diff --git a/annotations_1/--ABd2SeIGE_filtered.json b/annotations_1/--ABd2SeIGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfd6a9a878edcc2ca6d7b9beeb40ae13edd76ae3 --- /dev/null +++ b/annotations_1/--ABd2SeIGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.75], [15.0, 23.94], [27.0, 37.12], [48.0, 47.83], [51.0, 51.43], [60.0, 60.0], [62.0, 69.42], [86.0, 86.32], [93.0, 96.79], [98.0, 98.36], [99.0, 99.6], [100.0, 102.39], [106.0, 113.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.94, 30.17, 46.33, 0.0, 0.0, 0.0, 68.15, 0.0, 61.97, 0.0, 0.0, 38.33, 39.55], "audiomae_on_audioset": [[["theremin", 29.79], ["music", 28.67], ["hum", 7.9]], [["speech", 57.27], ["explosion", 14.36], ["burst, pop", 7.06]], [["music", 62.43], ["theremin", 8.26], ["cello", 4.68]], null, null, null, null, null, null, null, null, [["music", 21.78], ["musical instrument", 6.05], ["didgeridoo", 5.51]], [["music", 76.58], ["musical instrument", 3.22], ["theremin", 2.27]]], "duration": [4.75, 8.94, 10.12, -0.17, 0.43, 0.0, 7.42, 0.32, 3.79, 0.36, 0.6, 2.39, 7.46]} \ No newline at end of file diff --git a/annotations_1/--QCZKgJt6o_filtered.json b/annotations_1/--QCZKgJt6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda0024e4d05408c81e5065bd4807b883aae16d6 --- /dev/null +++ b/annotations_1/--QCZKgJt6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 6.37], [7.0, 9.76], [14.0, 16.93], [30.0, 31.36], [33.0, 33.54], [35.0, 35.72], [40.0, 46.94], [51.0, 50.68], [52.0, 61.47], [67.0, 69.9], [77.0, 77.35], [107.0, 108.08], [117.0, 117.19], [117.0, 118.18], [127.0, 128.22], [133.0, 134.74], [136.0, 136.24], [140.0, 142.8], [146.0, 149.35], [151.0, 151.31], [152.0, 153.35], [156.0, 156.61], [157.0, 159.6], [164.0, 165.43], [174.0, 175.02]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 60.89, 45.59, 0.0, 0.0, 0.0, 35.85, 0.0, 34.71, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 47.2, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 26.24], ["vocal music", 7.63], ["singing", 6.21]], null, null, null, [["speech", 18.36], ["moo", 9.75], ["livestock, farm animals, working animals", 8.42]], null, [["chant", 14.05], ["cattle, bovinae", 12.42], ["grunt", 10.88]], null, null, null, null, null, null, null, null, null, [["speech", 49.28], ["hum", 8.71], ["music", 5.69]], null, null, null, [["speech", 31.98], ["music", 6.36], ["hum", 5.44]], null, null], "duration": [1.3, 1.37, 2.76, 2.93, 1.36, 0.54, 0.72, 6.94, -0.32, 9.47, 2.9, 0.35, 1.08, 0.19, 1.18, 1.22, 1.74, 0.24, 2.8, 3.35, 0.31, 1.35, 0.61, 2.6, 1.43, 1.02]} \ No newline at end of file diff --git a/annotations_1/--hendERqm0_filtered.json b/annotations_1/--hendERqm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0669cccee3e71d295a6ed82416912baafbbf25a --- /dev/null +++ b/annotations_1/--hendERqm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [14.0, 14.22], [16.0, 21.17], [28.0, 28.76], [32.0, 32.95], [34.0, 34.42], [36.0, 36.15], [38.0, 38.06], [40.0, 40.63], [41.0, 51.34], [53.0, 56.84], [58.0, 59.12], [61.0, 62.31], [66.0, 67.93], [70.0, 71.29], [74.0, 74.75], [77.0, 78.38], [82.0, 84.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.77, 31.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95], "audiomae_on_audioset": [null, null, [["music", 67.55], ["electronic music", 5.78], ["house music", 4.08]], null, null, null, null, null, null, [["music", 45.64], ["speech", 12.16], ["techno", 9.56]], [["music", 51.69], ["speech", 33.92], ["drum machine", 1.58]], null, null, null, null, null, null, [["music", 30.48], ["sonar", 30.27], ["electronic music", 9.0]]], "duration": [0.56, 0.22, 5.17, 0.76, 0.95, 0.42, 0.15, 0.06, 0.63, 10.34, 3.84, 1.12, 1.31, 1.93, 1.29, 0.75, 1.38, 2.72]} \ No newline at end of file diff --git a/annotations_1/-0SHIbuEO3w_filtered.json b/annotations_1/-0SHIbuEO3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ca78185f0eca138fe939cf67a75296c5456a9f6 --- /dev/null +++ b/annotations_1/-0SHIbuEO3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 60.72], [63.0, 122.66], [127.0, 131.94]], "keep_status": [false, false, true], "silence_prob": [29.36, 0.0, 30.22], "audiomae_on_audioset": [[["music", 65.38], ["speech", 7.81], ["throbbing", 3.28]], null, [["speech", 22.67], ["music", 22.28], ["crowd", 5.83]]], "duration": [4.72, 59.66, 4.94]} \ No newline at end of file diff --git a/annotations_1/-19d_T472co_filtered.json b/annotations_1/-19d_T472co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0437989b42eed3a8bcff6d44e94bbfb2b34a546f --- /dev/null +++ b/annotations_1/-19d_T472co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 47.21], [48.0, 48.57], [53.0, 53.25], [53.0, 166.8], [167.0, 167.7], [168.0, 173.04], [175.0, 177.45], [180.0, 201.29], [205.0, 205.17], [206.0, 212.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 31.68, 35.71, 0.0, 74.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 76.85], ["speech", 5.82], ["boing", 1.78]], [["music", 32.21], ["fly, housefly", 10.63], ["buzz", 6.42]], null, null], "duration": [46.21, 0.57, 0.25, 113.8, 0.7, 5.04, 2.45, 21.29, 0.17, 6.75]} \ No newline at end of file diff --git a/annotations_1/-1W4xHNKvAk_filtered.json b/annotations_1/-1W4xHNKvAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9467dc1ee84c624e60243480b10c88ba9a32fa2 --- /dev/null +++ b/annotations_1/-1W4xHNKvAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [16.0, 17.51], [35.0, 35.06], [36.0, 36.69], [50.0, 51.21], [52.0, 53.15], [73.0, 74.11], [85.0, 86.86], [100.0, 101.07], [102.0, 103.08], [114.0, 115.01], [117.0, 117.29], [120.0, 120.75], [135.0, 134.97], [150.0, 150.13], [208.0, 208.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.51, 0.06, 0.69, 1.21, 1.15, 1.11, 1.86, 1.07, 1.08, 1.01, 0.29, 0.75, -0.03, 0.13, 0.63]} \ No newline at end of file diff --git a/annotations_1/-1eKufUP5XQ_filtered.json b/annotations_1/-1eKufUP5XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..603231b058b6f3ec8a1bba77d02a1e2ab295603a --- /dev/null +++ b/annotations_1/-1eKufUP5XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [11.0, 15.52], [20.0, 20.07], [24.0, 24.58], [40.0, 41.15], [44.0, 49.44], [50.0, 51.68], [53.0, 59.09], [64.0, 64.49], [65.0, 65.69], [66.0, 68.1], [79.0, 79.39], [80.0, 80.59], [83.0, 84.33], [89.0, 89.85], [91.0, 97.97], [99.0, 99.39], [100.0, 99.98], [100.0, 102.0], [104.0, 104.41], [105.0, 105.73], [106.0, 106.74], [107.0, 107.97], [110.0, 111.35], [112.0, 113.56], [114.0, 115.64], [116.0, 118.37], [119.0, 123.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.9, 0.0, 0.0, 0.0, 90.25, 0.0, 89.72, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 94.66], "audiomae_on_audioset": [null, [["speech", 27.69], ["whack, thwack", 9.37], ["busy signal", 8.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 4.52, 0.07, 0.58, 1.15, 5.44, 1.68, 6.09, 0.49, 0.69, 2.1, 0.39, 0.59, 1.33, 0.85, 6.97, 0.39, -0.02, 2.0, 0.41, 0.73, 0.74, 0.97, 1.35, 1.56, 1.64, 2.37, 4.13]} \ No newline at end of file diff --git a/annotations_1/-1zLU5N6uBU_filtered.json b/annotations_1/-1zLU5N6uBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/-1zLU5N6uBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/-2KG4lLGEl0_filtered.json b/annotations_1/-2KG4lLGEl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a192524a4650c9672d503b8d0142c2a17d6edce2 --- /dev/null +++ b/annotations_1/-2KG4lLGEl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.27], [14.0, 15.26], [21.0, 21.66], [27.0, 27.48], [31.0, 32.09], [34.0, 34.03], [34.0, 34.96], [36.0, 36.54], [38.0, 39.01], [41.0, 42.52], [43.0, 43.6], [46.0, 46.41], [47.0, 49.2], [51.0, 51.33], [54.0, 55.85], [57.0, 58.55], [68.0, 68.88], [79.0, 79.73], [80.0, 80.94], [84.0, 84.54], [87.0, 87.52], [89.0, 90.24], [101.0, 101.85], [105.0, 105.51], [109.0, 109.65], [111.0, 112.77], [116.0, 116.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 1.26, 0.66, 0.48, 1.09, 0.03, 0.96, 0.54, 1.01, 1.52, 0.6, 0.41, 2.2, 0.33, 1.85, 1.55, 0.88, 0.73, 0.94, 0.54, 0.52, 1.24, 0.85, 0.51, 0.65, 1.77, 0.92]} \ No newline at end of file diff --git a/annotations_1/-2KGPYEFnsU_filtered.json b/annotations_1/-2KGPYEFnsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc5f9d2288921cfa708683de7b5429a18c6efc1 --- /dev/null +++ b/annotations_1/-2KGPYEFnsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.39], [15.0, 16.73], [17.0, 17.9], [19.0, 20.11], [24.0, 24.53], [25.0, 25.76], [29.0, 33.12], [38.0, 39.55], [41.0, 43.04], [44.0, 44.71], [46.0, 47.39], [50.0, 50.03], [52.0, 53.38], [55.0, 56.1], [59.0, 60.71], [66.0, 66.9], [73.0, 73.94], [78.0, 78.9], [81.0, 80.79], [110.0, 110.1], [116.0, 117.9], [120.0, 119.8], [125.0, 127.04], [129.0, 129.41], [132.0, 132.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.73, 0.9, 1.11, 0.53, 0.76, 4.12, 1.55, 2.04, 0.71, 1.39, 0.03, 1.38, 1.1, 1.71, 0.9, 0.94, 0.9, -0.21, 0.1, 1.9, -0.2, 2.04, 0.41, 0.97]} \ No newline at end of file diff --git a/annotations_1/-2QFIXEHnOY_filtered.json b/annotations_1/-2QFIXEHnOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea4b135d467c6ccda9f2a044d3826870c6124d67 --- /dev/null +++ b/annotations_1/-2QFIXEHnOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.11], [19.0, 22.35], [24.0, 31.28], [33.0, 33.39], [34.0, 58.75], [59.0, 68.89]], "keep_status": [true, true, true, false, true, true], "silence_prob": [29.59, 29.9, 28.84, 0.0, 29.2, 29.4], "audiomae_on_audioset": [[["music", 34.03], ["buzz", 18.87], ["hum", 9.34]], [["hum", 17.0], ["mains hum", 12.84], ["throbbing", 7.47]], [["fly, housefly", 16.88], ["buzz", 13.34], ["mosquito", 12.24]], null, [["buzz", 13.81], ["hum", 12.07], ["electric shaver, electric razor", 6.64]], [["hum", 22.83], ["mains hum", 10.69], ["fly, housefly", 8.24]]], "duration": [10.11, 3.35, 7.28, 0.39, 24.75, 9.89]} \ No newline at end of file diff --git a/annotations_1/-5twCD8tAMc_filtered.json b/annotations_1/-5twCD8tAMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..191e5ec7d61aece63be80228ed9569155f898788 --- /dev/null +++ b/annotations_1/-5twCD8tAMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.65], [25.0, 25.08], [27.0, 28.24], [29.0, 30.91], [35.0, 35.61], [38.0, 42.33], [44.0, 75.29], [76.0, 76.72], [81.0, 89.38]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [33.09, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 30.12], "audiomae_on_audioset": [[["music", 83.83], ["theremin", 1.62], ["synthesizer", 1.3]], null, null, null, null, [["boat, water vehicle", 16.83], ["music", 14.4], ["vehicle", 11.07]], null, null, [["music", 72.52], ["musical instrument", 4.87], ["cacophony", 2.86]]], "duration": [15.65, 0.08, 1.24, 1.91, 0.61, 4.33, 31.29, 0.72, 8.38]} \ No newline at end of file diff --git a/annotations_1/-7-2-088LnM_filtered.json b/annotations_1/-7-2-088LnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3037e77d9123ada38a370e4acab1bf677751cae0 --- /dev/null +++ b/annotations_1/-7-2-088LnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.2], [23.0, 22.92], [23.0, 25.52], [28.0, 30.13], [35.0, 36.71], [40.0, 42.08], [44.0, 45.2], [45.0, 46.09], [46.0, 48.91], [49.0, 49.25], [50.0, 50.72], [51.0, 52.47], [53.0, 57.54], [59.0, 67.63], [70.0, 72.08], [72.0, 74.56], [82.0, 82.93], [87.0, 99.28], [99.0, 99.5], [100.0, 100.01], [100.0, 100.45], [101.0, 109.46]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.47, 36.04, 0.0, 97.11, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 71.14, 67.63, 98.99, 43.85, 0.0, 37.46, 0.0, 0.0, 0.0, 42.74], "audiomae_on_audioset": [null, null, [["whale vocalization", 16.24], ["boing", 16.19], ["moo", 10.98]], [["speech", 72.48], ["applause", 5.84], ["radio", 2.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.7], ["burping, eructation", 2.31], ["percussion", 1.49]], null, [["music", 60.25], ["groan", 6.88], ["grunt", 5.85]], null, null, null, [["gasp", 19.11], ["speech", 13.68], ["breaking", 11.58]]], "duration": [0.2, -0.08, 2.52, 2.13, 1.71, 2.08, 1.2, 1.09, 2.91, 0.25, 0.72, 1.47, 4.54, 8.63, 2.08, 2.56, 0.93, 12.28, 0.5, 0.01, 0.45, 8.46]} \ No newline at end of file diff --git a/annotations_1/-7Sow81yi24_filtered.json b/annotations_1/-7Sow81yi24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4b1a642f3eddad96ac0ab22d9e6bea1f00ecdd --- /dev/null +++ b/annotations_1/-7Sow81yi24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.53], [33.0, 38.33], [40.0, 42.58], [44.0, 45.69], [47.0, 63.64], [64.0, 66.07], [67.0, 73.43], [75.0, 76.65], [77.0, 79.95], [81.0, 84.52], [86.0, 89.21], [94.0, 96.35], [100.0, 101.29], [102.0, 103.87], [107.0, 107.33], [109.0, 110.39], [114.0, 124.66]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 49.92, 54.9, 0.0, 47.94, 35.61, 38.42, 0.0, 43.15, 38.54, 36.11, 45.14, 0.0, 0.0, 0.0, 0.0, 28.26], "audiomae_on_audioset": [null, [["music", 25.69], ["hum", 11.38], ["speech", 11.19]], null, null, [["hum", 39.29], ["mains hum", 20.44], ["music", 15.13]], [["gong", 43.33], ["hum", 9.03], ["singing bowl", 6.05]], [["hum", 50.46], ["throbbing", 24.51], ["mains hum", 10.71]], null, [["music", 41.92], ["mains hum", 17.04], ["hum", 14.08]], [["music", 40.52], ["mains hum", 12.71], ["hum", 12.62]], [["hum", 25.29], ["music", 24.57], ["mains hum", 18.16]], [["music", 60.94], ["theremin", 7.71], ["musical instrument", 3.84]], null, null, null, null, [["music", 56.16], ["vehicle", 7.08], ["car", 4.84]]], "duration": [0.53, 5.33, 2.58, 1.69, 16.64, 2.07, 6.43, 1.65, 2.95, 3.52, 3.21, 2.35, 1.29, 1.87, 0.33, 1.39, 10.66]} \ No newline at end of file diff --git a/annotations_1/-7cV5cWQmxg_filtered.json b/annotations_1/-7cV5cWQmxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0503a47a9789adfbca6f2006310e7ee8a9edd172 --- /dev/null +++ b/annotations_1/-7cV5cWQmxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [8.0, 8.5], [9.0, 9.83], [17.0, 18.98], [21.0, 21.37], [22.0, 23.33], [27.0, 28.56], [32.0, 33.91], [34.0, 38.38], [39.0, 40.36], [42.0, 61.25], [64.0, 66.39], [68.0, 73.47], [80.0, 79.89], [80.0, 80.2], [88.0, 94.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.01, 0.0, 41.98, 94.81, 37.09, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 28.43], ["music", 28.37], ["synthesizer", 5.19]], null, [["mosquito", 27.65], ["fly, housefly", 20.31], ["insect", 8.7]], null, [["speech", 72.72], ["stomach rumble", 4.04], ["animal", 2.28]], null, null, [["speech", 19.75], ["music", 18.08], ["throbbing", 13.72]]], "duration": [0.34, 0.5, 0.83, 1.98, 0.37, 1.33, 1.56, 1.91, 4.38, 1.36, 19.25, 2.39, 5.47, -0.11, 0.2, 6.09]} \ No newline at end of file diff --git a/annotations_1/-7mzQx0ebqk_filtered.json b/annotations_1/-7mzQx0ebqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c98ba98248ec2213a7d6e0a8ce39f81ef77b5f7 --- /dev/null +++ b/annotations_1/-7mzQx0ebqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [10.0, 10.27], [14.0, 14.88], [19.0, 20.17], [23.0, 23.01], [24.0, 28.61], [32.0, 34.43], [43.0, 43.29], [45.0, 45.52], [49.0, 49.55], [54.0, 54.06], [62.0, 63.85], [65.0, 72.45], [75.0, 79.84], [82.0, 82.54], [86.0, 89.4], [96.0, 97.44], [98.0, 100.3], [126.0, 125.73], [128.0, 127.7], [131.0, 132.16], [133.0, 133.22], [135.0, 136.95], [141.0, 141.61], [144.0, 143.95], [145.0, 148.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 60.05, 0.0, 94.22, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7], "audiomae_on_audioset": [null, null, null, null, null, [["singing bowl", 23.82], ["music", 21.45], ["burping, eructation", 15.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.27, 0.88, 1.17, 0.01, 4.61, 2.43, 0.29, 0.52, 0.55, 0.06, 1.85, 7.45, 4.84, 0.54, 3.4, 1.44, 2.3, -0.27, -0.3, 1.16, 0.22, 1.95, 0.61, -0.05, 3.66]} \ No newline at end of file diff --git a/annotations_1/-8ajIeIeJpY_filtered.json b/annotations_1/-8ajIeIeJpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a7b5ed9d7fc58d336376fc01c0fbb6be058bac --- /dev/null +++ b/annotations_1/-8ajIeIeJpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.89], [3.0, 5.76], [6.0, 6.86], [8.0, 8.73], [14.0, 15.4], [19.0, 19.99], [22.0, 23.03], [24.0, 24.53], [26.0, 26.33], [34.0, 33.86], [35.0, 35.43], [36.0, 36.31], [37.0, 37.89], [38.0, 39.29], [42.0, 43.29], [44.0, 44.58], [45.0, 45.4], [46.0, 46.4], [48.0, 48.32], [57.0, 57.15], [58.0, 59.56], [60.0, 61.32], [63.0, 63.66], [68.0, 68.47], [74.0, 76.0], [77.0, 78.85], [81.0, 85.8], [86.0, 86.41], [89.0, 90.75], [91.0, 91.93], [92.0, 92.62], [93.0, 93.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.92, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 34.69], ["radio", 21.67], ["croak", 11.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 2.76, 0.86, 0.73, 1.4, 0.99, 1.03, 0.53, 0.33, -0.14, 0.43, 0.31, 0.89, 1.29, 1.29, 0.58, 0.4, 0.4, 0.32, 0.15, 1.56, 1.32, 0.66, 0.47, 2.0, 1.85, 4.8, 0.41, 1.75, 0.93, 0.62, 0.85]} \ No newline at end of file diff --git a/annotations_1/-AZg55qXj7U_filtered.json b/annotations_1/-AZg55qXj7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56f67b60fb7943a1bb1cd2b8011d60fd6e08a86a --- /dev/null +++ b/annotations_1/-AZg55qXj7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 61.82], [62.0, 86.7], [88.0, 106.52], [109.0, 152.19], [153.0, 178.44]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.0, 31.48, 0.0, 33.88], "audiomae_on_audioset": [null, null, [["music", 83.76], ["hum", 7.02], ["throbbing", 1.65]], [["music", 65.55], ["synthesizer", 5.15], ["hum", 4.37]], null, [["music", 22.0], ["hum", 20.87], ["speech", 11.7]]], "duration": [0.62, 55.82, 24.7, 18.52, 43.19, 25.44]} \ No newline at end of file diff --git a/annotations_1/-BgZFaMJRxM_filtered.json b/annotations_1/-BgZFaMJRxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b97362e90eb6f798daefc7d304a08330545147c9 --- /dev/null +++ b/annotations_1/-BgZFaMJRxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.34], [7.0, 7.79], [9.0, 10.56], [15.0, 17.19], [17.0, 18.17], [19.0, 19.72], [21.0, 23.97], [25.0, 28.31], [30.0, 32.85], [43.0, 43.6], [45.0, 45.55], [48.0, 52.08], [56.0, 61.15], [64.0, 65.4], [67.0, 68.32], [69.0, 69.89], [70.0, 72.89], [74.0, 77.5], [81.0, 83.39], [84.0, 104.89], [106.0, 106.46], [107.0, 108.24], [110.0, 111.57], [115.0, 116.75], [120.0, 120.61], [123.0, 124.21], [126.0, 127.99], [130.0, 131.03], [132.0, 134.27], [135.0, 135.68], [136.0, 137.03], [139.0, 141.13], [142.0, 142.92], [146.0, 145.71], [146.0, 147.06], [149.0, 149.44], [152.0, 156.36], [162.0, 163.31], [164.0, 165.11], [168.0, 168.91], [174.0, 174.97], [175.0, 176.34], [177.0, 178.58], [180.0, 179.91]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.75, 0.0, 0.0, 47.98, 0.0, 0.0, 54.43, 50.51, 56.25, 0.0, 0.0, 57.32, 61.67, 0.0, 0.0, 0.0, 39.86, 58.55, 52.51, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["chirp tone", 24.02], ["whale vocalization", 16.52], ["sine wave", 16.23]], null, null, [["music", 31.28], ["whale vocalization", 20.69], ["singing bowl", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.97], ["whale vocalization", 14.45], ["hum", 11.47]], null, null, [["hum", 47.44], ["throbbing", 31.47], ["mains hum", 6.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.27], ["mains hum", 24.35], ["speech", 22.56]], null, null, null, null, null, null, null], "duration": [3.34, 0.79, 1.56, 2.19, 1.17, 0.72, 2.97, 3.31, 2.85, 0.6, 0.55, 4.08, 5.15, 1.4, 1.32, 0.89, 2.89, 3.5, 2.39, 20.89, 0.46, 1.24, 1.57, 1.75, 0.61, 1.21, 1.99, 1.03, 2.27, 0.68, 1.03, 2.13, 0.92, -0.29, 1.06, 0.44, 4.36, 1.31, 1.11, 0.91, 0.97, 1.34, 1.58, -0.09]} \ No newline at end of file diff --git a/annotations_1/-CSIqCS1WIk_filtered.json b/annotations_1/-CSIqCS1WIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43434f97cb91519933a57ebe7f1827c4ea60dc4e --- /dev/null +++ b/annotations_1/-CSIqCS1WIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.82], [5.0, 7.57], [9.0, 10.52], [11.0, 12.31], [14.0, 15.06], [18.0, 27.65], [30.0, 57.5], [58.0, 60.94], [62.0, 64.1], [67.0, 114.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 100.0, 0.0, 0.0, 0.0, 100.0, 99.8, 98.51, 91.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.82, 2.57, 1.52, 1.31, 1.06, 9.65, 27.5, 2.94, 2.1, 47.57]} \ No newline at end of file diff --git a/annotations_1/-DXQJLwDAwg_filtered.json b/annotations_1/-DXQJLwDAwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24741c221a08374bf5c5775183ea311bc2bfc22 --- /dev/null +++ b/annotations_1/-DXQJLwDAwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [7.0, 7.91], [10.0, 10.0], [10.0, 10.49], [11.0, 12.66], [14.0, 14.22], [15.0, 19.21], [21.0, 21.81], [22.0, 23.03], [24.0, 25.22], [26.0, 28.39], [30.0, 33.35], [36.0, 37.74], [39.0, 43.75], [47.0, 48.32], [50.0, 50.84], [52.0, 54.65], [55.0, 55.95], [58.0, 58.68], [60.0, 59.86], [61.0, 61.82], [63.0, 66.48], [67.0, 67.81], [69.0, 69.42], [71.0, 74.07], [76.0, 76.44], [78.0, 78.39], [81.0, 81.19], [85.0, 85.46], [89.0, 89.78], [92.0, 92.52], [93.0, 93.53], [95.0, 95.79], [100.0, 100.55], [102.0, 103.28], [104.0, 104.95], [107.0, 107.64], [113.0, 114.08], [115.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 82.43, 79.07, 0.0, 63.21, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.91, 0.0, 0.49, 1.66, 0.22, 4.21, 0.81, 1.03, 1.22, 2.39, 3.35, 1.74, 4.75, 1.32, 0.84, 2.65, 0.95, 0.68, -0.14, 0.82, 3.48, 0.81, 0.42, 3.07, 0.44, 0.39, 0.19, 0.46, 0.78, 0.52, 0.53, 0.79, 0.55, 1.28, 0.95, 0.64, 1.08, 1.16]} \ No newline at end of file diff --git a/annotations_1/-DXU2ZHuiTs_filtered.json b/annotations_1/-DXU2ZHuiTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3055202e3bd3de197e0c3ecf9b936f20c790d519 --- /dev/null +++ b/annotations_1/-DXU2ZHuiTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.16], [1.0, 1.54], [8.0, 8.21], [12.0, 11.92], [13.0, 13.73], [16.0, 16.39], [17.0, 17.66], [23.0, 23.04], [27.0, 28.22], [29.0, 29.4], [31.0, 31.45], [33.0, 33.84], [34.0, 34.74], [36.0, 36.83], [39.0, 39.12], [40.0, 40.09], [41.0, 41.81], [48.0, 48.63], [52.0, 51.98], [55.0, 54.97], [56.0, 56.4], [60.0, 60.39], [62.0, 61.87], [63.0, 62.92], [65.0, 65.35], [67.0, 67.31], [69.0, 69.33], [73.0, 73.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.54, 0.21, -0.08, 0.73, 0.39, 0.66, 0.04, 1.22, 0.4, 0.45, 0.84, 0.74, 0.83, 0.12, 0.09, 0.81, 0.63, -0.02, -0.03, 0.4, 0.39, -0.13, -0.08, 0.35, 0.31, 0.33, 0.08]} \ No newline at end of file diff --git a/annotations_1/-DqmTaUK-Ow_filtered.json b/annotations_1/-DqmTaUK-Ow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37022a6c4cb9f8dc6753bd66e848eb62155559b --- /dev/null +++ b/annotations_1/-DqmTaUK-Ow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.33], [24.0, 25.73], [26.0, 34.1], [35.0, 38.38], [40.0, 49.4], [50.0, 52.25], [58.0, 59.34], [65.0, 65.52], [66.0, 66.92]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.51, 99.31, 68.41, 69.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.33, 1.73, 8.1, 3.38, 9.4, 2.25, 1.34, 0.52, 0.92]} \ No newline at end of file diff --git a/annotations_1/-FQOaUEE69I_filtered.json b/annotations_1/-FQOaUEE69I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99b2fd5fdac71c95187c9a0091f61a3a7ba29df0 --- /dev/null +++ b/annotations_1/-FQOaUEE69I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [4.0, 5.95], [15.0, 20.61], [22.0, 22.4], [23.0, 23.7], [24.0, 25.81], [26.0, 27.08], [28.0, 28.34], [30.0, 30.72], [31.0, 34.33], [35.0, 35.33], [40.0, 43.02], [44.0, 46.09], [48.0, 48.52], [50.0, 50.82], [52.0, 52.96], [57.0, 58.06], [62.0, 62.46], [64.0, 64.47], [66.0, 66.34], [68.0, 71.2], [73.0, 73.8], [75.0, 75.46], [77.0, 78.14], [79.0, 81.5], [84.0, 85.72], [87.0, 87.69], [91.0, 91.62], [93.0, 96.11], [97.0, 97.6], [99.0, 100.25], [104.0, 104.4], [107.0, 107.91], [110.0, 110.25], [111.0, 118.81], [120.0, 122.07], [123.0, 137.61], [139.0, 140.41], [143.0, 143.26], [148.0, 151.63], [152.0, 153.86], [154.0, 156.12], [156.0, 157.47], [158.0, 158.62], [160.0, 161.38], [162.0, 165.4], [166.0, 166.48], [167.0, 167.64], [175.0, 180.82]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 39.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 0.0, 99.44, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 34.43, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 56.1, 35.47, 0.0, 0.0, 52.39, 0.0, 47.12, 0.0, 0.0, 0.0, 30.41, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, [["speech", 44.89], ["sidetone", 13.71], ["chirp tone", 11.39]], null, null, null, null, null, null, [["speech", 42.88], ["crackle", 7.42], ["crushing", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.83], ["sine wave", 15.21], ["sidetone", 8.1]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 32.18], ["music", 29.24], ["mains hum", 12.57]], null, null, null, null, [["speech", 36.44], ["sidetone", 31.39], ["music", 8.37]], null, null, null, [["speech", 27.73], ["livestock, farm animals, working animals", 11.15], ["cattle, bovinae", 5.06]], null, null, [["music", 18.98], ["chirp tone", 13.64], ["crushing", 12.95]]], "duration": [0.71, 1.95, 5.61, 0.4, 0.7, 1.81, 1.08, 0.34, 0.72, 3.33, 0.33, 3.02, 2.09, 0.52, 0.82, 0.96, 1.06, 0.46, 0.47, 0.34, 3.2, 0.8, 0.46, 1.14, 2.5, 1.72, 0.69, 0.62, 3.11, 0.6, 1.25, 0.4, 0.91, 0.25, 7.81, 2.07, 14.61, 1.41, 0.26, 3.63, 1.86, 2.12, 1.47, 0.62, 1.38, 3.4, 0.48, 0.64, 5.82]} \ No newline at end of file diff --git a/annotations_1/-FU65KX7aJs_filtered.json b/annotations_1/-FU65KX7aJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09fa577aa9881c06d9cfe6230358c13bdaa9713b --- /dev/null +++ b/annotations_1/-FU65KX7aJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.58], [14.0, 15.28], [17.0, 16.95], [19.0, 39.48], [41.0, 52.96], [54.0, 69.43], [70.0, 74.93], [76.0, 77.58], [78.0, 97.44], [98.0, 98.88], [99.0, 100.03], [102.0, 103.03], [104.0, 105.33], [111.0, 111.0], [116.0, 117.07], [121.0, 122.52], [125.0, 125.81], [126.0, 126.32], [126.0, 130.45], [132.0, 132.93], [134.0, 137.42], [138.0, 138.32], [139.0, 139.85], [141.0, 141.89], [145.0, 148.1], [149.0, 149.18], [171.0, 171.22], [171.0, 171.36], [175.0, 174.77]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [59.24, 0.0, 0.0, 30.61, 32.83, 30.67, 39.7, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.69, 0.0, 49.54, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.55], ["didgeridoo", 17.69], ["fly, housefly", 10.38]], [["music", 58.18], ["synthesizer", 12.1], ["hum", 7.36]], [["music", 54.02], ["didgeridoo", 24.44], ["synthesizer", 4.28]], [["wheeze", 12.09], ["speech", 7.39], ["frog", 6.24]], null, [["speech", 38.1], ["animal", 17.99], ["livestock, farm animals, working animals", 12.74]], null, null, null, null, null, null, null, null, null, [["speech", 55.95], ["animal", 9.45], ["whale vocalization", 4.16]], null, [["hum", 29.43], ["mains hum", 18.48], ["music", 9.87]], null, null, null, [["mains hum", 28.61], ["hum", 27.62], ["radio", 8.48]], null, null, null, null], "duration": [4.58, 1.28, -0.05, 20.48, 11.96, 15.43, 4.93, 1.58, 19.44, 0.88, 1.03, 1.03, 1.33, 0.0, 1.07, 1.52, 0.81, 0.32, 4.45, 0.93, 3.42, 0.32, 0.85, 0.89, 3.1, 0.18, 0.22, 0.36, -0.23]} \ No newline at end of file diff --git a/annotations_1/-G7OPYUlnT0_filtered.json b/annotations_1/-G7OPYUlnT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b58ce6615e635f88882f33bc4ddbf4180d3b14 --- /dev/null +++ b/annotations_1/-G7OPYUlnT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.89], [23.0, 23.26], [25.0, 25.29], [31.0, 30.89], [93.0, 93.24]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [-0.11, 0.26, 0.29, -0.11, 0.24]} \ No newline at end of file diff --git a/annotations_1/-H6l6-_elF0_filtered.json b/annotations_1/-H6l6-_elF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c01e2c0c035ff57a527d11c6468e11aa68e16e51 --- /dev/null +++ b/annotations_1/-H6l6-_elF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.13], [13.0, 14.25], [17.0, 17.69], [20.0, 21.29], [26.0, 37.62], [39.0, 48.19], [52.0, 52.44], [57.0, 57.79], [62.0, 62.53], [66.0, 67.32], [76.0, 76.86], [81.0, 81.7], [85.0, 86.36], [95.0, 96.08], [103.0, 105.76], [114.0, 115.53], [120.0, 120.78], [125.0, 125.81], [133.0, 133.24], [133.0, 138.7], [141.0, 142.01], [144.0, 145.56], [146.0, 148.44], [150.0, 150.35], [154.0, 154.97], [158.0, 157.72], [159.0, 159.95], [163.0, 163.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [96.17, 0.0, 0.0, 0.0, 78.55, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 10.24], ["thunk", 7.46], ["speech", 7.36]], null, null, null, null, null, null, null, null], "duration": [2.13, 1.25, 0.69, 1.29, 11.62, 9.19, 0.44, 0.79, 0.53, 1.32, 0.86, 0.7, 1.36, 1.08, 2.76, 1.53, 0.78, 0.81, 0.24, 5.7, 1.01, 1.56, 2.44, 0.35, 0.97, -0.28, 0.95, 0.65]} \ No newline at end of file diff --git a/annotations_1/-IV-ZZwXUkw_filtered.json b/annotations_1/-IV-ZZwXUkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af85df172e7e75acb26c186d4c1e0eeb169fff24 --- /dev/null +++ b/annotations_1/-IV-ZZwXUkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 26.13], [29.0, 30.69], [35.0, 40.22], [41.0, 43.88], [47.0, 52.44], [52.0, 116.23], [118.0, 124.95], [125.0, 163.73]], "keep_status": [false, false, true, true, true, false, true, false], "silence_prob": [30.6, 0.0, 28.97, 29.44, 28.46, 0.0, 28.72, 0.0], "audiomae_on_audioset": [[["throbbing", 56.58], ["hum", 10.19], ["music", 9.05]], null, [["music", 33.25], ["grunt", 15.2], ["fart", 12.17]], [["breaking", 28.12], ["whack, thwack", 15.12], ["music", 8.46]], [["zipper (clothing)", 30.8], ["whack, thwack", 11.18], ["smash, crash", 7.28]], null, [["groan", 18.26], ["music", 13.46], ["whack, thwack", 11.18]], null], "duration": [17.13, 1.69, 5.22, 2.88, 5.44, 64.23, 6.95, 38.73]} \ No newline at end of file diff --git a/annotations_1/-JNyHnAi8zk_filtered.json b/annotations_1/-JNyHnAi8zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7038be175df2b36f1954f88fb078ade8fde0e50 --- /dev/null +++ b/annotations_1/-JNyHnAi8zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.11], [20.0, 20.73], [22.0, 23.35], [24.0, 25.44], [26.0, 35.33], [39.0, 40.05], [42.0, 53.35], [54.0, 55.71], [57.0, 57.11], [59.0, 65.6], [68.0, 85.14], [91.0, 100.55], [103.0, 119.28], [121.0, 123.5], [126.0, 148.81], [149.0, 150.21], [151.0, 151.56], [153.0, 170.6]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.69, 0.0, 0.0, 0.0, 28.99, 0.0, 29.89, 0.0, 0.0, 28.67, 28.77, 28.61, 28.68, 29.78, 28.67, 0.0, 0.0, 29.53], "audiomae_on_audioset": [[["music", 45.86], ["speech", 33.8], ["crowd", 1.63]], null, null, null, [["music", 48.28], ["speech", 5.84], ["buzz", 2.5]], null, [["music", 56.42], ["musical instrument", 3.38], ["middle eastern music", 3.11]], null, null, [["music", 55.47], ["speech", 22.82], ["electronic music", 4.18]], [["music", 61.66], ["speech", 7.65], ["vehicle", 5.05]], [["music", 91.63], ["ice cream truck, ice cream van", 1.27], ["speech", 1.13]], [["music", 83.45], ["speech", 12.02], ["electronic music", 0.56]], [["music", 44.67], ["middle eastern music", 9.38], ["musical instrument", 6.41]], [["music", 85.64], ["electronic music", 5.03], ["speech", 1.37]], null, null, [["music", 60.08], ["speech", 15.87], ["vehicle", 1.54]]], "duration": [12.11, 0.73, 1.35, 1.44, 9.33, 1.05, 11.35, 1.71, 0.11, 6.6, 17.14, 9.55, 16.28, 2.5, 22.81, 1.21, 0.56, 17.6]} \ No newline at end of file diff --git a/annotations_1/-Jf-E7oEguU_filtered.json b/annotations_1/-Jf-E7oEguU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cd507b521785b9cd717b45b43c4bd6a429b3224 --- /dev/null +++ b/annotations_1/-Jf-E7oEguU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 94.05]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [88.05]} \ No newline at end of file diff --git a/annotations_1/-JhNO_E3aEE_filtered.json b/annotations_1/-JhNO_E3aEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45bc1e7124ee5fe53fe1920cf55cb47b12142924 --- /dev/null +++ b/annotations_1/-JhNO_E3aEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.03], [7.0, 7.7], [8.0, 8.18], [10.0, 10.69], [12.0, 12.23], [14.0, 14.5], [24.0, 24.92], [26.0, 29.08], [30.0, 29.83], [31.0, 31.11], [32.0, 31.85], [33.0, 33.91], [38.0, 44.12], [45.0, 45.59], [46.0, 47.22], [48.0, 49.91], [51.0, 52.44], [54.0, 67.9], [69.0, 73.95], [76.0, 76.25], [77.0, 82.76], [84.0, 83.98], [85.0, 88.94], [91.0, 93.24], [94.0, 94.91], [96.0, 96.23], [97.0, 100.84], [102.0, 102.86], [104.0, 104.73], [106.0, 107.47], [112.0, 113.88], [115.0, 116.78], [118.0, 118.57], [119.0, 121.81], [123.0, 132.49], [134.0, 134.79], [135.0, 180.39], [181.0, 185.43], [187.0, 191.66], [193.0, 196.94], [200.0, 204.26], [209.0, 211.94], [214.0, 218.13], [218.0, 220.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.56, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 64.52, 45.75, 0.0, 96.77, 0.0, 58.89, 82.61, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 97.83, 0.0, 0.0, 99.31, 94.37, 81.71, 79.94, 81.17, 72.75, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 73.25], ["thunk", 3.4], ["inside, small room", 1.41]], null, null, null, null, [["speech", 48.32], ["heart sounds, heartbeat", 12.75], ["stomach rumble", 11.88]], null, null, null, null, null, [["hum", 46.92], ["mains hum", 17.11], ["speech", 7.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.03, 0.7, 0.18, 0.69, 0.23, 0.5, 0.92, 3.08, -0.17, 0.11, -0.15, 0.91, 6.12, 0.59, 1.22, 1.91, 1.44, 13.9, 4.95, 0.25, 5.76, -0.02, 3.94, 2.24, 0.91, 0.23, 3.84, 0.86, 0.73, 1.47, 1.88, 1.78, 0.57, 2.81, 9.49, 0.79, 45.39, 4.43, 4.66, 3.94, 4.26, 2.94, 4.13, 2.75]} \ No newline at end of file diff --git a/annotations_1/-KVNfZo-cfc_filtered.json b/annotations_1/-KVNfZo-cfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2466a276d874959d071383550cfa5929ce89bc95 --- /dev/null +++ b/annotations_1/-KVNfZo-cfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [4.0, 5.04], [6.0, 6.08], [10.0, 10.3], [11.0, 11.26], [12.0, 12.56], [15.0, 15.16], [18.0, 18.81], [21.0, 22.84], [23.0, 25.29], [26.0, 29.89], [33.0, 34.5], [36.0, 36.78], [37.0, 37.98], [39.0, 39.39], [40.0, 43.23], [46.0, 46.89], [48.0, 48.2], [49.0, 49.25], [50.0, 50.18], [50.0, 52.25], [55.0, 55.22], [56.0, 58.29], [60.0, 60.27], [63.0, 63.54], [66.0, 66.61], [71.0, 71.76], [91.0, 91.54], [93.0, 94.46], [95.0, 96.9], [98.0, 99.03], [100.0, 101.51], [102.0, 104.38], [106.0, 107.45], [109.0, 111.77], [113.0, 116.13], [118.0, 118.77], [120.0, 120.95], [122.0, 123.48], [126.0, 127.28], [128.0, 129.29], [131.0, 133.98], [136.0, 137.96], [139.0, 147.39], [151.0, 152.29], [155.0, 155.92], [158.0, 161.6], [168.0, 169.25], [171.0, 171.21], [173.0, 173.45], [175.0, 176.98], [180.0, 184.87], [186.0, 188.87], [190.0, 191.42], [193.0, 194.78], [196.0, 196.45], [198.0, 199.35], [201.0, 201.55], [203.0, 204.31], [205.0, 206.95], [209.0, 209.39], [210.0, 224.24], [228.0, 229.17], [231.0, 235.28], [236.0, 239.79], [241.0, 242.06], [244.0, 248.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 94.37, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 99.59, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 96.42, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 99.95, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.2, 0.0, 85.17, 92.15, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 60.93], ["speech", 6.52], ["sidetone", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 38.5], ["mains hum", 24.84], ["throbbing", 16.21]], null, null, null, null, null], "duration": [0.86, 1.04, 0.08, 0.3, 0.26, 0.56, 0.16, 0.81, 1.84, 2.29, 3.89, 1.5, 0.78, 0.98, 0.39, 3.23, 0.89, 0.2, 0.25, 0.18, 2.25, 0.22, 2.29, 0.27, 0.54, 0.61, 0.76, 0.54, 1.46, 1.9, 1.03, 1.51, 2.38, 1.45, 2.77, 3.13, 0.77, 0.95, 1.48, 1.28, 1.29, 2.98, 1.96, 8.39, 1.29, 0.92, 3.6, 1.25, 0.21, 0.45, 1.98, 4.87, 2.87, 1.42, 1.78, 0.45, 1.35, 0.55, 1.31, 1.95, 0.39, 14.24, 1.17, 4.28, 3.79, 1.06, 4.41]} \ No newline at end of file diff --git a/annotations_1/-KW0wz1xBfw_filtered.json b/annotations_1/-KW0wz1xBfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..624dedb84608a1e595f1dd53512b2cbb9acca7af --- /dev/null +++ b/annotations_1/-KW0wz1xBfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.09], [17.0, 19.9], [20.0, 26.03], [26.0, 26.5], [27.0, 27.62], [28.0, 27.89], [29.0, 29.64], [32.0, 96.55], [100.0, 121.73], [122.0, 127.13], [128.0, 130.57], [132.0, 134.91], [136.0, 138.37]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 63.53, 39.72, 0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 99.99, 90.95, 99.26, 60.6], "audiomae_on_audioset": [null, null, [["music", 51.35], ["theremin", 7.7], ["singing bowl", 5.05]], null, null, null, null, null, [["rumble", 19.05], ["explosion", 14.27], ["hum", 9.71]], null, null, null, null], "duration": [0.09, 2.9, 6.03, 0.5, 0.62, -0.11, 0.64, 64.55, 21.73, 5.13, 2.57, 2.91, 2.37]} \ No newline at end of file diff --git a/annotations_1/-Koj9hvcBMk_filtered.json b/annotations_1/-Koj9hvcBMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1450859ed17638a1d8bcfa004f964f709591061 --- /dev/null +++ b/annotations_1/-Koj9hvcBMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.63], [25.0, 26.52], [27.0, 28.17], [37.0, 38.55], [43.0, 46.13], [47.0, 47.44], [48.0, 48.81], [51.0, 51.66], [53.0, 53.89], [56.0, 56.54], [58.0, 58.01], [59.0, 59.56], [61.0, 61.11], [77.0, 82.56], [85.0, 86.1], [86.0, 86.97], [89.0, 90.24], [98.0, 98.22], [99.0, 99.0], [104.0, 104.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.63, 1.52, 1.17, 1.55, 3.13, 0.44, 0.81, 0.66, 0.89, 0.54, 0.01, 0.56, 0.11, 5.56, 1.1, 0.97, 1.24, 0.22, 0.0, 0.63]} \ No newline at end of file diff --git a/annotations_1/-Kztqrjp2yw_filtered.json b/annotations_1/-Kztqrjp2yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..870359429a856e8e507fad8d094cc9d7f271302b --- /dev/null +++ b/annotations_1/-Kztqrjp2yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [3.0, 3.5], [5.0, 5.48], [6.0, 6.67], [8.0, 90.78], [92.0, 92.53], [94.0, 97.19], [99.0, 102.49], [106.0, 107.77], [111.0, 114.93], [116.0, 117.59], [119.0, 122.47], [127.0, 129.19], [133.0, 133.78], [136.0, 140.86], [144.0, 144.32], [147.0, 160.79], [162.0, 175.36], [177.0, 184.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 99.84, 0.0, 100.0, 0.0, 99.76, 81.0, 0.0, 59.15, 0.0, 30.67, 32.25, 55.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 38.68], ["cattle, bovinae", 31.7], ["moo", 22.6]], [["music", 14.27], ["fly, housefly", 11.78], ["sidetone", 7.68]], null], "duration": [-0.25, 0.5, 0.48, 0.67, 82.78, 0.53, 3.19, 3.49, 1.77, 3.93, 1.59, 3.47, 2.19, 0.78, 4.86, 0.32, 13.79, 13.36, 7.47]} \ No newline at end of file diff --git a/annotations_1/-LCqZeb1de0_filtered.json b/annotations_1/-LCqZeb1de0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ff95584a343a0a3669a7a61562dbee0d3425469 --- /dev/null +++ b/annotations_1/-LCqZeb1de0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [9.0, 10.02], [14.0, 15.04], [16.0, 20.28], [23.0, 23.09], [26.0, 26.22], [28.0, 28.29], [33.0, 35.14], [36.0, 38.13], [46.0, 47.95], [54.0, 62.11], [69.0, 69.99], [75.0, 88.37], [90.0, 90.59], [92.0, 92.67], [95.0, 103.05], [106.0, 108.55], [112.0, 113.0], [116.0, 123.25], [126.0, 127.82], [134.0, 135.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 89.9, 60.89, 0.0, 92.97, 0.0, 99.98, 0.0, 0.0, 99.88, 99.95, 0.0, 83.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.02, 1.04, 4.28, 0.09, 0.22, 0.29, 2.14, 2.13, 1.95, 8.11, 0.99, 13.37, 0.59, 0.67, 8.05, 2.55, 1.0, 7.25, 1.82, 1.94]} \ No newline at end of file diff --git a/annotations_1/-Lrndfrc9yU_filtered.json b/annotations_1/-Lrndfrc9yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/-Lrndfrc9yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/-MNpOKICOx8_filtered.json b/annotations_1/-MNpOKICOx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f57ea9414141946842d323b760118425160aab3 --- /dev/null +++ b/annotations_1/-MNpOKICOx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 7.89], [10.0, 9.78], [11.0, 11.89], [18.0, 19.74], [22.0, 25.59], [26.0, 26.35], [34.0, 35.4], [38.0, 37.99], [48.0, 49.69], [50.0, 50.25], [51.0, 52.41], [54.0, 57.33], [59.0, 60.99], [63.0, 63.59], [64.0, 64.35], [66.0, 77.57], [80.0, 81.77], [86.0, 93.02], [93.0, 94.74], [96.0, 96.84], [97.0, 100.74], [103.0, 103.17], [106.0, 106.57], [112.0, 113.22], [114.0, 117.83], [118.0, 119.85], [121.0, 121.36], [122.0, 123.42], [124.0, 132.61], [133.0, 134.64], [138.0, 138.86], [140.0, 140.0]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.26, 0.0, 0.0, 0.0, 36.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 45.49, 0.0, 67.13, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 27.19], ["speech", 12.83], ["fly, housefly", 12.71]], null, null, null, [["music", 22.44], ["speech", 13.4], ["frog", 11.1]], null, null, null, null, null, null, null, null, null, null, [["thunk", 77.32], ["music", 10.1], ["mosquito", 3.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 2.89, -0.22, 0.89, 1.74, 3.59, 0.35, 1.4, -0.01, 1.69, 0.25, 1.41, 3.33, 1.99, 0.59, 0.35, 11.57, 1.77, 7.02, 1.74, 0.84, 3.74, 0.17, 0.57, 1.22, 3.83, 1.85, 0.36, 1.42, 8.61, 1.64, 0.86, 0.0]} \ No newline at end of file diff --git a/annotations_1/-Nzbwerwks8_filtered.json b/annotations_1/-Nzbwerwks8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd6fecc044274505cb2ecf33e3948d318967d6a --- /dev/null +++ b/annotations_1/-Nzbwerwks8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [5.0, 5.86], [6.0, 12.97], [18.0, 19.21], [20.0, 23.06], [26.0, 28.95], [34.0, 39.63], [42.0, 42.09], [43.0, 44.83], [50.0, 54.41], [55.0, 73.7], [79.0, 82.31], [84.0, 84.86], [86.0, 92.77], [98.0, 101.33], [105.0, 108.51], [115.0, 119.62]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 39.11, 0.0, 34.11, 33.41, 31.43, 0.0, 0.0, 31.21, 30.91, 30.75, 0.0, 31.68, 47.54, 36.56, 32.04], "audiomae_on_audioset": [null, null, [["speech", 47.52], ["music", 15.35], ["hum", 12.1]], null, [["speech", 52.2], ["music", 8.99], ["sidetone", 8.27]], [["speech", 57.53], ["fly, housefly", 6.35], ["music", 3.85]], [["speech", 22.43], ["fart", 12.6], ["cattle, bovinae", 9.65]], null, null, [["speech", 71.3], ["music", 6.04], ["explosion", 2.52]], [["speech", 70.13], ["breaking", 8.66], ["music", 4.96]], [["speech", 63.9], ["music", 4.9], ["explosion", 3.03]], null, [["whack, thwack", 26.01], ["music", 22.96], ["groan", 9.42]], [["throbbing", 19.86], ["fly, housefly", 16.49], ["music", 11.74]], [["music", 42.78], ["hum", 13.51], ["didgeridoo", 6.94]], [["music", 41.78], ["speech", 22.02], ["drum machine", 6.29]]], "duration": [0.93, 0.86, 6.97, 1.21, 3.06, 2.95, 5.63, 0.09, 1.83, 4.41, 18.7, 3.31, 0.86, 6.77, 3.33, 3.51, 4.62]} \ No newline at end of file diff --git a/annotations_1/-OMiOIbouaA_filtered.json b/annotations_1/-OMiOIbouaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a5e4d69b700409de6d051cb8cac0bfa73cd2450 --- /dev/null +++ b/annotations_1/-OMiOIbouaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.3], [12.0, 13.78], [15.0, 16.83], [17.0, 26.6], [29.0, 41.88], [43.0, 44.95], [46.0, 48.12], [57.0, 61.13], [62.0, 63.8], [76.0, 76.89], [80.0, 80.7], [83.0, 85.8], [89.0, 89.38], [90.0, 90.83], [92.0, 92.16], [97.0, 98.05], [98.0, 102.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [96.17, 0.0, 0.0, 96.29, 91.64, 0.0, 93.76, 81.53, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 46.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.53], ["speech", 9.03], ["telephone", 2.99]]], "duration": [3.3, 1.78, 1.83, 9.6, 12.88, 1.95, 2.12, 4.13, 1.8, 0.89, 0.7, 2.8, 0.38, 0.83, 0.16, 1.05, 4.69]} \ No newline at end of file diff --git a/annotations_1/-ON8ZTCiuYo_filtered.json b/annotations_1/-ON8ZTCiuYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..075a770f0b5a1d786258cbf7c132015196f070d0 --- /dev/null +++ b/annotations_1/-ON8ZTCiuYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.47], [22.0, 22.92], [25.0, 30.74], [32.0, 38.31], [39.0, 39.31], [41.0, 52.03], [55.0, 57.35], [60.0, 65.16], [65.0, 66.8], [69.0, 72.5], [73.0, 75.17], [76.0, 81.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.82, 85.17, 0.0, 86.82, 38.59, 56.33, 0.0, 66.15, 57.09, 68.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 32.95], ["chirp tone", 25.13], ["tuning fork", 17.12]], null, null, null, null, null], "duration": [1.47, 0.92, 5.74, 6.31, 0.31, 11.03, 2.35, 5.16, 1.8, 3.5, 2.17, 5.53]} \ No newline at end of file diff --git a/annotations_1/-OUuZojE3aM_filtered.json b/annotations_1/-OUuZojE3aM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa20e5defcd05ad72501ff83db73a29986ee2e84 --- /dev/null +++ b/annotations_1/-OUuZojE3aM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.02], [33.0, 35.07], [36.0, 100.26], [101.0, 101.66], [102.0, 104.99], [106.0, 132.7], [133.0, 144.86], [146.0, 161.6], [162.0, 161.64], [162.0, 161.72], [162.0, 161.77], [162.0, 162.01], [162.0, 162.06], [162.0, 162.13], [162.0, 162.16], [162.0, 162.3], [162.0, 162.45], [162.0, 162.48], [164.0, 168.07]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 70.16, 0.0, 0.0, 38.05, 44.2, 63.74, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, null, null, [["speech", 65.43], ["music", 11.35], ["inside, small room", 3.15]], [["music", 33.49], ["synthesizer", 10.78], ["sine wave", 7.62]], null, [["music", 49.94], ["theremin", 12.22], ["singing bowl", 7.74]], null, null, null, null, null, null, null, null, null, null, [["whimper", 30.1], ["speech", 8.43], ["groan", 7.73]]], "duration": [1.02, 2.07, 64.26, 0.66, 2.99, 26.7, 11.86, 15.6, -0.36, -0.28, -0.23, 0.01, 0.06, 0.13, 0.16, 0.3, 0.45, 0.48, 4.07]} \ No newline at end of file diff --git a/annotations_1/-QT_Af7RLjU_filtered.json b/annotations_1/-QT_Af7RLjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7788ef1ed1d4e273f4874a283cc243ea98b543b8 --- /dev/null +++ b/annotations_1/-QT_Af7RLjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.73], [17.0, 18.45], [23.0, 24.22], [34.0, 34.18], [38.0, 38.35], [42.0, 41.71], [42.0, 42.01], [48.0, 52.41], [57.0, 57.13], [58.0, 59.0], [66.0, 66.19], [69.0, 68.91], [74.0, 76.0], [79.0, 80.03], [82.0, 83.15], [84.0, 94.04], [102.0, 101.65], [102.0, 101.76], [113.0, 113.32], [122.0, 130.72], [133.0, 133.84]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 37.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 27.06], ["animal", 11.71], ["whale vocalization", 10.93]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.45], ["whack, thwack", 3.97], ["breaking", 2.23]], null], "duration": [8.73, 1.45, 1.22, 0.18, 0.35, -0.29, 0.01, 4.41, 0.13, 1.0, 0.19, -0.09, 2.0, 1.03, 1.15, 10.04, -0.35, -0.24, 0.32, 8.72, 0.84]} \ No newline at end of file diff --git a/annotations_1/-QZzReak2Ck_filtered.json b/annotations_1/-QZzReak2Ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f501243593b30206a753e9cba39bc3e03a6c6c6 --- /dev/null +++ b/annotations_1/-QZzReak2Ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 93.02], [96.0, 97.28], [98.0, 101.12], [101.0, 103.42], [104.0, 104.9], [106.0, 107.84], [109.0, 113.1], [114.0, 114.67], [118.0, 120.85], [122.0, 121.85], [123.0, 151.38], [151.0, 151.41], [151.0, 151.44], [151.0, 151.48], [153.0, 156.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.12, 0.0, 66.03, 54.17, 0.0, 0.0, 72.31, 0.0, 35.37, 0.0, 32.58, 0.0, 0.0, 0.0, 81.71], "audiomae_on_audioset": [[["music", 43.13], ["throbbing", 20.27], ["hum", 15.46]], null, null, null, null, null, null, null, [["music", 73.1], ["speech", 5.41], ["didgeridoo", 4.54]], null, [["music", 50.95], ["speech", 24.54], ["whack, thwack", 2.62]], null, null, null, null], "duration": [20.02, 1.28, 3.12, 2.42, 0.9, 1.84, 4.1, 0.67, 2.85, -0.15, 28.38, 0.41, 0.44, 0.48, 3.09]} \ No newline at end of file diff --git a/annotations_1/-QfKnft9uWY_filtered.json b/annotations_1/-QfKnft9uWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f9ad0e8bb42e557f458ba1e211ad1579195c763 --- /dev/null +++ b/annotations_1/-QfKnft9uWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 76.37], [76.0, 76.4], [83.0, 87.86], [90.0, 95.49], [100.0, 141.94], [144.0, 149.89]], "keep_status": [false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 35.27, 39.77, 0.0, 31.75], "audiomae_on_audioset": [null, null, [["speech", 42.89], ["radio", 15.68], ["sidetone", 7.55]], [["fart", 25.2], ["speech", 23.95], ["fly, housefly", 8.6]], null, [["fart", 49.09], ["music", 8.72], ["sound effect", 4.1]]], "duration": [0.37, 0.4, 4.86, 5.49, 41.94, 5.89]} \ No newline at end of file diff --git a/annotations_1/-Qq6ZZy0yGg_filtered.json b/annotations_1/-Qq6ZZy0yGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49b0e01737c527b5ab3fa59f2e7d8433c7af6517 --- /dev/null +++ b/annotations_1/-Qq6ZZy0yGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [3.0, 2.98], [7.0, 7.15], [13.0, 16.6], [17.0, 18.42], [22.0, 23.35], [26.0, 30.0], [36.0, 37.71], [45.0, 50.68], [61.0, 85.45], [85.0, 85.51], [88.0, 121.51], [127.0, 166.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.34, 0.0, 0.0, 29.25, 0.0, 29.51, 29.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.78], ["speech", 24.0], ["sidetone", 3.84]], null, null, [["music", 76.68], ["musical instrument", 4.58], ["speech", 2.85]], null, [["music", 74.26], ["boing", 4.46], ["musical instrument", 4.37]], [["music", 81.65], ["didgeridoo", 3.24], ["musical instrument", 1.66]], null, null, null], "duration": [0.61, -0.02, 0.15, 3.6, 1.42, 1.35, 4.0, 1.71, 5.68, 24.45, 0.51, 33.51, 39.8]} \ No newline at end of file diff --git a/annotations_1/-SkeK7t74oo_filtered.json b/annotations_1/-SkeK7t74oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcf489bd3df204f55f91965ad7f8abeae845625e --- /dev/null +++ b/annotations_1/-SkeK7t74oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.29], [14.0, 15.6], [16.0, 16.36], [17.0, 23.04], [33.0, 33.61], [40.0, 41.99], [45.0, 44.93], [47.0, 51.95], [60.0, 72.52], [82.0, 83.03], [88.0, 94.61], [99.0, 104.11], [105.0, 114.79], [118.0, 119.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 31.13, 32.7, 0.0, 33.21, 33.52, 34.03, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 53.63], ["speech", 13.05], ["saxophone", 3.62]], null, null, null, [["sidetone", 62.27], ["music", 15.8], ["throbbing", 3.05]], [["music", 47.52], ["speech", 27.62], ["sidetone", 5.08]], null, [["music", 61.33], ["sidetone", 11.47], ["speech", 6.25]], [["music", 60.48], ["house music", 4.09], ["sampler", 2.07]], [["music", 57.62], ["hum", 9.52], ["saxophone", 3.15]], null], "duration": [1.29, 1.6, 0.36, 6.04, 0.61, 1.99, -0.07, 4.95, 12.52, 1.03, 6.61, 5.11, 9.79, 1.1]} \ No newline at end of file diff --git a/annotations_1/-Svsz19yyPM_filtered.json b/annotations_1/-Svsz19yyPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a14767bfb84cdc1d7c5e205bbffecf99bf5639f --- /dev/null +++ b/annotations_1/-Svsz19yyPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.4], [9.0, 9.22], [11.0, 18.03], [19.0, 19.53], [21.0, 28.49], [31.0, 76.1], [78.0, 81.51], [84.0, 92.16], [94.0, 99.94], [102.0, 102.32], [103.0, 103.5], [106.0, 105.85], [106.0, 106.84], [109.0, 109.0], [111.0, 111.48], [112.0, 114.94], [120.0, 121.19], [123.0, 124.21], [126.0, 140.12], [141.0, 149.39], [153.0, 155.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 96.04, 0.0, 51.39, 0.0, 89.54, 68.67, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 45.46, 42.88, 45.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.66], ["sampler", 4.29], ["drum machine", 4.04]], [["music", 46.72], ["hum", 17.85], ["throbbing", 13.36]], [["beatboxing", 56.92], ["music", 17.26], ["speech", 6.22]]], "duration": [2.4, 0.22, 7.03, 0.53, 7.49, 45.1, 3.51, 8.16, 5.94, 0.32, 0.5, -0.15, 0.84, 0.0, 0.48, 2.94, 1.19, 1.21, 14.12, 8.39, 2.07]} \ No newline at end of file diff --git a/annotations_1/-U9v7Nz6hOs_filtered.json b/annotations_1/-U9v7Nz6hOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56cf3546c26581878023e636a38a6bda01c7c784 --- /dev/null +++ b/annotations_1/-U9v7Nz6hOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [9.0, 10.74], [12.0, 12.11], [13.0, 14.52], [17.0, 23.11], [34.0, 55.49], [56.0, 64.27], [65.0, 67.34], [69.0, 68.91], [70.0, 70.88], [72.0, 85.77], [90.0, 89.95], [91.0, 91.0], [93.0, 98.34], [105.0, 120.36], [125.0, 126.33], [128.0, 134.54], [140.0, 140.73], [155.0, 155.34]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.42, 28.95, 29.06, 29.26, 0.0, 0.0, 29.05, 0.0, 0.0, 30.22, 30.86, 0.0, 31.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.5], ["quack", 6.9], ["livestock, farm animals, working animals", 2.75]], [["music", 53.48], ["speech", 18.34], ["electronic music", 10.32]], [["music", 12.99], ["vehicle", 11.55], ["whale vocalization", 8.26]], [["boing", 37.71], ["moo", 26.01], ["cattle, bovinae", 22.73]], null, null, [["music", 24.18], ["speech", 15.5], ["whip", 11.98]], null, null, [["speech", 60.38], ["hum", 12.69], ["music", 5.85]], [["music", 22.26], ["hum", 18.96], ["throbbing", 14.4]], null, [["music", 69.37], ["theremin", 10.04], ["musical instrument", 4.35]], null, null], "duration": [1.0, 1.74, 0.11, 1.52, 6.11, 21.49, 8.27, 2.34, -0.09, 0.88, 13.77, -0.05, 0.0, 5.34, 15.36, 1.33, 6.54, 0.73, 0.34]} \ No newline at end of file diff --git a/annotations_1/-VnQ_KpOBm4_filtered.json b/annotations_1/-VnQ_KpOBm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f079584b443ce674c1baac66acb4876a298c1645 --- /dev/null +++ b/annotations_1/-VnQ_KpOBm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 6.37], [13.0, 13.83], [17.0, 18.18], [19.0, 19.92], [27.0, 27.75], [29.0, 30.13], [34.0, 34.05], [35.0, 35.58], [41.0, 42.55], [46.0, 46.6], [49.0, 50.14], [51.0, 51.14], [52.0, 52.86], [54.0, 55.53], [57.0, 57.16], [62.0, 62.06], [63.0, 64.45], [66.0, 66.7], [69.0, 69.74], [72.0, 72.62], [76.0, 76.57], [79.0, 80.2], [82.0, 84.45], [88.0, 88.94], [91.0, 91.25], [92.0, 92.21], [94.0, 94.34], [96.0, 96.82], [100.0, 100.18], [103.0, 103.4], [106.0, 106.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.03], ["musical instrument", 13.94], ["guitar", 13.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.35], ["speech", 8.29], ["musical instrument", 4.71]], null, null, null, null, null, null, null, null], "duration": [0.13, 2.37, 0.83, 1.18, 0.92, 0.75, 1.13, 0.05, 0.58, 1.55, 0.6, 1.14, 0.14, 0.86, 1.53, 0.16, 0.06, 1.45, 0.7, 0.74, 0.62, 0.57, 1.2, 2.45, 0.94, 0.25, 0.21, 0.34, 0.82, 0.18, 0.4, 0.76]} \ No newline at end of file diff --git a/annotations_1/-W8pOz1fsD0_filtered.json b/annotations_1/-W8pOz1fsD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01c367440a68d880637feb64392e6740bd31d09c --- /dev/null +++ b/annotations_1/-W8pOz1fsD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 44.96], [45.0, 45.08], [46.0, 63.59], [65.0, 70.41], [72.0, 73.09]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.42, 32.94, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.68], ["throbbing", 6.95], ["hum", 5.56]], [["music", 33.15], ["throbbing", 20.68], ["hum", 14.39]], null], "duration": [40.96, 0.08, 17.59, 5.41, 1.09]} \ No newline at end of file diff --git a/annotations_1/-W_4EZvbrEI_filtered.json b/annotations_1/-W_4EZvbrEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7238aeacf2a7e7b9ea7ef36681980041ec78499 --- /dev/null +++ b/annotations_1/-W_4EZvbrEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 42.5], [44.0, 47.21], [49.0, 63.21], [70.0, 69.99], [81.0, 85.89], [87.0, 92.74], [93.0, 95.5], [97.0, 98.49], [101.0, 112.33]], "keep_status": [true, true, false, false, true, true, true, false, true], "silence_prob": [31.31, 30.0, 31.25, 0.0, 29.86, 30.14, 30.23, 0.0, 30.53], "audiomae_on_audioset": [[["speech", 46.94], ["music", 13.86], ["throbbing", 5.54]], [["music", 16.28], ["vehicle", 12.39], ["car", 11.42]], [["didgeridoo", 50.47], ["music", 36.43], ["electronic music", 1.59]], null, [["speech", 37.59], ["vehicle", 15.24], ["car", 10.97]], [["music", 24.08], ["boing", 18.44], ["speech", 17.03]], [["music", 22.51], ["speech", 8.93], ["jet engine", 5.49]], null, [["music", 51.01], ["fly, housefly", 5.83], ["buzz", 4.53]]], "duration": [8.5, 3.21, 14.21, -0.01, 4.89, 5.74, 2.5, 1.49, 11.33]} \ No newline at end of file diff --git a/annotations_1/-Ww_Bo5ghiw_filtered.json b/annotations_1/-Ww_Bo5ghiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..005024017920beaf27fba0428f1c240ef686e839 --- /dev/null +++ b/annotations_1/-Ww_Bo5ghiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.64], [8.0, 9.22], [10.0, 11.28], [12.0, 12.92], [16.0, 15.97], [21.0, 21.25], [26.0, 27.67], [29.0, 30.77], [33.0, 39.51], [41.0, 47.46], [48.0, 51.44], [54.0, 57.99], [59.0, 65.1], [68.0, 70.41], [78.0, 79.32], [81.0, 81.53], [83.0, 83.19], [84.0, 86.43], [89.0, 88.65], [91.0, 93.97], [95.0, 99.84], [103.0, 112.46], [116.0, 123.08], [125.0, 125.51], [127.0, 139.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 74.13, 79.07, 72.46, 56.25, 68.41, 0.0, 0.0, 0.0, 59.24, 0.0, 57.4, 71.57, 73.67, 42.28, 0.0, 46.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.88], ["music", 8.69], ["hum", 2.18]], null, [["music", 55.1], ["hum", 16.62], ["electronic music", 4.06]]], "duration": [1.64, 1.22, 1.28, 0.92, -0.03, 0.25, 1.67, 1.77, 6.51, 6.46, 3.44, 3.99, 6.1, 2.41, 1.32, 0.53, 0.19, 2.43, -0.35, 2.97, 4.84, 9.46, 7.08, 0.51, 12.9]} \ No newline at end of file diff --git a/annotations_1/-Xb-ryuTDlE_filtered.json b/annotations_1/-Xb-ryuTDlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47a7f9a56490b0c8fdb7a24e5eeeb289af417827 --- /dev/null +++ b/annotations_1/-Xb-ryuTDlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.86], [16.0, 16.36], [17.0, 18.15], [19.0, 19.6], [21.0, 21.83], [24.0, 27.33], [28.0, 34.35], [36.0, 38.74]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 75.55, 74.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.86, 0.36, 1.15, 0.6, 0.83, 3.33, 6.35, 2.74]} \ No newline at end of file diff --git a/annotations_1/-XggDv2QdHg_filtered.json b/annotations_1/-XggDv2QdHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49153d9b2492cddd70320dd543776634fc0c2d27 --- /dev/null +++ b/annotations_1/-XggDv2QdHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.68], [17.0, 19.75], [23.0, 28.88], [32.0, 33.79], [36.0, 36.27], [38.0, 38.5], [40.0, 40.29], [52.0, 53.86], [55.0, 55.98], [58.0, 60.4], [62.0, 63.96], [65.0, 67.1], [69.0, 69.36], [70.0, 74.36], [82.0, 83.05], [84.0, 84.7], [86.0, 86.04], [87.0, 89.13], [91.0, 92.06], [95.0, 95.42], [98.0, 99.69], [100.0, 103.92], [107.0, 108.97], [111.0, 113.73], [114.0, 113.83], [114.0, 117.31], [119.0, 122.15], [124.0, 125.19], [126.0, 129.69], [131.0, 132.04], [132.0, 133.12], [134.0, 134.15], [136.0, 138.18], [138.0, 139.77], [141.0, 143.8], [145.0, 148.2], [149.0, 150.13], [151.0, 151.53], [154.0, 154.5], [155.0, 156.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.85, 99.96, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 99.59, 0.0, 100.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 100.0, 0.0, 99.95, 0.0, 81.0, 99.52, 0.0, 83.52, 0.0, 0.0, 0.0, 99.36, 0.0, 98.27, 95.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.68, 2.75, 5.88, 1.79, 0.27, 0.5, 0.29, 1.86, 0.98, 2.4, 1.96, 2.1, 0.36, 4.36, 1.05, 0.7, 0.04, 2.13, 1.06, 0.42, 1.69, 3.92, 1.97, 2.73, -0.17, 3.31, 3.15, 1.19, 3.69, 1.04, 1.12, 0.15, 2.18, 1.77, 2.8, 3.2, 1.13, 0.53, 0.5, 1.96]} \ No newline at end of file diff --git a/annotations_1/-YaPh7shnWQ_filtered.json b/annotations_1/-YaPh7shnWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731184072009e93618da028a18f41f99eb0e7247 --- /dev/null +++ b/annotations_1/-YaPh7shnWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.15], [3.0, 4.04], [5.0, 6.81], [7.0, 9.46], [24.0, 24.38], [25.0, 25.84], [42.0, 42.62], [51.0, 51.16], [58.0, 58.77], [59.0, 60.22], [64.0, 65.62], [76.0, 78.95], [81.0, 81.6], [82.0, 81.63], [84.0, 83.67], [94.0, 96.15], [100.0, 101.06], [101.0, 101.49], [102.0, 101.6], [102.0, 104.01], [107.0, 110.05], [115.0, 116.82], [118.0, 119.94], [127.0, 128.19], [135.0, 142.99], [144.0, 148.29], [149.0, 149.5], [163.0, 164.91], [167.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 92.48, 99.95, 0.0, 0.0, 0.0, 99.95, 84.62, 0.0, 0.0, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 1.04, 1.81, 2.46, 0.38, 0.84, 0.62, 0.16, 0.77, 1.22, 1.62, 2.95, 0.6, -0.37, -0.33, 2.15, 1.06, 0.49, -0.4, 2.01, 3.05, 1.82, 1.94, 1.19, 7.99, 4.29, 0.5, 1.91, 6.23]} \ No newline at end of file diff --git a/annotations_1/-YiImyOVCj4_filtered.json b/annotations_1/-YiImyOVCj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55bbfbbb3e0f7724b51ad8ecf4c8d450d69a8653 --- /dev/null +++ b/annotations_1/-YiImyOVCj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [3.0, 4.99], [6.0, 7.59], [9.0, 9.85], [11.0, 12.33], [15.0, 19.36], [20.0, 20.66], [24.0, 23.94], [25.0, 26.28], [27.0, 27.92], [32.0, 31.95], [35.0, 36.81], [39.0, 40.07], [42.0, 43.02], [43.0, 43.98], [45.0, 46.38], [47.0, 48.52], [52.0, 53.35], [54.0, 56.12], [57.0, 60.24], [62.0, 63.64], [66.0, 66.26], [71.0, 71.56], [77.0, 83.0], [86.0, 86.83], [90.0, 91.45], [94.0, 94.76], [101.0, 101.8], [109.0, 109.61], [110.0, 111.18], [114.0, 116.18], [127.0, 127.36], [129.0, 130.08], [132.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 51.44, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.99, 1.59, 0.85, 1.33, 4.36, 0.66, -0.06, 1.28, 0.92, -0.05, 1.81, 1.07, 1.02, 0.98, 1.38, 1.52, 1.35, 2.12, 3.24, 1.64, 0.26, 0.56, 6.0, 0.83, 1.45, 0.76, 0.8, 0.61, 1.18, 2.18, 0.36, 1.08, 0.61]} \ No newline at end of file diff --git a/annotations_1/-ZRSgs6PHaY_filtered.json b/annotations_1/-ZRSgs6PHaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48f43f8cbb60bf47c456cbea9ddd59f71781e60e --- /dev/null +++ b/annotations_1/-ZRSgs6PHaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.95], [26.0, 26.81], [28.0, 28.27], [29.0, 29.94], [31.0, 31.7], [32.0, 33.78], [34.0, 35.5], [39.0, 40.63], [43.0, 43.71], [48.0, 48.2], [48.0, 49.52], [50.0, 51.38], [54.0, 58.73], [63.0, 81.97], [85.0, 85.58], [86.0, 86.32], [111.0, 116.7], [118.0, 117.95], [118.0, 118.05], [118.0, 121.81], [122.0, 123.57], [127.0, 127.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 28.91, 0.0, 0.0, 30.01, 0.0, 0.0, 36.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 24.9], ["speech", 14.71], ["fly, housefly", 9.15]], [["speech", 54.11], ["music", 33.27], ["sound effect", 1.39]], null, null, [["mains hum", 49.27], ["hum", 34.45], ["throbbing", 5.39]], null, null, [["speech", 54.69], ["radio", 5.88], ["sneeze", 5.53]], null, null], "duration": [0.95, 0.81, 0.27, 0.94, 0.7, 1.78, 1.5, 1.63, 0.71, 0.2, 1.52, 1.38, 4.73, 18.97, 0.58, 0.32, 5.7, -0.05, 0.05, 3.81, 1.57, 0.74]} \ No newline at end of file diff --git a/annotations_1/-ZxtmDbqDRc_filtered.json b/annotations_1/-ZxtmDbqDRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ee7befc5a36c161029c42bedef9014586caee25 --- /dev/null +++ b/annotations_1/-ZxtmDbqDRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.53], [3.0, 4.9], [6.0, 6.13], [10.0, 10.88], [13.0, 13.29], [19.0, 30.13], [33.0, 33.49], [35.0, 35.5], [42.0, 42.55], [47.0, 47.01], [47.0, 47.22], [50.0, 50.82], [55.0, 55.73], [58.0, 57.74], [58.0, 62.56], [65.0, 66.07], [68.0, 67.86], [69.0, 69.85], [79.0, 79.68], [81.0, 81.21], [83.0, 83.71], [90.0, 90.31], [110.0, 110.13], [112.0, 112.04], [113.0, 113.83], [114.0, 114.54], [118.0, 118.47], [120.0, 120.85], [122.0, 123.43], [124.0, 124.71], [125.0, 125.61], [127.0, 129.79], [131.0, 136.93], [141.0, 144.46], [148.0, 155.85], [158.0, 158.28], [159.0, 163.66], [168.0, 170.16], [171.0, 172.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.38, 29.21, 30.81, 29.5, 0.0, 30.03, 29.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 80.42], ["music", 15.08], ["whack, thwack", 0.48]], null, null, null, null, null, null, null, null, [["speech", 55.72], ["whack, thwack", 7.75], ["music", 5.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.46], ["speech", 13.65], ["theremin", 3.32]], [["music", 32.61], ["speech", 24.87], ["throbbing", 5.52]], [["music", 47.35], ["throbbing", 29.94], ["electronic music", 4.61]], [["breaking", 33.03], ["music", 27.48], ["glass", 4.49]], null, [["music", 52.67], ["theremin", 21.57], ["hum", 3.74]], [["speech", 42.86], ["civil defense siren", 22.16], ["siren", 3.53]], null], "duration": [1.53, 1.9, 0.13, 0.88, 0.29, 11.13, 0.49, 0.5, 0.55, 0.01, 0.22, 0.82, 0.73, -0.26, 4.56, 1.07, -0.14, 0.85, 0.68, 0.21, 0.71, 0.31, 0.13, 0.04, 0.83, 0.54, 0.47, 0.85, 1.43, 0.71, 0.61, 2.79, 5.93, 3.46, 7.85, 0.28, 4.66, 2.16, 1.27]} \ No newline at end of file diff --git a/annotations_1/-a1FAp677Vo_filtered.json b/annotations_1/-a1FAp677Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a9be38ace351788cd0637180600013ce65c055a --- /dev/null +++ b/annotations_1/-a1FAp677Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.05], [7.0, 28.19], [30.0, 35.92], [36.0, 42.69], [43.0, 44.41], [46.0, 48.46], [49.0, 51.11], [52.0, 90.58], [92.0, 94.59]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [100.0, 71.29, 96.17, 66.03, 0.0, 100.0, 99.96, 0.0, 39.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 19.67], ["synthesizer", 16.89], ["effects unit", 9.86]]], "duration": [3.05, 21.19, 5.92, 6.69, 1.41, 2.46, 2.11, 38.58, 2.59]} \ No newline at end of file diff --git a/annotations_1/-agdK2N5wX4_filtered.json b/annotations_1/-agdK2N5wX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..611b60470ced1761cc3ea766efcaa94b840fd401 --- /dev/null +++ b/annotations_1/-agdK2N5wX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.36], [23.0, 23.75], [25.0, 25.93], [28.0, 30.77], [31.0, 32.64], [34.0, 35.82], [37.0, 39.12], [41.0, 41.54], [43.0, 43.66], [46.0, 46.35], [47.0, 52.37], [54.0, 58.94], [60.0, 62.51], [63.0, 70.6], [71.0, 72.93], [77.0, 78.97], [80.0, 81.8], [82.0, 88.28], [91.0, 94.73], [95.0, 120.41], [121.0, 124.31], [125.0, 126.22], [128.0, 129.07], [130.0, 132.12], [133.0, 166.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 70.86, 68.54, 69.47, 52.22, 0.0, 0.0, 0.0, 41.28, 41.5, 45.88, 61.77, 0.0, 0.0, 40.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.49], ["music", 26.07], ["quack", 4.73]], [["throbbing", 47.39], ["hum", 26.36], ["music", 9.93]], [["throbbing", 54.7], ["hum", 31.13], ["music", 5.59]], null, null, null, [["music", 16.53], ["sine wave", 13.52], ["sidetone", 6.44]], null], "duration": [0.36, 0.75, 0.93, 2.77, 1.64, 1.82, 2.12, 0.54, 0.66, 0.35, 5.37, 4.94, 2.51, 7.6, 1.93, 1.97, 1.8, 6.28, 3.73, 25.41, 3.31, 1.22, 1.07, 2.12, 33.24]} \ No newline at end of file diff --git a/annotations_1/-arTRBtT9d4_filtered.json b/annotations_1/-arTRBtT9d4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f22d5c10b4d5bbc6dc82a8bf1200f426ce0ecc1 --- /dev/null +++ b/annotations_1/-arTRBtT9d4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.44], [16.0, 17.22], [20.0, 23.63], [25.0, 24.98], [26.0, 27.04], [27.0, 28.05], [31.0, 32.61], [35.0, 39.68], [40.0, 42.11], [43.0, 45.79], [47.0, 47.51], [48.0, 49.96], [59.0, 65.91], [67.0, 73.35], [75.0, 74.9], [80.0, 81.92], [82.0, 88.8], [107.0, 107.18], [111.0, 113.09], [114.0, 115.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [42.46, 0.0, 35.34, 0.0, 0.0, 0.0, 0.0, 51.55, 91.64, 94.22, 0.0, 0.0, 30.09, 30.76, 0.0, 0.0, 29.75, 0.0, 35.35, 0.0], "audiomae_on_audioset": [[["speech", 60.81], ["fart", 27.92], ["fly, housefly", 1.66]], null, [["speech", 62.09], ["sidetone", 12.68], ["music", 5.46]], null, null, null, null, null, null, null, null, null, [["speech", 33.21], ["music", 26.39], ["boing", 13.13]], [["music", 61.79], ["speech", 18.46], ["boing", 2.09]], null, null, [["music", 35.71], ["boing", 31.4], ["speech", 11.65]], null, [["music", 45.77], ["dubstep", 10.8], ["electronic music", 8.43]], null], "duration": [7.44, 1.22, 3.63, -0.02, 1.04, 1.05, 1.61, 4.68, 2.11, 2.79, 0.51, 1.96, 6.91, 6.35, -0.1, 1.92, 6.8, 0.18, 2.09, 1.01]} \ No newline at end of file diff --git a/annotations_1/-cdk5mhKuWc_filtered.json b/annotations_1/-cdk5mhKuWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fedf11a7dde5b59d41bdec82e51fdb204e1de615 --- /dev/null +++ b/annotations_1/-cdk5mhKuWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [14.0, 25.52], [29.0, 33.88], [35.0, 34.96], [35.0, 70.95], [71.0, 81.97], [86.0, 114.72], [115.0, 116.43], [117.0, 123.96], [127.0, 129.46]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 49.4, 61.18, 0.0, 0.0, 37.38, 46.64, 0.0, 41.66, 39.21], "audiomae_on_audioset": [null, [["music", 67.95], ["musical instrument", 8.17], ["didgeridoo", 7.97]], null, null, null, [["music", 51.94], ["speech", 12.32], ["musical instrument", 9.97]], [["music", 25.42], ["gasp", 20.66], ["insect", 2.68]], null, [["music", 61.49], ["synthesizer", 8.01], ["effects unit", 7.18]], [["music", 66.92], ["sonar", 5.79], ["musical instrument", 4.29]]], "duration": [1.38, 11.52, 4.88, -0.04, 35.95, 10.97, 28.72, 1.43, 6.96, 2.46]} \ No newline at end of file diff --git a/annotations_1/-dWENMR2aag_filtered.json b/annotations_1/-dWENMR2aag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dbeb656791e8698fb208f0ed6c433164a15d9d8 --- /dev/null +++ b/annotations_1/-dWENMR2aag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [20.0, 23.53], [24.0, 24.61], [26.0, 26.64], [43.0, 53.23], [57.0, 57.03], [57.0, 57.94], [58.0, 58.38], [59.0, 59.53], [60.0, 61.13], [63.0, 63.42], [65.0, 65.72], [74.0, 76.3], [83.0, 83.51], [84.0, 83.61], [89.0, 91.02], [93.0, 93.41], [94.0, 94.91], [96.0, 96.43], [97.0, 97.6], [100.0, 99.64], [100.0, 100.7], [102.0, 102.64], [103.0, 113.07], [118.0, 118.15], [120.0, 120.14], [120.0, 121.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.55, 0.0, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 35.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.8], ["didgeridoo", 29.74], ["musical instrument", 3.0]], null, null, [["music", 43.05], ["cattle, bovinae", 7.63], ["livestock, farm animals, working animals", 7.56]], null, null, null, null, null, null, null, [["speech", 22.27], ["music", 15.28], ["animal", 7.18]], null, null, [["speech", 28.75], ["livestock, farm animals, working animals", 9.55], ["boing", 9.05]], null, null, null, null, null, null, null, [["speech", 38.31], ["music", 32.51], ["didgeridoo", 7.01]], null, null, null], "duration": [1.34, 3.53, 0.61, 0.64, 10.23, 0.03, 0.94, 0.38, 0.53, 1.13, 0.42, 0.72, 2.3, 0.51, -0.39, 2.02, 0.41, 0.91, 0.43, 0.6, -0.36, 0.7, 0.64, 10.07, 0.15, 0.14, 1.31]} \ No newline at end of file diff --git a/annotations_1/-dlOM4ocKUM_filtered.json b/annotations_1/-dlOM4ocKUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea07a6875f8c1e0788b85caa21e33659637a9f6b --- /dev/null +++ b/annotations_1/-dlOM4ocKUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.96], [19.0, 20.38], [22.0, 43.95], [45.0, 44.95], [46.0, 54.77], [56.0, 58.06], [59.0, 59.71], [61.0, 61.82], [64.0, 65.28], [66.0, 66.53], [68.0, 68.72], [69.0, 72.28], [74.0, 73.63], [76.0, 77.3], [79.0, 84.69], [85.0, 84.77], [85.0, 91.77], [92.0, 103.01], [106.0, 110.47], [111.0, 111.91], [114.0, 116.56], [117.0, 117.32], [120.0, 123.47], [124.0, 131.7], [134.0, 134.91], [135.0, 136.43], [137.0, 138.13], [140.0, 140.26], [144.0, 152.73], [154.0, 159.44], [160.0, 162.72], [165.0, 165.99], [167.0, 167.76], [169.0, 169.4], [171.0, 171.0], [172.0, 176.86], [180.0, 182.78], [183.0, 184.64], [186.0, 185.67]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, true, false, false, true, false, false, true, false, false, true, false, true, true, false, false, false, false, true, true, true, false, false, false, false, true, true, false, false], "silence_prob": [34.78, 0.0, 30.36, 0.0, 39.4, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0, 36.05, 0.0, 0.0, 29.88, 0.0, 29.45, 29.56, 32.06, 0.0, 34.12, 0.0, 30.17, 31.3, 0.0, 0.0, 0.0, 0.0, 30.87, 35.07, 35.94, 0.0, 0.0, 0.0, 0.0, 29.71, 29.89, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.51], ["mains hum", 27.84], ["hum", 12.36]], null, [["speech", 21.65], ["livestock, farm animals, working animals", 11.35], ["vehicle", 11.15]], null, [["music", 31.68], ["didgeridoo", 19.83], ["hum", 12.82]], [["music", 29.09], ["mains hum", 25.61], ["hum", 14.73]], null, null, null, null, null, [["hum", 23.8], ["mains hum", 23.76], ["speech", 15.3]], null, null, [["sidetone", 28.94], ["speech", 22.09], ["hum", 8.11]], null, [["music", 40.72], ["throbbing", 24.34], ["hum", 9.76]], [["speech", 46.18], ["music", 12.31], ["didgeridoo", 9.46]], [["sidetone", 53.08], ["speech", 13.66], ["music", 8.47]], null, [["speech", 24.13], ["music", 12.07], ["civil defense siren", 8.38]], null, [["explosion", 16.69], ["fart", 6.84], ["speech", 6.58]], [["speech", 21.64], ["music", 12.3], ["didgeridoo", 8.16]], null, null, null, null, [["music", 57.47], ["didgeridoo", 7.99], ["theremin", 3.71]], [["music", 31.24], ["hum", 17.93], ["throbbing", 16.31]], [["music", 52.7], ["theremin", 6.44], ["musical instrument", 5.65]], null, null, null, null, [["speech", 21.78], ["music", 15.32], ["animal", 10.53]], [["speech", 42.01], ["music", 7.49], ["fly, housefly", 4.68]], null, null], "duration": [3.96, 1.38, 21.95, -0.05, 8.77, 2.06, 0.71, 0.82, 1.28, 0.53, 0.72, 3.28, -0.37, 1.3, 5.69, -0.23, 6.77, 11.01, 4.47, 0.91, 2.56, 0.32, 3.47, 7.7, 0.91, 1.43, 1.13, 0.26, 8.73, 5.44, 2.72, 0.99, 0.76, 0.4, 0.0, 4.86, 2.78, 1.64, -0.33]} \ No newline at end of file diff --git a/annotations_1/-fRY1b6WAx4_filtered.json b/annotations_1/-fRY1b6WAx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbb29af5f0764cd7605cf41f4171a341af92fb6 --- /dev/null +++ b/annotations_1/-fRY1b6WAx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [5.0, 6.0], [9.0, 9.17], [17.0, 17.25], [18.0, 18.64], [21.0, 21.63], [22.0, 36.0], [38.0, 39.36], [40.0, 42.82], [45.0, 53.1], [59.0, 66.9], [68.0, 69.8], [70.0, 70.77], [72.0, 73.14], [76.0, 76.79], [78.0, 84.06], [85.0, 86.8], [88.0, 89.85], [91.0, 92.91], [94.0, 97.58], [99.0, 100.57], [101.0, 108.58], [109.0, 113.63], [124.0, 126.32], [128.0, 129.12], [132.0, 134.15], [135.0, 138.52], [139.0, 141.2], [151.0, 153.5], [154.0, 155.83], [161.0, 166.89], [168.0, 170.73], [172.0, 173.67], [174.0, 175.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 69.61, 75.88, 94.22, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 88.83, 0.0, 88.46, 54.76, 80.29, 0.0, 61.47, 88.46, 51.77, 73.97, 0.0, 49.78, 67.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.74], ["tick-tock", 5.64], ["tick", 4.07]], null, null, null], "duration": [1.24, 1.0, 0.17, 0.25, 0.64, 0.63, 14.0, 1.36, 2.82, 8.1, 7.9, 1.8, 0.77, 1.14, 0.79, 6.06, 1.8, 1.85, 1.91, 3.58, 1.57, 7.58, 4.63, 2.32, 1.12, 2.15, 3.52, 2.2, 2.5, 1.83, 5.89, 2.73, 1.67, 1.42]} \ No newline at end of file diff --git a/annotations_1/-jg0_iXfTE4_filtered.json b/annotations_1/-jg0_iXfTE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e28a869681e66bc31e0768d03f395cec4e7ec9e5 --- /dev/null +++ b/annotations_1/-jg0_iXfTE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.03], [13.0, 12.97], [16.0, 16.87], [21.0, 22.91], [27.0, 27.08], [30.0, 29.88], [43.0, 43.65], [48.0, 49.2], [50.0, 52.59], [54.0, 56.3], [57.0, 62.02], [63.0, 65.75], [68.0, 68.61], [90.0, 94.9], [97.0, 99.33], [100.0, 99.54], [100.0, 100.03], [100.0, 100.4], [101.0, 125.9], [132.0, 132.39], [134.0, 145.81], [146.0, 149.72], [150.0, 152.93], [158.0, 159.44]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, false, false, true, false, true, true, true, false], "silence_prob": [30.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 30.73, 35.01, 31.11, 0.0, 30.83, 30.31, 0.0, 0.0, 0.0, 30.37, 0.0, 30.58, 49.73, 34.2, 0.0], "audiomae_on_audioset": [[["crowd", 48.97], ["cheering", 29.59], ["speech", 4.71]], null, null, null, null, null, null, null, [["music", 55.7], ["theremin", 3.6], ["civil defense siren", 3.11]], [["speech", 14.86], ["sheep", 6.19], ["crowd", 5.93]], [["hum", 31.19], ["mains hum", 22.9], ["music", 15.38]], [["speech", 37.02], ["music", 12.1], ["sidetone", 4.74]], null, [["music", 35.14], ["didgeridoo", 26.67], ["sidetone", 12.25]], [["speech", 26.18], ["music", 19.43], ["boing", 14.47]], null, null, null, [["music", 64.48], ["throbbing", 2.95], ["livestock, farm animals, working animals", 2.16]], null, [["music", 40.87], ["speech", 10.05], ["cacophony", 5.82]], [["speech", 43.17], ["rumble", 10.32], ["music", 9.11]], [["speech", 31.96], ["music", 17.33], ["hum", 5.73]], null], "duration": [2.03, -0.03, 0.87, 1.91, 0.08, -0.12, 0.65, 1.2, 2.59, 2.3, 5.02, 2.75, 0.61, 4.9, 2.33, -0.46, 0.03, 0.4, 24.9, 0.39, 11.81, 3.72, 2.93, 1.44]} \ No newline at end of file diff --git a/annotations_1/-jpEsYBH3g4_filtered.json b/annotations_1/-jpEsYBH3g4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c3b7742bc6f9d95096cb76a872d8685716c7df --- /dev/null +++ b/annotations_1/-jpEsYBH3g4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [5.0, 5.0], [5.0, 5.44], [6.0, 6.81], [8.0, 8.43], [20.0, 21.46], [22.0, 23.11], [25.0, 26.2], [29.0, 28.78], [30.0, 29.98], [33.0, 41.15], [42.0, 44.96], [45.0, 46.41], [47.0, 47.38], [50.0, 50.25], [53.0, 56.39], [58.0, 62.38], [65.0, 76.06], [78.0, 78.53], [80.0, 81.09], [82.0, 83.52], [85.0, 86.59], [88.0, 89.02], [89.0, 91.66], [94.0, 109.98], [116.0, 116.73], [118.0, 118.44], [124.0, 129.15], [133.0, 134.45], [135.0, 135.67], [136.0, 136.71], [138.0, 137.76], [138.0, 139.21], [153.0, 160.37], [162.0, 162.04], [163.0, 166.06], [167.0, 166.75], [167.0, 168.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.53, 37.11, 0.0, 0.0, 0.0, 37.07, 96.66, 35.05, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 29.7, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 0.0, 41.03, 0.0, 42.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 38.91], ["speech", 28.42], ["theremin", 6.51]], [["music", 22.96], ["cattle, bovinae", 13.09], ["livestock, farm animals, working animals", 9.74]], null, null, null, [["music", 41.77], ["theremin", 13.11], ["whale vocalization", 12.07]], null, [["music", 43.08], ["speech", 26.07], ["hum", 4.06]], null, null, null, null, null, [["music", 49.04], ["speech", 25.76], ["didgeridoo", 7.44]], [["livestock, farm animals, working animals", 26.33], ["cattle, bovinae", 11.87], ["music", 11.6]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 46.69], ["cattle, bovinae", 21.39], ["moo", 13.68]], null, [["music", 19.52], ["speech", 12.9], ["foghorn", 5.68]], null, null], "duration": [1.6, 0.0, 0.44, 0.81, 0.43, 1.46, 1.11, 1.2, -0.22, -0.02, 8.15, 2.96, 1.41, 0.38, 0.25, 3.39, 4.38, 11.06, 0.53, 1.09, 1.52, 1.59, 1.02, 2.66, 15.98, 0.73, 0.44, 5.15, 1.45, 0.67, 0.71, -0.24, 1.21, 7.37, 0.04, 3.06, -0.25, 1.3]} \ No newline at end of file diff --git a/annotations_1/-jtzzs0_bM4_filtered.json b/annotations_1/-jtzzs0_bM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6db02ebfedf227036339547e42e2278dc1a785a3 --- /dev/null +++ b/annotations_1/-jtzzs0_bM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.18], [32.0, 47.48], [49.0, 51.36], [53.0, 53.76], [56.0, 60.62], [64.0, 64.81], [68.0, 70.82], [72.0, 78.04], [78.0, 78.07], [78.0, 78.11], [80.0, 114.94], [117.0, 165.3]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.52, 46.36, 0.0, 37.16, 0.0, 64.41, 29.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 37.19], ["music", 29.79], ["hum", 13.01]], [["hum", 37.55], ["mains hum", 24.84], ["music", 18.87]], null, [["music", 33.38], ["electronic music", 11.88], ["rumble", 11.65]], null, null, [["music", 56.24], ["hum", 14.57], ["throbbing", 14.2]], null, null, null, null], "duration": [1.18, 15.48, 2.36, 0.76, 4.62, 0.81, 2.82, 6.04, 0.07, 0.11, 34.94, 48.3]} \ No newline at end of file diff --git a/annotations_1/-kHMOXNsE2k_filtered.json b/annotations_1/-kHMOXNsE2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..464f698755645b2d342a8f5685b83ea1ea5f2f6d --- /dev/null +++ b/annotations_1/-kHMOXNsE2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [5.0, 5.48], [8.0, 8.78], [10.0, 10.91], [12.0, 12.18], [14.0, 16.85], [18.0, 18.05], [20.0, 20.71], [21.0, 21.54], [26.0, 28.05], [32.0, 31.87], [34.0, 35.21], [36.0, 43.39], [44.0, 46.53], [59.0, 59.0], [62.0, 62.31], [64.0, 64.59], [65.0, 66.66], [89.0, 89.75], [93.0, 95.17], [96.0, 96.16], [97.0, 98.51], [101.0, 100.99], [105.0, 105.8], [109.0, 111.23], [113.0, 113.14], [115.0, 115.7]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 38.22, 0.0, 0.0, 37.01, 40.64, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 37.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 48.9], ["hiccup", 13.19], ["hum", 4.75]], null, null, [["clang", 18.0], ["music", 15.54], ["ding", 5.69]], [["speech", 49.62], ["crackle", 9.74], ["sidetone", 7.17]], null, null, null, null, null, null, null, null, null, null, [["music", 55.96], ["animal", 6.53], ["sneeze", 3.47]], null, null], "duration": [0.08, 0.48, 0.78, 0.91, 0.18, 2.85, 0.05, 0.71, 0.54, 2.05, -0.13, 1.21, 7.39, 2.53, 0.0, 0.31, 0.59, 1.66, 0.75, 2.17, 0.16, 1.51, -0.01, 0.8, 2.23, 0.14, 0.7]} \ No newline at end of file diff --git a/annotations_1/-kKqgjrbb6I_filtered.json b/annotations_1/-kKqgjrbb6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbab9e57f5154bb5842eb3f9d95a8a841e1d9739 --- /dev/null +++ b/annotations_1/-kKqgjrbb6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.05], [9.0, 12.6], [15.0, 16.77], [20.0, 42.48], [43.0, 44.98], [45.0, 48.34], [51.0, 53.27], [54.0, 59.48], [63.0, 63.48]], "keep_status": [true, true, false, false, false, true, false, false, false], "silence_prob": [30.57, 29.35, 0.0, 30.3, 0.0, 30.02, 44.26, 30.46, 0.0], "audiomae_on_audioset": [[["speech", 43.86], ["music", 6.87], ["sound effect", 3.91]], [["music", 19.88], ["speech", 13.71], ["boing", 10.51]], null, [["music", 59.99], ["speech", 21.97], ["throbbing", 2.18]], null, [["speech", 30.53], ["music", 21.81], ["hum", 16.51]], [["speech", 31.55], ["theremin", 22.62], ["music", 17.7]], [["speech", 51.79], ["music", 28.98], ["musical instrument", 1.15]], null], "duration": [2.05, 3.6, 1.77, 22.48, 1.98, 3.34, 2.27, 5.48, 0.48]} \ No newline at end of file diff --git a/annotations_1/-mXoZz1dqMQ_filtered.json b/annotations_1/-mXoZz1dqMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3bc18341096c73c4be59c606642c84d531702a --- /dev/null +++ b/annotations_1/-mXoZz1dqMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 26.77], [29.0, 29.89], [32.0, 33.03], [51.0, 52.73], [66.0, 66.07], [68.0, 68.32], [69.0, 69.2], [74.0, 78.04], [83.0, 84.69], [87.0, 89.36], [90.0, 90.42], [94.0, 95.25], [98.0, 98.49], [104.0, 106.05], [110.0, 111.96], [112.0, 113.43], [114.0, 116.34], [119.0, 128.31]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 69.07, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 70.72, 47.05], "audiomae_on_audioset": [[["music", 20.11], ["speech", 15.1], ["crowd", 11.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.81], ["hum", 16.45], ["mains hum", 5.0]]], "duration": [7.77, 0.89, 1.03, 1.73, 0.07, 0.32, 0.2, 4.04, 1.69, 2.36, 0.42, 1.25, 0.49, 2.05, 1.96, 1.43, 2.34, 9.31]} \ No newline at end of file diff --git a/annotations_1/-mexzYsMSro_filtered.json b/annotations_1/-mexzYsMSro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31fb1b9538cede61279b3d925483f0f002152a3e --- /dev/null +++ b/annotations_1/-mexzYsMSro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.65], [21.0, 23.38], [26.0, 26.1], [27.0, 28.53], [30.0, 41.2], [42.0, 43.82], [45.0, 46.23], [48.0, 48.36], [49.0, 52.39], [53.0, 64.67], [68.0, 70.65], [71.0, 73.26], [75.0, 78.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.52, 96.42, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 98.19, 69.47, 78.89, 65.32, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.65, 2.38, 0.1, 1.53, 11.2, 1.82, 1.23, 0.36, 3.39, 11.67, 2.65, 2.26, 3.68]} \ No newline at end of file diff --git a/annotations_1/-mlfefNP8cw_filtered.json b/annotations_1/-mlfefNP8cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33d6de553379664fa529d5788ee2fb5a566a9974 --- /dev/null +++ b/annotations_1/-mlfefNP8cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.72], [5.0, 5.21], [25.0, 25.12], [33.0, 46.65], [47.0, 48.24], [50.0, 51.78], [57.0, 57.65], [59.0, 62.45], [67.0, 74.09], [83.0, 85.09], [87.0, 88.47], [91.0, 91.17], [92.0, 91.94], [92.0, 93.24], [127.0, 127.5], [128.0, 127.58], [133.0, 133.22], [136.0, 135.73], [136.0, 142.45], [149.0, 149.69], [151.0, 151.97]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.89, 0.0, 0.0, 0.0, 35.6, 36.86, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 78.47], ["theremin", 2.65], ["musical instrument", 2.64]], null, null, null, [["music", 62.41], ["guitar", 5.82], ["bass guitar", 5.45]], [["music", 61.53], ["guitar", 4.97], ["effects unit", 3.02]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.28, 0.21, 0.12, 13.65, 1.24, 1.78, 0.65, 3.45, 7.09, 2.09, 1.47, 0.17, -0.06, 1.24, 0.5, -0.42, 0.22, -0.27, 6.45, 0.69, 0.97]} \ No newline at end of file diff --git a/annotations_1/-nk6Gs6Z_Bo_filtered.json b/annotations_1/-nk6Gs6Z_Bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5826d21fed8a20770ab94e41aa7bd68e838aeb22 --- /dev/null +++ b/annotations_1/-nk6Gs6Z_Bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.17], [11.0, 12.43], [13.0, 18.67], [45.0, 46.58], [49.0, 52.25], [63.0, 63.05], [63.0, 65.43], [74.0, 76.33], [83.0, 92.28], [93.0, 99.96], [101.0, 101.33], [102.0, 102.09], [103.0, 116.31], [117.0, 143.83], [144.0, 151.07]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 38.93, 0.0, 33.8, 0.0, 41.76, 56.33, 33.05, 37.19, 0.0, 0.0, 34.52, 34.32, 31.65], "audiomae_on_audioset": [null, null, [["thunk", 26.47], ["music", 19.13], ["speech", 12.03]], null, [["speech", 31.16], ["music", 19.87], ["fart", 6.86]], null, [["music", 35.67], ["speech", 24.05], ["didgeridoo", 2.79]], null, [["cattle, bovinae", 39.67], ["livestock, farm animals, working animals", 33.92], ["moo", 24.9]], [["music", 76.46], ["musical instrument", 3.1], ["synthesizer", 2.77]], null, null, [["fly, housefly", 61.23], ["insect", 10.26], ["music", 7.2]], [["music", 23.03], ["fly, housefly", 19.71], ["mosquito", 16.03]], [["music", 47.81], ["didgeridoo", 7.96], ["grunt", 5.63]]], "duration": [1.17, 1.43, 5.67, 1.58, 3.25, 0.05, 2.43, 2.33, 9.28, 6.96, 0.33, 0.09, 13.31, 26.83, 7.07]} \ No newline at end of file diff --git a/annotations_1/-npMZStX7dU_filtered.json b/annotations_1/-npMZStX7dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f8dcf0ae8e3bee5958f60149bcfa55dd52a8d1c --- /dev/null +++ b/annotations_1/-npMZStX7dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.83], [27.0, 43.34], [57.0, 57.45], [66.0, 68.39], [74.0, 88.5], [90.0, 97.92]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 34.78, 0.0, 32.93, 28.72, 28.99], "audiomae_on_audioset": [null, [["hum", 50.27], ["music", 17.5], ["mains hum", 12.81]], null, [["speech", 64.61], ["radio", 2.9], ["male speech, man speaking", 1.92]], [["music", 48.63], ["smash, crash", 22.59], ["whack, thwack", 5.34]], [["cattle, bovinae", 37.37], ["livestock, farm animals, working animals", 24.86], ["moo", 18.65]]], "duration": [1.83, 16.34, 0.45, 2.39, 14.5, 7.92]} \ No newline at end of file diff --git a/annotations_1/-nswXtzrfQU_filtered.json b/annotations_1/-nswXtzrfQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4752bfc59fdb0f820b050912230bdc13733dac --- /dev/null +++ b/annotations_1/-nswXtzrfQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [5.0, 8.83], [20.0, 23.08], [23.0, 24.17], [43.0, 46.23], [49.0, 49.84], [54.0, 54.87], [57.0, 57.33], [65.0, 65.82], [72.0, 72.55], [81.0, 80.86], [81.0, 83.44], [88.0, 87.99], [89.0, 91.05], [99.0, 99.98], [101.0, 101.29], [102.0, 102.64], [107.0, 107.54]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.26, 42.48, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.71], ["speech", 14.82], ["arrow", 7.84]], [["speech", 44.59], ["hum", 13.76], ["music", 9.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 3.83, 3.08, 1.17, 3.23, 0.84, 0.87, 0.33, 0.82, 0.55, -0.14, 2.44, -0.01, 2.05, 0.98, 0.29, 0.64, 0.54]} \ No newline at end of file diff --git a/annotations_1/-oL4NpO7eAw_filtered.json b/annotations_1/-oL4NpO7eAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24954907df1b3393089e10910e4e9ead66ffc0c --- /dev/null +++ b/annotations_1/-oL4NpO7eAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.84], [28.0, 29.74], [33.0, 32.73], [35.0, 35.75], [41.0, 43.83], [46.0, 46.18], [52.0, 52.88], [55.0, 57.72], [63.0, 63.15], [65.0, 72.67], [77.0, 78.7], [80.0, 80.82], [83.0, 83.32], [90.0, 90.39], [101.0, 101.46], [105.0, 105.83], [109.0, 110.76], [124.0, 125.39]], "keep_status": [true, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [31.5, 0.0, 0.0, 0.0, 34.98, 0.0, 0.0, 32.18, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.16], ["boing", 9.03], ["musical instrument", 5.52]], null, null, null, [["music", 50.6], ["speech", 7.29], ["musical instrument", 2.85]], null, null, [["music", 50.28], ["boing", 3.59], ["music of latin america", 3.55]], null, [["music", 29.86], ["speech", 10.92], ["mosquito", 8.83]], null, null, null, null, null, null, null, null], "duration": [15.84, 1.74, -0.27, 0.75, 2.83, 0.18, 0.88, 2.72, 0.15, 7.67, 1.7, 0.82, 0.32, 0.39, 0.46, 0.83, 1.76, 1.39]} \ No newline at end of file diff --git a/annotations_1/-p4TkuB20bs_filtered.json b/annotations_1/-p4TkuB20bs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019c7018b72f8aa75a739e6a18f0df31fdfe528f --- /dev/null +++ b/annotations_1/-p4TkuB20bs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.25], [16.0, 16.23], [18.0, 24.85], [33.0, 36.48], [43.0, 44.22], [44.0, 56.44], [66.0, 69.11]], "keep_status": [true, false, false, true, false, true, false], "silence_prob": [35.87, 0.0, 75.39, 36.97, 0.0, 29.99, 32.77], "audiomae_on_audioset": [[["speech", 36.11], ["music", 20.41], ["hum", 6.98]], null, null, [["speech", 30.55], ["hum", 26.34], ["rumble", 7.89]], null, [["throbbing", 29.68], ["hum", 19.35], ["music", 13.8]], [["music", 40.65], ["hum", 24.19], ["throbbing", 14.38]]], "duration": [9.25, 0.23, 6.85, 3.48, 1.22, 12.44, 3.11]} \ No newline at end of file diff --git a/annotations_1/-pKrpqoPu1o_filtered.json b/annotations_1/-pKrpqoPu1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5433da0d80954e9304a5727e2e27ca70c9f860c --- /dev/null +++ b/annotations_1/-pKrpqoPu1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 29.03], [40.0, 44.95], [47.0, 61.45], [66.0, 121.1]], "keep_status": [false, false, false, false], "silence_prob": [32.75, 37.77, 33.17, 0.0], "audiomae_on_audioset": [[["music", 54.98], ["throbbing", 12.11], ["hum", 8.72]], [["music", 66.88], ["throbbing", 4.95], ["musical instrument", 2.95]], [["music", 54.3], ["hum", 10.59], ["rumble", 8.22]], null], "duration": [24.03, 4.95, 14.45, 55.1]} \ No newline at end of file diff --git a/annotations_1/-pXlicO85dk_filtered.json b/annotations_1/-pXlicO85dk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5398d1743ab0de23af8e2f6ad5694733909db53 --- /dev/null +++ b/annotations_1/-pXlicO85dk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.24], [12.0, 15.16], [17.0, 19.41], [21.0, 21.98], [24.0, 28.02], [34.0, 35.4], [40.0, 42.6], [44.0, 49.82], [51.0, 56.29], [57.0, 58.78], [61.0, 62.58], [63.0, 69.69], [72.0, 73.04], [77.0, 80.45], [83.0, 89.23], [91.0, 92.82], [95.0, 97.02], [98.0, 99.13], [101.0, 101.66], [102.0, 112.14], [113.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.78, 43.53, 0.0, 98.44, 0.0, 61.57, 33.83, 41.44, 0.0, 0.0, 38.15, 0.0, 93.13, 45.49, 0.0, 65.67, 0.0, 0.0, 38.22, 44.69], "audiomae_on_audioset": [null, null, [["speech", 59.91], ["sidetone", 5.42], ["hum", 4.71]], null, null, null, null, [["music", 39.43], ["speech", 23.02], ["ambient music", 6.75]], [["music", 33.62], ["theremin", 26.12], ["speech", 8.68]], null, null, [["music", 53.32], ["speech", 17.8], ["speech synthesizer", 7.59]], null, null, [["music", 40.18], ["singing bowl", 16.38], ["speech", 14.78]], null, null, null, null, [["music", 61.01], ["speech", 10.51], ["hum", 3.63]], [["music", 69.93], ["gong", 6.48], ["synthesizer", 3.09]]], "duration": [0.24, 3.16, 2.41, 0.98, 4.02, 1.4, 2.6, 5.82, 5.29, 1.78, 1.58, 6.69, 1.04, 3.45, 6.23, 1.82, 2.02, 1.13, 0.66, 10.14, 8.98]} \ No newline at end of file diff --git a/annotations_1/-pix6UL8ONk_filtered.json b/annotations_1/-pix6UL8ONk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42325b5cb5ec1948a78683d12e5c1c8719b3b27d --- /dev/null +++ b/annotations_1/-pix6UL8ONk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [7.0, 7.47], [16.0, 19.23], [20.0, 19.77], [35.0, 35.19], [40.0, 40.81], [64.0, 66.5], [69.0, 68.79], [70.0, 71.54], [73.0, 75.95], [78.0, 79.08], [82.0, 84.64], [86.0, 97.24], [97.0, 100.77], [104.0, 103.92], [111.0, 111.47], [115.0, 131.55]], "keep_status": [false, false, true, false, false, false, true, false, false, true, false, true, true, true, false, false, true], "silence_prob": [0.0, 0.0, 40.09, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 49.09, 0.0, 35.24, 41.58, 33.79, 0.0, 0.0, 30.26], "audiomae_on_audioset": [null, null, [["speech", 9.81], ["crying, sobbing", 7.2], ["baby cry, infant cry", 5.4]], null, null, null, [["speech", 12.57], ["rowboat, canoe, kayak", 12.32], ["horse", 10.92]], null, null, [["speech", 32.37], ["boat, water vehicle", 20.33], ["vehicle", 6.1]], null, [["speech", 29.53], ["hum", 12.96], ["eruption", 5.68]], [["music", 32.15], ["hum", 26.02], ["throbbing", 9.07]], [["music", 45.03], ["hum", 12.62], ["mains hum", 8.28]], null, null, [["music", 52.81], ["speech", 6.15], ["synthesizer", 5.21]]], "duration": [1.88, 0.47, 3.23, -0.23, 0.19, 0.81, 2.5, -0.21, 1.54, 2.95, 1.08, 2.64, 11.24, 3.77, -0.08, 0.47, 16.55]} \ No newline at end of file diff --git a/annotations_1/-pq4FpNnvcg_filtered.json b/annotations_1/-pq4FpNnvcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25017a6c5fd3033e722ed17b756a7876db112533 --- /dev/null +++ b/annotations_1/-pq4FpNnvcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 23.68], [24.0, 35.04], [36.0, 36.15], [41.0, 42.15], [43.0, 43.23], [58.0, 60.96], [65.0, 65.94], [69.0, 70.01], [70.0, 74.33], [75.0, 75.88], [77.0, 80.13], [83.0, 84.87], [91.0, 92.8], [94.0, 95.94], [98.0, 99.39], [100.0, 101.65], [105.0, 107.54], [109.0, 113.54], [118.0, 122.99], [124.0, 125.37], [126.0, 129.73], [131.0, 132.75], [136.0, 136.71], [138.0, 138.69], [140.0, 141.18], [145.0, 151.82], [153.0, 154.3], [155.0, 156.42], [158.0, 159.48], [166.0, 167.63], [169.0, 168.84], [169.0, 170.14], [172.0, 172.56], [175.0, 176.99], [178.0, 179.31]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.49, 44.43, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 76.04, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 84.62, 64.07, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.51], ["sonar", 13.25], ["hum", 4.76]], [["mains hum", 21.47], ["fly, housefly", 10.83], ["insect", 10.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.68, 11.04, 0.15, 1.15, 0.23, 2.96, 0.94, 1.01, 4.33, 0.88, 3.13, 1.87, 1.8, 1.94, 1.39, 1.65, 2.54, 4.54, 4.99, 1.37, 3.73, 1.75, 0.71, 0.69, 1.18, 6.82, 1.3, 1.42, 1.48, 1.63, -0.16, 1.14, 0.56, 1.99, 1.31]} \ No newline at end of file diff --git a/annotations_1/-qGU1hiiJfU_filtered.json b/annotations_1/-qGU1hiiJfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..195994a65dd66ad5a7a010eb3275f5a4f71f3a58 --- /dev/null +++ b/annotations_1/-qGU1hiiJfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.36], [7.0, 8.34], [10.0, 10.4], [12.0, 12.51], [24.0, 26.91], [30.0, 31.94], [45.0, 46.82], [58.0, 57.97], [58.0, 58.8], [61.0, 62.41], [63.0, 63.96], [71.0, 73.52], [76.0, 76.44], [80.0, 83.25], [85.0, 86.04], [111.0, 111.74], [113.0, 114.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99, 0.0, 82.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 38.33], ["moo", 32.03], ["livestock, farm animals, working animals", 23.09]], null, null, null, null, null], "duration": [0.36, 1.34, 0.4, 0.51, 2.91, 1.94, 1.82, -0.03, 0.8, 1.41, 0.96, 2.52, 0.44, 3.25, 1.04, 0.74, 1.12]} \ No newline at end of file diff --git a/annotations_1/-r_-EnupRXo_filtered.json b/annotations_1/-r_-EnupRXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/-r_-EnupRXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/-rkhqMzCUnA_filtered.json b/annotations_1/-rkhqMzCUnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0b066052279cd9cadb243588d37b018d267ed7 --- /dev/null +++ b/annotations_1/-rkhqMzCUnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.43], [19.0, 20.41], [24.0, 24.48], [26.0, 26.94], [30.0, 30.54], [43.0, 43.43], [45.0, 45.81], [50.0, 49.96], [76.0, 76.33], [90.0, 90.29], [95.0, 99.01], [102.0, 103.22], [104.0, 104.5], [106.0, 107.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["fart", 14.23], ["sidetone", 10.64], ["noise", 9.66]], null, null, null], "duration": [0.34, 0.43, 1.41, 0.48, 0.94, 0.54, 0.43, 0.81, -0.04, 0.33, 0.29, 4.01, 1.22, 0.5, 1.0]} \ No newline at end of file diff --git a/annotations_1/-rsImQShehk_filtered.json b/annotations_1/-rsImQShehk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46b11c51cfa59e230fb248107e28c98c7ee2148e --- /dev/null +++ b/annotations_1/-rsImQShehk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [4.0, 31.78], [33.0, 36.85], [37.0, 36.88], [37.0, 37.44], [37.0, 37.5], [38.0, 38.08], [41.0, 40.86], [42.0, 42.45], [43.0, 47.97], [48.0, 97.09], [101.0, 108.01]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.78, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.43, 0.0, 30.51], "audiomae_on_audioset": [null, [["sheep", 19.58], ["livestock, farm animals, working animals", 17.46], ["cattle, bovinae", 16.0]], null, null, null, null, null, null, null, [["speech", 35.28], ["hum", 19.58], ["music", 9.9]], null, [["throbbing", 37.56], ["hum", 27.33], ["music", 14.82]]], "duration": [0.7, 27.78, 3.85, -0.12, 0.44, 0.5, 0.08, -0.14, 0.45, 4.97, 49.09, 7.01]} \ No newline at end of file diff --git a/annotations_1/-sD2jY0KMA8_filtered.json b/annotations_1/-sD2jY0KMA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62bc1200a72264af786ad118a1127fe02182c49f --- /dev/null +++ b/annotations_1/-sD2jY0KMA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.81], [17.0, 24.04], [26.0, 27.46], [39.0, 39.14], [43.0, 53.23], [57.0, 57.3], [59.0, 59.53], [62.0, 63.61], [64.0, 67.24], [70.0, 71.46], [80.0, 80.69], [83.0, 88.97], [91.0, 100.45], [105.0, 105.88], [112.0, 112.62]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [36.2, 32.0, 0.0, 0.0, 30.2, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 33.01, 30.17, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.96], ["throbbing", 17.24], ["hum", 16.9]], [["music", 62.1], ["throbbing", 10.26], ["hum", 10.04]], null, null, [["music", 44.72], ["didgeridoo", 16.05], ["throbbing", 6.48]], null, null, null, [["didgeridoo", 46.37], ["music", 31.04], ["quack", 2.26]], null, null, [["speech", 36.66], ["throbbing", 14.81], ["music", 10.5]], [["music", 52.55], ["speech", 38.81], ["boing", 4.76]], null, null], "duration": [3.81, 7.04, 1.46, 0.14, 10.23, 0.3, 0.53, 1.61, 3.24, 1.46, 0.69, 5.97, 9.45, 0.88, 0.62]} \ No newline at end of file diff --git a/annotations_1/-t06SZje8O0_filtered.json b/annotations_1/-t06SZje8O0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f534ac2a46aa6371ffdd3be23694d5f4e73e821a --- /dev/null +++ b/annotations_1/-t06SZje8O0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.22], [43.0, 47.71], [49.0, 49.0], [49.0, 49.59], [51.0, 72.35]], "keep_status": [true, true, false, false, true], "silence_prob": [30.68, 30.19, 0.0, 0.0, 29.6], "audiomae_on_audioset": [[["music", 57.58], ["thunk", 6.6], ["hum", 5.1]], [["speech", 21.52], ["music", 19.94], ["rumble", 6.61]], null, null, [["speech", 39.86], ["music", 11.03], ["explosion", 5.14]]], "duration": [17.22, 4.71, 0.0, 0.59, 21.35]} \ No newline at end of file diff --git a/annotations_1/-u1uwI5qJ74_filtered.json b/annotations_1/-u1uwI5qJ74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..370c09ea768e9c581a33f4bac114df0ee3f6625e --- /dev/null +++ b/annotations_1/-u1uwI5qJ74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.03], [15.0, 20.06], [20.0, 21.74], [25.0, 28.71], [32.0, 40.0], [44.0, 52.2], [53.0, 56.64], [74.0, 76.6], [81.0, 82.22], [98.0, 113.51], [118.0, 122.27], [126.0, 133.98], [147.0, 152.02], [152.0, 154.7]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true, false], "silence_prob": [46.79, 35.58, 0.0, 36.31, 33.48, 37.61, 36.2, 32.31, 0.0, 31.81, 32.36, 30.94, 31.87, 54.1], "audiomae_on_audioset": [[["speech", 76.95], ["burping, eructation", 4.68], ["male speech, man speaking", 3.51]], [["speech", 42.5], ["music", 29.1], ["thunk", 3.95]], null, [["music", 67.88], ["synthesizer", 3.22], ["whack, thwack", 2.51]], [["music", 62.57], ["speech", 16.83], ["groan", 5.21]], [["music", 46.6], ["speech", 18.77], ["boing", 11.21]], [["music", 18.98], ["fly, housefly", 8.67], ["speech", 6.46]], [["whack, thwack", 41.58], ["music", 20.14], ["thunk", 11.42]], null, [["music", 43.54], ["speech", 38.88], ["boing", 8.91]], [["music", 11.73], ["theremin", 11.64], ["speech", 10.43]], [["cattle, bovinae", 40.75], ["livestock, farm animals, working animals", 34.61], ["moo", 24.15]], [["music", 28.75], ["mosquito", 17.18], ["shofar", 4.72]], null], "duration": [3.03, 5.06, 1.74, 3.71, 8.0, 8.2, 3.64, 2.6, 1.22, 15.51, 4.27, 7.98, 5.02, 2.7]} \ No newline at end of file diff --git a/annotations_1/-uAEWFPmAwU_filtered.json b/annotations_1/-uAEWFPmAwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8dbf7fb5b1529de7d4e536d589dec0ef2d4ddb7 --- /dev/null +++ b/annotations_1/-uAEWFPmAwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 3.16], [4.0, 4.11], [5.0, 6.83], [7.0, 8.77], [10.0, 10.1], [15.0, 15.67], [17.0, 18.64], [22.0, 25.54], [28.0, 28.11], [30.0, 30.3], [35.0, 36.46], [38.0, 40.59], [50.0, 50.58], [56.0, 57.16], [65.0, 65.92], [69.0, 68.88], [71.0, 71.29], [73.0, 73.31], [79.0, 80.18], [95.0, 95.23], [96.0, 96.26], [112.0, 113.29], [114.0, 114.56], [115.0, 125.34], [128.0, 129.74], [140.0, 141.71], [145.0, 144.95], [145.0, 163.92], [181.0, 195.61], [200.0, 204.23], [205.0, 208.55], [211.0, 210.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0, 31.91, 32.91, 53.1, 78.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 58.24], ["mains hum", 8.51], ["throbbing", 4.76]], null, null, null, [["music", 75.51], ["didgeridoo", 6.36], ["theremin", 4.59]], [["music", 82.0], ["theremin", 1.38], ["musical instrument", 1.37]], null, null, null], "duration": [0.29, 0.16, 0.11, 1.83, 1.77, 0.1, 0.67, 1.64, 3.54, 0.11, 0.3, 1.46, 2.59, 0.58, 1.16, 0.92, -0.12, 0.29, 0.31, 1.18, 0.23, 0.26, 1.29, 0.56, 10.34, 1.74, 1.71, -0.05, 18.92, 14.61, 4.23, 3.55, -0.04]} \ No newline at end of file diff --git a/annotations_1/-uPSVWxV6d8_filtered.json b/annotations_1/-uPSVWxV6d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da03046e692908f111b6b45ecc97756624245a2f --- /dev/null +++ b/annotations_1/-uPSVWxV6d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.99], [7.0, 7.11], [10.0, 10.69], [12.0, 12.73], [14.0, 14.93], [17.0, 17.79], [21.0, 21.76], [22.0, 22.55], [23.0, 23.9], [42.0, 41.89], [42.0, 47.97], [50.0, 53.0], [54.0, 55.81], [57.0, 59.54], [67.0, 68.13], [70.0, 72.45], [79.0, 80.76], [88.0, 89.31], [93.0, 95.96], [99.0, 100.28], [104.0, 104.6], [111.0, 110.94], [120.0, 127.01], [135.0, 136.24], [137.0, 137.69], [139.0, 139.38], [141.0, 141.3], [144.0, 149.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 95.51, 0.0, 63.21, 0.0, 30.54, 0.0, 0.0, 36.73, 0.0, 0.0, 0.0, 39.89, 0.0, 0.0, 0.0, 0.0, 36.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.36], ["animal", 21.56], ["dog", 16.16]], null, null, [["music", 65.08], ["musical instrument", 2.12], ["didgeridoo", 1.73]], null, null, null, [["music", 39.29], ["speech", 9.45], ["cattle, bovinae", 3.79]], null, null, null, null, [["music", 72.51], ["speech", 11.24], ["fart", 1.7]]], "duration": [1.99, 0.11, 0.69, 0.73, 0.93, 0.79, 0.76, 0.55, 0.9, -0.11, 5.97, 3.0, 1.81, 2.54, 1.13, 2.45, 1.76, 1.31, 2.96, 1.28, 0.6, -0.06, 7.01, 1.24, 0.69, 0.38, 0.3, 5.4]} \ No newline at end of file diff --git a/annotations_1/-utei4CzIzc_filtered.json b/annotations_1/-utei4CzIzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53046e84553195bfd03cdd199a50cf8e4f7a6651 --- /dev/null +++ b/annotations_1/-utei4CzIzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.01], [7.0, 7.96], [8.0, 8.75], [11.0, 10.98], [12.0, 12.23], [13.0, 13.68], [15.0, 15.28], [18.0, 18.3], [19.0, 21.0], [22.0, 22.52], [24.0, 24.56], [28.0, 30.32], [53.0, 54.23], [55.0, 55.81], [63.0, 64.35], [70.0, 70.6], [73.0, 74.55], [76.0, 76.91], [78.0, 78.7], [80.0, 80.67], [82.0, 82.46], [84.0, 84.7], [85.0, 85.23], [86.0, 86.27], [88.0, 88.35], [90.0, 90.78], [92.0, 92.53], [95.0, 95.2], [97.0, 97.61], [100.0, 100.41], [102.0, 102.96], [105.0, 105.58], [107.0, 107.22], [110.0, 115.01], [117.0, 123.15], [124.0, 129.52], [133.0, 154.95], [156.0, 162.26], [165.0, 169.08], [181.0, 182.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.56, 34.21, 36.2, 53.65, 34.29, 46.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.78], ["wind instrument, woodwind instrument", 24.06], ["clarinet", 6.95]], [["music", 52.97], ["wind instrument, woodwind instrument", 20.28], ["musical instrument", 9.73]], [["wind instrument, woodwind instrument", 40.07], ["clarinet", 28.53], ["music", 20.29]], null, [["wind instrument, woodwind instrument", 47.33], ["music", 28.02], ["flute", 5.82]], [["speech", 24.03], ["fart", 4.86], ["crying, sobbing", 4.75]], null], "duration": [2.01, 0.96, 0.75, -0.02, 0.23, 0.68, 0.28, 0.3, 2.0, 0.52, 0.56, 2.32, 1.23, 0.81, 1.35, 0.6, 1.55, 0.91, 0.7, 0.67, 0.46, 0.7, 0.23, 0.27, 0.35, 0.78, 0.53, 0.2, 0.61, 0.41, 0.96, 0.58, 0.22, 5.01, 6.15, 5.52, 21.95, 6.26, 4.08, 1.61]} \ No newline at end of file diff --git a/annotations_1/-v8l6cCrf0w_filtered.json b/annotations_1/-v8l6cCrf0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa3b761e410d497390fbd37a07c1b7130f4aab08 --- /dev/null +++ b/annotations_1/-v8l6cCrf0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 57.48], [58.0, 59.44], [62.0, 63.0], [67.0, 68.66], [69.0, 69.6], [73.0, 84.38]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.78], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 32.38], ["buzz", 16.52], ["vehicle", 16.14]]], "duration": [41.48, 1.44, 1.0, 1.66, 0.6, 11.38]} \ No newline at end of file diff --git a/annotations_1/-vT2ztIXioo_filtered.json b/annotations_1/-vT2ztIXioo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79feee1c5d56ee51a769e05b3db0001a0ebbe952 --- /dev/null +++ b/annotations_1/-vT2ztIXioo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [9.0, 19.43], [20.0, 20.6], [21.0, 21.19], [22.0, 29.27], [30.0, 98.56]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 30.23, 0.0, 0.0, 31.21, 0.0], "audiomae_on_audioset": [null, [["music", 67.68], ["boing", 11.38], ["didgeridoo", 6.31]], null, null, [["fly, housefly", 37.75], ["insect", 32.1], ["mosquito", 14.81]], null], "duration": [0.07, 10.43, 0.6, 0.19, 7.27, 68.56]} \ No newline at end of file diff --git a/annotations_1/-v_2hFPseDg_filtered.json b/annotations_1/-v_2hFPseDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc12dd00e3e9ba68e5cebf06dbaf66476d378148 --- /dev/null +++ b/annotations_1/-v_2hFPseDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.55], [18.0, 18.98], [20.0, 34.1], [40.0, 44.09], [46.0, 56.08], [57.0, 57.89], [59.0, 59.12], [62.0, 69.43], [70.0, 80.96], [82.0, 86.86], [90.0, 93.16], [96.0, 96.53], [97.0, 124.23], [125.0, 130.84], [131.0, 130.94]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 31.88, 28.89, 34.08, 0.0, 0.0, 33.17, 30.2, 28.66, 29.17, 0.0, 28.79, 28.76, 0.0], "audiomae_on_audioset": [null, null, [["speech", 47.47], ["music", 16.04], ["mains hum", 6.52]], [["explosion", 17.51], ["breaking", 16.71], ["bang", 13.64]], [["hum", 37.04], ["mains hum", 35.23], ["speech", 12.31]], null, null, [["hum", 30.68], ["throbbing", 22.07], ["music", 18.0]], [["music", 42.12], ["speech", 15.43], ["throbbing", 7.51]], [["music", 44.72], ["speech", 30.04], ["hum", 3.05]], [["music", 57.6], ["throbbing", 7.58], ["hum", 4.92]], null, [["speech", 29.98], ["music", 19.26], ["explosion", 10.89]], [["music", 39.87], ["hum", 10.26], ["throbbing", 7.56]], null], "duration": [1.55, 0.98, 14.1, 4.09, 10.08, 0.89, 0.12, 7.43, 10.96, 4.86, 3.16, 0.53, 27.23, 5.84, -0.06]} \ No newline at end of file diff --git a/annotations_1/-vvxRiJkXAs_filtered.json b/annotations_1/-vvxRiJkXAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7b6167bf6ca56ca107ccfdc8ed7d004ac8647f --- /dev/null +++ b/annotations_1/-vvxRiJkXAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.21], [18.0, 18.1], [19.0, 22.08], [23.0, 23.62], [25.0, 28.59], [32.0, 32.64], [35.0, 39.14], [39.0, 40.34], [44.0, 46.62], [49.0, 54.45], [57.0, 56.89], [61.0, 60.94], [63.0, 67.1], [71.0, 71.42], [82.0, 87.37], [89.0, 92.92], [93.0, 108.67], [112.0, 123.62], [124.0, 128.21], [133.0, 134.08], [135.0, 135.21], [137.0, 139.4], [140.0, 141.15], [142.0, 144.34], [146.0, 146.08], [148.0, 148.69], [153.0, 155.53]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [42.58, 0.0, 39.94, 0.0, 34.55, 0.0, 40.82, 0.0, 29.62, 31.12, 0.0, 0.0, 33.31, 0.0, 29.18, 30.0, 29.65, 29.57, 28.74, 0.0, 0.0, 44.26, 0.0, 65.55, 0.0, 0.0, 29.48], "audiomae_on_audioset": [[["whale vocalization", 25.1], ["music", 19.63], ["hum", 10.81]], null, [["music", 39.36], ["didgeridoo", 16.38], ["whale vocalization", 7.12]], null, [["music", 56.6], ["theremin", 18.74], ["musical instrument", 5.37]], null, [["music", 53.88], ["synthesizer", 11.89], ["speech", 9.95]], null, [["music", 17.26], ["mosquito", 15.05], ["fly, housefly", 13.02]], [["didgeridoo", 22.68], ["music", 13.56], ["hum", 10.85]], null, null, [["hum", 39.93], ["mains hum", 23.43], ["music", 11.12]], null, [["music", 52.74], ["theremin", 5.49], ["musical instrument", 3.97]], [["didgeridoo", 35.39], ["music", 18.81], ["whip", 10.28]], [["music", 22.41], ["hum", 9.27], ["throbbing", 6.27]], [["music", 24.25], ["hum", 17.12], ["throbbing", 7.91]], [["speech", 51.52], ["music", 31.0], ["sound effect", 1.8]], null, null, [["music", 46.48], ["brass instrument", 19.27], ["trombone", 13.3]], null, null, null, null, [["music", 48.58], ["theremin", 13.6], ["foghorn", 5.09]]], "duration": [2.21, 0.1, 3.08, 0.62, 3.59, 0.64, 4.14, 1.34, 2.62, 5.45, -0.11, -0.06, 4.1, 0.42, 5.37, 3.92, 15.67, 11.62, 4.21, 1.08, 0.21, 2.4, 1.15, 2.34, 0.08, 0.69, 2.53]} \ No newline at end of file diff --git a/annotations_1/-wSqiksvdD8_filtered.json b/annotations_1/-wSqiksvdD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab87efbc3301c5031078aca5c1d6df5cdff1a68f --- /dev/null +++ b/annotations_1/-wSqiksvdD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [2.0, 3.89], [7.0, 11.33], [12.0, 17.47], [18.0, 18.57], [19.0, 19.45], [20.0, 20.44], [23.0, 27.24], [28.0, 28.46], [29.0, 29.57], [31.0, 32.66], [35.0, 35.8], [37.0, 38.48], [39.0, 42.08], [46.0, 47.56], [49.0, 63.0], [66.0, 66.48], [68.0, 69.69], [72.0, 89.31], [90.0, 93.33], [95.0, 108.89], [110.0, 110.86], [111.0, 117.9], [118.0, 119.79], [120.0, 126.87], [128.0, 127.75], [128.0, 128.07], [129.0, 130.79], [133.0, 135.65]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.25, 35.39, 0.0, 0.0, 0.0, 29.37, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 38.45, 0.0, 0.0, 50.86, 65.32, 55.53, 0.0, 49.73, 0.0, 38.93, 0.0, 0.0, 0.0, 70.16], "audiomae_on_audioset": [null, null, [["music", 42.26], ["hum", 20.21], ["mains hum", 8.28]], [["music", 26.21], ["animal", 15.35], ["didgeridoo", 11.52]], null, null, null, [["groan", 10.56], ["livestock, farm animals, working animals", 5.88], ["grunt", 5.42]], null, null, null, null, null, [["whale vocalization", 36.66], ["music", 10.48], ["speech", 7.62]], null, [["speech", 35.81], ["throbbing", 20.34], ["hum", 19.48]], null, null, null, null, null, null, [["hum", 38.96], ["mains hum", 26.78], ["speech", 21.8]], null, [["hum", 42.38], ["mains hum", 35.5], ["speech", 7.21]], null, null, null, null], "duration": [0.48, 1.89, 4.33, 5.47, 0.57, 0.45, 0.44, 4.24, 0.46, 0.57, 1.66, 0.8, 1.48, 3.08, 1.56, 14.0, 0.48, 1.69, 17.31, 3.33, 13.89, 0.86, 6.9, 1.79, 6.87, -0.25, 0.07, 1.79, 2.65]} \ No newline at end of file diff --git a/annotations_1/-wci2oycOQA_filtered.json b/annotations_1/-wci2oycOQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feb7b59c8ba05a7044a67d7a2c7a6024491b8cbe --- /dev/null +++ b/annotations_1/-wci2oycOQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [2.0, 6.71], [9.0, 10.03], [12.0, 47.09], [49.0, 50.11], [51.0, 51.38], [62.0, 77.09]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 30.13], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.51], ["car", 8.27], ["skidding", 7.09]]], "duration": [0.43, 4.71, 1.03, 35.09, 1.11, 0.38, 15.09]} \ No newline at end of file diff --git a/annotations_1/-whQdRI7wUQ_filtered.json b/annotations_1/-whQdRI7wUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5fe13776c82a00f0601e9a605b27c6e30e49a40 --- /dev/null +++ b/annotations_1/-whQdRI7wUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.68], [14.0, 15.35], [19.0, 20.56], [21.0, 23.28], [24.0, 30.15], [31.0, 36.58], [38.0, 64.5], [65.0, 65.64], [67.0, 68.2], [71.0, 75.83], [84.0, 91.89], [92.0, 93.5], [97.0, 98.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [69.74, 0.0, 0.0, 92.48, 59.24, 72.9, 71.14, 0.0, 0.0, 53.47, 32.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 35.36], ["speech", 14.98], ["boing", 6.81]], null, null], "duration": [8.68, 1.35, 1.56, 2.28, 6.15, 5.58, 26.5, 0.64, 1.2, 4.83, 7.89, 1.5, 1.56]} \ No newline at end of file diff --git a/annotations_1/-wqnmuzG51c_filtered.json b/annotations_1/-wqnmuzG51c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fdceca134ca72aab0e3127d626df527efffaa1f --- /dev/null +++ b/annotations_1/-wqnmuzG51c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [8.0, 9.12], [10.0, 10.45], [11.0, 17.44], [19.0, 35.55], [40.0, 40.88], [47.0, 48.54], [49.0, 71.12], [72.0, 74.97], [76.0, 78.19], [84.0, 86.37], [88.0, 96.28], [101.0, 102.49], [104.0, 104.94], [108.0, 108.46], [109.0, 111.59], [123.0, 130.03], [132.0, 135.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 46.19, 39.89, 0.0, 0.0, 66.27, 100.0, 100.0, 97.64, 98.66, 0.0, 0.0, 0.0, 80.82, 52.56, 48.06], "audiomae_on_audioset": [null, null, null, [["music", 48.35], ["speech", 21.86], ["didgeridoo", 4.49]], [["hum", 19.43], ["speech", 18.76], ["music", 12.89]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.83], ["music", 16.56], ["mosquito", 6.34]]], "duration": [1.13, 1.12, 0.45, 6.44, 16.55, 0.88, 1.54, 22.12, 2.97, 2.19, 2.37, 8.28, 1.49, 0.94, 0.46, 2.59, 7.03, 3.7]} \ No newline at end of file diff --git a/annotations_1/-xZKHX91z9I_filtered.json b/annotations_1/-xZKHX91z9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b71c36484cbad99e407a43142380e65cc66eef --- /dev/null +++ b/annotations_1/-xZKHX91z9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.44], [16.0, 68.22], [69.0, 70.01], [75.0, 76.17], [82.0, 82.46], [88.0, 90.36], [91.0, 101.04], [102.0, 126.6], [131.0, 136.63]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 34.17, 88.64, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 15.49], ["gunshot, gunfire", 9.11], ["burst, pop", 8.01]], null, null], "duration": [4.44, 52.22, 1.01, 1.17, 0.46, 2.36, 10.04, 24.6, 5.63]} \ No newline at end of file diff --git a/annotations_1/-yPwW5V4mhI_filtered.json b/annotations_1/-yPwW5V4mhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..931cb341f92ed95ad6c74a2fe6dfb6ab7b28da67 --- /dev/null +++ b/annotations_1/-yPwW5V4mhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.15], [5.0, 7.3], [10.0, 10.34], [15.0, 17.39], [21.0, 22.98], [27.0, 27.41], [40.0, 41.64], [44.0, 49.15], [52.0, 51.93], [53.0, 53.35], [54.0, 54.78], [56.0, 57.67], [60.0, 62.34], [63.0, 63.85], [66.0, 66.68], [67.0, 66.73], [67.0, 67.64], [68.0, 69.77], [77.0, 77.45], [81.0, 82.39], [91.0, 91.99], [96.0, 102.27], [103.0, 103.92], [106.0, 106.66], [109.0, 109.04], [111.0, 113.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.71, 0.0, 100.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 2.3, 0.34, 2.39, 1.98, 0.41, 1.64, 5.15, -0.07, 0.35, 0.78, 1.67, 2.34, 0.85, 0.68, -0.27, 0.64, 1.77, 0.45, 1.39, 0.99, 6.27, 0.92, 0.66, 0.04, 2.32]} \ No newline at end of file diff --git a/annotations_1/-yyoLJuNIJU_filtered.json b/annotations_1/-yyoLJuNIJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e16ab9050e3876cce66915ce37f69391e4cc0b6 --- /dev/null +++ b/annotations_1/-yyoLJuNIJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [13.0, 13.66], [14.0, 13.9], [14.0, 13.98], [15.0, 15.75], [18.0, 21.95], [26.0, 34.94], [37.0, 41.96], [43.0, 43.77], [47.0, 72.64], [75.0, 93.55], [94.0, 94.47], [97.0, 98.44], [103.0, 111.3], [117.0, 117.61], [118.0, 119.16], [122.0, 133.14], [135.0, 139.62], [140.0, 148.63], [155.0, 157.74], [158.0, 161.2], [163.0, 175.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.46, 28.59, 29.09, 0.0, 28.53, 28.45, 0.0, 0.0, 28.56, 0.0, 0.0, 28.75, 28.77, 28.55, 28.32, 29.25, 28.5], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.7], ["foghorn", 9.43], ["speech", 4.88]], [["music", 44.44], ["speech", 28.07], ["whack, thwack", 4.65]], [["music", 69.71], ["breaking", 7.55], ["throbbing", 5.28]], null, [["speech", 60.76], ["vehicle", 10.58], ["music", 6.53]], [["speech", 24.11], ["vehicle", 22.62], ["car", 13.55]], null, null, [["vehicle", 30.25], ["skidding", 21.62], ["car", 17.3]], null, null, [["speech", 25.76], ["music", 23.33], ["vehicle", 16.46]], [["music", 38.34], ["hum", 12.42], ["throbbing", 10.87]], [["vehicle", 46.86], ["car", 22.01], ["speech", 9.6]], [["skidding", 26.75], ["music", 22.25], ["vehicle", 14.44]], [["music", 25.53], ["vehicle", 9.71], ["speech", 7.92]], [["music", 18.89], ["livestock, farm animals, working animals", 18.41], ["cattle, bovinae", 9.71]]], "duration": [0.59, 0.66, -0.1, -0.02, 0.75, 3.95, 8.94, 4.96, 0.77, 25.64, 18.55, 0.47, 1.44, 8.3, 0.61, 1.16, 11.14, 4.62, 8.63, 2.74, 3.2, 12.74]} \ No newline at end of file diff --git a/annotations_1/-zNnJiwo_5Y_filtered.json b/annotations_1/-zNnJiwo_5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d5d03bf4b451dc069f61f96301cb86c533590e --- /dev/null +++ b/annotations_1/-zNnJiwo_5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 36.22], [38.0, 39.12], [44.0, 66.19], [68.0, 69.82], [72.0, 72.82], [79.0, 106.56], [109.0, 109.88], [112.0, 113.85]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [30.11, 0.0, 30.18, 0.0, 0.0, 30.43, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.13], ["didgeridoo", 9.52], ["wind instrument, woodwind instrument", 7.95]], null, [["music", 82.77], ["speech", 4.08], ["sampler", 1.59]], null, null, [["music", 74.49], ["psychedelic rock", 3.4], ["musical instrument", 2.66]], null, null], "duration": [2.22, 1.12, 22.19, 1.82, 0.82, 27.56, 0.88, 1.85]} \ No newline at end of file diff --git a/annotations_1/0-Whu5Hlbz8_filtered.json b/annotations_1/0-Whu5Hlbz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ed237ccbad1bb293a1639457c74abace44cb796 --- /dev/null +++ b/annotations_1/0-Whu5Hlbz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.33], [22.0, 30.75], [31.0, 30.79], [33.0, 34.32], [36.0, 36.8], [39.0, 39.41], [40.0, 40.81], [42.0, 43.07], [45.0, 46.38], [48.0, 48.49], [51.0, 52.22], [53.0, 54.21], [57.0, 56.83], [57.0, 59.88], [60.0, 61.48], [64.0, 65.85], [69.0, 71.04], [72.0, 72.62], [74.0, 75.59], [77.0, 77.5], [79.0, 79.2], [80.0, 80.25], [81.0, 82.12], [83.0, 83.67], [84.0, 85.77], [88.0, 88.94], [90.0, 89.88], [92.0, 108.6], [109.0, 117.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.71], ["fly, housefly", 4.16], ["explosion", 2.49]]], "duration": [0.33, 8.75, -0.21, 1.32, 0.8, 0.41, 0.81, 1.07, 1.38, 0.49, 1.22, 1.21, -0.17, 2.88, 1.48, 1.85, 2.04, 0.62, 1.59, 0.5, 0.2, 0.25, 1.12, 0.67, 1.77, 0.94, -0.12, 16.6, 8.73]} \ No newline at end of file diff --git a/annotations_1/003kLKX8n3E_filtered.json b/annotations_1/003kLKX8n3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..874dd3b54d5dbcfecaac8dc454d0c2d2077b229f --- /dev/null +++ b/annotations_1/003kLKX8n3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [4.0, 4.38], [5.0, 5.81], [6.0, 11.26], [12.0, 13.05], [14.0, 14.54], [16.0, 32.24], [33.0, 34.59], [37.0, 43.11], [46.0, 48.96], [55.0, 55.9], [57.0, 60.0], [60.0, 61.18], [62.0, 63.81], [66.0, 66.51], [68.0, 76.81], [77.0, 76.96], [77.0, 80.27], [81.0, 87.34], [89.0, 89.53], [90.0, 90.17], [91.0, 91.45], [92.0, 92.25], [93.0, 92.91], [94.0, 95.18], [96.0, 99.49], [100.0, 100.11], [100.0, 101.36], [102.0, 105.44], [106.0, 107.76], [109.0, 112.04], [113.0, 115.4], [117.0, 118.49], [120.0, 120.28], [121.0, 121.44], [122.0, 122.66], [123.0, 123.28], [125.0, 124.88], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 40.68, 0.0, 58.13, 75.55, 0.0, 57.4, 0.0, 0.0, 0.0, 51.23, 0.0, 70.86, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 64.52, 0.0, 56.18, 56.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 64.46], ["didgeridoo", 8.5], ["musical instrument", 5.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.04], ["hum", 12.35], ["throbbing", 6.37]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 0.38, 0.81, 5.26, 1.05, 0.54, 16.24, 1.59, 6.11, 2.96, 0.9, 3.0, 1.18, 1.81, 0.51, 8.81, -0.04, 3.27, 6.34, 0.53, 0.17, 0.45, 0.25, -0.09, 1.18, 3.49, 0.11, 1.36, 3.44, 1.76, 3.04, 2.4, 1.49, 0.28, 0.44, 0.66, 0.28, -0.12, 0.74]} \ No newline at end of file diff --git a/annotations_1/00I2Ofraf4A_filtered.json b/annotations_1/00I2Ofraf4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6df123e279367eff241e442e2cedb3038aae2ab0 --- /dev/null +++ b/annotations_1/00I2Ofraf4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [10.0, 21.51], [22.0, 22.4], [24.0, 24.7], [25.0, 30.84], [32.0, 33.93], [34.0, 35.92], [36.0, 37.25], [40.0, 42.47], [43.0, 47.21], [49.0, 50.43], [53.0, 57.7], [62.0, 62.43], [65.0, 75.15], [78.0, 82.0], [86.0, 92.55], [98.0, 98.39], [99.0, 99.98], [105.0, 106.22], [111.0, 113.86], [114.0, 122.94], [125.0, 140.32], [142.0, 142.25]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [41.2, 28.54, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 54.36, 51.44, 0.0, 44.93, 0.0, 52.98, 55.11, 38.32, 0.0, 0.0, 0.0, 47.43, 39.94, 37.8, 0.0], "audiomae_on_audioset": [[["mechanical fan", 18.59], ["mains hum", 14.19], ["hum", 8.8]], [["music", 21.94], ["hum", 10.94], ["throbbing", 9.6]], null, null, [["sidetone", 40.89], ["speech", 37.8], ["music", 6.72]], null, null, null, null, null, null, [["sidetone", 43.6], ["speech", 20.46], ["hum", 6.8]], null, null, null, [["speech", 23.75], ["fly, housefly", 23.68], ["insect", 18.5]], null, null, null, [["speech", 20.82], ["hum", 18.78], ["rumble", 8.39]], [["speech", 64.62], ["music", 11.96], ["sidetone", 6.08]], [["speech", 56.82], ["hum", 16.89], ["sidetone", 7.17]], null], "duration": [2.25, 11.51, 0.4, 0.7, 5.84, 1.93, 1.92, 1.25, 2.47, 4.21, 1.43, 4.7, 0.43, 10.15, 4.0, 6.55, 0.39, 0.98, 1.22, 2.86, 8.94, 15.32, 0.25]} \ No newline at end of file diff --git a/annotations_1/00QMS3Ldb20_filtered.json b/annotations_1/00QMS3Ldb20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd3038db201e628e85e91f1bde4d7abd4f71f44a --- /dev/null +++ b/annotations_1/00QMS3Ldb20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 57.5], [58.0, 59.88], [61.0, 64.22], [65.0, 65.91], [67.0, 70.65], [71.0, 73.95], [76.0, 105.14], [106.0, 136.36], [139.0, 156.24], [159.0, 203.03], [204.0, 204.42], [207.0, 209.16], [211.0, 215.13]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [29.2, 0.0, 29.97, 0.0, 29.52, 28.74, 28.53, 0.0, 28.74, 0.0, 0.0, 38.43, 33.42], "audiomae_on_audioset": [[["music", 53.55], ["speech", 21.69], ["hum", 4.38]], null, [["music", 25.39], ["hum", 17.56], ["mains hum", 16.62]], null, [["speech", 45.16], ["music", 44.0], ["musical instrument", 2.37]], [["throbbing", 30.63], ["music", 27.0], ["hum", 21.52]], [["music", 58.26], ["musical instrument", 11.4], ["effects unit", 2.72]], null, [["music", 46.43], ["mains hum", 17.38], ["hum", 5.1]], null, null, [["hum", 37.84], ["mains hum", 18.79], ["throbbing", 5.32]], [["hum", 45.32], ["mains hum", 18.49], ["throbbing", 9.37]]], "duration": [7.5, 1.88, 3.22, 0.91, 3.65, 2.95, 29.14, 30.36, 17.24, 44.03, 0.42, 2.16, 4.13]} \ No newline at end of file diff --git a/annotations_1/02AyhONR_DQ_filtered.json b/annotations_1/02AyhONR_DQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec3c95032f54146d85087db81e27881cd3a342d1 --- /dev/null +++ b/annotations_1/02AyhONR_DQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [7.0, 7.37], [8.0, 8.41], [15.0, 20.33], [28.0, 27.99], [32.0, 32.71], [35.0, 35.46], [37.0, 38.15], [38.0, 40.34], [43.0, 44.59], [45.0, 46.36], [51.0, 58.24], [60.0, 76.01], [76.0, 76.45], [77.0, 100.4], [105.0, 106.52], [113.0, 113.71], [115.0, 115.94], [118.0, 118.44], [119.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 35.1, 0.0, 0.0, 0.0, 0.0, 42.06, 0.0, 0.0, 42.74, 39.05, 0.0, 31.44, 0.0, 0.0, 0.0, 0.0, 41.36], "audiomae_on_audioset": [null, null, null, [["speech", 47.38], ["music", 24.17], ["animal", 8.14]], null, null, null, null, [["music", 28.5], ["burping, eructation", 22.16], ["effects unit", 14.45]], null, null, [["animal", 38.69], ["music", 23.98], ["dog", 9.46]], [["animal", 24.79], ["ding", 10.85], ["music", 10.73]], null, [["music", 67.66], ["electronic music", 5.3], ["boing", 5.22]], null, null, null, null, [["music", 38.73], ["musical instrument", 6.99], ["effects unit", 6.34]]], "duration": [0.04, 0.37, 0.41, 5.33, -0.01, 0.71, 0.46, 1.15, 2.34, 1.59, 1.36, 7.24, 16.01, 0.45, 23.4, 1.52, 0.71, 0.94, 0.44, 2.54]} \ No newline at end of file diff --git a/annotations_1/03jGqiF-0Gg_filtered.json b/annotations_1/03jGqiF-0Gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b86eaf58a5148e20921cc3fb469ede5575284d --- /dev/null +++ b/annotations_1/03jGqiF-0Gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.4], [6.0, 9.34], [11.0, 16.11], [17.0, 18.6], [21.0, 23.14], [24.0, 25.39], [26.0, 29.05], [33.0, 33.07], [37.0, 37.5], [52.0, 58.02]], "keep_status": [false, true, true, false, true, false, true, false, false, true], "silence_prob": [64.63, 40.26, 46.54, 0.0, 48.91, 0.0, 49.4, 0.0, 0.0, 37.85], "audiomae_on_audioset": [null, [["sidetone", 37.46], ["music", 10.98], ["speech", 10.23]], [["fly, housefly", 26.41], ["insect", 13.93], ["hum", 9.34]], null, [["music", 24.91], ["hum", 12.38], ["throbbing", 6.21]], null, [["hum", 25.63], ["music", 12.27], ["throbbing", 6.23]], null, null, [["mains hum", 23.56], ["hum", 15.96], ["noise", 12.73]]], "duration": [2.4, 3.34, 5.11, 1.6, 2.14, 1.39, 3.05, 0.07, 0.5, 6.02]} \ No newline at end of file diff --git a/annotations_1/03uEq5dKcFs_filtered.json b/annotations_1/03uEq5dKcFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2599b8de1eb9e3e75038b7c243667c15ef68e4 --- /dev/null +++ b/annotations_1/03uEq5dKcFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.47], [15.0, 15.3], [19.0, 27.03], [32.0, 33.52], [34.0, 33.81], [34.0, 34.92], [36.0, 36.19], [38.0, 38.37], [39.0, 39.77], [41.0, 42.13], [47.0, 47.92], [49.0, 49.55], [50.0, 51.26], [52.0, 52.42], [54.0, 53.94], [56.0, 58.01], [59.0, 59.12], [65.0, 65.38], [69.0, 70.78], [73.0, 75.1], [78.0, 78.04], [87.0, 87.03], [89.0, 91.1], [93.0, 93.72], [100.0, 100.38], [106.0, 106.3], [116.0, 118.18], [123.0, 123.87], [125.0, 125.24], [126.0, 144.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 92.8], "audiomae_on_audioset": [null, null, [["speech", 90.01], ["radio", 1.0], ["inside, small room", 0.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.3, 8.03, 1.52, -0.19, 0.92, 0.19, 0.37, 0.77, 1.13, 0.92, 0.55, 1.26, 0.42, -0.06, 2.01, 0.12, 0.38, 1.78, 2.1, 0.04, 0.03, 2.1, 0.72, 0.38, 0.3, 2.18, 0.87, 0.24, 18.0]} \ No newline at end of file diff --git a/annotations_1/056HlHORCIU_filtered.json b/annotations_1/056HlHORCIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7ef615d6de9348828f9dfb0ba6dabb7308f1525 --- /dev/null +++ b/annotations_1/056HlHORCIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.02], [4.0, 4.58], [7.0, 7.89], [9.0, 10.69], [11.0, 20.46], [21.0, 21.61], [24.0, 28.38], [29.0, 29.3], [32.0, 37.32], [38.0, 48.74]], "keep_status": [false, false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.1, 0.0, 30.59, 0.0, 29.99, 29.66], "audiomae_on_audioset": [null, null, null, null, [["hum", 23.75], ["speech", 21.77], ["mains hum", 14.05]], null, [["music", 49.09], ["buzz", 7.38], ["noise", 4.81]], null, [["music", 14.84], ["cacophony", 12.98], ["synthesizer", 10.44]], [["buzz", 32.4], ["vehicle", 14.19], ["music", 7.63]]], "duration": [1.02, 0.58, 0.89, 1.69, 9.46, 0.61, 4.38, 0.3, 5.32, 10.74]} \ No newline at end of file diff --git a/annotations_1/05foBuX_brU_filtered.json b/annotations_1/05foBuX_brU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed002d9c4baaa5e71e6325b96e26e66c3573f8f5 --- /dev/null +++ b/annotations_1/05foBuX_brU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [13.0, 13.9], [18.0, 18.18], [19.0, 20.09], [20.0, 20.58], [26.0, 26.05], [32.0, 33.03], [34.0, 34.7], [36.0, 36.71], [42.0, 42.57], [43.0, 44.56], [45.0, 46.14], [46.0, 46.7], [65.0, 66.43], [71.0, 72.0], [73.0, 72.96], [75.0, 76.3], [83.0, 82.88], [84.0, 85.04], [86.0, 86.19], [86.0, 86.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.9, 0.18, 1.09, 0.58, 0.05, 1.03, 0.7, 0.71, 0.57, 1.56, 1.14, 0.7, 1.43, 1.0, -0.04, 1.3, -0.12, 1.04, 0.19, 0.32]} \ No newline at end of file diff --git a/annotations_1/05qid4p_cfw_filtered.json b/annotations_1/05qid4p_cfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fbc3dd4dfa01ae381bf0650f237b1c65a15522e --- /dev/null +++ b/annotations_1/05qid4p_cfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.36], [10.0, 10.23], [12.0, 11.97], [15.0, 16.04], [17.0, 18.57], [21.0, 21.84], [24.0, 26.06], [31.0, 32.93], [38.0, 39.16], [51.0, 51.12], [79.0, 79.57], [89.0, 90.59], [107.0, 106.79], [109.0, 110.4], [136.0, 137.19], [147.0, 148.07], [151.0, 156.1], [160.0, 162.19], [164.0, 168.12], [181.0, 183.51], [184.0, 185.52], [187.0, 192.06], [197.0, 198.56], [202.0, 203.77], [213.0, 212.8], [215.0, 215.0], [223.0, 224.4], [229.0, 230.77], [231.0, 234.67], [238.0, 238.84]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 29.44, 29.05, 31.69, 0.0, 37.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 59.19], ["electronic music", 5.43], ["trance music", 3.77]], null, null, null, null, null, null, null, null, null, [["throbbing", 48.34], ["hum", 38.96], ["music", 6.13]], [["music", 61.62], ["speech", 5.42], ["electronic music", 4.35]], [["music", 70.83], ["electronic music", 5.54], ["static", 3.39]], [["music", 37.68], ["speech", 10.42], ["moo", 4.79]], null, [["music", 67.66], ["whack, thwack", 7.8], ["thunk", 2.1]], null, null, null, null, null, null, [["music", 67.71], ["lullaby", 1.74], ["singing", 1.74]], null], "duration": [0.36, 0.23, -0.03, 1.04, 1.57, 0.84, 2.06, 1.93, 1.16, 0.12, 0.57, 1.59, -0.21, 1.4, 1.19, 1.07, 5.1, 2.19, 4.12, 2.51, 1.52, 5.06, 1.56, 1.77, -0.2, 0.0, 1.4, 1.77, 3.67, 0.84]} \ No newline at end of file diff --git a/annotations_1/06DLNzLaTlE_filtered.json b/annotations_1/06DLNzLaTlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3555dedb97bc5e14a17c8728e72d34f116ece2d --- /dev/null +++ b/annotations_1/06DLNzLaTlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [8.0, 8.41], [9.0, 9.66], [14.0, 23.63], [24.0, 34.86], [40.0, 47.85], [49.0, 51.19], [53.0, 53.27], [59.0, 58.94], [60.0, 60.45], [61.0, 61.53], [66.0, 66.36], [68.0, 68.47], [69.0, 70.48], [72.0, 72.32], [75.0, 75.46], [78.0, 79.79], [82.0, 82.41], [84.0, 84.87], [88.0, 88.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 31.5, 33.42, 61.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.01], ["synthesizer", 10.4], ["theremin", 5.38]], [["music", 67.78], ["speech", 10.0], ["theremin", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.41, 0.66, 9.63, 10.86, 7.85, 2.19, 0.27, -0.06, 0.45, 0.53, 0.36, 0.47, 1.48, 0.32, 0.46, 1.79, 0.41, 0.87, 0.38]} \ No newline at end of file diff --git a/annotations_1/06L5y4Z9KcE_filtered.json b/annotations_1/06L5y4Z9KcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de5b19eabc356809923f45f7fe3a66cf70930b3 --- /dev/null +++ b/annotations_1/06L5y4Z9KcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.53], [21.0, 21.15], [28.0, 32.53], [34.0, 44.41], [44.0, 44.51], [45.0, 44.73], [45.0, 48.96], [50.0, 50.31], [52.0, 51.68], [54.0, 54.45], [69.0, 74.07], [75.0, 75.79], [81.0, 81.09], [83.0, 84.23], [86.0, 86.26], [88.0, 89.16], [92.0, 93.58], [95.0, 94.93], [97.0, 109.78], [112.0, 112.38], [113.0, 113.95], [124.0, 125.31], [126.0, 126.39], [128.0, 130.01], [132.0, 133.56], [138.0, 142.47], [145.0, 145.18], [146.0, 146.42], [147.0, 157.22], [158.0, 161.25], [165.0, 167.9], [168.0, 167.95], [169.0, 168.94]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.16, 33.87, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.85, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 31.61, 0.0, 0.0, 33.0, 81.89, 82.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.04], ["mosquito", 12.57], ["insect", 12.29]], [["electric shaver, electric razor", 43.47], ["mains hum", 25.92], ["hum", 14.2]], null, null, null, null, null, null, [["music", 63.24], ["effects unit", 9.91], ["guitar", 6.26]], null, null, null, null, null, null, null, [["speech", 31.88], ["mains hum", 14.2], ["hum", 14.01]], null, null, null, null, null, null, [["fart", 17.88], ["music", 13.06], ["explosion", 12.87]], null, null, [["buzz", 50.24], ["fly, housefly", 17.78], ["insect", 10.61]], null, null, null, null], "duration": [1.53, 0.15, 4.53, 10.41, 0.51, -0.27, 3.96, 0.31, -0.32, 0.45, 5.07, 0.79, 0.09, 1.23, 0.26, 1.16, 1.58, -0.07, 12.78, 0.38, 0.95, 1.31, 0.39, 2.01, 1.56, 4.47, 0.18, 0.42, 10.22, 3.25, 2.9, -0.05, -0.06]} \ No newline at end of file diff --git a/annotations_1/06qgu4XoNL4_filtered.json b/annotations_1/06qgu4XoNL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..119b179c7f49a953464730bf4545850f20fb8a87 --- /dev/null +++ b/annotations_1/06qgu4XoNL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [7.0, 8.36], [9.0, 9.69], [10.0, 11.08], [12.0, 13.22], [15.0, 17.86], [18.0, 19.2], [20.0, 21.98], [22.0, 22.23], [22.0, 24.56], [31.0, 34.21], [39.0, 41.98], [43.0, 51.97], [54.0, 54.51], [61.0, 62.58], [67.0, 69.89], [70.0, 71.22], [74.0, 77.57], [78.0, 78.87], [81.0, 81.87], [83.0, 85.56], [87.0, 87.18], [89.0, 89.94], [91.0, 94.1], [95.0, 95.89], [100.0, 100.26], [101.0, 101.53], [102.0, 102.03], [104.0, 104.6], [117.0, 116.88], [118.0, 118.81], [119.0, 120.04], [121.0, 121.27], [122.0, 129.9], [145.0, 146.42], [147.0, 153.86], [157.0, 157.05], [158.0, 158.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.48, 0.0, 0.0, 0.0, 32.94, 36.32, 32.13, 42.79, 0.0, 0.0, 39.86, 0.0, 42.08, 0.0, 0.0, 47.86, 0.0, 0.0, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.44, 0.0, 41.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 83.86], ["musical instrument", 3.73], ["electronic music", 2.81]], null, null, null, [["speech", 41.07], ["music", 39.75], ["sonar", 2.58]], [["livestock, farm animals, working animals", 43.24], ["cattle, bovinae", 31.91], ["moo", 16.67]], [["cattle, bovinae", 22.43], ["speech", 22.12], ["livestock, farm animals, working animals", 17.92]], [["music", 25.76], ["didgeridoo", 19.8], ["speech", 15.61]], null, null, [["speech", 87.55], ["radio", 3.48], ["speech synthesizer", 0.77]], null, [["speech", 38.27], ["music", 14.65], ["boing", 6.65]], null, null, [["heart sounds, heartbeat", 22.74], ["throbbing", 18.96], ["hum", 15.19]], null, null, [["speech", 57.35], ["sidetone", 11.02], ["music", 9.47]], null, null, null, null, null, null, null, null, null, [["music", 71.6], ["guitar", 6.11], ["bass guitar", 5.83]], null, [["music", 28.15], ["hum", 12.62], ["throbbing", 11.28]], null, null], "duration": [1.17, 1.36, 0.69, 1.08, 1.22, 2.86, 1.2, 1.98, 0.23, 2.56, 3.21, 2.98, 8.97, 0.51, 1.58, 2.89, 1.22, 3.57, 0.87, 0.87, 2.56, 0.18, 0.94, 3.1, 0.89, 0.26, 0.53, 0.03, 0.6, -0.12, 0.81, 1.04, 0.27, 7.9, 1.42, 6.86, 0.05, 0.38]} \ No newline at end of file diff --git a/annotations_1/07GcBnddoMU_filtered.json b/annotations_1/07GcBnddoMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63cbee2fc67730a4ff1715fda124488e6cc0a1bc --- /dev/null +++ b/annotations_1/07GcBnddoMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 64.29], [65.0, 77.09], [79.0, 88.57], [91.0, 109.56], [112.0, 113.98], [115.0, 124.46], [126.0, 125.59], [126.0, 133.12], [134.0, 134.03], [138.0, 140.93], [142.0, 142.86], [146.0, 146.25], [148.0, 148.29], [152.0, 152.93], [156.0, 166.83]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.78, 55.39, 94.66, 0.0, 36.83, 0.0, 82.97, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 94.22], "audiomae_on_audioset": [null, [["music", 35.27], ["groan", 4.95], ["animal", 4.06]], null, null, null, [["speech", 52.58], ["whack, thwack", 24.32], ["breaking", 9.51]], null, null, null, null, null, null, null, null, null], "duration": [1.29, 12.09, 9.57, 18.56, 1.98, 9.46, -0.41, 7.12, 0.03, 2.93, 0.86, 0.25, 0.29, 0.93, 10.83]} \ No newline at end of file diff --git a/annotations_1/07kluxoO8j8_filtered.json b/annotations_1/07kluxoO8j8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e086ff25cf4031b6fb1f41cda36ea28a868c189c --- /dev/null +++ b/annotations_1/07kluxoO8j8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [12.0, 12.6], [14.0, 14.98], [18.0, 18.22], [32.0, 34.01], [38.0, 40.05], [42.0, 44.39], [46.0, 52.12], [53.0, 64.59], [70.0, 74.21], [75.0, 81.5], [86.0, 98.64], [102.0, 111.92], [114.0, 123.69], [127.0, 126.64], [130.0, 130.92], [136.0, 139.53], [143.0, 143.88], [147.0, 150.72], [151.0, 154.08], [155.0, 157.89], [161.0, 164.81], [167.0, 171.71], [172.0, 184.54], [186.0, 200.04]], "keep_status": [false, false, false, false, false, false, true, true, true, true, true, true, false, false, false, false, false, false, true, true, true, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.73, 34.2, 33.72, 35.57, 33.89, 36.59, 35.76, 29.87, 29.42, 29.36, 0.0, 0.0, 30.8, 0.0, 28.7, 28.88, 29.27, 29.01, 30.75, 29.15, 29.25], "audiomae_on_audioset": [null, null, null, null, [["speech", 28.26], ["music", 24.28], ["hum", 21.43]], [["music", 73.34], ["hum", 4.63], ["electronic music", 3.03]], [["speech", 24.28], ["sidetone", 20.96], ["music", 15.12]], [["music", 43.26], ["hum", 15.94], ["noise", 7.85]], [["speech", 37.44], ["music", 18.56], ["hum", 10.47]], [["music", 37.86], ["effects unit", 8.16], ["synthesizer", 6.31]], [["music", 57.0], ["animal", 8.24], ["musical instrument", 4.41]], [["livestock, farm animals, working animals", 31.29], ["cattle, bovinae", 23.17], ["speech", 14.1]], [["music", 75.34], ["speech", 2.23], ["musical instrument", 1.92]], [["music", 39.57], ["hum", 21.75], ["mains hum", 9.2]], null, null, [["hum", 39.25], ["mains hum", 30.73], ["throbbing", 18.51]], null, [["music", 17.25], ["speech", 8.26], ["vehicle", 7.54]], [["music", 20.03], ["rumble", 14.29], ["mains hum", 7.13]], [["music", 32.78], ["whale vocalization", 13.05], ["speech", 8.58]], [["music", 48.44], ["cacophony", 17.03], ["throbbing", 3.41]], [["music", 55.04], ["brass instrument", 6.63], ["trombone", 6.42]], [["music", 34.22], ["throbbing", 11.13], ["hum", 8.52]], [["music", 38.14], ["speech", 22.32], ["throbbing", 4.56]]], "duration": [0.32, 0.6, 0.98, 0.22, 2.01, 2.05, 2.39, 6.12, 11.59, 4.21, 6.5, 12.64, 9.92, 9.69, -0.36, 0.92, 3.53, 0.88, 3.72, 3.08, 2.89, 3.81, 4.71, 12.54, 14.04]} \ No newline at end of file diff --git a/annotations_1/088CLxgnr8w_filtered.json b/annotations_1/088CLxgnr8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1550ad1855fe0025a3cada787b66ba55ed9f5ad6 --- /dev/null +++ b/annotations_1/088CLxgnr8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [5.0, 5.66], [10.0, 11.47], [12.0, 15.58], [16.0, 18.39], [19.0, 20.88], [22.0, 23.36], [24.0, 25.66], [27.0, 31.51], [33.0, 34.75], [37.0, 37.54], [46.0, 46.3], [55.0, 65.37], [72.0, 73.28], [76.0, 76.76], [105.0, 109.17], [113.0, 114.4], [117.0, 117.56], [121.0, 126.77], [129.0, 141.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.1, 54.43, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 56.63, 0.0, 0.0, 54.56, 0.0, 0.0, 57.89, 54.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 0.66, 1.47, 3.58, 2.39, 1.88, 1.36, 1.66, 4.51, 1.75, 0.54, 0.3, 10.37, 1.28, 0.76, 4.17, 1.4, 0.56, 5.77, 12.51]} \ No newline at end of file diff --git a/annotations_1/08NzJRNAFGc_filtered.json b/annotations_1/08NzJRNAFGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e80e9a4e5b715823bfa635b671450977fda8ee1 --- /dev/null +++ b/annotations_1/08NzJRNAFGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.82], [20.0, 23.9], [28.0, 28.53], [31.0, 32.37], [34.0, 34.82], [35.0, 35.94], [36.0, 37.94], [38.0, 40.59], [41.0, 42.03], [43.0, 44.31], [46.0, 49.33], [51.0, 53.54], [56.0, 57.13], [60.0, 67.05], [68.0, 70.43], [71.0, 72.96], [74.0, 76.69], [78.0, 78.95], [79.0, 81.53], [82.0, 83.73], [91.0, 90.85], [98.0, 98.86], [103.0, 104.14], [106.0, 107.7], [114.0, 114.2], [118.0, 118.42], [119.0, 119.62], [122.0, 124.31], [126.0, 126.67]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [50.06, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 33.63, 0.0, 0.0, 54.97, 98.59, 0.0, 83.52, 92.15, 0.0, 70.02, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0], "audiomae_on_audioset": [null, [["speech", 29.92], ["sidetone", 22.5], ["hum", 10.62]], null, null, null, null, null, [["stomach rumble", 42.7], ["sine wave", 11.39], ["fart", 6.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.82, 3.9, 0.53, 1.37, 0.82, 0.94, 1.94, 2.59, 1.03, 1.31, 3.33, 2.54, 1.13, 7.05, 2.43, 1.96, 2.69, 0.95, 2.53, 1.73, -0.15, 0.86, 1.14, 1.7, 0.2, 0.42, 0.62, 2.31, 0.67]} \ No newline at end of file diff --git a/annotations_1/08rJmhhQHtY_filtered.json b/annotations_1/08rJmhhQHtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5b771ec777eb43b6839937638bb50f1a612ebac --- /dev/null +++ b/annotations_1/08rJmhhQHtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.83], [10.0, 12.38], [21.0, 33.42], [38.0, 45.1], [46.0, 46.36], [50.0, 50.97], [52.0, 54.33], [55.0, 56.02], [58.0, 58.77], [64.0, 64.59], [66.0, 67.42], [70.0, 70.21], [75.0, 85.21], [88.0, 89.68], [91.0, 91.25], [92.0, 92.06], [93.0, 98.66], [99.0, 100.04], [106.0, 106.76], [109.0, 114.71], [115.0, 119.3]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 51.71, 44.69, 39.91, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 81.0, 45.69], "audiomae_on_audioset": [null, null, [["male singing", 29.4], ["speech", 29.3], ["clapping", 10.78]], [["speech", 60.62], ["fart", 5.94], ["moo", 3.11]], null, null, [["speech", 21.71], ["clapping", 6.3], ["livestock, farm animals, working animals", 5.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.7], ["hands", 8.2], ["music", 8.1]]], "duration": [0.83, 2.38, 12.42, 7.1, 0.36, 0.97, 2.33, 1.02, 0.77, 0.59, 1.42, 0.21, 10.21, 1.68, 0.25, 0.06, 5.66, 1.04, 0.76, 5.71, 4.3]} \ No newline at end of file diff --git a/annotations_1/09zP4iK6QuI_filtered.json b/annotations_1/09zP4iK6QuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d97763d47fc3c0312caa01f4d81179fd66e033 --- /dev/null +++ b/annotations_1/09zP4iK6QuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.88], [20.0, 24.65], [26.0, 28.27], [28.0, 28.39], [29.0, 31.4], [38.0, 38.26], [46.0, 46.21], [53.0, 56.52], [59.0, 79.62], [90.0, 90.41], [97.0, 96.92], [98.0, 99.25], [101.0, 102.84], [104.0, 104.82], [105.0, 111.08], [111.0, 112.36], [115.0, 117.53]], "keep_status": [false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 37.82, 30.39, 0.0, 46.72, 0.0, 0.0, 35.25, 37.1, 0.0, 0.0, 0.0, 0.0, 0.0, 36.49, 0.0, 39.52], "audiomae_on_audioset": [null, [["music", 40.62], ["throbbing", 14.04], ["hum", 12.85]], [["music", 37.31], ["throbbing", 17.45], ["hum", 11.19]], null, [["speech", 24.3], ["music", 17.77], ["radio", 16.7]], null, null, [["speech", 35.46], ["thunk", 8.59], ["music", 7.29]], [["music", 46.28], ["glass", 25.95], ["theremin", 3.11]], null, null, null, null, null, [["hum", 53.41], ["mains hum", 17.14], ["throbbing", 7.7]], null, [["speech", 16.14], ["rumble", 12.84], ["music", 7.88]]], "duration": [-0.12, 4.65, 2.27, 0.39, 2.4, 0.26, 0.21, 3.52, 20.62, 0.41, -0.08, 1.25, 1.84, 0.82, 6.08, 1.36, 2.53]} \ No newline at end of file diff --git a/annotations_1/0ACTvENkyD8_filtered.json b/annotations_1/0ACTvENkyD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3821fcdc7547a3af05260ffb660b2d3a41895d0a --- /dev/null +++ b/annotations_1/0ACTvENkyD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.02], [23.0, 23.99], [25.0, 27.4], [28.0, 30.38], [32.0, 34.05], [36.0, 36.86], [38.0, 39.21], [40.0, 42.4], [43.0, 53.67], [54.0, 60.0], [61.0, 76.72], [79.0, 88.48], [89.0, 118.4], [119.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [29.52, 0.0, 84.98, 45.36, 79.07, 0.0, 0.0, 54.5, 38.42, 38.14, 28.74, 35.33, 28.92, 0.0], "audiomae_on_audioset": [[["speech", 41.36], ["music", 28.54], ["didgeridoo", 6.52]], null, null, [["busy signal", 52.25], ["music", 15.58], ["synthesizer", 5.23]], null, null, null, null, [["speech", 35.21], ["music", 24.17], ["animal", 4.96]], [["music", 29.32], ["dog", 15.91], ["animal", 10.52]], [["music", 74.38], ["throbbing", 4.72], ["sound effect", 2.06]], [["music", 50.89], ["speech", 16.07], ["livestock, farm animals, working animals", 4.29]], [["music", 48.79], ["groan", 6.93], ["fly, housefly", 6.43]], null], "duration": [19.02, 0.99, 2.4, 2.38, 2.05, 0.86, 1.21, 2.4, 10.67, 6.0, 15.72, 9.48, 29.4, 0.42]} \ No newline at end of file diff --git a/annotations_1/0BM-Q3BDrkw_filtered.json b/annotations_1/0BM-Q3BDrkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb956dc90f8b98665420d8bb0590d47a902fa352 --- /dev/null +++ b/annotations_1/0BM-Q3BDrkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.53], [14.0, 17.47], [20.0, 22.45], [25.0, 26.59], [28.0, 31.48], [35.0, 37.47], [41.0, 43.48], [46.0, 48.3], [55.0, 57.79], [62.0, 63.37], [67.0, 68.67], [73.0, 73.4], [78.0, 78.97], [83.0, 84.57], [87.0, 87.71], [89.0, 93.24], [95.0, 98.44], [100.0, 103.35], [107.0, 108.97], [113.0, 113.91], [116.0, 117.75], [122.0, 123.9], [128.0, 128.49], [131.0, 133.17], [136.0, 136.9], [146.0, 147.21], [150.0, 151.39], [155.0, 156.93], [160.0, 163.76], [168.0, 170.28], [174.0, 181.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 98.27, 82.43, 0.0, 99.97, 87.55, 95.64, 76.86, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 90.08, 63.96, 0.0, 0.0, 0.0, 0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 0.0, 92.97, 100.0, 92.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.61], ["carnatic music", 3.11], ["musical instrument", 2.39]], null, null, null, null, null, null, null], "duration": [4.53, 3.47, 2.45, 1.59, 3.48, 2.47, 2.48, 2.3, 2.79, 1.37, 1.67, 0.4, 0.97, 1.57, 0.71, 4.24, 3.44, 3.35, 1.97, 0.91, 1.75, 1.9, 0.49, 2.17, 0.9, 1.21, 1.39, 1.93, 3.76, 2.28, 7.9]} \ No newline at end of file diff --git a/annotations_1/0C-qxjiDP1o_filtered.json b/annotations_1/0C-qxjiDP1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dffedbcd69ffefce09f90b7f4727ce7ac611e9a1 --- /dev/null +++ b/annotations_1/0C-qxjiDP1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [6.0, 14.47], [28.0, 30.45], [40.0, 40.81]], "keep_status": [false, false, false, false], "silence_prob": [98.1, 30.49, 30.57, 0.0], "audiomae_on_audioset": [null, [["music", 68.45], ["synthesizer", 8.6], ["electronic music", 6.37]], [["music", 91.41], ["electronic music", 1.88], ["hip hop music", 1.61]], null], "duration": [3.17, 8.47, 2.45, 0.81]} \ No newline at end of file diff --git a/annotations_1/0C4yBk6syOE_filtered.json b/annotations_1/0C4yBk6syOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0287ce0bcd765b2fbdc23ba1598660f2d5a6331a --- /dev/null +++ b/annotations_1/0C4yBk6syOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [15.0, 14.79], [15.0, 15.67], [18.0, 18.54], [19.0, 20.71], [22.0, 22.99], [25.0, 25.3], [30.0, 29.94], [36.0, 36.59], [38.0, 37.79], [43.0, 44.93], [47.0, 48.36], [51.0, 52.2], [56.0, 56.22], [58.0, 61.21], [62.0, 66.51], [79.0, 78.87], [89.0, 89.53], [104.0, 104.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 34.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.57], ["sidetone", 33.3], ["telephone", 7.37]], [["speech", 79.84], ["telephone", 4.75], ["inside, small room", 2.54]], null, null, null], "duration": [0.6, -0.21, 0.67, 0.54, 1.71, 0.99, 0.3, -0.06, 0.59, -0.21, 1.93, 1.36, 1.2, 0.22, 3.21, 4.51, -0.13, 0.53, 0.6]} \ No newline at end of file diff --git a/annotations_1/0CYdSfhwWVY_filtered.json b/annotations_1/0CYdSfhwWVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94309ccbc1c651cfd99b83dd899e5b7ccb72fc69 --- /dev/null +++ b/annotations_1/0CYdSfhwWVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.77], [10.0, 10.18], [34.0, 35.33], [38.0, 40.04], [43.0, 42.89], [43.0, 45.91], [47.0, 47.28], [48.0, 51.21], [51.0, 52.03], [55.0, 55.07], [58.0, 57.92], [58.0, 58.97], [60.0, 61.64], [62.0, 62.36], [64.0, 65.16], [67.0, 67.53], [71.0, 71.81], [85.0, 84.86], [89.0, 89.6], [91.0, 91.12], [92.0, 93.24], [97.0, 96.96], [98.0, 98.91], [102.0, 102.83], [104.0, 106.32], [109.0, 109.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 75.88, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.23, 0.18, 1.33, 2.04, -0.11, 2.91, 0.28, 3.21, 1.03, 0.07, -0.08, 0.97, 1.64, 0.36, 1.16, 0.53, 0.81, -0.14, 0.6, 0.12, 1.24, -0.04, 0.91, 0.83, 2.32, 0.43]} \ No newline at end of file diff --git a/annotations_1/0Cufl5Gao98_filtered.json b/annotations_1/0Cufl5Gao98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80b8918f2f6634898b29ed8be3baf975ce39e581 --- /dev/null +++ b/annotations_1/0Cufl5Gao98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.36], [12.0, 12.02], [12.0, 13.83], [15.0, 17.41], [20.0, 22.57], [23.0, 24.21], [31.0, 34.1], [36.0, 37.08], [37.0, 38.01], [40.0, 41.37], [47.0, 48.69], [52.0, 58.18], [59.0, 59.61], [61.0, 61.84], [63.0, 63.98], [69.0, 70.85], [72.0, 72.5], [77.0, 80.33], [82.0, 83.22], [86.0, 88.92], [92.0, 91.93], [95.0, 95.37], [100.0, 101.88], [103.0, 106.03], [108.0, 111.59], [115.0, 116.41], [117.0, 118.1], [119.0, 120.31], [124.0, 124.82], [127.0, 140.58], [141.0, 140.61], [148.0, 149.4], [165.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.14, 66.39, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 100.0, 0.0, 0.0, 0.0, 99.95, 98.66, 0.0, 0.0, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 74.61], ["boing", 4.4], ["music", 2.26]], null, null, null, null, null, null, null, [["applause", 72.44], ["clapping", 5.36], ["music", 4.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.34], ["applause", 4.44], ["sidetone", 2.31]], null, null, null], "duration": [0.36, 0.02, 1.83, 2.41, 2.57, 1.21, 3.1, 1.08, 1.01, 1.37, 1.69, 6.18, 0.61, 0.84, 0.98, 1.85, 0.5, 3.33, 1.22, 2.92, -0.07, 0.37, 1.88, 3.03, 3.59, 1.41, 1.1, 1.31, 0.82, 13.58, -0.39, 1.4, -0.06]} \ No newline at end of file diff --git a/annotations_1/0D35LZ4UBX8_filtered.json b/annotations_1/0D35LZ4UBX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0398e55a6b07868211c72e12f384b3ad4d8b8b3 --- /dev/null +++ b/annotations_1/0D35LZ4UBX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.5], [21.0, 21.24], [29.0, 30.84], [39.0, 40.98], [43.0, 43.66], [45.0, 45.66], [48.0, 50.19], [58.0, 59.07], [59.0, 65.69], [72.0, 72.06], [73.0, 74.55], [78.0, 79.27], [82.0, 82.26], [84.0, 86.63], [87.0, 88.18], [90.0, 91.54], [102.0, 104.6], [123.0, 123.35], [128.0, 133.12], [136.0, 136.63], [138.0, 140.95], [142.0, 152.05], [157.0, 163.29], [166.0, 166.58], [168.0, 170.31]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [30.28, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 30.7, 0.0, 31.19, 0.0, 81.35, 31.15, 31.25, 0.0, 34.75], "audiomae_on_audioset": [[["speech", 56.96], ["music", 6.34], ["applause", 5.59]], null, null, null, null, null, [["music", 40.55], ["didgeridoo", 40.25], ["musical instrument", 4.2]], null, [["music", 45.88], ["speech", 16.75], ["didgeridoo", 11.92]], null, null, null, null, [["speech", 69.63], ["music", 11.3], ["tap", 4.7]], null, null, [["speech", 39.13], ["music", 28.38], ["tap", 4.33]], null, [["music", 54.08], ["didgeridoo", 8.95], ["musical instrument", 4.2]], null, null, [["music", 53.4], ["didgeridoo", 35.1], ["musical instrument", 2.81]], [["music", 49.59], ["percussion", 11.05], ["didgeridoo", 10.18]], null, [["speech", 30.73], ["sidetone", 14.5], ["whale vocalization", 6.54]]], "duration": [2.5, 0.24, 1.84, 1.98, 0.66, 0.66, 2.19, 1.07, 6.69, 0.06, 1.55, 1.27, 0.26, 2.63, 1.18, 1.54, 2.6, 0.35, 5.12, 0.63, 2.95, 10.05, 6.29, 0.58, 2.31]} \ No newline at end of file diff --git a/annotations_1/0Dp--gKKMJ8_filtered.json b/annotations_1/0Dp--gKKMJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af2a595e48beb6e3c4da560897488fa944ddb501 --- /dev/null +++ b/annotations_1/0Dp--gKKMJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.53], [17.0, 19.21], [20.0, 21.24], [24.0, 23.63], [25.0, 25.52], [28.0, 28.56], [33.0, 34.05], [36.0, 37.1], [40.0, 43.44], [50.0, 55.12], [59.0, 65.53], [69.0, 70.75], [72.0, 73.47], [75.0, 76.0], [86.0, 86.61], [87.0, 86.98], [94.0, 109.32], [119.0, 126.25], [127.0, 127.13], [128.0, 130.23], [131.0, 132.75]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 37.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.28, 33.76, 32.92, 0.0, 0.0, 0.0, 0.0, 0.0, 33.53, 34.75, 0.0, 32.14, 0.0], "audiomae_on_audioset": [null, [["music", 58.91], ["speech", 9.99], ["musical instrument", 6.86]], null, null, null, null, null, null, [["music", 29.92], ["speech", 14.12], ["gobble", 8.87]], [["frog", 28.86], ["croak", 20.26], ["music", 16.56]], [["music", 80.41], ["musical instrument", 3.0], ["swing music", 1.67]], null, null, null, null, null, [["music", 64.29], ["speech", 10.67], ["didgeridoo", 7.42]], [["music", 55.28], ["speech", 23.93], ["didgeridoo", 2.96]], null, [["animal", 12.72], ["livestock, farm animals, working animals", 12.07], ["speech", 11.72]], null], "duration": [1.53, 2.21, 1.24, -0.37, 0.52, 0.56, 1.05, 1.1, 3.44, 5.12, 6.53, 1.75, 1.47, 1.0, 0.61, -0.02, 15.32, 7.25, 0.13, 2.23, 1.75]} \ No newline at end of file diff --git a/annotations_1/0EQXnRlIbXs_filtered.json b/annotations_1/0EQXnRlIbXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2edb2a33f4f082682b502924f779f0acdc7b3345 --- /dev/null +++ b/annotations_1/0EQXnRlIbXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.36], [38.0, 38.75], [42.0, 42.63], [46.0, 47.14], [48.0, 49.64], [54.0, 59.51], [63.0, 77.8], [79.0, 92.25], [93.0, 109.22], [111.0, 128.65], [132.0, 140.53], [143.0, 143.4], [144.0, 144.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [94.07, 0.0, 0.0, 0.0, 0.0, 40.82, 79.07, 67.25, 94.81, 93.6, 99.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 34.61], ["music", 22.12], ["boing", 4.45]], null, null, null, null, null, null, null], "duration": [6.36, 0.75, 0.63, 1.14, 1.64, 5.51, 14.8, 13.25, 16.22, 17.65, 8.53, 0.4, 0.91]} \ No newline at end of file diff --git a/annotations_1/0ERIepJUdPc_filtered.json b/annotations_1/0ERIepJUdPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d87ddf4417bf94c1ab432cd0c9cce8aee202c2d --- /dev/null +++ b/annotations_1/0ERIepJUdPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [3.0, 3.38], [4.0, 4.33], [12.0, 11.67], [12.0, 25.95], [28.0, 35.04], [38.0, 59.46], [64.0, 64.86], [65.0, 70.97], [73.0, 87.1], [89.0, 91.07], [91.0, 95.45], [96.0, 97.14], [97.0, 97.73], [101.0, 103.74], [108.0, 114.98], [115.0, 122.67], [124.0, 138.62], [141.0, 153.35], [156.0, 182.11], [185.0, 187.44], [189.0, 189.03], [189.0, 191.54]], "keep_status": [false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, true, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.18, 29.19, 28.78, 0.0, 28.23, 28.27, 29.83, 29.73, 0.0, 0.0, 30.56, 28.23, 28.3, 29.07, 29.66, 28.36, 29.53, 0.0, 28.65], "audiomae_on_audioset": [null, null, null, null, [["music", 32.88], ["hum", 7.61], ["whale vocalization", 5.94]], [["hum", 41.51], ["whale vocalization", 31.45], ["mains hum", 15.34]], [["hum", 33.59], ["music", 14.5], ["mains hum", 14.27]], null, [["music", 57.77], ["hum", 11.61], ["throbbing", 9.91]], [["music", 64.73], ["throbbing", 11.66], ["electronic music", 6.16]], [["vehicle", 20.01], ["eruption", 15.63], ["fixed-wing aircraft, airplane", 8.3]], [["hum", 36.24], ["mains hum", 27.86], ["speech", 18.65]], null, null, [["speech", 14.38], ["music", 14.37], ["hum", 13.37]], [["music", 22.44], ["mains hum", 16.71], ["hum", 15.75]], [["music", 53.65], ["speech", 8.81], ["electronic music", 4.7]], [["hum", 24.67], ["throbbing", 19.28], ["music", 16.43]], [["hum", 35.95], ["throbbing", 33.64], ["mains hum", 16.4]], [["speech", 37.06], ["vehicle", 33.95], ["motorboat, speedboat", 7.56]], [["speech", 25.16], ["hum", 14.62], ["mains hum", 8.7]], null, [["hum", 25.49], ["mains hum", 20.93], ["throbbing", 16.55]]], "duration": [0.56, 0.38, 0.33, -0.33, 13.95, 7.04, 21.46, 0.86, 5.97, 14.1, 2.07, 4.45, 1.14, 0.73, 2.74, 6.98, 7.67, 14.62, 12.35, 26.11, 2.44, 0.03, 2.54]} \ No newline at end of file diff --git a/annotations_1/0GCwhGQEZ90_filtered.json b/annotations_1/0GCwhGQEZ90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..924bfe2902068cc1d008769ed532415a88491daa --- /dev/null +++ b/annotations_1/0GCwhGQEZ90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [6.0, 29.76], [32.0, 34.21], [35.0, 40.88], [45.0, 46.62], [49.0, 51.16], [55.0, 54.92], [61.0, 61.74], [75.0, 75.37], [80.0, 86.71], [94.0, 95.22], [99.0, 99.52], [101.0, 101.31], [105.0, 105.29], [109.0, 108.82], [152.0, 158.58], [160.0, 161.05], [171.0, 174.29], [183.0, 185.38], [186.0, 187.47], [190.0, 190.83], [193.0, 194.26], [194.0, 197.5], [200.0, 201.77], [211.0, 213.07], [213.0, 213.24]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.86, 98.66, 31.94, 0.0, 32.78, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 29.5, 0.0, 29.98, 94.37, 0.0, 0.0, 0.0, 40.81, 0.0, 29.57, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.37], ["livestock, farm animals, working animals", 12.18], ["animal", 8.52]], null, [["livestock, farm animals, working animals", 57.83], ["cattle, bovinae", 26.82], ["moo", 10.14]], null, null, null, null, null, null, null, null, null, [["speech", 25.82], ["sidetone", 12.83], ["throbbing", 7.7]], null, [["music", 37.67], ["speech", 10.59], ["throbbing", 4.47]], null, null, null, null, [["throbbing", 30.67], ["hum", 22.03], ["music", 17.87]], null, [["groan", 51.09], ["music", 14.25], ["speech", 11.85]], null], "duration": [1.54, 23.76, 2.21, 5.88, 1.62, 2.16, -0.08, 0.74, 0.37, 6.71, 1.22, 0.52, 0.31, 0.29, -0.18, 6.58, 1.05, 3.29, 2.38, 1.47, 0.83, 1.26, 3.5, 1.77, 2.07, 0.24]} \ No newline at end of file diff --git a/annotations_1/0GEynXlmNYA_filtered.json b/annotations_1/0GEynXlmNYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecbd767535826cb61cf350e6df454b831646b376 --- /dev/null +++ b/annotations_1/0GEynXlmNYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.96], [15.0, 17.39], [20.0, 20.14], [21.0, 21.37], [25.0, 24.7], [28.0, 28.88], [36.0, 36.64], [39.0, 39.04], [46.0, 46.8], [51.0, 51.33], [53.0, 54.8], [58.0, 58.41], [63.0, 63.54], [79.0, 79.59], [84.0, 84.64], [96.0, 97.46], [104.0, 105.26], [126.0, 126.89], [128.0, 130.98]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.05], "audiomae_on_audioset": [null, [["cattle, bovinae", 15.81], ["moo", 13.28], ["music", 11.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.58], ["electronic music", 2.73], ["theremin", 2.42]]], "duration": [1.96, 2.39, 0.14, 0.37, -0.3, 0.88, 0.64, 0.04, 0.8, 0.33, 1.8, 0.41, 0.54, 0.59, 0.64, 1.46, 1.26, 0.89, 2.98]} \ No newline at end of file diff --git a/annotations_1/0GGOfY9uE1Y_filtered.json b/annotations_1/0GGOfY9uE1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc01e90587164c1c0cc0ccb7a9487e82147c4a85 --- /dev/null +++ b/annotations_1/0GGOfY9uE1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.18], [9.0, 10.25], [16.0, 17.0], [18.0, 19.16], [29.0, 30.37], [34.0, 33.62], [35.0, 35.19], [39.0, 38.67], [47.0, 47.36], [60.0, 61.47], [68.0, 67.88], [78.0, 77.85], [83.0, 82.86], [86.0, 87.3], [88.0, 88.45], [94.0, 95.27], [96.0, 96.75], [98.0, 98.88], [101.0, 101.28], [103.0, 105.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["croak", 23.14], ["frog", 18.5], ["fly, housefly", 11.41]]], "duration": [1.18, 1.25, 1.0, 1.16, 1.37, -0.38, 0.19, -0.33, 0.36, 1.47, -0.12, -0.15, -0.14, 1.3, 0.45, 1.27, 0.75, 0.88, 0.28, 2.49]} \ No newline at end of file diff --git a/annotations_1/0GYwcr3RD_k_filtered.json b/annotations_1/0GYwcr3RD_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12ce1fd7629caf54691c54fff35047b4a52fb5d4 --- /dev/null +++ b/annotations_1/0GYwcr3RD_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.05], [14.0, 14.49], [15.0, 17.32], [18.0, 19.43], [21.0, 21.76], [23.0, 24.75], [28.0, 28.75], [30.0, 31.11], [35.0, 35.97], [37.0, 38.18], [39.0, 41.03], [50.0, 50.53], [52.0, 52.57], [59.0, 59.46], [60.0, 61.06], [62.0, 63.39], [65.0, 65.94], [67.0, 68.32], [70.0, 72.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.49, 2.32, 1.43, 0.76, 1.75, 0.75, 1.11, 0.97, 1.18, 2.03, 0.53, 0.57, 0.46, 1.06, 1.39, 0.94, 1.32, 2.87]} \ No newline at end of file diff --git a/annotations_1/0IQgjMYWVGc_filtered.json b/annotations_1/0IQgjMYWVGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..455ccdd17c81d6a50568781b8d5370d05cc3573f --- /dev/null +++ b/annotations_1/0IQgjMYWVGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.8], [24.0, 26.54], [28.0, 28.85], [31.0, 55.65], [57.0, 59.07], [60.0, 61.28], [63.0, 80.27], [97.0, 97.31], [98.0, 98.64], [100.0, 101.63], [103.0, 103.94], [105.0, 106.96], [107.0, 107.72], [109.0, 108.89], [111.0, 119.8], [124.0, 138.3], [141.0, 143.29]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [41.05, 52.68, 0.0, 35.08, 100.0, 0.0, 31.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 46.54, 42.48], "audiomae_on_audioset": [[["music", 41.07], ["hum", 8.2], ["noise", 5.53]], null, null, [["music", 46.64], ["thunk", 10.38], ["hum", 10.26]], null, null, [["music", 42.31], ["hum", 17.83], ["mains hum", 11.14]], null, null, null, null, null, null, null, [["hum", 54.29], ["throbbing", 16.04], ["music", 13.94]], [["music", 37.02], ["hum", 15.31], ["throbbing", 10.28]], [["music", 40.5], ["hum", 14.54], ["throbbing", 13.53]]], "duration": [9.8, 2.54, 0.85, 24.65, 2.07, 1.28, 17.27, 0.31, 0.64, 1.63, 0.94, 1.96, 0.72, -0.11, 8.8, 14.3, 2.29]} \ No newline at end of file diff --git a/annotations_1/0IWmniYe7aI_filtered.json b/annotations_1/0IWmniYe7aI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d5eff34b7cad92b07a0975ccb688ee2e6f0f7b --- /dev/null +++ b/annotations_1/0IWmniYe7aI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.95], [15.0, 27.99], [30.0, 30.75], [31.0, 31.48], [32.0, 40.98], [42.0, 47.85], [50.0, 50.84], [55.0, 54.92], [58.0, 60.15], [66.0, 66.46], [68.0, 69.11], [79.0, 79.46], [81.0, 81.4], [83.0, 84.21], [86.0, 87.03], [89.0, 89.45], [90.0, 90.69], [93.0, 97.24], [98.0, 98.79], [104.0, 112.53], [114.0, 114.54], [120.0, 120.53], [124.0, 126.25]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 31.02, 0.0, 0.0, 31.01, 31.77, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 35.39, 0.0, 0.0, 39.27], "audiomae_on_audioset": [null, [["music", 62.39], ["throbbing", 8.19], ["electronic music", 5.14]], null, null, [["fly, housefly", 36.07], ["mosquito", 31.11], ["insect", 15.92]], [["music", 59.25], ["mains hum", 4.97], ["hum", 3.78]], null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 24.01], ["music", 21.82], ["fly, housefly", 16.28]], null, [["music", 67.78], ["synthesizer", 7.67], ["didgeridoo", 2.47]], null, null, [["music", 62.75], ["synthesizer", 10.52], ["musical instrument", 8.18]]], "duration": [0.95, 12.99, 0.75, 0.48, 8.98, 5.85, 0.84, -0.08, 2.15, 0.46, 1.11, 0.46, 0.4, 1.21, 1.03, 0.45, 0.69, 4.24, 0.79, 8.53, 0.54, 0.53, 2.25]} \ No newline at end of file diff --git a/annotations_1/0IiCOhajpS8_filtered.json b/annotations_1/0IiCOhajpS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6183628173a505683e96da0afc8af6b10104a0ef --- /dev/null +++ b/annotations_1/0IiCOhajpS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.93], [9.0, 10.72], [11.0, 42.09], [43.0, 45.54], [47.0, 46.85], [50.0, 57.18], [58.0, 61.26], [63.0, 73.16], [74.0, 78.38], [79.0, 118.74], [120.0, 152.51]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false], "silence_prob": [94.37, 0.0, 0.0, 34.8, 0.0, 37.06, 39.66, 41.93, 44.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 37.06], ["theremin", 3.76], ["speech", 3.48]], null, [["music", 54.68], ["percussion", 3.63], ["musical instrument", 2.79]], [["music", 62.03], ["musical instrument", 6.19], ["didgeridoo", 5.9]], [["music", 66.94], ["musical instrument", 6.19], ["theremin", 5.56]], [["speech", 28.89], ["music", 23.87], ["singing bowl", 6.21]], null, null], "duration": [3.93, 1.72, 31.09, 2.54, -0.15, 7.18, 3.26, 10.16, 4.38, 39.74, 32.51]} \ No newline at end of file diff --git a/annotations_1/0IuOpt3p3WE_filtered.json b/annotations_1/0IuOpt3p3WE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f5cdf30fca4852225b43228cc5697aed30498a2 --- /dev/null +++ b/annotations_1/0IuOpt3p3WE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 19.08], [34.0, 33.89], [35.0, 35.67], [37.0, 39.12], [41.0, 42.26], [44.0, 44.46], [51.0, 53.57], [57.0, 57.3], [58.0, 58.18], [59.0, 59.61], [60.0, 60.67], [61.0, 74.41], [81.0, 82.68], [85.0, 100.82], [101.0, 101.44], [101.0, 101.58], [102.0, 101.82], [102.0, 101.85], [102.0, 143.02], [146.0, 146.75], [148.0, 148.36], [159.0, 160.1], [168.0, 168.52], [170.0, 170.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0, 0.0, 29.53, 0.0, 29.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 57.74], ["music", 12.85], ["speech synthesizer", 2.36]], null, null, null, null, [["music", 88.1], ["electronic music", 1.44], ["male singing", 0.89]], null, [["music", 85.1], ["electronic music", 1.52], ["funny music", 1.46]], null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.08, -0.11, 0.67, 2.12, 1.26, 0.46, 2.57, 0.3, 0.18, 0.61, 0.67, 13.41, 1.68, 15.82, 0.44, 0.58, -0.18, -0.15, 41.02, 0.75, 0.36, 1.1, 0.52, 0.46]} \ No newline at end of file diff --git a/annotations_1/0IyuK069I-w_filtered.json b/annotations_1/0IyuK069I-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6905d2d31e09795c4a80111243d3ec9b986052af --- /dev/null +++ b/annotations_1/0IyuK069I-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [18.0, 18.89], [30.0, 30.54], [40.0, 40.66], [63.0, 65.75], [90.0, 90.68], [91.0, 90.86], [91.0, 92.4], [107.0, 108.85], [134.0, 134.5], [139.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 0.0, 0.0, 0.0, 0.0, 34.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 31.9], ["whack, thwack", 6.26], ["hum", 5.38]]], "duration": [0.67, 0.89, 0.54, 0.66, 2.75, 0.68, -0.14, 1.4, 1.85, 0.5, 2.17]} \ No newline at end of file diff --git a/annotations_1/0J4K03Owgwc_filtered.json b/annotations_1/0J4K03Owgwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/0J4K03Owgwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/0JVZ0bE8hpk_filtered.json b/annotations_1/0JVZ0bE8hpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc978756a4bf74100179e1cb8e315f0ebb3fa3f --- /dev/null +++ b/annotations_1/0JVZ0bE8hpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [6.0, 15.04], [17.0, 33.62], [36.0, 59.05], [60.0, 75.86], [82.0, 91.25], [96.0, 101.49], [102.0, 102.71], [104.0, 105.16], [107.0, 107.89], [109.0, 109.88]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.24, 32.64, 32.44, 31.82, 32.06, 31.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.99], ["didgeridoo", 11.34], ["speech", 6.64]], [["music", 36.68], ["speech", 26.41], ["synthesizer", 9.67]], [["music", 28.65], ["echo", 16.57], ["effects unit", 6.85]], [["music", 57.02], ["hum", 7.49], ["didgeridoo", 6.0]], [["music", 69.93], ["musical instrument", 7.74], ["effects unit", 3.03]], [["music", 51.4], ["hum", 13.99], ["throbbing", 4.61]], null, null, null, null], "duration": [1.97, 9.04, 16.62, 23.05, 15.86, 9.25, 5.49, 0.71, 1.16, 0.89, 0.88]} \ No newline at end of file diff --git a/annotations_1/0K6bVf4ra1w_filtered.json b/annotations_1/0K6bVf4ra1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bcb445c7d9e283a5c8aee3e12cf4bfe7e48dab7 --- /dev/null +++ b/annotations_1/0K6bVf4ra1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 29.81], [34.0, 34.18], [35.0, 38.57], [48.0, 94.58], [95.0, 112.77], [114.0, 114.0]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.85, 0.0, 30.03, 0.0, 30.18, 0.0], "audiomae_on_audioset": [[["music", 22.91], ["speech", 16.23], ["sidetone", 12.95]], null, [["music", 63.29], ["speech", 9.11], ["cacophony", 7.77]], null, [["speech", 40.35], ["music", 36.74], ["smash, crash", 2.36]], null], "duration": [21.81, 0.18, 3.57, 46.58, 17.77, 0.0]} \ No newline at end of file diff --git a/annotations_1/0KjO3YwlhEE_filtered.json b/annotations_1/0KjO3YwlhEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fc5b7ac29e654cf4a5e6344e7508c932964480d --- /dev/null +++ b/annotations_1/0KjO3YwlhEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.15], [11.0, 12.06], [21.0, 21.68], [24.0, 25.3], [26.0, 26.84], [31.0, 31.56], [34.0, 35.18], [36.0, 37.08], [38.0, 40.32], [42.0, 43.39], [45.0, 46.92], [51.0, 50.9], [52.0, 53.99], [55.0, 57.55], [59.0, 59.27], [60.0, 60.61], [61.0, 61.26], [63.0, 63.68], [67.0, 69.11], [70.0, 74.85], [77.0, 82.39], [85.0, 90.59], [92.0, 93.63], [96.0, 97.68], [102.0, 107.84], [110.0, 111.43], [117.0, 122.61], [126.0, 142.84], [145.0, 146.15], [149.0, 151.17], [153.0, 158.14], [160.0, 165.62], [167.0, 191.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 43.85, 33.67, 33.77, 37.23, 0.0, 0.0, 47.23, 0.0, 33.22, 34.32, 0.0, 57.97, 75.72, 93.76, 35.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.32], ["musical instrument", 4.39], ["singing", 2.72]], null, null, null, null, [["music", 65.95], ["musical instrument", 6.09], ["guitar", 4.58]], [["music", 81.9], ["humming", 4.94], ["yodeling", 4.12]], [["music", 78.22], ["carnatic music", 3.66], ["singing", 2.76]], [["music", 61.93], ["guitar", 4.95], ["musical instrument", 4.4]], null, null, [["music", 41.72], ["bass guitar", 11.96], ["guitar", 11.86]], null, [["music", 64.76], ["yodeling", 6.21], ["singing", 3.53]], [["music", 80.88], ["humming", 5.7], ["carnatic music", 2.35]], null, null, null, null, [["music", 57.39], ["speech", 7.57], ["musical instrument", 5.0]]], "duration": [7.15, 1.06, 0.68, 1.3, 0.84, 0.56, 1.18, 1.08, 2.32, 1.39, 1.92, -0.1, 1.99, 2.55, 0.27, 0.61, 0.26, 0.68, 2.11, 4.85, 5.39, 5.59, 1.63, 1.68, 5.84, 1.43, 5.61, 16.84, 1.15, 2.17, 5.14, 5.62, 24.94]} \ No newline at end of file diff --git a/annotations_1/0L1sL54G45Q_filtered.json b/annotations_1/0L1sL54G45Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0788b1dd66c561087e9528c976554e22ddfa3e --- /dev/null +++ b/annotations_1/0L1sL54G45Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.12], [39.0, 46.55], [49.0, 124.71], [125.0, 125.74], [127.0, 127.01]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 36.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.56], ["theremin", 33.15], ["singing", 1.46]], null, null, null], "duration": [0.12, 7.55, 75.71, 0.74, 0.01]} \ No newline at end of file diff --git a/annotations_1/0LArIo7OUJ8_filtered.json b/annotations_1/0LArIo7OUJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c77499edeeea83a13b17ac5f1212623f460cd3e --- /dev/null +++ b/annotations_1/0LArIo7OUJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 29.32], [32.0, 33.47], [43.0, 44.66], [46.0, 46.47], [49.0, 51.11], [58.0, 66.68], [69.0, 72.39], [74.0, 74.85], [81.0, 82.54], [83.0, 83.07], [87.0, 91.99], [93.0, 110.67], [113.0, 116.18], [116.0, 118.17], [119.0, 119.55], [120.0, 121.73], [123.0, 150.82], [151.0, 155.33], [156.0, 156.59]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [31.04, 0.0, 0.0, 0.0, 31.69, 30.74, 38.17, 0.0, 0.0, 0.0, 42.93, 29.62, 31.4, 28.71, 0.0, 0.0, 28.95, 30.55, 0.0], "audiomae_on_audioset": [[["music", 30.3], ["didgeridoo", 24.2], ["frog", 8.06]], null, null, null, [["didgeridoo", 61.78], ["music", 14.89], ["speech", 5.52]], [["music", 56.65], ["didgeridoo", 18.02], ["musical instrument", 4.49]], [["music", 66.86], ["didgeridoo", 14.6], ["hum", 2.23]], null, null, null, [["music", 67.28], ["didgeridoo", 8.33], ["hum", 2.14]], [["music", 38.29], ["didgeridoo", 14.36], ["speech", 7.32]], [["music", 23.12], ["foghorn", 12.47], ["didgeridoo", 8.53]], [["music", 58.06], ["theremin", 6.51], ["synthesizer", 3.88]], null, null, [["music", 89.26], ["didgeridoo", 2.28], ["musical instrument", 2.15]], [["music", 54.88], ["quack", 15.89], ["animal", 6.72]], null], "duration": [3.32, 1.47, 1.66, 0.47, 2.11, 8.68, 3.39, 0.85, 1.54, 0.07, 4.99, 17.67, 3.18, 2.17, 0.55, 1.73, 27.82, 4.33, 0.59]} \ No newline at end of file diff --git a/annotations_1/0N7ilB9wX3o_filtered.json b/annotations_1/0N7ilB9wX3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3a6c1b374a39a6a5fe0fdc9427c3efbc9718a80 --- /dev/null +++ b/annotations_1/0N7ilB9wX3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [18.0, 18.1], [31.0, 31.53], [32.0, 32.68], [43.0, 42.79], [51.0, 51.71], [69.0, 69.58], [76.0, 76.03], [85.0, 87.2], [113.0, 114.07], [116.0, 116.88], [122.0, 122.22], [127.0, 128.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 78.33], ["speech", 2.9], ["musical instrument", 1.96]], null, null, null, null], "duration": [0.73, 0.1, 0.53, 0.68, -0.21, 0.71, 0.58, 0.03, 2.2, 1.07, 0.88, 0.22, 1.51]} \ No newline at end of file diff --git a/annotations_1/0NUDP-gxGyM_filtered.json b/annotations_1/0NUDP-gxGyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e3d4a99da7e2b5d4ee6b9c4b470b7b2171ced1f --- /dev/null +++ b/annotations_1/0NUDP-gxGyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.07], [11.0, 11.8], [13.0, 13.85], [17.0, 17.59], [20.0, 20.8], [21.0, 23.08], [26.0, 27.68], [31.0, 32.51], [33.0, 35.94], [37.0, 39.77], [42.0, 43.17], [52.0, 55.93], [59.0, 59.17], [64.0, 64.76], [67.0, 68.35], [73.0, 75.29], [76.0, 78.02], [80.0, 80.2], [87.0, 91.03], [94.0, 98.31], [99.0, 102.59], [104.0, 105.0], [105.0, 106.15], [110.0, 123.82], [124.0, 129.86], [130.0, 137.51], [141.0, 147.99], [150.0, 150.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 99.94, 100.0, 0.0, 51.5, 0.0, 0.0, 0.0, 54.9, 98.59, 0.0, 99.73, 99.93, 99.99, 0.0, 0.0, 84.98, 74.13, 49.97, 44.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.14], ["hum", 26.47], ["throbbing", 12.16]], [["fly, housefly", 21.39], ["hum", 11.31], ["fart", 10.99]], null], "duration": [1.07, 0.8, 0.85, 0.59, 0.8, 2.08, 1.68, 1.51, 2.94, 2.77, 1.17, 3.93, 0.17, 0.76, 1.35, 2.29, 2.02, 0.2, 4.03, 4.31, 3.59, 1.0, 1.15, 13.82, 5.86, 7.51, 6.99, 0.67]} \ No newline at end of file diff --git a/annotations_1/0NXkZZqCGjs_filtered.json b/annotations_1/0NXkZZqCGjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..548331b3efb78a3683b671dff676417cbb1bca75 --- /dev/null +++ b/annotations_1/0NXkZZqCGjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.82], [29.0, 29.93], [39.0, 93.7], [94.0, 102.0], [105.0, 108.24], [111.0, 121.47]], "keep_status": [true, false, false, true, true, false], "silence_prob": [35.37, 0.0, 0.0, 33.23, 33.65, 33.19], "audiomae_on_audioset": [[["speech", 25.15], ["vehicle", 16.68], ["car", 8.78]], null, null, [["speech", 41.49], ["vehicle", 8.64], ["buzz", 5.27]], [["music", 30.74], ["speech", 13.7], ["whale vocalization", 9.0]], [["music", 77.4], ["buzz", 2.7], ["didgeridoo", 2.43]]], "duration": [2.82, 0.93, 54.7, 8.0, 3.24, 10.47]} \ No newline at end of file diff --git a/annotations_1/0ONU_H0EjIg_filtered.json b/annotations_1/0ONU_H0EjIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d696c82284b40c4a3689233ff99d4db922c48c3 --- /dev/null +++ b/annotations_1/0ONU_H0EjIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.62], [32.0, 35.16], [36.0, 38.91], [40.0, 40.74], [41.0, 43.7], [45.0, 48.0], [49.0, 54.67], [55.0, 56.05], [56.0, 57.03], [58.0, 59.56], [60.0, 60.74], [62.0, 62.63], [70.0, 71.04], [72.0, 73.45], [76.0, 77.04], [80.0, 81.24], [83.0, 85.21], [86.0, 88.96], [90.0, 91.94], [96.0, 97.34], [99.0, 100.4], [104.0, 105.41], [106.0, 107.76], [109.0, 117.05], [118.0, 119.82], [120.0, 123.23], [125.0, 126.79], [128.0, 130.87], [134.0, 135.3], [138.0, 139.67], [141.0, 142.03], [143.0, 147.87], [149.0, 151.07], [152.0, 156.22], [157.0, 157.62], [159.0, 161.67], [163.0, 164.25], [165.0, 169.45], [170.0, 175.15], [178.0, 181.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 87.55, 99.99, 0.0, 80.46, 80.64, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 55.31, 0.0, 98.93, 0.0, 0.0, 0.0, 99.92, 83.16, 42.04, 0.0, 98.73, 0.0, 81.0, 90.6, 92.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.12], ["music", 23.32], ["sidetone", 14.23]], null, null, null, null, null, null], "duration": [1.62, 3.16, 2.91, 0.74, 2.7, 3.0, 5.67, 1.05, 1.03, 1.56, 0.74, 0.63, 1.04, 1.45, 1.04, 1.24, 2.21, 2.96, 1.94, 1.34, 1.4, 1.41, 1.76, 8.05, 1.82, 3.23, 1.79, 2.87, 1.3, 1.67, 1.03, 4.87, 2.07, 4.22, 0.62, 2.67, 1.25, 4.45, 5.15, 3.94]} \ No newline at end of file diff --git a/annotations_1/0PtKzdvq7bc_filtered.json b/annotations_1/0PtKzdvq7bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec390fe5a10d3d8fa680d2d903393f0cfad43ad2 --- /dev/null +++ b/annotations_1/0PtKzdvq7bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.66], [13.0, 14.03], [16.0, 26.03], [32.0, 35.19], [37.0, 38.06], [39.0, 40.85], [42.0, 42.74], [46.0, 46.99], [48.0, 49.89], [56.0, 65.16], [66.0, 67.91], [68.0, 68.89], [69.0, 70.53], [71.0, 71.31], [72.0, 73.08], [76.0, 78.46], [79.0, 80.0], [96.0, 98.63], [100.0, 101.7], [103.0, 103.76], [110.0, 110.74], [113.0, 114.18], [119.0, 120.06], [123.0, 122.93], [129.0, 130.17], [131.0, 133.79], [135.0, 136.76], [142.0, 142.92], [151.0, 155.51], [156.0, 157.76], [160.0, 162.73], [166.0, 167.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [87.92, 0.0, 44.07, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26, 0.0, 0.0, 29.71, 0.0, 42.69, 0.0], "audiomae_on_audioset": [null, null, [["speech", 86.64], ["animal", 2.22], ["crowd", 1.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.64], ["speech", 24.41], ["musical instrument", 4.68]], null, null, [["music", 23.59], ["whack, thwack", 6.17], ["chant", 4.64]], null, [["music", 44.18], ["didgeridoo", 23.28], ["musical instrument", 6.4]], null], "duration": [2.66, 1.03, 10.03, 3.19, 1.06, 1.85, 0.74, 0.99, 1.89, 9.16, 1.91, 0.89, 1.53, 0.31, 1.08, 2.46, 1.0, 2.63, 1.7, 0.76, 0.74, 1.18, 1.06, -0.07, 1.17, 2.79, 1.76, 0.92, 4.51, 1.76, 2.73, 1.66]} \ No newline at end of file diff --git a/annotations_1/0RM_Ehtb5C4_filtered.json b/annotations_1/0RM_Ehtb5C4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b4ae52f89b49b31b36e8725202f20839d712689 --- /dev/null +++ b/annotations_1/0RM_Ehtb5C4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.14], [20.0, 23.82], [24.0, 27.09], [33.0, 33.05], [34.0, 35.92], [39.0, 42.25], [43.0, 55.51], [56.0, 56.54], [57.0, 71.19], [72.0, 72.67], [74.0, 79.1], [79.0, 80.25], [81.0, 81.3]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.2, 87.55, 52.1, 0.0, 0.0, 73.67, 51.18, 0.0, 51.28, 0.0, 57.48, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.73], ["cat", 8.14], ["animal", 7.64]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.14, 3.82, 3.09, 0.05, 1.92, 3.25, 12.51, 0.54, 14.19, 0.67, 5.1, 1.25, 0.3]} \ No newline at end of file diff --git a/annotations_1/0T3hXtyuX0g_filtered.json b/annotations_1/0T3hXtyuX0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfc82828b1a1544e295e8947315fa8f2eaba9c12 --- /dev/null +++ b/annotations_1/0T3hXtyuX0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.79], [29.0, 29.27], [57.0, 61.25], [65.0, 65.48], [70.0, 77.26], [81.0, 81.7], [85.0, 86.97], [90.0, 93.26], [95.0, 96.01], [98.0, 98.37], [100.0, 104.55], [105.0, 104.62], [105.0, 104.7], [105.0, 104.9], [108.0, 108.09], [111.0, 111.35], [113.0, 113.71], [116.0, 118.27], [123.0, 123.01], [125.0, 125.47], [127.0, 127.99], [130.0, 130.81], [132.0, 132.46], [134.0, 134.52], [138.0, 138.3], [139.0, 139.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.51, 0.0, 77.03, 0.0, 0.0, 76.53, 0.0, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 26.3], ["throbbing", 13.81], ["mains hum", 11.66]], null, null, null, null, null, null, [["speech", 60.22], ["animal", 2.96], ["outside, rural or natural", 2.04]], null, null, null, null, null, null, null, null], "duration": [0.79, 0.27, 4.25, 0.48, 7.26, 0.7, 1.97, 3.26, 1.01, 0.37, 4.55, -0.38, -0.3, -0.1, 0.09, 0.35, 0.71, 2.27, 0.01, 0.47, 0.99, 0.81, 0.46, 0.52, 0.3, 0.45]} \ No newline at end of file diff --git a/annotations_1/0WKopiIhAdI_filtered.json b/annotations_1/0WKopiIhAdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3264ca6b89e1bdc5aff37e4db9e966a6b14d50f --- /dev/null +++ b/annotations_1/0WKopiIhAdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [6.0, 6.0], [6.0, 11.84], [13.0, 13.91], [25.0, 26.64], [38.0, 42.18], [45.0, 45.4], [46.0, 45.64], [46.0, 52.95], [53.0, 54.16], [55.0, 65.25], [67.0, 70.56], [74.0, 74.71], [75.0, 78.85], [79.0, 80.2], [87.0, 94.17], [110.0, 111.05], [112.0, 112.16], [114.0, 113.98], [114.0, 114.54], [118.0, 126.15], [127.0, 129.46], [132.0, 131.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 38.71, 0.0, 0.0, 32.93, 0.0, 0.0, 30.01, 0.0, 30.4, 32.28, 0.0, 30.56, 0.0, 33.7, 0.0, 0.0, 0.0, 0.0, 47.86, 30.55, 0.0], "audiomae_on_audioset": [null, null, [["speech", 36.51], ["hum", 27.89], ["mains hum", 13.02]], null, null, [["music", 74.8], ["electronic music", 9.66], ["throbbing", 2.91]], null, null, [["music", 79.95], ["sound effect", 2.95], ["boing", 1.86]], null, [["throbbing", 31.05], ["music", 27.65], ["hum", 13.26]], [["music", 58.81], ["speech", 10.24], ["electronic music", 6.58]], null, [["music", 51.76], ["throbbing", 16.55], ["hum", 7.73]], null, [["speech", 41.48], ["music", 32.14], ["echo", 5.16]], null, null, null, null, [["music", 61.83], ["whale vocalization", 6.5], ["squish", 6.37]], [["livestock, farm animals, working animals", 17.89], ["cattle, bovinae", 15.07], ["cowbell", 12.26]], null], "duration": [0.76, 0.0, 5.84, 0.91, 1.64, 4.18, 0.4, -0.36, 6.95, 1.16, 10.25, 3.56, 0.71, 3.85, 1.2, 7.17, 1.05, 0.16, -0.02, 0.54, 8.15, 2.46, -0.28]} \ No newline at end of file diff --git a/annotations_1/0WRtWiz_Xvg_filtered.json b/annotations_1/0WRtWiz_Xvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cbdb43983e14c0d24fc9997be89e3d68a75261c --- /dev/null +++ b/annotations_1/0WRtWiz_Xvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.58], [27.0, 27.87], [33.0, 48.93], [50.0, 54.33], [55.0, 56.42], [61.0, 61.28], [65.0, 65.82], [68.0, 70.56], [71.0, 72.42], [79.0, 80.45], [90.0, 90.96], [92.0, 93.14], [94.0, 94.26], [97.0, 103.2], [104.0, 104.08], [107.0, 110.66], [113.0, 117.78], [122.0, 123.89], [124.0, 125.22], [126.0, 136.22], [138.0, 140.12], [142.0, 153.6], [155.0, 166.65], [171.0, 194.53], [196.0, 196.5]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false], "silence_prob": [39.43, 0.0, 51.99, 49.97, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 37.93, 44.6, 0.0, 0.0, 61.77, 76.86, 44.01, 54.3, 41.93, 0.0], "audiomae_on_audioset": [[["speech", 60.84], ["hum", 18.37], ["mains hum", 2.62]], null, null, [["speech", 38.97], ["music", 25.37], ["fart", 5.07]], null, null, null, null, null, null, null, null, null, null, null, [["music", 61.39], ["musical instrument", 4.02], ["breaking", 3.37]], [["music", 35.83], ["theremin", 13.87], ["speech", 7.33]], null, null, null, null, [["music", 55.01], ["speech", 4.75], ["didgeridoo", 3.7]], null, [["music", 68.26], ["didgeridoo", 8.83], ["theremin", 3.88]], null], "duration": [8.58, 0.87, 15.93, 4.33, 1.42, 0.28, 0.82, 2.56, 1.42, 1.45, 0.96, 1.14, 0.26, 6.2, 0.08, 3.66, 4.78, 1.89, 1.22, 10.22, 2.12, 11.6, 11.65, 23.53, 0.5]} \ No newline at end of file diff --git a/annotations_1/0XLEGFSKVhs_filtered.json b/annotations_1/0XLEGFSKVhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b12fc737f14afbe25e5b0dc9ba16e0d7e746ee --- /dev/null +++ b/annotations_1/0XLEGFSKVhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.29], [13.0, 15.63], [16.0, 19.62], [26.0, 50.82], [53.0, 81.19], [81.0, 85.04]], "keep_status": [false, true, false, true, false, true], "silence_prob": [38.11, 36.31, 70.44, 28.94, 29.19, 37.78], "audiomae_on_audioset": [[["mains hum", 27.06], ["hum", 23.23], ["throbbing", 22.2]], [["music", 44.61], ["synthesizer", 11.21], ["musical instrument", 7.24]], null, [["music", 52.28], ["synthesizer", 8.78], ["electronic music", 6.38]], [["music", 91.29], ["drip", 2.47], ["liquid", 1.0]], [["speech", 30.52], ["frog", 12.5], ["croak", 8.13]]], "duration": [6.29, 2.63, 3.62, 24.82, 28.19, 4.04]} \ No newline at end of file diff --git a/annotations_1/0YOmyGX2kmQ_filtered.json b/annotations_1/0YOmyGX2kmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67d6485afca5d140db0bbed9ab6c785af53d3d29 --- /dev/null +++ b/annotations_1/0YOmyGX2kmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.33], [9.0, 13.19], [14.0, 17.66], [18.0, 18.22], [19.0, 24.0], [25.0, 33.24], [34.0, 34.87], [35.0, 36.19], [38.0, 50.04], [54.0, 55.97], [57.0, 64.0], [66.0, 66.02]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 50.16, 40.28, 0.0, 86.82, 89.01, 0.0, 0.0, 36.42, 0.0, 35.82, 0.0], "audiomae_on_audioset": [null, null, [["speech", 21.15], ["goose", 13.67], ["fowl", 12.77]], null, null, null, null, null, [["music", 51.04], ["speech", 18.95], ["animal", 4.44]], null, [["music", 28.39], ["speech", 19.02], ["foghorn", 6.53]], null], "duration": [1.33, 4.19, 3.66, 0.22, 5.0, 8.24, 0.87, 1.19, 12.04, 1.97, 7.0, 0.02]} \ No newline at end of file diff --git a/annotations_1/0_-45EGFtA4_filtered.json b/annotations_1/0_-45EGFtA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f94911116513406f4155d2c86ed837bcf96c8c90 --- /dev/null +++ b/annotations_1/0_-45EGFtA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.69]} \ No newline at end of file diff --git a/annotations_1/0_0U4bhe6ag_filtered.json b/annotations_1/0_0U4bhe6ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0e6660e727674d230b0cdfdecc1e9848fc6fd62 --- /dev/null +++ b/annotations_1/0_0U4bhe6ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.89], [10.0, 10.05], [18.0, 22.33], [28.0, 28.65], [39.0, 39.93], [50.0, 50.63], [57.0, 58.48], [61.0, 61.67], [65.0, 66.28], [67.0, 67.47], [68.0, 68.67], [82.0, 84.2], [84.0, 87.64], [91.0, 93.28], [96.0, 105.29], [109.0, 110.84], [112.0, 112.31], [115.0, 115.5], [116.0, 116.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 35.5, 35.82, 32.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.91], ["effects unit", 4.16], ["musical instrument", 4.15]], null, null, null, null, null, null, null, null, [["whale vocalization", 32.63], ["speech", 13.33], ["music", 8.35]], [["music", 41.71], ["speech", 13.18], ["hum", 5.93]], [["music", 62.4], ["whale vocalization", 13.46], ["hum", 4.67]], [["speech", 23.5], ["music", 18.17], ["hum", 2.6]], null, null, null, null], "duration": [-0.11, 0.05, 4.33, 0.65, 0.93, 0.63, 1.48, 0.67, 1.28, 0.47, 0.67, 2.2, 3.64, 2.28, 9.29, 1.84, 0.31, 0.5, 0.95]} \ No newline at end of file diff --git a/annotations_1/0_1NU60qHWs_filtered.json b/annotations_1/0_1NU60qHWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09414d554151477b07e0766d142aa78c142caf4c --- /dev/null +++ b/annotations_1/0_1NU60qHWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.07], [13.0, 13.24], [14.0, 14.01], [18.0, 17.61], [18.0, 23.06], [29.0, 28.88], [30.0, 30.21], [46.0, 47.76], [51.0, 51.68], [54.0, 54.62], [56.0, 60.51], [65.0, 65.31], [65.0, 66.14], [66.0, 66.28], [66.0, 66.43], [71.0, 72.06], [78.0, 78.66], [81.0, 80.81], [84.0, 84.25], [85.0, 85.45], [88.0, 87.76], [91.0, 93.07], [95.0, 98.44], [107.0, 111.54], [125.0, 126.55], [127.0, 129.3], [132.0, 132.09], [142.0, 143.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 53.28, 45.24, 0.0, 71.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.28], ["marimba, xylophone", 6.22], ["glockenspiel", 3.12]], null, [["speech", 33.35], ["music", 27.8], ["boing", 6.41]], null, null, null, null], "duration": [1.07, 0.24, 0.01, -0.39, 5.06, -0.12, 0.21, 1.76, 0.68, 0.62, 4.51, 0.31, 1.14, 0.28, 0.43, 1.06, 0.66, -0.19, 0.25, 0.45, -0.24, 2.07, 3.44, 4.54, 1.55, 2.3, 0.09, 1.09]} \ No newline at end of file diff --git a/annotations_1/0_7vIOvdKqY_filtered.json b/annotations_1/0_7vIOvdKqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..726a259a3cd7d61fa98d3587186673eb550c720c --- /dev/null +++ b/annotations_1/0_7vIOvdKqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [4.0, 13.85], [14.0, 19.48], [34.0, 35.01], [35.0, 36.86], [39.0, 39.58], [42.0, 43.34], [44.0, 45.35], [46.0, 49.4], [50.0, 58.51], [60.0, 60.2], [63.0, 64.25], [66.0, 67.36], [71.0, 72.55], [76.0, 76.45], [79.0, 81.85], [84.0, 85.09], [86.0, 86.78], [91.0, 95.17], [97.0, 98.05], [100.0, 100.09], [101.0, 104.18], [105.0, 107.33], [109.0, 110.49], [113.0, 115.11], [116.0, 117.12], [122.0, 123.4], [124.0, 123.9], [124.0, 124.34], [127.0, 129.37], [130.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.26, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 99.56, 0.0, 0.0, 99.65, 99.48, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0], "audiomae_on_audioset": [null, [["speech", 92.2], ["sidetone", 2.74], ["whale vocalization", 1.23]], [["speech", 80.91], ["fart", 6.56], ["beatboxing", 5.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 9.85, 5.48, 1.01, 1.86, 0.58, 1.34, 1.35, 3.4, 8.51, 0.2, 1.25, 1.36, 1.55, 0.45, 2.85, 1.09, 0.78, 4.17, 1.05, 0.09, 3.18, 2.33, 1.49, 2.11, 1.12, 1.4, -0.1, 0.34, 2.37, -0.12]} \ No newline at end of file diff --git a/annotations_1/0_UCPY-mSZU_filtered.json b/annotations_1/0_UCPY-mSZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf63341e69d780fbddf205105988a4297c2fb85 --- /dev/null +++ b/annotations_1/0_UCPY-mSZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.21], [25.0, 26.84], [28.0, 29.32], [32.0, 32.63], [39.0, 39.78], [44.0, 48.98], [49.0, 52.22], [58.0, 58.75], [65.0, 65.53], [66.0, 66.06], [68.0, 69.36], [70.0, 71.83], [75.0, 76.23], [82.0, 93.93], [95.0, 100.74], [103.0, 106.86], [108.0, 109.0], [111.0, 114.59], [116.0, 116.73], [118.0, 119.45], [124.0, 125.71], [127.0, 127.82], [132.0, 135.77], [137.0, 139.99], [142.0, 150.36], [153.0, 154.95], [155.0, 156.59], [158.0, 159.85], [160.0, 162.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.99, 95.64, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 63.42, 51.94, 55.04, 0.0, 0.0, 0.0, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 1.84, 1.32, 0.63, 0.78, 4.98, 3.22, 0.75, 0.53, 0.06, 1.36, 1.83, 1.23, 11.93, 5.74, 3.86, 1.0, 3.59, 0.73, 1.45, 1.71, 0.82, 3.77, 2.99, 8.36, 1.95, 1.59, 1.85, 2.3]} \ No newline at end of file diff --git a/annotations_1/0aKB_Qm-z6g_filtered.json b/annotations_1/0aKB_Qm-z6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..706634bfa859e153adffe1c29ecad8080dbdacee --- /dev/null +++ b/annotations_1/0aKB_Qm-z6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [8.0, 8.28], [9.0, 10.79], [11.0, 13.71], [14.0, 15.21], [17.0, 22.38], [29.0, 29.66], [36.0, 36.56], [39.0, 39.46], [44.0, 44.95], [49.0, 50.09], [52.0, 54.45], [56.0, 58.36], [63.0, 64.1], [72.0, 74.12], [75.0, 76.06], [81.0, 83.27], [84.0, 91.2], [92.0, 92.5], [106.0, 106.54], [111.0, 117.39], [117.0, 118.89]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 40.59, 0.0, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 51.02, 0.0, 99.98, 0.0, 79.59, 33.28, 0.0, 0.0, 34.03, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 54.9], ["sidetone", 24.84], ["hum", 2.83]], null, [["speech", 16.15], ["mosquito", 12.84], ["fly, housefly", 9.52]], null, null, null, null, null, null, null, null, null, null, null, [["whistling", 95.31], ["beatboxing", 1.41], ["speech", 0.59]], null, null, [["music", 49.71], ["guitar", 9.14], ["musical instrument", 4.78]], null], "duration": [0.88, 0.28, 1.79, 2.71, 1.21, 5.38, 0.66, 0.56, 0.46, 0.95, 1.09, 2.45, 2.36, 1.1, 2.12, 1.06, 2.27, 7.2, 0.5, 0.54, 6.39, 1.89]} \ No newline at end of file diff --git a/annotations_1/0aX79Yt3Bno_filtered.json b/annotations_1/0aX79Yt3Bno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5395bb81dd57e34f28c5d75a7d17e7048f6f1fd9 --- /dev/null +++ b/annotations_1/0aX79Yt3Bno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.18], [10.0, 16.29], [16.0, 17.19], [22.0, 22.06], [25.0, 26.72], [29.0, 31.24], [49.0, 53.03], [53.0, 60.39], [70.0, 72.57], [85.0, 85.5], [92.0, 94.49], [111.0, 113.27], [115.0, 124.06]], "keep_status": [true, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [33.95, 42.58, 0.0, 0.0, 0.0, 56.7, 80.29, 56.48, 59.77, 0.0, 30.64, 32.72, 30.65], "audiomae_on_audioset": [[["speech", 37.56], ["music", 9.27], ["explosion", 6.16]], [["speech", 47.93], ["frog", 11.28], ["animal", 7.89]], null, null, null, null, null, null, null, null, [["speech", 23.88], ["gunshot, gunfire", 13.29], ["whack, thwack", 12.82]], [["frog", 22.78], ["animal", 13.49], ["boing", 7.22]], [["cattle, bovinae", 20.96], ["speech", 19.67], ["animal", 10.16]]], "duration": [6.18, 6.29, 1.19, 0.06, 1.72, 2.24, 4.03, 7.39, 2.57, 0.5, 2.49, 2.27, 9.06]} \ No newline at end of file diff --git a/annotations_1/0bR6pUOhZo4_filtered.json b/annotations_1/0bR6pUOhZo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c49615a738485c8d8099b4c35743bcca264a2e --- /dev/null +++ b/annotations_1/0bR6pUOhZo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.63], [17.0, 20.78], [24.0, 24.68], [30.0, 30.64], [44.0, 44.58], [48.0, 49.37], [53.0, 54.09], [55.0, 65.03], [67.0, 67.29], [70.0, 70.58], [72.0, 75.3], [77.0, 77.9], [80.0, 81.03], [83.0, 84.03], [86.0, 86.31], [89.0, 89.09], [91.0, 92.2], [97.0, 97.93], [101.0, 102.49], [105.0, 106.46], [109.0, 110.32], [116.0, 116.29], [122.0, 123.79], [126.0, 142.87], [144.0, 146.72], [151.0, 151.21], [151.0, 151.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.29, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 68.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.63, 3.78, 0.68, 0.64, 0.58, 1.37, 1.09, 10.03, 0.29, 0.58, 3.3, 0.9, 1.03, 1.03, 0.31, 0.09, 1.2, 0.93, 1.49, 1.46, 1.32, 0.29, 1.79, 16.87, 2.72, 0.21, 0.41]} \ No newline at end of file diff --git a/annotations_1/0bw8UM1eLFo_filtered.json b/annotations_1/0bw8UM1eLFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21061c9aabeef186692011699d2dcb5d8282ace9 --- /dev/null +++ b/annotations_1/0bw8UM1eLFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [6.0, 13.73], [16.0, 19.5], [21.0, 28.07], [29.0, 36.31], [39.0, 44.02], [45.0, 47.68], [49.0, 51.17], [55.0, 55.68], [57.0, 57.45], [59.0, 60.1], [64.0, 65.57], [67.0, 68.22], [69.0, 70.9], [72.0, 88.97], [90.0, 95.74], [98.0, 104.19], [107.0, 110.49], [112.0, 118.67], [120.0, 127.16], [127.0, 146.33], [148.0, 156.02], [165.0, 167.16], [169.0, 170.36], [172.0, 172.13], [179.0, 180.37], [181.0, 199.93], [200.0, 202.05], [203.0, 205.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 100.0, 100.0, 100.0, 98.86, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 99.84, 96.42, 100.0, 100.0, 100.0, 97.73, 32.59, 37.34, 0.0, 0.0, 0.0, 56.48, 61.08, 69.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.83], ["sidetone", 17.23], ["noise", 2.15]], [["fly, housefly", 27.21], ["insect", 16.22], ["mosquito", 13.36]], null, null, null, null, null, null], "duration": [1.7, 7.73, 3.5, 7.07, 7.31, 5.02, 2.68, 2.17, 0.68, 0.45, 1.1, 1.57, 1.22, 1.9, 16.97, 5.74, 6.19, 3.49, 6.67, 7.16, 19.33, 8.02, 2.16, 1.36, 0.13, 1.37, 18.93, 2.05, 2.75]} \ No newline at end of file diff --git a/annotations_1/0ePC0mh4rCY_filtered.json b/annotations_1/0ePC0mh4rCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fd920c5073072f9c6118e9a2ecde0ebd0c334c7 --- /dev/null +++ b/annotations_1/0ePC0mh4rCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.22], [2.0, 2.2], [3.0, 3.37], [4.0, 4.5], [5.0, 10.03], [13.0, 18.64], [19.0, 18.67], [19.0, 18.71], [19.0, 18.74], [19.0, 21.98], [23.0, 23.21], [24.0, 24.22], [27.0, 27.7], [29.0, 49.11], [49.0, 50.21], [55.0, 55.07], [57.0, 57.18], [58.0, 58.01], [59.0, 59.14], [60.0, 60.61], [61.0, 63.86], [64.0, 64.52], [74.0, 91.17], [95.0, 96.25], [100.0, 99.71], [102.0, 102.12], [103.0, 104.13], [107.0, 110.59], [112.0, 112.94], [113.0, 112.97]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.73, 30.05, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 0.0, 32.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 0.0, 37.17, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 40.91], ["livestock, farm animals, working animals", 13.28], ["cattle, bovinae", 10.73]], [["music", 67.85], ["speech", 6.4], ["mosquito", 5.99]], null, null, null, [["electric shaver, electric razor", 34.81], ["cattle, bovinae", 20.04], ["speech", 12.07]], null, null, null, [["livestock, farm animals, working animals", 53.53], ["buzz", 10.25], ["cattle, bovinae", 6.93]], null, null, null, null, null, null, [["speech", 57.68], ["fly, housefly", 4.58], ["insect", 3.5]], null, [["beatboxing", 14.03], ["mosquito", 13.18], ["noise", 12.99]], null, null, null, null, [["livestock, farm animals, working animals", 25.27], ["fly, housefly", 19.78], ["insect", 9.92]], null, null], "duration": [1.22, 0.2, 0.37, 0.5, 5.03, 5.64, -0.33, -0.29, -0.26, 2.98, 0.21, 0.22, 0.7, 20.11, 1.21, 0.07, 0.18, 0.01, 0.14, 0.61, 2.86, 0.52, 17.17, 1.25, -0.29, 0.12, 1.13, 3.59, 0.94, -0.03]} \ No newline at end of file diff --git a/annotations_1/0ekAvNp_F9c_filtered.json b/annotations_1/0ekAvNp_F9c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ba935e339bc6c30eb598b490fb975d6c92dc35f --- /dev/null +++ b/annotations_1/0ekAvNp_F9c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [8.0, 9.07], [10.0, 10.34], [13.0, 14.03], [16.0, 17.02], [18.0, 20.65], [22.0, 22.4], [24.0, 23.79], [29.0, 29.73], [31.0, 32.66], [39.0, 39.6], [41.0, 41.5], [49.0, 52.68], [57.0, 58.48], [64.0, 66.12], [79.0, 80.13], [86.0, 88.33], [96.0, 100.7], [102.0, 112.11], [113.0, 113.31], [114.0, 152.49], [153.0, 152.86], [154.0, 162.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 72.75, 0.0, 73.21, 36.07, 32.96, 0.0, 0.0, 0.0, 29.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.78], ["singing bowl", 22.86], ["speech", 22.05]], null, null, null, null, [["music", 55.35], ["electronic music", 5.92], ["sonar", 4.85]], [["hum", 31.75], ["music", 28.14], ["gong", 9.61]], null, null, null, [["music", 41.49], ["speech", 11.54], ["scary music", 7.45]]], "duration": [1.0, 1.07, 0.34, 1.03, 1.02, 2.65, 0.4, -0.21, 0.73, 1.66, 0.6, 0.5, 3.68, 1.48, 2.12, 1.13, 2.33, 4.7, 10.11, 0.31, 38.49, -0.14, 8.36]} \ No newline at end of file diff --git a/annotations_1/0g2o-CfakW0_filtered.json b/annotations_1/0g2o-CfakW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b920f7a7e1c8ff05a8f2c44d2bf17a056c89608d --- /dev/null +++ b/annotations_1/0g2o-CfakW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [5.0, 5.58], [6.0, 6.91], [7.0, 8.04], [10.0, 18.05], [19.0, 20.6], [22.0, 21.91], [23.0, 24.95], [28.0, 30.38], [33.0, 33.71], [34.0, 34.97], [36.0, 36.26], [37.0, 38.62], [40.0, 42.62], [44.0, 44.54], [46.0, 45.86], [47.0, 47.04], [48.0, 65.2], [67.0, 67.04], [68.0, 68.54], [69.0, 70.23], [73.0, 73.8], [76.0, 77.77], [79.0, 81.57], [82.0, 83.61], [85.0, 85.56], [86.0, 86.78], [87.0, 87.34], [88.0, 88.7], [89.0, 90.21], [91.0, 92.21], [95.0, 95.64], [96.0, 96.85], [97.0, 97.93], [98.0, 100.21], [101.0, 102.25], [103.0, 110.02], [111.0, 115.86], [117.0, 120.73], [125.0, 124.85], [126.0, 126.15], [127.0, 130.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.71, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.28, 0.0, 53.34, 39.17, 36.32, 0.0, 0.0, 38.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.96], ["creak", 5.63], ["whale vocalization", 2.44]], null, null, [["speech", 58.25], ["music", 14.96], ["mains hum", 1.83]], [["music", 20.36], ["hum", 12.12], ["speech", 10.9]], null, null, [["mains hum", 16.88], ["hum", 16.38], ["music", 14.62]]], "duration": [0.87, 0.58, 0.91, 1.04, 8.05, 1.6, -0.09, 1.95, 2.38, 0.71, 0.97, 0.26, 1.62, 2.62, 0.54, -0.14, 0.04, 17.2, 0.04, 0.54, 1.23, 0.8, 1.77, 2.57, 1.61, 0.56, 0.78, 0.34, 0.7, 1.21, 1.21, 0.64, 0.85, 0.93, 2.21, 1.25, 7.02, 4.86, 3.73, -0.15, 0.15, 3.77]} \ No newline at end of file diff --git a/annotations_1/0h0FeEzxCaM_filtered.json b/annotations_1/0h0FeEzxCaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c43ed34220ceaa5113b8326389d87bacfa304a94 --- /dev/null +++ b/annotations_1/0h0FeEzxCaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 57.99], [60.0, 63.49], [65.0, 86.58], [88.0, 88.42], [89.0, 94.29], [95.0, 95.81], [97.0, 97.88], [99.0, 99.45], [100.0, 114.84], [115.0, 124.09], [124.0, 128.12], [128.0, 196.53]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 47.31, 31.52, 0.0, 40.88, 0.0, 0.0, 0.0, 32.29, 35.03, 51.07, 0.0], "audiomae_on_audioset": [null, [["music", 69.99], ["hum", 5.14], ["electronic music", 3.66]], [["mains hum", 33.39], ["music", 30.24], ["hum", 18.71]], null, [["sine wave", 19.41], ["speech", 17.53], ["tuning fork", 3.99]], null, null, null, [["fly, housefly", 15.51], ["speech", 8.33], ["insect", 7.51]], [["fly, housefly", 24.94], ["insect", 16.43], ["hum", 12.29]], null, null], "duration": [56.99, 3.49, 21.58, 0.42, 5.29, 0.81, 0.88, 0.45, 14.84, 9.09, 4.12, 68.53]} \ No newline at end of file diff --git a/annotations_1/0h0S6EmQWrI_filtered.json b/annotations_1/0h0S6EmQWrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a04f853a749d0db4cbaca01b4bf05f75ffb5d152 --- /dev/null +++ b/annotations_1/0h0S6EmQWrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [15.0, 36.17], [38.0, 91.42], [96.0, 100.99], [102.0, 102.42], [103.0, 103.2], [108.0, 118.57], [121.0, 121.78], [122.0, 121.83], [122.0, 123.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.71, 0.0, 31.02, 0.0, 0.0, 30.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 41.03], ["music", 29.53], ["hum", 21.25]], null, [["whale vocalization", 68.18], ["music", 13.5], ["noise", 3.38]], null, null, [["music", 66.94], ["throbbing", 7.62], ["electronic music", 6.26]], null, null, null], "duration": [0.88, 21.17, 53.42, 4.99, 0.42, 0.2, 10.57, 0.78, -0.17, 1.57]} \ No newline at end of file diff --git a/annotations_1/0hNbRd78jOE_filtered.json b/annotations_1/0hNbRd78jOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb63a5fa9d2d8a852360f56a2342353e7050669c --- /dev/null +++ b/annotations_1/0hNbRd78jOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [8.0, 9.05], [12.0, 11.84], [20.0, 20.39], [28.0, 31.65], [33.0, 33.34], [37.0, 37.37], [41.0, 41.81], [46.0, 46.89], [49.0, 49.71], [52.0, 53.38], [56.0, 57.16], [59.0, 59.56], [65.0, 70.07], [72.0, 72.84], [74.0, 76.0], [78.0, 78.75], [81.0, 85.58], [92.0, 93.38], [93.0, 94.53], [99.0, 99.76], [101.0, 103.08], [105.0, 105.6], [108.0, 109.46], [110.0, 111.87], [114.0, 114.15], [121.0, 122.08], [122.0, 123.36], [125.0, 125.29], [126.0, 126.45], [129.0, 131.73], [136.0, 137.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 0.0, 35.85, 0.0, 37.99, 0.0, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0], "audiomae_on_audioset": [null, null, null, null, [["moo", 36.0], ["cattle, bovinae", 32.17], ["livestock, farm animals, working animals", 28.38]], null, null, null, null, null, null, null, null, null, null, [["speech", 34.76], ["crowd", 8.95], ["fireworks", 4.79]], null, [["speech", 33.16], ["music", 15.6], ["boing", 9.01]], null, null, null, [["moo", 23.19], ["speech", 22.48], ["cattle, bovinae", 15.64]], null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.05, -0.16, 0.39, 3.65, 0.34, 0.37, 0.81, 0.89, 0.71, 1.38, 1.16, 0.56, 5.07, 0.84, 2.0, 0.75, 4.58, 1.38, 1.53, 0.76, 2.08, 0.6, 1.46, 1.87, 0.15, 1.08, 1.36, 0.29, 0.45, 2.73, 1.29]} \ No newline at end of file diff --git a/annotations_1/0iUKZskQEso_filtered.json b/annotations_1/0iUKZskQEso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80b742f63450fb0df3482ac16dcc80d308bd23de --- /dev/null +++ b/annotations_1/0iUKZskQEso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.96], [52.0, 52.2], [64.0, 65.01], [83.0, 97.55], [103.0, 103.18], [121.0, 121.9], [139.0, 165.86], [173.0, 174.04], [179.0, 179.85]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.99, 0.0, 0.0, 47.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 83.9], ["quack", 4.29], ["bleat", 1.55]], null, null, [["cattle, bovinae", 35.97], ["moo", 34.15], ["livestock, farm animals, working animals", 21.9]], null, null], "duration": [-0.04, 0.2, 1.01, 14.55, 0.18, 0.9, 26.86, 1.04, 0.85]} \ No newline at end of file diff --git a/annotations_1/0igqAlu8Oqc_filtered.json b/annotations_1/0igqAlu8Oqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e0b55a7b54dafa480c5f2366bab572e7e930981 --- /dev/null +++ b/annotations_1/0igqAlu8Oqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.25], [22.0, 23.43], [29.0, 29.81], [46.0, 46.53], [49.0, 50.67], [62.0, 62.94], [68.0, 68.0], [70.0, 75.25], [76.0, 77.03], [83.0, 84.06], [91.0, 91.08], [92.0, 92.33], [96.0, 105.29], [114.0, 124.44], [134.0, 136.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 34.32, 36.7, 52.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.92], ["explosion", 24.06], ["music", 20.63]], [["speech", 68.48], ["music", 15.67], ["sidetone", 2.96]], null], "duration": [1.25, 1.43, 0.81, 0.53, 1.67, 0.94, 0.0, 5.25, 1.03, 1.06, 0.08, 0.33, 9.29, 10.44, 2.14]} \ No newline at end of file diff --git a/annotations_1/0k_yjEiPLoc_filtered.json b/annotations_1/0k_yjEiPLoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d655308b574172dcf24d92d8a5f3244bd434dc61 --- /dev/null +++ b/annotations_1/0k_yjEiPLoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.46], [17.0, 23.16], [24.0, 24.83], [25.0, 26.28], [27.0, 32.04], [32.0, 33.94], [34.0, 35.67], [36.0, 38.57], [42.0, 43.46], [44.0, 45.37], [46.0, 48.22], [53.0, 54.41], [55.0, 55.76], [56.0, 56.47], [64.0, 64.88], [66.0, 65.87], [68.0, 68.08], [72.0, 73.18], [76.0, 96.94], [97.0, 113.29], [114.0, 131.55]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 41.07, 0.0, 0.0, 39.3, 0.0, 0.0, 44.32, 0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 32.97, 32.1], "audiomae_on_audioset": [null, [["domestic animals, pets", 18.21], ["dog", 17.27], ["animal", 13.9]], null, null, [["speech", 72.58], ["inside, small room", 2.6], ["heart sounds, heartbeat", 2.26]], null, null, [["hum", 51.22], ["mains hum", 36.66], ["speech", 5.17]], null, null, null, null, null, null, null, null, null, null, [["speech", 13.07], ["burst, pop", 10.52], ["music", 10.27]], [["sidetone", 28.42], ["busy signal", 23.37], ["music", 5.35]], [["fly, housefly", 20.84], ["insect", 14.55], ["mosquito", 12.42]]], "duration": [1.46, 6.16, 0.83, 1.28, 5.04, 1.94, 1.67, 2.57, 1.46, 1.37, 2.22, 1.41, 0.76, 0.47, 0.88, -0.13, 0.08, 1.18, 20.94, 16.29, 17.55]} \ No newline at end of file diff --git a/annotations_1/0lCR_c5Su1M_filtered.json b/annotations_1/0lCR_c5Su1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5477ae1a0d2fecabbce0d6c40461c4854e803c8 --- /dev/null +++ b/annotations_1/0lCR_c5Su1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.86], [13.0, 33.56], [38.0, 42.11], [44.0, 53.45], [56.0, 82.09], [86.0, 121.1], [135.0, 148.04], [150.0, 150.26]], "keep_status": [false, false, true, true, false, false, false, false], "silence_prob": [30.85, 30.83, 31.59, 31.73, 30.36, 0.0, 31.08, 0.0], "audiomae_on_audioset": [[["didgeridoo", 45.36], ["music", 24.43], ["speech", 7.76]], [["didgeridoo", 45.96], ["music", 41.97], ["musical instrument", 2.4]], [["music", 42.22], ["effects unit", 9.8], ["hum", 7.5]], [["music", 33.66], ["throbbing", 15.46], ["hum", 14.49]], [["music", 74.79], ["musical instrument", 3.94], ["hum", 3.89]], null, [["music", 65.01], ["hum", 7.98], ["throbbing", 5.1]], null], "duration": [6.86, 20.56, 4.11, 9.45, 26.09, 35.1, 13.04, 0.26]} \ No newline at end of file diff --git a/annotations_1/0m5VGBc8VrQ_filtered.json b/annotations_1/0m5VGBc8VrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2b85e3b55656c2ee6ff7229084cc9f2e5c309bb --- /dev/null +++ b/annotations_1/0m5VGBc8VrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.81], [38.0, 38.65], [40.0, 40.49], [41.0, 42.47], [45.0, 48.51], [53.0, 53.82], [55.0, 56.17], [58.0, 59.02], [62.0, 63.48], [67.0, 67.44], [70.0, 70.82], [74.0, 74.21], [75.0, 76.62], [78.0, 78.17], [80.0, 80.76], [81.0, 83.22], [84.0, 85.11], [88.0, 89.34], [93.0, 94.58], [95.0, 96.11], [99.0, 99.44], [106.0, 106.47], [107.0, 109.39], [111.0, 111.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.65, 0.49, 1.47, 3.51, 0.82, 1.17, 1.02, 1.48, 0.44, 0.82, 0.21, 1.62, 0.17, 0.76, 2.22, 1.11, 1.34, 1.58, 1.11, 0.44, 0.47, 2.39, 0.97]} \ No newline at end of file diff --git a/annotations_1/0mPTGVoG248_filtered.json b/annotations_1/0mPTGVoG248_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2437c6555036c53fd9e3a5a4dd8ac65ca9873be --- /dev/null +++ b/annotations_1/0mPTGVoG248_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 104.13], [106.0, 122.79], [124.0, 130.05], [130.0, 130.1], [131.0, 151.5]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 29.22, 28.78, 0.0, 29.34], "audiomae_on_audioset": [null, [["whack, thwack", 30.18], ["sound effect", 13.52], ["music", 8.38]], [["music", 41.98], ["breaking", 15.96], ["reverberation", 6.81]], null, [["breaking", 21.5], ["smash, crash", 19.92], ["music", 7.89]]], "duration": [46.13, 16.79, 6.05, 0.1, 20.5]} \ No newline at end of file diff --git a/annotations_1/0mRRULBvuj0_filtered.json b/annotations_1/0mRRULBvuj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89ba791e4f88ac564c0ad22aa41d7fe7384dc6bd --- /dev/null +++ b/annotations_1/0mRRULBvuj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.2], [23.0, 24.49], [26.0, 27.03], [31.0, 32.36], [35.0, 35.88], [39.0, 39.72], [44.0, 44.19], [50.0, 50.58], [53.0, 54.11], [56.0, 56.2], [57.0, 60.44], [61.0, 63.04], [76.0, 77.36], [80.0, 80.69], [96.0, 97.46], [99.0, 100.45], [106.0, 106.19], [109.0, 173.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.82, 39.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 62.92], ["throbbing", 4.74], ["drum machine", 2.73]], [["music", 38.7], ["throbbing", 15.96], ["hum", 14.75]], null, null, null, null, null, null], "duration": [1.2, 1.49, 1.03, 1.36, 0.88, 0.72, 0.19, 0.58, 1.11, 0.2, 3.44, 2.04, 1.36, 0.69, 1.46, 1.45, 0.19, 64.89]} \ No newline at end of file diff --git a/annotations_1/0mjSZpCpsdc_filtered.json b/annotations_1/0mjSZpCpsdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb4011abb76777d8eebb2ee00deeb77ffea32346 --- /dev/null +++ b/annotations_1/0mjSZpCpsdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.72], [10.0, 10.4], [14.0, 27.21], [33.0, 33.4], [35.0, 92.15], [93.0, 95.32], [96.0, 98.41], [99.0, 101.93], [102.0, 111.21], [115.0, 117.69], [119.0, 119.35], [121.0, 123.79], [124.0, 124.39], [126.0, 127.89], [132.0, 132.26], [135.0, 135.35], [137.0, 136.95], [138.0, 139.14], [142.0, 142.87], [143.0, 143.99], [144.0, 146.11], [148.0, 149.12], [152.0, 152.04], [156.0, 157.1], [158.0, 158.87], [160.0, 161.82], [163.0, 165.79]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [76.2, 0.0, 30.94, 0.0, 0.0, 46.05, 38.51, 39.96, 38.59, 46.57, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55], "audiomae_on_audioset": [null, null, [["breaking", 27.64], ["music", 18.11], ["hum", 8.07]], null, null, [["music", 23.87], ["speech", 21.72], ["singing bowl", 20.71]], [["tuning fork", 42.59], ["sine wave", 32.82], ["chirp tone", 10.38]], [["speech", 31.74], ["music", 18.98], ["singing bowl", 16.37]], [["hum", 33.08], ["speech", 32.18], ["mains hum", 12.81]], [["hum", 31.94], ["speech", 20.27], ["throbbing", 14.94]], null, null, null, null, null, null, null, null, null, null, [["speech", 61.96], ["animal", 3.28], ["dog", 2.59]], null, null, null, null, null, null], "duration": [5.72, 0.4, 13.21, 0.4, 57.15, 2.32, 2.41, 2.93, 9.21, 2.69, 0.35, 2.79, 0.39, 1.89, 0.26, 0.35, -0.05, 1.14, 0.87, 0.99, 2.11, 1.12, 0.04, 1.1, 0.87, 1.82, 2.79]} \ No newline at end of file diff --git a/annotations_1/0mmSi-63Y9U_filtered.json b/annotations_1/0mmSi-63Y9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..221928fd0780e3b7b2643f21a8e26da3a63133d0 --- /dev/null +++ b/annotations_1/0mmSi-63Y9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [4.0, 4.19], [8.0, 8.46], [14.0, 15.23], [22.0, 23.16], [25.0, 27.14], [32.0, 34.74], [35.0, 36.95], [43.0, 42.84], [46.0, 46.31], [48.0, 47.87], [48.0, 49.49], [53.0, 54.18], [56.0, 55.68], [56.0, 56.51], [59.0, 59.85], [63.0, 63.58], [65.0, 65.42], [77.0, 77.99], [78.0, 79.73], [88.0, 88.23], [89.0, 89.99], [98.0, 98.05], [100.0, 99.96], [102.0, 102.64], [104.0, 104.46], [116.0, 116.28], [125.0, 125.27], [126.0, 126.44], [128.0, 127.79], [130.0, 129.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.07, 52.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.19, 0.46, 1.23, 1.16, 2.14, 2.74, 1.95, -0.16, 0.31, -0.13, 1.49, 1.18, -0.32, 0.51, 0.85, 0.58, 0.42, 0.99, 1.73, 0.23, 0.99, 0.05, -0.04, 0.64, 0.46, 0.28, 0.27, 0.44, -0.21, -0.05]} \ No newline at end of file diff --git a/annotations_1/0noY-XrAJRg_filtered.json b/annotations_1/0noY-XrAJRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2a84c6f4f7ff1d3bd1f5665f9a50385c0b12c18 --- /dev/null +++ b/annotations_1/0noY-XrAJRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [4.0, 5.7], [6.0, 7.72], [10.0, 11.92], [14.0, 22.18], [24.0, 24.54], [25.0, 25.56], [29.0, 30.38], [31.0, 32.66], [33.0, 36.24], [37.0, 38.3], [39.0, 39.04], [39.0, 39.95], [40.0, 40.34], [40.0, 40.8], [41.0, 41.2], [47.0, 47.17], [49.0, 48.66], [49.0, 49.28], [49.0, 49.96], [51.0, 51.34], [53.0, 53.5], [55.0, 55.8], [57.0, 56.84], [59.0, 59.44], [60.0, 61.53], [62.0, 62.92], [64.0, 67.19], [68.0, 69.13], [71.0, 70.97], [72.0, 72.45], [74.0, 91.03], [92.0, 92.23], [97.0, 97.7], [98.0, 150.13], [152.0, 154.01], [155.0, 157.96], [160.0, 160.88], [162.0, 165.03], [167.0, 176.17]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 0.0, 46.29, 32.63, 0.0, 31.46, 32.15], "audiomae_on_audioset": [null, null, null, null, [["music", 35.74], ["hum", 10.53], ["mains hum", 7.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.14], ["speech", 28.29], ["hum", 4.79]], null, null, null, [["music", 68.15], ["scary music", 7.54], ["ambient music", 2.74]], [["music", 15.45], ["theremin", 9.62], ["didgeridoo", 8.93]], null, [["music", 27.84], ["hum", 17.24], ["throbbing", 13.45]], [["music", 31.36], ["speech", 16.8], ["thunk", 8.34]]], "duration": [1.74, 1.7, 1.72, 1.92, 8.18, 0.54, 0.56, 1.38, 1.66, 3.24, 1.3, 0.04, 0.95, 0.34, 0.8, 0.2, 0.17, -0.34, 0.28, 0.96, 0.34, 0.5, 0.8, -0.16, 0.44, 1.53, 0.92, 3.19, 1.13, -0.03, 0.45, 17.03, 0.23, 0.7, 52.13, 2.01, 2.96, 0.88, 3.03, 9.17]} \ No newline at end of file diff --git a/annotations_1/0o9Fm3hnpYQ_filtered.json b/annotations_1/0o9Fm3hnpYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04877033f4a8cb3ac51f50d872f8502e0bb4571b --- /dev/null +++ b/annotations_1/0o9Fm3hnpYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [10.0, 10.45], [12.0, 15.18], [22.0, 22.76], [27.0, 32.05], [39.0, 39.99], [41.0, 41.76], [43.0, 46.8], [48.0, 52.02], [65.0, 65.91], [66.0, 67.54], [82.0, 82.16], [84.0, 85.29], [96.0, 96.65], [97.0, 100.18], [101.0, 107.32], [110.0, 113.73], [123.0, 139.72], [142.0, 147.87], [149.0, 150.13], [150.0, 151.71], [152.0, 153.37], [164.0, 164.76], [168.0, 167.81], [173.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.07, 0.0, 41.38, 0.0, 0.0, 46.22, 41.89, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 38.71, 36.37, 42.51, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.19], ["theremin", 6.56], ["musical instrument", 2.5]], null, [["music", 75.52], ["musical instrument", 3.12], ["synthesizer", 1.52]], null, null, [["music", 51.93], ["boing", 7.11], ["hum", 3.69]], [["music", 28.61], ["wail, moan", 6.22], ["fly, housefly", 5.13]], null, null, null, null, null, [["music", 40.69], ["speech", 25.13], ["musical instrument", 2.98]], [["music", 28.93], ["mains hum", 19.27], ["hum", 13.23]], [["music", 57.12], ["livestock, farm animals, working animals", 3.76], ["animal", 3.62]], [["music", 49.57], ["speech", 11.42], ["musical instrument", 7.51]], null, null, null, null, null, null, null], "duration": [0.64, 0.45, 3.18, 0.76, 5.05, 0.99, 0.76, 3.8, 4.02, 0.91, 1.54, 0.16, 1.29, 0.65, 3.18, 6.32, 3.73, 16.72, 5.87, 1.13, 1.71, 1.37, 0.76, -0.19, 0.23]} \ No newline at end of file diff --git a/annotations_1/0oFdsgLP8n8_filtered.json b/annotations_1/0oFdsgLP8n8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c483485b8350df26133ba2acffe2ca809b7d56fc --- /dev/null +++ b/annotations_1/0oFdsgLP8n8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [5.0, 6.02], [11.0, 13.69], [16.0, 16.44], [17.0, 17.58], [19.0, 20.21], [24.0, 25.22], [26.0, 26.47], [28.0, 30.11], [36.0, 36.54], [40.0, 41.76], [52.0, 52.57], [57.0, 59.58], [63.0, 65.08], [70.0, 71.04], [75.0, 75.36], [78.0, 78.26], [80.0, 82.65], [84.0, 84.01], [86.0, 88.08], [94.0, 94.49], [96.0, 96.84], [101.0, 100.9], [103.0, 103.72], [105.0, 105.0], [108.0, 109.59], [110.0, 110.4], [112.0, 113.53], [114.0, 115.05], [117.0, 118.25], [121.0, 122.18], [125.0, 125.34], [126.0, 126.44], [129.0, 129.93], [133.0, 135.84], [137.0, 137.76], [140.0, 141.35]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 32.1, 76.86, 0.0, 0.0, 0.0, 100.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sine wave", 19.64], ["sidetone", 16.27], ["busy signal", 13.58]], null, null, null, [["speech", 56.03], ["quack", 10.18], ["music", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.02, 2.69, 0.44, 0.58, 1.21, 1.22, 0.47, 2.11, 0.54, 1.76, 0.57, 2.58, 2.08, 1.04, 0.36, 0.26, 2.65, 0.01, 2.08, 0.49, 0.84, -0.1, 0.72, 0.0, 1.59, 0.4, 1.53, 1.05, 1.25, 1.18, 0.34, 0.44, 0.93, 2.84, 0.76, 1.35]} \ No newline at end of file diff --git a/annotations_1/0osA8jKKotc_filtered.json b/annotations_1/0osA8jKKotc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..642baf7ec41615a654ed5d7bb20c012f687b6d5c --- /dev/null +++ b/annotations_1/0osA8jKKotc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [11.0, 12.06], [13.0, 15.4], [16.0, 18.94], [22.0, 23.7], [24.0, 27.41], [29.0, 32.66], [36.0, 52.0], [52.0, 60.57], [65.0, 66.53], [67.0, 70.77], [72.0, 71.79], [73.0, 73.65], [75.0, 75.2], [76.0, 78.51], [80.0, 80.05], [81.0, 82.27], [83.0, 114.94], [116.0, 136.85], [140.0, 140.49], [142.0, 148.29], [149.0, 149.49], [150.0, 151.09], [153.0, 157.45], [158.0, 158.5], [159.0, 162.3], [165.0, 164.78], [172.0, 173.4], [175.0, 175.02], [175.0, 176.42], [181.0, 192.33], [194.0, 194.05], [196.0, 197.28], [198.0, 198.63], [202.0, 202.32], [203.0, 204.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.05, 95.51, 0.0, 98.36, 97.54, 99.16, 99.98, 0.0, 80.46, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 32.94, 0.0, 74.92, 0.0, 0.0, 43.93, 0.0, 39.8, 0.0, 0.0, 0.0, 0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 31.99], ["grunt", 22.55], ["cattle, bovinae", 16.11]], null, null, null, null, [["music", 40.69], ["speech", 10.2], ["synthesizer", 8.17]], null, [["music", 37.02], ["speech", 24.36], ["foghorn", 4.94]], null, null, null, null, [["music", 36.39], ["theremin", 29.74], ["synthesizer", 10.16]], null, null, null, null, null], "duration": [1.68, 1.06, 2.4, 2.94, 1.7, 3.41, 3.66, 16.0, 8.57, 1.53, 3.77, -0.21, 0.65, 0.2, 2.51, 0.05, 1.27, 31.94, 20.85, 0.49, 6.29, 0.49, 1.09, 4.45, 0.5, 3.3, -0.22, 1.4, 0.02, 1.42, 11.33, 0.05, 1.28, 0.63, 0.32, 1.97]} \ No newline at end of file diff --git a/annotations_1/0p2Oyd040pg_filtered.json b/annotations_1/0p2Oyd040pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27dd3ff9cd348b46dfc97a4cf7c72359cc092e1c --- /dev/null +++ b/annotations_1/0p2Oyd040pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.45], [12.0, 14.71], [15.0, 16.73], [17.0, 17.56], [18.0, 19.63], [22.0, 22.55], [25.0, 26.08], [27.0, 28.05], [30.0, 33.44], [35.0, 43.21], [46.0, 46.33], [50.0, 50.16], [60.0, 62.23], [71.0, 71.2], [73.0, 72.66], [73.0, 73.58], [75.0, 75.27], [77.0, 78.21], [79.0, 88.96], [91.0, 92.75], [94.0, 95.32], [96.0, 97.95], [99.0, 99.55], [101.0, 104.06], [104.0, 104.72], [110.0, 112.83], [116.0, 155.75], [156.0, 158.21], [161.0, 161.81], [163.0, 163.58], [171.0, 193.89], [196.0, 235.75], [238.0, 238.74], [240.0, 255.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 39.17, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 98.27, 0.0, 87.92, 0.0, 0.0, 32.0, 0.0, 0.0, 30.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 71.71], ["hum", 4.69], ["sidetone", 3.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.52], ["speech", 16.22], ["inside, small room", 6.27]], null, null, null, null, null, null, [["noise", 35.34], ["hum", 7.87], ["music", 7.87]], null, null, [["music", 36.42], ["speech", 22.17], ["synthesizer", 6.06]]], "duration": [0.45, 2.71, 1.73, 0.56, 1.63, 0.55, 1.08, 1.05, 3.44, 8.21, 0.33, 0.16, 2.23, 0.2, -0.34, 0.58, 0.27, 1.21, 9.96, 1.75, 1.32, 1.95, 0.55, 3.06, 0.72, 2.83, 39.75, 2.21, 0.81, 0.58, 22.89, 39.75, 0.74, 15.9]} \ No newline at end of file diff --git a/annotations_1/0p9Q6tDJJ1w_filtered.json b/annotations_1/0p9Q6tDJJ1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..031ab03aead9de9f30447ad1564c806ab366d6d2 --- /dev/null +++ b/annotations_1/0p9Q6tDJJ1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.77], [9.0, 9.76], [12.0, 13.09], [14.0, 15.77], [18.0, 41.47], [43.0, 42.77], [44.0, 44.37], [48.0, 48.79], [50.0, 51.07], [53.0, 55.54], [57.0, 58.08], [62.0, 62.51], [63.0, 63.48], [66.0, 66.29], [75.0, 77.5], [80.0, 80.2], [83.0, 83.67], [85.0, 90.24], [90.0, 91.18], [94.0, 94.09], [96.0, 96.25], [97.0, 97.97], [100.0, 103.77], [104.0, 106.74], [108.0, 108.85], [113.0, 113.8], [116.0, 117.1], [123.0, 124.53], [126.0, 131.46], [135.0, 136.98], [137.0, 138.77], [139.0, 159.36], [161.0, 161.55], [162.0, 161.89], [164.0, 164.24], [165.0, 165.99]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.26, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 91.13, 99.21, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 25.25], ["didgeridoo", 14.19], ["music", 11.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.76, 1.09, 1.77, 23.47, -0.23, 0.37, 0.79, 1.07, 2.54, 1.08, 0.51, 0.48, 0.29, 2.5, 0.2, 0.67, 5.24, 1.18, 0.09, 0.25, 0.97, 3.77, 2.74, 0.85, 0.8, 1.1, 1.53, 5.46, 1.98, 1.77, 20.36, 0.55, -0.11, 0.24, 0.99]} \ No newline at end of file diff --git a/annotations_1/0pRYoClF9w4_filtered.json b/annotations_1/0pRYoClF9w4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76cd5153add907b4c55c9108cc0ed55f9510e13b --- /dev/null +++ b/annotations_1/0pRYoClF9w4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.11], [9.0, 9.15], [14.0, 15.08], [16.0, 19.9], [27.0, 27.73], [30.0, 31.23], [35.0, 36.26], [40.0, 43.04], [48.0, 56.88], [59.0, 60.93], [64.0, 65.7], [67.0, 68.77], [73.0, 73.74], [78.0, 84.81], [89.0, 90.56], [92.0, 91.99], [92.0, 92.1], [94.0, 116.53], [126.0, 126.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.17, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 67.25, 91.81, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 50.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 0.15, 1.08, 3.9, 0.73, 1.23, 1.26, 3.04, 8.88, 1.93, 1.7, 1.77, 0.74, 6.81, 1.56, -0.01, 0.1, 22.53, 0.74]} \ No newline at end of file diff --git a/annotations_1/0pUMzDEV-DE_filtered.json b/annotations_1/0pUMzDEV-DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a1ae652a0eb39afed853e0a19e15bdfc252f086 --- /dev/null +++ b/annotations_1/0pUMzDEV-DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.87], [23.0, 22.99], [25.0, 31.46], [32.0, 32.91], [38.0, 42.69], [44.0, 51.87], [53.0, 59.53], [63.0, 83.1], [83.0, 84.25], [87.0, 109.19], [110.0, 118.39]], "keep_status": [true, false, true, false, true, false, false, false, false, true, true], "silence_prob": [29.9, 0.0, 32.38, 0.0, 29.36, 29.54, 29.63, 29.58, 0.0, 29.52, 29.5], "audiomae_on_audioset": [[["music", 51.25], ["throbbing", 8.94], ["hum", 5.97]], null, [["sonar", 22.16], ["rumble", 22.15], ["music", 13.55]], null, [["hum", 30.36], ["mains hum", 21.56], ["throbbing", 12.03]], [["music", 53.81], ["didgeridoo", 10.6], ["throbbing", 9.18]], [["music", 58.99], ["throbbing", 12.65], ["didgeridoo", 6.33]], [["music", 49.89], ["speech", 14.18], ["throbbing", 7.4]], null, [["music", 31.35], ["speech", 20.29], ["hum", 16.42]], [["speech", 36.74], ["hum", 12.46], ["music", 10.54]]], "duration": [4.87, -0.01, 6.46, 0.91, 4.69, 7.87, 6.53, 20.1, 1.25, 22.19, 8.39]} \ No newline at end of file diff --git a/annotations_1/0qkVyahL10U_filtered.json b/annotations_1/0qkVyahL10U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e42a0a98e841e7c0794846b0ef5a84f231666b6 --- /dev/null +++ b/annotations_1/0qkVyahL10U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [7.0, 8.68], [16.0, 16.26], [18.0, 18.5], [27.0, 27.7], [46.0, 46.82], [49.0, 50.5], [53.0, 54.99], [59.0, 59.98], [66.0, 66.5], [78.0, 78.75], [83.0, 84.54], [86.0, 87.07], [88.0, 89.11], [90.0, 90.29], [91.0, 92.2], [92.0, 94.12], [104.0, 104.19], [115.0, 115.92], [144.0, 160.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.69, 0.0, 0.0, 74.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.29], ["sine wave", 22.56], ["dial tone", 10.88]], null, null, null], "duration": [0.65, 1.68, 0.26, 0.5, 0.7, 0.82, 1.5, 1.99, 0.98, 0.5, 0.75, 1.54, 1.07, 1.11, 0.29, 1.2, 2.12, 0.19, 0.92, 16.95]} \ No newline at end of file diff --git a/annotations_1/0quxzV2i_gQ_filtered.json b/annotations_1/0quxzV2i_gQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2db3fbfb80c9d5f68980a7155c5d7446914fe3e --- /dev/null +++ b/annotations_1/0quxzV2i_gQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.91], [25.0, 26.0], [33.0, 35.88], [37.0, 38.21], [39.0, 39.36], [44.0, 44.58], [47.0, 47.61], [48.0, 49.03], [50.0, 50.36], [54.0, 54.63], [56.0, 56.88], [58.0, 58.83], [59.0, 59.43], [62.0, 62.18], [66.0, 66.29], [69.0, 70.06], [73.0, 73.38], [78.0, 79.47], [81.0, 82.39], [87.0, 101.92], [105.0, 112.95], [116.0, 117.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.01, 28.54, 0.0], "audiomae_on_audioset": [null, null, [["hum", 50.72], ["mains hum", 15.49], ["throbbing", 9.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 55.07], ["throbbing", 21.17], ["music", 8.92]], [["music", 82.25], ["beatboxing", 2.39], ["synthetic singing", 1.09]], null], "duration": [0.91, 1.0, 2.88, 1.21, 0.36, 0.58, 0.61, 1.03, 0.36, 0.63, 0.88, 0.83, 0.43, 0.18, 0.29, 1.06, 0.38, 1.47, 1.39, 14.92, 7.95, 1.34]} \ No newline at end of file diff --git a/annotations_1/0qzRQ3qxv5Y_filtered.json b/annotations_1/0qzRQ3qxv5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61abea0fc1166cff88c756632cc6843419f6d436 --- /dev/null +++ b/annotations_1/0qzRQ3qxv5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.92], [10.0, 20.82], [24.0, 47.87], [50.0, 51.14], [53.0, 53.49], [60.0, 72.39], [74.0, 139.29]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [64.52, 33.6, 37.46, 0.0, 0.0, 50.41, 0.0], "audiomae_on_audioset": [null, [["music", 79.57], ["speech", 3.69], ["boing", 1.73]], [["music", 54.39], ["bird", 4.82], ["bird vocalization, bird call, bird song", 4.52]], null, null, null, null], "duration": [3.92, 10.82, 23.87, 1.14, 0.49, 12.39, 65.29]} \ No newline at end of file diff --git a/annotations_1/0tnKF_qcXTo_filtered.json b/annotations_1/0tnKF_qcXTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41f3ebe950caf836be0ba4031a36d6ea5553bd04 --- /dev/null +++ b/annotations_1/0tnKF_qcXTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 88.23], [91.0, 126.84], [130.0, 171.29], [174.0, 187.96], [189.0, 189.46], [191.0, 191.81], [195.0, 201.07]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [30.05, 0.0, 0.0, 28.74, 0.0, 0.0, 30.24], "audiomae_on_audioset": [[["music", 39.56], ["throbbing", 30.89], ["hum", 16.81]], null, null, [["music", 71.58], ["throbbing", 5.63], ["speech", 5.42]], null, null, [["music", 33.03], ["throbbing", 11.89], ["hum", 9.66]]], "duration": [28.23, 35.84, 41.29, 13.96, 0.46, 0.81, 6.07]} \ No newline at end of file diff --git a/annotations_1/0tq44zxA0Ao_filtered.json b/annotations_1/0tq44zxA0Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1d7949963934d4dbbe2352191e8e82578f1064d --- /dev/null +++ b/annotations_1/0tq44zxA0Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.58], [12.0, 13.05], [17.0, 18.12], [22.0, 22.47], [25.0, 25.76], [28.0, 29.2], [30.0, 31.04], [32.0, 33.17], [34.0, 35.85], [39.0, 42.03], [46.0, 46.43], [54.0, 55.31], [57.0, 57.06], [59.0, 62.41], [64.0, 108.73], [116.0, 117.49], [121.0, 124.06], [124.0, 125.51], [127.0, 129.07], [131.0, 132.73], [137.0, 139.87], [143.0, 146.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 51.39, 0.0, 40.79, 0.0, 47.46, 37.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.94], ["speech", 17.71], ["hum", 4.19]], null, [["music", 65.83], ["didgeridoo", 15.44], ["hum", 3.28]], [["music", 41.99], ["speech", 20.45], ["slap, smack", 3.84]]], "duration": [1.58, 1.05, 1.12, 0.47, 0.76, 1.2, 1.04, 1.17, 1.85, 3.03, 0.43, 1.31, 0.06, 3.41, 44.73, 1.49, 3.06, 1.51, 2.07, 1.73, 2.87, 3.18]} \ No newline at end of file diff --git a/annotations_1/0tro-o0fOk4_filtered.json b/annotations_1/0tro-o0fOk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac6c9db7d9377fc26ce8d8c2efd1ea3fae1f3323 --- /dev/null +++ b/annotations_1/0tro-o0fOk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 19.97], [22.0, 24.27], [27.0, 27.94], [30.0, 30.32], [33.0, 34.33], [37.0, 37.94], [39.0, 40.07], [41.0, 43.23], [46.0, 47.44], [49.0, 49.65], [51.0, 52.68], [56.0, 57.37], [59.0, 59.81], [60.0, 71.29], [72.0, 77.21], [78.0, 82.65], [85.0, 90.66], [91.0, 92.74], [99.0, 99.62], [101.0, 101.87], [103.0, 106.73], [109.0, 111.99], [113.0, 131.13]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [41.26, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 38.03, 0.0, 0.0, 0.0, 0.0, 0.0, 40.93, 39.46, 46.05, 44.6, 0.0, 0.0, 0.0, 36.03, 49.45, 29.95], "audiomae_on_audioset": [[["hum", 19.31], ["walk, footsteps", 16.1], ["music", 13.78]], [["music", 53.13], ["speech", 8.11], ["hum", 7.55]], null, null, null, null, null, [["music", 58.41], ["gong", 10.42], ["synthesizer", 3.19]], null, null, null, null, null, [["music", 69.42], ["speech", 7.34], ["chirp tone", 2.95]], [["music", 46.58], ["speech", 21.5], ["beep, bleep", 4.58]], [["music", 78.64], ["synthesizer", 3.43], ["ambient music", 2.28]], [["music", 72.99], ["speech", 12.18], ["bass guitar", 2.02]], null, null, null, [["music", 68.04], ["guitar", 5.46], ["musical instrument", 4.75]], [["music", 31.07], ["alarm clock", 22.59], ["gong", 10.78]], [["music", 83.66], ["throbbing", 2.47], ["cacophony", 1.59]]], "duration": [10.97, 2.27, 0.94, 0.32, 1.33, 0.94, 1.07, 2.23, 1.44, 0.65, 1.68, 1.37, 0.81, 11.29, 5.21, 4.65, 5.66, 1.74, 0.62, 0.87, 3.73, 2.99, 18.13]} \ No newline at end of file diff --git a/annotations_1/0uyVs4iKp_E_filtered.json b/annotations_1/0uyVs4iKp_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dab0425dfb968ffe53698346f645361952bbc35 --- /dev/null +++ b/annotations_1/0uyVs4iKp_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 69.74], [71.0, 71.91], [73.0, 77.8], [80.0, 82.05], [83.0, 84.94], [85.0, 86.09], [87.0, 88.91], [90.0, 106.08], [107.0, 201.95], [204.0, 220.68], [221.0, 225.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.85, 98.44, 0.0, 0.0, 0.0, 66.63, 0.0, 78.89, 74.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [63.74, 0.91, 4.8, 2.05, 1.94, 1.09, 1.91, 16.08, 94.95, 16.68, 4.96]} \ No newline at end of file diff --git a/annotations_1/0v74ANWBqv0_filtered.json b/annotations_1/0v74ANWBqv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d29c31140087a91651e075d8e27bbba94b3a7a2 --- /dev/null +++ b/annotations_1/0v74ANWBqv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.49], [17.0, 18.67], [21.0, 21.88], [25.0, 49.54], [50.0, 50.14], [50.0, 50.43], [52.0, 52.29], [53.0, 58.55], [59.0, 60.18], [65.0, 65.43], [68.0, 69.06], [72.0, 81.18], [82.0, 89.51], [90.0, 102.47], [104.0, 113.81], [115.0, 116.73], [118.0, 145.52], [149.0, 151.26], [152.0, 157.22], [159.0, 162.57], [164.0, 164.0], [164.0, 195.32], [196.0, 196.4]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.62, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 42.26, 45.43, 31.1, 28.53, 0.0, 28.15, 28.44, 28.55, 29.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.59], ["throbbing", 22.15], ["hum", 10.52]], null, null, null, [["hum", 29.58], ["mains hum", 27.09], ["music", 11.23]], null, null, null, [["music", 29.6], ["hum", 22.46], ["mains hum", 10.37]], [["music", 42.72], ["hum", 15.82], ["mains hum", 11.56]], [["music", 76.18], ["ambient music", 4.78], ["synthesizer", 3.53]], [["music", 75.01], ["rumble", 6.31], ["mains hum", 2.82]], null, [["hum", 45.87], ["music", 13.24], ["throbbing", 6.86]], [["sound effect", 10.6], ["music", 8.93], ["speech", 7.01]], [["music", 25.58], ["mains hum", 21.21], ["hum", 14.7]], [["throbbing", 26.43], ["hum", 24.62], ["music", 13.78]], null, null, null], "duration": [1.49, 1.67, 0.88, 24.54, 0.14, 0.43, 0.29, 5.55, 1.18, 0.43, 1.06, 9.18, 7.51, 12.47, 9.81, 1.73, 27.52, 2.26, 5.22, 3.57, 0.0, 31.32, 0.4]} \ No newline at end of file diff --git a/annotations_1/0vcXvLUt1E4_filtered.json b/annotations_1/0vcXvLUt1E4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8b2ea9dd4755c3f9e9a98ac5e40eb75f1c84f4 --- /dev/null +++ b/annotations_1/0vcXvLUt1E4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [8.0, 9.64]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.73, 1.64]} \ No newline at end of file diff --git a/annotations_1/0w8oeXvLXOw_filtered.json b/annotations_1/0w8oeXvLXOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c6b19c9353c13cbcb81d8ea93f3efc0815008b --- /dev/null +++ b/annotations_1/0w8oeXvLXOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.31], [23.0, 37.44], [42.0, 42.55], [44.0, 58.06], [60.0, 60.05], [60.0, 60.08], [60.0, 60.12], [60.0, 76.05], [77.0, 77.75], [78.0, 105.26], [107.0, 106.96], [109.0, 138.4], [140.0, 153.05], [155.0, 155.63], [156.0, 156.56]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.86, 29.4, 0.0, 28.73, 0.0, 0.0, 0.0, 29.12, 0.0, 28.68, 0.0, 28.58, 29.56, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 52.0], ["music", 29.69], ["hum", 9.24]], [["throbbing", 28.73], ["hum", 17.56], ["music", 17.52]], null, [["hum", 51.28], ["mains hum", 29.45], ["music", 10.42]], null, null, null, [["hum", 57.55], ["throbbing", 22.29], ["mains hum", 17.84]], null, [["music", 38.9], ["throbbing", 17.56], ["hum", 8.82]], null, [["music", 40.68], ["throbbing", 24.72], ["hum", 13.63]], [["throbbing", 48.65], ["hum", 26.97], ["music", 9.69]], null, null], "duration": [9.31, 14.44, 0.55, 14.06, 0.05, 0.08, 0.12, 16.05, 0.75, 27.26, -0.04, 29.4, 13.05, 0.63, 0.56]} \ No newline at end of file diff --git a/annotations_1/0wTKzzRtGqY_filtered.json b/annotations_1/0wTKzzRtGqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a55e8b10af1d6fe54ab1e04abc0171ab5b335e4 --- /dev/null +++ b/annotations_1/0wTKzzRtGqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.62], [17.0, 29.46], [36.0, 38.26], [39.0, 40.37], [41.0, 45.0], [47.0, 47.92], [50.0, 50.53], [52.0, 52.25], [55.0, 55.66], [57.0, 57.89], [60.0, 60.29], [61.0, 61.92], [64.0, 63.91], [66.0, 66.83], [78.0, 78.0], [81.0, 80.99], [82.0, 83.93], [87.0, 90.48], [91.0, 91.84], [93.0, 93.34], [95.0, 95.76], [97.0, 98.25], [99.0, 99.98], [101.0, 101.9], [105.0, 110.93], [112.0, 112.87], [116.0, 115.74], [122.0, 122.13], [125.0, 125.68], [126.0, 127.55], [129.0, 130.92], [133.0, 133.44], [135.0, 135.5], [138.0, 137.79], [140.0, 142.5], [144.0, 144.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.56, 86.82, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.21], ["insect", 13.62], ["fly, housefly", 7.51]], null, null, null, null, null, null, null, null, null, [["sidetone", 40.87], ["speech", 23.08], ["hum", 9.68]], null], "duration": [0.62, 12.46, 2.26, 1.37, 4.0, 0.92, 0.53, 0.25, 0.66, 0.89, 0.29, 0.92, -0.09, 0.83, 0.0, -0.01, 1.93, 3.48, 0.84, 0.34, 0.76, 1.25, 0.98, 0.9, 5.93, 0.87, -0.26, 0.13, 0.68, 1.55, 1.92, 0.44, 0.5, -0.21, 2.5, 0.61]} \ No newline at end of file diff --git a/annotations_1/0xHe1zkABYo_filtered.json b/annotations_1/0xHe1zkABYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e8d33f60be399cf1d5bb769860c483e82c972db --- /dev/null +++ b/annotations_1/0xHe1zkABYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 25.79], [34.0, 34.7], [36.0, 38.16], [39.0, 40.53], [44.0, 60.66], [62.0, 63.09], [64.0, 65.45], [67.0, 67.42], [70.0, 72.33], [74.0, 75.27], [77.0, 77.94], [80.0, 80.18], [83.0, 85.36], [88.0, 92.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 0.0, 99.97, 0.0, 40.4, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 97.73, 81.35], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 36.83], ["hum", 29.55], ["buzz", 7.93]], null, null, null, null, null, null, null, null, null], "duration": [18.79, 0.7, 2.16, 1.53, 16.66, 1.09, 1.45, 0.42, 2.33, 1.27, 0.94, 0.18, 2.36, 4.94]} \ No newline at end of file diff --git a/annotations_1/0xSSnfRYBQY_filtered.json b/annotations_1/0xSSnfRYBQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1611ed721edf2ad5afe21a9e1d5285d7ab62c1c4 --- /dev/null +++ b/annotations_1/0xSSnfRYBQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 29.57], [30.0, 33.52], [34.0, 36.86], [37.0, 38.84], [39.0, 41.32], [42.0, 45.86], [47.0, 50.65], [51.0, 53.59]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [29.73, 30.05, 30.11, 0.0, 30.15, 30.15, 30.19, 30.29], "audiomae_on_audioset": [[["hum", 32.01], ["music", 21.09], ["throbbing", 16.49]], [["throbbing", 43.13], ["music", 29.5], ["hum", 8.59]], [["throbbing", 28.1], ["music", 25.03], ["hum", 18.3]], null, [["music", 40.23], ["throbbing", 15.06], ["speech", 11.03]], [["music", 33.76], ["throbbing", 28.29], ["hum", 16.14]], [["music", 54.02], ["throbbing", 16.54], ["hum", 8.92]], [["music", 56.71], ["electronic music", 9.4], ["throbbing", 8.99]]], "duration": [6.57, 3.52, 2.86, 1.84, 2.32, 3.86, 3.65, 2.59]} \ No newline at end of file diff --git a/annotations_1/0y5KiKKCD7A_filtered.json b/annotations_1/0y5KiKKCD7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56d3fd684c38a8bd97b5b83a240d54ed5009fa07 --- /dev/null +++ b/annotations_1/0y5KiKKCD7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.03], [27.0, 27.72], [29.0, 31.18], [35.0, 40.02], [40.0, 41.82], [45.0, 57.32], [59.0, 61.67], [65.0, 68.61], [74.0, 77.23], [78.0, 80.86], [83.0, 192.23]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false], "silence_prob": [28.26, 0.0, 37.25, 29.02, 0.0, 29.2, 41.28, 39.43, 28.98, 28.44, 0.0], "audiomae_on_audioset": [[["throbbing", 33.6], ["hum", 30.16], ["music", 14.97]], null, [["music", 28.3], ["hum", 11.45], ["speech", 10.69]], [["hum", 25.87], ["music", 25.56], ["throbbing", 17.19]], null, [["speech", 56.47], ["music", 22.01], ["electronic music", 4.01]], [["music", 42.44], ["synthesizer", 6.41], ["didgeridoo", 5.59]], [["music", 40.83], ["theremin", 27.66], ["didgeridoo", 5.23]], [["music", 56.52], ["scary music", 10.33], ["throbbing", 5.91]], [["speech", 36.79], ["gong", 28.61], ["music", 5.53]], null], "duration": [8.03, 0.72, 2.18, 5.02, 1.82, 12.32, 2.67, 3.61, 3.23, 2.86, 109.23]} \ No newline at end of file diff --git a/annotations_1/0yAYgv2YQ5k_filtered.json b/annotations_1/0yAYgv2YQ5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..171a1f228d613569e66d58f743f8ba924811988d --- /dev/null +++ b/annotations_1/0yAYgv2YQ5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.24], [23.0, 24.43], [27.0, 29.22], [31.0, 48.98], [52.0, 64.07]], "keep_status": [false, false, true, true, true], "silence_prob": [0.0, 0.0, 29.91, 29.0, 28.63], "audiomae_on_audioset": [null, null, [["groan", 17.06], ["sound effect", 14.33], ["whack, thwack", 12.03]], [["screaming", 27.82], ["music", 22.22], ["speech", 5.78]], [["speech", 36.78], ["whack, thwack", 18.17], ["thunk", 6.8]]], "duration": [0.24, 1.43, 2.22, 17.98, 12.07]} \ No newline at end of file diff --git a/annotations_1/0yDzNGZc9DI_filtered.json b/annotations_1/0yDzNGZc9DI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4810f0d32864746a95e76e4ecb08ef269c258d41 --- /dev/null +++ b/annotations_1/0yDzNGZc9DI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.64], [11.0, 52.69], [57.0, 63.07], [66.0, 107.27], [110.0, 121.1]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.86, 0.0, 35.38], "audiomae_on_audioset": [null, null, [["speech", 47.72], ["music", 39.94], ["whale vocalization", 2.75]], null, [["whale vocalization", 14.98], ["noise", 11.62], ["livestock, farm animals, working animals", 10.98]]], "duration": [-0.36, 41.69, 6.07, 41.27, 11.1]} \ No newline at end of file diff --git a/annotations_1/0yngsYrBCLg_filtered.json b/annotations_1/0yngsYrBCLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99140df6fd7aada5cb6d14b3c6599210235ba977 --- /dev/null +++ b/annotations_1/0yngsYrBCLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [15.0, 15.42], [17.0, 18.52], [52.0, 51.76], [53.0, 53.87], [58.0, 58.01], [61.0, 61.28], [61.0, 61.33]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.32, 0.42, 1.52, -0.24, 0.87, 0.01, 0.28, 0.33]} \ No newline at end of file diff --git a/annotations_1/0z-FtAMg6Vw_filtered.json b/annotations_1/0z-FtAMg6Vw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a314a004e271c3a8c869a55342ea9ec2774d8762 --- /dev/null +++ b/annotations_1/0z-FtAMg6Vw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.43], [6.0, 7.01], [9.0, 9.73], [18.0, 18.64], [19.0, 20.24], [22.0, 23.85], [24.0, 33.17], [38.0, 47.9]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.41, 36.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 58.6], ["musical instrument", 10.5], ["echo", 5.22]], [["music", 36.3], ["noise", 21.02], ["effects unit", 13.63]]], "duration": [1.43, 1.01, 0.73, 0.64, 1.24, 1.85, 9.17, 9.9]} \ No newline at end of file diff --git a/annotations_1/0z9b9_n8-Ek_filtered.json b/annotations_1/0z9b9_n8-Ek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..286c7414fbd92970550111f566a0df38a73b1467 --- /dev/null +++ b/annotations_1/0z9b9_n8-Ek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 50.58], [51.0, 59.14], [60.0, 65.79], [66.0, 68.66], [69.0, 74.63], [75.0, 84.21], [85.0, 86.1], [88.0, 89.97], [92.0, 105.24], [107.0, 113.31], [114.0, 121.32], [122.0, 133.44], [136.0, 136.85]], "keep_status": [false, true, true, false, false, true, false, false, true, false, true, true, false], "silence_prob": [45.46, 40.12, 46.12, 56.25, 56.25, 43.53, 0.0, 0.0, 42.53, 52.27, 34.37, 30.0, 0.0], "audiomae_on_audioset": [[["insect", 45.18], ["fly, housefly", 30.16], ["bee, wasp, etc.", 17.48]], [["speech", 28.43], ["hum", 11.0], ["noise", 7.7]], [["sidetone", 19.39], ["noise", 12.21], ["whale vocalization", 9.51]], null, null, [["fly, housefly", 34.05], ["insect", 16.29], ["bee, wasp, etc.", 14.61]], null, null, [["hum", 36.93], ["animal", 25.32], ["mains hum", 5.61]], null, [["hum", 23.38], ["bee, wasp, etc.", 16.86], ["speech", 7.31]], [["speech", 40.55], ["hum", 12.49], ["mains hum", 11.38]], null], "duration": [2.58, 8.14, 5.79, 2.66, 5.63, 9.21, 1.1, 1.97, 13.24, 6.31, 7.32, 11.44, 0.85]} \ No newline at end of file diff --git a/annotations_1/0zHERbRFxTU_filtered.json b/annotations_1/0zHERbRFxTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a79c027c08e424d8aa1ed67c79cc56c9fb355b3c --- /dev/null +++ b/annotations_1/0zHERbRFxTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.57], [31.0, 31.94], [35.0, 35.11], [36.0, 41.17], [42.0, 42.79], [45.0, 49.47], [52.0, 54.04], [57.0, 62.97], [63.0, 63.81], [64.0, 64.25], [66.0, 71.15], [77.0, 77.41], [85.0, 85.77], [88.0, 88.5], [89.0, 88.75], [94.0, 97.73], [106.0, 106.96], [111.0, 112.83], [115.0, 126.89], [127.0, 129.17], [139.0, 140.98], [144.0, 147.6]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.95, 0.0, 32.18, 35.68, 42.22, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 36.54, 38.86, 0.0, 31.86], "audiomae_on_audioset": [null, null, null, [["music", 53.84], ["speech", 23.22], ["boing", 5.3]], null, [["cattle, bovinae", 22.1], ["livestock, farm animals, working animals", 18.73], ["moo", 16.35]], [["music", 44.2], ["musical instrument", 10.56], ["guitar", 8.43]], [["speech", 80.27], ["animal", 2.6], ["outside, rural or natural", 1.95]], null, null, null, null, null, null, null, [["music", 49.68], ["speech", 18.33], ["boing", 7.06]], null, null, [["whale vocalization", 77.72], ["music", 11.8], ["animal", 2.35]], [["music", 66.31], ["musical instrument", 4.98], ["guitar", 4.25]], null, [["whale vocalization", 89.01], ["speech", 2.66], ["animal", 1.04]]], "duration": [1.57, 0.94, 0.11, 5.17, 0.79, 4.47, 2.04, 5.97, 0.81, 0.25, 5.15, 0.41, 0.77, 0.5, -0.25, 3.73, 0.96, 1.83, 11.89, 2.17, 1.98, 3.6]} \ No newline at end of file diff --git a/annotations_1/0zImze5PCFg_filtered.json b/annotations_1/0zImze5PCFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d51c9a9256e21cb019a47cb2bdc872c2acec641 --- /dev/null +++ b/annotations_1/0zImze5PCFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.06], [12.0, 12.45], [20.0, 20.66], [24.0, 26.77], [27.0, 27.46], [29.0, 29.3], [33.0, 33.0], [36.0, 36.73], [38.0, 38.25], [39.0, 39.83], [46.0, 46.63], [49.0, 48.91], [58.0, 58.24], [59.0, 66.39], [70.0, 69.74], [78.0, 78.36], [81.0, 81.26], [82.0, 83.84], [86.0, 88.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 87.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.45, 0.66, 2.77, 0.46, 0.3, 0.0, 0.73, 0.25, 0.83, 0.63, -0.09, 0.24, 7.39, -0.26, 0.36, 0.26, 1.84, 2.2]} \ No newline at end of file diff --git a/annotations_1/0zQAUQGwv4A_filtered.json b/annotations_1/0zQAUQGwv4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..227910dbb97dc1fa9895db66fd4d37388b7a76af --- /dev/null +++ b/annotations_1/0zQAUQGwv4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [5.0, 6.02], [6.0, 6.69], [12.0, 13.86], [15.0, 16.83], [18.0, 21.88], [23.0, 23.77], [25.0, 26.4], [27.0, 30.91], [32.0, 32.93], [41.0, 42.63], [43.0, 44.73], [46.0, 46.5], [47.0, 48.86], [50.0, 50.08], [51.0, 51.12], [57.0, 57.67], [58.0, 58.95], [60.0, 60.74], [61.0, 61.75], [62.0, 64.61], [70.0, 70.02], [70.0, 73.77], [75.0, 75.07], [79.0, 80.84], [82.0, 86.07], [90.0, 92.89], [96.0, 100.16], [102.0, 108.58], [112.0, 113.09], [114.0, 114.51], [119.0, 119.94], [121.0, 121.9], [124.0, 124.61], [127.0, 127.67], [130.0, 129.86], [134.0, 135.78], [136.0, 137.89], [138.0, 140.75], [141.0, 154.26], [155.0, 165.74], [167.0, 168.17], [169.0, 175.02], [176.0, 178.75]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [59.51, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 55.31, 0.0, 0.0, 37.96, 36.47, 32.42, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 42.91, 32.03, 0.0, 47.31, 34.28], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.26], ["theremin", 22.9], ["wind instrument, woodwind instrument", 3.48]], null, null, [["music", 18.93], ["foghorn", 11.94], ["gong", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 45.88], ["mains hum", 15.01], ["music", 13.17]], [["music", 47.61], ["synthesizer", 8.35], ["hum", 4.93]], [["music", 57.66], ["cowbell", 3.58], ["cacophony", 3.22]], [["music", 83.22], ["synthesizer", 6.52], ["electronic music", 2.43]], null, null, null, null, null, null, null, null, null, null, [["music", 46.34], ["theremin", 29.66], ["whale vocalization", 2.17]], [["theremin", 71.7], ["music", 23.88], ["musical instrument", 1.72]], null, [["music", 42.52], ["theremin", 11.02], ["flute", 5.06]], [["trombone", 28.63], ["music", 23.37], ["brass instrument", 21.01]]], "duration": [2.16, 1.02, 0.69, 1.86, 1.83, 3.88, 0.77, 1.4, 3.91, 0.93, 1.63, 1.73, 0.5, 1.86, 0.08, 0.12, 0.67, 0.95, 0.74, 0.75, 2.61, 0.02, 3.77, 0.07, 1.84, 4.07, 2.89, 4.16, 6.58, 1.09, 0.51, 0.94, 0.9, 0.61, 0.67, -0.14, 1.78, 1.89, 2.75, 13.26, 10.74, 1.17, 6.02, 2.75]} \ No newline at end of file diff --git a/annotations_1/0zsUFpPjt8g_filtered.json b/annotations_1/0zsUFpPjt8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70698f2df0d1ef0133a30887aaae3d4be1e9258c --- /dev/null +++ b/annotations_1/0zsUFpPjt8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.19], [15.0, 15.92], [19.0, 19.75], [20.0, 21.68], [23.0, 24.07], [25.0, 30.11], [32.0, 33.51], [34.0, 35.45], [36.0, 36.91], [39.0, 40.19], [41.0, 41.5], [42.0, 43.11], [51.0, 51.02], [55.0, 56.17], [58.0, 62.51], [63.0, 64.22], [64.0, 67.9], [84.0, 85.92], [86.0, 87.13], [90.0, 93.82], [96.0, 96.08], [97.0, 97.21], [99.0, 102.29], [117.0, 122.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [40.61, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 50.11, 0.0, 0.0, 65.67, 0.0, 0.0, 45.52, 38.51], "audiomae_on_audioset": [[["music", 35.11], ["throbbing", 20.5], ["speech", 17.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.36], ["music", 14.08], ["speech", 9.02]], [["hum", 31.93], ["mains hum", 23.0], ["music", 10.99]]], "duration": [3.19, 0.92, 0.75, 1.68, 1.07, 5.11, 1.51, 1.45, 0.91, 1.19, 0.5, 1.11, 0.02, 1.17, 4.51, 1.22, 3.9, 1.92, 1.13, 3.82, 0.08, 0.21, 3.29, 5.67]} \ No newline at end of file diff --git a/annotations_1/0zuW4KMG7XQ_filtered.json b/annotations_1/0zuW4KMG7XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27d3d14eb16485ad3b0b57bd53c072f84635301 --- /dev/null +++ b/annotations_1/0zuW4KMG7XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [8.0, 10.77], [11.0, 12.5], [13.0, 13.17], [14.0, 15.94], [17.0, 16.9], [25.0, 25.84], [28.0, 28.26], [29.0, 30.86], [40.0, 41.84], [47.0, 48.49], [50.0, 50.33], [51.0, 51.44], [59.0, 59.26], [63.0, 63.69], [67.0, 67.27], [72.0, 72.99], [74.0, 76.37], [78.0, 79.91], [81.0, 82.31], [83.0, 83.79], [95.0, 95.45], [124.0, 125.58], [132.0, 141.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 39.61], "audiomae_on_audioset": [null, [["music", 62.81], ["throbbing", 5.69], ["video game music", 4.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 16.96], ["groan", 14.17], ["wail, moan", 10.68]]], "duration": [-0.09, 2.77, 1.5, 0.17, 1.94, -0.1, 0.84, 0.26, 1.86, 1.84, 1.49, 0.33, 0.44, 0.26, 0.69, 0.27, 0.99, 2.37, 1.91, 1.31, 0.79, 0.45, 1.58, 9.08]} \ No newline at end of file diff --git a/annotations_1/1-9573qxk5g_filtered.json b/annotations_1/1-9573qxk5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78d236ed6dd1f369fdc971fdd0f0d898e35b2655 --- /dev/null +++ b/annotations_1/1-9573qxk5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.26], [14.0, 15.42], [17.0, 17.78], [21.0, 22.5], [26.0, 25.83], [28.0, 28.46], [29.0, 29.13], [29.0, 44.25], [45.0, 68.64], [70.0, 72.71], [73.0, 79.91], [85.0, 85.8], [87.0, 94.53], [96.0, 97.68]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [47.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.47, 30.14, 37.65, 31.94, 0.0, 39.72, 0.0], "audiomae_on_audioset": [[["music", 43.3], ["hum", 20.35], ["throbbing", 11.41]], null, null, null, null, null, null, [["speech", 56.17], ["music", 14.41], ["whack, thwack", 7.41]], [["speech", 18.17], ["music", 17.65], ["clang", 13.35]], [["speech", 39.94], ["hum", 11.57], ["mains hum", 6.22]], [["didgeridoo", 11.16], ["mains hum", 10.73], ["fly, housefly", 10.49]], null, [["hum", 36.63], ["throbbing", 29.11], ["music", 9.67]], null], "duration": [8.26, 1.42, 0.78, 1.5, -0.17, 0.46, 0.13, 15.25, 23.64, 2.71, 6.91, 0.8, 7.53, 1.68]} \ No newline at end of file diff --git a/annotations_1/1-WimijgGEU_filtered.json b/annotations_1/1-WimijgGEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d684799157475e9ccfd8424609d941c00f3cc0c --- /dev/null +++ b/annotations_1/1-WimijgGEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.66], [33.0, 33.02], [34.0, 40.2], [40.0, 47.98], [57.0, 58.77], [62.0, 64.54], [67.0, 66.78], [71.0, 71.81], [73.0, 92.33], [93.0, 157.28], [158.0, 160.1], [167.0, 166.92], [174.0, 174.21], [181.0, 181.25], [182.0, 182.66], [184.0, 184.54], [185.0, 198.19], [202.0, 203.52], [205.0, 207.44], [210.0, 234.76]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.2, 40.47, 0.0, 33.92, 0.0, 0.0, 32.19, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 54.83, 0.0, 37.99, 32.33], "audiomae_on_audioset": [null, null, [["music", 77.05], ["theremin", 5.06], ["musical instrument", 2.66]], [["music", 44.14], ["carnatic music", 15.31], ["sitar", 6.05]], null, [["music", 61.44], ["carnatic music", 17.42], ["yodeling", 1.96]], null, null, [["music", 68.27], ["theremin", 19.55], ["carnatic music", 2.07]], null, null, null, null, null, null, null, null, null, [["music", 59.78], ["theremin", 11.71], ["didgeridoo", 5.24]], [["music", 71.52], ["theremin", 12.28], ["didgeridoo", 3.16]]], "duration": [0.66, 0.02, 6.2, 7.98, 1.77, 2.54, -0.22, 0.81, 19.33, 64.28, 2.1, -0.08, 0.21, 0.25, 0.66, 0.54, 13.19, 1.52, 2.44, 24.76]} \ No newline at end of file diff --git a/annotations_1/10khF4-1rbU_filtered.json b/annotations_1/10khF4-1rbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0312194a2db8b93b8e1783e4e18737cc1718bda --- /dev/null +++ b/annotations_1/10khF4-1rbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.94], [23.0, 34.8], [41.0, 41.17], [46.0, 46.58], [59.0, 59.29], [60.0, 60.57], [61.0, 61.03], [69.0, 72.03], [78.0, 83.76], [91.0, 95.52], [100.0, 100.94], [103.0, 104.25], [108.0, 109.02], [110.0, 116.09], [133.0, 144.02]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [34.64, 36.03, 0.0, 0.0, 0.0, 0.0, 0.0, 39.58, 33.42, 34.01, 0.0, 0.0, 0.0, 36.46, 35.05], "audiomae_on_audioset": [[["music", 62.24], ["speech", 10.65], ["boing", 4.45]], [["music", 74.29], ["singing", 3.17], ["music of latin america", 2.11]], null, null, null, null, null, [["music", 43.22], ["drum machine", 10.24], ["synthesizer", 7.51]], [["hum", 29.22], ["speech", 21.14], ["music", 18.81]], [["music", 55.4], ["swing music", 23.86], ["brass instrument", 2.97]], null, null, null, [["fly, housefly", 33.04], ["insect", 18.19], ["music", 12.47]], [["music", 68.53], ["throbbing", 4.62], ["synthesizer", 3.72]]], "duration": [4.94, 11.8, 0.17, 0.58, 0.29, 0.57, 0.03, 3.03, 5.76, 4.52, 0.94, 1.25, 1.02, 6.09, 11.02]} \ No newline at end of file diff --git a/annotations_1/11-AlLawdeg_filtered.json b/annotations_1/11-AlLawdeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4203864bbdf21fded27001aea01b48f8103ac7b0 --- /dev/null +++ b/annotations_1/11-AlLawdeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.23], [24.0, 24.02], [25.0, 27.28], [28.0, 28.8], [33.0, 33.99], [41.0, 42.6], [58.0, 58.82], [59.0, 59.64], [71.0, 71.59], [73.0, 75.74], [76.0, 78.14], [79.0, 84.55], [85.0, 89.07], [89.0, 89.23], [91.0, 92.72], [102.0, 104.14], [106.0, 106.47], [111.0, 119.18], [125.0, 126.08], [127.0, 128.76], [130.0, 135.92], [140.0, 143.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, true, true], "silence_prob": [48.19, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 99.1, 56.63, 31.99, 0.0, 0.0, 42.91, 0.0, 29.35, 0.0, 0.0, 31.07, 29.33], "audiomae_on_audioset": [[["sidetone", 12.08], ["busy signal", 11.3], ["synthesizer", 9.63]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.43], ["groan", 14.11], ["music", 10.83]], null, null, [["music", 22.29], ["hum", 9.71], ["synthesizer", 7.83]], null, [["music", 22.55], ["speech", 16.74], ["hum", 14.26]], null, null, [["music", 33.4], ["sidetone", 14.67], ["hum", 9.24]], [["explosion", 26.04], ["fart", 11.4], ["burst, pop", 8.26]]], "duration": [19.23, 0.02, 2.28, 0.8, 0.99, 1.6, 0.82, 0.64, 0.59, 2.74, 2.14, 5.55, 4.07, 0.23, 1.72, 2.14, 0.47, 8.18, 1.08, 1.76, 5.92, 3.45]} \ No newline at end of file diff --git a/annotations_1/12KcnPMV3OM_filtered.json b/annotations_1/12KcnPMV3OM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ffc701a1c461b6194e1c651026d275e272f5065 --- /dev/null +++ b/annotations_1/12KcnPMV3OM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.39], [11.0, 12.46], [13.0, 15.16], [15.0, 16.6], [20.0, 20.09], [21.0, 21.34], [22.0, 22.69], [35.0, 35.43], [46.0, 47.14], [47.0, 47.8], [49.0, 49.6], [50.0, 51.66], [59.0, 59.34], [71.0, 72.23], [74.0, 76.38], [77.0, 78.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.46, 2.16, 1.6, 0.09, 0.34, 0.69, 0.43, 1.14, 0.8, 0.6, 1.66, 0.34, 1.23, 2.38, 1.19]} \ No newline at end of file diff --git a/annotations_1/12iewuXNhbE_filtered.json b/annotations_1/12iewuXNhbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d93840023178fc46737d85bf8d329089a0bdbb1 --- /dev/null +++ b/annotations_1/12iewuXNhbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [5.0, 6.49], [8.0, 9.61], [11.0, 11.35], [13.0, 13.24], [21.0, 22.62], [24.0, 24.44], [25.0, 25.95], [28.0, 31.36], [32.0, 39.83], [40.0, 42.23], [47.0, 48.37], [49.0, 52.15], [53.0, 55.48], [56.0, 58.83], [59.0, 59.88], [61.0, 63.42], [65.0, 65.69], [69.0, 69.3], [72.0, 72.54], [75.0, 76.5], [78.0, 80.06], [86.0, 87.52], [88.0, 92.45], [98.0, 98.64], [101.0, 100.7], [103.0, 103.4], [109.0, 111.43], [112.0, 114.29], [116.0, 117.24], [119.0, 119.5], [121.0, 121.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 61.08, 78.89, 0.0, 94.66, 71.72, 71.72, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 99.26, 0.0, 0.0, 0.0, 52.33, 99.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 1.49, 1.61, 0.35, 0.24, 1.62, 0.44, 0.95, 3.36, 7.83, 2.23, 1.37, 3.15, 2.48, 2.83, 0.88, 2.42, 0.69, 0.3, 0.54, 1.5, 2.06, 1.52, 4.45, 0.64, -0.3, 0.4, 2.43, 2.29, 1.24, 0.5, 0.76]} \ No newline at end of file diff --git a/annotations_1/13h4zTXEjvw_filtered.json b/annotations_1/13h4zTXEjvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc40b59a3c9b8c3af8ed1de7f982a2a917cbfa1f --- /dev/null +++ b/annotations_1/13h4zTXEjvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 96.77], [98.0, 126.39], [130.0, 134.67]], "keep_status": [false, true, false], "silence_prob": [30.1, 29.58, 40.22], "audiomae_on_audioset": [[["hum", 49.05], ["music", 20.43], ["mains hum", 7.5]], [["hum", 25.03], ["speech", 22.52], ["mains hum", 7.72]], [["whale vocalization", 95.36], ["music", 0.95], ["livestock, farm animals, working animals", 0.54]]], "duration": [29.77, 28.39, 4.67]} \ No newline at end of file diff --git a/annotations_1/14Et05Okf8w_filtered.json b/annotations_1/14Et05Okf8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71e2b80bdfcafcc9998a62d9f5fda144438fc76c --- /dev/null +++ b/annotations_1/14Et05Okf8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.57], [10.0, 10.49], [12.0, 12.23], [14.0, 14.69], [17.0, 17.46], [20.0, 20.55], [21.0, 22.6], [24.0, 24.11], [29.0, 29.71], [31.0, 31.89], [37.0, 38.37], [40.0, 41.32], [44.0, 45.55], [49.0, 49.42], [50.0, 50.97], [52.0, 52.76], [55.0, 57.48], [58.0, 59.43], [61.0, 61.65], [63.0, 63.93], [65.0, 65.48], [66.0, 67.8], [70.0, 71.07], [74.0, 75.54], [77.0, 78.21], [80.0, 81.41], [84.0, 84.06], [87.0, 87.83], [92.0, 92.55], [95.0, 95.88], [98.0, 99.57], [101.0, 102.79], [104.0, 105.38], [107.0, 114.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 0.49, 0.23, 0.69, 0.46, 0.55, 1.6, 0.11, 0.71, 0.89, 1.37, 1.32, 1.55, 0.42, 0.97, 0.76, 2.48, 1.43, 0.65, 0.93, 0.48, 1.8, 1.07, 1.54, 1.21, 1.41, 0.06, 0.83, 0.55, 0.88, 1.57, 1.79, 1.38, 7.71]} \ No newline at end of file diff --git a/annotations_1/14nilke-mtQ_filtered.json b/annotations_1/14nilke-mtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01441610537622beed057ef4529d2db9a0e15448 --- /dev/null +++ b/annotations_1/14nilke-mtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.21], [13.0, 27.04], [27.0, 30.48], [32.0, 33.54], [35.0, 35.21], [38.0, 41.81], [42.0, 47.65], [48.0, 49.76], [50.0, 70.75], [72.0, 74.8], [75.0, 78.16], [82.0, 82.8], [85.0, 85.89], [86.0, 87.45], [104.0, 105.12], [108.0, 109.97]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.33, 61.37, 0.0, 0.0, 99.95, 34.22, 0.0, 37.61, 100.0, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 30.91], ["dog", 10.05], ["mains hum", 7.41]], null, [["hum", 20.6], ["heart sounds, heartbeat", 13.59], ["walk, footsteps", 13.53]], null, null, null, null, null, null, null], "duration": [1.21, 14.04, 3.48, 1.54, 0.21, 3.81, 5.65, 1.76, 20.75, 2.8, 3.16, 0.8, 0.89, 1.45, 1.12, 1.97]} \ No newline at end of file diff --git a/annotations_1/14t7g8Yq8vE_filtered.json b/annotations_1/14t7g8Yq8vE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f5109c3ef02a759ad426c5bc198bb1e30f3306 --- /dev/null +++ b/annotations_1/14t7g8Yq8vE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.49], [7.0, 8.11], [11.0, 11.21], [14.0, 15.58], [20.0, 20.51], [22.0, 23.52], [26.0, 26.67], [27.0, 32.81], [37.0, 43.09], [47.0, 48.39], [55.0, 59.27], [63.0, 67.24], [70.0, 70.16], [73.0, 74.55], [75.0, 77.95], [79.0, 78.8], [82.0, 83.07], [90.0, 91.72], [109.0, 109.38], [109.0, 109.41], [109.0, 112.02], [117.0, 116.78], [117.0, 116.83], [124.0, 140.22]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.46, 38.83, 0.0, 37.9, 37.16, 0.0, 0.0, 31.12, 0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 0.0, 0.0, 33.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 62.0], ["guitar", 12.34], ["effects unit", 6.66]], [["music", 56.27], ["musical instrument", 6.38], ["guitar", 4.25]], null, [["music", 71.32], ["guitar", 9.07], ["plucked string instrument", 5.31]], [["music", 34.4], ["cattle, bovinae", 15.2], ["livestock, farm animals, working animals", 15.16]], null, null, [["music", 56.41], ["chant", 8.92], ["mantra", 5.51]], null, null, null, null, null, [["music", 65.93], ["didgeridoo", 11.79], ["theremin", 4.1]], null, null, [["music", 81.68], ["musical instrument", 4.45], ["guitar", 1.47]]], "duration": [1.49, 1.11, 0.21, 1.58, 0.51, 1.52, 0.67, 5.81, 6.09, 1.39, 4.27, 4.24, 0.16, 1.55, 2.95, -0.2, 1.07, 1.72, 0.38, 0.41, 3.02, -0.22, -0.17, 16.22]} \ No newline at end of file diff --git a/annotations_1/14zxmnIDoLs_filtered.json b/annotations_1/14zxmnIDoLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/14zxmnIDoLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/15MbDpZad74_filtered.json b/annotations_1/15MbDpZad74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fc5d2476601822f38427baa3b7c3ee25d67a5be --- /dev/null +++ b/annotations_1/15MbDpZad74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.2], [20.0, 19.92], [20.0, 69.53], [71.0, 74.29], [76.0, 77.6], [79.0, 80.27], [82.0, 81.94], [85.0, 97.09], [98.0, 107.23], [108.0, 108.45], [108.0, 157.37]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [30.92, 0.0, 0.0, 39.63, 0.0, 0.0, 0.0, 30.09, 30.16, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.34], ["throbbing", 9.32], ["electronic music", 5.93]], null, null, [["theremin", 23.31], ["music", 19.61], ["hum", 8.41]], null, null, null, [["music", 67.25], ["throbbing", 5.47], ["hum", 4.28]], [["music", 81.86], ["dubstep", 3.85], ["electronic music", 2.76]], null, null], "duration": [4.2, -0.08, 49.53, 3.29, 1.6, 1.27, -0.06, 12.09, 9.23, 0.45, 49.37]} \ No newline at end of file diff --git a/annotations_1/15WevUMiJI8_filtered.json b/annotations_1/15WevUMiJI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e914b5175dd1fab4cece9feaaf5c79f4d34356dd --- /dev/null +++ b/annotations_1/15WevUMiJI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.1], [12.0, 42.89], [47.0, 52.76], [57.0, 121.93], [123.0, 123.72], [124.0, 153.1], [156.0, 163.51], [166.0, 169.65], [171.0, 171.96], [172.0, 176.01]], "keep_status": [false, false, true, false, false, false, false, false, false, true], "silence_prob": [60.7, 0.0, 45.49, 0.0, 0.0, 34.24, 33.12, 31.08, 0.0, 44.52], "audiomae_on_audioset": [null, null, [["music", 43.27], ["synthesizer", 11.39], ["electronic music", 7.68]], null, null, [["music", 54.14], ["theremin", 18.17], ["musical instrument", 4.07]], [["music", 72.1], ["theremin", 9.63], ["ambient music", 5.48]], [["music", 74.89], ["theremin", 4.52], ["animal", 3.9]], null, [["music", 44.23], ["speech", 10.49], ["ambient music", 5.16]]], "duration": [8.1, 30.89, 5.76, 64.93, 0.72, 29.1, 7.51, 3.65, 0.96, 4.01]} \ No newline at end of file diff --git a/annotations_1/15XqLhQ0_Oo_filtered.json b/annotations_1/15XqLhQ0_Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed1d12aa6db16c5dda2d24350e8c22c0992ab42a --- /dev/null +++ b/annotations_1/15XqLhQ0_Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 25.07], [26.0, 27.51], [30.0, 29.93], [32.0, 41.77], [42.0, 42.63], [44.0, 47.56], [48.0, 48.91], [50.0, 63.07], [65.0, 71.46]], "keep_status": [false, false, false, false, false, true, false, true, false], "silence_prob": [42.81, 0.0, 0.0, 56.63, 0.0, 40.64, 0.0, 43.53, 58.3], "audiomae_on_audioset": [[["music", 71.35], ["ambient music", 4.42], ["hum", 3.62]], null, null, null, null, [["music", 12.68], ["hum", 12.04], ["throbbing", 11.53]], null, [["hum", 37.54], ["mains hum", 21.82], ["music", 7.66]], null], "duration": [21.07, 1.51, -0.07, 9.77, 0.63, 3.56, 0.91, 13.07, 6.46]} \ No newline at end of file diff --git a/annotations_1/16op1FeUX1A_filtered.json b/annotations_1/16op1FeUX1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..caa4abd2506864ba8510f688e50b7154eaff4f7d --- /dev/null +++ b/annotations_1/16op1FeUX1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 14.12], [14.0, 19.68], [20.0, 20.93], [21.0, 23.43], [29.0, 28.75], [29.0, 32.85], [34.0, 40.19], [42.0, 42.84], [44.0, 45.45], [47.0, 47.33], [49.0, 53.7], [54.0, 75.41], [77.0, 78.48], [80.0, 96.28], [97.0, 100.08], [101.0, 103.25], [104.0, 104.7], [106.0, 109.41], [111.0, 112.8], [116.0, 117.71], [121.0, 121.44], [122.0, 128.65], [130.0, 131.99]], "keep_status": [false, true, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, true, false], "silence_prob": [89.54, 28.44, 0.0, 31.22, 0.0, 39.12, 54.7, 0.0, 0.0, 0.0, 74.44, 29.03, 0.0, 30.19, 45.59, 36.62, 0.0, 42.84, 0.0, 0.0, 0.0, 43.08, 0.0], "audiomae_on_audioset": [null, [["speech", 52.87], ["fart", 4.36], ["field recording", 3.27]], null, [["speech", 35.48], ["didgeridoo", 11.16], ["noise", 7.04]], null, [["music", 28.86], ["creak", 8.35], ["didgeridoo", 6.88]], null, null, null, null, null, [["music", 68.14], ["animal", 3.06], ["speech", 2.71]], null, [["hum", 46.53], ["music", 24.53], ["throbbing", 12.33]], [["music", 38.51], ["fly, housefly", 3.55], ["throbbing", 2.6]], [["music", 28.51], ["throbbing", 21.77], ["hum", 10.77]], null, [["door", 17.14], ["music", 15.78], ["electric shaver, electric razor", 6.59]], null, null, null, [["fly, housefly", 39.21], ["mosquito", 11.2], ["insect", 7.93]], null], "duration": [13.12, 5.68, 0.93, 2.43, -0.25, 3.85, 6.19, 0.84, 1.45, 0.33, 4.7, 21.41, 1.48, 16.28, 3.08, 2.25, 0.7, 3.41, 1.8, 1.71, 0.44, 6.65, 1.99]} \ No newline at end of file diff --git a/annotations_1/16xSXPPqBfM_filtered.json b/annotations_1/16xSXPPqBfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a626e96c3d88f2cb4e353828474dda123ef5657 --- /dev/null +++ b/annotations_1/16xSXPPqBfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.25], [38.0, 47.82], [50.0, 50.87], [54.0, 54.33], [61.0, 63.41], [68.0, 68.74], [71.0, 81.75], [82.0, 92.16]], "keep_status": [false, false, false, false, true, false, false, true], "silence_prob": [0.0, 51.28, 0.0, 0.0, 44.52, 0.0, 41.34, 45.05], "audiomae_on_audioset": [null, null, null, null, [["music", 52.88], ["clarinet", 6.77], ["musical instrument", 6.48]], null, [["theremin", 48.65], ["music", 32.46], ["musical instrument", 4.33]], [["music", 28.18], ["theremin", 21.14], ["cello", 13.67]]], "duration": [0.25, 9.82, 0.87, 0.33, 2.41, 0.74, 10.75, 10.16]} \ No newline at end of file diff --git a/annotations_1/18ARBQLResg_filtered.json b/annotations_1/18ARBQLResg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c256d48e9cf5e39e00a431f783555b1846e1666a --- /dev/null +++ b/annotations_1/18ARBQLResg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 14.03], [16.0, 16.6], [18.0, 54.77], [55.0, 56.12], [57.0, 58.19], [59.0, 63.22], [65.0, 68.76], [69.0, 71.31], [72.0, 73.25], [74.0, 74.95], [77.0, 83.96], [88.0, 93.5], [95.0, 107.38]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [57.64, 0.0, 0.0, 0.0, 0.0, 45.82, 55.46, 45.56, 0.0, 0.0, 33.89, 30.91, 38.98], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 39.4], ["speech", 24.22], ["music", 9.43]], null, [["speech", 19.68], ["music", 12.9], ["sidetone", 10.46]], null, null, [["effects unit", 22.23], ["music", 11.22], ["distortion", 8.13]], [["music", 38.49], ["musical instrument", 11.36], ["effects unit", 10.53]], [["music", 52.55], ["synthesizer", 13.44], ["musical instrument", 6.56]]], "duration": [14.03, 0.6, 36.77, 1.12, 1.19, 4.22, 3.76, 2.31, 1.25, 0.95, 6.96, 5.5, 12.38]} \ No newline at end of file diff --git a/annotations_1/18Qa__JYKdc_filtered.json b/annotations_1/18Qa__JYKdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74911dffab373e76532fa962bda29a14b41cc36b --- /dev/null +++ b/annotations_1/18Qa__JYKdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.59], [29.0, 29.64], [58.0, 57.81], [59.0, 64.56], [65.0, 76.03], [77.0, 77.35], [93.0, 94.44], [105.0, 105.66], [106.0, 106.95], [110.0, 110.2], [112.0, 117.34], [118.0, 118.64], [120.0, 126.15], [138.0, 149.61], [151.0, 154.57], [156.0, 157.08], [158.0, 161.35], [163.0, 167.91], [173.0, 174.12]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.07, 40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 36.38, 49.59, 48.52, 0.0, 59.59, 74.29, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 34.39], ["hum", 22.3], ["mains hum", 11.86]], null, null, null, null, null, [["speech", 24.89], ["fart", 12.62], ["explosion", 9.36]], null, [["fly, housefly", 14.61], ["screaming", 13.28], ["speech", 10.25]], [["music", 67.92], ["musical instrument", 8.49], ["guitar", 5.98]], [["music", 66.29], ["electronic music", 3.62], ["musical instrument", 2.36]], null, null, null, null], "duration": [-0.41, 0.64, -0.19, 5.56, 11.03, 0.35, 1.44, 0.66, 0.95, 0.2, 5.34, 0.64, 6.15, 11.61, 3.57, 1.08, 3.35, 4.91, 1.12]} \ No newline at end of file diff --git a/annotations_1/193KvPnLO4I_filtered.json b/annotations_1/193KvPnLO4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da3909590b5c9175a963565048ad3ebe42899cc6 --- /dev/null +++ b/annotations_1/193KvPnLO4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [10.0, 10.3], [17.0, 17.49], [18.0, 19.84], [33.0, 33.66], [34.0, 34.55], [38.0, 38.33], [43.0, 43.65], [46.0, 46.09], [47.0, 47.8], [49.0, 49.87], [73.0, 72.86], [74.0, 75.1], [78.0, 78.63], [80.0, 80.22], [111.0, 114.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 74.0], ["singing", 3.76], ["male singing", 3.14]]], "duration": [0.57, 0.3, 0.49, 1.84, 0.66, 0.55, 0.33, 0.65, 0.09, 0.8, 0.87, -0.14, 1.1, 0.63, 0.22, 3.99]} \ No newline at end of file diff --git a/annotations_1/198uP07pieE_filtered.json b/annotations_1/198uP07pieE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/198uP07pieE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/1AhrD2-cvrw_filtered.json b/annotations_1/1AhrD2-cvrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af03cc97a26d98f5f59e4008e6a3957c4a0fa4fc --- /dev/null +++ b/annotations_1/1AhrD2-cvrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.43], [5.0, 5.44], [9.0, 10.15], [11.0, 13.69], [14.0, 20.61], [22.0, 23.58], [25.0, 25.64], [28.0, 28.66], [32.0, 32.19], [33.0, 35.02], [36.0, 38.89], [43.0, 43.66], [45.0, 46.28], [48.0, 49.18], [50.0, 50.68], [52.0, 53.28], [54.0, 55.16], [57.0, 57.3], [59.0, 61.38], [62.0, 63.09], [66.0, 67.12], [68.0, 68.45], [70.0, 71.25], [77.0, 78.0], [80.0, 81.21], [85.0, 85.78], [87.0, 87.2], [88.0, 87.94], [88.0, 88.5], [89.0, 96.97], [101.0, 103.5], [107.0, 108.53], [110.0, 112.02], [113.0, 115.11], [116.0, 117.27], [121.0, 125.2], [127.0, 129.22], [133.0, 134.94], [136.0, 136.86], [138.0, 138.45], [140.0, 147.85], [150.0, 150.74], [152.0, 156.29], [159.0, 159.85], [164.0, 170.04], [170.0, 170.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 70.16, 59.59, 0.0, 0.0, 0.0, 0.0, 73.36, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 62.07, 0.0, 58.55, 62.17, 0.0, 35.33, 35.41, 0.0, 0.0, 0.0, 30.12, 0.0, 49.36, 0.0, 61.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.79], ["musical instrument", 2.67], ["plucked string instrument", 2.01]], [["music", 74.7], ["musical instrument", 2.23], ["ambient music", 2.01]], null, null, null, [["music", 40.2], ["noise", 9.28], ["hum", 7.6]], null, [["music", 19.73], ["hum", 10.33], ["speech", 10.23]], null, null, null], "duration": [1.43, 0.44, 1.15, 2.69, 6.61, 1.58, 0.64, 0.66, 0.19, 2.02, 2.89, 0.66, 1.28, 1.18, 0.68, 1.28, 1.16, 0.3, 2.38, 1.09, 1.12, 0.45, 1.25, 1.0, 1.21, 0.78, 0.2, -0.06, 0.5, 7.97, 2.5, 1.53, 2.02, 2.11, 1.27, 4.2, 2.22, 1.94, 0.86, 0.45, 7.85, 0.74, 4.29, 0.85, 6.04, 0.7]} \ No newline at end of file diff --git a/annotations_1/1Aoukxd0GvI_filtered.json b/annotations_1/1Aoukxd0GvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c6c27a4d4f014db13e4c6a21c8bb4714cd0ea7a --- /dev/null +++ b/annotations_1/1Aoukxd0GvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.17], [17.0, 18.01], [19.0, 21.15], [23.0, 24.09], [25.0, 26.4], [27.0, 30.7], [32.0, 34.03], [40.0, 42.38], [44.0, 46.47], [48.0, 49.28], [52.0, 52.35], [60.0, 60.91], [63.0, 63.36], [64.0, 64.98], [66.0, 66.95], [69.0, 70.43], [71.0, 71.73], [73.0, 73.48], [74.0, 75.22], [77.0, 77.3], [79.0, 81.87], [85.0, 87.3], [88.0, 90.0], [92.0, 92.18], [98.0, 98.39], [100.0, 101.43], [102.0, 111.6], [112.0, 113.24], [115.0, 115.4], [117.0, 117.78], [120.0, 122.37], [124.0, 124.73], [125.0, 126.96], [129.0, 130.49], [132.0, 135.97], [137.0, 139.43], [140.0, 143.85], [145.0, 147.48], [149.0, 149.59], [150.0, 150.92], [151.0, 154.4], [156.0, 156.9], [158.0, 158.9], [161.0, 161.7], [164.0, 165.4], [166.0, 168.56], [172.0, 172.79], [177.0, 178.38], [181.0, 180.94], [191.0, 193.78], [195.0, 195.88], [196.0, 198.19], [202.0, 202.39], [203.0, 204.28], [210.0, 215.5], [217.0, 218.54], [219.0, 225.53], [227.0, 227.01], [228.0, 228.51], [230.0, 230.37], [231.0, 231.65], [232.0, 233.76], [234.0, 236.38], [239.0, 239.6], [241.0, 241.44], [243.0, 243.06], [245.0, 245.76], [246.0, 246.72], [257.0, 257.66], [258.0, 260.07], [261.0, 262.16], [263.0, 265.33], [268.0, 268.27], [269.0, 271.29], [275.0, 276.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.18, 0.0, 52.92, 0.0, 0.0, 76.04, 85.54, 58.98, 70.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 40.77, 70.3, 0.0, 0.0, 0.0, 39.61, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 74.44, 37.88, 99.87, 98.8, 0.0, 0.0, 63.53, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 96.66, 0.0, 60.51, 0.0, 0.0, 39.86, 0.0, 44.49, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 90.95, 0.0, 64.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.37], ["hum", 8.33], ["whale vocalization", 4.95]], null, null, null, null, [["speech", 53.5], ["music", 20.55], ["hum", 6.35]], null, null, null, null, null, null, null, null, [["whale vocalization", 54.4], ["animal", 8.17], ["roaring cats (lions, tigers)", 7.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.25], ["speech", 29.89], ["didgeridoo", 11.03]], null, [["music", 41.23], ["speech", 31.81], ["hum", 5.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.17, 1.01, 2.15, 1.09, 1.4, 3.7, 2.03, 2.38, 2.47, 1.28, 0.35, 0.91, 0.36, 0.98, 0.95, 1.43, 0.73, 0.48, 1.22, 0.3, 2.87, 2.3, 2.0, 0.18, 0.39, 1.43, 9.6, 1.24, 0.4, 0.78, 2.37, 0.73, 1.96, 1.49, 3.97, 2.43, 3.85, 2.48, 0.59, 0.92, 3.4, 0.9, 0.9, 0.7, 1.4, 2.56, 0.79, 1.38, -0.06, 2.78, 0.88, 2.19, 0.39, 1.28, 5.5, 1.54, 6.53, 0.01, 0.51, 0.37, 0.65, 1.76, 2.38, 0.6, 0.44, 0.06, 0.76, 0.72, 0.66, 2.07, 1.16, 2.33, 0.27, 2.29, 1.84]} \ No newline at end of file diff --git a/annotations_1/1BS3mo_yHvY_filtered.json b/annotations_1/1BS3mo_yHvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3fe4be9e2e540e65f0d5fed18cb73f34d3aa2e1 --- /dev/null +++ b/annotations_1/1BS3mo_yHvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.63], [13.0, 17.47], [19.0, 22.1], [23.0, 24.02], [25.0, 26.1], [27.0, 31.26], [38.0, 44.27], [45.0, 54.14], [55.0, 75.64], [77.0, 78.56], [80.0, 84.38], [87.0, 87.79], [90.0, 90.17], [92.0, 99.86], [100.0, 105.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.25, 51.02, 61.47, 0.0, 0.0, 54.63, 59.07, 44.75, 29.56, 0.0, 39.38, 0.0, 0.0, 28.91, 28.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 72.04], ["scary music", 5.58], ["hum", 4.85]], [["throbbing", 29.58], ["hum", 29.19], ["music", 18.85]], null, [["music", 72.25], ["throbbing", 5.43], ["electronic music", 2.88]], null, null, [["music", 31.99], ["throbbing", 25.41], ["hum", 13.95]], [["music", 71.93], ["speech", 10.65], ["groan", 3.88]]], "duration": [9.63, 4.47, 3.1, 1.02, 1.1, 4.26, 6.27, 9.14, 20.64, 1.56, 4.38, 0.79, 0.17, 7.86, 5.06]} \ No newline at end of file diff --git a/annotations_1/1C84oQva04A_filtered.json b/annotations_1/1C84oQva04A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb406ceb9862d9db5a26d59111bdc54afb7a57b6 --- /dev/null +++ b/annotations_1/1C84oQva04A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.69], [16.0, 16.73], [19.0, 21.66], [23.0, 24.07], [25.0, 29.47], [31.0, 32.19], [36.0, 36.24], [44.0, 46.72], [48.0, 48.25], [49.0, 49.52], [51.0, 51.34], [53.0, 52.78], [56.0, 56.64], [58.0, 59.36], [65.0, 65.91], [69.0, 94.44], [95.0, 95.71], [96.0, 97.02], [99.0, 99.91], [101.0, 102.49]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 36.7, 0.0, 33.92, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 22.5], ["sidetone", 20.78], ["hum", 19.09]], null, [["speech", 39.38], ["hum", 14.88], ["tuning fork", 10.86]], null, null, null, null, null, null, null, null, null, null, [["music", 32.66], ["throbbing", 19.05], ["speech", 14.28]], null, null, null, null], "duration": [0.69, 0.73, 2.66, 1.07, 4.47, 1.19, 0.24, 2.72, 0.25, 0.52, 0.34, -0.22, 0.64, 1.36, 0.91, 25.44, 0.71, 1.02, 0.91, 1.49]} \ No newline at end of file diff --git a/annotations_1/1CKEXvHN9es_filtered.json b/annotations_1/1CKEXvHN9es_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc037757ae90def586ea6e544db74852508e8c47 --- /dev/null +++ b/annotations_1/1CKEXvHN9es_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.15], [10.0, 10.69], [13.0, 13.19], [15.0, 20.33], [22.0, 27.36], [30.0, 31.63], [33.0, 33.89], [36.0, 36.9], [44.0, 44.64], [67.0, 68.18], [76.0, 76.87], [93.0, 93.48], [102.0, 103.11], [106.0, 106.0], [107.0, 108.01], [109.0, 109.68], [111.0, 113.64], [140.0, 140.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 79.94, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.69, 0.19, 5.33, 5.36, 1.63, 0.89, 0.9, 0.64, 1.18, 0.87, 0.48, 1.11, 0.0, 1.01, 0.68, 2.64, 0.63]} \ No newline at end of file diff --git a/annotations_1/1CTjGKT-hDY_filtered.json b/annotations_1/1CTjGKT-hDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b821f1328939e0eb545dc6ce8bba2d013ca30f10 --- /dev/null +++ b/annotations_1/1CTjGKT-hDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.88], [21.0, 24.8], [31.0, 33.69], [34.0, 35.7], [37.0, 37.0], [41.0, 41.12], [44.0, 53.38], [55.0, 55.51], [56.0, 57.54], [59.0, 62.61], [63.0, 66.56], [69.0, 69.53], [70.0, 72.37], [74.0, 77.46], [80.0, 81.78], [83.0, 84.52], [87.0, 87.44], [88.0, 88.96], [90.0, 90.39], [92.0, 116.06]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.34, 34.71, 0.0, 0.0, 0.0, 36.63, 0.0, 0.0, 36.99, 36.61, 0.0, 36.7, 34.67, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4], "audiomae_on_audioset": [null, [["music", 66.68], ["speech", 4.4], ["throbbing", 4.2]], [["music", 39.99], ["throbbing", 19.24], ["hum", 15.93]], null, null, null, [["music", 66.16], ["speech", 20.81], ["effects unit", 4.86]], null, null, [["music", 33.53], ["didgeridoo", 16.95], ["clang", 5.24]], [["music", 69.65], ["speech", 11.09], ["synthesizer", 2.09]], null, [["music", 81.95], ["speech", 5.53], ["didgeridoo", 2.68]], [["music", 88.6], ["single-lens reflex camera", 1.18], ["camera", 1.04]], null, null, null, null, null, [["music", 46.18], ["synthesizer", 14.07], ["speech", 10.34]]], "duration": [-0.12, 3.8, 2.69, 1.7, 0.0, 0.12, 9.38, 0.51, 1.54, 3.61, 3.56, 0.53, 2.37, 3.46, 1.78, 1.52, 0.44, 0.96, 0.39, 24.06]} \ No newline at end of file diff --git a/annotations_1/1CXkATQLZGk_filtered.json b/annotations_1/1CXkATQLZGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b9890f561374ef924fdaa47a9843e1680aee88 --- /dev/null +++ b/annotations_1/1CXkATQLZGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 49.64], [51.0, 51.0], [51.0, 57.15], [60.0, 63.59], [65.0, 68.66], [69.0, 70.17], [71.0, 71.83], [73.0, 75.93], [79.0, 82.19], [83.0, 109.88], [112.0, 133.73]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [47.5, 0.0, 43.79, 78.89, 92.64, 0.0, 0.0, 44.15, 67.89, 31.8, 32.98], "audiomae_on_audioset": [[["speech", 52.11], ["music", 24.92], ["hum", 2.35]], null, [["speech", 61.55], ["fly, housefly", 9.87], ["insect", 4.31]], null, null, null, null, [["music", 51.2], ["didgeridoo", 6.59], ["foghorn", 5.28]], null, [["music", 47.6], ["throbbing", 15.07], ["hum", 13.29]], [["mains hum", 28.78], ["hum", 28.19], ["music", 26.36]]], "duration": [4.64, 0.0, 6.15, 3.59, 3.66, 1.17, 0.83, 2.93, 3.19, 26.88, 21.73]} \ No newline at end of file diff --git a/annotations_1/1D4VF4WqJSE_filtered.json b/annotations_1/1D4VF4WqJSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a61b137c85de80b9c6caf305546289bf08aceead --- /dev/null +++ b/annotations_1/1D4VF4WqJSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.21], [8.0, 9.66], [11.0, 11.28], [13.0, 13.47], [15.0, 16.5], [18.0, 19.03], [19.0, 20.11], [22.0, 22.77], [24.0, 25.12], [29.0, 30.0], [34.0, 34.59], [42.0, 43.24], [45.0, 46.9], [49.0, 50.09], [51.0, 51.95], [59.0, 59.54], [62.0, 62.88], [64.0, 64.81], [66.0, 67.2], [69.0, 69.21], [70.0, 76.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.01], ["speech", 38.1], ["musical instrument", 2.39]]], "duration": [1.21, 1.66, 0.28, 0.47, 1.5, 1.03, 1.11, 0.77, 1.12, 1.0, 0.59, 1.24, 1.9, 1.09, 0.95, 0.54, 0.88, 0.81, 1.2, 0.21, 6.96]} \ No newline at end of file diff --git a/annotations_1/1D8CfzvSy7g_filtered.json b/annotations_1/1D8CfzvSy7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8990c60ba1c657ca7bcda25d8649762d74910546 --- /dev/null +++ b/annotations_1/1D8CfzvSy7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.64], [9.0, 8.65], [13.0, 17.74], [18.0, 19.4], [20.0, 21.15], [22.0, 32.86], [34.0, 35.43], [39.0, 39.5], [43.0, 66.33], [67.0, 74.33], [75.0, 76.13], [77.0, 78.0], [79.0, 79.81], [81.0, 81.45], [81.0, 81.82], [84.0, 85.53], [86.0, 87.45], [88.0, 90.81], [91.0, 92.57], [95.0, 96.47], [97.0, 97.33], [101.0, 101.75], [108.0, 109.53], [111.0, 113.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.97, 0.0, 0.0, 56.25, 0.0, 0.0, 30.78, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 53.57], ["music", 13.22], ["radio", 7.21]], [["speech", 71.4], ["vehicle", 8.07], ["radio", 3.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, -0.35, 4.74, 1.4, 1.15, 10.86, 1.43, 0.5, 23.33, 7.33, 1.13, 1.0, 0.81, 0.45, 0.82, 1.53, 1.45, 2.81, 1.57, 1.47, 0.33, 0.75, 1.53, 2.16]} \ No newline at end of file diff --git a/annotations_1/1DGrM6qhZHY_filtered.json b/annotations_1/1DGrM6qhZHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6804974e69ae4cc78c58c5405adbd7da9ca1297 --- /dev/null +++ b/annotations_1/1DGrM6qhZHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 24.39], [25.0, 41.54], [42.0, 46.57], [51.0, 54.8], [58.0, 63.07], [66.0, 66.01], [72.0, 80.65], [81.0, 86.88], [88.0, 89.07], [91.0, 92.74], [95.0, 97.38]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [93.45, 96.54, 34.1, 78.55, 47.86, 0.0, 70.44, 50.56, 0.0, 0.0, 85.35], "audiomae_on_audioset": [null, null, [["music", 26.47], ["hum", 17.49], ["mains hum", 10.92]], null, [["throbbing", 44.57], ["hum", 23.46], ["music", 14.25]], null, null, null, null, null, null], "duration": [23.39, 16.54, 4.57, 3.8, 5.07, 0.01, 8.65, 5.88, 1.07, 1.74, 2.38]} \ No newline at end of file diff --git a/annotations_1/1DTrvZ3wxy0_filtered.json b/annotations_1/1DTrvZ3wxy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1059dcaa4d1c67a1c1f599c2fdfbc9c4599151c2 --- /dev/null +++ b/annotations_1/1DTrvZ3wxy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.69], [17.0, 20.95], [21.0, 23.87], [28.0, 29.44], [33.0, 33.93], [37.0, 43.75], [45.0, 49.18], [50.0, 54.8], [57.0, 76.11], [77.0, 117.49], [118.0, 120.12], [121.0, 127.55], [128.0, 129.17]], "keep_status": [false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 32.72, 41.07, 0.0, 0.0, 33.54, 34.32, 31.45, 31.28, 0.0, 34.36, 31.72, 0.0], "audiomae_on_audioset": [null, [["music", 57.11], ["musical instrument", 11.44], ["guitar", 2.85]], [["music", 54.17], ["musical instrument", 8.5], ["guitar", 7.99]], null, null, [["throbbing", 20.1], ["hum", 19.94], ["music", 16.9]], [["music", 29.74], ["throbbing", 19.21], ["hum", 11.73]], [["music", 59.43], ["throbbing", 7.77], ["hum", 6.82]], [["music", 36.69], ["speech", 17.69], ["hum", 9.51]], null, [["music", 66.4], ["speech", 5.35], ["electronic music", 3.04]], [["throbbing", 48.97], ["hum", 24.7], ["music", 10.94]], null], "duration": [0.69, 3.95, 2.87, 1.44, 0.93, 6.75, 4.18, 4.8, 19.11, 40.49, 2.12, 6.55, 1.17]} \ No newline at end of file diff --git a/annotations_1/1DgOAPBMXws_filtered.json b/annotations_1/1DgOAPBMXws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..684e5cdaf5d4591485fc72f3b42fc517cf9c1060 --- /dev/null +++ b/annotations_1/1DgOAPBMXws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [6.0, 6.88], [9.0, 9.12], [13.0, 13.81], [18.0, 36.42], [37.0, 41.34], [42.0, 44.98], [48.0, 52.86], [57.0, 71.14], [72.0, 72.72], [74.0, 75.15], [78.0, 82.32], [83.0, 85.85], [88.0, 88.48], [93.0, 93.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.43, 72.31, 73.21, 77.53, 59.59, 0.0, 0.0, 95.09, 77.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.88, 0.12, 0.81, 18.42, 4.34, 2.98, 4.86, 14.14, 0.72, 1.15, 4.32, 2.85, 0.48, 0.65]} \ No newline at end of file diff --git a/annotations_1/1DvFzLRPc_w_filtered.json b/annotations_1/1DvFzLRPc_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b32b38ae7b1047363358b441a0393fcde610aa6c --- /dev/null +++ b/annotations_1/1DvFzLRPc_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.53], [7.0, 7.25], [7.0, 8.99], [9.0, 10.83], [14.0, 15.21], [17.0, 18.52], [25.0, 26.05], [28.0, 29.29], [30.0, 33.83], [34.0, 36.34]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [34.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 55.46], "audiomae_on_audioset": [[["music", 20.08], ["hum", 11.52], ["electronic music", 11.33]], null, null, null, null, null, null, null, [["speech", 30.98], ["sidetone", 17.42], ["whale vocalization", 17.3]], null], "duration": [3.53, 0.25, 1.99, 1.83, 1.21, 1.52, 1.05, 1.29, 3.83, 2.34]} \ No newline at end of file diff --git a/annotations_1/1Dvx_8APGEo_filtered.json b/annotations_1/1Dvx_8APGEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0319e82b2075089c3375b8439049b7f205bada10 --- /dev/null +++ b/annotations_1/1Dvx_8APGEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.72], [19.0, 20.48], [21.0, 22.03], [22.0, 23.23], [23.0, 24.07], [25.0, 26.16], [28.0, 28.65], [31.0, 33.74], [34.0, 35.99], [37.0, 37.35], [38.0, 38.57], [40.0, 41.07], [41.0, 42.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.48, 1.03, 1.23, 1.07, 1.16, 0.65, 2.74, 1.99, 0.35, 0.57, 1.07, 1.62]} \ No newline at end of file diff --git a/annotations_1/1EcAcWe08NU_filtered.json b/annotations_1/1EcAcWe08NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5def0daa97d205f47b7cee4f9314b886991c81e1 --- /dev/null +++ b/annotations_1/1EcAcWe08NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [21.0, 21.59], [22.0, 25.07], [29.0, 39.6], [44.0, 46.28], [54.0, 60.0], [61.0, 61.35], [94.0, 95.52], [145.0, 145.67], [148.0, 151.98], [153.0, 153.47], [154.0, 155.19], [156.0, 156.95], [157.0, 158.85], [162.0, 163.48], [167.0, 168.4], [173.0, 175.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [34.48, 0.0, 28.93, 29.1, 29.48, 29.91, 0.0, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.64], "audiomae_on_audioset": [[["music", 58.32], ["speech", 9.15], ["electronic music", 5.52]], null, [["music", 63.32], ["speech", 10.41], ["electronic music", 3.77]], [["music", 63.81], ["speech", 5.95], ["electronic music", 5.2]], [["music", 74.93], ["throbbing", 4.63], ["electronic music", 2.37]], [["music", 62.01], ["buzz", 7.41], ["speech", 5.08]], null, null, null, [["speech", 68.89], ["burping, eructation", 5.32], ["throat clearing", 3.02]], null, null, null, null, null, null, [["music", 20.07], ["speech", 13.02], ["throbbing", 11.13]]], "duration": [2.45, 0.59, 3.07, 10.6, 2.28, 6.0, 0.35, 1.52, 0.67, 3.98, 0.47, 1.19, 0.95, 1.85, 1.48, 1.4, 2.54]} \ No newline at end of file diff --git a/annotations_1/1EtA0HrUrYM_filtered.json b/annotations_1/1EtA0HrUrYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e44400119ee7b30b829849f16db2fa875935fe1 --- /dev/null +++ b/annotations_1/1EtA0HrUrYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.26], [25.0, 25.79], [32.0, 35.87], [39.0, 42.09], [49.0, 58.85], [62.0, 62.88], [64.0, 64.83], [65.0, 70.02], [77.0, 77.99], [83.0, 83.56], [89.0, 89.58], [95.0, 95.42], [97.0, 98.47], [102.0, 102.3]], "keep_status": [true, false, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [36.07, 0.0, 39.19, 49.22, 30.38, 0.0, 0.0, 31.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.74], ["speech", 8.79], ["musical instrument", 5.19]], null, [["fly, housefly", 49.54], ["speech", 9.37], ["insect", 7.41]], [["music", 39.77], ["speech", 22.46], ["radio", 3.15]], [["speech", 23.24], ["crowd", 14.59], ["music", 12.72]], null, null, [["cattle, bovinae", 32.43], ["moo", 32.06], ["livestock, farm animals, working animals", 15.83]], null, null, null, null, null, null], "duration": [2.26, 0.79, 3.87, 3.09, 9.85, 0.88, 0.83, 5.02, 0.99, 0.56, 0.58, 0.42, 1.47, 0.3]} \ No newline at end of file diff --git a/annotations_1/1Fxq_n8e1qA_filtered.json b/annotations_1/1Fxq_n8e1qA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19b31c8f54b7d58b5b070142d95bf87fec523919 --- /dev/null +++ b/annotations_1/1Fxq_n8e1qA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.19], [3.0, 2.81], [6.0, 6.51], [7.0, 7.79], [13.0, 14.81], [17.0, 30.11], [30.0, 30.16], [35.0, 35.33], [36.0, 36.07], [37.0, 45.15], [49.0, 50.9], [54.0, 58.65], [60.0, 61.55], [76.0, 76.35], [85.0, 89.13], [91.0, 95.82], [97.0, 127.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 99.85, 0.0, 66.27, 0.0, 0.0, 37.51, 54.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.57], ["music", 20.44], ["theremin", 13.98]], null, null], "duration": [1.19, -0.19, 0.51, 0.79, 1.81, 13.11, 0.16, 0.33, 0.07, 8.15, 1.9, 4.65, 1.55, 0.35, 4.13, 4.82, 30.14]} \ No newline at end of file diff --git a/annotations_1/1GYZPg_aQdw_filtered.json b/annotations_1/1GYZPg_aQdw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc8dea41e7721b32846c2025127ed18a62da6ccd --- /dev/null +++ b/annotations_1/1GYZPg_aQdw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [4.0, 6.17], [21.0, 21.51], [23.0, 25.0], [25.0, 42.52], [44.0, 46.85], [48.0, 48.12], [51.0, 57.01], [57.0, 58.63], [62.0, 62.72], [66.0, 83.57], [84.0, 84.92], [85.0, 86.36], [88.0, 90.17], [94.0, 101.29], [102.0, 103.23], [105.0, 113.09], [117.0, 117.53], [120.0, 121.64], [127.0, 130.1], [133.0, 134.74], [136.0, 136.19], [138.0, 138.64], [139.0, 139.01], [139.0, 141.81], [151.0, 151.07], [152.0, 153.1], [154.0, 155.75], [156.0, 156.9], [159.0, 159.44], [160.0, 159.93], [160.0, 162.21], [165.0, 165.57], [167.0, 166.92], [169.0, 169.5], [170.0, 173.67], [177.0, 178.7], [179.0, 180.62], [182.0, 182.24], [184.0, 194.44], [195.0, 195.56], [197.0, 197.99], [199.0, 200.26], [203.0, 202.95], [203.0, 203.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.25, 0.0, 67.13, 35.64, 87.37, 0.0, 52.45, 0.0, 0.0, 75.39, 0.0, 0.0, 62.37, 34.85, 0.0, 42.72, 0.0, 0.0, 34.61, 0.0, 0.0, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 48.78, 0.0, 0.0, 0.0, 29.69, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 39.85], ["didgeridoo", 29.28], ["musical instrument", 12.86]], null, null, null, null, null, null, null, null, null, [["throbbing", 39.04], ["hum", 28.71], ["music", 17.43]], null, [["chirp tone", 23.64], ["music", 14.87], ["glass", 8.76]], null, null, [["boing", 26.42], ["cattle, bovinae", 14.29], ["grunt", 7.7]], null, null, null, null, [["speech", 25.34], ["throbbing", 16.55], ["hum", 10.97]], null, null, null, null, null, null, null, null, null, null, [["hum", 44.01], ["throbbing", 13.45], ["music", 12.67]], null, null, null, [["music", 45.56], ["speech", 39.92], ["throbbing", 1.85]], null, null, null, null, null], "duration": [1.47, 2.17, 0.51, 2.0, 17.52, 2.85, 0.12, 6.01, 1.63, 0.72, 17.57, 0.92, 1.36, 2.17, 7.29, 1.23, 8.09, 0.53, 1.64, 3.1, 1.74, 0.19, 0.64, 0.01, 2.81, 0.07, 1.1, 1.75, 0.9, 0.44, -0.07, 2.21, 0.57, -0.08, 0.5, 3.67, 1.7, 1.62, 0.24, 10.44, 0.56, 0.99, 1.26, -0.05, 0.2]} \ No newline at end of file diff --git a/annotations_1/1GbNS7IcCj0_filtered.json b/annotations_1/1GbNS7IcCj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d3e8ff623486c6ab7eb2194d2ce5760af0da76 --- /dev/null +++ b/annotations_1/1GbNS7IcCj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [5.0, 5.75], [15.0, 16.66], [75.0, 75.03], [82.0, 93.29], [98.0, 97.95], [103.0, 103.42], [105.0, 106.61], [117.0, 120.09], [123.0, 123.28], [124.0, 124.58]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 45.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mosquito", 34.68], ["fly, housefly", 16.39], ["speech", 13.33]], null, null, null, [["speech", 17.92], ["moo", 13.48], ["cattle, bovinae", 13.39]], null, null], "duration": [0.82, 0.75, 1.66, 0.03, 11.29, -0.05, 0.42, 1.61, 3.09, 0.28, 0.58]} \ No newline at end of file diff --git a/annotations_1/1GfDQpfUaHQ_filtered.json b/annotations_1/1GfDQpfUaHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c81979434985fb32c698b2cccc0dab76f6236e7d --- /dev/null +++ b/annotations_1/1GfDQpfUaHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 28.41], [29.0, 31.78], [34.0, 35.46], [38.0, 38.47], [41.0, 43.36], [44.0, 44.04], [45.0, 45.23], [46.0, 47.61], [48.0, 49.69], [50.0, 58.94], [59.0, 63.95], [65.0, 67.47], [68.0, 71.63], [73.0, 75.54], [76.0, 76.81], [77.0, 80.25], [81.0, 84.99], [88.0, 88.79], [90.0, 89.83], [91.0, 99.76], [100.0, 100.62], [102.0, 103.3], [105.0, 105.65], [106.0, 111.6], [113.0, 114.91], [116.0, 118.42], [122.0, 125.76], [128.0, 129.57], [131.0, 137.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.14, 66.15, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 73.21, 70.02, 64.63, 79.94, 87.19, 0.0, 64.07, 66.03, 0.0, 0.0, 51.34, 0.0, 0.0, 0.0, 56.33, 0.0, 85.72, 98.59, 0.0, 69.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.41, 2.78, 1.46, 0.47, 2.36, 0.04, 0.23, 1.61, 1.69, 8.94, 4.95, 2.47, 3.63, 2.54, 0.81, 3.25, 3.99, 0.79, -0.17, 8.76, 0.62, 1.3, 0.65, 5.6, 1.91, 2.42, 3.76, 1.57, 6.79]} \ No newline at end of file diff --git a/annotations_1/1GiYwJRA2NA_filtered.json b/annotations_1/1GiYwJRA2NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efddd12fd0676f09b2a475f40393ff2f710b5df8 --- /dev/null +++ b/annotations_1/1GiYwJRA2NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.43], [9.0, 9.75], [13.0, 12.85], [13.0, 21.41], [24.0, 25.93], [27.0, 26.77], [28.0, 28.34], [29.0, 33.35], [34.0, 39.43], [40.0, 41.35], [42.0, 42.53], [50.0, 51.43], [53.0, 56.59], [62.0, 63.36], [64.0, 65.33], [68.0, 69.23], [71.0, 71.47], [82.0, 85.78], [88.0, 102.44], [104.0, 104.38], [108.0, 108.72], [111.0, 111.37], [113.0, 113.41], [116.0, 117.61], [119.0, 120.19], [122.0, 123.21], [124.0, 128.28], [129.0, 130.3], [134.0, 138.77], [142.0, 149.61], [160.0, 159.95], [162.0, 162.53], [163.0, 168.51], [169.0, 171.63], [174.0, 177.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.31, 0.0, 0.0, 0.0, 97.92, 57.17, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 62.17, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 99.98, 99.96, 0.0, 0.0, 65.2, 89.19, 64.29], "audiomae_on_audioset": [null, null, null, [["speech", 56.41], ["telephone", 11.53], ["dial tone", 6.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.75, -0.15, 8.41, 1.93, -0.23, 0.34, 4.35, 5.43, 1.35, 0.53, 1.43, 3.59, 1.36, 1.33, 1.23, 0.47, 3.78, 14.44, 0.38, 0.72, 0.37, 0.41, 1.61, 1.19, 1.21, 4.28, 1.3, 4.77, 7.61, -0.05, 0.53, 5.51, 2.63, 3.48]} \ No newline at end of file diff --git a/annotations_1/1HfZYZ2sDwE_filtered.json b/annotations_1/1HfZYZ2sDwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f58b3250b7bcb7ff57d019a9e03341680972dba3 --- /dev/null +++ b/annotations_1/1HfZYZ2sDwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 39.48], [45.0, 45.4], [48.0, 82.95]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [37.48, 0.4, 34.95]} \ No newline at end of file diff --git a/annotations_1/1I2xNdoQXM4_filtered.json b/annotations_1/1I2xNdoQXM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c18fe424d5df1342249a3f4addfe87decb1387e7 --- /dev/null +++ b/annotations_1/1I2xNdoQXM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 5.86], [7.0, 7.72], [9.0, 9.95], [12.0, 13.32], [15.0, 16.19], [18.0, 18.23], [19.0, 19.4], [21.0, 21.69], [26.0, 27.08], [28.0, 28.07], [30.0, 30.43], [31.0, 34.8], [35.0, 37.17], [38.0, 47.51], [49.0, 56.59], [58.0, 58.8], [60.0, 61.86], [66.0, 67.86], [70.0, 70.66], [75.0, 77.68], [79.0, 80.52], [83.0, 86.75], [88.0, 89.94], [93.0, 94.26], [99.0, 99.82], [103.0, 103.3], [104.0, 107.11], [109.0, 109.65], [116.0, 116.01], [117.0, 117.91], [120.0, 121.53], [123.0, 123.33], [124.0, 125.39], [130.0, 131.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 99.4, 68.15, 92.8, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 2.86, 0.72, 0.95, 1.32, 1.19, 0.23, 0.4, 0.69, 1.08, 0.07, 0.43, 3.8, 2.17, 9.51, 7.59, 0.8, 1.86, 1.86, 0.66, 2.68, 1.52, 3.75, 1.94, 1.26, 0.82, 0.3, 3.11, 0.65, 0.01, 0.91, 1.53, 0.33, 1.39, 1.82]} \ No newline at end of file diff --git a/annotations_1/1IaDQdo8x1I_filtered.json b/annotations_1/1IaDQdo8x1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d3bb21eee44d4747f65f3df5174d9e99308adae --- /dev/null +++ b/annotations_1/1IaDQdo8x1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.41], [27.0, 27.13], [28.0, 29.88], [31.0, 35.13], [36.0, 41.01], [70.0, 72.57], [75.0, 75.52], [77.0, 77.75], [80.0, 82.22], [84.0, 85.28], [93.0, 99.47], [119.0, 125.61], [126.0, 130.5], [134.0, 138.65], [141.0, 144.04], [147.0, 151.71], [153.0, 154.74], [174.0, 175.02], [178.0, 178.53], [179.0, 179.15], [185.0, 198.34], [202.0, 201.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.1, 37.84, 34.02, 0.0, 0.0, 69.47, 0.0, 32.76, 35.05, 47.74, 47.9, 35.47, 45.85, 0.0, 0.0, 0.0, 0.0, 38.78, 0.0], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 69.83], ["music", 9.98], ["livestock, farm animals, working animals", 5.73]], [["throbbing", 39.73], ["music", 34.76], ["hum", 9.44]], null, null, null, null, [["music", 62.11], ["synthesizer", 5.01], ["hum", 4.91]], [["music", 30.65], ["speech", 17.51], ["thunk", 12.47]], [["music", 55.83], ["synthesizer", 13.96], ["musical instrument", 4.74]], [["music", 64.91], ["theremin", 3.1], ["musical instrument", 2.57]], [["music", 52.02], ["breaking", 8.04], ["thump, thud", 7.17]], [["music", 42.98], ["fart", 10.71], ["fly, housefly", 4.25]], null, null, null, null, [["speech", 78.47], ["music", 6.09], ["fart", 4.24]], null], "duration": [0.41, 0.13, 1.88, 4.13, 5.01, 2.57, 0.52, 0.75, 2.22, 1.28, 6.47, 6.61, 4.5, 4.65, 3.04, 4.71, 1.74, 1.02, 0.53, 0.15, 13.34, -0.17]} \ No newline at end of file diff --git a/annotations_1/1IyD0DjLrrc_filtered.json b/annotations_1/1IyD0DjLrrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a867d35984aa9dd9bbe2038c9a7e206d9b08733 --- /dev/null +++ b/annotations_1/1IyD0DjLrrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.9], [8.0, 9.36], [15.0, 19.03], [25.0, 27.73], [30.0, 33.96], [34.0, 37.07], [38.0, 42.28], [44.0, 45.72], [47.0, 48.56], [51.0, 52.66], [54.0, 54.26], [56.0, 58.97], [61.0, 62.33], [64.0, 65.26], [68.0, 68.0], [72.0, 73.87], [75.0, 76.99], [79.0, 79.84], [81.0, 82.78], [84.0, 84.89], [86.0, 86.83], [89.0, 90.0], [94.0, 97.14], [98.0, 106.12], [110.0, 114.96], [120.0, 120.65], [131.0, 131.94], [137.0, 140.8]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.73, 44.29, 47.31, 67.89, 69.61, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 49.04, 47.94, 0.0, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, [["snicker", 29.4], ["chuckle, chortle", 18.04], ["laughter", 9.96]], [["speech", 43.31], ["animal", 13.76], ["livestock, farm animals, working animals", 5.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.73], ["speech", 18.79], ["outside, urban or manmade", 2.18]], [["music", 40.74], ["theremin", 27.28], ["synthesizer", 5.26]], null, null, null], "duration": [1.9, 1.36, 4.03, 2.73, 3.96, 3.07, 4.28, 1.72, 1.56, 1.66, 0.26, 2.97, 1.33, 1.26, 0.0, 1.87, 1.99, 0.84, 1.78, 0.89, 0.83, 1.0, 3.14, 8.12, 4.96, 0.65, 0.94, 3.8]} \ No newline at end of file diff --git a/annotations_1/1J-U8tLUlsg_filtered.json b/annotations_1/1J-U8tLUlsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b28fe54fb8d7f190953df5ee89c9bcb01e3aa4 --- /dev/null +++ b/annotations_1/1J-U8tLUlsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.27], [16.0, 18.52], [20.0, 23.31], [29.0, 30.97], [33.0, 40.22], [41.0, 50.23], [56.0, 61.21], [62.0, 63.81], [64.0, 65.06], [66.0, 66.09], [68.0, 67.68], [68.0, 68.57], [70.0, 71.58], [73.0, 75.2], [77.0, 78.66], [80.0, 82.21], [85.0, 87.05], [88.0, 90.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.9, 76.04, 0.0, 58.72, 69.47, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 91.3, 68.15, 57.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 2.52, 3.31, 1.97, 7.22, 9.23, 5.21, 1.81, 1.06, 0.09, -0.32, 0.57, 1.58, 2.2, 1.66, 2.21, 2.05, 2.02]} \ No newline at end of file diff --git a/annotations_1/1J1osn73VYs_filtered.json b/annotations_1/1J1osn73VYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19173fbea437e89f55d1cdd62cb1b3edde4d0ab8 --- /dev/null +++ b/annotations_1/1J1osn73VYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [5.0, 5.41], [7.0, 8.88], [10.0, 11.67], [13.0, 13.83], [15.0, 18.33], [19.0, 20.09], [22.0, 29.25], [31.0, 31.58], [32.0, 33.07], [34.0, 36.39], [37.0, 42.85], [43.0, 57.43], [59.0, 61.69], [63.0, 63.46], [64.0, 78.12], [83.0, 87.94], [90.0, 105.07], [106.0, 106.47], [107.0, 106.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 68.67, 0.0, 0.0, 59.42, 81.89, 63.85, 73.51, 0.0, 35.09, 31.88, 28.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.75], ["theremin", 9.04], ["hum", 8.27]], [["music", 65.58], ["bass guitar", 7.67], ["guitar", 3.95]], [["music", 78.49], ["didgeridoo", 3.63], ["throbbing", 3.04]], null, null], "duration": [-0.04, 0.41, 1.88, 1.67, 0.83, 3.33, 1.09, 7.25, 0.58, 1.07, 2.39, 5.85, 14.43, 2.69, 0.46, 14.12, 4.94, 15.07, 0.47, -0.38]} \ No newline at end of file diff --git a/annotations_1/1J3WNRR4O60_filtered.json b/annotations_1/1J3WNRR4O60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6edb0f840c3fe8ddc1cfc7e79a22be36b2cfdee --- /dev/null +++ b/annotations_1/1J3WNRR4O60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.84], [12.0, 12.72], [23.0, 26.99], [35.0, 34.89], [37.0, 39.5], [51.0, 51.27], [55.0, 55.07], [57.0, 57.37], [58.0, 60.49], [64.0, 65.5], [67.0, 67.42], [68.0, 69.38], [74.0, 74.61], [77.0, 78.24], [80.0, 82.48], [88.0, 91.0], [91.0, 98.49], [111.0, 116.94], [118.0, 120.14], [125.0, 126.49], [131.0, 134.08], [135.0, 135.85], [138.0, 140.95], [145.0, 145.35], [185.0, 190.92], [193.0, 192.94], [193.0, 194.68], [198.0, 198.0], [204.0, 204.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 35.36, 0.0, 57.56, 0.0, 0.0, 0.0, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 51.88, 34.13, 31.94, 35.99, 0.0, 35.1, 0.0, 32.86, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 36.36], ["moo", 30.11], ["livestock, farm animals, working animals", 10.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.73], ["moo", 17.78], ["cattle, bovinae", 12.94]], [["music", 28.85], ["battle cry", 23.75], ["crowd", 18.31]], [["speech", 36.13], ["animal", 9.34], ["whale vocalization", 8.12]], null, [["mains hum", 51.51], ["hum", 29.75], ["music", 6.06]], null, [["livestock, farm animals, working animals", 47.4], ["music", 11.69], ["cattle, bovinae", 7.93]], null, [["hum", 18.38], ["music", 17.9], ["throbbing", 12.26]], null, null, null, null], "duration": [1.84, 0.72, 3.99, -0.11, 2.5, 0.27, 0.07, 0.37, 2.49, 1.5, 0.42, 1.38, 0.61, 1.24, 2.48, 3.0, 7.49, 5.94, 2.14, 1.49, 3.08, 0.85, 2.95, 0.35, 5.92, -0.06, 1.68, 0.0, 0.99]} \ No newline at end of file diff --git a/annotations_1/1JHqVsXnQxQ_filtered.json b/annotations_1/1JHqVsXnQxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39c6b54044d4e9acd32a7feef4e582b343e8a05a --- /dev/null +++ b/annotations_1/1JHqVsXnQxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.76], [17.0, 17.79], [20.0, 21.57], [26.0, 26.62], [30.0, 44.98], [50.0, 50.3], [52.0, 56.73], [61.0, 75.54], [78.0, 82.16], [85.0, 94.17], [96.0, 96.57], [99.0, 104.97], [113.0, 113.19], [113.0, 116.07], [118.0, 120.34], [121.0, 120.99], [121.0, 121.07], [122.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 34.06, 42.24, 31.73, 32.59, 0.0, 30.8, 0.0, 32.38, 33.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 80.67], ["hip hop music", 2.2], ["funk", 1.76]], null, [["speech", 58.9], ["music", 18.77], ["percussion", 2.58]], [["music", 34.45], ["speech", 24.26], ["throbbing", 7.61]], [["music", 36.15], ["speech", 16.07], ["throbbing", 7.53]], [["music", 83.19], ["didgeridoo", 5.58], ["throbbing", 2.89]], null, [["music", 83.86], ["synthesizer", 3.94], ["musical instrument", 1.89]], null, [["speech", 32.88], ["boing", 18.87], ["music", 18.04]], [["music", 37.5], ["speech", 14.08], ["throbbing", 9.49]], null, null, null], "duration": [0.76, 0.79, 1.57, 0.62, 14.98, 0.3, 4.73, 14.54, 4.16, 9.17, 0.57, 5.97, 0.19, 3.07, 2.34, -0.01, 0.07, -0.02]} \ No newline at end of file diff --git a/annotations_1/1JJjo2GcRrg_filtered.json b/annotations_1/1JJjo2GcRrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e6210266d2179b73870f3a8014a4ea6a3b555d9 --- /dev/null +++ b/annotations_1/1JJjo2GcRrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.03], [44.0, 50.41], [52.0, 55.31], [59.0, 69.65], [80.0, 80.69], [82.0, 82.11], [83.0, 87.74], [96.0, 99.62], [100.0, 100.45], [109.0, 109.48], [120.0, 136.71]], "keep_status": [false, true, true, true, false, false, false, true, false, false, true], "silence_prob": [32.28, 31.26, 30.48, 37.09, 0.0, 0.0, 31.39, 32.14, 0.0, 0.0, 32.0], "audiomae_on_audioset": [[["music", 67.75], ["musical instrument", 5.18], ["speech", 4.24]], [["music", 42.99], ["speech", 6.68], ["frog", 6.48]], [["whistle", 27.16], ["music", 26.76], ["buzzer", 8.84]], [["speech", 20.28], ["music", 17.17], ["animal", 9.09]], null, null, [["music", 30.55], ["speech", 25.83], ["boing", 15.47]], [["music", 37.3], ["boing", 19.27], ["guitar", 5.23]], null, null, [["music", 57.16], ["musical instrument", 3.98], ["sheep", 2.06]]], "duration": [3.03, 6.41, 3.31, 10.65, 0.69, 0.11, 4.74, 3.62, 0.45, 0.48, 16.71]} \ No newline at end of file diff --git a/annotations_1/1Jk8IZYcxmQ_filtered.json b/annotations_1/1Jk8IZYcxmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c80b1429a8fb670a98d30dbe32bf03837a97393 --- /dev/null +++ b/annotations_1/1Jk8IZYcxmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [10.0, 10.39], [14.0, 14.93], [48.0, 48.37], [51.0, 53.28], [64.0, 64.15], [70.0, 72.0], [96.0, 97.34], [100.0, 99.86], [103.0, 103.6], [108.0, 108.75], [118.0, 117.95], [121.0, 121.76], [131.0, 133.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.68, 0.0, 39.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 40.63], ["moo", 26.32], ["livestock, farm animals, working animals", 20.95]], null, [["music", 32.49], ["speech", 13.6], ["theremin", 5.14]], null, null, null, null, null, null, [["music", 37.66], ["speech", 27.74], ["bang", 6.12]]], "duration": [0.0, 0.39, 0.93, 0.37, 2.28, 0.15, 2.0, 1.34, -0.14, 0.6, 0.75, -0.05, 0.76, 2.56]} \ No newline at end of file diff --git a/annotations_1/1Kk_oah-wCM_filtered.json b/annotations_1/1Kk_oah-wCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02f2ef1324a1973c3aa8e12decebd77461d040ea --- /dev/null +++ b/annotations_1/1Kk_oah-wCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.87], [23.0, 24.26], [30.0, 31.13], [45.0, 48.57], [50.0, 54.94], [63.0, 69.28], [72.0, 71.54]], "keep_status": [true, false, false, false, true, false, false], "silence_prob": [35.19, 0.0, 0.0, 28.76, 29.06, 30.43, 0.0], "audiomae_on_audioset": [[["hum", 23.98], ["music", 18.82], ["throbbing", 14.61]], null, null, [["foghorn", 41.78], ["speech", 17.7], ["music", 12.07]], [["speech", 43.42], ["music", 17.95], ["foghorn", 6.18]], [["music", 42.9], ["theremin", 23.14], ["speech", 4.86]], null], "duration": [7.87, 1.26, 1.13, 3.57, 4.94, 6.28, -0.46]} \ No newline at end of file diff --git a/annotations_1/1LoGtPIr2-k_filtered.json b/annotations_1/1LoGtPIr2-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d85fc1821896ba0ff8210d64eade6eb60f52f372 --- /dev/null +++ b/annotations_1/1LoGtPIr2-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.55], [6.0, 8.41], [10.0, 11.85], [14.0, 15.47], [17.0, 21.66], [23.0, 25.02], [26.0, 30.55], [31.0, 34.43], [36.0, 37.99], [39.0, 39.97], [41.0, 42.58], [43.0, 44.88], [46.0, 47.75], [50.0, 52.07], [55.0, 56.78], [59.0, 63.73], [64.0, 65.48], [66.0, 68.07], [69.0, 70.55], [72.0, 76.69], [79.0, 80.4], [82.0, 83.42], [85.0, 86.26], [88.0, 88.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.52, 66.76, 0.0, 0.0, 99.52, 99.44, 55.67, 73.06, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 99.82, 0.0, 42.37, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 95.95], ["speech", 1.21], ["music", 0.89]], null, null, null, null, null, null], "duration": [2.55, 2.41, 1.85, 1.47, 4.66, 2.02, 4.55, 3.43, 1.99, 0.97, 1.58, 1.88, 1.75, 2.07, 1.78, 4.73, 1.48, 2.07, 1.55, 4.69, 1.4, 1.42, 1.26, 0.1]} \ No newline at end of file diff --git a/annotations_1/1Ltz-vQPqgo_filtered.json b/annotations_1/1Ltz-vQPqgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a76467ed965e2b3d8d232b0b0b3d6ee114ff72a7 --- /dev/null +++ b/annotations_1/1Ltz-vQPqgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.25], [5.0, 6.15], [7.0, 7.64], [10.0, 33.59], [36.0, 36.17], [36.0, 68.91], [70.0, 80.97], [83.0, 89.06], [90.0, 95.59], [97.0, 102.41], [103.0, 104.21]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [98.36, 0.0, 0.0, 34.39, 0.0, 0.0, 51.44, 73.82, 32.74, 46.61, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.8], ["rumble", 14.52], ["hum", 10.37]], null, null, null, null, [["speech", 44.83], ["music", 23.56], ["mains hum", 8.6]], [["beatboxing", 29.59], ["squawk", 12.81], ["speech", 9.01]], null], "duration": [2.25, 1.15, 0.64, 23.59, 0.17, 32.91, 10.97, 6.06, 5.59, 5.41, 1.21]} \ No newline at end of file diff --git a/annotations_1/1M00J5Q1Vv8_filtered.json b/annotations_1/1M00J5Q1Vv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..438ffbcf00227d36f86a301696329daffa910428 --- /dev/null +++ b/annotations_1/1M00J5Q1Vv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.35], [4.0, 5.22], [7.0, 7.3], [8.0, 13.71], [14.0, 16.09], [17.0, 75.96], [78.0, 79.66]], "keep_status": [false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.98, 36.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["rumble", 45.47], ["music", 12.24], ["hum", 9.62]], [["speech", 55.11], ["sine wave", 5.99], ["hum", 4.47]], null, null], "duration": [0.35, 1.22, 0.3, 5.71, 2.09, 58.96, 1.66]} \ No newline at end of file diff --git a/annotations_1/1N81Dwye3VM_filtered.json b/annotations_1/1N81Dwye3VM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f9bde7d54503700cf1b0b033ce6dd9dd6fda06 --- /dev/null +++ b/annotations_1/1N81Dwye3VM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [18.0, 17.98], [31.0, 31.77], [34.0, 36.09], [37.0, 41.69], [43.0, 49.01], [51.0, 51.88], [53.0, 56.89], [58.0, 58.38], [61.0, 61.97], [62.0, 68.62], [70.0, 84.74], [87.0, 89.9], [90.0, 90.15], [90.0, 91.02], [91.0, 92.35], [96.0, 101.07], [101.0, 101.87], [111.0, 111.32], [119.0, 125.36], [127.0, 130.37]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 30.47, 29.28, 29.45, 0.0, 29.71, 0.0, 0.0, 30.82, 30.31, 31.25, 0.0, 0.0, 0.0, 30.37, 0.0, 0.0, 29.23, 38.71], "audiomae_on_audioset": [null, null, null, [["music", 27.79], ["cattle, bovinae", 21.71], ["moo", 21.16]], [["music", 44.79], ["vehicle", 7.28], ["motorcycle", 5.51]], [["music", 32.52], ["buzz", 17.68], ["speech", 9.04]], null, [["music", 72.94], ["speech", 4.96], ["electronic music", 2.62]], null, null, [["music", 27.31], ["vehicle", 14.25], ["motorcycle", 10.85]], [["music", 63.21], ["buzz", 5.9], ["cacophony", 4.89]], [["music", 48.34], ["boing", 20.58], ["sidetone", 10.19]], null, null, null, [["music", 40.22], ["cattle, bovinae", 12.36], ["speech", 11.34]], null, null, [["music", 27.03], ["speech", 9.95], ["fly, housefly", 6.83]], [["sneeze", 42.32], ["fart", 3.87], ["throbbing", 2.7]]], "duration": [1.27, -0.02, 0.77, 2.09, 4.69, 6.01, 0.88, 3.89, 0.38, 0.97, 6.62, 14.74, 2.9, 0.15, 1.02, 1.35, 5.07, 0.87, 0.32, 6.36, 3.37]} \ No newline at end of file diff --git a/annotations_1/1OxDZKordaM_filtered.json b/annotations_1/1OxDZKordaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c82139e8e9f0b3df35b427ec30131a0836977812 --- /dev/null +++ b/annotations_1/1OxDZKordaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.13], [11.0, 13.59], [20.0, 20.51], [30.0, 30.52], [39.0, 40.58], [46.0, 46.48], [47.0, 47.55], [49.0, 48.86], [51.0, 55.07], [59.0, 59.63], [72.0, 72.01], [75.0, 75.52], [81.0, 88.77], [92.0, 116.92], [119.0, 119.55], [120.0, 121.44], [123.0, 124.93], [126.0, 128.63], [130.0, 130.72], [131.0, 132.29], [133.0, 134.33], [136.0, 137.62], [141.0, 141.49], [147.0, 146.99], [150.0, 149.96], [153.0, 153.64], [161.0, 163.95], [166.0, 166.19], [175.0, 174.99], [176.0, 176.15], [188.0, 188.76], [189.0, 189.4], [192.0, 191.76], [193.0, 195.22], [196.0, 197.75], [202.0, 204.11], [206.0, 207.3], [218.0, 218.27], [221.0, 221.64], [225.0, 225.34], [232.0, 232.12], [243.0, 244.26], [259.0, 259.43], [264.0, 270.8], [271.0, 272.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.47, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 32.8, 31.4, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.14], ["speech", 18.62], ["trombone", 6.03]], [["music", 58.59], ["jingle bell", 7.58], ["tambourine", 4.35]], null, null, null, [["goose", 24.68], ["animal", 24.37], ["honk", 15.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.13, 2.59, 0.51, 0.52, 1.58, 0.48, 0.55, -0.14, 4.07, 0.63, 0.01, 0.52, 7.77, 24.92, 0.55, 1.44, 1.93, 2.63, 0.72, 1.29, 1.33, 1.62, 0.49, -0.01, -0.04, 0.64, 2.95, 0.19, -0.01, 0.15, 0.76, 0.4, -0.24, 2.22, 1.75, 2.11, 1.3, 0.27, 0.64, 0.34, 0.12, 1.26, 0.43, 6.8, 1.84]} \ No newline at end of file diff --git a/annotations_1/1PRZi8t38OQ_filtered.json b/annotations_1/1PRZi8t38OQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a6218189dff3b8602f904e7b6433f3dd003c97d --- /dev/null +++ b/annotations_1/1PRZi8t38OQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.5], [27.0, 32.46], [34.0, 42.45], [45.0, 45.25], [46.0, 49.22], [50.0, 54.5], [57.0, 59.91], [62.0, 62.87], [63.0, 64.35], [65.0, 67.22], [68.0, 81.6], [83.0, 96.31]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 41.56, 55.18, 0.0, 61.18, 64.18, 71.14, 0.0, 0.0, 47.54, 47.16, 67.38], "audiomae_on_audioset": [null, [["music", 43.48], ["synthesizer", 11.99], ["theremin", 9.18]], null, null, null, null, null, null, null, [["gong", 42.61], ["sine wave", 12.22], ["speech", 8.0]], [["music", 46.64], ["ambient music", 9.37], ["speech", 9.19]], null], "duration": [1.5, 5.46, 8.45, 0.25, 3.22, 4.5, 2.91, 0.87, 1.35, 2.22, 13.6, 13.31]} \ No newline at end of file diff --git a/annotations_1/1Pk2FQUbnm0_filtered.json b/annotations_1/1Pk2FQUbnm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57dd242241c71cee308025c029334977b9616bba --- /dev/null +++ b/annotations_1/1Pk2FQUbnm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.3], [22.0, 22.91], [23.0, 24.78], [27.0, 28.0], [31.0, 31.6], [33.0, 33.99], [34.0, 35.9], [40.0, 40.81], [42.0, 43.6], [46.0, 46.79], [48.0, 53.27], [57.0, 59.73], [60.0, 71.46], [74.0, 87.69], [88.0, 89.45], [91.0, 104.95], [107.0, 121.49], [126.0, 126.1], [127.0, 127.01], [127.0, 129.56], [132.0, 132.66], [136.0, 136.53], [137.0, 137.83], [139.0, 146.08], [150.0, 152.34], [156.0, 160.79], [163.0, 176.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [31.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.16, 42.44, 36.36, 31.28, 0.0, 55.89, 45.02, 0.0, 0.0, 63.96, 0.0, 0.0, 0.0, 42.88, 59.07, 38.0, 31.13], "audiomae_on_audioset": [[["music", 71.54], ["theremin", 4.06], ["civil defense siren", 3.37]], null, null, null, null, null, null, null, null, null, [["music", 52.96], ["speech", 8.32], ["synthesizer", 7.31]], [["music", 60.31], ["theremin", 6.32], ["musical instrument", 3.78]], [["music", 76.57], ["theremin", 5.64], ["synthesizer", 3.72]], [["throbbing", 37.62], ["hum", 36.68], ["mains hum", 11.18]], null, null, [["music", 65.24], ["synthesizer", 7.95], ["ambient music", 5.28]], null, null, null, null, null, null, [["music", 57.86], ["hum", 14.4], ["mains hum", 9.39]], null, [["music", 57.28], ["synthesizer", 5.1], ["sampler", 3.7]], [["music", 53.27], ["musical instrument", 5.7], ["sitar", 4.69]]], "duration": [3.3, 0.91, 1.78, 1.0, 0.6, 0.99, 1.9, 0.81, 1.6, 0.79, 5.27, 2.73, 11.46, 13.69, 1.45, 13.95, 14.49, 0.1, 0.01, 2.56, 0.66, 0.53, 0.83, 7.08, 2.34, 4.79, 13.4]} \ No newline at end of file diff --git a/annotations_1/1PkqpkQQmwg_filtered.json b/annotations_1/1PkqpkQQmwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0835de91d6b3dde7394841266ddedc303ab781d --- /dev/null +++ b/annotations_1/1PkqpkQQmwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.38], [5.0, 9.95], [12.0, 13.49], [15.0, 15.48], [16.0, 16.31], [19.0, 20.16], [25.0, 26.91], [27.0, 29.67], [32.0, 32.97], [34.0, 37.37], [38.0, 43.26], [46.0, 47.78], [49.0, 50.95], [54.0, 53.82], [56.0, 56.17], [58.0, 60.61], [61.0, 69.01], [69.0, 71.83], [75.0, 75.25], [77.0, 78.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.62, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 96.66, 40.55, 0.0, 0.0, 0.0, 0.0, 68.54, 87.55, 73.67, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 77.32], ["sidetone", 5.25], ["busy signal", 2.69]], null, null, null, null, null, null, null, null, null, [["speech", 65.74], ["sidetone", 8.93], ["music", 4.31]], null, null, null, null, null, null, null, null, null], "duration": [2.38, 4.95, 1.49, 0.48, 0.31, 1.16, 1.91, 2.67, 0.97, 3.37, 5.26, 1.78, 1.95, -0.18, 0.17, 2.61, 8.01, 2.83, 0.25, 1.54]} \ No newline at end of file diff --git a/annotations_1/1QC88NQZM-8_filtered.json b/annotations_1/1QC88NQZM-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ecf52639a62989b6ca84096f18f8e79ff95572 --- /dev/null +++ b/annotations_1/1QC88NQZM-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.53], [23.0, 26.64], [34.0, 35.29], [37.0, 37.35], [39.0, 40.12], [42.0, 43.11], [45.0, 56.69], [63.0, 65.25]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [64.63, 79.07, 0.0, 0.0, 0.0, 0.0, 34.96, 32.04], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 20.54], ["whale vocalization", 15.31], ["animal", 9.14]], [["fly, housefly", 28.07], ["fart", 24.36], ["mosquito", 20.0]]], "duration": [2.53, 3.64, 1.29, 0.35, 1.12, 1.11, 11.69, 2.25]} \ No newline at end of file diff --git a/annotations_1/1Qd2hicvxBc_filtered.json b/annotations_1/1Qd2hicvxBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a70c7f62223a4d15585551924865d4331ea44c9 --- /dev/null +++ b/annotations_1/1Qd2hicvxBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.54], [17.0, 17.12], [25.0, 28.39], [30.0, 31.92], [32.0, 33.08], [37.0, 42.3], [45.0, 46.38], [50.0, 50.89], [52.0, 59.41], [65.0, 66.85], [72.0, 72.82], [81.0, 80.99], [81.0, 82.43], [86.0, 86.71], [89.0, 89.85], [92.0, 92.97], [94.0, 95.03], [96.0, 108.33], [112.0, 112.4], [114.0, 114.69], [116.0, 116.4], [120.0, 122.62], [123.0, 130.13]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.94, 0.0, 0.0, 60.6, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0, 0.0, 69.07, 31.49], "audiomae_on_audioset": [null, null, [["speech", 47.91], ["music", 5.85], ["livestock, farm animals, working animals", 3.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 22.42], ["music", 19.08], ["moo", 12.6]], null, null, null, null, [["music", 28.16], ["vehicle", 6.07], ["explosion", 4.89]]], "duration": [-0.46, 0.12, 3.39, 1.92, 1.08, 5.3, 1.38, 0.89, 7.41, 1.85, 0.82, -0.01, 1.43, 0.71, 0.85, 0.97, 1.03, 12.33, 0.4, 0.69, 0.4, 2.62, 7.13]} \ No newline at end of file diff --git a/annotations_1/1R4FATHHlTU_filtered.json b/annotations_1/1R4FATHHlTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7112d7fed0901f24a0fc2698d891677e92d9034f --- /dev/null +++ b/annotations_1/1R4FATHHlTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.96], [23.0, 25.19], [29.0, 30.38], [32.0, 32.97], [38.0, 75.51], [84.0, 84.72], [89.0, 91.22], [93.0, 92.97], [96.0, 96.82], [97.0, 97.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.71, 33.17, 0.0, 0.0, 0.0, 0.0, 31.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.26], ["guitar", 3.26], ["musical instrument", 2.45]], [["music", 67.54], ["musical instrument", 5.55], ["guitar", 3.72]], null, null, null, null, [["music", 63.01], ["didgeridoo", 6.01], ["hum", 4.33]], null, null, null], "duration": [19.96, 2.19, 1.38, 0.97, 37.51, 0.72, 2.22, -0.03, 0.82, 0.83]} \ No newline at end of file diff --git a/annotations_1/1SPMnqTUu1A_filtered.json b/annotations_1/1SPMnqTUu1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db9e8887b4fb4bf380f830d64a12a7ea448a5c75 --- /dev/null +++ b/annotations_1/1SPMnqTUu1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.4], [19.0, 21.24], [22.0, 22.35], [24.0, 24.98], [26.0, 26.62], [28.0, 28.39], [30.0, 32.05], [43.0, 47.63], [50.0, 51.24], [53.0, 54.72], [58.0, 59.22], [60.0, 63.34], [66.0, 74.53], [76.0, 79.22], [81.0, 89.99], [92.0, 101.51], [104.0, 122.18], [123.0, 122.91], [135.0, 138.5], [143.0, 151.44], [152.0, 151.56], [152.0, 162.58], [164.0, 207.37], [209.0, 213.92], [214.0, 215.11], [217.0, 217.75], [220.0, 220.08], [221.0, 222.17]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, true, true, true, true, true, false, false, true, true, false, true, false, false, false, false, false, false], "silence_prob": [42.22, 81.71, 0.0, 0.0, 0.0, 0.0, 46.19, 40.36, 0.0, 0.0, 0.0, 48.74, 34.26, 33.15, 29.34, 29.94, 31.09, 0.0, 32.9, 28.67, 0.0, 29.92, 0.0, 29.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 21.34], ["speech", 18.92], ["foghorn", 5.51]], null, null, null, null, null, [["music", 28.18], ["speech", 18.24], ["didgeridoo", 17.48]], [["hum", 29.88], ["music", 18.27], ["speech", 12.47]], null, null, null, [["music", 51.3], ["didgeridoo", 5.06], ["ambient music", 4.95]], [["music", 21.02], ["duck", 13.29], ["ambient music", 11.77]], [["music", 41.18], ["trombone", 7.33], ["theremin", 6.76]], [["music", 55.89], ["theremin", 6.77], ["throbbing", 5.57]], [["music", 49.84], ["musical instrument", 5.96], ["didgeridoo", 5.76]], [["music", 61.55], ["speech", 13.58], ["throbbing", 6.73]], null, [["music", 25.71], ["speech", 24.55], ["trombone", 11.05]], [["music", 27.9], ["animal", 13.17], ["speech", 4.34]], null, [["livestock, farm animals, working animals", 23.66], ["music", 17.61], ["cattle, bovinae", 14.05]], null, [["cattle, bovinae", 56.05], ["moo", 25.61], ["livestock, farm animals, working animals", 16.32]], null, null, null, null], "duration": [9.4, 2.24, 0.35, 0.98, 0.62, 0.39, 2.05, 4.63, 1.24, 1.72, 1.22, 3.34, 8.53, 3.22, 8.99, 9.51, 18.18, -0.09, 3.5, 8.44, -0.44, 10.58, 43.37, 4.92, 1.11, 0.75, 0.08, 1.17]} \ No newline at end of file diff --git a/annotations_1/1SkWbujEeLM_filtered.json b/annotations_1/1SkWbujEeLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27c04a7c0ec632e0f4d33d5263a0d62cf039f975 --- /dev/null +++ b/annotations_1/1SkWbujEeLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.8], [11.0, 12.11], [13.0, 14.57], [23.0, 24.06], [26.0, 29.51], [33.0, 35.65], [37.0, 37.67], [40.0, 43.41], [46.0, 52.49], [56.0, 57.32], [58.0, 58.89], [61.0, 63.07], [65.0, 66.8], [71.0, 72.32], [73.0, 74.09], [75.0, 77.26], [79.0, 86.04], [88.0, 89.43], [92.0, 93.24], [95.0, 96.16], [97.0, 102.9], [107.0, 107.42], [108.0, 109.73], [111.0, 112.24], [114.0, 115.6], [118.0, 119.21], [120.0, 120.65], [123.0, 122.74], [127.0, 128.22], [130.0, 130.42], [131.0, 132.27], [133.0, 133.37], [135.0, 135.82], [137.0, 137.88], [140.0, 141.79], [144.0, 146.2], [147.0, 148.26], [154.0, 158.04], [159.0, 164.49], [167.0, 167.73], [170.0, 175.04], [176.0, 176.3], [178.0, 179.05], [180.0, 183.83], [188.0, 189.24], [201.0, 204.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.62, 99.87, 0.0, 97.33, 91.81, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 71.72, 55.96, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 39.98, 95.09, 0.0, 99.65, 0.0, 0.0, 57.17, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.32], ["dial tone", 8.53], ["whale vocalization", 6.95]], null, null, null, null, null, null, null, null], "duration": [0.8, 1.11, 1.57, 1.06, 3.51, 2.65, 0.67, 3.41, 6.49, 1.32, 0.89, 2.07, 1.8, 1.32, 1.09, 2.26, 7.04, 1.43, 1.24, 1.16, 5.9, 0.42, 1.73, 1.24, 1.6, 1.21, 0.65, -0.26, 1.22, 0.42, 1.27, 0.37, 0.82, 0.88, 1.79, 2.2, 1.26, 4.04, 5.49, 0.73, 5.04, 0.3, 1.05, 3.83, 1.24, 3.67]} \ No newline at end of file diff --git a/annotations_1/1TX6svl0Qjc_filtered.json b/annotations_1/1TX6svl0Qjc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fefd4973bd1ad15c8f57f3f83e7ad5c888655ca4 --- /dev/null +++ b/annotations_1/1TX6svl0Qjc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 79.52], [82.0, 86.71], [88.0, 112.13], [113.0, 112.9], [114.0, 116.04], [117.0, 117.59], [121.0, 121.32], [130.0, 131.5], [133.0, 134.69], [139.0, 139.83], [142.0, 142.43], [145.0, 147.88], [156.0, 157.77], [159.0, 160.15]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.76, 36.58, 0.0, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 29.53], ["music", 26.23], ["hum", 25.86]], null, [["music", 26.15], ["hum", 19.3], ["speech", 12.29]], null, null, null, null, null, null, null, null, null], "duration": [75.52, 4.71, 24.13, -0.1, 2.04, 0.59, 0.32, 1.5, 1.69, 0.83, 0.43, 2.88, 1.77, 1.15]} \ No newline at end of file diff --git a/annotations_1/1UXl3LGnRR4_filtered.json b/annotations_1/1UXl3LGnRR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f36eca4a65e76aad12e620f4ccd603d30ab0ed3 --- /dev/null +++ b/annotations_1/1UXl3LGnRR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.5], [21.0, 22.72], [26.0, 38.47], [40.0, 42.16], [43.0, 43.95], [48.0, 48.14], [50.0, 50.94], [55.0, 56.34], [58.0, 58.16], [60.0, 60.25], [61.0, 68.15], [71.0, 70.88], [71.0, 71.91], [73.0, 75.49], [76.0, 76.57], [83.0, 105.71], [109.0, 109.78], [111.0, 111.55], [116.0, 116.06], [119.0, 119.69], [131.0, 142.15], [145.0, 146.52], [150.0, 152.49], [157.0, 157.57], [160.0, 160.49], [173.0, 198.19], [199.0, 199.08], [200.0, 201.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.9, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.99, 0.0, 0.0, 37.16, 0.0, 34.78, 0.0, 0.0, 0.0, 0.0, 31.42, 0.0, 31.47, 0.0, 0.0, 30.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.82], ["didgeridoo", 6.07], ["speech", 3.7]], [["music", 56.62], ["musical instrument", 4.47], ["percussion", 3.63]], null, null, null, null, null, null, [["music", 62.11], ["didgeridoo", 23.63], ["musical instrument", 0.82]], null, null, [["music", 64.73], ["speech", 13.61], ["radio", 1.79]], null, [["explosion", 14.55], ["burst, pop", 11.98], ["animal", 11.93]], null, null, null, null, [["music", 86.7], ["electronic music", 1.28], ["speech", 0.98]], null, [["music", 37.84], ["moo", 5.23], ["cattle, bovinae", 4.89]], null, null, [["music", 51.15], ["speech", 14.08], ["fart", 6.8]], null, null], "duration": [0.5, 1.72, 12.47, 2.16, 0.95, 0.14, 0.94, 1.34, 0.16, 0.25, 7.15, -0.12, 0.91, 2.49, 0.57, 22.71, 0.78, 0.55, 0.06, 0.69, 11.15, 1.52, 2.49, 0.57, 0.49, 25.19, 0.08, 1.45]} \ No newline at end of file diff --git a/annotations_1/1UbxL1MVZ7o_filtered.json b/annotations_1/1UbxL1MVZ7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c62d946803dfedd52742b83134e25dd2dc6214ed --- /dev/null +++ b/annotations_1/1UbxL1MVZ7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.76], [15.0, 18.25], [20.0, 20.8], [22.0, 23.53], [26.0, 26.87], [28.0, 28.65], [30.0, 31.46], [33.0, 33.34], [36.0, 44.37], [45.0, 48.24], [50.0, 52.35], [53.0, 65.53], [67.0, 69.97], [71.0, 72.15], [73.0, 77.82], [79.0, 83.81], [85.0, 96.13], [99.0, 99.4], [102.0, 102.51], [103.0, 102.83], [103.0, 104.48], [105.0, 107.79]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.06, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 79.94, 44.93, 98.93, 97.22, 0.0, 95.64, 55.46, 70.72, 0.0, 0.0, 0.0, 0.0, 91.98], "audiomae_on_audioset": [[["music", 54.73], ["speech", 8.12], ["synthesizer", 6.39]], null, null, null, null, null, null, null, null, null, [["sidetone", 36.34], ["hum", 18.33], ["speech", 9.76]], null, null, null, null, null, null, null, null, null, null, null], "duration": [6.76, 3.25, 0.8, 1.53, 0.87, 0.65, 1.46, 0.34, 8.37, 3.24, 2.35, 12.53, 2.97, 1.15, 4.82, 4.81, 11.13, 0.4, 0.51, -0.17, 1.48, 2.79]} \ No newline at end of file diff --git a/annotations_1/1UtDbLZsJ4Q_filtered.json b/annotations_1/1UtDbLZsJ4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3da9b899185397293602c399103ad77f9860de9 --- /dev/null +++ b/annotations_1/1UtDbLZsJ4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.8], [25.0, 72.99], [76.0, 90.75]], "keep_status": [false, false, true], "silence_prob": [38.97, 0.0, 30.14], "audiomae_on_audioset": [[["music", 36.78], ["speech", 27.28], ["breaking", 9.32]], null, [["buzz", 18.73], ["music", 18.38], ["speech", 15.05]]], "duration": [21.8, 47.99, 14.75]} \ No newline at end of file diff --git a/annotations_1/1V4SU2_-Ppg_filtered.json b/annotations_1/1V4SU2_-Ppg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..343df4c1c90f45fbe57822adb902a67cb60faa3e --- /dev/null +++ b/annotations_1/1V4SU2_-Ppg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 5.95], [7.0, 7.11], [8.0, 9.34], [11.0, 10.79], [11.0, 14.42], [17.0, 104.79]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.72, 0.95, 0.11, 1.34, -0.21, 3.42, 87.79]} \ No newline at end of file diff --git a/annotations_1/1VEMit7JERo_filtered.json b/annotations_1/1VEMit7JERo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c26c6b20788ef24150877a9b84232271f087a8f9 --- /dev/null +++ b/annotations_1/1VEMit7JERo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 3.99], [5.0, 6.74], [7.0, 8.07], [14.0, 20.21], [26.0, 26.52], [29.0, 29.84], [34.0, 34.38], [37.0, 39.23], [42.0, 42.65], [46.0, 48.57], [49.0, 49.33], [50.0, 50.21], [55.0, 55.19], [56.0, 57.42], [58.0, 58.85], [65.0, 65.52], [68.0, 68.96], [74.0, 74.14], [78.0, 77.84], [91.0, 91.4], [93.0, 93.55], [105.0, 107.13], [108.0, 109.71], [111.0, 111.55], [114.0, 114.27], [116.0, 117.85], [118.0, 119.38], [120.0, 121.31], [129.0, 131.06], [132.0, 137.27], [142.0, 143.85], [147.0, 148.44], [150.0, 150.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.93, 0.0, 0.0, 0.0, 34.72, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 70.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 86.42], ["shuffling cards", 2.56], ["synthesizer", 1.97]], null, null, null, [["music", 75.99], ["synthesizer", 5.2], ["musical instrument", 4.49]], null, [["music", 54.48], ["synthesizer", 11.8], ["musical instrument", 9.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, -0.01, 1.74, 1.07, 6.21, 0.52, 0.84, 0.38, 2.23, 0.65, 2.57, 0.33, 0.21, 0.19, 1.42, 0.85, 0.52, 0.96, 0.14, -0.16, 0.4, 0.55, 2.13, 1.71, 0.55, 0.27, 1.85, 1.38, 1.31, 2.06, 5.27, 1.85, 1.44, 0.84]} \ No newline at end of file diff --git a/annotations_1/1WwlHv69kik_filtered.json b/annotations_1/1WwlHv69kik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ab00438a4ed2a06eb5a2f00412d4ee079e324a9 --- /dev/null +++ b/annotations_1/1WwlHv69kik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.91], [28.0, 28.66], [30.0, 34.55], [35.0, 35.43], [36.0, 38.48], [39.0, 42.62], [43.0, 44.81], [46.0, 46.87], [48.0, 48.49], [51.0, 51.63], [53.0, 53.97], [56.0, 59.32], [60.0, 62.88], [63.0, 63.91], [65.0, 70.61], [71.0, 73.08], [74.0, 76.27], [77.0, 80.1], [81.0, 83.49], [85.0, 87.15], [89.0, 99.25], [101.0, 105.49], [108.0, 109.59], [110.0, 118.67], [121.0, 121.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [82.61, 0.0, 92.48, 0.0, 89.01, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 73.51, 0.0, 91.81, 83.16, 89.9, 87.55, 90.25, 94.66, 77.53, 80.46, 0.0, 47.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.03], ["sheep", 7.51], ["hum", 6.23]], null], "duration": [5.91, 0.66, 4.55, 0.43, 2.48, 3.62, 1.81, 0.87, 0.49, 0.63, 0.97, 3.32, 2.88, 0.91, 5.61, 2.08, 2.27, 3.1, 2.49, 2.15, 10.25, 4.49, 1.59, 8.67, 0.42]} \ No newline at end of file diff --git a/annotations_1/1Ylk2e-x--8_filtered.json b/annotations_1/1Ylk2e-x--8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb681e0129eae5f32652849bd32598c2fbddaa25 --- /dev/null +++ b/annotations_1/1Ylk2e-x--8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.92], [3.0, 17.78], [20.0, 23.14], [41.0, 43.78], [44.0, 45.01], [46.0, 47.02], [49.0, 51.6], [53.0, 54.23], [56.0, 57.45], [59.0, 59.41], [62.0, 62.61], [65.0, 65.64], [68.0, 69.48], [70.0, 70.46], [74.0, 74.51], [76.0, 77.85], [78.0, 79.42], [81.0, 84.13], [85.0, 88.43], [89.0, 89.65], [92.0, 91.74], [104.0, 104.58], [105.0, 106.27], [110.0, 111.89], [114.0, 114.57], [116.0, 117.51], [119.0, 120.8], [121.0, 122.88], [124.0, 124.53], [126.0, 127.03], [135.0, 135.53], [137.0, 140.68], [143.0, 144.85], [145.0, 146.84], [149.0, 149.86], [151.0, 158.3], [160.0, 164.54], [167.0, 170.87], [172.0, 177.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, true], "silence_prob": [0.0, 38.11, 65.55, 91.98, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.45, 39.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 0.0, 34.01, 33.22, 33.49, 29.8], "audiomae_on_audioset": [null, [["theremin", 34.97], ["music", 32.99], ["hum", 15.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["rain", 28.72], ["rain on surface", 22.18], ["raindrop", 15.03]], [["speech", 29.56], ["eruption", 15.19], ["rain", 11.5]], null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 8.15], ["hum", 6.48], ["livestock, farm animals, working animals", 5.95]], null, null, null, [["speech", 23.37], ["hum", 14.4], ["rain on surface", 8.17]], [["music", 46.46], ["hum", 4.81], ["rain on surface", 4.32]], [["music", 42.31], ["hum", 12.13], ["throbbing", 7.29]], [["music", 55.36], ["theremin", 8.78], ["cello", 5.09]]], "duration": [1.92, 14.78, 3.14, 2.78, 1.01, 1.02, 2.6, 1.23, 1.45, 0.41, 0.61, 0.64, 1.48, 0.46, 0.51, 1.85, 1.42, 3.13, 3.43, 0.65, -0.26, 0.58, 1.27, 1.89, 0.57, 1.51, 1.8, 1.88, 0.53, 1.03, 0.53, 3.68, 1.85, 1.84, 0.86, 7.3, 4.54, 3.87, 5.62]} \ No newline at end of file diff --git a/annotations_1/1YpDd1nVthI_filtered.json b/annotations_1/1YpDd1nVthI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..089c6481ff751f7f33b9527ef5f160ec6dee1e07 --- /dev/null +++ b/annotations_1/1YpDd1nVthI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [12.0, 13.83], [15.0, 16.87], [18.0, 21.96], [25.0, 28.24], [30.0, 41.99], [43.0, 44.14], [46.0, 46.06], [51.0, 51.22], [53.0, 54.97], [56.0, 56.69], [61.0, 60.96], [78.0, 78.14], [97.0, 97.39], [104.0, 107.55], [116.0, 118.96], [120.0, 121.42], [124.0, 128.17], [134.0, 155.01], [166.0, 167.02], [168.0, 169.8], [170.0, 172.76], [175.0, 177.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 95.23, 93.29, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 46.57, 0.0, 62.07, 55.46, 0.0, 0.0, 39.22, 49.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.63], ["music", 15.81], ["theremin", 5.55]], null, null, null, null, null, [["mains hum", 28.27], ["hum", 23.91], ["speech", 14.39]], [["hum", 40.26], ["throbbing", 27.14], ["mains hum", 9.35]]], "duration": [0.67, 1.83, 1.87, 3.96, 3.24, 11.99, 1.14, 0.06, 0.22, 1.97, 0.69, -0.04, 0.14, 0.39, 3.55, 2.96, 1.42, 4.17, 21.01, 1.02, 1.8, 2.76, 2.52]} \ No newline at end of file diff --git a/annotations_1/1YrP2ICd6ro_filtered.json b/annotations_1/1YrP2ICd6ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3572ae9f0b0b1f42d8763d3b789b3772eca726b7 --- /dev/null +++ b/annotations_1/1YrP2ICd6ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [14.0, 15.06], [43.0, 43.78], [45.0, 47.11], [54.0, 54.43], [61.0, 63.07], [75.0, 75.51], [80.0, 106.22], [106.0, 106.25], [106.0, 106.44], [113.0, 113.1], [115.0, 115.01], [121.0, 158.89], [159.0, 166.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 34.93, 0.0, 57.25, 0.0, 32.81, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26], "audiomae_on_audioset": [null, null, null, [["speech", 34.28], ["music", 10.73], ["mantra", 8.94]], null, null, null, [["music", 83.02], ["musical instrument", 3.23], ["theremin", 2.81]], null, null, null, null, null, [["speech", 28.49], ["mains hum", 9.14], ["hum", 7.28]]], "duration": [0.45, 1.06, 0.78, 2.11, 0.43, 2.07, 0.51, 26.22, 0.25, 0.44, 0.1, 0.01, 37.89, 7.45]} \ No newline at end of file diff --git a/annotations_1/1ZJEtM585x0_filtered.json b/annotations_1/1ZJEtM585x0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/1ZJEtM585x0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/1ZVcZnWu57k_filtered.json b/annotations_1/1ZVcZnWu57k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..559ebd97ca5f2dcd64578666f2400af56a889b13 --- /dev/null +++ b/annotations_1/1ZVcZnWu57k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.8], [12.0, 27.41], [30.0, 33.52], [37.0, 44.54], [45.0, 60.47], [61.0, 63.96], [66.0, 84.32], [85.0, 87.66], [88.0, 89.45], [90.0, 98.05], [98.0, 98.81], [101.0, 109.71], [111.0, 111.55]], "keep_status": [true, true, true, true, false, true, true, true, false, true, false, true, false], "silence_prob": [37.12, 37.25, 37.35, 37.17, 35.67, 36.7, 39.75, 40.29, 0.0, 33.38, 0.0, 32.2, 0.0], "audiomae_on_audioset": [[["hum", 20.96], ["music", 19.96], ["synthesizer", 9.04]], [["speech", 38.87], ["insect", 9.12], ["sidetone", 6.64]], [["effects unit", 18.35], ["music", 17.94], ["distortion", 13.87]], [["sine wave", 39.62], ["hum", 8.35], ["chirp tone", 6.55]], [["throbbing", 52.22], ["hum", 29.2], ["heart sounds, heartbeat", 6.54]], [["sine wave", 31.52], ["chirp tone", 14.55], ["music", 9.7]], [["music", 14.7], ["singing bowl", 12.81], ["hum", 12.79]], [["sine wave", 51.34], ["singing bowl", 9.48], ["chirp tone", 6.13]], null, [["speech", 21.6], ["sine wave", 14.21], ["sidetone", 11.05]], null, [["sidetone", 36.44], ["sine wave", 23.29], ["chirp tone", 10.26]], null], "duration": [10.8, 15.41, 3.52, 7.54, 15.47, 2.96, 18.32, 2.66, 1.45, 8.05, 0.81, 8.71, 0.55]} \ No newline at end of file diff --git a/annotations_1/1Zwl6vfqjNQ_filtered.json b/annotations_1/1Zwl6vfqjNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17cdfbc188bae3a59336848676b2d69e002e50a2 --- /dev/null +++ b/annotations_1/1Zwl6vfqjNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [6.0, 10.03], [17.0, 16.7], [19.0, 19.38], [21.0, 21.05], [24.0, 25.52], [31.0, 42.8], [44.0, 45.66], [48.0, 51.19], [54.0, 54.46], [58.0, 59.07], [62.0, 66.06], [67.0, 68.64], [70.0, 71.41], [72.0, 74.44], [75.0, 75.76], [77.0, 104.21], [106.0, 112.83], [113.0, 114.62], [125.0, 125.93], [126.0, 132.33], [137.0, 137.94]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 38.84, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 40.28, 0.0, 0.0, 40.34, 0.0, 0.0, 37.09, 0.0, 28.55, 28.09, 0.0, 0.0, 28.44, 0.0], "audiomae_on_audioset": [null, [["speech", 18.02], ["hum", 13.84], ["mains hum", 9.09]], null, null, null, null, [["fly, housefly", 49.71], ["insect", 31.2], ["mosquito", 14.34]], null, [["speech", 27.75], ["music", 27.6], ["sonar", 6.76]], null, null, [["music", 49.9], ["synthesizer", 15.23], ["theremin", 6.95]], null, null, [["speech", 53.73], ["music", 4.84], ["rumble", 4.17]], null, [["rumble", 31.04], ["music", 26.75], ["hum", 11.73]], [["music", 69.63], ["electronic music", 3.95], ["throbbing", 3.78]], null, null, [["music", 29.51], ["didgeridoo", 14.44], ["electric shaver, electric razor", 14.06]], null], "duration": [0.21, 4.03, -0.3, 0.38, 0.05, 1.52, 11.8, 1.66, 3.19, 0.46, 1.07, 4.06, 1.64, 1.41, 2.44, 0.76, 27.21, 6.83, 1.62, 0.93, 6.33, 0.94]} \ No newline at end of file diff --git a/annotations_1/1afS6fOeldc_filtered.json b/annotations_1/1afS6fOeldc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e776dafe6760bc467931dbc5b17de69a5d05bb86 --- /dev/null +++ b/annotations_1/1afS6fOeldc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.9], [18.0, 19.79], [20.0, 29.02], [30.0, 72.59], [73.0, 79.0], [80.0, 80.99], [81.0, 81.03], [82.0, 99.84], [101.0, 101.63], [106.0, 106.74], [108.0, 138.37], [139.0, 161.59]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [30.72, 0.0, 30.38, 0.0, 30.64, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0, 30.97], "audiomae_on_audioset": [[["music", 66.34], ["throbbing", 10.6], ["synthesizer", 4.13]], null, [["music", 33.08], ["hum", 11.69], ["speech", 11.38]], null, [["music", 41.24], ["speech", 14.29], ["hum", 7.1]], null, null, [["music", 62.75], ["electronic music", 3.7], ["sound effect", 3.26]], null, null, null, [["music", 69.91], ["throbbing", 7.83], ["electronic music", 5.15]]], "duration": [14.9, 1.79, 9.02, 42.59, 6.0, 0.99, 0.03, 17.84, 0.63, 0.74, 30.37, 22.59]} \ No newline at end of file diff --git a/annotations_1/1bBOUr7rAHw_filtered.json b/annotations_1/1bBOUr7rAHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483d9ef773640d049453ba778cfd18bae136ae82 --- /dev/null +++ b/annotations_1/1bBOUr7rAHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.57], [4.0, 7.91], [9.0, 11.58], [12.0, 15.57], [16.0, 21.2], [23.0, 25.42], [29.0, 32.27], [36.0, 37.29], [39.0, 39.75], [40.0, 40.66], [43.0, 48.56], [52.0, 53.37], [57.0, 59.04], [60.0, 61.79], [66.0, 67.14], [70.0, 71.85], [74.0, 76.65], [78.0, 79.35], [84.0, 86.81], [91.0, 94.22], [95.0, 96.55], [97.0, 99.42], [105.0, 106.96], [111.0, 112.97], [118.0, 119.92], [125.0, 126.18], [132.0, 134.79], [138.0, 137.86], [138.0, 139.9], [141.0, 142.62], [154.0, 155.04], [155.0, 163.88], [165.0, 168.42], [169.0, 170.36]], "keep_status": [false, false, false, true, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.01, 73.51, 37.74, 35.28, 37.44, 38.75, 0.0, 0.0, 0.0, 36.28, 0.0, 35.58, 0.0, 0.0, 0.0, 36.44, 0.0, 96.77, 36.58, 0.0, 35.54, 0.0, 0.0, 0.0, 0.0, 36.6, 0.0, 0.0, 0.0, 0.0, 53.34, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 36.44], ["speech", 9.35], ["musical instrument", 5.59]], [["music", 49.96], ["didgeridoo", 8.33], ["speech", 3.93]], [["music", 52.75], ["bass guitar", 10.92], ["musical instrument", 5.54]], [["music", 53.71], ["effects unit", 8.82], ["bass guitar", 7.58]], null, null, null, [["music", 40.28], ["bass guitar", 13.64], ["speech", 11.12]], null, [["music", 47.26], ["theremin", 16.89], ["musical instrument", 4.35]], null, null, null, [["music", 66.38], ["speech", 11.08], ["musical instrument", 3.69]], null, null, [["music", 64.91], ["guitar", 7.65], ["bass guitar", 6.95]], null, [["music", 35.01], ["speech", 10.51], ["musical instrument", 9.09]], null, null, null, null, [["music", 71.05], ["guitar", 9.28], ["musical instrument", 5.53]], null, null, null, null, null, null, null], "duration": [1.57, 3.91, 2.58, 3.57, 5.2, 2.42, 3.27, 1.29, 0.75, 0.66, 5.56, 1.37, 2.04, 1.79, 1.14, 1.85, 2.65, 1.35, 2.81, 3.22, 1.55, 2.42, 1.96, 1.97, 1.92, 1.18, 2.79, -0.14, 1.9, 1.62, 1.04, 8.88, 3.42, 1.36]} \ No newline at end of file diff --git a/annotations_1/1c5xWXSWSgo_filtered.json b/annotations_1/1c5xWXSWSgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df0e61cae72391b37328fb7a5a388a1dce50ab4a --- /dev/null +++ b/annotations_1/1c5xWXSWSgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.43], [35.0, 42.04], [43.0, 69.16], [70.0, 72.25], [73.0, 122.4], [123.0, 123.9], [126.0, 127.5], [128.0, 130.2], [130.0, 139.21], [141.0, 141.02], [142.0, 143.24], [147.0, 151.85], [152.0, 153.87], [154.0, 170.55], [173.0, 174.56], [177.0, 178.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 81.0, 57.48, 99.99, 0.0, 0.0, 0.0, 78.04, 51.23, 0.0, 0.0, 47.43, 0.0, 51.23, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 19.78], ["fly, housefly", 13.86], ["fart", 9.78]], null, null, null, null], "duration": [0.43, 7.04, 26.16, 2.25, 49.4, 0.9, 1.5, 2.2, 9.21, 0.02, 1.24, 4.85, 1.87, 16.55, 1.56, 1.24]} \ No newline at end of file diff --git a/annotations_1/1cHRBd6l2UM_filtered.json b/annotations_1/1cHRBd6l2UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e00e8b24ffd3ccd0fc5ef5b64d35f7b7dfc525a1 --- /dev/null +++ b/annotations_1/1cHRBd6l2UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [6.0, 7.65], [9.0, 9.48], [13.0, 13.8], [15.0, 16.58], [17.0, 19.2], [25.0, 32.58], [34.0, 40.12], [43.0, 55.34], [56.0, 56.3], [62.0, 70.14], [71.0, 72.59], [73.0, 73.55], [77.0, 77.79], [81.0, 81.72], [88.0, 94.63], [99.0, 100.18], [101.0, 102.15], [108.0, 108.46], [109.0, 109.65], [111.0, 116.55], [126.0, 127.4], [130.0, 134.27], [135.0, 135.57], [139.0, 143.28], [145.0, 145.91], [147.0, 146.99], [148.0, 148.14], [153.0, 159.24], [161.0, 162.04], [163.0, 163.66], [165.0, 166.77]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 32.56, 37.67, 36.56, 0.0, 37.24, 0.0, 0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 31.8, 0.0, 41.98, 0.0, 31.46, 0.0, 0.0, 0.0, 31.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.42], ["hum", 17.19], ["synthesizer", 8.28]], [["hum", 42.06], ["music", 21.71], ["throbbing", 17.88]], [["music", 27.64], ["throbbing", 26.8], ["hum", 25.92]], [["hum", 44.44], ["music", 14.46], ["throbbing", 13.43]], null, [["music", 61.39], ["throbbing", 14.55], ["hum", 6.22]], null, null, null, null, [["music", 36.42], ["hum", 21.71], ["throbbing", 21.1]], null, null, null, null, [["music", 35.57], ["speech", 28.68], ["throbbing", 5.93]], null, [["music", 47.83], ["throbbing", 24.56], ["didgeridoo", 5.63]], null, [["throbbing", 67.59], ["hum", 16.03], ["music", 6.81]], null, null, null, [["music", 21.42], ["hum", 17.98], ["electronic music", 13.97]], null, null, null], "duration": [0.93, 1.65, 0.48, 0.8, 1.58, 2.2, 7.58, 6.12, 12.34, 0.3, 8.14, 1.59, 0.55, 0.79, 0.72, 6.63, 1.18, 1.15, 0.46, 0.65, 5.55, 1.4, 4.27, 0.57, 4.28, 0.91, -0.01, 0.14, 6.24, 1.04, 0.66, 1.77]} \ No newline at end of file diff --git a/annotations_1/1ccMqOW6LMs_filtered.json b/annotations_1/1ccMqOW6LMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b056dd21fcb7e7e0e16601ddac91c4e700d1c71 --- /dev/null +++ b/annotations_1/1ccMqOW6LMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.25], [24.0, 24.56], [25.0, 26.03], [27.0, 29.13], [32.0, 34.45], [38.0, 38.75], [49.0, 49.69], [51.0, 51.19], [53.0, 53.96], [61.0, 61.18], [68.0, 68.17], [82.0, 82.17], [88.0, 87.71], [88.0, 87.81], [97.0, 98.39], [112.0, 112.51], [114.0, 114.08], [124.0, 124.63], [131.0, 131.46], [132.0, 133.03], [143.0, 142.96], [144.0, 144.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.09, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 43.01], ["sidetone", 24.73], ["busy signal", 5.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 0.56, 1.03, 2.13, 2.45, 0.75, 0.69, 0.19, 0.96, 0.18, 0.17, 0.17, -0.29, -0.19, 1.39, 0.51, 0.08, 0.63, 0.46, 1.03, -0.04, 0.53]} \ No newline at end of file diff --git a/annotations_1/1d-Q6pT4pxo_filtered.json b/annotations_1/1d-Q6pT4pxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23407980aaf554c059ff1a1c2ba7a6419424f767 --- /dev/null +++ b/annotations_1/1d-Q6pT4pxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.5], [42.0, 45.66], [47.0, 51.06], [52.0, 106.51], [109.0, 109.56], [115.0, 127.58], [128.0, 128.17]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 55.04, 64.97, 0.0, 0.0, 43.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 37.04], ["hum", 9.63], ["theremin", 7.49]], null], "duration": [1.5, 3.66, 4.06, 54.51, 0.56, 12.58, 0.17]} \ No newline at end of file diff --git a/annotations_1/1dLZuGiJRXA_filtered.json b/annotations_1/1dLZuGiJRXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8608d25179b75555da5f429b6374aa5c01639f71 --- /dev/null +++ b/annotations_1/1dLZuGiJRXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.92], [11.0, 11.57], [17.0, 19.14], [23.0, 27.92], [29.0, 35.18], [36.0, 39.68], [48.0, 48.61], [49.0, 49.94], [53.0, 52.89], [61.0, 60.83], [63.0, 63.42], [71.0, 72.05], [76.0, 76.52], [82.0, 82.11], [97.0, 97.92], [110.0, 110.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.62, 0.0, 87.74, 87.0, 74.29, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.92, 0.57, 2.14, 4.92, 6.18, 3.68, 0.61, 0.94, -0.11, -0.17, 0.42, 1.05, 0.52, 0.11, 0.92, 0.96]} \ No newline at end of file diff --git a/annotations_1/1didVrNjTpQ_filtered.json b/annotations_1/1didVrNjTpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1e9b43023ac77ab303958a53bc18506cfc4ed16 --- /dev/null +++ b/annotations_1/1didVrNjTpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.37], [20.0, 20.88], [22.0, 22.99], [24.0, 25.02], [26.0, 27.63], [30.0, 32.21], [37.0, 36.66], [37.0, 38.48], [42.0, 41.91], [44.0, 44.37], [46.0, 47.29], [54.0, 54.21], [57.0, 57.38], [58.0, 59.83], [64.0, 64.52], [69.0, 69.55], [70.0, 70.33], [71.0, 71.52], [93.0, 93.95], [96.0, 97.31], [113.0, 113.95], [116.0, 117.32], [117.0, 117.36], [119.0, 120.01]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.62, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 37.11], ["rumble", 9.44], ["bee, wasp, etc.", 8.05]], null, null, null, null, [["effects unit", 17.79], ["music", 15.23], ["guitar", 9.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.37, 0.88, 0.99, 1.02, 1.63, 2.21, -0.34, 1.48, -0.09, 0.37, 1.29, 0.21, 0.38, 1.83, 0.52, 0.55, 0.33, 0.52, 0.95, 1.31, 0.95, 1.32, 0.36, 1.01]} \ No newline at end of file diff --git a/annotations_1/1dwtsZ4IJQE_filtered.json b/annotations_1/1dwtsZ4IJQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b881197dfed6d4cd96a5206320da0083a25ef75 --- /dev/null +++ b/annotations_1/1dwtsZ4IJQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.76], [5.0, 27.46], [28.0, 31.01], [32.0, 34.18], [35.0, 42.74], [44.0, 45.66], [48.0, 51.14], [52.0, 56.3], [58.0, 59.81], [61.0, 68.76], [72.0, 75.05], [76.0, 81.19], [82.0, 82.36], [87.0, 97.87], [99.0, 100.87], [102.0, 105.22], [106.0, 108.09], [110.0, 111.25], [117.0, 125.69], [128.0, 128.55], [137.0, 139.51], [141.0, 142.82], [145.0, 147.19], [150.0, 151.7], [157.0, 157.77], [160.0, 161.47], [163.0, 166.14], [168.0, 168.12], [171.0, 173.91], [176.0, 205.48], [207.0, 207.66], [215.0, 219.21], [220.0, 224.78], [229.0, 229.1]], "keep_status": [false, true, false, false, true, false, false, true, false, true, true, true, false, true, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 36.25, 58.89, 57.09, 30.74, 0.0, 36.11, 43.48, 0.0, 37.36, 29.8, 38.27, 0.0, 46.05, 0.0, 46.54, 51.55, 0.0, 29.85, 0.0, 51.39, 0.0, 34.9, 0.0, 0.0, 0.0, 45.05, 0.0, 60.7, 29.63, 0.0, 30.8, 29.93, 0.0], "audiomae_on_audioset": [null, [["gong", 23.38], ["speech", 13.71], ["music", 10.38]], null, null, [["music", 24.1], ["speech", 17.63], ["hum", 16.98]], null, [["hum", 28.87], ["throbbing", 27.97], ["music", 19.53]], [["music", 25.31], ["speech", 20.0], ["hum", 14.84]], null, [["music", 51.64], ["hum", 11.98], ["throbbing", 5.69]], [["music", 20.45], ["speech", 11.56], ["rumble", 9.98]], [["music", 26.97], ["scary music", 12.83], ["speech", 12.2]], null, [["speech", 22.9], ["hum", 16.88], ["music", 16.65]], null, [["music", 34.7], ["hum", 10.7], ["synthesizer", 7.23]], null, null, [["speech", 63.72], ["explosion", 9.11], ["music", 5.32]], null, null, null, [["didgeridoo", 23.32], ["music", 20.45], ["speech", 11.22]], null, null, null, [["music", 47.96], ["fart", 3.42], ["hum", 2.31]], null, null, [["music", 55.1], ["thump, thud", 7.55], ["speech", 4.9]], null, [["music", 35.9], ["speech", 15.82], ["electric shaver, electric razor", 7.73]], [["music", 73.63], ["speech", 4.84], ["thump, thud", 3.16]], null], "duration": [1.76, 22.46, 3.01, 2.18, 7.74, 1.66, 3.14, 4.3, 1.81, 7.76, 3.05, 5.19, 0.36, 10.87, 1.87, 3.22, 2.09, 1.25, 8.69, 0.55, 2.51, 1.82, 2.19, 1.7, 0.77, 1.47, 3.14, 0.12, 2.91, 29.48, 0.66, 4.21, 4.78, 0.1]} \ No newline at end of file diff --git a/annotations_1/1eN1O1j3LcY_filtered.json b/annotations_1/1eN1O1j3LcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..901e79be72a0c96114c8b0625ab7ebf950b5df5d --- /dev/null +++ b/annotations_1/1eN1O1j3LcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [10.0, 10.91], [12.0, 12.12], [13.0, 13.83], [17.0, 32.12], [35.0, 35.55], [37.0, 37.56], [45.0, 46.65], [50.0, 50.8], [52.0, 52.47], [53.0, 54.09], [55.0, 55.92], [59.0, 62.72], [64.0, 64.2], [67.0, 67.56], [69.0, 71.78], [73.0, 74.8], [76.0, 76.5], [79.0, 82.38], [85.0, 87.03], [89.0, 92.33], [95.0, 95.2], [98.0, 98.69], [109.0, 109.31], [111.0, 111.27], [113.0, 114.37], [115.0, 116.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 88.46, 0.0, 0.0, 100.0, 95.09, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 0.91, 0.12, 0.83, 15.12, 0.55, 0.56, 1.65, 0.8, 0.47, 1.09, 0.92, 3.72, 0.2, 0.56, 2.78, 1.8, 0.5, 3.38, 2.03, 3.33, 0.2, 0.69, 0.31, 0.27, 1.37, 1.4]} \ No newline at end of file diff --git a/annotations_1/1eP7huR6T3U_filtered.json b/annotations_1/1eP7huR6T3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a29683912dac551fcfe1f2e547a28525653f842e --- /dev/null +++ b/annotations_1/1eP7huR6T3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [14.0, 14.25], [17.0, 19.85], [23.0, 23.3], [24.0, 25.62], [26.0, 27.75], [31.0, 31.97], [35.0, 36.31], [38.0, 38.65], [40.0, 78.22], [79.0, 93.33], [97.0, 98.83], [102.0, 121.47], [122.0, 150.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 62.68, 32.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.88], ["fart", 21.26], ["animal", 6.98]]], "duration": [0.72, 0.25, 2.85, 0.3, 1.62, 1.75, 0.97, 1.31, 0.65, 38.22, 14.33, 1.83, 19.47, 28.23]} \ No newline at end of file diff --git a/annotations_1/1eSURYocFiM_filtered.json b/annotations_1/1eSURYocFiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d6a3ad2916eaeb141e4b65d6a5ba59aa88d27b --- /dev/null +++ b/annotations_1/1eSURYocFiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.78], [3.0, 3.5], [8.0, 8.53], [9.0, 9.07], [21.0, 21.14], [23.0, 23.55], [45.0, 46.43], [50.0, 49.98], [52.0, 52.76], [62.0, 62.01], [70.0, 70.53], [71.0, 72.05], [74.0, 77.19], [91.0, 92.15], [93.0, 93.61], [95.0, 100.67], [103.0, 102.61], [107.0, 112.02], [113.0, 119.75], [120.0, 121.53], [122.0, 123.47], [127.0, 127.18], [147.0, 149.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 50.91, 0.0, 71.14, 89.01, 0.0, 0.0, 0.0, 51.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 0.5, 0.53, 0.07, 0.14, 0.55, 1.43, -0.02, 0.76, 0.01, 0.53, 1.05, 3.19, 1.15, 0.61, 5.67, -0.39, 5.02, 6.75, 1.53, 1.47, 0.18, 2.18]} \ No newline at end of file diff --git a/annotations_1/1e_9GirqmoI_filtered.json b/annotations_1/1e_9GirqmoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cbb77707d70e13366dd02926e8635b27086f106 --- /dev/null +++ b/annotations_1/1e_9GirqmoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 49.71], [51.0, 52.73], [55.0, 56.1], [58.0, 58.21], [61.0, 62.01], [65.0, 74.09], [74.0, 74.76], [75.0, 75.2], [80.0, 80.28], [84.0, 86.05], [87.0, 87.69], [101.0, 110.62], [111.0, 110.74], [111.0, 120.43]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.07, 0.0, 0.0, 0.0, 54.97, 0.0, 42.58, 0.0, 43.33], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 34.41], ["hum", 21.74], ["noise", 13.18]], null, null, null, null, null, [["music", 37.96], ["electronic music", 17.2], ["fly, housefly", 8.79]], null, [["fly, housefly", 27.62], ["bee, wasp, etc.", 25.67], ["insect", 17.68]]], "duration": [38.71, 1.73, 1.1, 0.21, 1.01, 9.09, 0.76, 0.2, 0.28, 2.05, 0.69, 9.62, -0.26, 9.43]} \ No newline at end of file diff --git a/annotations_1/1eoKvx5X9JQ_filtered.json b/annotations_1/1eoKvx5X9JQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/1eoKvx5X9JQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/1etjTR5wYhU_filtered.json b/annotations_1/1etjTR5wYhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49876c6998cfb7676e6a30a376aa32a5c81c0ed0 --- /dev/null +++ b/annotations_1/1etjTR5wYhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.64], [8.0, 9.09], [15.0, 15.47], [18.0, 19.41], [40.0, 42.28], [51.0, 55.7], [58.0, 58.63], [61.0, 62.85], [65.0, 70.93], [71.0, 74.34], [75.0, 76.38], [78.0, 101.38], [103.0, 103.1], [103.0, 104.04], [110.0, 110.37], [114.0, 117.05], [117.0, 118.07], [122.0, 122.61], [125.0, 125.93], [127.0, 127.04], [127.0, 129.81], [131.0, 132.19], [133.0, 138.11], [139.0, 141.0]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [55.81, 0.0, 0.0, 0.0, 31.02, 31.38, 0.0, 0.0, 43.69, 46.33, 0.0, 30.3, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 46.97, 77.7], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 32.02], ["speech", 23.79], ["moo", 14.59]], [["speech", 29.14], ["cattle, bovinae", 11.94], ["music", 9.89]], null, null, [["music", 48.95], ["throbbing", 13.86], ["single-lens reflex camera", 12.95]], [["sidetone", 32.36], ["speech", 22.2], ["hum", 15.55]], null, [["music", 46.3], ["speech", 9.69], ["animal", 5.59]], null, null, null, [["speech", 22.8], ["livestock, farm animals, working animals", 19.33], ["cattle, bovinae", 8.66]], null, null, null, null, [["speech", 73.08], ["electric shaver, electric razor", 6.5], ["music", 4.36]], null, [["speech", 19.04], ["fly, housefly", 15.7], ["insect", 8.17]], null], "duration": [3.64, 1.09, 0.47, 1.41, 2.28, 4.7, 0.63, 1.85, 5.93, 3.34, 1.38, 23.38, 0.1, 1.04, 0.37, 3.05, 1.07, 0.61, 0.93, 0.04, 2.81, 1.19, 5.11, 2.0]} \ No newline at end of file diff --git a/annotations_1/1fp6lBNB7aw_filtered.json b/annotations_1/1fp6lBNB7aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6385d211a48cf14b4e51ad020725e5c11bbcf265 --- /dev/null +++ b/annotations_1/1fp6lBNB7aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 27.53], [31.0, 39.23], [40.0, 52.84], [53.0, 54.43], [55.0, 55.32], [65.0, 68.5], [69.0, 70.17], [71.0, 71.81], [75.0, 75.54], [76.0, 79.78], [108.0, 114.98], [117.0, 117.32], [118.0, 118.2], [119.0, 120.45], [127.0, 126.91], [140.0, 141.18]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [33.89, 31.08, 48.87, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 37.14, 30.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.32], ["chime", 4.52], ["glockenspiel", 4.17]], [["music", 22.21], ["speech", 16.33], ["noise", 7.45]], [["speech", 17.01], ["cattle, bovinae", 8.82], ["animal", 8.24]], null, null, null, null, null, null, [["speech", 61.28], ["radio", 11.3], ["outside, rural or natural", 2.62]], [["music", 37.56], ["musical instrument", 12.81], ["noise", 7.34]], null, null, null, null, null], "duration": [12.53, 8.23, 12.84, 1.43, 0.32, 3.5, 1.17, 0.81, 0.54, 3.78, 6.98, 0.32, 0.2, 1.45, -0.09, 1.18]} \ No newline at end of file diff --git a/annotations_1/1gj7X8C31Tg_filtered.json b/annotations_1/1gj7X8C31Tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..893e9d36d6d7a5b0a9240e2a7217b48336f9d74c --- /dev/null +++ b/annotations_1/1gj7X8C31Tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 30.99], [31.0, 31.67], [32.0, 33.05], [34.0, 34.57], [35.0, 54.33], [58.0, 58.38], [59.0, 95.67], [97.0, 137.73], [139.0, 144.34], [145.0, 151.56], [161.0, 168.67], [170.0, 170.63]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.02, 0.0, 0.0, 0.0, 31.91, 37.24, 34.37, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 15.06], ["hum", 11.68], ["throbbing", 6.63]], null, null, null, [["animal", 22.77], ["neigh, whinny", 17.56], ["horse", 9.01]], [["noise", 58.59], ["radio", 12.48], ["speech", 11.54]], [["whale vocalization", 50.53], ["animal", 17.16], ["speech", 11.24]], null], "duration": [-0.01, 0.67, 1.05, 0.57, 19.33, 0.38, 36.67, 40.73, 5.34, 6.56, 7.67, 0.63]} \ No newline at end of file diff --git a/annotations_1/1iEOBKuW9TQ_filtered.json b/annotations_1/1iEOBKuW9TQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..585f0fed4fd0e90005a59f2e7464497b3d0188b9 --- /dev/null +++ b/annotations_1/1iEOBKuW9TQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 20.41], [22.0, 27.87], [28.0, 32.04], [33.0, 34.21], [38.0, 38.92], [39.0, 39.77], [40.0, 46.16], [48.0, 56.08], [57.0, 57.06], [65.0, 65.92], [69.0, 69.28], [82.0, 93.12], [96.0, 104.5], [105.0, 105.54], [107.0, 156.14], [157.0, 156.76], [158.0, 158.35], [159.0, 162.55], [164.0, 166.55], [169.0, 168.99], [169.0, 169.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [31.12, 28.7, 28.58, 0.0, 0.0, 0.0, 28.95, 33.68, 0.0, 0.0, 0.0, 29.4, 29.59, 0.0, 0.0, 0.0, 0.0, 29.22, 39.77, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.98], ["throbbing", 16.49], ["speech", 16.39]], [["music", 85.16], ["throbbing", 4.94], ["hum", 3.06]], [["music", 74.06], ["throbbing", 9.59], ["hum", 7.57]], null, null, null, [["music", 56.78], ["throbbing", 17.63], ["electronic music", 8.62]], [["hum", 39.47], ["throbbing", 25.09], ["music", 20.68]], null, null, null, [["music", 58.61], ["speech", 25.11], ["didgeridoo", 6.03]], [["music", 40.75], ["speech", 21.78], ["electronic music", 7.92]], null, null, null, null, [["music", 83.99], ["synthesizer", 2.04], ["musical instrument", 1.92]], [["music", 24.73], ["throbbing", 12.03], ["hum", 8.48]], null, null], "duration": [13.41, 5.87, 4.04, 1.21, 0.92, 0.77, 6.16, 8.08, 0.06, 0.92, 0.28, 11.12, 8.5, 0.54, 49.14, -0.24, 0.35, 3.55, 2.55, -0.01, 0.03]} \ No newline at end of file diff --git a/annotations_1/1iOnKJA2H7I_filtered.json b/annotations_1/1iOnKJA2H7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d19e2370268f8db62b6975a1528d76fb2ee7df0a --- /dev/null +++ b/annotations_1/1iOnKJA2H7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 20.55], [22.0, 28.19], [30.0, 32.48], [40.0, 46.7], [48.0, 50.79], [57.0, 58.09], [60.0, 60.84], [63.0, 84.13], [85.0, 87.24], [88.0, 98.37], [99.0, 99.77], [103.0, 103.23], [107.0, 107.76], [118.0, 118.29], [121.0, 120.93], [121.0, 123.11], [124.0, 127.48], [129.0, 153.28], [154.0, 154.8], [156.0, 163.09], [164.0, 180.33]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [77.53, 94.37, 69.88, 93.13, 94.22, 0.0, 0.0, 49.59, 96.42, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 91.64, 97.22, 0.0, 98.36, 44.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fly, housefly", 34.03], ["insect", 11.35], ["mosquito", 7.46]], null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 18.1], ["animal", 15.03], ["moo", 9.89]]], "duration": [13.55, 6.19, 2.48, 6.7, 2.79, 1.09, 0.84, 21.13, 2.24, 10.37, 0.77, 0.23, 0.76, 0.29, -0.07, 2.11, 3.48, 24.28, 0.8, 7.09, 16.33]} \ No newline at end of file diff --git a/annotations_1/1id63E3KgH0_filtered.json b/annotations_1/1id63E3KgH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0baa174c32ffe87ca54f0f77a269ff04ce75abdc --- /dev/null +++ b/annotations_1/1id63E3KgH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.88], [11.0, 31.82], [37.0, 36.81], [38.0, 38.55], [39.0, 39.68], [41.0, 45.5], [47.0, 68.1], [75.0, 111.48], [114.0, 124.55], [126.0, 153.62], [155.0, 171.49]], "keep_status": [false, false, false, false, false, true, true, false, true, true, true], "silence_prob": [0.0, 28.88, 0.0, 0.0, 0.0, 28.94, 29.15, 0.0, 28.91, 28.36, 28.54], "audiomae_on_audioset": [null, [["music", 40.97], ["speech", 27.78], ["throbbing", 6.39]], null, null, null, [["music", 51.84], ["speech", 7.66], ["throbbing", 7.35]], [["livestock, farm animals, working animals", 24.16], ["speech", 20.52], ["cattle, bovinae", 10.05]], null, [["music", 38.29], ["speech", 23.22], ["whack, thwack", 7.77]], [["speech", 35.98], ["music", 15.38], ["mains hum", 14.61]], [["music", 33.34], ["hum", 16.26], ["mains hum", 10.11]]], "duration": [1.88, 20.82, -0.19, 0.55, 0.68, 4.5, 21.1, 36.48, 10.55, 27.62, 16.49]} \ No newline at end of file diff --git a/annotations_1/1jEe_vPgNJE_filtered.json b/annotations_1/1jEe_vPgNJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d598dd8a3b4ab6f17ad729b19142589c8cf29809 --- /dev/null +++ b/annotations_1/1jEe_vPgNJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.94], [7.0, 7.75], [10.0, 17.81], [21.0, 21.36], [23.0, 25.1], [44.0, 44.74], [50.0, 51.21], [54.0, 57.59], [67.0, 69.8], [71.0, 72.17], [80.0, 82.26], [88.0, 91.03], [95.0, 95.15], [99.0, 102.76], [107.0, 107.92], [108.0, 109.16], [111.0, 111.37], [114.0, 143.26], [144.0, 144.29], [145.0, 145.32]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, true, false, true, false, false, false, true, false, false], "silence_prob": [50.56, 0.0, 42.81, 0.0, 69.88, 0.0, 0.0, 29.06, 29.62, 0.0, 31.4, 30.08, 0.0, 28.24, 0.0, 0.0, 0.0, 28.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.87], ["speech", 7.48], ["theremin", 6.43]], null, null, null, null, [["hum", 21.74], ["mains hum", 20.36], ["music", 17.63]], [["hum", 28.25], ["music", 25.9], ["mains hum", 21.74]], null, [["music", 50.66], ["didgeridoo", 6.66], ["mains hum", 5.35]], [["music", 24.02], ["speech", 21.74], ["rumble", 8.0]], null, [["music", 31.04], ["speech", 18.29], ["cattle, bovinae", 10.11]], null, null, null, [["hum", 23.68], ["buzz", 22.18], ["mains hum", 16.27]], null, null], "duration": [3.94, 0.75, 7.81, 0.36, 2.1, 0.74, 1.21, 3.59, 2.8, 1.17, 2.26, 3.03, 0.15, 3.76, 0.92, 1.16, 0.37, 29.26, 0.29, 0.32]} \ No newline at end of file diff --git a/annotations_1/1jK2Y8vAM1A_filtered.json b/annotations_1/1jK2Y8vAM1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7a98730482c7bc7721920d976b52d68cf6701b --- /dev/null +++ b/annotations_1/1jK2Y8vAM1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [4.0, 4.89], [5.0, 5.66], [6.0, 6.44], [17.0, 16.87], [18.0, 19.4], [20.0, 21.0], [22.0, 23.35], [24.0, 26.42], [35.0, 35.36], [40.0, 40.14], [65.0, 65.69], [68.0, 68.27], [73.0, 73.08], [75.0, 74.58], [76.0, 76.67], [77.0, 77.63], [80.0, 79.74], [86.0, 86.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.89, 0.66, 0.44, -0.13, 1.4, 1.0, 1.35, 2.42, 0.36, 0.14, 0.69, 0.27, 0.08, -0.42, 0.67, 0.63, -0.26, 0.22]} \ No newline at end of file diff --git a/annotations_1/1jjQuF3a-7U_filtered.json b/annotations_1/1jjQuF3a-7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5d80ebe1e5769c2b97197b752d6c069752e3b5 --- /dev/null +++ b/annotations_1/1jjQuF3a-7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [3.0, 4.29], [5.0, 5.36], [6.0, 6.47], [8.0, 12.41], [14.0, 19.38], [20.0, 20.29], [31.0, 30.99], [33.0, 32.73], [33.0, 33.44], [40.0, 61.33], [64.0, 65.1], [67.0, 87.05], [102.0, 102.66], [105.0, 109.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.94, 34.03, 0.0, 0.0, 0.0, 0.0, 35.61, 0.0, 32.21, 0.0, 55.67], "audiomae_on_audioset": [null, null, null, null, [["music", 76.33], ["speech", 9.53], ["ambient music", 2.63]], [["ding", 35.88], ["music", 29.17], ["clang", 11.97]], null, null, null, null, [["music", 50.55], ["sonar", 9.99], ["throbbing", 4.95]], null, [["music", 59.43], ["boing", 10.55], ["synthesizer", 7.23]], null, null], "duration": [0.37, 1.29, 0.36, 0.47, 4.41, 5.38, 0.29, -0.01, -0.27, 0.44, 21.33, 1.1, 20.05, 0.66, 4.31]} \ No newline at end of file diff --git a/annotations_1/1kNZdy-IxNQ_filtered.json b/annotations_1/1kNZdy-IxNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7590c0b6327d4982d22c3eafd8048abea883edfe --- /dev/null +++ b/annotations_1/1kNZdy-IxNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 34.32], [36.0, 39.46], [41.0, 51.31], [54.0, 73.09], [76.0, 92.2], [94.0, 94.83], [96.0, 133.14], [136.0, 182.36], [183.0, 195.1]], "keep_status": [false, true, false, false, true, false, false, false, false], "silence_prob": [30.59, 34.51, 30.32, 31.72, 31.29, 0.0, 0.0, 0.0, 32.99], "audiomae_on_audioset": [[["rumble", 42.66], ["whale vocalization", 27.19], ["music", 11.27]], [["hum", 22.47], ["mains hum", 19.86], ["speech", 14.42]], [["music", 32.79], ["mains hum", 21.15], ["hum", 16.25]], [["music", 49.01], ["sonar", 40.5], ["electronic music", 2.83]], [["music", 24.71], ["hum", 14.47], ["mains hum", 6.89]], null, null, null, [["hum", 50.5], ["mains hum", 20.85], ["music", 5.74]]], "duration": [5.32, 3.46, 10.31, 19.09, 16.2, 0.83, 37.14, 46.36, 12.1]} \ No newline at end of file diff --git a/annotations_1/1kPvrYaCi4c_filtered.json b/annotations_1/1kPvrYaCi4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b5143ea88607f6c504501fa8961637c44a7de5 --- /dev/null +++ b/annotations_1/1kPvrYaCi4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 28.85], [31.0, 41.05], [42.0, 74.58], [78.0, 81.19], [86.0, 99.37], [103.0, 109.05], [112.0, 116.14], [120.0, 133.73], [135.0, 139.48], [141.0, 142.23], [143.0, 145.79]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [100.0, 34.2, 0.0, 46.05, 31.69, 34.96, 99.52, 59.96, 99.05, 0.0, 81.89], "audiomae_on_audioset": [null, [["music", 76.78], ["grunt", 5.35], ["groan", 2.49]], null, [["fly, housefly", 56.49], ["insect", 12.0], ["mosquito", 10.2]], [["music", 15.74], ["speech", 12.72], ["groan", 4.73]], [["speech", 31.08], ["animal", 15.13], ["whale vocalization", 12.61]], null, null, null, null, null], "duration": [4.85, 10.05, 32.58, 3.19, 13.37, 6.05, 4.14, 13.73, 4.48, 1.23, 2.79]} \ No newline at end of file diff --git a/annotations_1/1kuNl2T_mjQ_filtered.json b/annotations_1/1kuNl2T_mjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1b6c4b28c3ad0b1e0efb2b77f72c563f5e29a2 --- /dev/null +++ b/annotations_1/1kuNl2T_mjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.42], [12.0, 13.59], [27.0, 34.55], [35.0, 38.48], [40.0, 39.83], [42.0, 42.85], [44.0, 50.45], [52.0, 54.28], [55.0, 86.24], [92.0, 103.11], [110.0, 110.22], [113.0, 117.22], [123.0, 127.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 76.37, 91.98, 0.0, 0.0, 96.42, 37.21, 0.0, 29.25, 0.0, 29.24, 29.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 62.15], ["musical instrument", 8.12], ["synthesizer", 7.48]], null, [["music", 82.5], ["musical instrument", 1.24], ["singing", 1.21]], null, [["music", 79.31], ["didgeridoo", 2.11], ["musical instrument", 1.78]], [["music", 61.13], ["singing", 3.68], ["musical instrument", 1.87]]], "duration": [1.42, 1.59, 7.55, 3.48, -0.17, 0.85, 6.45, 2.28, 31.24, 11.11, 0.22, 4.22, 4.52]} \ No newline at end of file diff --git a/annotations_1/1lt4euqZLsY_filtered.json b/annotations_1/1lt4euqZLsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a51c03ae1efc7c9fab715c87a742f0d884b3e6b3 --- /dev/null +++ b/annotations_1/1lt4euqZLsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.95], [15.0, 17.54], [35.0, 35.77], [62.0, 65.72]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 44.57, 0.0, 30.41], "audiomae_on_audioset": [null, [["music", 50.78], ["throbbing", 16.1], ["hum", 6.11]], null, [["music", 55.74], ["didgeridoo", 37.3], ["musical instrument", 2.19]]], "duration": [-0.05, 2.54, 0.77, 3.72]} \ No newline at end of file diff --git a/annotations_1/1lxY4Sc9eNg_filtered.json b/annotations_1/1lxY4Sc9eNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4209952c9fe75331f29c01924eb1d1e44c9d6775 --- /dev/null +++ b/annotations_1/1lxY4Sc9eNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.3], [10.0, 11.72], [12.0, 13.29], [15.0, 16.29], [18.0, 19.95], [21.0, 23.89], [30.0, 31.41], [33.0, 34.55], [36.0, 38.13], [41.0, 45.57], [49.0, 59.78], [62.0, 63.9], [67.0, 69.57], [70.0, 72.33], [74.0, 77.52], [79.0, 84.06], [86.0, 102.25], [104.0, 104.48], [106.0, 128.66], [129.0, 136.38], [137.0, 137.37]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [47.98, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 45.4, 52.27, 47.23, 0.0, 68.54, 41.87, 56.86, 47.94, 41.64, 0.0, 32.21, 36.48, 0.0], "audiomae_on_audioset": [[["fly, housefly", 31.5], ["bee, wasp, etc.", 19.48], ["insect", 13.25]], null, null, null, null, [["sidetone", 46.45], ["bee, wasp, etc.", 9.84], ["speech", 8.49]], null, null, [["fly, housefly", 35.78], ["bee, wasp, etc.", 22.76], ["insect", 20.28]], null, [["hum", 42.9], ["mains hum", 27.41], ["speech", 5.17]], null, null, [["sine wave", 16.38], ["sidetone", 14.71], ["fly, housefly", 13.78]], null, [["hum", 55.25], ["mains hum", 27.09], ["sidetone", 5.22]], [["fly, housefly", 43.48], ["insect", 37.33], ["bee, wasp, etc.", 6.28]], null, [["hum", 27.46], ["speech", 27.24], ["mains hum", 7.82]], [["hum", 45.52], ["mains hum", 35.19], ["speech", 6.9]], null], "duration": [5.3, 1.72, 1.29, 1.29, 1.95, 2.89, 1.41, 1.55, 2.13, 4.57, 10.78, 1.9, 2.57, 2.33, 3.52, 5.06, 16.25, 0.48, 22.66, 7.38, 0.37]} \ No newline at end of file diff --git a/annotations_1/1m8Ac21hxO4_filtered.json b/annotations_1/1m8Ac21hxO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..865fe80672ba9334ef56cf1eaf93987ff9da16d9 --- /dev/null +++ b/annotations_1/1m8Ac21hxO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.46], [14.0, 14.91], [17.0, 19.33], [22.0, 22.69], [24.0, 37.0], [38.0, 46.35], [60.0, 65.79], [74.0, 74.82], [80.0, 115.13], [116.0, 132.46], [136.0, 151.17]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [73.21, 0.0, 94.37, 0.0, 63.31, 55.74, 51.34, 0.0, 0.0, 37.22, 29.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 25.0], ["speech", 23.35], ["music", 20.45]], [["insect", 15.9], ["music", 13.53], ["livestock, farm animals, working animals", 11.86]]], "duration": [11.46, 0.91, 2.33, 0.69, 13.0, 8.35, 5.79, 0.82, 35.13, 16.46, 15.17]} \ No newline at end of file diff --git a/annotations_1/1mLEN1SN9Eo_filtered.json b/annotations_1/1mLEN1SN9Eo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97161e17df9af658e6d0b7699af28359a9f1fbd5 --- /dev/null +++ b/annotations_1/1mLEN1SN9Eo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.59], [13.0, 13.04], [14.0, 15.35], [19.0, 18.94], [20.0, 22.82], [31.0, 31.97], [33.0, 34.72], [37.0, 47.16], [49.0, 49.2], [51.0, 52.27], [56.0, 63.27], [82.0, 88.28], [89.0, 88.92], [94.0, 100.08], [102.0, 102.63], [104.0, 105.76], [110.0, 110.3], [112.0, 112.43], [115.0, 115.18], [116.0, 117.37], [119.0, 119.3], [121.0, 120.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 43.58, 0.0, 0.0, 33.81, 35.01, 0.0, 31.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 38.59], ["throbbing", 30.83], ["hum", 13.83]], null, null, [["music", 73.73], ["boing", 5.82], ["drum machine", 2.14]], [["music", 78.25], ["musical instrument", 7.97], ["singing", 2.13]], null, [["music", 42.26], ["musical instrument", 5.24], ["speech", 5.12]], null, null, null, null, null, null, null, null], "duration": [-0.41, 0.04, 1.35, -0.06, 2.82, 0.97, 1.72, 10.16, 0.2, 1.27, 7.27, 6.28, -0.08, 6.08, 0.63, 1.76, 0.3, 0.43, 0.18, 1.37, 0.3, -0.15]} \ No newline at end of file diff --git a/annotations_1/1mVk7wal9bk_filtered.json b/annotations_1/1mVk7wal9bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cb41092a741967c77de8150bd412cd43b5203ee --- /dev/null +++ b/annotations_1/1mVk7wal9bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.62], [8.0, 8.6], [25.0, 31.41], [32.0, 41.08], [41.0, 42.09], [44.0, 44.44], [45.0, 48.88], [50.0, 50.82], [52.0, 52.1], [56.0, 57.32], [65.0, 72.06], [76.0, 79.03], [81.0, 80.76], [82.0, 85.67], [86.0, 89.21], [90.0, 110.32], [111.0, 139.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 42.65, 30.01, 0.0, 0.0, 29.58, 0.0, 0.0, 0.0, 29.29, 29.53, 0.0, 30.45, 29.75, 29.88, 29.2], "audiomae_on_audioset": [null, null, [["music", 59.56], ["didgeridoo", 8.62], ["speech", 5.72]], [["cattle, bovinae", 36.55], ["livestock, farm animals, working animals", 27.79], ["moo", 26.01]], null, null, [["cattle, bovinae", 40.82], ["livestock, farm animals, working animals", 19.5], ["moo", 17.74]], null, null, null, [["speech", 27.09], ["vehicle", 16.79], ["car", 13.57]], [["music", 26.19], ["noise", 10.9], ["effects unit", 10.37]], null, [["music", 23.68], ["cattle, bovinae", 15.33], ["moo", 12.41]], [["music", 47.08], ["tubular bells", 5.62], ["speech", 3.48]], [["throbbing", 38.83], ["hum", 30.04], ["music", 16.36]], [["music", 76.25], ["throbbing", 4.48], ["electronic music", 2.71]]], "duration": [0.62, 0.6, 6.41, 9.08, 1.09, 0.44, 3.88, 0.82, 0.1, 1.32, 7.06, 3.03, -0.24, 3.67, 3.21, 20.32, 28.87]} \ No newline at end of file diff --git a/annotations_1/1maNhuFVhmk_filtered.json b/annotations_1/1maNhuFVhmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..838a5d5531270ad1527e8517d25d7a69aa4696e6 --- /dev/null +++ b/annotations_1/1maNhuFVhmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.98], [17.0, 17.61], [21.0, 21.66], [28.0, 28.44], [30.0, 29.89], [35.0, 35.72], [49.0, 49.44], [54.0, 54.46], [65.0, 65.97], [86.0, 86.59], [89.0, 89.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 0.61, 0.66, 0.44, -0.11, 0.72, 0.44, 0.46, 0.97, 0.59, 0.48]} \ No newline at end of file diff --git a/annotations_1/1mqubJrf6KA_filtered.json b/annotations_1/1mqubJrf6KA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f930888b3d174061e7fc7ae8ef1b6f73e42238 --- /dev/null +++ b/annotations_1/1mqubJrf6KA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [4.0, 4.83], [5.0, 7.75], [8.0, 12.63], [14.0, 16.31], [18.0, 18.84], [21.0, 21.86], [31.0, 37.77], [39.0, 40.83], [41.0, 99.74], [100.0, 100.16], [100.0, 171.15]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 42.98, 58.81, 60.23, 0.0, 0.0, 30.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 57.49], ["sine wave", 17.86], ["dial tone", 8.46]], null, null, null, null, [["animal", 31.61], ["wild animals", 18.27], ["roar", 7.91]], null, null, null, null], "duration": [0.47, 0.83, 2.75, 4.63, 2.31, 0.84, 0.86, 6.77, 1.83, 58.74, 0.16, 71.15]} \ No newline at end of file diff --git a/annotations_1/1ovQhqQy7bE_filtered.json b/annotations_1/1ovQhqQy7bE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b4e719576346bfc15f1ccfeb5b8c9e07a642ce3 --- /dev/null +++ b/annotations_1/1ovQhqQy7bE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.28], [47.0, 57.4], [62.0, 63.69], [64.0, 65.01], [66.0, 68.03], [69.0, 69.96], [72.0, 72.54], [80.0, 80.7], [82.0, 82.58], [85.0, 86.05], [89.0, 89.02], [90.0, 91.18], [92.0, 93.19], [95.0, 115.69], [117.0, 117.07], [118.0, 119.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.43, 38.08, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 56.33], ["music", 15.96], ["sidetone", 3.23]], [["speech", 62.6], ["hum", 8.29], ["sidetone", 6.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.28, 10.4, 1.69, 1.01, 2.03, 0.96, 0.54, 0.7, 0.58, 1.05, 0.02, 1.18, 1.19, 20.69, 0.07, 1.7]} \ No newline at end of file diff --git a/annotations_1/1pzV9GoSuys_filtered.json b/annotations_1/1pzV9GoSuys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6f5071d92d1310a393aee7ec3d798c8f89169b0 --- /dev/null +++ b/annotations_1/1pzV9GoSuys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.96], [12.0, 12.83], [15.0, 18.03], [19.0, 19.43], [20.0, 23.25], [25.0, 31.01], [33.0, 33.37], [35.0, 35.6], [37.0, 38.37], [40.0, 41.76], [44.0, 44.86], [46.0, 47.22], [48.0, 49.25], [52.0, 54.26], [55.0, 55.49], [56.0, 57.77], [60.0, 61.43]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 47.05, 0.0, 38.45, 38.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 22.2], ["rumble", 13.94], ["throbbing", 6.34]], null, [["speech", 60.23], ["rumble", 17.35], ["hum", 3.28]], [["hum", 29.84], ["throbbing", 13.61], ["gong", 11.58]], null, null, null, null, null, null, null, [["speech", 11.84], ["gong", 9.72], ["hum", 9.09]], null, null, null], "duration": [0.96, 0.83, 3.03, 0.43, 3.25, 6.01, 0.37, 0.6, 1.37, 1.76, 0.86, 1.22, 1.25, 2.26, 0.49, 1.77, 1.43]} \ No newline at end of file diff --git a/annotations_1/1q-FL1Wd0EE_filtered.json b/annotations_1/1q-FL1Wd0EE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cfddd1b43f00112ee21d61c67161d5c6cc8ec31 --- /dev/null +++ b/annotations_1/1q-FL1Wd0EE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.23], [10.0, 15.09], [19.0, 36.31], [38.0, 42.65], [43.0, 45.66], [47.0, 48.88], [51.0, 56.0], [57.0, 67.26], [67.0, 68.45], [69.0, 72.44], [74.0, 76.18], [77.0, 78.22], [80.0, 81.89], [83.0, 87.93], [89.0, 90.29], [92.0, 93.43], [95.0, 96.8], [97.0, 98.32], [100.0, 100.92], [102.0, 109.02], [110.0, 112.45], [113.0, 122.32], [123.0, 133.64], [136.0, 139.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 83.16, 85.17, 99.56, 0.0, 99.44, 70.3, 0.0, 74.76, 100.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 99.98, 91.81, 98.73, 97.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 5.09, 17.31, 4.65, 2.66, 1.88, 5.0, 10.26, 1.45, 3.44, 2.18, 1.22, 1.89, 4.93, 1.29, 1.43, 1.8, 1.32, 0.92, 7.02, 2.45, 9.32, 10.64, 3.62]} \ No newline at end of file diff --git a/annotations_1/1qYVJgixc3U_filtered.json b/annotations_1/1qYVJgixc3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..756d377fd5fbf195c39605fcafb33b8ae07bec1d --- /dev/null +++ b/annotations_1/1qYVJgixc3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 36.78], [39.0, 39.34], [40.0, 69.33], [70.0, 76.79], [92.0, 92.64], [98.0, 98.47], [99.0, 152.32], [152.0, 163.68], [169.0, 185.7], [187.0, 213.06], [219.0, 219.18], [221.0, 234.79], [238.0, 256.78], [261.0, 271.9]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 30.02, 30.95, 0.0, 0.0, 0.0, 30.27, 29.92, 30.28, 0.0, 30.03, 30.28, 30.42], "audiomae_on_audioset": [null, null, [["music", 43.67], ["hum", 9.28], ["throbbing", 9.04]], [["music", 30.85], ["mains hum", 20.99], ["hum", 19.58]], null, null, null, [["music", 41.68], ["mosquito", 11.23], ["fly, housefly", 9.83]], [["music", 57.81], ["hum", 13.39], ["throbbing", 6.27]], [["speech", 55.13], ["music", 18.33], ["fart", 3.88]], null, [["music", 40.75], ["machine gun", 6.96], ["effects unit", 4.18]], [["music", 31.85], ["noise", 9.57], ["throbbing", 9.01]], [["music", 45.74], ["hum", 20.99], ["throbbing", 16.87]]], "duration": [-0.22, 0.34, 29.33, 6.79, 0.64, 0.47, 53.32, 11.68, 16.7, 26.06, 0.18, 13.79, 18.78, 10.9]} \ No newline at end of file diff --git a/annotations_1/1rJ_NvTBOmc_filtered.json b/annotations_1/1rJ_NvTBOmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66073d21259fd0aa451da15c25d8149b5d373cdc --- /dev/null +++ b/annotations_1/1rJ_NvTBOmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [22.0, 22.13], [25.0, 25.81], [28.0, 29.49], [51.0, 50.85], [52.0, 52.56], [54.0, 55.16], [56.0, 56.32], [73.0, 74.01], [83.0, 83.91], [88.0, 88.38], [90.0, 89.9], [92.0, 93.48], [108.0, 107.99], [110.0, 111.15], [113.0, 117.1], [121.0, 122.55], [124.0, 124.06], [129.0, 129.76], [133.0, 133.57], [136.0, 136.21], [139.0, 139.5], [140.0, 141.86], [143.0, 143.07], [147.0, 148.1], [150.0, 150.99], [152.0, 158.48], [160.0, 162.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 0.13, 0.81, 1.49, -0.15, 0.56, 1.16, 0.32, 1.01, 0.91, 0.38, -0.1, 1.48, -0.01, 1.15, 4.1, 1.55, 0.06, 0.76, 0.57, 0.21, 0.5, 1.86, 0.07, 1.1, 0.99, 6.48, 2.01]} \ No newline at end of file diff --git a/annotations_1/1rKzD4yNMoc_filtered.json b/annotations_1/1rKzD4yNMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87497405a62f71ea59eca708e01e26b029825e45 --- /dev/null +++ b/annotations_1/1rKzD4yNMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 91.4]], "keep_status": [true], "silence_prob": [31.8], "audiomae_on_audioset": [[["music", 45.83], ["animal", 8.61], ["speech", 5.87]]], "duration": [10.4]} \ No newline at end of file diff --git a/annotations_1/1rP402h6Euo_filtered.json b/annotations_1/1rP402h6Euo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3712a804c0dbba30bf3c1a2fcb1f93a62593790 --- /dev/null +++ b/annotations_1/1rP402h6Euo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.82], [15.0, 15.58], [18.0, 20.41], [21.0, 21.81], [25.0, 95.96], [99.0, 110.81]], "keep_status": [false, false, false, false, false, true], "silence_prob": [84.98, 0.0, 98.93, 0.0, 0.0, 33.06], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.12], ["hum", 9.83], ["throbbing", 8.37]]], "duration": [2.82, 0.58, 2.41, 0.81, 70.96, 11.81]} \ No newline at end of file diff --git a/annotations_1/1sz2oWajICY_filtered.json b/annotations_1/1sz2oWajICY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2544f68e84657d3018027b2dda62a99b472357c6 --- /dev/null +++ b/annotations_1/1sz2oWajICY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.37], [19.0, 25.95], [28.0, 29.62], [32.0, 32.58], [37.0, 39.09], [41.0, 41.86], [42.0, 47.02], [48.0, 50.36], [51.0, 62.94], [64.0, 70.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.72, 0.0, 0.0, 96.29, 0.0, 84.62, 100.0, 99.78, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 6.95, 1.62, 0.58, 2.09, 0.86, 5.02, 2.36, 11.94, 6.97]} \ No newline at end of file diff --git a/annotations_1/1ugiiAH40_w_filtered.json b/annotations_1/1ugiiAH40_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..745712e6c692e19e4686c1968f3e63f540bf1905 --- /dev/null +++ b/annotations_1/1ugiiAH40_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [7.0, 7.6], [8.0, 13.61], [14.0, 25.22], [26.0, 27.99], [30.0, 35.28], [37.0, 37.25], [65.0, 65.91], [67.0, 67.05], [72.0, 74.43], [87.0, 96.6], [101.0, 101.78], [104.0, 104.89], [107.0, 108.68], [110.0, 116.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.76, 52.22, 0.0, 93.45, 0.0, 0.0, 0.0, 83.16, 81.89, 0.0, 0.0, 0.0, 93.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.6, 5.61, 11.22, 1.99, 5.28, 0.25, 0.91, 0.05, 2.43, 9.6, 0.78, 0.89, 1.68, 6.61]} \ No newline at end of file diff --git a/annotations_1/1vNv-pE8I_c_filtered.json b/annotations_1/1vNv-pE8I_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88bf4b8785edb6b52ba24739bbc2347a861a0c16 --- /dev/null +++ b/annotations_1/1vNv-pE8I_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.71], [2.0, 27.46], [32.0, 43.75], [49.0, 63.83], [67.0, 67.76], [69.0, 69.72], [71.0, 120.09], [121.0, 121.73], [123.0, 137.62], [139.0, 139.31], [140.0, 148.81], [153.0, 160.74]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 33.14, 32.14, 31.85, 0.0, 0.0, 0.0, 0.0, 43.85, 0.0, 59.96, 37.2], "audiomae_on_audioset": [null, [["music", 73.66], ["musical instrument", 3.72], ["trombone", 2.12]], [["music", 58.15], ["trombone", 9.75], ["musical instrument", 6.52]], [["music", 56.04], ["cacophony", 5.58], ["musical instrument", 5.39]], null, null, null, null, [["music", 29.11], ["mains hum", 15.69], ["hum", 12.83]], null, null, [["music", 64.65], ["theremin", 3.89], ["musical instrument", 3.31]]], "duration": [-0.29, 25.46, 11.75, 14.83, 0.76, 0.72, 49.09, 0.73, 14.62, 0.31, 8.81, 7.74]} \ No newline at end of file diff --git a/annotations_1/1vhyMvNS3Ek_filtered.json b/annotations_1/1vhyMvNS3Ek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f37b235fdf06ebcb1e7d370c1e83546e0112a42f --- /dev/null +++ b/annotations_1/1vhyMvNS3Ek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.81], [26.0, 27.58], [43.0, 43.33], [47.0, 47.61], [56.0, 57.28], [59.0, 59.88], [61.0, 63.93], [64.0, 66.99], [68.0, 68.93], [74.0, 75.61], [78.0, 78.7], [84.0, 85.36], [88.0, 88.38], [93.0, 93.51], [97.0, 97.46], [99.0, 100.08], [104.0, 105.12], [107.0, 106.79], [113.0, 113.53], [127.0, 126.93], [130.0, 132.41], [139.0, 139.72], [145.0, 145.32], [155.0, 155.53], [157.0, 157.01], [158.0, 159.46], [160.0, 160.52], [164.0, 166.08], [169.0, 169.8], [171.0, 172.76], [174.0, 174.36], [178.0, 177.77], [180.0, 184.99]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 49.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 71.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 38.72], ["didgeridoo", 9.66], ["speech", 7.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.19, 1.58, 0.33, 0.61, 1.28, 0.88, 2.93, 2.99, 0.93, 1.61, 0.7, 1.36, 0.38, 0.51, 0.46, 1.08, 1.12, -0.21, 0.53, -0.07, 2.41, 0.72, 0.32, 0.53, 0.01, 1.46, 0.52, 2.08, 0.8, 1.76, 0.36, -0.23, 4.99]} \ No newline at end of file diff --git a/annotations_1/1x3IKujLO-E_filtered.json b/annotations_1/1x3IKujLO-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3e06ba1eaea04b785ccfede5112ed37b94cfe8e --- /dev/null +++ b/annotations_1/1x3IKujLO-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 25.1], [26.0, 31.04], [32.0, 33.86], [35.0, 36.02], [37.0, 59.97], [61.0, 61.97], [67.0, 68.59], [71.0, 89.41], [91.0, 91.25], [94.0, 141.51], [142.0, 163.26], [163.0, 163.32], [166.0, 189.99]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [28.91, 30.1, 0.0, 0.0, 29.03, 0.0, 0.0, 29.23, 0.0, 0.0, 29.29, 0.0, 28.4], "audiomae_on_audioset": [[["music", 20.83], ["vehicle", 12.69], ["explosion", 7.09]], [["music", 54.01], ["emergency vehicle", 3.91], ["siren", 3.56]], null, null, [["clang", 29.38], ["music", 18.18], ["ding", 11.07]], null, null, [["speech", 45.24], ["music", 19.82], ["buzz", 6.36]], null, null, [["hum", 62.06], ["mains hum", 14.65], ["throbbing", 6.53]], null, [["speech", 49.69], ["vehicle", 15.6], ["car", 8.28]]], "duration": [25.1, 5.04, 1.86, 1.02, 22.97, 0.97, 1.59, 18.41, 0.25, 47.51, 21.26, 0.32, 23.99]} \ No newline at end of file diff --git a/annotations_1/1xXjjahIwr8_filtered.json b/annotations_1/1xXjjahIwr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3215f56187c648a02579a1c40d2af23f25b2c9c2 --- /dev/null +++ b/annotations_1/1xXjjahIwr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.66], [7.0, 9.27], [10.0, 21.88], [22.0, 24.66], [25.0, 26.59], [30.0, 34.69], [37.0, 39.39], [40.0, 41.54], [43.0, 44.85], [46.0, 74.58], [75.0, 76.62], [77.0, 81.82], [83.0, 84.92], [86.0, 87.25], [88.0, 88.84], [89.0, 90.05], [91.0, 95.71], [98.0, 108.03], [109.0, 153.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [64.52, 59.33, 30.22, 51.6, 0.0, 65.91, 60.98, 0.0, 0.0, 28.77, 0.0, 39.09, 0.0, 0.0, 0.0, 0.0, 34.62, 35.62, 0.0], "audiomae_on_audioset": [null, null, [["ding", 32.73], ["clang", 32.28], ["thunk", 9.62]], null, null, null, null, null, null, [["explosion", 18.84], ["music", 18.59], ["whack, thwack", 11.23]], null, [["music", 58.78], ["hum", 5.3], ["synthesizer", 4.69]], null, null, null, null, [["mains hum", 31.61], ["hum", 29.9], ["speech", 15.76]], [["theremin", 45.59], ["hum", 24.87], ["mains hum", 13.22]], null], "duration": [2.66, 2.27, 11.88, 2.66, 1.59, 4.69, 2.39, 1.54, 1.85, 28.58, 1.62, 4.82, 1.92, 1.25, 0.84, 1.05, 4.71, 10.03, 44.72]} \ No newline at end of file diff --git a/annotations_1/1xhIWaxWINs_filtered.json b/annotations_1/1xhIWaxWINs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23f30f78f486fded72d6d203a9c341075e84d9ea --- /dev/null +++ b/annotations_1/1xhIWaxWINs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [5.0, 11.85], [14.0, 15.04], [19.0, 21.68], [44.0, 44.14], [44.0, 44.46], [46.0, 46.94], [47.0, 48.25], [51.0, 57.86], [61.0, 63.68], [68.0, 69.63], [84.0, 84.69], [85.0, 86.93], [88.0, 88.6], [104.0, 104.28], [108.0, 112.83], [117.0, 116.67], [117.0, 118.45], [120.0, 121.96], [125.0, 125.93], [127.0, 127.5], [129.0, 129.2], [132.0, 133.02], [134.0, 134.59], [136.0, 142.35], [145.0, 149.37], [171.0, 179.88], [186.0, 187.44], [192.0, 194.68], [195.0, 195.05], [195.0, 195.12], [195.0, 195.15], [195.0, 195.18], [195.0, 195.22]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 60.14, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 41.93, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.06, 29.44, 30.15, 0.0, 28.7, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 30.04], ["speech", 22.91], ["sidetone", 12.8]], null, null, null, null, null, null, [["music", 39.35], ["speech", 17.35], ["hum", 7.68]], null, null, null, null, null, null, null, null, [["boing", 33.63], ["livestock, farm animals, working animals", 22.71], ["cattle, bovinae", 22.26]], [["music", 51.13], ["speech", 19.04], ["boing", 9.15]], [["music", 43.72], ["speech", 25.41], ["boing", 4.9]], null, [["livestock, farm animals, working animals", 28.98], ["artillery fire", 16.19], ["cattle, bovinae", 8.98]], null, null, null, null, null], "duration": [0.02, 6.85, 1.04, 2.68, 0.14, 0.46, 0.94, 1.25, 6.86, 2.68, 1.63, 0.69, 1.93, 0.6, 0.28, 4.83, -0.33, 1.45, 1.96, 0.93, 0.5, 0.2, 1.02, 0.59, 6.35, 4.37, 8.88, 1.44, 2.68, 0.05, 0.12, 0.15, 0.18, 0.22]} \ No newline at end of file diff --git a/annotations_1/1y7cZSWu93k_filtered.json b/annotations_1/1y7cZSWu93k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..037280c29f756c0dfdf2eefe72025e81c2d094c5 --- /dev/null +++ b/annotations_1/1y7cZSWu93k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.84], [25.0, 27.46], [28.0, 29.13], [32.0, 31.95], [35.0, 36.37], [45.0, 46.23], [50.0, 50.75], [53.0, 54.53], [58.0, 59.61], [67.0, 67.73], [68.0, 72.99], [78.0, 79.02], [87.0, 87.44], [90.0, 98.85], [100.0, 102.44], [105.0, 108.68], [111.0, 112.94], [121.0, 127.06], [129.0, 130.69]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false], "silence_prob": [33.02, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.35, 0.0, 0.0, 34.27, 38.51, 56.78, 0.0, 36.95, 0.0], "audiomae_on_audioset": [[["wild animals", 23.63], ["animal", 10.94], ["speech", 10.73]], null, null, null, null, null, null, null, null, null, [["speech", 13.62], ["music", 9.03], ["burping, eructation", 6.62]], null, null, [["insect", 27.74], ["electric shaver, electric razor", 19.33], ["fly, housefly", 17.98]], [["mosquito", 64.65], ["fly, housefly", 9.76], ["frog", 7.2]], null, null, [["cough", 13.99], ["speech", 13.95], ["bird", 7.73]], null], "duration": [3.84, 2.46, 1.13, -0.05, 1.37, 1.23, 0.75, 1.53, 1.61, 0.73, 4.99, 1.02, 0.44, 8.85, 2.44, 3.68, 1.94, 6.06, 1.69]} \ No newline at end of file diff --git a/annotations_1/1zi4R4EklsI_filtered.json b/annotations_1/1zi4R4EklsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..793ab0ac8d180116449ff4ac0e6a848ae59a5966 --- /dev/null +++ b/annotations_1/1zi4R4EklsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.86], [12.0, 15.75], [17.0, 19.58], [21.0, 21.22], [29.0, 30.21], [31.0, 34.72], [35.0, 49.13], [55.0, 54.97], [55.0, 57.16], [58.0, 58.53], [60.0, 60.74], [67.0, 68.15], [70.0, 71.14], [73.0, 80.0], [88.0, 89.78], [90.0, 92.7], [95.0, 102.61], [104.0, 115.06], [118.0, 124.77], [132.0, 132.58], [135.0, 151.41], [152.0, 154.7], [158.0, 173.5], [175.0, 177.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.99, 97.22, 99.99, 0.0, 0.0, 100.0, 100.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 54.63, 50.21, 36.71, 31.28, 0.0, 39.01, 96.66, 99.16, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.57], ["scary music", 12.7], ["hum", 7.57]], [["music", 53.53], ["scary music", 14.47], ["hum", 7.74]], null, [["music", 50.59], ["hum", 10.74], ["electric shaver, electric razor", 5.08]], null, null, null], "duration": [2.86, 3.75, 2.58, 0.22, 1.21, 3.72, 14.13, -0.03, 2.16, 0.53, 0.74, 1.15, 1.14, 7.0, 1.78, 2.7, 7.61, 11.06, 6.77, 0.58, 16.41, 2.7, 15.5, 2.09]} \ No newline at end of file diff --git a/annotations_1/2-1_64NeG_E_filtered.json b/annotations_1/2-1_64NeG_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0847175df9489a2654bb46ec85aa71121758933d --- /dev/null +++ b/annotations_1/2-1_64NeG_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.44], [16.0, 55.8], [58.0, 58.99], [62.0, 71.24], [72.0, 89.68], [92.0, 117.8], [118.0, 132.41], [132.0, 132.44], [136.0, 144.76]], "keep_status": [true, false, false, true, true, false, false, false, true], "silence_prob": [40.97, 0.0, 0.0, 46.64, 29.07, 33.14, 30.56, 0.0, 34.52], "audiomae_on_audioset": [[["music", 41.9], ["hum", 8.02], ["throbbing", 5.75]], null, null, [["speech", 15.69], ["whale vocalization", 15.63], ["music", 12.96]], [["whale vocalization", 18.26], ["music", 12.36], ["grunt", 9.43]], [["music", 57.47], ["throbbing", 22.12], ["hum", 6.17]], [["speech", 49.32], ["music", 19.49], ["hum", 4.12]], null, [["speech", 30.89], ["hum", 19.6], ["mains hum", 8.69]]], "duration": [5.44, 39.8, 0.99, 9.24, 17.68, 25.8, 14.41, 0.44, 8.76]} \ No newline at end of file diff --git a/annotations_1/2-L4tBlUJos_filtered.json b/annotations_1/2-L4tBlUJos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8331531b520a72530f58a71b88a18ad0712451d4 --- /dev/null +++ b/annotations_1/2-L4tBlUJos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 25.41], [26.0, 37.0], [39.0, 40.07], [40.0, 42.18], [44.0, 45.99], [52.0, 54.36], [61.0, 61.16], [62.0, 62.33], [62.0, 62.5], [63.0, 64.0], [67.0, 67.12], [69.0, 71.68], [77.0, 77.33], [82.0, 82.51]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [68.02, 76.2, 0.0, 34.93, 0.0, 39.86, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 43.49], ["music", 6.06], ["cattle, bovinae", 4.1]], null, [["music", 39.93], ["synthesizer", 6.65], ["echo", 4.07]], null, null, null, null, null, null, null, null], "duration": [9.41, 11.0, 1.07, 2.18, 1.99, 2.36, 0.16, 0.33, 0.5, 1.0, 0.12, 2.68, 0.33, 0.51]} \ No newline at end of file diff --git a/annotations_1/208MQEPGWLA_filtered.json b/annotations_1/208MQEPGWLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6f18a03d2bf1f9afd05237e22f418d1359f60a9 --- /dev/null +++ b/annotations_1/208MQEPGWLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.95], [12.0, 14.93], [17.0, 22.87], [28.0, 29.3], [31.0, 34.3], [36.0, 40.44], [45.0, 50.63], [51.0, 53.01], [54.0, 59.19], [60.0, 61.3], [69.0, 70.19], [75.0, 78.36], [82.0, 87.52], [91.0, 91.72], [93.0, 94.41], [95.0, 98.12], [103.0, 103.22], [104.0, 118.61], [126.0, 127.14], [136.0, 139.31], [145.0, 146.62], [149.0, 163.41], [164.0, 164.1], [164.0, 165.27], [167.0, 168.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.59, 72.75, 74.76, 0.0, 59.96, 70.3, 83.34, 65.91, 72.46, 0.0, 0.0, 82.97, 86.64, 0.0, 0.0, 64.07, 0.0, 41.09, 0.0, 40.28, 0.0, 43.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.52], ["hum", 9.41], ["throbbing", 4.58]], null, [["music", 36.01], ["speech", 34.52], ["sheep", 4.64]], null, [["music", 57.05], ["speech", 10.88], ["theremin", 4.49]], null, null, null], "duration": [2.95, 2.93, 5.87, 1.3, 3.3, 4.44, 5.63, 2.01, 5.19, 1.3, 1.19, 3.36, 5.52, 0.72, 1.41, 3.12, 0.22, 14.61, 1.14, 3.31, 1.62, 14.41, 0.1, 1.27, 1.08]} \ No newline at end of file diff --git a/annotations_1/218nJYQ3oMI_filtered.json b/annotations_1/218nJYQ3oMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..becc1d442f379f2fe56a3fe536340f657f059ba4 --- /dev/null +++ b/annotations_1/218nJYQ3oMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.08], [14.0, 14.79], [22.0, 29.24], [40.0, 41.03], [45.0, 48.14], [61.0, 66.65], [71.0, 74.44], [81.0, 81.85], [85.0, 88.3], [89.0, 90.24], [93.0, 94.24], [95.0, 96.36], [101.0, 101.76], [103.0, 105.21], [118.0, 119.96], [121.0, 124.36], [128.0, 128.71]], "keep_status": [true, false, true, false, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [33.43, 0.0, 35.38, 0.0, 33.28, 31.27, 32.17, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 31.98, 0.0], "audiomae_on_audioset": [[["moo", 16.75], ["cattle, bovinae", 12.2], ["livestock, farm animals, working animals", 11.33]], null, [["music", 37.55], ["speech", 18.54], ["hum", 6.55]], null, [["music", 66.6], ["throbbing", 15.06], ["hum", 6.65]], [["cattle, bovinae", 40.12], ["moo", 32.57], ["livestock, farm animals, working animals", 25.63]], [["music", 37.95], ["throbbing", 8.9], ["hum", 6.63]], null, [["music", 72.71], ["throbbing", 7.91], ["hum", 2.56]], null, null, null, null, [["music", 26.44], ["didgeridoo", 23.17], ["boing", 8.0]], null, [["music", 36.48], ["mains hum", 15.31], ["throbbing", 12.26]], null], "duration": [3.08, 0.79, 7.24, 1.03, 3.14, 5.65, 3.44, 0.85, 3.3, 1.24, 1.24, 1.36, 0.76, 2.21, 1.96, 3.36, 0.71]} \ No newline at end of file diff --git a/annotations_1/21Vg94SOqk0_filtered.json b/annotations_1/21Vg94SOqk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71e1003c3987a1f2ad769678e14e11ddda8f063a --- /dev/null +++ b/annotations_1/21Vg94SOqk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [7.0, 15.45], [18.0, 18.23], [22.0, 48.49], [52.0, 53.01], [54.0, 69.9], [72.0, 73.08], [74.0, 78.07], [89.0, 89.99]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.2, 0.0, 31.15, 0.0, 30.34, 0.0, 30.12, 0.0], "audiomae_on_audioset": [null, [["music", 20.29], ["throbbing", 16.79], ["hum", 11.4]], null, [["music", 68.83], ["didgeridoo", 4.41], ["singing", 4.12]], null, [["music", 56.64], ["didgeridoo", 7.76], ["musical instrument", 6.65]], null, [["music", 55.48], ["didgeridoo", 13.99], ["speech", 5.51]], null], "duration": [0.72, 8.45, 0.23, 26.49, 1.01, 15.9, 1.08, 4.07, 0.99]} \ No newline at end of file diff --git a/annotations_1/21aXGNHDBWQ_filtered.json b/annotations_1/21aXGNHDBWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a49f7786437c3886bd3b6e856a059e5918e870d3 --- /dev/null +++ b/annotations_1/21aXGNHDBWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.61], [19.0, 19.48], [21.0, 23.26], [26.0, 26.42], [27.0, 42.52], [44.0, 45.23], [47.0, 47.19], [50.0, 51.75], [52.0, 53.52], [55.0, 55.46], [58.0, 58.9], [61.0, 65.72], [66.0, 68.28], [68.0, 70.21], [72.0, 72.98], [75.0, 92.16], [93.0, 101.71], [103.0, 109.56], [111.0, 121.98], [123.0, 124.56], [126.0, 128.11]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, true, false, true], "silence_prob": [45.98, 0.0, 46.02, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 41.01, 34.7, 0.0, 36.28, 32.8, 29.33, 29.65, 0.0, 29.76], "audiomae_on_audioset": [[["whale vocalization", 29.76], ["music", 20.03], ["synthesizer", 4.0]], null, [["speech", 43.62], ["music", 16.98], ["sidetone", 13.26]], null, null, null, null, null, null, null, null, null, [["speech", 29.04], ["music", 23.89], ["ambient music", 10.27]], [["singing bowl", 35.81], ["music", 19.47], ["speech", 13.97]], null, [["singing bowl", 22.08], ["music", 21.71], ["gong", 18.71]], [["hum", 47.76], ["mains hum", 12.59], ["music", 10.39]], [["hum", 15.12], ["music", 8.35], ["grunt", 6.98]], [["speech", 17.51], ["noise", 11.08], ["rumble", 9.01]], null, [["grunt", 17.36], ["effects unit", 6.66], ["hum", 5.58]]], "duration": [3.61, 0.48, 2.26, 0.42, 15.52, 1.23, 0.19, 1.75, 1.52, 0.46, 0.9, 4.72, 2.28, 2.21, 0.98, 17.16, 8.71, 6.56, 10.98, 1.56, 2.11]} \ No newline at end of file diff --git a/annotations_1/21b9Nr4VIcI_filtered.json b/annotations_1/21b9Nr4VIcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c6785df8ec0a46289d14ea2e05b0716cf45580 --- /dev/null +++ b/annotations_1/21b9Nr4VIcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 6.91], [9.0, 22.52], [24.0, 24.49], [25.0, 25.88], [26.0, 26.81], [27.0, 32.36], [34.0, 39.53], [40.0, 39.61], [40.0, 56.54], [58.0, 57.92], [59.0, 59.32], [60.0, 62.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 67.13, 0.0, 0.0, 0.0, 33.1, 99.97, 0.0, 93.45, 0.0, 0.0, 44.99], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 66.15], ["explosion", 10.82], ["burst, pop", 5.8]], null, null, null, null, null, [["mosquito", 33.79], ["music", 21.12], ["fly, housefly", 3.73]]], "duration": [0.33, 1.91, 13.52, 0.49, 0.88, 0.81, 5.36, 5.53, -0.39, 16.54, -0.08, 0.32, 2.07]} \ No newline at end of file diff --git a/annotations_1/22Xiae6LXdU_filtered.json b/annotations_1/22Xiae6LXdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5de7e955e187672a753efe7cfdf416e830f190a4 --- /dev/null +++ b/annotations_1/22Xiae6LXdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.69], [14.0, 14.17], [16.0, 16.01], [17.0, 17.47], [19.0, 19.8], [27.0, 27.5], [28.0, 39.33], [49.0, 61.06], [64.0, 63.75], [67.0, 113.43], [114.0, 120.38], [121.0, 121.83], [123.0, 138.23], [140.0, 144.53], [147.0, 147.55], [151.0, 152.63], [160.0, 160.35], [167.0, 166.8]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [38.35, 0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 32.04, 0.0, 0.0, 37.47, 0.0, 31.5, 32.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 21.81], ["speech", 10.65], ["throbbing", 6.62]], null, null, null, null, null, [["speech", 44.98], ["music", 33.07], ["outside, rural or natural", 3.33]], [["speech", 48.06], ["music", 9.27], ["throbbing", 5.15]], null, null, [["hum", 32.73], ["throbbing", 24.77], ["music", 24.31]], null, [["music", 54.48], ["boing", 9.26], ["livestock, farm animals, working animals", 4.08]], [["speech", 39.59], ["music", 29.57], ["throbbing", 8.29]], null, null, null, null], "duration": [2.69, 0.17, 0.01, 0.47, 0.8, 0.5, 11.33, 12.06, -0.25, 46.43, 6.38, 0.83, 15.23, 4.53, 0.55, 1.63, 0.35, -0.2]} \ No newline at end of file diff --git a/annotations_1/22xJjwTRC10_filtered.json b/annotations_1/22xJjwTRC10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09c1b7a8cffc2d6a8e1cb8636fc65c89d6acc0b4 --- /dev/null +++ b/annotations_1/22xJjwTRC10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.28], [11.0, 22.0], [24.0, 25.56], [27.0, 42.33], [46.0, 56.49], [57.0, 57.52], [59.0, 77.5], [78.0, 77.94], [81.0, 104.73], [107.0, 108.95], [112.0, 116.68], [117.0, 118.66], [124.0, 127.5], [131.0, 133.39], [137.0, 141.91]], "keep_status": [false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [30.92, 51.71, 0.0, 32.1, 31.82, 0.0, 31.93, 0.0, 31.47, 0.0, 32.07, 0.0, 31.36, 33.61, 39.31], "audiomae_on_audioset": [[["hum", 49.09], ["mains hum", 18.94], ["throbbing", 14.67]], null, null, [["music", 71.68], ["hum", 5.49], ["mains hum", 5.46]], [["music", 33.86], ["speech", 13.55], ["whack, thwack", 7.34]], null, [["speech", 34.86], ["music", 33.12], ["synthesizer", 5.08]], null, [["music", 33.52], ["throbbing", 13.33], ["cattle, bovinae", 10.07]], null, [["throbbing", 33.55], ["speech", 16.35], ["music", 13.26]], null, [["music", 52.94], ["speech", 12.66], ["throbbing", 9.55]], [["music", 67.89], ["theremin", 7.74], ["effects unit", 2.8]], [["whale vocalization", 32.67], ["music", 25.67], ["speech", 9.97]]], "duration": [7.28, 11.0, 1.56, 15.33, 10.49, 0.52, 18.5, -0.06, 23.73, 1.95, 4.68, 1.66, 3.5, 2.39, 4.91]} \ No newline at end of file diff --git a/annotations_1/23uAYGDpS_I_filtered.json b/annotations_1/23uAYGDpS_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d8c1d9bb60b70e37414386d925f533bd492dac1 --- /dev/null +++ b/annotations_1/23uAYGDpS_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [5.0, 5.22], [8.0, 8.31], [11.0, 12.56], [16.0, 16.55], [18.0, 21.22], [25.0, 25.96], [28.0, 29.0], [31.0, 37.13], [38.0, 43.12], [45.0, 45.27], [47.0, 52.3], [54.0, 56.17], [60.0, 63.9], [65.0, 66.07], [67.0, 68.76], [71.0, 72.72], [73.0, 74.38], [75.0, 75.69], [77.0, 77.75], [79.0, 81.26], [84.0, 88.94], [91.0, 91.42], [96.0, 102.79], [105.0, 106.62], [108.0, 114.93], [116.0, 117.21], [120.0, 125.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 92.48, 92.8, 0.0, 92.15, 72.9, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 82.79, 0.0, 92.97, 0.0, 91.98, 0.0, 79.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.22, 0.31, 1.56, 0.55, 3.22, 0.96, 1.0, 6.13, 5.12, 0.27, 5.3, 2.17, 3.9, 1.07, 1.76, 1.72, 1.38, 0.69, 0.75, 2.26, 4.94, 0.42, 6.79, 1.62, 6.93, 1.21, 5.44]} \ No newline at end of file diff --git a/annotations_1/24B-_HU7NLs_filtered.json b/annotations_1/24B-_HU7NLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d7dc8305deb70199b982fcdc37dfff8d22ba280 --- /dev/null +++ b/annotations_1/24B-_HU7NLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.0], [5.0, 18.03], [19.0, 19.9], [21.0, 25.81], [27.0, 35.53], [36.0, 38.35], [41.0, 42.92], [46.0, 64.69], [67.0, 67.39], [68.0, 69.21], [69.0, 74.56], [76.0, 79.66], [80.0, 87.03], [88.0, 94.37], [96.0, 96.45], [97.0, 111.06], [112.0, 112.77], [120.0, 120.39]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 47.23, 0.0, 99.05, 98.66, 94.95, 0.0, 53.53, 0.0, 0.0, 44.18, 52.8, 44.96, 45.08, 0.0, 48.48, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 56.47], ["sidetone", 9.38], ["animal", 2.82]], null, null, null, null, null, null, null, null, [["hum", 44.18], ["mains hum", 15.83], ["throbbing", 15.61]], null, [["speech", 48.59], ["drip", 5.89], ["hum", 5.53]], [["hum", 20.92], ["sidetone", 10.06], ["sine wave", 6.79]], null, [["tubular bells", 21.89], ["hum", 10.55], ["clang", 6.0]], null, null], "duration": [1.0, 13.03, 0.9, 4.81, 8.53, 2.35, 1.92, 18.69, 0.39, 1.21, 5.56, 3.66, 7.03, 6.37, 0.45, 14.06, 0.77, 0.39]} \ No newline at end of file diff --git a/annotations_1/24adocMDT_U_filtered.json b/annotations_1/24adocMDT_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5468f03fba330d0351c44ba4342831ffa956b176 --- /dev/null +++ b/annotations_1/24adocMDT_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [8.0, 11.94], [14.0, 13.58], [19.0, 20.97], [22.0, 23.14], [31.0, 31.16], [31.0, 43.87], [47.0, 56.69], [59.0, 59.21], [60.0, 68.37], [76.0, 80.0], [82.0, 81.9], [85.0, 89.13], [90.0, 94.88], [114.0, 118.62], [119.0, 120.11], [121.0, 128.22], [131.0, 131.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 42.86, 31.9, 0.0, 31.69, 31.81, 0.0, 32.09, 32.0, 31.38, 0.0, 33.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 71.35], ["speech", 11.22], ["scratching (performance technique)", 3.59]], [["music", 73.23], ["drum machine", 5.94], ["singing", 4.9]], null, [["music", 70.49], ["sampler", 3.74], ["drum machine", 3.2]], [["music", 70.69], ["hip hop music", 3.33], ["drum machine", 2.33]], null, [["music", 42.43], ["drum machine", 5.11], ["bow-wow", 4.97]], [["music", 73.31], ["synthesizer", 3.18], ["sampler", 2.5]], [["cattle, bovinae", 25.53], ["moo", 25.34], ["music", 11.08]], null, [["speech", 68.33], ["cattle, bovinae", 5.67], ["music", 5.38]], null], "duration": [0.96, 3.94, -0.42, 1.97, 1.14, 0.16, 12.87, 9.69, 0.21, 8.37, 4.0, -0.1, 4.13, 4.88, 4.62, 1.11, 7.22, 0.48]} \ No newline at end of file diff --git a/annotations_1/25_58Uww0bc_filtered.json b/annotations_1/25_58Uww0bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebb57c3b9a87e688f086b68cf5ee8846773f4f25 --- /dev/null +++ b/annotations_1/25_58Uww0bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.65], [1.0, 5.05], [8.0, 10.1], [11.0, 12.7], [14.0, 15.52], [17.0, 19.21], [19.0, 21.91], [23.0, 23.75], [26.0, 28.44], [30.0, 30.94], [32.0, 35.34], [36.0, 37.77], [39.0, 41.84], [43.0, 44.2], [46.0, 47.53], [48.0, 50.13], [53.0, 53.86], [55.0, 55.81], [57.0, 58.4], [60.0, 65.69], [66.0, 67.05], [70.0, 89.45], [98.0, 100.04], [102.0, 103.89], [105.0, 109.21], [111.0, 118.69], [120.0, 132.21], [134.0, 135.5], [139.0, 140.46], [142.0, 143.58], [147.0, 147.28], [150.0, 150.87], [153.0, 153.67], [154.0, 154.01], [156.0, 158.7], [163.0, 164.34], [169.0, 169.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.7, 93.13, 0.0, 0.0, 82.61, 73.82, 0.0, 82.07, 0.0, 63.74, 0.0, 56.63, 0.0, 0.0, 57.4, 0.0, 0.0, 0.0, 36.37, 0.0, 35.4, 62.47, 0.0, 38.41, 32.57, 42.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 36.6], ["rumble", 19.99], ["mains hum", 14.45]], null, [["hum", 39.15], ["music", 26.04], ["mains hum", 8.72]], null, null, [["music", 49.53], ["hum", 6.12], ["synthesizer", 5.87]], [["mains hum", 53.66], ["hum", 31.13], ["music", 3.49]], [["music", 24.61], ["didgeridoo", 22.92], ["hum", 15.49]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.35, 4.05, 2.1, 1.7, 1.52, 2.21, 2.91, 0.75, 2.44, 0.94, 3.34, 1.77, 2.84, 1.2, 1.53, 2.13, 0.86, 0.81, 1.4, 5.69, 1.05, 19.45, 2.04, 1.89, 4.21, 7.69, 12.21, 1.5, 1.46, 1.58, 0.28, 0.87, 0.67, 0.01, 2.7, 1.34, 0.89]} \ No newline at end of file diff --git a/annotations_1/271ymG6B7aw_filtered.json b/annotations_1/271ymG6B7aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84e31b05c874200b92f9e252e8e191714083cdf3 --- /dev/null +++ b/annotations_1/271ymG6B7aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.07], [3.0, 4.43], [18.0, 18.47], [20.0, 20.41], [28.0, 28.73], [30.0, 31.97], [39.0, 44.04], [52.0, 54.24], [56.0, 56.2], [57.0, 57.45], [63.0, 63.51], [67.0, 67.68], [68.0, 75.03], [81.0, 82.02], [83.0, 82.88], [86.0, 87.45], [90.0, 90.34], [99.0, 99.93], [101.0, 101.93], [103.0, 103.71], [105.0, 112.38], [113.0, 124.44], [125.0, 144.44], [145.0, 156.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.8, 0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 98.19, 100.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 1.43, 0.47, 0.41, 0.73, 1.97, 5.04, 2.24, 0.2, 0.45, 0.51, 0.68, 7.03, 1.02, -0.12, 1.45, 0.34, 0.93, 0.93, 0.71, 7.38, 11.44, 19.44, 11.0]} \ No newline at end of file diff --git a/annotations_1/276AIPEK_JA_filtered.json b/annotations_1/276AIPEK_JA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b337acb17068bb6a5a1aee8f25cf39a148a65a72 --- /dev/null +++ b/annotations_1/276AIPEK_JA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.04], [20.0, 21.98], [30.0, 30.45], [31.0, 35.16], [36.0, 36.86], [49.0, 51.65], [69.0, 68.79], [70.0, 70.24], [72.0, 73.03], [85.0, 87.61], [88.0, 93.45], [96.0, 97.24], [99.0, 99.59], [101.0, 106.03], [108.0, 113.71], [115.0, 115.67], [116.0, 116.53], [117.0, 118.12], [120.0, 124.9], [125.0, 125.93], [127.0, 129.14], [136.0, 143.78], [151.0, 152.56], [153.0, 154.99], [156.0, 157.38], [158.0, 162.67], [164.0, 166.28], [168.0, 173.65], [176.0, 179.14], [180.0, 186.29], [186.0, 189.33], [192.0, 193.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 67.76, 0.0, 72.16, 0.0, 0.0, 0.0, 98.44, 62.47, 0.0, 0.0, 90.6, 97.0, 0.0, 0.0, 0.0, 60.32, 0.0, 77.7, 42.0, 0.0, 0.0, 0.0, 66.03, 75.88, 58.22, 51.99, 54.23, 67.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 80.64], ["music", 4.32], ["sidetone", 2.89]], null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 1.98, 0.45, 4.16, 0.86, 2.65, -0.21, 0.24, 1.03, 2.61, 5.45, 1.24, 0.59, 5.03, 5.71, 0.67, 0.53, 1.12, 4.9, 0.93, 2.14, 7.78, 1.56, 1.99, 1.38, 4.67, 2.28, 5.65, 3.14, 6.29, 3.33, 1.29]} \ No newline at end of file diff --git a/annotations_1/27ARVhE-a58_filtered.json b/annotations_1/27ARVhE-a58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41887d7805d34982195de929765b8a6dd96a34ff --- /dev/null +++ b/annotations_1/27ARVhE-a58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.35], [10.0, 11.3], [16.0, 18.54], [21.0, 32.05], [35.0, 133.52], [135.0, 136.73], [147.0, 147.26], [148.0, 148.95], [151.0, 151.71]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [70.86, 0.0, 32.98, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 45.6], ["throbbing", 23.14], ["hum", 9.93]], [["throbbing", 20.59], ["music", 17.69], ["speech", 17.63]], null, null, null, null, null], "duration": [3.35, 1.3, 2.54, 11.05, 98.52, 1.73, 0.26, 0.95, 0.71]} \ No newline at end of file diff --git a/annotations_1/27moTiftkCc_filtered.json b/annotations_1/27moTiftkCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a71ace7053435e81b730f3ec61d80ea5e3bda8d --- /dev/null +++ b/annotations_1/27moTiftkCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.3], [9.0, 9.14], [10.0, 11.2], [12.0, 13.12], [20.0, 20.9], [27.0, 27.51], [29.0, 29.83], [35.0, 36.49], [41.0, 41.67]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.14, 1.2, 1.12, 0.9, 0.51, 0.83, 1.49, 0.67]} \ No newline at end of file diff --git a/annotations_1/282_VCffiTo_filtered.json b/annotations_1/282_VCffiTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05432106346602c1c512141aad00daafd6108a60 --- /dev/null +++ b/annotations_1/282_VCffiTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [6.0, 7.65], [11.0, 12.51], [14.0, 16.14], [17.0, 61.23], [62.0, 64.3], [65.0, 71.74], [73.0, 81.33]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.89, 0.0, 99.88, 99.87, 99.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.24, 1.65, 1.51, 2.14, 44.23, 2.3, 6.74, 8.33]} \ No newline at end of file diff --git a/annotations_1/29Pg9Oo6P2w_filtered.json b/annotations_1/29Pg9Oo6P2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7355f9b312988122851139cedfcdd4c4bd84cd5 --- /dev/null +++ b/annotations_1/29Pg9Oo6P2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 5.73], [9.0, 11.2], [16.0, 18.23], [19.0, 29.15], [30.0, 32.75], [36.0, 37.08], [37.0, 37.79], [39.0, 39.87], [41.0, 75.37], [76.0, 76.4], [77.0, 80.72], [83.0, 83.1], [84.0, 85.18], [86.0, 86.53], [87.0, 96.43], [97.0, 105.61], [106.0, 123.57], [126.0, 127.35], [128.0, 128.58], [130.0, 131.35], [132.0, 140.1], [141.0, 141.81], [143.0, 143.14], [146.0, 146.58], [149.0, 149.34], [151.0, 154.68], [156.0, 157.81], [159.0, 160.02], [163.0, 164.29], [167.0, 168.62], [170.0, 170.68], [174.0, 180.59], [181.0, 192.25], [195.0, 196.4], [198.0, 203.77], [208.0, 236.43]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 33.35, 48.1, 41.54, 47.54, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 31.46, 39.17, 42.13, 0.0, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 51.07, 29.68, 0.0, 29.95, 28.85], "audiomae_on_audioset": [null, null, [["hum", 31.26], ["music", 14.73], ["mains hum", 14.15]], [["music", 57.18], ["scary music", 9.37], ["theremin", 5.56]], [["music", 21.55], ["whale vocalization", 21.03], ["speech", 12.51]], [["music", 28.54], ["hum", 16.22], ["throbbing", 15.25]], null, null, null, null, null, null, null, null, null, [["music", 45.54], ["livestock, farm animals, working animals", 13.64], ["moo", 9.53]], [["music", 63.19], ["theremin", 4.89], ["synthesizer", 4.14]], [["speech", 50.63], ["music", 23.12], ["sonar", 3.95]], null, null, null, [["music", 48.49], ["bleat", 10.96], ["sheep", 8.21]], null, null, null, null, null, null, null, null, null, null, null, [["music", 38.05], ["speech", 26.8], ["eruption", 4.06]], null, [["music", 39.67], ["hum", 22.5], ["throbbing", 14.64]], [["music", 12.16], ["hum", 11.21], ["vehicle", 10.68]]], "duration": [1.3, 0.73, 2.2, 2.23, 10.15, 2.75, 1.08, 0.79, 0.87, 34.37, 0.4, 3.72, 0.1, 1.18, 0.53, 9.43, 8.61, 17.57, 1.35, 0.58, 1.35, 8.1, 0.81, 0.14, 0.58, 0.34, 3.68, 1.81, 1.02, 1.29, 1.62, 0.68, 6.59, 11.25, 1.4, 5.77, 28.43]} \ No newline at end of file diff --git a/annotations_1/29VjYkPPY2s_filtered.json b/annotations_1/29VjYkPPY2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e8196d7de7512619f48e43a2e83ac58ac2d9d4f --- /dev/null +++ b/annotations_1/29VjYkPPY2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.89], [12.0, 14.45], [15.0, 16.68], [18.0, 18.87], [24.0, 25.29], [27.0, 27.3], [35.0, 35.8], [36.0, 37.03], [42.0, 43.63], [45.0, 50.67], [57.0, 65.72], [72.0, 72.33], [77.0, 78.0], [80.0, 80.2], [84.0, 84.92], [87.0, 88.94], [90.0, 91.35], [94.0, 95.25], [98.0, 98.81], [102.0, 103.84], [106.0, 108.24], [110.0, 112.04], [115.0, 115.97], [118.0, 119.7], [124.0, 124.95]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 33.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.74, 49.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 52.01], ["sine wave", 19.2], ["chirp tone", 8.87]], null, null, null, null, null, null, null, [["speech", 47.67], ["mains hum", 10.77], ["hum", 10.76]], [["speech", 40.99], ["music", 8.04], ["whack, thwack", 6.06]], null, null, null, null, null, null, null, null, null, [["music", 24.5], ["speech", 17.11], ["hum", 13.93]], [["speech", 31.69], ["music", 22.34], ["hum", 9.15]], null, null, null], "duration": [0.89, 2.45, 1.68, 0.87, 1.29, 0.3, 0.8, 1.03, 1.63, 5.67, 8.72, 0.33, 1.0, 0.2, 0.92, 1.94, 1.35, 1.25, 0.81, 1.84, 2.24, 2.04, 0.97, 1.7, 0.95]} \ No newline at end of file diff --git a/annotations_1/29YDqiuyaOU_filtered.json b/annotations_1/29YDqiuyaOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..604f9b2428c52f72de6aeb64b6c238404912e76b --- /dev/null +++ b/annotations_1/29YDqiuyaOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 32.66], [34.0, 51.46], [53.0, 75.15]], "keep_status": [false, true, false], "silence_prob": [31.62, 33.79, 32.37], "audiomae_on_audioset": [[["hum", 67.77], ["throbbing", 14.57], ["mains hum", 5.76]], [["fire", 24.12], ["music", 21.53], ["hum", 5.51]], [["music", 45.23], ["hum", 19.54], ["throbbing", 14.13]]], "duration": [13.66, 17.46, 22.15]} \ No newline at end of file diff --git a/annotations_1/2ADaXnuG-YM_filtered.json b/annotations_1/2ADaXnuG-YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7e5a0709019d4cfdb026b0935d5337c16b81dcd --- /dev/null +++ b/annotations_1/2ADaXnuG-YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.15], [14.0, 15.84], [30.0, 30.13], [31.0, 31.94], [35.0, 35.53], [40.0, 40.12], [53.0, 52.93], [88.0, 88.13], [90.0, 91.18], [93.0, 93.72], [95.0, 95.17], [95.0, 99.49], [110.0, 110.15], [111.0, 113.59], [116.0, 118.18], [120.0, 130.5], [144.0, 144.91], [149.0, 149.15], [157.0, 157.42], [158.0, 158.79], [160.0, 160.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.78, 0.0, 32.13, 32.49, 36.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["car alarm", 57.0], ["emergency vehicle", 14.48], ["siren", 11.15]], null, [["percussion", 29.16], ["moo", 15.1], ["cattle, bovinae", 13.33]], [["music", 31.98], ["speech", 14.3], ["animal", 5.75]], [["music", 66.45], ["speech", 8.45], ["brass instrument", 4.31]], null, null, null, null, null], "duration": [0.15, 1.84, 0.13, 0.94, 0.53, 0.12, -0.07, 0.13, 1.18, 0.72, 0.17, 4.49, 0.15, 2.59, 2.18, 10.5, 0.91, 0.15, 0.42, 0.79, 0.89]} \ No newline at end of file diff --git a/annotations_1/2AmY_TaUh8M_filtered.json b/annotations_1/2AmY_TaUh8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1a5fb1b86190e55caf426632dcc394c51fb0697 --- /dev/null +++ b/annotations_1/2AmY_TaUh8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.02], [10.0, 11.25], [13.0, 14.13], [15.0, 15.57], [16.0, 17.32], [21.0, 23.14], [24.0, 26.03], [26.0, 26.97], [28.0, 29.44], [30.0, 30.7], [32.0, 32.36], [34.0, 35.23], [36.0, 36.12], [36.0, 37.25], [38.0, 39.51], [41.0, 41.42], [42.0, 43.51], [44.0, 45.74], [49.0, 86.36], [87.0, 87.69], [89.0, 96.15], [99.0, 133.83], [140.0, 149.17], [152.0, 154.94], [157.0, 165.13], [167.0, 170.55], [171.0, 172.05], [174.0, 174.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.28, 0.0, 59.96, 39.77, 93.76, 48.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.87], ["didgeridoo", 11.6], ["musical instrument", 4.63]], null, null, [["speech", 25.27], ["fly, housefly", 12.03], ["mosquito", 7.66]], null, [["music", 55.49], ["fart", 9.88], ["speech", 9.85]], null, null], "duration": [0.02, 1.25, 1.13, 0.57, 1.32, 2.14, 2.03, 0.97, 1.44, 0.7, 0.36, 1.23, 0.12, 1.25, 1.51, 0.42, 1.51, 1.74, 37.36, 0.69, 7.15, 34.83, 9.17, 2.94, 8.13, 3.55, 1.05, 0.85]} \ No newline at end of file diff --git a/annotations_1/2AoKTalyiUA_filtered.json b/annotations_1/2AoKTalyiUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2748e76217de254c59ec05de1e3a627dc0b9f4a3 --- /dev/null +++ b/annotations_1/2AoKTalyiUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 25.49], [26.0, 26.6], [28.0, 30.81], [31.0, 32.54], [34.0, 36.56], [37.0, 43.92], [45.0, 46.72], [49.0, 50.18], [54.0, 54.14], [55.0, 55.51], [62.0, 61.99], [64.0, 65.2], [66.0, 67.29], [70.0, 71.31], [73.0, 73.65], [75.0, 76.05], [77.0, 77.75], [83.0, 84.06], [87.0, 88.47], [90.0, 90.61], [96.0, 97.23], [107.0, 110.2], [112.0, 112.29], [113.0, 118.61], [125.0, 126.66], [128.0, 128.02], [129.0, 137.44], [138.0, 139.02], [140.0, 147.99], [149.0, 153.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.88, 0.0, 99.8, 0.0, 93.91, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.71, 0.0, 0.0, 99.97, 0.0, 85.17, 51.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.49, 0.6, 2.81, 1.54, 2.56, 6.92, 1.72, 1.18, 0.14, 0.51, -0.01, 1.2, 1.29, 1.31, 0.65, 1.05, 0.75, 1.06, 1.47, 0.61, 1.23, 3.2, 0.29, 5.61, 1.66, 0.02, 8.44, 1.02, 7.99, 4.1]} \ No newline at end of file diff --git a/annotations_1/2BaBf4EEO10_filtered.json b/annotations_1/2BaBf4EEO10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a93ff00b5d066fd19fd0799c428b73f3c0f5fd --- /dev/null +++ b/annotations_1/2BaBf4EEO10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.45], [5.0, 5.46], [7.0, 8.04], [10.0, 10.99], [12.0, 13.17]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.45, 0.46, 1.04, 0.99, 1.17]} \ No newline at end of file diff --git a/annotations_1/2BofOahaB0w_filtered.json b/annotations_1/2BofOahaB0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93d8cabee0b47ff328435f1b6d5fddbd679d8131 --- /dev/null +++ b/annotations_1/2BofOahaB0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.27], [25.0, 25.47], [28.0, 28.61], [30.0, 31.24], [34.0, 34.82], [38.0, 38.74], [41.0, 42.36], [44.0, 44.76], [45.0, 45.03], [45.0, 45.06], [45.0, 50.77], [51.0, 51.14], [55.0, 56.52], [60.0, 81.28], [82.0, 83.05], [84.0, 87.24], [93.0, 94.24], [96.0, 95.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 0.0, 99.78, 0.0, 78.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 0.47, 0.61, 1.24, 0.82, 0.74, 1.36, 0.76, 0.03, 0.06, 5.77, 0.14, 1.52, 21.28, 1.05, 3.24, 1.24, -0.04]} \ No newline at end of file diff --git a/annotations_1/2C8fB8p6crY_filtered.json b/annotations_1/2C8fB8p6crY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60bd5847665e05a5fd1f19eec03f99fd9d95edb0 --- /dev/null +++ b/annotations_1/2C8fB8p6crY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.59], [24.0, 24.14], [25.0, 45.55], [47.0, 50.04], [51.0, 52.78], [54.0, 57.65], [58.0, 58.89], [59.0, 60.54], [61.0, 62.9], [64.0, 65.28], [67.0, 71.22], [72.0, 73.23], [75.0, 75.19], [76.0, 77.3], [80.0, 81.06], [88.0, 89.18], [92.0, 94.27], [95.0, 96.15], [96.0, 117.27], [118.0, 126.55], [128.0, 128.71], [131.0, 186.76], [189.0, 191.57], [193.0, 194.12], [195.0, 196.53], [198.0, 198.83]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 35.26, 76.86, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 57.72, 51.07, 0.0, 0.0, 45.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 31.85], ["grunt", 21.16], ["music", 9.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 35.38], ["fart", 22.09], ["cough", 5.3]], null, null, null], "duration": [1.59, 0.14, 20.55, 3.04, 1.78, 3.65, 0.89, 1.54, 1.9, 1.28, 4.22, 1.23, 0.19, 1.3, 1.06, 1.18, 2.27, 1.15, 21.27, 8.55, 0.71, 55.76, 2.57, 1.12, 1.53, 0.83]} \ No newline at end of file diff --git a/annotations_1/2DCjXk4qpLo_filtered.json b/annotations_1/2DCjXk4qpLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf36111ae362fcbddb2fd451a0b76f11bb2bedd1 --- /dev/null +++ b/annotations_1/2DCjXk4qpLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [3.0, 3.2], [4.0, 4.16], [10.0, 11.21], [13.0, 13.12], [15.0, 14.89], [15.0, 14.93], [16.0, 16.87], [19.0, 19.45], [21.0, 21.57], [29.0, 30.55], [31.0, 33.02], [36.0, 36.14], [40.0, 40.53], [41.0, 42.04], [44.0, 45.0], [50.0, 53.47], [58.0, 57.7], [58.0, 59.16], [60.0, 60.47], [67.0, 67.58], [69.0, 70.11], [75.0, 75.63], [93.0, 92.94], [96.0, 97.38], [100.0, 100.36], [105.0, 105.22], [107.0, 107.38], [110.0, 109.81], [111.0, 111.33], [113.0, 112.82], [113.0, 113.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 0.2, 0.16, 1.21, 0.12, -0.11, -0.07, 0.87, 0.45, 0.57, 1.55, 2.02, 0.14, 0.53, 1.04, 1.0, 3.47, -0.3, 1.16, 0.47, 0.58, 1.11, 0.63, -0.06, 1.38, 0.36, 0.22, 0.38, -0.19, 0.33, -0.18, 0.91]} \ No newline at end of file diff --git a/annotations_1/2DgFlZwrD-Q_filtered.json b/annotations_1/2DgFlZwrD-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85a63c88b2486fa32e3e8593a6a9756fe1865021 --- /dev/null +++ b/annotations_1/2DgFlZwrD-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.82], [18.0, 18.49], [20.0, 21.14], [21.0, 22.81], [25.0, 27.8], [30.0, 31.4], [32.0, 34.05], [35.0, 36.44], [37.0, 38.1], [40.0, 41.18], [44.0, 44.22], [46.0, 46.97], [49.0, 49.77], [53.0, 54.14], [56.0, 57.13], [58.0, 58.63], [60.0, 61.35], [66.0, 66.31], [69.0, 70.63], [72.0, 72.82], [76.0, 77.6], [78.0, 85.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.27, 0.0, 0.0, 0.0, 99.48, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67], "audiomae_on_audioset": [[["hum", 20.55], ["music", 14.15], ["singing bowl", 12.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.82, 0.49, 1.14, 1.81, 2.8, 1.4, 2.05, 1.44, 1.1, 1.18, 0.22, 0.97, 0.77, 1.14, 1.13, 0.63, 1.35, 0.31, 1.63, 0.82, 1.6, 7.94]} \ No newline at end of file diff --git a/annotations_1/2DpotjffI6U_filtered.json b/annotations_1/2DpotjffI6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6aa3de3c6484aca918b25f876acd3cd7b8a24d82 --- /dev/null +++ b/annotations_1/2DpotjffI6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 103.5]], "keep_status": [true], "silence_prob": [28.97], "audiomae_on_audioset": [[["noise", 30.24], ["music", 24.98], ["reverberation", 4.67]]], "duration": [2.5]} \ No newline at end of file diff --git a/annotations_1/2EQCpQbUrzI_filtered.json b/annotations_1/2EQCpQbUrzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ae7880f20ce7328ce0a0bbb0288ce3828cff815 --- /dev/null +++ b/annotations_1/2EQCpQbUrzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.61], [11.0, 14.01], [15.0, 17.29], [19.0, 20.44], [21.0, 22.98], [23.0, 29.61], [36.0, 38.28], [41.0, 43.36], [46.0, 46.2], [47.0, 47.55], [48.0, 49.25], [50.0, 63.69], [66.0, 66.63], [68.0, 69.3], [72.0, 74.87], [77.0, 93.53], [101.0, 110.0], [115.0, 121.2], [127.0, 132.56], [134.0, 139.7], [142.0, 142.72], [146.0, 146.64], [148.0, 173.82], [175.0, 181.9], [187.0, 188.25], [190.0, 197.55]], "keep_status": [true, true, true, false, false, true, true, true, false, false, false, false, false, false, true, true, false, false, true, true, false, false, true, false, false, false], "silence_prob": [45.88, 40.7, 43.25, 0.0, 0.0, 37.98, 34.27, 33.04, 0.0, 0.0, 0.0, 32.89, 0.0, 0.0, 32.86, 28.81, 29.02, 29.75, 28.7, 28.41, 0.0, 0.0, 28.27, 28.44, 0.0, 30.75], "audiomae_on_audioset": [[["speech", 24.4], ["music", 7.11], ["mains hum", 4.22]], [["music", 14.56], ["didgeridoo", 10.62], ["speech", 10.26]], [["frog", 20.6], ["croak", 13.42], ["music", 8.7]], null, null, [["music", 39.49], ["tubular bells", 9.8], ["piano", 9.23]], [["music", 29.97], ["musical instrument", 16.23], ["keyboard (musical)", 14.44]], [["music", 48.79], ["musical instrument", 10.2], ["synthesizer", 6.43]], null, null, null, [["music", 33.11], ["speech", 26.18], ["piano", 11.58]], null, null, [["music", 38.05], ["keyboard (musical)", 10.72], ["piano", 8.02]], [["music", 11.28], ["effects unit", 10.98], ["distortion", 8.59]], [["cattle, bovinae", 43.76], ["moo", 27.85], ["livestock, farm animals, working animals", 24.42]], [["music", 44.74], ["didgeridoo", 23.45], ["musical instrument", 5.16]], [["music", 40.05], ["livestock, farm animals, working animals", 7.86], ["cattle, bovinae", 6.93]], [["music", 42.2], ["chant", 16.4], ["musical instrument", 5.24]], null, null, [["music", 53.32], ["chant", 12.35], ["vocal music", 3.96]], [["music", 53.21], ["hum", 14.62], ["mains hum", 14.11]], null, [["music", 56.69], ["throbbing", 10.7], ["hum", 5.85]]], "duration": [3.61, 3.01, 2.29, 1.44, 1.98, 6.61, 2.28, 2.36, 0.2, 0.55, 1.25, 13.69, 0.63, 1.3, 2.87, 16.53, 9.0, 6.2, 5.56, 5.7, 0.72, 0.64, 25.82, 6.9, 1.25, 7.55]} \ No newline at end of file diff --git a/annotations_1/2EojVDDg3xM_filtered.json b/annotations_1/2EojVDDg3xM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..284393cf53b7206c55048e939e661df69146ca46 --- /dev/null +++ b/annotations_1/2EojVDDg3xM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [9.0, 9.34], [13.0, 15.43], [17.0, 43.7], [44.0, 48.51], [50.0, 65.45], [67.0, 94.73], [96.0, 97.01], [97.0, 102.34], [103.0, 105.81], [108.0, 119.2], [121.0, 125.12], [126.0, 128.07], [129.0, 131.55], [133.0, 134.33], [136.0, 138.28], [139.0, 142.32], [143.0, 144.88], [146.0, 147.39], [148.0, 152.93], [154.0, 159.56]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.82, 0.0, 50.36, 40.54, 38.19, 33.35, 41.1, 0.0, 81.17, 84.62, 86.27, 80.64, 85.9, 85.9, 0.0, 88.1, 77.7, 0.0, 0.0, 98.66, 98.1], "audiomae_on_audioset": [null, null, null, [["hum", 50.33], ["mains hum", 33.5], ["music", 7.83]], [["sine wave", 76.46], ["chirp tone", 9.01], ["foghorn", 4.58]], [["music", 36.42], ["wind instrument, woodwind instrument", 15.23], ["harmonic", 8.48]], [["sine wave", 57.91], ["chirp tone", 16.21], ["wind instrument, woodwind instrument", 4.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.61, 0.34, 2.43, 26.7, 4.51, 15.45, 27.73, 1.01, 5.34, 2.81, 11.2, 4.12, 2.07, 2.55, 1.33, 2.28, 3.32, 1.88, 1.39, 4.93, 5.56]} \ No newline at end of file diff --git a/annotations_1/2F4ExP0q6RU_filtered.json b/annotations_1/2F4ExP0q6RU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/2F4ExP0q6RU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/2FlG1Z6jY-0_filtered.json b/annotations_1/2FlG1Z6jY-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa33bb159c2e4fc187445543b8df70b0fff94a1 --- /dev/null +++ b/annotations_1/2FlG1Z6jY-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.79], [11.0, 13.9], [15.0, 15.48], [16.0, 17.2], [19.0, 19.09], [23.0, 23.65], [34.0, 36.02], [40.0, 40.9], [55.0, 56.1], [58.0, 75.86], [77.0, 86.61], [89.0, 90.32], [92.0, 93.11], [94.0, 97.38], [99.0, 101.93], [104.0, 104.45], [106.0, 128.76], [131.0, 133.2], [134.0, 135.68], [136.0, 137.24], [155.0, 156.57], [157.0, 157.77], [160.0, 163.83], [165.0, 166.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.76, 66.76, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 90.6, 96.04, 0.0, 0.0, 31.84, 34.25, 0.0, 34.08, 96.42, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.27], ["singing bowl", 14.65], ["hum", 10.26]], [["music", 66.02], ["musical instrument", 10.27], ["theremin", 1.97]], null, [["music", 71.18], ["hum", 3.71], ["electronic music", 2.92]], null, null, null, null, null, null, null], "duration": [9.79, 2.9, 0.48, 1.2, 0.09, 0.65, 2.02, 0.9, 1.1, 17.86, 9.61, 1.32, 1.11, 3.38, 2.93, 0.45, 22.76, 2.2, 1.68, 1.24, 1.57, 0.77, 3.83, 1.68]} \ No newline at end of file diff --git a/annotations_1/2G5KN2wt048_filtered.json b/annotations_1/2G5KN2wt048_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a7a255b05d198f95bcab86e95f9274246098608 --- /dev/null +++ b/annotations_1/2G5KN2wt048_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 10.0], [13.0, 13.17], [14.0, 23.01], [34.0, 43.28], [45.0, 50.25], [52.0, 53.92], [55.0, 55.97], [58.0, 64.27], [64.0, 75.71], [78.0, 86.22], [87.0, 88.69], [89.0, 91.18], [92.0, 92.64], [95.0, 95.67], [98.0, 119.25], [120.0, 121.26], [123.0, 129.17], [130.0, 132.8], [134.0, 134.5], [136.0, 136.61], [138.0, 145.91], [146.0, 146.52], [149.0, 149.3], [151.0, 154.47]], "keep_status": [false, false, false, true, true, false, false, false, false, true, true, false, false, false, false, true, false, true, true, false, false, true, false, false, true], "silence_prob": [0.0, 38.71, 0.0, 32.41, 34.39, 32.3, 0.0, 0.0, 34.33, 30.07, 32.9, 0.0, 39.47, 0.0, 0.0, 33.02, 0.0, 32.21, 31.7, 0.0, 0.0, 31.33, 0.0, 0.0, 41.48], "audiomae_on_audioset": [null, [["hum", 32.76], ["mains hum", 25.22], ["speech", 14.4]], null, [["music", 25.74], ["moo", 19.38], ["cattle, bovinae", 14.3]], [["cattle, bovinae", 24.93], ["music", 24.62], ["moo", 19.42]], [["music", 44.17], ["speech", 29.52], ["boing", 5.35]], null, null, [["music", 50.17], ["speech", 18.15], ["hum", 7.48]], [["noise", 22.01], ["mains hum", 18.54], ["hum", 16.86]], [["explosion", 25.7], ["speech", 19.45], ["hum", 8.02]], null, [["speech", 66.77], ["clip-clop", 2.94], ["music", 2.05]], null, null, [["music", 40.24], ["throbbing", 10.1], ["speech", 8.09]], null, [["music", 22.74], ["speech", 18.84], ["throbbing", 16.67]], [["hum", 22.79], ["mains hum", 15.22], ["throbbing", 6.83]], null, null, [["speech", 33.04], ["music", 17.24], ["foghorn", 7.87]], null, null, [["sine wave", 36.56], ["chirp tone", 8.81], ["hum", 8.81]]], "duration": [1.83, 5.0, 0.17, 9.01, 9.28, 5.25, 1.92, 0.97, 6.27, 11.71, 8.22, 1.69, 2.18, 0.64, 0.67, 21.25, 1.26, 6.17, 2.8, 0.5, 0.61, 7.91, 0.52, 0.3, 3.47]} \ No newline at end of file diff --git a/annotations_1/2GFzqqC8iUg_filtered.json b/annotations_1/2GFzqqC8iUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6321cfbb2d583cf4adfb5fe64da624f02011b50a --- /dev/null +++ b/annotations_1/2GFzqqC8iUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [7.0, 7.82], [12.0, 13.12], [16.0, 16.58], [18.0, 18.93], [20.0, 20.02], [23.0, 27.18], [27.0, 28.22], [32.0, 32.44], [37.0, 39.24], [47.0, 48.93], [52.0, 52.41], [59.0, 59.39], [64.0, 64.83], [66.0, 66.92], [74.0, 74.61], [82.0, 89.29], [90.0, 92.45], [93.0, 93.88], [96.0, 96.72], [97.0, 98.39], [99.0, 99.79], [101.0, 101.53], [103.0, 103.06], [104.0, 104.35], [106.0, 106.27], [108.0, 108.31], [110.0, 110.32], [112.0, 112.53], [118.0, 118.15], [119.0, 118.99], [119.0, 120.01], [120.0, 121.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.68, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.78, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.67], ["didgeridoo", 21.37], ["musical instrument", 5.8]], null, null, null, null, null, null, null, null, null, [["music", 51.07], ["musical instrument", 7.78], ["trombone", 6.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.82, 1.12, 0.58, 0.93, 0.02, 4.18, 1.22, 0.44, 2.24, 1.93, 0.41, 0.39, 0.83, 0.92, 0.61, 7.29, 2.45, 0.88, 0.72, 1.39, 0.79, 0.53, 0.06, 0.35, 0.27, 0.31, 0.32, 0.53, 0.15, -0.01, 1.01, 1.14]} \ No newline at end of file diff --git a/annotations_1/2GM0LKQ-ml0_filtered.json b/annotations_1/2GM0LKQ-ml0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0f4f501b7916681b56d78ccd694528fa7f3c5d5 --- /dev/null +++ b/annotations_1/2GM0LKQ-ml0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [3.0, 5.46], [6.0, 6.98], [8.0, 9.68], [14.0, 14.64], [17.0, 22.38], [32.0, 34.26], [35.0, 35.5], [36.0, 37.99], [39.0, 39.77], [40.0, 50.95], [52.0, 53.74], [55.0, 57.54], [58.0, 64.69], [66.0, 67.46], [69.0, 73.18], [75.0, 74.98], [76.0, 82.11], [84.0, 86.83], [87.0, 87.91], [89.0, 89.46], [91.0, 113.9], [115.0, 115.43], [118.0, 131.73], [132.0, 137.56], [138.0, 151.73], [152.0, 153.3], [155.0, 155.28], [158.0, 158.31], [162.0, 167.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 99.48, 0.0, 0.0, 0.0, 36.27, 98.86, 0.0, 0.0, 0.0, 94.95, 0.0, 99.05, 89.9, 0.0, 99.05, 0.0, 92.48, 97.83, 0.0, 0.0, 36.55, 0.0, 40.75, 82.79, 37.91, 0.0, 0.0, 0.0, 61.57], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 66.85], ["burst, pop", 13.96], ["artillery fire", 3.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.51], ["music", 12.88], ["radio", 4.27]], null, [["explosion", 21.78], ["hum", 12.47], ["noise", 10.38]], null, [["speech", 30.37], ["explosion", 5.72], ["breaking", 5.59]], null, null, null, null], "duration": [0.64, 2.46, 0.98, 1.68, 0.64, 5.38, 2.26, 0.5, 1.99, 0.77, 10.95, 1.74, 2.54, 6.69, 1.46, 4.18, -0.02, 6.11, 2.83, 0.91, 0.46, 22.9, 0.43, 13.73, 5.56, 13.73, 1.3, 0.28, 0.31, 5.39]} \ No newline at end of file diff --git a/annotations_1/2GvL0jFY7u8_filtered.json b/annotations_1/2GvL0jFY7u8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8695cd7e15df242b7e9a67d1f8957d801f85c141 --- /dev/null +++ b/annotations_1/2GvL0jFY7u8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 54.06], [57.0, 57.28], [59.0, 97.11], [99.0, 101.6], [102.0, 103.08]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.2, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 51.39], ["guitar", 5.72], ["musical instrument", 4.2]], null], "duration": [1.06, 0.28, 38.11, 2.6, 1.08]} \ No newline at end of file diff --git a/annotations_1/2GvyC7s3RpU_filtered.json b/annotations_1/2GvyC7s3RpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df8616e2ed2d7b9635de05513c2dd10d2e554bab --- /dev/null +++ b/annotations_1/2GvyC7s3RpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [5.0, 5.71], [7.0, 9.61], [10.0, 13.44], [15.0, 16.7], [17.0, 18.87], [20.0, 48.36], [50.0, 56.0], [57.0, 76.5], [77.0, 80.62], [83.0, 84.08], [88.0, 89.01], [94.0, 94.81], [97.0, 97.56], [103.0, 110.96], [119.0, 137.29], [141.0, 144.61], [147.0, 147.83], [156.0, 167.98], [170.0, 170.67]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 29.91, 29.44, 0.0, 0.0, 28.4, 29.11, 28.66, 28.25, 0.0, 0.0, 0.0, 0.0, 29.91, 28.29, 28.78, 0.0, 29.47, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 36.1], ["hum", 22.41], ["rumble", 7.97]], [["music", 44.97], ["hum", 15.54], ["throbbing", 10.52]], null, null, [["hum", 29.34], ["throbbing", 27.05], ["music", 19.05]], [["speech", 33.16], ["hum", 15.89], ["music", 15.22]], [["hum", 45.59], ["throbbing", 21.3], ["music", 13.22]], [["music", 66.99], ["theremin", 12.19], ["mains hum", 2.74]], null, null, null, null, [["music", 38.86], ["hum", 14.26], ["sonar", 9.7]], [["music", 23.85], ["crushing", 22.52], ["breaking", 10.48]], [["music", 22.92], ["hum", 11.34], ["mains hum", 8.78]], null, [["music", 37.71], ["throbbing", 21.72], ["hum", 16.3]], null], "duration": [1.57, 0.71, 2.61, 3.44, 1.7, 1.87, 28.36, 6.0, 19.5, 3.62, 1.08, 1.01, 0.81, 0.56, 7.96, 18.29, 3.61, 0.83, 11.98, 0.67]} \ No newline at end of file diff --git a/annotations_1/2HMLj2siVxY_filtered.json b/annotations_1/2HMLj2siVxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8adf9ae4af51e5b82c777eb5fdfe38511640555 --- /dev/null +++ b/annotations_1/2HMLj2siVxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 46.33], [50.0, 98.49]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.33, 48.49]} \ No newline at end of file diff --git a/annotations_1/2HuQzKat6hU_filtered.json b/annotations_1/2HuQzKat6hU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9de763f9c111c478fb6d1bf6bcb12443bd8ab757 --- /dev/null +++ b/annotations_1/2HuQzKat6hU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 35.92], [38.0, 37.93], [39.0, 39.72], [41.0, 42.16], [43.0, 44.02], [47.0, 47.14], [48.0, 48.63], [49.0, 49.96], [51.0, 52.93], [54.0, 58.04], [59.0, 59.88], [61.0, 61.7], [63.0, 66.83], [70.0, 70.19], [71.0, 71.07], [75.0, 75.03], [76.0, 76.96], [82.0, 82.93], [84.0, 84.57], [88.0, 88.43], [90.0, 91.12], [92.0, 92.87], [93.0, 97.04], [99.0, 100.48], [103.0, 104.21], [105.0, 106.44], [108.0, 107.99], [110.0, 110.61], [111.0, 111.79], [113.0, 115.5], [116.0, 117.12], [118.0, 119.04], [121.0, 121.76], [125.0, 125.47], [127.0, 127.36], [129.0, 129.63], [131.0, 131.33], [132.0, 135.09], [138.0, 143.02], [145.0, 145.27], [146.0, 146.53], [147.0, 147.31], [150.0, 150.48], [166.0, 184.5], [186.0, 187.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 94.22, 0.0, 0.0, 0.0, 0.0, 38.09, 0.0], "audiomae_on_audioset": [[["music", 63.85], ["theremin", 28.36], ["soundtrack music", 1.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 81.15], ["fart", 5.17], ["thunk", 1.15]], null], "duration": [12.92, -0.07, 0.72, 1.16, 1.02, 0.14, 0.63, 0.96, 1.93, 4.04, 0.88, 0.7, 3.83, 0.19, 0.07, 0.03, 0.96, 0.93, 0.57, 0.43, 1.12, 0.87, 4.04, 1.48, 1.21, 1.44, -0.01, 0.61, 0.79, 2.5, 1.12, 1.04, 0.76, 0.47, 0.36, 0.63, 0.33, 3.09, 5.02, 0.27, 0.53, 0.31, 0.48, 18.5, 1.22]} \ No newline at end of file diff --git a/annotations_1/2HwVVwlGHU0_filtered.json b/annotations_1/2HwVVwlGHU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3446be4a6818813381c338beafe3e27236a86af5 --- /dev/null +++ b/annotations_1/2HwVVwlGHU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [21.0, 23.43], [28.0, 28.71], [32.0, 32.44], [35.0, 41.3], [42.0, 44.46], [45.0, 46.16], [48.0, 53.28], [54.0, 55.31], [59.0, 62.82], [73.0, 73.87], [81.0, 80.81], [83.0, 84.55], [85.0, 86.43], [90.0, 90.53], [94.0, 97.21], [98.0, 99.45], [101.0, 102.24], [105.0, 105.19], [112.0, 112.19], [113.0, 113.54], [127.0, 127.21], [129.0, 129.51], [130.0, 130.13], [134.0, 134.23], [134.0, 135.63], [140.0, 142.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.93, 0.0, 0.0, 97.92, 87.37, 0.0, 99.99, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 2.43, 0.71, 0.44, 6.3, 2.46, 1.16, 5.28, 1.31, 3.82, 0.87, -0.19, 1.55, 1.43, 0.53, 3.21, 1.45, 1.24, 0.19, 0.19, 0.54, 0.21, 0.51, 0.13, 0.23, 1.63, 2.91]} \ No newline at end of file diff --git a/annotations_1/2IIA6TYZynQ_filtered.json b/annotations_1/2IIA6TYZynQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0302e21a3d7a0d81f213fa127cf5e901a232f27 --- /dev/null +++ b/annotations_1/2IIA6TYZynQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 46.92], [51.0, 60.13], [64.0, 95.25], [98.0, 99.12], [102.0, 102.76], [103.0, 103.0], [103.0, 114.72], [115.0, 115.65], [116.0, 122.67], [124.0, 139.7], [141.0, 149.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.24, 50.61, 0.0, 0.0, 0.0, 0.0, 42.39, 0.0, 38.37, 31.0, 29.63], "audiomae_on_audioset": [[["theremin", 36.62], ["music", 30.06], ["didgeridoo", 4.44]], null, null, null, null, null, [["music", 44.78], ["theremin", 22.66], ["wind instrument, woodwind instrument", 6.44]], null, [["music", 58.14], ["clarinet", 12.4], ["musical instrument", 7.33]], [["music", 63.46], ["theremin", 19.85], ["clarinet", 4.09]], [["music", 88.42], ["musical instrument", 4.61], ["bowed string instrument", 0.71]]], "duration": [11.92, 9.13, 31.25, 1.12, 0.76, 0.0, 11.72, 0.65, 6.67, 15.7, 8.3]} \ No newline at end of file diff --git a/annotations_1/2LX27W51kB0_filtered.json b/annotations_1/2LX27W51kB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ecee514f451e4c27a961657b36deaab69842ef5 --- /dev/null +++ b/annotations_1/2LX27W51kB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.13], [11.0, 11.87], [14.0, 14.55], [26.0, 26.03], [72.0, 72.79], [81.0, 81.73], [85.0, 90.51], [95.0, 96.3], [106.0, 106.81], [109.0, 112.02], [113.0, 113.32], [114.0, 114.71], [116.0, 116.87], [118.0, 119.06], [120.0, 122.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 67.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.87, 0.55, 0.03, 0.79, 0.73, 5.51, 1.3, 0.81, 3.02, 0.32, 0.71, 0.87, 1.06, 2.47]} \ No newline at end of file diff --git a/annotations_1/2LhsuPLvtFk_filtered.json b/annotations_1/2LhsuPLvtFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69a07059a91a055fbe5dc871a5d038f28f4d8960 --- /dev/null +++ b/annotations_1/2LhsuPLvtFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [4.0, 4.46], [7.0, 8.06], [16.0, 16.41], [18.0, 19.89], [22.0, 22.47], [24.0, 25.35], [31.0, 31.9], [34.0, 36.19], [39.0, 40.27], [42.0, 42.67], [46.0, 46.72], [48.0, 49.49], [53.0, 53.62], [54.0, 56.12], [57.0, 57.28], [57.0, 63.73], [66.0, 67.09], [82.0, 83.79], [91.0, 91.18], [102.0, 102.57], [105.0, 105.53], [108.0, 108.7], [110.0, 110.1], [112.0, 112.5], [116.0, 116.63], [121.0, 121.27], [123.0, 123.47], [125.0, 126.32], [129.0, 130.06], [132.0, 132.31], [134.0, 134.52], [144.0, 145.02], [148.0, 149.5], [152.0, 152.96], [155.0, 155.49], [156.0, 157.05], [160.0, 160.76], [163.0, 164.52], [167.0, 167.29], [169.0, 170.16], [173.0, 173.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 41.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 20.11], ["music", 18.29], ["hum", 16.69]], null, [["music", 37.1], ["speech", 17.76], ["hum", 17.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.46, 1.06, 0.41, 1.89, 0.47, 1.35, 0.9, 2.19, 1.27, 0.67, 0.72, 1.49, 0.62, 2.12, 0.28, 6.73, 1.09, 1.79, 0.18, 0.57, 0.53, 0.7, 0.1, 0.5, 0.63, 0.27, 0.47, 1.32, 1.06, 0.31, 0.52, 1.02, 1.5, 0.96, 0.49, 1.05, 0.76, 1.52, 0.29, 1.16, 0.53]} \ No newline at end of file diff --git a/annotations_1/2LwWmJojqvM_filtered.json b/annotations_1/2LwWmJojqvM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bce9111f3170b7749a6b27973610f27cae42ceb4 --- /dev/null +++ b/annotations_1/2LwWmJojqvM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [4.0, 6.13], [8.0, 12.23], [13.0, 17.04], [18.0, 27.41], [28.0, 30.06], [31.0, 31.75], [32.0, 41.47], [42.0, 43.6], [44.0, 44.64], [46.0, 47.16], [48.0, 49.3], [50.0, 50.77], [51.0, 51.63], [54.0, 54.63], [56.0, 57.67], [59.0, 61.62], [62.0, 63.19], [63.0, 65.75], [66.0, 67.26], [67.0, 70.31], [71.0, 71.61], [73.0, 73.82], [74.0, 76.18], [79.0, 79.3], [81.0, 81.97], [82.0, 84.11], [86.0, 86.63], [88.0, 89.14], [92.0, 92.4], [94.0, 94.85], [96.0, 97.19], [98.0, 104.18], [105.0, 107.05], [109.0, 110.69], [112.0, 113.41], [115.0, 119.13], [120.0, 120.12], [120.0, 121.93], [123.0, 123.03], [123.0, 123.97], [124.0, 125.29], [128.0, 128.97], [129.0, 131.55], [135.0, 136.22], [137.0, 137.64], [139.0, 140.02], [141.0, 141.66], [143.0, 143.34], [144.0, 144.71], [145.0, 146.25], [148.0, 149.64], [150.0, 151.34], [154.0, 154.94], [160.0, 160.73], [162.0, 162.67], [165.0, 165.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.07, 98.27, 98.59, 33.25, 99.85, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 47.98, 0.0, 90.6, 0.0, 0.0, 36.48, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 99.85, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 41.86], ["telephone bell ringing", 37.1], ["telephone", 10.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 39.58], ["speech", 16.22], ["dial tone", 14.87]], null, null, null, null, [["chirp tone", 35.55], ["tuning fork", 25.17], ["speech", 21.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 2.13, 4.23, 4.04, 9.41, 2.06, 0.75, 9.47, 1.6, 0.64, 1.16, 1.3, 0.77, 0.63, 0.63, 1.67, 2.62, 1.19, 2.75, 1.26, 3.31, 0.61, 0.82, 2.18, 0.3, 0.97, 2.11, 0.63, 1.14, 0.4, 0.85, 1.19, 6.18, 2.05, 1.69, 1.41, 4.13, 0.12, 1.93, 0.03, 0.97, 1.29, 0.97, 2.55, 1.22, 0.64, 1.02, 0.66, 0.34, 0.71, 1.25, 1.64, 1.34, 0.94, 0.73, 0.67, 0.77]} \ No newline at end of file diff --git a/annotations_1/2MxnokvI6c0_filtered.json b/annotations_1/2MxnokvI6c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1225b47d9732c71599de4b8825bf37182ca3621a --- /dev/null +++ b/annotations_1/2MxnokvI6c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.57], [15.0, 16.65], [17.0, 38.28], [42.0, 44.46], [45.0, 45.55], [48.0, 53.37], [54.0, 75.24], [76.0, 78.63], [81.0, 157.1], [160.0, 170.01], [176.0, 175.71], [178.0, 180.42], [181.0, 183.22], [186.0, 190.76], [193.0, 196.86]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.19, 0.0, 32.91, 40.24, 0.0, 93.76, 33.38, 55.31, 0.0, 33.91, 0.0, 45.27, 58.05, 30.12, 60.23], "audiomae_on_audioset": [null, null, [["music", 35.71], ["speech", 18.52], ["hum", 7.77]], [["music", 29.26], ["theremin", 13.12], ["musical instrument", 6.38]], null, null, [["music", 53.77], ["saxophone", 22.22], ["brass instrument", 8.42]], null, null, [["speech", 64.89], ["music", 5.92], ["outside, rural or natural", 2.69]], null, [["cattle, bovinae", 43.51], ["livestock, farm animals, working animals", 33.26], ["moo", 22.46]], null, [["cattle, bovinae", 39.34], ["moo", 21.7], ["livestock, farm animals, working animals", 11.47]], null], "duration": [4.57, 1.65, 21.28, 2.46, 0.55, 5.37, 21.24, 2.63, 76.1, 10.01, -0.29, 2.42, 2.22, 4.76, 3.86]} \ No newline at end of file diff --git a/annotations_1/2NA_wZ2MWBc_filtered.json b/annotations_1/2NA_wZ2MWBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dcb9620c758e0b671b2f8f7e5679d94457ddb49 --- /dev/null +++ b/annotations_1/2NA_wZ2MWBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.9], [10.0, 10.1], [12.0, 12.65], [13.0, 15.11], [26.0, 26.49], [27.0, 28.83], [30.0, 32.19], [34.0, 34.35], [38.0, 39.78], [41.0, 44.24], [45.0, 47.51], [48.0, 54.95], [55.0, 55.73], [58.0, 58.75], [60.0, 60.81], [62.0, 64.94], [69.0, 69.79], [70.0, 70.78], [73.0, 73.26], [75.0, 76.3], [82.0, 84.69], [86.0, 94.54], [99.0, 99.94], [105.0, 105.76], [108.0, 118.84], [121.0, 121.41], [122.0, 127.16]], "keep_status": [true, false, false, true, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [33.66, 0.0, 0.0, 32.92, 0.0, 0.0, 39.25, 0.0, 0.0, 31.72, 30.15, 30.45, 0.0, 0.0, 0.0, 40.97, 0.0, 0.0, 0.0, 0.0, 48.48, 39.21, 0.0, 0.0, 74.44, 0.0, 65.32], "audiomae_on_audioset": [[["speech", 42.89], ["fly, housefly", 9.84], ["hum", 6.68]], null, null, [["speech", 20.62], ["fly, housefly", 11.57], ["insect", 3.59]], null, null, [["music", 71.29], ["speech", 3.88], ["electronic music", 3.33]], null, null, [["music", 29.73], ["speech", 26.88], ["livestock, farm animals, working animals", 6.49]], [["trombone", 41.91], ["brass instrument", 14.4], ["trumpet", 10.14]], [["music", 59.68], ["speech", 5.65], ["hum", 5.1]], null, null, null, [["electric shaver, electric razor", 21.62], ["music", 9.77], ["hum", 6.67]], null, null, null, null, [["fly, housefly", 19.84], ["speech", 15.98], ["insect", 10.68]], [["speech", 30.32], ["fly, housefly", 20.95], ["insect", 14.71]], null, null, null, null, null], "duration": [2.9, 0.1, 0.65, 2.11, 0.49, 1.83, 2.19, 0.35, 1.78, 3.24, 2.51, 6.95, 0.73, 0.75, 0.81, 2.94, 0.79, 0.78, 0.26, 1.3, 2.69, 8.54, 0.94, 0.76, 10.84, 0.41, 5.16]} \ No newline at end of file diff --git a/annotations_1/2NNTVLRN-Ms_filtered.json b/annotations_1/2NNTVLRN-Ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b3016152b71a11da6b1f3f8d48686fb2605da9 --- /dev/null +++ b/annotations_1/2NNTVLRN-Ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.3]], "keep_status": [true], "silence_prob": [30.95], "audiomae_on_audioset": [[["throbbing", 14.22], ["hum", 14.19], ["mains hum", 11.35]]], "duration": [6.3]} \ No newline at end of file diff --git a/annotations_1/2NR-tebGw3U_filtered.json b/annotations_1/2NR-tebGw3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17e16a7d8138f46367998e11dc725415e52e46b --- /dev/null +++ b/annotations_1/2NR-tebGw3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.13], [13.0, 14.69], [16.0, 24.78], [25.0, 25.76], [28.0, 28.26], [30.0, 37.12], [38.0, 43.93], [45.0, 45.91], [47.0, 52.0], [55.0, 55.56], [60.0, 64.1], [67.0, 67.22], [73.0, 77.87], [79.0, 79.79], [81.0, 82.98], [90.0, 109.02], [113.0, 113.61], [116.0, 116.46], [122.0, 123.21], [125.0, 125.31], [134.0, 134.23], [135.0, 136.21], [140.0, 140.22], [142.0, 142.7], [147.0, 149.54], [151.0, 155.12]], "keep_status": [false, false, true, false, false, true, true, false, true, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.37, 0.0, 0.0, 43.43, 39.21, 0.0, 41.1, 0.0, 46.97, 0.0, 42.08, 0.0, 0.0, 32.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.97, 62.89], "audiomae_on_audioset": [null, null, [["gong", 22.3], ["whale vocalization", 21.07], ["music", 11.39]], null, null, [["hum", 15.43], ["mains hum", 7.39], ["vehicle", 6.76]], [["hum", 12.74], ["music", 10.09], ["throbbing", 7.51]], null, [["speech", 20.6], ["hum", 19.8], ["music", 7.28]], null, [["hum", 37.23], ["mains hum", 13.31], ["throbbing", 7.28]], null, [["noise", 34.75], ["music", 17.86], ["synthesizer", 11.9]], null, null, [["speech", 25.47], ["buzz", 21.16], ["music", 5.71]], null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 1.69, 8.78, 0.76, 0.26, 7.12, 5.93, 0.91, 5.0, 0.56, 4.1, 0.22, 4.87, 0.79, 1.98, 19.02, 0.61, 0.46, 1.21, 0.31, 0.23, 1.21, 0.22, 0.7, 2.54, 4.12]} \ No newline at end of file diff --git a/annotations_1/2NkV6POGLOc_filtered.json b/annotations_1/2NkV6POGLOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34c7c3d03e80b5c64def73ec0e1a52bbc0fae148 --- /dev/null +++ b/annotations_1/2NkV6POGLOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [2.0, 2.91], [3.0, 3.82], [6.0, 6.84], [9.0, 10.12], [12.0, 12.19], [19.0, 19.36], [22.0, 21.76], [24.0, 27.38], [29.0, 29.67], [30.0, 31.08], [32.0, 32.41], [36.0, 36.73], [39.0, 40.12], [45.0, 45.99], [46.0, 46.11], [46.0, 46.5], [48.0, 49.67], [56.0, 57.6], [59.0, 59.85], [60.0, 61.48], [64.0, 64.62], [65.0, 66.61], [69.0, 73.85], [75.0, 79.35], [80.0, 85.51], [89.0, 89.36], [91.0, 100.99], [102.0, 111.94], [114.0, 116.95], [118.0, 120.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 57.48, 52.68, 0.0, 97.33, 91.13, 98.99, 95.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.91, 0.82, 0.84, 1.12, 0.19, 0.36, -0.24, 3.38, 0.67, 1.08, 0.41, 0.73, 1.12, 0.99, 0.11, 0.5, 1.67, 1.6, 0.85, 1.48, 0.62, 1.61, 4.85, 4.35, 5.51, 0.36, 9.99, 9.94, 2.95, 2.43]} \ No newline at end of file diff --git a/annotations_1/2OXtHJgLJr0_filtered.json b/annotations_1/2OXtHJgLJr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b2d4333d926ef640132f304a8ac6d020a68f7dc --- /dev/null +++ b/annotations_1/2OXtHJgLJr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.69], [8.0, 16.88], [18.0, 19.43], [20.0, 20.73], [21.0, 43.31], [45.0, 44.69], [46.0, 47.14], [48.0, 49.32], [53.0, 75.0], [77.0, 77.33], [78.0, 124.04], [124.0, 124.14], [128.0, 130.0], [134.0, 170.45]], "keep_status": [true, false, false, false, true, false, false, false, true, false, false, false, true, false], "silence_prob": [34.98, 36.72, 0.0, 0.0, 33.14, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0, 0.0, 47.08, 0.0], "audiomae_on_audioset": [[["music", 26.94], ["trombone", 13.75], ["brass instrument", 7.79]], [["music", 73.42], ["musical instrument", 4.35], ["synthesizer", 3.59]], null, null, [["music", 31.95], ["speech", 16.4], ["hum", 14.62]], null, null, null, [["music", 14.4], ["noise", 13.82], ["hum", 11.25]], null, null, null, [["music", 28.05], ["synthesizer", 10.64], ["mains hum", 8.39]], null], "duration": [2.69, 8.88, 1.43, 0.73, 22.31, -0.31, 1.14, 1.32, 22.0, 0.33, 46.04, 0.14, 2.0, 36.45]} \ No newline at end of file diff --git a/annotations_1/2OrlbOFhcUs_filtered.json b/annotations_1/2OrlbOFhcUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff11f4d24793ce5e3cc2d1b8639d2273174e8f06 --- /dev/null +++ b/annotations_1/2OrlbOFhcUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 8.21], [9.0, 24.76], [25.0, 27.73], [28.0, 68.89], [70.0, 75.57], [78.0, 78.51], [80.0, 121.0]], "keep_status": [true, false, false, false, true, false, false], "silence_prob": [36.73, 33.79, 34.72, 0.0, 39.75, 0.0, 0.0], "audiomae_on_audioset": [[["music", 19.32], ["electric shaver, electric razor", 10.8], ["didgeridoo", 10.59]], [["mains hum", 43.07], ["hum", 25.03], ["electric shaver, electric razor", 8.44]], [["tuning fork", 48.96], ["sine wave", 27.02], ["hum", 5.83]], null, [["music", 38.28], ["didgeridoo", 15.73], ["throbbing", 13.11]], null, null], "duration": [8.21, 15.76, 2.73, 40.89, 5.57, 0.51, 41.0]} \ No newline at end of file diff --git a/annotations_1/2Q0IkYxSo3w_filtered.json b/annotations_1/2Q0IkYxSo3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dee5af05546daa96bdfe3c0ac0a52394f97b138 --- /dev/null +++ b/annotations_1/2Q0IkYxSo3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.92], [18.0, 20.04], [21.0, 21.91], [24.0, 23.87], [24.0, 24.04], [26.0, 26.42], [30.0, 30.82], [32.0, 32.49], [34.0, 34.65], [45.0, 45.86], [47.0, 47.92], [49.0, 49.17], [50.0, 50.55], [52.0, 52.12], [53.0, 53.65], [57.0, 57.13], [58.0, 58.63], [68.0, 69.04], [72.0, 73.09], [74.0, 75.22], [77.0, 77.21], [81.0, 82.04], [83.0, 83.08], [84.0, 84.52], [88.0, 89.31], [90.0, 92.47], [93.0, 94.19], [95.0, 95.23], [96.0, 98.88], [101.0, 102.64], [108.0, 109.7], [111.0, 111.6], [114.0, 115.01], [116.0, 116.85], [118.0, 118.98], [121.0, 127.01], [128.0, 130.23], [132.0, 132.34], [134.0, 134.74], [142.0, 142.8], [146.0, 145.77], [148.0, 149.86], [152.0, 153.15], [154.0, 154.36], [155.0, 156.61], [158.0, 158.82], [159.0, 160.46], [162.0, 161.84], [163.0, 163.11], [164.0, 172.13], [173.0, 181.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.57, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.4], ["mains hum", 17.57], ["music", 8.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.92, 2.04, 0.91, -0.13, 0.04, 0.42, 0.82, 0.49, 0.65, 0.86, 0.92, 0.17, 0.55, 0.12, 0.65, 0.13, 0.63, 1.04, 1.09, 1.22, 0.21, 1.04, 0.08, 0.52, 1.31, 2.47, 1.19, 0.23, 2.88, 1.64, 1.7, 0.6, 1.01, 0.85, 0.98, 6.01, 2.23, 0.34, 0.74, 0.8, -0.23, 1.86, 1.15, 0.36, 1.61, 0.82, 1.46, -0.16, 0.11, 8.13, 8.18]} \ No newline at end of file diff --git a/annotations_1/2Q7wnttjQgw_filtered.json b/annotations_1/2Q7wnttjQgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64bbacd9fa58451b1847b0eb2b9d4616e3741e51 --- /dev/null +++ b/annotations_1/2Q7wnttjQgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.73], [8.0, 8.38], [11.0, 14.45], [21.0, 22.25], [25.0, 25.76], [33.0, 34.64], [36.0, 36.39], [37.0, 44.12], [47.0, 47.33], [53.0, 59.58], [65.0, 65.26], [70.0, 74.7], [76.0, 76.62], [83.0, 89.7], [92.0, 93.58], [94.0, 102.34], [104.0, 105.78], [109.0, 110.83], [112.0, 113.02], [116.0, 120.55], [122.0, 123.3], [125.0, 130.18], [131.0, 140.19], [143.0, 144.26], [145.0, 148.2], [150.0, 151.66], [153.0, 154.97], [155.0, 161.82]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [33.67, 0.0, 33.77, 0.0, 0.0, 0.0, 0.0, 33.98, 0.0, 35.22, 0.0, 36.89, 0.0, 47.23, 0.0, 43.51, 0.0, 0.0, 0.0, 36.42, 0.0, 36.04, 33.7, 0.0, 87.37, 0.0, 0.0, 73.82], "audiomae_on_audioset": [[["cattle, bovinae", 30.87], ["livestock, farm animals, working animals", 29.02], ["moo", 19.2]], null, [["hum", 22.16], ["music", 17.4], ["mains hum", 15.14]], null, null, null, null, [["music", 56.88], ["speech", 16.9], ["didgeridoo", 6.1]], null, [["music", 41.23], ["fart", 17.85], ["groan", 6.04]], null, [["moo", 24.44], ["cattle, bovinae", 20.79], ["speech", 12.52]], null, [["music", 32.83], ["fart", 28.83], ["fly, housefly", 10.21]], null, [["music", 69.43], ["musical instrument", 4.79], ["synthesizer", 3.68]], null, null, null, [["music", 72.0], ["synthesizer", 3.35], ["electronic music", 1.97]], null, [["music", 49.52], ["fly, housefly", 10.59], ["insect", 3.88]], [["music", 50.23], ["boing", 13.56], ["speech", 5.81]], null, null, null, null, null], "duration": [4.73, 0.38, 3.45, 1.25, 0.76, 1.64, 0.39, 7.12, 0.33, 6.58, 0.26, 4.7, 0.62, 6.7, 1.58, 8.34, 1.78, 1.83, 1.02, 4.55, 1.3, 5.18, 9.19, 1.26, 3.2, 1.66, 1.97, 6.82]} \ No newline at end of file diff --git a/annotations_1/2Qz0AREgsdQ_filtered.json b/annotations_1/2Qz0AREgsdQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..637b81143f18dede92d03c1dfbe44a78d5d982e1 --- /dev/null +++ b/annotations_1/2Qz0AREgsdQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.33], [26.0, 28.36], [29.0, 30.91], [31.0, 32.26], [34.0, 34.69], [37.0, 37.25], [38.0, 39.88], [41.0, 41.89], [43.0, 44.0], [47.0, 50.68], [55.0, 55.78], [57.0, 57.62], [61.0, 62.16], [66.0, 66.93], [67.0, 68.23], [69.0, 69.55], [71.0, 75.27], [77.0, 77.8], [85.0, 85.82], [91.0, 91.23], [96.0, 96.74], [113.0, 114.27], [115.0, 115.75], [123.0, 128.85], [132.0, 132.41], [136.0, 136.66], [143.0, 145.35], [151.0, 151.88], [164.0, 165.72], [171.0, 172.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.42], ["hum", 19.74], ["throbbing", 9.06]], null, null, null, null, null, null, [["speech", 26.65], ["music", 23.69], ["hum", 5.37]], null, null, null, null, null, null], "duration": [0.33, 2.36, 1.91, 1.26, 0.69, 0.25, 1.88, 0.89, 1.0, 3.68, 0.78, 0.62, 1.16, 0.93, 1.23, 0.55, 4.27, 0.8, 0.82, 0.23, 0.74, 1.27, 0.75, 5.85, 0.41, 0.66, 2.35, 0.88, 1.72, 1.23]} \ No newline at end of file diff --git a/annotations_1/2T51K4xsBjg_filtered.json b/annotations_1/2T51K4xsBjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93345c5743f4f6a7e450413041c720b57d122953 --- /dev/null +++ b/annotations_1/2T51K4xsBjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.17], [20.0, 20.11], [22.0, 22.0], [24.0, 24.31], [27.0, 27.13], [31.0, 32.61], [52.0, 52.22], [53.0, 54.72], [58.0, 59.9], [60.0, 61.45], [63.0, 65.77], [67.0, 67.47], [70.0, 70.16], [70.0, 71.32], [72.0, 72.57], [78.0, 78.56], [79.0, 80.4], [92.0, 92.57], [94.0, 93.73], [96.0, 97.02], [100.0, 102.86], [113.0, 113.22], [116.0, 119.13], [120.0, 120.39], [121.0, 122.45], [124.0, 123.97], [125.0, 126.06], [126.0, 126.52], [128.0, 128.8], [131.0, 132.88], [134.0, 134.18], [136.0, 137.89], [138.0, 141.18], [144.0, 144.14], [145.0, 145.02], [145.0, 146.52], [148.0, 150.23], [151.0, 151.73], [153.0, 155.48], [159.0, 158.65], [159.0, 160.59], [166.0, 167.26], [170.0, 171.49], [172.0, 172.79], [176.0, 177.85], [181.0, 183.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.89, 0.0, 0.0, 0.0, 43.15, 0.0, 32.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.89], ["musical instrument", 4.59], ["guitar", 3.93]], null, null, null, [["music", 47.78], ["throbbing", 4.91], ["electronic music", 4.87]], null, [["livestock, farm animals, working animals", 29.13], ["cattle, bovinae", 26.59], ["moo", 25.59]], null, null, null, null, null, null, [["music", 41.49], ["didgeridoo", 27.37], ["musical instrument", 4.44]]], "duration": [9.17, 0.11, 0.0, 0.31, 0.13, 1.61, 0.22, 1.72, 1.9, 1.45, 2.77, 0.47, 0.16, 1.32, 0.57, 0.56, 1.4, 0.57, -0.27, 1.02, 2.86, 0.22, 3.13, 0.39, 1.45, -0.03, 1.06, 0.52, 0.8, 1.88, 0.18, 1.89, 3.18, 0.14, 0.02, 1.52, 2.23, 0.73, 2.48, -0.35, 1.59, 1.26, 1.49, 0.79, 1.85, 2.83]} \ No newline at end of file diff --git a/annotations_1/2UBYT9teTIs_filtered.json b/annotations_1/2UBYT9teTIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..969f413f1ccc771ce7935f48fc6b88515253a474 --- /dev/null +++ b/annotations_1/2UBYT9teTIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.79], [20.0, 20.68], [25.0, 25.02], [38.0, 41.74], [49.0, 49.69], [51.0, 51.51], [53.0, 55.22], [57.0, 60.76], [62.0, 62.75], [64.0, 73.43], [75.0, 76.38], [84.0, 84.2], [85.0, 85.63], [89.0, 89.06], [93.0, 94.19], [96.0, 96.87], [99.0, 100.33], [101.0, 101.66], [102.0, 104.31], [105.0, 108.28], [115.0, 115.08], [127.0, 127.09], [131.0, 131.82], [142.0, 142.84], [144.0, 144.54], [145.0, 146.35], [156.0, 155.93], [157.0, 158.03]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.93, 0.0, 0.0, 57.48, 38.52, 0.0, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 25.47], ["speech", 14.91], ["sheep", 8.37]], null, null, null, [["music", 44.68], ["musical instrument", 6.4], ["effects unit", 6.11]], null, [["speech", 84.34], ["music", 2.5], ["whack, thwack", 2.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.68, 0.02, 3.74, 0.69, 0.51, 2.22, 3.76, 0.75, 9.43, 1.38, 0.2, 0.63, 0.06, 1.19, 0.87, 1.33, 0.66, 2.31, 3.28, 0.08, 0.09, 0.82, 0.84, 0.54, 1.35, -0.07, 1.03]} \ No newline at end of file diff --git a/annotations_1/2UK1aSp3bUY_filtered.json b/annotations_1/2UK1aSp3bUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3bed840af399a8e506961180e53b757a0b4bbb --- /dev/null +++ b/annotations_1/2UK1aSp3bUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.22], [12.0, 34.96], [36.0, 37.35], [39.0, 41.93], [46.0, 50.77], [54.0, 56.34], [57.0, 64.49], [68.0, 67.91], [72.0, 72.45], [74.0, 74.29], [76.0, 78.22], [80.0, 80.77], [81.0, 81.85], [84.0, 84.16], [84.0, 84.25], [85.0, 85.72], [90.0, 91.88], [93.0, 95.3], [98.0, 98.52], [99.0, 99.89], [101.0, 102.59], [107.0, 106.76], [111.0, 112.09], [116.0, 116.61], [118.0, 119.45], [120.0, 121.02], [122.0, 129.66], [134.0, 144.53], [146.0, 147.38], [149.0, 149.86], [151.0, 151.8], [153.0, 153.33], [156.0, 156.42], [160.0, 162.82], [171.0, 171.05], [172.0, 174.06]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [65.32, 69.74, 0.0, 70.02, 49.4, 53.22, 62.78, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 38.05, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 0.0, 66.27], "audiomae_on_audioset": [null, null, null, null, [["music", 38.02], ["speech", 8.3], ["didgeridoo", 7.03]], null, null, null, null, null, [["music", 34.07], ["singing bowl", 12.74], ["mains hum", 7.68]], null, null, null, null, null, null, [["canidae, dogs, wolves", 14.56], ["howl", 8.73], ["dog", 7.84]], null, null, null, null, null, null, null, null, [["music", 35.41], ["groan", 15.06], ["speech", 14.37]], [["music", 52.11], ["speech", 12.3], ["theremin", 6.39]], null, null, null, null, null, null, null, null], "duration": [4.22, 22.96, 1.35, 2.93, 4.77, 2.34, 7.49, -0.09, 0.45, 0.29, 2.22, 0.77, 0.85, 0.16, 0.25, 0.72, 1.88, 2.3, 0.52, 0.89, 1.59, -0.24, 1.09, 0.61, 1.45, 1.02, 7.66, 10.53, 1.38, 0.86, 0.8, 0.33, 0.42, 2.82, 0.05, 2.06]} \ No newline at end of file diff --git a/annotations_1/2UOL-ZHUOC4_filtered.json b/annotations_1/2UOL-ZHUOC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40e2ae8ff62e655692e0442be4cf2be15e8cc46c --- /dev/null +++ b/annotations_1/2UOL-ZHUOC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [9.0, 9.24], [11.0, 10.93], [14.0, 17.74], [18.0, 20.12], [20.0, 20.56], [22.0, 26.03], [27.0, 29.74], [31.0, 32.31], [34.0, 34.06], [35.0, 44.24], [46.0, 47.01], [48.0, 49.42], [50.0, 52.73], [55.0, 60.94], [62.0, 62.68], [65.0, 66.19], [67.0, 72.6], [75.0, 75.27], [76.0, 79.2], [80.0, 81.8], [84.0, 85.67], [86.0, 86.53], [87.0, 89.09], [93.0, 102.81], [103.0, 105.88], [108.0, 113.14], [119.0, 119.74], [128.0, 128.33], [128.0, 129.66], [131.0, 132.75], [134.0, 140.14], [141.0, 144.93], [147.0, 149.52], [151.0, 153.23], [156.0, 155.7], [156.0, 155.88], [157.0, 168.03], [170.0, 171.95], [175.0, 175.36], [180.0, 180.62], [182.0, 187.24]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 52.68, 43.58, 0.0, 77.03, 51.55, 0.0, 0.0, 35.0, 0.0, 0.0, 48.91, 72.75, 0.0, 0.0, 47.05, 0.0, 92.97, 0.0, 0.0, 0.0, 45.3, 90.95, 54.43, 67.38, 0.0, 0.0, 0.0, 0.0, 54.7, 81.17, 82.07, 99.16, 0.0, 0.0, 37.21, 0.0, 0.0, 0.0, 36.24], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.48], ["sidetone", 8.98], ["radio", 5.88]], null, null, null, null, null, [["music", 62.2], ["didgeridoo", 17.27], ["musical instrument", 3.69]], null, null, [["music", 22.98], ["speech", 16.76], ["hum", 9.21]], null, null, null, [["music", 34.92], ["didgeridoo", 7.66], ["gong", 6.09]], null, null, null, null, null, [["music", 35.48], ["didgeridoo", 21.51], ["hum", 6.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 30.86], ["livestock, farm animals, working animals", 8.39], ["cattle, bovinae", 5.39]], null, null, null, [["speech", 22.72], ["dog", 7.27], ["bark", 6.08]]], "duration": [1.06, 0.24, -0.07, 3.74, 2.12, 0.56, 4.03, 2.74, 1.31, 0.06, 9.24, 1.01, 1.42, 2.73, 5.94, 0.68, 1.19, 5.6, 0.27, 3.2, 1.8, 1.67, 0.53, 2.09, 9.81, 2.88, 5.14, 0.74, 0.33, 1.66, 1.75, 6.14, 3.93, 2.52, 2.23, -0.3, -0.12, 11.03, 1.95, 0.36, 0.62, 5.24]} \ No newline at end of file diff --git a/annotations_1/2UPj8FTPaXg_filtered.json b/annotations_1/2UPj8FTPaXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a82e55af57a11b39ad00ea3b07950e1ea774fb17 --- /dev/null +++ b/annotations_1/2UPj8FTPaXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [9.0, 8.87], [11.0, 55.66], [56.0, 57.06], [60.0, 62.63], [64.0, 64.88], [74.0, 78.98], [81.0, 82.09], [84.0, 99.35], [100.0, 112.13], [113.0, 115.45], [121.0, 122.18], [123.0, 123.35], [124.0, 130.0], [135.0, 162.82], [164.0, 164.51], [166.0, 166.29], [167.0, 167.41]], "keep_status": [false, false, false, false, true, false, true, false, false, true, true, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 30.93, 0.0, 34.62, 28.82, 43.25, 0.0, 0.0, 28.75, 29.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 28.75], ["speech", 12.94], ["livestock, farm animals, working animals", 9.74]], null, [["cattle, bovinae", 24.71], ["moo", 12.03], ["speech", 11.75]], null, [["throbbing", 33.21], ["hum", 25.26], ["music", 11.85]], [["music", 29.98], ["explosion", 21.21], ["hum", 7.68]], [["fly, housefly", 30.71], ["bee, wasp, etc.", 17.08], ["insect", 10.91]], null, null, [["livestock, farm animals, working animals", 22.96], ["cattle, bovinae", 20.7], ["moo", 11.05]], [["speech", 32.6], ["livestock, farm animals, working animals", 6.46], ["explosion", 5.46]], null, null, null], "duration": [0.89, -0.13, 44.66, 1.06, 2.63, 0.88, 4.98, 1.09, 15.35, 12.13, 2.45, 1.18, 0.35, 6.0, 27.82, 0.51, 0.29, 0.41]} \ No newline at end of file diff --git a/annotations_1/2UuM47BOqNA_filtered.json b/annotations_1/2UuM47BOqNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f99ffec8cadc0b419f1d279a3cea65517f168167 --- /dev/null +++ b/annotations_1/2UuM47BOqNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [5.0, 11.37], [15.0, 18.91], [20.0, 28.85], [30.0, 34.57], [35.0, 36.04], [38.0, 40.0], [41.0, 48.22], [50.0, 56.02], [56.0, 66.66], [71.0, 72.49], [75.0, 75.91], [79.0, 80.99], [82.0, 82.04], [84.0, 85.36], [87.0, 88.11], [91.0, 94.12], [95.0, 95.64], [100.0, 102.68], [107.0, 107.15], [109.0, 109.92], [111.0, 111.01], [112.0, 117.27], [121.0, 121.69], [122.0, 127.7], [130.0, 169.8], [173.0, 174.34]], "keep_status": [false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 36.8, 89.54, 50.11, 48.74, 0.0, 35.5, 39.14, 61.57, 41.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.52, 0.0, 43.61, 0.0, 0.0, 0.0, 44.15, 0.0, 49.87, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 38.14], ["music", 24.1], ["thunk", 4.17]], null, null, [["speech", 21.72], ["music", 18.69], ["mains hum", 6.4]], null, [["music", 52.75], ["musical instrument", 6.4], ["effects unit", 3.08]], [["music", 65.7], ["speech", 8.36], ["theremin", 4.84]], null, [["music", 68.23], ["synthesizer", 4.85], ["theremin", 3.52]], null, null, null, null, null, null, [["music", 36.93], ["tabla", 9.93], ["sitar", 8.9]], null, [["speech", 20.14], ["music", 15.92], ["electric shaver, electric razor", 15.82]], null, null, null, [["music", 20.6], ["hum", 7.5], ["mains hum", 6.16]], null, [["thunk", 30.45], ["music", 27.79], ["didgeridoo", 13.79]], null, null], "duration": [0.96, 6.37, 3.91, 8.85, 4.57, 1.04, 2.0, 7.22, 6.02, 10.66, 1.49, 0.91, 1.99, 0.04, 1.36, 1.11, 3.12, 0.64, 2.68, 0.15, 0.92, 0.01, 5.27, 0.69, 5.7, 39.8, 1.34]} \ No newline at end of file diff --git a/annotations_1/2VgamrBe_vM_filtered.json b/annotations_1/2VgamrBe_vM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c3d3519e07150236b3dfc218d157388a23f4880 --- /dev/null +++ b/annotations_1/2VgamrBe_vM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [9.0, 9.37], [12.0, 12.8], [13.0, 15.26], [22.0, 22.89], [23.0, 26.64], [29.0, 33.44], [34.0, 42.57], [43.0, 45.1], [57.0, 56.81], [60.0, 60.61], [62.0, 69.79], [77.0, 78.38], [82.0, 83.15], [84.0, 101.19], [104.0, 104.11], [107.0, 107.38], [108.0, 108.4], [109.0, 109.31], [110.0, 110.42], [113.0, 119.04], [122.0, 121.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.82, 0.0, 55.39, 95.37, 39.41, 82.79, 0.0, 0.0, 40.68, 0.0, 0.0, 33.36, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 74.01], ["sidetone", 10.92], ["dial tone", 5.7]], null, null, null, [["speech", 58.69], ["music", 9.08], ["effects unit", 3.31]], null, null, [["hum", 13.41], ["music", 12.6], ["speech", 11.75]], null, null, null, null, null, null, null], "duration": [0.4, 0.37, 0.8, 2.26, 0.89, 3.64, 4.44, 8.57, 2.1, -0.19, 0.61, 7.79, 1.38, 1.15, 17.19, 0.11, 0.38, 0.4, 0.31, 0.42, 6.04, -0.31]} \ No newline at end of file diff --git a/annotations_1/2W3KDB0yHYM_filtered.json b/annotations_1/2W3KDB0yHYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2cb9b70244d3076546adec0ab5e4cd5cddd9c14 --- /dev/null +++ b/annotations_1/2W3KDB0yHYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [22.0, 108.87]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.67, 86.87]} \ No newline at end of file diff --git a/annotations_1/2WDIu8XbVD8_filtered.json b/annotations_1/2WDIu8XbVD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a60c9d11acbbb992cf86fa67465259f003bcac8c --- /dev/null +++ b/annotations_1/2WDIu8XbVD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [5.0, 5.63], [16.0, 16.23], [17.0, 18.98], [22.0, 22.54], [25.0, 28.09], [31.0, 32.31], [33.0, 33.89], [35.0, 36.34], [38.0, 38.99], [48.0, 48.3], [72.0, 73.57], [75.0, 75.1], [78.0, 78.14], [85.0, 84.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 64.48], ["insect", 17.99], ["mosquito", 9.01]], null, null, null, null, null, null, null, null, null], "duration": [1.04, 0.63, 0.23, 1.98, 0.54, 3.09, 1.31, 0.89, 1.34, 0.99, 0.3, 1.57, 0.1, 0.14, -0.19]} \ No newline at end of file diff --git a/annotations_1/2WJjBuXiXK0_filtered.json b/annotations_1/2WJjBuXiXK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8de0daacc478430fd3edc780c76c893db134e8f --- /dev/null +++ b/annotations_1/2WJjBuXiXK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.02], [7.0, 11.67], [12.0, 15.13], [16.0, 17.31], [18.0, 20.39], [21.0, 31.9], [32.0, 34.62], [36.0, 38.62], [39.0, 40.29], [41.0, 42.3], [44.0, 47.01], [48.0, 51.51], [53.0, 55.27], [57.0, 59.29], [61.0, 62.48], [64.0, 64.61], [66.0, 69.23], [72.0, 73.23], [75.0, 75.74], [79.0, 88.21], [90.0, 91.25], [92.0, 100.77], [103.0, 103.4], [105.0, 105.73], [107.0, 111.6], [112.0, 113.21], [116.0, 116.23], [117.0, 123.43], [125.0, 128.44], [129.0, 136.12], [137.0, 141.66], [143.0, 143.06], [144.0, 150.48], [151.0, 153.49], [154.0, 174.97], [176.0, 181.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [72.75, 79.94, 61.97, 0.0, 90.6, 80.29, 62.17, 88.83, 0.0, 0.0, 79.07, 88.28, 66.88, 63.21, 0.0, 0.0, 64.63, 0.0, 0.0, 60.32, 0.0, 60.32, 0.0, 0.0, 59.15, 0.0, 0.0, 60.51, 59.59, 58.72, 59.24, 0.0, 55.74, 65.55, 58.55, 49.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.1], ["hum", 6.23], ["musical instrument", 3.77]]], "duration": [3.02, 4.67, 3.13, 1.31, 2.39, 10.9, 2.62, 2.62, 1.29, 1.3, 3.01, 3.51, 2.27, 2.29, 1.48, 0.61, 3.23, 1.23, 0.74, 9.21, 1.25, 8.77, 0.4, 0.73, 4.6, 1.21, 0.23, 6.43, 3.44, 7.12, 4.66, 0.06, 6.48, 2.49, 20.97, 5.23]} \ No newline at end of file diff --git a/annotations_1/2X8O8PN7GOQ_filtered.json b/annotations_1/2X8O8PN7GOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e361ce0eeae1ef5ecbbd6b0e4cdfd81c2f6ab84 --- /dev/null +++ b/annotations_1/2X8O8PN7GOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 143.45], [144.0, 158.57]], "keep_status": [false, false], "silence_prob": [0.0, 29.4], "audiomae_on_audioset": [null, [["speech", 48.2], ["music", 15.92], ["mains hum", 6.18]]], "duration": [121.45, 14.57]} \ No newline at end of file diff --git a/annotations_1/2XmLLBZnvDg_filtered.json b/annotations_1/2XmLLBZnvDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ac7aa90d73df844896bc6eac406e6749f4e28cf --- /dev/null +++ b/annotations_1/2XmLLBZnvDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.86], [10.0, 10.91], [12.0, 12.92], [18.0, 19.5], [27.0, 28.14], [33.0, 35.73], [38.0, 38.99], [39.0, 43.82], [45.0, 50.06], [51.0, 51.83], [53.0, 55.07], [57.0, 71.2], [72.0, 72.79], [75.0, 75.22], [75.0, 84.01], [85.0, 85.9], [93.0, 92.7], [96.0, 96.69], [98.0, 98.09], [100.0, 100.01], [102.0, 102.41], [108.0, 108.95], [111.0, 112.19], [118.0, 118.86], [119.0, 120.58], [121.0, 121.32], [123.0, 123.15], [124.0, 128.63], [131.0, 131.5], [135.0, 135.82], [137.0, 141.51], [145.0, 147.55], [150.0, 150.4], [152.0, 158.75], [159.0, 159.54], [161.0, 161.7], [162.0, 164.88], [168.0, 170.24], [172.0, 174.82], [179.0, 191.46], [195.0, 201.99], [209.0, 209.6], [213.0, 259.31], [261.0, 263.56], [264.0, 265.71]], "keep_status": [false, false, false, false, false, true, false, true, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.69, 0.0, 32.7, 34.16, 0.0, 40.92, 43.33, 0.0, 0.0, 40.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 62.58, 77.87, 0.0, 88.46, 0.0, 0.0, 59.59, 99.21, 78.89, 29.16, 29.56, 0.0, 0.0, 31.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 25.17], ["throbbing", 6.22], ["frog", 6.12]], null, [["music", 32.2], ["speech", 26.82], ["hum", 4.4]], [["speech", 22.69], ["music", 18.29], ["hum", 12.15]], null, [["music", 28.73], ["noise", 16.53], ["synthesizer", 7.49]], [["hum", 16.61], ["electric shaver, electric razor", 13.86], ["mains hum", 9.93]], null, null, [["hum", 19.04], ["whale vocalization", 14.24], ["fly, housefly", 8.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 38.92], ["speech", 17.86], ["outside, rural or natural", 6.03]], [["mains hum", 28.53], ["hum", 27.52], ["buzz", 14.03]], null, null, [["mains hum", 71.92], ["hum", 23.03], ["throbbing", 1.81]], null], "duration": [0.86, 0.91, 0.92, 1.5, 1.14, 2.73, 0.99, 4.82, 5.06, 0.83, 2.07, 14.2, 0.79, 0.22, 9.01, 0.9, -0.3, 0.69, 0.09, 0.01, 0.41, 0.95, 1.19, 0.86, 1.58, 0.32, 0.15, 4.63, 0.5, 0.82, 4.51, 2.55, 0.4, 6.75, 0.54, 0.7, 2.88, 2.24, 2.82, 12.46, 6.99, 0.6, 46.31, 2.56, 1.71]} \ No newline at end of file diff --git a/annotations_1/2Y_CzHI89mQ_filtered.json b/annotations_1/2Y_CzHI89mQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0c32c920993e67e34bcca9a53f2b8eecf516889 --- /dev/null +++ b/annotations_1/2Y_CzHI89mQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.3], [27.0, 28.22], [31.0, 32.24], [33.0, 36.19], [40.0, 40.42], [41.0, 43.06], [45.0, 49.01], [51.0, 52.44], [55.0, 56.24], [59.0, 61.57], [64.0, 74.11], [75.0, 77.87], [78.0, 90.05], [92.0, 95.3], [97.0, 98.31], [106.0, 105.87], [107.0, 122.42], [123.0, 137.54], [138.0, 171.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.89, 0.0, 0.0, 64.75, 0.0, 83.16, 81.89, 0.0, 0.0, 98.36, 99.92, 99.97, 95.78, 99.65, 0.0, 0.0, 99.96, 86.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.3, 1.22, 1.24, 3.19, 0.42, 2.06, 4.01, 1.44, 1.24, 2.57, 10.11, 2.87, 12.05, 3.3, 1.31, -0.13, 15.42, 14.54, 33.73]} \ No newline at end of file diff --git a/annotations_1/2ZTrUc824oI_filtered.json b/annotations_1/2ZTrUc824oI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83264a3bff97fe14a9e6abc23ec690db533f9fb2 --- /dev/null +++ b/annotations_1/2ZTrUc824oI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [4.0, 6.03], [8.0, 9.04], [12.0, 12.78], [15.0, 17.15], [22.0, 21.81], [25.0, 25.93], [29.0, 29.83], [31.0, 32.68], [34.0, 36.53], [39.0, 40.8], [45.0, 45.57], [50.0, 50.35], [50.0, 50.46], [51.0, 51.44], [54.0, 55.21], [88.0, 90.96], [96.0, 110.51], [112.0, 113.0], [114.0, 115.3], [124.0, 133.88], [139.0, 142.28], [143.0, 145.02], [146.0, 147.12], [149.0, 149.98], [152.0, 158.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 63.96, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 62.89, 0.0, 0.0, 33.29, 55.96, 81.71, 0.0, 0.0, 36.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 21.35], ["dog", 12.79], ["speech", 12.4]], null, null, null, null, [["speech", 80.8], ["whack, thwack", 2.75], ["gunshot, gunfire", 2.21]]], "duration": [0.43, 2.03, 1.04, 0.78, 2.15, -0.19, 0.93, 0.83, 1.68, 2.53, 1.8, 0.57, 0.35, 0.46, 0.44, 1.21, 2.96, 14.51, 1.0, 1.3, 9.88, 3.28, 2.02, 1.12, 0.98, 6.6]} \ No newline at end of file diff --git a/annotations_1/2_BwhA8M9-w_filtered.json b/annotations_1/2_BwhA8M9-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ae9944e3a39b056411517da154731be64c0c6e8 --- /dev/null +++ b/annotations_1/2_BwhA8M9-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [2.0, 2.24], [3.0, 4.95], [6.0, 6.27], [8.0, 12.7], [13.0, 12.9], [13.0, 16.92], [18.0, 18.35], [19.0, 19.33], [20.0, 21.25], [23.0, 23.77], [25.0, 25.2], [26.0, 28.48], [29.0, 31.04], [32.0, 38.58], [42.0, 42.94], [47.0, 48.19], [50.0, 50.46], [51.0, 52.44], [55.0, 59.49], [61.0, 61.86], [65.0, 67.12], [68.0, 71.22], [73.0, 74.33], [77.0, 79.19], [80.0, 96.31], [98.0, 98.15], [99.0, 99.57], [103.0, 103.82], [106.0, 106.71], [107.0, 107.84], [110.0, 111.5], [129.0, 129.46], [132.0, 132.21], [134.0, 134.11], [137.0, 137.81], [148.0, 150.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.82, 0.0, 51.94, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 45.14, 35.5, 0.0, 0.0, 0.0, 0.0, 33.02, 0.0, 37.03, 33.71, 0.0, 30.73, 30.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 41.86], ["speech", 31.35], ["music", 5.11]], [["music", 70.09], ["musical instrument", 5.05], ["guitar", 4.05]], null, null, null, null, [["music", 58.79], ["vocal music", 5.07], ["singing", 4.75]], null, [["music", 45.01], ["theremin", 15.22], ["synthesizer", 5.15]], [["music", 66.03], ["musical instrument", 4.59], ["guitar", 4.43]], null, [["music", 61.08], ["didgeridoo", 16.63], ["musical instrument", 4.75]], [["music", 61.92], ["carnatic music", 11.33], ["musical instrument", 5.59]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.24, 1.95, 0.27, 4.7, -0.1, 3.92, 0.35, 0.33, 1.25, 0.77, 0.2, 2.48, 2.04, 6.58, 0.94, 1.19, 0.46, 1.44, 4.49, 0.86, 2.12, 3.22, 1.33, 2.19, 16.31, 0.15, 0.57, 0.82, 0.71, 0.84, 1.5, 0.46, 0.21, 0.11, 0.81, 2.94]} \ No newline at end of file diff --git a/annotations_1/2aKkSYvLvXk_filtered.json b/annotations_1/2aKkSYvLvXk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce887c2f28ee4da24cab926d85248650d2113148 --- /dev/null +++ b/annotations_1/2aKkSYvLvXk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.17], [20.0, 22.25], [55.0, 60.83], [62.0, 68.17], [72.0, 72.3], [90.0, 90.93], [93.0, 100.6], [113.0, 115.38], [119.0, 119.38], [121.0, 123.6], [153.0, 153.76]], "keep_status": [false, true, true, true, false, false, false, true, false, false, false], "silence_prob": [42.79, 33.87, 31.93, 32.71, 0.0, 0.0, 39.99, 32.71, 0.0, 32.65, 0.0], "audiomae_on_audioset": [[["music", 73.66], ["beatboxing", 9.89], ["electronic music", 2.17]], [["speech", 35.69], ["music", 20.81], ["effects unit", 6.88]], [["theremin", 18.26], ["music", 14.39], ["vocal music", 5.51]], [["music", 8.08], ["vocal music", 7.32], ["echo", 6.99]], null, null, [["speech", 42.99], ["music", 22.47], ["sidetone", 5.7]], [["speech", 15.54], ["wail, moan", 13.82], ["beatboxing", 13.32]], null, [["music", 62.07], ["vocal music", 11.13], ["a capella", 9.77]], null], "duration": [8.17, 2.25, 5.83, 6.17, 0.3, 0.93, 7.6, 2.38, 0.38, 2.6, 0.76]} \ No newline at end of file diff --git a/annotations_1/2b-ip6hZYgE_filtered.json b/annotations_1/2b-ip6hZYgE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..137b08894609cb21885e2518a0bac87b0ccd2f53 --- /dev/null +++ b/annotations_1/2b-ip6hZYgE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 38.2], [40.0, 41.52], [42.0, 52.32], [58.0, 58.85], [65.0, 64.98], [66.0, 87.47], [88.0, 89.13], [92.0, 91.64], [92.0, 92.57], [93.0, 93.68], [102.0, 122.34], [124.0, 131.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [43.96, 0.0, 34.06, 0.0, 0.0, 33.03, 0.0, 0.0, 0.0, 0.0, 34.07, 31.0], "audiomae_on_audioset": [[["speech", 42.16], ["music", 31.2], ["radio", 14.38]], null, [["speech", 56.41], ["radio", 11.36], ["sidetone", 9.96]], null, null, [["mains hum", 47.85], ["hum", 37.93], ["music", 5.61]], null, null, null, null, [["hum", 38.98], ["mains hum", 27.34], ["music", 20.12]], [["hum", 24.61], ["electric shaver, electric razor", 10.25], ["livestock, farm animals, working animals", 7.97]]], "duration": [3.2, 1.52, 10.32, 0.85, -0.02, 21.47, 1.13, -0.36, 0.57, 0.68, 20.34, 7.16]} \ No newline at end of file diff --git a/annotations_1/2cJGGVlQ8X8_filtered.json b/annotations_1/2cJGGVlQ8X8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8628c448da905e37cbfe359061f6558e1262e755 --- /dev/null +++ b/annotations_1/2cJGGVlQ8X8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 33.03], [35.0, 34.94], [36.0, 36.21], [37.0, 39.46], [42.0, 42.38], [44.0, 53.01], [56.0, 66.02], [69.0, 76.82], [79.0, 79.79], [81.0, 81.9], [82.0, 81.94], [82.0, 81.97], [83.0, 86.14], [89.0, 90.26], [94.0, 104.75], [107.0, 114.93], [115.0, 121.81], [124.0, 124.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [45.43, 0.0, 0.0, 54.04, 0.0, 36.98, 47.62, 51.18, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 45.62, 38.71, 45.92, 0.0], "audiomae_on_audioset": [[["speech", 35.2], ["music", 34.07], ["mains hum", 3.76]], null, null, null, null, [["music", 63.08], ["chant", 9.55], ["mantra", 6.13]], [["music", 60.9], ["scary music", 12.64], ["ambient music", 5.97]], null, null, null, null, null, null, null, [["music", 77.25], ["ambient music", 5.41], ["singing bowl", 5.21]], [["mains hum", 32.54], ["hum", 24.06], ["music", 19.31]], [["music", 36.45], ["speech", 18.33], ["didgeridoo", 14.87]], null], "duration": [6.03, -0.06, 0.21, 2.46, 0.38, 9.01, 10.02, 7.82, 0.79, 0.9, -0.06, -0.03, 3.14, 1.26, 10.75, 7.93, 6.81, 0.66]} \ No newline at end of file diff --git a/annotations_1/2cxG6iiqEdk_filtered.json b/annotations_1/2cxG6iiqEdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f03d7d011c3190aed6db297496b950bcbeb2cdb0 --- /dev/null +++ b/annotations_1/2cxG6iiqEdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.9], [17.0, 17.34], [32.0, 33.84], [37.0, 37.91], [39.0, 39.93], [44.0, 45.55], [50.0, 55.05], [55.0, 56.19], [65.0, 65.94], [67.0, 67.74], [77.0, 77.33], [78.0, 80.1], [84.0, 84.54], [86.0, 87.91], [91.0, 91.12], [99.0, 99.81], [109.0, 109.66], [111.0, 111.67], [112.0, 114.08], [117.0, 117.09], [121.0, 123.2], [128.0, 129.47], [130.0, 129.69], [130.0, 131.21], [132.0, 132.46], [143.0, 143.46], [147.0, 148.0], [149.0, 150.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41, 0.0, 46.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.12], ["music", 26.76], ["hum", 2.48]], null, null, null, null, null, null, null], "duration": [4.9, 0.34, 1.84, 0.91, 0.93, 1.55, 5.05, 1.19, 0.94, 0.74, 0.33, 2.1, 0.54, 1.91, 0.12, 0.81, 0.66, 0.67, 2.08, 0.09, 2.2, 1.47, -0.31, 1.21, 0.46, 0.46, 1.0, 1.43]} \ No newline at end of file diff --git a/annotations_1/2dB26bOiT4E_filtered.json b/annotations_1/2dB26bOiT4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50737b2d61e8374d730af713ed1b6fed041e5709 --- /dev/null +++ b/annotations_1/2dB26bOiT4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.98], [8.0, 9.71], [14.0, 14.4], [21.0, 41.3], [41.0, 41.37], [45.0, 46.36], [46.0, 63.48]], "keep_status": [false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.17, 0.0, 0.0, 28.1], "audiomae_on_audioset": [null, null, null, [["music", 51.75], ["speech", 10.46], ["cacophony", 7.14]], null, null, [["speech", 52.84], ["music", 9.18], ["aircraft", 6.0]]], "duration": [0.98, 1.71, 0.4, 20.3, 0.37, 1.36, 17.48]} \ No newline at end of file diff --git a/annotations_1/2dn_r_sgBEE_filtered.json b/annotations_1/2dn_r_sgBEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b460e01361746440e8484061dec8a0146bbfaf --- /dev/null +++ b/annotations_1/2dn_r_sgBEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.21], [19.0, 29.02], [30.0, 49.13], [53.0, 62.78], [66.0, 66.77], [70.0, 71.15], [72.0, 74.82]], "keep_status": [false, false, false, true, false, false, true], "silence_prob": [70.16, 85.17, 46.94, 30.72, 0.0, 0.0, 28.52], "audiomae_on_audioset": [null, null, [["music", 67.35], ["hum", 9.32], ["electronic music", 5.28]], [["music", 23.84], ["gong", 13.28], ["theremin", 6.8]], null, null, [["sound effect", 15.52], ["music", 12.16], ["livestock, farm animals, working animals", 11.35]]], "duration": [6.21, 10.02, 19.13, 9.78, 0.77, 1.15, 2.82]} \ No newline at end of file diff --git a/annotations_1/2dvchK48Z-o_filtered.json b/annotations_1/2dvchK48Z-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7723215ea7b973d1f9ff1fd99b58179740b1950f --- /dev/null +++ b/annotations_1/2dvchK48Z-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 11.91], [20.0, 21.86], [23.0, 23.03], [24.0, 25.2], [26.0, 26.47], [34.0, 36.04], [38.0, 38.53], [39.0, 42.5], [43.0, 49.91], [50.0, 51.97], [53.0, 59.24], [60.0, 60.37], [61.0, 63.88], [67.0, 75.51], [77.0, 80.7], [82.0, 93.68], [96.0, 100.72], [102.0, 102.24], [106.0, 107.54], [111.0, 111.32], [112.0, 113.0], [115.0, 117.21], [121.0, 121.07], [125.0, 125.71], [131.0, 136.24], [138.0, 139.56], [153.0, 157.71], [168.0, 172.37], [175.0, 177.92], [191.0, 192.05]], "keep_status": [false, false, false, false, false, true, false, true, true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.75, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 33.17, 31.62, 0.0, 31.28, 0.0, 32.83, 31.42, 64.63, 33.99, 75.55, 0.0, 0.0, 0.0, 0.0, 48.69, 0.0, 0.0, 89.36, 0.0, 72.16, 79.94, 59.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 15.75], ["whale vocalization", 13.85], ["sonar", 12.09]], null, [["frog", 26.48], ["music", 19.05], ["croak", 8.43]], [["speech", 31.9], ["music", 12.66], ["gong", 9.04]], null, [["music", 34.85], ["speech", 23.51], ["hum", 11.35]], null, [["speech", 37.71], ["sidetone", 34.38], ["music", 6.65]], [["music", 36.59], ["electronic music", 21.13], ["sidetone", 5.31]], null, [["music", 24.55], ["speech", 23.01], ["sidetone", 17.32]], null, null, null, null, null, [["music", 48.31], ["speech", 29.84], ["sidetone", 3.37]], null, null, null, null, null, null, null, null], "duration": [11.91, 1.86, 0.03, 1.2, 0.47, 2.04, 0.53, 3.5, 6.91, 1.97, 6.24, 0.37, 2.88, 8.51, 3.7, 11.68, 4.72, 0.24, 1.54, 0.32, 1.0, 2.21, 0.07, 0.71, 5.24, 1.56, 4.71, 4.37, 2.92, 1.05]} \ No newline at end of file diff --git a/annotations_1/2g96QnNekOc_filtered.json b/annotations_1/2g96QnNekOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddb0eddf6edafd76a83f5caf0a80a207031d6d6e --- /dev/null +++ b/annotations_1/2g96QnNekOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [5.0, 7.21], [12.0, 12.33], [20.0, 21.54], [23.0, 23.92], [24.0, 24.49], [26.0, 28.02], [29.0, 33.44], [36.0, 39.8], [41.0, 41.34], [42.0, 43.7], [45.0, 45.55], [47.0, 47.65], [49.0, 52.54], [54.0, 55.93], [56.0, 57.94], [61.0, 61.53], [63.0, 63.54], [64.0, 67.71], [68.0, 71.95], [73.0, 73.08], [78.0, 77.9], [80.0, 80.15], [80.0, 82.05], [85.0, 85.68], [86.0, 112.8], [113.0, 115.25], [130.0, 130.6], [133.0, 132.97], [139.0, 139.89], [145.0, 144.69], [145.0, 146.55], [150.0, 150.8], [151.0, 158.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 71.57, 90.43, 61.57, 0.0, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 92.64, 99.68, 0.0, 0.0, 0.0, 53.84, 0.0, 62.58, 41.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.99], ["mains hum", 13.98], ["music", 12.94]], null, null, null, null, null, null, null], "duration": [0.02, 2.21, 0.33, 1.54, 0.92, 0.49, 2.02, 4.44, 3.8, 0.34, 1.7, 0.55, 0.65, 3.54, 1.93, 1.94, 0.53, 0.54, 3.71, 3.95, 0.08, -0.1, 0.15, 2.05, 0.68, 26.8, 2.25, 0.6, -0.03, 0.89, -0.31, 1.55, 0.8, 7.9]} \ No newline at end of file diff --git a/annotations_1/2gUFZCRHHvE_filtered.json b/annotations_1/2gUFZCRHHvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa2b74be82b7b463f4ec02192c833f3fd5fc8c16 --- /dev/null +++ b/annotations_1/2gUFZCRHHvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [9.0, 9.63], [17.0, 17.41], [45.0, 50.73], [85.0, 90.04], [102.0, 103.65], [108.0, 111.15], [116.0, 119.26], [122.0, 133.52], [134.0, 154.5]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.22, 29.26, 0.0, 29.34, 29.1, 29.43, 30.59], "audiomae_on_audioset": [null, null, null, [["music", 82.07], ["musical instrument", 2.35], ["didgeridoo", 1.93]], [["music", 71.29], ["didgeridoo", 3.75], ["musical instrument", 3.25]], null, [["music", 34.05], ["didgeridoo", 28.1], ["throbbing", 9.24]], [["music", 61.37], ["swing music", 3.47], ["funny music", 1.43]], [["music", 59.77], ["speech", 21.14], ["throbbing", 1.68]], [["music", 53.09], ["throbbing", 25.2], ["hum", 4.71]]], "duration": [0.21, 0.63, 0.41, 5.73, 5.04, 1.65, 3.15, 3.26, 11.52, 20.5]} \ No newline at end of file diff --git a/annotations_1/2gzVWIUhUOg_filtered.json b/annotations_1/2gzVWIUhUOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..290aa93796e14bcf6bb29e2bd7b6fd905e00e8fd --- /dev/null +++ b/annotations_1/2gzVWIUhUOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.22], [15.0, 15.38], [21.0, 33.27], [38.0, 58.56], [60.0, 64.13], [65.0, 78.83], [85.0, 88.8], [90.0, 95.37], [109.0, 112.77], [123.0, 128.21], [140.0, 142.5]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 53.59, 38.23, 75.55, 33.07, 34.37, 33.94, 32.17, 32.66, 40.84], "audiomae_on_audioset": [null, null, null, [["fart", 77.56], ["music", 4.02], ["effects unit", 2.2]], null, [["music", 22.89], ["effects unit", 20.21], ["whale vocalization", 14.09]], [["music", 70.0], ["musical instrument", 10.19], ["brass instrument", 2.58]], [["music", 66.1], ["effects unit", 8.79], ["musical instrument", 5.43]], [["sidetone", 69.26], ["speech", 5.29], ["white noise", 3.22]], [["music", 41.35], ["effects unit", 9.51], ["chorus effect", 6.66]], [["music", 34.6], ["foghorn", 11.41], ["musical instrument", 5.5]]], "duration": [1.22, 0.38, 12.27, 20.56, 4.13, 13.83, 3.8, 5.37, 3.77, 5.21, 2.5]} \ No newline at end of file diff --git a/annotations_1/2hcGeToc17I_filtered.json b/annotations_1/2hcGeToc17I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1327dc198abe8558821f703b15ff0be476d3eea --- /dev/null +++ b/annotations_1/2hcGeToc17I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [7.0, 16.36], [17.0, 17.19], [19.0, 21.32], [24.0, 24.87], [25.0, 44.19], [44.0, 44.22], [45.0, 56.46], [60.0, 59.95], [61.0, 72.87], [73.0, 72.91], [73.0, 72.94], [75.0, 79.05], [80.0, 81.99], [83.0, 83.74], [85.0, 92.38], [99.0, 99.42], [101.0, 109.02], [109.0, 115.3], [117.0, 118.0], [120.0, 129.25], [134.0, 154.36], [155.0, 161.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 50.61, 0.0, 49.27, 0.0, 40.38, 0.0, 32.11, 0.0, 39.82, 0.0, 0.0, 33.06, 0.0, 0.0, 34.85, 0.0, 40.93, 40.71, 0.0, 33.12, 33.15, 33.86], "audiomae_on_audioset": [null, null, null, [["music", 67.99], ["musical instrument", 5.91], ["synthesizer", 4.13]], null, [["music", 40.97], ["hum", 21.01], ["mains hum", 12.18]], null, [["speech", 74.34], ["music", 17.42], ["didgeridoo", 2.48]], null, [["music", 60.8], ["synthesizer", 7.32], ["musical instrument", 7.05]], null, null, [["speech", 54.67], ["music", 23.48], ["theremin", 3.12]], null, null, [["music", 75.01], ["speech", 12.91], ["musical instrument", 2.02]], null, [["music", 47.67], ["speech", 21.36], ["throbbing", 3.76]], [["music", 25.59], ["speech", 17.34], ["honk", 8.46]], null, [["music", 66.29], ["didgeridoo", 7.29], ["theremin", 2.19]], [["music", 78.05], ["musical instrument", 3.63], ["theremin", 3.04]], [["music", 55.31], ["bleat", 6.38], ["sheep", 3.65]]], "duration": [0.83, 9.36, 0.19, 2.32, 0.87, 19.19, 0.22, 11.46, -0.05, 11.87, -0.09, -0.06, 4.05, 1.99, 0.74, 7.38, 0.42, 8.02, 6.3, 1.0, 9.25, 20.36, 6.3]} \ No newline at end of file diff --git a/annotations_1/2heRUn56wrg_filtered.json b/annotations_1/2heRUn56wrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c206a98fdc35f402b4ef7faa70cb7a1a6d8c0551 --- /dev/null +++ b/annotations_1/2heRUn56wrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.97], [26.0, 32.66], [34.0, 34.37], [38.0, 39.6], [41.0, 41.44], [43.0, 44.59], [47.0, 47.44], [52.0, 53.59], [57.0, 57.52], [58.0, 68.44], [69.0, 70.12], [72.0, 74.6], [75.0, 76.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 96.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 6.66, 0.37, 1.6, 0.44, 1.59, 0.44, 1.59, 0.52, 10.44, 1.12, 2.6, 1.2]} \ No newline at end of file diff --git a/annotations_1/2hs-yt-Pmk0_filtered.json b/annotations_1/2hs-yt-Pmk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e4c9e0624dba64cadbe56d255af194af08bae76 --- /dev/null +++ b/annotations_1/2hs-yt-Pmk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [12.0, 14.08], [20.0, 21.27], [23.0, 23.55], [29.0, 29.76], [36.0, 36.69], [51.0, 51.7], [69.0, 69.36], [74.0, 74.43], [76.0, 76.03], [83.0, 83.98], [85.0, 86.09], [95.0, 97.65], [100.0, 101.76], [106.0, 106.1], [120.0, 119.84], [120.0, 121.76], [122.0, 123.84], [125.0, 126.23], [128.0, 129.02], [130.0, 132.21]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07], "audiomae_on_audioset": [null, [["sidetone", 30.4], ["speech", 22.28], ["moo", 7.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 2.08, 1.27, 0.55, 0.76, 0.69, 0.7, 0.36, 0.43, 0.03, 0.98, 1.09, 2.65, 1.76, 0.1, -0.16, 1.76, 1.84, 1.23, 1.02, 2.21]} \ No newline at end of file diff --git a/annotations_1/2i8C-GOsHo0_filtered.json b/annotations_1/2i8C-GOsHo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18bd9a3f94ea118236c7ead7218b6a4ed3f25af8 --- /dev/null +++ b/annotations_1/2i8C-GOsHo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [6.0, 6.83], [15.0, 14.99], [23.0, 24.24], [26.0, 26.47], [27.0, 28.88], [30.0, 31.58], [33.0, 36.96], [38.0, 44.17], [45.0, 46.01], [47.0, 50.95], [52.0, 57.21], [59.0, 59.83], [61.0, 63.73], [75.0, 78.14], [80.0, 85.41], [89.0, 93.28], [95.0, 97.6], [99.0, 101.01], [104.0, 110.24], [112.0, 113.36], [116.0, 128.44], [130.0, 130.35], [133.0, 134.47], [135.0, 140.31]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.66, 56.7, 0.0, 58.47, 52.05, 0.0, 55.74, 53.47, 54.43, 47.78, 77.87, 87.92, 84.98, 0.0, 29.84, 0.0, 0.0, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 17.32], ["hum", 16.92], ["mains hum", 7.98]], null, null, null, null, null, null, null, null, [["speech", 40.13], ["rumble", 8.44], ["hum", 6.19]], null, null, null, null, [["speech", 50.95], ["whack, thwack", 10.32], ["sound effect", 4.7]], null, null, null], "duration": [0.43, 0.83, -0.01, 1.24, 0.47, 1.88, 1.58, 3.96, 6.17, 1.01, 3.95, 5.21, 0.83, 2.73, 3.14, 5.41, 4.28, 2.6, 2.01, 6.24, 1.36, 12.44, 0.35, 1.47, 5.31]} \ No newline at end of file diff --git a/annotations_1/2iD5pPwbDJ8_filtered.json b/annotations_1/2iD5pPwbDJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3b7d8ecee544c8807c25f44a4005ac8c948d4a2 --- /dev/null +++ b/annotations_1/2iD5pPwbDJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.02], [31.0, 32.39], [33.0, 49.99], [54.0, 56.46], [58.0, 64.76], [72.0, 76.76], [79.0, 83.1], [85.0, 84.86], [85.0, 85.77], [89.0, 90.48], [94.0, 105.73], [106.0, 117.9], [118.0, 122.17], [127.0, 129.95], [132.0, 143.23], [146.0, 176.62], [179.0, 192.0], [194.0, 201.28], [209.0, 211.87]], "keep_status": [false, false, true, true, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.95, 32.63, 29.55, 30.42, 29.71, 0.0, 0.0, 0.0, 32.09, 49.13, 50.56, 36.13, 35.04, 0.0, 31.47, 34.51, 50.21], "audiomae_on_audioset": [null, null, [["speech", 20.69], ["fart", 16.3], ["buzz", 13.72]], [["speech", 38.9], ["hum", 12.67], ["mains hum", 5.63]], [["speech", 21.16], ["music", 13.51], ["theremin", 10.53]], [["music", 64.22], ["theremin", 9.04], ["noise", 6.24]], [["music", 22.18], ["whip", 18.91], ["brass instrument", 6.4]], null, null, null, [["music", 42.23], ["theremin", 33.22], ["musical instrument", 3.89]], [["music", 53.58], ["musical instrument", 12.78], ["theremin", 9.41]], null, [["music", 58.41], ["didgeridoo", 5.83], ["synthesizer", 5.58]], [["music", 64.98], ["theremin", 18.79], ["synthesizer", 4.86]], null, [["music", 51.41], ["theremin", 31.71], ["musical instrument", 2.04]], [["music", 49.28], ["theremin", 26.21], ["foghorn", 4.38]], null], "duration": [0.02, 1.39, 16.99, 2.46, 6.76, 4.76, 4.1, -0.14, 0.77, 1.48, 11.73, 11.9, 4.17, 2.95, 11.23, 30.62, 13.0, 7.28, 2.87]} \ No newline at end of file diff --git a/annotations_1/2iF-cU-qnbc_filtered.json b/annotations_1/2iF-cU-qnbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a0ac857ca00285816d7b16a2e47b5e44b8e1bd2 --- /dev/null +++ b/annotations_1/2iF-cU-qnbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.81], [10.0, 9.71], [32.0, 32.85], [34.0, 34.42], [38.0, 38.08], [77.0, 77.16], [89.0, 90.12], [109.0, 109.7], [133.0, 133.12], [146.0, 146.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.81, -0.29, 0.85, 0.42, 0.08, 0.16, 1.12, 0.7, 0.12, 0.08]} \ No newline at end of file diff --git a/annotations_1/2jzlSeFLr7A_filtered.json b/annotations_1/2jzlSeFLr7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..646036c0768f1b525492b9a0b1580ae4bb3d3835 --- /dev/null +++ b/annotations_1/2jzlSeFLr7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.36], [7.0, 8.99], [10.0, 10.64], [12.0, 12.24], [14.0, 15.8], [16.0, 17.05], [18.0, 27.89], [31.0, 38.55], [49.0, 52.32], [59.0, 59.98], [66.0, 66.33], [70.0, 72.13], [83.0, 85.24], [91.0, 91.72], [114.0, 114.59], [124.0, 126.45], [132.0, 131.82], [134.0, 133.83], [135.0, 135.46], [136.0, 139.28], [142.0, 144.31], [147.0, 147.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 54.83, 43.18, 0.0, 0.0, 54.63, 81.35, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 41.09, 50.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 45.43], ["mantra", 14.72], ["lullaby", 7.79]], null, null, null, null, null, null, [["music", 40.54], ["synthesizer", 9.46], ["theremin", 9.45]], null, null, null, [["music", 36.27], ["mantra", 9.35], ["speech", 4.96]], null, null], "duration": [1.36, 1.99, 0.64, 0.24, 1.8, 1.05, 9.89, 7.55, 3.32, 0.98, 0.33, 2.13, 2.24, 0.72, 0.59, 2.45, -0.18, -0.17, 0.46, 3.28, 2.31, 0.53]} \ No newline at end of file diff --git a/annotations_1/2k0S-F8VIhI_filtered.json b/annotations_1/2k0S-F8VIhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b594f1d5a094da3e6ce328a8dc292a5895f7aad --- /dev/null +++ b/annotations_1/2k0S-F8VIhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [12.0, 12.09], [16.0, 16.83], [18.0, 19.85], [22.0, 23.26], [29.0, 30.42], [34.0, 36.09], [50.0, 50.55], [55.0, 57.37], [64.0, 66.12], [70.0, 77.19], [78.0, 83.49], [92.0, 92.67], [94.0, 96.79], [111.0, 116.95], [120.0, 135.45], [137.0, 158.62], [160.0, 159.88], [162.0, 168.62], [169.0, 174.72], [176.0, 176.93], [178.0, 177.89], [179.0, 179.83]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 36.45, 30.03, 30.81, 30.45, 0.0, 30.69, 28.04, 27.98, 28.14, 0.0, 29.32, 30.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.14], ["synthesizer", 6.38], ["electronic music", 4.41]], null, [["music", 53.33], ["electronic music", 3.53], ["musical instrument", 2.43]], [["music", 36.38], ["speech", 18.44], ["synthesizer", 12.01]], [["throbbing", 47.18], ["hum", 35.14], ["music", 7.18]], [["music", 60.83], ["musical instrument", 5.58], ["speech", 5.37]], null, [["music", 42.44], ["didgeridoo", 14.38], ["theremin", 13.0]], [["music", 81.98], ["musical instrument", 1.88], ["singing", 1.21]], [["music", 66.86], ["throbbing", 10.23], ["electronic music", 3.38]], [["music", 56.13], ["hum", 14.97], ["throbbing", 13.48]], null, [["music", 59.11], ["throbbing", 12.5], ["hum", 7.22]], [["music", 73.64], ["musical instrument", 7.27], ["didgeridoo", 6.84]], null, null, null], "duration": [0.15, 0.09, 0.83, 1.85, 1.26, 1.42, 2.09, 0.55, 2.37, 2.12, 7.19, 5.49, 0.67, 2.79, 5.95, 15.45, 21.62, -0.12, 6.62, 5.72, 0.93, -0.11, 0.83]} \ No newline at end of file diff --git a/annotations_1/2k6F2WITgac_filtered.json b/annotations_1/2k6F2WITgac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ab7482cbe4c1dd68b7de68b0c98f18b39a05445 --- /dev/null +++ b/annotations_1/2k6F2WITgac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.97], [8.0, 9.41], [10.0, 12.8], [13.0, 13.68], [14.0, 14.54], [15.0, 15.77], [16.0, 16.87], [18.0, 18.91], [22.0, 24.33], [24.0, 29.27], [30.0, 31.11], [33.0, 41.49], [42.0, 42.5], [43.0, 43.48], [56.0, 57.43], [59.0, 60.39], [71.0, 71.85], [74.0, 82.59], [90.0, 89.99], [91.0, 91.07], [92.0, 94.37], [96.0, 98.31], [99.0, 101.85], [102.0, 101.92], [102.0, 102.52], [105.0, 106.32], [113.0, 114.86], [117.0, 120.95], [123.0, 124.23], [125.0, 127.57], [128.0, 128.6], [129.0, 130.44], [132.0, 136.65], [138.0, 138.4], [139.0, 140.64], [142.0, 143.68], [145.0, 149.5], [153.0, 152.58], [155.0, 156.02], [157.0, 158.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 93.29, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 0.0, 73.82, 94.95, 52.22, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 84.98, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 1.41, 2.8, 0.68, 0.54, 0.77, 0.87, 0.91, 2.33, 5.27, 1.11, 8.49, 0.5, 0.48, 1.43, 1.39, 0.85, 8.59, -0.01, 0.07, 2.37, 2.31, 2.85, -0.08, 0.52, 1.32, 1.86, 3.95, 1.23, 2.57, 0.6, 1.44, 4.65, 0.4, 1.64, 1.68, 4.5, -0.42, 1.02, 1.06]} \ No newline at end of file diff --git a/annotations_1/2kK1wyTEMUQ_filtered.json b/annotations_1/2kK1wyTEMUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d505c05695a0ae0216cb5ff22df13418425a25e --- /dev/null +++ b/annotations_1/2kK1wyTEMUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 40.59], [41.0, 42.65], [45.0, 45.89], [46.0, 47.93], [51.0, 51.83], [53.0, 53.79], [55.0, 70.46], [72.0, 78.29], [79.0, 83.19], [84.0, 84.55], [87.0, 89.33], [92.0, 94.26], [96.0, 98.39], [101.0, 102.22], [104.0, 104.33], [107.0, 107.38], [109.0, 109.63], [113.0, 117.39], [119.0, 120.5], [122.0, 123.72], [125.0, 149.01], [151.0, 153.3], [154.0, 154.55], [159.0, 158.89], [159.0, 161.54], [164.0, 166.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.03, 52.05, 43.51, 0.0, 70.44, 97.0, 57.4, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0, 0.0, 30.52, 53.16, 0.0, 0.0, 77.7, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 47.1], ["throbbing", 25.94], ["hum", 3.78]], null, [["music", 37.35], ["speech", 24.91], ["throbbing", 8.82]], null, null, null, null, null, null, null, null, [["hum", 30.16], ["music", 23.33], ["throbbing", 9.22]], null, null, [["music", 21.37], ["hum", 20.2], ["explosion", 19.68]], null, null, null, null, null], "duration": [38.59, 1.65, 0.89, 1.93, 0.83, 0.79, 15.46, 6.29, 4.19, 0.55, 2.33, 2.26, 2.39, 1.22, 0.33, 0.38, 0.63, 4.39, 1.5, 1.72, 24.01, 2.3, 0.55, -0.11, 2.54, 2.72]} \ No newline at end of file diff --git a/annotations_1/2kV2EVWNqXQ_filtered.json b/annotations_1/2kV2EVWNqXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6e8267be0c6a25f722bfed110c703bc50396c70 --- /dev/null +++ b/annotations_1/2kV2EVWNqXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.67], [10.0, 11.75], [12.0, 24.11], [25.0, 25.74], [27.0, 38.18], [41.0, 41.39], [50.0, 52.56]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 41.48, 0.0, 38.91, 0.0, 41.32], "audiomae_on_audioset": [null, null, [["fly, housefly", 45.98], ["insect", 19.16], ["music", 8.56]], null, [["music", 53.36], ["speech", 12.64], ["buzz", 2.67]], null, [["speech", 11.63], ["whale vocalization", 9.65], ["electric shaver, electric razor", 8.45]]], "duration": [0.67, 1.75, 12.11, 0.74, 11.18, 0.39, 2.56]} \ No newline at end of file diff --git a/annotations_1/2kdSBZ2QieY_filtered.json b/annotations_1/2kdSBZ2QieY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50274fdda4fa88ed74f6e296c021170f89a89910 --- /dev/null +++ b/annotations_1/2kdSBZ2QieY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.69], [4.0, 10.74], [11.0, 13.95], [15.0, 15.63], [21.0, 23.13], [25.0, 26.16], [31.0, 31.65], [54.0, 54.51], [61.0, 61.96], [76.0, 76.47], [77.0, 79.37], [85.0, 90.66], [94.0, 113.34], [114.0, 120.73], [122.0, 129.71], [130.0, 135.63], [136.0, 141.47], [143.0, 154.01], [156.0, 172.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, true], "silence_prob": [100.0, 87.55, 74.6, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 30.62, 31.32, 35.06, 36.22, 36.16, 32.57, 43.13, 93.76, 35.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 17.25], ["pig", 9.09], ["mosquito", 6.27]], [["mosquito", 80.21], ["fly, housefly", 10.7], ["insect", 2.87]], [["gasp", 60.39], ["hiccup", 8.85], ["speech", 5.35]], [["sine wave", 44.9], ["singing bowl", 17.1], ["chirp tone", 7.96]], [["hum", 22.73], ["speech", 15.82], ["music", 11.27]], [["hum", 17.16], ["singing bowl", 15.49], ["mains hum", 8.44]], [["singing bowl", 56.79], ["sine wave", 15.08], ["tuning fork", 7.14]], null, [["thunk", 25.76], ["arrow", 17.73], ["hum", 11.33]]], "duration": [2.69, 6.74, 2.95, 0.63, 2.13, 1.16, 0.65, 0.51, 0.96, 0.47, 2.37, 5.66, 19.34, 6.73, 7.71, 5.63, 5.47, 11.01, 16.57]} \ No newline at end of file diff --git a/annotations_1/2l_mfcc2I8E_filtered.json b/annotations_1/2l_mfcc2I8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70670a2698aadd536f56678d073a02bd64cd35a4 --- /dev/null +++ b/annotations_1/2l_mfcc2I8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.98], [7.0, 19.67], [21.0, 36.15], [38.0, 38.28], [40.0, 41.4], [43.0, 44.61], [46.0, 47.41], [50.0, 50.7], [53.0, 66.5], [67.0, 85.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.7, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 59.59, 67.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 12.67, 15.15, 0.28, 1.4, 1.61, 1.41, 0.7, 13.5, 18.09]} \ No newline at end of file diff --git a/annotations_1/2lh1uIhuujc_filtered.json b/annotations_1/2lh1uIhuujc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8bd61db8dad8ba2c7148b71c2dbe21796092cd --- /dev/null +++ b/annotations_1/2lh1uIhuujc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.07], [8.0, 8.82], [19.0, 19.52], [25.0, 25.51], [28.0, 29.13], [30.0, 31.33], [32.0, 32.26], [40.0, 40.24], [41.0, 42.65], [49.0, 49.18], [51.0, 50.84], [54.0, 55.38], [57.0, 58.46], [63.0, 62.7], [64.0, 65.26], [67.0, 68.12], [73.0, 74.63], [76.0, 78.88], [84.0, 85.7], [87.0, 88.16], [89.0, 90.29], [94.0, 95.4], [97.0, 98.41], [102.0, 102.51], [103.0, 109.61], [111.0, 112.6], [113.0, 114.52], [117.0, 118.34], [120.0, 124.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.82, 0.52, 0.51, 1.13, 1.33, 0.26, 0.24, 1.65, 0.18, -0.16, 1.38, 1.46, -0.3, 1.26, 1.12, 1.63, 2.88, 1.7, 1.16, 1.29, 1.4, 1.41, 0.51, 6.61, 1.6, 1.52, 1.34, 4.01]} \ No newline at end of file diff --git a/annotations_1/2m-I23sWzEI_filtered.json b/annotations_1/2m-I23sWzEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5251aaab60f3050cc9f0460c774bf6a0f49c43a7 --- /dev/null +++ b/annotations_1/2m-I23sWzEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.86], [5.0, 5.7], [7.0, 10.25], [12.0, 12.75], [54.0, 54.65], [76.0, 78.97], [83.0, 83.56], [86.0, 85.99]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.09, 0.0, 0.0, 62.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.86, 0.7, 3.25, 0.75, 0.65, 2.97, 0.56, -0.01]} \ No newline at end of file diff --git a/annotations_1/2nclzm_QlLw_filtered.json b/annotations_1/2nclzm_QlLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..233ac5bd9e3baa076377a1efaa150fc8c1df2f89 --- /dev/null +++ b/annotations_1/2nclzm_QlLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.51], [9.0, 13.42], [15.0, 15.63], [16.0, 16.93], [19.0, 19.82], [22.0, 34.72], [38.0, 55.98], [58.0, 61.53], [63.0, 64.37], [67.0, 67.24], [70.0, 70.16], [71.0, 72.05], [77.0, 77.72], [80.0, 82.9], [84.0, 84.59], [86.0, 93.28], [95.0, 96.25], [99.0, 100.82], [102.0, 105.98], [107.0, 109.36], [111.0, 115.21], [116.0, 118.1], [118.0, 119.31], [120.0, 126.13], [128.0, 130.17], [133.0, 136.75], [140.0, 140.16], [143.0, 144.46], [146.0, 146.8], [147.0, 149.28]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 90.6, 0.0, 0.0, 0.0, 29.39, 35.4, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 81.89, 0.0, 0.0, 89.54, 93.76, 95.23, 97.83, 0.0, 68.8, 86.09, 32.92, 0.0, 0.0, 0.0, 45.49], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.4], ["didgeridoo", 4.71], ["thump, thud", 4.62]], [["buzz", 19.84], ["fart", 10.58], ["insect", 9.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["breaking", 56.26], ["crushing", 10.65], ["glass", 7.99]], null, null, null, [["sidetone", 30.82], ["speech", 27.82], ["chirp tone", 8.35]]], "duration": [0.51, 4.42, 0.63, 0.93, 0.82, 12.72, 17.98, 3.53, 1.37, 0.24, 0.16, 1.05, 0.72, 2.9, 0.59, 7.28, 1.25, 1.82, 3.98, 2.36, 4.21, 2.1, 1.31, 6.13, 2.17, 3.75, 0.16, 1.46, 0.8, 2.28]} \ No newline at end of file diff --git a/annotations_1/2oFuSvs-WU0_filtered.json b/annotations_1/2oFuSvs-WU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b68800931339b8f53f37c727e973c78f7868932 --- /dev/null +++ b/annotations_1/2oFuSvs-WU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.19], [6.0, 11.97], [19.0, 20.61], [29.0, 29.3], [35.0, 36.95], [39.0, 39.45], [41.0, 41.28], [48.0, 48.49], [50.0, 50.21], [56.0, 58.78], [62.0, 66.02], [73.0, 73.47], [79.0, 79.59], [81.0, 81.46], [87.0, 89.58], [92.0, 92.47], [93.0, 93.93], [99.0, 99.64], [102.0, 102.37], [109.0, 111.75], [114.0, 121.59], [122.0, 123.77], [125.0, 128.16], [129.0, 131.52], [136.0, 136.21], [137.0, 139.46], [141.0, 142.86], [145.0, 146.2]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.54, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.58, 100.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 51.12, 95.78, 0.0, 100.0, 99.99, 0.0, 98.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 39.58], ["carnatic music", 13.85], ["vocal music", 6.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.19, 5.97, 1.61, 0.3, 1.95, 0.45, 0.28, 0.49, 0.21, 2.78, 4.02, 0.47, 0.59, 0.46, 2.58, 0.47, 0.93, 0.64, 0.37, 2.75, 7.59, 1.77, 3.16, 2.52, 0.21, 2.46, 1.86, 1.2]} \ No newline at end of file diff --git a/annotations_1/2oLqQw8jHts_filtered.json b/annotations_1/2oLqQw8jHts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c79f32d906995f59bd3fa59413a3725c611c89b1 --- /dev/null +++ b/annotations_1/2oLqQw8jHts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.37], [8.0, 9.96], [13.0, 16.33], [17.0, 17.88], [19.0, 20.76], [22.0, 40.24], [41.0, 42.43], [43.0, 43.8], [45.0, 48.14], [49.0, 50.26], [53.0, 59.49], [60.0, 60.29], [64.0, 66.04], [68.0, 73.84], [78.0, 80.67], [86.0, 86.8], [87.0, 92.03], [95.0, 96.4], [97.0, 103.72], [104.0, 105.09], [108.0, 108.35], [109.0, 112.11], [115.0, 114.96], [119.0, 123.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.02, 0.0, 0.0, 99.16, 0.0, 0.0, 56.86, 0.0, 81.17, 0.0, 99.62, 54.3, 100.0, 0.0, 93.76, 0.0, 100.0, 0.0, 0.0, 92.15, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 1.96, 3.33, 0.88, 1.76, 18.24, 1.43, 0.8, 3.14, 1.26, 6.49, 0.29, 2.04, 5.84, 2.67, 0.8, 5.03, 1.4, 6.72, 1.09, 0.35, 3.11, -0.04, 4.92]} \ No newline at end of file diff --git a/annotations_1/2pCUsMk0Zs0_filtered.json b/annotations_1/2pCUsMk0Zs0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9f40bad4bf97a60b9c8cc0e892d83b5285c8bcd --- /dev/null +++ b/annotations_1/2pCUsMk0Zs0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.71], [16.0, 16.44], [19.0, 19.23], [21.0, 26.15], [28.0, 32.59], [36.0, 36.85], [38.0, 38.15], [40.0, 41.17], [42.0, 43.56], [47.0, 54.57], [57.0, 57.15], [57.0, 62.63], [65.0, 66.78], [68.0, 72.55], [77.0, 84.87], [87.0, 97.41], [98.0, 104.79], [105.0, 125.22], [127.0, 127.31]], "keep_status": [false, false, false, true, true, false, false, false, false, true, false, true, false, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 38.93, 41.44, 0.0, 0.0, 0.0, 0.0, 42.53, 0.0, 37.03, 0.0, 35.62, 34.02, 34.74, 41.44, 34.26, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.72], ["hum", 9.43], ["mains hum", 4.85]], [["speech", 39.46], ["music", 20.59], ["noise", 4.77]], null, null, null, null, [["music", 27.44], ["speech", 7.28], ["oink", 6.25]], null, [["speech", 53.53], ["music", 11.63], ["fly, housefly", 4.63]], null, [["roaring cats (lions, tigers)", 15.37], ["wild animals", 13.51], ["music", 7.55]], [["speech", 43.05], ["music", 28.19], ["sidetone", 8.48]], [["music", 39.28], ["gong", 13.01], ["hum", 9.26]], [["music", 55.92], ["hum", 7.82], ["ambient music", 7.39]], [["music", 29.73], ["ambient music", 13.21], ["speech", 7.49]], null], "duration": [0.71, 0.44, 0.23, 5.15, 4.59, 0.85, 0.15, 1.17, 1.56, 7.57, 0.15, 5.63, 1.78, 4.55, 7.87, 10.41, 6.79, 20.22, 0.31]} \ No newline at end of file diff --git a/annotations_1/2pw_36yxgXI_filtered.json b/annotations_1/2pw_36yxgXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c362b6862740b5e71d332020bd6b6997088839ec --- /dev/null +++ b/annotations_1/2pw_36yxgXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.15], [5.0, 5.43], [6.0, 7.99], [10.0, 12.16], [13.0, 14.74], [16.0, 16.09], [17.0, 17.52], [19.0, 20.22], [21.0, 22.67], [24.0, 24.7], [28.0, 28.22], [29.0, 29.42], [30.0, 31.75], [32.0, 34.35], [40.0, 42.35], [48.0, 48.29], [51.0, 53.23], [58.0, 58.51], [59.0, 60.02], [66.0, 66.58], [72.0, 71.98], [77.0, 77.89], [81.0, 82.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 45.27, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 31.86], ["moo", 20.07], ["insect", 14.2]], null, null, null, null, null, null, null, null], "duration": [1.15, 0.43, 1.99, 2.16, 1.74, 0.09, 0.52, 1.22, 1.67, 0.7, 0.22, 0.42, 1.75, 2.35, 2.35, 0.29, 2.23, 0.51, 1.02, 0.58, -0.02, 0.89, 1.22]} \ No newline at end of file diff --git a/annotations_1/2qyJ5r7Wink_filtered.json b/annotations_1/2qyJ5r7Wink_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1221b4f8fc2533de17e6a984be7a1dfe3339a67a --- /dev/null +++ b/annotations_1/2qyJ5r7Wink_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.57], [28.0, 91.74], [96.0, 102.02], [105.0, 105.93], [107.0, 123.15], [130.0, 131.09]], "keep_status": [false, false, false, false, false, false], "silence_prob": [36.61, 0.0, 31.33, 0.0, 32.57, 0.0], "audiomae_on_audioset": [[["hum", 35.36], ["throbbing", 22.84], ["music", 15.97]], null, [["speech", 51.73], ["music", 13.15], ["didgeridoo", 10.36]], null, [["throbbing", 45.39], ["music", 24.74], ["hum", 12.26]], null], "duration": [19.57, 63.74, 6.02, 0.93, 16.15, 1.09]} \ No newline at end of file diff --git a/annotations_1/2rFXR3_DeMU_filtered.json b/annotations_1/2rFXR3_DeMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d64cb96fd3b691d1836c89e779b23257ade30fc5 --- /dev/null +++ b/annotations_1/2rFXR3_DeMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 29.89]], "keep_status": [false], "silence_prob": [28.7], "audiomae_on_audioset": [[["music", 78.41], ["funny music", 4.95], ["air horn, truck horn", 2.98]]], "duration": [23.89]} \ No newline at end of file diff --git a/annotations_1/2rPDGz_0qvw_filtered.json b/annotations_1/2rPDGz_0qvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..753770ffc8978e55d4394df55d5610fed228b8a6 --- /dev/null +++ b/annotations_1/2rPDGz_0qvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.14], [16.0, 17.51], [18.0, 19.94], [22.0, 23.11], [25.0, 44.47], [46.0, 46.97], [47.0, 51.58], [55.0, 103.0], [109.0, 109.86], [110.0, 159.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.39, 0.0, 32.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 41.27], ["hum", 18.49], ["mains hum", 15.53]], null, [["music", 66.56], ["theremin", 6.05], ["musical instrument", 3.69]], null, null, null], "duration": [0.14, 1.51, 1.94, 1.11, 19.47, 0.97, 4.58, 48.0, 0.86, 49.92]} \ No newline at end of file diff --git a/annotations_1/2rSSxAdDhuU_filtered.json b/annotations_1/2rSSxAdDhuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b75949ed590b98cc7eee09948c718654782ad197 --- /dev/null +++ b/annotations_1/2rSSxAdDhuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.24], [14.0, 16.85], [18.0, 19.82], [21.0, 49.57], [55.0, 55.14], [56.0, 57.64], [68.0, 69.67], [70.0, 71.05], [76.0, 76.71], [81.0, 81.41], [87.0, 87.29], [95.0, 94.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.17, 30.76, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 30.8], ["music", 26.25], ["hum", 24.08]], [["music", 63.72], ["throbbing", 10.42], ["electronic music", 4.93]], null, [["music", 61.45], ["throbbing", 4.94], ["musical instrument", 4.88]], null, null, null, null, null, null, null, null], "duration": [5.24, 2.85, 1.82, 28.57, 0.14, 1.64, 1.67, 1.05, 0.71, 0.41, 0.29, -0.24]} \ No newline at end of file diff --git a/annotations_1/2rSnCcaMDdg_filtered.json b/annotations_1/2rSnCcaMDdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e27e307f8430da2ba9b815e3077130a5a4c30369 --- /dev/null +++ b/annotations_1/2rSnCcaMDdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.5], [40.0, 39.99], [41.0, 42.01], [43.0, 44.42], [46.0, 46.8], [49.0, 49.62], [51.0, 58.33], [60.0, 60.39], [61.0, 66.53], [86.0, 85.92], [87.0, 89.09], [101.0, 101.75], [107.0, 108.63], [111.0, 111.79], [116.0, 116.43], [118.0, 119.42], [121.0, 126.57]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 0.0, 34.14, 0.0, 51.23, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 32.88], ["vehicle", 10.05], ["crowd", 6.04]], null, [["cattle, bovinae", 38.29], ["moo", 27.85], ["livestock, farm animals, working animals", 17.63]], null, null, null, null, null, null, null, [["whale vocalization", 18.64], ["crowd", 8.71], ["sound effect", 5.43]]], "duration": [0.5, -0.01, 1.01, 1.42, 0.8, 0.62, 7.33, 0.39, 5.53, -0.08, 2.09, 0.75, 1.63, 0.79, 0.43, 1.42, 5.57]} \ No newline at end of file diff --git a/annotations_1/2r_EHD8QVYg_filtered.json b/annotations_1/2r_EHD8QVYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b203f846209b5f0734a26bcefed936fe29be6f --- /dev/null +++ b/annotations_1/2r_EHD8QVYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.07], [3.0, 4.14], [9.0, 12.68], [14.0, 15.33], [17.0, 22.74], [25.0, 26.55], [28.0, 30.03], [31.0, 34.05], [35.0, 35.9], [37.0, 50.33], [51.0, 58.89], [63.0, 64.27], [68.0, 67.91], [69.0, 70.24], [73.0, 74.29], [77.0, 77.48], [78.0, 78.7], [81.0, 82.05], [84.0, 84.72], [86.0, 86.48], [91.0, 96.04], [97.0, 100.87], [102.0, 102.69], [107.0, 107.65], [109.0, 110.76], [114.0, 113.71], [116.0, 115.97], [118.0, 119.72], [120.0, 121.22], [124.0, 124.92], [126.0, 126.42], [128.0, 127.94], [131.0, 135.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.91, 0.0, 51.82, 0.0, 50.76, 50.36, 0.0, 37.65, 33.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["animal", 34.27], ["horse", 29.82], ["clip-clop", 28.85]], [["speech", 28.91], ["hum", 10.73], ["eruption", 9.08]], null, null, null, null, null, null, null, null, null, null, [["speech", 25.93], ["sidetone", 15.08], ["hum", 13.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 1.14, 3.68, 1.33, 5.74, 1.55, 2.03, 3.05, 0.9, 13.33, 7.89, 1.27, -0.09, 1.24, 1.29, 0.48, 0.7, 1.05, 0.72, 0.48, 5.04, 3.87, 0.69, 0.65, 1.76, -0.29, -0.03, 1.72, 1.22, 0.92, 0.42, -0.06, 4.48]} \ No newline at end of file diff --git a/annotations_1/2sX5DMSCipI_filtered.json b/annotations_1/2sX5DMSCipI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1463e0faccd30f87ac4b546f9b32def289d90a97 --- /dev/null +++ b/annotations_1/2sX5DMSCipI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 24.93], [26.0, 26.38], [26.0, 28.66], [38.0, 41.61], [43.0, 43.16], [46.0, 54.94], [55.0, 55.02], [57.0, 64.12], [69.0, 81.24], [82.0, 92.72], [96.0, 96.58], [99.0, 99.93], [102.0, 107.06]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [31.62, 0.0, 56.18, 98.59, 0.0, 37.24, 0.0, 31.51, 47.12, 41.72, 0.0, 0.0, 34.61], "audiomae_on_audioset": [[["speech", 50.01], ["music", 30.75], ["didgeridoo", 3.0]], null, null, null, null, [["music", 31.19], ["hum", 21.66], ["speech", 14.19]], null, [["music", 48.37], ["speech", 28.14], ["throbbing", 3.07]], [["music", 34.09], ["hum", 29.43], ["mains hum", 7.67]], [["music", 18.83], ["throbbing", 16.63], ["hum", 10.43]], null, null, [["theremin", 23.6], ["music", 13.25], ["speech", 11.84]]], "duration": [20.93, 0.38, 2.66, 3.61, 0.16, 8.94, 0.02, 7.12, 12.24, 10.72, 0.58, 0.93, 5.06]} \ No newline at end of file diff --git a/annotations_1/2tqG6KMgyv8_filtered.json b/annotations_1/2tqG6KMgyv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c5da22f16456880cfd6fd9f256faf8fdabfda09 --- /dev/null +++ b/annotations_1/2tqG6KMgyv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [16.0, 15.96], [16.0, 18.08], [27.0, 27.55], [37.0, 38.04], [47.0, 47.78], [51.0, 52.1], [53.0, 54.85], [59.0, 59.9], [74.0, 75.19], [86.0, 85.78], [86.0, 86.88], [115.0, 118.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9], "audiomae_on_audioset": [null, null, [["music", 74.23], ["boing", 7.0], ["animal", 1.78]], null, null, null, null, null, null, null, null, null, null], "duration": [0.99, -0.04, 2.08, 0.55, 1.04, 0.78, 1.1, 1.85, 0.9, 1.19, -0.22, 0.88, 3.37]} \ No newline at end of file diff --git a/annotations_1/2uZV27BttLM_filtered.json b/annotations_1/2uZV27BttLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2246f366e389c8b329ead5eb0e3ba3fa13971b0 --- /dev/null +++ b/annotations_1/2uZV27BttLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 59.32], [63.0, 84.42], [88.0, 109.95], [112.0, 113.66], [116.0, 117.69], [118.0, 119.57], [121.0, 120.93], [127.0, 126.62], [130.0, 129.88], [134.0, 134.23], [139.0, 140.19], [143.0, 150.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.55, 30.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.93], "audiomae_on_audioset": [null, [["music", 69.95], ["boom", 4.1], ["gunshot, gunfire", 3.03]], [["speech", 38.21], ["music", 37.52], ["hum", 3.49]], null, null, null, null, null, null, null, null, [["music", 46.33], ["throbbing", 25.12], ["hum", 13.14]]], "duration": [36.32, 21.42, 21.95, 1.66, 1.69, 1.57, -0.07, -0.38, -0.12, 0.23, 1.19, 7.2]} \ No newline at end of file diff --git a/annotations_1/2vIINq7m10Q_filtered.json b/annotations_1/2vIINq7m10Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..278b5c1b220310d10898faffae5c3656fff29542 --- /dev/null +++ b/annotations_1/2vIINq7m10Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.96], [13.0, 20.09], [22.0, 28.66], [34.0, 36.1], [37.0, 37.12], [42.0, 77.11], [80.0, 80.67], [87.0, 88.2], [91.0, 96.65], [99.0, 110.12], [110.0, 120.48]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 29.31, 29.09, 29.22, 0.0, 0.0, 0.0, 0.0, 29.17, 30.01, 29.78], "audiomae_on_audioset": [null, [["boing", 57.12], ["music", 26.78], ["speech", 5.28]], [["vehicle", 15.31], ["music", 13.74], ["speech", 11.37]], [["music", 15.18], ["speech", 14.83], ["animal", 6.16]], null, null, null, null, [["music", 35.87], ["speech", 17.94], ["fart", 6.03]], [["music", 79.92], ["boing", 4.07], ["speech", 1.8]], [["music", 52.1], ["boing", 32.52], ["speech", 2.77]]], "duration": [-0.04, 7.09, 6.66, 2.1, 0.12, 35.11, 0.67, 1.2, 5.65, 11.12, 10.48]} \ No newline at end of file diff --git a/annotations_1/2vJOE2qvIEM_filtered.json b/annotations_1/2vJOE2qvIEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a74653e2a66436dc9162f2da10e74f50a73d1ae0 --- /dev/null +++ b/annotations_1/2vJOE2qvIEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [6.0, 6.35], [13.0, 14.23], [20.0, 21.03], [22.0, 22.62], [24.0, 24.04], [26.0, 27.13], [30.0, 30.69], [34.0, 34.16], [38.0, 38.6], [41.0, 41.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.35, 1.23, 1.03, 0.62, 0.04, 1.13, 0.69, 0.16, 0.6, 0.86]} \ No newline at end of file diff --git a/annotations_1/2vbGcYm8u1o_filtered.json b/annotations_1/2vbGcYm8u1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa217d32c01e74a3677b746e429ae49232755550 --- /dev/null +++ b/annotations_1/2vbGcYm8u1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.99], [6.0, 7.13], [8.0, 10.49], [11.0, 13.69], [15.0, 19.94], [21.0, 24.02], [27.0, 33.22], [35.0, 40.27], [41.0, 42.15], [43.0, 52.86], [55.0, 55.86], [57.0, 58.95], [61.0, 61.96], [64.0, 65.82], [67.0, 68.32], [71.0, 72.06], [74.0, 75.46], [78.0, 79.27], [82.0, 82.61], [85.0, 86.31], [87.0, 87.71], [89.0, 90.36], [92.0, 97.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.89, 0.0, 71.57, 56.78, 99.84, 79.59, 67.51, 99.85, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.99, 1.13, 2.49, 2.69, 4.94, 3.02, 6.22, 5.27, 1.15, 9.86, 0.86, 1.95, 0.96, 1.82, 1.32, 1.06, 1.46, 1.27, 0.61, 1.31, 0.71, 1.36, 5.43]} \ No newline at end of file diff --git a/annotations_1/2vi_VeRSHbM_filtered.json b/annotations_1/2vi_VeRSHbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a177e916f2cba5800dd4edcd65e2bf9359d82eb9 --- /dev/null +++ b/annotations_1/2vi_VeRSHbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 33.86], [42.0, 46.87], [47.0, 47.88], [64.0, 68.91], [70.0, 71.32], [72.0, 78.0], [82.0, 93.16], [97.0, 112.08], [113.0, 114.18], [117.0, 119.37], [121.0, 121.68]], "keep_status": [true, true, false, false, false, true, true, true, false, true, false], "silence_prob": [32.23, 34.83, 0.0, 53.91, 0.0, 45.05, 41.36, 33.27, 0.0, 34.97, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 16.28], ["fly, housefly", 10.87], ["insect", 6.87]], [["fly, housefly", 11.75], ["radio", 8.34], ["mosquito", 8.16]], null, null, null, [["mains hum", 17.19], ["music", 16.2], ["hum", 15.22]], [["music", 31.68], ["mains hum", 10.01], ["musical instrument", 6.3]], [["music", 25.46], ["hum", 22.78], ["mains hum", 10.43]], null, [["music", 57.42], ["throbbing", 3.39], ["didgeridoo", 2.93]], null], "duration": [11.86, 4.87, 0.88, 4.91, 1.32, 6.0, 11.16, 15.08, 1.18, 2.37, 0.68]} \ No newline at end of file diff --git a/annotations_1/2yWYCKoqKmE_filtered.json b/annotations_1/2yWYCKoqKmE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db00387e26f2b443ada3f7aae2febfeb6ecc2919 --- /dev/null +++ b/annotations_1/2yWYCKoqKmE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [9.0, 10.08], [11.0, 11.97], [13.0, 13.73], [16.0, 16.24], [17.0, 17.64], [19.0, 19.7], [22.0, 25.32], [26.0, 26.77], [27.0, 27.82], [30.0, 37.86], [40.0, 40.64], [45.0, 45.64], [49.0, 52.57], [56.0, 61.15], [62.0, 69.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 42.72, 0.0, 0.0, 93.76, 86.45, 31.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mains hum", 49.14], ["hum", 35.76], ["music", 1.78]], null, null, null, null, [["explosion", 33.26], ["speech", 17.36], ["fly, housefly", 10.71]]], "duration": [0.51, 1.08, 0.97, 0.73, 0.24, 0.64, 0.7, 3.32, 0.77, 0.82, 7.86, 0.64, 0.64, 3.57, 5.15, 7.36]} \ No newline at end of file diff --git a/annotations_1/2yZlrJWBLac_filtered.json b/annotations_1/2yZlrJWBLac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e20cfa167b09091a666ab7ac823fd631cc63c124 --- /dev/null +++ b/annotations_1/2yZlrJWBLac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.38], [4.0, 4.87], [8.0, 29.51], [30.0, 31.77], [33.0, 35.83], [39.0, 39.58], [40.0, 41.98], [43.0, 44.1], [45.0, 46.7], [47.0, 48.64], [50.0, 51.43], [56.0, 58.31], [59.0, 59.76], [65.0, 65.01], [69.0, 71.49], [72.0, 77.01], [78.0, 81.21], [97.0, 101.53], [105.0, 105.02], [116.0, 116.29], [118.0, 119.87], [121.0, 122.69], [125.0, 130.69], [131.0, 132.48]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [42.72, 0.0, 47.2, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 89.9, 66.88, 87.37, 36.11, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0], "audiomae_on_audioset": [[["music", 17.8], ["radio", 5.59], ["frog", 4.06]], null, [["livestock, farm animals, working animals", 13.59], ["animal", 11.68], ["hum", 8.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.69], ["sidetone", 26.63], ["radio", 13.14]], null, null, null, null, null, null], "duration": [2.38, 0.87, 21.51, 1.77, 2.83, 0.58, 1.98, 1.1, 1.7, 1.64, 1.43, 2.31, 0.76, 0.01, 2.49, 5.01, 3.21, 4.53, 0.02, 0.29, 1.87, 1.69, 5.69, 1.48]} \ No newline at end of file diff --git a/annotations_1/2ycw0UUyCm0_filtered.json b/annotations_1/2ycw0UUyCm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ce93f1adb74aebcce33e625af50a97f5d4598ea --- /dev/null +++ b/annotations_1/2ycw0UUyCm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.9], [14.0, 19.87], [20.0, 23.5], [25.0, 25.93], [27.0, 28.51], [29.0, 29.89], [43.0, 53.38], [57.0, 56.56], [57.0, 85.83], [87.0, 99.57], [101.0, 105.9], [107.0, 144.24], [147.0, 149.18], [155.0, 158.3], [161.0, 165.25], [166.0, 167.44], [168.0, 168.34]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, true, true, true, false, false], "silence_prob": [55.96, 31.96, 34.29, 0.0, 0.0, 0.0, 41.24, 0.0, 29.67, 29.48, 30.32, 0.0, 28.98, 28.94, 33.62, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 49.96], ["whale vocalization", 13.12], ["music", 10.71]], [["music", 43.63], ["whale vocalization", 23.17], ["didgeridoo", 4.03]], null, null, null, [["music", 35.72], ["speech", 34.69], ["sidetone", 5.06]], null, [["music", 34.07], ["speech", 19.37], ["electric shaver, electric razor", 8.07]], [["speech", 33.96], ["music", 23.59], ["thump, thud", 5.92]], [["music", 58.91], ["throbbing", 9.54], ["mains hum", 5.42]], null, [["music", 26.5], ["whack, thwack", 16.9], ["speech", 6.46]], [["rumble", 47.3], ["hum", 9.96], ["whoosh, swoosh, swish", 5.72]], [["hum", 43.11], ["rumble", 13.47], ["whale vocalization", 10.71]], null, null], "duration": [3.9, 5.87, 3.5, 0.93, 1.51, 0.89, 10.38, -0.44, 28.83, 12.57, 4.9, 37.24, 2.18, 3.3, 4.25, 1.44, 0.34]} \ No newline at end of file diff --git a/annotations_1/2zHHkSu1br4_filtered.json b/annotations_1/2zHHkSu1br4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab6981ce67e53365e52417fe78ea2873659e56e9 --- /dev/null +++ b/annotations_1/2zHHkSu1br4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.21], [19.0, 22.71], [42.0, 41.98], [48.0, 47.93], [55.0, 55.56], [56.0, 60.07], [61.0, 67.85], [83.0, 83.39], [92.0, 92.8], [94.0, 94.29], [97.0, 97.14], [98.0, 99.91], [104.0, 105.54], [107.0, 109.59], [111.0, 112.36], [114.0, 117.59], [118.0, 118.29], [118.0, 118.32], [120.0, 126.54], [131.0, 131.55], [136.0, 138.55], [141.0, 141.76], [143.0, 143.58], [144.0, 144.83]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [34.82, 29.73, 0.0, 0.0, 0.0, 32.68, 28.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 29.53, 0.0, 0.0, 32.46, 0.0, 29.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.25], ["didgeridoo", 2.4], ["musical instrument", 2.07]], [["livestock, farm animals, working animals", 48.96], ["moo", 12.34], ["cattle, bovinae", 11.66]], null, null, null, [["music", 37.59], ["synthesizer", 8.53], ["echo", 6.97]], [["music", 84.21], ["foghorn", 1.54], ["musical instrument", 1.22]], null, null, null, null, null, null, null, null, [["music", 29.29], ["noise", 9.68], ["buzz", 8.38]], null, null, [["music", 32.22], ["throbbing", 16.12], ["hum", 12.33]], null, [["music", 40.14], ["throbbing", 5.34], ["creak", 4.82]], null, null, null], "duration": [2.21, 3.71, -0.02, -0.07, 0.56, 4.07, 6.85, 0.39, 0.8, 0.29, 0.14, 1.91, 1.54, 2.59, 1.36, 3.59, 0.29, 0.32, 6.54, 0.55, 2.55, 0.76, 0.58, 0.83]} \ No newline at end of file diff --git a/annotations_1/2zSE8r8jU_U_filtered.json b/annotations_1/2zSE8r8jU_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..763eff10171139bf08111fb1ff1a4a6fcfcf0e22 --- /dev/null +++ b/annotations_1/2zSE8r8jU_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [6.0, 6.66], [8.0, 22.64], [24.0, 25.41], [26.0, 27.28], [29.0, 31.18], [32.0, 43.16], [46.0, 46.62], [48.0, 52.14], [53.0, 65.23], [69.0, 69.69], [70.0, 72.84], [74.0, 74.24], [75.0, 76.11], [77.0, 78.14], [81.0, 81.33], [83.0, 121.8], [122.0, 122.94], [124.0, 124.87], [127.0, 127.58], [131.0, 131.36], [133.0, 137.94], [138.0, 138.06], [140.0, 141.79], [143.0, 143.04], [144.0, 153.27], [154.0, 164.0], [165.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.6, 0.0, 0.0, 99.87, 68.28, 0.0, 68.41, 93.45, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 98.19, 52.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 0.66, 14.64, 1.41, 1.28, 2.18, 11.16, 0.62, 4.14, 12.23, 0.69, 2.84, 0.24, 1.11, 1.14, 0.33, 38.8, 0.94, 0.87, 0.58, 0.36, 4.94, 0.06, 1.79, 0.04, 9.27, 10.0, -0.06]} \ No newline at end of file diff --git a/annotations_1/30IrWTTMWos_filtered.json b/annotations_1/30IrWTTMWos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..837d431675b67a7c2faf835eb43b59495a55350e --- /dev/null +++ b/annotations_1/30IrWTTMWos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [4.0, 9.86], [12.0, 13.88], [21.0, 21.3], [25.0, 28.46], [38.0, 41.35], [43.0, 43.5], [44.0, 45.98], [47.0, 50.58], [52.0, 53.84], [55.0, 58.51], [60.0, 66.56], [74.0, 75.98], [84.0, 85.94], [95.0, 96.6], [115.0, 118.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 97.11, 100.0, 0.0, 0.0, 100.0, 0.0, 99.21, 39.25, 0.0, 0.0, 0.0, 30.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.85], ["piano", 9.42], ["keyboard (musical)", 8.46]], null, null, null, [["music", 69.78], ["musical instrument", 3.73], ["didgeridoo", 2.34]]], "duration": [1.44, 5.86, 1.88, 0.3, 3.46, 3.35, 0.5, 1.98, 3.58, 1.84, 3.51, 6.56, 1.98, 1.94, 1.6, 3.99]} \ No newline at end of file diff --git a/annotations_1/30VlDItRAVk_filtered.json b/annotations_1/30VlDItRAVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a0aeede1af7d3c6e37daaa7c23ee1deb4c503b6 --- /dev/null +++ b/annotations_1/30VlDItRAVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.74], [25.0, 26.2], [27.0, 36.69], [39.0, 40.51], [43.0, 44.58], [51.0, 67.2], [68.0, 74.8], [76.0, 77.26], [79.0, 81.62], [84.0, 95.44], [95.0, 104.08], [105.0, 125.71], [137.0, 140.49], [144.0, 147.06], [148.0, 149.57], [151.0, 158.21], [162.0, 164.29]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, true], "silence_prob": [55.89, 0.0, 31.83, 0.0, 0.0, 31.09, 29.67, 0.0, 31.36, 30.95, 30.36, 29.96, 31.87, 33.41, 0.0, 28.95, 31.66], "audiomae_on_audioset": [null, null, [["music", 66.47], ["hum", 9.31], ["speech", 6.07]], null, null, [["music", 69.19], ["throbbing", 5.01], ["didgeridoo", 3.23]], [["music", 68.21], ["groan", 3.89], ["throbbing", 2.93]], null, [["music", 45.2], ["throbbing", 19.36], ["techno", 2.52]], [["music", 64.27], ["throbbing", 7.23], ["hum", 3.32]], [["music", 62.87], ["speech", 6.57], ["foghorn", 4.78]], [["music", 41.8], ["speech", 13.63], ["hum", 6.37]], [["cattle, bovinae", 38.23], ["moo", 26.46], ["livestock, farm animals, working animals", 20.85]], [["music", 42.21], ["sitar", 7.29], ["scary music", 6.88]], null, [["music", 54.53], ["theremin", 12.9], ["hum", 7.48]], [["music", 43.3], ["theremin", 7.67], ["musical instrument", 2.91]]], "duration": [4.74, 1.2, 9.69, 1.51, 1.58, 16.2, 6.8, 1.26, 2.62, 11.44, 9.08, 20.71, 3.49, 3.06, 1.57, 7.21, 2.29]} \ No newline at end of file diff --git a/annotations_1/318L0jBVIKM_filtered.json b/annotations_1/318L0jBVIKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e08c2de204cdb957a21232cac5462f06aa23ae9 --- /dev/null +++ b/annotations_1/318L0jBVIKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.01], [8.0, 9.66], [14.0, 15.3], [19.0, 19.85], [25.0, 26.06], [27.0, 30.0], [35.0, 36.09], [43.0, 43.7], [47.0, 49.13], [50.0, 50.97], [51.0, 60.1], [61.0, 63.32], [70.0, 71.93], [75.0, 104.89], [106.0, 107.37], [109.0, 110.42], [112.0, 116.19], [117.0, 119.8], [120.0, 134.47], [136.0, 136.98], [138.0, 170.31], [173.0, 174.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 56.4, 0.0, 42.39, 54.9, 0.0, 41.38, 0.0, 0.0, 50.51, 43.61, 38.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 52.06], ["speech", 27.36], ["didgeridoo", 3.84]], null, null, [["music", 42.37], ["synthesizer", 9.23], ["throbbing", 4.33]], null, null, null, [["music", 62.95], ["didgeridoo", 3.86], ["synthesizer", 3.75]], [["music", 78.18], ["synthetic singing", 2.64], ["male singing", 1.7]], null, null, null], "duration": [0.01, 1.66, 1.3, 0.85, 1.06, 3.0, 1.09, 0.7, 2.13, 0.97, 9.1, 2.32, 1.93, 29.89, 1.37, 1.42, 4.19, 2.8, 14.47, 0.98, 32.31, 1.66]} \ No newline at end of file diff --git a/annotations_1/31LlQhZmSYs_filtered.json b/annotations_1/31LlQhZmSYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ac88f4b029f1bff3245cded7d3d2b07dc6e6547 --- /dev/null +++ b/annotations_1/31LlQhZmSYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 14.66], [17.0, 21.83], [22.0, 22.94], [24.0, 24.48], [24.0, 29.81], [36.0, 39.56], [42.0, 43.98], [49.0, 49.05], [51.0, 51.48], [62.0, 62.73], [65.0, 65.15], [67.0, 67.53], [69.0, 69.18], [71.0, 72.15], [74.0, 75.25], [77.0, 77.03], [79.0, 90.12]], "keep_status": [false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.71, 32.3, 0.0, 0.0, 32.43, 37.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.36], "audiomae_on_audioset": [[["music", 46.15], ["theremin", 19.24], ["hum", 6.04]], [["moo", 19.42], ["livestock, farm animals, working animals", 17.08], ["speech", 15.62]], null, null, [["speech", 16.98], ["music", 16.56], ["fly, housefly", 7.48]], [["music", 38.18], ["speech", 22.53], ["hum", 6.19]], null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 19.5], ["cattle, bovinae", 11.75], ["whack, thwack", 10.84]]], "duration": [14.66, 4.83, 0.94, 0.48, 5.81, 3.56, 1.98, 0.05, 0.48, 0.73, 0.15, 0.53, 0.18, 1.15, 1.25, 0.03, 11.12]} \ No newline at end of file diff --git a/annotations_1/31fx9aF04ww_filtered.json b/annotations_1/31fx9aF04ww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8853abedade263e5928440080b216b6002acc767 --- /dev/null +++ b/annotations_1/31fx9aF04ww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 69.23], [70.0, 71.54]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [68.23, 1.54]} \ No newline at end of file diff --git a/annotations_1/31sP1-4GgsA_filtered.json b/annotations_1/31sP1-4GgsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6503095f156f7adb73e2197410d418ba116ebbb4 --- /dev/null +++ b/annotations_1/31sP1-4GgsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.76], [15.0, 47.66], [48.0, 88.82], [89.0, 104.68], [108.0, 116.9]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.54, 32.61], "audiomae_on_audioset": [null, null, null, [["music", 41.42], ["hum", 14.66], ["throbbing", 7.41]], [["music", 63.73], ["hum", 8.26], ["electronic music", 3.58]]], "duration": [1.76, 32.66, 40.82, 15.68, 8.9]} \ No newline at end of file diff --git a/annotations_1/31vkz05skoc_filtered.json b/annotations_1/31vkz05skoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1eb0175d87f14c482df072ad01406125e4d5ce --- /dev/null +++ b/annotations_1/31vkz05skoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [4.0, 5.22], [6.0, 6.15], [7.0, 9.88], [11.0, 11.99], [12.0, 13.73], [17.0, 23.7], [24.0, 25.73], [27.0, 27.11], [29.0, 30.11], [33.0, 34.15], [37.0, 37.66], [42.0, 43.65], [48.0, 60.07], [61.0, 65.11], [74.0, 75.61], [78.0, 80.91], [81.0, 82.22], [83.0, 84.03], [86.0, 86.7], [90.0, 91.0], [95.0, 98.24], [103.0, 104.23], [112.0, 113.21], [117.0, 121.09], [124.0, 127.65], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 100.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 33.16, 0.0, 0.0, 36.87, 38.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.78], ["synthetic singing", 7.14], ["singing", 3.95]], null, null, [["music", 68.43], ["speech", 10.34], ["didgeridoo", 7.0]], [["music", 36.63], ["didgeridoo", 30.23], ["theremin", 5.66]], null], "duration": [0.98, 1.22, 0.15, 2.88, 0.99, 1.73, 6.7, 1.73, 0.11, 1.11, 1.15, 0.66, 1.65, 12.07, 4.11, 1.61, 2.91, 1.22, 1.03, 0.7, 1.0, 3.24, 1.23, 1.21, 4.09, 3.65, -0.06]} \ No newline at end of file diff --git a/annotations_1/326RvY72nmE_filtered.json b/annotations_1/326RvY72nmE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..543984fad8101c575aa955e60dbd4c65d008486a --- /dev/null +++ b/annotations_1/326RvY72nmE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.39], [7.0, 7.62], [11.0, 11.3], [15.0, 17.0], [18.0, 21.51], [23.0, 23.14], [24.0, 26.05], [31.0, 32.54], [35.0, 35.14], [36.0, 35.9], [37.0, 37.12], [38.0, 40.37], [44.0, 46.18], [49.0, 52.52], [54.0, 55.05], [61.0, 62.01], [66.0, 66.83], [68.0, 67.98], [68.0, 70.24], [80.0, 82.11], [83.0, 83.42], [84.0, 85.13], [89.0, 92.72], [95.0, 102.76], [103.0, 107.59], [112.0, 114.62], [116.0, 116.7], [120.0, 134.72], [135.0, 136.32], [138.0, 139.73], [147.0, 146.94], [148.0, 148.41], [151.0, 155.43]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [56.78, 0.0, 0.0, 90.25, 38.82, 0.0, 41.32, 0.0, 0.0, 0.0, 0.0, 99.93, 99.59, 100.0, 0.0, 0.0, 0.0, 0.0, 99.31, 100.0, 0.0, 0.0, 100.0, 74.44, 68.28, 92.64, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 43.33], "audiomae_on_audioset": [null, null, null, null, [["noise", 17.67], ["mains hum", 9.67], ["hum", 9.43]], null, [["vehicle", 13.18], ["insect", 5.82], ["fly, housefly", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.33], ["speech", 8.48], ["throbbing", 6.86]]], "duration": [4.39, 0.62, 0.3, 2.0, 3.51, 0.14, 2.05, 1.54, 0.14, -0.1, 0.12, 2.37, 2.18, 3.52, 1.05, 1.01, 0.83, -0.02, 2.24, 2.11, 0.42, 1.13, 3.72, 7.76, 4.59, 2.62, 0.7, 14.72, 1.32, 1.73, -0.06, 0.41, 4.43]} \ No newline at end of file diff --git a/annotations_1/32Fz-BBjVXs_filtered.json b/annotations_1/32Fz-BBjVXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..777c684c81ea44952395696ccbac9a8e08b0caa5 --- /dev/null +++ b/annotations_1/32Fz-BBjVXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.61], [15.0, 15.09], [15.0, 15.87], [18.0, 19.21], [24.0, 24.93], [26.0, 29.42], [31.0, 33.49], [35.0, 35.83], [36.0, 37.94], [38.0, 39.11], [40.0, 41.03], [48.0, 48.73], [51.0, 62.55], [64.0, 64.66], [67.0, 67.96], [68.0, 68.08], [69.0, 71.44], [75.0, 76.79], [79.0, 79.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.62, 0.0, 0.0, 0.0, 0.0, 88.46, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.61, 0.09, 0.87, 1.21, 0.93, 3.42, 2.49, 0.83, 1.94, 1.11, 1.03, 0.73, 11.55, 0.66, 0.96, 0.08, 2.44, 1.79, 0.39]} \ No newline at end of file diff --git a/annotations_1/32I5RODje3o_filtered.json b/annotations_1/32I5RODje3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95213422da9118551efcf887d316c6683ceddd1f --- /dev/null +++ b/annotations_1/32I5RODje3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [5.0, 5.16], [5.0, 6.13], [9.0, 9.27], [11.0, 11.72], [15.0, 15.04], [28.0, 28.48], [37.0, 38.1], [52.0, 53.01], [54.0, 55.36], [57.0, 57.4], [60.0, 60.45], [61.0, 61.57], [63.0, 63.88], [66.0, 69.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 0.16, 1.13, 0.27, 0.72, 0.04, 0.48, 1.1, 1.01, 1.36, 0.4, 0.45, 0.57, 0.88, 3.77]} \ No newline at end of file diff --git a/annotations_1/32OSGQmjP1Y_filtered.json b/annotations_1/32OSGQmjP1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b7b169167e8fcea508c0200a07354740de82e32 --- /dev/null +++ b/annotations_1/32OSGQmjP1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.11], [11.0, 21.3], [24.0, 24.36], [26.0, 27.85], [30.0, 32.73], [33.0, 40.51], [66.0, 73.75], [77.0, 87.44], [90.0, 95.99], [100.0, 100.13], [100.0, 104.67], [107.0, 113.37], [114.0, 124.5]], "keep_status": [false, true, false, false, true, true, true, false, true, false, true, false, true], "silence_prob": [31.1, 30.19, 0.0, 0.0, 31.95, 33.92, 30.8, 31.7, 29.8, 0.0, 30.02, 30.6, 29.33], "audiomae_on_audioset": [[["music", 36.23], ["didgeridoo", 26.17], ["speech", 7.99]], [["music", 54.63], ["speech", 5.26], ["fly, housefly", 4.27]], null, null, [["speech", 37.6], ["music", 24.09], ["creak", 3.09]], [["whack, thwack", 40.55], ["speech", 11.76], ["boing", 7.13]], [["music", 29.91], ["fly, housefly", 16.24], ["mosquito", 14.7]], [["moo", 35.51], ["livestock, farm animals, working animals", 34.57], ["cattle, bovinae", 14.07]], [["music", 23.96], ["throbbing", 12.45], ["mosquito", 8.2]], null, [["music", 48.9], ["speech", 16.21], ["rumble", 4.47]], [["speech", 71.81], ["fart", 7.18], ["music", 6.95]], [["music", 43.47], ["musical instrument", 7.73], ["hum", 6.15]]], "duration": [6.11, 10.3, 0.36, 1.85, 2.73, 7.51, 7.75, 10.44, 5.99, 0.13, 4.67, 6.37, 10.5]} \ No newline at end of file diff --git a/annotations_1/32iBCneCYcI_filtered.json b/annotations_1/32iBCneCYcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cec6bd84e226316789a7a5b5d74284c438feb584 --- /dev/null +++ b/annotations_1/32iBCneCYcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 30.06], [30.0, 37.12], [38.0, 63.19], [65.0, 80.76], [81.0, 93.34], [94.0, 96.08], [97.0, 133.74], [134.0, 156.68], [158.0, 164.76]], "keep_status": [true, true, false, false, false, true, false, false, true], "silence_prob": [29.19, 29.58, 29.46, 30.71, 30.14, 31.94, 0.0, 53.28, 43.4], "audiomae_on_audioset": [[["whack, thwack", 36.87], ["hum", 13.41], ["music", 9.35]], [["speech", 29.36], ["fart", 8.02], ["livestock, farm animals, working animals", 5.79]], [["speech", 56.28], ["music", 12.45], ["whack, thwack", 2.71]], [["music", 34.37], ["hum", 29.36], ["mains hum", 13.21]], [["speech", 46.58], ["music", 23.5], ["hum", 6.14]], [["music", 29.24], ["hum", 18.76], ["speech", 14.22]], null, null, [["music", 29.68], ["didgeridoo", 15.91], ["animal", 5.84]]], "duration": [27.06, 7.12, 25.19, 15.76, 12.34, 2.08, 36.74, 22.68, 6.76]} \ No newline at end of file diff --git a/annotations_1/32pZcw3acD0_filtered.json b/annotations_1/32pZcw3acD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f03c8dda3243ba912a670eab2ccd5d00e4188d78 --- /dev/null +++ b/annotations_1/32pZcw3acD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.98], [22.0, 22.84], [23.0, 27.18], [29.0, 29.42], [34.0, 58.94], [60.0, 74.02], [76.0, 87.54], [94.0, 103.47]], "keep_status": [false, false, true, false, true, false, false, false], "silence_prob": [41.26, 0.0, 38.5, 0.0, 41.83, 29.72, 29.9, 29.26], "audiomae_on_audioset": [[["music", 55.09], ["harp", 12.96], ["musical instrument", 8.13]], null, [["speech", 42.33], ["music", 13.81], ["sidetone", 9.98]], null, [["hum", 16.67], ["music", 14.01], ["noise", 10.92]], [["music", 73.47], ["speech", 10.96], ["didgeridoo", 2.24]], [["music", 83.7], ["sampler", 2.02], ["synthesizer", 1.09]], [["music", 87.61], ["singing", 1.36], ["boing", 1.08]]], "duration": [2.98, 0.84, 4.18, 0.42, 24.94, 14.02, 11.54, 9.47]} \ No newline at end of file diff --git a/annotations_1/33uE1YctOf4_filtered.json b/annotations_1/33uE1YctOf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eee9a3bab23858967692afd039aaf29ea63a99eb --- /dev/null +++ b/annotations_1/33uE1YctOf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.76], [9.0, 14.2], [18.0, 25.42], [26.0, 26.99], [33.0, 32.63], [34.0, 39.04], [41.0, 76.74], [80.0, 80.69], [84.0, 85.06], [86.0, 86.41], [88.0, 88.79], [90.0, 90.81], [92.0, 94.44], [95.0, 97.06], [99.0, 121.64], [123.0, 123.01], [124.0, 124.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 29.71, 30.07, 0.0, 0.0, 32.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.84, 47.35, 29.38, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 66.44], ["musical instrument", 11.37], ["brass instrument", 4.63]], [["music", 47.22], ["didgeridoo", 13.8], ["brass instrument", 9.38]], null, null, [["music", 46.55], ["theremin", 28.13], ["musical instrument", 5.13]], null, null, null, null, null, null, [["music", 46.97], ["hum", 6.59], ["ambient music", 5.28]], [["music", 43.54], ["synthesizer", 8.12], ["didgeridoo", 8.1]], [["music", 63.44], ["theremin", 15.91], ["musical instrument", 6.08]], null, null], "duration": [-0.24, 5.2, 7.42, 0.99, -0.37, 5.04, 35.74, 0.69, 1.06, 0.41, 0.79, 0.81, 2.44, 2.06, 22.64, 0.01, 0.92]} \ No newline at end of file diff --git a/annotations_1/34FTDewDftA_filtered.json b/annotations_1/34FTDewDftA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e78f487a41a0d8ec10fbe20a834f691e2104b9f6 --- /dev/null +++ b/annotations_1/34FTDewDftA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.71], [18.0, 20.07], [20.0, 22.4], [24.0, 27.53], [31.0, 36.05], [47.0, 47.53], [48.0, 53.3], [58.0, 59.76], [60.0, 62.13], [66.0, 71.07], [72.0, 124.14], [131.0, 131.23], [133.0, 136.8], [137.0, 137.76], [139.0, 139.19], [143.0, 142.82], [154.0, 154.68], [155.0, 156.93], [158.0, 158.73], [159.0, 159.63]], "keep_status": [true, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.21, 55.67, 39.5, 30.89, 29.36, 0.0, 33.04, 0.0, 42.42, 95.78, 0.0, 0.0, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 17.96], ["clip-clop", 16.55], ["horse", 9.63]], null, [["livestock, farm animals, working animals", 43.41], ["cattle, bovinae", 23.27], ["moo", 12.85]], [["speech", 38.58], ["crowd", 14.95], ["animal", 4.86]], [["speech", 16.99], ["throbbing", 9.42], ["crowd", 9.25]], null, [["speech", 24.98], ["cattle, bovinae", 7.86], ["animal", 7.25]], null, [["music", 12.08], ["speech", 8.66], ["chirp tone", 7.34]], null, null, null, [["speech", 81.14], ["inside, small room", 3.07], ["fart", 2.5]], null, null, null, null, null, null, null], "duration": [13.71, 2.07, 2.4, 3.53, 5.05, 0.53, 5.3, 1.76, 2.13, 5.07, 52.14, 0.23, 3.8, 0.76, 0.19, -0.18, 0.68, 1.93, 0.73, 0.63]} \ No newline at end of file diff --git a/annotations_1/34K-mcoEFuk_filtered.json b/annotations_1/34K-mcoEFuk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25a469de9ca041bd215dcaf063378689c3504378 --- /dev/null +++ b/annotations_1/34K-mcoEFuk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.52], [3.0, 8.01], [9.0, 11.11], [12.0, 13.73], [14.0, 15.62], [17.0, 42.2], [44.0, 45.17], [46.0, 55.73], [57.0, 60.08], [61.0, 62.92], [65.0, 67.66], [70.0, 73.47], [75.0, 79.2], [80.0, 81.09], [82.0, 86.73], [88.0, 90.42], [93.0, 93.46], [94.0, 97.97], [100.0, 104.46], [106.0, 111.27], [112.0, 115.13], [117.0, 123.35], [124.0, 126.52], [128.0, 135.48], [137.0, 151.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.65, 66.63, 0.0, 0.0, 58.22, 0.0, 84.25, 91.13, 0.0, 82.97, 90.95, 93.6, 0.0, 66.76, 93.91, 0.0, 55.6, 88.83, 84.62, 86.09, 80.64, 82.43, 87.92, 82.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.48, 5.01, 2.11, 1.73, 1.62, 25.2, 1.17, 9.73, 3.08, 1.92, 2.66, 3.47, 4.2, 1.09, 4.73, 2.42, 0.46, 3.97, 4.46, 5.27, 3.13, 6.35, 2.52, 7.48, 14.21]} \ No newline at end of file diff --git a/annotations_1/35FF7e1-zCg_filtered.json b/annotations_1/35FF7e1-zCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e122bebb3cbb66ad991b81b111a821567e77e64 --- /dev/null +++ b/annotations_1/35FF7e1-zCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.55], [24.0, 23.89], [27.0, 27.8], [32.0, 32.56], [68.0, 70.68], [72.0, 73.87], [76.0, 75.9], [83.0, 83.83], [85.0, 85.26], [86.0, 88.45], [90.0, 90.31], [95.0, 95.52], [116.0, 117.64], [120.0, 119.7], [120.0, 119.82], [120.0, 119.97], [120.0, 120.01], [120.0, 120.04], [120.0, 120.07], [120.0, 120.11], [120.0, 120.14], [120.0, 120.26], [125.0, 125.22], [137.0, 137.24], [147.0, 147.6], [154.0, 154.9], [156.0, 156.25], [163.0, 163.83], [171.0, 173.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.4, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.55, -0.11, 0.8, 0.56, 2.68, 1.87, -0.1, 0.83, 0.26, 2.45, 0.31, 0.52, 1.64, -0.3, -0.18, -0.03, 0.01, 0.04, 0.07, 0.11, 0.14, 0.26, 0.22, 0.24, 0.6, 0.9, 0.25, 0.83, 2.16]} \ No newline at end of file diff --git a/annotations_1/37O1H9YiBJo_filtered.json b/annotations_1/37O1H9YiBJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..319a1d345b41a598c13d20af64e934511ddfa181 --- /dev/null +++ b/annotations_1/37O1H9YiBJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.05], [35.0, 34.97], [38.0, 37.72], [43.0, 44.22], [55.0, 58.56], [74.0, 74.26], [75.0, 75.96], [78.0, 83.0], [83.0, 102.1], [105.0, 107.22]], "keep_status": [false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.68, 0.0, 0.0, 45.95, 36.0, 45.46], "audiomae_on_audioset": [null, null, null, null, [["speech", 50.79], ["fart", 9.42], ["whack, thwack", 3.76]], null, null, [["sine wave", 42.12], ["hum", 18.68], ["chirp tone", 12.96]], [["hum", 35.98], ["sidetone", 15.41], ["mains hum", 13.89]], [["hum", 28.76], ["throbbing", 15.92], ["music", 7.62]]], "duration": [1.05, -0.03, -0.28, 1.22, 3.56, 0.26, 0.96, 5.0, 19.1, 2.22]} \ No newline at end of file diff --git a/annotations_1/38AYeNGjqg0_filtered.json b/annotations_1/38AYeNGjqg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb4a427c0544f4836e526e66251a21e7bf467cf1 --- /dev/null +++ b/annotations_1/38AYeNGjqg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.76], [14.0, 16.9], [19.0, 29.81], [31.0, 38.65]], "keep_status": [false, true, true, true], "silence_prob": [0.0, 47.12, 45.56, 43.03], "audiomae_on_audioset": [null, [["music", 23.52], ["sonar", 9.74], ["sine wave", 8.1]], [["sonar", 35.33], ["music", 22.84], ["singing bowl", 8.98]], [["music", 24.85], ["hum", 14.27], ["sonar", 10.5]]], "duration": [1.76, 2.9, 10.81, 7.65]} \ No newline at end of file diff --git a/annotations_1/38jXOaoZQZI_filtered.json b/annotations_1/38jXOaoZQZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec5ec1e64477b22485466dab1ae48e4d660307e5 --- /dev/null +++ b/annotations_1/38jXOaoZQZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.6], [9.0, 8.7], [9.0, 12.26], [15.0, 15.01], [27.0, 29.3], [32.0, 33.17], [34.0, 34.99], [37.0, 45.3], [60.0, 69.06], [70.0, 73.28], [76.0, 76.45], [79.0, 79.71], [81.0, 82.58], [83.0, 83.15], [84.0, 89.67], [95.0, 104.52], [106.0, 107.05], [109.0, 110.3], [116.0, 119.58], [129.0, 129.19], [135.0, 135.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [50.61, 0.0, 53.53, 0.0, 94.52, 0.0, 0.0, 37.33, 39.86, 74.13, 0.0, 0.0, 0.0, 0.0, 36.17, 31.48, 0.0, 0.0, 39.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 82.24], ["telephone", 3.82], ["noise", 2.66]], [["sidetone", 56.42], ["speech", 25.31], ["noise", 7.5]], null, null, null, null, null, [["speech", 55.66], ["music", 19.1], ["mains hum", 5.87]], [["fart", 44.59], ["speech", 44.37], ["music", 3.18]], null, null, [["speech", 78.06], ["hiccup", 3.35], ["sidetone", 2.61]], null, null], "duration": [5.6, -0.3, 3.26, 0.01, 2.3, 1.17, 0.99, 8.3, 9.06, 3.28, 0.45, 0.71, 1.58, 0.15, 5.67, 9.52, 1.05, 1.3, 3.58, 0.19, 0.72]} \ No newline at end of file diff --git a/annotations_1/39471A71y3w_filtered.json b/annotations_1/39471A71y3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73dd77fd4f507babe75a637adf926ed5b93bdc59 --- /dev/null +++ b/annotations_1/39471A71y3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [12.0, 12.97], [20.0, 19.89], [21.0, 21.66], [24.0, 24.85], [27.0, 29.52], [31.0, 30.59], [38.0, 38.43], [41.0, 41.32], [42.0, 42.18], [51.0, 53.08], [54.0, 55.36], [57.0, 58.19], [59.0, 64.52], [67.0, 68.59], [70.0, 71.0], [77.0, 77.79], [86.0, 95.13], [96.0, 109.19], [111.0, 112.73], [113.0, 118.25], [120.0, 123.85], [124.0, 127.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 41.68, 0.0, 0.0, 49.31, 0.0, 0.0, 0.0, 56.48, 53.53, 0.0, 62.37, 57.01, 54.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 53.01], ["speech", 7.19], ["guitar", 6.12]], null, null, [["music", 25.7], ["hum", 16.3], ["speech", 15.27]], null, null, null, null, null, null, null, null, null], "duration": [1.1, 0.97, -0.11, 0.66, 0.85, 2.52, -0.41, 0.43, 0.32, 0.18, 2.08, 1.36, 1.19, 5.52, 1.59, 1.0, 0.79, 9.13, 13.19, 1.73, 5.25, 3.85, 3.08]} \ No newline at end of file diff --git a/annotations_1/39Bnk6VU53Y_filtered.json b/annotations_1/39Bnk6VU53Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08f2047dd73bcf88eaee5ae4639cdd103d381f68 --- /dev/null +++ b/annotations_1/39Bnk6VU53Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [20.0, 20.75], [30.0, 67.04], [68.0, 68.22], [69.0, 82.44], [89.0, 90.58], [91.0, 90.93], [91.0, 91.0], [97.0, 97.34], [98.0, 98.58], [99.0, 99.37], [100.0, 100.36], [101.0, 102.44], [104.0, 103.98], [105.0, 113.16], [116.0, 116.9], [119.0, 120.26], [121.0, 121.47], [123.0, 123.53], [125.0, 124.98], [126.0, 126.94], [128.0, 128.71], [130.0, 130.6], [132.0, 133.25], [135.0, 134.97], [136.0, 139.28], [140.0, 140.64], [145.0, 145.59], [147.0, 147.24], [150.0, 150.62], [159.0, 169.6], [170.0, 169.74], [170.0, 170.99], [171.0, 171.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 38.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 83.93], ["christmas music", 2.26], ["musical instrument", 1.38]], null, null, null, null, null, null, null, null, null, [["speech", 48.43], ["echo", 9.03], ["crying, sobbing", 4.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.73], ["animal", 18.15], ["howl", 8.79]], null, null, null], "duration": [0.03, 0.75, 37.04, 0.22, 13.44, 1.58, -0.07, 0.0, 0.34, 0.58, 0.37, 0.36, 1.44, -0.02, 8.16, 0.9, 1.26, 0.47, 0.53, -0.02, 0.94, 0.71, 0.6, 1.25, -0.03, 3.28, 0.64, 0.59, 0.24, 0.62, 10.6, -0.26, 0.99, 0.71]} \ No newline at end of file diff --git a/annotations_1/3A97Vc1eExE_filtered.json b/annotations_1/3A97Vc1eExE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad3a33d2544d668591b62a01be316199a15dd605 --- /dev/null +++ b/annotations_1/3A97Vc1eExE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.43], [28.0, 28.46], [29.0, 30.0], [33.0, 45.99], [46.0, 49.08], [53.0, 53.59], [54.0, 54.33], [56.0, 56.56], [57.0, 61.75], [62.0, 68.1], [69.0, 72.37], [73.0, 74.51], [75.0, 75.84], [77.0, 78.21], [79.0, 83.05], [92.0, 92.96], [94.0, 95.35], [97.0, 100.67], [105.0, 105.71], [106.0, 107.18], [107.0, 107.55], [117.0, 118.54], [121.0, 122.49], [123.0, 124.78], [126.0, 129.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.0, 39.0, 0.0, 0.0, 0.0, 33.14, 43.51, 46.02, 0.0, 0.0, 0.0, 30.89, 0.0, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02], "audiomae_on_audioset": [null, null, null, [["music", 73.61], ["synthesizer", 3.78], ["electronic music", 3.2]], [["sidetone", 58.53], ["speech", 22.97], ["music", 4.26]], null, null, null, [["whale vocalization", 34.76], ["hum", 17.59], ["speech", 11.9]], [["mains hum", 45.61], ["hum", 33.49], ["speech", 6.15]], [["hum", 47.78], ["mains hum", 30.42], ["throbbing", 5.57]], null, null, null, [["music", 50.76], ["hum", 7.63], ["throbbing", 6.31]], null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 0.46, 1.0, 12.99, 3.08, 0.59, 0.33, 0.56, 4.75, 6.1, 3.37, 1.51, 0.84, 1.21, 4.05, 0.96, 1.35, 3.67, 0.71, 1.18, 0.55, 1.54, 1.49, 1.78, 3.44]} \ No newline at end of file diff --git a/annotations_1/3Avu3KdHGdo_filtered.json b/annotations_1/3Avu3KdHGdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40b6d695078e1af85ebbd85f4e52958a9e8c183d --- /dev/null +++ b/annotations_1/3Avu3KdHGdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.28], [9.0, 10.72], [11.0, 11.97], [14.0, 14.79], [17.0, 19.11], [23.0, 24.53], [27.0, 32.14], [35.0, 36.0], [38.0, 38.96], [44.0, 47.19], [54.0, 56.49], [57.0, 59.31], [63.0, 63.58], [70.0, 72.67]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [44.69, 0.0, 0.0, 0.0, 89.36, 0.0, 40.9, 0.0, 0.0, 52.86, 54.83, 60.7, 0.0, 49.18], "audiomae_on_audioset": [[["music", 11.98], ["hum", 10.91], ["whale vocalization", 8.86]], null, null, null, null, null, [["fly, housefly", 24.59], ["insect", 20.19], ["bee, wasp, etc.", 15.61]], null, null, null, null, null, null, [["speech", 46.59], ["cattle, bovinae", 6.72], ["music", 6.31]]], "duration": [5.28, 1.72, 0.97, 0.79, 2.11, 1.53, 5.14, 1.0, 0.96, 3.19, 2.49, 2.31, 0.58, 2.67]} \ No newline at end of file diff --git a/annotations_1/3B40Rhnt4PA_filtered.json b/annotations_1/3B40Rhnt4PA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c15f70075c8595253c3f682307a1d4b929a133e --- /dev/null +++ b/annotations_1/3B40Rhnt4PA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.63], [24.0, 24.36], [26.0, 27.31], [31.0, 31.56], [39.0, 41.91], [45.0, 44.95], [53.0, 53.96], [56.0, 56.69], [73.0, 72.99], [87.0, 95.45], [99.0, 100.2], [101.0, 100.97], [101.0, 101.01], [101.0, 103.69], [119.0, 126.94], [137.0, 157.67], [159.0, 159.33], [160.0, 161.62], [162.0, 163.21]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 29.16, 0.0, 0.0, 0.0, 29.4, 29.79, 29.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.17], ["speech", 20.43], ["moo", 6.49]], null, null, null, [["music", 38.61], ["boing", 33.35], ["speech", 10.35]], [["music", 22.14], ["moo", 16.99], ["cattle, bovinae", 16.78]], [["moo", 22.63], ["music", 22.55], ["cattle, bovinae", 19.4]], null, null, null], "duration": [0.63, 0.36, 1.31, 0.56, 2.91, -0.05, 0.96, 0.69, -0.01, 8.45, 1.2, -0.03, 0.01, 2.69, 7.94, 20.67, 0.33, 1.62, 1.21]} \ No newline at end of file diff --git a/annotations_1/3Blk7Vo0abY_filtered.json b/annotations_1/3Blk7Vo0abY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0146c809b25005b90f43ad3fa4aa2ed8f121f529 --- /dev/null +++ b/annotations_1/3Blk7Vo0abY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.39], [8.0, 8.33], [9.0, 10.61], [14.0, 14.39], [15.0, 19.36], [21.0, 21.19], [23.0, 23.68], [31.0, 32.29], [37.0, 37.66], [40.0, 40.32], [43.0, 45.79], [46.0, 47.8], [51.0, 53.2], [54.0, 55.04], [58.0, 60.29], [64.0, 69.2], [74.0, 75.2], [80.0, 81.68], [83.0, 85.13], [90.0, 91.62], [94.0, 97.31], [99.0, 110.78], [112.0, 130.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [70.44, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 99.95, 0.0, 62.89, 77.36, 0.0, 0.0, 99.99, 0.0, 90.78, 90.95, 31.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.26], ["synthesizer", 13.96], ["theremin", 8.63]]], "duration": [5.39, 0.33, 1.61, 0.39, 4.36, 0.19, 0.68, 1.29, 0.66, 0.32, 2.79, 1.8, 2.2, 1.04, 2.29, 5.2, 1.2, 1.68, 2.13, 1.62, 3.31, 11.78, 18.55]} \ No newline at end of file diff --git a/annotations_1/3Cf6HfBCcso_filtered.json b/annotations_1/3Cf6HfBCcso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c2da00907401d1f7a55d8a7e7f9fe1279bb5c53 --- /dev/null +++ b/annotations_1/3Cf6HfBCcso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.9], [6.0, 25.68], [27.0, 28.0], [29.0, 79.81], [85.0, 88.28], [92.0, 93.07], [94.0, 94.63], [97.0, 113.44], [114.0, 115.74], [117.0, 117.91], [123.0, 124.41], [125.0, 125.74], [128.0, 129.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.51, 34.26, 0.0, 0.0, 38.51, 0.0, 0.0, 31.45, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.65], ["didgeridoo", 13.38], ["musical instrument", 4.16]], [["speech", 46.03], ["music", 30.04], ["sidetone", 3.95]], null, null, [["music", 40.97], ["speech", 39.25], ["guitar", 2.6]], null, null, [["hum", 39.83], ["mains hum", 18.3], ["music", 14.21]], null, null, null, null, null], "duration": [2.9, 19.68, 1.0, 50.81, 3.28, 1.07, 0.63, 16.44, 1.74, 0.91, 1.41, 0.74, 1.27]} \ No newline at end of file diff --git a/annotations_1/3D0gGgMTylk_filtered.json b/annotations_1/3D0gGgMTylk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72d53015a71e63a9c042063a483740c313459f31 --- /dev/null +++ b/annotations_1/3D0gGgMTylk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [5.0, 5.83], [17.0, 18.49], [19.0, 19.87], [24.0, 24.07], [37.0, 37.37], [38.0, 40.81], [48.0, 47.95], [51.0, 54.06], [62.0, 62.53], [67.0, 68.39], [70.0, 70.33], [78.0, 79.25], [86.0, 88.86], [90.0, 94.34], [96.0, 98.29], [100.0, 103.94], [108.0, 108.43], [111.0, 116.04], [129.0, 130.92]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.16, 0.0, 30.46, 0.0, 0.0, 0.0, 0.0, 100.0, 47.54, 100.0, 99.98, 0.0, 31.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 21.74], ["livestock, farm animals, working animals", 15.79], ["cattle, bovinae", 14.83]], null, [["speech", 27.23], ["fart", 8.32], ["whale vocalization", 4.41]], null, null, null, null, null, [["sidetone", 48.29], ["speech", 26.22], ["music", 3.11]], null, null, null, [["music", 77.06], ["musical instrument", 4.54], ["fly, housefly", 2.75]], null], "duration": [0.94, 0.83, 1.49, 0.87, 0.07, 0.37, 2.81, -0.05, 3.06, 0.53, 1.39, 0.33, 1.25, 2.86, 4.34, 2.29, 3.94, 0.43, 5.04, 1.92]} \ No newline at end of file diff --git a/annotations_1/3EIqxstBVCs_filtered.json b/annotations_1/3EIqxstBVCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3b679c09fce12a2f5252191da649783785ae628 --- /dev/null +++ b/annotations_1/3EIqxstBVCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.67], [10.0, 10.15], [13.0, 30.06], [30.0, 38.33], [40.0, 41.49], [42.0, 45.81], [47.0, 56.15]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.36, 80.46, 0.0, 54.7, 54.56], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.67, 0.15, 17.06, 8.33, 1.49, 3.81, 9.15]} \ No newline at end of file diff --git a/annotations_1/3EdXrMS1gJc_filtered.json b/annotations_1/3EdXrMS1gJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c995d0b4187bcc92cac09e5f04831b9ee1199a --- /dev/null +++ b/annotations_1/3EdXrMS1gJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [5.0, 5.04], [42.0, 42.15], [44.0, 44.49], [65.0, 65.47]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.32, 0.04, 0.15, 0.49, 0.47]} \ No newline at end of file diff --git a/annotations_1/3EeGyS1BOGk_filtered.json b/annotations_1/3EeGyS1BOGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab0525cbb958ab666b10436001d8aa0969a62d2f --- /dev/null +++ b/annotations_1/3EeGyS1BOGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [6.0, 7.18], [9.0, 9.91], [11.0, 12.06], [16.0, 16.63], [19.0, 19.95], [21.0, 22.67], [25.0, 25.37], [28.0, 29.15], [31.0, 32.04], [32.0, 33.12], [35.0, 35.5], [37.0, 37.88], [39.0, 41.44], [45.0, 46.21], [47.0, 48.73], [50.0, 50.41], [51.0, 51.78], [53.0, 53.55], [57.0, 58.29], [60.0, 61.16], [64.0, 65.26], [66.0, 66.68], [67.0, 68.34], [72.0, 73.3], [77.0, 77.06], [78.0, 78.44], [79.0, 80.32], [81.0, 81.7], [84.0, 83.98], [86.0, 86.21], [87.0, 88.21], [90.0, 89.99], [92.0, 92.28], [93.0, 92.94], [96.0, 96.85], [98.0, 99.17], [104.0, 104.19], [105.0, 104.85], [107.0, 107.32], [110.0, 111.59], [113.0, 113.49], [116.0, 116.7], [117.0, 118.39], [120.0, 120.29], [123.0, 124.77], [129.0, 130.01], [132.0, 132.14], [139.0, 139.56], [141.0, 144.1], [146.0, 148.09], [150.0, 150.45], [161.0, 161.62], [163.0, 163.59], [165.0, 165.57], [167.0, 167.63], [171.0, 171.51], [175.0, 175.0], [178.0, 179.2], [182.0, 182.53], [187.0, 187.64], [188.0, 189.01], [190.0, 190.54], [191.0, 191.4], [196.0, 196.15], [198.0, 199.07], [200.0, 201.36], [202.0, 203.39], [205.0, 205.78], [206.0, 206.86], [208.0, 208.36], [209.0, 209.06], [211.0, 211.22], [214.0, 214.59], [217.0, 217.63], [218.0, 219.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.28], ["dial tone", 30.13], ["busy signal", 5.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 1.18, 0.91, 1.06, 0.63, 0.95, 1.67, 0.37, 1.15, 1.04, 1.12, 0.5, 0.88, 2.44, 1.21, 1.73, 0.41, 0.78, 0.55, 1.29, 1.16, 1.26, 0.68, 1.34, 1.3, 0.06, 0.44, 1.32, 0.7, -0.02, 0.21, 1.21, -0.01, 0.28, -0.06, 0.85, 1.17, 0.19, -0.15, 0.32, 1.59, 0.49, 0.7, 1.39, 0.29, 1.77, 1.01, 0.14, 0.56, 3.1, 2.09, 0.45, 0.62, 0.59, 0.57, 0.63, 0.51, 0.0, 1.2, 0.53, 0.64, 1.01, 0.54, 0.4, 0.15, 1.07, 1.36, 1.39, 0.78, 0.86, 0.36, 0.06, 0.22, 0.59, 0.63, 1.1]} \ No newline at end of file diff --git a/annotations_1/3FKMUa7vCZU_filtered.json b/annotations_1/3FKMUa7vCZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffd69c9853f1048bc22c17e2abbbad38a23b7b34 --- /dev/null +++ b/annotations_1/3FKMUa7vCZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.05], [2.0, 2.78], [12.0, 11.84], [13.0, 14.49], [28.0, 28.9], [32.0, 33.08], [36.0, 35.9], [38.0, 38.45], [39.0, 40.9], [46.0, 47.68], [48.0, 49.45], [50.0, 51.24], [56.0, 65.55], [68.0, 68.94], [71.0, 71.44], [75.0, 75.54], [77.0, 80.86], [84.0, 84.84], [91.0, 96.09], [98.0, 101.12], [120.0, 120.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.89, 0.0, 0.0, 0.0, 36.52, 0.0, 31.6, 31.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 44.94], ["groan", 20.29], ["animal", 5.6]], null, null, null, [["mosquito", 27.38], ["fly, housefly", 12.09], ["speech", 6.03]], null, [["music", 71.04], ["speech", 9.9], ["screaming", 3.45]], [["music", 37.31], ["fly, housefly", 11.7], ["synthesizer", 5.32]], null], "duration": [0.05, 0.78, -0.16, 1.49, 0.9, 1.08, -0.1, 0.45, 1.9, 1.68, 1.45, 1.24, 9.55, 0.94, 0.44, 0.54, 3.86, 0.84, 5.09, 3.12, 0.85]} \ No newline at end of file diff --git a/annotations_1/3GrjR4Fib1M_filtered.json b/annotations_1/3GrjR4Fib1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..573ac65d660039fa088495b2b66fed2502baf5cb --- /dev/null +++ b/annotations_1/3GrjR4Fib1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.04], [8.0, 8.07], [8.0, 8.24], [9.0, 8.67], [9.0, 9.64], [12.0, 12.75], [14.0, 14.79], [41.0, 41.2], [51.0, 51.09], [52.0, 51.92], [69.0, 68.71], [84.0, 84.3], [103.0, 104.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.07, 0.24, -0.33, 0.64, 0.75, 0.79, 0.2, 0.09, -0.08, -0.29, 0.3, 1.84]} \ No newline at end of file diff --git a/annotations_1/3IUoqFHJ6wk_filtered.json b/annotations_1/3IUoqFHJ6wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cd220c40050dcd768e1faf5686c96f20e653484 --- /dev/null +++ b/annotations_1/3IUoqFHJ6wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [4.0, 4.9], [5.0, 6.88], [8.0, 11.5], [13.0, 16.28], [18.0, 19.43], [21.0, 22.69], [24.0, 25.14], [25.0, 26.59], [28.0, 30.03], [31.0, 33.29], [34.0, 35.92], [37.0, 44.91], [45.0, 56.98], [61.0, 63.71], [65.0, 66.18], [66.0, 68.2], [69.0, 70.26], [71.0, 72.32], [73.0, 72.98], [73.0, 73.11], [73.0, 78.39], [79.0, 80.97], [85.0, 89.33], [91.0, 93.73], [95.0, 96.25], [97.0, 98.49], [101.0, 110.47], [113.0, 114.78], [116.0, 118.47], [119.0, 122.2], [125.0, 128.21], [131.0, 131.04], [132.0, 132.04], [133.0, 135.16], [137.0, 143.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 94.37, 95.09, 0.0, 0.0, 0.0, 0.0, 93.6, 71.72, 0.0, 68.15, 95.78, 88.1, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 77.36, 62.89, 0.0, 0.0, 53.16, 0.0, 52.98, 46.29, 49.18, 0.0, 0.0, 44.34, 47.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.27], ["speech", 10.02], ["musical instrument", 7.67]], [["music", 48.71], ["ambient music", 5.74], ["theremin", 3.07]], null, null, [["music", 36.16], ["speech", 25.3], ["foghorn", 2.73]], [["music", 57.23], ["hum", 3.07], ["ambient music", 2.58]]], "duration": [0.25, 0.9, 1.88, 3.5, 3.28, 1.43, 1.69, 1.14, 1.59, 2.03, 2.29, 1.92, 7.91, 11.98, 2.71, 1.18, 2.2, 1.26, 1.32, -0.02, 0.11, 5.39, 1.97, 4.33, 2.73, 1.25, 1.49, 9.47, 1.78, 2.47, 3.2, 3.21, 0.04, 0.04, 2.16, 6.43]} \ No newline at end of file diff --git a/annotations_1/3IVugy6dK3E_filtered.json b/annotations_1/3IVugy6dK3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71b3f47fa0fe3cdc90d4b384cdbb20ef434de59b --- /dev/null +++ b/annotations_1/3IVugy6dK3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [9.0, 9.46], [10.0, 13.24], [14.0, 14.15], [15.0, 15.67], [18.0, 17.59], [20.0, 35.7], [38.0, 39.82], [42.0, 43.55], [46.0, 58.14], [64.0, 64.96], [66.0, 67.73], [69.0, 72.87], [77.0, 80.1], [81.0, 81.43], [89.0, 89.78], [90.0, 90.54], [91.0, 91.3], [92.0, 92.26], [99.0, 103.44], [104.0, 104.82], [106.0, 113.85], [118.0, 119.06], [128.0, 142.45]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 47.31, 0.0, 0.0, 0.0, 35.5, 0.0, 0.0, 37.99, 0.0, 0.0, 64.97, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 29.56, 0.0, 30.09], "audiomae_on_audioset": [null, null, [["speech", 27.58], ["music", 22.53], ["fly, housefly", 12.03]], null, null, null, [["music", 51.96], ["speech", 12.37], ["throbbing", 9.23]], null, null, [["music", 67.82], ["throbbing", 4.4], ["speech", 3.85]], null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 25.82], ["music", 18.91], ["speech", 15.6]], null, [["music", 75.09], ["throbbing", 4.32], ["drum machine", 1.81]]], "duration": [0.73, 0.46, 3.24, 0.15, 0.67, -0.41, 15.7, 1.82, 1.55, 12.14, 0.96, 1.73, 3.87, 3.1, 0.43, 0.78, 0.54, 0.3, 0.26, 4.44, 0.82, 7.85, 1.06, 14.45]} \ No newline at end of file diff --git a/annotations_1/3IZVz7ukKyU_filtered.json b/annotations_1/3IZVz7ukKyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ea7b6202062fab577e9c114477299bd20bad50b --- /dev/null +++ b/annotations_1/3IZVz7ukKyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 62.09], [63.0, 68.1]], "keep_status": [false, false], "silence_prob": [0.0, 32.62], "audiomae_on_audioset": [null, [["speech", 56.75], ["music", 12.88], ["hum", 7.24]]], "duration": [32.09, 5.1]} \ No newline at end of file diff --git a/annotations_1/3Iy44xwjtQA_filtered.json b/annotations_1/3Iy44xwjtQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8cc02962b117e7d226630801132a4a31a6b805d --- /dev/null +++ b/annotations_1/3Iy44xwjtQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.97], [7.0, 8.38], [14.0, 18.13], [19.0, 22.6], [24.0, 28.21], [29.0, 33.76], [38.0, 39.02], [42.0, 42.25], [53.0, 53.57], [62.0, 62.02], [69.0, 70.19], [71.0, 75.29], [78.0, 78.92], [80.0, 82.19], [87.0, 88.2], [93.0, 94.74], [97.0, 97.95], [105.0, 106.25], [107.0, 109.09], [117.0, 119.58], [121.0, 124.29], [126.0, 126.45], [136.0, 138.1], [142.0, 143.5], [146.0, 146.23], [147.0, 148.37], [150.0, 150.42], [151.0, 152.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.0, 79.76, 67.63, 58.22, 0.0, 0.0, 0.0, 0.0, 0.0, 36.61, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 48.35, 51.18, 54.63, 0.0, 40.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 32.88], ["speech", 27.99], ["mains hum", 12.08]], null, null, null, null, null, null, [["hum", 20.43], ["throbbing", 11.78], ["speech", 11.14]], null, null, null, [["hum", 37.8], ["music", 19.82], ["mains hum", 9.47]], null, null, null, null, null], "duration": [1.97, 1.38, 4.13, 3.6, 4.21, 4.76, 1.02, 0.25, 0.57, 0.02, 1.19, 4.29, 0.92, 2.19, 1.2, 1.74, 0.95, 1.25, 2.09, 2.58, 3.29, 0.45, 2.1, 1.5, 0.23, 1.37, 0.42, 1.2]} \ No newline at end of file diff --git a/annotations_1/3J0d3ZwHy-Y_filtered.json b/annotations_1/3J0d3ZwHy-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d04ffad86bef6aed2182e0b5ee7df19f392cce29 --- /dev/null +++ b/annotations_1/3J0d3ZwHy-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.96], [23.0, 27.78], [29.0, 29.49], [31.0, 31.94], [33.0, 34.21], [37.0, 36.91], [37.0, 38.42], [39.0, 39.8], [41.0, 91.39], [93.0, 94.31], [95.0, 95.13], [96.0, 96.69], [97.0, 114.35], [118.0, 132.34], [134.0, 135.82], [137.0, 139.29], [142.0, 142.94], [145.0, 147.29], [149.0, 155.33], [158.0, 161.55], [162.0, 175.04], [181.0, 181.85], [192.0, 197.58], [199.0, 199.39], [200.0, 201.85], [202.0, 203.49], [205.0, 206.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.69, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.74, 57.4, 0.0, 99.82, 0.0, 99.4, 90.25, 98.59, 57.17, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 42.95], ["radio", 18.3], ["whale vocalization", 13.48]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.78], ["whack, thwack", 18.38], ["groan", 7.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.96, 4.78, 0.49, 0.94, 1.21, -0.09, 1.42, 0.8, 50.39, 1.31, 0.13, 0.69, 17.35, 14.34, 1.82, 2.29, 0.94, 2.29, 6.33, 3.55, 13.04, 0.85, 5.58, 0.39, 1.85, 1.49, 1.49]} \ No newline at end of file diff --git a/annotations_1/3K0KQCvu2Xo_filtered.json b/annotations_1/3K0KQCvu2Xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..309648bd6c51db9a8fb8426083fac17a2e75ce20 --- /dev/null +++ b/annotations_1/3K0KQCvu2Xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.46], [26.0, 26.22], [27.0, 29.64], [30.0, 31.26], [33.0, 33.02], [33.0, 34.3], [35.0, 35.61], [37.0, 37.32], [38.0, 39.77], [41.0, 47.56], [48.0, 49.13], [50.0, 56.91], [58.0, 92.64], [93.0, 94.68], [96.0, 96.72], [100.0, 101.44], [103.0, 104.01], [106.0, 106.0], [107.0, 107.25], [107.0, 107.76], [109.0, 109.27], [110.0, 110.32], [111.0, 111.6], [112.0, 112.45], [113.0, 113.78], [115.0, 115.52], [116.0, 115.72], [119.0, 119.35], [120.0, 121.93], [123.0, 126.87], [129.0, 129.56], [130.0, 134.0], [135.0, 135.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 47.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 99.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["bouncing", 46.85], ["speech", 43.48], ["thunk", 4.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.22, 2.64, 1.26, 0.02, 1.3, 0.61, 0.32, 1.77, 6.56, 1.13, 6.91, 34.64, 1.68, 0.72, 1.44, 1.01, 0.0, 0.25, 0.76, 0.27, 0.32, 0.6, 0.45, 0.78, 0.52, -0.28, 0.35, 1.93, 3.87, 0.56, 4.0, 0.78]} \ No newline at end of file diff --git a/annotations_1/3KdgZgQRDU0_filtered.json b/annotations_1/3KdgZgQRDU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f53b12fd067b204464e512808a3e0daa70363b4 --- /dev/null +++ b/annotations_1/3KdgZgQRDU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [21.0, 21.3], [25.0, 44.27], [45.0, 48.69], [54.0, 56.73], [59.0, 60.44], [62.0, 63.05], [64.0, 64.71], [66.0, 67.17], [73.0, 73.4], [74.0, 74.75], [75.0, 97.02], [100.0, 101.85], [104.0, 107.99], [111.0, 111.28], [120.0, 121.85], [122.0, 122.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.71, 44.12, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.9, 0.0, 99.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["machine gun", 37.39], ["gunshot, gunfire", 23.05], ["speech", 19.24]], [["cattle, bovinae", 52.51], ["moo", 34.91], ["livestock, farm animals, working animals", 12.26]], null, null, null, null, null, null, null, [["speech", 73.69], ["groan", 8.41], ["animal", 2.68]], null, null, null, null, null], "duration": [0.4, 0.3, 19.27, 3.69, 2.73, 1.44, 1.05, 0.71, 1.17, 0.4, 0.75, 22.02, 1.85, 3.99, 0.28, 1.85, 0.57]} \ No newline at end of file diff --git a/annotations_1/3MhzaQnLhRY_filtered.json b/annotations_1/3MhzaQnLhRY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e34a112b0c8bd11580c1ba10c8e41ef21dddccf1 --- /dev/null +++ b/annotations_1/3MhzaQnLhRY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [6.0, 6.67], [8.0, 9.73], [17.0, 17.15], [27.0, 26.77], [31.0, 30.99], [35.0, 36.44], [41.0, 42.89], [45.0, 49.18], [50.0, 52.34], [58.0, 58.35], [65.0, 67.47], [75.0, 76.27], [77.0, 78.26], [79.0, 79.96], [81.0, 82.58], [86.0, 86.54], [88.0, 88.8], [91.0, 91.2], [94.0, 94.2], [98.0, 98.27], [99.0, 99.0], [100.0, 101.78], [102.0, 101.98], [110.0, 109.7], [119.0, 118.54], [119.0, 118.96], [119.0, 121.61], [128.0, 129.81], [134.0, 134.94], [137.0, 138.13], [156.0, 156.0], [163.0, 166.13], [170.0, 172.0], [172.0, 174.56]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 94.81, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 0.0, 75.07, 58.64, 56.78], "audiomae_on_audioset": [[["music", 26.04], ["hum", 14.06], ["mains hum", 9.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.39], ["male speech, man speaking", 4.96], ["speech synthesizer", 4.83]], null, null, null, null, null, null, null], "duration": [2.15, 0.67, 1.73, 0.15, -0.23, -0.01, 1.44, 1.89, 4.18, 2.34, 0.35, 2.47, 1.27, 1.26, 0.96, 1.58, 0.54, 0.8, 0.2, 0.2, 0.27, 0.0, 1.78, -0.02, -0.3, -0.46, -0.04, 2.61, 1.81, 0.94, 1.13, 0.0, 3.13, 2.0, 2.56]} \ No newline at end of file diff --git a/annotations_1/3NRVJdoihjY_filtered.json b/annotations_1/3NRVJdoihjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f30065078762b0eecc1ecb39c03aba01997d0dba --- /dev/null +++ b/annotations_1/3NRVJdoihjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.83], [17.0, 18.64], [21.0, 22.64], [25.0, 28.83], [32.0, 69.5], [70.0, 79.24], [80.0, 105.7], [108.0, 112.6]], "keep_status": [false, false, false, false, false, true, true, true], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 32.2, 33.54, 36.27], "audiomae_on_audioset": [null, null, null, null, null, [["music", 41.89], ["sidetone", 11.61], ["didgeridoo", 4.36]], [["music", 39.07], ["flute", 8.75], ["hum", 7.77]], [["hum", 31.21], ["speech", 13.75], ["mains hum", 13.44]]], "duration": [7.83, 1.64, 1.64, 3.83, 37.5, 9.24, 25.7, 4.6]} \ No newline at end of file diff --git a/annotations_1/3NpYTks1mDI_filtered.json b/annotations_1/3NpYTks1mDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97fe5c08a66db7810ce210c278d5094a5a193660 --- /dev/null +++ b/annotations_1/3NpYTks1mDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [5.0, 7.7], [12.0, 12.23], [12.0, 42.63], [47.0, 47.93], [54.0, 55.0], [56.0, 72.77], [73.0, 81.53], [82.0, 102.98], [105.0, 107.57], [108.0, 114.99], [117.0, 118.76], [120.0, 135.13]], "keep_status": [false, true, false, false, false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 32.86, 34.21, 33.43, 36.15, 35.26, 0.0, 33.65], "audiomae_on_audioset": [null, [["speech", 20.41], ["animal", 8.71], ["cat", 5.56]], null, null, null, null, [["music", 66.97], ["groan", 7.9], ["speech", 6.98]], [["music", 47.57], ["cacophony", 9.52], ["hum", 8.09]], [["music", 32.09], ["speech", 12.29], ["groan", 11.13]], [["music", 29.34], ["speech", 21.82], ["foghorn", 3.74]], [["music", 33.16], ["fly, housefly", 8.38], ["hum", 7.13]], null, [["music", 62.18], ["hum", 9.45], ["mains hum", 4.85]]], "duration": [0.97, 2.7, 0.23, 30.63, 0.93, 1.0, 16.77, 8.53, 20.98, 2.57, 6.99, 1.76, 15.13]} \ No newline at end of file diff --git a/annotations_1/3OFda9AT-U4_filtered.json b/annotations_1/3OFda9AT-U4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dea16ec3cf22885c94718c31762e4fbb616b822f --- /dev/null +++ b/annotations_1/3OFda9AT-U4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.1], [19.0, 20.31], [22.0, 22.89], [48.0, 48.42], [87.0, 87.62], [90.0, 93.14], [97.0, 97.11], [97.0, 100.75], [102.0, 102.02], [104.0, 104.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 63.96, 0.0, 55.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.1, 1.31, 0.89, 0.42, 0.62, 3.14, 0.11, 3.75, 0.02, 0.45]} \ No newline at end of file diff --git a/annotations_1/3PBo1ef-18Y_filtered.json b/annotations_1/3PBo1ef-18Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a4b4bde9f21b58c866a69693b94164ba8c7781 --- /dev/null +++ b/annotations_1/3PBo1ef-18Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.66], [10.0, 25.98], [27.0, 42.7], [48.0, 48.59], [52.0, 54.01], [57.0, 60.02], [61.0, 63.51], [65.0, 68.1], [77.0, 77.48], [80.0, 82.34], [86.0, 87.45], [92.0, 91.52], [92.0, 91.56], [92.0, 91.59], [92.0, 91.62], [92.0, 91.66], [92.0, 96.45], [103.0, 103.76], [106.0, 106.73], [113.0, 124.85], [126.0, 135.68], [138.0, 137.88]], "keep_status": [false, true, true, false, true, true, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.22, 31.34, 0.0, 46.09, 37.75, 36.19, 39.64, 0.0, 33.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.81, 0.0, 0.0, 30.06, 31.08, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 26.11], ["insect", 22.72], ["mosquito", 12.14]], [["music", 36.0], ["fly, housefly", 11.18], ["insect", 5.68]], null, [["speech", 28.94], ["mains hum", 14.43], ["hum", 6.09]], [["speech", 29.96], ["music", 17.2], ["whale vocalization", 6.6]], [["roaring cats (lions, tigers)", 16.73], ["music", 14.53], ["animal", 10.48]], [["music", 43.1], ["quack", 9.47], ["duck", 6.17]], null, [["speech", 41.38], ["music", 22.17], ["musical instrument", 3.36]], null, null, null, null, null, null, [["speech", 56.53], ["whack, thwack", 11.91], ["music", 7.7]], null, null, [["music", 78.68], ["vehicle", 2.61], ["car", 2.54]], [["speech", 30.99], ["music", 21.15], ["vehicle", 4.16]], null], "duration": [0.66, 15.98, 15.7, 0.59, 2.01, 3.02, 2.51, 3.1, 0.48, 2.34, 1.45, -0.48, -0.44, -0.41, -0.38, -0.34, 4.45, 0.76, 0.73, 11.85, 9.68, -0.12]} \ No newline at end of file diff --git a/annotations_1/3PoW8y_3rzU_filtered.json b/annotations_1/3PoW8y_3rzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad1060d7a7d80aaca099c0b7f2c535350fc43f74 --- /dev/null +++ b/annotations_1/3PoW8y_3rzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.51], [19.0, 20.12], [21.0, 22.08], [23.0, 24.95], [26.0, 26.57], [28.0, 28.63], [29.0, 28.66], [29.0, 29.34], [30.0, 31.95], [35.0, 37.22], [39.0, 41.4], [43.0, 43.04], [44.0, 44.69], [48.0, 48.95], [51.0, 57.86], [59.0, 59.54], [60.0, 60.84], [61.0, 64.27], [65.0, 65.67], [67.0, 67.68], [69.0, 71.44], [72.0, 95.71], [97.0, 121.09], [123.0, 133.24], [135.0, 148.51]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, true, false, true, true, true], "silence_prob": [49.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.91, 44.2, 0.0, 0.0, 0.0, 40.01, 0.0, 0.0, 44.63, 0.0, 0.0, 45.3, 31.22, 48.14, 30.69, 31.29], "audiomae_on_audioset": [[["throbbing", 30.67], ["hum", 23.0], ["music", 17.44]], null, null, null, null, null, null, null, null, [["speech", 52.0], ["sidetone", 7.59], ["hum", 5.31]], [["music", 38.49], ["hum", 7.27], ["throbbing", 4.41]], null, null, null, [["hum", 31.2], ["mains hum", 15.21], ["music", 14.91]], null, null, [["speech", 45.73], ["hum", 15.92], ["rumble", 8.74]], null, null, [["music", 28.05], ["noise", 15.9], ["hum", 9.27]], [["music", 50.64], ["speech", 20.23], ["burst, pop", 3.49]], [["music", 29.37], ["hum", 21.92], ["throbbing", 7.61]], [["music", 26.93], ["machine gun", 11.65], ["hum", 5.88]], [["hum", 25.87], ["smash, crash", 15.02], ["mains hum", 14.98]]], "duration": [3.51, 1.12, 1.08, 1.95, 0.57, 0.63, -0.34, 0.34, 1.95, 2.22, 2.4, 0.04, 0.69, 0.95, 6.86, 0.54, 0.84, 3.27, 0.67, 0.68, 2.44, 23.71, 24.09, 10.24, 13.51]} \ No newline at end of file diff --git a/annotations_1/3S5E22b49-Q_filtered.json b/annotations_1/3S5E22b49-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..339210b2a96da8eb0bd592ba4c8925d777b664c5 --- /dev/null +++ b/annotations_1/3S5E22b49-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.74], [16.0, 42.58], [51.0, 53.11], [57.0, 58.51], [60.0, 60.03], [61.0, 66.36]], "keep_status": [false, false, false, false, false, false], "silence_prob": [99.97, 98.99, 93.76, 0.0, 0.0, 90.6], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [2.74, 26.58, 2.11, 1.51, 0.03, 5.36]} \ No newline at end of file diff --git a/annotations_1/3SKk58UngIk_filtered.json b/annotations_1/3SKk58UngIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c9b5c36cfeae05232a0ae7969b64abf366ee9c5 --- /dev/null +++ b/annotations_1/3SKk58UngIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [9.0, 9.88], [10.0, 10.27], [13.0, 12.6], [15.0, 18.17], [20.0, 22.06], [23.0, 25.17], [25.0, 27.45], [28.0, 36.75], [39.0, 39.48], [41.0, 41.37], [42.0, 43.61], [45.0, 45.72], [51.0, 50.92], [55.0, 55.12], [62.0, 62.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.53, 82.43, 74.13, 66.51, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 0.88, 0.27, -0.4, 3.17, 2.06, 2.17, 2.45, 8.75, 0.48, 0.37, 1.61, 0.72, -0.08, 0.12, 0.7]} \ No newline at end of file diff --git a/annotations_1/3SsvC_2wKI0_filtered.json b/annotations_1/3SsvC_2wKI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ffba5533b04ea3a05cc8f6e241bffa5e0e36db1 --- /dev/null +++ b/annotations_1/3SsvC_2wKI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [2.0, 3.87], [4.0, 7.75], [11.0, 12.9], [14.0, 15.52], [17.0, 18.13], [19.0, 21.02], [24.0, 27.72], [30.0, 33.88], [35.0, 37.99], [39.0, 39.58], [56.0, 56.34], [69.0, 69.74], [89.0, 89.85], [93.0, 93.56], [96.0, 107.33], [108.0, 108.26], [109.0, 109.73], [112.0, 113.24], [115.0, 115.57], [116.0, 117.63], [119.0, 121.44], [125.0, 125.15], [125.0, 125.76], [128.0, 127.97], [131.0, 132.11], [135.0, 137.39], [139.0, 139.94], [146.0, 148.27], [152.0, 152.36]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 94.95, 83.88, 70.72, 34.55, 0.0, 0.0, 0.0, 0.0, 0.0, 48.19, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 33.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fart", 44.16], ["laughter", 11.89], ["snicker", 8.9]], null, null, null, null, null, [["music", 47.67], ["speech", 38.34], ["guitar", 2.57]], null, null, null, null, null, [["speech", 70.87], ["music", 10.6], ["synthesizer", 3.18]], null, null, null, null, [["throbbing", 17.19], ["hum", 12.91], ["chirp tone", 11.89]], null, [["music", 36.69], ["speech", 27.25], ["thunk", 12.42]], null], "duration": [0.49, 1.87, 3.75, 1.9, 1.52, 1.13, 2.02, 3.72, 3.88, 2.99, 0.58, 0.34, 0.74, 0.85, 0.56, 11.33, 0.26, 0.73, 1.24, 0.57, 1.63, 2.44, 0.15, 0.76, -0.03, 1.11, 2.39, 0.94, 2.27, 0.36]} \ No newline at end of file diff --git a/annotations_1/3Sz7dbX2kTY_filtered.json b/annotations_1/3Sz7dbX2kTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82c14dc890d89916f8dea7ad5277096546c15dba --- /dev/null +++ b/annotations_1/3Sz7dbX2kTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.84], [9.0, 9.0], [19.0, 24.11], [27.0, 27.08], [27.0, 27.97], [46.0, 49.22], [51.0, 53.87], [67.0, 67.98], [69.0, 69.15], [113.0, 114.12], [115.0, 116.24], [118.0, 119.18], [120.0, 120.33], [121.0, 122.2], [125.0, 127.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 0.0, 0.0, 88.1, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.0, 5.11, 0.08, 0.97, 3.22, 2.87, 0.98, 0.15, 1.12, 1.24, 1.18, 0.33, 1.2, 2.9]} \ No newline at end of file diff --git a/annotations_1/3TzAJdCNpZw_filtered.json b/annotations_1/3TzAJdCNpZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ef2bde783f1098993747fb08e46fb2ceba32dd1 --- /dev/null +++ b/annotations_1/3TzAJdCNpZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.97], [10.0, 11.75], [14.0, 15.94], [17.0, 24.07], [25.0, 28.51], [30.0, 31.75], [34.0, 35.33], [36.0, 37.57], [41.0, 41.27], [42.0, 45.67], [47.0, 48.34], [49.0, 51.36], [53.0, 56.25], [57.0, 59.97], [61.0, 66.56], [67.0, 68.13], [69.0, 72.23], [73.0, 77.75], [80.0, 80.37], [83.0, 83.32], [85.0, 96.06], [96.0, 96.11], [96.0, 98.41], [99.0, 112.04], [112.0, 112.65], [113.0, 115.43], [116.0, 117.07], [117.0, 117.66], [118.0, 122.66], [124.0, 125.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.98, 99.85, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 99.16, 100.0, 99.99, 95.51, 0.0, 97.83, 98.73, 0.0, 0.0, 91.98, 0.0, 98.27, 99.96, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 1.75, 1.94, 7.07, 3.51, 1.75, 1.33, 1.57, 0.27, 3.67, 1.34, 2.36, 3.25, 2.97, 5.56, 1.13, 3.23, 4.75, 0.37, 0.32, 11.06, 0.11, 2.41, 13.04, 0.65, 2.43, 1.07, 0.66, 4.66, 1.05]} \ No newline at end of file diff --git a/annotations_1/3UbNdsZot98_filtered.json b/annotations_1/3UbNdsZot98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..416f8b4edf978c7dbaed7b123f8698918a402ded --- /dev/null +++ b/annotations_1/3UbNdsZot98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.57], [14.0, 17.56], [19.0, 19.28], [20.0, 24.31], [25.0, 30.79], [32.0, 33.4], [35.0, 35.67], [37.0, 36.95], [37.0, 39.09], [41.0, 41.54], [43.0, 43.55], [50.0, 50.7], [51.0, 52.41], [54.0, 57.99], [61.0, 71.51], [73.0, 74.02], [75.0, 77.11], [78.0, 79.57], [80.0, 81.72], [86.0, 86.31], [87.0, 90.68], [93.0, 93.77], [95.0, 96.26], [99.0, 100.21], [101.0, 102.96], [105.0, 105.04], [113.0, 114.76], [115.0, 116.01], [117.0, 121.17], [125.0, 126.35], [128.0, 128.43], [129.0, 130.72], [139.0, 138.81], [140.0, 140.07], [142.0, 141.99], [144.0, 145.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.04, 0.0, 85.72, 31.6, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 78.38, 38.03, 0.0, 91.81, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 21.93], ["cattle, bovinae", 19.05], ["moo", 14.76]], null, null, null, null, null, null, null, null, null, [["speech", 22.85], ["animal", 22.41], ["livestock, farm animals, working animals", 10.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 3.56, 0.28, 4.31, 5.79, 1.4, 0.67, -0.05, 2.09, 0.54, 0.55, 0.7, 1.41, 3.99, 10.51, 1.02, 2.11, 1.57, 1.72, 0.31, 3.68, 0.77, 1.26, 1.21, 1.96, 0.04, 1.76, 1.01, 4.17, 1.35, 0.43, 1.72, -0.19, 0.07, -0.01, 1.1]} \ No newline at end of file diff --git a/annotations_1/3WfRT1c7Tz0_filtered.json b/annotations_1/3WfRT1c7Tz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2b97f3ff68d1817c480c7188013573f51783b99 --- /dev/null +++ b/annotations_1/3WfRT1c7Tz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.64], [29.0, 31.6], [46.0, 56.46], [57.0, 76.22], [77.0, 141.22], [142.0, 142.87], [148.0, 153.47]], "keep_status": [true, true, true, true, false, false, true], "silence_prob": [30.97, 34.02, 30.58, 34.43, 0.0, 0.0, 40.92], "audiomae_on_audioset": [[["music", 21.46], ["mains hum", 18.71], ["speech", 12.69]], [["music", 52.14], ["speech", 3.45], ["percussion", 3.33]], [["speech", 48.38], ["music", 17.19], ["didgeridoo", 2.43]], [["fart", 27.67], ["speech", 15.79], ["hum", 12.87]], null, null, [["speech", 35.57], ["hum", 14.2], ["mains hum", 8.82]]], "duration": [4.64, 2.6, 10.46, 19.22, 64.22, 0.87, 5.47]} \ No newline at end of file diff --git a/annotations_1/3WmyeqVxCV0_filtered.json b/annotations_1/3WmyeqVxCV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fac958f04344cee639e3a5dbd05f800a21e1032f --- /dev/null +++ b/annotations_1/3WmyeqVxCV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.28], [7.0, 10.2], [24.0, 25.69], [27.0, 32.51], [39.0, 38.99], [48.0, 53.81], [55.0, 66.78], [74.0, 76.13], [80.0, 84.96], [86.0, 98.07], [99.0, 100.62], [101.0, 103.64], [104.0, 113.27], [118.0, 148.83]], "keep_status": [false, false, false, false, false, false, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 46.5, 0.0, 45.3, 0.0, 36.85, 39.14, 48.65, 43.61, 35.7, 0.0, 99.71, 39.55, 0.0], "audiomae_on_audioset": [null, [["music", 50.59], ["didgeridoo", 30.29], ["musical instrument", 3.92]], null, [["music", 52.59], ["speech", 24.37], ["quack", 5.2]], null, [["music", 35.95], ["speech", 34.14], ["sidetone", 8.33]], [["music", 19.09], ["livestock, farm animals, working animals", 15.61], ["speech", 10.17]], [["music", 60.45], ["speech", 8.44], ["didgeridoo", 2.61]], [["music", 37.22], ["hum", 11.86], ["throbbing", 10.6]], [["music", 40.29], ["whale vocalization", 15.95], ["speech", 8.04]], null, null, [["cowbell", 32.55], ["music", 27.59], ["speech", 4.46]], null], "duration": [0.28, 3.2, 1.69, 5.51, -0.01, 5.81, 11.78, 2.13, 4.96, 12.07, 1.62, 2.64, 9.27, 30.83]} \ No newline at end of file diff --git a/annotations_1/3XD34HIx-00_filtered.json b/annotations_1/3XD34HIx-00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39fbd71725c886e52519680cdb1803a35fc82a50 --- /dev/null +++ b/annotations_1/3XD34HIx-00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [12.0, 17.09], [18.0, 18.25], [19.0, 19.82], [21.0, 20.73], [24.0, 23.89], [24.0, 24.7], [35.0, 35.14], [39.0, 40.26], [43.0, 43.82], [46.0, 46.31], [49.0, 48.98], [58.0, 59.48], [67.0, 67.12], [69.0, 71.0], [82.0, 82.22], [86.0, 86.59], [88.0, 91.96], [98.0, 98.14], [101.0, 104.57], [106.0, 107.25], [111.0, 111.21], [112.0, 112.99], [119.0, 119.26], [121.0, 121.36], [124.0, 127.31], [129.0, 131.11], [137.0, 137.03]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 36.27, 0.0, 44.07, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 73.51, 0.0], "audiomae_on_audioset": [null, [["music", 34.23], ["speech", 9.53], ["throbbing", 7.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.72], ["speech", 16.46], ["electronic music", 5.12]], null, [["music", 71.65], ["musical instrument", 4.51], ["guitar", 4.03]], null, null, null, null, null, null, null, null], "duration": [0.22, 5.09, 0.25, 0.82, -0.27, -0.11, 0.7, 0.14, 1.26, 0.82, 0.31, -0.02, 1.48, 0.12, 2.0, 0.22, 0.59, 3.96, 0.14, 3.57, 1.25, 0.21, 0.99, 0.26, 0.36, 3.31, 2.11, 0.03]} \ No newline at end of file diff --git a/annotations_1/3XZ9vtsDiuM_filtered.json b/annotations_1/3XZ9vtsDiuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8aaf65d8d5fe2c4c66332663b0b1cd915f0b4760 --- /dev/null +++ b/annotations_1/3XZ9vtsDiuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 27.85]], "keep_status": [false], "silence_prob": [98.1], "audiomae_on_audioset": [null], "duration": [7.85]} \ No newline at end of file diff --git a/annotations_1/3Y-pMJ4IcTY_filtered.json b/annotations_1/3Y-pMJ4IcTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..932f7e628c2c6d4e7992fb8f23620d506443dfe8 --- /dev/null +++ b/annotations_1/3Y-pMJ4IcTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 3.94], [10.0, 10.94], [21.0, 46.13], [50.0, 50.21], [52.0, 59.44], [63.0, 64.25], [69.0, 69.31], [70.0, 70.93], [96.0, 95.89], [102.0, 106.15], [109.0, 113.68], [123.0, 124.66], [126.0, 128.92], [133.0, 133.19], [138.0, 138.69], [142.0, 141.59], [145.0, 147.11], [147.0, 147.92], [149.0, 151.71], [154.0, 157.57], [160.0, 173.01], [173.0, 190.09], [191.0, 191.42], [193.0, 193.97], [194.0, 194.98], [198.0, 197.87], [200.0, 201.09], [202.0, 202.47], [204.0, 204.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 99.98, 41.42, 0.0, 37.25, 0.0, 0.0, 0.0, 39.64, 0.0, 39.04, 52.1, 45.49, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 65.33], ["musical instrument", 5.95], ["lullaby", 3.06]], null, [["music", 50.13], ["musical instrument", 6.72], ["guitar", 3.31]], null, null, null, [["music", 56.26], ["musical instrument", 4.43], ["speech", 1.54]], null, [["music", 54.51], ["humming", 8.51], ["mantra", 7.12]], null, [["music", 58.52], ["harmonica", 9.99], ["musical instrument", 6.13]], null, null, null, null, null, null, null, null], "duration": [0.52, 0.94, 0.94, 25.13, 0.21, 7.44, 1.25, 0.31, 0.93, -0.11, 4.15, 4.68, 1.66, 2.92, 0.19, 0.69, -0.41, 2.11, 0.92, 2.71, 3.57, 13.01, 17.09, 0.42, 0.97, 0.98, -0.13, 1.09, 0.47, 0.35]} \ No newline at end of file diff --git a/annotations_1/3a6TxHEyLdo_filtered.json b/annotations_1/3a6TxHEyLdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a47c9d4faf4766709663589a238157e87d944a58 --- /dev/null +++ b/annotations_1/3a6TxHEyLdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [5.0, 10.05], [11.0, 11.62], [13.0, 14.42], [14.0, 14.45], [15.0, 15.96], [17.0, 17.59], [24.0, 25.39], [29.0, 29.12], [32.0, 33.32], [54.0, 55.38], [63.0, 63.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 5.05, 0.62, 1.42, 0.45, 0.96, 0.59, 1.39, 0.12, 1.32, 1.38, 0.83]} \ No newline at end of file diff --git a/annotations_1/3bHDHRxatZg_filtered.json b/annotations_1/3bHDHRxatZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9af22034387293f6d4befd17a447892196683901 --- /dev/null +++ b/annotations_1/3bHDHRxatZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.91], [32.0, 38.65], [41.0, 43.31], [46.0, 55.66], [58.0, 68.47], [69.0, 70.09], [70.0, 70.66], [71.0, 82.0], [83.0, 83.42], [85.0, 85.23], [87.0, 105.88], [108.0, 112.18], [114.0, 119.16], [122.0, 122.42], [123.0, 123.18], [124.0, 124.95], [126.0, 127.3]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [29.71, 28.89, 30.44, 29.98, 29.99, 0.0, 0.0, 29.14, 0.0, 0.0, 29.58, 29.24, 31.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.6], ["music", 22.97], ["throbbing", 22.35]], [["music", 41.49], ["speech", 36.52], ["hum", 3.79]], [["music", 27.88], ["speech", 8.07], ["hum", 4.09]], [["hum", 31.86], ["mains hum", 26.1], ["speech", 18.26]], [["mains hum", 37.34], ["hum", 32.08], ["speech", 7.67]], null, null, [["music", 48.84], ["hum", 16.68], ["throbbing", 14.16]], null, null, [["music", 20.02], ["speech", 11.61], ["hum", 6.37]], [["music", 35.21], ["boom", 21.24], ["speech", 8.71]], [["music", 36.98], ["speech", 9.94], ["throbbing", 8.89]], null, null, null, null], "duration": [16.91, 6.65, 2.31, 9.66, 10.47, 1.09, 0.66, 11.0, 0.42, 0.23, 18.88, 4.18, 5.16, 0.42, 0.18, 0.95, 1.3]} \ No newline at end of file diff --git a/annotations_1/3cBAmkzKEBU_filtered.json b/annotations_1/3cBAmkzKEBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf3ea432a265a16449212554ad62a1cf47bc690 --- /dev/null +++ b/annotations_1/3cBAmkzKEBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.09], [6.0, 6.44], [9.0, 12.09], [13.0, 13.58], [14.0, 15.87], [24.0, 28.24], [41.0, 43.24], [44.0, 47.93], [49.0, 49.18], [54.0, 53.69], [55.0, 56.02], [63.0, 62.95], [64.0, 64.62], [72.0, 73.41], [76.0, 76.11], [79.0, 79.62], [84.0, 85.28], [88.0, 88.96], [97.0, 99.08], [102.0, 104.4]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.18, 0.0, 31.15, 0.0, 0.0, 33.49, 33.71, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.05, 38.09], "audiomae_on_audioset": [[["music", 59.2], ["speech", 13.66], ["outside, rural or natural", 6.41]], null, [["music", 51.6], ["synthesizer", 15.82], ["boing", 4.74]], null, null, [["music", 27.84], ["boing", 24.54], ["siren", 12.13]], [["music", 54.5], ["musical instrument", 6.41], ["synthesizer", 5.51]], null, null, null, null, null, null, null, null, null, null, null, [["music", 54.54], ["synthesizer", 10.47], ["sampler", 5.1]], [["music", 62.46], ["synthesizer", 6.72], ["boing", 5.62]]], "duration": [3.09, 0.44, 3.09, 0.58, 1.87, 4.24, 2.24, 3.93, 0.18, -0.31, 1.02, -0.05, 0.62, 1.41, 0.11, 0.62, 1.28, 0.96, 2.08, 2.4]} \ No newline at end of file diff --git a/annotations_1/3cdlwCCzujo_filtered.json b/annotations_1/3cdlwCCzujo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b417b9a50bee7e54d48cdc21fbec78a2fce7d94a --- /dev/null +++ b/annotations_1/3cdlwCCzujo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.47], [16.0, 17.02], [20.0, 20.17], [26.0, 29.51], [30.0, 30.32], [33.0, 34.3], [36.0, 40.14], [44.0, 44.32], [48.0, 49.6], [51.0, 51.65], [55.0, 55.58], [68.0, 69.09], [74.0, 76.6], [78.0, 81.06], [93.0, 95.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 29.21, 0.0, 0.0, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 49.68, 60.6, 34.17], "audiomae_on_audioset": [null, null, null, [["music", 74.81], ["dubstep", 4.03], ["electronic music", 2.86]], null, null, [["music", 73.01], ["electronic music", 2.21], ["singing", 1.94]], null, null, null, null, null, [["whale vocalization", 17.58], ["hum", 8.4], ["throbbing", 4.89]], null, [["music", 39.45], ["boing", 5.82], ["whack, thwack", 5.52]]], "duration": [0.47, 1.02, 0.17, 3.51, 0.32, 1.3, 4.14, 0.32, 1.6, 0.65, 0.58, 1.09, 2.6, 3.06, 2.49]} \ No newline at end of file diff --git a/annotations_1/3gD5egw3-Lg_filtered.json b/annotations_1/3gD5egw3-Lg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/3gD5egw3-Lg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/3gLxv0qizPY_filtered.json b/annotations_1/3gLxv0qizPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42a28c79ae0d65b2f7f550f2ba29072fb1489a46 --- /dev/null +++ b/annotations_1/3gLxv0qizPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 18.96], [24.0, 25.05], [39.0, 39.24], [40.0, 40.51], [44.0, 46.52], [47.0, 56.05], [58.0, 60.94], [61.0, 67.76], [74.0, 79.1], [81.0, 102.37], [105.0, 120.58], [122.0, 121.59], [122.0, 124.39], [133.0, 132.97]], "keep_status": [true, false, false, false, false, true, false, true, true, true, false, false, false, false], "silence_prob": [30.55, 0.0, 0.0, 0.0, 31.51, 30.71, 29.93, 30.8, 30.15, 30.32, 30.18, 0.0, 31.06, 0.0], "audiomae_on_audioset": [[["vehicle", 15.13], ["car", 13.17], ["speech", 11.09]], null, null, null, [["speech", 62.24], ["music", 6.79], ["hum", 3.01]], [["speech", 42.57], ["hum", 14.66], ["mains hum", 8.72]], [["speech", 60.86], ["music", 23.42], ["boing", 1.03]], [["music", 32.09], ["fly, housefly", 19.69], ["insect", 8.37]], [["speech", 27.96], ["music", 17.53], ["buzz", 16.19]], [["music", 34.37], ["throbbing", 13.09], ["hum", 11.05]], [["buzz", 39.39], ["speech", 16.67], ["music", 16.21]], null, [["whale vocalization", 90.36], ["speech", 2.36], ["animal", 1.35]], null], "duration": [15.96, 1.05, 0.24, 0.51, 2.52, 9.05, 2.94, 6.76, 5.1, 21.37, 15.58, -0.41, 2.39, -0.03]} \ No newline at end of file diff --git a/annotations_1/3gSOZW-vNFk_filtered.json b/annotations_1/3gSOZW-vNFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cca3f94c038ef084fa43b2b0c2d638483bf8a500 --- /dev/null +++ b/annotations_1/3gSOZW-vNFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 44.98], [47.0, 61.38], [63.0, 73.14], [74.0, 74.44], [74.0, 82.53], [85.0, 98.83], [101.0, 104.9], [108.0, 144.85]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 32.56, 37.55, 0.0, 46.97, 90.95, 99.82, 0.0], "audiomae_on_audioset": [null, [["music", 59.4], ["theremin", 9.0], ["buzz", 4.52]], [["noise", 20.24], ["music", 17.11], ["buzz", 15.9]], null, [["music", 48.36], ["didgeridoo", 26.98], ["brass instrument", 4.37]], null, null, null], "duration": [42.98, 14.38, 10.14, 0.44, 8.53, 13.83, 3.9, 36.85]} \ No newline at end of file diff --git a/annotations_1/3ge07nbMna0_filtered.json b/annotations_1/3ge07nbMna0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/3ge07nbMna0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/3ghKgAcPBC8_filtered.json b/annotations_1/3ghKgAcPBC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e96a72b5d78836f7dee25ba11d9bf94b03cc28b --- /dev/null +++ b/annotations_1/3ghKgAcPBC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 51.12], [54.0, 54.18], [55.0, 57.3], [59.0, 59.97], [63.0, 67.24], [68.0, 69.25], [72.0, 72.62], [73.0, 75.24], [76.0, 78.31], [80.0, 80.69], [81.0, 81.73], [83.0, 83.71], [87.0, 89.78], [91.0, 92.91], [94.0, 98.24], [99.0, 100.47], [101.0, 102.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.34, 0.0, 66.88, 0.0, 0.0, 55.67, 72.75, 0.0, 0.0, 0.0, 71.87, 0.0, 62.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.18, 2.3, 0.97, 4.24, 1.25, 0.62, 2.24, 2.31, 0.69, 0.73, 0.71, 2.78, 1.91, 4.24, 1.47, 1.17]} \ No newline at end of file diff --git a/annotations_1/3hUkHF18IrI_filtered.json b/annotations_1/3hUkHF18IrI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c92a03eaf494266fbcbad3b2960e7d4e28e36ff4 --- /dev/null +++ b/annotations_1/3hUkHF18IrI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.5], [15.0, 15.65], [17.0, 19.04], [20.0, 22.18], [27.0, 28.81], [32.0, 33.37], [34.0, 35.87], [37.0, 41.71], [43.0, 45.64], [46.0, 48.56], [53.0, 54.09], [55.0, 56.3], [59.0, 69.09], [69.0, 69.25], [69.0, 76.82], [77.0, 77.82]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.36, 0.0, 51.23, 65.67, 0.0, 0.0, 0.0, 36.47, 44.84, 56.48, 0.0, 0.0, 37.52, 0.0, 39.86, 0.0], "audiomae_on_audioset": [[["music", 47.96], ["speech", 8.96], ["musical instrument", 6.36]], null, null, null, null, null, null, [["music", 52.22], ["musical instrument", 11.21], ["wind instrument, woodwind instrument", 10.35]], [["music", 49.37], ["clarinet", 10.81], ["wind instrument, woodwind instrument", 10.35]], null, null, null, [["music", 44.46], ["synthesizer", 16.87], ["musical instrument", 9.39]], null, [["music", 47.61], ["synthesizer", 19.05], ["musical instrument", 8.63]], null], "duration": [4.5, 0.65, 2.04, 2.18, 1.81, 1.37, 1.87, 4.71, 2.64, 2.56, 1.09, 1.3, 10.09, 0.25, 7.82, 0.82]} \ No newline at end of file diff --git a/annotations_1/3i7EvW15Lyk_filtered.json b/annotations_1/3i7EvW15Lyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19a367e178d525e24252bcd28dbbc47aadf4e549 --- /dev/null +++ b/annotations_1/3i7EvW15Lyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [16.0, 16.7], [18.0, 18.15], [25.0, 26.15], [27.0, 26.76], [28.0, 28.26], [29.0, 29.78], [43.0, 47.44], [51.0, 54.28], [57.0, 57.3], [59.0, 60.57], [61.0, 62.28], [66.0, 66.61], [81.0, 82.26], [84.0, 84.03], [90.0, 93.88], [105.0, 105.26], [117.0, 123.15], [124.0, 124.98], [126.0, 126.47], [127.0, 128.02]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.37, 36.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.15, 0.0, 31.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 32.1], ["fly, housefly", 14.18], ["insect", 10.01]], [["speech", 77.4], ["inside, small room", 2.46], ["music", 1.53]], null, null, null, null, null, null, [["cattle, bovinae", 46.31], ["moo", 29.84], ["livestock, farm animals, working animals", 10.04]], null, [["music", 36.08], ["speech", 17.85], ["groan", 8.99]], null, null, null], "duration": [0.83, 0.7, 0.15, 1.15, -0.24, 0.26, 0.78, 4.44, 3.28, 0.3, 1.57, 1.28, 0.61, 1.26, 0.03, 3.88, 0.26, 6.15, 0.98, 0.47, 1.02]} \ No newline at end of file diff --git a/annotations_1/3jWrsTACVn4_filtered.json b/annotations_1/3jWrsTACVn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f530e3767a76f8a11c0569739ebe6238ddbda745 --- /dev/null +++ b/annotations_1/3jWrsTACVn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [9.0, 9.58], [11.0, 11.52], [16.0, 16.75], [19.0, 22.15], [23.0, 23.92], [26.0, 26.37], [27.0, 28.19], [31.0, 31.29], [32.0, 33.84], [38.0, 38.13], [41.0, 41.64], [45.0, 51.51], [54.0, 59.46], [60.0, 96.04], [97.0, 98.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 79.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.58, 0.52, 0.75, 3.15, 0.92, 0.37, 1.19, 0.29, 1.84, 0.13, 0.64, 6.51, 5.46, 36.04, 1.36]} \ No newline at end of file diff --git a/annotations_1/3k7E9zkTPLA_filtered.json b/annotations_1/3k7E9zkTPLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6decd10078f9e91df0785fff91fd4ce384eec27 --- /dev/null +++ b/annotations_1/3k7E9zkTPLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [8.0, 8.18], [17.0, 19.84], [30.0, 42.94], [44.0, 45.17], [71.0, 70.77], [71.0, 74.16], [76.0, 77.6], [79.0, 100.18], [111.0, 111.43], [112.0, 111.55], [112.0, 111.97], [112.0, 112.01], [139.0, 143.13], [146.0, 146.25], [154.0, 154.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 99.48, 58.64, 0.0, 0.0, 93.13, 0.0, 43.28, 0.0, 0.0, 0.0, 0.0, 35.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 53.56], ["breaking", 13.79], ["glass", 9.56]], null, null, null, null, [["music", 44.92], ["breaking", 9.74], ["shatter", 8.23]], null, null], "duration": [0.31, 0.18, 2.84, 12.94, 1.17, -0.23, 3.16, 1.6, 21.18, 0.43, -0.45, -0.03, 0.01, 4.13, 0.25, 0.48]} \ No newline at end of file diff --git a/annotations_1/3kEL1doAC4M_filtered.json b/annotations_1/3kEL1doAC4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa35a3955bf99ce7634740eb53613c0a1fc0f93e --- /dev/null +++ b/annotations_1/3kEL1doAC4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.64], [46.0, 56.0], [59.0, 62.34], [66.0, 78.87], [81.0, 81.06], [83.0, 139.63], [141.0, 155.19], [156.0, 156.95]], "keep_status": [false, true, true, true, false, false, true, false], "silence_prob": [0.0, 29.77, 28.76, 30.19, 0.0, 0.0, 28.88, 0.0], "audiomae_on_audioset": [null, [["music", 50.54], ["hum", 9.12], ["mains hum", 6.26]], [["reverberation", 13.74], ["music", 10.96], ["thump, thud", 9.0]], [["whale vocalization", 13.5], ["vehicle", 13.17], ["music", 8.0]], null, null, [["music", 30.93], ["cacophony", 13.76], ["didgeridoo", 6.05]], null], "duration": [0.64, 10.0, 3.34, 12.87, 0.06, 56.63, 14.19, 0.95]} \ No newline at end of file diff --git a/annotations_1/3kNqc5Hrh0M_filtered.json b/annotations_1/3kNqc5Hrh0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f58123767e953ff777f70180ff81c12ce5041d45 --- /dev/null +++ b/annotations_1/3kNqc5Hrh0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 82.65], [85.0, 103.5], [107.0, 157.74]], "keep_status": [false, false, false], "silence_prob": [30.0, 32.19, 0.0], "audiomae_on_audioset": [[["music", 63.12], ["fart", 7.4], ["speech", 4.48]], [["music", 72.27], ["fly, housefly", 3.15], ["buzz", 1.8]], null], "duration": [3.65, 18.5, 50.74]} \ No newline at end of file diff --git a/annotations_1/3l3rJxuxpDo_filtered.json b/annotations_1/3l3rJxuxpDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4b31251d7db0c6300d7382cb4b277d296d012a0 --- /dev/null +++ b/annotations_1/3l3rJxuxpDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.67], [9.0, 9.49], [10.0, 13.54], [15.0, 17.96], [19.0, 20.55], [21.0, 22.42], [23.0, 23.68], [24.0, 25.39], [28.0, 28.61], [38.0, 37.89], [40.0, 40.83], [45.0, 45.45], [46.0, 46.9], [60.0, 60.25], [64.0, 65.08], [66.0, 66.85], [69.0, 73.6], [77.0, 79.17], [80.0, 81.68], [83.0, 83.42], [86.0, 87.24], [100.0, 99.98], [102.0, 102.51], [104.0, 109.05], [110.0, 114.24], [119.0, 119.92], [121.0, 121.58], [125.0, 125.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 69.07, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 90.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.67, 0.49, 3.54, 2.96, 1.55, 1.42, 0.68, 1.39, 0.61, -0.11, 0.83, 0.45, 0.9, 0.25, 1.08, 0.85, 4.6, 2.17, 1.68, 0.42, 1.24, -0.02, 0.51, 5.05, 4.24, 0.92, 0.58, 0.34]} \ No newline at end of file diff --git a/annotations_1/3lQ1fd0hBe0_filtered.json b/annotations_1/3lQ1fd0hBe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e70486c965ca41b19677574cda5b66b3422e562 --- /dev/null +++ b/annotations_1/3lQ1fd0hBe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.57], [12.0, 14.44], [15.0, 16.51], [18.0, 27.18], [32.0, 48.73], [49.0, 78.26], [79.0, 86.85], [88.0, 108.63], [110.0, 112.67], [113.0, 115.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 35.05, 0.0, 98.01, 100.0, 99.87, 99.88, 99.68, 100.0, 100.0], "audiomae_on_audioset": [null, [["sidetone", 39.29], ["dial tone", 20.07], ["speech", 17.61]], null, null, null, null, null, null, null, null], "duration": [8.57, 2.44, 1.51, 9.18, 16.73, 29.26, 7.85, 20.63, 2.67, 2.6]} \ No newline at end of file diff --git a/annotations_1/3lR-s-Q5XsQ_filtered.json b/annotations_1/3lR-s-Q5XsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fd01a64786122dd3b60422b900451e1305ad1fd --- /dev/null +++ b/annotations_1/3lR-s-Q5XsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [12.0, 33.64], [38.0, 42.08], [49.0, 58.78], [60.0, 68.69], [70.0, 75.95], [78.0, 80.64], [83.0, 97.5], [98.0, 98.73], [104.0, 127.94], [132.0, 147.95], [152.0, 152.74], [155.0, 155.21], [155.0, 161.11], [161.0, 161.81], [162.0, 170.72], [175.0, 191.67], [196.0, 199.99], [202.0, 209.88], [211.0, 212.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.34, 30.38, 30.88, 31.96, 32.08, 30.26, 31.24, 0.0, 30.85, 30.67, 0.0, 0.0, 31.5, 0.0, 31.48, 30.58, 30.4, 30.61, 0.0], "audiomae_on_audioset": [null, [["music", 65.89], ["speech", 11.31], ["foghorn", 3.81]], [["music", 63.23], ["didgeridoo", 4.86], ["salsa music", 3.12]], [["music", 81.27], ["didgeridoo", 6.56], ["reggae", 1.53]], [["music", 88.76], ["didgeridoo", 6.07], ["sampler", 0.61]], [["music", 66.85], ["didgeridoo", 25.27], ["musical instrument", 2.12]], [["music", 75.88], ["salsa music", 1.74], ["singing", 1.52]], [["music", 84.24], ["didgeridoo", 10.49], ["musical instrument", 0.65]], null, [["music", 91.05], ["christmas music", 0.85], ["christian music", 0.72]], [["music", 78.75], ["reggae", 2.19], ["singing", 1.79]], null, null, [["music", 78.9], ["didgeridoo", 6.27], ["musical instrument", 3.45]], null, [["music", 72.35], ["didgeridoo", 11.91], ["synthesizer", 1.79]], [["music", 70.96], ["didgeridoo", 3.11], ["singing", 1.76]], [["music", 56.13], ["drum machine", 5.06], ["didgeridoo", 3.77]], [["music", 65.05], ["didgeridoo", 18.18], ["drum machine", 1.72]], null], "duration": [0.78, 21.64, 4.08, 9.78, 8.69, 5.95, 2.64, 14.5, 0.73, 23.94, 15.95, 0.74, 0.21, 6.11, 0.81, 8.72, 16.67, 3.99, 7.88, 1.03]} \ No newline at end of file diff --git a/annotations_1/3lex4AAgAfs_filtered.json b/annotations_1/3lex4AAgAfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..917245a74444c873b0ae7407e9ec77ce5ce685c5 --- /dev/null +++ b/annotations_1/3lex4AAgAfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.64], [10.0, 10.94], [15.0, 16.68], [18.0, 61.5], [62.0, 67.17], [69.0, 122.35], [126.0, 126.6], [141.0, 141.2], [143.0, 143.99], [147.0, 147.33], [149.0, 151.63], [152.0, 153.18], [154.0, 154.95], [166.0, 166.02], [173.0, 173.35], [174.0, 175.85], [177.0, 178.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.82, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 85.42], ["electric shaver, electric razor", 3.81], ["fart", 1.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.94, 1.68, 43.5, 5.17, 53.35, 0.6, 0.2, 0.99, 0.33, 2.63, 1.18, 0.95, 0.02, 0.35, 1.85, 1.09]} \ No newline at end of file diff --git a/annotations_1/3lxLsyE0CRo_filtered.json b/annotations_1/3lxLsyE0CRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2ad7f3f1db98736a28bdc8bd740513ae91f8c38 --- /dev/null +++ b/annotations_1/3lxLsyE0CRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.72], [8.0, 9.76], [11.0, 11.72], [14.0, 16.98], [17.0, 19.75], [38.0, 39.51], [43.0, 45.5], [51.0, 57.55], [61.0, 61.13], [63.0, 63.48], [67.0, 67.2], [68.0, 73.92], [78.0, 82.02], [83.0, 83.29], [87.0, 88.18], [90.0, 93.51], [94.0, 94.93], [96.0, 96.89], [99.0, 103.47], [110.0, 120.19]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.18, 35.26, 0.0, 43.0, 38.72, 0.0, 0.0, 0.0, 42.69, 40.45, 0.0, 0.0, 36.69, 0.0, 0.0, 38.58, 32.18], "audiomae_on_audioset": [null, null, null, [["rumble", 33.44], ["throbbing", 13.64], ["hum", 7.85]], [["speech", 66.73], ["rumble", 14.08], ["sidetone", 2.19]], null, [["sine wave", 16.78], ["whale vocalization", 13.78], ["music", 11.27]], [["rumble", 15.42], ["sine wave", 12.77], ["buzz", 8.49]], null, null, null, [["sine wave", 18.88], ["music", 13.39], ["rumble", 12.21]], [["speech", 49.39], ["sine wave", 24.88], ["chirp tone", 10.09]], null, null, [["music", 35.67], ["effects unit", 12.46], ["noise", 8.62]], null, null, [["speech", 27.05], ["hum", 19.73], ["sidetone", 14.73]], [["speech", 72.44], ["fart", 6.67], ["explosion", 4.83]]], "duration": [1.72, 1.76, 0.72, 2.98, 2.75, 1.51, 2.5, 6.55, 0.13, 0.48, 0.2, 5.92, 4.02, 0.29, 1.18, 3.51, 0.93, 0.89, 4.47, 10.19]} \ No newline at end of file diff --git a/annotations_1/3nVP-DM1egA_filtered.json b/annotations_1/3nVP-DM1egA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b97964e63e8b236882ebfa9b66d652f6c274703 --- /dev/null +++ b/annotations_1/3nVP-DM1egA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [3.0, 3.87], [4.0, 6.49], [8.0, 9.96], [11.0, 12.11], [14.0, 16.23], [18.0, 19.75], [20.0, 21.9], [26.0, 27.9], [29.0, 33.27], [35.0, 36.37], [41.0, 41.08], [44.0, 46.82], [48.0, 51.78], [56.0, 58.06], [64.0, 64.64], [70.0, 74.73], [78.0, 78.7], [82.0, 85.31], [86.0, 86.29], [89.0, 89.04], [89.0, 93.04], [96.0, 96.48], [98.0, 112.38], [119.0, 129.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.21, 0.0, 0.0, 52.98, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 79.94, 84.25, 83.34, 0.0, 88.46, 0.0, 89.72, 0.0, 0.0, 67.89, 0.0, 67.13, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["caw", 38.45], ["crow", 26.54], ["frog", 10.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.87, 2.49, 1.96, 1.11, 2.23, 1.75, 1.9, 1.9, 4.27, 1.37, 0.08, 2.82, 3.78, 2.06, 0.64, 4.73, 0.7, 3.31, 0.29, 0.04, 4.04, 0.48, 14.38, 10.17]} \ No newline at end of file diff --git a/annotations_1/3oIQCt6GVcY_filtered.json b/annotations_1/3oIQCt6GVcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58a3d14bcb9327a818fb22ebf13399a273061844 --- /dev/null +++ b/annotations_1/3oIQCt6GVcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 31.92], [33.0, 49.42], [51.0, 56.03], [59.0, 68.3], [70.0, 75.86], [77.0, 76.92], [78.0, 126.44], [129.0, 147.55], [150.0, 149.54], [150.0, 150.31], [152.0, 180.17]], "keep_status": [true, false, true, true, true, false, false, true, false, false, false], "silence_prob": [30.87, 31.54, 31.85, 30.67, 30.66, 0.0, 0.0, 32.91, 0.0, 0.0, 31.14], "audiomae_on_audioset": [[["music", 26.83], ["hum", 22.46], ["mains hum", 13.17]], [["speech", 45.07], ["sidetone", 20.18], ["explosion", 7.12]], [["sidetone", 14.45], ["music", 12.28], ["explosion", 11.22]], [["speech", 46.97], ["music", 12.36], ["sidetone", 8.88]], [["speech", 34.12], ["hum", 19.46], ["music", 10.4]], null, null, [["speech", 26.88], ["music", 16.39], ["explosion", 14.12]], null, null, [["music", 59.29], ["speech", 14.5], ["throbbing", 10.99]]], "duration": [14.92, 16.42, 5.03, 9.3, 5.86, -0.08, 48.44, 18.55, -0.46, 0.31, 28.17]} \ No newline at end of file diff --git a/annotations_1/3oqt6V9aJIM_filtered.json b/annotations_1/3oqt6V9aJIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..917f80524b6a56eeef451e50f8aa17808b8d7d35 --- /dev/null +++ b/annotations_1/3oqt6V9aJIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.1], [20.0, 19.84], [27.0, 31.18], [34.0, 34.35], [36.0, 36.73], [38.0, 38.62], [41.0, 42.28], [50.0, 50.36], [52.0, 53.35], [54.0, 54.48], [57.0, 58.08], [61.0, 62.82], [67.0, 68.88], [87.0, 87.56], [102.0, 102.69], [104.0, 104.03], [106.0, 106.24], [110.0, 110.57], [119.0, 119.5], [121.0, 123.28], [126.0, 135.14], [137.0, 137.47], [139.0, 139.48], [143.0, 144.9], [152.0, 152.52], [167.0, 168.1], [170.0, 170.87], [173.0, 174.83], [177.0, 177.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 35.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 46.18], ["hum", 25.22], ["music", 17.13]], null, null, null, null, null, null, null, null], "duration": [5.1, -0.16, 4.18, 0.35, 0.73, 0.62, 1.28, 0.36, 1.35, 0.48, 1.08, 1.82, 1.88, 0.56, 0.69, 0.03, 0.24, 0.57, 0.5, 2.28, 9.14, 0.47, 0.48, 1.9, 0.52, 1.1, 0.87, 1.83, 0.72]} \ No newline at end of file diff --git a/annotations_1/3pEtiCv07Yc_filtered.json b/annotations_1/3pEtiCv07Yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f369047b40ab5f71518788920fbed1769080467d --- /dev/null +++ b/annotations_1/3pEtiCv07Yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [7.0, 7.52], [17.0, 17.29], [19.0, 18.91], [24.0, 25.98], [31.0, 31.72], [38.0, 39.01], [45.0, 45.64], [47.0, 48.39], [52.0, 52.93], [56.0, 56.91], [59.0, 59.76], [62.0, 61.75], [64.0, 64.69], [68.0, 68.89], [72.0, 72.08], [73.0, 73.82], [77.0, 77.79], [82.0, 84.01], [85.0, 84.87], [85.0, 86.12], [87.0, 88.2], [91.0, 90.95], [94.0, 95.4], [96.0, 97.09], [99.0, 101.63], [102.0, 102.86], [105.0, 105.68], [108.0, 108.55], [111.0, 111.47], [113.0, 114.93], [117.0, 117.32], [120.0, 121.02], [123.0, 124.01], [127.0, 127.8], [129.0, 129.09], [130.0, 130.59], [132.0, 132.26], [134.0, 134.69], [136.0, 136.39], [137.0, 138.62], [141.0, 141.0], [142.0, 143.6], [144.0, 145.37], [148.0, 148.19], [152.0, 152.39], [155.0, 155.44], [158.0, 159.0], [161.0, 161.16], [166.0, 166.55], [171.0, 171.48], [176.0, 176.49], [181.0, 181.65], [183.0, 183.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.33], ["musical instrument", 4.67], ["theremin", 2.59]], null, null, null, null, null, null, [["music", 57.99], ["theremin", 11.43], ["musical instrument", 5.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.52, 0.29, -0.09, 1.98, 0.72, 1.01, 0.64, 1.39, 0.93, 0.91, 0.76, -0.25, 0.69, 0.89, 0.08, 0.82, 0.79, 2.01, -0.13, 1.12, 1.2, -0.05, 1.4, 1.09, 2.63, 0.86, 0.68, 0.55, 0.47, 1.93, 0.32, 1.02, 1.01, 0.8, 0.09, 0.59, 0.26, 0.69, 0.39, 1.62, 0.0, 1.6, 1.37, 0.19, 0.39, 0.44, 1.0, 0.16, 0.55, 0.48, 0.49, 0.65, 0.14]} \ No newline at end of file diff --git a/annotations_1/3reg2k9xS9k_filtered.json b/annotations_1/3reg2k9xS9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e951588702bedaeb26ca026844f183ae39bd9f1 --- /dev/null +++ b/annotations_1/3reg2k9xS9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.34], [6.0, 6.57], [7.0, 7.96], [10.0, 11.45], [18.0, 18.87], [20.0, 21.03], [25.0, 25.91], [27.0, 27.95], [31.0, 31.68], [33.0, 33.88], [36.0, 36.48], [43.0, 43.75], [47.0, 47.11], [48.0, 49.55], [51.0, 52.47], [58.0, 59.51], [63.0, 64.29], [68.0, 70.28], [73.0, 73.68], [78.0, 79.05], [83.0, 83.93], [86.0, 86.8], [92.0, 92.15], [96.0, 96.52], [100.0, 99.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.51], ["brass instrument", 14.55], ["trombone", 12.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.34, 0.57, 0.96, 1.45, 0.87, 1.03, 0.91, 0.95, 0.68, 0.88, 0.48, 0.75, 0.11, 1.55, 1.47, 1.51, 1.29, 2.28, 0.68, 1.05, 0.93, 0.8, 0.15, 0.52, -0.21]} \ No newline at end of file diff --git a/annotations_1/3s2XMsUdd1k_filtered.json b/annotations_1/3s2XMsUdd1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dec9e0a72531259fa98cd23940daa2a9a46b6837 --- /dev/null +++ b/annotations_1/3s2XMsUdd1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.94], [11.0, 57.72], [60.0, 61.21], [63.0, 113.7], [115.0, 116.36], [117.0, 118.27], [122.0, 163.75], [164.0, 164.44], [164.0, 202.44]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.94, 46.72, 1.21, 50.7, 1.36, 1.27, 41.75, 0.44, 38.44]} \ No newline at end of file diff --git a/annotations_1/3sP7UMxhGYw_filtered.json b/annotations_1/3sP7UMxhGYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab0bf6256ac9d09398f3b37c9e6f4860f43c6d4 --- /dev/null +++ b/annotations_1/3sP7UMxhGYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.55], [15.0, 15.35], [16.0, 22.2], [23.0, 23.23], [24.0, 48.79], [52.0, 53.35], [55.0, 57.37], [59.0, 110.79], [113.0, 116.34], [117.0, 129.64], [131.0, 138.47], [140.0, 160.14], [162.0, 175.86], [177.0, 177.48], [178.0, 185.52], [188.0, 195.86], [198.0, 198.53], [199.0, 218.94], [219.0, 227.37], [229.0, 229.29], [230.0, 233.61]], "keep_status": [true, false, true, false, true, false, false, false, true, false, false, true, true, false, true, false, false, false, false, false, false], "silence_prob": [28.84, 0.0, 29.68, 0.0, 29.9, 0.0, 43.0, 0.0, 40.7, 35.28, 30.15, 29.48, 34.14, 0.0, 40.84, 70.02, 0.0, 64.86, 73.67, 0.0, 71.14], "audiomae_on_audioset": [[["electric shaver, electric razor", 24.53], ["music", 14.06], ["hum", 10.66]], null, [["music", 52.43], ["mains hum", 6.19], ["noise", 5.16]], null, [["music", 45.94], ["speech", 16.69], ["hum", 4.42]], null, [["hum", 29.96], ["mains hum", 21.86], ["music", 21.21]], null, [["music", 32.92], ["hum", 10.4], ["throbbing", 9.53]], [["music", 53.26], ["speech", 9.81], ["hum", 7.39]], [["mains hum", 56.9], ["hum", 28.55], ["music", 6.88]], [["music", 38.13], ["speech", 10.04], ["whack, thwack", 5.8]], [["speech", 46.27], ["music", 8.74], ["hum", 8.61]], null, [["music", 26.32], ["fly, housefly", 16.38], ["hum", 11.08]], null, null, null, null, null, null], "duration": [8.55, 0.35, 6.2, 0.23, 24.79, 1.35, 2.37, 51.79, 3.34, 12.64, 7.47, 20.14, 13.86, 0.48, 7.52, 7.86, 0.53, 19.94, 8.37, 0.29, 3.61]} \ No newline at end of file diff --git a/annotations_1/3tMHSQGSUzc_filtered.json b/annotations_1/3tMHSQGSUzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2461b709b0866d5505b24b4fafb0c499f3b83fb --- /dev/null +++ b/annotations_1/3tMHSQGSUzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [11.0, 15.36], [17.0, 17.66], [19.0, 18.82], [20.0, 21.34], [22.0, 22.89], [24.0, 24.41], [26.0, 27.53], [28.0, 29.32], [71.0, 71.83], [76.0, 76.64], [81.0, 81.36], [82.0, 82.66], [84.0, 86.59], [89.0, 91.18], [93.0, 92.91], [95.0, 96.87], [99.0, 104.11], [105.0, 119.38], [121.0, 122.37], [124.0, 127.67], [134.0, 134.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 98.27, 0.0, 0.0, 92.48, 43.18, 0.0, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 40.91], ["music", 17.29], ["mains hum", 16.39]], null, null, null], "duration": [0.74, 4.36, 0.66, -0.18, 1.34, 0.89, 0.41, 1.53, 1.32, 0.83, 0.64, 0.36, 0.66, 2.59, 2.18, -0.09, 1.87, 5.11, 14.38, 1.37, 3.67, 0.4]} \ No newline at end of file diff --git a/annotations_1/3tuV7dBxBPU_filtered.json b/annotations_1/3tuV7dBxBPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..065a1c75b7a413477428711962f22096764f1d82 --- /dev/null +++ b/annotations_1/3tuV7dBxBPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 19.79], [24.0, 29.59], [30.0, 29.62], [34.0, 36.34], [41.0, 42.72], [52.0, 53.79], [56.0, 57.87], [60.0, 63.19], [69.0, 71.02]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [32.22, 32.2, 0.0, 32.47, 0.0, 0.0, 0.0, 34.03, 32.75], "audiomae_on_audioset": [[["music", 76.6], ["bass guitar", 5.39], ["didgeridoo", 3.44]], [["music", 72.41], ["didgeridoo", 4.76], ["musical instrument", 3.43]], null, [["music", 56.16], ["musical instrument", 5.77], ["guitar", 4.24]], null, null, null, [["music", 62.95], ["guitar", 9.16], ["musical instrument", 7.19]], [["music", 65.59], ["skateboard", 3.09], ["synthesizer", 2.62]]], "duration": [13.79, 5.59, -0.38, 2.34, 1.72, 1.79, 1.87, 3.19, 2.02]} \ No newline at end of file diff --git a/annotations_1/3tvpgXQ4y4Q_filtered.json b/annotations_1/3tvpgXQ4y4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0828630396282b9e48e63b300325d5a0ced1d3b --- /dev/null +++ b/annotations_1/3tvpgXQ4y4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[134.0, 134.0], [135.0, 135.41], [137.0, 153.37], [156.0, 161.0], [163.0, 163.34], [164.0, 165.32], [167.0, 167.41]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 34.21, 33.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 57.41], ["whack, thwack", 19.46], ["breaking", 3.39]], [["speech", 49.45], ["hum", 6.97], ["mains hum", 5.51]], null, null, null], "duration": [0.0, 0.41, 16.37, 5.0, 0.34, 1.32, 0.41]} \ No newline at end of file diff --git a/annotations_1/3uUUeNqdMMU_filtered.json b/annotations_1/3uUUeNqdMMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77036be3893e1a9ff4241280197d7c23f242ebd7 --- /dev/null +++ b/annotations_1/3uUUeNqdMMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.29], [36.0, 46.45], [49.0, 49.11], [51.0, 52.44], [53.0, 54.14], [55.0, 56.91], [59.0, 59.78], [63.0, 66.5], [69.0, 69.42], [70.0, 69.99], [72.0, 72.3]], "keep_status": [true, true, false, false, false, false, false, true, false, false, false], "silence_prob": [30.76, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0, 31.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.27], ["vehicle", 9.4], ["hum", 6.05]], [["music", 35.23], ["noise", 17.03], ["speech", 13.67]], null, null, null, null, null, [["speech", 38.99], ["hum", 14.13], ["throbbing", 9.85]], null, null, null], "duration": [25.29, 10.45, 0.11, 1.44, 1.14, 1.91, 0.78, 3.5, 0.42, -0.01, 0.3]} \ No newline at end of file diff --git a/annotations_1/3v-e25d34pY_filtered.json b/annotations_1/3v-e25d34pY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f2314b71a179169542c59a9ec8f37bf3edceb4a --- /dev/null +++ b/annotations_1/3v-e25d34pY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.83], [10.0, 10.07], [14.0, 17.98], [21.0, 25.02], [28.0, 29.35], [33.0, 35.06], [35.0, 37.93], [39.0, 49.4], [50.0, 53.7], [69.0, 70.95], [73.0, 90.49], [92.0, 97.43], [98.0, 98.86], [100.0, 103.99], [108.0, 108.5], [109.0, 108.55], [109.0, 109.68], [110.0, 113.27], [114.0, 116.83], [118.0, 120.39], [122.0, 124.12], [125.0, 125.61], [127.0, 128.53], [132.0, 133.3], [135.0, 135.4], [137.0, 139.56], [141.0, 166.45], [167.0, 171.66], [172.0, 174.68], [176.0, 177.9], [179.0, 182.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.36, 100.0, 0.0, 100.0, 77.7, 77.7, 80.46, 0.0, 77.87, 99.99, 0.0, 92.97, 0.0, 0.0, 0.0, 70.02, 77.36, 95.64, 98.44, 0.0, 0.0, 0.0, 0.0, 98.99, 58.55, 53.4, 53.28, 0.0, 53.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.83, 0.07, 3.98, 4.02, 1.35, 2.06, 2.93, 10.4, 3.7, 1.95, 17.49, 5.43, 0.86, 3.99, 0.5, -0.45, 0.68, 3.27, 2.83, 2.39, 2.12, 0.61, 1.53, 1.3, 0.4, 2.56, 25.45, 4.66, 2.68, 1.9, 3.09]} \ No newline at end of file diff --git a/annotations_1/3v9Pfg4Ocbg_filtered.json b/annotations_1/3v9Pfg4Ocbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee6185d6e0fbd83c12f86a672cdd3fcfc5884347 --- /dev/null +++ b/annotations_1/3v9Pfg4Ocbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [6.0, 6.91], [7.0, 7.75], [19.0, 19.77], [21.0, 25.71], [28.0, 54.48]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.07, 30.36], "audiomae_on_audioset": [null, null, null, null, null, [["walk, footsteps", 20.75], ["noise", 14.21], ["hum", 13.81]]], "duration": [0.1, 0.91, 0.75, 0.77, 4.71, 26.48]} \ No newline at end of file diff --git a/annotations_1/3wLF8oDA3ZM_filtered.json b/annotations_1/3wLF8oDA3ZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ca7cdffd321d548af7648876e16390d2d2c556a --- /dev/null +++ b/annotations_1/3wLF8oDA3ZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.47], [36.0, 36.68], [41.0, 42.15], [42.0, 43.23], [44.0, 44.37], [53.0, 53.1], [54.0, 55.38], [57.0, 57.42], [63.0, 64.27], [70.0, 70.16], [71.0, 72.27], [73.0, 74.44], [79.0, 86.24], [88.0, 88.97], [90.0, 90.49], [91.0, 91.79], [96.0, 105.9], [107.0, 108.8], [110.0, 114.67], [117.0, 120.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81, 0.0, 0.0, 0.0, 31.11, 0.0, 29.13, 29.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.68], ["throbbing", 6.38], ["didgeridoo", 6.25]], null, [["boing", 33.51], ["music", 27.96], ["speech", 5.04]], [["fly, housefly", 17.58], ["mosquito", 13.09], ["insect", 7.4]]], "duration": [0.47, 0.68, 1.15, 1.23, 0.37, 0.1, 1.38, 0.42, 1.27, 0.16, 1.27, 1.44, 7.24, 0.97, 0.49, 0.79, 9.9, 1.8, 4.67, 3.36]} \ No newline at end of file diff --git a/annotations_1/3wqXNKYn-fQ_filtered.json b/annotations_1/3wqXNKYn-fQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c26a48ec7e4f219f5520f51a33002585d247bfb7 --- /dev/null +++ b/annotations_1/3wqXNKYn-fQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 10.71], [12.0, 14.71], [16.0, 17.1], [20.0, 21.07], [25.0, 25.51], [28.0, 29.57], [30.0, 30.77], [32.0, 32.05], [33.0, 34.21], [35.0, 37.08], [41.0, 42.53], [44.0, 44.17], [45.0, 45.82], [48.0, 49.59], [50.0, 52.08], [54.0, 54.65], [56.0, 55.83], [57.0, 58.09], [60.0, 60.79], [64.0, 64.72], [67.0, 68.4], [74.0, 74.97], [76.0, 78.21], [85.0, 87.44], [89.0, 90.73], [94.0, 95.34], [96.0, 97.34], [98.0, 99.22], [100.0, 102.02], [103.0, 104.14], [105.0, 105.68], [109.0, 110.42], [111.0, 117.02], [118.0, 119.15], [120.0, 121.68], [123.0, 126.79], [128.0, 129.2], [132.0, 131.79], [135.0, 136.63], [138.0, 138.96], [141.0, 143.8], [144.0, 144.93], [147.0, 149.62], [150.0, 151.28]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 42.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.71, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 38.54, 0.0, 0.0, 0.0, 0.0, 36.27, 0.0, 0.0, 0.0, 44.6, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 33.5, 0.0, 31.98, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 30.53], ["speech", 28.87], ["hum", 10.57]], null, null, null, null, null, null, null, [["speech", 69.09], ["busy signal", 4.4], ["dog", 2.97]], null, null, null, null, [["speech", 38.62], ["music", 10.76], ["sidetone", 9.42]], null, null, null, null, null, null, null, null, [["speech", 58.49], ["tuning fork", 5.33], ["sidetone", 5.19]], null, null, null, null, [["music", 26.88], ["burping, eructation", 9.78], ["speech", 8.91]], null, null, null, [["speech", 56.44], ["singing bowl", 14.72], ["music", 6.26]], null, null, null, null, null, null, null, [["speech", 32.5], ["music", 12.68], ["radio", 8.27]], null, [["music", 39.03], ["speech", 11.74], ["hum", 2.82]], null], "duration": [0.16, 0.71, 2.71, 1.1, 1.07, 0.51, 1.57, 0.77, 0.05, 1.21, 2.08, 1.53, 0.17, 0.82, 1.59, 2.08, 0.65, -0.17, 1.09, 0.79, 0.72, 1.4, 0.97, 2.21, 2.44, 1.73, 1.34, 1.34, 1.22, 2.02, 1.14, 0.68, 1.42, 6.02, 1.15, 1.68, 3.79, 1.2, -0.21, 1.63, 0.96, 2.8, 0.93, 2.62, 1.28]} \ No newline at end of file diff --git a/annotations_1/3x0UxzeZBso_filtered.json b/annotations_1/3x0UxzeZBso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c0947848d68e4d1a0c4389dec2ddd9f0bc18f0c --- /dev/null +++ b/annotations_1/3x0UxzeZBso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [5.0, 11.21], [12.0, 15.15], [17.0, 20.16], [22.0, 22.03], [23.0, 24.63], [26.0, 26.3], [27.0, 28.83], [30.0, 32.58], [34.0, 34.82], [37.0, 43.09], [45.0, 46.87], [48.0, 51.12], [52.0, 54.04], [55.0, 55.44], [59.0, 59.9], [61.0, 64.39], [65.0, 64.93], [67.0, 69.94], [71.0, 77.6], [78.0, 109.59], [110.0, 119.35], [120.0, 122.17], [123.0, 128.22], [128.0, 128.44], [128.0, 128.49], [129.0, 130.62], [132.0, 182.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 51.94, 81.71, 99.36, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 39.94, 0.0, 48.69, 68.02, 0.0, 0.0, 31.2, 0.0, 28.61, 28.61, 0.0, 35.22, 41.74, 33.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 64.36], ["whale vocalization", 4.14], ["synthetic singing", 2.79]], null, [["whale vocalization", 42.87], ["speech", 15.78], ["music", 11.68]], null, [["didgeridoo", 23.97], ["music", 17.68], ["hum", 13.46]], null, null, null, [["music", 41.59], ["speech", 25.26], ["hum", 4.28]], null, [["music", 28.82], ["sonar", 16.44], ["hum", 15.95]], [["breaking", 60.03], ["music", 11.67], ["whack, thwack", 6.34]], null, [["burping, eructation", 55.87], ["music", 10.5], ["speech", 4.43]], [["music", 26.49], ["speech", 19.43], ["didgeridoo", 10.07]], [["didgeridoo", 30.99], ["music", 15.39], ["fart", 5.86]], null, null, null, null], "duration": [0.64, 6.21, 3.15, 3.16, 0.03, 1.63, 0.3, 1.83, 2.58, 0.82, 6.09, 1.87, 3.12, 2.04, 0.44, 0.9, 3.39, -0.07, 2.94, 6.6, 31.59, 9.35, 2.17, 5.22, 0.44, 0.49, 1.62, 50.82]} \ No newline at end of file diff --git a/annotations_1/3xtKas3-ctQ_filtered.json b/annotations_1/3xtKas3-ctQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..412275367dc98a5c200d017e6b555d552a108c66 --- /dev/null +++ b/annotations_1/3xtKas3-ctQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 27.11], [34.0, 35.83], [38.0, 39.23], [40.0, 42.63], [46.0, 50.45], [51.0, 51.17], [52.0, 51.95], [53.0, 55.16], [59.0, 60.64], [62.0, 62.85], [67.0, 68.07], [80.0, 80.64], [86.0, 88.55], [90.0, 90.86], [92.0, 96.06], [99.0, 101.8], [102.0, 103.47], [105.0, 106.81], [107.0, 107.62], [109.0, 109.98], [113.0, 112.9], [137.0, 137.71], [138.0, 139.14], [140.0, 140.98], [152.0, 153.3]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.28, 0.0, 0.0, 29.71, 28.97, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 70.16, 65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.53], ["vehicle", 6.97], ["car", 5.86]], null, null, [["mains hum", 29.77], ["hum", 28.41], ["rumble", 12.83]], [["music", 34.36], ["speech", 24.69], ["whip", 4.94]], null, null, [["speech", 26.71], ["fart", 9.5], ["fly, housefly", 8.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.11, 1.83, 1.23, 2.63, 4.45, 0.17, -0.05, 2.16, 1.64, 0.85, 1.07, 0.64, 2.55, 0.86, 4.06, 2.8, 1.47, 1.81, 0.62, 0.98, -0.1, 0.71, 1.14, 0.98, 1.3]} \ No newline at end of file diff --git a/annotations_1/3yVGaKmJrUY_filtered.json b/annotations_1/3yVGaKmJrUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c574b30a402b76d4f83dea3c20c8e2401c08078 --- /dev/null +++ b/annotations_1/3yVGaKmJrUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [5.0, 4.97], [9.0, 9.42], [19.0, 22.94], [25.0, 25.15], [26.0, 26.43], [38.0, 38.55], [43.0, 43.28], [45.0, 46.48], [58.0, 58.62], [59.0, 60.4], [63.0, 64.1], [65.0, 65.84], [74.0, 76.49], [91.0, 91.49], [94.0, 95.27], [96.0, 97.28], [98.0, 98.0], [101.0, 101.29], [106.0, 106.08], [114.0, 115.06], [118.0, 121.27], [122.0, 122.39], [123.0, 124.16], [125.0, 127.89], [129.0, 132.27], [135.0, 135.5], [142.0, 144.32], [147.0, 147.95], [149.0, 166.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 44.55, 59.51, 0.0, 41.85, 0.0, 29.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.4], ["speech", 13.28], ["mains hum", 9.1]], null, null, [["music", 65.88], ["musical instrument", 4.53], ["guitar", 3.83]], null, [["music", 44.46], ["whack, thwack", 26.94], ["boing", 3.3]]], "duration": [0.24, -0.03, 0.42, 3.94, 0.15, 0.43, 0.55, 0.28, 1.48, 0.62, 1.4, 1.1, 0.84, 2.49, 0.49, 1.27, 1.28, 0.0, 0.29, 0.08, 1.06, 3.27, 0.39, 1.16, 2.89, 3.27, 0.5, 2.32, 0.95, 17.46]} \ No newline at end of file diff --git a/annotations_1/3yjYPrkMGdk_filtered.json b/annotations_1/3yjYPrkMGdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c929fd4d1106d8453abc4575a64286bc43bc1c --- /dev/null +++ b/annotations_1/3yjYPrkMGdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.44], [37.0, 37.71], [41.0, 41.5], [53.0, 78.41], [79.0, 82.17], [84.0, 85.48], [89.0, 99.25], [102.0, 109.29], [111.0, 113.27], [114.0, 115.92], [117.0, 118.2], [119.0, 118.81], [119.0, 126.12], [126.0, 126.37], [126.0, 159.75], [161.0, 162.16], [165.0, 170.46]], "keep_status": [false, false, false, false, true, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.88, 40.43, 0.0, 32.6, 28.86, 36.49, 0.0, 0.0, 0.0, 28.65, 0.0, 0.0, 0.0, 39.4], "audiomae_on_audioset": [null, null, null, [["music", 45.37], ["throbbing", 14.98], ["cacophony", 10.14]], [["music", 28.61], ["sine wave", 14.99], ["chirp tone", 9.39]], null, [["noise", 24.1], ["music", 14.43], ["hum", 12.9]], [["speech", 37.12], ["vehicle", 16.14], ["car", 13.91]], [["vehicle", 33.75], ["car", 13.83], ["music", 9.71]], null, null, null, [["vehicle", 59.76], ["car", 17.7], ["skidding", 8.66]], null, null, null, [["music", 20.62], ["buzz", 13.67], ["mains hum", 10.18]]], "duration": [0.44, 0.71, 0.5, 25.41, 3.17, 1.48, 10.25, 7.29, 2.27, 1.92, 1.2, -0.19, 7.12, 0.37, 33.75, 1.16, 5.46]} \ No newline at end of file diff --git a/annotations_1/4-3B-Y9bM0M_filtered.json b/annotations_1/4-3B-Y9bM0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dcc11c1605c5830d4e448c50324146f0d457918 --- /dev/null +++ b/annotations_1/4-3B-Y9bM0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.07], [15.0, 26.94], [27.0, 28.92], [29.0, 85.77], [88.0, 89.06]], "keep_status": [true, false, false, false, false], "silence_prob": [45.95, 56.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 14.54], ["speech", 12.85], ["sine wave", 10.32]], null, null, null, null], "duration": [7.07, 11.94, 1.92, 56.77, 1.06]} \ No newline at end of file diff --git a/annotations_1/4-BWFsE_TQE_filtered.json b/annotations_1/4-BWFsE_TQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f49932ad69db8b22e8a76a18fd3d22aedeb61da8 --- /dev/null +++ b/annotations_1/4-BWFsE_TQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [5.0, 9.09], [10.0, 10.12], [19.0, 20.71], [23.0, 23.14], [25.0, 27.3], [28.0, 28.76], [31.0, 36.19], [37.0, 38.35], [39.0, 45.91], [48.0, 47.95], [50.0, 53.7], [54.0, 54.72], [58.0, 66.92], [67.0, 68.82], [69.0, 72.55], [74.0, 74.71], [76.0, 78.19], [80.0, 81.09], [86.0, 87.29], [92.0, 94.02], [97.0, 98.31], [100.0, 102.15], [105.0, 105.73], [108.0, 109.51], [111.0, 113.78], [115.0, 116.04], [118.0, 119.85], [120.0, 123.75], [139.0, 139.23], [141.0, 141.91], [142.0, 145.13], [147.0, 148.61], [150.0, 151.5], [153.0, 160.25], [162.0, 162.04], [163.0, 194.8], [195.0, 194.95], [195.0, 195.17], [197.0, 201.5], [207.0, 209.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.14, 0.0, 0.0, 0.0, 99.98, 0.0, 78.38, 0.0, 63.64, 0.0, 47.23, 0.0, 60.6, 0.0, 36.67, 0.0, 52.51, 0.0, 0.0, 58.13, 0.0, 72.46, 0.0, 0.0, 84.25, 0.0, 0.0, 32.65, 0.0, 0.0, 59.07, 0.0, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 29.28, 29.93], "audiomae_on_audioset": [null, [["sine wave", 60.76], ["speech", 9.76], ["tuning fork", 7.84]], null, null, null, null, null, null, null, null, null, [["speech", 42.5], ["cough", 17.58], ["music", 13.37]], null, null, null, [["didgeridoo", 12.24], ["music", 9.3], ["whale vocalization", 7.83]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.75], ["thunk", 2.75], ["inside, small room", 1.82]], null, null, null, null, null, [["music", 55.81], ["speech", 18.44], ["whack, thwack", 3.86]], null, null, null, null, [["music", 69.1], ["speech", 5.85], ["cacophony", 2.65]], [["speech", 42.17], ["music", 35.9], ["didgeridoo", 3.04]]], "duration": [0.84, 4.09, 0.12, 1.71, 0.14, 2.3, 0.76, 5.19, 1.35, 6.91, -0.05, 3.7, 0.72, 8.92, 1.82, 3.55, 0.71, 2.19, 1.09, 1.29, 2.02, 1.31, 2.15, 0.73, 1.51, 2.78, 1.04, 1.85, 3.75, 0.23, 0.91, 3.13, 1.61, 1.5, 7.25, 0.04, 31.8, -0.05, 0.17, 4.5, 2.02]} \ No newline at end of file diff --git a/annotations_1/4-hiooEmi-I_filtered.json b/annotations_1/4-hiooEmi-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9d4dc3a69989ed146c7f0705da0bdef6f254576 --- /dev/null +++ b/annotations_1/4-hiooEmi-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[144.0, 145.86], [147.0, 151.65]], "keep_status": [false, true], "silence_prob": [0.0, 31.15], "audiomae_on_audioset": [null, [["cattle, bovinae", 16.92], ["roaring cats (lions, tigers)", 14.41], ["livestock, farm animals, working animals", 11.33]]], "duration": [1.86, 4.65]} \ No newline at end of file diff --git a/annotations_1/40JQrUnvKUw_filtered.json b/annotations_1/40JQrUnvKUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c87da5cdce7a9265fd5eba907c3dcef71775792 --- /dev/null +++ b/annotations_1/40JQrUnvKUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.53], [5.0, 12.12], [14.0, 14.64], [17.0, 46.09], [48.0, 49.67], [52.0, 52.15], [63.0, 69.52], [72.0, 73.25], [75.0, 75.19], [76.0, 79.25], [85.0, 85.06], [88.0, 87.98], [96.0, 96.28], [97.0, 97.48], [98.0, 98.66], [108.0, 109.48], [112.0, 113.41], [116.0, 117.37], [127.0, 126.72], [131.0, 131.43], [134.0, 139.5]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.33, 62.58, 0.0, 35.42, 0.0, 0.0, 57.72, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.74], "audiomae_on_audioset": [[["speech", 46.23], ["tuning fork", 13.19], ["dial tone", 12.76]], null, null, [["music", 50.64], ["musical instrument", 9.79], ["effects unit", 4.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.75], ["mains hum", 24.07], ["speech", 10.4]]], "duration": [2.53, 7.12, 0.64, 29.09, 1.67, 0.15, 6.52, 1.25, 0.19, 3.25, 0.06, -0.02, 0.28, 0.48, 0.66, 1.48, 1.41, 1.37, -0.28, 0.43, 5.5]} \ No newline at end of file diff --git a/annotations_1/40NyqKryTUU_filtered.json b/annotations_1/40NyqKryTUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a6f8bfeee2af9ff060c595b671fb56025971e40 --- /dev/null +++ b/annotations_1/40NyqKryTUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [8.0, 12.18], [22.0, 23.46], [24.0, 24.56], [37.0, 37.76], [40.0, 40.64], [61.0, 61.4], [68.0, 72.89], [78.0, 79.93], [82.0, 84.21], [84.0, 84.94], [85.0, 85.83], [86.0, 89.48], [94.0, 100.72], [103.0, 104.79], [106.0, 106.08], [107.0, 108.16], [115.0, 115.13], [118.0, 120.09], [129.0, 129.78], [134.0, 134.3], [143.0, 143.38]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 39.24, 0.0, 0.0, 37.68, 32.56, 0.0, 0.0, 0.0, 0.0, 43.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 48.66], ["synthesizer", 4.72], ["boing", 4.32]], null, null, null, null, null, null, null, [["music", 56.48], ["didgeridoo", 8.36], ["boing", 4.76]], null, null, [["music", 19.47], ["speech", 15.98], ["musical instrument", 7.25]], [["music", 49.92], ["boing", 9.23], ["speech", 5.43]], null, null, null, null, [["boing", 45.29], ["music", 39.25], ["musical instrument", 3.46]], null, null, null], "duration": [1.12, 4.18, 1.46, 0.56, 0.76, 0.64, 0.4, 4.89, 1.93, 2.21, 0.94, 0.83, 3.48, 6.72, 1.79, 0.08, 1.16, 0.13, 2.09, 0.78, 0.3, 0.38]} \ No newline at end of file diff --git a/annotations_1/40p6dkKil_8_filtered.json b/annotations_1/40p6dkKil_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7ab46104b5090935a52f4c8ea91a3cc83c7a107 --- /dev/null +++ b/annotations_1/40p6dkKil_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 53.96], [55.0, 58.7], [66.0, 66.95], [73.0, 93.72], [95.0, 97.48], [99.0, 99.39], [101.0, 103.44], [104.0, 104.84]], "keep_status": [false, false, false, true, true, false, true, false], "silence_prob": [0.0, 32.39, 0.0, 30.18, 34.01, 0.0, 35.19, 0.0], "audiomae_on_audioset": [null, [["radio", 41.04], ["sidetone", 18.17], ["speech", 16.85]], null, [["vehicle", 27.4], ["car", 9.72], ["hum", 8.02]], [["music", 42.28], ["throbbing", 11.99], ["noise", 4.94]], null, [["fly, housefly", 29.04], ["insect", 14.48], ["bee, wasp, etc.", 5.81]], null], "duration": [-0.04, 3.7, 0.95, 20.72, 2.48, 0.39, 2.44, 0.84]} \ No newline at end of file diff --git a/annotations_1/40ryheWGyZY_filtered.json b/annotations_1/40ryheWGyZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..790af7b193eedeca8ff772c66ba7035f33099810 --- /dev/null +++ b/annotations_1/40ryheWGyZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [5.0, 6.22], [8.0, 8.99], [11.0, 13.22], [15.0, 16.58], [18.0, 19.75], [21.0, 21.37], [29.0, 30.59], [32.0, 34.96], [36.0, 37.1], [38.0, 40.27], [42.0, 44.02], [45.0, 45.5], [47.0, 48.19], [50.0, 53.2], [54.0, 58.08], [59.0, 61.62], [63.0, 63.26], [65.0, 66.75], [68.0, 68.45], [74.0, 79.76], [81.0, 84.35], [86.0, 88.42], [90.0, 91.57], [92.0, 99.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 45.3, 36.65, 0.0, 0.0, 31.7, 32.74, 32.64, 0.0, 0.0, 0.0, 32.61, 35.6, 35.68, 0.0, 33.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 21.71], ["sidetone", 18.31], ["synthesizer", 8.32]], [["hum", 34.59], ["throbbing", 16.52], ["mains hum", 10.26]], null, null, [["hum", 44.91], ["mains hum", 26.05], ["throbbing", 6.05]], [["hum", 27.57], ["mains hum", 24.3], ["throbbing", 7.76]], [["fly, housefly", 15.12], ["bee, wasp, etc.", 12.02], ["speech", 11.98]], null, null, null, [["hum", 31.23], ["throbbing", 27.24], ["mains hum", 21.55]], [["hum", 27.05], ["music", 20.1], ["throbbing", 7.47]], [["hum", 33.46], ["throbbing", 20.7], ["music", 11.92]], null, [["hum", 32.95], ["throbbing", 22.03], ["speech", 17.23]]], "duration": [0.0, 1.22, 0.99, 2.22, 1.58, 1.75, 0.37, 1.59, 2.96, 1.1, 2.27, 2.02, 0.5, 1.19, 3.2, 4.08, 2.62, 0.26, 1.75, 0.45, 5.76, 3.35, 2.42, 1.57, 7.2]} \ No newline at end of file diff --git a/annotations_1/41BnkhKxWHA_filtered.json b/annotations_1/41BnkhKxWHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1b2fcd396ab99ef0eb23decd0f54b640cee5cc2 --- /dev/null +++ b/annotations_1/41BnkhKxWHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [7.0, 7.72], [9.0, 9.71], [14.0, 16.78], [17.0, 18.69], [30.0, 44.25], [47.0, 60.02], [62.0, 67.71], [71.0, 78.24], [82.0, 83.44], [92.0, 94.0], [99.0, 111.35]], "keep_status": [false, false, false, true, false, true, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 44.66, 0.0, 30.18, 31.1, 29.97, 33.38, 0.0, 39.55, 49.73], "audiomae_on_audioset": [null, null, null, [["music", 53.63], ["speech", 10.06], ["didgeridoo", 5.51]], null, [["speech", 47.29], ["music", 12.71], ["crowd", 4.67]], [["music", 36.15], ["speech", 29.18], ["buzz", 4.75]], [["mains hum", 27.89], ["hum", 22.37], ["music", 21.11]], [["music", 34.46], ["synthesizer", 12.15], ["musical instrument", 7.34]], null, [["speech", 7.45], ["animal", 7.3], ["livestock, farm animals, working animals", 7.3]], [["cough", 36.45], ["speech", 29.11], ["throat clearing", 10.06]]], "duration": [0.45, 0.72, 0.71, 2.78, 1.69, 14.25, 13.02, 5.71, 7.24, 1.44, 2.0, 12.35]} \ No newline at end of file diff --git a/annotations_1/43OVm86-4rU_filtered.json b/annotations_1/43OVm86-4rU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f77fb3081036cabfe5121872b8396b2226cecc3f --- /dev/null +++ b/annotations_1/43OVm86-4rU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.68], [11.0, 17.78], [27.0, 26.87], [40.0, 40.32], [43.0, 46.26], [55.0, 63.51], [65.0, 68.77], [73.0, 102.14], [108.0, 116.43], [118.0, 120.06], [126.0, 127.75], [131.0, 132.29], [134.0, 135.14], [137.0, 160.76], [167.0, 171.24], [173.0, 173.13], [173.0, 177.82], [179.0, 182.49], [183.0, 199.91], [200.0, 232.56], [239.0, 245.35]], "keep_status": [false, true, false, false, true, false, true, false, false, true, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 31.27, 0.0, 0.0, 29.6, 29.79, 32.16, 29.19, 31.4, 32.7, 0.0, 0.0, 0.0, 28.47, 29.02, 0.0, 29.7, 30.27, 31.22, 0.0, 31.58], "audiomae_on_audioset": [null, [["music", 39.57], ["smash, crash", 10.55], ["clang", 6.67]], null, null, [["music", 23.68], ["mains hum", 17.24], ["hum", 8.88]], [["music", 40.97], ["didgeridoo", 28.07], ["livestock, farm animals, working animals", 1.91]], [["music", 42.2], ["didgeridoo", 7.45], ["cattle, bovinae", 6.52]], [["music", 69.47], ["electronic music", 6.84], ["throbbing", 3.57]], [["music", 66.73], ["theremin", 7.82], ["throbbing", 3.49]], [["music", 12.54], ["boing", 12.33], ["throbbing", 10.34]], null, null, null, [["music", 62.15], ["electronic music", 9.76], ["throbbing", 6.14]], [["throbbing", 28.81], ["music", 27.4], ["hum", 11.51]], null, [["music", 44.98], ["speech", 27.69], ["sidetone", 6.08]], [["music", 37.05], ["hum", 18.75], ["throbbing", 18.01]], [["music", 35.5], ["throbbing", 22.41], ["hum", 11.75]], null, [["music", 68.2], ["didgeridoo", 4.88], ["sampler", 3.51]]], "duration": [0.68, 6.78, -0.13, 0.32, 3.26, 8.51, 3.77, 29.14, 8.43, 2.06, 1.75, 1.29, 1.14, 23.76, 4.24, 0.13, 4.82, 3.49, 16.91, 32.56, 6.35]} \ No newline at end of file diff --git a/annotations_1/44BkOqV2jDc_filtered.json b/annotations_1/44BkOqV2jDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56ee2bbfde7d169686c72e1d797d3e694ae930e5 --- /dev/null +++ b/annotations_1/44BkOqV2jDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.11], [4.0, 7.35], [8.0, 8.14], [8.0, 8.94], [10.0, 10.83], [14.0, 15.03], [16.0, 17.34], [20.0, 20.95], [22.0, 22.17], [30.0, 30.01], [37.0, 38.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 3.35, 0.14, 0.94, 0.83, 1.03, 1.34, 0.95, 0.17, 0.01, 1.4]} \ No newline at end of file diff --git a/annotations_1/44MohOiWwnA_filtered.json b/annotations_1/44MohOiWwnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cafb5c863671ece7d0b259a8a276e1d12c07d77c --- /dev/null +++ b/annotations_1/44MohOiWwnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 42.23], [46.0, 66.51], [69.0, 115.92], [117.0, 117.81], [122.0, 122.57], [124.0, 132.66]], "keep_status": [false, false, false, false, false, true], "silence_prob": [29.24, 28.9, 0.0, 0.0, 0.0, 29.4], "audiomae_on_audioset": [[["music", 44.63], ["throbbing", 14.57], ["hum", 13.9]], [["hum", 35.39], ["music", 30.0], ["throbbing", 20.77]], null, null, null, [["whack, thwack", 32.41], ["music", 18.36], ["speech", 15.77]]], "duration": [19.23, 20.51, 46.92, 0.81, 0.57, 8.66]} \ No newline at end of file diff --git a/annotations_1/480Hw45m9v8_filtered.json b/annotations_1/480Hw45m9v8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d5764171ad164c5c446c0698acf6dee0c483a44 --- /dev/null +++ b/annotations_1/480Hw45m9v8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.32], [15.0, 29.4], [36.0, 50.73], [59.0, 59.95], [63.0, 63.15], [70.0, 70.21], [81.0, 82.7], [85.0, 85.36], [93.0, 94.53], [95.0, 95.89], [98.0, 104.31], [106.0, 109.66], [110.0, 110.89], [112.0, 112.58], [113.0, 115.01], [117.0, 125.74], [131.0, 131.58], [133.0, 133.52], [134.0, 134.76], [136.0, 140.98], [142.0, 144.54], [148.0, 148.39]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.87, 30.93, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.86, 31.39, 0.0, 0.0, 33.26, 32.32, 0.0, 0.0, 0.0, 31.02, 34.77, 0.0], "audiomae_on_audioset": [[["music", 61.17], ["hip hop music", 8.8], ["static", 4.29]], [["music", 88.17], ["hip hop music", 2.68], ["sampler", 0.89]], [["speech", 32.3], ["sidetone", 17.02], ["whack, thwack", 12.28]], null, null, null, null, null, null, null, [["music", 26.77], ["boing", 21.34], ["hum", 9.93]], [["music", 64.34], ["speech", 4.37], ["singing", 2.11]], null, null, [["music", 74.31], ["didgeridoo", 2.09], ["electronic music", 1.41]], [["music", 68.93], ["boing", 7.76], ["synthetic singing", 2.65]], null, null, null, [["music", 46.9], ["throbbing", 25.11], ["hum", 7.31]], [["music", 29.71], ["speech", 19.42], ["didgeridoo", 8.54]], null], "duration": [3.32, 14.4, 14.73, 0.95, 0.15, 0.21, 1.7, 0.36, 1.53, 0.89, 6.31, 3.66, 0.89, 0.58, 2.01, 8.74, 0.58, 0.52, 0.76, 4.98, 2.54, 0.39]} \ No newline at end of file diff --git a/annotations_1/485KJTKt6RE_filtered.json b/annotations_1/485KJTKt6RE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a26207a1180a583ca4de833fb758f206357ff59 --- /dev/null +++ b/annotations_1/485KJTKt6RE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 62.14], [79.0, 79.05], [93.0, 92.96], [95.0, 96.72], [97.0, 97.5]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.14, 0.05, -0.04, 1.72, 0.5]} \ No newline at end of file diff --git a/annotations_1/4A-hmyHNaxM_filtered.json b/annotations_1/4A-hmyHNaxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e3be0a25ce290131fbcbd6b6d5b3af3172eb9b8 --- /dev/null +++ b/annotations_1/4A-hmyHNaxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.8], [16.0, 18.01], [19.0, 31.45], [34.0, 62.48], [63.0, 64.35], [67.0, 68.17], [74.0, 75.19], [76.0, 81.06], [81.0, 82.46], [85.0, 85.28], [86.0, 93.19], [95.0, 103.44], [106.0, 116.31], [117.0, 118.71], [119.0, 120.92], [121.0, 123.74], [125.0, 126.82], [128.0, 128.16], [129.0, 129.34], [130.0, 130.94], [131.0, 132.19], [134.0, 136.85], [137.0, 144.32], [145.0, 145.27], [146.0, 152.95], [156.0, 156.3], [157.0, 160.96], [161.0, 163.85], [165.0, 171.37]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 80.46, 47.01, 61.97, 0.0, 0.0, 0.0, 30.79, 0.0, 0.0, 32.13, 50.06, 46.29, 0.0, 0.0, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 42.17, 0.0, 64.75, 0.0, 42.91, 32.52, 64.52], "audiomae_on_audioset": [null, null, [["speech", 77.08], ["effects unit", 2.17], ["music", 2.01]], null, null, null, null, [["hum", 32.08], ["music", 14.06], ["throbbing", 14.03]], null, null, [["speech", 41.53], ["noise", 32.85], ["music", 7.34]], null, [["whale vocalization", 35.17], ["hum", 16.2], ["throbbing", 11.06]], null, null, null, null, null, null, null, null, null, [["sidetone", 41.16], ["speech", 31.89], ["hum", 9.55]], null, null, null, [["effects unit", 21.66], ["distortion", 10.93], ["music", 10.83]], [["speech", 65.66], ["dial tone", 7.88], ["whale vocalization", 7.31]], null], "duration": [1.8, 2.01, 12.45, 28.48, 1.35, 1.17, 1.19, 5.06, 1.46, 0.28, 7.19, 8.44, 10.31, 1.71, 1.92, 2.74, 1.82, 0.16, 0.34, 0.94, 1.19, 2.85, 7.32, 0.27, 6.95, 0.3, 3.96, 2.85, 6.37]} \ No newline at end of file diff --git a/annotations_1/4At_9_s2lDY_filtered.json b/annotations_1/4At_9_s2lDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e801fd03f61493a3ff1d18380fb60f6afa4a93e4 --- /dev/null +++ b/annotations_1/4At_9_s2lDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.45], [21.0, 23.38], [26.0, 28.93], [29.0, 29.03], [30.0, 72.32], [77.0, 80.91], [82.0, 82.63], [84.0, 89.75], [90.0, 94.86]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.09, 28.99, 0.0, 0.0, 28.98, 0.0, 29.05, 29.29], "audiomae_on_audioset": [null, [["music", 45.81], ["dubstep", 29.42], ["electronic music", 11.16]], [["music", 59.38], ["reggae", 12.36], ["dubstep", 5.74]], null, null, [["music", 73.07], ["didgeridoo", 6.06], ["rattle (instrument)", 1.55]], null, [["music", 95.52], ["swing music", 0.5], ["didgeridoo", 0.44]], [["music", 65.88], ["didgeridoo", 3.37], ["reggae", 3.23]]], "duration": [0.45, 2.38, 2.93, 0.03, 42.32, 3.91, 0.63, 5.75, 4.86]} \ No newline at end of file diff --git a/annotations_1/4C7VpH9VvC0_filtered.json b/annotations_1/4C7VpH9VvC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9f1c5f3ee2854852a5f34f6252459b941f47e75 --- /dev/null +++ b/annotations_1/4C7VpH9VvC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [11.0, 11.33], [29.0, 29.37], [32.0, 32.39], [37.0, 37.69], [44.0, 44.54], [46.0, 46.5], [50.0, 50.6], [51.0, 51.04], [53.0, 55.81], [58.0, 63.86], [68.0, 68.81], [78.0, 81.75], [88.0, 91.1], [99.0, 98.96]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.36, 35.23, 0.0, 35.1, 33.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 28.5], ["mains hum", 20.45], ["hum", 17.98]], [["hum", 30.36], ["mains hum", 17.2], ["music", 16.5]], null, [["hum", 23.61], ["mains hum", 20.47], ["music", 15.07]], [["music", 36.91], ["drum machine", 11.82], ["throbbing", 7.1]], null], "duration": [0.88, 0.33, 0.37, 0.39, 0.69, 0.54, 0.5, 0.6, 0.04, 2.81, 5.86, 0.81, 3.75, 3.1, -0.04]} \ No newline at end of file diff --git a/annotations_1/4CVFOnmW6v8_filtered.json b/annotations_1/4CVFOnmW6v8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28e2bf41891901670e7d42b93d14fe526e9613fc --- /dev/null +++ b/annotations_1/4CVFOnmW6v8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.38], [15.0, 14.88], [19.0, 21.41], [23.0, 25.25], [29.0, 30.97], [34.0, 35.36], [37.0, 39.33], [41.0, 42.62], [45.0, 48.76], [50.0, 51.06], [58.0, 58.85], [60.0, 60.24], [61.0, 61.74], [63.0, 64.42], [65.0, 67.51], [69.0, 79.42]], "keep_status": [true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [30.41, 0.0, 31.67, 36.02, 0.0, 0.0, 33.53, 0.0, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 35.51, 29.36], "audiomae_on_audioset": [[["music", 32.88], ["speech", 16.9], ["applause", 9.02]], null, [["speech", 23.28], ["crowd", 22.07], ["cheering", 11.48]], [["moo", 27.34], ["cattle, bovinae", 26.99], ["livestock, farm animals, working animals", 25.88]], null, null, [["livestock, farm animals, working animals", 42.68], ["cattle, bovinae", 31.47], ["moo", 22.94]], null, [["speech", 21.53], ["crowd", 14.9], ["applause", 9.37]], null, null, null, null, null, [["speech", 70.0], ["boing", 8.17], ["radio", 7.05]], [["speech", 37.86], ["music", 20.99], ["crowd", 4.79]]], "duration": [8.38, -0.12, 2.41, 2.25, 1.97, 1.36, 2.33, 1.62, 3.76, 1.06, 0.85, 0.24, 0.74, 1.42, 2.51, 10.42]} \ No newline at end of file diff --git a/annotations_1/4CmmKmlXD9I_filtered.json b/annotations_1/4CmmKmlXD9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd8f16911a8b48b792686abe1cc0beca122fd188 --- /dev/null +++ b/annotations_1/4CmmKmlXD9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 102.95], [103.0, 103.03], [103.0, 103.06]], "keep_status": [true, false, false], "silence_prob": [32.26, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.66], ["theremin", 8.62], ["throbbing", 4.76]], null, null], "duration": [8.95, 0.03, 0.06]} \ No newline at end of file diff --git a/annotations_1/4Cw7JHJuTt8_filtered.json b/annotations_1/4Cw7JHJuTt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/4Cw7JHJuTt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/4DD8QRsms1s_filtered.json b/annotations_1/4DD8QRsms1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f58189acedaf165add334541561335aa15f97482 --- /dev/null +++ b/annotations_1/4DD8QRsms1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [24.0, 24.44], [26.0, 26.55], [27.0, 27.36], [28.0, 30.3], [38.0, 38.01], [41.0, 49.52], [55.0, 55.81], [57.0, 57.06], [58.0, 65.62], [66.0, 66.6], [69.0, 82.51], [85.0, 85.67], [86.0, 106.29], [118.0, 118.57], [120.0, 120.88], [124.0, 132.16], [136.0, 142.35], [144.0, 145.96], [157.0, 162.65], [167.0, 171.48]], "keep_status": [true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [36.63, 0.0, 0.0, 0.0, 32.46, 0.0, 37.23, 0.0, 0.0, 29.99, 0.0, 34.43, 0.0, 30.68, 0.0, 0.0, 31.0, 32.9, 0.0, 31.27, 35.06], "audiomae_on_audioset": [[["speech", 10.32], ["grunt", 8.43], ["fly, housefly", 6.44]], null, null, null, [["speech", 20.12], ["wail, moan", 13.72], ["animal", 4.93]], null, [["whack, thwack", 39.09], ["speech", 26.83], ["noise", 9.25]], null, null, [["breaking", 44.05], ["speech", 16.95], ["grunt", 4.59]], null, [["speech", 71.06], ["whack, thwack", 5.32], ["thump, thud", 4.39]], null, [["speech", 55.75], ["whack, thwack", 6.53], ["groan", 6.5]], null, null, [["whack, thwack", 72.31], ["speech", 9.38], ["smash, crash", 6.73]], [["speech", 45.04], ["whack, thwack", 25.92], ["fart", 4.96]], null, [["breaking", 37.05], ["whack, thwack", 11.47], ["animal", 7.93]], [["speech", 51.2], ["grunt", 13.95], ["music", 10.81]]], "duration": [2.16, 0.44, 0.55, 0.36, 2.3, 0.01, 8.52, 0.81, 0.06, 7.62, 0.6, 13.51, 0.67, 20.29, 0.57, 0.88, 8.16, 6.35, 1.96, 5.65, 4.48]} \ No newline at end of file diff --git a/annotations_1/4DKTOdul0_I_filtered.json b/annotations_1/4DKTOdul0_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30bae778c4239ff525ebe720e3e54561848041c3 --- /dev/null +++ b/annotations_1/4DKTOdul0_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.12], [13.0, 27.5], [29.0, 29.83], [30.0, 31.75], [33.0, 33.47], [34.0, 34.52], [35.0, 35.23], [35.0, 39.41], [40.0, 41.25], [45.0, 48.56], [49.0, 51.24], [53.0, 55.11], [57.0, 58.01], [59.0, 59.81], [62.0, 64.1], [66.0, 72.99], [74.0, 75.63], [77.0, 83.56], [85.0, 86.02], [88.0, 89.19], [93.0, 93.63], [95.0, 96.4], [99.0, 100.13], [101.0, 102.1], [103.0, 102.86], [104.0, 105.09], [106.0, 122.94], [132.0, 132.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.39, 51.82, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 78.21, 72.75, 47.08, 0.0, 0.0, 52.68, 60.51, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.09], ["music", 12.35], ["hum", 10.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.12, 14.5, 0.83, 1.75, 0.47, 0.52, 0.23, 4.41, 1.25, 3.56, 2.24, 2.11, 1.01, 0.81, 2.1, 6.99, 1.63, 6.56, 1.02, 1.19, 0.63, 1.4, 1.13, 1.1, -0.14, 1.09, 16.94, 0.33]} \ No newline at end of file diff --git a/annotations_1/4E55_uKSR40_filtered.json b/annotations_1/4E55_uKSR40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d253c1645c6588a7a5e9716536c6ef72e517199 --- /dev/null +++ b/annotations_1/4E55_uKSR40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [7.0, 7.11], [8.0, 8.77], [10.0, 10.18], [17.0, 21.36], [22.0, 23.43], [24.0, 25.74], [27.0, 28.61], [30.0, 30.54], [32.0, 32.1], [34.0, 34.8], [36.0, 36.66], [38.0, 39.78], [40.0, 48.98], [50.0, 52.12], [53.0, 53.82], [54.0, 54.7], [56.0, 59.37], [60.0, 69.23], [70.0, 93.66], [95.0, 95.69], [100.0, 100.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.09, 88.28, 0.0, 0.0, 62.58, 46.26, 43.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.42], ["foghorn", 7.49], ["scary music", 4.78]], null, null, null, null, null, null, null, null, [["fart", 73.51], ["music", 1.81], ["speech", 1.67]], null, null, null, null, [["speech", 68.74], ["radio", 4.9], ["telephone", 3.79]], [["speech", 50.32], ["fart", 7.88], ["livestock, farm animals, working animals", 3.54]], null, null], "duration": [1.21, 0.11, 0.77, 0.18, 4.36, 1.43, 1.74, 1.61, 0.54, 0.1, 0.8, 0.66, 1.78, 8.98, 2.12, 0.82, 0.7, 3.37, 9.23, 23.66, 0.69, 0.79]} \ No newline at end of file diff --git a/annotations_1/4EF1zYFHbus_filtered.json b/annotations_1/4EF1zYFHbus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f216c9ec0638f71af3088ff374aa5d9cd88398d --- /dev/null +++ b/annotations_1/4EF1zYFHbus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.1], [28.0, 28.86], [33.0, 34.96], [36.0, 36.44], [47.0, 46.74], [53.0, 52.98], [60.0, 60.76], [75.0, 76.38], [83.0, 85.43], [96.0, 96.38], [115.0, 116.21], [133.0, 132.63], [152.0, 158.14], [159.0, 161.45], [164.0, 164.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.58, 0.0, 0.0, 0.0, 35.82, 39.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 76.43], ["radio", 8.13], ["whale vocalization", 1.12]], null, null, null, [["music", 62.35], ["chorus effect", 6.06], ["musical instrument", 5.46]], [["music", 41.53], ["musical instrument", 5.28], ["alarm", 4.28]], null], "duration": [1.1, 0.86, 1.96, 0.44, -0.26, -0.02, 0.76, 1.38, 2.43, 0.38, 1.21, -0.37, 6.14, 2.45, 0.71]} \ No newline at end of file diff --git a/annotations_1/4EWgdeVQzEk_filtered.json b/annotations_1/4EWgdeVQzEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f44c5956b83f5eeab22e9a9bb4a325ca0ce8322c --- /dev/null +++ b/annotations_1/4EWgdeVQzEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 41.45], [42.0, 66.66], [67.0, 90.98], [91.0, 91.02], [92.0, 100.28], [102.0, 127.33], [128.0, 154.36]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 42.17, 37.1, 0.0, 70.86, 46.75, 31.07], "audiomae_on_audioset": [null, [["music", 31.7], ["whale vocalization", 13.85], ["sonar", 11.35]], [["music", 59.35], ["theremin", 7.16], ["ambient music", 4.13]], null, null, [["music", 58.3], ["singing bowl", 12.04], ["musical instrument", 5.23]], [["music", 47.0], ["sidetone", 37.78], ["speech", 1.85]]], "duration": [35.45, 24.66, 23.98, 0.02, 8.28, 25.33, 26.36]} \ No newline at end of file diff --git a/annotations_1/4F5AGPMRwgw_filtered.json b/annotations_1/4F5AGPMRwgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..619982fbdd98789868ec556d4963290c3a26540f --- /dev/null +++ b/annotations_1/4F5AGPMRwgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [10.0, 10.2], [12.0, 12.83], [14.0, 14.62], [16.0, 16.98], [18.0, 20.33], [26.0, 30.25], [32.0, 32.8], [34.0, 36.46], [39.0, 40.78], [47.0, 64.45], [67.0, 72.82], [74.0, 84.87], [88.0, 90.85], [92.0, 93.12], [98.0, 98.73], [109.0, 109.95], [114.0, 115.53], [116.0, 120.19], [124.0, 146.99], [149.0, 152.44], [153.0, 153.94], [155.0, 156.64], [162.0, 163.31], [164.0, 169.21], [170.0, 171.78], [173.0, 173.38], [181.0, 181.2], [183.0, 185.35]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 33.89, 0.0, 39.69, 0.0, 58.3, 42.91, 47.66, 62.58, 0.0, 0.0, 0.0, 0.0, 45.49, 47.27, 46.5, 0.0, 0.0, 0.0, 46.9, 0.0, 0.0, 0.0, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 40.6], ["fart", 15.35], ["vehicle", 5.12]], null, [["music", 32.13], ["sonar", 17.88], ["hum", 16.8]], null, null, [["music", 31.92], ["singing bowl", 21.15], ["hum", 6.39]], [["music", 33.55], ["hum", 16.09], ["musical instrument", 7.32]], null, null, null, null, null, [["speech", 64.63], ["music", 15.14], ["livestock, farm animals, working animals", 2.33]], [["music", 46.9], ["hum", 10.7], ["musical instrument", 4.42]], [["sidetone", 78.63], ["speech", 13.69], ["telephone", 3.08]], null, null, null, [["sidetone", 56.74], ["speech", 27.32], ["music", 3.5]], null, null, null, null], "duration": [1.02, 0.2, 0.83, 0.62, 0.98, 2.33, 4.25, 0.8, 2.46, 1.78, 17.45, 5.82, 10.87, 2.85, 1.12, 0.73, 0.95, 1.53, 4.19, 22.99, 3.44, 0.94, 1.64, 1.31, 5.21, 1.78, 0.38, 0.2, 2.35]} \ No newline at end of file diff --git a/annotations_1/4F_jLtYFT6Y_filtered.json b/annotations_1/4F_jLtYFT6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b586d297a388611d2b5ee33ec5f1385cbaa230b0 --- /dev/null +++ b/annotations_1/4F_jLtYFT6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.82], [10.0, 18.98], [21.0, 21.44], [23.0, 31.72], [35.0, 47.75], [49.0, 50.03], [51.0, 50.84], [54.0, 55.24], [61.0, 61.3], [64.0, 63.88], [64.0, 77.67], [85.0, 90.91], [92.0, 111.92], [114.0, 114.67], [116.0, 117.09]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.62, 29.55, 0.0, 29.33, 29.78, 0.0, 0.0, 0.0, 0.0, 0.0, 29.88, 32.15, 30.74, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 74.53], ["music", 9.56], ["electronic music", 0.98]], [["speech", 29.09], ["music", 19.91], ["breaking", 15.59]], null, [["hum", 30.59], ["mains hum", 17.24], ["speech", 14.95]], [["speech", 53.67], ["music", 14.61], ["hum", 4.47]], null, null, null, null, null, [["speech", 78.22], ["vehicle", 3.47], ["electric shaver, electric razor", 1.86]], [["speech", 77.36], ["music", 2.34], ["beatboxing", 2.05]], [["speech", 22.16], ["fart", 10.09], ["whale vocalization", 9.1]], null, null], "duration": [5.82, 8.98, 0.44, 8.72, 12.75, 1.03, -0.16, 1.24, 0.3, -0.12, 13.67, 5.91, 19.92, 0.67, 1.09]} \ No newline at end of file diff --git a/annotations_1/4Fa5YPKxwRU_filtered.json b/annotations_1/4Fa5YPKxwRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce2b4267955c37f1f3d6a0ae4f9aab9b1ab88ba0 --- /dev/null +++ b/annotations_1/4Fa5YPKxwRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.29], [26.0, 30.81], [32.0, 33.76], [43.0, 43.48], [47.0, 47.55], [59.0, 59.93], [65.0, 65.79], [68.0, 69.89], [74.0, 78.61], [80.0, 81.31], [83.0, 84.47], [86.0, 98.63], [100.0, 100.9], [102.0, 103.13], [105.0, 106.56], [117.0, 117.78], [121.0, 126.79], [129.0, 131.26], [134.0, 133.93], [136.0, 137.07], [146.0, 146.89], [152.0, 153.23], [156.0, 160.42], [172.0, 172.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 33.73, 0.0, 0.0, 0.0, 0.0, 34.61, 81.71, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 42.71], ["speech", 24.98], ["synthesizer", 13.13]], null, null, [["music", 20.07], ["insect", 13.36], ["hum", 12.3]], null, null, null, null, [["speech", 69.88], ["music", 17.07], ["guitar", 1.85]], null, null, null, null, null, null, null], "duration": [0.29, 4.81, 1.76, 0.48, 0.55, 0.93, 0.79, 1.89, 4.61, 1.31, 1.47, 12.63, 0.9, 1.13, 1.56, 0.78, 5.79, 2.26, -0.07, 1.07, 0.89, 1.23, 4.42, 0.5]} \ No newline at end of file diff --git a/annotations_1/4FkUmPvbDQs_filtered.json b/annotations_1/4FkUmPvbDQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bbf46cbb7742c6494d22d71768022a5d79b2e3a --- /dev/null +++ b/annotations_1/4FkUmPvbDQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 9.53], [11.0, 14.57], [16.0, 17.61], [19.0, 23.46], [24.0, 45.91], [46.0, 50.01], [52.0, 54.33], [58.0, 58.36], [63.0, 63.12], [64.0, 70.26], [72.0, 77.65], [79.0, 86.07], [87.0, 96.06], [114.0, 115.38], [117.0, 118.4], [126.0, 127.35], [129.0, 130.62], [132.0, 133.73], [134.0, 134.96], [135.0, 135.92], [145.0, 154.01], [155.0, 159.83], [161.0, 160.84], [161.0, 165.18], [168.0, 169.82], [172.0, 173.67], [175.0, 177.89], [179.0, 184.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.29, 72.16, 0.0, 92.8, 58.38, 64.52, 93.13, 0.0, 0.0, 48.95, 87.74, 65.55, 43.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 60.23, 0.0, 39.31, 0.0, 0.0, 63.31, 51.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 64.62], ["sidetone", 19.47], ["hum", 3.71]], null, null, [["gong", 29.22], ["music", 16.62], ["speech", 7.85]], null, null, null, null, null, null, null, null, null, null, [["speech", 55.37], ["music", 18.24], ["ambient music", 3.72]], null, null, null, null], "duration": [9.53, 3.57, 1.61, 4.46, 21.91, 4.01, 2.33, 0.36, 0.12, 6.26, 5.65, 7.07, 9.06, 1.38, 1.4, 1.35, 1.62, 1.73, 0.96, 0.92, 9.01, 4.83, -0.16, 4.18, 1.82, 1.67, 2.89, 5.82]} \ No newline at end of file diff --git a/annotations_1/4FppyDurg7c_filtered.json b/annotations_1/4FppyDurg7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f967311e1adfb843221fd04cc8b35de2d3be938 --- /dev/null +++ b/annotations_1/4FppyDurg7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 45.33], [51.0, 53.3], [58.0, 60.35], [62.0, 63.69], [65.0, 82.38], [83.0, 102.93], [103.0, 105.71], [106.0, 136.98], [137.0, 137.02], [137.0, 145.05], [151.0, 152.54], [154.0, 154.41], [155.0, 156.05], [157.0, 159.11], [160.0, 160.81], [162.0, 162.35], [171.0, 171.44], [176.0, 176.35], [178.0, 177.79], [180.0, 180.37], [181.0, 184.13], [190.0, 191.54]], "keep_status": [true, true, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.12, 30.18, 30.85, 0.0, 30.04, 33.06, 38.64, 0.0, 0.0, 37.64, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0], "audiomae_on_audioset": [[["music", 39.83], ["throbbing", 14.22], ["speech", 13.66]], [["hum", 18.34], ["noise", 18.05], ["throbbing", 13.76]], [["hum", 30.91], ["throbbing", 24.65], ["mains hum", 13.12]], null, [["throbbing", 58.09], ["hum", 23.3], ["music", 8.06]], [["hum", 47.0], ["mains hum", 26.33], ["music", 7.38]], [["groan", 48.82], ["grunt", 9.8], ["whimper", 8.8]], null, null, [["speech", 22.31], ["groan", 9.83], ["outside, rural or natural", 8.41]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.33, 2.3, 2.35, 1.69, 17.38, 19.93, 2.71, 30.98, 0.02, 8.05, 1.54, 0.41, 1.05, 2.11, 0.81, 0.35, 0.44, 0.35, -0.21, 0.37, 3.13, 1.54]} \ No newline at end of file diff --git a/annotations_1/4G6VXPkfDvo_filtered.json b/annotations_1/4G6VXPkfDvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6289862889937a5448002cabe4952ca8b973ea6d --- /dev/null +++ b/annotations_1/4G6VXPkfDvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [8.0, 7.91], [12.0, 11.96], [19.0, 20.75], [29.0, 28.76], [34.0, 37.61], [38.0, 40.51], [47.0, 49.42], [50.0, 51.29], [52.0, 52.37], [54.0, 53.87], [56.0, 56.17], [67.0, 66.97], [68.0, 68.34], [70.0, 70.21], [72.0, 72.0], [77.0, 77.33], [77.0, 78.54], [79.0, 81.38], [82.0, 82.83], [85.0, 88.52], [89.0, 90.02], [91.0, 90.93], [91.0, 91.88], [92.0, 92.99], [100.0, 100.47], [101.0, 101.49], [102.0, 102.51], [111.0, 111.96], [117.0, 119.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 72.6, 65.91, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.43], ["buzz", 8.8], ["electric shaver, electric razor", 4.36]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, -0.09, -0.04, 1.75, -0.24, 3.61, 2.51, 2.42, 1.29, 0.37, -0.13, 0.17, -0.03, 0.34, 0.21, 0.0, 0.33, 1.54, 2.38, 0.83, 3.52, 1.02, -0.07, 0.88, 0.99, 0.47, 0.49, 0.51, 0.96, 2.43]} \ No newline at end of file diff --git a/annotations_1/4GRGY20zWkU_filtered.json b/annotations_1/4GRGY20zWkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c124e3017d26c9fd92652861df5d9ae138cb1943 --- /dev/null +++ b/annotations_1/4GRGY20zWkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.47], [9.0, 10.96], [12.0, 12.85], [15.0, 17.9], [19.0, 19.01], [21.0, 21.71], [22.0, 27.77], [34.0, 37.44], [39.0, 43.87], [44.0, 45.69], [47.0, 47.43], [48.0, 49.35], [53.0, 54.89], [57.0, 57.86], [58.0, 67.69], [70.0, 71.02], [74.0, 77.36], [81.0, 94.46], [99.0, 101.07], [111.0, 111.65], [115.0, 115.57], [116.0, 116.31], [118.0, 118.86], [121.0, 123.43], [131.0, 131.11], [134.0, 134.69], [136.0, 136.26], [147.0, 146.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 96.77, 84.43, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 35.29, 34.35, 93.13, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 10.52], ["livestock, farm animals, working animals", 9.69], ["groan", 9.1]], null, [["cattle, bovinae", 34.39], ["moo", 24.93], ["livestock, farm animals, working animals", 16.76]], [["speech", 30.63], ["ding", 10.53], ["car", 10.01]], null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 1.96, 0.85, 2.9, 0.01, 0.71, 5.77, 3.44, 4.87, 1.69, 0.43, 1.35, 1.89, 0.86, 9.69, 1.02, 3.36, 13.46, 2.07, 0.65, 0.57, 0.31, 0.86, 2.43, 0.11, 0.69, 0.26, -0.35]} \ No newline at end of file diff --git a/annotations_1/4GlXOOYL_5I_filtered.json b/annotations_1/4GlXOOYL_5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0779c877098ab2e0ed0f9eae89ada0e5876d18b6 --- /dev/null +++ b/annotations_1/4GlXOOYL_5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 36.56], [38.0, 168.96], [170.0, 172.35]], "keep_status": [true, false, false], "silence_prob": [32.52, 0.0, 58.72], "audiomae_on_audioset": [[["music", 34.98], ["hum", 11.24], ["noise", 7.49]], null, null], "duration": [25.56, 130.96, 2.35]} \ No newline at end of file diff --git a/annotations_1/4Gs6pBwn5w8_filtered.json b/annotations_1/4Gs6pBwn5w8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6417ffeed04e178bd3205f623ffff544d27f0d9d --- /dev/null +++ b/annotations_1/4Gs6pBwn5w8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.77], [17.0, 19.25], [22.0, 27.92], [33.0, 33.94], [38.0, 40.12], [48.0, 49.11], [54.0, 54.5], [56.0, 56.64], [59.0, 66.18], [67.0, 68.37], [69.0, 70.9], [75.0, 78.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.96, 47.86, 56.7, 0.0, 56.1, 0.0, 0.0, 0.0, 55.6, 0.0, 0.0, 54.1], "audiomae_on_audioset": [null, [["speech", 48.58], ["rumble", 15.41], ["vehicle", 8.88]], null, null, null, null, null, null, null, null, null, null], "duration": [4.77, 2.25, 5.92, 0.94, 2.12, 1.11, 0.5, 0.64, 7.18, 1.37, 1.9, 3.09]} \ No newline at end of file diff --git a/annotations_1/4HB9b-ttI3I_filtered.json b/annotations_1/4HB9b-ttI3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a994c9d46fd35b4489dea3e29022b85ff3c8102 --- /dev/null +++ b/annotations_1/4HB9b-ttI3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.25], [3.0, 3.79], [6.0, 8.97], [10.0, 9.81], [12.0, 11.72], [12.0, 16.93], [20.0, 21.95], [23.0, 23.73], [24.0, 26.1], [27.0, 27.73], [30.0, 30.67], [37.0, 37.69], [40.0, 40.58], [42.0, 42.63], [44.0, 44.79], [49.0, 49.15], [49.0, 50.43], [52.0, 52.52], [63.0, 63.15], [64.0, 64.99], [74.0, 74.51], [77.0, 77.68], [81.0, 81.41], [85.0, 85.78], [86.0, 93.31], [98.0, 98.31], [102.0, 101.88], [103.0, 104.26], [106.0, 107.43], [112.0, 111.79], [114.0, 115.84], [121.0, 121.12], [122.0, 122.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.88, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.79, 2.97, -0.19, -0.28, 4.93, 1.95, 0.73, 2.1, 0.73, 0.67, 0.69, 0.58, 0.63, 0.79, 0.15, 1.43, 0.52, 0.15, 0.99, 0.51, 0.68, 0.41, 0.78, 7.31, 0.31, -0.12, 1.26, 1.43, -0.21, 1.84, 0.12, 0.99]} \ No newline at end of file diff --git a/annotations_1/4HOgujwklBY_filtered.json b/annotations_1/4HOgujwklBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44e0bc1e82f3c453a294fffc57b9874f21cd1d1a --- /dev/null +++ b/annotations_1/4HOgujwklBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [5.0, 9.49], [11.0, 13.14], [14.0, 16.29], [16.0, 18.4], [19.0, 21.95], [22.0, 30.87], [34.0, 34.01], [38.0, 38.23], [39.0, 39.41], [39.0, 39.46], [41.0, 72.93], [73.0, 74.65], [76.0, 76.76], [78.0, 79.61], [82.0, 98.74], [101.0, 100.95], [103.0, 104.58], [107.0, 107.86], [108.0, 134.05], [135.0, 142.86], [144.0, 145.47], [146.0, 151.5], [154.0, 154.21], [157.0, 158.75]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 39.35, 39.8, 39.19, 35.85, 32.06, 31.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.35, 0.0, 0.0, 0.0, 31.4, 31.28, 0.0, 31.42, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 56.93], ["throbbing", 12.88], ["hum", 4.15]], [["music", 54.46], ["throbbing", 17.02], ["hum", 8.78]], [["music", 51.6], ["mains hum", 6.4], ["hum", 6.3]], [["music", 68.31], ["hum", 5.52], ["mains hum", 4.69]], [["music", 69.04], ["explosion", 2.97], ["burst, pop", 2.13]], [["music", 43.55], ["hum", 15.87], ["throbbing", 12.94]], null, null, null, null, null, null, null, null, [["music", 32.1], ["throbbing", 17.65], ["whack, thwack", 9.02]], null, null, null, [["music", 66.98], ["speech", 4.8], ["electronic music", 2.36]], [["speech", 35.83], ["music", 15.53], ["hum", 6.45]], null, [["speech", 36.95], ["music", 28.06], ["electric shaver, electric razor", 4.94]], null, null], "duration": [1.62, 4.49, 2.14, 2.29, 2.4, 2.95, 8.87, 0.01, 0.23, 0.41, 0.46, 31.93, 1.65, 0.76, 1.61, 16.74, -0.05, 1.58, 0.86, 26.05, 7.86, 1.47, 5.5, 0.21, 1.75]} \ No newline at end of file diff --git a/annotations_1/4I9-0dipqo0_filtered.json b/annotations_1/4I9-0dipqo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..069d4b38fb57a01132061677a8f93962f5ff22e8 --- /dev/null +++ b/annotations_1/4I9-0dipqo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [5.0, 5.36], [7.0, 7.91], [12.0, 13.47], [15.0, 15.63], [21.0, 21.63], [22.0, 23.6], [32.0, 32.17], [34.0, 35.06], [36.0, 37.02], [39.0, 39.12], [43.0, 43.48], [48.0, 48.25], [49.0, 50.55], [52.0, 52.29], [54.0, 55.29], [61.0, 63.12], [64.0, 64.59], [71.0, 77.33], [103.0, 103.89], [105.0, 104.97], [110.0, 111.47], [114.0, 114.57], [121.0, 121.29], [125.0, 125.71], [131.0, 132.39], [134.0, 135.11], [138.0, 138.15], [141.0, 141.81], [143.0, 144.27], [146.0, 147.28], [149.0, 149.74], [153.0, 162.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.36, 0.91, 1.47, 0.63, 0.63, 1.6, 0.17, 1.06, 1.02, 0.12, 0.48, 0.25, 1.55, 0.29, 1.29, 2.12, 0.59, 6.33, 0.89, -0.03, 1.47, 0.57, 0.29, 0.71, 1.39, 1.11, 0.15, 0.81, 1.27, 1.28, 0.74, 9.9]} \ No newline at end of file diff --git a/annotations_1/4IHDSpacpbc_filtered.json b/annotations_1/4IHDSpacpbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..585e084d04ee62aa86ef8b96577a62dbecdca163 --- /dev/null +++ b/annotations_1/4IHDSpacpbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 40.95], [42.0, 57.92], [64.0, 65.52], [74.0, 77.82], [79.0, 81.21], [86.0, 96.42], [99.0, 137.12], [140.0, 223.45]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [30.07, 41.32, 0.0, 79.94, 92.31, 79.41, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.68], ["throbbing", 20.72], ["hum", 7.12]], [["music", 30.67], ["whale vocalization", 20.01], ["theremin", 15.71]], null, null, null, null, null, null], "duration": [29.95, 15.92, 1.52, 3.82, 2.21, 10.42, 38.12, 83.45]} \ No newline at end of file diff --git a/annotations_1/4IbNz68R49c_filtered.json b/annotations_1/4IbNz68R49c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec84edbc0d417a34be48e4d1ba6dfde778668a4c --- /dev/null +++ b/annotations_1/4IbNz68R49c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.94], [18.0, 18.71], [20.0, 19.68], [20.0, 37.61], [40.0, 69.84], [71.0, 83.51], [85.0, 88.4], [89.0, 88.99], [90.0, 97.06], [98.0, 98.88], [101.0, 101.9], [104.0, 106.59], [108.0, 109.7]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.26, 31.28, 31.98, 31.85, 0.0, 36.76, 0.0, 0.0, 85.9, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.0], ["speech", 20.08], ["throbbing", 18.78]], [["music", 66.87], ["fart", 5.78], ["speech", 4.69]], [["music", 41.61], ["groan", 13.56], ["whack, thwack", 11.41]], [["music", 56.33], ["didgeridoo", 19.59], ["throbbing", 6.01]], null, [["music", 68.02], ["speech", 13.59], ["hum", 4.07]], null, null, null, null], "duration": [0.94, 0.71, -0.32, 17.61, 29.84, 12.51, 3.4, -0.01, 7.06, 0.88, 0.9, 2.59, 1.7]} \ No newline at end of file diff --git a/annotations_1/4InwO1SSp5o_filtered.json b/annotations_1/4InwO1SSp5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6cbd566bee6a80a1ae6140ec0ffa6503b649c6c --- /dev/null +++ b/annotations_1/4InwO1SSp5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [5.0, 6.76], [10.0, 10.71], [16.0, 17.41], [21.0, 22.84], [26.0, 28.49], [30.0, 30.27], [34.0, 35.09], [37.0, 37.13], [39.0, 42.47], [43.0, 45.94], [47.0, 49.64], [51.0, 51.61], [53.0, 55.36], [57.0, 59.93], [62.0, 61.94], [63.0, 74.33], [77.0, 78.27], [93.0, 92.55], [93.0, 94.83], [97.0, 96.97], [99.0, 99.35], [100.0, 101.14], [102.0, 103.13], [109.0, 110.57], [115.0, 128.65], [134.0, 136.07], [138.0, 139.35], [140.0, 141.56], [142.0, 167.63]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.46, 0.0, 0.0, 0.0, 43.13, 67.13, 32.58, 0.0, 63.85, 46.15, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 56.48, 0.0, 0.0, 40.79], "audiomae_on_audioset": [null, null, null, null, null, [["music", 25.81], ["mains hum", 12.48], ["hum", 8.97]], null, null, null, [["speech", 41.66], ["music", 10.61], ["musical instrument", 2.09]], null, [["music", 19.5], ["cattle, bovinae", 14.19], ["moo", 13.39]], null, null, [["music", 53.98], ["didgeridoo", 15.3], ["cacophony", 3.27]], null, [["music", 52.78], ["speech", 8.11], ["hum", 4.17]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.79], ["throbbing", 6.52], ["frog", 5.38]]], "duration": [1.52, 1.76, 0.71, 1.41, 1.84, 2.49, 0.27, 1.09, 0.13, 3.47, 2.94, 2.64, 0.61, 2.36, 2.93, -0.06, 11.33, 1.27, -0.45, 1.83, -0.03, 0.35, 1.14, 1.13, 1.57, 13.65, 2.07, 1.35, 1.56, 25.63]} \ No newline at end of file diff --git a/annotations_1/4IsISIQpKTc_filtered.json b/annotations_1/4IsISIQpKTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1244f0645ae243772d07f571855d21a7b90b4591 --- /dev/null +++ b/annotations_1/4IsISIQpKTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 36.85], [39.0, 43.93], [46.0, 62.19], [63.0, 80.13], [82.0, 100.99]], "keep_status": [false, true, true, true, false], "silence_prob": [0.0, 30.28, 30.12, 28.55, 28.49], "audiomae_on_audioset": [null, [["hum", 22.15], ["mains hum", 20.2], ["music", 18.22]], [["hum", 12.83], ["whale vocalization", 10.88], ["animal", 10.35]], [["speech", 46.42], ["groan", 9.78], ["buzz", 5.87]], [["music", 67.52], ["cacophony", 7.06], ["electronic music", 3.62]]], "duration": [31.85, 4.93, 16.19, 17.13, 18.99]} \ No newline at end of file diff --git a/annotations_1/4JE04So6OqU_filtered.json b/annotations_1/4JE04So6OqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3043f6dd4d25f69d7756dfb29b7d95b66791e3b --- /dev/null +++ b/annotations_1/4JE04So6OqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.47], [23.0, 59.43], [60.0, 71.85], [78.0, 89.73], [91.0, 93.31], [97.0, 98.69], [101.0, 102.93], [104.0, 103.94], [106.0, 108.72], [109.0, 110.47], [112.0, 151.8], [152.0, 151.85]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [28.87, 0.0, 31.12, 30.43, 31.91, 0.0, 0.0, 0.0, 33.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.12], ["hum", 6.06], ["throbbing", 4.76]], null, [["music", 42.94], ["throbbing", 24.6], ["hum", 14.66]], [["music", 77.64], ["hum", 5.43], ["throbbing", 4.81]], [["throbbing", 23.05], ["speech", 21.8], ["hum", 21.08]], null, null, null, [["throbbing", 47.36], ["music", 23.43], ["hum", 15.79]], null, null, null], "duration": [17.47, 36.43, 11.85, 11.73, 2.31, 1.69, 1.93, -0.06, 2.72, 1.47, 39.8, -0.15]} \ No newline at end of file diff --git a/annotations_1/4JtubCgodCE_filtered.json b/annotations_1/4JtubCgodCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce4647d344fe2bcd370830c25eb4cc25f8a70355 --- /dev/null +++ b/annotations_1/4JtubCgodCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [6.0, 6.42], [14.0, 14.61], [16.0, 16.7], [18.0, 18.01], [20.0, 20.17], [22.0, 23.16], [26.0, 25.98], [30.0, 32.46], [33.0, 33.81], [36.0, 37.17], [38.0, 44.25], [50.0, 52.66], [55.0, 57.92], [59.0, 66.33], [72.0, 78.34], [80.0, 79.98], [81.0, 83.59], [85.0, 85.53], [86.0, 86.73], [88.0, 88.21], [89.0, 93.38], [98.0, 107.52], [108.0, 108.68]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.61, 0.0, 0.0, 36.44, 69.07, 35.61, 35.6, 43.05, 0.0, 83.34, 0.0, 0.0, 0.0, 38.11, 38.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 51.75], ["music", 13.02], ["animal", 1.94]], null, null, [["music", 38.76], ["speech", 37.85], ["hum", 4.05]], null, [["music", 75.02], ["electronic music", 2.28], ["whack, thwack", 1.37]], [["music", 51.57], ["speech", 43.66], ["thunk", 0.69]], [["music", 74.09], ["speech", 3.33], ["boing", 2.06]], null, null, null, null, null, [["music", 66.38], ["thunk", 6.05], ["arrow", 5.85]], [["music", 35.4], ["speech", 34.07], ["boing", 7.14]], null], "duration": [0.96, 0.42, 0.61, 0.7, 0.01, 0.17, 1.16, -0.02, 2.46, 0.81, 1.17, 6.25, 2.66, 2.92, 7.33, 6.34, -0.02, 2.59, 0.53, 0.73, 0.21, 4.38, 9.52, 0.68]} \ No newline at end of file diff --git a/annotations_1/4KICpbB5YQY_filtered.json b/annotations_1/4KICpbB5YQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d484499acb014bd0ee97d0f55cb44288936e119 --- /dev/null +++ b/annotations_1/4KICpbB5YQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [5.0, 6.51], [8.0, 7.89], [11.0, 14.15], [15.0, 16.31], [17.0, 18.6], [21.0, 21.15], [23.0, 25.49], [26.0, 28.12], [30.0, 33.03], [35.0, 35.14], [36.0, 38.5], [41.0, 51.87], [54.0, 55.97], [57.0, 59.39], [64.0, 66.48], [68.0, 69.92], [71.0, 73.31], [79.0, 83.39], [89.0, 91.71], [93.0, 96.99], [98.0, 99.06], [100.0, 101.68], [103.0, 105.8], [107.0, 109.36], [110.0, 124.83], [126.0, 127.8], [130.0, 145.96], [147.0, 148.49], [150.0, 149.86], [150.0, 174.7]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 92.97, 39.46, 63.31, 0.0, 78.21, 63.31, 0.0, 36.21, 82.79, 0.0, 91.13, 60.7, 43.85, 54.83, 0.0, 0.0, 34.51, 31.2, 29.14, 0.0, 28.38, 0.0, 0.0, 28.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 28.08], ["speech", 19.25], ["mains hum", 14.42]], null, null, null, null, null, [["speech", 54.76], ["hum", 7.95], ["rumble", 5.97]], null, null, null, null, [["mains hum", 30.99], ["hum", 27.56], ["speech", 14.9]], null, null, null, [["hum", 18.4], ["mains hum", 18.17], ["music", 14.52]], [["music", 35.09], ["scary music", 11.06], ["vehicle", 4.41]], [["music", 42.26], ["hum", 19.14], ["mains hum", 11.88]], null, [["music", 47.7], ["mains hum", 16.09], ["hum", 14.57]], null, null, [["music", 77.85], ["cacophony", 4.28], ["musical instrument", 2.29]]], "duration": [0.75, 1.51, -0.11, 3.15, 1.31, 1.6, 0.15, 2.49, 2.12, 3.03, 0.14, 2.5, 10.87, 1.97, 2.39, 2.48, 1.92, 2.31, 4.39, 2.71, 3.99, 1.06, 1.68, 2.8, 2.36, 14.83, 1.8, 15.96, 1.49, -0.14, 24.7]} \ No newline at end of file diff --git a/annotations_1/4KkCEjawUHM_filtered.json b/annotations_1/4KkCEjawUHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5a6dd0d956bddcce98d6e4f21fba33754424217 --- /dev/null +++ b/annotations_1/4KkCEjawUHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.88], [8.0, 17.91], [21.0, 21.64], [25.0, 27.77], [30.0, 30.72], [38.0, 49.72], [53.0, 57.77], [58.0, 115.5], [117.0, 130.99], [135.0, 169.53], [174.0, 174.11], [179.0, 180.76]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 31.78, 0.0, 47.78, 0.0, 30.19, 31.16, 0.0, 30.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.93], ["didgeridoo", 16.83], ["throbbing", 6.06]], null, [["music", 57.46], ["throbbing", 19.6], ["hum", 9.52]], null, [["music", 41.92], ["cacophony", 13.88], ["mains hum", 9.68]], [["music", 35.94], ["throbbing", 25.65], ["hum", 18.98]], null, [["music", 47.23], ["noise", 9.8], ["synthesizer", 7.36]], null, null, null], "duration": [-0.12, 9.91, 0.64, 2.77, 0.72, 11.72, 4.77, 57.5, 13.99, 34.53, 0.11, 1.76]} \ No newline at end of file diff --git a/annotations_1/4LvvutsvgrE_filtered.json b/annotations_1/4LvvutsvgrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24ca63b2fc06f13a6d5a508b476e4d718f3ac693 --- /dev/null +++ b/annotations_1/4LvvutsvgrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.5], [9.0, 10.18], [11.0, 12.39], [13.0, 15.03], [16.0, 17.69], [18.0, 19.03], [21.0, 22.49], [29.0, 44.78], [45.0, 45.91], [47.0, 51.53], [66.0, 71.42], [72.0, 73.08], [83.0, 83.44], [84.0, 93.87], [100.0, 99.79], [104.0, 105.51], [111.0, 114.24], [115.0, 115.37], [117.0, 122.18], [134.0, 135.06], [143.0, 143.77]], "keep_status": [false, false, false, true, false, false, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.44, 0.0, 0.0, 0.0, 30.13, 0.0, 30.29, 44.07, 0.0, 0.0, 40.31, 0.0, 0.0, 54.97, 0.0, 39.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 30.91], ["mains hum", 22.84], ["sidetone", 11.12]], null, null, null, [["music", 28.16], ["hum", 18.42], ["noise", 11.7]], null, [["music", 18.38], ["speech", 8.21], ["electric shaver, electric razor", 6.63]], [["hum", 14.05], ["speech", 12.78], ["music", 10.88]], null, null, [["bee, wasp, etc.", 21.91], ["music", 19.9], ["fly, housefly", 16.2]], null, null, null, null, [["music", 45.87], ["didgeridoo", 39.37], ["musical instrument", 1.8]], null, null], "duration": [1.5, 1.18, 1.39, 2.03, 1.69, 1.03, 1.49, 15.78, 0.91, 4.53, 5.42, 1.08, 0.44, 9.87, -0.21, 1.51, 3.24, 0.37, 5.18, 1.06, 0.77]} \ No newline at end of file diff --git a/annotations_1/4MbRVVP6rPg_filtered.json b/annotations_1/4MbRVVP6rPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e250772d085af090e2fbbaf9af59466a8b39d214 --- /dev/null +++ b/annotations_1/4MbRVVP6rPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 1.11], [2.0, 5.98], [10.0, 10.62], [12.0, 16.73], [17.0, 16.77], [17.0, 16.8], [17.0, 17.69], [28.0, 29.13], [38.0, 37.81], [46.0, 45.72], [51.0, 51.63], [52.0, 55.11], [60.0, 61.06], [63.0, 63.61], [65.0, 66.12], [69.0, 71.25], [73.0, 73.2], [75.0, 75.78], [79.0, 80.99], [82.0, 84.62], [86.0, 88.45], [90.0, 91.27], [94.0, 94.49], [96.0, 96.4], [97.0, 104.57], [107.0, 108.99], [114.0, 114.42], [117.0, 116.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.64, 0.0, 37.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.74, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 58.81, 74.92, 0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 80.64], ["inside, small room", 3.66], ["boing", 3.52]], null, [["speech", 67.14], ["sidetone", 27.47], ["chirp tone", 0.95]], null, null, null, null, null, null, null, [["cattle, bovinae", 31.27], ["moo", 27.93], ["livestock, farm animals, working animals", 14.85]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.78], ["didgeridoo", 10.6], ["speech", 4.15]], null, null, null], "duration": [0.5, 0.11, 3.98, 0.62, 4.73, -0.23, -0.2, 0.69, 1.13, -0.19, -0.28, 0.63, 3.11, 1.06, 0.61, 1.12, 2.25, 0.2, 0.78, 1.99, 2.62, 2.45, 1.27, 0.49, 0.4, 7.57, 1.99, 0.42, -0.12]} \ No newline at end of file diff --git a/annotations_1/4NGNbrLnvhA_filtered.json b/annotations_1/4NGNbrLnvhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4940a00071e68fca285e691a0238e364d9849ba6 --- /dev/null +++ b/annotations_1/4NGNbrLnvhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [2.0, 2.76], [6.0, 44.51], [45.0, 48.78], [49.0, 61.13], [64.0, 74.07], [74.0, 88.57], [89.0, 88.69], [89.0, 88.91], [89.0, 98.0], [101.0, 101.22], [105.0, 110.62], [125.0, 125.24], [127.0, 127.28], [130.0, 138.0], [138.0, 140.63], [142.0, 147.24], [149.0, 151.77], [153.0, 154.77]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.45, 39.49, 43.85, 42.17, 0.0, 0.0, 41.22, 0.0, 54.56, 0.0, 0.0, 42.93, 85.54, 99.98, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 68.22], ["didgeridoo", 10.26], ["musical instrument", 2.85]], [["music", 49.7], ["speech", 9.77], ["hum", 5.55]], [["hum", 36.7], ["music", 31.12], ["throbbing", 10.81]], [["music", 49.94], ["speech", 22.39], ["cattle, bovinae", 2.09]], null, null, [["music", 38.96], ["speech", 20.1], ["foghorn", 6.0]], null, null, null, null, [["speech", 17.2], ["livestock, farm animals, working animals", 15.28], ["cattle, bovinae", 9.52]], null, null, null, null], "duration": [0.0, 0.76, 38.51, 3.78, 12.13, 10.07, 14.57, -0.31, -0.09, 9.0, 0.22, 5.62, 0.24, 0.28, 8.0, 2.63, 5.24, 2.77, 1.77]} \ No newline at end of file diff --git a/annotations_1/4N_0iP8TSRo_filtered.json b/annotations_1/4N_0iP8TSRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9514fc09dcf06b1604bdb855cec516eddb39e324 --- /dev/null +++ b/annotations_1/4N_0iP8TSRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.64], [30.0, 69.5], [72.0, 72.74], [73.0, 74.28], [76.0, 77.09], [78.0, 110.88]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.64, 39.5, 0.74, 1.28, 1.09, 32.88]} \ No newline at end of file diff --git a/annotations_1/4OEhuma-rrY_filtered.json b/annotations_1/4OEhuma-rrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6c77c29308bfed608e4aa70f3af3d8ed0c58594 --- /dev/null +++ b/annotations_1/4OEhuma-rrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.21], [19.0, 19.47], [31.0, 30.94], [36.0, 35.97], [36.0, 36.09], [41.0, 41.57], [42.0, 57.1], [60.0, 62.5], [63.0, 62.6], [64.0, 63.98], [67.0, 67.29], [67.0, 67.46], [82.0, 82.58], [83.0, 84.43], [92.0, 97.9], [99.0, 114.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.2, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 51.69], ["music", 14.62], ["rumble", 10.55]], null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.47, -0.06, -0.03, 0.09, 0.57, 15.1, 2.5, -0.4, -0.02, 0.29, 0.46, 0.58, 1.43, 5.9, 15.44]} \ No newline at end of file diff --git a/annotations_1/4QR_9BehbWc_filtered.json b/annotations_1/4QR_9BehbWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88e446245c7b8ba756ed43513bb0a621fcfe95a4 --- /dev/null +++ b/annotations_1/4QR_9BehbWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [4.0, 3.54], [4.0, 5.0], [6.0, 6.88], [8.0, 8.85], [10.0, 14.15], [16.0, 27.99], [32.0, 32.26], [33.0, 33.59], [34.0, 35.83], [37.0, 37.52], [40.0, 41.72], [46.0, 75.14], [76.0, 76.45], [77.0, 89.9], [91.0, 92.38], [93.0, 94.2], [95.0, 97.43], [98.0, 108.5], [109.0, 109.07], [110.0, 111.69], [115.0, 123.42]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 35.68, 0.0, 0.0, 0.0, 0.0, 0.0, 40.59, 0.0, 33.43, 0.0, 0.0, 38.32, 38.62, 0.0, 0.0, 45.62], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.89], ["hum", 14.78], ["throbbing", 7.97]], null, null, null, null, null, [["hum", 25.28], ["music", 20.48], ["throbbing", 18.34]], null, [["whale vocalization", 41.42], ["music", 19.03], ["speech", 7.38]], null, null, [["music", 60.42], ["animal", 7.71], ["synthesizer", 2.99]], [["music", 46.42], ["theremin", 37.14], ["musical instrument", 3.55]], null, null, [["music", 51.86], ["hum", 14.16], ["mains hum", 5.57]]], "duration": [0.38, -0.46, 1.0, 0.88, 0.85, 4.15, 11.99, 0.26, 0.59, 1.83, 0.52, 1.72, 29.14, 0.45, 12.9, 1.38, 1.2, 2.43, 10.5, 0.07, 1.69, 8.42]} \ No newline at end of file diff --git a/annotations_1/4QYYeDp44H8_filtered.json b/annotations_1/4QYYeDp44H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d68cb8ff0aa4ffc0b0b2f332f1eb12ff54ec8abd --- /dev/null +++ b/annotations_1/4QYYeDp44H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 70.24], [74.0, 78.75], [81.0, 82.66], [94.0, 94.66], [101.0, 102.24], [106.0, 107.52], [110.0, 111.37], [113.0, 115.13], [116.0, 122.66], [124.0, 126.3], [127.0, 130.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.14, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 91.47, 87.92, 52.56], "audiomae_on_audioset": [[["mains hum", 24.12], ["hum", 21.26], ["music", 9.37]], null, null, null, null, null, null, null, null, null, null], "duration": [8.24, 4.75, 1.66, 0.66, 1.24, 1.52, 1.37, 2.13, 6.66, 2.3, 3.44]} \ No newline at end of file diff --git a/annotations_1/4RrAmzAYCQY_filtered.json b/annotations_1/4RrAmzAYCQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d76fd2d5ddffd804d1d5b4737815928d5013159 --- /dev/null +++ b/annotations_1/4RrAmzAYCQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 79.12], [91.0, 92.04], [93.0, 93.24], [96.0, 102.47], [104.0, 104.87], [115.0, 118.72], [124.0, 126.71]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [29.71, 0.0, 0.0, 31.07, 0.0, 31.14, 38.98], "audiomae_on_audioset": [[["music", 64.68], ["throbbing", 9.91], ["electronic music", 3.27]], null, null, [["cattle, bovinae", 25.14], ["music", 23.34], ["moo", 20.22]], null, [["throbbing", 39.95], ["music", 27.4], ["hum", 12.14]], [["music", 46.81], ["throbbing", 20.68], ["hum", 8.75]]], "duration": [8.12, 1.04, 0.24, 6.47, 0.87, 3.72, 2.71]} \ No newline at end of file diff --git a/annotations_1/4SDOcUPE1GI_filtered.json b/annotations_1/4SDOcUPE1GI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2619690317f52bccb41292d7f47422dc2228a96 --- /dev/null +++ b/annotations_1/4SDOcUPE1GI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.35], [19.0, 24.58], [28.0, 37.79], [39.0, 49.69], [54.0, 59.24], [61.0, 82.76], [86.0, 101.07]], "keep_status": [true, false, true, true, true, false, false], "silence_prob": [30.98, 32.67, 32.95, 31.24, 30.42, 31.85, 30.72], "audiomae_on_audioset": [[["speech", 50.91], ["music", 5.68], ["explosion", 5.45]], [["music", 62.96], ["speech", 15.91], ["fart", 3.3]], [["music", 34.47], ["throbbing", 14.65], ["fly, housefly", 10.57]], [["music", 29.49], ["speech", 24.02], ["throbbing", 7.86]], [["music", 35.72], ["throbbing", 18.03], ["hum", 14.21]], [["music", 63.61], ["speech", 14.93], ["groan", 2.74]], [["music", 69.59], ["groan", 5.52], ["throbbing", 4.98]]], "duration": [7.35, 5.58, 9.79, 10.69, 5.24, 21.76, 15.07]} \ No newline at end of file diff --git a/annotations_1/4Tb7SrDUXWo_filtered.json b/annotations_1/4Tb7SrDUXWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2daa92ad70b6323894f801940280ea96669af2ca --- /dev/null +++ b/annotations_1/4Tb7SrDUXWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.29], [21.0, 21.68], [22.0, 23.58], [24.0, 24.85], [33.0, 33.39], [39.0, 40.95], [44.0, 61.1], [61.0, 63.51], [66.0, 69.04], [71.0, 72.99], [75.0, 76.03], [77.0, 78.07], [79.0, 81.04], [82.0, 84.18], [87.0, 88.96], [92.0, 92.84], [94.0, 95.15], [97.0, 98.32], [99.0, 105.73], [106.0, 108.14], [110.0, 112.02], [113.0, 113.49], [115.0, 123.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.65, 0.0, 0.0, 0.0, 0.0, 0.0, 37.5, 34.44, 44.69, 0.0, 0.0, 0.0, 54.56, 43.98, 0.0, 0.0, 0.0, 0.0, 31.94, 31.74, 38.46, 0.0, 32.96], "audiomae_on_audioset": [[["music", 74.12], ["theremin", 5.89], ["musical instrument", 5.49]], null, null, null, null, null, [["music", 53.53], ["speech", 39.76], ["musical instrument", 1.01]], [["sidetone", 27.3], ["music", 18.98], ["didgeridoo", 13.52]], [["music", 54.12], ["theremin", 17.19], ["synthesizer", 6.43]], null, null, null, null, [["music", 46.6], ["foghorn", 19.32], ["speech", 12.61]], null, null, null, null, [["music", 48.19], ["theremin", 21.23], ["effects unit", 13.44]], [["music", 54.86], ["speech", 6.32], ["theremin", 6.02]], [["music", 76.63], ["synthetic singing", 2.2], ["didgeridoo", 2.03]], null, [["music", 74.11], ["brass instrument", 6.37], ["trombone", 5.37]]], "duration": [19.29, 0.68, 1.58, 0.85, 0.39, 1.95, 17.1, 2.51, 3.04, 1.99, 1.03, 1.07, 2.04, 2.18, 1.96, 0.84, 1.15, 1.32, 6.73, 2.14, 2.02, 0.49, 8.94]} \ No newline at end of file diff --git a/annotations_1/4TsgjtL0Qx4_filtered.json b/annotations_1/4TsgjtL0Qx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13e97b42bb174032c51a42f1726e8b0b7f36dd46 --- /dev/null +++ b/annotations_1/4TsgjtL0Qx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.67], [21.0, 22.94], [24.0, 27.85], [29.0, 43.48], [45.0, 47.01], [48.0, 49.52], [51.0, 53.25], [55.0, 56.86], [58.0, 62.61], [63.0, 67.24], [69.0, 74.43], [75.0, 78.41], [82.0, 83.56], [85.0, 86.93], [88.0, 89.45], [92.0, 93.78], [95.0, 96.31], [100.0, 100.47], [103.0, 117.41], [118.0, 163.09], [165.0, 169.64], [172.0, 177.23]], "keep_status": [true, false, true, true, true, false, true, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.4, 0.0, 32.18, 33.08, 35.29, 0.0, 35.19, 0.0, 30.22, 33.37, 34.34, 35.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.78, 0.0, 67.51, 39.28], "audiomae_on_audioset": [[["sine wave", 22.22], ["speech", 15.02], ["hum", 13.47]], null, [["music", 27.72], ["chirp tone", 11.66], ["sine wave", 7.38]], [["hum", 34.39], ["throbbing", 18.43], ["speech", 15.12]], [["music", 17.91], ["chirp tone", 15.47], ["hum", 15.36]], null, [["hum", 30.37], ["throbbing", 16.95], ["music", 9.87]], null, [["speech", 38.68], ["music", 23.73], ["breaking", 8.05]], [["hum", 24.29], ["mains hum", 18.2], ["music", 17.43]], [["music", 31.35], ["hum", 22.35], ["throbbing", 13.22]], [["music", 42.83], ["hum", 10.44], ["electronic music", 7.89]], null, null, null, null, null, null, [["throbbing", 43.57], ["hum", 26.9], ["music", 17.12]], null, null, [["music", 66.15], ["scary music", 8.6], ["sonar", 3.57]]], "duration": [5.67, 1.94, 3.85, 14.48, 2.01, 1.52, 2.25, 1.86, 4.61, 4.24, 5.43, 3.41, 1.56, 1.93, 1.45, 1.78, 1.31, 0.47, 14.41, 45.09, 4.64, 5.23]} \ No newline at end of file diff --git a/annotations_1/4UC_5gXVXUk_filtered.json b/annotations_1/4UC_5gXVXUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..772df2603beb2d5c56fa32af0996dde74ce8b96e --- /dev/null +++ b/annotations_1/4UC_5gXVXUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.94], [5.0, 5.0], [10.0, 10.39], [14.0, 14.72], [16.0, 17.78], [18.0, 18.33], [29.0, 30.99], [36.0, 36.58], [75.0, 75.44], [79.0, 85.68]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 27.61], ["music", 13.29], ["gong", 13.06]]], "duration": [1.94, 0.0, 0.39, 0.72, 1.78, 0.33, 1.99, 0.58, 0.44, 6.68]} \ No newline at end of file diff --git a/annotations_1/4UOnDFoEPUQ_filtered.json b/annotations_1/4UOnDFoEPUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42b82b30195264343de46f813354dc5bb2ecd960 --- /dev/null +++ b/annotations_1/4UOnDFoEPUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 23.53], [29.0, 69.16], [69.0, 69.7], [70.0, 75.64], [78.0, 79.15], [80.0, 82.71], [84.0, 87.22], [88.0, 89.01], [91.0, 92.47], [94.0, 96.77], [98.0, 99.82], [101.0, 105.65], [107.0, 137.44], [138.0, 139.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.26, 0.0, 0.0, 31.44, 0.0, 51.5, 68.54, 0.0, 0.0, 62.47, 0.0, 44.99, 0.0, 0.0], "audiomae_on_audioset": [[["buzz", 58.21], ["music", 10.46], ["insect", 3.49]], null, null, [["music", 24.14], ["hum", 18.43], ["sonar", 17.46]], null, null, null, null, null, null, null, [["music", 35.09], ["speech", 33.93], ["theremin", 12.5]], null, null], "duration": [21.53, 40.16, 0.7, 5.64, 1.15, 2.71, 3.22, 1.01, 1.47, 2.77, 1.82, 4.65, 30.44, 1.53]} \ No newline at end of file diff --git a/annotations_1/4UzVKW_Iqi0_filtered.json b/annotations_1/4UzVKW_Iqi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e747d3bcceb7e408820cd59b21a44767aa13f4 --- /dev/null +++ b/annotations_1/4UzVKW_Iqi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.6], [16.0, 16.44], [17.0, 27.9], [31.0, 37.76], [42.0, 46.03], [47.0, 47.63], [49.0, 58.99], [60.0, 62.48], [64.0, 65.55], [71.0, 71.19], [73.0, 72.94], [75.0, 75.9], [80.0, 80.79], [82.0, 82.32], [92.0, 91.96], [98.0, 98.96], [103.0, 103.84], [108.0, 118.59], [120.0, 120.31]], "keep_status": [true, false, false, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.33, 0.0, 30.51, 30.15, 31.92, 0.0, 31.94, 36.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.7, 0.0], "audiomae_on_audioset": [[["music", 45.31], ["didgeridoo", 12.23], ["speech", 5.18]], null, [["cowbell", 50.51], ["speech", 13.73], ["music", 10.74]], [["speech", 23.46], ["music", 23.43], ["throbbing", 8.58]], [["music", 39.53], ["throbbing", 11.2], ["coin (dropping)", 6.51]], null, [["music", 29.66], ["speech", 13.3], ["burst, pop", 5.73]], [["music", 20.95], ["synthesizer", 18.69], ["theremin", 12.84]], null, null, null, null, null, null, null, null, null, [["music", 56.32], ["speech", 9.44], ["hum", 7.83]], null], "duration": [10.6, 0.44, 10.9, 6.76, 4.03, 0.63, 9.99, 2.48, 1.55, 0.19, -0.06, 0.9, 0.79, 0.32, -0.04, 0.96, 0.84, 10.59, 0.31]} \ No newline at end of file diff --git a/annotations_1/4V4jhMSJRW8_filtered.json b/annotations_1/4V4jhMSJRW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22a199ca5343dfdc2ab073baa0641224d58db57d --- /dev/null +++ b/annotations_1/4V4jhMSJRW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.4], [9.0, 9.27], [12.0, 13.41], [15.0, 18.6], [23.0, 27.06], [31.0, 31.11], [32.0, 56.62], [60.0, 64.4], [66.0, 77.89], [78.0, 82.0], [85.0, 90.59], [95.0, 120.01], [120.0, 121.8], [122.0, 137.59], [138.0, 147.99], [149.0, 154.45], [157.0, 162.4], [168.0, 168.13], [172.0, 172.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.92, 59.68, 0.0, 37.04, 59.59, 43.51, 48.82, 47.98, 39.66, 0.0, 45.14, 45.08, 79.59, 99.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 64.4], ["whale vocalization", 6.82], ["electronic music", 5.52]], null, null, [["music", 68.36], ["whale vocalization", 7.0], ["singing bowl", 3.91]], null, [["music", 47.0], ["singing bowl", 33.18], ["ambient music", 2.45]], [["whale vocalization", 83.83], ["speech", 8.51], ["hum", 1.39]], [["hum", 44.13], ["mains hum", 27.87], ["throbbing", 11.01]], [["whale vocalization", 97.48], ["music", 1.08], ["gurgling", 0.28]], null, [["speech", 48.54], ["music", 25.27], ["boat, water vehicle", 2.64]], [["music", 59.06], ["ambient music", 7.94], ["hum", 6.62]], null, null, null, null], "duration": [1.4, 0.27, 1.41, 3.6, 4.06, 0.11, 24.62, 4.4, 11.89, 4.0, 5.59, 25.01, 1.8, 15.59, 9.99, 5.45, 5.4, 0.13, 0.4]} \ No newline at end of file diff --git a/annotations_1/4V9xYmVeNL4_filtered.json b/annotations_1/4V9xYmVeNL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64e39ae382299632ac4d3474b07b6fe8c949420b --- /dev/null +++ b/annotations_1/4V9xYmVeNL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.34], [15.0, 15.5], [18.0, 25.37], [26.0, 31.21], [32.0, 33.44], [35.0, 38.3], [41.0, 42.08], [44.0, 45.59], [48.0, 58.02], [61.0, 62.31], [66.0, 66.95], [70.0, 79.32], [83.0, 85.01], [88.0, 87.83], [91.0, 110.98], [112.0, 113.02], [114.0, 116.26], [117.0, 126.44], [128.0, 130.64], [132.0, 132.63], [134.0, 135.24], [136.0, 138.52], [139.0, 146.5], [151.0, 171.12], [173.0, 173.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.25, 51.18, 0.0, 62.99, 0.0, 0.0, 62.99, 0.0, 0.0, 61.47, 56.33, 0.0, 61.08, 0.0, 55.39, 51.94, 56.03, 0.0, 0.0, 50.02, 52.74, 58.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 0.5, 7.37, 5.21, 1.44, 3.3, 1.08, 1.59, 10.02, 1.31, 0.95, 9.32, 2.01, -0.17, 19.98, 1.02, 2.26, 9.44, 2.64, 0.63, 1.24, 2.52, 7.5, 20.12, 0.57]} \ No newline at end of file diff --git a/annotations_1/4VDry9fy8UE_filtered.json b/annotations_1/4VDry9fy8UE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f777777e71d1cde801ebfb93e3abc2314390f520 --- /dev/null +++ b/annotations_1/4VDry9fy8UE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [13.0, 13.54], [15.0, 25.57], [28.0, 95.27], [96.0, 104.7], [120.0, 120.55], [124.0, 125.34], [126.0, 126.47]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [31.43, 0.0, 32.46, 0.0, 30.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.07], ["didgeridoo", 12.17], ["musical instrument", 4.53]], null, [["music", 53.45], ["trombone", 6.23], ["foghorn", 4.43]], null, [["speech", 39.01], ["horse", 18.71], ["clip-clop", 14.93]], null, null, null], "duration": [2.44, 0.54, 10.57, 67.27, 8.7, 0.55, 1.34, 0.47]} \ No newline at end of file diff --git a/annotations_1/4WNq9Yy9m_g_filtered.json b/annotations_1/4WNq9Yy9m_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4595dd8d659c251a84df2c9df4348c50cbc795f7 --- /dev/null +++ b/annotations_1/4WNq9Yy9m_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.7], [10.0, 13.64], [15.0, 17.19], [19.0, 19.87], [21.0, 24.7], [26.0, 27.21], [33.0, 34.79], [36.0, 36.64], [39.0, 62.8], [65.0, 65.52], [69.0, 70.95], [76.0, 78.85], [80.0, 80.89], [88.0, 89.01], [93.0, 94.37], [99.0, 100.2], [103.0, 103.4], [106.0, 116.82], [118.0, 118.56], [126.0, 126.06], [133.0, 132.8], [136.0, 140.09], [141.0, 143.83], [145.0, 149.13], [150.0, 149.94], [150.0, 171.1], [174.0, 178.82], [180.0, 180.15]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [48.69, 84.43, 91.47, 0.0, 51.6, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 30.58, 0.0, 0.0, 0.0, 32.56, 34.89, 33.97, 0.0, 31.29, 29.81, 0.0], "audiomae_on_audioset": [[["speech", 26.15], ["whale vocalization", 15.86], ["music", 14.26]], null, null, null, null, null, null, null, [["music", 48.21], ["siren", 9.29], ["synthesizer", 8.98]], null, null, [["music", 37.19], ["crushing", 30.12], ["theremin", 7.17]], null, null, null, null, null, [["music", 21.69], ["fly, housefly", 19.94], ["insect", 5.58]], null, null, null, [["buzz", 22.28], ["music", 13.25], ["hum", 8.52]], [["hum", 26.94], ["throbbing", 20.42], ["mains hum", 10.92]], [["music", 36.19], ["hum", 5.07], ["speech", 4.46]], null, [["music", 38.14], ["speech", 30.52], ["outside, rural or natural", 6.65]], [["music", 70.46], ["speech", 3.38], ["foghorn", 2.73]], null], "duration": [4.7, 3.64, 2.19, 0.87, 3.7, 1.21, 1.79, 0.64, 23.8, 0.52, 1.95, 2.85, 0.89, 1.01, 1.37, 1.2, 0.4, 10.82, 0.56, 0.06, -0.2, 4.09, 2.83, 4.13, -0.06, 21.1, 4.82, 0.15]} \ No newline at end of file diff --git a/annotations_1/4WdyyPhh4-k_filtered.json b/annotations_1/4WdyyPhh4-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21381c2e6b20d25b42244d9a4e8877cb0d371c76 --- /dev/null +++ b/annotations_1/4WdyyPhh4-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 5.53], [6.0, 7.1], [12.0, 13.66], [16.0, 16.16], [17.0, 17.12], [20.0, 20.55], [22.0, 24.68], [25.0, 25.61], [27.0, 27.16], [31.0, 30.65], [31.0, 30.96], [36.0, 38.2], [43.0, 44.51], [50.0, 50.26], [53.0, 55.93], [59.0, 59.75], [61.0, 61.25], [62.0, 62.95], [64.0, 64.45], [65.0, 66.36], [69.0, 68.96], [70.0, 71.69], [73.0, 73.04], [77.0, 77.13], [79.0, 79.47], [80.0, 80.43], [82.0, 82.26], [85.0, 85.9], [87.0, 99.13], [102.0, 102.86], [116.0, 116.95], [121.0, 120.87], [126.0, 127.18], [129.0, 139.82], [142.0, 142.86], [143.0, 143.85], [145.0, 145.42], [146.0, 149.99], [152.0, 152.41], [158.0, 157.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.16, 0.0, 0.0, 0.0, 0.0, 55.11, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.41, 0.0, 0.0, 0.0, 0.0, 31.36, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 34.8], ["speech", 8.31], ["musical instrument", 6.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.4], ["musical instrument", 5.74], ["hum", 5.1]], null, null, null, null, [["music", 79.63], ["sampler", 2.06], ["electronic music", 1.61]], null, null, null, [["music", 63.86], ["sampler", 2.72], ["electronic music", 2.04]], null, null], "duration": [0.33, 0.53, 1.1, 1.66, 0.16, 0.12, 0.55, 2.68, 0.61, 0.16, -0.35, -0.04, 2.2, 1.51, 0.26, 2.93, 0.75, 0.25, 0.95, 0.45, 1.36, -0.04, 1.69, 0.04, 0.13, 0.47, 0.43, 0.26, 0.9, 12.13, 0.86, 0.95, -0.13, 1.18, 10.82, 0.86, 0.85, 0.42, 3.99, 0.41, -0.06]} \ No newline at end of file diff --git a/annotations_1/4WgLRH-FpWQ_filtered.json b/annotations_1/4WgLRH-FpWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72622418bcfb3147a19724a31ca9e40e3199ab39 --- /dev/null +++ b/annotations_1/4WgLRH-FpWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.21], [26.0, 26.72], [27.0, 27.85], [44.0, 47.04], [56.0, 58.31], [70.0, 74.36], [75.0, 75.74], [85.0, 84.79], [117.0, 119.26], [122.0, 123.67], [127.0, 128.22], [129.0, 129.86], [136.0, 140.46]], "keep_status": [false, false, false, true, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.93, 29.08, 28.41, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 38.95], "audiomae_on_audioset": [null, null, null, [["whip", 25.34], ["throbbing", 15.52], ["music", 15.12]], [["music", 44.99], ["speech", 11.41], ["throbbing", 8.64]], [["speech", 36.88], ["music", 28.42], ["boom", 3.58]], null, null, [["music", 41.16], ["speech", 14.82], ["theremin", 7.51]], null, null, null, [["music", 57.19], ["scary music", 11.52], ["hum", 6.94]]], "duration": [0.21, 0.72, 0.85, 3.04, 2.31, 4.36, 0.74, -0.21, 2.26, 1.67, 1.22, 0.86, 4.46]} \ No newline at end of file diff --git a/annotations_1/4WibEcqn1c8_filtered.json b/annotations_1/4WibEcqn1c8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cfa8ff185fb6dbc2c526508400b33a5b3bdc672 --- /dev/null +++ b/annotations_1/4WibEcqn1c8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.12], [10.0, 45.74], [51.0, 61.8], [66.0, 66.09], [67.0, 67.42], [68.0, 70.85], [73.0, 81.19], [82.0, 85.94], [86.0, 87.62], [88.0, 91.84], [94.0, 96.67], [105.0, 116.48], [117.0, 119.58], [120.0, 128.9], [131.0, 136.93], [139.0, 141.39], [143.0, 143.6], [145.0, 147.01], [149.0, 152.47], [153.0, 153.91], [155.0, 157.01], [159.0, 160.34], [161.0, 161.05], [161.0, 168.56], [169.0, 169.5], [175.0, 175.56], [177.0, 177.62], [178.0, 178.29], [179.0, 179.68], [181.0, 181.77], [183.0, 183.22], [185.0, 187.44], [188.0, 188.0], [192.0, 194.88], [195.0, 197.34], [200.0, 199.81], [200.0, 200.99], [204.0, 206.31], [209.0, 211.06], [214.0, 214.27], [217.0, 225.54], [228.0, 230.79]], "keep_status": [false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [48.39, 0.0, 37.54, 0.0, 0.0, 37.14, 51.07, 48.39, 0.0, 50.02, 33.93, 33.5, 41.46, 44.84, 62.17, 53.04, 0.0, 59.15, 82.79, 0.0, 66.27, 0.0, 0.0, 42.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.55, 0.0, 49.45, 47.62, 0.0, 0.0, 34.12, 71.43, 0.0, 40.95, 38.88], "audiomae_on_audioset": [[["music", 56.51], ["didgeridoo", 15.31], ["theremin", 7.57]], null, [["music", 37.71], ["theremin", 20.59], ["flute", 16.16]], null, null, [["music", 30.12], ["didgeridoo", 16.95], ["hum", 8.64]], null, [["music", 39.7], ["brass instrument", 8.12], ["dog", 4.54]], null, null, [["music", 25.34], ["synthesizer", 7.93], ["musical instrument", 6.98]], [["music", 31.26], ["brass instrument", 30.63], ["trombone", 16.82]], [["music", 32.11], ["brass instrument", 24.16], ["trombone", 23.46]], [["music", 31.58], ["brass instrument", 31.06], ["musical instrument", 8.84]], null, null, null, null, null, null, null, null, null, [["music", 55.56], ["brass instrument", 11.84], ["foghorn", 9.62]], null, null, null, null, null, null, null, null, null, [["music", 42.87], ["theremin", 11.74], ["carnatic music", 9.01]], [["music", 57.9], ["theremin", 5.98], ["musical instrument", 5.64]], null, null, [["music", 28.68], ["trombone", 21.52], ["brass instrument", 20.7]], null, null, [["brass instrument", 47.46], ["trombone", 20.79], ["music", 19.5]], [["music", 51.83], ["musical instrument", 4.48], ["speech", 2.74]]], "duration": [8.12, 35.74, 10.8, 0.09, 0.42, 2.85, 8.19, 3.94, 1.62, 3.84, 2.67, 11.48, 2.58, 8.9, 5.93, 2.39, 0.6, 2.01, 3.47, 0.91, 2.01, 1.34, 0.05, 7.56, 0.5, 0.56, 0.62, 0.29, 0.68, 0.77, 0.22, 2.44, 0.0, 2.88, 2.34, -0.19, 0.99, 2.31, 2.06, 0.27, 8.54, 2.79]} \ No newline at end of file diff --git a/annotations_1/4XK1zU7zhkI_filtered.json b/annotations_1/4XK1zU7zhkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd676e36d5f997403a2e35e11a1054bd96f73821 --- /dev/null +++ b/annotations_1/4XK1zU7zhkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.62], [20.0, 21.09], [23.0, 23.57], [26.0, 28.71], [34.0, 35.04], [37.0, 42.9], [44.0, 46.08], [46.0, 47.31], [48.0, 49.08], [50.0, 51.09], [52.0, 53.13], [55.0, 55.43], [57.0, 57.38], [60.0, 61.67], [62.0, 63.07], [70.0, 70.83], [73.0, 73.65], [75.0, 77.31], [78.0, 80.08], [81.0, 82.12], [83.0, 89.72], [90.0, 90.8], [93.0, 93.43], [97.0, 98.34], [99.0, 107.23], [110.0, 115.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 89.19, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 39.07, 0.0, 40.07, 0.0, 0.0, 0.0, 34.91, 34.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.91], ["rumble", 16.95], ["whale vocalization", 6.61]], [["music", 10.72], ["gong", 8.83], ["sine wave", 8.25]], null, [["music", 19.66], ["hum", 13.73], ["synthesizer", 12.25]], null, null, null, [["music", 59.6], ["synthesizer", 23.06], ["electronic music", 3.9]], [["music", 64.13], ["synthesizer", 9.77], ["throbbing", 4.2]]], "duration": [0.62, 1.09, 0.57, 2.71, 1.04, 5.9, 2.08, 1.31, 1.08, 1.09, 1.13, 0.43, 0.38, 1.67, 1.07, 0.83, 0.65, 2.31, 2.08, 1.12, 6.72, 0.8, 0.43, 1.34, 8.23, 5.03]} \ No newline at end of file diff --git a/annotations_1/4XKZFS7EoCU_filtered.json b/annotations_1/4XKZFS7EoCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bad4ea05550b7e6b71a3297318d5d53896db8c82 --- /dev/null +++ b/annotations_1/4XKZFS7EoCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.51], [19.0, 21.22], [26.0, 28.05], [31.0, 31.11], [39.0, 40.42], [40.0, 40.46], [50.0, 50.08], [53.0, 53.79], [55.0, 56.79], [79.0, 79.76], [83.0, 86.29], [98.0, 98.42], [99.0, 99.86], [101.0, 102.46], [121.0, 121.56], [125.0, 125.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.97, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 36.05], ["speech", 13.85], ["music", 10.06]], null, null, null, null, null, null, null, [["cattle, bovinae", 34.69], ["livestock, farm animals, working animals", 28.62], ["moo", 26.62]], null, null, null, null, null], "duration": [0.51, 2.22, 2.05, 0.11, 1.42, 0.46, 0.08, 0.79, 1.79, 0.76, 3.29, 0.42, 0.86, 1.46, 0.56, 0.95]} \ No newline at end of file diff --git a/annotations_1/4YPxIpLpLRM_filtered.json b/annotations_1/4YPxIpLpLRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51888b954bb98fb0e03d3d0a88b9e84f17f7e566 --- /dev/null +++ b/annotations_1/4YPxIpLpLRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.07], [13.0, 14.35], [18.0, 18.49], [23.0, 23.58], [24.0, 24.85], [26.0, 26.32], [27.0, 26.94], [30.0, 30.69], [31.0, 34.03], [50.0, 50.46], [63.0, 80.64], [96.0, 96.33], [121.0, 129.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.88, 0.0, 35.52, 0.0, 29.63], "audiomae_on_audioset": [[["thunk", 44.12], ["speech", 22.95], ["door", 3.56]], null, null, null, null, null, null, null, [["speech", 67.45], ["sidetone", 14.43], ["sine wave", 2.5]], null, [["throbbing", 39.87], ["hum", 24.33], ["heart sounds, heartbeat", 13.68]], null, [["speech", 73.34], ["music", 11.62], ["outside, urban or manmade", 1.35]]], "duration": [3.07, 1.35, 0.49, 0.58, 0.85, 0.32, -0.06, 0.69, 3.03, 0.46, 17.64, 0.33, 8.83]} \ No newline at end of file diff --git a/annotations_1/4YuwbC-9aDI_filtered.json b/annotations_1/4YuwbC-9aDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4e8fd58ccf4b470b9a5aa5ee7da8d9418adecb --- /dev/null +++ b/annotations_1/4YuwbC-9aDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.28], [45.0, 45.27], [48.0, 52.95], [65.0, 66.09], [69.0, 69.48], [70.0, 72.23], [92.0, 93.23], [98.0, 99.45], [100.0, 101.51]], "keep_status": [true, false, true, false, false, false, false, false, false], "silence_prob": [46.54, 0.0, 40.75, 0.0, 0.0, 50.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 25.73], ["livestock, farm animals, working animals", 14.41], ["animal", 12.05]], null, [["music", 30.38], ["guitar", 15.82], ["musical instrument", 9.97]], null, null, null, null, null, null], "duration": [2.28, 0.27, 4.95, 1.09, 0.48, 2.23, 1.23, 1.45, 1.51]} \ No newline at end of file diff --git a/annotations_1/4ZCtygwf67Y_filtered.json b/annotations_1/4ZCtygwf67Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83928207ef73af172041374d08456a898c95ef20 --- /dev/null +++ b/annotations_1/4ZCtygwf67Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.24], [8.0, 10.49], [12.0, 13.49], [14.0, 14.5], [15.0, 16.7], [20.0, 21.56], [24.0, 24.43], [26.0, 27.21], [30.0, 31.11], [35.0, 37.29], [39.0, 40.37], [43.0, 44.47], [47.0, 55.85], [60.0, 62.07], [63.0, 83.24], [87.0, 88.89], [91.0, 92.11], [96.0, 96.36], [97.0, 99.28], [102.0, 103.44], [106.0, 141.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [39.67, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 84.43, 88.28, 41.24, 0.0, 0.0, 0.0, 45.3, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 63.24], ["hum", 5.6], ["chirp tone", 2.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 33.85], ["throbbing", 18.6], ["mains hum", 15.69]], null, null, null, [["speech", 33.58], ["music", 32.12], ["hum", 4.13]], null, null], "duration": [3.24, 2.49, 1.49, 0.5, 1.7, 1.56, 0.43, 1.21, 1.11, 2.29, 1.37, 1.47, 8.85, 2.07, 20.24, 1.89, 1.11, 0.36, 2.28, 1.44, 35.96]} \ No newline at end of file diff --git a/annotations_1/4ZiwLxnl_9k_filtered.json b/annotations_1/4ZiwLxnl_9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d2689021c60ade950cb894612708f909c887c5 --- /dev/null +++ b/annotations_1/4ZiwLxnl_9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [7.0, 7.38], [10.0, 11.57], [13.0, 15.72], [20.0, 23.53], [26.0, 26.82], [27.0, 37.44], [39.0, 44.56], [47.0, 56.93], [58.0, 60.51], [62.0, 64.94], [66.0, 71.49], [74.0, 75.05], [78.0, 82.44], [84.0, 85.16], [88.0, 89.24], [90.0, 98.32], [102.0, 116.43], [123.0, 128.68], [133.0, 144.05]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 60.79, 41.58, 0.0, 52.86, 31.93, 35.85, 39.34, 35.12, 32.63, 0.0, 30.78, 0.0, 0.0, 32.48, 29.5, 31.21, 39.98], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 33.65], ["speech", 21.37], ["hum", 18.44]], null, null, [["hum", 16.84], ["throbbing", 11.35], ["fart", 9.64]], [["speech", 37.79], ["hum", 17.42], ["throbbing", 9.83]], [["fart", 30.07], ["heart sounds, heartbeat", 26.36], ["throbbing", 14.38]], [["noise", 8.51], ["throbbing", 5.69], ["music", 5.48]], [["throbbing", 60.4], ["hum", 27.75], ["heart sounds, heartbeat", 7.73]], null, [["music", 71.92], ["speech", 5.42], ["electronic music", 4.04]], null, null, [["speech", 46.39], ["horse", 19.67], ["neigh, whinny", 9.38]], [["moo", 20.06], ["music", 19.49], ["cattle, bovinae", 18.19]], [["speech", 30.02], ["fart", 18.11], ["noise", 6.01]], [["animal", 25.62], ["grunt", 10.15], ["whale vocalization", 8.15]]], "duration": [0.26, 0.38, 1.57, 2.72, 3.53, 0.82, 10.44, 5.56, 9.93, 2.51, 2.94, 5.49, 1.05, 4.44, 1.16, 1.24, 8.32, 14.43, 5.68, 11.05]} \ No newline at end of file diff --git a/annotations_1/4_SBdgdCwDA_filtered.json b/annotations_1/4_SBdgdCwDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0bfd1492ef2749fea00d7e49e799b6775caf941 --- /dev/null +++ b/annotations_1/4_SBdgdCwDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.1], [12.0, 15.42], [16.0, 17.52], [22.0, 23.01], [27.0, 27.09], [28.0, 28.81], [30.0, 32.07], [33.0, 36.32], [45.0, 45.2], [48.0, 52.62], [53.0, 60.2], [62.0, 62.55], [65.0, 66.48], [68.0, 70.01], [74.0, 75.51], [77.0, 77.33], [78.0, 85.16], [87.0, 87.3], [88.0, 116.4], [118.0, 118.07], [119.0, 120.7], [124.0, 126.5], [128.0, 132.11], [133.0, 134.22]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [71.72, 32.0, 0.0, 0.0, 0.0, 0.0, 42.11, 55.6, 0.0, 99.87, 34.39, 0.0, 0.0, 99.99, 0.0, 0.0, 30.65, 0.0, 31.88, 0.0, 0.0, 99.98, 54.23, 0.0], "audiomae_on_audioset": [null, [["speech", 56.98], ["coin (dropping)", 7.01], ["creak", 7.0]], null, null, null, null, [["speech", 22.07], ["crushing", 5.67], ["bouncing", 4.08]], null, null, null, [["sine wave", 25.1], ["speech", 16.86], ["chirp tone", 8.0]], null, null, null, null, null, [["speech", 66.61], ["gunshot, gunfire", 7.08], ["burst, pop", 6.96]], null, [["mosquito", 22.27], ["whack, thwack", 13.41], ["fly, housefly", 10.33]], null, null, null, null, null], "duration": [3.1, 3.42, 1.52, 1.01, 0.09, 0.81, 2.07, 3.32, 0.2, 4.62, 7.2, 0.55, 1.48, 2.01, 1.51, 0.33, 7.16, 0.3, 28.4, 0.07, 1.7, 2.5, 4.11, 1.22]} \ No newline at end of file diff --git a/annotations_1/4_p4EAmMa-M_filtered.json b/annotations_1/4_p4EAmMa-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83fb6565fb50830ce1ce6ed15327fddfe2f40c63 --- /dev/null +++ b/annotations_1/4_p4EAmMa-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [12.0, 13.26], [15.0, 18.06], [19.0, 20.88], [23.0, 29.02], [30.0, 33.54], [35.0, 38.06], [40.0, 43.29], [47.0, 47.66], [48.0, 48.68], [50.0, 52.17], [54.0, 55.75], [57.0, 67.2], [68.0, 93.38], [94.0, 98.56], [99.0, 100.25], [102.0, 102.51], [106.0, 106.07], [107.0, 110.39], [111.0, 112.63], [114.0, 119.75], [120.0, 121.61], [123.0, 124.01], [127.0, 128.31], [129.0, 130.18], [131.0, 131.92], [134.0, 134.6], [136.0, 138.74], [139.0, 140.02], [146.0, 146.42], [148.0, 152.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.93, 0.0, 99.16, 99.91, 99.21, 99.4, 0.0, 0.0, 94.22, 0.0, 99.48, 95.09, 97.22, 0.0, 0.0, 0.0, 99.9, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 1.26, 3.06, 1.88, 6.02, 3.54, 3.06, 3.29, 0.66, 0.68, 2.17, 1.75, 10.2, 25.38, 4.56, 1.25, 0.51, 0.07, 3.39, 1.63, 5.75, 1.61, 1.01, 1.31, 1.18, 0.92, 0.6, 2.74, 1.02, 0.42, 4.19]} \ No newline at end of file diff --git a/annotations_1/4aKmbFnV-mI_filtered.json b/annotations_1/4aKmbFnV-mI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cac6a53eda2dc282d9937c66087c84db92c3156d --- /dev/null +++ b/annotations_1/4aKmbFnV-mI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 95.98], [96.0, 120.34], [121.0, 131.25], [134.0, 143.5], [145.0, 145.74], [146.0, 146.67], [147.0, 149.72], [150.0, 151.39], [152.0, 152.79]], "keep_status": [false, false, true, true, false, false, true, false, false], "silence_prob": [70.86, 59.15, 40.16, 35.67, 0.0, 0.0, 35.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.43], ["music", 14.56], ["sonar", 11.78]], [["music", 39.64], ["basketball bounce", 16.77], ["speech", 12.54]], null, null, [["speech", 32.13], ["electric shaver, electric razor", 11.21], ["music", 5.61]], null, null], "duration": [28.98, 24.34, 10.25, 9.5, 0.74, 0.67, 2.72, 1.39, 0.79]} \ No newline at end of file diff --git a/annotations_1/4ak8huhsVKc_filtered.json b/annotations_1/4ak8huhsVKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cddfa0fc7663fc9134fb0a8892e8c166a46ece8 --- /dev/null +++ b/annotations_1/4ak8huhsVKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.02], [6.0, 8.24], [9.0, 10.02], [13.0, 16.33], [18.0, 25.95], [26.0, 27.92], [33.0, 33.47], [34.0, 43.16], [45.0, 46.3], [47.0, 47.38], [49.0, 52.32], [52.0, 54.11], [55.0, 55.71], [57.0, 59.43], [61.0, 61.37], [62.0, 62.75], [67.0, 67.31], [68.0, 68.4], [69.0, 69.67], [76.0, 77.62], [78.0, 78.66], [79.0, 81.13], [83.0, 83.89], [90.0, 90.29], [91.0, 91.17], [91.0, 99.52], [103.0, 104.38], [109.0, 110.52], [112.0, 113.54], [115.0, 115.72], [116.0, 117.56], [118.0, 118.59], [119.0, 120.55], [121.0, 121.63], [122.0, 123.77], [126.0, 127.53], [131.0, 131.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 61.08, 0.0, 91.64, 51.77, 0.0, 0.0, 100.0, 0.0, 0.0, 99.99, 74.29, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 49.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 54.53], ["speech", 25.84], ["radio", 14.47]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.02, 2.24, 1.02, 3.33, 7.95, 1.92, 0.47, 9.16, 1.3, 0.38, 3.32, 2.11, 0.71, 2.43, 0.37, 0.75, 0.31, 0.4, 0.67, 1.62, 0.66, 2.13, 0.89, 0.29, 0.17, 8.52, 1.38, 1.52, 1.54, 0.72, 1.56, 0.59, 1.55, 0.63, 1.77, 1.53, 0.43]} \ No newline at end of file diff --git a/annotations_1/4c_4MGTCgHY_filtered.json b/annotations_1/4c_4MGTCgHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59c965b404613ecdf640ca0cd4bc827768a84cc6 --- /dev/null +++ b/annotations_1/4c_4MGTCgHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.67], [29.0, 29.03], [29.0, 30.43], [33.0, 33.12], [42.0, 53.32], [54.0, 54.87], [58.0, 61.8], [68.0, 68.74], [73.0, 76.15]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [30.14, 0.0, 0.0, 0.0, 29.9, 0.0, 83.52, 0.0, 53.65], "audiomae_on_audioset": [[["speech", 34.14], ["whack, thwack", 17.23], ["thunk", 14.87]], null, null, null, [["speech", 52.17], ["whack, thwack", 16.92], ["thump, thud", 8.76]], null, null, null, null], "duration": [4.67, 0.03, 1.43, 0.12, 11.32, 0.87, 3.8, 0.74, 3.15]} \ No newline at end of file diff --git a/annotations_1/4cl5cWYmvgc_filtered.json b/annotations_1/4cl5cWYmvgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d98edbf97a79d1c47fa1553a34bf605474d1b539 --- /dev/null +++ b/annotations_1/4cl5cWYmvgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.8], [13.0, 16.43], [23.0, 23.77], [32.0, 33.17], [39.0, 40.81], [45.0, 47.98], [54.0, 54.57], [61.0, 61.84], [64.0, 65.45], [68.0, 68.89], [72.0, 72.64], [76.0, 79.66], [81.0, 81.7], [88.0, 89.45], [94.0, 104.23], [115.0, 114.76], [123.0, 123.42], [127.0, 128.26], [130.0, 131.79], [144.0, 145.03], [156.0, 156.02], [160.0, 160.64], [172.0, 173.4], [174.0, 174.61], [181.0, 181.6], [183.0, 184.64], [185.0, 185.6]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.94, 0.0, 0.0, 0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["marimba, xylophone", 26.29], ["music", 17.57], ["glockenspiel", 16.65]], null, null, null, [["livestock, farm animals, working animals", 20.57], ["cattle, bovinae", 17.69], ["music", 16.97]], null, null, null, null, null, [["music", 58.5], ["marimba, xylophone", 6.51], ["vibraphone", 5.72]], null, null, [["music", 38.91], ["didgeridoo", 13.28], ["musical instrument", 11.92]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 3.43, 0.77, 1.17, 1.81, 2.98, 0.57, 0.84, 1.45, 0.89, 0.64, 3.66, 0.7, 1.45, 10.23, -0.24, 0.42, 1.26, 1.79, 1.03, 0.02, 0.64, 1.4, 0.61, 0.6, 1.64, 0.6]} \ No newline at end of file diff --git a/annotations_1/4cyZctbdFik_filtered.json b/annotations_1/4cyZctbdFik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..218f39d00a4530a42a05ed320c2a10b5e4b5d074 --- /dev/null +++ b/annotations_1/4cyZctbdFik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.55], [12.0, 14.5], [16.0, 16.85], [18.0, 18.66], [21.0, 21.93], [25.0, 30.42], [33.0, 33.24], [34.0, 35.23], [37.0, 45.35], [47.0, 50.79], [53.0, 53.76], [54.0, 62.38], [65.0, 67.61], [68.0, 70.23], [71.0, 72.5], [80.0, 81.08], [82.0, 82.49], [83.0, 85.48], [86.0, 87.86], [90.0, 90.85], [98.0, 100.79], [102.0, 104.92], [109.0, 112.95], [116.0, 117.29], [120.0, 120.18], [121.0, 121.69], [131.0, 132.54], [133.0, 135.09], [138.0, 140.54], [143.0, 147.33], [153.0, 162.87], [166.0, 171.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [85.35, 97.73, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 100.0, 94.07, 0.0, 66.39, 100.0, 42.96, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 99.94, 99.99, 43.87, 0.0, 0.0, 0.0, 0.0, 95.91, 89.54, 81.0, 57.01, 49.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.48], ["sidetone", 11.75], ["mains hum", 9.24]], null, null, null, null, null, null, null, null, [["stomach rumble", 24.86], ["ding", 13.24], ["chime", 8.03]], null, null, null, null, null, null, null, null, [["music", 75.04], ["singing bowl", 2.56], ["frog", 2.27]]], "duration": [3.55, 2.5, 0.85, 0.66, 0.93, 5.42, 0.24, 1.23, 8.35, 3.79, 0.76, 8.38, 2.61, 2.23, 1.5, 1.08, 0.49, 2.48, 1.86, 0.85, 2.79, 2.92, 3.95, 1.29, 0.18, 0.69, 1.54, 2.09, 2.54, 4.33, 9.87, 5.69]} \ No newline at end of file diff --git a/annotations_1/4d9fx7umXgg_filtered.json b/annotations_1/4d9fx7umXgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c571ff688e91c72b79beda5ad21dec2cc07cb03d --- /dev/null +++ b/annotations_1/4d9fx7umXgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.32], [15.0, 17.24], [19.0, 19.94], [21.0, 24.46], [29.0, 29.91], [33.0, 34.21], [37.0, 40.05], [44.0, 45.1], [46.0, 48.46], [51.0, 52.59], [53.0, 56.05], [58.0, 60.45], [61.0, 62.95], [66.0, 69.85], [74.0, 74.98], [78.0, 80.08], [81.0, 83.96], [86.0, 86.93], [91.0, 92.6], [96.0, 97.87], [102.0, 103.27], [107.0, 108.09], [110.0, 111.55], [114.0, 116.75], [125.0, 125.61], [128.0, 130.27], [133.0, 135.6], [139.0, 142.64], [143.0, 150.01], [151.0, 152.27], [154.0, 162.31], [164.0, 195.34], [204.0, 206.27], [208.0, 210.0], [214.0, 217.51], [219.0, 219.47], [220.0, 250.62], [252.0, 256.14], [259.0, 279.09], [280.0, 281.28], [282.0, 284.03]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, true, true, true, false, false, true, true, false, false], "silence_prob": [55.6, 56.7, 0.0, 61.37, 0.0, 0.0, 59.15, 0.0, 45.72, 0.0, 31.29, 44.34, 0.0, 30.93, 0.0, 50.81, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 0.0, 46.29, 42.53, 30.99, 39.33, 0.0, 30.4, 0.0, 49.4, 49.73, 34.32, 0.0, 0.0, 29.32, 44.69, 0.0, 74.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 26.57], ["music", 19.95], ["hum", 6.98]], null, [["hum", 26.05], ["mains hum", 16.35], ["rumble", 9.45]], [["hum", 21.96], ["mains hum", 14.02], ["rumble", 9.79]], null, [["music", 70.33], ["hum", 5.5], ["scary music", 4.06]], null, null, null, null, null, null, null, null, null, [["chirp tone", 25.25], ["hum", 25.03], ["music", 13.69]], null, [["speech", 55.55], ["music", 9.09], ["hum", 6.5]], [["music", 26.74], ["speech", 16.31], ["hum", 13.05]], [["music", 34.76], ["hum", 14.83], ["electronic music", 7.07]], [["hum", 29.81], ["music", 21.75], ["mains hum", 10.46]], null, [["music", 71.83], ["synthesizer", 5.74], ["didgeridoo", 4.59]], null, [["music", 42.21], ["hum", 7.26], ["electronic music", 6.35]], [["music", 45.45], ["synthesizer", 4.23], ["hum", 3.73]], [["music", 39.06], ["hum", 15.64], ["mains hum", 11.44]], null, null, [["music", 43.59], ["gong", 11.88], ["sonar", 8.42]], [["music", 33.18], ["didgeridoo", 10.89], ["throbbing", 4.77]], null, null], "duration": [2.32, 2.24, 0.94, 3.46, 0.91, 1.21, 3.05, 1.1, 2.46, 1.59, 3.05, 2.45, 1.95, 3.85, 0.98, 2.08, 2.96, 0.93, 1.6, 1.87, 1.27, 1.09, 1.55, 2.75, 0.61, 2.27, 2.6, 3.64, 7.01, 1.27, 8.31, 31.34, 2.27, 2.0, 3.51, 0.47, 30.62, 4.14, 20.09, 1.28, 2.03]} \ No newline at end of file diff --git a/annotations_1/4fwQKF64AWY_filtered.json b/annotations_1/4fwQKF64AWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb3da0531bdee44469b6ea69e2569b09e95c245f --- /dev/null +++ b/annotations_1/4fwQKF64AWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.29], [16.0, 16.97], [18.0, 19.65], [24.0, 25.52], [28.0, 29.66], [33.0, 36.8], [38.0, 38.21], [39.0, 44.59], [46.0, 53.84], [56.0, 56.91], [58.0, 59.56], [61.0, 62.41], [63.0, 64.08], [65.0, 67.47], [69.0, 69.97], [72.0, 72.44], [74.0, 77.18], [78.0, 78.24], [79.0, 80.13], [83.0, 83.42], [86.0, 86.48], [87.0, 87.66], [89.0, 89.33], [93.0, 93.95], [96.0, 97.07], [98.0, 98.86], [100.0, 104.48], [109.0, 111.37], [113.0, 114.2], [115.0, 116.51], [118.0, 118.57], [120.0, 121.05], [123.0, 131.3], [134.0, 135.14], [139.0, 138.92], [140.0, 141.34], [145.0, 146.57], [147.0, 153.35], [165.0, 166.48], [169.0, 170.21], [172.0, 172.74], [179.0, 180.15], [182.0, 182.76], [186.0, 186.48], [187.0, 190.63], [192.0, 192.81], [194.0, 194.41], [197.0, 197.85], [200.0, 201.34], [203.0, 206.36], [208.0, 215.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.65, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 98.86, 99.65, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 95.78, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 99.62, 42.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.93], ["theremin", 19.32], ["thunk", 16.67]]], "duration": [2.29, 0.97, 1.65, 1.52, 1.66, 3.8, 0.21, 5.59, 7.84, 0.91, 1.56, 1.41, 1.08, 2.47, 0.97, 0.44, 3.18, 0.24, 1.13, 0.42, 0.48, 0.66, 0.33, 0.95, 1.07, 0.86, 4.48, 2.37, 1.2, 1.51, 0.57, 1.05, 8.3, 1.14, -0.08, 1.34, 1.57, 6.35, 1.48, 1.21, 0.74, 1.15, 0.76, 0.48, 3.63, 0.81, 0.41, 0.85, 1.34, 3.36, 7.52]} \ No newline at end of file diff --git a/annotations_1/4gO9OFumO8U_filtered.json b/annotations_1/4gO9OFumO8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faf13a8e54f26b60d0b20ce555967cb85c5f0587 --- /dev/null +++ b/annotations_1/4gO9OFumO8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [5.0, 5.88], [7.0, 7.65], [9.0, 11.23], [12.0, 14.4], [17.0, 76.2], [80.0, 81.11], [82.0, 82.9], [84.0, 85.87], [89.0, 90.66], [91.0, 93.66], [94.0, 95.49], [96.0, 98.24], [99.0, 99.33], [102.0, 102.73], [104.0, 105.11], [106.0, 107.0], [108.0, 109.83], [111.0, 112.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.25, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 80.64, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.88, 0.65, 2.23, 2.4, 59.2, 1.11, 0.9, 1.87, 1.66, 2.66, 1.49, 2.24, 0.33, 0.73, 1.11, 1.0, 1.83, 1.41]} \ No newline at end of file diff --git a/annotations_1/4gSkh86zcaU_filtered.json b/annotations_1/4gSkh86zcaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c33488569db613b5f92316361d73866fb6bc8585 --- /dev/null +++ b/annotations_1/4gSkh86zcaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.93], [11.0, 11.48], [12.0, 13.09], [14.0, 17.36], [18.0, 18.91], [21.0, 21.2], [22.0, 25.95], [27.0, 26.94], [31.0, 33.57], [36.0, 36.56], [38.0, 40.26], [42.0, 42.2], [52.0, 53.59], [58.0, 59.05], [62.0, 62.88], [65.0, 66.5], [68.0, 68.44], [71.0, 71.51], [72.0, 74.07], [77.0, 77.25], [80.0, 80.38], [87.0, 88.35], [88.0, 88.45], [90.0, 91.84], [94.0, 93.73], [95.0, 95.93], [102.0, 102.59], [107.0, 107.74], [108.0, 107.99], [108.0, 109.54], [114.0, 115.05], [119.0, 119.87], [131.0, 131.52], [134.0, 135.08], [140.0, 145.0], [147.0, 147.06], [148.0, 149.12], [154.0, 154.43], [157.0, 158.21], [162.0, 163.71], [165.0, 165.96], [169.0, 170.16]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.89, 0.0, 0.0, 63.31, 0.0, 0.0, 34.56, 0.0, 32.52, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 26.57], ["cattle, bovinae", 18.85], ["moo", 9.75]], null, null, null, null, null, [["speech", 16.15], ["fly, housefly", 14.48], ["mosquito", 8.03]], null, [["speech", 38.56], ["buzzer", 25.12], ["music", 8.26]], null, [["hum", 35.8], ["mains hum", 20.54], ["whale vocalization", 6.18]], null, null, null, null, null, null, null, [["music", 29.66], ["mains hum", 8.42], ["hum", 7.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.41], ["speech", 23.8], ["electronic music", 2.13]], null, null, null, null, null, null, null], "duration": [6.93, 0.48, 1.09, 3.36, 0.91, 0.2, 3.95, -0.06, 2.57, 0.56, 2.26, 0.2, 1.59, 1.05, 0.88, 1.5, 0.44, 0.51, 2.07, 0.25, 0.38, 1.35, 0.45, 1.84, -0.27, 0.93, 0.59, 0.74, -0.01, 1.54, 1.05, 0.87, 0.52, 1.08, 5.0, 0.06, 1.12, 0.43, 1.21, 1.71, 0.96, 1.16]} \ No newline at end of file diff --git a/annotations_1/4g_oMoSgIas_filtered.json b/annotations_1/4g_oMoSgIas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a3ba6b42443ec0ff0e9a6194eb2934e40c06b45 --- /dev/null +++ b/annotations_1/4g_oMoSgIas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [7.0, 12.9], [14.0, 38.04], [40.0, 42.57], [46.0, 56.34], [59.0, 59.61], [62.0, 70.97], [72.0, 72.57], [74.0, 78.54], [79.0, 81.9], [82.0, 81.99], [83.0, 87.61], [89.0, 90.75], [93.0, 95.37], [97.0, 97.68], [100.0, 102.0], [105.0, 106.27], [108.0, 108.48], [108.0, 108.51], [109.0, 118.23], [119.0, 119.7], [121.0, 121.22], [124.0, 127.18], [128.0, 128.53]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.14, 29.86, 29.9, 30.1, 0.0, 31.03, 0.0, 30.06, 29.99, 0.0, 30.29, 0.0, 31.95, 0.0, 31.32, 0.0, 0.0, 0.0, 29.79, 0.0, 0.0, 31.57, 0.0], "audiomae_on_audioset": [null, [["music", 52.5], ["cacophony", 14.44], ["throbbing", 7.14]], [["music", 51.2], ["throbbing", 14.24], ["hum", 7.35]], [["music", 56.74], ["throbbing", 14.94], ["hum", 8.75]], [["music", 76.24], ["throbbing", 5.47], ["hum", 2.5]], null, [["hum", 43.92], ["mains hum", 21.4], ["music", 15.63]], null, [["speech", 26.28], ["music", 13.9], ["noise", 12.27]], [["speech", 23.92], ["sidetone", 19.33], ["music", 10.81]], null, [["speech", 19.02], ["music", 18.5], ["whale vocalization", 16.73]], null, [["mains hum", 12.09], ["hum", 11.99], ["bee, wasp, etc.", 11.21]], null, [["music", 49.77], ["speech", 14.24], ["throbbing", 7.5]], null, null, null, [["speech", 42.03], ["music", 32.64], ["musical instrument", 2.62]], null, null, [["hum", 41.06], ["throbbing", 21.01], ["mains hum", 14.59]], null], "duration": [1.13, 5.9, 24.04, 2.57, 10.34, 0.61, 8.97, 0.57, 4.54, 2.9, -0.01, 4.61, 1.75, 2.37, 0.68, 2.0, 1.27, 0.48, 0.51, 9.23, 0.7, 0.22, 3.18, 0.53]} \ No newline at end of file diff --git a/annotations_1/4gftIIxf7B4_filtered.json b/annotations_1/4gftIIxf7B4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/4gftIIxf7B4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/4hY7f4nOQtU_filtered.json b/annotations_1/4hY7f4nOQtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4fef1bfb0fc668ac9977c3a25d0c60e6f30da78 --- /dev/null +++ b/annotations_1/4hY7f4nOQtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.43], [16.0, 16.02], [18.0, 18.62], [21.0, 21.2], [24.0, 24.44], [30.0, 30.5], [31.0, 31.9], [33.0, 33.57], [37.0, 37.59], [49.0, 56.3], [63.0, 63.19], [63.0, 63.29], [63.0, 63.91], [64.0, 64.76], [68.0, 68.57], [73.0, 79.19], [80.0, 80.42], [81.0, 86.76], [96.0, 96.67], [97.0, 97.48], [98.0, 98.71], [101.0, 103.99], [108.0, 112.35], [112.0, 112.94], [119.0, 119.64], [141.0, 141.86], [145.0, 144.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.01, 0.0, 0.0, 0.0, 0.0, 0.0, 35.68, 0.0, 41.74, 0.0, 0.0, 0.0, 35.86, 43.28, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 70.53], ["music", 10.33], ["grunt", 5.0]], null, null, null, null, null, null, null, null, [["speech", 68.23], ["music", 17.76], ["grunt", 6.82]], null, null, null, null, null, [["speech", 43.91], ["groan", 20.13], ["grunt", 18.9]], null, [["grunt", 35.09], ["music", 30.43], ["speech", 23.81]], null, null, null, [["speech", 49.23], ["music", 21.11], ["grunt", 5.85]], [["speech", 31.48], ["music", 25.59], ["grunt", 21.22]], null, null, null, null], "duration": [3.43, 0.02, 0.62, 0.2, 0.44, 0.5, 0.9, 0.57, 0.59, 7.3, 0.19, 0.29, 0.91, 0.76, 0.57, 6.19, 0.42, 5.76, 0.67, 0.48, 0.71, 2.99, 4.35, 0.94, 0.64, 0.86, -0.04]} \ No newline at end of file diff --git a/annotations_1/4k1Vx0equfE_filtered.json b/annotations_1/4k1Vx0equfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58f95d2ed23f2d89fd2bea0fc4ab611d55d6c0a0 --- /dev/null +++ b/annotations_1/4k1Vx0equfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 23.35], [24.0, 29.81], [36.0, 40.61], [42.0, 41.82], [43.0, 43.33], [43.0, 46.67], [50.0, 51.34], [69.0, 69.08], [70.0, 74.43], [84.0, 86.1], [90.0, 90.46], [98.0, 98.68], [103.0, 107.72], [108.0, 109.7], [111.0, 111.54], [112.0, 113.34], [115.0, 118.99], [130.0, 130.3], [153.0, 153.44], [154.0, 153.6], [155.0, 155.76], [160.0, 160.29], [169.0, 170.97], [171.0, 171.0], [172.0, 173.57], [176.0, 177.16]], "keep_status": [true, true, true, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [47.46, 45.33, 47.27, 0.0, 0.0, 45.14, 0.0, 0.0, 61.67, 69.61, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.11], ["speech", 12.2], ["didgeridoo", 5.12]], [["music", 27.37], ["speech", 24.75], ["mains hum", 10.2]], [["music", 28.35], ["speech", 26.14], ["sidetone", 9.58]], null, null, [["speech", 27.63], ["music", 26.82], ["moo", 7.84]], null, null, null, null, null, null, [["music", 27.94], ["didgeridoo", 23.58], ["musical instrument", 6.55]], null, null, null, [["noise", 21.15], ["speech", 20.65], ["music", 11.52]], null, null, null, null, null, null, null, null, null], "duration": [8.35, 5.81, 4.61, -0.18, 0.33, 3.67, 1.34, 0.08, 4.43, 2.1, 0.46, 0.68, 4.72, 1.7, 0.54, 1.34, 3.99, 0.3, 0.44, -0.4, 0.76, 0.29, 1.97, 0.0, 1.57, 1.16]} \ No newline at end of file diff --git a/annotations_1/4kAViGVuLmM_filtered.json b/annotations_1/4kAViGVuLmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98e14a8e59b1f6d416fb2274d5ec72ed49c51ec7 --- /dev/null +++ b/annotations_1/4kAViGVuLmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.87], [1.0, 1.65], [2.0, 3.0], [3.0, 3.72], [8.0, 8.8], [9.0, 10.67], [36.0, 36.96], [42.0, 42.65], [43.0, 43.87], [52.0, 60.15], [60.0, 60.44], [60.0, 63.54], [64.0, 70.39], [79.0, 79.34], [81.0, 85.13], [90.0, 92.77], [93.0, 93.36], [99.0, 101.71], [102.0, 105.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.3, 0.0, 42.39, 44.99, 0.0, 63.1, 57.17, 0.0, 37.64, 32.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 59.01], ["sidetone", 25.35], ["music", 7.69]], null, [["music", 29.57], ["brass instrument", 14.83], ["speech", 12.0]], [["music", 44.67], ["synthesizer", 13.3], ["keyboard (musical)", 7.87]], null, null, null, null, [["speech", 37.62], ["tubular bells", 13.93], ["bell", 3.58]], [["music", 65.12], ["speech", 14.58], ["foghorn", 5.29]]], "duration": [0.87, 0.65, 1.0, 0.72, 0.8, 1.67, 0.96, 0.65, 0.87, 8.15, 0.44, 3.54, 6.39, 0.34, 4.13, 2.77, 0.36, 2.71, 3.07]} \ No newline at end of file diff --git a/annotations_1/4kIbIjoVakQ_filtered.json b/annotations_1/4kIbIjoVakQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70905d2a8988b9e3abb8c25abcac384e08b85b01 --- /dev/null +++ b/annotations_1/4kIbIjoVakQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [8.0, 11.26], [15.0, 16.85], [19.0, 20.93], [24.0, 24.9], [28.0, 28.97], [32.0, 33.07], [36.0, 37.05], [40.0, 41.27], [44.0, 45.23], [47.0, 46.89], [48.0, 48.05], [48.0, 49.03], [52.0, 53.38], [56.0, 56.19], [56.0, 56.27], [56.0, 59.46], [63.0, 63.51], [66.0, 67.76], [70.0, 70.38], [71.0, 71.88], [73.0, 73.45], [74.0, 75.86], [78.0, 78.53], [79.0, 79.89], [82.0, 83.86], [89.0, 90.04], [93.0, 93.82], [95.0, 98.12], [101.0, 102.12], [109.0, 114.49], [118.0, 119.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.53, 36.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.32, 0.0, 31.92, 0.0], "audiomae_on_audioset": [null, [["music", 47.84], ["hum", 10.4], ["throbbing", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.69], ["didgeridoo", 30.83], ["musical instrument", 4.08]], null, null, null, null, null, null, null, null, null, null, null, [["music", 68.87], ["musical instrument", 7.5], ["guitar", 2.99]], null, [["music", 59.5], ["didgeridoo", 15.98], ["musical instrument", 6.31]], null], "duration": [2.66, 3.26, 1.85, 1.93, 0.9, 0.97, 1.07, 1.05, 1.27, 1.23, -0.11, 0.05, 1.03, 1.38, 0.19, 0.27, 3.46, 0.51, 1.76, 0.38, 0.88, 0.45, 1.86, 0.53, 0.89, 1.86, 1.04, 0.82, 3.12, 1.12, 5.49, 1.04]} \ No newline at end of file diff --git a/annotations_1/4kRRDuR7OBM_filtered.json b/annotations_1/4kRRDuR7OBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..645ce03171f8195101eba07ff71282e958194a31 --- /dev/null +++ b/annotations_1/4kRRDuR7OBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.81], [4.0, 3.96], [8.0, 8.33], [14.0, 14.44], [17.0, 17.42], [18.0, 20.19], [21.0, 22.65], [27.0, 28.75], [31.0, 31.51], [35.0, 35.23], [37.0, 37.39], [39.0, 39.95], [40.0, 41.76], [43.0, 43.28], [52.0, 52.56], [55.0, 55.41], [56.0, 56.34], [58.0, 59.29], [62.0, 63.15], [64.0, 64.27], [69.0, 71.96], [73.0, 73.85], [77.0, 79.08], [80.0, 82.81], [87.0, 88.97], [95.0, 94.9], [98.0, 98.44], [102.0, 103.11], [108.0, 108.58], [109.0, 109.76], [111.0, 112.62], [115.0, 127.18], [128.0, 128.88], [131.0, 131.41], [132.0, 132.93], [136.0, 141.49], [143.0, 144.49], [147.0, 150.53], [157.0, 159.24], [162.0, 163.04], [165.0, 165.87], [169.0, 169.4], [170.0, 174.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.99, 0.0, 96.77, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.81, -0.04, 0.33, 0.44, 0.42, 2.19, 1.65, 1.75, 0.51, 0.23, 0.39, 0.95, 1.76, 0.28, 0.56, 0.41, 0.34, 1.29, 1.15, 0.27, 2.96, 0.85, 2.08, 2.81, 1.97, -0.1, 0.44, 1.11, 0.58, 0.76, 1.62, 12.18, 0.88, 0.41, 0.93, 5.49, 1.49, 3.53, 2.24, 1.04, 0.87, 0.4, 4.95]} \ No newline at end of file diff --git a/annotations_1/4kmeixKc9yk_filtered.json b/annotations_1/4kmeixKc9yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8251d2194b95137008d2f1d66ba902b8c871660 --- /dev/null +++ b/annotations_1/4kmeixKc9yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 49.32], [50.0, 51.26], [54.0, 70.36], [79.0, 84.08], [87.0, 183.73]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.21, 28.83, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.84], ["musical instrument", 11.66], ["theremin", 8.89]], [["music", 54.79], ["theremin", 13.34], ["musical instrument", 4.04]], null], "duration": [44.32, 1.26, 16.36, 5.08, 96.73]} \ No newline at end of file diff --git a/annotations_1/4koPfEQVo44_filtered.json b/annotations_1/4koPfEQVo44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d6ef2dec0ada17edc69bd8014e336eb77f196c9 --- /dev/null +++ b/annotations_1/4koPfEQVo44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 33.51], [34.0, 109.68], [113.0, 118.72], [121.0, 154.57]], "keep_status": [false, false, false, false], "silence_prob": [31.68, 0.0, 35.71, 0.0], "audiomae_on_audioset": [[["music", 85.13], ["reggae", 2.59], ["drum machine", 1.78]], null, [["music", 68.59], ["didgeridoo", 16.27], ["musical instrument", 6.09]], null], "duration": [24.51, 75.68, 5.72, 33.57]} \ No newline at end of file diff --git a/annotations_1/4m15WAC5khw_filtered.json b/annotations_1/4m15WAC5khw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bc2bc1cbdda63bb1b02d4fd1651508083956a57 --- /dev/null +++ b/annotations_1/4m15WAC5khw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.61], [13.0, 13.93], [16.0, 16.39], [20.0, 23.72], [25.0, 25.91], [27.0, 34.43], [36.0, 36.54], [40.0, 40.51], [41.0, 41.55], [42.0, 42.89], [44.0, 45.44], [46.0, 50.35], [53.0, 55.65], [58.0, 62.45], [68.0, 68.71], [76.0, 118.47], [120.0, 120.23], [121.0, 121.95]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 0.0, 0.0, 36.61, 0.0, 31.76, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 60.42, 55.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 41.53], ["fly, housefly", 10.02], ["bee, wasp, etc.", 7.07]], null, [["speech", 23.58], ["hum", 21.91], ["mains hum", 9.72]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.61, 0.93, 0.39, 3.72, 0.91, 7.43, 0.54, 0.51, 0.55, 0.89, 1.44, 4.35, 2.65, 4.45, 0.71, 42.47, 0.23, 0.95]} \ No newline at end of file diff --git a/annotations_1/4mMrCXPCZAA_filtered.json b/annotations_1/4mMrCXPCZAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fea98c523a1bfe9882dde11a9dda003b031d8bf1 --- /dev/null +++ b/annotations_1/4mMrCXPCZAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 10.0], [10.0, 10.64], [14.0, 15.97], [17.0, 18.59], [19.0, 20.48], [21.0, 23.77], [25.0, 26.0], [30.0, 36.85], [38.0, 38.79], [39.0, 39.85], [41.0, 42.09], [44.0, 44.31], [47.0, 48.09], [49.0, 49.59], [51.0, 51.14], [58.0, 59.19], [60.0, 60.51], [63.0, 63.53], [65.0, 65.65], [68.0, 68.82], [71.0, 71.69], [78.0, 78.53], [81.0, 81.57], [83.0, 84.42], [86.0, 86.02], [87.0, 88.5], [90.0, 91.94], [92.0, 93.21], [94.0, 95.18], [98.0, 98.95], [102.0, 103.0], [103.0, 103.94], [106.0, 118.12], [119.0, 120.65]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.09, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 46.27], ["music", 8.28], ["foghorn", 5.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.0, 0.64, 1.97, 1.59, 1.48, 2.77, 1.0, 6.85, 0.79, 0.85, 1.09, 0.31, 1.09, 0.59, 0.14, 1.19, 0.51, 0.53, 0.65, 0.82, 0.69, 0.53, 0.57, 1.42, 0.02, 1.5, 1.94, 1.21, 1.18, 0.95, 1.0, 0.94, 12.12, 1.65]} \ No newline at end of file diff --git a/annotations_1/4ozs0VI04xI_filtered.json b/annotations_1/4ozs0VI04xI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a897e330d67eb54c8117cebc64c893a3b164f27 --- /dev/null +++ b/annotations_1/4ozs0VI04xI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.51], [11.0, 45.86], [46.0, 69.03], [71.0, 77.85], [78.0, 77.92]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 33.33, 35.65, 0.0], "audiomae_on_audioset": [null, null, [["speech", 14.76], ["animal", 11.38], ["music", 9.42]], [["wail, moan", 70.56], ["speech", 6.0], ["whimper", 3.93]], null], "duration": [1.51, 34.86, 23.03, 6.85, -0.08]} \ No newline at end of file diff --git a/annotations_1/4pSAjI9lOGY_filtered.json b/annotations_1/4pSAjI9lOGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..540819a2b8579f46317f465bb18763b8bc0e0c01 --- /dev/null +++ b/annotations_1/4pSAjI9lOGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [12.0, 13.07], [16.0, 17.71], [22.0, 22.94], [27.0, 28.98], [40.0, 40.02], [49.0, 51.33], [69.0, 69.62]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["wild animals", 41.39], ["roaring cats (lions, tigers)", 24.07], ["animal", 13.15]], null], "duration": [1.16, 1.07, 1.71, 0.94, 1.98, 0.02, 2.33, 0.62]} \ No newline at end of file diff --git a/annotations_1/4qseBKnxIpQ_filtered.json b/annotations_1/4qseBKnxIpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ac8925a61d2ae346723fedf4a2f87bf4b1de3f2 --- /dev/null +++ b/annotations_1/4qseBKnxIpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.19], [4.0, 4.72], [7.0, 6.66], [11.0, 11.58], [14.0, 15.6], [16.0, 17.04], [18.0, 18.89], [21.0, 21.3], [22.0, 23.38], [24.0, 24.51], [26.0, 27.28], [28.0, 28.51], [35.0, 35.73], [39.0, 39.63], [43.0, 43.82], [47.0, 47.93], [50.0, 51.51], [54.0, 54.43], [55.0, 56.54], [58.0, 59.49], [61.0, 63.46], [65.0, 66.97], [68.0, 87.45], [90.0, 97.95], [123.0, 124.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 99.76, 71.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.19, 0.72, -0.34, 0.58, 1.6, 1.04, 0.89, 0.3, 1.38, 0.51, 1.28, 0.51, 0.73, 0.63, 0.82, 0.93, 1.51, 0.43, 1.54, 1.49, 2.46, 1.97, 19.45, 7.95, 1.73]} \ No newline at end of file diff --git a/annotations_1/4ri_ybNiTPU_filtered.json b/annotations_1/4ri_ybNiTPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..002e52df92178dedfca8458757b86bd9d64c6142 --- /dev/null +++ b/annotations_1/4ri_ybNiTPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.64], [27.0, 27.57], [47.0, 49.77], [51.0, 51.97], [74.0, 74.31]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 67.86], ["telephone", 5.23], ["sine wave", 2.98]], null, null], "duration": [0.64, 0.57, 2.77, 0.97, 0.31]} \ No newline at end of file diff --git a/annotations_1/4sNyWmYN-rM_filtered.json b/annotations_1/4sNyWmYN-rM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b63fc8a55a2fa9cb69ddefe4f5b046140750e038 --- /dev/null +++ b/annotations_1/4sNyWmYN-rM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.03], [22.0, 25.61], [26.0, 28.58], [30.0, 32.07], [33.0, 34.26], [35.0, 36.78], [38.0, 39.9], [42.0, 43.82], [47.0, 46.75], [48.0, 49.59], [51.0, 52.07], [55.0, 55.63], [57.0, 57.6], [59.0, 59.83], [63.0, 64.29], [67.0, 66.83], [69.0, 69.38], [75.0, 75.22], [77.0, 77.85], [79.0, 84.42], [86.0, 88.67], [89.0, 89.19], [89.0, 89.24], [89.0, 92.91], [98.0, 100.62], [104.0, 105.14], [111.0, 111.59], [112.0, 113.78], [114.0, 115.82], [117.0, 116.94], [118.0, 118.89], [121.0, 121.51], [122.0, 122.98], [124.0, 124.33], [125.0, 125.68], [126.0, 126.89], [129.0, 129.39], [130.0, 130.96], [132.0, 132.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.89, 91.13, 66.76, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.47, 35.23, 0.0, 0.0, 33.21, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.03], ["cattle, bovinae", 11.08], ["moo", 9.5]], [["music", 43.09], ["throbbing", 19.3], ["hum", 6.29]], null, null, [["speech", 26.11], ["music", 25.04], ["hum", 16.74]], [["music", 34.69], ["hum", 27.55], ["throbbing", 16.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 3.61, 2.58, 2.07, 1.26, 1.78, 1.9, 1.82, -0.25, 1.59, 1.07, 0.63, 0.6, 0.83, 1.29, -0.17, 0.38, 0.22, 0.85, 5.42, 2.67, 0.19, 0.24, 3.91, 2.62, 1.14, 0.59, 1.78, 1.82, -0.06, 0.89, 0.51, 0.98, 0.33, 0.68, 0.89, 0.39, 0.96, 0.44]} \ No newline at end of file diff --git a/annotations_1/4sOjksh8vX8_filtered.json b/annotations_1/4sOjksh8vX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9759a4134f6e22e673c67f7806b35cb423e8a056 --- /dev/null +++ b/annotations_1/4sOjksh8vX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 48.73], [49.0, 52.59], [56.0, 56.59], [58.0, 59.91], [68.0, 68.2], [69.0, 70.19], [71.0, 91.12], [93.0, 100.41], [104.0, 113.61], [119.0, 122.69], [124.0, 132.6], [134.0, 134.45], [139.0, 142.6], [145.0, 146.79], [149.0, 150.92], [152.0, 154.5], [156.0, 156.95], [159.0, 161.92], [169.0, 171.59]], "keep_status": [true, true, false, false, false, false, false, true, false, true, true, false, false, false, false, true, false, true, true], "silence_prob": [45.65, 30.97, 0.0, 0.0, 0.0, 0.0, 30.62, 48.65, 30.76, 30.24, 30.86, 0.0, 29.61, 0.0, 0.0, 37.62, 0.0, 33.29, 30.74], "audiomae_on_audioset": [[["music", 20.36], ["hum", 11.81], ["sine wave", 6.4]], [["hum", 40.76], ["mains hum", 14.58], ["speech", 12.24]], null, null, null, null, [["throbbing", 29.33], ["speech", 21.86], ["hum", 21.71]], [["music", 23.53], ["mains hum", 22.43], ["hum", 18.2]], [["music", 65.08], ["whale vocalization", 5.76], ["musical instrument", 2.52]], [["music", 21.3], ["hum", 20.88], ["mains hum", 11.64]], [["mains hum", 18.42], ["speech", 18.39], ["music", 17.25]], null, [["hum", 24.62], ["music", 23.86], ["mains hum", 21.92]], null, null, [["music", 51.52], ["throbbing", 3.15], ["tabla", 2.82]], null, [["noise", 19.93], ["hum", 18.45], ["mains hum", 16.41]], [["music", 24.75], ["hum", 12.97], ["mains hum", 9.28]]], "duration": [2.73, 3.59, 0.59, 1.91, 0.2, 1.19, 20.12, 7.41, 9.61, 3.69, 8.6, 0.45, 3.6, 1.79, 1.92, 2.5, 0.95, 2.92, 2.59]} \ No newline at end of file diff --git a/annotations_1/4t7oXxFAlHM_filtered.json b/annotations_1/4t7oXxFAlHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40c572d77534b989d4737d0e984e66148c18fe46 --- /dev/null +++ b/annotations_1/4t7oXxFAlHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [9.0, 20.51], [27.0, 103.18]], "keep_status": [false, false, false], "silence_prob": [45.56, 44.23, 0.0], "audiomae_on_audioset": [[["music", 46.07], ["boing", 38.35], ["musical instrument", 3.99]], [["music", 59.76], ["throbbing", 10.97], ["electronic music", 5.92]], null], "duration": [2.21, 11.51, 76.18]} \ No newline at end of file diff --git a/annotations_1/4tMdFDBXDpk_filtered.json b/annotations_1/4tMdFDBXDpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3de5207327c2a0a2ebeb7a1f82829fdc254436b2 --- /dev/null +++ b/annotations_1/4tMdFDBXDpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.49], [13.0, 15.15], [17.0, 18.71], [20.0, 22.49], [30.0, 34.26], [40.0, 41.52], [42.0, 43.82], [52.0, 71.54], [79.0, 79.1], [90.0, 91.61], [95.0, 95.61], [101.0, 101.76], [105.0, 131.19], [134.0, 135.65], [145.0, 145.54], [148.0, 148.58], [155.0, 156.12], [162.0, 171.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.06, 30.17, 0.0, 44.57, 31.34, 0.0, 0.0, 30.48, 0.0, 0.0, 0.0, 0.0, 35.67, 0.0, 0.0, 0.0, 0.0, 48.23], "audiomae_on_audioset": [[["music", 64.63], ["musical instrument", 7.17], ["trombone", 6.59]], [["music", 71.03], ["musical instrument", 9.05], ["theremin", 6.68]], null, [["music", 67.8], ["musical instrument", 6.03], ["synthesizer", 2.99]], [["music", 77.78], ["didgeridoo", 3.76], ["synthesizer", 2.43]], null, null, [["music", 78.97], ["didgeridoo", 7.01], ["musical instrument", 2.02]], null, null, null, null, [["music", 38.05], ["ambient music", 19.12], ["gong", 11.63]], null, null, null, null, [["music", 42.07], ["ambient music", 38.32], ["gong", 6.83]]], "duration": [4.49, 2.15, 1.71, 2.49, 4.26, 1.52, 1.82, 19.54, 0.1, 1.61, 0.61, 0.76, 26.19, 1.65, 0.54, 0.58, 1.12, 9.26]} \ No newline at end of file diff --git a/annotations_1/4us4K3KLRM0_filtered.json b/annotations_1/4us4K3KLRM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fbc871cfbb28cd18d645c0361f9daaae4e9fae4 --- /dev/null +++ b/annotations_1/4us4K3KLRM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.56], [14.0, 14.23], [16.0, 16.77], [20.0, 21.36], [22.0, 22.13], [22.0, 26.57], [29.0, 42.48], [43.0, 43.82], [44.0, 49.57], [54.0, 54.67], [55.0, 56.1], [60.0, 60.35], [61.0, 62.06], [63.0, 64.0], [65.0, 67.54], [68.0, 69.77], [71.0, 71.22], [72.0, 107.22], [113.0, 115.35], [117.0, 119.87], [121.0, 123.94], [125.0, 126.86]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 47.66, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 38.33, 0.0, 0.0, 0.0, 32.54, 31.26, 29.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 57.29], ["insect", 5.74], ["fly, housefly", 4.5]], [["music", 69.4], ["hum", 4.46], ["theremin", 2.87]], null, null, null, null, null, null, null, [["hum", 27.42], ["crushing", 23.64], ["mains hum", 15.92]], null, null, null, [["music", 52.36], ["throbbing", 6.67], ["electronic music", 3.02]], [["music", 35.28], ["speech", 13.49], ["zipper (clothing)", 6.51]], [["moo", 39.84], ["cattle, bovinae", 38.82], ["livestock, farm animals, working animals", 11.62]], null], "duration": [0.56, 0.23, 0.77, 1.36, 0.13, 4.57, 13.48, 0.82, 5.57, 0.67, 1.1, 0.35, 1.06, 1.0, 2.54, 1.77, 0.22, 35.22, 2.35, 2.87, 2.94, 1.86]} \ No newline at end of file diff --git a/annotations_1/4vJ6xB6ctaA_filtered.json b/annotations_1/4vJ6xB6ctaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4225fb8447df00ca5ef59ccea9eeca7f41924568 --- /dev/null +++ b/annotations_1/4vJ6xB6ctaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.07], [8.0, 13.05], [13.0, 19.65], [21.0, 23.31], [23.0, 28.46], [32.0, 34.16], [35.0, 36.71], [39.0, 39.01], [40.0, 41.27], [45.0, 46.67], [49.0, 49.17], [51.0, 52.0], [63.0, 63.44], [67.0, 67.91], [70.0, 70.66], [75.0, 75.76], [76.0, 78.09], [79.0, 79.79], [83.0, 83.51], [85.0, 85.08], [87.0, 87.72], [92.0, 93.43], [95.0, 96.45], [97.0, 98.71], [100.0, 101.46], [104.0, 104.57], [106.0, 110.17], [112.0, 116.55]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.69, 46.36, 34.55, 73.36, 57.48, 33.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 37.72], "audiomae_on_audioset": [[["music", 29.48], ["theremin", 26.29], ["hum", 8.75]], [["music", 46.76], ["theremin", 28.62], ["hum", 3.33]], [["music", 44.16], ["speech", 21.35], ["hum", 6.75]], null, null, [["music", 11.31], ["ding", 6.78], ["clang", 6.32]], null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 49.19], ["music", 39.58], ["musical instrument", 2.79]], null, null, null, null, null, null, null, null, null, [["music", 41.89], ["theremin", 26.68], ["musical instrument", 4.74]], [["music", 54.13], ["theremin", 19.33], ["musical instrument", 2.73]]], "duration": [6.07, 5.05, 6.65, 2.31, 5.46, 2.16, 1.71, 0.01, 1.27, 1.67, 0.17, 1.0, 0.44, 0.91, 0.66, 0.76, 2.09, 0.79, 0.51, 0.08, 0.72, 1.43, 1.45, 1.71, 1.46, 0.57, 4.17, 4.55]} \ No newline at end of file diff --git a/annotations_1/4vekUOykIvw_filtered.json b/annotations_1/4vekUOykIvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6609d970938cad08ff8d4200b48119803920c04 --- /dev/null +++ b/annotations_1/4vekUOykIvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.38], [18.0, 20.21], [32.0, 32.04], [41.0, 42.77], [43.0, 44.05], [45.0, 45.72], [49.0, 49.33], [50.0, 50.5], [57.0, 56.91], [57.0, 57.87], [66.0, 66.18], [67.0, 66.63], [68.0, 69.16], [107.0, 108.97], [114.0, 115.72], [123.0, 125.25], [134.0, 135.68], [140.0, 140.81], [148.0, 148.2], [159.0, 159.87], [161.0, 161.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.71, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 80.05], ["fly, housefly", 2.49], ["didgeridoo", 2.24]], [["music", 62.95], ["speech", 10.15], ["boing", 6.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.52], ["music", 21.23], ["synthesizer", 15.16]], null, null, null, null, null], "duration": [3.38, 2.21, 0.04, 1.77, 1.05, 0.72, 0.33, 0.5, -0.09, 0.87, 0.18, -0.37, 1.16, 1.97, 1.72, 2.25, 1.68, 0.81, 0.2, 0.87, 0.0]} \ No newline at end of file diff --git a/annotations_1/4wv_1umbZ-w_filtered.json b/annotations_1/4wv_1umbZ-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7162cc3e372641c2d59bb470b974648e374580d --- /dev/null +++ b/annotations_1/4wv_1umbZ-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.37], [13.0, 13.19], [15.0, 18.28], [20.0, 22.79], [24.0, 30.03], [33.0, 47.48], [49.0, 57.27], [65.0, 65.13], [66.0, 81.03], [87.0, 88.15], [89.0, 99.12], [100.0, 101.02], [102.0, 106.39], [108.0, 108.4], [109.0, 130.42], [131.0, 132.44], [134.0, 135.51], [136.0, 137.52], [139.0, 140.76], [142.0, 143.26], [144.0, 145.0], [146.0, 146.62], [147.0, 148.32], [150.0, 150.45], [152.0, 155.68], [159.0, 159.98], [161.0, 162.4], [163.0, 165.55], [166.0, 169.96], [176.0, 175.93], [177.0, 177.4]], "keep_status": [false, false, true, false, true, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.3, 39.34, 40.33, 37.51, 34.97, 0.0, 44.6, 0.0, 59.86, 0.0, 51.5, 0.0, 59.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 62.89, 66.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.5], ["breaking", 13.6], ["rumble", 10.42]], [["music", 40.64], ["gong", 26.65], ["electronic music", 7.57]], [["gong", 27.6], ["music", 21.36], ["singing bowl", 5.73]], [["music", 45.93], ["hum", 12.65], ["musical instrument", 5.46]], [["door", 23.33], ["speech", 15.66], ["arrow", 13.31]], null, [["music", 37.03], ["hum", 14.67], ["throbbing", 8.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.19, 3.28, 2.79, 6.03, 14.48, 8.27, 0.13, 15.03, 1.15, 10.12, 1.02, 4.39, 0.4, 21.42, 1.44, 1.51, 1.52, 1.76, 1.26, 1.0, 0.62, 1.32, 0.45, 3.68, 0.98, 1.4, 2.55, 3.96, -0.07, 0.4]} \ No newline at end of file diff --git a/annotations_1/4xg-5TeGvQY_filtered.json b/annotations_1/4xg-5TeGvQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e1e641f990025d666a6207b2b6514f55b9a10b3 --- /dev/null +++ b/annotations_1/4xg-5TeGvQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [7.0, 9.22], [10.0, 10.37], [15.0, 15.21], [22.0, 23.06], [25.0, 25.52], [26.0, 44.96], [46.0, 46.41], [55.0, 68.1], [69.0, 70.8], [73.0, 74.07], [77.0, 81.92], [90.0, 89.9], [93.0, 93.6], [96.0, 96.4], [99.0, 103.27], [104.0, 117.09], [119.0, 126.69]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 31.12, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 30.02, 0.0, 0.0, 30.9, 0.0, 0.0, 0.0, 30.49, 31.15, 30.51], "audiomae_on_audioset": [null, [["music", 31.86], ["hum", 11.8], ["throbbing", 9.92]], null, null, null, null, [["music", 49.7], ["hum", 24.43], ["throbbing", 12.3]], null, [["speech", 47.57], ["music", 19.28], ["buzz", 2.92]], null, null, [["hum", 24.25], ["mains hum", 22.73], ["speech", 18.75]], null, null, null, [["music", 23.93], ["speech", 8.18], ["whack, thwack", 7.54]], [["sidetone", 39.39], ["speech", 31.21], ["music", 6.92]], [["music", 22.24], ["throbbing", 19.38], ["hum", 14.62]]], "duration": [0.91, 2.22, 0.37, 0.21, 1.06, 0.52, 18.96, 0.41, 13.1, 1.8, 1.07, 4.92, -0.1, 0.6, 0.4, 4.27, 13.09, 7.69]} \ No newline at end of file diff --git a/annotations_1/4zBMw2XqgWY_filtered.json b/annotations_1/4zBMw2XqgWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7e8d7b9a8b2707e31e9bb4a9c02978abe631ad3 --- /dev/null +++ b/annotations_1/4zBMw2XqgWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 21.03], [22.0, 26.11], [28.0, 30.64], [31.0, 33.51], [35.0, 38.13], [39.0, 41.94], [43.0, 44.49], [45.0, 54.65], [57.0, 62.21], [63.0, 66.26], [67.0, 68.57], [69.0, 72.32]], "keep_status": [true, false, true, true, true, true, false, true, true, true, false, true], "silence_prob": [37.63, 37.55, 44.32, 42.51, 35.71, 41.64, 0.0, 35.96, 47.16, 32.83, 0.0, 33.59], "audiomae_on_audioset": [[["music", 41.88], ["hum", 9.64], ["singing bowl", 4.44]], [["mains hum", 35.87], ["hum", 28.31], ["music", 8.71]], [["fly, housefly", 21.01], ["mains hum", 12.91], ["insect", 12.56]], [["mains hum", 21.06], ["hum", 19.42], ["sizzle", 14.55]], [["music", 45.04], ["hum", 11.26], ["mains hum", 7.76]], [["music", 22.32], ["hum", 9.01], ["mains hum", 6.01]], null, [["music", 22.33], ["hum", 21.94], ["speech", 14.87]], [["music", 13.7], ["insect", 12.35], ["hum", 6.52]], [["speech", 17.62], ["mains hum", 15.4], ["hum", 14.99]], null, [["speech", 18.34], ["music", 13.58], ["fly, housefly", 10.27]]], "duration": [11.03, 4.11, 2.64, 2.51, 3.13, 2.94, 1.49, 9.65, 5.21, 3.26, 1.57, 3.32]} \ No newline at end of file diff --git a/annotations_1/51IaQuowCcA_filtered.json b/annotations_1/51IaQuowCcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf2587ca979d515e8104fb2d0bb01657362a7a50 --- /dev/null +++ b/annotations_1/51IaQuowCcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [11.0, 12.83], [15.0, 14.61], [16.0, 17.79], [25.0, 25.25], [28.0, 39.73], [41.0, 42.28], [52.0, 51.7], [68.0, 71.04], [80.0, 92.11], [92.0, 94.39], [95.0, 95.54], [97.0, 103.28], [107.0, 111.33], [113.0, 119.1], [121.0, 154.13], [159.0, 163.93], [164.0, 201.26], [207.0, 209.43], [216.0, 216.28]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.34, 0.0, 0.0, 98.36, 45.08, 56.63, 0.0, 94.95, 48.35, 32.13, 0.0, 33.68, 0.0, 93.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["sine wave", 12.52], ["insect", 8.2], ["groan", 7.37]], null, null, null, [["mosquito", 42.89], ["fly, housefly", 35.59], ["insect", 20.85]], null, null, null, [["animal", 9.11], ["cattle, bovinae", 8.91], ["moo", 8.06]], [["music", 75.63], ["musical instrument", 4.22], ["speech", 3.78]], null, [["music", 54.44], ["speech", 17.12], ["thunk", 8.1]], null, null, null], "duration": [1.39, 1.83, -0.39, 1.79, 0.25, 11.73, 1.28, -0.3, 3.04, 12.11, 2.39, 0.54, 6.28, 4.33, 6.1, 33.13, 4.93, 37.26, 2.43, 0.28]} \ No newline at end of file diff --git a/annotations_1/51reM6wq2XU_filtered.json b/annotations_1/51reM6wq2XU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cf9c65e8ea290c8fd4de706d0ea5329e05fb157 --- /dev/null +++ b/annotations_1/51reM6wq2XU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.09], [9.0, 14.59], [15.0, 17.47], [18.0, 19.67], [21.0, 23.28], [24.0, 27.24], [29.0, 30.91], [32.0, 34.25], [37.0, 38.97], [39.0, 43.55], [45.0, 48.56], [49.0, 51.65], [53.0, 66.65], [69.0, 71.24], [73.0, 75.02], [77.0, 83.73], [84.0, 85.23], [86.0, 87.74], [89.0, 89.36], [93.0, 95.66], [97.0, 98.46], [99.0, 103.96], [105.0, 106.15], [107.0, 110.0], [111.0, 113.04], [114.0, 121.86], [123.0, 126.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.95, 98.51, 0.0, 94.37, 99.93, 0.0, 99.59, 0.0, 81.0, 99.99, 99.99, 93.6, 94.95, 99.16, 91.13, 0.0, 0.0, 0.0, 78.72, 0.0, 82.07, 0.0, 76.7, 81.17, 86.27, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 5.59, 2.47, 1.67, 2.28, 3.24, 1.91, 2.25, 1.97, 4.55, 3.56, 2.65, 13.65, 2.24, 2.02, 6.73, 1.23, 1.74, 0.36, 2.66, 1.46, 4.96, 1.15, 3.0, 2.04, 7.86, 3.72]} \ No newline at end of file diff --git a/annotations_1/530g3-fuGGU_filtered.json b/annotations_1/530g3-fuGGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee6ed8b053806e343ab0d2b431b70ae3af09a98 --- /dev/null +++ b/annotations_1/530g3-fuGGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [13.0, 14.03], [20.0, 21.27], [22.0, 22.81], [25.0, 28.85], [30.0, 30.43], [39.0, 40.1], [41.0, 41.86], [43.0, 44.47], [47.0, 47.48], [49.0, 49.69], [56.0, 57.25], [62.0, 64.72], [66.0, 68.18], [77.0, 77.72], [78.0, 78.49], [79.0, 80.28], [82.0, 82.07], [84.0, 101.83], [103.0, 116.87], [119.0, 119.65], [122.0, 123.31], [128.0, 128.38], [134.0, 134.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 56.33, 0.0, 0.0, 0.0, 0.0, 32.61, 34.53, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 18.62], ["mains hum", 13.79], ["speech", 9.16]], [["music", 15.48], ["electric shaver, electric razor", 9.89], ["speech", 9.39]], null, null, null, null], "duration": [0.47, 1.03, 1.27, 0.81, 3.85, 0.43, 1.1, 0.86, 1.47, 0.48, 0.69, 1.25, 2.72, 2.18, 0.72, 0.49, 1.28, 0.07, 17.83, 13.87, 0.65, 1.31, 0.38, 0.43]} \ No newline at end of file diff --git a/annotations_1/536GqWYOHdI_filtered.json b/annotations_1/536GqWYOHdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0db2fc38064186ee2c95f548db274905c6e14539 --- /dev/null +++ b/annotations_1/536GqWYOHdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 30.01], [32.0, 36.96], [41.0, 46.79], [51.0, 51.49], [53.0, 60.08], [61.0, 62.5], [63.0, 62.72], [64.0, 66.31], [69.0, 80.49], [82.0, 82.83], [85.0, 90.1], [93.0, 98.47], [101.0, 104.08], [106.0, 113.04], [115.0, 129.24], [134.0, 153.79], [157.0, 157.91], [159.0, 167.27], [169.0, 170.58]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [48.65, 48.91, 36.09, 0.0, 44.66, 0.0, 0.0, 75.72, 38.45, 0.0, 37.49, 36.06, 33.87, 31.69, 32.04, 32.13, 0.0, 32.56, 0.0], "audiomae_on_audioset": [[["music", 50.27], ["musical instrument", 5.19], ["didgeridoo", 4.91]], [["music", 27.8], ["effects unit", 10.9], ["synthesizer", 9.45]], [["music", 76.35], ["musical instrument", 6.79], ["guitar", 4.06]], null, [["music", 55.6], ["speech", 3.95], ["musical instrument", 3.43]], null, null, null, [["music", 61.64], ["theremin", 6.4], ["musical instrument", 5.76]], null, [["music", 65.0], ["didgeridoo", 7.73], ["musical instrument", 5.59]], [["music", 67.14], ["effects unit", 3.91], ["musical instrument", 3.58]], [["music", 26.25], ["speech", 12.21], ["didgeridoo", 9.37]], [["music", 76.46], ["musical instrument", 3.33], ["didgeridoo", 2.98]], [["music", 82.44], ["didgeridoo", 3.49], ["musical instrument", 2.9]], [["music", 59.46], ["musical instrument", 4.78], ["theremin", 4.77]], null, [["music", 51.45], ["synthesizer", 5.22], ["musical instrument", 4.7]], null], "duration": [4.01, 4.96, 5.79, 0.49, 7.08, 1.5, -0.28, 2.31, 11.49, 0.83, 5.1, 5.47, 3.08, 7.04, 14.24, 19.79, 0.91, 8.27, 1.58]} \ No newline at end of file diff --git a/annotations_1/54x4n4FlV4U_filtered.json b/annotations_1/54x4n4FlV4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdd600c007866a0a78c8f415b38e66550bd31119 --- /dev/null +++ b/annotations_1/54x4n4FlV4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 41.72], [43.0, 48.15], [57.0, 57.72], [59.0, 61.94], [63.0, 64.69], [68.0, 71.93], [77.0, 81.41], [83.0, 89.68], [91.0, 97.33], [100.0, 102.44], [103.0, 105.71], [107.0, 110.37], [112.0, 116.21], [118.0, 122.4], [124.0, 125.81], [129.0, 143.28]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, true, false, true], "silence_prob": [73.67, 89.54, 0.0, 55.89, 0.0, 89.54, 54.5, 79.76, 85.54, 35.92, 35.41, 34.62, 30.94, 32.21, 0.0, 30.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 35.67], ["music", 8.04], ["sonar", 4.25]], [["music", 19.91], ["speech", 14.0], ["hum", 11.62]], [["music", 21.96], ["effects unit", 16.37], ["musical instrument", 9.88]], [["music", 30.77], ["sonar", 12.35], ["synthesizer", 9.96]], [["music", 43.37], ["electronic music", 8.15], ["musical instrument", 6.34]], null, [["music", 29.89], ["synthesizer", 5.24], ["hum", 5.11]]], "duration": [2.72, 5.15, 0.72, 2.94, 1.69, 3.93, 4.41, 6.68, 6.33, 2.44, 2.71, 3.37, 4.21, 4.4, 1.81, 14.28]} \ No newline at end of file diff --git a/annotations_1/55uK9Lg3TaY_filtered.json b/annotations_1/55uK9Lg3TaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2990b5a908462fa3e9d113f7f8cb52d6143e5351 --- /dev/null +++ b/annotations_1/55uK9Lg3TaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.98], [11.0, 11.37], [13.0, 13.42], [15.0, 22.11], [23.0, 23.53], [32.0, 32.58], [39.0, 39.38], [41.0, 41.67], [42.0, 43.29], [46.0, 47.82], [49.0, 50.72], [51.0, 52.0], [53.0, 55.9], [57.0, 58.56], [59.0, 67.44], [75.0, 78.63], [80.0, 84.72], [87.0, 89.67], [91.0, 91.96], [97.0, 97.93], [102.0, 108.8], [110.0, 111.18], [125.0, 126.54], [130.0, 130.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 29.37, 29.85, 33.36, 29.76, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 25.83], ["speech", 20.7], ["sidetone", 14.74]], null, null, null, null, null, null, null, null, null, null, [["music", 82.54], ["hum", 2.97], ["sidetone", 1.76]], [["music", 51.08], ["theremin", 5.45], ["thunk", 4.91]], [["sidetone", 43.25], ["music", 17.82], ["dial tone", 3.89]], [["music", 30.82], ["speech", 12.34], ["fly, housefly", 8.14]], null, null, [["music", 68.02], ["synthesizer", 6.95], ["musical instrument", 4.28]], null, null, null], "duration": [1.98, 0.37, 0.42, 7.11, 0.53, 0.58, 0.38, 0.67, 1.29, 1.82, 1.72, 1.0, 2.9, 1.56, 8.44, 3.63, 4.72, 2.67, 0.96, 0.93, 6.8, 1.18, 1.54, 0.13]} \ No newline at end of file diff --git a/annotations_1/56v74zFOV58_filtered.json b/annotations_1/56v74zFOV58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..881a4d962393b4b0142b3bc26c36d5443a5df124 --- /dev/null +++ b/annotations_1/56v74zFOV58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.57], [12.0, 16.77], [18.0, 21.56], [25.0, 26.11], [32.0, 33.78], [35.0, 35.65], [36.0, 39.43], [41.0, 45.59], [54.0, 55.9], [57.0, 58.26], [63.0, 63.49], [66.0, 67.9], [73.0, 75.47], [80.0, 80.74], [83.0, 84.35], [87.0, 87.83], [91.0, 90.86], [93.0, 94.78], [95.0, 97.93], [99.0, 103.18], [106.0, 108.06], [110.0, 112.09], [114.0, 115.6], [116.0, 128.9], [130.0, 133.3], [134.0, 137.73], [139.0, 143.77], [145.0, 147.85], [149.0, 156.91], [159.0, 160.59]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.54, 34.58, 32.61, 0.0, 0.0, 0.0, 43.0, 91.47, 0.0, 0.0, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 0.0, 0.0, 43.64, 69.2, 38.68, 66.27, 0.0, 42.96, 63.96, 84.43, 46.15, 83.7, 38.5, 0.0], "audiomae_on_audioset": [[["speech", 33.26], ["sheep", 15.15], ["vehicle", 9.12]], [["speech", 46.98], ["hum", 14.35], ["mains hum", 3.82]], [["whale vocalization", 14.09], ["livestock, farm animals, working animals", 9.66], ["sheep", 5.8]], null, null, null, [["speech", 53.36], ["music", 11.14], ["hum", 9.83]], null, null, null, null, null, [["music", 22.97], ["sonar", 17.2], ["synthesizer", 10.21]], null, null, null, null, null, [["hum", 58.52], ["throbbing", 23.29], ["music", 4.85]], null, [["speech", 50.78], ["music", 21.0], ["synthesizer", 4.01]], null, null, [["speech", 42.17], ["music", 21.18], ["sidetone", 9.98]], null, null, [["music", 8.15], ["vehicle", 8.0], ["speech", 7.85]], null, [["music", 64.72], ["musical instrument", 3.63], ["speech", 2.03]], null], "duration": [7.57, 4.77, 3.56, 1.11, 1.78, 0.65, 3.43, 4.59, 1.9, 1.26, 0.49, 1.9, 2.47, 0.74, 1.35, 0.83, -0.14, 1.78, 2.93, 4.18, 2.06, 2.09, 1.6, 12.9, 3.3, 3.73, 4.77, 2.85, 7.91, 1.59]} \ No newline at end of file diff --git a/annotations_1/574oBJ7SR_8_filtered.json b/annotations_1/574oBJ7SR_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..868b892badc036376fb41adcd11f0aca2119aa60 --- /dev/null +++ b/annotations_1/574oBJ7SR_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.58], [32.0, 34.59], [36.0, 36.88], [37.0, 51.44], [52.0, 52.62], [55.0, 56.44], [60.0, 60.78], [62.0, 62.28], [66.0, 66.38], [79.0, 79.83], [83.0, 88.87], [95.0, 95.84], [97.0, 98.31], [99.0, 98.78], [99.0, 108.48], [111.0, 111.82], [112.0, 111.86], [112.0, 112.5], [113.0, 113.75], [115.0, 115.33], [116.0, 116.31], [118.0, 134.0], [134.0, 134.5], [135.0, 135.35], [136.0, 136.17], [138.0, 138.08], [139.0, 141.27], [146.0, 151.65], [155.0, 155.11], [155.0, 155.14], [155.0, 157.06], [157.0, 157.1], [157.0, 157.13], [166.0, 167.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 65.09, 0.0, 31.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 34.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 0.0, 0.0, 0.0, 31.74, 30.49, 0.0, 0.0, 29.9, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 68.61], ["noise", 13.31], ["radio", 2.89]], null, null, null, null, null, null, [["speech", 93.34], ["burping, eructation", 1.14], ["male speech, man speaking", 1.08]], null, null, null, [["speech", 54.24], ["noise", 15.5], ["music", 14.01]], null, null, null, null, null, null, [["speech", 86.55], ["noise", 3.73], ["music", 1.48]], null, null, null, null, [["speech", 57.98], ["noise", 5.67], ["hum", 4.08]], [["speech", 85.74], ["radio", 5.04], ["burping, eructation", 2.6]], null, null, [["speech", 36.06], ["music", 16.78], ["reverberation", 6.03]], null, null, null], "duration": [0.58, 2.59, 0.88, 14.44, 0.62, 1.44, 0.78, 0.28, 0.38, 0.83, 5.87, 0.84, 1.31, -0.22, 9.48, 0.82, -0.14, 0.5, 0.75, 0.33, 0.31, 16.0, 0.5, 0.35, 0.17, 0.08, 2.27, 5.65, 0.11, 0.14, 2.06, 0.1, 0.13, 1.31]} \ No newline at end of file diff --git a/annotations_1/57MtQQ5sm24_filtered.json b/annotations_1/57MtQQ5sm24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aafc0e2fec5cc13182fbd3cd28ccdaaa222f783 --- /dev/null +++ b/annotations_1/57MtQQ5sm24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 84.38], [85.0, 117.75], [121.0, 121.32], [124.0, 151.16], [154.0, 191.73]], "keep_status": [false, false, false, false, false], "silence_prob": [39.3, 0.0, 0.0, 31.0, 0.0], "audiomae_on_audioset": [[["insect", 42.27], ["fly, housefly", 24.75], ["hum", 6.52]], null, null, [["buzz", 45.12], ["fly, housefly", 14.59], ["insect", 11.96]], null], "duration": [4.38, 32.75, 0.32, 27.16, 37.73]} \ No newline at end of file diff --git a/annotations_1/57eIYneEz7E_filtered.json b/annotations_1/57eIYneEz7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fe3e4f27e7763d384202a5310fbc51040dd4bdb --- /dev/null +++ b/annotations_1/57eIYneEz7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[91.0, 108.53], [110.0, 112.55], [114.0, 114.86], [116.0, 117.42], [118.0, 119.75], [121.0, 123.08], [125.0, 142.99]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [30.42, 46.43, 0.0, 0.0, 0.0, 41.6, 30.7], "audiomae_on_audioset": [[["music", 27.58], ["whack, thwack", 20.86], ["thump, thud", 19.72]], [["fly, housefly", 48.27], ["bee, wasp, etc.", 19.5], ["insect", 17.87]], null, null, null, [["fly, housefly", 44.55], ["bee, wasp, etc.", 28.25], ["insect", 17.69]], [["hum", 39.01], ["music", 16.44], ["throbbing", 15.22]]], "duration": [17.53, 2.55, 0.86, 1.42, 1.75, 2.08, 17.99]} \ No newline at end of file diff --git a/annotations_1/57u_LsqMoys_filtered.json b/annotations_1/57u_LsqMoys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9b461931f16b6c26fb05442994751df829d5266 --- /dev/null +++ b/annotations_1/57u_LsqMoys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [10.0, 9.73], [11.0, 11.96], [18.0, 18.59], [25.0, 26.86], [28.0, 28.07], [30.0, 30.65], [36.0, 36.24], [36.0, 44.71], [48.0, 51.88], [65.0, 65.35], [67.0, 67.83], [82.0, 84.7], [87.0, 106.25], [108.0, 110.49], [113.0, 115.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.39, 35.1, 0.0, 0.0, 41.6, 31.84, 51.12, 49.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 67.78], ["explosion", 7.95], ["music", 6.58]], [["whale vocalization", 71.8], ["groan", 6.65], ["speech", 4.92]], null, null, [["speech", 24.64], ["rumble", 19.59], ["music", 15.71]], [["music", 55.06], ["hiccup", 10.43], ["hum", 7.12]], null, [["music", 46.69], ["speech", 23.41], ["hum", 4.93]]], "duration": [0.48, -0.27, 0.96, 0.59, 1.86, 0.07, 0.65, 0.24, 8.71, 3.88, 0.35, 0.83, 2.7, 19.25, 2.49, 2.26]} \ No newline at end of file diff --git a/annotations_1/585p7sJhiFk_filtered.json b/annotations_1/585p7sJhiFk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d590cbd3dbc823b451ca936522964dc791aa4b --- /dev/null +++ b/annotations_1/585p7sJhiFk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 79.47], [81.0, 85.08], [85.0, 102.22], [103.0, 107.89], [111.0, 119.38], [120.0, 123.7], [124.0, 129.36]], "keep_status": [false, true, true, false, false, false, false], "silence_prob": [0.0, 31.17, 31.03, 37.1, 55.11, 76.86, 66.03], "audiomae_on_audioset": [null, [["music", 29.76], ["machine gun", 24.14], ["fusillade", 15.75]], [["speech", 40.74], ["music", 12.63], ["machine gun", 12.27]], [["music", 71.51], ["musical instrument", 3.67], ["theremin", 2.92]], null, null, null], "duration": [78.47, 4.08, 17.22, 4.89, 8.38, 3.7, 5.36]} \ No newline at end of file diff --git a/annotations_1/58BDrZH7SX8_filtered.json b/annotations_1/58BDrZH7SX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b164d4a447659889da8167ef1698e25d5c523b12 --- /dev/null +++ b/annotations_1/58BDrZH7SX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.91], [28.0, 28.49], [184.0, 190.27]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 33.52], "audiomae_on_audioset": [null, null, [["music", 58.86], ["bleat", 3.85], ["throbbing", 2.47]]], "duration": [1.91, 0.49, 6.27]} \ No newline at end of file diff --git a/annotations_1/58DPO_8Bd88_filtered.json b/annotations_1/58DPO_8Bd88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..effe660dbe94aca225e579f23ab89a8fad630ed0 --- /dev/null +++ b/annotations_1/58DPO_8Bd88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [18.0, 21.51], [23.0, 23.14], [26.0, 26.57], [30.0, 30.11], [31.0, 32.05], [38.0, 37.86], [50.0, 53.2], [56.0, 56.78], [74.0, 74.11], [75.0, 76.03], [76.0, 77.08], [78.0, 78.22], [85.0, 84.94], [88.0, 89.33], [99.0, 100.13], [101.0, 102.12], [106.0, 106.61], [116.0, 116.95], [118.0, 119.55], [121.0, 121.29], [122.0, 122.71], [125.0, 125.91], [128.0, 129.03], [130.0, 132.36], [133.0, 134.11], [135.0, 135.72], [137.0, 141.13], [142.0, 144.05], [145.0, 149.13], [150.0, 149.77], [152.0, 168.44], [169.0, 170.09], [171.0, 173.3]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.79, 0.0, 0.0, 0.0, 0.0, 0.0, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 65.2, 62.37, 82.61, 0.0, 60.42, 0.0, 52.1], "audiomae_on_audioset": [null, [["speech", 31.66], ["hum", 19.59], ["sidetone", 14.31]], null, null, null, null, null, [["music", 25.67], ["speech", 24.17], ["hum", 11.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 3.51, 0.14, 0.57, 0.11, 1.05, -0.14, 3.2, 0.78, 0.11, 1.03, 1.08, 0.22, -0.06, 1.33, 1.13, 1.12, 0.61, 0.95, 1.55, 0.29, 0.71, 0.91, 1.03, 2.36, 1.11, 0.72, 4.13, 2.05, 4.13, -0.23, 16.44, 1.09, 2.3]} \ No newline at end of file diff --git a/annotations_1/59wvo9e2XQY_filtered.json b/annotations_1/59wvo9e2XQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78d26f2d23402a7209fc4d5abcb87738a174d45b --- /dev/null +++ b/annotations_1/59wvo9e2XQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.65], [19.0, 20.75], [22.0, 22.96], [24.0, 25.74], [40.0, 41.88], [44.0, 46.23], [56.0, 57.54], [58.0, 60.15], [61.0, 64.74], [67.0, 67.31], [68.0, 68.91], [72.0, 73.92], [76.0, 78.98], [80.0, 81.36], [82.0, 83.89], [85.0, 86.88], [90.0, 92.7], [101.0, 102.15], [105.0, 105.41], [119.0, 119.13], [123.0, 122.74], [130.0, 132.53], [134.0, 136.07], [138.0, 138.67], [143.0, 143.46], [145.0, 147.33], [151.0, 151.31], [159.0, 167.61], [200.0, 201.56], [208.0, 208.16], [209.0, 211.65], [213.0, 214.61], [217.0, 218.74], [220.0, 221.09], [222.0, 223.62], [225.0, 225.76], [227.0, 231.89], [232.0, 235.25], [236.0, 247.97]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 47.5, 53.47, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 55.6, 45.62, 0.0, 0.0, 76.53, 0.0, 49.68, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 47.74, 55.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 53.57], ["telephone", 10.54], ["busy signal", 4.37]], null, null, null, null, null, null, null, null, [["sidetone", 50.09], ["speech", 31.64], ["music", 3.53]], null, null, null, null, null, [["speech", 44.31], ["hum", 9.23], ["music", 8.39]], null, null, null, null, [["hum", 24.13], ["music", 19.98], ["speech", 19.09]], null, null, null, null, null, null, null, null, [["music", 37.06], ["electronic music", 9.41], ["hum", 8.25]], [["music", 60.19], ["speech", 13.51], ["hum", 3.96]], null], "duration": [0.65, 1.75, 0.96, 1.74, 1.88, 2.23, 1.54, 2.15, 3.74, 0.31, 0.91, 1.92, 2.98, 1.36, 1.89, 1.88, 2.7, 1.15, 0.41, 0.13, -0.26, 2.53, 2.07, 0.67, 0.46, 2.33, 0.31, 8.61, 1.56, 0.16, 2.65, 1.61, 1.74, 1.09, 1.62, 0.76, 4.89, 3.25, 11.97]} \ No newline at end of file diff --git a/annotations_1/5A98txE5nno_filtered.json b/annotations_1/5A98txE5nno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0510fde2953edc81ca836d2b66b312213907ccea --- /dev/null +++ b/annotations_1/5A98txE5nno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 5.36], [8.0, 8.85], [10.0, 11.33], [12.0, 13.85], [18.0, 18.62], [30.0, 30.99], [33.0, 33.44], [35.0, 35.99], [38.0, 38.03], [41.0, 41.17], [42.0, 50.41], [54.0, 55.93], [56.0, 93.07], [97.0, 99.62], [101.0, 102.91], [107.0, 110.13], [112.0, 112.58], [113.0, 114.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 61.57, 0.0, 53.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.36, 0.85, 1.33, 1.85, 0.62, 0.99, 0.44, 0.99, 0.03, 0.17, 8.41, 1.93, 37.07, 2.62, 1.91, 3.13, 0.58, 1.05]} \ No newline at end of file diff --git a/annotations_1/5Ackdv3pgmU_filtered.json b/annotations_1/5Ackdv3pgmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7389eae00959fe2ec3218d546f6b483416c04d93 --- /dev/null +++ b/annotations_1/5Ackdv3pgmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.69], [16.0, 15.75], [16.0, 17.32], [17.0, 17.44], [19.0, 21.61], [23.0, 26.05], [27.0, 27.46], [29.0, 40.22], [41.0, 42.6], [44.0, 58.85], [60.0, 72.17], [72.0, 73.63], [74.0, 74.48], [75.0, 78.22], [80.0, 84.62], [86.0, 91.37], [93.0, 107.03], [109.0, 115.06]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [49.87, 0.0, 0.0, 0.0, 99.91, 99.99, 0.0, 83.52, 0.0, 93.29, 49.36, 0.0, 0.0, 95.78, 66.15, 36.88, 31.45, 33.18], "audiomae_on_audioset": [[["speech", 35.55], ["hum", 15.49], ["sidetone", 15.45]], null, null, null, null, null, null, null, null, null, [["speech", 26.62], ["hum", 25.86], ["mains hum", 10.58]], null, null, null, null, [["music", 27.6], ["hum", 11.34], ["fart", 9.27]], [["speech", 70.21], ["music", 12.48], ["whack, thwack", 2.85]], [["music", 68.61], ["didgeridoo", 7.2], ["throbbing", 6.92]]], "duration": [7.69, -0.25, 1.32, 0.44, 2.61, 3.05, 0.46, 11.22, 1.6, 14.85, 12.17, 1.63, 0.48, 3.22, 4.62, 5.37, 14.03, 6.06]} \ No newline at end of file diff --git a/annotations_1/5BLZxhN2lDE_filtered.json b/annotations_1/5BLZxhN2lDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d6fb555db0f07f08be5d309e11413509a8a0a7 --- /dev/null +++ b/annotations_1/5BLZxhN2lDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.62], [2.0, 7.65], [8.0, 8.73], [9.0, 10.22], [15.0, 20.65], [21.0, 24.27], [28.0, 29.96], [31.0, 31.92], [34.0, 37.3], [38.0, 38.79], [42.0, 44.29], [48.0, 48.84], [50.0, 50.89], [52.0, 57.62], [59.0, 60.22], [62.0, 63.19], [66.0, 70.34], [72.0, 77.18], [78.0, 81.48], [82.0, 84.91], [86.0, 86.49], [88.0, 88.82], [90.0, 93.92], [96.0, 96.3], [97.0, 98.58], [103.0, 105.7], [108.0, 115.47], [117.0, 119.45], [123.0, 122.96], [128.0, 128.21], [138.0, 141.84], [144.0, 144.53], [148.0, 157.27], [158.0, 160.68], [163.0, 164.44], [166.0, 167.75], [169.0, 181.95], [184.0, 188.35], [189.0, 188.67], [189.0, 191.81], [192.0, 193.35], [195.0, 195.15], [196.0, 195.81], [196.0, 199.66], [200.0, 201.16], [202.0, 203.99], [204.0, 206.25], [208.0, 208.87], [209.0, 209.98], [213.0, 212.87], [214.0, 216.16], [217.0, 217.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 69.61, 0.0, 0.0, 57.32, 41.01, 0.0, 0.0, 63.96, 0.0, 53.84, 0.0, 0.0, 78.21, 0.0, 0.0, 99.52, 70.02, 84.43, 78.89, 0.0, 0.0, 46.61, 0.0, 0.0, 49.45, 40.29, 31.89, 0.0, 0.0, 33.13, 0.0, 30.17, 29.42, 0.0, 0.0, 29.58, 33.08, 0.0, 36.55, 0.0, 0.0, 0.0, 41.66, 0.0, 0.0, 44.04, 0.0, 0.0, 0.0, 94.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 41.63], ["throbbing", 18.77], ["speech", 16.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.49], ["speech", 7.57], ["hum", 6.04]], null, null, [["music", 41.92], ["musical instrument", 8.44], ["effects unit", 8.35]], [["music", 49.28], ["hum", 8.83], ["musical instrument", 4.77]], [["music", 71.07], ["lullaby", 2.75], ["guitar", 1.83]], null, null, [["music", 55.56], ["guitar", 3.18], ["plucked string instrument", 3.16]], null, [["music", 63.41], ["didgeridoo", 6.61], ["mantra", 4.6]], [["music", 67.52], ["carnatic music", 11.38], ["didgeridoo", 3.93]], null, null, [["music", 82.69], ["singing", 2.17], ["lullaby", 1.43]], [["didgeridoo", 31.07], ["music", 29.4], ["theremin", 3.75]], null, [["music", 20.3], ["speech", 17.9], ["didgeridoo", 16.74]], null, null, null, [["music", 45.89], ["speech", 13.56], ["musical instrument", 6.65]], null, null, [["speech", 47.32], ["music", 3.79], ["animal", 3.19]], null, null, null, null, null], "duration": [-0.38, 5.65, 0.73, 1.22, 5.65, 3.27, 1.96, 0.92, 3.3, 0.79, 2.29, 0.84, 0.89, 5.62, 1.22, 1.19, 4.34, 5.18, 3.48, 2.91, 0.49, 0.82, 3.92, 0.3, 1.58, 2.7, 7.47, 2.45, -0.04, 0.21, 3.84, 0.53, 9.27, 2.68, 1.44, 1.75, 12.95, 4.35, -0.33, 2.81, 1.35, 0.15, -0.19, 3.66, 1.16, 1.99, 2.25, 0.87, 0.98, -0.13, 2.16, 0.7]} \ No newline at end of file diff --git a/annotations_1/5CO6DsmrIDw_filtered.json b/annotations_1/5CO6DsmrIDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f63878c40c6fea69c7eb9d26d33ea3e6b4a396a9 --- /dev/null +++ b/annotations_1/5CO6DsmrIDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 113.26]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [105.26]} \ No newline at end of file diff --git a/annotations_1/5Cv1ENey4yU_filtered.json b/annotations_1/5Cv1ENey4yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed67e72e098c05e9aee340b8e933b3f40ddb4199 --- /dev/null +++ b/annotations_1/5Cv1ENey4yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [1.0, 1.78], [5.0, 8.97], [13.0, 13.17], [13.0, 30.33], [35.0, 38.11], [39.0, 40.59], [41.0, 42.18], [43.0, 45.2], [46.0, 48.02], [49.0, 53.91], [58.0, 61.26], [63.0, 73.08], [73.0, 80.62], [82.0, 85.29], [89.0, 97.65], [98.0, 109.9], [113.0, 140.95], [144.0, 151.04], [153.0, 160.64]], "keep_status": [false, false, false, false, true, true, false, false, true, false, true, true, true, true, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 40.09, 0.0, 31.22, 30.01, 0.0, 0.0, 33.15, 38.4, 30.89, 29.99, 30.74, 32.16, 32.3, 30.28, 30.11, 30.17, 32.33, 32.65], "audiomae_on_audioset": [null, null, [["speech", 53.45], ["music", 18.52], ["rumble", 1.92]], null, [["music", 24.5], ["hum", 14.42], ["throbbing", 8.23]], [["speech", 42.98], ["music", 14.54], ["mains hum", 7.65]], null, null, [["hum", 30.92], ["throbbing", 20.41], ["music", 17.55]], [["music", 50.47], ["throbbing", 10.86], ["hum", 9.22]], [["speech", 43.54], ["music", 17.92], ["throbbing", 7.25]], [["speech", 14.96], ["music", 8.61], ["hum", 7.89]], [["hum", 17.25], ["fly, housefly", 16.74], ["throbbing", 10.74]], [["speech", 37.23], ["music", 14.68], ["sheep", 11.57]], [["livestock, farm animals, working animals", 14.42], ["music", 11.61], ["sheep", 10.33]], [["speech", 48.0], ["music", 25.53], ["hum", 4.21]], [["whack, thwack", 25.46], ["music", 23.38], ["speech", 12.56]], [["music", 61.1], ["hum", 7.08], ["throbbing", 4.74]], [["throbbing", 56.69], ["hum", 20.22], ["music", 14.54]], [["speech", 38.78], ["fly, housefly", 9.77], ["sidetone", 9.05]]], "duration": [0.04, 0.78, 3.97, 0.17, 17.33, 3.11, 1.59, 1.18, 2.2, 2.02, 4.91, 3.26, 10.08, 7.62, 3.29, 8.65, 11.9, 27.95, 7.04, 7.64]} \ No newline at end of file diff --git a/annotations_1/5CxYctMSiw0_filtered.json b/annotations_1/5CxYctMSiw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7083fe62de9fe2dc325fa8b51a2439f0bb808429 --- /dev/null +++ b/annotations_1/5CxYctMSiw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.64], [16.0, 16.7], [33.0, 37.88], [39.0, 44.79], [61.0, 72.81], [85.0, 94.73], [95.0, 96.6], [100.0, 119.82], [120.0, 119.94], [120.0, 121.71], [122.0, 127.03], [131.0, 131.94], [134.0, 134.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.54, 29.88, 29.56, 32.78, 0.0, 30.0, 0.0, 0.0, 28.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.01], ["didgeridoo", 10.59], ["beatboxing", 5.61]], [["music", 65.06], ["didgeridoo", 12.01], ["throbbing", 4.9]], [["music", 75.48], ["didgeridoo", 5.13], ["electronic music", 2.66]], [["music", 50.0], ["throbbing", 22.35], ["hum", 6.14]], null, [["music", 78.98], ["hum", 3.54], ["throbbing", 2.9]], null, null, [["speech", 24.63], ["synthesizer", 9.14], ["whale vocalization", 8.36]], null, null], "duration": [0.64, 0.7, 4.88, 5.79, 11.81, 9.73, 1.6, 19.82, -0.06, 1.71, 5.03, 0.94, 0.55]} \ No newline at end of file diff --git a/annotations_1/5D20G8qe4Qc_filtered.json b/annotations_1/5D20G8qe4Qc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a5143b471fd05703fbf02f17896b17912d813a0 --- /dev/null +++ b/annotations_1/5D20G8qe4Qc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [2.0, 2.0], [9.0, 9.91], [16.0, 16.36], [23.0, 25.15], [30.0, 31.14], [36.0, 36.95], [39.0, 40.96], [44.0, 46.97], [50.0, 51.14], [52.0, 53.69], [55.0, 56.89], [59.0, 60.91], [62.0, 64.69], [65.0, 68.34], [69.0, 71.69], [73.0, 73.89], [77.0, 78.0], [79.0, 80.82], [82.0, 83.71], [86.0, 87.49], [89.0, 112.83], [115.0, 153.77], [155.0, 162.28], [163.0, 166.4], [167.0, 171.36], [172.0, 173.84]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.28, 0.0, 0.0, 0.0, 47.05, 0.0, 0.0, 0.0, 0.0, 53.16, 50.71, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0, 29.86, 0.0, 39.41, 46.54, 44.93, 0.0], "audiomae_on_audioset": [null, null, null, null, [["throbbing", 19.26], ["hum", 14.09], ["music", 8.7]], null, null, null, [["music", 32.71], ["synthesizer", 7.96], ["glass", 5.02]], null, null, null, null, null, null, [["music", 32.1], ["throbbing", 23.56], ["hum", 9.84]], null, null, null, null, null, [["music", 64.24], ["hum", 9.42], ["mains hum", 3.21]], null, [["hum", 41.96], ["throbbing", 18.02], ["mains hum", 13.61]], [["hum", 40.89], ["throbbing", 20.23], ["mains hum", 13.99]], [["hum", 28.56], ["music", 21.33], ["throbbing", 12.49]], null], "duration": [0.46, 0.0, 0.91, 0.36, 2.15, 1.14, 0.95, 1.96, 2.97, 1.14, 1.69, 1.89, 1.91, 2.69, 3.34, 2.69, 0.89, 1.0, 1.82, 1.71, 1.49, 23.83, 38.77, 7.28, 3.4, 4.36, 1.84]} \ No newline at end of file diff --git a/annotations_1/5DWrrqP_HNk_filtered.json b/annotations_1/5DWrrqP_HNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b870acd45b5ce1bb9d41ebc8053ab2e1ea3d5183 --- /dev/null +++ b/annotations_1/5DWrrqP_HNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.83], [14.0, 17.34], [18.0, 20.06], [22.0, 24.04], [25.0, 27.65], [29.0, 30.42], [31.0, 32.91], [34.0, 33.96], [35.0, 36.07], [37.0, 40.36], [42.0, 44.93], [47.0, 49.79], [52.0, 55.02], [57.0, 58.94], [60.0, 62.07], [64.0, 65.69], [69.0, 70.36], [71.0, 72.98], [74.0, 75.36], [76.0, 79.32], [81.0, 84.13], [85.0, 86.66], [89.0, 92.72], [94.0, 94.81], [96.0, 103.0], [104.0, 112.89], [114.0, 114.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 90.08, 60.98, 43.85, 99.92, 0.0, 0.0, 0.0, 0.0, 52.22, 92.8, 70.44, 98.86, 0.0, 40.52, 0.0, 0.0, 0.0, 0.0, 98.01, 90.78, 0.0, 85.9, 0.0, 54.7, 34.26, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 56.95], ["sine wave", 12.04], ["hum", 6.11]], null, null, null, null, null, null, null, null, null, null, [["speech", 20.23], ["mains hum", 17.03], ["hum", 13.1]], null, null, null, null, null, null, null, null, null, null, [["speech", 45.49], ["music", 10.16], ["explosion", 9.97]], null], "duration": [1.83, 3.34, 2.06, 2.04, 2.65, 1.42, 1.91, -0.04, 1.07, 3.36, 2.93, 2.79, 3.02, 1.94, 2.07, 1.69, 1.36, 1.98, 1.36, 3.32, 3.13, 1.66, 3.72, 0.81, 7.0, 8.89, 0.94]} \ No newline at end of file diff --git a/annotations_1/5EN4MulDX_A_filtered.json b/annotations_1/5EN4MulDX_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f8c41ae72f2a151ae1abe6037d391cbd14d303a --- /dev/null +++ b/annotations_1/5EN4MulDX_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.72], [10.0, 11.53], [13.0, 16.38], [19.0, 19.85], [22.0, 22.54], [23.0, 25.68], [30.0, 30.81], [32.0, 32.59], [33.0, 33.1], [33.0, 34.11], [34.0, 36.39], [42.0, 43.17], [47.0, 57.92], [59.0, 64.89], [79.0, 81.7], [83.0, 84.33], [85.0, 85.63], [87.0, 88.1], [89.0, 90.56], [92.0, 93.33], [97.0, 102.91], [103.0, 103.25], [106.0, 116.51], [117.0, 118.5], [125.0, 128.49], [135.0, 135.57], [139.0, 144.41]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [75.72, 0.0, 95.64, 0.0, 0.0, 38.72, 0.0, 0.0, 0.0, 0.0, 47.7, 0.0, 30.67, 30.16, 38.91, 0.0, 0.0, 0.0, 0.0, 0.0, 31.42, 0.0, 30.28, 0.0, 30.01, 0.0, 30.11], "audiomae_on_audioset": [null, null, null, null, null, [["music", 34.94], ["boing", 13.73], ["animal", 6.64]], null, null, null, null, [["music", 24.32], ["speech", 18.25], ["musical instrument", 11.51]], null, [["noise", 31.62], ["music", 24.1], ["hum", 15.7]], [["music", 74.54], ["musical instrument", 5.01], ["didgeridoo", 3.8]], [["music", 15.34], ["livestock, farm animals, working animals", 8.88], ["cattle, bovinae", 7.94]], null, null, null, null, null, [["music", 63.37], ["guitar", 3.69], ["musical instrument", 3.12]], null, [["music", 48.15], ["bass guitar", 9.99], ["musical instrument", 7.55]], null, [["music", 66.48], ["musical instrument", 4.04], ["guitar", 2.66]], null, [["music", 68.86], ["didgeridoo", 3.22], ["musical instrument", 2.46]]], "duration": [2.72, 1.53, 3.38, 0.85, 0.54, 2.68, 0.81, 0.59, 0.1, 1.11, 2.39, 1.17, 10.92, 5.89, 2.7, 1.33, 0.63, 1.1, 1.56, 1.33, 5.91, 0.25, 10.51, 1.5, 3.49, 0.57, 5.41]} \ No newline at end of file diff --git a/annotations_1/5Ehdu6XTlBc_filtered.json b/annotations_1/5Ehdu6XTlBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49c2dafdb6f0a1fe36342c7a8be6169ee76f7c12 --- /dev/null +++ b/annotations_1/5Ehdu6XTlBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.46], [3.0, 4.48], [5.0, 6.02], [12.0, 13.69], [15.0, 15.69], [19.0, 19.75], [21.0, 22.22], [23.0, 25.05], [29.0, 30.5], [31.0, 33.45], [36.0, 37.61], [44.0, 44.76], [46.0, 46.6], [50.0, 51.39], [52.0, 56.13], [57.0, 57.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.16, 0.0, 37.52, 0.0, 0.0, 0.0, 0.0, 41.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 84.2], ["quack", 4.99], ["speech", 1.59]], null, null, null, null, [["music", 88.47], ["speech", 3.98], ["music of latin america", 1.05]], null], "duration": [1.46, 1.48, 1.02, 1.69, 0.69, 0.75, 1.22, 2.05, 1.5, 2.45, 1.61, 0.76, 0.6, 1.39, 4.13, 0.2]} \ No newline at end of file diff --git a/annotations_1/5Fa3enGmEfA_filtered.json b/annotations_1/5Fa3enGmEfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58f63cdde9daf915d0f30ad3d758b14db25e5b15 --- /dev/null +++ b/annotations_1/5Fa3enGmEfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.13], [29.0, 59.86], [61.0, 85.19], [87.0, 133.32], [136.0, 136.09]], "keep_status": [false, false, false, false, false], "silence_prob": [28.24, 0.0, 28.53, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.38], ["hum", 11.76], ["throbbing", 9.61]], null, [["music", 68.06], ["noise", 4.79], ["reverberation", 2.33]], null, null], "duration": [19.13, 30.86, 24.19, 46.32, 0.09]} \ No newline at end of file diff --git a/annotations_1/5H7YGAM9Na0_filtered.json b/annotations_1/5H7YGAM9Na0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af7d1164009b6732ebb19dfb2a71d3cd86e00fe7 --- /dev/null +++ b/annotations_1/5H7YGAM9Na0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.91], [24.0, 27.46], [28.0, 30.15], [34.0, 36.66], [40.0, 40.29], [42.0, 42.94], [45.0, 61.21], [63.0, 63.48], [69.0, 70.61], [73.0, 73.4], [75.0, 77.35], [78.0, 79.27], [81.0, 81.38], [85.0, 86.27], [91.0, 91.35], [93.0, 94.46], [101.0, 102.19], [105.0, 105.27], [108.0, 108.97], [111.0, 111.79], [113.0, 114.71], [117.0, 118.86], [119.0, 122.05], [129.0, 130.47], [145.0, 146.43], [149.0, 151.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 99.85, 58.64, 57.48, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 0.0, 40.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 23.39], ["speech", 15.85], ["hum", 8.11]]], "duration": [0.91, 3.46, 2.15, 2.66, 0.29, 0.94, 16.21, 0.48, 1.61, 0.4, 2.35, 1.27, 0.38, 1.27, 0.35, 1.46, 1.19, 0.27, 0.97, 0.79, 1.71, 1.86, 3.05, 1.47, 1.43, 2.31]} \ No newline at end of file diff --git a/annotations_1/5H_MyLSpRSs_filtered.json b/annotations_1/5H_MyLSpRSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecd310b92b87eb88e82dece73e5b1ed78eeb2c3c --- /dev/null +++ b/annotations_1/5H_MyLSpRSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [8.0, 21.3], [22.0, 27.31], [28.0, 39.09], [42.0, 75.64], [78.0, 110.0], [112.0, 113.98]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 33.56, 29.54, 30.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["arrow", 15.7], ["tubular bells", 15.44], ["tuning fork", 13.07]], [["livestock, farm animals, working animals", 50.21], ["cattle, bovinae", 20.01], ["moo", 9.45]], [["music", 54.06], ["whale vocalization", 13.31], ["noise", 6.33]], null, null, null], "duration": [0.95, 13.3, 5.31, 11.09, 33.64, 32.0, 1.98]} \ No newline at end of file diff --git a/annotations_1/5Ii0_2kAYlU_filtered.json b/annotations_1/5Ii0_2kAYlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea4f28ab102f80668c99776581aaf8a2460d5750 --- /dev/null +++ b/annotations_1/5Ii0_2kAYlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [6.0, 7.03], [13.0, 12.87], [22.0, 27.89], [47.0, 47.76], [52.0, 52.42], [53.0, 57.74], [59.0, 63.63], [71.0, 74.17], [78.0, 83.78], [88.0, 88.52], [90.0, 90.61], [91.0, 91.35], [93.0, 93.6], [98.0, 98.49], [102.0, 106.49], [110.0, 112.99], [114.0, 115.6], [117.0, 125.83], [127.0, 131.92], [142.0, 142.72]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 30.0, 32.41, 95.09, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 62.58, 0.0, 91.47, 97.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 50.51], ["whack, thwack", 8.37], ["explosion", 7.0]], null, null, [["speech", 39.52], ["groan", 11.73], ["screaming", 10.34]], [["wail, moan", 29.35], ["fart", 13.0], ["speech", 11.97]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.03, -0.13, 5.89, 0.76, 0.42, 4.74, 4.63, 3.17, 5.78, 0.52, 0.61, 0.35, 0.6, 0.49, 4.49, 2.99, 1.6, 8.83, 4.92, 0.72]} \ No newline at end of file diff --git a/annotations_1/5Io8n3JYNUY_filtered.json b/annotations_1/5Io8n3JYNUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e52a800f4cd38f6eb5ada03bda26a4ee4389d32 --- /dev/null +++ b/annotations_1/5Io8n3JYNUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [6.0, 6.93], [9.0, 9.44], [18.0, 23.84], [25.0, 25.56], [29.0, 29.88], [32.0, 32.34], [38.0, 38.43], [45.0, 45.94], [47.0, 47.66], [50.0, 50.41], [51.0, 51.71], [53.0, 54.14], [59.0, 59.63], [60.0, 68.13], [69.0, 70.58], [71.0, 82.24], [89.0, 90.02], [93.0, 94.69], [97.0, 154.4], [155.0, 155.31], [158.0, 158.77], [159.0, 162.36], [164.0, 167.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 32.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.72, 0.0, 32.01, 0.0, 0.0, 0.0, 0.0, 0.0, 35.96, 41.12], "audiomae_on_audioset": [null, null, null, [["music", 74.22], ["didgeridoo", 3.8], ["synthesizer", 2.85]], null, null, null, null, null, null, null, null, null, null, [["music", 45.05], ["synthesizer", 6.66], ["theremin", 5.4]], null, [["cowbell", 46.45], ["livestock, farm animals, working animals", 28.21], ["cattle, bovinae", 13.57]], null, null, null, null, null, [["speech", 48.75], ["singing bowl", 9.48], ["music", 4.34]], [["music", 30.25], ["speech", 29.89], ["groan", 7.23]]], "duration": [1.04, 0.93, 0.44, 5.84, 0.56, 0.88, 0.34, 0.43, 0.94, 0.66, 0.41, 0.71, 1.14, 0.63, 8.13, 1.58, 11.24, 1.02, 1.69, 57.4, 0.31, 0.77, 3.36, 3.02]} \ No newline at end of file diff --git a/annotations_1/5IzNXdsZUHk_filtered.json b/annotations_1/5IzNXdsZUHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8abf87079502301d239d73d803954386446ef7ad --- /dev/null +++ b/annotations_1/5IzNXdsZUHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [12.0, 21.57], [24.0, 24.49], [25.0, 31.5], [34.0, 33.96], [34.0, 35.01], [40.0, 40.15], [44.0, 44.81], [46.0, 46.13], [58.0, 58.8], [59.0, 60.45], [64.0, 65.74], [68.0, 70.55], [72.0, 88.89], [91.0, 91.57], [93.0, 93.66], [98.0, 98.19], [104.0, 104.36], [105.0, 106.37], [123.0, 123.55], [124.0, 124.51]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 35.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.45, 43.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 25.22], ["fart", 18.86], ["fly, housefly", 9.0]], null, null, null, null, null, null, null, null, [["sidetone", 51.1], ["speech", 27.25], ["hum", 7.72]], [["hum", 44.72], ["mains hum", 18.9], ["whack, thwack", 4.7]], null, null, null, null, null, null, null], "duration": [0.49, 9.57, 0.49, 6.5, -0.04, 1.01, 0.15, 0.81, 0.13, 0.8, 1.45, 1.74, 2.55, 16.89, 0.57, 0.66, 0.19, 0.36, 1.37, 0.55, 0.51]} \ No newline at end of file diff --git a/annotations_1/5JCbdlUra28_filtered.json b/annotations_1/5JCbdlUra28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ccf701ff531f74348521d2b3d685f3b4c0e2eb --- /dev/null +++ b/annotations_1/5JCbdlUra28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 32.41], [34.0, 36.05], [38.0, 45.06], [47.0, 48.29], [50.0, 50.48], [51.0, 50.94], [52.0, 53.52], [55.0, 56.96], [58.0, 58.45], [60.0, 62.67], [63.0, 67.53], [70.0, 70.43], [71.0, 72.42], [74.0, 74.49], [76.0, 76.82], [79.0, 80.62], [81.0, 84.67], [89.0, 103.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.35, 90.25, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 62.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.41, 2.05, 7.06, 1.29, 0.48, -0.06, 1.52, 1.96, 0.45, 2.67, 4.53, 0.43, 1.42, 0.49, 0.82, 1.62, 3.67, 14.67]} \ No newline at end of file diff --git a/annotations_1/5K6sh7HZri4_filtered.json b/annotations_1/5K6sh7HZri4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6794e8e1314643f8e74d37d0d2825fe2fda0624d --- /dev/null +++ b/annotations_1/5K6sh7HZri4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.3], [8.0, 8.72], [9.0, 10.39], [12.0, 12.9], [15.0, 15.75], [18.0, 18.47], [19.0, 19.8], [23.0, 24.04], [24.0, 25.39], [27.0, 27.45], [28.0, 29.13], [32.0, 32.53], [33.0, 35.75], [37.0, 37.83], [39.0, 39.01], [40.0, 40.95], [43.0, 43.73], [45.0, 46.21], [51.0, 53.72], [54.0, 54.46], [57.0, 57.47], [59.0, 60.17], [63.0, 63.85], [68.0, 69.01], [72.0, 73.67], [77.0, 76.82], [84.0, 85.85], [90.0, 92.15], [93.0, 93.23], [105.0, 105.53], [111.0, 112.16], [118.0, 118.83], [121.0, 121.26], [126.0, 127.8]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 21.14], ["fly, housefly", 13.28], ["insect", 6.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 15.74], ["noise", 6.82], ["thunk", 6.4]], null, null, null, null, null, null], "duration": [4.3, 0.72, 1.39, 0.9, 0.75, 0.47, 0.8, 1.04, 1.39, 0.45, 1.13, 0.53, 2.75, 0.83, 0.01, 0.95, 0.73, 1.21, 2.72, 0.46, 0.47, 1.17, 0.85, 1.01, 1.67, -0.18, 1.85, 2.15, 0.23, 0.53, 1.16, 0.83, 0.26, 1.8]} \ No newline at end of file diff --git a/annotations_1/5LX01_nSeZU_filtered.json b/annotations_1/5LX01_nSeZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cb4323aad4f9b5c2c696d11832e81140cafebe2 --- /dev/null +++ b/annotations_1/5LX01_nSeZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.49], [15.0, 16.26], [17.0, 18.05], [20.0, 20.93], [22.0, 29.32], [32.0, 49.62], [51.0, 60.49], [62.0, 63.59], [64.0, 79.1], [95.0, 95.52], [96.0, 96.55], [98.0, 99.67], [100.0, 100.7], [101.0, 107.37], [108.0, 109.48], [110.0, 127.35], [128.0, 129.84], [132.0, 132.12], [135.0, 135.26], [137.0, 137.22], [138.0, 140.32]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.39, 39.15, 99.52, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 30.04, 0.0, 30.93, 0.0, 0.0, 0.0, 0.0, 75.39], "audiomae_on_audioset": [null, null, null, null, [["creak", 15.17], ["hum", 10.92], ["whack, thwack", 7.56]], [["music", 28.58], ["thunk", 12.02], ["gong", 11.34]], null, null, null, null, null, null, null, [["speech", 49.18], ["music", 13.94], ["hum", 7.81]], null, [["speech", 49.61], ["music", 18.69], ["thump, thud", 6.47]], null, null, null, null, null], "duration": [1.49, 1.26, 1.05, 0.93, 7.32, 17.62, 9.49, 1.59, 15.1, 0.52, 0.55, 1.67, 0.7, 6.37, 1.48, 17.35, 1.84, 0.12, 0.26, 0.22, 2.32]} \ No newline at end of file diff --git a/annotations_1/5Le4OlAvuME_filtered.json b/annotations_1/5Le4OlAvuME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84466168f925f85e9816a598257c7ba0840db719 --- /dev/null +++ b/annotations_1/5Le4OlAvuME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.45], [8.0, 13.8], [17.0, 18.12], [20.0, 22.35], [23.0, 25.74], [27.0, 27.23], [29.0, 29.17], [31.0, 31.94], [33.0, 34.65], [37.0, 38.97], [39.0, 42.92], [44.0, 49.72], [51.0, 51.61], [52.0, 52.3], [55.0, 56.19], [57.0, 64.88], [66.0, 69.08], [70.0, 71.98], [73.0, 108.09], [109.0, 111.2], [113.0, 114.78], [117.0, 117.96], [119.0, 120.23], [121.0, 122.05], [123.0, 126.03], [128.0, 128.56], [129.0, 131.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.76, 65.91, 0.0, 69.2, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 30.65, 0.0, 0.0, 0.0, 33.05, 54.76, 0.0, 0.0, 37.18, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 59.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.43], ["machine gun", 22.41], ["whack, thwack", 4.63]], null, null, null, [["speech", 49.54], ["hum", 8.57], ["mains hum", 7.73]], null, null, null, [["music", 62.02], ["chorus effect", 5.46], ["effects unit", 2.54]], null, null, null, null, null, null, null], "duration": [3.45, 5.8, 1.12, 2.35, 2.74, 0.23, 0.17, 0.94, 1.65, 1.97, 3.92, 5.72, 0.61, 0.3, 1.19, 7.88, 3.08, 1.98, 35.09, 2.2, 1.78, 0.96, 1.23, 1.05, 3.03, 0.56, 2.06]} \ No newline at end of file diff --git a/annotations_1/5LvcBgWzjwc_filtered.json b/annotations_1/5LvcBgWzjwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..456fd8ca711e0bacb3cce15b3e14525e47cef984 --- /dev/null +++ b/annotations_1/5LvcBgWzjwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 182.71]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [119.71]} \ No newline at end of file diff --git a/annotations_1/5M4VIDlRYjQ_filtered.json b/annotations_1/5M4VIDlRYjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56f3e91cc3fab4d1d133ac1d09688d4fddd64496 --- /dev/null +++ b/annotations_1/5M4VIDlRYjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.4], [31.0, 40.93], [42.0, 44.09], [48.0, 48.84], [50.0, 52.0], [54.0, 54.24], [62.0, 62.72], [68.0, 67.96], [85.0, 85.6], [90.0, 91.12], [93.0, 127.67], [129.0, 130.03]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [46.79, 32.28, 48.44, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.07], ["fly, housefly", 26.66], ["insect", 16.71]], [["speech", 34.34], ["busy signal", 18.01], ["sidetone", 17.31]], [["speech", 40.45], ["music", 11.93], ["telephone", 11.28]], null, [["sidetone", 42.89], ["speech", 26.02], ["music", 11.05]], null, null, null, null, null, null, null], "duration": [6.4, 9.93, 2.09, 0.84, 2.0, 0.24, 0.72, -0.04, 0.6, 1.12, 34.67, 1.03]} \ No newline at end of file diff --git a/annotations_1/5NTDlhH174M_filtered.json b/annotations_1/5NTDlhH174M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10e2f40a0ad3a726c1d19d22566a9192299bfda4 --- /dev/null +++ b/annotations_1/5NTDlhH174M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [8.0, 8.94], [19.0, 20.75], [21.0, 23.43], [37.0, 36.85], [39.0, 39.33], [40.0, 40.61], [68.0, 69.15], [81.0, 80.72], [85.0, 85.77], [97.0, 97.58], [103.0, 103.69], [108.0, 108.9], [114.0, 114.99]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 23.74], ["speech", 20.75], ["animal", 8.39]], null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.94, 1.75, 2.43, -0.15, 0.33, 0.61, 1.15, -0.28, 0.77, 0.58, 0.69, 0.9, 0.99]} \ No newline at end of file diff --git a/annotations_1/5NY_8ulSutc_filtered.json b/annotations_1/5NY_8ulSutc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29a7161ae8428fb59d2c6e713383fc54e9a44d4e --- /dev/null +++ b/annotations_1/5NY_8ulSutc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [6.0, 7.42], [9.0, 41.77], [43.0, 44.19], [46.0, 46.62], [53.0, 52.56], [55.0, 58.26], [59.0, 65.47], [68.0, 78.6], [83.0, 85.33], [93.0, 98.69], [102.0, 110.88], [113.0, 121.51], [123.0, 131.94], [133.0, 133.0], [136.0, 136.07], [138.0, 142.84], [151.0, 151.51]], "keep_status": [false, false, false, false, false, false, true, true, false, true, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 29.8, 33.63, 29.86, 29.82, 30.45, 46.61, 44.37, 0.0, 0.0, 37.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 50.4], ["boing", 9.58], ["groan", 6.1]], [["mains hum", 26.32], ["music", 21.37], ["hum", 19.26]], [["music", 49.61], ["speech", 33.76], ["sine wave", 2.42]], [["livestock, farm animals, working animals", 29.92], ["music", 24.94], ["cattle, bovinae", 10.79]], [["mosquito", 17.36], ["music", 13.55], ["buzz", 7.7]], [["music", 64.51], ["throbbing", 10.69], ["hum", 5.88]], [["hum", 28.62], ["speech", 27.83], ["mains hum", 12.09]], [["speech", 70.8], ["fly, housefly", 7.07], ["bee, wasp, etc.", 4.94]], null, null, [["speech", 28.89], ["hum", 11.4], ["music", 8.92]], null], "duration": [0.21, 1.42, 32.77, 1.19, 0.62, -0.44, 3.26, 6.47, 10.6, 2.33, 5.69, 8.88, 8.51, 8.94, 0.0, 0.07, 4.84, 0.51]} \ No newline at end of file diff --git a/annotations_1/5NlQiQfC4zQ_filtered.json b/annotations_1/5NlQiQfC4zQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0ecd9a5b1a9400c74d966aca259ff813f88a722 --- /dev/null +++ b/annotations_1/5NlQiQfC4zQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.53], [10.0, 10.59], [12.0, 11.75], [13.0, 13.36], [17.0, 18.13], [19.0, 19.85], [20.0, 24.19], [27.0, 28.9], [30.0, 30.74], [31.0, 32.39], [34.0, 33.94], [35.0, 35.6], [37.0, 36.88], [38.0, 38.89], [41.0, 41.42], [46.0, 45.79], [46.0, 49.81], [50.0, 50.9], [52.0, 59.19], [61.0, 62.46], [64.0, 65.65]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.99, 0.0, 0.0, 0.0, 0.0, 0.0, 41.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.2, 0.0, 31.21, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 26.14], ["livestock, farm animals, working animals", 23.36], ["cattle, bovinae", 20.25]], null, null, null, null, null, [["music", 41.7], ["speech", 17.21], ["effects unit", 4.73]], null, null, null, null, null, null, null, null, null, [["music", 58.5], ["didgeridoo", 19.15], ["musical instrument", 5.83]], null, [["didgeridoo", 62.35], ["music", 16.05], ["theremin", 3.87]], null, null], "duration": [2.53, 0.59, -0.25, 0.36, 1.13, 0.85, 4.19, 1.9, 0.74, 1.39, -0.06, 0.6, -0.12, 0.89, 0.42, -0.21, 3.81, 0.9, 7.19, 1.46, 1.65]} \ No newline at end of file diff --git a/annotations_1/5ODDHpmqyWE_filtered.json b/annotations_1/5ODDHpmqyWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3a8820991a78ad4448640c58f6f07113b1eb5d4 --- /dev/null +++ b/annotations_1/5ODDHpmqyWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 20.06], [21.0, 23.23], [24.0, 25.56], [33.0, 34.96], [37.0, 37.54], [40.0, 40.81], [42.0, 43.44], [45.0, 45.44], [47.0, 48.15], [49.0, 50.45], [53.0, 54.04], [62.0, 62.6], [70.0, 69.79], [74.0, 75.46], [77.0, 77.82], [79.0, 79.64], [83.0, 83.73], [84.0, 87.59], [90.0, 91.32], [94.0, 95.17], [103.0, 103.33], [105.0, 105.65], [107.0, 109.11], [114.0, 119.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [75.55, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 0.0, 0.0, 0.0, 0.0, 47.94, 43.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hiccup", 14.82], ["hum", 8.72], ["laughter", 8.37]], null, null, null, null, [["music", 38.1], ["burping, eructation", 11.32], ["whale vocalization", 8.21]], [["music", 26.84], ["mains hum", 23.19], ["synthesizer", 11.8]]], "duration": [17.06, 2.23, 1.56, 1.96, 0.54, 0.81, 1.44, 0.44, 1.15, 1.45, 1.04, 0.6, -0.21, 1.46, 0.82, 0.64, 0.73, 3.59, 1.32, 1.17, 0.33, 0.65, 2.11, 5.4]} \ No newline at end of file diff --git a/annotations_1/5OfAMHeIr7k_filtered.json b/annotations_1/5OfAMHeIr7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce138c3bad93dd1f9c4363bcf787af9db9e7be34 --- /dev/null +++ b/annotations_1/5OfAMHeIr7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [3.0, 8.51], [11.0, 31.73], [33.0, 50.01], [50.0, 50.53], [65.0, 65.42], [65.0, 65.8], [69.0, 69.36], [70.0, 72.99], [76.0, 78.44], [82.0, 87.35], [89.0, 92.4], [94.0, 98.95], [103.0, 104.7], [107.0, 125.85], [126.0, 127.5], [133.0, 146.85], [148.0, 152.51]], "keep_status": [false, true, true, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.52, 29.07, 29.31, 0.0, 0.0, 0.0, 0.0, 32.83, 42.65, 38.03, 35.28, 31.05, 0.0, 30.44, 0.0, 29.9, 38.2], "audiomae_on_audioset": [null, [["music", 44.15], ["throbbing", 11.19], ["speech", 9.66]], [["vehicle", 31.82], ["car", 18.42], ["race car, auto racing", 12.15]], [["speech", 54.59], ["vehicle", 13.83], ["car", 3.67]], null, null, null, null, [["fly, housefly", 33.65], ["insect", 27.84], ["mosquito", 12.4]], [["radio", 37.51], ["speech", 16.04], ["sidetone", 14.24]], [["whale vocalization", 32.04], ["fly, housefly", 10.7], ["insect", 9.87]], [["speech", 34.5], ["music", 22.59], ["hum", 4.89]], [["speech", 69.36], ["music", 15.2], ["clang", 4.48]], null, [["theremin", 43.55], ["music", 32.89], ["musical instrument", 2.95]], null, [["cattle, bovinae", 42.82], ["livestock, farm animals, working animals", 30.08], ["moo", 24.91]], [["music", 61.36], ["throbbing", 5.63], ["hum", 5.16]]], "duration": [0.84, 5.51, 20.73, 17.01, 0.53, 0.42, 0.8, 0.36, 2.99, 2.44, 5.35, 3.4, 4.95, 1.7, 18.85, 1.5, 13.85, 4.51]} \ No newline at end of file diff --git a/annotations_1/5OkvZ-y_dgI_filtered.json b/annotations_1/5OkvZ-y_dgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdb0ee00db276f0ae7ccfc17610839dd40e2a2f --- /dev/null +++ b/annotations_1/5OkvZ-y_dgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.97], [29.0, 67.42], [69.0, 88.28], [90.0, 92.48]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 29.04, 28.05], "audiomae_on_audioset": [null, null, [["hum", 27.41], ["throbbing", 15.43], ["music", 11.25]], [["explosion", 56.44], ["burst, pop", 16.18], ["eruption", 7.09]]], "duration": [-0.03, 38.42, 19.28, 2.48]} \ No newline at end of file diff --git a/annotations_1/5PaUTnk9k9Y_filtered.json b/annotations_1/5PaUTnk9k9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c431d941d71980f7570b003b5ee4ebb0dfaa7960 --- /dev/null +++ b/annotations_1/5PaUTnk9k9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.49], [22.0, 45.49], [48.0, 55.66], [57.0, 70.12], [75.0, 75.61], [78.0, 83.73], [85.0, 97.48], [99.0, 100.7], [103.0, 103.06], [107.0, 109.24], [111.0, 111.69]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [31.05, 30.25, 30.36, 29.76, 0.0, 29.76, 29.76, 0.0, 0.0, 31.31, 0.0], "audiomae_on_audioset": [[["music", 50.67], ["electronic music", 7.0], ["foghorn", 5.15]], [["music", 60.34], ["hum", 5.49], ["mains hum", 5.16]], [["music", 49.6], ["throbbing", 12.84], ["hum", 6.73]], [["music", 67.09], ["electronic music", 5.89], ["throbbing", 5.85]], null, [["music", 35.02], ["throbbing", 13.9], ["cacophony", 10.92]], [["music", 73.26], ["throbbing", 8.92], ["musical instrument", 2.68]], null, null, [["music", 42.29], ["throbbing", 20.22], ["hum", 8.48]], null], "duration": [4.49, 23.49, 7.66, 13.12, 0.61, 5.73, 12.48, 1.7, 0.06, 2.24, 0.69]} \ No newline at end of file diff --git a/annotations_1/5PsKwqiRjEM_filtered.json b/annotations_1/5PsKwqiRjEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7bb82602861b78c17d9c8b1bffede26a75e30fd --- /dev/null +++ b/annotations_1/5PsKwqiRjEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [5.0, 5.09], [8.0, 8.82], [13.0, 13.51], [15.0, 34.7], [40.0, 64.35], [70.0, 70.5], [74.0, 76.13], [78.0, 80.94], [83.0, 86.44], [90.0, 100.18], [102.0, 102.84], [107.0, 110.61], [112.0, 116.34], [117.0, 119.33], [120.0, 123.62]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.67, 34.23, 0.0, 94.95, 69.61, 43.0, 94.81, 0.0, 83.52, 90.08, 81.71, 43.4], "audiomae_on_audioset": [null, null, null, null, [["hum", 42.14], ["mains hum", 18.08], ["music", 17.32]], [["speech", 47.01], ["vehicle", 7.56], ["door", 6.53]], null, null, null, [["speech", 26.0], ["hum", 8.24], ["sidetone", 7.84]], null, null, null, null, null, [["domestic animals, pets", 27.79], ["animal", 20.99], ["dog", 18.91]]], "duration": [0.24, 0.09, 0.82, 0.51, 19.7, 24.35, 0.5, 2.13, 2.94, 3.44, 10.18, 0.84, 3.61, 4.34, 2.33, 3.62]} \ No newline at end of file diff --git a/annotations_1/5Q52XfZ9no0_filtered.json b/annotations_1/5Q52XfZ9no0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3596a574537a5d04b749061d0f81542e6f54497 --- /dev/null +++ b/annotations_1/5Q52XfZ9no0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [4.0, 5.17], [10.0, 9.95], [11.0, 11.2], [13.0, 13.69], [18.0, 18.86], [21.0, 21.0], [24.0, 27.99], [29.0, 29.39], [37.0, 37.74], [39.0, 39.43], [51.0, 51.98], [52.0, 53.0], [55.0, 56.02], [65.0, 66.65], [68.0, 68.42], [82.0, 83.0], [85.0, 85.46], [89.0, 89.09], [101.0, 106.0], [107.0, 107.23], [112.0, 121.41], [124.0, 139.06], [142.0, 145.17], [149.0, 151.44], [152.0, 152.51], [153.0, 153.64], [155.0, 162.55]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.48, 0.0, 29.17, 31.63, 28.42, 37.45, 0.0, 0.0, 49.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 21.49], ["owl", 10.57], ["hoot", 7.69]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 51.1], ["whale vocalization", 8.77], ["dial tone", 4.41]], null, [["speech", 45.06], ["dial tone", 18.24], ["music", 5.2]], [["music", 39.88], ["dial tone", 13.19], ["busy signal", 11.34]], [["animal", 22.09], ["whale vocalization", 14.19], ["dog", 10.7]], [["chirp tone", 52.61], ["sine wave", 18.06], ["dial tone", 10.51]], null, null, [["music", 28.74], ["whale vocalization", 22.95], ["sonar", 15.61]]], "duration": [0.67, 1.17, -0.05, 0.2, 0.69, 0.86, 0.0, 3.99, 0.39, 0.74, 0.43, 0.98, 1.0, 1.02, 1.65, 0.42, 1.0, 0.46, 0.09, 5.0, 0.23, 9.41, 15.06, 3.17, 2.44, 0.51, 0.64, 7.55]} \ No newline at end of file diff --git a/annotations_1/5QFZ_Kh7vP0_filtered.json b/annotations_1/5QFZ_Kh7vP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4733de42dfe17a69c50fb70fd814405d7ce0f9a7 --- /dev/null +++ b/annotations_1/5QFZ_Kh7vP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 28.43], [30.0, 31.99], [40.0, 43.38], [47.0, 48.49], [52.0, 57.79], [61.0, 96.04], [97.0, 123.96], [124.0, 123.99], [124.0, 124.07], [138.0, 149.13], [150.0, 151.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.98, 0.0, 67.25, 0.0, 40.75, 0.0, 0.0, 42.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.69], ["throbbing", 12.33], ["hum", 6.23]], null, null, [["music", 54.28], ["grunt", 15.44], ["throbbing", 6.33]], null], "duration": [1.43, 1.99, 3.38, 1.49, 5.79, 35.04, 26.96, -0.01, 0.07, 11.13, 1.61]} \ No newline at end of file diff --git a/annotations_1/5QJGkxbb0wE_filtered.json b/annotations_1/5QJGkxbb0wE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da98f0ec6d7af20c0a4369acdb898c5442395188 --- /dev/null +++ b/annotations_1/5QJGkxbb0wE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.79], [13.0, 18.99], [20.0, 30.81], [32.0, 44.86], [49.0, 57.21], [60.0, 70.04], [71.0, 78.34], [81.0, 82.78], [84.0, 86.19], [87.0, 94.53], [95.0, 101.9]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 61.47, 35.24, 35.8, 33.93, 34.91, 63.74, 0.0, 50.16, 33.53, 29.89], "audiomae_on_audioset": [null, null, [["whale vocalization", 53.27], ["hum", 13.49], ["throbbing", 4.44]], [["whale vocalization", 40.06], ["speech", 31.04], ["hum", 5.89]], [["hum", 43.57], ["throbbing", 24.45], ["heart sounds, heartbeat", 10.24]], [["whale vocalization", 26.9], ["hum", 7.79], ["stomach rumble", 6.31]], null, null, null, [["speech", 38.81], ["rumble", 9.39], ["whale vocalization", 9.22]], [["speech", 42.56], ["throbbing", 15.48], ["hum", 15.33]]], "duration": [1.79, 5.99, 10.81, 12.86, 8.21, 10.04, 7.34, 1.78, 2.19, 7.53, 6.9]} \ No newline at end of file diff --git a/annotations_1/5QMsr3UxzPk_filtered.json b/annotations_1/5QMsr3UxzPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b96ecf47e56900a847700ff54ed3db25b988b260 --- /dev/null +++ b/annotations_1/5QMsr3UxzPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 92.57], [96.0, 114.76], [115.0, 115.15], [116.0, 118.18]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 31.09, 0.0, 34.61], "audiomae_on_audioset": [null, [["speech", 60.96], ["music", 13.36], ["vehicle", 3.28]], null, [["music", 33.75], ["drum", 10.33], ["musical instrument", 8.61]]], "duration": [50.57, 18.76, 0.15, 2.18]} \ No newline at end of file diff --git a/annotations_1/5RGxUKhhRWA_filtered.json b/annotations_1/5RGxUKhhRWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b6e199c46d9e5b680b658a386e63efb3f4f52f8 --- /dev/null +++ b/annotations_1/5RGxUKhhRWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [3.0, 5.48], [8.0, 14.98], [16.0, 17.95], [19.0, 21.19], [22.0, 25.91], [27.0, 29.81], [31.0, 31.56], [33.0, 35.09], [36.0, 40.36], [41.0, 45.96], [47.0, 83.19], [86.0, 89.26], [90.0, 102.52], [104.0, 115.82], [117.0, 119.25], [121.0, 122.79], [125.0, 125.58], [127.0, 127.79], [128.0, 131.67], [134.0, 136.12], [139.0, 147.73], [148.0, 150.3], [152.0, 155.93], [158.0, 162.11], [164.0, 164.94], [165.0, 168.08], [169.0, 180.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 95.78, 0.0, 99.21, 99.97, 99.95, 0.0, 100.0, 99.94, 99.99, 0.0, 75.23, 91.13, 99.26, 99.65, 0.0, 0.0, 0.0, 94.66, 99.95, 59.33, 82.61, 98.27, 58.05, 0.0, 76.2, 60.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 2.48, 6.98, 1.95, 2.19, 3.91, 2.81, 0.56, 2.09, 4.36, 4.96, 36.19, 3.26, 12.52, 11.82, 2.25, 1.79, 0.58, 0.79, 3.67, 2.12, 8.73, 2.3, 3.93, 4.11, 0.94, 3.08, 11.86]} \ No newline at end of file diff --git a/annotations_1/5RKld6BGJA4_filtered.json b/annotations_1/5RKld6BGJA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcf1efdecffe48b308e4a27e537b62b4edda3547 --- /dev/null +++ b/annotations_1/5RKld6BGJA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 36.61], [58.0, 66.41], [96.0, 96.7], [102.0, 102.59], [103.0, 104.26], [106.0, 106.91], [114.0, 114.96], [117.0, 117.24], [119.0, 119.47], [124.0, 125.58], [127.0, 127.45], [132.0, 132.58], [134.0, 134.5], [137.0, 137.67], [140.0, 140.37], [143.0, 144.17], [152.0, 151.97], [153.0, 153.59], [162.0, 162.31], [170.0, 170.6], [177.0, 179.54], [182.0, 184.65], [190.0, 192.38], [192.0, 192.45], [193.0, 192.59], [193.0, 201.78], [203.0, 204.72], [205.0, 205.39], [206.0, 206.73], [207.0, 207.66], [209.0, 209.14]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.44, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 74.44, 81.53, 0.0, 0.0, 40.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 77.53], ["boing", 4.52], ["synthetic singing", 3.94]], [["music", 17.69], ["speech", 15.79], ["boing", 9.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 31.06], ["speech", 21.14], ["whack, thwack", 12.37]], null, null, null, null, [["thunk", 33.06], ["music", 29.81], ["whack, thwack", 8.45]], null, null, null, null, null], "duration": [24.61, 8.41, 0.7, 0.59, 1.26, 0.91, 0.96, 0.24, 0.47, 1.58, 0.45, 0.58, 0.5, 0.67, 0.37, 1.17, -0.03, 0.59, 0.31, 0.6, 2.54, 2.65, 2.38, 0.45, -0.41, 8.78, 1.72, 0.39, 0.73, 0.66, 0.14]} \ No newline at end of file diff --git a/annotations_1/5RUWalajNYE_filtered.json b/annotations_1/5RUWalajNYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07746304e5632f15b2c72d8c0139bcda6c18cbbc --- /dev/null +++ b/annotations_1/5RUWalajNYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.88], [20.0, 20.71], [23.0, 23.97], [27.0, 30.87], [33.0, 41.61], [42.0, 41.94], [42.0, 43.31], [48.0, 49.49], [50.0, 53.22], [54.0, 54.53], [58.0, 59.58], [64.0, 64.54], [69.0, 69.25], [70.0, 70.38], [71.0, 71.02], [72.0, 72.35], [73.0, 73.82], [74.0, 100.89], [103.0, 120.09], [123.0, 125.12], [128.0, 130.23], [135.0, 135.33], [142.0, 154.52], [162.0, 168.0], [170.0, 180.82]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [34.34, 0.0, 0.0, 33.28, 33.25, 0.0, 0.0, 0.0, 38.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 29.54, 29.8, 30.1, 0.0, 29.16, 29.9, 31.38], "audiomae_on_audioset": [[["music", 58.81], ["musical instrument", 10.61], ["effects unit", 6.41]], null, null, [["music", 28.5], ["musical instrument", 11.29], ["harmonica", 5.29]], [["music", 42.34], ["theremin", 29.31], ["musical instrument", 3.89]], null, null, null, [["speech", 45.84], ["music", 37.36], ["musical instrument", 2.73]], null, null, null, null, null, null, null, null, [["music", 67.8], ["didgeridoo", 23.87], ["echo", 0.66]], [["didgeridoo", 66.15], ["music", 31.07], ["musical instrument", 0.58]], [["music", 77.35], ["didgeridoo", 4.58], ["musical instrument", 2.22]], [["music", 70.72], ["didgeridoo", 15.03], ["musical instrument", 2.92]], null, [["music", 72.08], ["carnatic music", 6.2], ["didgeridoo", 4.88]], [["didgeridoo", 59.41], ["music", 23.77], ["throbbing", 2.74]], [["music", 21.23], ["whale vocalization", 11.54], ["theremin", 10.44]]], "duration": [3.88, 0.71, 0.97, 3.87, 8.61, -0.06, 1.31, 1.49, 3.22, 0.53, 1.58, 0.54, 0.25, 0.38, 0.02, 0.35, 0.82, 26.89, 17.09, 2.12, 2.23, 0.33, 12.52, 6.0, 10.82]} \ No newline at end of file diff --git a/annotations_1/5SRxYONb12I_filtered.json b/annotations_1/5SRxYONb12I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8410d5862547932bd3ba95404ae1da6321517792 --- /dev/null +++ b/annotations_1/5SRxYONb12I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [4.0, 5.12], [8.0, 8.51], [12.0, 12.63], [16.0, 16.71], [18.0, 17.86], [21.0, 21.42], [23.0, 23.65], [24.0, 24.85], [29.0, 29.86], [36.0, 37.02], [39.0, 39.53], [44.0, 45.03], [49.0, 50.26], [55.0, 56.84], [58.0, 58.85], [61.0, 61.05], [63.0, 63.1], [64.0, 64.45], [66.0, 67.54], [72.0, 72.64], [75.0, 75.24], [77.0, 79.46], [81.0, 81.33], [82.0, 83.13], [86.0, 86.91], [90.0, 90.68], [94.0, 96.33], [98.0, 97.97], [99.0, 100.87], [103.0, 106.73], [109.0, 109.81], [112.0, 112.21], [115.0, 116.01], [117.0, 118.3], [119.0, 120.12], [121.0, 122.49], [124.0, 124.66], [127.0, 126.98], [128.0, 128.88], [133.0, 133.59], [136.0, 137.46], [139.0, 140.76], [143.0, 143.56], [145.0, 145.86], [148.0, 148.31], [152.0, 153.32], [157.0, 157.25], [159.0, 159.07], [160.0, 160.89], [162.0, 163.29], [166.0, 166.18], [167.0, 169.55], [172.0, 173.77], [175.0, 179.85], [182.0, 183.05], [185.0, 185.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 98.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 1.12, 0.51, 0.63, 0.71, -0.14, 0.42, 0.65, 0.85, 0.86, 1.02, 0.53, 1.03, 1.26, 1.84, 0.85, 0.05, 0.1, 0.45, 1.54, 0.64, 0.24, 2.46, 0.33, 1.13, 0.91, 0.68, 2.33, -0.03, 1.87, 3.73, 0.81, 0.21, 1.01, 1.3, 1.12, 1.49, 0.66, -0.02, 0.88, 0.59, 1.46, 1.76, 0.56, 0.86, 0.31, 1.32, 0.25, 0.07, 0.89, 1.29, 0.18, 2.55, 1.77, 4.85, 1.05, 0.31]} \ No newline at end of file diff --git a/annotations_1/5SkzHjQrCXk_filtered.json b/annotations_1/5SkzHjQrCXk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e30c617d504b7dcac3cad4cf9b64d41df7d71ec --- /dev/null +++ b/annotations_1/5SkzHjQrCXk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 6.34], [9.0, 9.44], [12.0, 12.5], [15.0, 16.21], [18.0, 18.22], [21.0, 21.39], [22.0, 22.49], [23.0, 23.97], [26.0, 28.11], [30.0, 30.79], [35.0, 35.58], [38.0, 38.3], [39.0, 39.88], [41.0, 41.45], [43.0, 44.91], [46.0, 47.33], [51.0, 51.27], [53.0, 54.18], [58.0, 63.24], [66.0, 66.63], [67.0, 67.85], [69.0, 77.77], [79.0, 80.7], [82.0, 82.22], [87.0, 94.61], [97.0, 97.04], [98.0, 98.15], [98.0, 99.91], [100.0, 101.46], [102.0, 103.59], [107.0, 109.73], [110.0, 111.62], [113.0, 113.83], [115.0, 115.01], [124.0, 125.07], [126.0, 126.96], [130.0, 130.86], [132.0, 132.78], [134.0, 137.62], [141.0, 142.01], [143.0, 146.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 100.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.34, 0.44, 0.5, 1.21, 0.22, 0.39, 0.49, 0.97, 2.11, 0.79, 0.58, 0.3, 0.88, 0.45, 1.91, 1.33, 0.27, 1.18, 5.24, 0.63, 0.85, 8.77, 1.7, 0.22, 7.61, 0.04, 0.15, 1.91, 1.46, 1.59, 2.73, 1.62, 0.83, 0.01, 1.07, 0.96, 0.86, 0.78, 3.62, 1.01, 3.31]} \ No newline at end of file diff --git a/annotations_1/5Svd15hqUfs_filtered.json b/annotations_1/5Svd15hqUfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b1136a0641ed1ffdcc67722fb93baa217ff3041 --- /dev/null +++ b/annotations_1/5Svd15hqUfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 34.99], [36.0, 55.46], [58.0, 68.94], [70.0, 70.63], [71.0, 111.01], [112.0, 120.87], [123.0, 141.78], [143.0, 147.43]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [28.51, 28.53, 29.27, 0.0, 0.0, 29.03, 33.62, 38.31], "audiomae_on_audioset": [[["music", 46.84], ["throbbing", 14.91], ["hum", 11.92]], [["music", 42.8], ["throbbing", 22.43], ["hum", 16.21]], [["mains hum", 31.66], ["hum", 25.27], ["music", 23.7]], null, null, [["music", 53.72], ["speech", 17.38], ["fart", 3.31]], [["music", 50.53], ["didgeridoo", 13.33], ["hum", 4.59]], [["music", 33.68], ["breaking", 13.03], ["hum", 9.85]]], "duration": [21.99, 19.46, 10.94, 0.63, 40.01, 8.87, 18.78, 4.43]} \ No newline at end of file diff --git a/annotations_1/5T17qRlPIiA_filtered.json b/annotations_1/5T17qRlPIiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c695337a3bdd9621286c55da6b368682b506dcf3 --- /dev/null +++ b/annotations_1/5T17qRlPIiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.32], [9.0, 17.98], [18.0, 19.45], [25.0, 33.15], [34.0, 212.14]], "keep_status": [false, false, false, false, false], "silence_prob": [31.4, 31.65, 0.0, 32.95, 0.0], "audiomae_on_audioset": [[["music", 40.11], ["brass instrument", 20.16], ["foghorn", 14.86]], [["music", 80.39], ["musical instrument", 2.62], ["brass instrument", 2.31]], null, [["music", 58.34], ["brass instrument", 9.54], ["french horn", 4.97]], null], "duration": [6.32, 8.98, 1.45, 8.15, 178.14]} \ No newline at end of file diff --git a/annotations_1/5TG1Wh04D1g_filtered.json b/annotations_1/5TG1Wh04D1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3acdde5752418e5163a70cc55dacf035e4889167 --- /dev/null +++ b/annotations_1/5TG1Wh04D1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [7.0, 11.25], [13.0, 14.15], [14.0, 14.18], [26.0, 30.74], [34.0, 36.0], [37.0, 38.87], [41.0, 42.7], [45.0, 46.48], [54.0, 56.25], [65.0, 65.87], [74.0, 77.87], [85.0, 89.45], [91.0, 96.04], [107.0, 117.34], [123.0, 130.65]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 59.59, 0.0, 0.0, 30.5, 30.62, 0.0, 0.0, 0.0, 31.49, 0.0, 29.64, 29.57, 29.75, 30.45, 30.45], "audiomae_on_audioset": [null, null, null, null, [["speech", 19.11], ["groan", 19.08], ["screaming", 13.45]], [["music", 85.11], ["singing", 0.74], ["ska", 0.6]], null, null, null, [["music", 73.16], ["speech", 4.36], ["singing", 1.58]], null, [["music", 72.83], ["electronic music", 3.7], ["speech", 3.09]], [["music", 73.55], ["electronic music", 5.34], ["speech", 3.59]], [["music", 65.21], ["speech", 10.32], ["drum machine", 8.71]], [["music", 72.19], ["speech", 7.39], ["electronic music", 4.7]], [["music", 37.47], ["livestock, farm animals, working animals", 6.57], ["sound effect", 4.29]]], "duration": [0.31, 4.25, 1.15, 0.18, 4.74, 2.0, 1.87, 1.7, 1.48, 2.25, 0.87, 3.87, 4.45, 5.04, 10.34, 7.65]} \ No newline at end of file diff --git a/annotations_1/5Tqsh3b_lb4_filtered.json b/annotations_1/5Tqsh3b_lb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51b3e6f9f858a64766aca4934867605d4c7f9a93 --- /dev/null +++ b/annotations_1/5Tqsh3b_lb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [11.0, 11.85], [15.0, 15.58], [22.0, 23.63], [28.0, 28.95], [38.0, 45.05], [46.0, 51.12], [53.0, 53.96], [56.0, 56.94], [59.0, 61.06], [68.0, 70.38], [76.0, 90.73], [95.0, 98.73], [105.0, 108.18], [113.0, 126.4], [129.0, 129.2], [131.0, 134.35], [134.0, 135.16], [139.0, 150.42], [152.0, 153.59], [154.0, 160.25], [162.0, 172.15]], "keep_status": [false, false, false, false, false, true, true, false, false, false, true, false, false, true, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.81, 46.09, 0.0, 0.0, 52.51, 43.77, 33.54, 37.72, 35.41, 30.63, 0.0, 31.01, 0.0, 31.39, 0.0, 62.07, 95.23], "audiomae_on_audioset": [null, null, null, null, null, [["music", 36.41], ["theremin", 28.54], ["synthesizer", 5.01]], [["music", 20.5], ["theremin", 12.93], ["whale vocalization", 12.37]], null, null, null, [["music", 27.9], ["synthesizer", 18.33], ["hum", 9.93]], [["hum", 29.79], ["mains hum", 23.83], ["music", 17.03]], [["music", 49.16], ["theremin", 29.22], ["foghorn", 5.26]], [["speech", 40.07], ["music", 14.55], ["boing", 6.53]], [["hum", 23.44], ["fly, housefly", 15.65], ["mains hum", 12.0]], null, [["cattle, bovinae", 28.44], ["livestock, farm animals, working animals", 15.77], ["moo", 13.91]], null, [["music", 34.92], ["buzz", 14.15], ["speech", 7.66]], null, null, null], "duration": [1.56, 0.85, 0.58, 1.63, 0.95, 7.05, 5.12, 0.96, 0.94, 2.06, 2.38, 14.73, 3.73, 3.18, 13.4, 0.2, 3.35, 1.16, 11.42, 1.59, 6.25, 10.15]} \ No newline at end of file diff --git a/annotations_1/5U72xvlbn-k_filtered.json b/annotations_1/5U72xvlbn-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cab2a516c73c94464f12a3d403e3c461ab116a89 --- /dev/null +++ b/annotations_1/5U72xvlbn-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [10.0, 9.98], [13.0, 13.44], [15.0, 16.06], [17.0, 18.49], [19.0, 19.57], [24.0, 23.75], [26.0, 26.49], [27.0, 27.19], [29.0, 30.64], [31.0, 32.48], [36.0, 36.66], [37.0, 41.71], [46.0, 50.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.11, 57.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.32], ["explosion", 27.3], ["burst, pop", 8.23]], null], "duration": [0.34, -0.02, 0.44, 1.06, 1.49, 0.57, -0.25, 0.49, 0.19, 1.64, 1.48, 0.66, 4.71, 4.25]} \ No newline at end of file diff --git a/annotations_1/5U8scp5J9Is_filtered.json b/annotations_1/5U8scp5J9Is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5566bde0936fa1626e6f61a4e5de4a3bb01a195a --- /dev/null +++ b/annotations_1/5U8scp5J9Is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.76], [19.0, 21.19], [23.0, 25.07], [26.0, 27.99], [31.0, 31.02], [32.0, 32.76], [36.0, 36.86], [38.0, 38.57], [39.0, 40.22], [42.0, 45.22], [46.0, 49.33], [50.0, 51.21], [52.0, 58.92], [60.0, 60.12], [61.0, 61.33], [62.0, 72.55], [75.0, 75.57], [76.0, 88.94], [89.0, 109.63], [112.0, 112.33], [113.0, 121.49], [123.0, 126.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, true, true], "silence_prob": [49.31, 48.27, 52.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 57.56, 0.0, 33.57, 0.0, 0.0, 32.04, 0.0, 29.3, 28.79, 0.0, 42.53, 37.84], "audiomae_on_audioset": [[["hum", 29.0], ["speech", 19.84], ["mains hum", 11.2]], [["hum", 43.24], ["mains hum", 22.69], ["throbbing", 13.7]], null, null, null, null, null, null, null, null, null, null, [["mains hum", 28.6], ["hum", 22.77], ["speech", 18.0]], null, null, [["hum", 16.66], ["whack, thwack", 7.03], ["speech", 6.7]], null, [["speech", 66.29], ["thump, thud", 12.89], ["whack, thwack", 3.04]], [["speech", 13.58], ["livestock, farm animals, working animals", 8.55], ["fly, housefly", 7.0]], null, [["speech", 16.65], ["hum", 14.14], ["mains hum", 11.44]], [["speech", 13.86], ["whale vocalization", 6.92], ["noise", 5.05]]], "duration": [7.76, 2.19, 2.07, 1.99, 0.02, 0.76, 0.86, 0.57, 1.22, 3.22, 3.33, 1.21, 6.92, 0.12, 0.33, 10.55, 0.57, 12.94, 20.63, 0.33, 8.49, 3.05]} \ No newline at end of file diff --git a/annotations_1/5Ugqj1RATYE_filtered.json b/annotations_1/5Ugqj1RATYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f72bdbded88131adbfe36cc26e6fd4de869844d --- /dev/null +++ b/annotations_1/5Ugqj1RATYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.73], [15.0, 15.89], [16.0, 16.33], [24.0, 25.41], [30.0, 29.86], [38.0, 39.7], [45.0, 47.53], [49.0, 58.46], [59.0, 60.74], [71.0, 71.56], [72.0, 73.58], [75.0, 76.1], [79.0, 82.58], [85.0, 85.94], [87.0, 86.9], [89.0, 89.5], [90.0, 94.49], [96.0, 97.36], [98.0, 99.28], [105.0, 107.37], [108.0, 109.17], [110.0, 110.62], [121.0, 121.51], [122.0, 123.16], [123.0, 123.48]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.82, 42.88, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 29.42], ["animal", 12.77], ["music", 8.78]], [["speech", 28.43], ["music", 24.99], ["sidetone", 8.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 0.89, 0.33, 1.41, -0.14, 1.7, 2.53, 9.46, 1.74, 0.56, 1.58, 1.1, 3.58, 0.94, -0.1, 0.5, 4.49, 1.36, 1.28, 2.37, 1.17, 0.62, 0.51, 1.16, 0.48]} \ No newline at end of file diff --git a/annotations_1/5UjmbtIRvLY_filtered.json b/annotations_1/5UjmbtIRvLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9651129c5ab8cfd77490b7898e55e357cb096b61 --- /dev/null +++ b/annotations_1/5UjmbtIRvLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.1], [15.0, 15.57], [18.0, 18.87], [20.0, 20.88], [22.0, 22.71], [33.0, 32.75], [33.0, 33.88], [35.0, 34.6], [35.0, 46.4], [61.0, 63.21], [77.0, 77.9], [81.0, 81.73], [86.0, 86.64], [95.0, 96.72], [99.0, 99.84], [100.0, 101.17], [102.0, 102.63], [103.0, 103.65], [107.0, 108.4], [114.0, 115.03], [117.0, 117.9], [119.0, 119.77], [120.0, 120.53], [125.0, 125.98], [138.0, 138.54], [139.0, 139.92], [158.0, 163.02], [164.0, 164.69], [174.0, 174.56], [176.0, 184.01], [184.0, 185.08], [187.0, 186.81]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 32.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 29.74, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 54.5], ["whack, thwack", 16.42], ["thunk", 5.45]], null, null, null, null, null, null, null, [["speech", 82.65], ["boing", 6.85], ["fart", 1.98]], [["music", 39.2], ["speech", 6.44], ["theremin", 6.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.44], ["sidetone", 21.56], ["mains hum", 3.76]], null, null, [["music", 45.67], ["speech", 26.42], ["sidetone", 10.84]], null, null], "duration": [6.1, 0.57, 0.87, 0.88, 0.71, -0.25, 0.88, -0.4, 11.4, 2.21, 0.9, 0.73, 0.64, 1.72, 0.84, 1.17, 0.63, 0.65, 1.4, 1.03, 0.9, 0.77, 0.53, 0.98, 0.54, 0.92, 5.02, 0.69, 0.56, 8.01, 1.08, -0.19]} \ No newline at end of file diff --git a/annotations_1/5UnmqCr95HI_filtered.json b/annotations_1/5UnmqCr95HI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6712848e38fe1172b7dae7623094032c43fc4c6 --- /dev/null +++ b/annotations_1/5UnmqCr95HI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.6], [18.0, 31.02], [32.0, 33.25], [34.0, 39.38], [41.0, 41.72], [43.0, 44.34], [45.0, 47.73], [49.0, 53.33], [55.0, 59.64], [61.0, 133.08], [134.0, 133.95]], "keep_status": [false, false, false, true, false, false, true, true, true, false, false], "silence_prob": [40.45, 32.48, 0.0, 35.39, 0.0, 0.0, 38.43, 34.88, 32.55, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 59.18], ["insect", 17.85], ["bee, wasp, etc.", 6.16]], [["music", 49.08], ["fly, housefly", 15.46], ["insect", 7.6]], null, [["music", 39.67], ["throbbing", 10.33], ["hum", 6.75]], null, null, [["hum", 27.4], ["mains hum", 20.52], ["throbbing", 14.82]], [["music", 35.64], ["mechanisms", 6.05], ["musical instrument", 4.43]], [["speech", 27.76], ["gong", 16.08], ["music", 14.13]], null, null], "duration": [5.6, 13.02, 1.25, 5.38, 0.72, 1.34, 2.73, 4.33, 4.64, 72.08, -0.05]} \ No newline at end of file diff --git a/annotations_1/5V-C6ziFKMA_filtered.json b/annotations_1/5V-C6ziFKMA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..126bb5da39f47cbf3bb8b31f4e5cd621515116ae --- /dev/null +++ b/annotations_1/5V-C6ziFKMA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.11], [22.0, 24.51], [27.0, 30.21], [31.0, 32.17], [33.0, 35.26], [39.0, 43.53], [46.0, 46.92]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [54.63, 50.11, 57.32, 0.0, 73.97, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [2.11, 2.51, 3.21, 1.17, 2.26, 4.53, 0.92]} \ No newline at end of file diff --git a/annotations_1/5VSg6c8TKNc_filtered.json b/annotations_1/5VSg6c8TKNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37d702598422858ca3f76034e44e7251e664a7a9 --- /dev/null +++ b/annotations_1/5VSg6c8TKNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.56], [14.0, 13.58], [19.0, 22.35], [27.0, 31.53], [33.0, 34.38], [36.0, 43.71], [45.0, 63.29], [65.0, 69.75], [70.0, 72.0], [81.0, 146.23], [166.0, 167.95], [168.0, 168.02], [169.0, 171.42], [172.0, 171.53]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 93.13, 92.48, 0.0, 52.68, 46.47, 41.3, 30.95, 0.0, 0.0, 0.0, 61.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.68], ["theremin", 17.15], ["whale vocalization", 8.66]], [["speech", 33.92], ["hum", 20.51], ["throbbing", 8.41]], [["mosquito", 9.69], ["animal", 9.18], ["music", 8.15]], null, null, null, null, null], "duration": [0.56, -0.42, 3.35, 4.53, 1.38, 7.71, 18.29, 4.75, 2.0, 65.23, 1.95, 0.02, 2.42, -0.47]} \ No newline at end of file diff --git a/annotations_1/5VgRuLQgeSE_filtered.json b/annotations_1/5VgRuLQgeSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c2af9b1f5b5596ad16a397d2d2b6399cfad5836 --- /dev/null +++ b/annotations_1/5VgRuLQgeSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.02], [8.0, 15.67], [17.0, 18.72], [22.0, 23.4], [32.0, 35.83], [36.0, 38.58], [40.0, 41.72], [45.0, 46.5], [55.0, 56.44], [58.0, 59.14], [64.0, 66.43], [75.0, 86.27], [87.0, 88.52], [92.0, 91.81], [94.0, 95.05], [97.0, 97.97], [101.0, 101.49], [102.0, 102.74], [104.0, 104.4], [105.0, 106.71], [114.0, 114.2], [117.0, 117.58], [131.0, 132.92], [149.0, 150.99], [155.0, 157.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.31, 88.46, 0.0, 0.0, 99.8, 97.83, 0.0, 0.0, 0.0, 0.0, 72.75, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.02, 7.67, 1.72, 1.4, 3.83, 2.58, 1.72, 1.5, 1.44, 1.14, 2.43, 11.27, 1.52, -0.19, 1.05, 0.97, 0.49, 0.74, 0.4, 1.71, 0.2, 0.58, 1.92, 1.99, 2.6]} \ No newline at end of file diff --git a/annotations_1/5VmWe3LyUDM_filtered.json b/annotations_1/5VmWe3LyUDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa9b55abc086135b309407d7cd61d9f1e73db83e --- /dev/null +++ b/annotations_1/5VmWe3LyUDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [7.0, 7.2], [9.0, 14.4], [15.0, 14.81], [15.0, 14.84], [15.0, 14.94], [20.0, 22.77], [25.0, 25.25], [27.0, 27.84], [31.0, 31.26], [33.0, 32.93], [39.0, 40.32], [54.0, 60.51], [68.0, 68.57], [75.0, 76.98], [78.0, 81.33], [87.0, 89.02], [93.0, 99.27], [100.0, 101.01], [103.0, 103.11], [106.0, 106.52], [118.0, 119.15], [120.0, 120.38], [126.0, 126.13], [126.0, 126.52], [135.0, 135.19], [136.0, 141.0], [143.0, 144.12], [149.0, 150.2], [154.0, 154.67], [155.0, 157.08], [157.0, 158.28], [163.0, 163.61], [168.0, 168.4]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.17, 0.0, 0.0, 0.0, 33.55, 0.0, 0.0, 0.0, 0.0, 0.0, 29.2, 0.0, 0.0, 30.07, 30.01, 30.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 31.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 51.23], ["groan", 11.97], ["insect", 5.51]], null, null, null, [["explosion", 9.53], ["whack, thwack", 9.18], ["speech", 8.73]], null, null, null, null, null, [["music", 68.56], ["speech", 7.57], ["electronic music", 3.33]], null, null, [["music", 29.5], ["speech", 25.2], ["moo", 5.43]], [["speech", 26.08], ["music", 18.11], ["livestock, farm animals, working animals", 3.95]], [["mosquito", 30.14], ["music", 18.75], ["fly, housefly", 17.68]], null, null, null, null, null, null, null, null, [["music", 53.44], ["speech", 13.12], ["boing", 3.31]], null, null, null, [["music", 79.52], ["boing", 1.09], ["musical instrument", 0.81]], null, null, null], "duration": [0.54, 0.2, 5.4, -0.19, -0.16, -0.06, 2.77, 0.25, 0.84, 0.26, -0.07, 1.32, 6.51, 0.57, 1.98, 3.33, 2.02, 6.27, 1.01, 0.11, 0.52, 1.15, 0.38, 0.13, 0.52, 0.19, 5.0, 1.12, 1.2, 0.67, 2.08, 1.28, 0.61, 0.4]} \ No newline at end of file diff --git a/annotations_1/5W19mLb-9JM_filtered.json b/annotations_1/5W19mLb-9JM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4f584472b384f430d8d9742c1c8e43c6247c8c --- /dev/null +++ b/annotations_1/5W19mLb-9JM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.52], [48.0, 49.0], [50.0, 89.26], [90.0, 116.82], [118.0, 127.68], [130.0, 155.78], [163.0, 164.57], [165.0, 166.19], [167.0, 167.59], [170.0, 172.29], [174.0, 188.03], [201.0, 202.07], [206.0, 208.16]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [34.21, 0.0, 0.0, 35.22, 30.96, 30.95, 0.0, 0.0, 0.0, 31.43, 29.87, 0.0, 64.97], "audiomae_on_audioset": [[["music", 56.42], ["throbbing", 20.47], ["hum", 13.75]], null, null, [["music", 54.8], ["throbbing", 23.37], ["hum", 6.3]], [["music", 44.3], ["hum", 8.76], ["speech", 8.15]], [["speech", 55.98], ["whack, thwack", 10.41], ["hum", 3.45]], null, null, null, [["music", 77.46], ["throbbing", 3.23], ["didgeridoo", 1.75]], [["music", 37.04], ["speech", 25.71], ["musical instrument", 4.56]], null, null], "duration": [21.52, 1.0, 39.26, 26.82, 9.68, 25.78, 1.57, 1.19, 0.59, 2.29, 14.03, 1.07, 2.16]} \ No newline at end of file diff --git a/annotations_1/5WT1QRZ2z6A_filtered.json b/annotations_1/5WT1QRZ2z6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..432e0c195c4759970a921e2b1884a91cd020f1df --- /dev/null +++ b/annotations_1/5WT1QRZ2z6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.05], [8.0, 18.87], [20.0, 20.87], [23.0, 22.84], [24.0, 24.56], [26.0, 27.63], [28.0, 32.71], [34.0, 34.59], [35.0, 96.96], [98.0, 100.21], [100.0, 100.45], [100.0, 101.33], [103.0, 103.59], [106.0, 110.52], [111.0, 111.87], [113.0, 113.07], [115.0, 120.97], [126.0, 125.95]], "keep_status": [false, true, false, false, false, false, true, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [30.84, 31.3, 0.0, 0.0, 0.0, 0.0, 33.89, 0.0, 0.0, 37.55, 0.0, 0.0, 0.0, 33.05, 0.0, 0.0, 39.99, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 39.89], ["moo", 34.94], ["livestock, farm animals, working animals", 25.04]], [["speech", 26.26], ["music", 10.6], ["buzz", 7.84]], null, null, null, null, [["hum", 33.15], ["mains hum", 25.16], ["music", 10.42]], null, null, [["cattle, bovinae", 25.87], ["livestock, farm animals, working animals", 19.84], ["moo", 17.44]], null, null, null, [["speech", 40.73], ["mains hum", 10.19], ["hum", 10.09]], null, null, [["music", 55.55], ["whale vocalization", 6.56], ["theremin", 5.91]], null], "duration": [2.05, 10.87, 0.87, -0.16, 0.56, 1.63, 4.71, 0.59, 61.96, 2.21, 0.45, 1.33, 0.59, 4.52, 0.87, 0.07, 5.97, -0.05]} \ No newline at end of file diff --git a/annotations_1/5W_sktmZuzI_filtered.json b/annotations_1/5W_sktmZuzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0086fae7becbcf51770889823e7bed35ff788424 --- /dev/null +++ b/annotations_1/5W_sktmZuzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [13.0, 13.95], [15.0, 15.96], [22.0, 22.38], [25.0, 25.03], [28.0, 28.11], [34.0, 33.99], [37.0, 37.83], [40.0, 40.27]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.95, 0.96, 0.38, 0.03, 0.11, -0.01, 0.83, 0.27]} \ No newline at end of file diff --git a/annotations_1/5WvXdaXIbYw_filtered.json b/annotations_1/5WvXdaXIbYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/5WvXdaXIbYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/5XQqslDEoeI_filtered.json b/annotations_1/5XQqslDEoeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..891a7fae5fda75cbc2b8b3e2d36afccccab10242 --- /dev/null +++ b/annotations_1/5XQqslDEoeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.74], [14.0, 20.29], [21.0, 24.66], [27.0, 27.73], [29.0, 29.17], [31.0, 61.52], [62.0, 92.06], [95.0, 96.82], [98.0, 100.58], [104.0, 105.31], [105.0, 106.61], [108.0, 111.43], [114.0, 129.07], [130.0, 130.55], [134.0, 144.68], [145.0, 150.15], [151.0, 170.97], [177.0, 184.72]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, true, false, true], "silence_prob": [50.16, 53.34, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 31.96, 0.0, 0.0, 29.19, 28.82, 0.0, 29.12, 42.69, 28.37, 43.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["mains hum", 22.17], ["music", 14.83], ["pulse", 13.03]], null, null, [["music", 23.8], ["dog", 15.58], ["didgeridoo", 14.21]], [["animal", 78.28], ["dog", 3.79], ["domestic animals, pets", 3.29]], null, [["animal", 31.38], ["dog", 19.89], ["music", 15.1]], [["stomach rumble", 9.92], ["whale vocalization", 9.67], ["animal", 8.29]], [["speech", 48.14], ["music", 20.92], ["animal", 4.62]], [["speech", 20.34], ["music", 19.83], ["effects unit", 9.3]]], "duration": [7.74, 6.29, 3.66, 0.73, 0.17, 30.52, 30.06, 1.82, 2.58, 1.31, 1.61, 3.43, 15.07, 0.55, 10.68, 5.15, 19.97, 7.72]} \ No newline at end of file diff --git a/annotations_1/5XZcn9qR5SE_filtered.json b/annotations_1/5XZcn9qR5SE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..399967855b43f1dc468adb46e07d884ea34bddc7 --- /dev/null +++ b/annotations_1/5XZcn9qR5SE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 63.24], [64.0, 84.1], [86.0, 87.1], [88.0, 88.87], [90.0, 91.59], [93.0, 94.1]], "keep_status": [true, true, false, false, false, false], "silence_prob": [38.02, 32.77, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 13.14], ["rumble", 11.59], ["fly, housefly", 11.3]], [["throbbing", 23.52], ["hum", 15.2], ["music", 12.07]], null, null, null, null], "duration": [9.24, 20.1, 1.1, 0.87, 1.59, 1.1]} \ No newline at end of file diff --git a/annotations_1/5X_ZiFC5RMg_filtered.json b/annotations_1/5X_ZiFC5RMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45c4b6273415398e3e6ac92246110cdb4d526e23 --- /dev/null +++ b/annotations_1/5X_ZiFC5RMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.23], [16.0, 19.13], [20.0, 26.0], [27.0, 41.1], [43.0, 44.74], [47.0, 51.53], [52.0, 53.1], [61.0, 67.88], [72.0, 73.14], [81.0, 117.04], [123.0, 124.01]], "keep_status": [true, true, true, true, false, true, false, true, false, false, false], "silence_prob": [34.88, 32.46, 36.15, 33.11, 0.0, 33.79, 0.0, 32.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.14], ["buzz", 4.38], ["musical instrument", 3.07]], [["music", 39.82], ["mains hum", 6.43], ["hum", 5.76]], [["music", 25.5], ["speech", 24.31], ["foghorn", 10.17]], [["music", 29.71], ["speech", 15.93], ["hum", 6.79]], null, [["trombone", 16.79], ["music", 10.92], ["brass instrument", 10.2]], null, [["music", 34.65], ["noise", 5.61], ["musical instrument", 3.79]], null, null, null], "duration": [10.23, 3.13, 6.0, 14.1, 1.74, 4.53, 1.1, 6.88, 1.14, 36.04, 1.01]} \ No newline at end of file diff --git a/annotations_1/5XnGKA75dtI_filtered.json b/annotations_1/5XnGKA75dtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfc5e40f4045e31eb828d89e8cef30ecefff6e7d --- /dev/null +++ b/annotations_1/5XnGKA75dtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.67], [20.0, 26.0], [28.0, 30.62], [32.0, 50.48], [51.0, 52.93], [53.0, 57.5], [58.0, 58.99]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 29.16, 41.32, 29.09, 0.0, 42.65, 0.0], "audiomae_on_audioset": [null, [["music", 39.35], ["theremin", 16.6], ["chirp tone", 15.98]], [["music", 25.67], ["sonar", 19.76], ["chirp tone", 8.75]], [["music", 48.64], ["speech", 37.68], ["sound effect", 1.1]], null, [["music", 64.85], ["throbbing", 4.72], ["synthesizer", 3.34]], null], "duration": [0.67, 6.0, 2.62, 18.48, 1.93, 4.5, 0.99]} \ No newline at end of file diff --git a/annotations_1/5Y7gOcsg0Xk_filtered.json b/annotations_1/5Y7gOcsg0Xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..169da3d9fb7becd18a165c0f5d44443f0f0056ca --- /dev/null +++ b/annotations_1/5Y7gOcsg0Xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.59], [9.0, 9.24], [12.0, 20.44], [23.0, 25.27], [32.0, 32.31], [34.0, 34.96], [41.0, 41.3], [48.0, 48.73], [51.0, 51.8], [54.0, 55.11], [56.0, 58.78], [60.0, 61.86], [65.0, 66.53], [69.0, 69.11], [70.0, 71.02], [73.0, 76.76], [83.0, 83.1], [89.0, 89.21], [90.0, 95.0], [96.0, 97.34], [100.0, 102.15], [112.0, 114.86], [118.0, 123.08], [126.0, 139.46], [147.0, 147.92], [150.0, 150.26], [151.0, 153.82], [158.0, 159.93], [164.0, 164.1]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.78, 34.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 29.93, 0.0, 47.58, 34.78, 39.31, 34.62, 0.0, 0.0, 44.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 22.41], ["music", 11.52], ["vehicle", 7.61]], [["music", 26.9], ["hum", 14.06], ["mains hum", 8.13]], null, null, null, null, null, null, [["music", 58.07], ["hum", 8.31], ["throbbing", 5.12]], null, null, null, null, [["hum", 40.1], ["music", 16.75], ["mains hum", 12.25]], null, null, [["throbbing", 13.93], ["hum", 13.39], ["music", 8.27]], null, [["hum", 32.99], ["music", 20.76], ["throbbing", 17.89]], [["speech", 32.21], ["music", 25.54], ["throbbing", 16.58]], [["music", 32.14], ["throbbing", 24.34], ["hum", 6.28]], [["speech", 22.98], ["rumble", 20.39], ["hum", 14.5]], null, null, [["hum", 25.76], ["speech", 21.51], ["whale vocalization", 21.25]], null, null], "duration": [0.59, 0.24, 8.44, 2.27, 0.31, 0.96, 0.3, 0.73, 0.8, 1.11, 2.78, 1.86, 1.53, 0.11, 1.02, 3.76, 0.1, 0.21, 5.0, 1.34, 2.15, 2.86, 5.08, 13.46, 0.92, 0.26, 2.82, 1.93, 0.1]} \ No newline at end of file diff --git a/annotations_1/5YEw7F6ri_0_filtered.json b/annotations_1/5YEw7F6ri_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8d825e7372ab95a66f9acf95421dad3933a0d0e --- /dev/null +++ b/annotations_1/5YEw7F6ri_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.69], [26.0, 26.67], [29.0, 28.76], [33.0, 33.96], [38.0, 39.95], [43.0, 43.87], [47.0, 48.84], [51.0, 51.31], [54.0, 54.01], [57.0, 58.16], [68.0, 69.23], [71.0, 72.81], [74.0, 75.25], [76.0, 78.31], [81.0, 81.55], [83.0, 90.61], [100.0, 104.89], [106.0, 107.35], [108.0, 109.12], [110.0, 111.67], [116.0, 116.26], [117.0, 117.39], [120.0, 122.28], [123.0, 125.36], [126.0, 127.68], [129.0, 129.69], [131.0, 133.47], [135.0, 136.17], [139.0, 140.63], [145.0, 146.35], [148.0, 148.34], [151.0, 154.3], [155.0, 156.69], [157.0, 158.62], [160.0, 166.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 0.0, 49.82, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 48.44, 90.78, 0.0, 0.0, 75.23, 0.0, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 44.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.86], ["sidetone", 29.64], ["sine wave", 10.8]], null, null, null, null, null, null, [["music", 64.39], ["guitar", 7.6], ["didgeridoo", 7.16]], null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 51.68], ["music", 27.8], ["musical instrument", 3.2]]], "duration": [-0.31, 0.67, -0.24, 0.96, 1.95, 0.87, 1.84, 0.31, 0.01, 1.16, 1.23, 1.81, 1.25, 2.31, 0.55, 7.61, 4.89, 1.35, 1.12, 1.67, 0.26, 0.39, 2.28, 2.36, 1.68, 0.69, 2.47, 1.17, 1.63, 1.35, 0.34, 3.3, 1.69, 1.62, 6.14]} \ No newline at end of file diff --git a/annotations_1/5YgMl4JQxKw_filtered.json b/annotations_1/5YgMl4JQxKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebe20c2f5932392e016718ae9fbb00d966e9c014 --- /dev/null +++ b/annotations_1/5YgMl4JQxKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.44], [11.0, 12.82], [20.0, 20.88], [26.0, 25.83], [30.0, 31.31], [38.0, 40.9], [41.0, 41.59], [44.0, 47.06], [48.0, 51.38], [53.0, 55.48], [57.0, 60.07], [61.0, 61.55], [63.0, 63.22], [65.0, 68.69], [74.0, 79.54], [81.0, 88.1], [92.0, 92.7], [95.0, 95.37], [98.0, 99.0], [100.0, 101.49], [103.0, 107.22], [107.0, 112.45], [115.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [99.78, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0, 46.64, 45.21, 94.81, 81.35, 0.0, 0.0, 73.21, 35.13, 40.34, 0.0, 0.0, 0.0, 0.0, 60.05, 55.31, 74.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["theremin", 60.86], ["music", 24.88], ["musical instrument", 2.75]], [["theremin", 35.05], ["music", 34.33], ["didgeridoo", 5.28]], null, null, null, null, null, [["music", 31.96], ["foghorn", 17.53], ["speech", 7.4]], [["music", 49.98], ["fart", 6.64], ["didgeridoo", 4.67]], null, null, null, null, null, null, null], "duration": [5.44, 1.82, 0.88, -0.17, 1.31, 2.9, 0.59, 3.06, 3.38, 2.48, 3.07, 0.55, 0.22, 3.69, 5.54, 7.1, 0.7, 0.37, 1.0, 1.49, 4.22, 5.45, 3.59]} \ No newline at end of file diff --git a/annotations_1/5ZCaXimXaxo_filtered.json b/annotations_1/5ZCaXimXaxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..813eb30a94ad3044792c5961deb978a4fe9b8bce --- /dev/null +++ b/annotations_1/5ZCaXimXaxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 21.39], [23.0, 23.63], [25.0, 25.64], [26.0, 26.87], [27.0, 28.09], [30.0, 30.67], [32.0, 36.26], [38.0, 38.55], [40.0, 45.67], [47.0, 52.78], [54.0, 55.16], [56.0, 57.75], [60.0, 60.74], [63.0, 64.08], [65.0, 65.65], [68.0, 69.11]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [37.72, 0.0, 0.0, 0.0, 0.0, 0.0, 54.76, 0.0, 44.9, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["theremin", 62.63], ["music", 21.48], ["synthesizer", 4.61]], null, null, null, null, null, null, null, [["music", 41.44], ["mains hum", 5.59], ["musical instrument", 5.28]], [["theremin", 34.67], ["music", 20.72], ["chirp tone", 13.31]], null, null, null, null, null, null], "duration": [14.39, 0.63, 0.64, 0.87, 1.09, 0.67, 4.26, 0.55, 5.67, 5.78, 1.16, 1.75, 0.74, 1.08, 0.65, 1.11]} \ No newline at end of file diff --git a/annotations_1/5ZUgU9CsjDc_filtered.json b/annotations_1/5ZUgU9CsjDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2195df91dd119c31e5341fc407786c0a3b7b9d5a --- /dev/null +++ b/annotations_1/5ZUgU9CsjDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 82.78], [85.0, 86.09], [94.0, 98.69]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 29.76], "audiomae_on_audioset": [null, null, [["speech", 36.65], ["vehicle", 10.4], ["car", 10.01]]], "duration": [47.78, 1.09, 4.69]} \ No newline at end of file diff --git a/annotations_1/5_j3NrcDiS4_filtered.json b/annotations_1/5_j3NrcDiS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c393046017de2fb62db93dbb51e7da382d84bfe --- /dev/null +++ b/annotations_1/5_j3NrcDiS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.69], [27.0, 29.22], [31.0, 31.48], [33.0, 32.78], [39.0, 39.8], [49.0, 49.5], [50.0, 50.23], [50.0, 50.73], [51.0, 51.63], [53.0, 53.08], [54.0, 54.19], [55.0, 54.84], [55.0, 55.53], [56.0, 56.66], [57.0, 65.18], [66.0, 69.08], [84.0, 98.19], [99.0, 99.39], [105.0, 105.41], [106.0, 106.35], [107.0, 109.11], [110.0, 110.49], [116.0, 115.92], [118.0, 118.72], [120.0, 120.97], [123.0, 124.28], [125.0, 125.51], [128.0, 129.34], [132.0, 132.48], [135.0, 138.25], [142.0, 142.33], [147.0, 147.75], [149.0, 150.31], [153.0, 153.08], [155.0, 155.16], [157.0, 157.71], [159.0, 170.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.82, 47.35, 40.09, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25], "audiomae_on_audioset": [null, [["music", 74.22], ["musical instrument", 1.43], ["speech", 1.21]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.42], ["mains hum", 8.51], ["hum", 7.37]], [["music", 44.04], ["speech", 24.39], ["effects unit", 3.02]], [["music", 62.9], ["musical instrument", 6.39], ["cello", 3.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.31, 2.22, 0.48, -0.22, 0.8, 0.5, 0.23, 0.73, 0.63, 0.08, 0.19, -0.16, 0.53, 0.66, 8.18, 3.08, 14.19, 0.39, 0.41, 0.35, 2.11, 0.49, -0.08, 0.72, 0.97, 1.28, 0.51, 1.34, 0.48, 3.25, 0.33, 0.75, 1.31, 0.08, 0.16, 0.71, 11.45]} \ No newline at end of file diff --git a/annotations_1/5aY5jTL60pA_filtered.json b/annotations_1/5aY5jTL60pA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de5c85ffefdb07d4f2398cd469c10e1322c983a2 --- /dev/null +++ b/annotations_1/5aY5jTL60pA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.64], [15.0, 19.2], [27.0, 33.32], [36.0, 41.69], [45.0, 65.5], [67.0, 68.47], [72.0, 72.79], [79.0, 81.26], [83.0, 85.36], [87.0, 88.75], [90.0, 90.22], [92.0, 92.2], [93.0, 94.36], [95.0, 95.23], [95.0, 96.13], [99.0, 100.11], [103.0, 103.03], [122.0, 123.26], [126.0, 126.94], [136.0, 136.36], [137.0, 138.65], [139.0, 139.73], [143.0, 143.29], [146.0, 146.06], [149.0, 148.69], [149.0, 151.77], [164.0, 167.39], [168.0, 168.32], [169.0, 169.47], [170.0, 170.65], [174.0, 176.23], [177.0, 177.55], [178.0, 179.04]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [30.62, 30.26, 31.84, 29.61, 30.65, 0.0, 0.0, 60.23, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.83, 35.47, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.13], ["throbbing", 7.49], ["musical instrument", 4.64]], [["speech", 38.15], ["music", 27.9], ["boing", 17.69]], [["music", 42.86], ["speech", 15.26], ["hum", 12.99]], [["music", 42.17], ["boing", 20.97], ["throbbing", 7.92]], [["hum", 35.95], ["throbbing", 16.19], ["sidetone", 11.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 31.7], ["speech", 12.41], ["insect", 9.19]], [["speech", 31.86], ["boing", 27.0], ["thunk", 11.72]], null, null, null, null, null, null], "duration": [4.64, 4.2, 6.32, 5.69, 20.5, 1.47, 0.79, 2.26, 2.36, 1.75, 0.22, 0.2, 1.36, 0.23, 1.13, 1.11, 0.03, 1.26, 0.94, 0.36, 1.65, 0.73, 0.29, 0.06, -0.31, 2.77, 3.39, 0.32, 0.47, 0.65, 2.23, 0.55, 1.04]} \ No newline at end of file diff --git a/annotations_1/5asGTRoIqCw_filtered.json b/annotations_1/5asGTRoIqCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/5asGTRoIqCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/5bWanpZTnSQ_filtered.json b/annotations_1/5bWanpZTnSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75d8312de7b39a5fe55a2d0e9a68d1eedfef6cb8 --- /dev/null +++ b/annotations_1/5bWanpZTnSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.5], [25.0, 35.31], [39.0, 49.57], [53.0, 54.84], [63.0, 66.73], [68.0, 78.8], [82.0, 82.86], [85.0, 87.54], [93.0, 95.69], [98.0, 98.15], [101.0, 112.23], [113.0, 112.73], [113.0, 119.58], [120.0, 123.85], [126.0, 134.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 80.29, 82.07, 0.0, 59.15, 54.97, 0.0, 50.51, 43.82, 0.0, 32.6, 0.0, 33.14, 32.44, 33.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["cello", 27.93], ["double bass", 25.84], ["music", 23.89]], null, [["music", 45.67], ["hum", 15.11], ["mains hum", 12.98]], null, [["music", 62.54], ["scary music", 7.99], ["ambient music", 4.65]], [["music", 62.76], ["theremin", 4.46], ["musical instrument", 3.88]], [["foghorn", 51.39], ["music", 33.07], ["brass instrument", 2.96]]], "duration": [6.5, 10.31, 10.57, 1.84, 3.73, 10.8, 0.86, 2.54, 2.69, 0.15, 11.23, -0.27, 6.58, 3.85, 8.5]} \ No newline at end of file diff --git a/annotations_1/5c1qYWHkPEc_filtered.json b/annotations_1/5c1qYWHkPEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..965d1d6c20441aa67fa5ead7f4a9c32e7cc58126 --- /dev/null +++ b/annotations_1/5c1qYWHkPEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [12.0, 12.18], [25.0, 25.3], [28.0, 28.75], [30.0, 33.3], [35.0, 36.39], [37.0, 37.34], [43.0, 52.98], [54.0, 54.75], [57.0, 58.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 54.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.18, 0.3, 0.75, 3.3, 1.39, 0.34, 9.98, 0.75, 1.04]} \ No newline at end of file diff --git a/annotations_1/5c3tOFFEcU4_filtered.json b/annotations_1/5c3tOFFEcU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a9764d97d062e9b3582f8427aa1c04d058ef2d8 --- /dev/null +++ b/annotations_1/5c3tOFFEcU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[107.0, 109.34], [109.0, 116.51], [117.0, 116.55]], "keep_status": [true, true, false], "silence_prob": [42.04, 39.5, 0.0], "audiomae_on_audioset": [[["music", 43.31], ["sidetone", 6.06], ["noise", 5.52]], [["speech", 23.63], ["music", 21.97], ["hum", 10.41]], null], "duration": [2.34, 7.51, -0.45]} \ No newline at end of file diff --git a/annotations_1/5cbim7n9ARs_filtered.json b/annotations_1/5cbim7n9ARs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e17c447e2f84ac3f8ce8170b6713b0a863ea4fad --- /dev/null +++ b/annotations_1/5cbim7n9ARs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 28.7], [31.0, 42.3], [45.0, 47.55], [48.0, 48.66], [51.0, 52.25], [57.0, 58.68], [66.0, 71.36], [74.0, 79.44], [85.0, 88.01], [96.0, 97.73], [99.0, 100.26], [102.0, 109.81], [110.0, 111.77], [116.0, 120.45], [126.0, 127.36], [131.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.61, 64.97, 65.79, 0.0, 0.0, 0.0, 70.58, 69.88, 90.25, 0.0, 0.0, 64.29, 0.0, 43.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.01], ["speech", 33.4], ["didgeridoo", 3.71]], null, null], "duration": [8.7, 11.3, 2.55, 0.66, 1.25, 1.68, 5.36, 5.44, 3.01, 1.73, 1.26, 7.81, 1.77, 4.45, 1.36, 0.9]} \ No newline at end of file diff --git a/annotations_1/5ckqhebte9o_filtered.json b/annotations_1/5ckqhebte9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4677f6502acf757196bdfa923bca943991142ab --- /dev/null +++ b/annotations_1/5ckqhebte9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 139.21], [140.0, 139.99], [140.0, 140.02], [141.0, 145.96], [147.0, 148.1], [150.0, 151.23], [153.0, 152.98], [153.0, 153.01], [154.0, 154.5], [155.0, 155.38], [155.0, 155.56], [156.0, 157.65], [158.0, 159.76], [161.0, 162.26], [164.0, 168.76], [171.0, 172.32], [173.0, 176.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 0.0, 33.35], "audiomae_on_audioset": [null, null, null, [["music", 66.52], ["musical instrument", 6.84], ["brass instrument", 6.4]], null, null, null, null, null, null, null, null, null, null, [["music", 48.36], ["synthesizer", 17.16], ["musical instrument", 7.83]], null, [["music", 48.29], ["didgeridoo", 7.62], ["musical instrument", 7.27]]], "duration": [133.21, -0.01, 0.02, 4.96, 1.1, 1.23, -0.02, 0.01, 0.5, 0.38, 0.56, 1.65, 1.76, 1.26, 4.76, 1.32, 3.49]} \ No newline at end of file diff --git a/annotations_1/5d1P50L28LU_filtered.json b/annotations_1/5d1P50L28LU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b59959fb69ccbb7ebf834012f80fbe2025befa2 --- /dev/null +++ b/annotations_1/5d1P50L28LU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.49], [12.0, 13.12], [14.0, 29.44], [32.0, 39.53], [42.0, 43.78], [45.0, 56.54], [57.0, 72.03], [75.0, 79.37], [81.0, 92.38], [94.0, 101.58], [103.0, 104.14], [108.0, 120.14], [121.0, 150.5], [154.0, 166.83]], "keep_status": [true, false, true, true, false, true, true, true, false, false, false, false, false, true], "silence_prob": [30.27, 0.0, 30.01, 30.47, 0.0, 29.81, 30.31, 29.01, 30.61, 30.59, 0.0, 30.08, 30.04, 32.67], "audiomae_on_audioset": [[["music", 44.4], ["noise", 11.78], ["cacophony", 6.69]], null, [["music", 21.16], ["machine gun", 19.69], ["sonar", 7.57]], [["vehicle", 28.31], ["buzz", 13.35], ["motorcycle", 11.1]], null, [["speech", 29.27], ["music", 26.56], ["mains hum", 6.5]], [["music", 41.64], ["speech", 13.85], ["synthesizer", 5.47]], [["music", 37.82], ["hum", 9.85], ["gong", 6.77]], [["speech", 55.39], ["music", 15.18], ["vehicle", 3.4]], [["throbbing", 50.54], ["hum", 22.08], ["music", 14.42]], null, [["music", 74.62], ["speech", 4.13], ["hum", 2.88]], [["music", 75.27], ["speech", 4.4], ["throbbing", 3.67]], [["hum", 28.72], ["mains hum", 27.27], ["music", 7.34]]], "duration": [6.49, 1.12, 15.44, 7.53, 1.78, 11.54, 15.03, 4.37, 11.38, 7.58, 1.14, 12.14, 29.5, 12.83]} \ No newline at end of file diff --git a/annotations_1/5dE-JjnKznQ_filtered.json b/annotations_1/5dE-JjnKznQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2977f323db21c1ed313390dc3ea0fbe8b4845646 --- /dev/null +++ b/annotations_1/5dE-JjnKznQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.94], [10.0, 11.21], [13.0, 33.02], [34.0, 53.86], [55.0, 61.38], [62.0, 62.5], [63.0, 62.95], [63.0, 63.41], [64.0, 63.73], [64.0, 75.78], [79.0, 82.85], [87.0, 91.47], [94.0, 95.39], [97.0, 97.58], [100.0, 102.9]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.27, 42.93, 38.52, 0.0, 0.0, 0.0, 0.0, 36.62, 100.0, 98.8, 0.0, 0.0, 54.9], "audiomae_on_audioset": [null, null, [["music", 40.39], ["speech", 14.51], ["wind instrument, woodwind instrument", 4.98]], [["music", 54.41], ["theremin", 21.13], ["animal", 4.72]], [["music", 37.6], ["speech", 33.0], ["hum", 5.29]], null, null, null, null, [["music", 69.89], ["chant", 3.6], ["speech", 2.42]], null, null, null, null, null], "duration": [1.94, 1.21, 20.02, 19.86, 6.38, 0.5, -0.05, 0.41, -0.27, 11.78, 3.85, 4.47, 1.39, 0.58, 2.9]} \ No newline at end of file diff --git a/annotations_1/5enqrVvjxg0_filtered.json b/annotations_1/5enqrVvjxg0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcb431de7703540763e025cd89bbdf73405011b4 --- /dev/null +++ b/annotations_1/5enqrVvjxg0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [9.0, 9.44], [12.0, 13.02], [16.0, 19.2], [21.0, 21.51], [23.0, 24.92], [26.0, 26.92], [28.0, 28.49], [31.0, 35.99], [38.0, 40.32], [42.0, 43.21], [46.0, 46.06], [47.0, 83.49], [88.0, 93.48], [101.0, 102.19], [103.0, 145.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 0.0, 44.29, 52.27, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.83], ["speech", 20.8], ["throbbing", 7.11]], null, null, null, null, null, null, null], "duration": [0.53, 0.44, 1.02, 3.2, 0.51, 1.92, 0.92, 0.49, 4.99, 2.32, 1.21, 0.06, 36.49, 5.48, 1.19, 42.37]} \ No newline at end of file diff --git a/annotations_1/5gOfKFlEJvo_filtered.json b/annotations_1/5gOfKFlEJvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c8acb77bf1c5be069c2644ec6f6b70f21e33880 --- /dev/null +++ b/annotations_1/5gOfKFlEJvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.7], [11.0, 14.07], [22.0, 24.22], [25.0, 26.16], [27.0, 28.12], [32.0, 33.34], [34.0, 34.74], [38.0, 55.39], [56.0, 69.31], [69.0, 69.38], [70.0, 70.39], [77.0, 77.21], [78.0, 88.87], [90.0, 91.34], [92.0, 93.28], [95.0, 95.91], [96.0, 96.99], [99.0, 100.45], [110.0, 111.74], [116.0, 115.96], [118.0, 117.95], [120.0, 120.9], [121.0, 122.54], [128.0, 143.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 62.37, 67.25, 0.0, 0.0, 0.0, 0.0, 38.17, 60.51, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["thunk", 53.34], ["speech", 12.95], ["crushing", 12.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.7, 3.07, 2.22, 1.16, 1.12, 1.34, 0.74, 17.39, 13.31, 0.38, 0.39, 0.21, 10.87, 1.34, 1.28, 0.91, 0.99, 1.45, 1.74, -0.04, -0.05, 0.9, 1.54, 15.29]} \ No newline at end of file diff --git a/annotations_1/5gtFQegr2xA_filtered.json b/annotations_1/5gtFQegr2xA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7df81428d59fc29d91b7748d5044b95ba42d5fc --- /dev/null +++ b/annotations_1/5gtFQegr2xA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.5], [19.0, 20.68], [21.0, 21.66], [39.0, 39.99], [42.0, 42.48], [44.0, 52.37], [53.0, 56.05], [57.0, 57.54], [58.0, 59.02], [60.0, 62.87], [64.0, 64.84], [72.0, 72.99], [79.0, 79.52], [81.0, 82.19], [84.0, 84.89], [89.0, 89.87], [93.0, 95.88], [98.0, 98.0], [101.0, 102.57], [105.0, 106.54], [107.0, 108.33], [117.0, 117.58], [121.0, 122.2], [127.0, 127.95], [130.0, 130.0], [137.0, 136.86], [138.0, 141.51], [143.0, 142.97], [150.0, 150.72], [154.0, 155.19], [159.0, 160.56], [163.0, 163.53], [169.0, 170.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.89, 0.0, 0.0, 0.0, 0.0, 71.72, 94.66, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.5, 1.68, 0.66, 0.99, 0.48, 8.37, 3.05, 0.54, 1.02, 2.87, 0.84, 0.99, 0.52, 1.19, 0.89, 0.87, 2.88, 0.0, 1.57, 1.54, 1.33, 0.58, 1.2, 0.95, 0.0, -0.14, 3.51, -0.03, 0.72, 1.19, 1.56, 0.53, 1.34]} \ No newline at end of file diff --git a/annotations_1/5h2uLkqpVV8_filtered.json b/annotations_1/5h2uLkqpVV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..791d191f8ded5db07f7d61a4c3e82e9d724f1fff --- /dev/null +++ b/annotations_1/5h2uLkqpVV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [2.0, 2.46], [3.0, 3.65], [5.0, 5.9], [10.0, 10.05], [13.0, 13.24], [14.0, 15.6], [19.0, 20.87], [26.0, 26.72], [27.0, 32.61], [43.0, 47.02], [48.0, 49.49], [53.0, 52.84], [59.0, 62.85], [66.0, 65.89], [68.0, 68.23], [69.0, 72.69], [79.0, 79.51], [80.0, 80.7], [81.0, 81.87], [90.0, 91.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.41, 74.44, 0.0, 0.0, 92.97, 0.0, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 42.87], ["speech", 17.45], ["drum machine", 9.44]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.46, 0.65, 0.9, 0.05, 0.24, 1.6, 1.87, 0.72, 5.61, 4.02, 1.49, -0.16, 3.85, -0.11, 0.23, 3.69, 0.51, 0.7, 0.87, 1.66]} \ No newline at end of file diff --git a/annotations_1/5h9E5SmLCVM_filtered.json b/annotations_1/5h9E5SmLCVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a097a30699780ea7c3aab22d4a196e8969ec0154 --- /dev/null +++ b/annotations_1/5h9E5SmLCVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 64.12], [66.0, 130.38]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.12, 64.38]} \ No newline at end of file diff --git a/annotations_1/5hriUO428pw_filtered.json b/annotations_1/5hriUO428pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0a67609de7b8975b5ff822c85de515fc5fbfeb9 --- /dev/null +++ b/annotations_1/5hriUO428pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 36.81], [38.0, 38.52], [39.0, 38.58], [39.0, 44.95], [46.0, 51.75], [52.0, 53.99], [54.0, 54.03], [55.0, 63.95], [65.0, 66.19], [68.0, 86.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.81, 0.0, 0.0, 36.2, 56.63, 0.0, 0.0, 50.11, 0.0, 47.86], "audiomae_on_audioset": [[["fly, housefly", 36.07], ["sidetone", 28.89], ["insect", 13.4]], null, null, [["speech", 57.96], ["siren", 9.35], ["frog", 4.74]], null, null, null, null, null, [["frog", 30.92], ["sneeze", 23.94], ["whale vocalization", 19.3]]], "duration": [12.81, 0.52, -0.42, 5.95, 5.75, 1.99, 0.03, 8.95, 1.19, 18.34]} \ No newline at end of file diff --git a/annotations_1/5jv7TlhbjAQ_filtered.json b/annotations_1/5jv7TlhbjAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294b090ef852ef8733e6665bf4efc95a7177f40a --- /dev/null +++ b/annotations_1/5jv7TlhbjAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 90.1], [91.0, 113.68], [115.0, 116.41], [118.0, 119.53], [124.0, 135.13], [137.0, 136.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 71.72, 0.0, 0.0, 40.84, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 62.61], ["music", 4.75], ["buzz", 3.96]], null], "duration": [69.1, 22.68, 1.41, 1.53, 11.13, -0.05]} \ No newline at end of file diff --git a/annotations_1/5kQCpsPnnew_filtered.json b/annotations_1/5kQCpsPnnew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..395319afee4de5e9d343bc796d8467b4b2a3f451 --- /dev/null +++ b/annotations_1/5kQCpsPnnew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [8.0, 10.88], [11.0, 13.71], [14.0, 14.82], [16.0, 17.04], [21.0, 32.88], [35.0, 42.58], [46.0, 51.58], [53.0, 65.4], [69.0, 70.34], [74.0, 77.8], [80.0, 87.62], [88.0, 87.86], [88.0, 98.85], [101.0, 104.04], [105.0, 121.8], [124.0, 140.83], [142.0, 174.6]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, true, false, false, true, false, false, false], "silence_prob": [0.0, 66.27, 45.59, 0.0, 0.0, 36.45, 30.99, 29.76, 31.65, 0.0, 44.69, 36.22, 0.0, 33.4, 29.01, 28.91, 28.97, 0.0], "audiomae_on_audioset": [null, null, [["speech", 40.87], ["whack, thwack", 10.1], ["thunk", 6.05]], null, null, [["music", 33.88], ["mains hum", 22.61], ["hum", 19.84]], [["music", 64.4], ["screaming", 8.39], ["groan", 4.36]], [["music", 24.74], ["whack, thwack", 18.99], ["speech", 13.19]], [["music", 54.18], ["clang", 8.72], ["ding", 7.59]], null, [["music", 17.53], ["speech", 15.14], ["hum", 14.79]], [["speech", 38.09], ["whack, thwack", 9.94], ["music", 8.61]], null, [["music", 69.22], ["synthesizer", 6.74], ["theremin", 4.02]], [["music", 26.03], ["boing", 10.48], ["hum", 5.45]], [["music", 65.44], ["cacophony", 10.8], ["mains hum", 3.65]], [["music", 70.54], ["musical instrument", 6.37], ["theremin", 5.76]], null], "duration": [1.31, 2.88, 2.71, 0.82, 1.04, 11.88, 7.58, 5.58, 12.4, 1.34, 3.8, 7.62, -0.14, 10.85, 3.04, 16.8, 16.83, 32.6]} \ No newline at end of file diff --git a/annotations_1/5lPGiKG9VI8_filtered.json b/annotations_1/5lPGiKG9VI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..972f9e59892002eeb1c9ff2fd496cc5304866f54 --- /dev/null +++ b/annotations_1/5lPGiKG9VI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 75.3]], "keep_status": [true], "silence_prob": [29.44], "audiomae_on_audioset": [[["music", 23.26], ["hum", 12.69], ["mains hum", 9.42]]], "duration": [2.3]} \ No newline at end of file diff --git a/annotations_1/5lekLtatLl0_filtered.json b/annotations_1/5lekLtatLl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc33d881fbd5b9a653cd01b04d584859c7a52b67 --- /dev/null +++ b/annotations_1/5lekLtatLl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.65], [13.0, 15.3], [15.0, 29.83], [31.0, 31.78], [32.0, 34.86], [36.0, 38.03], [39.0, 50.45], [52.0, 56.74], [57.0, 57.92], [59.0, 76.25], [77.0, 83.02], [83.0, 84.35], [85.0, 106.98], [110.0, 111.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 41.2, 28.77, 0.0, 51.12, 55.96, 30.11, 58.64, 0.0, 43.96, 65.2, 0.0, 31.04, 0.0], "audiomae_on_audioset": [null, [["mains hum", 39.71], ["hum", 31.43], ["music", 7.47]], [["speech", 64.63], ["music", 12.52], ["foghorn", 4.09]], null, null, null, [["theremin", 53.83], ["music", 27.72], ["whale vocalization", 4.46]], null, null, [["music", 50.18], ["theremin", 11.45], ["musical instrument", 4.59]], null, null, [["buzz", 14.77], ["mains hum", 13.75], ["hum", 11.47]], null], "duration": [1.65, 2.3, 14.83, 0.78, 2.86, 2.03, 11.45, 4.74, 0.92, 17.25, 6.02, 1.35, 21.98, 1.5]} \ No newline at end of file diff --git a/annotations_1/5lgCxWubUnU_filtered.json b/annotations_1/5lgCxWubUnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6449b0fd81935ad2268a2555aff9660caff835e4 --- /dev/null +++ b/annotations_1/5lgCxWubUnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.37], [9.0, 10.57], [12.0, 22.67], [23.0, 23.92], [26.0, 35.06], [38.0, 39.09], [43.0, 43.41], [43.0, 48.63], [55.0, 69.36], [74.0, 79.69], [87.0, 93.48], [95.0, 99.6]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.91, 0.0, 29.84, 0.0, 0.0, 29.3, 29.64, 29.74, 30.71, 30.11], "audiomae_on_audioset": [null, null, [["music", 73.03], ["speech", 5.17], ["musical instrument", 2.0]], null, [["music", 48.25], ["moo", 9.47], ["cattle, bovinae", 7.8]], null, null, [["music", 61.17], ["didgeridoo", 24.76], ["speech", 1.28]], [["music", 87.4], ["electronic music", 1.69], ["didgeridoo", 1.31]], [["music", 59.39], ["speech", 15.3], ["throbbing", 4.99]], [["music", 58.08], ["cattle, bovinae", 3.64], ["speech", 3.44]], [["music", 42.33], ["cattle, bovinae", 15.94], ["moo", 14.19]]], "duration": [1.37, 1.57, 10.67, 0.92, 9.06, 1.09, 0.41, 5.63, 14.36, 5.69, 6.48, 4.6]} \ No newline at end of file diff --git a/annotations_1/5m9Bf48pWc0_filtered.json b/annotations_1/5m9Bf48pWc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad79928db21fa316573c16bced99ab103d347085 --- /dev/null +++ b/annotations_1/5m9Bf48pWc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.89], [8.0, 8.53], [17.0, 17.37], [20.0, 20.17], [30.0, 30.16], [33.0, 33.62], [34.0, 34.7], [35.0, 35.16], [38.0, 39.87], [45.0, 44.88], [48.0, 48.12], [53.0, 54.03], [55.0, 54.85], [56.0, 57.35], [59.0, 59.78], [62.0, 63.63], [65.0, 66.55], [74.0, 75.25], [78.0, 81.43], [96.0, 96.08], [98.0, 98.51], [99.0, 98.78], [112.0, 114.94], [117.0, 118.67], [120.0, 132.09], [134.0, 136.32], [137.0, 137.64], [139.0, 141.08], [144.0, 145.98], [149.0, 153.1], [154.0, 156.39], [159.0, 160.59], [165.0, 165.06], [167.0, 167.59], [171.0, 175.68], [177.0, 179.12], [182.0, 183.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 63.1, 0.0, 35.63, 95.23, 0.0, 82.79, 0.0, 94.22, 72.9, 0.0, 0.0, 0.0, 95.64, 81.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.1], ["brass instrument", 11.65], ["trombone", 6.61]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 0.53, 0.37, 0.17, 0.16, 0.62, 0.7, 0.16, 1.87, -0.12, 0.12, 1.03, -0.15, 1.35, 0.78, 1.63, 1.55, 1.25, 3.43, 0.08, 0.51, -0.22, 2.94, 1.67, 12.09, 2.32, 0.64, 2.08, 1.98, 4.1, 2.39, 1.59, 0.06, 0.59, 4.68, 2.12, 1.54]} \ No newline at end of file diff --git a/annotations_1/5mcjt53aqlE_filtered.json b/annotations_1/5mcjt53aqlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..460e4a2c34378100ad5481e3a1141ac07329c9cf --- /dev/null +++ b/annotations_1/5mcjt53aqlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 42.35]], "keep_status": [false], "silence_prob": [74.44], "audiomae_on_audioset": [null], "duration": [24.35]} \ No newline at end of file diff --git a/annotations_1/5noS6qGxcbM_filtered.json b/annotations_1/5noS6qGxcbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d5d2bd947ca5d8a9c326cad646129c2b4f36b2f --- /dev/null +++ b/annotations_1/5noS6qGxcbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [15.0, 17.0], [19.0, 19.68], [22.0, 23.23], [28.0, 28.93], [30.0, 31.45], [37.0, 36.86], [38.0, 38.13], [43.0, 44.27], [47.0, 47.58], [50.0, 50.36], [59.0, 58.95], [60.0, 62.99], [63.0, 64.86], [66.0, 66.68], [69.0, 70.39], [73.0, 73.7], [76.0, 76.57], [80.0, 83.86], [85.0, 86.81], [91.0, 103.01], [104.0, 104.35], [105.0, 129.0], [131.0, 133.35], [134.0, 134.86]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.39, 0.0, 0.0, 0.0, 0.0, 0.0, 38.37, 0.0, 28.92, 0.0, 28.96, 35.2, 0.0], "audiomae_on_audioset": [null, [["music", 46.31], ["frog", 11.82], ["whale vocalization", 5.33]], null, null, null, null, null, null, null, null, null, null, [["music", 25.5], ["hum", 21.72], ["throbbing", 11.07]], null, null, null, null, null, [["music", 26.96], ["hum", 26.14], ["throbbing", 19.43]], null, [["speech", 62.14], ["music", 17.2], ["breaking", 2.76]], null, [["music", 51.93], ["theremin", 13.43], ["gong", 6.99]], [["hum", 42.97], ["throbbing", 16.15], ["music", 13.0]], null], "duration": [0.42, 2.0, 0.68, 1.23, 0.93, 1.45, -0.14, 0.13, 1.27, 0.58, 0.36, -0.05, 2.99, 1.86, 0.68, 1.39, 0.7, 0.57, 3.86, 1.81, 12.01, 0.35, 24.0, 2.35, 0.86]} \ No newline at end of file diff --git a/annotations_1/5oHNA8muC4I_filtered.json b/annotations_1/5oHNA8muC4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5980c9f73fab7f03c2dbe1bf290515bd301d10f1 --- /dev/null +++ b/annotations_1/5oHNA8muC4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 63.24], [64.0, 73.95], [74.0, 80.35], [82.0, 84.23], [87.0, 89.51], [94.0, 94.8], [102.0, 103.71], [106.0, 107.13], [108.0, 109.92], [112.0, 114.62], [117.0, 122.44], [123.0, 123.23], [123.0, 123.7], [124.0, 127.4], [129.0, 130.82], [132.0, 133.54], [138.0, 139.65], [141.0, 143.8], [145.0, 147.97], [149.0, 150.53], [154.0, 157.6], [159.0, 164.66], [167.0, 167.78], [168.0, 173.47], [174.0, 180.2]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [35.33, 42.76, 48.69, 89.01, 99.99, 0.0, 0.0, 0.0, 0.0, 90.78, 80.46, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 95.78, 68.93, 0.0, 45.78, 99.82, 0.0, 97.92, 99.65], "audiomae_on_audioset": [[["music", 41.91], ["ambient music", 9.49], ["hum", 6.33]], [["music", 31.03], ["speech", 10.66], ["didgeridoo", 9.23]], [["speech", 18.96], ["music", 13.76], ["hum", 10.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.18], ["music", 24.41], ["guitar", 7.13]], null, null, null, null], "duration": [18.24, 9.95, 6.35, 2.23, 2.51, 0.8, 1.71, 1.13, 1.92, 2.62, 5.44, 0.23, 0.7, 3.4, 1.82, 1.54, 1.65, 2.8, 2.97, 1.53, 3.6, 5.66, 0.78, 5.47, 6.2]} \ No newline at end of file diff --git a/annotations_1/5qKySTAWpiY_filtered.json b/annotations_1/5qKySTAWpiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..355da132359cd89747418fcca833aaa06861ed02 --- /dev/null +++ b/annotations_1/5qKySTAWpiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.95], [10.0, 11.31], [12.0, 14.44], [16.0, 18.44], [19.0, 18.94], [23.0, 24.61], [25.0, 29.61], [31.0, 33.2], [39.0, 41.66], [43.0, 44.9], [47.0, 47.71], [48.0, 51.66], [54.0, 64.27], [65.0, 65.57], [66.0, 67.37], [68.0, 70.34], [71.0, 75.02], [75.0, 76.67], [80.0, 82.56], [83.0, 84.87], [86.0, 91.13], [93.0, 97.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.89, 92.48, 0.0, 0.0, 90.25, 97.83, 79.24, 0.0, 0.0, 56.25, 99.52, 0.0, 0.0, 62.58, 99.92, 0.0, 99.91, 0.0, 99.05, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 1.31, 2.44, 2.44, -0.06, 1.61, 4.61, 2.2, 2.66, 1.9, 0.71, 3.66, 10.27, 0.57, 1.37, 2.34, 4.02, 1.67, 2.56, 1.87, 5.13, 4.88]} \ No newline at end of file diff --git a/annotations_1/5rGPKIgdV6A_filtered.json b/annotations_1/5rGPKIgdV6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eaa7e6b628a844944109a51572ba3ffe81d52c4 --- /dev/null +++ b/annotations_1/5rGPKIgdV6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.21], [8.0, 9.05], [11.0, 20.87], [24.0, 24.71], [26.0, 27.36], [28.0, 33.83], [38.0, 65.45], [71.0, 88.52], [91.0, 91.62], [92.0, 98.74], [99.0, 98.98], [101.0, 182.33], [184.0, 184.81]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [57.4, 0.0, 35.33, 0.0, 0.0, 32.24, 30.01, 30.36, 0.0, 29.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 35.86], ["hum", 32.51], ["music", 9.81]], null, null, [["fly, housefly", 31.49], ["speech", 14.83], ["mosquito", 11.32]], [["music", 74.06], ["speech", 6.58], ["throbbing", 6.05]], [["music", 83.37], ["scratching (performance technique)", 3.15], ["electronic music", 3.12]], null, [["music", 50.92], ["throbbing", 16.68], ["hum", 7.95]], null, null, null], "duration": [3.21, 1.05, 9.87, 0.71, 1.36, 5.83, 27.45, 17.52, 0.62, 6.74, -0.02, 81.33, 0.81]} \ No newline at end of file diff --git a/annotations_1/5rOdGpkURD8_filtered.json b/annotations_1/5rOdGpkURD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55522ebb5708db8f4e5f6d9069de2d5006825e9c --- /dev/null +++ b/annotations_1/5rOdGpkURD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.32], [26.0, 29.54], [30.0, 30.55], [31.0, 31.62], [32.0, 33.79], [35.0, 42.57], [49.0, 63.81], [67.0, 71.56], [72.0, 72.2], [73.0, 91.89], [101.0, 110.35], [114.0, 123.87], [129.0, 131.36], [131.0, 135.08], [136.0, 137.47], [138.0, 138.86], [140.0, 140.48], [141.0, 141.39], [144.0, 146.23], [147.0, 147.24], [149.0, 149.69]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, true, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 46.75, 0.0, 0.0, 0.0, 46.94, 53.34, 61.27, 0.0, 36.24, 36.44, 33.8, 34.67, 33.3, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.65], ["sidetone", 17.27], ["hum", 6.33]], null, null, null, [["rain", 24.49], ["rain on surface", 19.14], ["fly, housefly", 12.08]], null, null, null, [["hum", 39.84], ["mains hum", 17.14], ["white noise", 8.05]], [["speech", 35.82], ["rain on surface", 8.8], ["rain", 6.3]], [["speech", 19.73], ["music", 17.75], ["fly, housefly", 12.23]], [["speech", 52.0], ["static", 6.45], ["eruption", 4.95]], [["livestock, farm animals, working animals", 18.22], ["noise", 16.98], ["speech", 13.16]], null, null, null, null, [["frog", 6.46], ["speech", 5.03], ["rain", 4.55]], null, null], "duration": [0.32, 3.54, 0.55, 0.62, 1.79, 7.57, 14.81, 4.56, 0.2, 18.89, 9.35, 9.87, 2.36, 4.08, 1.47, 0.86, 0.48, 0.39, 2.23, 0.24, 0.69]} \ No newline at end of file diff --git a/annotations_1/5sMFxEL3zhw_filtered.json b/annotations_1/5sMFxEL3zhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad60cd64bea0128133a42593d5846fb345a87571 --- /dev/null +++ b/annotations_1/5sMFxEL3zhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.58], [14.0, 16.31], [18.0, 24.46], [26.0, 30.01], [32.0, 35.72], [37.0, 41.49], [43.0, 48.93], [51.0, 50.82], [57.0, 57.15], [58.0, 61.3], [65.0, 67.8], [68.0, 75.9], [80.0, 79.61], [84.0, 96.31], [98.0, 99.94], [102.0, 102.95], [109.0, 109.66], [110.0, 114.45], [116.0, 116.9], [117.0, 118.0], [118.0, 121.1], [133.0, 134.22], [137.0, 138.64], [139.0, 147.33], [148.0, 150.62], [153.0, 156.79], [159.0, 160.03], [165.0, 166.35], [173.0, 174.19], [176.0, 177.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 87.0, 98.19, 85.17, 98.19, 99.36, 70.02, 0.0, 0.0, 78.72, 99.56, 57.56, 0.0, 64.63, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 52.98, 0.0, 0.0, 76.7, 72.6, 76.7, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 2.31, 6.46, 4.01, 3.72, 4.49, 5.93, -0.18, 0.15, 3.3, 2.8, 7.9, -0.39, 12.31, 1.94, 0.95, 0.66, 4.45, 0.9, 1.0, 3.1, 1.22, 1.64, 8.33, 2.62, 3.79, 1.03, 1.35, 1.19, 1.89]} \ No newline at end of file diff --git a/annotations_1/5sNY4Rn7bYI_filtered.json b/annotations_1/5sNY4Rn7bYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc0ccfaa1bc6d846bf92938ab34db364515ecbeb --- /dev/null +++ b/annotations_1/5sNY4Rn7bYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.01], [21.0, 21.71], [22.0, 34.72], [40.0, 40.42], [44.0, 58.14], [62.0, 74.06], [77.0, 78.26]], "keep_status": [false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 30.16, 0.0, 30.28, 30.07, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.98], ["speech", 10.61], ["vehicle", 4.84]], null, [["music", 43.82], ["skidding", 10.58], ["vehicle", 9.11]], [["music", 35.92], ["vehicle", 13.75], ["race car, auto racing", 10.24]], null], "duration": [0.01, 0.71, 12.72, 0.42, 14.14, 12.06, 1.26]} \ No newline at end of file diff --git a/annotations_1/5tz8013avVU_filtered.json b/annotations_1/5tz8013avVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae64eb26e57d4587c603a9696cf9a881fa8ce5b6 --- /dev/null +++ b/annotations_1/5tz8013avVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.71], [3.0, 3.5], [4.0, 5.49], [11.0, 32.07], [34.0, 36.31], [38.0, 40.58], [42.0, 43.73], [48.0, 50.06], [50.0, 50.82], [60.0, 60.2], [60.0, 60.29], [60.0, 65.79], [69.0, 69.03], [73.0, 81.36], [85.0, 90.34]], "keep_status": [false, false, false, true, false, true, false, true, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 36.72, 36.2, 36.38, 0.0, 38.43, 0.0, 0.0, 0.0, 33.76, 0.0, 33.23, 32.55], "audiomae_on_audioset": [null, null, null, [["music", 28.81], ["speech", 17.61], ["hum", 11.28]], [["hum", 46.45], ["mains hum", 28.54], ["music", 6.14]], [["music", 24.14], ["speech", 20.4], ["hum", 11.96]], null, [["vehicle", 22.54], ["speech", 12.36], ["car", 10.2]], null, null, null, [["speech", 40.33], ["fly, housefly", 7.15], ["insect", 6.51]], null, [["hum", 41.25], ["music", 15.2], ["throbbing", 9.99]], [["music", 26.28], ["hum", 14.43], ["throbbing", 10.56]]], "duration": [-0.29, 0.5, 1.49, 21.07, 2.31, 2.58, 1.73, 2.06, 0.82, 0.2, 0.29, 5.79, 0.03, 8.36, 5.34]} \ No newline at end of file diff --git a/annotations_1/5uEViMQGON4_filtered.json b/annotations_1/5uEViMQGON4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f95471dcf12c0daa0f893bc666f78df2a30f8e44 --- /dev/null +++ b/annotations_1/5uEViMQGON4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.34], [35.0, 35.92], [41.0, 43.12], [47.0, 47.63], [55.0, 55.36], [66.0, 68.91], [76.0, 85.06], [91.0, 91.07], [101.0, 103.64], [109.0, 111.11], [113.0, 115.96], [127.0, 130.18], [136.0, 136.09], [142.0, 145.77], [152.0, 153.55], [165.0, 165.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.69, 0.0, 30.28, 0.0, 0.0, 29.92, 30.2, 0.0, 29.57, 29.89, 30.04, 29.56, 0.0, 30.17, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.53], ["bass guitar", 5.21], ["musical instrument", 4.04]], null, [["music", 58.71], ["bass guitar", 8.47], ["guitar", 5.09]], null, null, [["music", 65.96], ["musical instrument", 5.25], ["guitar", 2.43]], [["music", 70.11], ["funk", 3.83], ["bass guitar", 3.72]], null, [["music", 62.14], ["bass guitar", 5.94], ["musical instrument", 5.44]], [["music", 67.11], ["synthesizer", 4.69], ["theremin", 3.55]], [["music", 69.23], ["throbbing", 4.8], ["hum", 2.0]], [["music", 68.68], ["psychedelic rock", 7.32], ["musical instrument", 1.98]], null, [["music", 53.43], ["quack", 14.74], ["frog", 6.75]], null, null], "duration": [5.34, 0.92, 2.12, 0.63, 0.36, 2.91, 9.06, 0.07, 2.64, 2.11, 2.96, 3.18, 0.09, 3.77, 1.55, 0.1]} \ No newline at end of file diff --git a/annotations_1/5uvhg1AtZlQ_filtered.json b/annotations_1/5uvhg1AtZlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98e845243e856bc443473b8f6a74e2fcfe5211b7 --- /dev/null +++ b/annotations_1/5uvhg1AtZlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.97], [28.0, 62.16], [65.0, 65.15], [72.0, 72.47], [75.0, 74.66], [76.0, 76.03], [76.0, 88.16], [91.0, 98.47], [102.0, 109.32], [111.0, 123.33], [124.0, 156.1], [159.0, 158.57], [161.0, 168.94], [169.0, 180.59], [182.0, 183.63]], "keep_status": [false, false, false, false, false, false, true, true, true, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.19, 31.11, 29.29, 32.24, 0.0, 0.0, 28.71, 29.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 21.26], ["music", 12.02], ["hum", 6.16]], [["hum", 28.74], ["throbbing", 19.73], ["music", 16.99]], [["speech", 26.48], ["mains hum", 18.44], ["hum", 16.63]], [["music", 49.15], ["buzz", 7.37], ["livestock, farm animals, working animals", 6.86]], null, null, [["grunt", 28.96], ["livestock, farm animals, working animals", 11.93], ["animal", 10.61]], [["whack, thwack", 17.41], ["music", 11.11], ["breaking", 7.62]], null], "duration": [0.97, 34.16, 0.15, 0.47, -0.34, 0.03, 12.16, 7.47, 7.32, 12.33, 32.1, -0.43, 7.94, 11.59, 1.63]} \ No newline at end of file diff --git a/annotations_1/5vFi7gu-g-w_filtered.json b/annotations_1/5vFi7gu-g-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f9e004c6c80380c9181a965e0d1d34fdb77be9d --- /dev/null +++ b/annotations_1/5vFi7gu-g-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.67], [7.0, 7.37], [18.0, 34.91], [36.0, 36.68], [40.0, 51.24], [53.0, 53.57], [66.0, 66.51], [68.0, 67.81], [69.0, 69.52], [71.0, 71.29], [73.0, 73.63], [91.0, 91.67], [95.0, 95.42], [102.0, 102.56], [107.0, 107.6], [109.0, 109.76], [114.0, 114.02], [115.0, 115.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.44, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["synthesizer", 27.83], ["music", 20.04], ["hum", 10.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 0.37, 16.91, 0.68, 11.24, 0.57, 0.51, -0.19, 0.52, 0.29, 0.63, 0.67, 0.42, 0.56, 0.6, 0.76, 0.02, 0.84]} \ No newline at end of file diff --git a/annotations_1/5vY-zNTuq8E_filtered.json b/annotations_1/5vY-zNTuq8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aec65c65d6a6c34864f9753c7934e12784682432 --- /dev/null +++ b/annotations_1/5vY-zNTuq8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 23.68], [39.0, 39.66], [52.0, 53.42], [61.0, 61.82], [68.0, 106.25], [110.0, 123.99], [125.0, 125.91], [128.0, 142.25], [147.0, 150.57], [152.0, 152.25]], "keep_status": [true, false, false, false, false, true, false, false, true, false], "silence_prob": [30.56, 0.0, 0.0, 0.0, 0.0, 29.88, 0.0, 29.22, 29.74, 0.0], "audiomae_on_audioset": [[["speech", 38.24], ["grunt", 14.73], ["whale vocalization", 5.88]], null, null, null, null, [["animal", 21.7], ["wild animals", 20.93], ["music", 16.64]], null, [["music", 56.43], ["wild animals", 14.38], ["roaring cats (lions, tigers)", 11.54]], [["vehicle", 32.9], ["car", 16.1], ["race car, auto racing", 6.22]], null], "duration": [21.68, 0.66, 1.42, 0.82, 38.25, 13.99, 0.91, 14.25, 3.57, 0.25]} \ No newline at end of file diff --git a/annotations_1/5ve2E8iEbSQ_filtered.json b/annotations_1/5ve2E8iEbSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4322ebf1688bce1fe75284d12dfd7c492bcd289c --- /dev/null +++ b/annotations_1/5ve2E8iEbSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 25.88], [27.0, 27.62], [29.0, 36.8], [77.0, 79.35], [86.0, 87.81], [92.0, 92.87], [99.0, 103.92], [106.0, 113.27], [116.0, 116.28], [132.0, 132.83], [133.0, 132.93], [136.0, 150.77], [158.0, 161.69], [169.0, 173.18], [174.0, 174.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.94, 33.2, 0.0, 0.0, 38.75, 38.45, 0.0, 0.0, 0.0, 30.92, 32.42, 33.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 84.76], ["electronic music", 1.66], ["musical instrument", 1.05]], [["music", 46.89], ["speech", 26.22], ["electronic music", 1.36]], null, null, [["music", 56.23], ["throbbing", 9.92], ["speech", 6.74]], [["music", 36.38], ["hum", 18.16], ["throbbing", 10.87]], null, null, null, [["music", 60.36], ["sidetone", 11.08], ["speech", 10.72]], [["sidetone", 41.59], ["music", 30.04], ["speech", 8.44]], [["music", 30.77], ["hum", 17.54], ["mains hum", 13.99]], null], "duration": [-0.12, 0.62, 7.8, 2.35, 1.81, 0.87, 4.92, 7.27, 0.28, 0.83, -0.07, 14.77, 3.69, 4.18, 0.46]} \ No newline at end of file diff --git a/annotations_1/5wAlQf4WdiE_filtered.json b/annotations_1/5wAlQf4WdiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30984a452b0e849a591c43da21a0e3d04eec9704 --- /dev/null +++ b/annotations_1/5wAlQf4WdiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [16.0, 16.14], [21.0, 21.69], [24.0, 24.46], [49.0, 49.27], [70.0, 71.52], [74.0, 73.97], [81.0, 85.08], [96.0, 96.38], [100.0, 109.46], [118.0, 119.23], [127.0, 127.87], [129.0, 131.23], [133.0, 135.78], [137.0, 137.66], [138.0, 138.97], [140.0, 140.44], [151.0, 152.42], [158.0, 158.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 0.0, 34.09, 0.0, 0.0, 38.19, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 62.41], ["vibraphone", 10.62], ["marimba, xylophone", 4.69]], null, [["music", 63.25], ["livestock, farm animals, working animals", 5.61], ["bleat", 5.51]], null, null, [["howl", 24.05], ["canidae, dogs, wolves", 20.02], ["siren", 10.78]], null, null, null, null, null, null], "duration": [0.84, 0.14, 0.69, 0.46, 0.27, 1.52, -0.03, 4.08, 0.38, 9.46, 1.23, 0.87, 2.23, 2.78, 0.66, 0.97, 0.44, 1.42, 0.57]} \ No newline at end of file diff --git a/annotations_1/5wErjt1ukFE_filtered.json b/annotations_1/5wErjt1ukFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbb5d1024a774e9ee91d0ef392f0a8b4e93a3518 --- /dev/null +++ b/annotations_1/5wErjt1ukFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.92], [14.0, 18.52], [21.0, 22.18], [24.0, 23.72], [27.0, 27.38], [30.0, 30.62], [33.0, 34.5], [36.0, 37.34], [38.0, 39.01], [44.0, 43.92], [44.0, 45.12], [48.0, 48.29], [50.0, 51.16], [54.0, 55.49], [65.0, 65.99], [67.0, 68.2], [70.0, 76.1], [77.0, 81.11], [82.0, 83.51], [84.0, 85.55], [87.0, 87.51], [89.0, 89.34], [91.0, 91.32], [93.0, 93.06], [105.0, 107.27], [108.0, 108.9], [114.0, 115.08], [117.0, 117.58], [122.0, 127.01], [129.0, 129.91], [133.0, 134.7], [136.0, 137.62], [140.0, 141.86], [145.0, 145.69], [147.0, 149.25], [150.0, 150.75], [154.0, 157.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 84.07], "audiomae_on_audioset": [null, [["speech", 63.72], ["vehicle", 18.23], ["car", 2.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 4.52, 1.18, -0.28, 0.38, 0.62, 1.5, 1.34, 1.01, -0.08, 1.12, 0.29, 1.16, 1.49, 0.99, 1.2, 6.1, 4.11, 1.51, 1.55, 0.51, 0.34, 0.32, 0.06, 2.27, 0.9, 1.08, 0.58, 5.01, 0.91, 1.7, 1.62, 1.86, 0.69, 2.25, 0.75, 3.08]} \ No newline at end of file diff --git a/annotations_1/5wcg-4j9CZ0_filtered.json b/annotations_1/5wcg-4j9CZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eeb830f06700848c0cc39505279c133b3c2b8919 --- /dev/null +++ b/annotations_1/5wcg-4j9CZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [6.0, 9.09], [10.0, 14.32], [15.0, 21.47], [26.0, 39.16], [41.0, 63.64], [65.0, 65.04], [66.0, 68.64], [79.0, 79.88], [82.0, 86.86], [90.0, 94.15], [97.0, 110.54], [113.0, 114.27], [116.0, 118.47], [122.0, 123.45], [125.0, 128.76], [130.0, 135.14], [136.0, 138.89]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [32.45, 33.08, 32.13, 32.44, 32.71, 30.48, 0.0, 49.64, 0.0, 49.04, 54.36, 46.33, 0.0, 46.75, 0.0, 51.02, 45.46, 51.82], "audiomae_on_audioset": [[["music", 59.93], ["throbbing", 8.59], ["hum", 8.06]], [["music", 58.32], ["speech", 6.28], ["throbbing", 5.77]], [["music", 32.42], ["throbbing", 22.68], ["hum", 11.1]], [["music", 45.0], ["throbbing", 24.44], ["hum", 6.69]], [["music", 67.26], ["throbbing", 6.64], ["didgeridoo", 5.93]], [["music", 71.95], ["throbbing", 6.39], ["electronic music", 1.84]], null, [["throbbing", 38.05], ["hum", 35.16], ["mains hum", 5.25]], null, [["hum", 31.81], ["throbbing", 28.89], ["mains hum", 13.93]], null, [["throbbing", 43.21], ["hum", 29.78], ["heart sounds, heartbeat", 6.3]], null, [["hum", 27.19], ["music", 15.0], ["heart sounds, heartbeat", 12.88]], null, null, [["sonar", 44.42], ["music", 23.35], ["hum", 3.05]], null], "duration": [3.44, 3.09, 4.32, 6.47, 13.16, 22.64, 0.04, 2.64, 0.88, 4.86, 4.15, 13.54, 1.27, 2.47, 1.45, 3.76, 5.14, 2.89]} \ No newline at end of file diff --git a/annotations_1/5x1FeyWYp9s_filtered.json b/annotations_1/5x1FeyWYp9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731cbba10e474307e5d64da4f548f2b59419e9e6 --- /dev/null +++ b/annotations_1/5x1FeyWYp9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [7.0, 9.21], [20.0, 21.56], [34.0, 44.1], [46.0, 49.47], [68.0, 71.12], [71.0, 72.18], [86.0, 87.2], [97.0, 98.86], [107.0, 119.52], [121.0, 125.05], [130.0, 130.23], [135.0, 136.31], [138.0, 139.65]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 56.63, 0.0, 30.82, 30.8, 29.43, 0.0, 0.0, 0.0, 29.31, 29.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 90.81], ["folk music", 1.08], ["carnatic music", 1.04]], [["carnatic music", 43.37], ["music", 32.06], ["folk music", 2.21]], [["music", 61.71], ["middle eastern music", 3.4], ["singing", 2.61]], null, null, null, [["music", 81.3], ["singing", 2.92], ["folk music", 2.86]], [["music", 54.15], ["carnatic music", 7.58], ["musical instrument", 5.69]], null, null, null], "duration": [0.43, 2.21, 1.56, 10.1, 3.47, 3.12, 1.18, 1.2, 1.86, 12.52, 4.05, 0.23, 1.31, 1.65]} \ No newline at end of file diff --git a/annotations_1/5xnSzPHjw10_filtered.json b/annotations_1/5xnSzPHjw10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..786059ef0a69eb23028dc51aa2f49ced8d53fe23 --- /dev/null +++ b/annotations_1/5xnSzPHjw10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.47], [23.0, 23.06], [25.0, 25.78], [30.0, 30.37], [39.0, 39.8], [43.0, 44.56], [45.0, 49.18], [53.0, 54.94], [58.0, 65.47], [67.0, 70.02], [71.0, 78.04], [82.0, 82.02], [87.0, 88.38], [94.0, 94.51], [99.0, 99.5], [113.0, 113.39], [116.0, 116.8], [118.0, 118.27], [119.0, 119.84], [120.0, 120.78], [124.0, 126.93], [136.0, 136.61], [146.0, 148.64], [150.0, 149.98], [161.0, 162.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 0.0, 36.62, 51.82, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 99.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 95.05], ["animal", 1.23], ["frog", 0.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.06, 0.78, 0.37, 0.8, 1.56, 4.18, 1.94, 7.47, 3.02, 7.04, 0.02, 1.38, 0.51, 0.5, 0.39, 0.8, 0.27, 0.84, 0.78, 2.93, 0.61, 2.64, -0.02, 1.51]} \ No newline at end of file diff --git a/annotations_1/5zileWIEgoQ_filtered.json b/annotations_1/5zileWIEgoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d311e868a739b2b36ac6cf74ed1343b44b1ecfb7 --- /dev/null +++ b/annotations_1/5zileWIEgoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 97.63], [100.0, 108.06], [109.0, 109.61], [111.0, 111.3], [112.0, 112.55], [114.0, 113.59], [114.0, 114.45], [117.0, 117.29], [123.0, 123.06], [124.0, 124.87], [128.0, 128.71], [130.0, 132.02], [138.0, 139.08], [146.0, 146.89], [152.0, 159.76]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 43.98], "audiomae_on_audioset": [null, [["music", 42.92], ["explosion", 13.32], ["synthesizer", 4.15]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.72], ["whale vocalization", 16.15], ["gurgling", 9.46]]], "duration": [42.63, 8.06, 0.61, 0.3, 0.55, -0.41, 0.45, 0.29, 0.06, 0.87, 0.71, 2.02, 1.08, 0.89, 7.76]} \ No newline at end of file diff --git a/annotations_1/6-IGOKWYCDc_filtered.json b/annotations_1/6-IGOKWYCDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddad7b70ad248fcea1fe7b63c1e6bb7615454c99 --- /dev/null +++ b/annotations_1/6-IGOKWYCDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.36], [9.0, 11.31], [12.0, 26.16], [28.0, 32.02], [33.0, 61.4], [63.0, 65.28], [66.0, 66.99], [69.0, 69.35], [70.0, 72.13], [73.0, 75.71], [78.0, 85.02], [86.0, 99.79], [101.0, 105.07], [106.0, 107.03], [107.0, 127.38]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.95, 83.52, 52.45, 48.14, 44.12, 79.59, 0.0, 0.0, 64.52, 75.55, 54.5, 55.31, 59.68, 0.0, 44.09], "audiomae_on_audioset": [[["sidetone", 30.44], ["singing bowl", 14.18], ["speech", 11.73]], null, null, [["music", 34.65], ["singing bowl", 20.21], ["ambient music", 18.44]], [["music", 52.57], ["ambient music", 14.29], ["synthesizer", 6.28]], null, null, null, null, null, null, null, null, null, [["music", 56.5], ["speech", 14.01], ["whale vocalization", 4.18]]], "duration": [4.36, 2.31, 14.16, 4.02, 28.4, 2.28, 0.99, 0.35, 2.13, 2.71, 7.02, 13.79, 4.07, 1.03, 20.38]} \ No newline at end of file diff --git a/annotations_1/6-_tIPShuwQ_filtered.json b/annotations_1/6-_tIPShuwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6eb02392c3eafd0775b049eb59873571234585e6 --- /dev/null +++ b/annotations_1/6-_tIPShuwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [21.0, 21.56], [29.0, 29.88], [57.0, 62.02], [62.0, 62.16], [62.0, 62.29], [62.0, 62.41], [74.0, 74.19], [74.0, 78.46], [84.0, 84.77], [111.0, 111.82], [116.0, 116.51], [128.0, 128.26], [133.0, 134.64], [135.0, 136.58], [138.0, 138.77], [142.0, 142.84], [148.0, 148.51], [150.0, 150.3], [160.0, 160.84], [164.0, 164.08], [173.0, 174.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 0.56, 0.88, 5.02, 0.16, 0.29, 0.41, 0.19, 4.46, 0.77, 0.82, 0.51, 0.26, 1.64, 1.58, 0.77, 0.84, 0.51, 0.3, 0.84, 0.08, 1.87]} \ No newline at end of file diff --git a/annotations_1/60V3JFUPvIE_filtered.json b/annotations_1/60V3JFUPvIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..735bc5d1ee0ad50056f80a094d93c68e6416550f --- /dev/null +++ b/annotations_1/60V3JFUPvIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.43], [10.0, 10.18], [11.0, 11.79], [20.0, 25.51], [26.0, 79.02], [84.0, 86.17], [87.0, 117.26], [118.0, 118.02], [120.0, 121.49], [123.0, 125.59], [128.0, 129.56], [130.0, 133.22], [137.0, 140.49], [143.0, 144.73], [148.0, 168.03], [171.0, 171.73], [174.0, 175.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [44.46, 0.0, 0.0, 34.78, 0.0, 35.12, 0.0, 0.0, 0.0, 97.64, 0.0, 97.64, 77.2, 0.0, 43.08, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 43.93], ["mains hum", 22.88], ["throbbing", 15.51]], null, null, [["hum", 49.8], ["mains hum", 18.01], ["throbbing", 8.73]], null, [["mains hum", 31.38], ["music", 21.33], ["hum", 17.84]], null, null, null, null, null, null, null, null, [["sonar", 45.5], ["music", 15.75], ["whale vocalization", 6.86]], null, null], "duration": [2.43, 0.18, 0.79, 5.51, 53.02, 2.17, 30.26, 0.02, 1.49, 2.59, 1.56, 3.22, 3.49, 1.73, 20.03, 0.73, 1.02]} \ No newline at end of file diff --git a/annotations_1/61cBscxr69E_filtered.json b/annotations_1/61cBscxr69E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7fc37c628c4940dac6a8bce7df90b63fd45a6b5 --- /dev/null +++ b/annotations_1/61cBscxr69E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 39.95], [49.0, 56.37], [62.0, 66.28], [67.0, 67.64], [69.0, 69.99], [73.0, 73.18], [76.0, 76.6], [84.0, 83.91], [90.0, 90.36], [91.0, 91.64], [93.0, 93.65], [94.0, 95.1], [96.0, 97.01], [98.0, 98.81], [107.0, 109.66], [119.0, 175.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.71, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.41, 0.0], "audiomae_on_audioset": [null, [["music", 64.65], ["throbbing", 4.67], ["electronic music", 4.66]], [["music", 62.4], ["throbbing", 8.93], ["hum", 5.41]], null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 17.06], ["music", 16.09], ["speech", 14.91]], null], "duration": [0.95, 7.37, 4.28, 0.64, 0.99, 0.18, 0.6, -0.09, 0.36, 0.64, 0.65, 1.1, 1.01, 0.81, 2.66, 56.98]} \ No newline at end of file diff --git a/annotations_1/61nCIyBCmjg_filtered.json b/annotations_1/61nCIyBCmjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..020c758441857e57a4dfa7f35a3d5c416d6e6a16 --- /dev/null +++ b/annotations_1/61nCIyBCmjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.71], [12.0, 13.58], [14.0, 19.63], [22.0, 23.63], [25.0, 26.72], [27.0, 29.76], [35.0, 35.73], [36.0, 37.81], [39.0, 42.08], [44.0, 63.63], [67.0, 71.51], [74.0, 88.26], [89.0, 92.31], [94.0, 95.69], [97.0, 107.13], [109.0, 108.63], [110.0, 110.35], [112.0, 112.55], [114.0, 115.33], [117.0, 117.21], [118.0, 118.96], [120.0, 120.99], [122.0, 122.12], [123.0, 124.14], [125.0, 125.15], [126.0, 126.5], [127.0, 128.02], [128.0, 136.66], [138.0, 138.82]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.28, 0.0, 0.0, 47.39, 0.0, 0.0, 52.56, 43.85, 98.86, 99.82, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 17.38], ["foghorn", 13.28], ["speech", 10.84]], null, null, null, [["music", 35.79], ["ambient music", 14.26], ["theremin", 13.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.01], ["speech", 24.2], ["quack", 11.12]], null], "duration": [1.71, 1.58, 5.63, 1.63, 1.72, 2.76, 0.73, 1.81, 3.08, 19.63, 4.51, 14.26, 3.31, 1.69, 10.13, -0.37, 0.35, 0.55, 1.33, 0.21, 0.96, 0.99, 0.12, 1.14, 0.15, 0.5, 1.02, 8.66, 0.82]} \ No newline at end of file diff --git a/annotations_1/63Lf9kwyWd4_filtered.json b/annotations_1/63Lf9kwyWd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a068a86d405e36268c273605e61bfa381b5e9b9 --- /dev/null +++ b/annotations_1/63Lf9kwyWd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.47], [6.0, 22.76], [23.0, 29.0], [30.0, 30.27], [30.0, 30.32], [32.0, 33.57], [35.0, 35.8], [36.0, 36.1], [36.0, 52.57], [55.0, 80.08], [83.0, 83.76], [89.0, 90.85]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [91.13, 48.78, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 32.56, 56.4, 0.0, 0.0], "audiomae_on_audioset": [null, [["sonar", 45.13], ["music", 29.26], ["thunk", 4.46]], null, null, null, null, null, null, [["music", 23.22], ["hum", 19.77], ["speech", 18.71]], null, null, null], "duration": [2.47, 16.76, 6.0, 0.27, 0.32, 1.57, 0.8, 0.1, 16.57, 25.08, 0.76, 1.85]} \ No newline at end of file diff --git a/annotations_1/64tSUb_LTdI_filtered.json b/annotations_1/64tSUb_LTdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfc09fae1243fe579986f11fefcf84ac42f3a463 --- /dev/null +++ b/annotations_1/64tSUb_LTdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.32], [10.0, 9.85], [11.0, 12.95], [24.0, 25.56], [29.0, 30.32], [31.0, 33.0], [38.0, 38.38], [49.0, 74.75], [85.0, 86.29], [90.0, 91.03], [93.0, 93.78], [95.0, 99.03], [102.0, 105.48], [109.0, 118.67], [120.0, 121.86], [126.0, 130.98], [133.0, 143.55]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.01, 0.0, 29.59, 0.0, 0.0, 0.0, 29.88, 30.83, 32.18, 0.0, 39.69, 38.06], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.59], ["musical instrument", 3.13], ["drum machine", 2.63]], null, [["music", 77.21], ["didgeridoo", 1.26], ["throbbing", 1.22]], null, null, null, [["music", 74.59], ["synthesizer", 3.44], ["hum", 2.32]], [["music", 38.94], ["didgeridoo", 21.8], ["theremin", 6.27]], [["music", 54.22], ["didgeridoo", 6.89], ["synthesizer", 4.66]], null, [["music", 48.29], ["vocal music", 3.73], ["musical instrument", 3.42]], [["music", 44.63], ["speech", 10.46], ["hum", 9.79]]], "duration": [1.32, -0.15, 1.95, 1.56, 1.32, 2.0, 0.38, 25.75, 1.29, 1.03, 0.78, 4.03, 3.48, 9.67, 1.86, 4.98, 10.55]} \ No newline at end of file diff --git a/annotations_1/65pGOp7qa_s_filtered.json b/annotations_1/65pGOp7qa_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0350281c707d8f40c5e0150d8094be4e7df4f27 --- /dev/null +++ b/annotations_1/65pGOp7qa_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [9.0, 11.4], [21.0, 22.62], [30.0, 31.01], [40.0, 41.23], [49.0, 57.15], [58.0, 92.6], [93.0, 96.97], [99.0, 107.57], [109.0, 138.62], [141.0, 164.25]], "keep_status": [false, true, false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 33.64, 0.0, 0.0, 0.0, 31.69, 0.0, 29.88, 31.08, 30.75, 29.58], "audiomae_on_audioset": [null, [["music", 9.86], ["animal", 7.51], ["hum", 5.15]], null, null, null, [["music", 30.27], ["hum", 15.03], ["throbbing", 7.73]], null, [["music", 16.51], ["fly, housefly", 13.67], ["moo", 9.91]], [["speech", 44.26], ["music", 32.18], ["vehicle", 1.9]], [["music", 24.03], ["cattle, bovinae", 10.65], ["buzz", 9.21]], [["music", 22.5], ["speech", 10.8], ["outside, rural or natural", 6.79]]], "duration": [1.62, 2.4, 1.62, 1.01, 1.23, 8.15, 34.6, 3.97, 8.57, 29.62, 23.25]} \ No newline at end of file diff --git a/annotations_1/67dyb52zKRs_filtered.json b/annotations_1/67dyb52zKRs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5213a3a126ec01744c344c4e5c3072252373da55 --- /dev/null +++ b/annotations_1/67dyb52zKRs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 45.1], [49.0, 49.55], [52.0, 53.0], [54.0, 54.24], [55.0, 61.15]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.81], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 19.73], ["music", 18.33], ["moo", 13.91]]], "duration": [37.1, 0.55, 1.0, 0.24, 6.15]} \ No newline at end of file diff --git a/annotations_1/688uSEwvYnQ_filtered.json b/annotations_1/688uSEwvYnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74344d9499564a178214ac36a91dfbcb7c601352 --- /dev/null +++ b/annotations_1/688uSEwvYnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.52], [12.0, 13.81], [15.0, 15.35], [16.0, 17.32], [18.0, 25.47], [26.0, 26.4], [28.0, 36.1], [37.0, 40.2], [41.0, 41.18], [42.0, 43.26], [47.0, 47.78], [48.0, 54.26], [55.0, 56.0], [58.0, 59.64], [60.0, 60.69], [62.0, 62.28], [63.0, 63.71], [65.0, 65.45], [66.0, 67.02], [68.0, 69.75], [70.0, 72.6], [74.0, 74.63], [77.0, 77.7], [79.0, 79.1], [81.0, 82.68], [86.0, 91.52], [93.0, 93.19], [96.0, 96.8], [98.0, 99.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 57.64, 78.21, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.18, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 84.36], ["speech synthesizer", 5.08], ["sidetone", 2.92]], null, null, null, null, null, null, null, null], "duration": [0.52, 1.81, 0.35, 1.32, 7.47, 0.4, 8.1, 3.2, 0.18, 1.26, 0.78, 6.26, 1.0, 1.64, 0.69, 0.28, 0.71, 0.45, 1.02, 1.75, 2.6, 0.63, 0.7, 0.1, 1.68, 5.52, 0.19, 0.8, 1.72]} \ No newline at end of file diff --git a/annotations_1/68CXG6t1mxU_filtered.json b/annotations_1/68CXG6t1mxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2284f6b29c010512238ba129b8df2b9573d0b66 --- /dev/null +++ b/annotations_1/68CXG6t1mxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [6.0, 5.73], [7.0, 7.65], [10.0, 11.72], [28.0, 30.81], [36.0, 36.68], [38.0, 38.94], [42.0, 43.21], [48.0, 49.71], [67.0, 67.32], [84.0, 85.5], [90.0, 90.46], [95.0, 95.0], [101.0, 102.29], [103.0, 103.05], [103.0, 103.18], [103.0, 111.5], [112.0, 113.41], [116.0, 116.7], [120.0, 131.35], [133.0, 134.52], [141.0, 141.88], [143.0, 142.86], [159.0, 160.76], [164.0, 167.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 67.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.83], ["hum", 13.81], ["animal", 9.32]], null, null, null, null, null, null, null, null], "duration": [0.42, -0.27, 0.65, 1.72, 2.81, 0.68, 0.94, 1.21, 1.71, 0.32, 1.5, 0.46, 0.0, 1.29, 0.05, 0.18, 8.5, 1.41, 0.7, 11.35, 1.52, 0.88, -0.14, 1.76, 3.27]} \ No newline at end of file diff --git a/annotations_1/68SlAT125f8_filtered.json b/annotations_1/68SlAT125f8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41ed9011b51da761cf6adc4bddeaf641c0886be7 --- /dev/null +++ b/annotations_1/68SlAT125f8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.03], [6.0, 6.61], [8.0, 11.03], [17.0, 31.67], [34.0, 43.29], [46.0, 49.03], [50.0, 55.95], [57.0, 56.61]], "keep_status": [false, false, true, true, true, false, true, false], "silence_prob": [30.76, 0.0, 29.45, 29.5, 29.21, 28.44, 28.53, 0.0], "audiomae_on_audioset": [[["music", 36.51], ["throbbing", 27.18], ["hum", 14.24]], null, [["speech", 40.85], ["music", 10.29], ["explosion", 5.65]], [["music", 36.58], ["hum", 18.03], ["speech", 11.83]], [["buzz", 26.45], ["mains hum", 17.54], ["hum", 16.69]], [["music", 62.19], ["speech", 4.92], ["scary music", 4.08]], [["music", 36.63], ["speech", 12.08], ["explosion", 6.92]], null], "duration": [2.03, 0.61, 3.03, 14.67, 9.29, 3.03, 5.95, -0.39]} \ No newline at end of file diff --git a/annotations_1/68av2-Ti-GU_filtered.json b/annotations_1/68av2-Ti-GU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a386935100ea2810adeefc7285c519d00b53a75 --- /dev/null +++ b/annotations_1/68av2-Ti-GU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.0], [9.0, 14.27], [15.0, 14.98], [15.0, 16.24], [17.0, 28.26], [30.0, 33.86], [35.0, 35.78], [37.0, 57.0], [58.0, 83.61], [85.0, 88.8], [89.0, 98.19], [100.0, 102.81]], "keep_status": [true, true, false, false, true, false, false, true, true, false, false, true], "silence_prob": [46.5, 37.28, 0.0, 0.0, 40.14, 69.88, 0.0, 37.19, 42.55, 91.47, 54.9, 38.37], "audiomae_on_audioset": [[["music", 30.58], ["hum", 18.88], ["mains hum", 10.49]], [["speech", 52.54], ["sidetone", 9.64], ["hum", 7.0]], null, null, [["hum", 35.1], ["throbbing", 14.89], ["noise", 12.28]], null, null, [["music", 27.54], ["hum", 20.32], ["throbbing", 13.99]], [["music", 25.58], ["speech", 18.86], ["thunk", 13.11]], null, null, [["music", 39.39], ["hum", 9.15], ["mains hum", 6.22]]], "duration": [3.0, 5.27, -0.02, 1.24, 11.26, 3.86, 0.78, 20.0, 25.61, 3.8, 9.19, 2.81]} \ No newline at end of file diff --git a/annotations_1/68igl3sbzFI_filtered.json b/annotations_1/68igl3sbzFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1c22ed12937b8646047b33c59d144dad8d5ee7f --- /dev/null +++ b/annotations_1/68igl3sbzFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.02], [30.0, 45.69], [46.0, 51.34]], "keep_status": [false, false, false], "silence_prob": [0.0, 58.55, 54.04], "audiomae_on_audioset": [null, null, null], "duration": [1.02, 15.69, 5.34]} \ No newline at end of file diff --git a/annotations_1/69v1tcsG6nc_filtered.json b/annotations_1/69v1tcsG6nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3503c6b6b4b4ea8797af9b4d092f0ac0a02f5318 --- /dev/null +++ b/annotations_1/69v1tcsG6nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [7.0, 7.6], [9.0, 9.59], [12.0, 14.59], [16.0, 17.0], [20.0, 21.19], [24.0, 25.15], [30.0, 29.64], [31.0, 32.17], [34.0, 35.31], [36.0, 38.13], [39.0, 39.7], [41.0, 42.25], [44.0, 44.95], [45.0, 46.57], [48.0, 48.57], [54.0, 56.46], [58.0, 59.07], [59.0, 61.94], [67.0, 67.56], [73.0, 73.41], [77.0, 77.8], [83.0, 87.07], [91.0, 94.05], [97.0, 98.25], [99.0, 99.45], [101.0, 102.86], [108.0, 108.58], [111.0, 111.79], [116.0, 116.58], [117.0, 119.85], [125.0, 126.01], [131.0, 131.08], [141.0, 140.88], [143.0, 143.88], [145.0, 150.89], [151.0, 151.63], [153.0, 153.5], [155.0, 155.63], [167.0, 168.78], [170.0, 184.94], [185.0, 186.76], [189.0, 189.75], [191.0, 191.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 96.66, 0.0, 0.0, 0.0, 100.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 19.83], ["sidetone", 17.86], ["speech", 9.78]], null, null, null], "duration": [0.43, 0.6, 0.59, 2.59, 1.0, 1.19, 1.15, -0.36, 1.17, 1.31, 2.13, 0.7, 1.25, 0.95, 1.57, 0.57, 2.46, 1.07, 2.94, 0.56, 0.41, 0.8, 4.07, 3.05, 1.25, 0.45, 1.86, 0.58, 0.79, 0.58, 2.85, 1.01, 0.08, -0.12, 0.88, 5.89, 0.63, 0.5, 0.63, 1.78, 14.94, 1.76, 0.75, 0.84]} \ No newline at end of file diff --git a/annotations_1/6AE1I5edCfQ_filtered.json b/annotations_1/6AE1I5edCfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25c8f09b471c46dd49e7cd6bee21f54abf4e4e69 --- /dev/null +++ b/annotations_1/6AE1I5edCfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [5.0, 5.63], [7.0, 9.14], [11.0, 12.11], [13.0, 14.01], [15.0, 16.19], [21.0, 22.03], [30.0, 31.35], [33.0, 33.52], [35.0, 36.56], [38.0, 38.87], [41.0, 41.15], [41.0, 41.32], [41.0, 41.35], [42.0, 41.86], [45.0, 45.96], [49.0, 49.25], [66.0, 65.7], [67.0, 67.27], [72.0, 71.71], [74.0, 74.07], [74.0, 75.98], [85.0, 85.53]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 30.5], ["moo", 15.48], ["whale vocalization", 11.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 0.63, 2.14, 1.11, 1.01, 1.19, 1.03, 1.35, 0.52, 1.56, 0.87, 0.15, 0.32, 0.35, -0.14, 0.96, 0.25, -0.3, 0.27, -0.29, 0.07, 1.98, 0.53]} \ No newline at end of file diff --git a/annotations_1/6AJH6b91rF8_filtered.json b/annotations_1/6AJH6b91rF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70c77158639cbf0a32a3fa7cb48cda55bd9ef76f --- /dev/null +++ b/annotations_1/6AJH6b91rF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [7.0, 7.94], [12.0, 12.77], [14.0, 15.89], [16.0, 17.46], [21.0, 22.38], [25.0, 26.38], [37.0, 38.48], [49.0, 52.96], [54.0, 54.87], [57.0, 57.77], [59.0, 59.91], [61.0, 61.94], [72.0, 72.81], [89.0, 89.73], [91.0, 92.53], [94.0, 94.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 0.94, 0.77, 1.89, 1.46, 1.38, 1.38, 1.48, 3.96, 0.87, 0.77, 0.91, 0.94, 0.81, 0.73, 1.53, 0.1]} \ No newline at end of file diff --git a/annotations_1/6AWMlRhBN5U_filtered.json b/annotations_1/6AWMlRhBN5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c882b024fee641e64cde273325f2414fbb7bd5b8 --- /dev/null +++ b/annotations_1/6AWMlRhBN5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 1.39], [15.0, 15.55], [18.0, 18.93], [22.0, 22.6], [26.0, 34.47], [36.0, 36.1], [38.0, 38.67], [42.0, 42.92], [52.0, 51.85], [62.0, 62.4], [64.0, 64.61], [67.0, 68.17], [69.0, 70.56], [71.0, 76.06], [82.0, 83.03], [87.0, 88.32], [91.0, 92.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.39, 0.55, 0.93, 0.6, 8.47, 0.1, 0.67, 0.92, -0.15, 0.4, 0.61, 1.17, 1.56, 5.06, 1.03, 1.32, 1.37]} \ No newline at end of file diff --git a/annotations_1/6BBGO5M_2A0_filtered.json b/annotations_1/6BBGO5M_2A0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f26a5866f34b97a76e59c3f5a54de5e3b00157d --- /dev/null +++ b/annotations_1/6BBGO5M_2A0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.49], [13.0, 87.37], [89.0, 98.88], [100.0, 99.77], [100.0, 104.63], [105.0, 106.62]], "keep_status": [false, false, false, false, true, false], "silence_prob": [98.01, 0.0, 32.17, 0.0, 35.42, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.71], ["fly, housefly", 5.68], ["bee, wasp, etc.", 3.48]], null, [["groan", 41.41], ["music", 13.0], ["speech", 12.5]], null], "duration": [9.49, 74.37, 9.88, -0.23, 4.63, 1.62]} \ No newline at end of file diff --git a/annotations_1/6CBfg5X9Z3Y_filtered.json b/annotations_1/6CBfg5X9Z3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f1755f49006e08a5544e7150ed9b82e8418b10 --- /dev/null +++ b/annotations_1/6CBfg5X9Z3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [4.0, 5.71], [6.0, 8.36], [12.0, 11.97], [17.0, 16.73], [17.0, 17.41], [18.0, 18.57], [19.0, 21.42], [24.0, 24.16], [40.0, 41.15], [55.0, 55.39], [68.0, 68.27], [79.0, 80.16], [81.0, 81.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.89, 1.71, 2.36, -0.03, -0.27, 0.41, 0.57, 2.42, 0.16, 1.15, 0.39, 0.27, 1.16, 0.26]} \ No newline at end of file diff --git a/annotations_1/6CmxSs6Mmx4_filtered.json b/annotations_1/6CmxSs6Mmx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cbd2a0f4bcc35f129420816a0cfd64eaaf66c4e --- /dev/null +++ b/annotations_1/6CmxSs6Mmx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.45]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.45]} \ No newline at end of file diff --git a/annotations_1/6D64t1trSRs_filtered.json b/annotations_1/6D64t1trSRs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8d942ad064de3d620c7fb1efbd365c518ab786c --- /dev/null +++ b/annotations_1/6D64t1trSRs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.91], [8.0, 35.38], [38.0, 114.22], [115.0, 117.02], [119.0, 119.7], [122.0, 134.45], [138.0, 140.61], [143.0, 144.19], [146.0, 149.27], [150.0, 152.24], [153.0, 154.99], [158.0, 158.73], [161.0, 161.27], [164.0, 164.61], [166.0, 166.95]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.75, 36.28, 0.0, 74.29, 0.0, 71.72, 87.0, 0.0, 92.64, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 10.39], ["hum", 6.23], ["sine wave", 5.67]], [["speech", 34.22], ["breaking", 16.39], ["music", 13.07]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.91, 27.38, 76.22, 2.02, 0.7, 12.45, 2.61, 1.19, 3.27, 2.24, 1.99, 0.73, 0.27, 0.61, 0.95]} \ No newline at end of file diff --git a/annotations_1/6Dg0qouE5Zo_filtered.json b/annotations_1/6Dg0qouE5Zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..607cfb239bf3fd9c53c4c1884cd8112a34453460 --- /dev/null +++ b/annotations_1/6Dg0qouE5Zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.86], [12.0, 13.59], [15.0, 20.11], [21.0, 23.79], [27.0, 45.74], [49.0, 49.28], [52.0, 51.71], [54.0, 54.41], [71.0, 71.37], [81.0, 81.58], [84.0, 84.3], [85.0, 86.78], [96.0, 96.62], [97.0, 97.02], [97.0, 97.43], [120.0, 120.83], [122.0, 122.96], [128.0, 130.33], [132.0, 132.54], [133.0, 135.55], [139.0, 139.78], [141.0, 141.17], [142.0, 142.91], [161.0, 165.92]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [96.04, 0.0, 56.48, 47.35, 31.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 44.9, 0.0, 0.0, 0.0, 34.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 14.05], ["speech", 13.41], ["livestock, farm animals, working animals", 10.76]], [["music", 66.6], ["speech", 6.45], ["didgeridoo", 3.44]], null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.97], ["cattle, bovinae", 20.06], ["moo", 18.08]], null, [["speech", 21.77], ["sidetone", 6.99], ["music", 6.26]], null, null, null, [["speech", 32.3], ["music", 9.22], ["explosion", 6.94]]], "duration": [3.86, 1.59, 5.11, 2.79, 18.74, 0.28, -0.29, 0.41, 0.37, 0.58, 0.3, 1.78, 0.62, 0.02, 0.43, 0.83, 0.96, 2.33, 0.54, 2.55, 0.78, 0.17, 0.91, 4.92]} \ No newline at end of file diff --git a/annotations_1/6DlOr1PP0Fc_filtered.json b/annotations_1/6DlOr1PP0Fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34f2a687d2568b962ff463a850af17119cce4943 --- /dev/null +++ b/annotations_1/6DlOr1PP0Fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [4.0, 5.93], [8.0, 8.38], [10.0, 19.13], [20.0, 21.46], [22.0, 33.81], [35.0, 61.94], [64.0, 88.6], [90.0, 95.88], [96.0, 106.49], [108.0, 153.52], [154.0, 155.8], [157.0, 180.54], [182.0, 182.09], [183.0, 184.0], [185.0, 185.36], [186.0, 202.71], [204.0, 204.5], [206.0, 206.14], [207.0, 208.67], [213.0, 216.21]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.16, 0.0, 37.52, 39.54, 32.76, 40.71, 32.92, 0.0, 0.0, 32.72, 0.0, 0.0, 0.0, 31.65, 0.0, 0.0, 0.0, 31.6], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.34], ["whack, thwack", 10.98], ["speech", 8.24]], [["music", 64.33], ["speech", 6.5], ["didgeridoo", 6.25]], [["music", 49.97], ["fly, housefly", 8.96], ["mosquito", 5.26]], [["music", 32.27], ["throbbing", 18.61], ["speech", 16.87]], [["speech", 50.11], ["music", 24.63], ["noise", 3.26]], null, null, [["music", 47.7], ["throbbing", 7.49], ["didgeridoo", 6.19]], null, null, null, [["music", 56.16], ["speech", 14.33], ["breaking", 5.18]], null, null, null, [["music", 66.56], ["throbbing", 4.6], ["musical instrument", 2.61]]], "duration": [0.72, 1.93, 0.38, 9.13, 1.46, 11.81, 26.94, 24.6, 5.88, 10.49, 45.52, 1.8, 23.54, 0.09, 1.0, 0.36, 16.71, 0.5, 0.14, 1.67, 3.21]} \ No newline at end of file diff --git a/annotations_1/6DmSVYtMoyQ_filtered.json b/annotations_1/6DmSVYtMoyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bf1585851bb5670ab38d7c33b6f90cc20debe2b --- /dev/null +++ b/annotations_1/6DmSVYtMoyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.03], [13.0, 13.86], [16.0, 16.66], [20.0, 22.06], [23.0, 43.83], [45.0, 61.28], [65.0, 68.01], [69.0, 79.59], [81.0, 80.91], [82.0, 112.04], [115.0, 116.43], [119.0, 143.09], [145.0, 149.44]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 43.25, 30.05, 32.59, 35.39, 29.23, 0.0, 0.0, 0.0, 35.56, 46.83], "audiomae_on_audioset": [null, null, null, [["music", 40.87], ["throbbing", 9.95], ["hum", 9.03]], [["music", 75.38], ["hum", 6.9], ["throbbing", 4.56]], [["music", 62.44], ["throbbing", 4.19], ["theremin", 3.33]], [["hum", 28.47], ["mains hum", 20.49], ["speech", 19.56]], [["speech", 31.63], ["music", 21.8], ["hum", 11.57]], null, null, null, [["music", 51.48], ["quack", 5.41], ["scary music", 2.61]], [["music", 61.56], ["theremin", 14.06], ["ambient music", 2.68]]], "duration": [1.03, 0.86, 0.66, 2.06, 20.83, 16.28, 3.01, 10.59, -0.09, 30.04, 1.43, 24.09, 4.44]} \ No newline at end of file diff --git a/annotations_1/6EfYYxmfABk_filtered.json b/annotations_1/6EfYYxmfABk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e404f96c01e0d4465c41852f0ef11df67487ad8 --- /dev/null +++ b/annotations_1/6EfYYxmfABk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [5.0, 19.43], [20.0, 35.83], [37.0, 37.96], [40.0, 41.13], [42.0, 42.47], [42.0, 42.5], [43.0, 44.52], [49.0, 60.99], [63.0, 63.88], [65.0, 66.26], [68.0, 71.46], [73.0, 74.9], [79.0, 79.42], [84.0, 84.79], [86.0, 89.72], [90.0, 91.18], [95.0, 96.43], [98.0, 98.83], [101.0, 102.05], [104.0, 104.79], [107.0, 107.27], [111.0, 110.83], [113.0, 114.76], [118.0, 118.72], [122.0, 122.54], [125.0, 125.88], [130.0, 131.21], [134.0, 135.03], [139.0, 144.31], [145.0, 146.35], [147.0, 158.58], [159.0, 166.62], [168.0, 169.48], [170.0, 172.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.71, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 44.04, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 87.37, 52.56, 0.0, 92.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.04], ["radio", 6.49], ["speech synthesizer", 4.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 14.43, 15.83, 0.96, 1.13, 0.47, 0.5, 1.52, 11.99, 0.88, 1.26, 3.46, 1.9, 0.42, 0.79, 3.72, 1.18, 1.43, 0.83, 1.05, 0.79, 0.27, -0.17, 1.76, 0.72, 0.54, 0.88, 1.21, 1.03, 5.31, 1.35, 11.58, 7.62, 1.48, 2.27]} \ No newline at end of file diff --git a/annotations_1/6F_Wp3IlryI_filtered.json b/annotations_1/6F_Wp3IlryI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2390636c42a760fe560781db0ec08493f22e17e7 --- /dev/null +++ b/annotations_1/6F_Wp3IlryI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.72], [7.0, 8.26], [8.0, 9.41], [10.0, 11.53], [24.0, 25.24], [27.0, 30.2], [31.0, 31.7], [33.0, 35.06], [36.0, 36.83], [37.0, 37.89], [39.0, 40.0], [43.0, 45.96], [47.0, 49.52], [50.0, 51.71], [53.0, 54.68], [58.0, 57.96], [66.0, 66.09], [67.0, 67.88], [72.0, 74.44], [75.0, 77.5], [83.0, 84.23], [86.0, 86.56], [88.0, 89.82], [92.0, 91.94], [94.0, 95.64], [96.0, 98.69], [104.0, 104.45], [113.0, 113.85], [114.0, 115.74], [120.0, 122.2], [123.0, 123.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 61.67, 0.0, 0.0, 0.0, 70.44, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 43.58, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71, 0.0, 0.0, 0.0, 61.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 45.71], ["music", 31.08], ["singing bowl", 3.54]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 74.09], ["speech", 6.44], ["effects unit", 5.47]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.26, 1.41, 1.53, 1.24, 3.2, 0.7, 2.06, 0.83, 0.89, 1.0, 2.96, 2.52, 1.71, 1.68, -0.04, 0.09, 0.88, 2.44, 2.5, 1.23, 0.56, 1.82, -0.06, 1.64, 2.69, 0.45, 0.85, 1.74, 2.2, 0.62]} \ No newline at end of file diff --git a/annotations_1/6Gd4JbJxaf4_filtered.json b/annotations_1/6Gd4JbJxaf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c81038ee0d385b8e0b83c0f8769d8300a0ca9bd3 --- /dev/null +++ b/annotations_1/6Gd4JbJxaf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 55.36], [58.0, 81.36], [82.0, 83.57], [85.0, 91.83], [92.0, 93.07], [96.0, 105.81], [107.0, 127.53], [130.0, 134.96], [135.0, 137.57], [138.0, 149.2], [154.0, 154.58], [156.0, 156.3]], "keep_status": [true, true, false, false, false, false, true, true, true, true, false, false], "silence_prob": [29.62, 32.04, 0.0, 49.68, 0.0, 37.76, 29.7, 37.85, 40.06, 40.75, 0.0, 0.0], "audiomae_on_audioset": [[["music", 21.27], ["buzz", 8.17], ["fly, housefly", 6.87]], [["music", 47.66], ["fly, housefly", 6.91], ["speech", 4.37]], null, [["theremin", 35.04], ["music", 19.74], ["whale vocalization", 17.31]], null, [["music", 43.71], ["speech", 16.89], ["theremin", 11.41]], [["music", 26.23], ["mains hum", 24.63], ["hum", 13.81]], [["hum", 32.66], ["mains hum", 21.78], ["throbbing", 8.29]], [["hum", 19.2], ["mains hum", 17.3], ["speech", 14.99]], [["music", 52.13], ["speech", 9.71], ["shofar", 4.33]], null, null], "duration": [19.36, 23.36, 1.57, 6.83, 1.07, 9.81, 20.53, 4.96, 2.57, 11.2, 0.58, 0.3]} \ No newline at end of file diff --git a/annotations_1/6GhSM3Gu9VU_filtered.json b/annotations_1/6GhSM3Gu9VU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d9969ded1822d1d8256e9cbef3adc6922db074c --- /dev/null +++ b/annotations_1/6GhSM3Gu9VU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.95], [13.0, 16.07], [19.0, 19.6], [21.0, 21.29], [28.0, 28.14], [32.0, 32.9], [36.0, 36.98], [39.0, 45.93], [49.0, 54.43], [55.0, 56.35], [57.0, 66.9], [72.0, 73.16], [75.0, 75.47], [85.0, 85.35], [87.0, 92.01], [95.0, 139.5], [140.0, 175.83]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.82, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 34.14, 0.0, 32.32, 0.0, 0.0, 0.0, 31.5, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.47], ["music", 15.45], ["rumble", 7.77]], null, null, null, null, null, [["hum", 46.02], ["mains hum", 21.37], ["throbbing", 8.48]], [["speech", 43.53], ["electric shaver, electric razor", 37.18], ["hum", 5.87]], null, [["electric shaver, electric razor", 58.65], ["hum", 14.96], ["mains hum", 9.27]], null, null, null, [["speech", 42.56], ["hum", 17.35], ["vehicle", 11.62]], null, null], "duration": [-0.05, 3.07, 0.6, 0.29, 0.14, 0.9, 0.98, 6.93, 5.43, 1.35, 9.9, 1.16, 0.47, 0.35, 5.01, 44.5, 35.83]} \ No newline at end of file diff --git a/annotations_1/6GpeTJqqtG4_filtered.json b/annotations_1/6GpeTJqqtG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab41818aae226d89f3e8f3639ab60affa7964a20 --- /dev/null +++ b/annotations_1/6GpeTJqqtG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.89], [12.0, 13.32], [20.0, 20.65], [21.0, 24.63], [30.0, 31.51], [34.0, 37.12], [42.0, 52.56], [54.0, 55.44], [56.0, 56.42], [57.0, 57.08], [73.0, 75.9], [83.0, 83.08], [84.0, 84.38], [85.0, 85.8], [87.0, 87.51], [114.0, 113.9], [115.0, 118.35]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [52.39, 0.0, 0.0, 45.24, 0.0, 57.81, 84.8, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1], "audiomae_on_audioset": [null, null, null, [["theremin", 28.69], ["singing bowl", 23.71], ["music", 8.2]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.37], ["creak", 23.68], ["fart", 5.43]]], "duration": [4.89, 1.32, 0.65, 3.63, 1.51, 3.12, 10.56, 1.44, 0.42, 0.08, 2.9, 0.08, 0.38, 0.8, 0.51, -0.1, 3.35]} \ No newline at end of file diff --git a/annotations_1/6H6RGCBUcf4_filtered.json b/annotations_1/6H6RGCBUcf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17e93523ffe314bb8310b23c28d4d89bc5958829 --- /dev/null +++ b/annotations_1/6H6RGCBUcf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 63.88], [64.0, 70.36], [71.0, 89.73], [90.0, 91.54], [92.0, 147.11], [148.0, 148.58]], "keep_status": [false, true, true, false, false, false], "silence_prob": [33.84, 39.43, 32.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.88], ["hum", 7.25], ["throbbing", 6.74]], [["speech", 23.79], ["music", 22.05], ["hum", 12.14]], [["music", 27.05], ["speech", 14.82], ["breaking", 11.86]], null, null, null], "duration": [10.88, 6.36, 18.73, 1.54, 55.11, 0.58]} \ No newline at end of file diff --git a/annotations_1/6I5B0jyLBUg_filtered.json b/annotations_1/6I5B0jyLBUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7be962cf41f06148983040870338e85d40aa564a --- /dev/null +++ b/annotations_1/6I5B0jyLBUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [7.0, 7.52], [20.0, 20.12], [25.0, 25.76], [31.0, 31.62], [42.0, 41.77], [59.0, 59.51], [66.0, 66.38], [67.0, 69.04], [75.0, 75.37], [76.0, 76.42], [93.0, 93.55], [121.0, 144.1], [148.0, 149.23], [150.0, 150.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 29.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.27], ["music", 10.93], ["vehicle", 4.66]], null, null], "duration": [0.6, 0.52, 0.12, 0.76, 0.62, -0.23, 0.51, 0.38, 2.04, 0.37, 0.42, 0.55, 23.1, 1.23, 0.15]} \ No newline at end of file diff --git a/annotations_1/6IJ8LfJnJvQ_filtered.json b/annotations_1/6IJ8LfJnJvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43445195df6770e54e4a8052e101c85d88010f26 --- /dev/null +++ b/annotations_1/6IJ8LfJnJvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.78], [6.0, 6.88], [8.0, 10.39], [15.0, 17.12], [19.0, 37.84], [39.0, 39.9], [42.0, 56.86], [57.0, 60.69], [61.0, 62.53], [64.0, 87.62], [89.0, 95.94], [96.0, 95.99], [100.0, 115.57], [117.0, 122.74], [126.0, 126.12], [131.0, 132.11], [135.0, 135.6], [140.0, 144.15], [146.0, 146.58], [147.0, 148.29], [150.0, 156.46], [156.0, 156.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.31, 0.0, 98.44, 98.66, 95.91, 0.0, 92.31, 84.25, 0.0, 89.01, 87.92, 0.0, 73.06, 74.44, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 98.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.78, 0.88, 2.39, 2.12, 18.84, 0.9, 14.86, 3.69, 1.53, 23.62, 6.94, -0.01, 15.57, 5.74, 0.12, 1.11, 0.6, 4.15, 0.58, 1.29, 6.46, 0.57]} \ No newline at end of file diff --git a/annotations_1/6IM3wUpXVfA_filtered.json b/annotations_1/6IM3wUpXVfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3945cb27e605d0bbb434de7a9286948ddf82569 --- /dev/null +++ b/annotations_1/6IM3wUpXVfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 104.43], [112.0, 116.45], [117.0, 119.69], [122.0, 124.56], [125.0, 126.79]], "keep_status": [true, true, false, false, false], "silence_prob": [30.66, 37.09, 59.42, 66.03, 0.0], "audiomae_on_audioset": [[["speech", 39.37], ["moo", 10.38], ["cattle, bovinae", 9.24]], [["noise", 27.97], ["music", 15.22], ["hum", 8.45]], null, null, null], "duration": [18.43, 4.45, 2.69, 2.56, 1.79]} \ No newline at end of file diff --git a/annotations_1/6IXjYpPtjWk_filtered.json b/annotations_1/6IXjYpPtjWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28e60b1e64973a216c3155e1f743afe07be61466 --- /dev/null +++ b/annotations_1/6IXjYpPtjWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.72], [12.0, 12.45], [12.0, 12.82], [14.0, 17.14], [19.0, 22.15], [46.0, 48.07], [57.0, 58.18], [63.0, 64.54], [68.0, 69.11], [70.0, 70.83], [74.0, 74.95], [75.0, 75.1], [81.0, 82.58], [85.0, 86.39], [89.0, 90.96], [93.0, 98.56], [104.0, 106.83], [120.0, 120.31], [122.0, 123.48], [124.0, 125.34], [127.0, 128.24], [130.0, 130.42], [132.0, 132.21]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.4, 33.46, 49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.25, 50.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 27.2], ["insect", 19.51], ["moo", 11.11]], [["speech", 49.43], ["music", 25.5], ["hum", 1.87]], [["cattle, bovinae", 16.37], ["music", 13.95], ["livestock, farm animals, working animals", 11.84]], null, null, null, null, null, null, null, null, null, [["music", 47.94], ["cattle, bovinae", 6.48], ["livestock, farm animals, working animals", 6.3]], null, null, null, null, null, null, null], "duration": [-0.28, 0.45, 0.82, 3.14, 3.15, 2.07, 1.18, 1.54, 1.11, 0.83, 0.95, 0.1, 1.58, 1.39, 1.96, 5.56, 2.83, 0.31, 1.48, 1.34, 1.24, 0.42, 0.21]} \ No newline at end of file diff --git a/annotations_1/6JIY7mRvsRE_filtered.json b/annotations_1/6JIY7mRvsRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bbb2c5e692348069f10f8d04c09ae4f92fc1d68 --- /dev/null +++ b/annotations_1/6JIY7mRvsRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[92.0, 101.95], [103.0, 108.24], [109.0, 109.58], [113.0, 125.63]], "keep_status": [false, false, false, true], "silence_prob": [30.39, 67.13, 0.0, 35.12], "audiomae_on_audioset": [[["music", 67.28], ["speech", 8.38], ["synthesizer", 2.55]], null, null, [["music", 23.43], ["hum", 13.44], ["noise", 13.33]]], "duration": [9.95, 5.24, 0.58, 12.63]} \ No newline at end of file diff --git a/annotations_1/6JfQ82WowC8_filtered.json b/annotations_1/6JfQ82WowC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c660cae8110e491f9bdac5dfd014a286f35a06f --- /dev/null +++ b/annotations_1/6JfQ82WowC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.48], [16.0, 25.29], [28.0, 49.64], [51.0, 72.42], [75.0, 79.51], [81.0, 83.59], [84.0, 86.64], [87.0, 91.25], [92.0, 97.58], [98.0, 99.42], [100.0, 101.6], [102.0, 105.88]], "keep_status": [true, false, false, true, false, false, false, true, true, false, false, true], "silence_prob": [33.79, 34.24, 28.69, 28.21, 35.43, 60.79, 54.63, 44.29, 33.57, 0.0, 0.0, 34.95], "audiomae_on_audioset": [[["mains hum", 18.88], ["music", 13.45], ["insect", 12.21]], [["mains hum", 63.3], ["hum", 30.02], ["noise", 3.25]], [["speech", 66.76], ["explosion", 4.36], ["music", 3.82]], [["speech", 46.79], ["groan", 6.24], ["music", 5.48]], [["mains hum", 39.76], ["hum", 18.84], ["music", 18.19]], null, null, [["speech", 46.39], ["sidetone", 11.47], ["hum", 9.32]], [["livestock, farm animals, working animals", 23.37], ["cattle, bovinae", 22.95], ["moo", 11.21]], null, null, [["radio", 21.98], ["speech", 19.09], ["sidetone", 8.13]]], "duration": [8.48, 9.29, 21.64, 21.42, 4.51, 2.59, 2.64, 4.25, 5.58, 1.42, 1.6, 3.88]} \ No newline at end of file diff --git a/annotations_1/6KHyMISpE18_filtered.json b/annotations_1/6KHyMISpE18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28eb56851a02cd88f495b28e461c6e07e727921d --- /dev/null +++ b/annotations_1/6KHyMISpE18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 9.44], [44.0, 46.33], [49.0, 51.43], [53.0, 53.55], [57.0, 57.72], [65.0, 65.69], [85.0, 85.51], [104.0, 107.92], [109.0, 121.68], [131.0, 130.84], [131.0, 130.87], [135.0, 135.35], [137.0, 141.98], [144.0, 158.77], [165.0, 165.11], [166.0, 176.32]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [28.51, 29.06, 30.45, 0.0, 0.0, 0.0, 0.0, 28.58, 28.57, 0.0, 0.0, 0.0, 28.55, 28.52, 0.0, 28.63], "audiomae_on_audioset": [[["music", 57.33], ["speech", 12.99], ["electronic music", 9.79]], [["mains hum", 36.71], ["music", 20.21], ["hum", 17.38]], [["music", 54.4], ["mains hum", 10.0], ["hum", 9.68]], null, null, null, null, [["music", 47.59], ["speech", 16.62], ["electronic music", 5.17]], [["music", 66.29], ["speech", 15.31], ["electronic music", 7.06]], null, null, null, [["music", 60.56], ["speech", 12.05], ["electronic music", 5.05]], [["music", 68.9], ["speech", 12.65], ["techno", 4.48]], null, [["music", 78.32], ["speech", 5.94], ["electronic music", 5.28]]], "duration": [9.44, 2.33, 2.43, 0.55, 0.72, 0.69, 0.51, 3.92, 12.68, -0.16, -0.13, 0.35, 4.98, 14.77, 0.11, 10.32]} \ No newline at end of file diff --git a/annotations_1/6KYxDFGC2hE_filtered.json b/annotations_1/6KYxDFGC2hE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f74995e298b78b728d43c18605d6ed8d56720b2e --- /dev/null +++ b/annotations_1/6KYxDFGC2hE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [4.0, 7.26], [13.0, 14.34], [15.0, 15.28], [16.0, 18.98], [21.0, 25.78], [27.0, 28.61], [32.0, 33.93], [35.0, 36.02], [37.0, 43.26], [47.0, 48.24], [52.0, 52.68], [55.0, 56.32], [57.0, 57.5], [58.0, 58.28], [59.0, 60.74], [61.0, 63.27], [64.0, 67.58], [70.0, 75.74], [83.0, 84.16], [85.0, 92.11], [95.0, 99.23], [102.0, 105.48], [108.0, 109.22], [111.0, 111.5], [114.0, 113.76], [115.0, 115.55], [116.0, 117.19], [121.0, 125.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 44.12, 0.0, 0.0, 39.08, 61.18, 0.0, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 47.16, 35.07, 0.0, 34.37, 57.32, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 45.49], "audiomae_on_audioset": [null, [["hum", 16.05], ["mains hum", 7.75], ["cattle, bovinae", 6.33]], null, null, [["burping, eructation", 68.32], ["animal", 2.88], ["speech", 2.72]], null, null, null, null, [["cattle, bovinae", 58.99], ["moo", 22.35], ["livestock, farm animals, working animals", 18.03]], null, null, null, null, null, null, [["mains hum", 20.49], ["hum", 19.78], ["wood", 8.35]], [["speech", 18.64], ["rain on surface", 11.97], ["rain", 8.99]], [["speech", 32.86], ["rain on surface", 11.33], ["radio", 11.27]], null, [["animal", 19.22], ["fart", 7.3], ["speech", 7.1]], null, null, null, null, null, null, null, [["fly, housefly", 19.43], ["crushing", 15.63], ["bee, wasp, etc.", 8.22]]], "duration": [0.78, 3.26, 1.34, 0.28, 2.98, 4.78, 1.61, 1.93, 1.02, 6.26, 1.24, 0.68, 1.32, 0.5, 0.28, 1.74, 2.27, 3.58, 5.74, 1.16, 7.11, 4.23, 3.48, 1.22, 0.5, -0.24, 0.55, 1.19, 4.85]} \ No newline at end of file diff --git a/annotations_1/6Kfqy-8C3o0_filtered.json b/annotations_1/6Kfqy-8C3o0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c6c85e1ac196acea546a9f19c0554bd361e4693 --- /dev/null +++ b/annotations_1/6Kfqy-8C3o0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 24.85], [25.0, 26.08], [27.0, 40.81], [42.0, 50.26], [52.0, 88.57], [89.0, 90.98], [93.0, 165.18]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [49.45, 0.0, 40.04, 39.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.86], ["hum", 13.56], ["throbbing", 5.14]], null, [["hum", 39.65], ["music", 25.54], ["mains hum", 13.64]], [["music", 84.98], ["synthesizer", 3.32], ["electronic music", 2.13]], null, null, null], "duration": [15.85, 1.08, 13.81, 8.26, 36.57, 1.98, 72.18]} \ No newline at end of file diff --git a/annotations_1/6La5YCYlMZY_filtered.json b/annotations_1/6La5YCYlMZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aa217a8c4b1baab7538e88dc0cc24fd42c12592 --- /dev/null +++ b/annotations_1/6La5YCYlMZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.37], [9.0, 12.51], [13.0, 13.91], [15.0, 15.82], [22.0, 24.73], [25.0, 35.78], [37.0, 37.54], [41.0, 41.99], [43.0, 44.14], [45.0, 45.82], [46.0, 47.73], [48.0, 49.76], [53.0, 53.32], [64.0, 65.55], [69.0, 72.0], [72.0, 72.66], [74.0, 74.39], [75.0, 75.47], [76.0, 77.11], [78.0, 78.36], [80.0, 80.72], [82.0, 82.71], [87.0, 91.12], [92.0, 95.2], [99.0, 111.55], [113.0, 116.72], [119.0, 125.9], [129.0, 134.3], [136.0, 146.4]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.15, 0.0, 0.0, 38.22, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 61.08, 44.26, 81.17, 73.67, 82.79, 86.45], "audiomae_on_audioset": [null, [["speech", 41.35], ["didgeridoo", 9.75], ["animal", 7.13]], null, null, [["speech", 44.53], ["whale vocalization", 7.81], ["animal", 4.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 32.15], ["hum", 17.5], ["heart sounds, heartbeat", 6.76]], null, null, null, null], "duration": [0.37, 3.51, 0.91, 0.82, 2.73, 10.78, 0.54, 0.99, 1.14, 0.82, 1.73, 1.76, 0.32, 1.55, 3.0, 0.66, 0.39, 0.47, 1.11, 0.36, 0.72, 0.71, 4.12, 3.2, 12.55, 3.72, 6.9, 5.3, 10.4]} \ No newline at end of file diff --git a/annotations_1/6LyYxpkxILE_filtered.json b/annotations_1/6LyYxpkxILE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91939a4f80ce4b2484a09adfe3e0225618cb33d5 --- /dev/null +++ b/annotations_1/6LyYxpkxILE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [9.0, 10.39], [15.0, 16.6], [19.0, 20.7], [23.0, 24.43], [26.0, 26.76], [30.0, 31.62], [32.0, 36.29], [38.0, 38.37], [50.0, 51.61], [55.0, 55.38], [57.0, 56.89], [60.0, 59.88], [62.0, 62.07], [64.0, 65.82], [69.0, 69.3], [70.0, 70.6], [77.0, 79.34]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [46.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.27], "audiomae_on_audioset": [[["music", 49.57], ["gong", 4.99], ["musical instrument", 4.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sound effect", 17.66], ["music", 13.99], ["boing", 10.61]]], "duration": [2.31, 1.39, 1.6, 1.7, 1.43, 0.76, 1.62, 4.29, 0.37, 1.61, 0.38, -0.11, -0.12, 0.07, 1.82, 0.3, 0.6, 2.34]} \ No newline at end of file diff --git a/annotations_1/6MJJXdBz1q0_filtered.json b/annotations_1/6MJJXdBz1q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..722d0862a88d1a63a795b9595c65c97044d17ce8 --- /dev/null +++ b/annotations_1/6MJJXdBz1q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 0.84], [1.0, 1.04], [1.0, 17.07], [21.0, 39.48], [41.0, 42.4], [44.0, 46.75], [47.0, 47.8], [49.0, 50.57], [54.0, 57.38], [68.0, 68.93], [74.0, 74.06], [82.0, 81.62], [83.0, 82.93], [86.0, 93.66], [100.0, 104.72], [108.0, 109.21], [114.0, 115.47], [116.0, 115.65], [116.0, 123.97]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.56, 30.59, 0.0, 39.22, 0.0, 0.0, 48.27, 0.0, 0.0, 0.0, 0.0, 30.06, 35.42, 0.0, 0.0, 0.0, 31.06], "audiomae_on_audioset": [null, null, null, [["music", 52.03], ["speech", 13.67], ["animal", 3.07]], [["music", 46.7], ["speech", 38.9], ["hum", 3.4]], null, [["throbbing", 32.45], ["hum", 27.87], ["music", 24.08]], null, null, [["music", 55.03], ["hum", 11.35], ["synthesizer", 5.0]], null, null, null, null, [["speech", 44.48], ["music", 32.0], ["animal", 2.15]], [["hum", 41.75], ["mains hum", 10.14], ["throbbing", 6.61]], null, null, null, [["music", 53.54], ["speech", 21.05], ["throbbing", 5.89]]], "duration": [0.5, -0.16, 0.04, 16.07, 18.48, 1.4, 2.75, 0.8, 1.57, 3.38, 0.93, 0.06, -0.38, -0.07, 7.66, 4.72, 1.21, 1.47, -0.35, 7.97]} \ No newline at end of file diff --git a/annotations_1/6MaOE8YiJy8_filtered.json b/annotations_1/6MaOE8YiJy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2556d951cb325511f37b0cf11c172cf8981a74f3 --- /dev/null +++ b/annotations_1/6MaOE8YiJy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 28.7], [32.0, 33.83], [37.0, 40.1], [45.0, 68.74], [70.0, 73.95], [75.0, 75.39], [78.0, 86.68], [88.0, 88.42], [90.0, 91.02], [94.0, 96.11], [97.0, 141.03], [142.0, 150.36], [152.0, 164.37]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [38.88, 0.0, 64.52, 41.24, 70.02, 0.0, 35.26, 0.0, 0.0, 95.09, 0.0, 32.38, 28.45], "audiomae_on_audioset": [[["speech", 64.47], ["sidetone", 22.26], ["electric shaver, electric razor", 2.65]], null, null, [["music", 27.35], ["hum", 27.3], ["throbbing", 15.3]], null, null, [["music", 19.48], ["speech", 13.51], ["didgeridoo", 8.33]], null, null, null, null, [["music", 27.02], ["hum", 24.52], ["mains hum", 23.84]], [["hum", 30.85], ["throbbing", 18.32], ["mains hum", 12.1]]], "duration": [5.7, 1.83, 3.1, 23.74, 3.95, 0.39, 8.68, 0.42, 1.02, 2.11, 44.03, 8.36, 12.37]} \ No newline at end of file diff --git a/annotations_1/6Mr9bQJEuN0_filtered.json b/annotations_1/6Mr9bQJEuN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cc5615e71031c280b298d6b435b7c9224e14049 --- /dev/null +++ b/annotations_1/6Mr9bQJEuN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.06], [12.0, 12.6], [13.0, 15.57], [17.0, 17.32], [19.0, 19.77], [21.0, 21.17], [21.0, 23.25], [26.0, 27.35], [32.0, 39.92], [41.0, 42.06], [47.0, 48.57], [50.0, 50.19], [54.0, 55.44], [56.0, 57.87], [60.0, 61.8], [62.0, 66.48], [67.0, 69.23], [71.0, 70.8], [74.0, 75.44], [76.0, 78.06], [79.0, 81.35], [82.0, 83.08], [85.0, 89.13], [90.0, 92.06], [94.0, 96.65], [99.0, 99.84], [102.0, 105.66], [106.0, 107.06], [109.0, 109.97], [112.0, 112.11], [114.0, 114.34], [118.0, 120.34], [122.0, 124.71], [126.0, 129.63], [133.0, 142.33], [143.0, 148.02], [149.0, 150.52], [155.0, 156.32], [158.0, 179.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.21, 0.0, 97.73, 0.0, 0.0, 0.0, 90.78, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.04, 74.13, 0.0, 0.0, 71.57, 95.51, 0.0, 87.55, 64.63, 77.03, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 83.7, 90.25, 76.53, 78.04, 48.23, 0.0, 0.0, 57.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.18], ["music", 20.31], ["radio", 5.23]], null, null, null, null, null, null, null, null, [["music", 27.72], ["mains hum", 11.19], ["speech", 8.85]], null, null, null], "duration": [3.06, 0.6, 2.57, 0.32, 0.77, 0.17, 2.25, 1.35, 7.92, 1.06, 1.57, 0.19, 1.44, 1.87, 1.8, 4.48, 2.23, -0.2, 1.44, 2.06, 2.35, 1.08, 4.13, 2.06, 2.65, 0.84, 3.66, 1.06, 0.97, 0.11, 0.34, 2.34, 2.71, 3.63, 9.33, 5.02, 1.52, 1.32, 21.52]} \ No newline at end of file diff --git a/annotations_1/6Nb7rSggCns_filtered.json b/annotations_1/6Nb7rSggCns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37e8357a0f9789c69f6b2502b593b4804a828d7 --- /dev/null +++ b/annotations_1/6Nb7rSggCns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [7.0, 12.45], [15.0, 27.16], [32.0, 35.02], [39.0, 41.05], [42.0, 80.2], [84.0, 100.62], [102.0, 104.16], [111.0, 112.16], [113.0, 117.48], [118.0, 119.08], [120.0, 126.28], [128.0, 130.91], [131.0, 138.79], [139.0, 140.76], [142.0, 142.57], [146.0, 149.82], [150.0, 149.86], [150.0, 151.33], [152.0, 159.76], [161.0, 162.72], [164.0, 168.37], [169.0, 169.64], [171.0, 173.72], [175.0, 175.42]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 38.26, 38.3, 40.43, 51.5, 0.0, 34.8, 41.91, 0.0, 30.58, 0.0, 31.07, 34.94, 33.03, 0.0, 0.0, 39.83, 0.0, 0.0, 32.23, 0.0, 32.37, 0.0, 41.3, 0.0], "audiomae_on_audioset": [null, [["speech", 26.32], ["music", 19.39], ["rumble", 9.14]], [["speech", 25.13], ["rumble", 18.03], ["whale vocalization", 13.87]], [["music", 63.62], ["ambient music", 4.36], ["musical instrument", 4.17]], null, null, [["singing bowl", 48.03], ["music", 28.64], ["electronic music", 6.61]], [["music", 30.5], ["whale vocalization", 20.24], ["electronic music", 8.36]], null, [["speech", 61.18], ["music", 9.74], ["hum", 7.77]], null, [["hum", 37.52], ["sonar", 19.51], ["music", 13.46]], [["speech", 59.94], ["rumble", 9.49], ["music", 8.0]], [["speech", 85.11], ["rumble", 4.77], ["speech synthesizer", 1.1]], null, null, [["speech", 47.82], ["dial tone", 9.51], ["music", 9.17]], null, null, [["whale vocalization", 23.63], ["speech", 9.72], ["music", 8.45]], null, [["speech", 37.63], ["music", 28.29], ["throbbing", 6.59]], null, [["hum", 23.76], ["rumble", 18.78], ["throbbing", 10.07]], null], "duration": [0.56, 5.45, 12.16, 3.02, 2.05, 38.2, 16.62, 2.16, 1.16, 4.48, 1.08, 6.28, 2.91, 7.79, 1.76, 0.57, 3.82, -0.14, 1.33, 7.76, 1.72, 4.37, 0.64, 2.72, 0.42]} \ No newline at end of file diff --git a/annotations_1/6O554p-ovsI_filtered.json b/annotations_1/6O554p-ovsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07ab2716c9d5a7f5b06c7c07ca7416537d915c80 --- /dev/null +++ b/annotations_1/6O554p-ovsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [4.0, 3.87], [7.0, 7.16], [9.0, 9.24], [10.0, 12.5], [13.0, 16.5], [17.0, 20.33], [21.0, 21.34], [26.0, 26.7], [28.0, 28.11], [29.0, 30.0], [35.0, 35.53], [37.0, 41.44], [43.0, 43.55], [44.0, 45.96], [50.0, 50.53], [55.0, 55.48], [58.0, 59.1], [73.0, 73.89], [75.0, 75.96], [80.0, 81.45], [82.0, 82.68], [83.0, 83.83], [86.0, 90.26], [95.0, 95.12], [96.0, 96.8], [98.0, 98.51], [101.0, 102.71], [105.0, 105.29], [108.0, 108.67], [115.0, 115.75], [116.0, 119.72], [121.0, 121.0], [121.0, 121.93], [124.0, 124.7], [126.0, 126.35], [127.0, 127.97], [132.0, 132.04], [138.0, 140.1], [142.0, 143.95], [145.0, 144.9], [146.0, 147.73], [151.0, 152.12], [153.0, 166.29], [169.0, 169.6], [170.0, 170.82], [171.0, 172.76], [174.0, 174.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.4, 43.18, 60.51, 0.0, 0.0, 0.0, 0.0, 0.0, 44.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.74, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 29.07], ["hum", 17.7], ["fly, housefly", 9.0]], null, null, null, null, null, null, [["speech", 22.74], ["hum", 8.81], ["throbbing", 5.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, -0.13, 0.16, 0.24, 2.5, 3.5, 3.33, 0.34, 0.7, 0.11, 1.0, 0.53, 4.44, 0.55, 1.96, 0.53, 0.48, 1.1, 0.89, 0.96, 1.45, 0.68, 0.83, 4.26, 0.12, 0.8, 0.51, 1.71, 0.29, 0.67, 0.75, 3.72, 0.0, 0.93, 0.7, 0.35, 0.97, 0.04, 2.1, 1.95, -0.1, 1.73, 1.12, 13.29, 0.6, 0.82, 1.76, 0.88]} \ No newline at end of file diff --git a/annotations_1/6OKt2CZ4ULE_filtered.json b/annotations_1/6OKt2CZ4ULE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3408936f7c9ca38b3999516322486ce33c22b06 --- /dev/null +++ b/annotations_1/6OKt2CZ4ULE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [3.0, 3.82], [7.0, 12.93], [15.0, 26.28], [27.0, 34.5], [36.0, 36.37], [40.0, 40.36], [41.0, 41.22], [42.0, 42.5], [43.0, 44.29], [45.0, 45.37], [46.0, 46.6], [47.0, 47.14], [48.0, 48.09], [52.0, 62.06]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 65.2, 81.0, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.84], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.06], ["noise", 8.6], ["fly, housefly", 7.34]], null, null, null, null, null, null, null, null, null, [["speech", 34.7], ["mosquito", 12.32], ["livestock, farm animals, working animals", 6.27]]], "duration": [0.42, 0.82, 5.93, 11.28, 7.5, 0.37, 0.36, 0.22, 0.5, 1.29, 0.37, 0.6, 0.14, 0.09, 10.06]} \ No newline at end of file diff --git a/annotations_1/6O_dprt5rts_filtered.json b/annotations_1/6O_dprt5rts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06593bd0aa7a1ff113461a3322e9afa9b1283c52 --- /dev/null +++ b/annotations_1/6O_dprt5rts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.42], [9.0, 12.77], [15.0, 15.6], [17.0, 27.41], [28.0, 30.3], [32.0, 32.83], [35.0, 41.72], [43.0, 79.3], [81.0, 96.84], [98.0, 154.74], [156.0, 157.06], [158.0, 179.51]], "keep_status": [true, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [37.58, 34.66, 0.0, 51.66, 37.35, 0.0, 28.76, 0.0, 31.59, 0.0, 0.0, 61.77], "audiomae_on_audioset": [[["music", 35.0], ["hum", 15.65], ["mains hum", 14.85]], [["music", 32.15], ["speech", 18.43], ["hum", 10.11]], null, null, [["music", 23.2], ["speech", 20.02], ["whale vocalization", 13.47]], null, [["music", 37.93], ["cacophony", 10.38], ["rumble", 4.33]], null, [["music", 37.15], ["hum", 24.29], ["throbbing", 13.29]], null, null, null], "duration": [4.42, 3.77, 0.6, 10.41, 2.3, 0.83, 6.72, 36.3, 15.84, 56.74, 1.06, 21.51]} \ No newline at end of file diff --git a/annotations_1/6PAMZYS1Fqk_filtered.json b/annotations_1/6PAMZYS1Fqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a31b004765c359fa4392a46d887b1b17920e2249 --- /dev/null +++ b/annotations_1/6PAMZYS1Fqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.99], [8.0, 11.6], [21.0, 23.33], [26.0, 32.78], [39.0, 42.11], [50.0, 55.48], [60.0, 61.2], [67.0, 67.15], [114.0, 114.42], [117.0, 117.85], [123.0, 123.06], [123.0, 123.79], [130.0, 131.43], [136.0, 136.56], [145.0, 145.35], [147.0, 147.34], [148.0, 147.7], [148.0, 152.05], [154.0, 155.73], [159.0, 160.73], [161.0, 164.54], [165.0, 166.5], [167.0, 167.04], [167.0, 170.16]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.54, 55.25, 40.54, 39.41, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 74.44, 0.0, 0.0, 61.37], "audiomae_on_audioset": [null, [["speech", 37.67], ["music", 27.6], ["thunk", 7.96]], null, [["cattle, bovinae", 23.2], ["music", 17.59], ["moo", 16.91]], [["music", 65.49], ["speech", 7.06], ["throbbing", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 3.6, 2.33, 6.78, 3.11, 5.48, 1.2, 0.15, 0.42, 0.85, 0.06, 0.79, 1.43, 0.56, 0.35, 0.34, -0.3, 4.05, 1.73, 1.73, 3.54, 1.5, 0.04, 3.16]} \ No newline at end of file diff --git a/annotations_1/6PEQcK6G_4M_filtered.json b/annotations_1/6PEQcK6G_4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61283201a215fb40b9f14e449106487cd4da216f --- /dev/null +++ b/annotations_1/6PEQcK6G_4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.62], [16.0, 17.63], [20.0, 21.44], [22.0, 24.81], [26.0, 27.73], [29.0, 30.42], [33.0, 34.06], [38.0, 55.61], [58.0, 58.48], [61.0, 85.48], [101.0, 112.09], [116.0, 117.46], [118.0, 118.25], [118.0, 118.94], [133.0, 133.3], [141.0, 142.86], [143.0, 147.73], [150.0, 156.73], [159.0, 160.03], [171.0, 171.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 32.36, 0.0, 31.94, 40.95, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 65.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.84], ["throbbing", 16.9], ["electronic music", 3.24]], null, [["music", 47.22], ["throbbing", 26.22], ["hum", 8.54]], [["music", 78.18], ["telephone dialing, dtmf", 4.5], ["sidetone", 3.3]], null, null, null, null, null, null, null, null, null], "duration": [1.62, 1.63, 1.44, 2.81, 1.73, 1.42, 1.06, 17.61, 0.48, 24.48, 11.09, 1.46, 0.25, 0.94, 0.3, 1.86, 4.73, 6.73, 1.03, 0.8]} \ No newline at end of file diff --git a/annotations_1/6PrFocPT-Rs_filtered.json b/annotations_1/6PrFocPT-Rs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a814ac6eb465be4c2fb56a48be4de68bd4735ce7 --- /dev/null +++ b/annotations_1/6PrFocPT-Rs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [10.0, 22.15], [23.0, 23.95], [26.0, 26.06], [29.0, 30.1], [31.0, 32.1], [38.0, 42.06], [43.0, 43.93], [51.0, 53.32], [57.0, 70.07], [70.0, 72.18], [76.0, 79.93], [82.0, 87.94], [88.0, 91.13], [95.0, 100.09], [101.0, 103.06], [104.0, 112.9], [114.0, 114.84], [121.0, 125.24], [126.0, 129.29], [130.0, 135.77], [139.0, 145.89], [147.0, 148.53], [149.0, 150.36], [152.0, 153.3], [154.0, 155.6], [157.0, 157.49], [159.0, 160.02], [163.0, 164.46], [170.0, 170.58], [172.0, 171.75], [173.0, 173.2]], "keep_status": [false, true, false, false, false, false, true, false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.45, 0.0, 0.0, 0.0, 0.0, 33.13, 0.0, 44.26, 30.72, 32.55, 31.27, 31.73, 31.39, 32.86, 40.07, 32.08, 0.0, 66.88, 62.99, 61.67, 34.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.0], ["throbbing", 22.93], ["hum", 11.6]], null, null, null, null, [["hum", 16.11], ["music", 15.15], ["noise", 14.38]], null, [["music", 32.82], ["hum", 11.96], ["throbbing", 8.19]], [["speech", 33.3], ["groan", 8.49], ["fly, housefly", 7.58]], [["cattle, bovinae", 44.36], ["moo", 29.14], ["livestock, farm animals, working animals", 13.05]], [["music", 51.33], ["speech", 11.93], ["hum", 8.8]], [["music", 33.43], ["hum", 32.63], ["throbbing", 14.4]], [["music", 37.47], ["speech", 35.46], ["hum", 8.54]], [["speech", 38.96], ["music", 29.92], ["throbbing", 11.57]], [["cattle, bovinae", 31.41], ["moo", 18.19], ["livestock, farm animals, working animals", 15.59]], [["whale vocalization", 26.26], ["speech", 17.7], ["hum", 8.82]], null, null, null, null, [["theremin", 31.34], ["music", 21.28], ["hum", 19.81]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 12.15, 0.95, 0.06, 1.1, 1.1, 4.06, 0.93, 2.32, 13.07, 2.18, 3.93, 5.94, 3.13, 5.09, 2.06, 8.9, 0.84, 4.24, 3.29, 5.77, 6.89, 1.53, 1.36, 1.3, 1.6, 0.49, 1.02, 1.46, 0.58, -0.25, 0.2]} \ No newline at end of file diff --git a/annotations_1/6QB5kS_JcuU_filtered.json b/annotations_1/6QB5kS_JcuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7477a24deadcba3d2ddeb749814f8b75943f60fd --- /dev/null +++ b/annotations_1/6QB5kS_JcuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.13], [30.0, 59.29], [64.0, 141.98], [142.0, 144.0], [144.0, 144.81], [145.0, 146.11]], "keep_status": [false, true, false, true, false, false], "silence_prob": [54.43, 29.1, 0.0, 35.2, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.44], ["throbbing", 18.79], ["skidding", 9.48]], null, [["stomach rumble", 22.1], ["hum", 19.59], ["throbbing", 10.44]], null, null], "duration": [3.13, 29.29, 77.98, 2.0, 0.81, 1.11]} \ No newline at end of file diff --git a/annotations_1/6QYw68kf4sI_filtered.json b/annotations_1/6QYw68kf4sI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..226e026c0c570d959313f6c8ee51dea4e2f3b36b --- /dev/null +++ b/annotations_1/6QYw68kf4sI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.71], [12.0, 15.08], [17.0, 18.62], [20.0, 20.95], [25.0, 26.06], [29.0, 29.62], [32.0, 32.29], [40.0, 40.68], [52.0, 53.79], [63.0, 63.27], [67.0, 81.75], [85.0, 89.87], [93.0, 108.35], [109.0, 110.86], [114.0, 114.52], [119.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 37.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.35, 28.77, 29.55, 0.0, 0.0, 67.25], "audiomae_on_audioset": [null, [["speech", 36.6], ["radio", 32.75], ["noise", 5.15]], null, null, null, null, null, null, null, null, [["speech", 47.04], ["vehicle", 16.21], ["car", 4.81]], [["vehicle", 45.61], ["speech", 33.72], ["car", 7.24]], [["vehicle", 34.47], ["car", 20.92], ["motorcycle", 6.02]], null, null, null], "duration": [0.71, 3.08, 1.62, 0.95, 1.06, 0.62, 0.29, 0.68, 1.79, 0.27, 14.75, 4.87, 15.35, 1.86, 0.52, 2.54]} \ No newline at end of file diff --git a/annotations_1/6QfunXjWCpc_filtered.json b/annotations_1/6QfunXjWCpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/6QfunXjWCpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/6R3tTi_m8VQ_filtered.json b/annotations_1/6R3tTi_m8VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04a075fff7e3cce667c2074be08a68f2a9fd013a --- /dev/null +++ b/annotations_1/6R3tTi_m8VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 28.43], [29.0, 30.79], [32.0, 33.07], [39.0, 39.92], [43.0, 44.42], [46.0, 47.34], [49.0, 50.45], [53.0, 62.09], [64.0, 64.17], [65.0, 69.89], [71.0, 72.82], [73.0, 74.06], [76.0, 76.96], [80.0, 81.63], [84.0, 85.09], [86.0, 88.47], [90.0, 99.3], [101.0, 102.91], [105.0, 111.05], [112.0, 112.99]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.87, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 43.18, 0.0, 43.53, 0.0], "audiomae_on_audioset": [[["hum", 39.68], ["mains hum", 15.61], ["throbbing", 13.81]], null, null, null, null, null, null, [["speech", 29.89], ["hum", 25.69], ["throbbing", 14.76]], null, null, null, null, null, null, null, null, [["music", 53.42], ["hum", 3.82], ["throbbing", 2.66]], null, [["music", 33.03], ["throbbing", 24.06], ["hum", 17.44]], null], "duration": [7.43, 1.79, 1.07, 0.92, 1.42, 1.34, 1.45, 9.09, 0.17, 4.89, 1.82, 1.06, 0.96, 1.63, 1.09, 2.47, 9.3, 1.91, 6.05, 0.99]} \ No newline at end of file diff --git a/annotations_1/6RbMqRpNqmY_filtered.json b/annotations_1/6RbMqRpNqmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36acc62bda309c816dd315f4a3283c9808bbf3ac --- /dev/null +++ b/annotations_1/6RbMqRpNqmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [4.0, 5.21], [6.0, 7.97], [10.0, 10.35], [11.0, 12.01], [13.0, 14.15], [15.0, 15.96], [19.0, 20.53], [21.0, 24.56], [26.0, 26.69], [30.0, 30.35], [32.0, 34.4], [35.0, 36.93], [38.0, 39.07], [43.0, 43.36], [48.0, 61.08], [67.0, 69.43], [74.0, 78.34], [79.0, 80.15], [81.0, 82.88], [85.0, 85.46], [90.0, 93.93], [95.0, 95.07], [96.0, 96.35], [98.0, 98.73], [101.0, 101.17], [103.0, 103.57], [104.0, 106.49], [109.0, 111.16], [112.0, 112.53], [114.0, 113.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 68.28, 31.44, 72.6, 0.0, 0.0, 0.0, 41.87, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46, 31.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 12.09], ["music", 7.98], ["noise", 7.07]], null, null, null, null, [["hum", 45.18], ["speech", 11.53], ["mains hum", 7.69]], null, null, null, null, null, [["radio", 25.99], ["speech", 19.63], ["croak", 8.47]], [["speech", 49.72], ["inside, small room", 5.99], ["radio", 3.3]], null, null], "duration": [1.52, 1.21, 1.97, 0.35, 1.01, 1.15, 0.96, 1.53, 3.56, 0.69, 0.35, 2.4, 1.93, 1.07, 0.36, 13.08, 2.43, 4.34, 1.15, 1.88, 0.46, 3.93, 0.07, 0.35, 0.73, 0.17, 0.57, 2.49, 2.16, 0.53, -0.07]} \ No newline at end of file diff --git a/annotations_1/6TOx7qsyaxU_filtered.json b/annotations_1/6TOx7qsyaxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6275d4fb4bd372c05ee2c62e806d71862ca6edde --- /dev/null +++ b/annotations_1/6TOx7qsyaxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.22], [18.0, 19.48], [20.0, 23.14], [26.0, 36.17], [38.0, 42.82], [46.0, 46.52], [48.0, 48.15], [52.0, 53.18], [55.0, 54.95], [59.0, 59.34], [70.0, 71.12], [72.0, 72.57], [78.0, 78.41], [80.0, 80.96], [82.0, 84.43], [86.0, 89.24], [91.0, 91.35], [93.0, 93.23], [97.0, 97.75], [100.0, 100.7], [106.0, 106.73], [110.0, 114.39], [117.0, 117.1], [120.0, 120.68], [122.0, 123.47], [126.0, 172.0], [172.0, 174.11], [177.0, 179.15], [183.0, 188.79], [189.0, 190.44], [192.0, 195.13], [198.0, 198.24], [200.0, 202.59], [204.0, 222.44], [224.0, 225.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 37.26, 33.59, 65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 51.39, 77.2, 54.43, 0.0, 33.18, 0.0, 38.58, 33.67, 0.0], "audiomae_on_audioset": [null, null, [["moo", 32.75], ["livestock, farm animals, working animals", 22.95], ["cattle, bovinae", 22.04]], [["music", 61.79], ["fart", 7.95], ["didgeridoo", 6.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 13.33], ["throbbing", 9.79], ["fly, housefly", 9.27]], null, [["music", 48.24], ["theremin", 14.86], ["synthesizer", 4.58]], [["music", 60.05], ["speech", 16.01], ["theremin", 5.85]], null], "duration": [0.22, 1.48, 3.14, 10.17, 4.82, 0.52, 0.15, 1.18, -0.05, 0.34, 1.12, 0.57, 0.41, 0.96, 2.43, 3.24, 0.35, 0.23, 0.75, 0.7, 0.73, 4.39, 0.1, 0.68, 1.47, 46.0, 2.11, 2.15, 5.79, 1.44, 3.13, 0.24, 2.59, 18.44, 1.22]} \ No newline at end of file diff --git a/annotations_1/6TVik8mYxrY_filtered.json b/annotations_1/6TVik8mYxrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..775ddaca86a1a44383e2e75e063a5a6599e8bbba --- /dev/null +++ b/annotations_1/6TVik8mYxrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[143.0, 144.91], [146.0, 148.41]], "keep_status": [false, true], "silence_prob": [0.0, 43.18], "audiomae_on_audioset": [null, [["music", 41.54], ["synthesizer", 12.27], ["noise", 8.81]]], "duration": [1.91, 2.41]} \ No newline at end of file diff --git a/annotations_1/6T_01swH-OY_filtered.json b/annotations_1/6T_01swH-OY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1afb8e060759cb913c7dc7f99e3651b8fd34a732 --- /dev/null +++ b/annotations_1/6T_01swH-OY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [7.0, 8.11], [9.0, 9.66], [11.0, 11.33], [13.0, 16.71], [17.0, 17.37], [23.0, 46.48], [48.0, 48.1], [49.0, 50.35], [52.0, 53.3], [56.0, 56.07], [59.0, 59.46], [61.0, 61.59], [69.0, 69.52], [70.0, 70.61], [82.0, 82.34], [88.0, 89.19], [91.0, 91.99], [94.0, 98.22], [99.0, 101.88], [103.0, 103.96], [106.0, 107.86], [109.0, 111.03], [112.0, 123.38], [124.0, 124.39], [125.0, 125.19], [128.0, 128.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 56.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.1, 68.54, 0.0, 0.0, 81.0, 96.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.11, 0.66, 0.33, 3.71, 0.37, 23.48, 0.1, 1.35, 1.3, 0.07, 0.46, 0.59, 0.52, 0.61, 0.34, 1.19, 0.99, 4.22, 2.88, 0.96, 1.86, 2.03, 11.38, 0.39, 0.19, 0.85]} \ No newline at end of file diff --git a/annotations_1/6Tax5ajZYsY_filtered.json b/annotations_1/6Tax5ajZYsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..727a94d218ef2693e238fe7493d5c48e44b0ba72 --- /dev/null +++ b/annotations_1/6Tax5ajZYsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [5.0, 5.81], [11.0, 11.57], [15.0, 14.84], [15.0, 16.55], [17.0, 18.12], [20.0, 25.44], [27.0, 29.25], [35.0, 35.53], [36.0, 36.91], [41.0, 44.25], [53.0, 53.59], [55.0, 55.56], [57.0, 57.08], [62.0, 62.19], [69.0, 69.94], [73.0, 72.62], [78.0, 78.39], [81.0, 81.87], [83.0, 83.61], [85.0, 86.41], [87.0, 87.54], [89.0, 89.68], [90.0, 90.96], [93.0, 100.53], [102.0, 104.65], [107.0, 112.35], [115.0, 120.23], [124.0, 123.62], [126.0, 131.55], [132.0, 132.81], [134.0, 134.0], [135.0, 135.19], [136.0, 147.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 99.88, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 86.27, 39.19, 53.28, 0.0, 31.8, 0.0, 0.0, 0.0, 42.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 17.02], ["noise", 16.58], ["music", 9.58]], null, null, [["breaking", 21.87], ["speech", 20.84], ["gunshot, gunfire", 18.55]], null, null, null, [["speech", 48.97], ["electric shaver, electric razor", 14.88], ["fart", 4.92]]], "duration": [0.4, 0.81, 0.57, -0.16, 1.55, 1.12, 5.44, 2.25, 0.53, 0.91, 3.25, 0.59, 0.56, 0.08, 0.19, 0.94, -0.38, 0.39, 0.87, 0.61, 1.41, 0.54, 0.68, 0.96, 7.53, 2.65, 5.35, 5.23, -0.38, 5.55, 0.81, 0.0, 0.19, 11.61]} \ No newline at end of file diff --git a/annotations_1/6Tz9krF1K68_filtered.json b/annotations_1/6Tz9krF1K68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af68d82504d48d43c3585af1606e640b9582c3a --- /dev/null +++ b/annotations_1/6Tz9krF1K68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.97], [17.0, 17.47], [25.0, 25.08], [27.0, 29.42], [33.0, 33.47], [39.0, 39.31], [44.0, 43.82], [46.0, 47.49], [51.0, 50.94], [52.0, 92.67], [95.0, 95.28], [97.0, 96.69], [97.0, 104.75], [108.0, 107.91], [112.0, 111.74], [114.0, 114.25], [116.0, 116.18], [119.0, 119.7], [121.0, 121.61], [123.0, 123.15], [124.0, 124.43], [125.0, 125.78], [129.0, 129.52], [133.0, 133.39], [138.0, 139.45], [141.0, 140.91], [141.0, 141.69], [144.0, 144.31], [148.0, 147.9], [150.0, 150.08], [153.0, 153.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 79.61], ["radio", 4.53], ["sidetone", 3.72]], null, null, null, null, null, null, null, null, [["noise", 38.62], ["speech", 14.6], ["fart", 8.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 0.47, 0.08, 2.42, 0.47, 0.31, -0.18, 1.49, -0.06, 40.67, 0.28, -0.31, 7.75, -0.09, -0.26, 0.25, 0.18, 0.7, 0.61, 0.15, 0.43, 0.78, 0.52, 0.39, 1.45, -0.09, 0.69, 0.31, -0.1, 0.08, 0.5]} \ No newline at end of file diff --git a/annotations_1/6Ua_T32yaic_filtered.json b/annotations_1/6Ua_T32yaic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0e1bf503dd1ea9c9ff98475466c1e1bb672aefe --- /dev/null +++ b/annotations_1/6Ua_T32yaic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.87], [5.0, 5.7], [6.0, 6.99], [10.0, 10.2], [15.0, 14.94], [15.0, 15.7], [16.0, 18.06], [21.0, 21.1], [23.0, 23.16], [27.0, 30.84], [31.0, 31.43], [32.0, 32.83], [35.0, 35.82], [37.0, 37.66], [40.0, 40.36], [41.0, 42.11], [44.0, 44.34], [45.0, 45.84], [46.0, 46.92], [53.0, 53.67], [55.0, 55.21], [58.0, 59.97], [66.0, 66.78], [67.0, 67.59], [71.0, 71.52], [72.0, 74.76], [75.0, 85.82], [87.0, 89.75], [90.0, 91.47], [92.0, 92.8], [93.0, 94.71], [97.0, 97.8], [99.0, 99.12], [102.0, 103.01], [103.0, 107.97], [110.0, 110.42], [119.0, 120.11], [121.0, 121.44], [125.0, 125.85], [126.0, 128.83], [138.0, 141.07], [141.0, 142.8], [152.0, 153.0], [161.0, 162.18], [162.0, 164.1], [165.0, 165.43], [166.0, 166.65], [168.0, 168.45], [186.0, 186.33], [187.0, 187.54], [188.0, 188.97], [191.0, 191.34], [192.0, 192.7], [194.0, 194.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 72.9, 100.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, 0.7, 0.99, 0.2, -0.06, 0.7, 2.06, 0.1, 0.16, 3.84, 0.43, 0.83, 0.82, 0.66, 0.36, 1.11, 0.34, 0.84, 0.92, 0.67, 0.21, 1.97, 0.78, 0.59, 0.52, 2.76, 10.82, 2.75, 1.47, 0.8, 1.71, 0.8, 0.12, 1.01, 4.97, 0.42, 1.11, 0.44, 0.85, 2.83, 3.07, 1.8, 1.0, 1.18, 2.1, 0.43, 0.65, 0.45, 0.33, 0.54, 0.97, 0.34, 0.7, 0.37]} \ No newline at end of file diff --git a/annotations_1/6V22uyjiMpw_filtered.json b/annotations_1/6V22uyjiMpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88b20bbd1a42f29347b87c3dbcec9778ae30f9c0 --- /dev/null +++ b/annotations_1/6V22uyjiMpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [4.0, 8.01], [8.0, 8.51], [13.0, 14.61], [19.0, 19.58], [28.0, 31.5], [34.0, 41.76], [56.0, 56.39], [58.0, 59.54], [62.0, 74.07], [75.0, 76.91], [80.0, 89.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.86, 0.0, 0.0, 0.0, 94.66, 85.9, 0.0, 0.0, 51.77, 0.0, 68.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 4.01, 0.51, 1.61, 0.58, 3.5, 7.76, 0.39, 1.54, 12.07, 1.91, 9.72]} \ No newline at end of file diff --git a/annotations_1/6VhCGQODB5U_filtered.json b/annotations_1/6VhCGQODB5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66fe1f4ae6c2505d12239389c5869a27b8806bb3 --- /dev/null +++ b/annotations_1/6VhCGQODB5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.47], [4.0, 4.97], [10.0, 10.45], [12.0, 12.88], [13.0, 13.42], [15.0, 17.27], [19.0, 18.94], [20.0, 20.87], [25.0, 25.2], [25.0, 26.42], [27.0, 27.72], [29.0, 29.76], [31.0, 32.39], [33.0, 33.98], [36.0, 36.53], [37.0, 38.87], [43.0, 43.31], [64.0, 64.29], [69.0, 70.63], [73.0, 73.26], [75.0, 77.33], [87.0, 88.47], [92.0, 92.8], [95.0, 95.91], [96.0, 99.01], [101.0, 101.63], [110.0, 110.64], [115.0, 116.02], [120.0, 129.86], [131.0, 131.04], [132.0, 133.59], [136.0, 137.3], [139.0, 139.24], [141.0, 142.42], [143.0, 144.64], [146.0, 147.06], [148.0, 148.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 31.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.42], ["speech", 21.35], ["electric shaver, electric razor", 3.85]], null, null, null, null, null, null, null, null], "duration": [1.47, 0.97, 0.45, 0.88, 0.42, 2.27, -0.06, 0.87, 0.2, 1.42, 0.72, 0.76, 1.39, 0.98, 0.53, 1.87, 0.31, 0.29, 1.63, 0.26, 2.33, 1.47, 0.8, 0.91, 3.01, 0.63, 0.64, 1.02, 9.86, 0.04, 1.59, 1.3, 0.24, 1.42, 1.64, 1.06, 0.66]} \ No newline at end of file diff --git a/annotations_1/6VvluTE_w14_filtered.json b/annotations_1/6VvluTE_w14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecb06c4630c134ba19bcba7b438b3b6042eec062 --- /dev/null +++ b/annotations_1/6VvluTE_w14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.53], [4.0, 5.27], [7.0, 7.5], [10.0, 10.62], [13.0, 16.51], [25.0, 26.84], [29.0, 29.74], [36.0, 37.42], [39.0, 41.4], [43.0, 73.35]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.97, 0.0, 0.0, 0.0, 31.38, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 42.53], ["mains hum", 19.45], ["music", 11.18]], null, null, null, [["music", 36.17], ["speech", 23.1], ["hum", 7.91]], null], "duration": [0.53, 1.27, 0.5, 0.62, 3.51, 1.84, 0.74, 1.42, 2.4, 30.35]} \ No newline at end of file diff --git a/annotations_1/6WX8Ct4xMvE_filtered.json b/annotations_1/6WX8Ct4xMvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90a0d122eb141876720e65c61b4407cced3bed32 --- /dev/null +++ b/annotations_1/6WX8Ct4xMvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.15], [14.0, 14.18], [23.0, 24.39], [28.0, 28.68], [32.0, 33.12], [34.0, 37.03], [38.0, 39.93], [42.0, 42.82], [52.0, 54.78], [57.0, 59.14], [63.0, 63.8], [70.0, 70.61], [76.0, 76.57], [77.0, 78.14], [81.0, 80.86], [81.0, 82.86], [87.0, 88.35], [91.0, 93.24], [94.0, 94.91], [96.0, 96.63], [98.0, 98.22], [103.0, 104.04], [104.0, 105.9], [106.0, 107.99], [110.0, 111.1], [113.0, 113.26], [118.0, 119.75], [123.0, 124.85], [126.0, 126.45], [128.0, 131.18], [140.0, 140.83], [155.0, 155.93], [164.0, 165.96], [173.0, 174.48], [177.0, 178.11], [179.0, 180.12]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 0.0, 34.05, 32.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 44.22], ["whale vocalization", 12.5], ["hum", 4.82]], null, null, [["music", 29.11], ["ping", 6.15], ["gong", 5.4]], [["mains hum", 30.17], ["hum", 16.07], ["speech", 11.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.18, 1.39, 0.68, 1.12, 3.03, 1.93, 0.82, 2.78, 2.14, 0.8, 0.61, 0.57, 1.14, -0.14, 1.86, 1.35, 2.24, 0.91, 0.63, 0.22, 1.04, 1.9, 1.99, 1.1, 0.26, 1.75, 1.85, 0.45, 3.18, 0.83, 0.93, 1.96, 1.48, 1.11, 1.12]} \ No newline at end of file diff --git a/annotations_1/6XRJuEv5Ya4_filtered.json b/annotations_1/6XRJuEv5Ya4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e09595fa74b47db4688b551ee2d392a632441f --- /dev/null +++ b/annotations_1/6XRJuEv5Ya4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.88], [6.0, 8.19], [9.0, 10.47], [12.0, 12.41], [13.0, 13.53], [15.0, 15.28], [16.0, 17.0], [18.0, 19.03], [20.0, 21.03], [26.0, 27.35], [27.0, 28.75], [30.0, 31.01], [33.0, 33.67], [34.0, 45.84], [53.0, 54.7], [56.0, 63.31], [68.0, 68.17], [75.0, 75.47], [78.0, 78.29], [79.0, 79.22], [81.0, 80.91], [82.0, 82.93], [84.0, 84.89], [86.0, 87.02], [91.0, 95.69], [97.0, 97.51], [103.0, 104.9], [107.0, 112.55], [116.0, 115.97], [118.0, 119.92], [120.0, 121.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [59.59, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 49.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 0.0, 0.0, 50.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.16], ["brass instrument", 25.19], ["trombone", 11.31]], null, [["hum", 42.95], ["mains hum", 32.74], ["throbbing", 7.13]], null, null, null, null, null, null, null, null, [["horse", 36.21], ["clip-clop", 29.09], ["speech", 4.0]], null, null, null, null, null, null], "duration": [2.88, 2.19, 1.47, 0.41, 0.53, 0.28, 1.0, 1.03, 1.03, 1.35, 1.75, 1.01, 0.67, 11.84, 1.7, 7.31, 0.17, 0.47, 0.29, 0.22, -0.09, 0.93, 0.89, 1.02, 4.69, 0.51, 1.9, 5.55, -0.03, 1.92, 1.05]} \ No newline at end of file diff --git a/annotations_1/6Xn4tr2grtc_filtered.json b/annotations_1/6Xn4tr2grtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df5877c92d9f75a535fb447703dbe675936455df --- /dev/null +++ b/annotations_1/6Xn4tr2grtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [9.0, 9.26], [14.0, 18.23], [18.0, 29.86], [36.0, 41.44], [46.0, 59.0], [61.0, 62.85], [64.0, 64.84], [66.0, 66.01], [66.0, 68.08], [74.0, 75.63]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.11, 29.28, 29.82, 30.7, 0.0, 0.0, 0.0, 30.81, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.53], ["speech", 18.15], ["electronic music", 2.99]], [["music", 51.23], ["speech", 10.38], ["boing", 9.16]], [["music", 31.05], ["speech", 21.72], ["sheep", 7.33]], [["music", 51.99], ["speech", 31.39], ["electronic music", 2.46]], null, null, null, [["whip", 52.62], ["mosquito", 6.62], ["fart", 5.84]], null], "duration": [0.04, 0.26, 4.23, 11.86, 5.44, 13.0, 1.85, 0.84, 0.01, 2.08, 1.63]} \ No newline at end of file diff --git a/annotations_1/6ZgWwouKUXg_filtered.json b/annotations_1/6ZgWwouKUXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5472f4dbfa4267c922bc2f47838b52541f247e40 --- /dev/null +++ b/annotations_1/6ZgWwouKUXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.18], [5.0, 5.41], [17.0, 17.12], [22.0, 22.3], [24.0, 24.81], [30.0, 30.2], [33.0, 32.9], [34.0, 34.3], [36.0, 36.12], [41.0, 41.62], [48.0, 48.98], [51.0, 56.42], [57.0, 57.84], [60.0, 60.03], [61.0, 61.5], [62.0, 64.12], [77.0, 77.95], [84.0, 84.08], [93.0, 93.58], [100.0, 102.12], [108.0, 110.81], [112.0, 115.11], [118.0, 120.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.35, 0.0, 0.0, 0.0, 38.67, 0.0, 0.0, 0.0, 33.43, 37.66, 34.42, 36.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 63.11], ["musical instrument", 5.26], ["hum", 4.98]], null, null, null, [["cowbell", 46.13], ["livestock, farm animals, working animals", 30.79], ["cattle, bovinae", 9.58]], null, null, null, [["music", 53.56], ["musical instrument", 7.06], ["synthesizer", 3.51]], [["music", 30.08], ["hum", 18.0], ["mains hum", 12.0]], [["speech", 36.91], ["mains hum", 16.96], ["hum", 11.64]], [["music", 57.41], ["hum", 6.71], ["synthesizer", 6.65]]], "duration": [0.18, 0.41, 0.12, 0.3, 0.81, 0.2, -0.1, 0.3, 0.12, 0.62, 0.98, 5.42, 0.84, 0.03, 0.5, 2.12, 0.95, 0.08, 0.58, 2.12, 2.81, 3.11, 2.78]} \ No newline at end of file diff --git a/annotations_1/6ZygVYbMrfc_filtered.json b/annotations_1/6ZygVYbMrfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb82a6b514c1db7e1f8f0cedd225a8e392c583a --- /dev/null +++ b/annotations_1/6ZygVYbMrfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 33.3], [34.0, 51.98], [56.0, 59.07], [61.0, 74.41], [76.0, 75.91], [79.0, 97.92], [100.0, 101.43], [103.0, 104.43], [106.0, 109.97], [114.0, 121.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [29.96, 29.93, 30.04, 31.27, 0.0, 30.04, 0.0, 0.0, 30.26, 29.85], "audiomae_on_audioset": [[["music", 73.05], ["throbbing", 11.28], ["hum", 5.06]], [["mains hum", 37.03], ["hum", 34.76], ["throbbing", 8.02]], [["music", 60.45], ["throbbing", 5.37], ["musical instrument", 3.99]], [["music", 73.46], ["throbbing", 6.3], ["electronic music", 4.34]], null, [["speech", 49.74], ["music", 12.34], ["buzz", 9.14]], null, null, [["fly, housefly", 48.68], ["insect", 15.57], ["buzz", 7.73]], [["music", 34.38], ["hum", 27.87], ["mains hum", 13.08]]], "duration": [23.3, 17.98, 3.07, 13.41, -0.09, 18.92, 1.43, 1.43, 3.97, 7.04]} \ No newline at end of file diff --git a/annotations_1/6_Ed23ettio_filtered.json b/annotations_1/6_Ed23ettio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cddacfdb9992d1f6034f81a7fc0b25f1efd144b0 --- /dev/null +++ b/annotations_1/6_Ed23ettio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [7.0, 7.74], [9.0, 30.35], [31.0, 37.35], [41.0, 113.43]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 39.3, 32.06, 0.0], "audiomae_on_audioset": [null, null, [["hum", 28.42], ["throbbing", 15.64], ["music", 10.81]], [["music", 25.98], ["livestock, farm animals, working animals", 7.58], ["grunt", 6.69]], null], "duration": [0.97, 0.74, 21.35, 6.35, 72.43]} \ No newline at end of file diff --git a/annotations_1/6_eBGV71X0w_filtered.json b/annotations_1/6_eBGV71X0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38ed979e3bbeda8eb9a6c69c5178640a2fa768aa --- /dev/null +++ b/annotations_1/6_eBGV71X0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.43], [32.0, 40.53], [44.0, 45.59], [49.0, 50.53], [51.0, 50.9], [51.0, 52.12], [56.0, 56.89], [67.0, 70.44], [72.0, 72.76], [73.0, 73.41], [73.0, 73.92], [79.0, 79.08], [80.0, 83.15], [85.0, 89.78], [97.0, 100.95], [103.0, 104.62], [105.0, 104.65], [107.0, 107.91], [109.0, 109.27], [110.0, 111.84], [127.0, 127.06], [128.0, 131.45], [136.0, 136.73], [141.0, 141.76], [145.0, 145.35], [148.0, 149.64], [150.0, 151.06], [156.0, 156.05], [158.0, 157.74], [160.0, 160.54], [164.0, 164.89], [175.0, 180.74], [181.0, 181.74], [187.0, 187.05], [187.0, 187.91], [189.0, 189.67], [191.0, 191.2], [196.0, 197.07], [204.0, 205.02]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 38.36, 38.75, 36.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 31.02], ["music", 26.44], ["hum", 6.42]], null, null, null, null, null, [["music", 37.72], ["synthesizer", 7.73], ["hiccup", 3.65]], null, null, null, null, [["music", 26.72], ["speech", 19.76], ["hum", 18.17]], [["mains hum", 22.01], ["hum", 18.71], ["music", 14.19]], [["speech", 37.56], ["music", 20.39], ["groan", 4.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 44.62], ["music", 27.09], ["theremin", 7.89]], null, null, null, null, null, null, null], "duration": [0.43, 8.53, 1.59, 1.53, -0.1, 1.12, 0.89, 3.44, 0.76, 0.41, 0.92, 0.08, 3.15, 4.78, 3.95, 1.62, -0.35, 0.91, 0.27, 1.84, 0.06, 3.45, 0.73, 0.76, 0.35, 1.64, 1.06, 0.05, -0.26, 0.54, 0.89, 5.74, 0.74, 0.05, 0.91, 0.67, 0.2, 1.07, 1.02]} \ No newline at end of file diff --git a/annotations_1/6_u456zQtkY_filtered.json b/annotations_1/6_u456zQtkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47a842e15aeed8413a7c3a7edb0e44848d0ca2d7 --- /dev/null +++ b/annotations_1/6_u456zQtkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[111.0, 113.17]], "keep_status": [false], "silence_prob": [72.6], "audiomae_on_audioset": [null], "duration": [2.17]} \ No newline at end of file diff --git a/annotations_1/6_yYxTkdIk8_filtered.json b/annotations_1/6_yYxTkdIk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cab8d8d67df6f05d9184828f76401c8535c54a59 --- /dev/null +++ b/annotations_1/6_yYxTkdIk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.2], [12.0, 12.21], [15.0, 15.89], [18.0, 21.54], [43.0, 46.21], [54.0, 69.26], [73.0, 101.09], [101.0, 105.48], [106.0, 114.17], [117.0, 121.34], [125.0, 125.41], [127.0, 129.24], [130.0, 130.76], [132.0, 135.3], [136.0, 137.3], [138.0, 139.08], [139.0, 143.33], [145.0, 149.25], [150.0, 151.14], [152.0, 155.53], [158.0, 162.89], [164.0, 166.43], [167.0, 169.28]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.96, 0.0, 0.0, 81.17, 55.25, 40.7, 43.15, 47.01, 46.12, 80.11, 0.0, 94.07, 0.0, 92.64, 0.0, 0.0, 99.9, 92.64, 0.0, 82.07, 78.38, 84.43, 82.43], "audiomae_on_audioset": [null, null, null, null, null, [["music", 37.59], ["speech", 30.8], ["groan", 6.24]], [["music", 49.7], ["didgeridoo", 15.11], ["musical instrument", 5.8]], [["music", 47.87], ["theremin", 8.16], ["scary music", 4.87]], [["music", 70.72], ["scary music", 6.18], ["grunt", 2.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.2, 0.21, 0.89, 3.54, 3.21, 15.26, 28.09, 4.48, 8.17, 4.34, 0.41, 2.24, 0.76, 3.3, 1.3, 1.08, 4.33, 4.25, 1.14, 3.53, 4.89, 2.43, 2.28]} \ No newline at end of file diff --git a/annotations_1/6bO4ZsAMowI_filtered.json b/annotations_1/6bO4ZsAMowI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6b671249d55d7a69b48e3d7857af8eb6425c9bb --- /dev/null +++ b/annotations_1/6bO4ZsAMowI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 21.1], [23.0, 24.14], [28.0, 34.03], [35.0, 46.25], [47.0, 49.55], [51.0, 52.91], [54.0, 54.01], [55.0, 55.46], [58.0, 60.69]], "keep_status": [false, false, false, true, true, false, false, false, true], "silence_prob": [29.79, 0.0, 97.54, 32.06, 39.4, 0.0, 0.0, 0.0, 32.17], "audiomae_on_audioset": [[["music", 48.2], ["speech", 20.08], ["sidetone", 12.25]], null, null, [["speech", 55.52], ["explosion", 9.65], ["whack, thwack", 3.96]], [["music", 28.17], ["crushing", 22.64], ["chirp tone", 12.18]], null, null, null, [["music", 46.61], ["scary music", 8.77], ["theremin", 6.4]]], "duration": [11.1, 1.14, 6.03, 11.25, 2.55, 1.91, 0.01, 0.46, 2.69]} \ No newline at end of file diff --git a/annotations_1/6dA4C1NKChE_filtered.json b/annotations_1/6dA4C1NKChE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9dfbbf37ecf0333978d72d08ead2ab8f03c5395 --- /dev/null +++ b/annotations_1/6dA4C1NKChE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 23.01], [24.0, 25.68], [35.0, 36.83], [41.0, 41.99], [44.0, 44.37], [46.0, 46.82], [47.0, 47.58], [50.0, 49.89], [51.0, 53.05], [53.0, 55.38], [61.0, 61.64], [62.0, 62.73], [63.0, 63.73], [67.0, 67.51], [68.0, 69.6], [75.0, 74.83], [77.0, 78.39], [83.0, 84.28], [85.0, 88.65], [93.0, 94.15], [96.0, 96.96], [97.0, 97.87], [99.0, 99.84], [103.0, 103.87], [117.0, 117.71], [122.0, 123.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 75.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 71.04], ["sine wave", 4.26], ["sidetone", 2.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.01, 1.68, 1.83, 0.99, 0.37, 0.82, 0.58, -0.11, 2.05, 2.38, 0.64, 0.73, 0.73, 0.51, 1.6, -0.17, 1.39, 1.28, 3.65, 1.15, 0.96, 0.87, 0.84, 0.87, 0.71, 1.06]} \ No newline at end of file diff --git a/annotations_1/6dDbnwQlCek_filtered.json b/annotations_1/6dDbnwQlCek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22ed299df9c944516b94433d4df63e6a6e5df59b --- /dev/null +++ b/annotations_1/6dDbnwQlCek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.64], [16.0, 23.03], [25.0, 25.76], [27.0, 27.36], [29.0, 38.08], [41.0, 42.33], [44.0, 50.38], [52.0, 64.17], [68.0, 69.15], [71.0, 73.94], [80.0, 81.23], [84.0, 84.89], [95.0, 102.79], [105.0, 106.46], [108.0, 111.18], [113.0, 114.39], [118.0, 133.2], [133.0, 133.44], [135.0, 136.71], [138.0, 145.37], [147.0, 148.04], [151.0, 151.87], [161.0, 169.2], [172.0, 173.52], [175.0, 178.01], [181.0, 206.46], [209.0, 217.83]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 31.14, 0.0, 0.0, 30.39, 0.0, 29.92, 30.31, 0.0, 30.65, 0.0, 0.0, 29.49, 0.0, 29.21, 0.0, 30.03, 0.0, 0.0, 29.6, 0.0, 0.0, 29.4, 0.0, 29.17, 29.41, 29.02], "audiomae_on_audioset": [null, [["music", 71.69], ["singing", 1.95], ["carnatic music", 1.53]], null, null, [["music", 64.45], ["carnatic music", 8.0], ["wind instrument, woodwind instrument", 3.12]], null, [["music", 32.99], ["reggae", 4.45], ["swing music", 3.43]], [["music", 54.71], ["carnatic music", 20.32], ["sitar", 4.99]], null, [["music", 65.28], ["musical instrument", 4.02], ["guitar", 2.54]], null, null, [["music", 53.57], ["carnatic music", 26.57], ["chant", 2.43]], null, [["music", 49.28], ["foghorn", 11.7], ["middle eastern music", 4.58]], null, [["music", 48.42], ["didgeridoo", 8.28], ["carnatic music", 3.91]], null, null, [["music", 66.35], ["carnatic music", 2.3], ["musical instrument", 2.14]], null, null, [["music", 57.02], ["middle eastern music", 5.28], ["carnatic music", 4.84]], null, [["music", 45.57], ["wind instrument, woodwind instrument", 5.09], ["harmonica", 5.04]], [["music", 95.97], ["musical instrument", 0.42], ["harmonica", 0.24]], [["music", 67.63], ["sitar", 7.04], ["middle eastern music", 5.16]]], "duration": [1.64, 7.03, 0.76, 0.36, 9.08, 1.33, 6.38, 12.17, 1.15, 2.94, 1.23, 0.89, 7.79, 1.46, 3.18, 1.39, 15.2, 0.44, 1.71, 7.37, 1.04, 0.87, 8.2, 1.52, 3.01, 25.46, 8.83]} \ No newline at end of file diff --git a/annotations_1/6e4xlcfKHxY_filtered.json b/annotations_1/6e4xlcfKHxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..878e791846a63767df5f9bf3a3183699dc2b0bd4 --- /dev/null +++ b/annotations_1/6e4xlcfKHxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.35], [4.0, 4.06], [4.0, 5.12], [6.0, 6.78], [7.0, 7.87], [11.0, 12.88], [15.0, 17.52], [20.0, 20.51], [22.0, 22.13], [23.0, 23.4], [24.0, 26.0], [27.0, 27.95], [29.0, 30.69], [34.0, 34.65], [35.0, 36.04], [36.0, 37.17], [38.0, 38.94], [47.0, 47.56], [48.0, 49.28], [52.0, 52.69], [54.0, 55.81], [60.0, 63.42], [71.0, 76.11], [77.0, 77.28], [78.0, 79.42], [80.0, 81.87], [84.0, 84.5], [85.0, 88.16], [90.0, 90.9], [94.0, 94.49], [95.0, 104.25], [105.0, 106.47], [110.0, 116.68], [119.0, 131.87], [136.0, 136.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 34.9, 0.0, 0.0, 0.0, 0.0, 42.55, 0.0, 0.0, 37.09, 0.0, 40.31, 33.12, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 70.45], ["telephone", 2.94], ["inside, small room", 2.85]], null, null, null, null, null, null, null, null, null, null, null, [["music", 28.03], ["speech", 22.3], ["synthesizer", 12.1]], null, null, null, null, [["music", 40.85], ["theremin", 10.32], ["ice cream truck, ice cream van", 9.4]], null, null, [["music", 61.01], ["insect", 7.39], ["mosquito", 5.99]], null, [["music", 40.22], ["fly, housefly", 6.43], ["insect", 6.03]], [["music", 79.07], ["theremin", 5.83], ["didgeridoo", 2.8]], null], "duration": [1.35, 0.06, 1.12, 0.78, 0.87, 1.88, 2.52, 0.51, 0.13, 0.4, 2.0, 0.95, 1.69, 0.65, 1.04, 1.17, 0.94, 0.56, 1.28, 0.69, 1.81, 3.42, 5.11, 0.28, 1.42, 1.87, 0.5, 3.16, 0.9, 0.49, 9.25, 1.47, 6.68, 12.87, 0.31]} \ No newline at end of file diff --git a/annotations_1/6eW1ht2HbtQ_filtered.json b/annotations_1/6eW1ht2HbtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..630f78e82f02a24800ba2c034b5d7e596c83d6f3 --- /dev/null +++ b/annotations_1/6eW1ht2HbtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.76], [6.0, 6.05], [9.0, 9.78], [12.0, 13.68], [23.0, 24.44], [26.0, 43.04], [44.0, 47.97], [49.0, 50.25], [52.0, 52.3], [57.0, 63.36], [64.0, 65.69], [66.0, 67.74], [68.0, 80.97], [84.0, 112.62], [113.0, 115.43], [118.0, 128.33], [131.0, 136.48], [138.0, 139.36], [141.0, 143.9], [147.0, 156.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 58.22, 0.0, 0.0, 47.35, 0.0, 0.0, 51.94, 45.14, 49.78, 46.26, 71.43, 0.0, 65.09, 52.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 63.95], ["ambient music", 8.43], ["hum", 5.41]], null, null, null, [["music", 62.09], ["ambient music", 9.47], ["singing bowl", 7.22]], [["music", 63.6], ["throbbing", 4.17], ["hum", 2.21]], [["hum", 29.82], ["throbbing", 25.6], ["music", 19.17]], null, null, null, null], "duration": [-0.24, 0.05, 0.78, 1.68, 1.44, 17.04, 3.97, 1.25, 0.3, 6.36, 1.69, 1.74, 12.97, 28.62, 2.43, 10.33, 5.48, 1.36, 2.9, 9.79]} \ No newline at end of file diff --git a/annotations_1/6fJNyx7kI6w_filtered.json b/annotations_1/6fJNyx7kI6w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..592073d4512da9caecdad50b906c5b4826402e26 --- /dev/null +++ b/annotations_1/6fJNyx7kI6w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.59], [24.0, 23.89], [28.0, 31.18], [37.0, 38.08], [39.0, 39.77], [44.0, 46.47], [56.0, 56.25], [59.0, 61.21], [75.0, 76.91], [79.0, 79.83], [98.0, 98.96], [121.0, 122.0], [125.0, 125.2], [126.0, 126.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.54, 0.0, 0.0, 74.29, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, -0.11, 3.18, 1.08, 0.77, 2.47, 0.25, 2.21, 1.91, 0.83, 0.96, 1.0, 0.2, 0.47]} \ No newline at end of file diff --git a/annotations_1/6hT5xOszncI_filtered.json b/annotations_1/6hT5xOszncI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7776d07bb93604f97cbcefc1532d8df174c0c79a --- /dev/null +++ b/annotations_1/6hT5xOszncI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.42], [39.0, 43.55], [45.0, 48.39], [49.0, 68.66], [70.0, 98.64], [100.0, 103.98], [105.0, 117.14], [121.0, 133.88], [135.0, 137.51]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 31.59, 31.44, 28.85, 31.57, 32.83, 32.68, 31.92, 36.52], "audiomae_on_audioset": [null, [["throbbing", 41.14], ["hum", 36.02], ["music", 4.35]], [["hum", 51.86], ["throbbing", 33.08], ["mains hum", 5.15]], [["speech", 52.63], ["hum", 17.34], ["music", 7.77]], [["throbbing", 37.2], ["hum", 31.82], ["music", 14.89]], [["speech", 17.71], ["frog", 17.07], ["rumble", 4.95]], [["hum", 50.04], ["mains hum", 20.44], ["throbbing", 11.03]], [["throbbing", 46.68], ["hum", 35.62], ["music", 6.81]], [["hum", 25.05], ["throbbing", 12.88], ["white noise", 9.59]]], "duration": [1.42, 4.55, 3.39, 19.66, 28.64, 3.98, 12.14, 12.88, 2.51]} \ No newline at end of file diff --git a/annotations_1/6hUiaXXj_Hg_filtered.json b/annotations_1/6hUiaXXj_Hg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..899cbde39463d4cdb69cf23144e04b899f2197e9 --- /dev/null +++ b/annotations_1/6hUiaXXj_Hg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 67.63], [69.0, 110.73], [113.0, 114.93], [116.0, 121.44], [123.0, 123.62]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.1, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.91], ["speech", 23.74], ["throbbing", 12.67]], null], "duration": [32.63, 41.73, 1.93, 5.44, 0.62]} \ No newline at end of file diff --git a/annotations_1/6i7cWj1WqDU_filtered.json b/annotations_1/6i7cWj1WqDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b3a1606dac7bb377b00ac25b551cd4c76ac8116 --- /dev/null +++ b/annotations_1/6i7cWj1WqDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 67.59], [69.0, 69.99], [70.0, 82.31], [85.0, 85.11], [86.0, 88.99], [91.0, 131.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 63.64, 0.0, 73.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.59, 0.99, 12.31, 0.11, 2.99, 40.48]} \ No newline at end of file diff --git a/annotations_1/6ikH1EFDm6A_filtered.json b/annotations_1/6ikH1EFDm6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..008a3b8a7d64731cbc7592b0fd3cc87a6b167e3b --- /dev/null +++ b/annotations_1/6ikH1EFDm6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.99], [20.0, 23.36], [27.0, 28.76], [31.0, 32.97], [37.0, 37.05], [38.0, 40.42], [67.0, 67.71], [75.0, 75.02], [77.0, 84.15], [90.0, 103.79], [105.0, 106.44], [109.0, 110.0], [111.0, 112.29], [112.0, 112.78], [117.0, 118.18], [120.0, 120.75], [127.0, 127.3], [130.0, 131.62]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.82, 0.0, 0.0, 0.0, 30.95, 0.0, 0.0, 31.53, 35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["burping, eructation", 68.71], ["speech", 3.91], ["hum", 1.64]], null, null, null, [["speech", 34.9], ["music", 25.07], ["quack", 5.78]], null, null, [["speech", 73.11], ["thunk", 3.43], ["hum", 2.0]], [["thunk", 22.34], ["whack, thwack", 19.99], ["music", 11.88]], null, null, null, null, null, null, null, null], "duration": [0.99, 3.36, 1.76, 1.97, 0.05, 2.42, 0.71, 0.02, 7.15, 13.79, 1.44, 1.0, 1.29, 0.78, 1.18, 0.75, 0.3, 1.62]} \ No newline at end of file diff --git a/annotations_1/6j-vjtJ7PRI_filtered.json b/annotations_1/6j-vjtJ7PRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1d8dc17ec7191052c68696a29361c3a164eaa1 --- /dev/null +++ b/annotations_1/6j-vjtJ7PRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [12.0, 12.46], [13.0, 14.05], [15.0, 17.95], [23.0, 40.24], [42.0, 48.83], [51.0, 54.77], [61.0, 61.59], [62.0, 75.88], [77.0, 85.6], [86.0, 92.85], [93.0, 100.9], [104.0, 104.55], [105.0, 105.49], [108.0, 131.9], [133.0, 134.6], [136.0, 136.26], [138.0, 145.32]], "keep_status": [false, false, false, false, true, false, true, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.28, 31.46, 33.83, 32.98, 0.0, 33.4, 39.19, 63.42, 37.65, 0.0, 0.0, 31.28, 0.0, 0.0, 34.6], "audiomae_on_audioset": [null, null, null, [["speech", 53.89], ["music", 21.78], ["hum", 6.3]], [["rumble", 26.39], ["hum", 17.08], ["music", 12.01]], [["speech", 44.91], ["music", 15.86], ["didgeridoo", 12.87]], [["burping, eructation", 23.4], ["buzz", 22.91], ["speech", 6.85]], null, [["music", 40.79], ["hum", 16.97], ["throbbing", 13.29]], [["music", 49.37], ["arrow", 11.05], ["thump, thud", 3.42]], null, [["speech", 44.56], ["sonar", 12.02], ["hum", 9.13]], null, null, [["speech", 50.17], ["music", 20.32], ["hum", 4.7]], null, null, [["throbbing", 42.1], ["music", 25.61], ["hum", 15.3]]], "duration": [0.56, 0.46, 1.05, 2.95, 17.24, 6.83, 3.77, 0.59, 13.88, 8.6, 6.85, 7.9, 0.55, 0.49, 23.9, 1.6, 0.26, 7.32]} \ No newline at end of file diff --git a/annotations_1/6kN5IkXFwcQ_filtered.json b/annotations_1/6kN5IkXFwcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..365b5b4f7024c9686fdaa8466e418f6e9cf2cd21 --- /dev/null +++ b/annotations_1/6kN5IkXFwcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.88], [30.0, 31.06]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.88, 1.06]} \ No newline at end of file diff --git a/annotations_1/6kktAYxwo7M_filtered.json b/annotations_1/6kktAYxwo7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d137ddabc905109c4ac72cd5e2d44a81be48025 --- /dev/null +++ b/annotations_1/6kktAYxwo7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.5], [14.0, 15.01], [18.0, 37.37], [39.0, 40.78], [43.0, 43.88], [44.0, 52.56], [53.0, 53.03], [53.0, 53.43], [54.0, 56.35], [59.0, 72.87], [75.0, 76.77], [77.0, 87.3], [89.0, 89.09], [90.0, 92.16], [95.0, 94.91], [97.0, 98.85], [100.0, 100.99], [101.0, 102.79], [105.0, 106.25], [106.0, 112.46], [114.0, 114.0], [117.0, 117.69], [122.0, 128.71]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.48, 0.0, 36.21, 0.0, 0.0, 45.65, 0.0, 0.0, 59.86, 48.65, 0.0, 41.74, 0.0, 42.44, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0, 44.69], "audiomae_on_audioset": [[["whack, thwack", 17.65], ["speech", 11.23], ["thump, thud", 5.92]], null, [["speech", 14.23], ["animal", 9.0], ["whack, thwack", 7.56]], null, null, [["noise", 64.34], ["speech", 7.64], ["whale vocalization", 4.37]], null, null, null, [["insect", 31.34], ["fly, housefly", 30.85], ["mosquito", 11.47]], null, [["speech", 20.88], ["electric shaver, electric razor", 12.6], ["livestock, farm animals, working animals", 10.42]], null, [["radio", 26.9], ["speech", 24.07], ["whale vocalization", 19.06]], null, null, null, null, null, null, null, null, [["noise", 55.27], ["wild animals", 9.79], ["insect", 5.46]]], "duration": [4.5, 1.01, 19.37, 1.78, 0.88, 8.56, 0.03, 0.43, 2.35, 13.87, 1.77, 10.3, 0.09, 2.16, -0.09, 1.85, 0.99, 1.79, 1.25, 6.46, 0.0, 0.69, 6.71]} \ No newline at end of file diff --git a/annotations_1/6l0tsxNujWA_filtered.json b/annotations_1/6l0tsxNujWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..258802b323c6a1cca0307188df7c33f95579b222 --- /dev/null +++ b/annotations_1/6l0tsxNujWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [15.0, 15.47], [17.0, 18.39], [21.0, 22.42], [23.0, 34.86], [37.0, 37.62], [40.0, 40.96], [41.0, 42.31], [50.0, 51.27], [52.0, 53.0], [58.0, 58.75]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 29.68], ["buzz", 21.58], ["insect", 18.36]], null, null, null, null, null, null], "duration": [0.83, 0.47, 1.39, 1.42, 11.86, 0.62, 0.96, 1.31, 1.27, 1.0, 0.75]} \ No newline at end of file diff --git a/annotations_1/6ldKc6yXTyg_filtered.json b/annotations_1/6ldKc6yXTyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df7150cc7e455a7cba670c7b1a570e1f3563c857 --- /dev/null +++ b/annotations_1/6ldKc6yXTyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.8], [17.0, 17.76], [20.0, 20.78], [21.0, 24.48], [29.0, 31.99], [36.0, 38.74], [40.0, 40.8], [42.0, 43.48], [45.0, 45.23], [47.0, 48.37], [49.0, 49.64], [55.0, 78.73], [80.0, 80.7], [83.0, 87.91], [92.0, 92.38], [95.0, 94.93], [96.0, 97.29], [98.0, 98.32], [101.0, 101.01], [104.0, 105.44], [107.0, 107.0], [112.0, 114.51], [119.0, 120.97], [122.0, 124.58], [129.0, 130.22], [135.0, 137.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 74.6, 98.51, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 32.06, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07, 0.0, 90.95, 0.0, 92.8], "audiomae_on_audioset": [null, null, null, null, null, [["music", 59.09], ["speech", 16.65], ["electronic music", 3.08]], null, null, null, null, null, [["music", 80.91], ["sampler", 3.0], ["drum machine", 2.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.76, 0.78, 3.48, 2.99, 2.74, 0.8, 1.48, 0.23, 1.37, 0.64, 23.73, 0.7, 4.91, 0.38, -0.07, 1.29, 0.32, 0.01, 1.44, 0.0, 2.51, 1.97, 2.58, 1.22, 2.51]} \ No newline at end of file diff --git a/annotations_1/6loInvUSYEM_filtered.json b/annotations_1/6loInvUSYEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf2fcac77a4a89fe5342ab48e97f8a7a4884b8d5 --- /dev/null +++ b/annotations_1/6loInvUSYEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 34.38], [36.0, 71.95], [78.0, 94.49], [98.0, 107.37]], "keep_status": [false, false, false, false], "silence_prob": [57.56, 0.0, 39.28, 83.52], "audiomae_on_audioset": [null, null, [["music", 79.2], ["soundtrack music", 4.93], ["electronic music", 2.13]], null], "duration": [21.38, 35.95, 16.49, 9.37]} \ No newline at end of file diff --git a/annotations_1/6moZJqA4iuc_filtered.json b/annotations_1/6moZJqA4iuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..495a142f9c23408bff6d0d613a2e6c70265c3804 --- /dev/null +++ b/annotations_1/6moZJqA4iuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.4], [16.0, 17.19], [19.0, 25.66], [28.0, 29.39], [31.0, 50.5], [51.0, 55.93], [58.0, 70.36], [72.0, 73.35], [75.0, 76.05], [78.0, 78.22], [79.0, 79.78], [80.0, 80.54], [82.0, 83.42], [84.0, 99.76], [101.0, 101.46], [103.0, 104.26], [105.0, 108.23], [108.0, 109.75], [112.0, 114.57], [116.0, 117.63], [118.0, 121.12], [122.0, 130.55], [132.0, 134.16], [135.0, 139.01], [140.0, 140.02], [141.0, 142.32], [143.0, 144.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.41, 0.0, 53.65, 57.01, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 40.57, 0.0, 58.72, 0.0, 52.62, 55.46, 51.44, 59.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.18], ["rumble", 6.83], ["musical instrument", 6.05]], null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 1.19, 6.66, 1.39, 19.5, 4.93, 12.36, 1.35, 1.05, 0.22, 0.78, 0.54, 1.42, 15.76, 0.46, 1.26, 3.23, 1.75, 2.57, 1.63, 3.12, 8.55, 2.16, 4.01, 0.02, 1.32, 1.64]} \ No newline at end of file diff --git a/annotations_1/6mooNp4aWBo_filtered.json b/annotations_1/6mooNp4aWBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58da7f97ead3cda044c6dbf8be1a5baebaea9d10 --- /dev/null +++ b/annotations_1/6mooNp4aWBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.17], [14.0, 15.67], [21.0, 23.35], [25.0, 29.62], [31.0, 33.88], [34.0, 38.64], [40.0, 41.42], [44.0, 48.05], [50.0, 50.5], [51.0, 53.42], [56.0, 61.97], [65.0, 65.28], [65.0, 68.34], [69.0, 76.91], [78.0, 78.98], [81.0, 81.9], [82.0, 84.25], [86.0, 87.29], [91.0, 91.27], [92.0, 92.3], [99.0, 99.67], [101.0, 101.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.46, 0.0, 87.37, 84.07, 88.46, 68.28, 0.0, 82.79, 0.0, 70.02, 62.89, 0.0, 45.59, 48.23, 0.0, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.2], ["sidetone", 5.57], ["radio", 2.77]], [["speech", 44.87], ["rumble", 30.44], ["hum", 4.37]], null, null, [["speech", 46.48], ["music", 25.83], ["synthesizer", 2.53]], null, null, null, null, null], "duration": [5.17, 1.67, 2.35, 4.62, 2.88, 4.64, 1.42, 4.05, 0.5, 2.42, 5.97, 0.28, 3.34, 7.91, 0.98, 0.9, 2.25, 1.29, 0.27, 0.3, 0.67, 0.68]} \ No newline at end of file diff --git a/annotations_1/6nSu2qhTmNU_filtered.json b/annotations_1/6nSu2qhTmNU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44f778041a8794af4eb5693ac101e4438dc346e5 --- /dev/null +++ b/annotations_1/6nSu2qhTmNU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 34.77], [38.0, 67.17], [70.0, 70.51], [71.0, 81.03], [82.0, 83.15], [85.0, 88.99], [89.0, 91.94], [94.0, 116.45], [121.0, 121.24]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 35.36, 0.0, 43.98, 0.0, 36.87, 38.6, 32.84, 0.0], "audiomae_on_audioset": [null, [["theremin", 61.96], ["music", 21.26], ["synthesizer", 3.04]], null, [["music", 38.41], ["hum", 23.28], ["mains hum", 15.58]], null, [["music", 60.46], ["synthesizer", 4.48], ["electronic music", 4.21]], [["music", 50.46], ["theremin", 27.75], ["ambient music", 3.04]], [["music", 77.59], ["synthesizer", 5.49], ["musical instrument", 3.87]], null], "duration": [30.77, 29.17, 0.51, 10.03, 1.15, 3.99, 2.94, 22.45, 0.24]} \ No newline at end of file diff --git a/annotations_1/6nZJPF_VgIQ_filtered.json b/annotations_1/6nZJPF_VgIQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0714af8679ff51dcb711ce4690dfda23a7d2343d --- /dev/null +++ b/annotations_1/6nZJPF_VgIQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.7], [27.0, 26.99], [33.0, 33.0], [33.0, 33.12], [33.0, 34.59], [39.0, 39.93], [42.0, 44.04], [45.0, 48.46], [50.0, 50.92], [52.0, 52.25], [53.0, 53.84], [57.0, 57.77], [59.0, 59.54], [65.0, 65.1], [67.0, 68.44], [73.0, 72.69], [75.0, 74.97], [76.0, 76.99], [80.0, 80.32], [81.0, 81.06], [82.0, 82.49], [83.0, 83.64], [86.0, 87.18], [89.0, 90.1], [92.0, 94.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 34.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 74.4], ["music", 5.67], ["speech synthesizer", 3.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.63], ["hum", 10.02], ["gong", 8.82]]], "duration": [-0.3, -0.01, 0.0, 0.12, 1.59, 0.93, 2.04, 3.46, 0.92, 0.25, 0.84, 0.77, 0.54, 0.1, 1.44, -0.31, -0.03, 0.99, 0.32, 0.06, 0.49, 0.64, 1.18, 1.1, 2.53]} \ No newline at end of file diff --git a/annotations_1/6nfXJd8nV9E_filtered.json b/annotations_1/6nfXJd8nV9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b596a549e58126a1174210a680af3593e217ddd5 --- /dev/null +++ b/annotations_1/6nfXJd8nV9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.07], [6.0, 6.86], [9.0, 8.8], [9.0, 9.53], [10.0, 13.95], [17.0, 17.14], [17.0, 20.22], [25.0, 25.96], [32.0, 32.16], [32.0, 33.35], [36.0, 37.5], [39.0, 41.12], [42.0, 45.84], [50.0, 55.19], [56.0, 56.42], [57.0, 59.1], [64.0, 64.39], [65.0, 71.2], [79.0, 80.97], [83.0, 83.37], [89.0, 89.45], [92.0, 130.77]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.61, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 88.1, 94.52, 59.07, 0.0, 47.23, 0.0, 51.12, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 60.79], ["funny music", 3.87], ["electric piano", 3.18]], null, null, null, null, null, null, null, null, null, null, [["music", 55.23], ["ambient music", 4.49], ["musical instrument", 2.63]], null, null, null, null, null, null], "duration": [0.07, 0.86, -0.2, 0.53, 3.95, 0.14, 3.22, 0.96, 0.16, 1.35, 1.5, 2.12, 3.84, 5.19, 0.42, 2.1, 0.39, 6.2, 1.97, 0.37, 0.45, 38.77]} \ No newline at end of file diff --git a/annotations_1/6o8Eq0LEpf0_filtered.json b/annotations_1/6o8Eq0LEpf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7e2da17a45f0a9e98f399430539273f8e3d705 --- /dev/null +++ b/annotations_1/6o8Eq0LEpf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.98], [10.0, 10.88], [12.0, 12.85], [15.0, 17.69], [19.0, 20.33], [21.0, 38.89], [39.0, 42.62], [44.0, 48.29], [49.0, 51.39], [52.0, 53.18], [54.0, 55.95], [58.0, 59.71], [64.0, 64.13], [64.0, 64.42], [65.0, 65.31], [68.0, 68.5], [69.0, 70.01], [71.0, 72.98], [74.0, 74.29], [75.0, 76.72], [82.0, 85.31], [89.0, 90.78], [93.0, 96.36], [97.0, 99.6], [100.0, 100.79], [103.0, 102.95], [104.0, 104.75], [105.0, 105.95], [107.0, 107.37], [109.0, 111.64], [112.0, 113.17], [116.0, 117.04], [118.0, 118.5], [119.0, 119.48], [122.0, 122.1], [123.0, 123.48], [125.0, 125.07], [126.0, 130.67], [131.0, 133.86], [136.0, 137.27], [138.0, 138.5], [142.0, 147.65], [152.0, 151.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.82, 0.0, 98.44, 83.88, 82.07, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 44.6, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 49.45, 0.0, 0.0, 94.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.61], ["effects unit", 17.36], ["echo", 11.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.34], ["hum", 9.99], ["radio", 8.23]], null, null, null, null], "duration": [0.98, 0.88, 0.85, 2.69, 1.33, 17.89, 3.62, 4.29, 2.39, 1.18, 1.95, 1.71, 0.13, 0.42, 0.31, 0.5, 1.01, 1.98, 0.29, 1.72, 3.31, 1.78, 3.36, 2.6, 0.79, -0.05, 0.75, 0.95, 0.37, 2.64, 1.17, 1.04, 0.5, 0.48, 0.1, 0.48, 0.07, 4.67, 2.86, 1.27, 0.5, 5.65, -0.12]} \ No newline at end of file diff --git a/annotations_1/6oUzjN26DoM_filtered.json b/annotations_1/6oUzjN26DoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d054394880f8040a9a2a7ea1876b6366755e3a9 --- /dev/null +++ b/annotations_1/6oUzjN26DoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.16], [22.0, 22.98], [24.0, 24.21], [31.0, 32.36], [37.0, 37.08], [38.0, 38.47], [42.0, 42.42], [44.0, 45.52], [51.0, 52.12], [53.0, 55.44], [65.0, 65.52], [69.0, 69.75], [77.0, 78.24], [87.0, 87.35], [88.0, 90.86], [94.0, 97.11], [104.0, 105.24], [112.0, 112.28], [114.0, 114.15], [124.0, 125.47], [127.0, 128.38], [133.0, 134.64], [143.0, 144.78], [150.0, 152.27], [168.0, 172.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 90.95, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 31.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.2], ["sine wave", 12.16], ["chirp tone", 8.02]]], "duration": [1.16, 0.98, 0.21, 1.36, 0.08, 0.47, 0.42, 1.52, 1.12, 2.44, 0.52, 0.75, 1.24, 0.35, 2.86, 3.11, 1.24, 0.28, 0.15, 1.47, 1.38, 1.64, 1.78, 2.27, 4.62]} \ No newline at end of file diff --git a/annotations_1/6oqDO7aHVFo_filtered.json b/annotations_1/6oqDO7aHVFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c2695a809716fda149ecc913eb18b0cc03ded1b --- /dev/null +++ b/annotations_1/6oqDO7aHVFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.6], [13.0, 14.34], [15.0, 15.45], [16.0, 16.23], [17.0, 17.96], [18.0, 19.04], [22.0, 22.25], [41.0, 41.03], [42.0, 42.63], [45.0, 47.68], [53.0, 53.11], [57.0, 58.72], [60.0, 61.32], [70.0, 71.15], [73.0, 73.5], [82.0, 82.75], [92.0, 92.03], [93.0, 93.65], [107.0, 107.5], [113.0, 113.97], [116.0, 116.88], [119.0, 119.4], [122.0, 124.55], [125.0, 126.42], [128.0, 131.6], [132.0, 134.65], [135.0, 137.64], [138.0, 139.46], [142.0, 144.69]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [39.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 100.0, 67.51, 49.04, 0.0, 61.47], "audiomae_on_audioset": [[["speech", 15.91], ["horse", 10.97], ["fly, housefly", 8.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.95], ["livestock, farm animals, working animals", 10.89], ["animal", 6.7]], null, null], "duration": [7.6, 1.34, 0.45, 0.23, 0.96, 1.04, 0.25, 0.03, 0.63, 2.68, 0.11, 1.72, 1.32, 1.15, 0.5, 0.75, 0.03, 0.65, 0.5, 0.97, 0.88, 0.4, 2.55, 1.42, 3.6, 2.65, 2.64, 1.46, 2.69]} \ No newline at end of file diff --git a/annotations_1/6oxCZ2CyGII_filtered.json b/annotations_1/6oxCZ2CyGII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16aa4c26b1d7a7f7d10c4b2faa5c3b709a08a85b --- /dev/null +++ b/annotations_1/6oxCZ2CyGII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.99], [11.0, 11.23], [21.0, 22.11], [26.0, 26.08], [30.0, 30.38], [31.0, 31.63], [34.0, 34.06], [37.0, 41.4], [44.0, 43.82], [49.0, 51.53], [53.0, 52.95], [53.0, 61.16], [64.0, 64.4], [66.0, 66.5], [70.0, 70.75], [73.0, 73.6], [76.0, 76.13], [87.0, 86.95], [88.0, 88.87], [90.0, 90.91], [93.0, 93.92], [96.0, 97.01], [98.0, 98.69], [101.0, 101.61], [102.0, 104.92], [108.0, 108.82], [109.0, 109.8], [111.0, 121.29], [122.0, 122.91], [123.0, 123.8]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.69, 0.0, 39.27, 0.0, 36.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.96, 0.0, 0.0, 91.98, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.3], ["musical instrument", 10.85], ["wind instrument, woodwind instrument", 6.63]], null, null, null, null, null, null, [["music", 58.9], ["musical instrument", 6.78], ["theremin", 6.11]], null, [["music", 34.24], ["musical instrument", 10.31], ["theremin", 5.46]], null, [["music", 58.04], ["musical instrument", 5.0], ["theremin", 4.59]], null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 39.18], ["speech", 27.53], ["radio", 13.98]], null, null, null, null, null], "duration": [4.99, 0.23, 1.11, 0.08, 0.38, 0.63, 0.06, 4.4, -0.18, 2.53, -0.05, 8.16, 0.4, 0.5, 0.75, 0.6, 0.13, -0.05, 0.87, 0.91, 0.92, 1.01, 0.69, 0.61, 2.92, 0.82, 0.8, 10.29, 0.91, 0.8]} \ No newline at end of file diff --git a/annotations_1/6p-S9nS21Wc_filtered.json b/annotations_1/6p-S9nS21Wc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de83e5e0f094b5edc4a6be7cb6c5dbf5d247b11e --- /dev/null +++ b/annotations_1/6p-S9nS21Wc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.08], [2.0, 3.57], [7.0, 14.52], [19.0, 19.35], [20.0, 20.98], [21.0, 23.75], [24.0, 26.15], [28.0, 29.24], [30.0, 32.16], [35.0, 38.21], [58.0, 61.18], [62.0, 62.56], [68.0, 69.4], [73.0, 75.03], [83.0, 85.35], [86.0, 86.88], [88.0, 88.45], [88.0, 89.46], [102.0, 108.3], [110.0, 110.49], [113.0, 113.98]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 39.05, 0.0, 0.0, 37.9, 34.82, 0.0, 47.9, 49.92, 55.89, 0.0, 0.0, 31.78, 33.04, 0.0, 0.0, 0.0, 34.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 40.81], ["speech", 15.06], ["musical instrument", 3.85]], null, null, [["music", 57.27], ["speech", 13.25], ["musical instrument", 2.92]], [["music", 41.53], ["cattle, bovinae", 10.96], ["moo", 9.04]], null, [["music", 58.96], ["guitar", 5.03], ["musical instrument", 3.89]], [["music", 75.23], ["speech", 5.85], ["musical instrument", 1.98]], null, null, null, [["music", 68.38], ["boing", 5.8], ["quack", 5.75]], [["music", 53.12], ["throbbing", 6.76], ["speech", 4.85]], null, null, null, [["music", 23.14], ["livestock, farm animals, working animals", 15.21], ["cattle, bovinae", 13.43]], null, null], "duration": [0.08, 1.57, 7.52, 0.35, 0.98, 2.75, 2.15, 1.24, 2.16, 3.21, 3.18, 0.56, 1.4, 2.03, 2.35, 0.88, 0.45, 1.46, 6.3, 0.49, 0.98]} \ No newline at end of file diff --git a/annotations_1/6pUt6xlMorQ_filtered.json b/annotations_1/6pUt6xlMorQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50d5bfe36392ea96211a3035f02a9db2981215ce --- /dev/null +++ b/annotations_1/6pUt6xlMorQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 25.07], [30.0, 76.72], [80.0, 93.61], [94.0, 94.85], [96.0, 96.31], [96.0, 96.35], [96.0, 96.38], [96.0, 99.91], [101.0, 115.1], [116.0, 120.38], [124.0, 156.29], [157.0, 157.6], [158.0, 159.26], [161.0, 161.96], [162.0, 162.45], [166.0, 166.04]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [29.6, 0.0, 36.92, 0.0, 0.0, 0.0, 0.0, 33.41, 35.38, 33.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 67.94], ["musical instrument", 3.65], ["electronic music", 2.7]], null, [["speech", 50.55], ["horse", 11.68], ["clip-clop", 5.14]], null, null, null, null, [["speech", 32.82], ["music", 9.26], ["cattle, bovinae", 7.97]], [["speech", 76.27], ["vehicle", 2.75], ["eruption", 2.46]], [["speech", 55.36], ["music", 10.91], ["explosion", 4.23]], null, null, null, null, null, null], "duration": [20.07, 46.72, 13.61, 0.85, 0.31, 0.35, 0.38, 3.91, 14.1, 4.38, 32.29, 0.6, 1.26, 0.96, 0.45, 0.04]} \ No newline at end of file diff --git a/annotations_1/6puVCaR2E7M_filtered.json b/annotations_1/6puVCaR2E7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c4199ce6327c00a943d541baf22c1e844acaec7 --- /dev/null +++ b/annotations_1/6puVCaR2E7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 32.81], [33.0, 33.25], [36.0, 46.26], [47.0, 49.59], [51.0, 51.83], [53.0, 54.77], [57.0, 58.28], [60.0, 61.37], [62.0, 62.26], [63.0, 71.0], [71.0, 73.47], [74.0, 75.81], [76.0, 75.84], [78.0, 79.64], [81.0, 81.41], [83.0, 86.22], [88.0, 89.19], [90.0, 92.3], [93.0, 93.39], [94.0, 96.6], [100.0, 100.95], [102.0, 103.71], [104.0, 104.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.35, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 63.31, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 65.79, 0.0, 34.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.62], ["hum", 22.48], ["mains hum", 16.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.54], ["rumble", 13.09], ["gasp", 5.83]], null, null, null], "duration": [-0.19, 0.25, 10.26, 2.59, 0.83, 1.77, 1.28, 1.37, 0.26, 8.0, 2.47, 1.81, -0.16, 1.64, 0.41, 3.22, 1.19, 2.3, 0.39, 2.6, 0.95, 1.71, 0.9]} \ No newline at end of file diff --git a/annotations_1/6q2aPotJP7w_filtered.json b/annotations_1/6q2aPotJP7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f58182731261e60a7bef838b58d157377c35c19e --- /dev/null +++ b/annotations_1/6q2aPotJP7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.05], [6.0, 10.77], [12.0, 48.0], [51.0, 50.85], [58.0, 59.27], [63.0, 67.02], [68.0, 68.47], [70.0, 81.08], [85.0, 86.04], [114.0, 115.69], [117.0, 118.0], [129.0, 136.71], [138.0, 139.92], [145.0, 145.4], [148.0, 149.4], [149.0, 149.47], [150.0, 150.63], [151.0, 151.11], [151.0, 151.26], [152.0, 151.87], [154.0, 153.69]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.22, 0.0, 0.0, 0.0, 34.09, 0.0, 31.39, 0.0, 0.0, 0.0, 31.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 28.32], ["speech", 21.16], ["boing", 13.56]], null, null, null, [["sidetone", 49.94], ["speech", 14.07], ["noise", 8.1]], null, [["music", 27.94], ["cattle, bovinae", 16.56], ["moo", 15.68]], null, null, null, [["music", 40.45], ["speech", 12.4], ["electronic music", 7.84]], null, null, null, null, null, null, null, null, null], "duration": [0.05, 4.77, 36.0, -0.15, 1.27, 4.02, 0.47, 11.08, 1.04, 1.69, 1.0, 7.71, 1.92, 0.4, 1.4, 0.47, 0.63, 0.11, 0.26, -0.13, -0.31]} \ No newline at end of file diff --git a/annotations_1/6qZZWAScCn8_filtered.json b/annotations_1/6qZZWAScCn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d88a55efebf9b7d5cf0b6f3f968bba81d0259150 --- /dev/null +++ b/annotations_1/6qZZWAScCn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [4.0, 8.06], [9.0, 11.26], [13.0, 15.26], [26.0, 26.5], [28.0, 30.03], [33.0, 35.88], [37.0, 38.69], [40.0, 44.32], [52.0, 53.13], [57.0, 59.44], [60.0, 60.61], [62.0, 62.9], [64.0, 65.87], [68.0, 68.71], [77.0, 86.17], [88.0, 89.28], [96.0, 97.04], [102.0, 109.66], [120.0, 120.58], [125.0, 133.12], [140.0, 141.47], [143.0, 149.03], [151.0, 151.48], [158.0, 159.24], [161.0, 161.62], [162.0, 165.2], [168.0, 169.03], [173.0, 173.84], [177.0, 182.85], [183.0, 186.16], [187.0, 188.92], [194.0, 200.06], [200.0, 200.16], [200.0, 201.65], [205.0, 207.79], [212.0, 213.43], [217.0, 218.83], [221.0, 223.03], [225.0, 227.35], [228.0, 236.36], [239.0, 241.76], [254.0, 255.61], [259.0, 260.07], [267.0, 267.33], [285.0, 289.36], [290.0, 290.98]], "keep_status": [false, true, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 30.3, 29.58, 29.68, 0.0, 29.78, 30.22, 0.0, 29.96, 0.0, 31.66, 0.0, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0, 28.83, 0.0, 29.37, 0.0, 35.47, 0.0, 0.0, 0.0, 38.02, 0.0, 0.0, 30.03, 29.95, 0.0, 30.43, 0.0, 0.0, 29.85, 0.0, 0.0, 32.05, 34.2, 31.02, 34.36, 0.0, 0.0, 0.0, 28.33, 0.0], "audiomae_on_audioset": [null, [["music", 41.07], ["hum", 7.9], ["throbbing", 7.25]], [["music", 22.11], ["fly, housefly", 16.59], ["insect", 9.79]], [["music", 78.08], ["throbbing", 4.53], ["didgeridoo", 2.14]], null, [["music", 61.38], ["speech", 4.45], ["angry music", 3.44]], [["music", 46.95], ["throbbing", 18.44], ["hum", 12.28]], null, [["music", 72.02], ["throbbing", 5.66], ["didgeridoo", 1.62]], null, [["music", 56.23], ["vehicle", 2.33], ["soundtrack music", 1.82]], null, null, null, null, [["hum", 37.02], ["mains hum", 22.45], ["music", 16.39]], null, null, [["hum", 20.44], ["buzz", 17.54], ["mains hum", 15.84]], null, [["music", 21.36], ["hum", 12.6], ["fly, housefly", 10.63]], null, [["fly, housefly", 12.15], ["bee, wasp, etc.", 11.29], ["buzz", 8.41]], null, null, null, [["speech", 30.45], ["bee, wasp, etc.", 20.6], ["fly, housefly", 18.21]], null, null, [["music", 76.9], ["ambient music", 10.74], ["synthesizer", 2.17]], [["music", 64.56], ["ambient music", 19.86], ["new-age music", 3.51]], null, [["music", 79.59], ["ambient music", 5.84], ["scary music", 4.59]], null, null, [["music", 58.53], ["scary music", 9.9], ["ambient music", 8.14]], null, null, [["music", 47.57], ["ambient music", 30.37], ["new-age music", 2.85]], [["music", 59.69], ["ambient music", 9.93], ["synthesizer", 7.29]], [["music", 48.59], ["fly, housefly", 9.48], ["insect", 4.12]], [["applause", 37.28], ["speech", 24.79], ["crowd", 19.27]], null, null, null, [["crowd", 33.46], ["cheering", 26.02], ["music", 5.86]], null], "duration": [1.44, 4.06, 2.26, 2.26, 0.5, 2.03, 2.88, 1.69, 4.32, 1.13, 2.44, 0.61, 0.9, 1.87, 0.71, 9.17, 1.28, 1.04, 7.66, 0.58, 8.12, 1.47, 6.03, 0.48, 1.24, 0.62, 3.2, 1.03, 0.84, 5.85, 3.16, 1.92, 6.06, 0.16, 1.65, 2.79, 1.43, 1.83, 2.03, 2.35, 8.36, 2.76, 1.61, 1.07, 0.33, 4.36, 0.98]} \ No newline at end of file diff --git a/annotations_1/6qxQ2l1DC6Y_filtered.json b/annotations_1/6qxQ2l1DC6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c765228d51cfaf3757b2433c9451f31cc2901a --- /dev/null +++ b/annotations_1/6qxQ2l1DC6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.27], [11.0, 13.42], [18.0, 19.52], [23.0, 24.27], [26.0, 26.5], [28.0, 49.5], [54.0, 54.16], [56.0, 82.95], [87.0, 89.04], [96.0, 120.09], [121.0, 123.21], [124.0, 126.62], [127.0, 129.83], [131.0, 134.03], [137.0, 138.03], [143.0, 145.81], [148.0, 148.22], [149.0, 151.12], [152.0, 154.58], [156.0, 157.64], [159.0, 159.83], [161.0, 165.59], [168.0, 168.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.62, 99.95, 0.0, 0.0, 0.0, 87.92, 0.0, 73.97, 75.07, 99.16, 99.88, 99.4, 92.15, 98.01, 0.0, 93.6, 0.0, 97.83, 98.86, 0.0, 0.0, 88.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 2.42, 1.52, 1.27, 0.5, 21.5, 0.16, 26.95, 2.04, 24.09, 2.21, 2.62, 2.83, 3.03, 1.03, 2.81, 0.22, 2.12, 2.58, 1.64, 0.83, 4.59, 0.51]} \ No newline at end of file diff --git a/annotations_1/6rDCHgWk7dI_filtered.json b/annotations_1/6rDCHgWk7dI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4ba863656608158cf979439763c53ca6578fa1a --- /dev/null +++ b/annotations_1/6rDCHgWk7dI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 42.65], [43.0, 64.1], [65.0, 69.04], [71.0, 119.38], [120.0, 130.69], [132.0, 171.98]], "keep_status": [false, false, false, false, false, false], "silence_prob": [77.7, 77.7, 83.16, 0.0, 64.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [13.65, 21.1, 4.04, 48.38, 10.69, 39.98]} \ No newline at end of file diff --git a/annotations_1/6rGBqovePfY_filtered.json b/annotations_1/6rGBqovePfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e7eaf99be348adc5b3fd852fd79ab5d2d15c4f4 --- /dev/null +++ b/annotations_1/6rGBqovePfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 20.24], [21.0, 23.09], [25.0, 24.88], [26.0, 28.61], [31.0, 32.44], [33.0, 43.93], [46.0, 63.75], [65.0, 85.85], [87.0, 87.56], [89.0, 96.26], [97.0, 99.52], [101.0, 105.71], [106.0, 113.19], [118.0, 133.96], [135.0, 137.15], [138.0, 138.23], [139.0, 140.39], [147.0, 148.54], [153.0, 154.84], [160.0, 163.56], [164.0, 168.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 99.98, 0.0, 100.0, 0.0, 100.0, 100.0, 90.43, 0.0, 53.34, 100.0, 100.0, 99.91, 89.01, 100.0, 0.0, 0.0, 0.0, 0.0, 90.25, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.24, 2.09, -0.12, 2.61, 1.44, 10.93, 17.75, 20.85, 0.56, 7.26, 2.52, 4.71, 7.19, 15.96, 2.15, 0.23, 1.39, 1.54, 1.84, 3.56, 4.07]} \ No newline at end of file diff --git a/annotations_1/6rHHZ3hiwcQ_filtered.json b/annotations_1/6rHHZ3hiwcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5c88088b2f3b9c3375084a5e54a6951c5500748 --- /dev/null +++ b/annotations_1/6rHHZ3hiwcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.15], [10.0, 14.94], [20.0, 20.26], [24.0, 26.62], [37.0, 37.34], [41.0, 42.43], [46.0, 47.53], [49.0, 52.02], [55.0, 56.07], [69.0, 69.72], [73.0, 73.28], [75.0, 79.68], [82.0, 82.95], [84.0, 86.14], [110.0, 111.67], [115.0, 115.48], [116.0, 119.11], [120.0, 121.14], [123.0, 123.15], [124.0, 124.44], [125.0, 124.75], [126.0, 128.04], [134.0, 135.36], [140.0, 141.54], [143.0, 144.15], [145.0, 146.21], [151.0, 151.71], [152.0, 153.72], [154.0, 156.49], [180.0, 180.25]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.89, 0.0, 29.61, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 0.0, 42.08, 0.0, 38.72, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 34.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0], "audiomae_on_audioset": [null, [["music", 53.35], ["didgeridoo", 25.91], ["singing", 3.47]], null, [["music", 39.36], ["didgeridoo", 20.94], ["musical instrument", 8.98]], null, null, null, null, null, null, null, [["music", 68.27], ["didgeridoo", 5.08], ["singing", 3.37]], null, [["speech", 34.86], ["music", 31.42], ["didgeridoo", 6.72]], null, null, null, null, null, null, null, [["music", 31.99], ["speech", 25.19], ["didgeridoo", 2.51]], null, null, null, null, null, null, [["music", 45.22], ["speech", 19.42], ["didgeridoo", 10.36]], null], "duration": [0.15, 4.94, 0.26, 2.62, 0.34, 1.43, 1.53, 3.02, 1.07, 0.72, 0.28, 4.68, 0.95, 2.14, 1.67, 0.48, 3.11, 1.14, 0.15, 0.44, -0.25, 2.04, 1.36, 1.54, 1.15, 1.21, 0.71, 1.72, 2.49, 0.25]} \ No newline at end of file diff --git a/annotations_1/6rVFFaIyfH0_filtered.json b/annotations_1/6rVFFaIyfH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b980215e5b0963524dee9395c7fa0f898c1d260 --- /dev/null +++ b/annotations_1/6rVFFaIyfH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [4.0, 6.03], [8.0, 8.26], [9.0, 10.57], [15.0, 17.14], [26.0, 26.35], [34.0, 34.86], [39.0, 40.27], [43.0, 43.61], [50.0, 50.72], [53.0, 53.87], [56.0, 60.84], [62.0, 63.41], [65.0, 67.2], [69.0, 74.06], [75.0, 77.89], [79.0, 80.84], [81.0, 83.57], [92.0, 93.72], [95.0, 98.93], [102.0, 103.94], [104.0, 109.58], [111.0, 120.56], [123.0, 126.27], [129.0, 138.54], [142.0, 143.09], [148.0, 149.18], [151.0, 152.29], [154.0, 159.11], [160.0, 167.1], [168.0, 170.01], [172.0, 177.84], [180.0, 180.76]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.72, 0.0, 0.0, 42.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.47, 0.0, 95.37, 80.64, 90.25, 0.0, 50.36, 0.0, 89.54, 0.0, 75.72, 37.95, 64.63, 45.75, 0.0, 0.0, 0.0, 76.86, 62.37, 49.82, 73.67, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 36.16], ["music", 19.35], ["hum", 8.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.82], ["theremin", 5.03], ["scary music", 4.25]], null, [["music", 61.39], ["theremin", 13.3], ["synthesizer", 4.37]], null, null, null, null, null, [["music", 48.48], ["speech", 19.45], ["singing bowl", 4.58]], null, null], "duration": [1.3, 2.03, 0.26, 1.57, 2.14, 0.35, 0.86, 1.27, 0.61, 0.72, 0.87, 4.84, 1.41, 2.2, 5.06, 2.89, 1.84, 2.57, 1.72, 3.93, 1.94, 5.58, 9.56, 3.27, 9.54, 1.09, 1.18, 1.29, 5.11, 7.1, 2.01, 5.84, 0.76]} \ No newline at end of file diff --git a/annotations_1/6sfgXGPtVQk_filtered.json b/annotations_1/6sfgXGPtVQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b434c3fa1ce2a61809d5e62c84b8556279a8a197 --- /dev/null +++ b/annotations_1/6sfgXGPtVQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 41.28], [43.0, 43.97], [45.0, 45.69], [46.0, 47.14], [50.0, 50.04], [51.0, 59.58], [64.0, 66.87], [68.0, 68.59], [69.0, 69.53], [70.0, 70.16], [71.0, 71.85], [75.0, 78.53], [81.0, 81.65], [82.0, 82.9], [84.0, 84.62], [86.0, 86.75], [87.0, 88.05], [89.0, 89.53], [92.0, 98.69], [101.0, 101.73]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 45.24, 96.89, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 27.31], ["speech", 24.51], ["clip-clop", 4.2]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.12], ["fart", 5.89], ["noise", 3.51]], null], "duration": [0.28, 0.97, 0.69, 1.14, 0.04, 8.58, 2.87, 0.59, 0.53, 0.16, 0.85, 3.53, 0.65, 0.9, 0.62, 0.75, 1.05, 0.53, 6.69, 0.73]} \ No newline at end of file diff --git a/annotations_1/6tVC53rH37g_filtered.json b/annotations_1/6tVC53rH37g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fab140c9a25a26a222be6de6875a922d50bf00cc --- /dev/null +++ b/annotations_1/6tVC53rH37g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [3.0, 4.24], [6.0, 6.49], [36.0, 36.69], [47.0, 48.69], [58.0, 58.99], [66.0, 66.53], [78.0, 77.8], [84.0, 85.06], [94.0, 94.15], [106.0, 110.13], [112.0, 112.63], [118.0, 118.67], [121.0, 120.88], [125.0, 125.09], [128.0, 128.63], [133.0, 133.56], [142.0, 142.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 42.85], ["livestock, farm animals, working animals", 35.47], ["moo", 17.58]], null, null, null, null, null, null, null], "duration": [0.44, 1.24, 0.49, 0.69, 1.69, 0.99, 0.53, -0.2, 1.06, 0.15, 4.13, 0.63, 0.67, -0.12, 0.09, 0.63, 0.56, 0.48]} \ No newline at end of file diff --git a/annotations_1/6vAYIYN2Iac_filtered.json b/annotations_1/6vAYIYN2Iac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22e53e5f45469346d45852727e529da30d6ec43e --- /dev/null +++ b/annotations_1/6vAYIYN2Iac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[103.0, 139.53], [143.0, 186.93], [189.0, 190.66]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [36.53, 43.93, 1.66]} \ No newline at end of file diff --git a/annotations_1/6w4Chzgna0c_filtered.json b/annotations_1/6w4Chzgna0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ae7bda059de8f526c99dbe0841844c5ed4d195 --- /dev/null +++ b/annotations_1/6w4Chzgna0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.66], [7.0, 37.3], [39.0, 40.74], [45.0, 130.94], [131.0, 131.01], [132.0, 141.83]], "keep_status": [false, false, false, false, false, true], "silence_prob": [72.9, 0.0, 0.0, 0.0, 0.0, 34.52], "audiomae_on_audioset": [null, null, null, null, null, [["music", 33.2], ["hum", 11.66], ["throbbing", 5.06]]], "duration": [4.66, 30.3, 1.74, 85.94, 0.01, 9.83]} \ No newline at end of file diff --git a/annotations_1/6w5n1TfIFjk_filtered.json b/annotations_1/6w5n1TfIFjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b94e3d3051593662e772b925814a023e5d74cc33 --- /dev/null +++ b/annotations_1/6w5n1TfIFjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [6.0, 7.16], [8.0, 10.25], [13.0, 14.22], [16.0, 16.12], [22.0, 23.43], [27.0, 29.03], [32.0, 48.07], [53.0, 75.54], [76.0, 78.0], [79.0, 80.35], [81.0, 92.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.97, 52.39, 45.46, 38.78, 0.0, 39.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 54.07], ["theremin", 29.73], ["musical instrument", 1.47]], [["music", 57.73], ["theremin", 9.4], ["speech", 5.71]], null, [["music", 41.13], ["speech", 16.47], ["theremin", 6.32]]], "duration": [1.54, 1.16, 2.25, 1.22, 0.12, 1.43, 2.03, 16.07, 22.54, 2.0, 1.35, 11.69]} \ No newline at end of file diff --git a/annotations_1/6wXeUrZ6p5E_filtered.json b/annotations_1/6wXeUrZ6p5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f47ae422a87c1f4230980150a33ef175e2f13b81 --- /dev/null +++ b/annotations_1/6wXeUrZ6p5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.81], [15.0, 15.84], [22.0, 27.24], [30.0, 30.33], [31.0, 38.01], [39.0, 64.64], [67.0, 76.32], [83.0, 101.83], [102.0, 109.75], [111.0, 126.42], [131.0, 131.48], [132.0, 140.27], [143.0, 178.38]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.02, 0.0, 32.14, 30.02, 29.93, 30.65, 31.73, 30.26, 0.0, 30.51, 0.0], "audiomae_on_audioset": [null, null, [["whack, thwack", 52.25], ["speech", 15.87], ["breaking", 13.23]], null, [["speech", 73.75], ["whack, thwack", 7.78], ["fart", 4.64]], [["breaking", 50.66], ["smash, crash", 13.99], ["speech", 11.21]], [["breaking", 31.38], ["whack, thwack", 16.2], ["smash, crash", 10.37]], [["breaking", 31.85], ["whack, thwack", 26.94], ["smash, crash", 14.9]], [["whack, thwack", 74.48], ["speech", 5.18], ["slap, smack", 4.71]], [["speech", 37.98], ["breaking", 25.78], ["whack, thwack", 21.82]], null, [["speech", 47.89], ["breaking", 20.23], ["whack, thwack", 4.86]], null], "duration": [-0.19, 0.84, 5.24, 0.33, 7.01, 25.64, 9.32, 18.83, 7.75, 15.42, 0.48, 8.27, 35.38]} \ No newline at end of file diff --git a/annotations_1/6wyRTKGY2Tw_filtered.json b/annotations_1/6wyRTKGY2Tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1f0a5215a07a0e68a4bd785a1b94578aae24e2b --- /dev/null +++ b/annotations_1/6wyRTKGY2Tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.47], [7.0, 18.5], [19.0, 37.96], [38.0, 42.72], [43.0, 43.29], [45.0, 46.01], [47.0, 49.76], [53.0, 53.45], [55.0, 54.75], [55.0, 60.42], [66.0, 67.73], [68.0, 88.47], [91.0, 92.03], [95.0, 96.77], [104.0, 106.25], [108.0, 110.42], [113.0, 117.32], [120.0, 128.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 99.26, 0.0, 0.0, 99.84, 0.0, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 99.59, 99.36, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.47, 11.5, 18.96, 4.72, 0.29, 1.01, 2.76, 0.45, -0.25, 5.42, 1.73, 20.47, 1.03, 1.77, 2.25, 2.42, 4.32, 8.61]} \ No newline at end of file diff --git a/annotations_1/6x0i-FfeA44_filtered.json b/annotations_1/6x0i-FfeA44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b58e7d613738de33fe5444987323ffe363bbcb3 --- /dev/null +++ b/annotations_1/6x0i-FfeA44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [7.0, 12.12], [13.0, 14.12], [16.0, 24.9], [26.0, 26.64], [30.0, 30.69], [32.0, 32.24], [35.0, 35.53], [36.0, 36.98], [46.0, 45.86], [50.0, 50.36], [52.0, 53.96], [55.0, 54.89], [58.0, 58.35], [61.0, 61.11], [63.0, 63.54], [68.0, 68.66], [70.0, 70.36], [74.0, 73.85], [79.0, 78.7], [80.0, 80.23], [81.0, 83.19], [84.0, 84.42], [87.0, 88.21], [88.0, 88.97], [89.0, 90.58], [94.0, 95.77], [97.0, 97.8], [99.0, 99.44], [102.0, 105.49], [106.0, 105.95], [106.0, 110.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.18, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 50.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 5.12, 1.12, 8.9, 0.64, 0.69, 0.24, 0.53, 0.98, -0.14, 0.36, 1.96, -0.11, 0.35, 0.11, 0.54, 0.66, 0.36, -0.15, -0.3, 0.23, 2.19, 0.42, 1.21, 0.97, 1.58, 1.77, 0.8, 0.44, 3.49, -0.05, 4.05]} \ No newline at end of file diff --git a/annotations_1/6xCIhFtDtx0_filtered.json b/annotations_1/6xCIhFtDtx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d40aa0c5fc9302f4c905382275f342e4646ef0e0 --- /dev/null +++ b/annotations_1/6xCIhFtDtx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.97], [12.0, 12.02], [13.0, 13.41], [13.0, 17.15], [18.0, 21.44], [26.0, 27.28], [28.0, 29.08], [31.0, 39.29], [40.0, 42.55], [43.0, 45.28], [48.0, 52.22], [54.0, 54.04], [55.0, 62.28], [63.0, 67.26], [73.0, 74.63], [75.0, 77.31], [78.0, 86.66], [89.0, 90.64], [92.0, 93.73], [97.0, 101.02], [101.0, 101.55], [106.0, 109.9], [115.0, 120.43], [126.0, 127.79], [128.0, 134.81], [140.0, 143.99], [146.0, 149.34], [151.0, 153.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.46, 0.0, 0.0, 37.96, 59.86, 0.0, 0.0, 97.92, 81.53, 76.2, 93.91, 0.0, 86.09, 85.35, 0.0, 91.13, 92.64, 0.0, 0.0, 53.59, 0.0, 66.15, 92.48, 0.0, 60.98, 79.41, 79.07, 65.91], "audiomae_on_audioset": [null, null, null, [["music", 48.19], ["gong", 16.75], ["electronic music", 11.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.97, 0.02, 0.41, 4.15, 3.44, 1.28, 1.08, 8.29, 2.55, 2.28, 4.22, 0.04, 7.28, 4.26, 1.63, 2.31, 8.66, 1.64, 1.73, 4.02, 0.55, 3.9, 5.43, 1.79, 6.81, 3.99, 3.34, 2.99]} \ No newline at end of file diff --git a/annotations_1/6xmaoTphmLY_filtered.json b/annotations_1/6xmaoTphmLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8e5f642504008e0eb26d4105c701a834d82dd69 --- /dev/null +++ b/annotations_1/6xmaoTphmLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.36], [35.0, 36.07], [42.0, 42.82], [44.0, 48.41], [50.0, 52.95], [57.0, 57.47], [59.0, 61.05], [62.0, 63.24], [64.0, 128.14], [129.0, 129.51]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.44, 36.56, 0.0, 78.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 20.8], ["music", 14.49], ["vehicle", 4.27]], [["music", 25.9], ["noise", 16.48], ["hum", 13.06]], null, null, null, null, null], "duration": [0.36, 1.07, 0.82, 4.41, 2.95, 0.47, 2.05, 1.24, 64.14, 0.51]} \ No newline at end of file diff --git a/annotations_1/6ya9GVSPiXs_filtered.json b/annotations_1/6ya9GVSPiXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00ea5cf5471b7b02384fa43bc5390eaf24e6c2de --- /dev/null +++ b/annotations_1/6ya9GVSPiXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[102.0, 102.61], [105.0, 106.56], [112.0, 112.77], [121.0, 123.6], [127.0, 128.97], [129.0, 130.91], [136.0, 137.35], [138.0, 140.51], [143.0, 146.94], [152.0, 152.42], [153.0, 164.94], [170.0, 171.68], [174.0, 174.93]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.62, 0.0, 0.0, 0.0, 41.83, 45.11, 0.0, 32.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 30.6], ["hum", 13.45], ["mains hum", 6.84]], null, null, null, [["mains hum", 14.21], ["hum", 10.68], ["music", 7.51]], [["music", 59.84], ["electronic music", 4.88], ["synthesizer", 4.8]], null, [["music", 49.39], ["throbbing", 15.47], ["hum", 11.93]], null, null], "duration": [0.61, 1.56, 0.77, 2.6, 1.97, 1.91, 1.35, 2.51, 3.94, 0.42, 11.94, 1.68, 0.93]} \ No newline at end of file diff --git a/annotations_1/6zfXkQ5QkrE_filtered.json b/annotations_1/6zfXkQ5QkrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ee7d51c1890869bb18dbfe5f0d546babbd8f8d --- /dev/null +++ b/annotations_1/6zfXkQ5QkrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [7.0, 7.92], [9.0, 9.66], [12.0, 12.04], [13.0, 13.91], [17.0, 18.96], [23.0, 23.95], [25.0, 26.28], [28.0, 28.26], [31.0, 31.21], [32.0, 33.13], [34.0, 34.25], [38.0, 38.97], [41.0, 43.46], [46.0, 45.98], [47.0, 47.88], [50.0, 50.36], [52.0, 52.74], [56.0, 56.02], [63.0, 62.95], [64.0, 64.39], [66.0, 66.83], [68.0, 68.52], [69.0, 69.65], [74.0, 74.73], [76.0, 76.08], [80.0, 79.93], [83.0, 83.78], [85.0, 85.56], [88.0, 88.48], [90.0, 90.85], [93.0, 93.9], [95.0, 96.16], [98.0, 98.31], [102.0, 102.05], [107.0, 108.97], [112.0, 113.09], [114.0, 114.56], [116.0, 116.65], [118.0, 118.64], [119.0, 119.8], [121.0, 122.23], [126.0, 126.66], [131.0, 131.6], [133.0, 133.96], [150.0, 150.65], [153.0, 152.86], [154.0, 158.06], [159.0, 174.87], [176.0, 178.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 99.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 0.92, 0.66, 0.04, 0.91, 1.96, 0.95, 1.28, 0.26, 0.21, 1.13, 0.25, 0.97, 2.46, -0.02, 0.88, 0.36, 0.74, 0.02, -0.05, 0.39, 0.83, 0.52, 0.65, 0.73, 0.08, -0.07, 0.78, 0.56, 0.48, 0.85, 0.9, 1.16, 0.31, 0.05, 1.97, 1.09, 0.56, 0.65, 0.64, 0.8, 1.23, 0.66, 0.6, 0.96, 0.65, -0.14, 4.06, 15.87, 2.66]} \ No newline at end of file diff --git a/annotations_1/6zx4HGKU2E4_filtered.json b/annotations_1/6zx4HGKU2E4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33b1c015975008bc59aa710b6a1484754300b869 --- /dev/null +++ b/annotations_1/6zx4HGKU2E4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 45.39], [46.0, 47.6], [48.0, 73.14], [75.0, 76.92]], "keep_status": [false, false, false, false], "silence_prob": [42.79, 0.0, 70.86, 0.0], "audiomae_on_audioset": [[["music", 40.46], ["didgeridoo", 17.92], ["theremin", 11.84]], null, null, null], "duration": [2.39, 1.6, 25.14, 1.92]} \ No newline at end of file diff --git a/annotations_1/7-5kYQLJnFw_filtered.json b/annotations_1/7-5kYQLJnFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5711e03ab373bd505c5cf7f55c3ecbeb4285cae --- /dev/null +++ b/annotations_1/7-5kYQLJnFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [9.0, 13.26], [17.0, 20.02], [21.0, 22.15], [23.0, 24.34], [28.0, 29.61], [31.0, 32.46], [38.0, 38.77], [39.0, 39.83], [49.0, 49.22], [55.0, 54.85], [68.0, 68.17], [69.0, 70.14], [71.0, 73.67], [75.0, 78.12], [82.0, 82.38], [84.0, 84.5], [85.0, 84.54], [88.0, 99.06], [101.0, 102.0], [104.0, 110.81], [120.0, 120.04], [126.0, 128.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.86, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 63.85, 0.0, 0.0, 0.0, 30.78, 0.0, 33.4, 0.0, 51.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.99], ["musical instrument", 5.98], ["theremin", 3.49]], null, [["music", 38.95], ["didgeridoo", 35.63], ["musical instrument", 8.58]], null, null], "duration": [1.21, 4.26, 3.02, 1.15, 1.34, 1.61, 1.46, 0.77, 0.83, 0.22, -0.15, 0.17, 1.14, 2.67, 3.12, 0.38, 0.5, -0.46, 11.06, 1.0, 6.81, 0.04, 2.36]} \ No newline at end of file diff --git a/annotations_1/7-H5Yu3_Py8_filtered.json b/annotations_1/7-H5Yu3_Py8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d86fc8a5e2629d7a4bf065b03e428aa3dfca116 --- /dev/null +++ b/annotations_1/7-H5Yu3_Py8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [1.0, 1.0], [1.0, 1.11], [27.0, 27.13], [38.0, 38.18], [45.0, 45.06], [48.0, 48.19], [72.0, 78.71], [91.0, 91.47], [93.0, 93.55], [94.0, 94.9], [97.0, 103.11], [105.0, 105.68], [108.0, 107.97], [113.0, 112.78], [119.0, 120.11], [123.0, 124.34], [126.0, 126.45], [131.0, 137.19], [138.0, 165.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 52.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.0, 0.11, 0.13, 0.18, 0.06, 0.19, 6.71, 0.47, 0.55, 0.9, 6.11, 0.68, -0.03, -0.22, 1.11, 1.34, 0.45, 6.19, 27.72]} \ No newline at end of file diff --git a/annotations_1/7-TZCEyok_o_filtered.json b/annotations_1/7-TZCEyok_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1a30744ce325414cb7d789370d341c86b58d17c --- /dev/null +++ b/annotations_1/7-TZCEyok_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[78.0, 78.24], [79.0, 90.39], [94.0, 173.52]], "keep_status": [false, false, false], "silence_prob": [0.0, 33.48, 0.0], "audiomae_on_audioset": [null, [["hum", 52.85], ["mains hum", 17.4], ["throbbing", 11.9]], null], "duration": [0.24, 11.39, 79.52]} \ No newline at end of file diff --git a/annotations_1/7014C_6ABAg_filtered.json b/annotations_1/7014C_6ABAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77bc6c7d303c1525056962aa2a701fe95c8469e7 --- /dev/null +++ b/annotations_1/7014C_6ABAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [26.0, 26.37], [29.0, 30.79], [33.0, 33.32], [35.0, 35.8], [42.0, 42.58], [44.0, 44.04], [47.0, 48.03], [54.0, 54.26], [63.0, 67.66], [69.0, 69.31], [72.0, 73.97], [75.0, 75.81], [78.0, 79.62], [81.0, 81.3], [83.0, 82.95], [85.0, 86.32], [97.0, 98.46], [103.0, 104.57], [107.0, 108.03], [110.0, 113.98], [117.0, 118.15], [120.0, 120.5], [122.0, 122.35], [125.0, 125.29], [128.0, 130.35], [131.0, 133.3], [134.0, 137.19], [139.0, 143.85], [144.0, 153.59], [155.0, 166.21], [167.0, 173.47], [177.0, 178.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 83.34, 32.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.9], ["foghorn", 14.07], ["musical instrument", 4.15]], null], "duration": [0.82, 0.37, 1.79, 0.32, 0.8, 0.58, 0.04, 1.03, 0.26, 4.66, 0.31, 1.97, 0.81, 1.62, 0.3, -0.05, 1.32, 1.46, 1.57, 1.03, 3.98, 1.15, 0.5, 0.35, 0.29, 2.35, 2.3, 3.19, 4.85, 9.59, 11.21, 6.47, 1.73]} \ No newline at end of file diff --git a/annotations_1/70eKt79PSQw_filtered.json b/annotations_1/70eKt79PSQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7f6e68af7c5a0bcbfde918aee06dc820be54a9d --- /dev/null +++ b/annotations_1/70eKt79PSQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.21], [9.0, 8.72], [13.0, 13.71], [22.0, 23.01], [23.0, 23.77], [24.0, 25.37], [26.0, 30.59], [32.0, 40.41], [42.0, 45.35], [46.0, 47.31], [50.0, 56.02], [56.0, 56.24], [56.0, 66.48], [67.0, 71.98], [74.0, 75.81], [77.0, 82.81], [84.0, 87.25], [88.0, 89.29], [91.0, 120.9], [122.0, 122.74], [124.0, 125.05], [127.0, 127.48], [128.0, 127.75], [128.0, 129.46], [130.0, 130.4]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 49.04, 46.75, 0.0, 36.11, 0.0, 49.54, 51.94, 0.0, 53.91, 66.27, 0.0, 33.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 27.98], ["music", 10.76], ["mains hum", 9.11]], [["speech", 24.26], ["music", 23.14], ["hum", 15.23]], null, [["music", 28.83], ["hum", 17.96], ["speech", 10.55]], null, [["hum", 32.6], ["music", 16.53], ["throbbing", 11.3]], null, null, null, null, null, [["music", 27.38], ["didgeridoo", 25.33], ["buzz", 7.77]], null, null, null, null, null, null], "duration": [0.21, -0.28, 0.71, 1.01, 0.77, 1.37, 4.59, 8.41, 3.35, 1.31, 6.02, 0.24, 10.48, 4.98, 1.81, 5.81, 3.25, 1.29, 29.9, 0.74, 1.05, 0.48, -0.25, 1.46, 0.4]} \ No newline at end of file diff --git a/annotations_1/70tY44WxygM_filtered.json b/annotations_1/70tY44WxygM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8343f2d1a53ca4482662eb3786e87b6f7894960 --- /dev/null +++ b/annotations_1/70tY44WxygM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.6], [6.0, 10.4], [10.0, 10.44], [12.0, 15.33], [16.0, 20.21], [28.0, 28.92], [31.0, 33.94], [45.0, 45.59], [57.0, 59.64], [60.0, 60.17], [66.0, 69.38], [86.0, 86.31], [90.0, 91.56], [92.0, 93.07], [96.0, 97.77], [99.0, 104.28], [105.0, 110.52], [113.0, 114.05], [120.0, 121.41], [129.0, 132.44], [141.0, 148.46], [149.0, 149.47], [152.0, 159.44], [164.0, 166.43], [167.0, 175.95], [177.0, 178.04]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 31.41, 0.0, 32.78, 81.0, 0.0, 33.23, 0.0, 36.61, 0.0, 42.42, 0.0, 0.0, 0.0, 0.0, 35.87, 32.02, 0.0, 0.0, 32.75, 36.34, 0.0, 29.81, 34.16, 32.14, 0.0], "audiomae_on_audioset": [null, [["speech", 82.95], ["sidetone", 7.06], ["radio", 2.1]], null, [["speech", 90.86], ["speech synthesizer", 3.1], ["male speech, man speaking", 1.19]], null, null, [["speech", 67.35], ["sidetone", 8.43], ["radio", 7.41]], null, [["frog", 45.35], ["croak", 12.1], ["burping, eructation", 4.33]], null, [["speech", 15.16], ["gong", 10.9], ["hum", 10.28]], null, null, null, null, [["speech", 21.73], ["grunt", 17.99], ["hum", 16.85]], [["noise", 53.73], ["speech", 21.28], ["sidetone", 4.21]], null, null, [["speech", 88.32], ["speech synthesizer", 3.14], ["male speech, man speaking", 1.47]], [["music", 42.45], ["speech", 19.97], ["synthesizer", 6.33]], null, [["music", 29.2], ["speech", 13.85], ["whack, thwack", 11.67]], [["music", 54.9], ["quack", 9.57], ["didgeridoo", 3.32]], [["music", 64.38], ["synthesizer", 8.31], ["musical instrument", 3.24]], null], "duration": [-0.4, 4.4, 0.44, 3.33, 4.21, 0.92, 2.94, 0.59, 2.64, 0.17, 3.38, 0.31, 1.56, 1.07, 1.77, 5.28, 5.52, 1.05, 1.41, 3.44, 7.46, 0.47, 7.44, 2.43, 8.95, 1.04]} \ No newline at end of file diff --git a/annotations_1/71Nmq8VOKnY_filtered.json b/annotations_1/71Nmq8VOKnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c55104a3ff73973727ad0b130f5171d94614b9b --- /dev/null +++ b/annotations_1/71Nmq8VOKnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [6.0, 8.8], [10.0, 10.81], [12.0, 12.93], [13.0, 14.0], [14.0, 16.01], [17.0, 29.37], [30.0, 44.51], [45.0, 48.17], [49.0, 51.12], [52.0, 70.44], [73.0, 74.04], [79.0, 117.58], [119.0, 119.18], [120.0, 131.52], [134.0, 134.59], [136.0, 137.42], [140.0, 140.8], [141.0, 143.36], [146.0, 149.81]], "keep_status": [false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [44.63, 46.72, 0.0, 0.0, 0.0, 36.72, 35.24, 33.56, 39.61, 45.11, 36.9, 0.0, 0.0, 0.0, 31.71, 0.0, 0.0, 0.0, 36.76, 34.05], "audiomae_on_audioset": [[["music", 30.35], ["hum", 30.13], ["mains hum", 12.96]], [["mains hum", 49.88], ["hum", 45.31], ["throbbing", 1.3]], null, null, null, [["music", 38.62], ["foghorn", 12.3], ["theremin", 9.52]], [["music", 39.14], ["theremin", 14.22], ["speech", 6.71]], [["singing bowl", 33.42], ["music", 20.84], ["wind instrument, woodwind instrument", 18.38]], [["music", 42.68], ["speech", 16.26], ["domestic animals, pets", 1.94]], [["music", 69.45], ["theremin", 3.84], ["electronic music", 3.76]], [["theremin", 83.66], ["music", 9.2], ["singing bowl", 2.07]], null, null, null, [["music", 69.35], ["synthesizer", 7.74], ["musical instrument", 4.11]], null, null, null, [["music", 42.17], ["mains hum", 10.72], ["hum", 8.83]], [["music", 49.87], ["musical instrument", 8.24], ["didgeridoo", 4.56]]], "duration": [3.33, 2.8, 0.81, 0.93, 1.0, 2.01, 12.37, 14.51, 3.17, 2.12, 18.44, 1.04, 38.58, 0.18, 11.52, 0.59, 1.42, 0.8, 2.36, 3.81]} \ No newline at end of file diff --git a/annotations_1/71pIZ76YvR4_filtered.json b/annotations_1/71pIZ76YvR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49e7f949bdd56482174353f4b8519e6f0bbb2eed --- /dev/null +++ b/annotations_1/71pIZ76YvR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.16], [21.0, 24.07], [25.0, 25.95], [28.0, 28.86], [30.0, 30.65], [36.0, 37.07], [38.0, 39.02], [47.0, 48.36], [55.0, 56.12], [57.0, 58.24], [61.0, 62.23], [64.0, 64.91], [66.0, 66.95], [68.0, 69.92], [72.0, 75.09], [76.0, 77.41], [78.0, 78.63], [80.0, 81.14], [82.0, 82.24], [83.0, 84.11], [86.0, 88.97], [90.0, 90.61], [95.0, 98.24], [99.0, 102.02], [104.0, 109.49], [111.0, 113.39], [114.0, 114.51], [115.0, 116.78], [117.0, 119.3], [120.0, 120.75], [123.0, 124.09], [132.0, 133.07]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.0, 48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 69.88, 97.33, 86.09, 77.36, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 59.57], ["fart", 14.05], ["music", 5.61]], [["throbbing", 37.99], ["hum", 13.06], ["music", 10.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.16, 3.07, 0.95, 0.86, 0.65, 1.07, 1.02, 1.36, 1.12, 1.24, 1.23, 0.91, 0.95, 1.92, 3.09, 1.41, 0.63, 1.14, 0.24, 1.11, 2.97, 0.61, 3.24, 3.02, 5.49, 2.39, 0.51, 1.78, 2.3, 0.75, 1.09, 1.07]} \ No newline at end of file diff --git a/annotations_1/73Pm3rkTzb0_filtered.json b/annotations_1/73Pm3rkTzb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cbd019fb25f9ed28b4ffa17c5020cc268cde9a8 --- /dev/null +++ b/annotations_1/73Pm3rkTzb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [13.0, 34.18], [36.0, 36.76], [40.0, 40.22], [41.0, 41.96], [44.0, 45.59], [47.0, 48.68], [54.0, 54.5], [59.0, 59.7], [65.0, 65.74], [67.0, 67.64], [69.0, 69.97], [71.0, 73.47], [74.0, 74.33], [75.0, 77.35], [78.0, 80.7], [82.0, 84.28], [85.0, 85.26], [87.0, 87.45], [88.0, 88.42], [91.0, 92.1], [94.0, 94.96], [96.0, 103.08], [105.0, 105.95], [108.0, 108.97], [110.0, 111.64], [112.0, 113.68], [123.0, 123.3], [125.0, 126.27], [129.0, 134.89], [140.0, 141.61], [143.0, 144.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0, 49.73, 54.83, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 33.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 0.0], "audiomae_on_audioset": [null, [["explosion", 22.24], ["hum", 21.17], ["fire", 12.89]], null, null, null, null, null, null, null, null, null, null, [["music", 41.66], ["brass instrument", 8.95], ["musical instrument", 7.84]], null, [["music", 37.2], ["theremin", 10.38], ["musical instrument", 6.42]], null, [["music", 21.32], ["insect", 8.33], ["whale vocalization", 6.42]], null, null, null, null, null, [["music", 73.63], ["boing", 4.5], ["didgeridoo", 2.59]], null, null, null, null, null, null, [["music", 68.41], ["marimba, xylophone", 2.71], ["theremin", 2.54]], null, null], "duration": [0.1, 21.18, 0.76, 0.22, 0.96, 1.59, 1.68, 0.5, 0.7, 0.74, 0.64, 0.97, 2.47, 0.33, 2.35, 2.7, 2.28, 0.26, 0.45, 0.42, 1.1, 0.96, 7.08, 0.95, 0.97, 1.64, 1.68, 0.3, 1.27, 5.89, 1.61, 1.04]} \ No newline at end of file diff --git a/annotations_1/74DUcGnFH8g_filtered.json b/annotations_1/74DUcGnFH8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b52e76dcbc06bdd7583ee5cec8b66eef386431c --- /dev/null +++ b/annotations_1/74DUcGnFH8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.02], [21.0, 21.93], [23.0, 23.73], [25.0, 26.27], [27.0, 56.25], [59.0, 58.95], [61.0, 90.56], [92.0, 91.71], [92.0, 91.74], [92.0, 91.77], [92.0, 97.31], [98.0, 98.22], [99.0, 115.48], [121.0, 145.83], [150.0, 150.55], [151.0, 172.0], [177.0, 189.62], [193.0, 203.49], [205.0, 221.26], [223.0, 263.82], [266.0, 265.87]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, true, false, false, true, true, true, true, false, false], "silence_prob": [49.27, 0.0, 0.0, 0.0, 29.16, 0.0, 28.98, 0.0, 0.0, 0.0, 28.38, 0.0, 28.3, 28.42, 0.0, 28.66, 28.69, 28.57, 28.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.4], ["hum", 3.46], ["ambient music", 2.93]], null, null, null, [["speech", 26.03], ["hum", 24.39], ["mains hum", 20.93]], null, [["music", 42.11], ["didgeridoo", 9.54], ["throbbing", 7.9]], null, null, null, [["music", 17.0], ["groan", 12.57], ["roaring cats (lions, tigers)", 10.46]], null, [["music", 31.87], ["speech", 7.86], ["animal", 6.24]], [["music", 63.8], ["speech", 4.82], ["musical instrument", 3.33]], null, [["fart", 23.42], ["electric shaver, electric razor", 13.75], ["music", 11.17]], [["music", 35.62], ["buzz", 11.63], ["speech", 4.92]], [["music", 42.33], ["speech", 8.69], ["throbbing", 5.03]], [["vehicle", 24.25], ["music", 12.03], ["race car, auto racing", 6.61]], null, null], "duration": [2.02, 0.93, 0.73, 1.27, 29.25, -0.05, 29.56, -0.29, -0.26, -0.23, 5.31, 0.22, 16.48, 24.83, 0.55, 21.0, 12.62, 10.49, 16.26, 40.82, -0.13]} \ No newline at end of file diff --git a/annotations_1/74Od5-Fmf60_filtered.json b/annotations_1/74Od5-Fmf60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..620205bb7420a0d9dad7ffe3228c223dcf5587dd --- /dev/null +++ b/annotations_1/74Od5-Fmf60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.35], [6.0, 8.95], [12.0, 16.29], [18.0, 17.93], [19.0, 21.73], [42.0, 44.22], [46.0, 47.48], [63.0, 63.56], [75.0, 77.38], [83.0, 91.71], [94.0, 95.12], [109.0, 109.11], [114.0, 114.94], [119.0, 119.3], [121.0, 123.6], [126.0, 128.87], [130.0, 138.21], [141.0, 148.66]], "keep_status": [false, true, false, false, true, false, false, false, true, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 32.37, 31.14, 0.0, 43.08, 90.6, 0.0, 0.0, 30.04, 30.81, 0.0, 0.0, 0.0, 0.0, 30.6, 29.67, 30.13, 29.34], "audiomae_on_audioset": [null, [["music", 21.48], ["a capella", 12.24], ["vocal music", 11.97]], [["music", 82.75], ["singing", 2.3], ["electronic music", 1.25]], null, [["speech", 39.77], ["noise", 19.42], ["music", 5.88]], null, null, null, [["cattle, bovinae", 28.08], ["speech", 16.09], ["animal", 13.93]], [["breaking", 33.88], ["whack, thwack", 16.26], ["smash, crash", 15.93]], null, null, null, null, [["music", 51.61], ["cacophony", 5.83], ["speech", 3.23]], [["music", 60.65], ["speech", 24.3], ["didgeridoo", 2.21]], [["music", 63.49], ["speech", 13.63], ["hum", 3.44]], [["music", 36.24], ["whack, thwack", 9.25], ["fart", 6.91]]], "duration": [0.35, 2.95, 4.29, -0.07, 2.73, 2.22, 1.48, 0.56, 2.38, 8.71, 1.12, 0.11, 0.94, 0.3, 2.6, 2.87, 8.21, 7.66]} \ No newline at end of file diff --git a/annotations_1/74PUHyVj4BQ_filtered.json b/annotations_1/74PUHyVj4BQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b534ec16b116942c4becf98301a414be5abf549c --- /dev/null +++ b/annotations_1/74PUHyVj4BQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 17.9], [20.0, 21.15], [24.0, 26.37], [30.0, 31.06], [31.0, 33.32], [35.0, 36.71], [41.0, 40.74], [49.0, 55.39], [57.0, 93.6], [94.0, 94.51], [99.0, 100.82], [105.0, 104.99], [107.0, 107.35], [110.0, 111.13], [115.0, 115.6], [118.0, 118.66], [124.0, 135.53], [137.0, 138.64], [149.0, 153.86], [158.0, 160.59], [161.0, 161.81], [162.0, 162.92], [165.0, 165.32], [166.0, 173.18]], "keep_status": [true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [43.96, 0.0, 40.57, 0.0, 44.32, 0.0, 0.0, 30.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 32.09, 58.98, 0.0, 0.0, 0.0, 39.44], "audiomae_on_audioset": [[["animal", 16.75], ["grunt", 16.5], ["burping, eructation", 8.46]], null, [["whale vocalization", 33.72], ["speech", 21.71], ["livestock, farm animals, working animals", 2.73]], null, [["speech", 24.98], ["livestock, farm animals, working animals", 19.63], ["cattle, bovinae", 18.31]], null, null, [["music", 61.51], ["didgeridoo", 6.76], ["throbbing", 5.58]], null, null, null, null, null, null, null, null, [["hum", 17.74], ["throbbing", 13.02], ["grunt", 8.94]], null, [["music", 19.11], ["speech", 15.73], ["gunshot, gunfire", 11.27]], null, null, null, null, [["music", 23.65], ["speech", 17.25], ["sidetone", 11.07]]], "duration": [12.9, 1.15, 2.37, 1.06, 2.32, 1.71, -0.26, 6.39, 36.6, 0.51, 1.82, -0.01, 0.35, 1.13, 0.6, 0.66, 11.53, 1.64, 4.86, 2.59, 0.81, 0.92, 0.32, 7.18]} \ No newline at end of file diff --git a/annotations_1/74ZjOVz3gs4_filtered.json b/annotations_1/74ZjOVz3gs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dda65d634bb56b1b893174fe5b7fd031e4735cb7 --- /dev/null +++ b/annotations_1/74ZjOVz3gs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.97], [15.0, 15.26], [22.0, 23.4], [34.0, 38.7], [42.0, 45.28], [46.0, 46.74], [47.0, 47.9], [50.0, 51.6], [57.0, 63.66], [66.0, 69.55], [71.0, 72.23], [74.0, 74.06], [75.0, 75.84], [76.0, 77.43], [79.0, 79.05], [80.0, 82.92], [88.0, 88.97], [89.0, 89.7], [124.0, 127.18], [134.0, 134.59], [137.0, 137.57]], "keep_status": [false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.26, 32.37, 0.0, 0.0, 0.0, 34.21, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 0.0, 0.0, 53.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.89], ["didgeridoo", 12.1], ["throbbing", 3.83]], [["boing", 25.24], ["whack, thwack", 20.21], ["ding", 12.55]], null, null, null, [["speech", 58.77], ["music", 23.14], ["noise", 2.32]], [["noise", 34.69], ["music", 15.56], ["speech", 8.74]], null, null, null, null, null, [["speech", 38.77], ["music", 10.87], ["fart", 4.69]], null, null, null, null, null], "duration": [-0.03, 0.26, 1.4, 4.7, 3.28, 0.74, 0.9, 1.6, 6.66, 3.55, 1.23, 0.06, 0.84, 1.43, 0.05, 2.92, 0.97, 0.7, 3.18, 0.59, 0.57]} \ No newline at end of file diff --git a/annotations_1/757qJxO5D6Y_filtered.json b/annotations_1/757qJxO5D6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fefd418cbeee702d45f5fba2b8221b2b9d3b1d3 --- /dev/null +++ b/annotations_1/757qJxO5D6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.4], [12.0, 15.06], [17.0, 18.08], [20.0, 20.65], [22.0, 22.52], [24.0, 24.6], [26.0, 26.35], [29.0, 29.93], [30.0, 32.97], [34.0, 34.5], [38.0, 40.59], [43.0, 43.51], [45.0, 66.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [82.43, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.7, 0.0, 99.1, 0.0, 30.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["insect", 45.43], ["fly, housefly", 43.81], ["mosquito", 8.09]], null, null, null, [["speech", 41.54], ["fart", 11.33], ["whack, thwack", 6.27]]], "duration": [3.4, 3.06, 1.08, 0.65, 0.52, 0.6, 0.35, 0.93, 2.97, 0.5, 2.59, 0.51, 21.45]} \ No newline at end of file diff --git a/annotations_1/75EThT2il7k_filtered.json b/annotations_1/75EThT2il7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..118994282e17ca8337067465907640d4fa4f6ad3 --- /dev/null +++ b/annotations_1/75EThT2il7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.34], [20.0, 21.51], [28.0, 76.71], [78.0, 79.95], [82.0, 83.84], [86.0, 89.46]], "keep_status": [true, false, false, false, false, true], "silence_prob": [37.77, 0.0, 0.0, 0.0, 0.0, 31.58], "audiomae_on_audioset": [[["music", 46.68], ["carnatic music", 11.41], ["sitar", 8.03]], null, null, null, null, [["insect", 29.53], ["fly, housefly", 22.15], ["speech", 8.02]]], "duration": [2.34, 1.51, 48.71, 1.95, 1.84, 3.46]} \ No newline at end of file diff --git a/annotations_1/75k4CoAyT4I_filtered.json b/annotations_1/75k4CoAyT4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d41a63b8eaf24fa7cf74f327f320be6a16b3d4e --- /dev/null +++ b/annotations_1/75k4CoAyT4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.37], [12.0, 13.37], [18.0, 18.67], [20.0, 20.73], [22.0, 29.51], [33.0, 37.61], [43.0, 43.53], [46.0, 46.36], [51.0, 51.93], [53.0, 53.49], [54.0, 58.46], [61.0, 62.87], [64.0, 64.4], [65.0, 68.57], [70.0, 69.96], [71.0, 71.9], [72.0, 73.9], [74.0, 75.19], [79.0, 84.5], [103.0, 122.89]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.74, 0.0, 0.0, 0.0, 32.33, 34.2, 0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 56.18, 0.0, 0.0, 0.0, 0.0, 61.27, 31.28], "audiomae_on_audioset": [[["music", 44.21], ["speech", 21.64], ["throbbing", 11.12]], null, null, null, [["music", 47.47], ["didgeridoo", 18.18], ["speech", 15.44]], [["speech", 39.47], ["music", 26.93], ["didgeridoo", 3.33]], null, null, null, null, [["music", 73.36], ["throbbing", 3.61], ["musical instrument", 2.08]], null, null, null, null, null, null, null, null, [["music", 80.69], ["hip hop music", 2.48], ["funk", 2.05]]], "duration": [7.37, 1.37, 0.67, 0.73, 7.51, 4.61, 0.53, 0.36, 0.93, 0.49, 4.46, 1.87, 0.4, 3.57, -0.04, 0.9, 1.9, 1.19, 5.5, 19.89]} \ No newline at end of file diff --git a/annotations_1/76pNjmVp58w_filtered.json b/annotations_1/76pNjmVp58w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/76pNjmVp58w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/79WfcpXDbg4_filtered.json b/annotations_1/79WfcpXDbg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43fe111f7eb221fa447ccc174fc3035e625966f0 --- /dev/null +++ b/annotations_1/79WfcpXDbg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.5], [22.0, 57.86], [61.0, 74.29], [75.0, 77.03], [79.0, 79.59], [84.0, 91.52], [95.0, 95.96], [98.0, 101.41], [104.0, 117.44], [119.0, 119.87], [120.0, 119.92], [120.0, 123.94], [126.0, 138.96], [141.0, 142.45]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [32.71, 0.0, 32.92, 51.34, 0.0, 29.42, 0.0, 40.45, 34.91, 0.0, 0.0, 33.99, 35.23, 0.0], "audiomae_on_audioset": [[["music", 56.76], ["speech", 20.85], ["didgeridoo", 4.18]], null, [["telephone bell ringing", 44.16], ["music", 35.89], ["speech", 13.58]], null, null, [["speech", 42.19], ["whack, thwack", 5.98], ["rumble", 5.76]], null, [["music", 56.79], ["didgeridoo", 30.47], ["hum", 1.96]], [["music", 60.85], ["sidetone", 11.89], ["speech", 5.76]], null, null, [["speech", 33.13], ["bee, wasp, etc.", 4.68], ["male speech, man speaking", 4.13]], [["music", 63.76], ["speech", 8.98], ["scary music", 5.75]], null], "duration": [10.5, 35.86, 13.29, 2.03, 0.59, 7.52, 0.96, 3.41, 13.44, 0.87, -0.08, 3.94, 12.96, 1.45]} \ No newline at end of file diff --git a/annotations_1/7A6HQOrRDiw_filtered.json b/annotations_1/7A6HQOrRDiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd84e65684875f3f9ca8e460b776fa2ff399cd9c --- /dev/null +++ b/annotations_1/7A6HQOrRDiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [3.0, 3.62], [4.0, 4.95], [5.0, 6.44], [8.0, 8.38], [10.0, 10.77], [12.0, 12.41], [15.0, 16.06], [17.0, 18.03], [19.0, 20.09], [21.0, 22.49], [24.0, 25.73], [26.0, 26.97], [27.0, 28.05], [28.0, 28.92], [31.0, 32.31], [33.0, 34.2], [36.0, 37.83], [40.0, 39.78], [41.0, 41.96], [42.0, 43.01], [43.0, 44.66], [46.0, 47.11], [49.0, 50.65], [51.0, 51.46], [52.0, 52.56], [53.0, 54.23], [56.0, 57.62], [58.0, 59.12], [60.0, 60.44], [61.0, 63.27], [65.0, 68.59], [71.0, 73.36], [74.0, 80.59], [81.0, 82.17], [86.0, 87.62], [88.0, 89.83], [95.0, 95.76], [98.0, 98.37], [101.0, 102.27], [106.0, 108.36], [110.0, 111.11], [113.0, 114.18], [115.0, 116.24], [118.0, 124.12], [125.0, 125.27], [126.0, 128.61], [129.0, 129.69], [131.0, 133.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 88.28, 56.25, 38.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 61.18, 0.0, 70.58, 0.0, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 47.27], ["music", 32.27], ["musical instrument", 2.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.62, 0.95, 1.44, 0.38, 0.77, 0.41, 1.06, 1.03, 1.09, 1.49, 1.73, 0.97, 1.05, 0.92, 1.31, 1.2, 1.83, -0.22, 0.96, 1.01, 1.66, 1.11, 1.65, 0.46, 0.56, 1.23, 1.62, 1.12, 0.44, 2.27, 3.59, 2.36, 6.59, 1.17, 1.62, 1.83, 0.76, 0.37, 1.27, 2.36, 1.11, 1.18, 1.24, 6.12, 0.27, 2.61, 0.69, 2.32]} \ No newline at end of file diff --git a/annotations_1/7AB4ab4LtFo_filtered.json b/annotations_1/7AB4ab4LtFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0a5d26a5caa413abb1f1a6b02dff2d719d3024a --- /dev/null +++ b/annotations_1/7AB4ab4LtFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.67], [10.0, 10.49], [11.0, 12.31], [14.0, 15.6], [16.0, 19.55], [20.0, 24.34], [25.0, 26.43], [28.0, 64.79], [73.0, 100.55], [104.0, 136.46], [139.0, 139.04], [142.0, 141.96], [142.0, 171.69]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.86, 54.7, 0.0, 0.0, 33.01, 0.0, 0.0, 0.0, 36.86], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 32.34], ["livestock, farm animals, working animals", 21.45], ["moo", 10.7]], null, null, null, [["whale vocalization", 14.35], ["animal", 12.94], ["cattle, bovinae", 12.82]], null, null, null, [["music", 34.38], ["speech", 14.33], ["theremin", 6.74]]], "duration": [0.67, 0.49, 1.31, 1.6, 3.55, 4.34, 1.43, 36.79, 27.55, 32.46, 0.04, -0.04, 29.69]} \ No newline at end of file diff --git a/annotations_1/7AajEaNH7g4_filtered.json b/annotations_1/7AajEaNH7g4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed864f8c624245e25b138148fdebda1c4ae0cd49 --- /dev/null +++ b/annotations_1/7AajEaNH7g4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.98], [17.0, 18.57], [27.0, 27.58], [32.0, 32.49], [34.0, 34.33], [35.0, 36.86], [39.0, 39.82], [43.0, 44.19], [45.0, 45.13], [51.0, 51.75], [56.0, 56.59], [62.0, 62.01], [65.0, 65.21], [73.0, 73.47], [83.0, 83.69], [91.0, 91.98], [98.0, 98.17], [103.0, 105.93], [108.0, 108.03], [112.0, 112.28], [117.0, 117.9], [121.0, 121.26], [125.0, 125.09], [129.0, 129.41], [136.0, 136.49], [141.0, 141.37], [147.0, 148.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 1.57, 0.58, 0.49, 0.33, 1.86, 0.82, 1.19, 0.13, 0.75, 0.59, 0.01, 0.21, 0.47, 0.69, 0.98, 0.17, 2.93, 0.03, 0.28, 0.9, 0.26, 0.09, 0.41, 0.49, 0.37, 1.83]} \ No newline at end of file diff --git a/annotations_1/7AnDGdVit4w_filtered.json b/annotations_1/7AnDGdVit4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ead3d1f9acfc7f171b763042843de6b5388a9680 --- /dev/null +++ b/annotations_1/7AnDGdVit4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.06], [4.0, 6.81], [8.0, 8.4], [10.0, 11.64], [14.0, 14.69], [15.0, 15.45], [26.0, 25.86], [31.0, 31.14], [59.0, 60.22], [61.0, 61.69], [62.0, 61.99], [63.0, 67.24], [69.0, 70.01], [75.0, 75.37], [80.0, 80.87], [82.0, 82.9], [85.0, 93.56], [95.0, 101.88], [104.0, 104.31], [105.0, 105.58], [109.0, 110.24], [112.0, 119.01], [120.0, 133.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 90.78, 89.72, 0.0, 0.0, 0.0, 89.36, 44.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.04], ["electric shaver, electric razor", 13.16], ["microwave oven", 7.49]]], "duration": [0.06, 2.81, 0.4, 1.64, 0.69, 0.45, -0.14, 0.14, 1.22, 0.69, -0.01, 4.24, 1.01, 0.37, 0.87, 0.9, 8.56, 6.88, 0.31, 0.58, 1.24, 7.01, 13.98]} \ No newline at end of file diff --git a/annotations_1/7C-aB09i30E_filtered.json b/annotations_1/7C-aB09i30E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1e1c03ffb90c83f3ee3369786c24e670f2151b --- /dev/null +++ b/annotations_1/7C-aB09i30E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.5], [14.0, 16.6], [28.0, 27.8], [29.0, 29.64], [30.0, 38.84], [41.0, 44.95], [47.0, 48.34], [57.0, 57.96], [62.0, 63.41], [66.0, 67.63]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [57.25, 58.55, 0.0, 0.0, 32.82, 36.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 39.83], ["insect", 11.8], ["speech", 9.83]], [["fly, housefly", 41.56], ["insect", 26.03], ["bee, wasp, etc.", 10.02]], null, null, null, null], "duration": [3.5, 2.6, -0.2, 0.64, 8.84, 3.95, 1.34, 0.96, 1.41, 1.63]} \ No newline at end of file diff --git a/annotations_1/7CVfTd-_qbc_filtered.json b/annotations_1/7CVfTd-_qbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cf4dd92ab6dc9c3a0660859f728bcf0a2f10065 --- /dev/null +++ b/annotations_1/7CVfTd-_qbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.93], [21.0, 21.34], [43.0, 43.58], [44.0, 43.9], [44.0, 44.17], [63.0, 69.53], [71.0, 77.45], [78.0, 78.07], [113.0, 159.24]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.28, 31.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 81.28], ["throbbing", 3.23], ["hum", 2.05]], [["music", 56.08], ["sidetone", 4.45], ["throbbing", 3.55]], null, null], "duration": [0.93, 0.34, 0.58, -0.1, 0.17, 6.53, 6.45, 0.07, 46.24]} \ No newline at end of file diff --git a/annotations_1/7DP-JKwZrA0_filtered.json b/annotations_1/7DP-JKwZrA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae7f28c148fc9cc8aac8bc9de8d9e912959749bc --- /dev/null +++ b/annotations_1/7DP-JKwZrA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.08], [27.0, 28.41], [30.0, 30.35], [31.0, 32.37], [37.0, 37.42], [39.0, 38.94], [40.0, 40.51], [44.0, 49.69], [53.0, 54.45], [62.0, 62.13], [65.0, 67.2], [68.0, 68.89], [73.0, 76.77], [82.0, 82.85], [84.0, 85.11], [86.0, 86.91], [90.0, 91.77], [94.0, 98.31], [99.0, 99.47], [105.0, 108.21], [112.0, 113.22], [119.0, 121.37], [123.0, 123.52], [125.0, 127.77]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0, 0.0, 28.33, 0.0, 28.45, 0.0, 0.0, 0.0, 0.0, 29.18, 0.0, 29.71, 0.0, 28.48, 0.0, 29.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 31.56], ["speech", 13.99], ["hum", 13.21]], null, null, [["speech", 48.06], ["explosion", 8.88], ["burst, pop", 7.98]], null, [["music", 18.19], ["explosion", 15.43], ["whack, thwack", 6.4]], null, null, null, null, [["explosion", 37.91], ["speech", 24.32], ["burst, pop", 10.46]], null, [["cattle, bovinae", 26.82], ["moo", 11.85], ["livestock, farm animals, working animals", 11.02]], null, [["explosion", 40.62], ["speech", 7.47], ["eruption", 6.59]], null, [["explosion", 30.12], ["speech", 12.51], ["music", 12.41]]], "duration": [0.08, 1.41, 0.35, 1.37, 0.42, -0.06, 0.51, 5.69, 1.45, 0.13, 2.2, 0.89, 3.77, 0.85, 1.11, 0.91, 1.77, 4.31, 0.47, 3.21, 1.22, 2.37, 0.52, 2.77]} \ No newline at end of file diff --git a/annotations_1/7D_6z1EnSik_filtered.json b/annotations_1/7D_6z1EnSik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc70265652a6b6a4c71a90fed93662e74273c6d3 --- /dev/null +++ b/annotations_1/7D_6z1EnSik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.94], [17.0, 17.88], [19.0, 19.43], [24.0, 24.98], [25.0, 33.66], [38.0, 46.09], [46.0, 46.13], [49.0, 70.07], [70.0, 73.84], [74.0, 76.23], [77.0, 77.8], [81.0, 80.81], [86.0, 86.59], [87.0, 88.08], [91.0, 93.26], [94.0, 95.61], [101.0, 101.6], [103.0, 103.03], [107.0, 109.76], [114.0, 114.03], [117.0, 138.28], [139.0, 139.95], [141.0, 141.79], [142.0, 142.97]], "keep_status": [true, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [43.56, 0.0, 0.0, 0.0, 65.91, 54.97, 0.0, 32.7, 42.98, 43.05, 0.0, 0.0, 0.0, 0.0, 56.78, 0.0, 0.0, 0.0, 40.26, 0.0, 32.49, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 27.43], ["music", 18.97], ["mains hum", 15.99]], null, null, null, null, null, null, [["animal", 26.21], ["speech", 19.22], ["domestic animals, pets", 8.38]], [["livestock, farm animals, working animals", 26.17], ["speech", 19.25], ["animal", 14.12]], [["speech", 30.27], ["livestock, farm animals, working animals", 3.57], ["animal", 2.75]], null, null, null, null, null, null, null, null, [["speech", 52.26], ["buzz", 3.02], ["noise", 2.79]], null, [["speech", 48.5], ["music", 26.04], ["sidetone", 3.7]], null, null, null], "duration": [9.94, 0.88, 0.43, 0.98, 8.66, 8.09, 0.13, 21.07, 3.84, 2.23, 0.8, -0.19, 0.59, 1.08, 2.26, 1.61, 0.6, 0.03, 2.76, 0.03, 21.28, 0.95, 0.79, 0.97]} \ No newline at end of file diff --git a/annotations_1/7EcK-LuhzAA_filtered.json b/annotations_1/7EcK-LuhzAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a690c41543940362eb903ebf4a669ff30ed9e71e --- /dev/null +++ b/annotations_1/7EcK-LuhzAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.17], [9.0, 10.44], [15.0, 16.48], [17.0, 19.33], [22.0, 22.37], [24.0, 25.51], [29.0, 30.74], [32.0, 33.13], [35.0, 37.77], [40.0, 42.85], [48.0, 50.06], [54.0, 55.53], [61.0, 62.16], [67.0, 68.34], [71.0, 75.49], [76.0, 77.16], [78.0, 78.24], [78.0, 78.27], [78.0, 82.26], [84.0, 84.72], [86.0, 87.24], [88.0, 87.96], [88.0, 88.03], [90.0, 94.05], [97.0, 102.44], [103.0, 107.06], [112.0, 113.44], [116.0, 118.25], [123.0, 133.08], [137.0, 137.57], [139.0, 140.68], [142.0, 145.17], [146.0, 146.6], [148.0, 149.01], [150.0, 151.44], [154.0, 155.85], [159.0, 162.03], [164.0, 170.75], [177.0, 195.61]], "keep_status": [false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, false, true, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [54.76, 0.0, 0.0, 39.09, 0.0, 0.0, 0.0, 0.0, 35.36, 51.12, 35.22, 0.0, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 33.15, 33.87, 33.03, 0.0, 33.07, 30.94, 0.0, 0.0, 37.85, 0.0, 0.0, 0.0, 0.0, 36.81, 30.47, 31.28], "audiomae_on_audioset": [null, null, null, [["speech", 17.02], ["insect", 9.89], ["fly, housefly", 6.64]], null, null, null, null, [["livestock, farm animals, working animals", 19.65], ["cattle, bovinae", 15.21], ["moo", 11.79]], null, [["music", 51.94], ["frog", 4.82], ["electronic music", 4.15]], null, null, null, [["music", 25.32], ["bleat", 10.7], ["animal", 6.2]], null, null, null, [["music", 59.75], ["musical instrument", 2.41], ["throbbing", 1.92]], null, null, null, null, [["music", 50.47], ["cattle, bovinae", 6.94], ["moo", 6.63]], [["music", 55.84], ["musical instrument", 7.09], ["guitar", 3.88]], [["music", 60.1], ["didgeridoo", 12.52], ["electronic music", 1.98]], null, [["mosquito", 22.03], ["fly, housefly", 9.01], ["speech", 8.97]], [["music", 46.14], ["speech", 33.25], ["electric shaver, electric razor", 5.65]], null, null, [["music", 19.77], ["fly, housefly", 16.5], ["mosquito", 9.29]], null, null, null, null, [["fly, housefly", 61.94], ["insect", 29.0], ["mosquito", 6.15]], [["music", 35.5], ["boing", 14.75], ["whack, thwack", 10.27]], [["music", 75.31], ["groan", 2.14], ["wail, moan", 1.93]]], "duration": [5.17, 1.44, 1.48, 2.33, 0.37, 1.51, 1.74, 1.13, 2.77, 2.85, 2.06, 1.53, 1.16, 1.34, 4.49, 1.16, 0.24, 0.27, 4.26, 0.72, 1.24, -0.04, 0.03, 4.05, 5.44, 4.06, 1.44, 2.25, 10.08, 0.57, 1.68, 3.17, 0.6, 1.01, 1.44, 1.85, 3.03, 6.75, 18.61]} \ No newline at end of file diff --git a/annotations_1/7EmNSHq1mh0_filtered.json b/annotations_1/7EmNSHq1mh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5815e55067acf3ccff7dbbf95ca6b10ee1cc1ef1 --- /dev/null +++ b/annotations_1/7EmNSHq1mh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.06], [18.0, 19.6], [21.0, 37.03], [39.0, 47.53], [48.0, 49.89], [51.0, 53.06], [57.0, 67.14], [71.0, 94.12], [127.0, 127.41], [129.0, 130.03]], "keep_status": [true, false, false, false, false, true, false, true, false, false], "silence_prob": [47.9, 0.0, 32.41, 54.04, 0.0, 36.67, 31.18, 30.22, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.56], ["hum", 14.87], ["throbbing", 11.3]], null, [["music", 70.46], ["soundtrack music", 4.54], ["hum", 4.24]], null, null, [["music", 23.67], ["hum", 11.32], ["mains hum", 6.19]], [["music", 52.03], ["speech", 11.16], ["didgeridoo", 8.41]], [["music", 23.41], ["hum", 20.38], ["buzz", 8.37]], null, null], "duration": [2.06, 1.6, 16.03, 8.53, 1.89, 2.06, 10.14, 23.12, 0.41, 1.03]} \ No newline at end of file diff --git a/annotations_1/7Fj5JAYfWVc_filtered.json b/annotations_1/7Fj5JAYfWVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f42a4917d39c56409eaf938aaa8d2b33b52db739 --- /dev/null +++ b/annotations_1/7Fj5JAYfWVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.17], [14.0, 19.52], [23.0, 24.93], [33.0, 35.45], [37.0, 36.91], [41.0, 44.12], [45.0, 46.47], [55.0, 57.97], [63.0, 76.45], [77.0, 81.97], [82.0, 82.0], [84.0, 85.33], [88.0, 92.65], [93.0, 112.45], [113.0, 114.61], [115.0, 114.64], [117.0, 122.74], [128.0, 135.6], [146.0, 146.16], [150.0, 161.52], [163.0, 163.22], [164.0, 166.41]], "keep_status": [false, false, false, true, false, false, false, false, true, true, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [33.39, 33.05, 0.0, 36.6, 0.0, 34.13, 0.0, 32.51, 37.34, 39.72, 0.0, 0.0, 46.4, 32.13, 0.0, 0.0, 31.29, 36.39, 0.0, 33.2, 0.0, 51.6], "audiomae_on_audioset": [[["whale vocalization", 67.51], ["moo", 11.03], ["cattle, bovinae", 10.28]], [["cattle, bovinae", 45.12], ["moo", 38.74], ["livestock, farm animals, working animals", 9.95]], null, [["speech", 22.09], ["vehicle", 7.61], ["cattle, bovinae", 6.12]], null, [["livestock, farm animals, working animals", 38.82], ["cattle, bovinae", 30.56], ["moo", 23.04]], null, [["cattle, bovinae", 34.73], ["moo", 22.21], ["livestock, farm animals, working animals", 17.35]], [["mosquito", 16.58], ["whack, thwack", 12.47], ["noise", 11.29]], [["creak", 38.76], ["livestock, farm animals, working animals", 10.77], ["cattle, bovinae", 9.18]], null, null, [["music", 43.71], ["whale vocalization", 12.82], ["buzz", 5.12]], [["music", 83.43], ["didgeridoo", 3.67], ["grunt", 2.35]], null, null, [["music", 48.28], ["groan", 16.22], ["boing", 10.49]], [["music", 20.8], ["cattle, bovinae", 20.66], ["livestock, farm animals, working animals", 15.61]], null, [["throbbing", 39.04], ["music", 25.07], ["hum", 22.03]], null, null], "duration": [6.17, 5.52, 1.93, 2.45, -0.09, 3.12, 1.47, 2.97, 13.45, 4.97, 0.0, 1.33, 4.65, 19.45, 1.61, -0.36, 5.74, 7.6, 0.16, 11.52, 0.22, 2.41]} \ No newline at end of file diff --git a/annotations_1/7GrURVFAC2I_filtered.json b/annotations_1/7GrURVFAC2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6de977edb8b74e64e88c5fe97e922002ee477ab8 --- /dev/null +++ b/annotations_1/7GrURVFAC2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.88], [6.0, 5.86], [10.0, 10.74], [11.0, 11.99], [14.0, 16.12], [16.0, 16.58], [17.0, 17.51], [20.0, 19.7], [21.0, 21.32], [22.0, 24.06], [28.0, 28.41], [29.0, 29.89], [32.0, 33.17], [37.0, 36.88], [50.0, 50.43], [57.0, 58.21], [60.0, 60.39], [73.0, 77.75], [79.0, 79.27], [80.0, 81.13], [87.0, 87.98], [89.0, 89.72], [91.0, 93.21], [98.0, 97.93], [105.0, 106.34], [111.0, 111.54], [112.0, 113.53], [114.0, 114.61], [115.0, 116.06], [117.0, 116.68], [117.0, 119.01], [121.0, 124.06], [124.0, 125.44], [127.0, 131.6], [136.0, 136.63], [137.0, 136.83], [138.0, 138.16], [142.0, 143.09], [144.0, 144.46], [149.0, 149.23], [154.0, 155.16], [163.0, 163.49], [173.0, 175.0]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.37, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 0.0, 34.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.64, 32.98, 0.0, 33.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.52], "audiomae_on_audioset": [null, null, null, null, [["speech", 32.73], ["cattle, bovinae", 15.19], ["crowd", 10.75]], null, null, null, null, [["speech", 28.29], ["siren", 7.25], ["hum", 6.98]], null, null, null, null, null, null, null, [["speech", 68.22], ["vehicle", 13.49], ["race car, auto racing", 2.98]], null, null, null, null, [["speech", 33.13], ["applause", 11.29], ["crowd", 8.94]], null, null, null, null, null, null, null, [["speech", 40.35], ["vehicle", 14.71], ["car", 7.14]], [["speech", 45.07], ["foghorn", 12.45], ["vehicle", 7.4]], null, [["speech", 34.4], ["sheep", 26.59], ["bleat", 11.68]], null, null, null, null, null, null, null, null, [["hum", 28.57], ["mains hum", 24.6], ["music", 12.96]]], "duration": [-0.12, -0.14, 0.74, 0.99, 2.12, 0.58, 0.51, -0.3, 0.32, 2.06, 0.41, 0.89, 1.17, -0.12, 0.43, 1.21, 0.39, 4.75, 0.27, 1.13, 0.98, 0.72, 2.21, -0.07, 1.34, 0.54, 1.53, 0.61, 1.06, -0.32, 2.01, 3.06, 1.44, 4.6, 0.63, -0.17, 0.16, 1.09, 0.46, 0.23, 1.16, 0.49, 2.0]} \ No newline at end of file diff --git a/annotations_1/7H3XPETdtmc_filtered.json b/annotations_1/7H3XPETdtmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8afa49d3c27103b89917e2eba07218a36b133e9 --- /dev/null +++ b/annotations_1/7H3XPETdtmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 43.07], [44.0, 47.71], [49.0, 79.57], [81.0, 86.12], [89.0, 95.74]], "keep_status": [true, true, false, true, true], "silence_prob": [31.47, 29.73, 0.0, 29.11, 29.64], "audiomae_on_audioset": [[["boat, water vehicle", 13.4], ["vehicle", 11.04], ["hum", 10.01]], [["music", 42.28], ["speech", 21.19], ["didgeridoo", 6.46]], null, [["music", 32.29], ["field recording", 9.05], ["speech", 7.38]], [["noise", 15.63], ["music", 9.99], ["didgeridoo", 5.52]]], "duration": [2.07, 3.71, 30.57, 5.12, 6.74]} \ No newline at end of file diff --git a/annotations_1/7HEi1kmCzEY_filtered.json b/annotations_1/7HEi1kmCzEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8e979f2aab2c37d774cfc88397e03fa83de155a --- /dev/null +++ b/annotations_1/7HEi1kmCzEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.7], [14.0, 15.31], [16.0, 17.61], [19.0, 19.47], [22.0, 23.82], [24.0, 25.57], [27.0, 30.74], [34.0, 34.94], [47.0, 47.7], [49.0, 49.45], [50.0, 50.9], [52.0, 53.15], [53.0, 55.14], [56.0, 56.66], [57.0, 60.39], [62.0, 62.92], [69.0, 71.07], [72.0, 77.21], [77.0, 77.57], [80.0, 81.33], [97.0, 97.36], [98.0, 99.5], [102.0, 105.21], [106.0, 107.43], [108.0, 109.24], [115.0, 115.72], [118.0, 118.3], [120.0, 120.88], [123.0, 126.06], [127.0, 135.23], [136.0, 139.85], [141.0, 147.9], [149.0, 151.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 62.27, 0.0, 63.53, 46.5, 0.0, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 93.29, 46.09, 95.37, 49.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.49], ["music", 11.98], ["didgeridoo", 7.0]], null, null, null, null, [["gong", 35.01], ["music", 18.06], ["singing bowl", 15.42]], null, null, null, null, null, null, null, [["speech", 41.76], ["music", 10.6], ["chirp tone", 5.34]], null, [["music", 23.34], ["speech", 20.01], ["hum", 11.05]]], "duration": [0.7, 1.31, 1.61, 0.47, 1.82, 1.57, 3.74, 0.94, 0.7, 0.45, 0.9, 1.15, 2.14, 0.66, 3.39, 0.92, 2.07, 5.21, 0.57, 1.33, 0.36, 1.5, 3.21, 1.43, 1.24, 0.72, 0.3, 0.88, 3.06, 8.23, 3.85, 6.9, 2.36]} \ No newline at end of file diff --git a/annotations_1/7HWfwLBqSQ4_filtered.json b/annotations_1/7HWfwLBqSQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed642574e32e871dac484d0b386c389f978210ba --- /dev/null +++ b/annotations_1/7HWfwLBqSQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 29.76], [31.0, 33.18]], "keep_status": [false, false], "silence_prob": [54.36, 59.24], "audiomae_on_audioset": [null, null], "duration": [13.76, 2.18]} \ No newline at end of file diff --git a/annotations_1/7HlSKPTYZhs_filtered.json b/annotations_1/7HlSKPTYZhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ae2c84d7be615f0dce8a8d1955c20ee1ded349b --- /dev/null +++ b/annotations_1/7HlSKPTYZhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 34.18], [36.0, 36.96], [38.0, 39.72], [41.0, 41.1], [43.0, 45.27], [50.0, 51.58], [53.0, 54.75], [58.0, 60.0], [61.0, 72.12], [76.0, 82.36], [83.0, 93.51], [94.0, 95.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.03, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 100.0, 97.54, 100.0, 98.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.18, 0.96, 1.72, 0.1, 2.27, 1.58, 1.75, 2.0, 11.12, 6.36, 10.51, 1.2]} \ No newline at end of file diff --git a/annotations_1/7I6z51iYFg8_filtered.json b/annotations_1/7I6z51iYFg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c82189ad051da179ef5f760768039bffe3968f0 --- /dev/null +++ b/annotations_1/7I6z51iYFg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [5.0, 6.76], [10.0, 10.72], [13.0, 13.61], [20.0, 19.99], [40.0, 40.34], [43.0, 42.92], [47.0, 47.44], [48.0, 49.22], [52.0, 53.94], [66.0, 67.37], [71.0, 75.73], [92.0, 99.71], [101.0, 100.74], [102.0, 101.97], [104.0, 106.07], [108.0, 117.09], [118.0, 119.15], [121.0, 121.37], [124.0, 125.51], [127.0, 128.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.09, 33.46, 0.0, 0.0, 44.46, 60.05, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.89], ["explosion", 6.72], ["burst, pop", 4.88]], [["speech", 34.75], ["music", 14.74], ["gunshot, gunfire", 10.25]], null, null, [["music", 50.04], ["hum", 7.76], ["didgeridoo", 7.75]], null, null, null, null, null], "duration": [1.09, 1.76, 0.72, 0.61, -0.01, 0.34, -0.08, 0.44, 1.22, 1.94, 1.37, 4.73, 7.71, -0.26, -0.03, 2.07, 9.09, 1.15, 0.37, 1.51, 1.11]} \ No newline at end of file diff --git a/annotations_1/7KF4iJzBVWM_filtered.json b/annotations_1/7KF4iJzBVWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..111ca6de72cdc135a9e38677b6cd51a985e7f734 --- /dev/null +++ b/annotations_1/7KF4iJzBVWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [14.0, 19.7], [40.0, 41.0], [43.0, 43.46], [44.0, 49.64], [50.0, 76.52], [78.0, 79.0], [82.0, 82.09], [85.0, 85.45], [88.0, 96.23], [97.0, 102.79], [106.0, 107.01], [108.0, 108.01], [108.0, 109.32], [110.0, 110.51], [114.0, 114.69]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 33.12, 0.0, 0.0, 47.82, 33.39, 0.0, 0.0, 0.0, 30.51, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.43], ["fart", 28.78], ["creak", 3.35]], null, null, [["music", 41.43], ["hum", 9.01], ["theremin", 8.77]], [["mains hum", 38.08], ["music", 20.89], ["hum", 11.2]], null, null, null, [["cattle, bovinae", 25.48], ["moo", 23.72], ["livestock, farm animals, working animals", 18.83]], null, null, null, null, null, null], "duration": [1.96, 5.7, 1.0, 0.46, 5.64, 26.52, 1.0, 0.09, 0.45, 8.23, 5.79, 1.01, 0.01, 1.32, 0.51, 0.69]} \ No newline at end of file diff --git a/annotations_1/7LraDj4Pjgk_filtered.json b/annotations_1/7LraDj4Pjgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec38ebe52db8ae04c10ca9d96cb659f74ac482b --- /dev/null +++ b/annotations_1/7LraDj4Pjgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.21], [10.0, 16.19], [19.0, 19.7], [21.0, 21.79], [23.0, 33.45], [34.0, 35.38], [37.0, 41.55], [43.0, 45.27], [47.0, 47.83], [53.0, 53.22], [55.0, 55.14], [60.0, 60.05], [62.0, 62.43], [63.0, 64.76], [66.0, 66.55], [67.0, 71.29], [72.0, 72.39], [76.0, 78.44], [79.0, 81.75], [82.0, 87.24], [88.0, 89.6], [94.0, 94.24], [95.0, 113.93], [114.0, 117.95], [118.0, 141.24], [142.0, 144.59], [146.0, 155.07], [157.0, 160.61], [162.0, 164.07], [166.0, 166.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.04, 85.54, 0.0, 0.0, 78.55, 0.0, 82.07, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 73.36, 56.18, 66.51, 0.0, 0.0, 68.41, 67.38, 61.47, 96.04, 96.89, 95.37, 84.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.21, 6.19, 0.7, 0.79, 10.45, 1.38, 4.55, 2.27, 0.83, 0.22, 0.14, 0.05, 0.43, 1.76, 0.55, 4.29, 0.39, 2.44, 2.75, 5.24, 1.6, 0.24, 18.93, 3.95, 23.24, 2.59, 9.07, 3.61, 2.07, 0.58]} \ No newline at end of file diff --git a/annotations_1/7LxG9WBUbf8_filtered.json b/annotations_1/7LxG9WBUbf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b90850a99f0e903cce32bcd85fc1f751ea0aef4 --- /dev/null +++ b/annotations_1/7LxG9WBUbf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.2], [12.0, 15.58], [16.0, 19.63], [23.0, 29.44], [31.0, 31.94], [33.0, 37.17], [38.0, 39.77], [40.0, 56.69], [57.0, 66.38], [68.0, 72.69], [73.0, 84.15], [85.0, 88.91], [90.0, 91.54], [93.0, 96.31], [102.0, 106.05], [107.0, 111.62], [112.0, 121.69], [123.0, 123.65], [128.0, 129.78], [131.0, 144.32], [145.0, 148.88], [150.0, 153.54], [155.0, 155.7], [163.0, 164.32], [166.0, 170.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [71.57, 71.87, 53.72, 75.55, 0.0, 55.6, 0.0, 71.0, 54.04, 71.14, 83.34, 88.46, 0.0, 58.05, 53.78, 54.3, 48.56, 0.0, 0.0, 41.28, 45.3, 51.6, 0.0, 0.0, 50.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.6], ["hum", 18.1], ["music", 12.39]], null, null, [["music", 40.7], ["hum", 17.23], ["ambient music", 13.87]], [["music", 35.48], ["hum", 21.62], ["ambient music", 11.18]], null, null, null, null], "duration": [2.2, 3.58, 3.63, 6.44, 0.94, 4.17, 1.77, 16.69, 9.38, 4.69, 11.15, 3.91, 1.54, 3.31, 4.05, 4.62, 9.69, 0.65, 1.78, 13.32, 3.88, 3.54, 0.7, 1.32, 4.72]} \ No newline at end of file diff --git a/annotations_1/7ML-9r4M_qk_filtered.json b/annotations_1/7ML-9r4M_qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d47a876fd517d1801a7f490245f018bdc954053 --- /dev/null +++ b/annotations_1/7ML-9r4M_qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.93], [15.0, 17.36], [25.0, 26.3], [29.0, 33.24], [34.0, 34.43], [35.0, 37.86], [40.0, 46.85]], "keep_status": [false, false, false, true, false, true, false], "silence_prob": [0.0, 31.48, 0.0, 38.6, 0.0, 29.79, 29.23], "audiomae_on_audioset": [null, [["music", 41.36], ["speech", 28.69], ["trance music", 4.49]], null, [["music", 33.38], ["speech", 12.98], ["electronic music", 8.07]], null, [["moo", 32.41], ["cattle, bovinae", 19.02], ["speech", 9.13]], [["music", 61.36], ["electronic music", 4.34], ["beatboxing", 4.32]]], "duration": [0.93, 2.36, 1.3, 4.24, 0.43, 2.86, 6.85]} \ No newline at end of file diff --git a/annotations_1/7MWts8-_LUo_filtered.json b/annotations_1/7MWts8-_LUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c2aac67049fe501ed0dcd149fc734a8250e0e33 --- /dev/null +++ b/annotations_1/7MWts8-_LUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [10.0, 46.67], [49.0, 54.45], [59.0, 59.97], [66.0, 66.18], [67.0, 67.78], [68.0, 69.5], [79.0, 80.86], [84.0, 87.1], [88.0, 90.36], [94.0, 94.2], [101.0, 103.99], [110.0, 111.86], [119.0, 119.01], [127.0, 127.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 87.0, 0.0, 99.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["arrow", 13.8], ["fly, housefly", 13.27], ["insect", 9.85]], null, null, null, null, null, null], "duration": [1.67, 36.67, 5.45, 0.97, 0.18, 0.78, 1.5, 1.86, 3.1, 2.36, 0.2, 2.99, 1.86, 0.01, 0.87]} \ No newline at end of file diff --git a/annotations_1/7OIn2KFDWjM_filtered.json b/annotations_1/7OIn2KFDWjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef21e9d3c70e8f51a78b52cd820558653e91f6c7 --- /dev/null +++ b/annotations_1/7OIn2KFDWjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.44], [20.0, 23.14], [33.0, 39.68], [47.0, 47.61], [56.0, 58.02], [64.0, 76.72], [84.0, 91.03], [95.0, 100.38]], "keep_status": [true, false, false, false, true, true, false, true], "silence_prob": [45.3, 40.77, 38.93, 0.0, 39.25, 38.88, 37.57, 37.57], "audiomae_on_audioset": [[["music", 46.74], ["boing", 7.14], ["didgeridoo", 2.76]], [["music", 79.17], ["didgeridoo", 3.86], ["musical instrument", 2.8]], [["music", 75.8], ["musical instrument", 3.35], ["swing music", 2.13]], null, [["music", 64.52], ["musical instrument", 2.14], ["speech", 1.57]], [["music", 50.63], ["musical instrument", 5.15], ["speech", 4.92]], [["music", 73.12], ["musical instrument", 3.21], ["singing", 2.37]], [["music", 42.04], ["speech", 9.06], ["musical instrument", 8.39]]], "duration": [13.44, 3.14, 6.68, 0.61, 2.02, 12.72, 7.03, 5.38]} \ No newline at end of file diff --git a/annotations_1/7PI0v2ZWDl0_filtered.json b/annotations_1/7PI0v2ZWDl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..875b6c418a322a1692d835a29b4de36283c280db --- /dev/null +++ b/annotations_1/7PI0v2ZWDl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [6.0, 6.59], [12.0, 12.01], [14.0, 13.9], [16.0, 16.41], [18.0, 18.44], [21.0, 21.46], [24.0, 24.46], [26.0, 29.13], [30.0, 31.53], [33.0, 33.62], [34.0, 35.43], [36.0, 37.42], [39.0, 40.22], [41.0, 41.77], [42.0, 43.48], [47.0, 48.71], [50.0, 52.1], [55.0, 56.4], [61.0, 62.75], [64.0, 67.68], [68.0, 70.23], [72.0, 72.77], [76.0, 76.47], [79.0, 80.84], [81.0, 82.44], [89.0, 88.6], [91.0, 91.02], [93.0, 96.6], [97.0, 97.93], [100.0, 100.62], [104.0, 104.48], [116.0, 116.31], [123.0, 123.09], [125.0, 126.82], [128.0, 129.9], [132.0, 132.04], [138.0, 138.06], [143.0, 143.19], [144.0, 145.0], [147.0, 146.87], [150.0, 151.24], [153.0, 153.87], [159.0, 160.0], [161.0, 161.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 99.56, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.59, 0.01, -0.1, 0.41, 0.44, 0.46, 0.46, 3.13, 1.53, 0.62, 1.43, 1.42, 1.22, 0.77, 1.48, 1.71, 2.1, 1.4, 1.75, 3.68, 2.23, 0.77, 0.47, 1.84, 1.44, -0.4, 0.02, 3.6, 0.93, 0.62, 0.48, 0.31, 0.09, 1.82, 1.9, 0.04, 0.06, 0.19, 1.0, -0.13, 1.24, 0.87, 1.0, 0.65]} \ No newline at end of file diff --git a/annotations_1/7R9gbSQenqg_filtered.json b/annotations_1/7R9gbSQenqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aac6cfa70e863b9420f3704b0ba9bfbd47bf0c2b --- /dev/null +++ b/annotations_1/7R9gbSQenqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.87], [12.0, 13.59], [18.0, 19.4], [25.0, 25.2], [30.0, 32.29], [33.0, 33.32], [35.0, 36.26], [39.0, 40.54], [41.0, 42.4], [44.0, 49.59], [52.0, 57.91], [59.0, 61.3], [62.0, 72.28], [75.0, 77.26], [79.0, 99.64], [103.0, 104.4]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false], "silence_prob": [33.44, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 29.79, 30.3, 43.43, 29.3, 49.4, 30.76, 0.0], "audiomae_on_audioset": [[["music", 29.28], ["hum", 10.88], ["mains hum", 5.31]], null, null, null, null, null, null, null, null, [["hum", 31.06], ["mains hum", 25.0], ["music", 18.5]], [["electric shaver, electric razor", 19.02], ["music", 18.7], ["mains hum", 12.4]], [["music", 44.53], ["theremin", 22.32], ["electronic music", 3.06]], [["music", 58.24], ["sound effect", 4.19], ["hum", 3.84]], [["speech", 38.0], ["music", 15.47], ["rumble", 7.64]], [["hum", 40.25], ["music", 19.08], ["mains hum", 11.57]], null], "duration": [7.87, 1.59, 1.4, 0.2, 2.29, 0.32, 1.26, 1.54, 1.4, 5.59, 5.91, 2.3, 10.28, 2.26, 20.64, 1.4]} \ No newline at end of file diff --git a/annotations_1/7RBqyBb-MlU_filtered.json b/annotations_1/7RBqyBb-MlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ace0b74aa9783e1a395f9a82f27f56e35a624d95 --- /dev/null +++ b/annotations_1/7RBqyBb-MlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.28], [32.0, 32.36], [50.0, 50.35], [53.0, 54.58], [59.0, 59.26], [60.0, 60.94], [62.0, 66.33], [68.0, 67.95], [75.0, 75.54], [79.0, 81.13], [82.0, 84.38], [85.0, 88.25], [89.0, 90.93], [91.0, 93.45], [94.0, 96.8], [98.0, 100.38], [103.0, 102.88], [111.0, 111.2]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.04, 0.0, 0.0, 81.89, 99.1, 70.44, 0.0, 53.22, 35.77, 33.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["noise", 18.94], ["hum", 18.36], ["buzz", 13.97]], null, null, null, null, null, null, null, [["moo", 27.25], ["cattle, bovinae", 26.5], ["livestock, farm animals, working animals", 13.59]], [["speech", 41.71], ["radio", 21.73], ["moo", 6.16]], null, null], "duration": [1.28, 0.36, 0.35, 1.58, 0.26, 0.94, 4.33, -0.05, 0.54, 2.13, 2.38, 3.25, 1.93, 2.45, 2.8, 2.38, -0.12, 0.2]} \ No newline at end of file diff --git a/annotations_1/7RJnMME0XAw_filtered.json b/annotations_1/7RJnMME0XAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4219cce7dd97149fcef22b6b42db349a33295f0 --- /dev/null +++ b/annotations_1/7RJnMME0XAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.77], [6.0, 6.39], [9.0, 12.18], [15.0, 14.67], [19.0, 20.24], [21.0, 24.68], [27.0, 26.94], [29.0, 29.81], [30.0, 37.0], [42.0, 41.99], [43.0, 43.66], [45.0, 46.03], [51.0, 51.31], [56.0, 56.49], [57.0, 56.54], [57.0, 56.62], [57.0, 57.7], [59.0, 59.07], [59.0, 59.12], [59.0, 59.16], [59.0, 59.19], [59.0, 60.94], [62.0, 65.67], [66.0, 68.0], [70.0, 73.7], [76.0, 76.17], [77.0, 81.04], [82.0, 84.37], [89.0, 91.3], [93.0, 94.68], [96.0, 96.28], [98.0, 98.88], [100.0, 101.09], [102.0, 102.91], [105.0, 108.7], [110.0, 110.83], [113.0, 113.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.07, 0.0, 0.0, 89.72, 0.0, 0.0, 50.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 99.99, 92.8, 0.0, 99.96, 71.29, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.23, 0.39, 3.18, -0.33, 1.24, 3.68, -0.06, 0.81, 7.0, -0.01, 0.66, 1.03, 0.31, 0.49, -0.46, -0.38, 0.7, 0.07, 0.12, 0.16, 0.19, 1.94, 3.67, 2.0, 3.7, 0.17, 4.04, 2.37, 2.3, 1.68, 0.28, 0.88, 1.09, 0.91, 3.7, 0.83, 0.91]} \ No newline at end of file diff --git a/annotations_1/7RSJehegfZw_filtered.json b/annotations_1/7RSJehegfZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70fa2c74b8e05d35c45d81fae788ab894e7de793 --- /dev/null +++ b/annotations_1/7RSJehegfZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 30.96], [31.0, 32.54], [33.0, 49.57]], "keep_status": [true, false, true], "silence_prob": [28.41, 0.0, 28.51], "audiomae_on_audioset": [[["hum", 19.04], ["music", 18.49], ["speech", 14.9]], null, [["animal", 19.24], ["music", 13.38], ["speech", 10.26]]], "duration": [5.96, 1.54, 16.57]} \ No newline at end of file diff --git a/annotations_1/7S2ffMUk7iI_filtered.json b/annotations_1/7S2ffMUk7iI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1224f81f22ba4c6ff5fae856108b9cfba0e3128a --- /dev/null +++ b/annotations_1/7S2ffMUk7iI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [7.0, 8.55], [10.0, 10.88], [13.0, 13.73], [16.0, 16.04], [19.0, 22.06], [35.0, 35.16], [37.0, 41.03], [42.0, 42.69], [46.0, 46.9], [58.0, 58.19], [61.0, 61.89], [63.0, 65.03], [67.0, 67.91], [69.0, 70.65], [73.0, 73.25], [74.0, 75.17], [76.0, 81.04], [82.0, 90.29], [93.0, 94.2], [96.0, 96.94], [102.0, 103.28], [105.0, 105.51], [118.0, 124.97], [128.0, 128.53], [131.0, 133.15], [144.0, 144.02], [145.0, 147.93], [153.0, 153.6], [156.0, 155.82], [160.0, 160.59], [163.0, 163.95]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0, 0.0, 0.0, 49.45, 41.62, 0.0, 0.0, 0.0, 0.0, 34.53, 0.0, 74.44, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.64], ["synthesizer", 7.6], ["hum", 5.54]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.68], ["music", 21.28], ["theremin", 4.83]], [["noise", 57.38], ["music", 25.22], ["fart", 2.68]], null, null, null, null, [["music", 25.52], ["effects unit", 11.39], ["fly, housefly", 5.59]], null, null, null, null, null, null, null, null], "duration": [0.36, 1.55, 0.88, 0.73, 0.04, 3.06, 0.16, 4.03, 0.69, 0.9, 0.19, 0.89, 2.03, 0.91, 1.65, 0.25, 1.17, 5.04, 8.29, 1.2, 0.94, 1.28, 0.51, 6.97, 0.53, 2.15, 0.02, 2.93, 0.6, -0.18, 0.59, 0.95]} \ No newline at end of file diff --git a/annotations_1/7S3biRDwbAc_filtered.json b/annotations_1/7S3biRDwbAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d346c721d0afcd1d958f4db0d2205e04abc660ec --- /dev/null +++ b/annotations_1/7S3biRDwbAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [3.0, 7.57], [8.0, 9.29], [11.0, 12.21], [14.0, 14.84], [15.0, 16.8], [18.0, 23.55], [25.0, 28.58], [32.0, 33.15], [35.0, 35.16], [37.0, 38.67], [42.0, 43.09], [47.0, 48.73], [55.0, 57.69], [59.0, 59.97], [61.0, 62.38], [64.0, 101.66], [105.0, 112.68], [114.0, 157.94], [160.0, 163.36], [165.0, 166.51]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 67.0, 49.22, 0.0, 0.0, 0.0, 0.0, 0.0, 45.62, 0.0, 0.0, 0.0, 29.53, 0.0, 29.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 31.31], ["hum", 18.97], ["music", 10.56]], null, null, null, null, null, [["music", 22.08], ["speech", 12.03], ["hum", 7.9]], null, null, null, [["hum", 36.82], ["mains hum", 29.43], ["music", 11.55]], null, [["music", 44.75], ["mains hum", 5.35], ["hum", 5.24]], null], "duration": [0.37, 4.57, 1.29, 1.21, 0.84, 1.8, 5.55, 3.58, 1.15, 0.16, 1.67, 1.09, 1.73, 2.69, 0.97, 1.38, 37.66, 7.68, 43.94, 3.36, 1.51]} \ No newline at end of file diff --git a/annotations_1/7SZcDW_1o8g_filtered.json b/annotations_1/7SZcDW_1o8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d637a2628c4c312f336a1229e6d1c74aa765814 --- /dev/null +++ b/annotations_1/7SZcDW_1o8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [3.0, 5.75], [8.0, 8.48], [11.0, 11.57], [14.0, 16.65], [18.0, 18.82], [22.0, 23.13], [26.0, 26.33], [27.0, 28.0], [30.0, 31.51], [37.0, 39.07], [40.0, 42.35], [45.0, 47.04], [48.0, 49.2], [51.0, 52.93], [55.0, 56.39], [57.0, 65.92], [70.0, 70.11], [71.0, 82.29], [84.0, 91.4], [92.0, 93.97], [96.0, 98.41], [99.0, 101.16], [104.0, 105.33], [112.0, 112.72], [116.0, 121.04], [124.0, 128.22], [129.0, 130.76], [136.0, 140.48], [143.0, 142.72], [143.0, 142.84], [144.0, 145.72], [150.0, 149.61], [150.0, 155.85], [158.0, 158.73], [165.0, 169.01], [170.0, 172.52], [176.0, 177.45], [179.0, 180.0], [181.0, 183.71], [185.0, 186.66], [187.0, 188.43], [189.0, 196.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 100.0, 100.0, 0.0, 0.0, 0.0, 99.88, 0.0, 73.82, 100.0, 0.0, 100.0, 62.47, 0.0, 0.0, 41.81, 82.07, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 41.24, 0.0, 82.61, 99.95, 0.0, 0.0, 49.68, 0.0, 0.0, 57.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.19], ["sidetone", 7.81], ["music", 7.18]], null, null, null, null, null, null, null, [["speech", 79.29], ["sidetone", 2.77], ["busy signal", 2.23]], null, null, null, null, null, [["speech", 71.24], ["dial tone", 17.52], ["sine wave", 2.87]], null, null, null], "duration": [0.37, 2.75, 0.48, 0.57, 2.65, 0.82, 1.13, 0.33, 1.0, 1.51, 2.07, 2.35, 2.04, 1.2, 1.93, 1.39, 8.92, 0.11, 11.29, 7.4, 1.97, 2.41, 2.16, 1.33, 0.72, 5.04, 4.22, 1.76, 4.48, -0.28, -0.16, 1.72, -0.39, 5.85, 0.73, 4.01, 2.52, 1.45, 1.0, 2.71, 1.66, 1.43, 7.77]} \ No newline at end of file diff --git a/annotations_1/7SojZ1TuMsk_filtered.json b/annotations_1/7SojZ1TuMsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aca1e5f5ae41a8434271cf4d5b9e59d7cfe868e --- /dev/null +++ b/annotations_1/7SojZ1TuMsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.08], [4.0, 4.19], [5.0, 5.51], [7.0, 18.3], [20.0, 22.69], [23.0, 22.74], [23.0, 23.48], [24.0, 72.32], [74.0, 143.87], [144.0, 201.58], [207.0, 220.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.64, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73], "audiomae_on_audioset": [null, null, null, [["music", 55.14], ["speech", 13.92], ["breaking", 9.0]], [["speech", 38.96], ["music", 23.79], ["boing", 9.44]], null, null, null, null, null, [["hum", 52.8], ["music", 18.69], ["throbbing", 15.76]]], "duration": [0.08, 0.19, 0.51, 11.3, 2.69, -0.26, 0.48, 48.32, 69.87, 57.58, 13.14]} \ No newline at end of file diff --git a/annotations_1/7T5KMMZfc_U_filtered.json b/annotations_1/7T5KMMZfc_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f8c758528d0895ea9d1163cde9d752e0cde85ac --- /dev/null +++ b/annotations_1/7T5KMMZfc_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [7.0, 7.4], [8.0, 9.14], [19.0, 18.96], [26.0, 26.54], [29.0, 29.27], [33.0, 33.44], [34.0, 35.33], [37.0, 38.18], [39.0, 42.13], [51.0, 51.14], [54.0, 56.76], [62.0, 63.68], [66.0, 65.77], [69.0, 69.96], [71.0, 71.58], [80.0, 83.0], [91.0, 91.96], [103.0, 104.3], [105.0, 105.63], [108.0, 109.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 47.7], ["hum", 4.06], ["synthesizer", 3.9]], null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.4, 1.14, -0.04, 0.54, 0.27, 0.44, 1.33, 1.18, 3.13, 0.14, 2.76, 1.68, -0.23, 0.96, 0.58, 3.0, 0.96, 1.3, 0.63, 1.88]} \ No newline at end of file diff --git a/annotations_1/7URRIBRCm8E_filtered.json b/annotations_1/7URRIBRCm8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd9d34db8887d6f60b31b4f9f3837c25c0aaa6d1 --- /dev/null +++ b/annotations_1/7URRIBRCm8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.77], [24.0, 24.6], [25.0, 28.51], [30.0, 63.8], [73.0, 76.42], [78.0, 78.6], [80.0, 82.22], [97.0, 98.1], [100.0, 100.43], [104.0, 104.85], [105.0, 109.44], [116.0, 117.49], [122.0, 128.19], [131.0, 136.83]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [31.19, 0.0, 94.37, 0.0, 34.28, 0.0, 37.47, 0.0, 0.0, 0.0, 35.26, 0.0, 30.28, 32.34], "audiomae_on_audioset": [[["howl", 22.45], ["whack, thwack", 7.64], ["thump, thud", 6.59]], null, null, null, [["music", 41.65], ["musical instrument", 9.73], ["speech", 9.23]], null, [["music", 66.65], ["musical instrument", 7.52], ["guitar", 6.46]], null, null, null, [["music", 72.75], ["speech", 5.52], ["bass guitar", 3.52]], null, [["music", 30.68], ["speech", 24.5], ["thunk", 12.18]], [["speech", 40.4], ["music", 36.48], ["thunk", 6.28]]], "duration": [3.77, 0.6, 3.51, 33.8, 3.42, 0.6, 2.22, 1.1, 0.43, 0.85, 4.44, 1.49, 6.19, 5.83]} \ No newline at end of file diff --git a/annotations_1/7UnKOlleCCw_filtered.json b/annotations_1/7UnKOlleCCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54d13ffeb519a45ef7575d7dd82326bc58f01fa9 --- /dev/null +++ b/annotations_1/7UnKOlleCCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [2.0, 3.75], [4.0, 3.94], [4.0, 12.18], [15.0, 21.14], [23.0, 25.44], [28.0, 68.55], [69.0, 77.65], [79.0, 91.35], [92.0, 106.84], [109.0, 111.75], [113.0, 112.97], [118.0, 123.84]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.94, 96.04, 98.27, 0.0, 97.33, 84.07, 41.5, 100.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 39.84], ["music", 12.5], ["gong", 9.04]], null, null, null], "duration": [0.32, 1.75, -0.06, 8.18, 6.14, 2.44, 40.55, 8.65, 12.35, 14.84, 2.75, -0.03, 5.84]} \ No newline at end of file diff --git a/annotations_1/7VOpGn2RTP4_filtered.json b/annotations_1/7VOpGn2RTP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffc0a1e5356659e0484cef90750b67823aab88c0 --- /dev/null +++ b/annotations_1/7VOpGn2RTP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.74], [20.0, 27.19], [30.0, 35.02], [46.0, 48.32], [51.0, 53.81], [60.0, 62.14], [71.0, 78.78], [95.0, 96.35], [98.0, 98.19], [101.0, 103.11], [125.0, 129.79], [145.0, 156.22], [159.0, 164.08]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 29.78, 30.27, 40.81, 31.74, 31.34, 30.76, 0.0, 0.0, 31.32, 29.44, 30.09, 30.2], "audiomae_on_audioset": [null, [["music", 62.19], ["didgeridoo", 6.25], ["music of latin america", 3.19]], [["music", 84.59], ["male singing", 1.52], ["synthetic singing", 1.04]], [["music", 48.16], ["guitar", 11.81], ["musical instrument", 10.54]], [["music", 61.62], ["synthesizer", 5.84], ["sampler", 4.84]], [["music", 40.01], ["music of latin america", 10.91], ["musical instrument", 9.19]], [["music", 73.17], ["boing", 11.87], ["music of latin america", 1.89]], null, null, [["music", 68.91], ["theremin", 4.32], ["musical instrument", 4.02]], [["music", 42.12], ["foghorn", 7.7], ["carnatic music", 5.67]], [["music", 85.43], ["singing", 3.32], ["song", 1.79]], [["music", 87.13], ["singing", 0.87], ["male singing", 0.63]]], "duration": [0.74, 7.19, 5.02, 2.32, 2.81, 2.14, 7.78, 1.35, 0.19, 2.11, 4.79, 11.22, 5.08]} \ No newline at end of file diff --git a/annotations_1/7WkMxJKKITM_filtered.json b/annotations_1/7WkMxJKKITM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..562777c96ef6bd954e3a5bed75540fa62e563938 --- /dev/null +++ b/annotations_1/7WkMxJKKITM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.82], [13.0, 16.23], [24.0, 55.58], [61.0, 61.53], [63.0, 64.52], [67.0, 73.45], [75.0, 75.86], [77.0, 77.63], [79.0, 79.0], [81.0, 88.6], [89.0, 89.8], [93.0, 94.22], [102.0, 107.57], [141.0, 143.21], [149.0, 149.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.21, 0.0, 0.0, 0.0, 34.41, 0.0, 0.0, 0.0, 38.36, 0.0, 0.0, 34.04, 30.33, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 56.13], ["beatboxing", 10.67], ["thunk", 5.81]], null, null, null, [["speech", 82.72], ["music", 3.14], ["synthesizer", 1.29]], null, null, [["speech", 77.91], ["fart", 4.89], ["boing", 2.6]], [["speech", 80.2], ["radio", 6.51], ["inside, small room", 2.25]], null], "duration": [0.82, 3.23, 31.58, 0.53, 1.52, 6.45, 0.86, 0.63, 0.0, 7.6, 0.8, 1.22, 5.57, 2.21, 0.32]} \ No newline at end of file diff --git a/annotations_1/7Wyjo_hrIbM_filtered.json b/annotations_1/7Wyjo_hrIbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38fc5ecc3c60d27d5c639ec895dbe5e72a7d8df3 --- /dev/null +++ b/annotations_1/7Wyjo_hrIbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.16], [24.0, 30.16], [32.0, 38.72], [41.0, 40.86], [44.0, 44.2], [45.0, 45.35], [46.0, 46.99], [48.0, 48.41], [50.0, 52.71], [54.0, 57.38], [63.0, 63.86], [65.0, 80.32], [84.0, 91.88], [101.0, 101.43], [105.0, 105.73], [107.0, 114.54], [116.0, 116.21], [121.0, 154.87]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.58, 29.68, 0.0, 0.0, 0.0, 0.0, 0.0, 29.32, 30.19, 0.0, 29.4, 29.59, 0.0, 0.0, 30.53, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 82.47], ["electronic music", 2.58], ["techno", 1.85]], [["music", 72.79], ["electronic music", 4.46], ["drum machine", 1.82]], null, null, null, null, null, [["music", 75.31], ["speech", 4.39], ["electronic music", 1.89]], [["music", 38.48], ["speech", 18.3], ["radio", 12.75]], null, [["music", 58.66], ["speech", 18.29], ["throbbing", 5.14]], [["throbbing", 33.25], ["hum", 28.57], ["music", 15.35]], null, null, [["music", 85.48], ["didgeridoo", 6.08], ["musical instrument", 3.09]], null, null], "duration": [0.16, 6.16, 6.72, -0.14, 0.2, 0.35, 0.99, 0.41, 2.71, 3.38, 0.86, 15.32, 7.88, 0.43, 0.73, 7.54, 0.21, 33.87]} \ No newline at end of file diff --git a/annotations_1/7XBizI9jArU_filtered.json b/annotations_1/7XBizI9jArU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..824897a7b33550b3a97af475533a92a65a86b66f --- /dev/null +++ b/annotations_1/7XBizI9jArU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 35.65], [43.0, 46.77], [48.0, 52.42], [69.0, 71.02], [75.0, 76.5], [78.0, 78.53], [83.0, 84.45], [85.0, 84.59], [85.0, 84.96], [86.0, 86.78], [102.0, 102.74], [104.0, 117.14], [125.0, 130.25], [140.0, 145.54], [156.0, 161.82], [167.0, 214.24], [216.0, 219.82]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.7, 41.14, 29.76, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.91, 29.95, 29.75, 29.53, 0.0, 37.18], "audiomae_on_audioset": [[["music", 24.19], ["breaking", 14.5], ["sidetone", 7.45]], [["music", 31.87], ["speech", 11.53], ["synthesizer", 3.75]], [["music", 45.91], ["speech", 24.14], ["hum", 4.67]], null, null, null, null, null, null, null, null, [["music", 82.1], ["boing", 7.6], ["speech", 2.32]], [["music", 84.53], ["speech", 4.9], ["boing", 2.24]], [["music", 82.2], ["rattle (instrument)", 6.61], ["didgeridoo", 1.64]], [["music", 82.49], ["didgeridoo", 3.5], ["speech", 1.99]], null, [["chirp tone", 34.72], ["speech", 23.5], ["sine wave", 20.7]]], "duration": [16.65, 3.77, 4.42, 2.02, 1.5, 0.53, 1.45, -0.41, -0.04, 0.78, 0.74, 13.14, 5.25, 5.54, 5.82, 47.24, 3.82]} \ No newline at end of file diff --git a/annotations_1/7XaThsXXj_M_filtered.json b/annotations_1/7XaThsXXj_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6c168759c50fcce16c4e3d7713f854e63aa1cb8 --- /dev/null +++ b/annotations_1/7XaThsXXj_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 62.19], [65.0, 68.2], [69.0, 123.53], [126.0, 126.74], [127.0, 132.12], [132.0, 137.51], [139.0, 146.8], [148.0, 148.15], [149.0, 149.81], [151.0, 151.5], [152.0, 152.37], [157.0, 157.71], [159.0, 160.14], [161.0, 162.68], [164.0, 170.19]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.5, 0.0, 0.0, 34.44, 33.66, 37.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.67], "audiomae_on_audioset": [null, [["mains hum", 43.69], ["hum", 29.41], ["throbbing", 5.52]], null, null, [["cattle, bovinae", 46.39], ["livestock, farm animals, working animals", 28.24], ["moo", 17.79]], [["music", 29.07], ["hum", 9.1], ["thunk", 8.38]], [["music", 49.84], ["speech", 20.1], ["hum", 3.07]], null, null, null, null, null, null, null, [["hum", 33.41], ["music", 23.38], ["throbbing", 21.86]]], "duration": [0.19, 3.2, 54.53, 0.74, 5.12, 5.51, 7.8, 0.15, 0.81, 0.5, 0.37, 0.71, 1.14, 1.68, 6.19]} \ No newline at end of file diff --git a/annotations_1/7ZEqMqBLOOI_filtered.json b/annotations_1/7ZEqMqBLOOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d50a31e135208dd4a596918d81b749a250b600d --- /dev/null +++ b/annotations_1/7ZEqMqBLOOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 81.55], [82.0, 83.12], [85.0, 84.67], [85.0, 84.7], [85.0, 84.74], [85.0, 85.62], [86.0, 85.72], [86.0, 85.78], [86.0, 87.3], [90.0, 91.15], [95.0, 98.24], [100.0, 101.98], [103.0, 113.51], [116.0, 125.73], [127.0, 134.7], [135.0, 135.72], [137.0, 138.7], [140.0, 139.7], [140.0, 146.75], [147.0, 150.36], [151.0, 152.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 92.97, 99.98, 99.4, 0.0, 0.0, 0.0, 95.51, 99.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.55, 1.12, -0.33, -0.3, -0.26, 0.62, -0.28, -0.22, 1.3, 1.15, 3.24, 1.98, 10.51, 9.73, 7.7, 0.72, 1.7, -0.3, 6.75, 3.36, 1.25]} \ No newline at end of file diff --git a/annotations_1/7ZUVMim8ebM_filtered.json b/annotations_1/7ZUVMim8ebM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb9e1250791cb185585e4c284057050a772d8567 --- /dev/null +++ b/annotations_1/7ZUVMim8ebM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.9], [7.0, 34.57], [35.0, 35.65], [38.0, 38.31], [38.0, 38.65], [39.0, 40.47], [42.0, 71.49], [72.0, 73.28], [74.0, 74.93], [76.0, 76.91], [80.0, 85.94], [88.0, 90.09], [91.0, 94.07], [95.0, 96.28], [97.0, 98.49], [106.0, 109.59], [115.0, 115.77], [117.0, 118.74], [119.0, 121.14], [122.0, 122.69], [124.0, 124.73], [126.0, 127.99], [131.0, 131.4], [133.0, 133.24], [136.0, 140.54], [141.0, 144.17], [144.0, 152.51]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 36.3, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 100.0, 99.05], "audiomae_on_audioset": [null, [["mains hum", 32.66], ["hum", 30.77], ["thunk", 8.66]], null, null, null, null, [["whale vocalization", 37.2], ["music", 14.99], ["hum", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 27.57, 0.65, 0.31, 0.65, 1.47, 29.49, 1.28, 0.93, 0.91, 5.94, 2.09, 3.07, 1.28, 1.49, 3.59, 0.77, 1.74, 2.14, 0.69, 0.73, 1.99, 0.4, 0.24, 4.54, 3.17, 8.51]} \ No newline at end of file diff --git a/annotations_1/7ZzaLI6n1pU_filtered.json b/annotations_1/7ZzaLI6n1pU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0297b6908d0a3ff25eb5d6f60fb6d4cd944c419f --- /dev/null +++ b/annotations_1/7ZzaLI6n1pU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.95], [27.0, 28.29], [32.0, 32.46], [34.0, 35.02], [37.0, 37.03], [37.0, 39.12], [42.0, 46.18], [47.0, 50.7], [51.0, 51.65], [88.0, 90.9], [93.0, 94.71], [124.0, 127.84], [130.0, 133.08], [134.0, 135.77], [139.0, 140.32], [141.0, 142.57], [145.0, 144.71], [146.0, 148.1], [149.0, 151.65], [153.0, 154.57], [156.0, 155.9], [157.0, 157.64], [161.0, 161.35]], "keep_status": [true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [30.29, 0.0, 0.0, 0.0, 0.0, 30.43, 44.52, 32.88, 0.0, 30.38, 0.0, 63.85, 52.05, 0.0, 0.0, 0.0, 0.0, 38.09, 36.73, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 18.94], ["throbbing", 17.79], ["echo", 6.46]], null, null, null, null, [["speech", 56.59], ["explosion", 9.92], ["burst, pop", 5.99]], [["noise", 19.71], ["hum", 15.79], ["eruption", 9.66]], [["livestock, farm animals, working animals", 66.72], ["cattle, bovinae", 18.36], ["moo", 8.4]], null, [["wild animals", 33.22], ["roaring cats (lions, tigers)", 12.87], ["animal", 10.6]], null, null, null, null, null, null, null, [["speech", 17.23], ["music", 11.26], ["hum", 7.48]], [["hum", 35.08], ["mains hum", 33.2], ["music", 11.92]], null, null, null, null], "duration": [2.95, 1.29, 0.46, 1.02, 0.03, 2.12, 4.18, 3.7, 0.65, 2.9, 1.71, 3.84, 3.08, 1.77, 1.32, 1.57, -0.29, 2.1, 2.65, 1.57, -0.1, 0.64, 0.35]} \ No newline at end of file diff --git a/annotations_1/7a3vbSR4qWU_filtered.json b/annotations_1/7a3vbSR4qWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6871f924f495e95208a7d225c16562686b6aaf50 --- /dev/null +++ b/annotations_1/7a3vbSR4qWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [7.0, 16.53], [17.0, 20.17], [23.0, 44.71], [47.0, 62.63]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 36.45, 34.98, 33.07, 32.78], "audiomae_on_audioset": [null, [["music", 38.14], ["brass instrument", 16.27], ["musical instrument", 10.15]], [["music", 45.84], ["didgeridoo", 11.94], ["brass instrument", 4.61]], [["music", 54.19], ["trombone", 15.09], ["brass instrument", 9.41]], [["music", 39.7], ["speech", 16.04], ["brass instrument", 6.49]]], "duration": [0.85, 9.53, 3.17, 21.71, 15.63]} \ No newline at end of file diff --git a/annotations_1/7aYOGUPabd8_filtered.json b/annotations_1/7aYOGUPabd8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95aa3e175fd575e97b75af8545f58ea88892d934 --- /dev/null +++ b/annotations_1/7aYOGUPabd8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [23.0, 35.77], [42.0, 50.3], [57.0, 103.71], [106.0, 118.89], [127.0, 164.74], [171.0, 173.16], [174.0, 175.81]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.09, 36.61, 0.0, 31.55, 0.0, 99.26, 0.0], "audiomae_on_audioset": [null, [["music", 78.08], ["singing", 1.71], ["static", 1.23]], [["sound effect", 17.9], ["animal", 13.34], ["grunt", 9.85]], null, [["music", 78.88], ["afrobeat", 2.06], ["reggae", 1.82]], null, null, null], "duration": [0.51, 12.77, 8.3, 46.71, 12.89, 37.74, 2.16, 1.81]} \ No newline at end of file diff --git a/annotations_1/7bCca1RYtao_filtered.json b/annotations_1/7bCca1RYtao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88c5d869e093309162899f1f2a1e7edbb30ff972 --- /dev/null +++ b/annotations_1/7bCca1RYtao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 31.7], [37.0, 102.15], [108.0, 112.92], [115.0, 117.76], [120.0, 123.43], [127.0, 137.94]], "keep_status": [true, false, true, true, true, false], "silence_prob": [31.29, 0.0, 35.46, 36.2, 35.03, 30.87], "audiomae_on_audioset": [[["music", 31.19], ["musical instrument", 11.15], ["cacophony", 7.92]], null, [["music", 21.18], ["speech", 14.37], ["fly, housefly", 10.8]], [["didgeridoo", 21.73], ["music", 16.76], ["sidetone", 14.86]], [["music", 40.85], ["theremin", 9.14], ["bowed string instrument", 8.4]], [["theremin", 84.23], ["music", 11.1], ["didgeridoo", 1.59]]], "duration": [11.7, 65.15, 4.92, 2.76, 3.43, 10.94]} \ No newline at end of file diff --git a/annotations_1/7bCqTdKJPFo_filtered.json b/annotations_1/7bCqTdKJPFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a60f9999d6a4dea42ba92388947f3ab58a1c21f --- /dev/null +++ b/annotations_1/7bCqTdKJPFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [3.0, 3.0], [5.0, 7.4], [10.0, 12.63], [13.0, 13.96], [16.0, 16.41], [20.0, 21.76], [24.0, 26.67], [28.0, 28.75], [31.0, 31.83], [33.0, 33.81], [36.0, 35.65], [36.0, 35.75], [37.0, 37.3], [39.0, 40.46], [42.0, 43.61], [45.0, 45.23], [46.0, 47.8], [49.0, 49.98], [51.0, 53.23], [54.0, 54.73], [56.0, 57.27], [62.0, 62.58], [64.0, 65.94], [68.0, 68.99], [71.0, 71.47], [73.0, 73.04], [74.0, 76.28], [80.0, 81.63], [85.0, 85.9], [88.0, 88.57], [90.0, 91.67], [94.0, 94.51], [95.0, 97.33], [98.0, 100.13], [103.0, 103.82], [106.0, 107.69], [109.0, 109.11], [111.0, 111.55], [115.0, 116.63], [119.0, 120.61], [122.0, 123.4], [125.0, 126.69], [128.0, 130.6], [132.0, 133.15], [134.0, 135.92], [138.0, 140.53], [142.0, 144.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 98.86, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.0, 2.4, 2.63, 0.96, 0.41, 1.76, 2.67, 0.75, 0.83, 0.81, -0.35, -0.25, 0.3, 1.46, 1.61, 0.23, 1.8, 0.98, 2.23, 0.73, 1.27, 0.58, 1.94, 0.99, 0.47, 0.04, 2.28, 1.63, 0.9, 0.57, 1.67, 0.51, 2.33, 2.13, 0.82, 1.69, 0.11, 0.55, 1.63, 1.61, 1.4, 1.69, 2.6, 1.15, 1.92, 2.53, 2.63]} \ No newline at end of file diff --git a/annotations_1/7bFIUJ_voCs_filtered.json b/annotations_1/7bFIUJ_voCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e269290168e56e6d100871be5e9ce90ce28eb63 --- /dev/null +++ b/annotations_1/7bFIUJ_voCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.73], [26.0, 28.9], [32.0, 39.23], [41.0, 45.74], [47.0, 47.61], [48.0, 48.52], [51.0, 61.06], [61.0, 63.41], [65.0, 70.51], [84.0, 89.9], [98.0, 101.36], [118.0, 118.02]], "keep_status": [true, true, false, true, false, false, false, true, true, false, true, false], "silence_prob": [32.35, 30.37, 30.63, 30.42, 0.0, 0.0, 30.76, 29.88, 30.76, 31.48, 36.15, 0.0], "audiomae_on_audioset": [[["music", 32.91], ["bow-wow", 11.75], ["dog", 9.74]], [["music", 48.21], ["musical instrument", 11.68], ["theremin", 8.2]], [["music", 37.64], ["throbbing", 28.94], ["hum", 12.43]], [["music", 34.06], ["speech", 13.7], ["theremin", 4.95]], null, null, [["music", 61.46], ["speech", 18.02], ["musical instrument", 1.28]], [["music", 39.92], ["speech", 4.83], ["cattle, bovinae", 4.74]], [["music", 54.48], ["didgeridoo", 6.33], ["throbbing", 5.34]], [["music", 61.93], ["musical instrument", 6.01], ["didgeridoo", 4.75]], [["speech", 44.67], ["livestock, farm animals, working animals", 8.35], ["boing", 8.1]], null], "duration": [15.73, 2.9, 7.23, 4.74, 0.61, 0.52, 10.06, 2.41, 5.51, 5.9, 3.36, 0.02]} \ No newline at end of file diff --git a/annotations_1/7cZ3I9Bn9Rg_filtered.json b/annotations_1/7cZ3I9Bn9Rg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c9cb47ba0e86fd2378a46c27774d77a75e955c5 --- /dev/null +++ b/annotations_1/7cZ3I9Bn9Rg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.82], [25.0, 25.14], [32.0, 43.58], [44.0, 48.22], [50.0, 70.65], [75.0, 76.13], [77.0, 82.0], [83.0, 84.05], [86.0, 91.13], [93.0, 96.01], [98.0, 105.19], [108.0, 108.41], [109.0, 109.71], [112.0, 118.44], [122.0, 122.52], [125.0, 125.32], [126.0, 127.4], [131.0, 131.4]], "keep_status": [true, false, false, false, false, false, true, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [29.77, 0.0, 30.76, 33.54, 30.68, 0.0, 38.8, 0.0, 37.38, 51.77, 33.49, 0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 14.65], ["livestock, farm animals, working animals", 14.16], ["cattle, bovinae", 10.83]], null, [["music", 48.34], ["speech", 12.58], ["animal", 9.35]], [["music", 58.85], ["hum", 15.67], ["mains hum", 5.09]], [["music", 43.49], ["speech", 25.92], ["hum", 8.06]], null, [["hum", 27.04], ["music", 26.36], ["throbbing", 9.23]], null, [["hum", 22.28], ["mains hum", 17.05], ["livestock, farm animals, working animals", 15.7]], null, [["music", 43.24], ["explosion", 7.03], ["static", 4.6]], null, null, [["speech", 46.43], ["music", 15.15], ["hum", 5.54]], null, null, null, null], "duration": [7.82, 0.14, 11.58, 4.22, 20.65, 1.13, 5.0, 1.05, 5.13, 3.01, 7.19, 0.41, 0.71, 6.44, 0.52, 0.32, 1.4, 0.4]} \ No newline at end of file diff --git a/annotations_1/7dgOcvrxxac_filtered.json b/annotations_1/7dgOcvrxxac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a453321434da8cba18d59be0724146113b0484a3 --- /dev/null +++ b/annotations_1/7dgOcvrxxac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [7.0, 7.64], [10.0, 11.75], [14.0, 14.52], [17.0, 17.25], [19.0, 19.75], [25.0, 25.07], [26.0, 35.77], [45.0, 46.41], [47.0, 48.07], [60.0, 60.35], [62.0, 62.13], [63.0, 63.76], [71.0, 71.52], [75.0, 75.34], [78.0, 78.78], [83.0, 84.1], [86.0, 85.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["theremin", 72.46], ["music", 19.83], ["musical instrument", 1.82]], null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.64, 1.75, 0.52, 0.25, 0.75, 0.07, 9.77, 1.41, 1.07, 0.35, 0.13, 0.76, 0.52, 0.34, 0.78, 1.1, -0.06]} \ No newline at end of file diff --git a/annotations_1/7doKgPFilPg_filtered.json b/annotations_1/7doKgPFilPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5e6f09cbb9279e768b33de18357cfbdc89c2bee --- /dev/null +++ b/annotations_1/7doKgPFilPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.85], [6.0, 6.1], [16.0, 16.87], [18.0, 18.72], [20.0, 21.29], [22.0, 23.26], [30.0, 75.88], [80.0, 86.73], [87.0, 162.73], [163.0, 168.4], [172.0, 178.8], [181.0, 181.36], [185.0, 184.72], [186.0, 186.12], [188.0, 188.57]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.69, 0.0, 34.12, 38.71, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.09], ["didgeridoo", 23.6], ["musical instrument", 2.61]], null, [["speech", 40.69], ["whale vocalization", 11.61], ["music", 5.07]], [["music", 50.96], ["fly, housefly", 10.35], ["insect", 6.13]], null, null, null, null], "duration": [1.85, 0.1, 0.87, 0.72, 1.29, 1.26, 45.88, 6.73, 75.73, 5.4, 6.8, 0.36, -0.28, 0.12, 0.57]} \ No newline at end of file diff --git a/annotations_1/7dtQiqaxf_o_filtered.json b/annotations_1/7dtQiqaxf_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9fee103512b8f653a6160bf8cf1822201e07624 --- /dev/null +++ b/annotations_1/7dtQiqaxf_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.63], [13.0, 23.48], [24.0, 23.82], [25.0, 38.04], [38.0, 39.36], [44.0, 44.73], [45.0, 46.97], [48.0, 49.79], [50.0, 53.45], [54.0, 54.01], [54.0, 54.97], [58.0, 59.34], [61.0, 73.2], [75.0, 74.85], [77.0, 98.95]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.04, 59.24, 0.0, 39.55, 0.0, 0.0, 0.0, 0.0, 37.91, 0.0, 0.0, 0.0, 34.96, 0.0, 32.61], "audiomae_on_audioset": [[["fart", 27.48], ["music", 20.32], ["grunt", 18.24]], null, null, [["music", 21.24], ["fly, housefly", 20.58], ["insect", 13.42]], null, null, null, null, [["sidetone", 61.07], ["speech", 9.53], ["hum", 4.49]], null, null, null, [["music", 37.97], ["speech", 35.15], ["breaking", 11.7]], null, [["music", 23.72], ["hum", 20.02], ["mains hum", 12.88]]], "duration": [8.63, 10.48, -0.18, 13.04, 1.36, 0.73, 1.97, 1.79, 3.45, 0.01, 0.97, 1.34, 12.2, -0.15, 21.95]} \ No newline at end of file diff --git a/annotations_1/7ezYV1mOdh0_filtered.json b/annotations_1/7ezYV1mOdh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e8523b0eef807f8440fc836c7beb21a36066761 --- /dev/null +++ b/annotations_1/7ezYV1mOdh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.57], [1.0, 9.31], [9.0, 9.44], [10.0, 19.87], [22.0, 39.72], [41.0, 52.61], [53.0, 53.15], [53.0, 74.12], [75.0, 75.0], [76.0, 77.08], [87.0, 96.03], [101.0, 104.9], [107.0, 111.84], [114.0, 129.14], [130.0, 142.64], [144.0, 165.42], [166.0, 171.95]], "keep_status": [false, true, false, true, false, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 29.6, 0.0, 28.74, 29.01, 30.06, 0.0, 30.0, 0.0, 0.0, 29.49, 28.5, 30.19, 28.97, 29.07, 28.68, 28.27], "audiomae_on_audioset": [null, [["speech", 48.12], ["music", 12.38], ["hum", 4.54]], null, [["explosion", 32.67], ["music", 20.7], ["burst, pop", 10.48]], [["music", 44.77], ["speech", 17.54], ["throbbing", 8.75]], [["machine gun", 35.82], ["music", 19.23], ["hum", 10.68]], null, [["music", 48.37], ["smash, crash", 15.82], ["breaking", 8.9]], null, null, [["music", 33.6], ["throbbing", 25.26], ["hum", 23.02]], [["speech", 46.69], ["vehicle", 22.54], ["car", 7.38]], [["music", 44.88], ["throbbing", 24.19], ["hum", 10.65]], [["music", 34.71], ["speech", 15.46], ["explosion", 9.16]], [["music", 51.69], ["hum", 19.62], ["throbbing", 12.58]], [["music", 66.75], ["throbbing", 5.58], ["electronic music", 4.58]], [["mains hum", 40.43], ["hum", 19.79], ["music", 7.45]]], "duration": [0.57, 8.31, 0.44, 9.87, 17.72, 11.61, 0.15, 21.12, 0.0, 1.08, 9.03, 3.9, 4.84, 15.14, 12.64, 21.42, 5.95]} \ No newline at end of file diff --git a/annotations_1/7fduMinwJZ8_filtered.json b/annotations_1/7fduMinwJZ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4f81f3a73ae7f1f78d088da1f67f086a2d49d08 --- /dev/null +++ b/annotations_1/7fduMinwJZ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [12.0, 11.72], [22.0, 23.57], [24.0, 29.05], [62.0, 62.99], [73.0, 73.48], [85.0, 86.02], [99.0, 99.05], [114.0, 114.79], [115.0, 115.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 46.35], ["speech", 22.15], ["didgeridoo", 5.17]], null, null, null, null, null, null], "duration": [0.35, -0.28, 1.57, 5.05, 0.99, 0.48, 1.02, 0.05, 0.79, 0.26]} \ No newline at end of file diff --git a/annotations_1/7g5k1qwVLjw_filtered.json b/annotations_1/7g5k1qwVLjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fac35d7d523dd83e1e5e1f5a4f86b797904895c --- /dev/null +++ b/annotations_1/7g5k1qwVLjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.28], [28.0, 28.22], [34.0, 34.06], [34.0, 41.62], [46.0, 50.77], [63.0, 65.42], [69.0, 69.5], [75.0, 75.1], [80.0, 81.99], [90.0, 90.46], [92.0, 92.48], [96.0, 96.11], [97.0, 98.09], [100.0, 105.53], [106.0, 116.58], [120.0, 120.99], [125.0, 125.52]], "keep_status": [true, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.72, 0.0, 0.0, 41.78, 45.33, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.41, 100.0, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 20.53], ["speech", 10.89], ["dog", 9.51]], null, null, [["speech", 29.02], ["music", 26.19], ["knock", 5.21]], [["bleat", 10.72], ["sheep", 9.84], ["music", 9.32]], [["speech", 19.03], ["sheep", 12.95], ["crying, sobbing", 11.45]], null, null, null, null, null, null, null, [["speech", 61.97], ["screaming", 8.92], ["groan", 2.75]], null, null, null], "duration": [11.28, 0.22, 0.06, 7.62, 4.77, 2.42, 0.5, 0.1, 1.99, 0.46, 0.48, 0.11, 1.09, 5.53, 10.58, 0.99, 0.52]} \ No newline at end of file diff --git a/annotations_1/7h-q7bXYD1c_filtered.json b/annotations_1/7h-q7bXYD1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96deee59b5ecf7c1ce8b991764ca711ba2a59904 --- /dev/null +++ b/annotations_1/7h-q7bXYD1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.45], [28.0, 30.1], [34.0, 57.32], [62.0, 84.74], [89.0, 94.81], [103.0, 104.09], [124.0, 126.99], [145.0, 145.5], [147.0, 161.97], [166.0, 179.04]], "keep_status": [false, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 35.88, 31.91, 34.68, 31.83, 0.0, 32.31, 0.0, 31.33, 33.64], "audiomae_on_audioset": [null, [["whale vocalization", 23.56], ["frog", 16.77], ["mosquito", 8.87]], [["music", 42.16], ["throbbing", 20.26], ["buzz", 8.8]], [["music", 54.16], ["didgeridoo", 20.2], ["musical instrument", 3.73]], [["livestock, farm animals, working animals", 35.95], ["cattle, bovinae", 20.06], ["moo", 15.47]], null, [["speech", 32.59], ["sidetone", 14.26], ["music", 9.03]], null, [["speech", 50.96], ["music", 20.13], ["vehicle", 1.83]], [["music", 42.42], ["groan", 14.66], ["speech", 8.08]]], "duration": [0.45, 2.1, 23.32, 22.74, 5.81, 1.09, 2.99, 0.5, 14.97, 13.04]} \ No newline at end of file diff --git a/annotations_1/7hacgmRbdMM_filtered.json b/annotations_1/7hacgmRbdMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0927bbf6cf977670690ef3deb717f2bafe429ff9 --- /dev/null +++ b/annotations_1/7hacgmRbdMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.55], [2.0, 2.52], [7.0, 8.94], [10.0, 10.64], [16.0, 16.7], [21.0, 22.27], [27.0, 27.45], [28.0, 32.29], [33.0, 34.15], [38.0, 39.21], [43.0, 43.17], [45.0, 45.17], [52.0, 51.78], [60.0, 60.08], [61.0, 61.33], [67.0, 72.82], [74.0, 74.55], [75.0, 75.36], [76.0, 77.3], [80.0, 84.3], [86.0, 87.29], [90.0, 91.0], [91.0, 91.56], [93.0, 93.68], [95.0, 101.83], [104.0, 108.57], [109.0, 108.94], [109.0, 115.59], [117.0, 118.52], [122.0, 123.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 96.42, 99.56, 0.0, 99.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.52, 1.94, 0.64, 0.7, 1.27, 0.45, 4.29, 1.15, 1.21, 0.17, 0.17, -0.22, 0.08, 0.33, 5.82, 0.55, 0.36, 1.3, 4.3, 1.29, 1.0, 0.56, 0.68, 6.83, 4.57, -0.06, 6.59, 1.52, 1.5]} \ No newline at end of file diff --git a/annotations_1/7iajsLA5MKM_filtered.json b/annotations_1/7iajsLA5MKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..222575d48fedf87b628fe116cdb7ecf30ba648b1 --- /dev/null +++ b/annotations_1/7iajsLA5MKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.74], [19.0, 22.33], [24.0, 24.61], [41.0, 41.54], [42.0, 42.65], [55.0, 82.14], [129.0, 129.64]], "keep_status": [false, true, false, false, false, true, false], "silence_prob": [0.0, 35.25, 0.0, 0.0, 0.0, 28.93, 0.0], "audiomae_on_audioset": [null, [["music", 28.91], ["fly, housefly", 22.45], ["mosquito", 10.62]], null, null, null, [["music", 46.81], ["speech", 10.21], ["cattle, bovinae", 7.06]], null], "duration": [0.74, 3.33, 0.61, 0.54, 0.65, 27.14, 0.64]} \ No newline at end of file diff --git a/annotations_1/7jz_uA1dv9w_filtered.json b/annotations_1/7jz_uA1dv9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ee864af1fddb4780a4653936f168d79a496a768 --- /dev/null +++ b/annotations_1/7jz_uA1dv9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 21.09], [33.0, 43.33], [46.0, 61.28], [64.0, 72.27], [78.0, 90.95], [107.0, 147.45], [149.0, 153.62]], "keep_status": [false, true, true, false, true, false, false], "silence_prob": [73.82, 28.44, 28.75, 28.55, 29.24, 0.0, 28.8], "audiomae_on_audioset": [null, [["speech", 27.5], ["whack, thwack", 7.62], ["vehicle", 5.37]], [["animal", 15.33], ["speech", 12.61], ["vehicle", 10.05]], [["speech", 48.18], ["music", 11.53], ["machine gun", 10.91]], [["machine gun", 23.38], ["speech", 23.11], ["music", 15.98]], null, [["speech", 70.19], ["vehicle", 5.84], ["hubbub, speech noise, speech babble", 4.39]]], "duration": [13.09, 10.33, 15.28, 8.27, 12.95, 40.45, 4.62]} \ No newline at end of file diff --git a/annotations_1/7l79p5apaqQ_filtered.json b/annotations_1/7l79p5apaqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7525f211fff402c0718de074fe77cbc5f67f2d9c --- /dev/null +++ b/annotations_1/7l79p5apaqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [6.0, 8.68], [12.0, 17.95], [21.0, 23.89], [25.0, 46.65], [49.0, 50.09], [51.0, 54.24], [56.0, 59.86], [60.0, 70.82], [71.0, 89.5], [93.0, 103.0], [110.0, 111.2], [112.0, 117.64], [118.0, 120.5], [121.0, 124.9], [129.0, 130.32], [132.0, 134.32], [138.0, 140.64], [142.0, 148.8], [151.0, 154.26], [155.0, 161.11], [162.0, 162.11]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.98, 77.87, 45.27, 40.66, 0.0, 47.39, 90.95, 49.92, 45.59, 33.15, 0.0, 36.72, 38.9, 62.47, 0.0, 94.07, 95.64, 76.86, 98.44, 86.09, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 35.04], ["didgeridoo", 16.89], ["singing bowl", 8.23]], [["music", 36.09], ["hum", 27.14], ["throbbing", 8.63]], null, [["coin (dropping)", 86.82], ["telephone", 1.75], ["cash register", 1.75]], null, [["fly, housefly", 22.04], ["mosquito", 14.31], ["speech", 11.84]], [["speech", 41.4], ["electric shaver, electric razor", 20.0], ["buzz", 10.74]], [["livestock, farm animals, working animals", 46.58], ["cattle, bovinae", 13.99], ["moo", 11.73]], null, [["speech", 42.39], ["music", 12.39], ["noise", 7.6]], [["speech", 70.82], ["hum", 4.61], ["male speech, man speaking", 3.01]], null, null, null, null, null, null, null, null], "duration": [0.89, 2.68, 5.95, 2.89, 21.65, 1.09, 3.24, 3.86, 10.82, 18.5, 10.0, 1.2, 5.64, 2.5, 3.9, 1.32, 2.32, 2.64, 6.8, 3.26, 6.11, 0.11]} \ No newline at end of file diff --git a/annotations_1/7mm8aQCp_oc_filtered.json b/annotations_1/7mm8aQCp_oc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb9c8104aabe7daeae2b310ddba77d21d895c01 --- /dev/null +++ b/annotations_1/7mm8aQCp_oc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.46], [14.0, 13.88], [20.0, 22.67], [24.0, 26.86], [30.0, 38.62], [39.0, 38.7], [39.0, 72.06], [75.0, 82.12], [83.0, 83.79], [85.0, 85.21], [86.0, 86.1], [94.0, 95.07], [95.0, 95.81], [96.0, 96.74], [98.0, 98.58], [99.0, 98.98], [99.0, 105.44], [106.0, 106.86], [107.0, 107.69], [108.0, 108.53], [109.0, 110.05]], "keep_status": [true, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.67, 0.0, 30.07, 30.83, 29.78, 0.0, 0.0, 29.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.69], ["speech", 7.66], ["electronic music", 4.02]], null, [["buzz", 18.04], ["speech", 17.21], ["frog", 15.68]], [["electric shaver, electric razor", 78.47], ["speech", 9.54], ["buzz", 2.46]], [["music", 28.66], ["buzz", 16.7], ["speech", 10.44]], null, null, [["throbbing", 23.27], ["music", 16.21], ["hum", 16.07]], null, null, null, null, null, null, null, null, [["hum", 42.88], ["mains hum", 36.45], ["throbbing", 11.32]], null, null, null, null], "duration": [7.46, -0.12, 2.67, 2.86, 8.62, -0.3, 33.06, 7.12, 0.79, 0.21, 0.1, 1.07, 0.81, 0.74, 0.58, -0.02, 6.44, 0.86, 0.69, 0.53, 1.05]} \ No newline at end of file diff --git a/annotations_1/7nWfsF7ThLw_filtered.json b/annotations_1/7nWfsF7ThLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dba9f8beb3c890b34ad1b5840e5f580c4ed73f53 --- /dev/null +++ b/annotations_1/7nWfsF7ThLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 66.5], [69.0, 81.3], [86.0, 123.03]], "keep_status": [true, true, false], "silence_prob": [37.78, 33.12, 0.0], "audiomae_on_audioset": [[["music", 36.07], ["synthesizer", 19.7], ["hum", 9.72]], [["music", 31.31], ["musical instrument", 9.63], ["guitar", 8.19]], null], "duration": [9.5, 12.3, 37.03]} \ No newline at end of file diff --git a/annotations_1/7oDSPSwMw5k_filtered.json b/annotations_1/7oDSPSwMw5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bfae7808653e18229b0ae6a8fc1ef5e3577ddd1 --- /dev/null +++ b/annotations_1/7oDSPSwMw5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 64.27]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [48.27]} \ No newline at end of file diff --git a/annotations_1/7oczRhQvSlE_filtered.json b/annotations_1/7oczRhQvSlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7157acd63864ead205a8fcd3ccc5787ed22c5b3c --- /dev/null +++ b/annotations_1/7oczRhQvSlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.67], [10.0, 10.54], [12.0, 22.94], [24.0, 27.94], [29.0, 33.98], [35.0, 34.97], [39.0, 38.87], [39.0, 39.11], [57.0, 60.27], [61.0, 61.75], [63.0, 64.93], [66.0, 68.72], [70.0, 71.32], [72.0, 72.37], [73.0, 74.22], [76.0, 81.9], [83.0, 82.97], [84.0, 84.75], [85.0, 86.32], [89.0, 91.57], [95.0, 96.23], [100.0, 103.2], [104.0, 105.34], [109.0, 111.69], [112.0, 121.59], [123.0, 123.52], [125.0, 125.17]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.11, 30.82, 52.86, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 77.36, 0.0, 80.11, 0.0, 95.78, 44.32, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 50.85], ["hum", 21.89], ["mains hum", 8.51]], [["music", 57.7], ["electronic music", 5.19], ["soundtrack music", 2.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.57], ["speech", 21.87], ["theremin", 7.0]], null, null], "duration": [0.67, 0.54, 10.94, 3.94, 4.98, -0.03, -0.13, 0.11, 3.27, 0.75, 1.93, 2.72, 1.32, 0.37, 1.22, 5.9, -0.03, 0.75, 1.32, 2.57, 1.23, 3.2, 1.34, 2.69, 9.59, 0.52, 0.17]} \ No newline at end of file diff --git a/annotations_1/7oi0cS5tNRg_filtered.json b/annotations_1/7oi0cS5tNRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..343a9bad90e968ff163888a864821acf59d14a88 --- /dev/null +++ b/annotations_1/7oi0cS5tNRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [10.0, 10.61], [11.0, 11.53], [15.0, 19.35], [20.0, 19.63], [20.0, 19.68], [20.0, 20.56], [23.0, 23.14], [26.0, 26.45], [27.0, 30.2], [33.0, 33.54], [35.0, 34.91], [44.0, 43.9], [46.0, 46.4], [47.0, 48.19], [49.0, 49.49], [53.0, 54.24], [55.0, 56.0], [56.0, 59.48], [61.0, 61.67], [63.0, 63.53], [65.0, 66.12], [78.0, 78.83], [85.0, 85.13], [90.0, 90.98], [95.0, 95.86], [100.0, 108.09], [125.0, 124.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 84.55], ["sidetone", 5.54], ["boing", 2.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.61, 0.53, 4.35, -0.37, -0.32, 0.56, 0.14, 0.45, 3.2, 0.54, -0.09, -0.1, 0.4, 1.19, 0.49, 1.24, 1.0, 3.48, 0.67, 0.53, 1.12, 0.83, 0.13, 0.98, 0.86, 8.09, -0.18]} \ No newline at end of file diff --git a/annotations_1/7oqRCOYvOS4_filtered.json b/annotations_1/7oqRCOYvOS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe2d915e8c95cc6a712b38410a53229b12a93a76 --- /dev/null +++ b/annotations_1/7oqRCOYvOS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.39], [14.0, 20.16], [21.0, 23.03], [24.0, 25.24], [25.0, 30.64], [31.0, 35.21], [36.0, 43.09], [44.0, 46.47], [48.0, 48.61], [50.0, 51.17], [53.0, 55.46], [56.0, 58.08], [60.0, 65.33], [66.0, 67.8], [71.0, 71.85], [74.0, 75.39], [77.0, 78.48], [79.0, 80.87]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.02, 100.0, 0.0, 98.93, 98.59, 98.01, 99.84, 0.0, 0.0, 99.97, 99.85, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 14.55], ["thunk", 12.71], ["bouncing", 10.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 6.16, 2.03, 1.24, 5.64, 4.21, 7.09, 2.47, 0.61, 1.17, 2.46, 2.08, 5.33, 1.8, 0.85, 1.39, 1.48, 1.87]} \ No newline at end of file diff --git a/annotations_1/7p0J9wVGwZ0_filtered.json b/annotations_1/7p0J9wVGwZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7529eb8b66487c73005874e04d5d6e6ceb1b9893 --- /dev/null +++ b/annotations_1/7p0J9wVGwZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 30.55], [32.0, 33.99], [37.0, 37.05], [37.0, 37.54], [39.0, 40.56], [41.0, 48.79], [52.0, 51.97], [57.0, 57.25], [58.0, 59.02], [59.0, 59.98], [80.0, 81.87], [83.0, 84.03], [86.0, 94.59], [97.0, 97.11], [102.0, 102.42], [103.0, 103.69], [105.0, 105.6], [106.0, 107.23], [109.0, 111.81], [114.0, 114.35]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [32.55, 0.0, 0.0, 0.0, 0.0, 29.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 0.0, 29.26, 0.0], "audiomae_on_audioset": [[["music", 19.82], ["speech", 18.73], ["keyboard (musical)", 10.93]], null, null, null, null, [["music", 71.48], ["trombone", 2.57], ["brass instrument", 2.43]], null, null, null, null, null, null, [["music", 29.94], ["speech", 27.35], ["whack, thwack", 9.07]], null, null, null, null, null, [["speech", 24.82], ["fart", 21.85], ["music", 14.51]], null], "duration": [15.55, 1.99, 0.05, 0.54, 1.56, 7.79, -0.03, 0.25, 1.02, 0.98, 1.87, 1.03, 8.59, 0.11, 0.42, 0.69, 0.6, 1.23, 2.81, 0.35]} \ No newline at end of file diff --git a/annotations_1/7qhNVDPZ-0I_filtered.json b/annotations_1/7qhNVDPZ-0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..315b1c7d5e566f3bc88f79c5da90210cde8adb0f --- /dev/null +++ b/annotations_1/7qhNVDPZ-0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.1], [16.0, 16.77], [18.0, 18.27], [23.0, 23.21], [28.0, 29.56], [31.0, 32.49], [36.0, 35.73], [44.0, 46.72], [49.0, 50.5], [52.0, 52.51], [55.0, 57.72], [58.0, 60.78], [61.0, 62.99], [65.0, 68.57], [69.0, 71.98], [73.0, 75.25], [79.0, 80.69], [82.0, 83.74], [85.0, 86.66], [88.0, 91.71], [93.0, 95.22], [97.0, 113.68], [116.0, 138.15], [140.0, 145.64], [147.0, 149.27], [152.0, 157.82], [159.0, 160.81], [162.0, 162.63], [163.0, 163.48], [164.0, 164.86], [165.0, 167.17], [172.0, 173.99], [175.0, 177.13], [184.0, 185.04], [186.0, 187.14], [188.0, 198.12], [200.0, 200.74], [202.0, 202.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 91.64, 42.46, 0.0, 75.39, 73.82, 53.53, 0.0, 0.0, 0.0, 60.23, 48.65, 54.5, 55.25, 52.56, 53.4, 40.36, 0.0, 0.0, 0.0, 0.0, 33.43, 0.0, 33.06, 0.0, 0.0, 29.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.36], ["music", 10.76], ["whale vocalization", 2.91]], null, null, null, null, null, null, null, null, [["music", 46.53], ["whale vocalization", 9.53], ["musical instrument", 7.27]], null, null, null, null, [["music", 18.05], ["speech", 11.02], ["animal", 10.68]], null, null, null, null, [["livestock, farm animals, working animals", 37.27], ["cowbell", 32.69], ["cattle, bovinae", 11.89]], null, [["hum", 27.01], ["mains hum", 18.06], ["music", 14.44]], null, null, [["buzzer", 64.14], ["speech", 7.54], ["buzz", 6.4]], null, null], "duration": [2.1, 0.77, 0.27, 0.21, 1.56, 1.49, -0.27, 2.72, 1.5, 0.51, 2.72, 2.78, 1.99, 3.57, 2.98, 2.25, 1.69, 1.74, 1.66, 3.71, 2.22, 16.68, 22.15, 5.64, 2.27, 5.82, 1.81, 0.63, 0.48, 0.86, 2.17, 1.99, 2.13, 1.04, 1.14, 10.12, 0.74, 0.56]} \ No newline at end of file diff --git a/annotations_1/7qi8llEviYY_filtered.json b/annotations_1/7qi8llEviYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..641430d67a13ba7f523931343ff960060901edd7 --- /dev/null +++ b/annotations_1/7qi8llEviYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.14], [14.0, 15.63], [21.0, 24.22], [28.0, 28.71], [32.0, 32.68], [36.0, 36.63], [39.0, 45.5], [48.0, 48.36], [49.0, 57.67], [58.0, 93.51], [94.0, 95.05], [100.0, 101.07], [103.0, 117.05], [122.0, 122.98], [123.0, 135.14], [137.0, 137.74]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 49.73, 0.0, 39.72, 0.0, 0.0, 0.0, 37.77, 0.0, 36.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 69.11], ["throbbing", 6.73], ["hum", 3.9]], null, [["music", 27.92], ["ding", 23.27], ["chink, clink", 14.0]], null, null, null, [["music", 46.45], ["speech", 15.76], ["hum", 4.81]], null, [["music", 25.79], ["speech", 20.47], ["hum", 14.74]], null], "duration": [0.14, 1.63, 3.22, 0.71, 0.68, 0.63, 6.5, 0.36, 8.67, 35.51, 1.05, 1.07, 14.05, 0.98, 12.14, 0.74]} \ No newline at end of file diff --git a/annotations_1/7rJZx_l_h1w_filtered.json b/annotations_1/7rJZx_l_h1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7667bbb59ce5d4d422adf22472cdf474f1faa3f7 --- /dev/null +++ b/annotations_1/7rJZx_l_h1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [5.0, 4.92], [5.0, 6.4], [7.0, 9.54], [12.0, 13.56], [16.0, 16.85], [19.0, 19.62], [21.0, 21.78], [23.0, 25.19], [27.0, 30.42], [33.0, 33.96], [36.0, 37.67], [42.0, 42.8], [43.0, 46.2], [47.0, 47.87], [51.0, 50.84], [52.0, 52.73], [60.0, 61.05], [65.0, 75.69], [77.0, 78.92], [82.0, 82.05], [89.0, 92.91], [95.0, 95.89], [99.0, 99.23], [100.0, 102.2], [103.0, 114.81], [116.0, 129.83], [131.0, 133.57], [135.0, 150.82], [153.0, 154.85], [155.0, 158.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 34.77, 98.44, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 39.18, 0.0, 0.0, 62.27, 0.0, 0.0, 62.58, 47.62, 76.7, 98.51, 38.88, 0.0, 49.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 35.26], ["speech", 13.89], ["sidetone", 7.18]], null, null, null, null, null, null, null, null, null, [["music", 41.13], ["singing bowl", 12.65], ["glockenspiel", 4.46]], null, null, null, null, null, null, [["hum", 19.77], ["music", 19.39], ["mains hum", 13.92]], null, null, [["mains hum", 32.18], ["hum", 29.2], ["music", 16.03]], null, [["music", 23.21], ["fly, housefly", 17.95], ["mosquito", 7.3]]], "duration": [0.21, -0.08, 1.4, 2.54, 1.56, 0.85, 0.62, 0.78, 2.19, 3.42, 0.96, 1.67, 0.8, 3.2, 0.87, -0.16, 0.73, 1.05, 10.69, 1.92, 0.05, 3.91, 0.89, 0.23, 2.2, 11.81, 13.83, 2.57, 15.82, 1.85, 3.09]} \ No newline at end of file diff --git a/annotations_1/7rYqBdJdnqo_filtered.json b/annotations_1/7rYqBdJdnqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb3d432bac96bb0ed580df5ac525f795ee1d6658 --- /dev/null +++ b/annotations_1/7rYqBdJdnqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.3], [19.0, 19.45], [21.0, 23.13], [24.0, 24.34], [26.0, 27.67], [28.0, 30.11], [30.0, 33.81], [37.0, 37.2], [38.0, 38.72], [41.0, 42.7], [43.0, 43.65], [46.0, 49.64], [52.0, 52.42], [57.0, 58.82], [61.0, 62.9], [63.0, 91.25], [92.0, 92.6], [93.0, 95.07], [97.0, 99.17], [100.0, 109.71], [110.0, 114.24], [117.0, 118.39], [119.0, 119.57], [120.0, 120.95], [123.0, 123.06], [124.0, 124.58], [125.0, 126.71], [128.0, 128.33], [129.0, 133.32], [136.0, 147.02], [148.0, 158.25], [160.0, 160.64], [161.0, 164.44], [165.0, 165.77], [167.0, 171.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, false, false, true, false, true], "silence_prob": [34.63, 0.0, 71.87, 0.0, 0.0, 51.66, 90.25, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 42.86, 0.0, 38.91, 38.9, 33.29, 54.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.08, 30.23, 30.61, 0.0, 30.71, 0.0, 28.49], "audiomae_on_audioset": [[["music", 32.32], ["throbbing", 24.46], ["hum", 16.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 27.92], ["speech", 27.3], ["music", 20.87]], null, [["hum", 29.46], ["music", 17.24], ["mains hum", 9.21]], [["music", 38.23], ["hum", 9.22], ["sonar", 7.0]], [["hum", 34.14], ["single-lens reflex camera", 15.38], ["music", 13.72]], null, null, null, null, null, null, null, null, [["music", 39.21], ["speech", 12.08], ["didgeridoo", 6.81]], [["speech", 30.16], ["music", 22.07], ["hum", 14.74]], [["hum", 30.36], ["mains hum", 29.41], ["music", 16.08]], null, [["music", 30.04], ["speech", 29.29], ["didgeridoo", 3.39]], null, [["music", 46.98], ["throbbing", 7.02], ["hum", 5.72]]], "duration": [5.3, 0.45, 2.13, 0.34, 1.67, 2.11, 3.81, 0.2, 0.72, 1.7, 0.65, 3.64, 0.42, 1.82, 1.9, 28.25, 0.6, 2.07, 2.17, 9.71, 4.24, 1.39, 0.57, 0.95, 0.06, 0.58, 1.71, 0.33, 4.32, 11.02, 10.25, 0.64, 3.44, 0.77, 4.0]} \ No newline at end of file diff --git a/annotations_1/7sXlyaQ_ZHs_filtered.json b/annotations_1/7sXlyaQ_ZHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c27c2b32e99b296f6c3392910dcdd73f631448f --- /dev/null +++ b/annotations_1/7sXlyaQ_ZHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.24], [11.0, 12.85], [15.0, 16.14], [18.0, 18.82], [19.0, 20.02], [21.0, 22.18], [23.0, 24.33], [25.0, 64.3], [65.0, 96.69], [98.0, 131.01], [134.0, 137.47], [138.0, 141.76], [144.0, 150.7]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [40.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.26, 35.4, 42.81], "audiomae_on_audioset": [[["music", 23.48], ["hum", 22.2], ["throbbing", 16.81]], null, null, null, null, null, null, null, null, null, [["mains hum", 32.28], ["hum", 25.92], ["speech", 8.71]], [["hum", 25.05], ["buzz", 14.17], ["electric shaver, electric razor", 12.48]], [["hum", 38.89], ["mains hum", 11.25], ["throbbing", 9.03]]], "duration": [2.24, 1.85, 1.14, 0.82, 1.02, 1.18, 1.33, 39.3, 31.69, 33.01, 3.47, 3.76, 6.7]} \ No newline at end of file diff --git a/annotations_1/7szH-UZx2JU_filtered.json b/annotations_1/7szH-UZx2JU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95bf539509ee25e38f9429c359b62c95ab512f85 --- /dev/null +++ b/annotations_1/7szH-UZx2JU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.22], [18.0, 17.79], [19.0, 20.61], [35.0, 35.77], [37.0, 37.76], [39.0, 39.26], [41.0, 42.03], [43.0, 43.77], [45.0, 45.15], [46.0, 47.02], [48.0, 48.61], [49.0, 50.84], [52.0, 52.52], [57.0, 57.89], [59.0, 67.46], [70.0, 72.84], [75.0, 77.5], [79.0, 79.32], [89.0, 90.19], [92.0, 93.11], [94.0, 95.15], [96.0, 96.92], [102.0, 102.1], [106.0, 105.93], [108.0, 108.92], [115.0, 133.89], [135.0, 136.65], [139.0, 139.51], [150.0, 150.92], [152.0, 152.29], [157.0, 157.5], [161.0, 161.91], [167.0, 168.94], [170.0, 171.58], [177.0, 177.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 30.35, 30.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 47.44], ["mains hum", 17.76], ["throbbing", 8.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 42.37], ["hum", 11.82], ["music", 8.13]], [["hum", 18.45], ["music", 14.88], ["throbbing", 7.47]], [["rumble", 17.65], ["hum", 13.68], ["mains hum", 12.18]], null, null, null, null, null, null, null, null, [["hum", 32.15], ["music", 20.55], ["mains hum", 13.08]], null, null, null, null, null, null, null, null, null], "duration": [5.22, -0.21, 1.61, 0.77, 0.76, 0.26, 1.03, 0.77, 0.15, 1.02, 0.61, 1.84, 0.52, 0.89, 8.46, 2.84, 2.5, 0.32, 1.19, 1.11, 1.15, 0.92, 0.1, -0.07, 0.92, 18.89, 1.65, 0.51, 0.92, 0.29, 0.5, 0.91, 1.94, 1.58, 0.38]} \ No newline at end of file diff --git a/annotations_1/7tXcQ8BBqXs_filtered.json b/annotations_1/7tXcQ8BBqXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e1b5cfb061b6fc1b2d96c2bf3c9feedc43ef9c7 --- /dev/null +++ b/annotations_1/7tXcQ8BBqXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.91], [12.0, 12.88], [16.0, 16.85], [19.0, 22.81], [25.0, 37.25], [38.0, 63.12], [64.0, 70.09], [74.0, 74.97], [79.0, 79.59], [87.0, 90.24], [92.0, 93.53], [94.0, 96.52], [99.0, 98.81], [103.0, 102.69], [107.0, 108.46], [109.0, 111.03], [112.0, 117.59], [119.0, 121.86], [125.0, 130.23], [132.0, 137.27], [138.0, 138.43], [144.0, 143.68], [145.0, 144.8], [145.0, 145.91], [147.0, 148.63], [150.0, 157.47], [158.0, 160.91], [165.0, 171.04], [173.0, 173.47], [176.0, 176.82]], "keep_status": [false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.48, 87.55, 44.07, 64.18, 0.0, 0.0, 49.09, 0.0, 54.43, 0.0, 0.0, 0.0, 55.6, 44.75, 66.76, 76.2, 61.77, 0.0, 0.0, 0.0, 0.0, 0.0, 40.38, 37.9, 36.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.28], ["didgeridoo", 7.89], ["hum", 6.99]], null, [["speech", 37.08], ["music", 19.65], ["hum", 5.49]], null, null, null, [["speech", 36.09], ["fart", 17.32], ["hum", 4.62]], null, null, null, null, null, null, [["music", 52.03], ["speech", 8.44], ["hum", 4.53]], null, null, null, null, null, null, null, null, [["music", 41.21], ["speech", 14.9], ["didgeridoo", 11.75]], [["music", 29.28], ["didgeridoo", 15.98], ["speech", 6.14]], [["speech", 21.45], ["hum", 16.93], ["music", 15.95]], null, null], "duration": [-0.09, 0.88, 0.85, 3.81, 12.25, 25.12, 6.09, 0.97, 0.59, 3.24, 1.53, 2.52, -0.19, -0.31, 1.46, 2.03, 5.59, 2.86, 5.23, 5.27, 0.43, -0.32, -0.2, 0.91, 1.63, 7.47, 2.91, 6.04, 0.47, 0.82]} \ No newline at end of file diff --git a/annotations_1/7uOhTRONUbY_filtered.json b/annotations_1/7uOhTRONUbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fc1c8dd9ddfaaa7175c2771b35716bd9bd1a2e5 --- /dev/null +++ b/annotations_1/7uOhTRONUbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.93], [11.0, 11.23], [11.0, 11.37], [11.0, 13.95], [18.0, 22.4], [23.0, 24.11], [25.0, 26.0], [28.0, 27.8], [29.0, 30.99], [33.0, 34.3], [36.0, 36.9], [38.0, 37.86], [38.0, 41.08], [44.0, 55.17], [56.0, 57.86], [59.0, 60.51], [66.0, 69.89], [73.0, 72.96], [73.0, 73.06], [73.0, 73.16], [74.0, 73.94], [75.0, 76.65], [77.0, 79.74], [81.0, 83.13], [86.0, 87.61], [88.0, 88.96], [90.0, 171.83]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.69, 35.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.26, 37.69, 0.0, 0.0, 38.74, 0.0, 0.0, 0.0, 0.0, 0.0, 31.97, 32.39, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 35.07], ["speech", 16.31], ["whale vocalization", 3.02]], [["speech", 38.69], ["music", 14.73], ["mains hum", 10.16]], null, null, null, null, null, null, null, [["speech", 46.98], ["music", 22.69], ["synthesizer", 3.95]], [["music", 30.14], ["speech", 25.66], ["hum", 6.33]], null, null, [["music", 59.04], ["hum", 5.76], ["duck", 3.25]], null, null, null, null, null, [["music", 48.74], ["didgeridoo", 7.67], ["theremin", 4.13]], [["music", 41.29], ["croak", 16.11], ["frog", 12.49]], null, null, null], "duration": [0.93, 0.23, 0.37, 2.95, 4.4, 1.11, 1.0, -0.2, 1.99, 1.3, 0.9, -0.14, 3.08, 11.17, 1.86, 1.51, 3.89, -0.04, 0.06, 0.16, -0.06, 1.65, 2.74, 2.13, 1.61, 0.96, 81.83]} \ No newline at end of file diff --git a/annotations_1/7uYoJwMuN_8_filtered.json b/annotations_1/7uYoJwMuN_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94a98917161f5f0a909b93dab69e79ef38987a95 --- /dev/null +++ b/annotations_1/7uYoJwMuN_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.03], [8.0, 38.52], [39.0, 39.95], [41.0, 78.11], [82.0, 90.22], [91.0, 110.42], [111.0, 113.44], [119.0, 120.24], [121.0, 121.17]], "keep_status": [true, false, false, false, true, false, true, false, false], "silence_prob": [32.86, 0.0, 0.0, 0.0, 32.87, 29.62, 29.98, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 29.7], ["mains hum", 22.64], ["music", 5.67]], null, null, null, [["music", 42.23], ["hum", 8.58], ["rumble", 7.14]], [["speech", 48.14], ["music", 18.71], ["machine gun", 8.84]], [["music", 43.65], ["breaking", 10.9], ["crack", 5.65]], null, null], "duration": [2.03, 30.52, 0.95, 37.11, 8.22, 19.42, 2.44, 1.24, 0.17]} \ No newline at end of file diff --git a/annotations_1/7vWLiI04VCw_filtered.json b/annotations_1/7vWLiI04VCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..531e50b767533cc91d6fd00eccabee85ab3b6b77 --- /dev/null +++ b/annotations_1/7vWLiI04VCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.51], [25.0, 53.08], [55.0, 74.78], [77.0, 76.91]], "keep_status": [false, true, true, false], "silence_prob": [0.0, 31.26, 33.45, 0.0], "audiomae_on_audioset": [null, [["music", 25.86], ["effects unit", 17.0], ["musical instrument", 9.34]], [["music", 19.34], ["effects unit", 15.24], ["gong", 7.97]], null], "duration": [0.51, 28.08, 19.78, -0.09]} \ No newline at end of file diff --git a/annotations_1/7wZdMPB-O6Y_filtered.json b/annotations_1/7wZdMPB-O6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a08fd5e4541fd7887b5bb1bf7a7a3c3fab25b62 --- /dev/null +++ b/annotations_1/7wZdMPB-O6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.41], [6.0, 7.5], [12.0, 13.81], [20.0, 20.38], [34.0, 34.43], [39.0, 40.26], [57.0, 57.48], [62.0, 62.31], [76.0, 75.68], [84.0, 84.55], [85.0, 93.09], [95.0, 95.35], [97.0, 97.46], [100.0, 100.09], [105.0, 105.36], [107.0, 107.28], [112.0, 113.81], [115.0, 116.7], [118.0, 120.45], [123.0, 124.53], [127.0, 134.82], [146.0, 146.5], [152.0, 152.51], [163.0, 180.35], [186.0, 186.39]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [40.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.75, 0.0, 44.32, 0.0, 0.0, 29.31, 0.0], "audiomae_on_audioset": [[["music", 41.91], ["whale vocalization", 14.22], ["theremin", 12.2]], null, null, null, null, null, null, null, null, null, [["music", 28.97], ["hum", 8.61], ["sound effect", 4.95]], null, null, null, null, null, null, null, [["explosion", 33.42], ["music", 29.73], ["eruption", 6.65]], null, [["music", 50.61], ["ambient music", 17.05], ["synthesizer", 7.89]], null, null, [["speech", 65.68], ["music", 6.58], ["explosion", 4.78]], null], "duration": [5.41, 1.5, 1.81, 0.38, 0.43, 1.26, 0.48, 0.31, -0.32, 0.55, 8.09, 0.35, 0.46, 0.09, 0.36, 0.28, 1.81, 1.7, 2.45, 1.53, 7.82, 0.5, 0.51, 17.35, 0.39]} \ No newline at end of file diff --git a/annotations_1/7wgLb8Ykb24_filtered.json b/annotations_1/7wgLb8Ykb24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ad49f9b60da733c8e99d1f7f72cf3d3ec7d2c5f --- /dev/null +++ b/annotations_1/7wgLb8Ykb24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [3.0, 4.02], [5.0, 5.53], [9.0, 9.73], [17.0, 16.9], [18.0, 23.3], [30.0, 30.35], [31.0, 31.8], [33.0, 34.52], [43.0, 43.44], [45.0, 45.03], [53.0, 53.4], [53.0, 53.5], [54.0, 53.54], [56.0, 56.66], [60.0, 59.98], [61.0, 62.02], [73.0, 74.04], [75.0, 76.45], [77.0, 85.46], [91.0, 90.9], [93.0, 94.32], [101.0, 103.86], [104.0, 103.98], [104.0, 110.39], [112.0, 114.1], [115.0, 116.28], [121.0, 122.05], [124.0, 124.95], [127.0, 130.99], [132.0, 132.41], [134.0, 134.94], [142.0, 142.91], [145.0, 150.16], [152.0, 153.81], [156.0, 157.4], [158.0, 159.63], [160.0, 168.81], [169.0, 170.04], [171.0, 172.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 0.0, 0.0, 99.98, 0.0, 99.97, 88.83, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 47.7, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 34.21], ["hum", 26.19], ["music", 22.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.18], ["hum", 20.33], ["throbbing", 5.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.81], ["synthesizer", 7.78], ["musical instrument", 3.36]], null, null, null, null, null, null], "duration": [0.15, 1.02, 0.53, 0.73, -0.1, 5.3, 0.35, 0.8, 1.52, 0.44, 0.03, 0.4, 0.5, -0.46, 0.66, -0.02, 1.02, 1.04, 1.45, 8.46, -0.1, 1.32, 2.86, -0.02, 6.39, 2.1, 1.28, 1.05, 0.95, 3.99, 0.41, 0.94, 0.91, 5.16, 1.81, 1.4, 1.63, 8.81, 1.04, 1.22]} \ No newline at end of file diff --git a/annotations_1/7wniAznxp08_filtered.json b/annotations_1/7wniAznxp08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..585348db1833f49e25f06c2df2df0d6495d71765 --- /dev/null +++ b/annotations_1/7wniAznxp08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [5.0, 7.3], [9.0, 9.78], [11.0, 11.15], [12.0, 12.73], [20.0, 20.98], [24.0, 25.03], [37.0, 37.56], [39.0, 38.99], [40.0, 40.0], [47.0, 47.58], [49.0, 49.4], [50.0, 53.18], [64.0, 64.89], [65.0, 67.14], [72.0, 74.83], [79.0, 80.76], [84.0, 85.38], [91.0, 92.38], [106.0, 106.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 37.41, 42.06, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.72], ["boing", 22.93], ["didgeridoo", 9.18]], [["music", 46.45], ["musical instrument", 10.79], ["brass instrument", 3.06]], null, null, null, null], "duration": [0.93, 2.3, 0.78, 0.15, 0.73, 0.98, 1.03, 0.56, -0.01, 0.0, 0.58, 0.4, 3.18, 0.89, 2.14, 2.83, 1.76, 1.38, 1.38, 0.68]} \ No newline at end of file diff --git a/annotations_1/7yBBNmR1CLg_filtered.json b/annotations_1/7yBBNmR1CLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3dcfedf5a81912e6cc00a58dc26953279844a65 --- /dev/null +++ b/annotations_1/7yBBNmR1CLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [8.0, 8.67], [10.0, 10.71], [12.0, 16.78], [18.0, 19.41], [21.0, 22.89], [24.0, 39.04], [40.0, 41.35], [42.0, 45.67], [47.0, 58.23], [85.0, 103.5], [105.0, 107.55], [108.0, 109.65], [112.0, 113.88], [115.0, 116.19], [117.0, 117.83], [119.0, 119.45], [120.0, 120.8], [123.0, 122.77], [124.0, 124.43], [125.0, 130.44], [132.0, 133.39], [134.0, 134.62], [143.0, 144.31], [149.0, 149.5], [150.0, 160.27], [163.0, 165.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.28, 0.0, 0.0, 34.01, 0.0, 53.22, 33.69, 37.83, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 38.51, 60.32], "audiomae_on_audioset": [null, null, null, [["speech", 44.88], ["music", 43.91], ["whale vocalization", 2.64]], null, null, [["speech", 52.43], ["music", 27.34], ["sidetone", 5.11]], null, null, [["music", 47.58], ["speech", 35.05], ["slosh", 1.69]], [["music", 61.57], ["guitar", 15.48], ["plucked string instrument", 5.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.28], ["gurgling", 7.03], ["effects unit", 5.02]], null], "duration": [1.16, 0.67, 0.71, 4.78, 1.41, 1.89, 15.04, 1.35, 3.67, 11.23, 18.5, 2.55, 1.65, 1.88, 1.19, 0.83, 0.45, 0.8, -0.23, 0.43, 5.44, 1.39, 0.62, 1.31, 0.5, 10.27, 2.01]} \ No newline at end of file diff --git a/annotations_1/7ycVIGqnLO8_filtered.json b/annotations_1/7ycVIGqnLO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a94cf469add45dadb843cca68cf1b87312f482fd --- /dev/null +++ b/annotations_1/7ycVIGqnLO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.06], [32.0, 37.23], [42.0, 50.57], [58.0, 81.08], [84.0, 114.66], [116.0, 116.33]], "keep_status": [true, true, false, true, false, false], "silence_prob": [33.34, 36.15, 33.23, 29.87, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.59], ["hum", 8.95], ["throbbing", 6.51]], [["music", 36.44], ["wind instrument, woodwind instrument", 23.33], ["shofar", 7.83]], [["music", 77.53], ["wind instrument, woodwind instrument", 3.26], ["musical instrument", 2.07]], [["music", 48.22], ["hum", 11.41], ["throbbing", 5.33]], null, null], "duration": [19.06, 5.23, 8.57, 23.08, 30.66, 0.33]} \ No newline at end of file diff --git a/annotations_1/7ygAdJYS9m0_filtered.json b/annotations_1/7ygAdJYS9m0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7b27d8f97d22a484f7ac2a307049c163bea64ba --- /dev/null +++ b/annotations_1/7ygAdJYS9m0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.6], [18.0, 22.11], [28.0, 30.16], [31.0, 31.68], [50.0, 53.91], [54.0, 59.0], [63.0, 63.0], [63.0, 64.96], [78.0, 80.89], [85.0, 85.33], [87.0, 87.02], [90.0, 90.12], [110.0, 114.4], [116.0, 115.84], [119.0, 122.77], [123.0, 123.84], [125.0, 125.37], [130.0, 130.62], [133.0, 132.8], [138.0, 139.09], [140.0, 140.54], [147.0, 148.83], [150.0, 150.75], [158.0, 158.94], [161.0, 163.43], [164.0, 165.25]], "keep_status": [false, false, true, false, true, true, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 42.58, 47.01, 0.0, 30.35, 30.14, 0.0, 0.0, 37.68, 0.0, 0.0, 0.0, 30.9, 0.0, 41.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.05, 0.0], "audiomae_on_audioset": [null, [["music", 56.53], ["chirp tone", 17.56], ["sine wave", 1.76]], [["speech", 10.61], ["cacophony", 7.4], ["radio", 6.02]], null, [["music", 20.42], ["cattle, bovinae", 14.96], ["moo", 13.74]], [["sheep", 13.92], ["bleat", 13.8], ["livestock, farm animals, working animals", 13.05]], null, null, [["music", 39.68], ["hum", 13.06], ["throbbing", 10.89]], null, null, null, [["music", 22.65], ["livestock, farm animals, working animals", 15.26], ["moo", 11.39]], null, [["speech", 12.57], ["music", 11.68], ["electric shaver, electric razor", 8.95]], null, null, null, null, null, null, null, null, null, [["speech", 29.24], ["music", 25.35], ["splash, splatter", 8.17]], null], "duration": [1.6, 4.11, 2.16, 0.68, 3.91, 5.0, 0.0, 1.96, 2.89, 0.33, 0.02, 0.12, 4.4, -0.16, 3.77, 0.84, 0.37, 0.62, -0.2, 1.09, 0.54, 1.83, 0.75, 0.94, 2.43, 1.25]} \ No newline at end of file diff --git a/annotations_1/801rBxBY-5w_filtered.json b/annotations_1/801rBxBY-5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5f02d9d896993054c36fd67a804d3e8b39f1ead --- /dev/null +++ b/annotations_1/801rBxBY-5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [4.0, 8.18], [9.0, 10.49], [12.0, 32.14], [32.0, 73.45], [75.0, 75.34], [81.0, 81.58], [95.0, 106.79], [108.0, 108.99], [109.0, 114.94], [117.0, 117.51], [123.0, 128.48], [129.0, 129.2], [131.0, 131.09], [133.0, 133.74]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.71, 0.0, 30.32, 0.0, 0.0, 0.0, 53.47, 0.0, 50.91, 0.0, 51.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 37.49], ["music", 17.37], ["mains hum", 12.7]], null, [["music", 69.16], ["breaking", 4.59], ["machine gun", 3.38]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 4.18, 1.49, 20.14, 41.45, 0.34, 0.58, 11.79, 0.99, 5.94, 0.51, 5.48, 0.2, 0.09, 0.74]} \ No newline at end of file diff --git a/annotations_1/80fHUAW_up0_filtered.json b/annotations_1/80fHUAW_up0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..894edd15651f8379a7f2a4b509fa162c42872262 --- /dev/null +++ b/annotations_1/80fHUAW_up0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.0], [15.0, 16.21], [17.0, 17.05], [24.0, 25.95], [26.0, 27.77], [28.0, 28.39], [28.0, 28.98], [40.0, 41.86], [44.0, 47.43], [53.0, 55.75], [58.0, 62.53], [66.0, 66.06], [67.0, 68.64], [74.0, 88.16], [98.0, 100.5], [110.0, 111.89]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 30.0, 32.03, 0.0, 0.0, 30.01, 30.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 45.03], ["speech", 17.89], ["electronic music", 2.25]], [["music", 66.93], ["synthetic singing", 3.0], ["echo", 2.05]], [["music", 52.29], ["didgeridoo", 20.46], ["sidetone", 7.26]], null, null, [["music", 88.39], ["country", 1.03], ["musical instrument", 0.62]], [["music", 57.23], ["yodeling", 7.2], ["song", 3.38]], null], "duration": [3.0, 1.21, 0.05, 1.95, 1.77, 0.39, 0.98, 1.86, 3.43, 2.75, 4.53, 0.06, 1.64, 14.16, 2.5, 1.89]} \ No newline at end of file diff --git a/annotations_1/81MNbVi5a64_filtered.json b/annotations_1/81MNbVi5a64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..070a3c25c1d1c882b6af8b28e0696805e6d57702 --- /dev/null +++ b/annotations_1/81MNbVi5a64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.96], [17.0, 21.29], [28.0, 28.78], [31.0, 32.05], [32.0, 49.82], [52.0, 52.47], [54.0, 58.62], [63.0, 84.84], [85.0, 95.96], [98.0, 108.85], [109.0, 113.31], [114.0, 114.59], [118.0, 119.35], [121.0, 121.51], [124.0, 126.27], [126.0, 126.71], [127.0, 127.52], [129.0, 129.63], [135.0, 149.71], [152.0, 180.49], [182.0, 209.26], [210.0, 210.95], [212.0, 211.82]], "keep_status": [true, false, false, false, true, false, true, false, false, true, true, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [31.43, 31.18, 0.0, 0.0, 31.15, 0.0, 35.74, 29.7, 31.17, 31.44, 33.26, 0.0, 0.0, 0.0, 28.79, 0.0, 0.0, 0.0, 30.1, 30.39, 29.73, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 24.0], ["cattle, bovinae", 21.64], ["moo", 17.33]], [["cattle, bovinae", 40.59], ["moo", 27.48], ["livestock, farm animals, working animals", 16.2]], null, null, [["speech", 43.91], ["music", 12.17], ["electric shaver, electric razor", 5.34]], null, [["music", 45.62], ["speech", 18.94], ["didgeridoo", 4.09]], [["music", 66.83], ["speech", 13.75], ["ice cream truck, ice cream van", 10.53]], [["speech", 38.99], ["music", 32.36], ["boing", 3.7]], [["music", 27.48], ["livestock, farm animals, working animals", 23.64], ["sheep", 16.22]], [["speech", 27.21], ["thump, thud", 11.68], ["crack", 11.04]], null, null, null, [["music", 67.48], ["speech", 8.96], ["hum", 3.49]], null, null, null, [["throbbing", 19.31], ["cattle, bovinae", 13.49], ["livestock, farm animals, working animals", 12.65]], [["music", 33.41], ["buzz", 9.75], ["sound effect", 7.49]], [["music", 62.46], ["sound effect", 7.09], ["cacophony", 5.36]], null, null], "duration": [12.96, 4.29, 0.78, 1.05, 17.82, 0.47, 4.62, 21.84, 10.96, 10.85, 4.31, 0.59, 1.35, 0.51, 2.27, 0.71, 0.52, 0.63, 14.71, 28.49, 27.26, 0.95, -0.18]} \ No newline at end of file diff --git a/annotations_1/81XTZOlNHEU_filtered.json b/annotations_1/81XTZOlNHEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..239fa13573b9dee4ec4ea671394be8307cb29ea9 --- /dev/null +++ b/annotations_1/81XTZOlNHEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [7.0, 17.71], [19.0, 20.75], [27.0, 27.09], [33.0, 33.08], [33.0, 34.5], [35.0, 41.05], [54.0, 58.85], [61.0, 63.15], [66.0, 69.48], [71.0, 73.48], [86.0, 86.63], [89.0, 88.92], [94.0, 94.12], [97.0, 97.66], [101.0, 103.99], [105.0, 106.59], [108.0, 109.17], [111.0, 111.42], [115.0, 116.01], [118.0, 125.19], [126.0, 127.26], [129.0, 129.78], [132.0, 132.75], [134.0, 136.66]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 33.36, 0.0, 0.0, 0.0, 0.0, 78.55, 99.36, 70.86, 82.97, 99.68, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 46.26], "audiomae_on_audioset": [null, [["music", 29.53], ["cattle, bovinae", 14.88], ["speech", 12.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.84], ["speech", 11.96], ["musical instrument", 7.37]]], "duration": [1.32, 10.71, 1.75, 0.09, 0.08, 1.5, 6.05, 4.85, 2.15, 3.48, 2.48, 0.63, -0.08, 0.12, 0.66, 2.99, 1.59, 1.17, 0.42, 1.01, 7.19, 1.26, 0.78, 0.75, 2.66]} \ No newline at end of file diff --git a/annotations_1/81YXRcpQSpE_filtered.json b/annotations_1/81YXRcpQSpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8d302602a9c4bf0ff39df12040f6c2f59fdd32c --- /dev/null +++ b/annotations_1/81YXRcpQSpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [13.0, 15.11], [21.0, 22.03], [23.0, 24.16], [29.0, 29.71], [32.0, 43.48], [45.0, 47.65], [53.0, 54.24], [58.0, 59.71], [60.0, 64.84], [66.0, 67.53], [68.0, 69.85], [72.0, 73.53], [76.0, 76.96], [80.0, 82.26], [84.0, 85.26], [87.0, 89.85], [93.0, 93.58], [97.0, 98.51], [103.0, 103.25], [107.0, 107.87], [112.0, 114.17], [118.0, 120.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.59, 0.0, 0.0, 0.0, 38.47, 91.47, 0.0, 0.0, 39.41, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 84.43, 100.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 72.29], ["explosion", 5.5], ["eruption", 4.31]], null, null, null, [["speech", 72.5], ["sidetone", 5.8], ["music", 3.07]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.68, 2.11, 1.03, 1.16, 0.71, 11.48, 2.65, 1.24, 1.71, 4.84, 1.53, 1.85, 1.53, 0.96, 2.26, 1.26, 2.85, 0.58, 1.51, 0.25, 0.87, 2.17, 2.68]} \ No newline at end of file diff --git a/annotations_1/81oozSLS2CM_filtered.json b/annotations_1/81oozSLS2CM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab2d901e1af451a2118e4eae44ab9f7424a2df7b --- /dev/null +++ b/annotations_1/81oozSLS2CM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.88], [26.0, 27.43], [45.0, 45.64], [46.0, 46.14], [51.0, 51.65], [55.0, 56.74], [58.0, 59.75], [60.0, 97.12], [99.0, 100.43], [102.0, 102.64], [104.0, 107.47], [118.0, 118.77], [123.0, 123.16], [125.0, 125.31], [128.0, 128.85], [132.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.31, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["grunt", 59.31], ["speech", 8.93], ["groan", 3.32]], null, null, null, null, null], "duration": [0.88, 1.43, 0.64, 0.14, 0.65, 1.74, 1.75, 37.12, 1.43, 0.64, 3.47, 0.77, 0.16, 0.31, 0.85, 0.61]} \ No newline at end of file diff --git a/annotations_1/836TMubeCfo_filtered.json b/annotations_1/836TMubeCfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65505312b18746d5db4a5cb1a2cc2a286ec53ccb --- /dev/null +++ b/annotations_1/836TMubeCfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.46], [13.0, 14.17], [16.0, 18.62], [22.0, 22.47], [24.0, 69.53], [73.0, 90.05], [90.0, 109.09], [112.0, 114.78], [115.0, 118.1]], "keep_status": [true, false, false, false, false, false, true, true, true], "silence_prob": [39.12, 0.0, 60.7, 0.0, 0.0, 30.37, 30.18, 33.9, 40.54], "audiomae_on_audioset": [[["speech", 57.24], ["rumble", 7.58], ["hum", 4.82]], null, null, null, null, [["music", 48.42], ["synthesizer", 17.2], ["ambient music", 5.07]], [["music", 42.9], ["didgeridoo", 14.82], ["guitar", 9.64]], [["music", 28.6], ["hum", 15.9], ["throbbing", 7.52]], [["speech", 38.31], ["hum", 12.8], ["bee, wasp, etc.", 8.67]]], "duration": [2.46, 1.17, 2.62, 0.47, 45.53, 17.05, 19.09, 2.78, 3.1]} \ No newline at end of file diff --git a/annotations_1/836dGO4v65I_filtered.json b/annotations_1/836dGO4v65I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..244ad3e238a1fb2cc0643cf37a440e662eef7c79 --- /dev/null +++ b/annotations_1/836dGO4v65I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [22.0, 22.81], [26.0, 28.26], [33.0, 34.6], [36.0, 41.59], [43.0, 55.58], [59.0, 74.29], [77.0, 77.6], [82.0, 82.85], [91.0, 121.58], [138.0, 138.35], [143.0, 142.99], [149.0, 152.32], [159.0, 159.26], [163.0, 172.84], [174.0, 188.32], [189.0, 190.05]], "keep_status": [false, false, true, false, true, true, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 45.46, 0.0, 30.44, 30.53, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 29.86, 30.41, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.12], ["hum", 6.17], ["mains hum", 5.26]], null, [["music", 44.49], ["cacophony", 13.33], ["mains hum", 7.52]], [["music", 56.87], ["hum", 5.11], ["smash, crash", 4.29]], [["music", 28.31], ["hum", 13.21], ["throbbing", 11.16]], null, null, null, null, null, [["music", 52.62], ["throbbing", 6.75], ["musical instrument", 6.48]], null, [["speech", 49.57], ["music", 28.7], ["eruption", 1.72]], [["speech", 34.57], ["music", 16.28], ["sidetone", 13.07]], null], "duration": [0.56, 0.81, 2.26, 1.6, 5.59, 12.58, 15.29, 0.6, 0.85, 30.58, 0.35, -0.01, 3.32, 0.26, 9.84, 14.32, 1.05]} \ No newline at end of file diff --git a/annotations_1/83Lfw7BxsQE_filtered.json b/annotations_1/83Lfw7BxsQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..374427bae4fb8811009590d8fe98f34beef54e9e --- /dev/null +++ b/annotations_1/83Lfw7BxsQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.47], [17.0, 17.29], [18.0, 18.18], [19.0, 23.13], [24.0, 29.51], [32.0, 31.63], [33.0, 33.66], [36.0, 37.44], [41.0, 43.14], [48.0, 49.52], [52.0, 54.35], [56.0, 64.79], [65.0, 69.45], [71.0, 78.07], [82.0, 87.71], [89.0, 89.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.4, 0.0, 0.0, 100.0, 99.62, 0.0, 0.0, 0.0, 100.0, 0.0, 99.99, 100.0, 92.64, 38.08, 46.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 27.7], ["music", 25.23], ["gong", 24.91]], [["music", 60.84], ["soundtrack music", 6.03], ["whale vocalization", 4.83]], null], "duration": [11.47, 0.29, 0.18, 4.13, 5.51, -0.37, 0.66, 1.44, 2.14, 1.52, 2.35, 8.79, 4.45, 7.07, 5.71, 0.04]} \ No newline at end of file diff --git a/annotations_1/84gYIl6Zjks_filtered.json b/annotations_1/84gYIl6Zjks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6b124bedab2c2eb8d0a2b1561f27dded4002705 --- /dev/null +++ b/annotations_1/84gYIl6Zjks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.21], [19.0, 19.23], [21.0, 22.18], [25.0, 31.62], [33.0, 35.41], [36.0, 39.46], [42.0, 43.31], [45.0, 44.95], [48.0, 54.94], [56.0, 58.02], [61.0, 63.41], [65.0, 65.8], [67.0, 86.66], [90.0, 90.86], [92.0, 93.29], [94.0, 94.64], [99.0, 100.55], [104.0, 104.7], [106.0, 106.91], [112.0, 112.08], [114.0, 114.02], [115.0, 115.18], [117.0, 118.02], [118.0, 119.03], [122.0, 122.23], [124.0, 125.1], [126.0, 130.05], [131.0, 131.57], [132.0, 133.14], [134.0, 137.88], [138.0, 139.8], [144.0, 145.93], [149.0, 149.07], [157.0, 157.71], [163.0, 164.29], [169.0, 169.38], [170.0, 170.77], [174.0, 173.94], [179.0, 180.47], [181.0, 181.72], [184.0, 184.86], [185.0, 185.55], [186.0, 186.76]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.75, 86.09, 45.49, 0.0, 0.0, 40.62, 63.1, 50.81, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["snicker", 10.23], ["laughter", 6.89], ["noise", 6.45]], null, [["speech", 59.95], ["stomach rumble", 6.61], ["hum", 4.95]], null, null, [["speech", 40.42], ["fart", 16.23], ["fly, housefly", 10.14]], null, null, null, [["speech", 68.55], ["creak", 5.11], ["electric shaver, electric razor", 4.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.23, 1.18, 6.62, 2.41, 3.46, 1.31, -0.05, 6.94, 2.02, 2.41, 0.8, 19.66, 0.86, 1.29, 0.64, 1.55, 0.7, 0.91, 0.08, 0.02, 0.18, 1.02, 1.03, 0.23, 1.1, 4.05, 0.57, 1.14, 3.88, 1.8, 1.93, 0.07, 0.71, 1.29, 0.38, 0.77, -0.06, 1.47, 0.72, 0.86, 0.55, 0.76]} \ No newline at end of file diff --git a/annotations_1/85A2rWA5O3o_filtered.json b/annotations_1/85A2rWA5O3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c9c428ab5259914dc435b94cc49cc67f3525edc --- /dev/null +++ b/annotations_1/85A2rWA5O3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 40.63], [42.0, 54.65], [56.0, 56.91], [59.0, 61.28], [63.0, 63.51], [64.0, 66.65], [71.0, 71.46], [74.0, 75.2], [77.0, 88.18], [91.0, 93.21], [97.0, 97.65], [102.0, 130.3], [131.0, 133.14], [134.0, 142.37], [146.0, 151.95], [166.0, 166.28]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 49.13, 0.0, 53.28, 0.0, 84.8, 0.0, 0.0, 52.05, 38.71, 0.0, 34.32, 63.96, 39.6, 64.29, 0.0], "audiomae_on_audioset": [null, [["music", 52.57], ["theremin", 9.2], ["musical instrument", 4.91]], null, null, null, null, null, null, null, [["music", 46.15], ["synthesizer", 9.06], ["theremin", 8.19]], null, [["speech", 55.74], ["music", 27.5], ["synthesizer", 4.28]], null, [["speech", 46.59], ["hum", 4.65], ["music", 4.56]], null, null], "duration": [36.63, 12.65, 0.91, 2.28, 0.51, 2.65, 0.46, 1.2, 11.18, 2.21, 0.65, 28.3, 2.14, 8.37, 5.95, 0.28]} \ No newline at end of file diff --git a/annotations_1/85O_vS9vSCA_filtered.json b/annotations_1/85O_vS9vSCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/85O_vS9vSCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/85cnCW_4LIc_filtered.json b/annotations_1/85cnCW_4LIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ee550aebfe11c460ef1dacb320df7fa5ded1d82 --- /dev/null +++ b/annotations_1/85cnCW_4LIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.34], [10.0, 10.32], [11.0, 11.1], [12.0, 13.27], [14.0, 16.68], [18.0, 19.52], [23.0, 22.91], [25.0, 25.95], [33.0, 36.53], [39.0, 40.09], [41.0, 42.69], [52.0, 52.68], [55.0, 56.29], [72.0, 75.36], [77.0, 79.49], [81.0, 83.44], [85.0, 85.67], [87.0, 88.01], [88.0, 92.2], [92.0, 92.85], [104.0, 108.31], [116.0, 116.45], [117.0, 122.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 97.54, 0.0, 0.0, 95.64, 0.0, 82.79, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 0.32, 0.1, 1.27, 2.68, 1.52, -0.09, 0.95, 3.53, 1.09, 1.69, 0.68, 1.29, 3.36, 2.49, 2.44, 0.67, 1.01, 4.2, 0.85, 4.31, 0.45, 5.37]} \ No newline at end of file diff --git a/annotations_1/86Vd7XFiYZA_filtered.json b/annotations_1/86Vd7XFiYZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0344fb45c0d3d4bc359fc152175f5d986a5df88c --- /dev/null +++ b/annotations_1/86Vd7XFiYZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 20.06], [22.0, 22.92], [24.0, 27.23], [28.0, 52.68], [54.0, 61.05], [62.0, 67.24], [74.0, 82.68]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [59.42, 0.0, 67.13, 52.27, 59.33, 72.16, 98.1], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [16.06, 0.92, 3.23, 24.68, 7.05, 5.24, 8.68]} \ No newline at end of file diff --git a/annotations_1/86sXLVakflE_filtered.json b/annotations_1/86sXLVakflE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09960fb58def946f961a61d4daa88d13ad7ecc03 --- /dev/null +++ b/annotations_1/86sXLVakflE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.07], [21.0, 22.64], [24.0, 24.63], [26.0, 27.24], [29.0, 31.23], [32.0, 37.94], [38.0, 38.33], [39.0, 39.43], [40.0, 41.82], [43.0, 44.09], [46.0, 47.29], [52.0, 52.1], [53.0, 54.51], [55.0, 56.4], [58.0, 59.29], [60.0, 60.2], [61.0, 63.0], [64.0, 67.37], [68.0, 69.38], [75.0, 75.19], [77.0, 80.15], [81.0, 82.92], [84.0, 85.5], [96.0, 96.28], [99.0, 99.47], [100.0, 101.46], [103.0, 103.25], [104.0, 104.84], [117.0, 123.04], [126.0, 135.57], [138.0, 140.37], [141.0, 141.88], [143.0, 144.69], [145.0, 146.28], [148.0, 149.86], [151.0, 151.7], [154.0, 154.28], [155.0, 156.27], [157.0, 158.5], [159.0, 160.56], [161.0, 164.27], [165.0, 167.37], [169.0, 170.19], [171.0, 171.85], [174.0, 174.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 0.0, 0.0, 0.0, 91.47, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 99.71, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 94.37, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 97.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 1.64, 0.63, 1.24, 2.23, 5.94, 0.33, 0.43, 1.82, 1.09, 1.29, 0.1, 1.51, 1.4, 1.29, 0.2, 2.0, 3.37, 1.38, 0.19, 3.15, 1.92, 1.5, 0.28, 0.47, 1.46, 0.25, 0.84, 6.04, 9.57, 2.37, 0.88, 1.69, 1.28, 1.86, 0.7, 0.28, 1.27, 1.5, 1.56, 3.27, 2.37, 1.19, 0.85, 0.51]} \ No newline at end of file diff --git a/annotations_1/86xtQC4rp98_filtered.json b/annotations_1/86xtQC4rp98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccfb551165d6a3326812f994af9211f4abfe0c57 --- /dev/null +++ b/annotations_1/86xtQC4rp98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.63], [9.0, 10.2], [12.0, 13.39], [16.0, 16.73], [24.0, 25.35], [28.0, 28.12], [30.0, 30.45], [31.0, 32.02], [34.0, 34.33], [38.0, 38.99], [42.0, 57.13], [58.0, 57.84], [59.0, 59.66], [66.0, 68.86], [78.0, 78.78], [81.0, 92.2], [93.0, 93.82], [95.0, 96.09], [97.0, 98.63], [99.0, 101.8], [104.0, 105.17], [107.0, 107.45], [108.0, 109.39], [111.0, 116.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.76, 0.0, 0.0, 73.82, 0.0, 78.04, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 0.0, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 38.0], ["sidetone", 22.54], ["speech", 12.32]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 1.2, 1.39, 0.73, 1.35, 0.12, 0.45, 1.02, 0.33, 0.99, 15.13, -0.16, 0.66, 2.86, 0.78, 11.2, 0.82, 1.09, 1.63, 2.8, 1.17, 0.45, 1.39, 5.75]} \ No newline at end of file diff --git a/annotations_1/87IqS4kQqgE_filtered.json b/annotations_1/87IqS4kQqgE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f37203be4f4ec72a186b27a8a5736d65a7e5e82e --- /dev/null +++ b/annotations_1/87IqS4kQqgE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.94], [16.0, 17.73], [20.0, 21.32], [22.0, 35.43], [38.0, 42.72], [43.0, 49.86], [55.0, 54.97], [56.0, 60.34], [62.0, 62.41], [63.0, 63.26], [63.0, 63.49], [64.0, 63.53], [64.0, 63.96], [64.0, 65.67], [67.0, 67.85], [85.0, 99.98], [102.0, 110.73], [114.0, 122.59], [129.0, 135.9], [142.0, 146.89], [149.0, 150.25], [153.0, 156.47], [161.0, 164.89], [168.0, 172.67], [176.0, 185.73], [187.0, 190.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false], "silence_prob": [47.35, 0.0, 0.0, 50.71, 67.89, 87.0, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 43.85, 40.99, 42.91, 33.95, 0.0, 43.64, 38.41, 38.88, 47.86, 52.51], "audiomae_on_audioset": [[["music", 38.95], ["singing bowl", 24.36], ["musical instrument", 7.68]], null, null, null, null, null, null, [["music", 30.91], ["livestock, farm animals, working animals", 29.47], ["cattle, bovinae", 14.49]], null, null, null, null, null, null, null, [["music", 72.47], ["didgeridoo", 8.27], ["electric shaver, electric razor", 2.06]], [["music", 80.99], ["whale vocalization", 3.87], ["throbbing", 1.81]], [["music", 69.99], ["whale vocalization", 4.83], ["stomach rumble", 2.47]], [["music", 46.4], ["didgeridoo", 10.11], ["theremin", 5.08]], [["theremin", 62.39], ["music", 26.69], ["wind instrument, woodwind instrument", 3.2]], null, [["music", 64.66], ["guitar", 3.6], ["speech", 3.15]], [["music", 44.55], ["musical instrument", 5.87], ["maraca", 4.97]], [["music", 40.79], ["speech", 40.16], ["guitar", 2.29]], [["music", 37.89], ["speech", 11.89], ["theremin", 11.1]], null], "duration": [3.94, 1.73, 1.32, 13.43, 4.72, 6.86, -0.03, 4.34, 0.41, 0.26, 0.49, -0.47, -0.04, 1.67, 0.85, 14.98, 8.73, 8.59, 6.9, 4.89, 1.25, 3.47, 3.89, 4.67, 9.73, 3.78]} \ No newline at end of file diff --git a/annotations_1/880-MqUhhEk_filtered.json b/annotations_1/880-MqUhhEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43b324c8c26a1432f1e37ec7e4096e5ecfa5f3f4 --- /dev/null +++ b/annotations_1/880-MqUhhEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.74], [10.0, 26.27], [28.0, 28.75], [30.0, 30.65], [34.0, 41.42], [42.0, 42.63], [47.0, 92.42], [100.0, 110.27]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [39.54, 33.86, 0.0, 0.0, 32.2, 0.0, 0.0, 30.68], "audiomae_on_audioset": [[["music", 66.12], ["theremin", 9.97], ["carnatic music", 3.92]], [["music", 58.96], ["didgeridoo", 18.51], ["theremin", 13.63]], null, null, [["music", 64.95], ["theremin", 14.14], ["carnatic music", 5.19]], null, null, [["music", 78.08], ["theremin", 2.92], ["musical instrument", 1.82]]], "duration": [3.74, 16.27, 0.75, 0.65, 7.42, 0.63, 45.42, 10.27]} \ No newline at end of file diff --git a/annotations_1/88T3elu2wfE_filtered.json b/annotations_1/88T3elu2wfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..701484da6e8f9d80a5b2b26fdfb0f10c87500707 --- /dev/null +++ b/annotations_1/88T3elu2wfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [8.0, 11.75], [13.0, 14.45], [17.0, 20.98], [22.0, 23.94], [27.0, 28.56], [31.0, 32.46], [34.0, 35.29], [36.0, 38.08], [44.0, 44.24], [46.0, 47.58], [51.0, 56.32], [67.0, 67.36], [68.0, 69.33], [70.0, 73.48], [80.0, 80.43], [82.0, 83.25], [84.0, 84.33], [91.0, 92.23], [95.0, 95.4], [100.0, 101.04], [106.0, 106.83], [112.0, 112.9], [127.0, 127.65], [131.0, 132.16], [136.0, 137.81], [155.0, 155.26], [160.0, 163.75], [172.0, 180.0], [195.0, 198.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 87.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 47.43, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.93, 30.95, 30.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.16], ["speech", 11.47], ["animal", 3.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.14], ["didgeridoo", 25.33], ["musical instrument", 4.87]], [["music", 42.12], ["didgeridoo", 26.85], ["musical instrument", 3.22]], [["music", 43.02], ["didgeridoo", 20.43], ["musical instrument", 5.31]]], "duration": [1.28, 3.75, 1.45, 3.98, 1.94, 1.56, 1.46, 1.29, 2.08, 0.24, 1.58, 5.32, 0.36, 1.33, 3.48, 0.43, 1.25, 0.33, 1.23, 0.4, 1.04, 0.83, 0.9, 0.65, 1.16, 1.81, 0.26, 3.75, 8.0, 3.53]} \ No newline at end of file diff --git a/annotations_1/88dS92rgWhA_filtered.json b/annotations_1/88dS92rgWhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2475a7704a4007826bd241cd2c27b36c08dc9631 --- /dev/null +++ b/annotations_1/88dS92rgWhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 62.6], [69.0, 76.45], [83.0, 83.74], [86.0, 93.04], [97.0, 101.51], [111.0, 111.45], [112.0, 112.24], [113.0, 115.6], [117.0, 119.01], [124.0, 129.03], [130.0, 130.08], [132.0, 132.7]], "keep_status": [false, false, false, true, true, false, false, false, true, true, false, false], "silence_prob": [30.2, 29.95, 0.0, 30.11, 29.43, 0.0, 0.0, 30.53, 30.35, 29.61, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.37], ["speech", 23.8], ["machine gun", 10.62]], [["speech", 38.29], ["music", 34.88], ["hum", 2.88]], null, [["speech", 53.13], ["music", 8.86], ["vehicle", 5.01]], [["music", 29.92], ["vehicle", 14.59], ["car", 11.36]], null, null, [["hum", 33.99], ["mains hum", 24.53], ["throbbing", 11.76]], [["music", 30.88], ["hum", 6.24], ["electronic music", 4.17]], [["hum", 32.12], ["throbbing", 20.67], ["speech", 16.44]], null, null], "duration": [9.6, 7.45, 0.74, 7.04, 4.51, 0.45, 0.24, 2.6, 2.01, 5.03, 0.08, 0.7]} \ No newline at end of file diff --git a/annotations_1/891-YR-fgsk_filtered.json b/annotations_1/891-YR-fgsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69c43eb05a2aa8cd8cacbac03710c9bb9e9b128f --- /dev/null +++ b/annotations_1/891-YR-fgsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.17], [9.0, 52.54], [53.0, 58.13], [59.0, 63.48], [64.0, 86.22], [87.0, 92.35], [94.0, 100.95], [101.0, 103.44], [106.0, 107.42], [108.0, 109.71], [111.0, 112.35], [114.0, 119.65], [120.0, 123.33], [124.0, 125.58], [127.0, 130.03], [131.0, 187.62], [188.0, 198.96], [200.0, 213.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 59.68, 95.78, 98.1, 55.04, 51.66, 71.43, 0.0, 0.0, 0.0, 71.72, 41.03, 0.0, 54.5, 0.0, 58.81, 35.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.01], ["music", 5.9], ["whale vocalization", 5.22]], null, null, null, null, [["music", 26.8], ["throbbing", 17.52], ["speech", 14.2]]], "duration": [0.17, 43.54, 5.13, 4.48, 22.22, 5.35, 6.95, 2.44, 1.42, 1.71, 1.35, 5.65, 3.33, 1.58, 3.03, 56.62, 10.96, 13.16]} \ No newline at end of file diff --git a/annotations_1/89FuExOuBbI_filtered.json b/annotations_1/89FuExOuBbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7c5c7a8c56ffbbda19d53061452068ffcf79dae --- /dev/null +++ b/annotations_1/89FuExOuBbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.24], [19.0, 19.47], [21.0, 21.46], [26.0, 28.43], [49.0, 49.72], [51.0, 52.78], [55.0, 58.35], [59.0, 60.1], [63.0, 62.72], [65.0, 69.36], [71.0, 71.31], [73.0, 73.75], [75.0, 75.32], [75.0, 75.36], [75.0, 80.37], [82.0, 91.07], [105.0, 106.73], [108.0, 109.26], [118.0, 117.81], [119.0, 118.94], [119.0, 120.09], [130.0, 130.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 38.88, 0.0, 0.0, 35.89, 0.0, 0.0, 0.0, 0.0, 34.23, 30.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 61.5], ["throbbing", 9.91], ["hum", 6.0]], null, null, [["speech", 38.29], ["mains hum", 21.33], ["hum", 16.08]], null, null, [["music", 37.77], ["throbbing", 26.07], ["hum", 16.14]], null, null, null, null, [["music", 62.65], ["speech", 7.18], ["hum", 5.69]], [["speech", 31.73], ["explosion", 22.23], ["burst, pop", 11.4]], null, null, null, null, null, null], "duration": [0.24, 0.47, 0.46, 2.43, 0.72, 1.78, 3.35, 1.1, -0.28, 4.36, 0.31, 0.75, 0.32, 0.36, 5.37, 9.07, 1.73, 1.26, -0.19, -0.06, 1.09, 0.15]} \ No newline at end of file diff --git a/annotations_1/89OqkIyNnfQ_filtered.json b/annotations_1/89OqkIyNnfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79ea4845c62e5878edeb14d25194e2213f23c991 --- /dev/null +++ b/annotations_1/89OqkIyNnfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 50.75], [53.0, 78.88], [89.0, 91.35], [92.0, 94.78], [102.0, 111.57], [112.0, 136.51], [142.0, 142.06], [142.0, 151.19]], "keep_status": [false, false, true, true, true, true, false, true], "silence_prob": [0.0, 28.66, 28.42, 28.48, 28.6, 29.0, 0.0, 29.04], "audiomae_on_audioset": [null, [["music", 62.67], ["buzz", 7.23], ["mains hum", 4.76]], [["music", 28.91], ["static", 5.82], ["musical instrument", 5.41]], [["music", 34.75], ["cacophony", 13.98], ["hum", 4.79]], [["music", 36.63], ["throbbing", 17.96], ["hum", 9.35]], [["music", 37.86], ["hum", 12.07], ["mains hum", 10.45]], null, [["music", 45.54], ["didgeridoo", 5.79], ["speech", 5.01]]], "duration": [36.75, 25.88, 2.35, 2.78, 9.57, 24.51, 0.06, 9.19]} \ No newline at end of file diff --git a/annotations_1/89RJwGDFpC4_filtered.json b/annotations_1/89RJwGDFpC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5814a0b591d81d42cf52e8c5418eb869801e82b0 --- /dev/null +++ b/annotations_1/89RJwGDFpC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.49], [15.0, 16.33], [17.0, 18.01], [21.0, 22.25], [25.0, 25.29], [27.0, 28.59], [33.0, 35.4], [36.0, 41.25], [52.0, 53.97], [55.0, 54.73], [55.0, 54.8], [55.0, 54.9], [56.0, 57.74], [62.0, 63.75], [64.0, 64.45], [69.0, 68.74], [70.0, 70.12], [72.0, 78.83], [80.0, 83.22], [85.0, 86.16], [91.0, 92.74], [101.0, 106.79], [111.0, 111.42], [112.0, 134.3], [135.0, 139.77], [143.0, 145.22]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [36.85, 0.0, 0.0, 0.0, 0.0, 0.0, 49.27, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.4, 32.85, 0.0, 0.0, 34.05, 0.0, 32.37, 32.85, 55.67], "audiomae_on_audioset": [[["speech", 43.82], ["music", 31.34], ["moo", 1.29]], null, null, null, null, null, [["music", 52.1], ["buzz", 14.14], ["insect", 2.04]], [["music", 69.09], ["speech", 7.48], ["frog", 4.51]], null, null, null, null, null, null, null, null, null, [["music", 55.6], ["boing", 22.44], ["ding", 3.71]], [["music", 60.88], ["foghorn", 11.0], ["brass instrument", 2.17]], null, null, [["music", 43.79], ["boing", 7.83], ["musical instrument", 7.04]], null, [["music", 69.63], ["animal", 4.9], ["quack", 4.18]], [["music", 49.67], ["fart", 6.94], ["groan", 5.01]], null], "duration": [2.49, 1.33, 1.01, 1.25, 0.29, 1.59, 2.4, 5.25, 1.97, -0.27, -0.2, -0.1, 1.74, 1.75, 0.45, -0.26, 0.12, 6.83, 3.22, 1.16, 1.74, 5.79, 0.42, 22.3, 4.77, 2.22]} \ No newline at end of file diff --git a/annotations_1/8CZcZ_b-Cmg_filtered.json b/annotations_1/8CZcZ_b-Cmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7688129e0900a7ff18a4d639147a5de670e13788 --- /dev/null +++ b/annotations_1/8CZcZ_b-Cmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.87], [25.0, 25.42], [29.0, 30.91], [32.0, 34.28], [36.0, 45.05], [45.0, 68.13], [73.0, 81.97]], "keep_status": [false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 45.88, 44.84, 39.38, 33.55], "audiomae_on_audioset": [null, null, null, [["hum", 29.98], ["throbbing", 14.13], ["mains hum", 13.09]], [["hum", 29.0], ["music", 23.41], ["mains hum", 7.28]], [["music", 53.5], ["speech", 21.35], ["wind instrument, woodwind instrument", 8.5]], [["music", 53.64], ["musical instrument", 7.54], ["orchestra", 4.95]]], "duration": [-0.13, 0.42, 1.91, 2.28, 9.05, 23.13, 8.97]} \ No newline at end of file diff --git a/annotations_1/8CcVO0mQ1go_filtered.json b/annotations_1/8CcVO0mQ1go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6f0fb987b07cc786c9ef2e20e80079b36cbfb79 --- /dev/null +++ b/annotations_1/8CcVO0mQ1go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [5.0, 6.35], [11.0, 10.98], [30.0, 39.02], [43.0, 44.79], [50.0, 52.96], [53.0, 65.62], [67.0, 66.9], [71.0, 72.77], [74.0, 74.61], [77.0, 77.72], [82.0, 83.37], [84.0, 93.19], [101.0, 100.87], [104.0, 105.7], [112.0, 113.98], [118.0, 120.95], [125.0, 127.11], [129.0, 131.04], [132.0, 133.64], [135.0, 146.13], [147.0, 146.94], [148.0, 149.07], [150.0, 152.44], [153.0, 153.79], [155.0, 158.08], [165.0, 167.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 50.86, 0.0, 43.66, 38.05, 0.0, 0.0, 0.0, 0.0, 0.0, 34.51, 0.0, 0.0, 0.0, 34.77, 48.52, 52.86, 0.0, 30.48, 0.0, 0.0, 31.71, 0.0, 31.22, 31.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.58], ["throbbing", 28.62], ["hum", 8.14]], [["music", 50.36], ["hum", 14.8], ["throbbing", 9.09]], null, null, null, null, null, [["music", 50.26], ["hum", 16.25], ["ambient music", 6.15]], null, null, null, [["music", 30.2], ["hum", 12.83], ["gong", 10.68]], [["music", 71.99], ["hum", 5.76], ["electronic music", 3.97]], null, null, [["music", 54.53], ["didgeridoo", 12.9], ["theremin", 6.64]], null, null, [["music", 50.68], ["theremin", 12.8], ["hum", 3.06]], null, [["music", 66.45], ["whale vocalization", 8.91], ["theremin", 4.81]], [["foghorn", 27.77], ["music", 22.42], ["speech", 8.15]]], "duration": [0.89, 1.35, -0.02, 9.02, 1.79, 2.96, 12.62, -0.1, 1.77, 0.61, 0.72, 1.37, 9.19, -0.13, 1.7, 1.98, 2.95, 2.11, 2.04, 1.64, 11.13, -0.06, 1.07, 2.44, 0.79, 3.08, 2.78]} \ No newline at end of file diff --git a/annotations_1/8CouO6czPic_filtered.json b/annotations_1/8CouO6czPic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5710b9aeebe81cbd7f7895346cc67be3d09b8305 --- /dev/null +++ b/annotations_1/8CouO6czPic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [3.0, 2.93], [5.0, 11.92], [13.0, 15.55], [16.0, 18.71], [23.0, 27.28], [28.0, 28.93], [29.0, 30.18], [42.0, 54.01], [57.0, 57.81], [62.0, 62.58], [65.0, 71.52], [75.0, 103.69], [106.0, 107.49], [110.0, 110.46], [114.0, 114.67], [117.0, 117.93], [122.0, 123.58], [127.0, 140.83], [142.0, 141.91], [143.0, 145.4], [148.0, 149.28], [151.0, 153.23]], "keep_status": [false, false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 31.75, 30.19, 31.05, 29.39, 0.0, 0.0, 30.14, 0.0, 0.0, 37.62, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41, 0.0, 47.39, 0.0, 40.79], "audiomae_on_audioset": [null, null, [["music", 48.84], ["theremin", 13.51], ["didgeridoo", 5.7]], [["music", 15.31], ["foghorn", 10.26], ["didgeridoo", 6.87]], [["music", 61.8], ["musical instrument", 7.04], ["strum", 2.21]], [["foghorn", 36.67], ["electric shaver, electric razor", 7.04], ["music", 6.7]], null, null, [["music", 41.08], ["brass instrument", 18.2], ["trombone", 9.93]], null, null, [["music", 62.34], ["musical instrument", 5.94], ["foghorn", 4.64]], [["music", 56.48], ["brass instrument", 10.93], ["musical instrument", 8.31]], null, null, null, null, null, null, null, [["music", 28.3], ["speech", 19.31], ["didgeridoo", 17.46]], null, [["music", 29.66], ["hum", 7.93], ["mains hum", 6.23]]], "duration": [-0.14, -0.07, 6.92, 2.55, 2.71, 4.28, 0.93, 1.18, 12.01, 0.81, 0.58, 6.52, 28.69, 1.49, 0.46, 0.67, 0.93, 1.58, 13.83, -0.09, 2.4, 1.28, 2.23]} \ No newline at end of file diff --git a/annotations_1/8Cyv7f65bbY_filtered.json b/annotations_1/8Cyv7f65bbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cd39751ffdd5f960bd3798fdd33bf6902f2a4d1 --- /dev/null +++ b/annotations_1/8Cyv7f65bbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [7.0, 10.79], [11.0, 11.92], [13.0, 19.09], [21.0, 32.95], [34.0, 36.05], [37.0, 45.33], [46.0, 46.63], [48.0, 60.29], [61.0, 66.97], [68.0, 70.58], [72.0, 74.12], [75.0, 85.72], [87.0, 87.12], [87.0, 88.23], [90.0, 91.49], [95.0, 95.74], [97.0, 100.04], [101.0, 102.34], [103.0, 109.11], [109.0, 121.71]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [78.55, 72.01, 0.0, 61.18, 44.6, 90.78, 85.17, 0.0, 51.5, 40.88, 98.86, 100.0, 79.24, 0.0, 0.0, 0.0, 0.0, 92.8, 0.0, 78.89, 43.05], "audiomae_on_audioset": [null, null, null, null, [["music", 27.26], ["mains hum", 23.7], ["hum", 20.39]], null, null, null, null, [["speech", 41.17], ["sine wave", 8.38], ["hum", 7.38]], null, null, null, null, null, null, null, null, null, null, [["hum", 20.69], ["speech", 11.99], ["sine wave", 11.62]]], "duration": [2.45, 3.79, 0.92, 6.09, 11.95, 2.05, 8.33, 0.63, 12.29, 5.97, 2.58, 2.12, 10.72, 0.12, 1.23, 1.49, 0.74, 3.04, 1.34, 6.11, 12.71]} \ No newline at end of file diff --git a/annotations_1/8D7EY0zKevM_filtered.json b/annotations_1/8D7EY0zKevM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa4873381417a33d5e0b4370ccf44928527701f --- /dev/null +++ b/annotations_1/8D7EY0zKevM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.75], [16.0, 18.12], [26.0, 33.37], [34.0, 34.37], [37.0, 38.53], [39.0, 41.72], [47.0, 47.7], [58.0, 57.79], [59.0, 61.53], [67.0, 67.39], [69.0, 69.35], [71.0, 71.04], [72.0, 73.25], [78.0, 78.21], [83.0, 83.69], [87.0, 87.52], [89.0, 89.11], [93.0, 96.48], [100.0, 100.84], [105.0, 107.67], [110.0, 124.68], [127.0, 127.14], [129.0, 134.57], [138.0, 141.37], [145.0, 145.2]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, false], "silence_prob": [0.0, 31.03, 76.53, 0.0, 0.0, 48.19, 0.0, 0.0, 40.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 36.25, 30.83, 0.0, 29.5, 29.57, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 37.77], ["mosquito", 21.63], ["insect", 10.97]], null, null, null, [["hum", 24.92], ["speech", 14.08], ["music", 13.94]], null, null, [["music", 18.98], ["speech", 11.13], ["beatboxing", 10.82]], null, null, null, null, null, null, null, null, [["roar", 17.93], ["wild animals", 13.29], ["speech", 11.56]], null, [["music", 50.62], ["throbbing", 9.45], ["electronic music", 6.15]], [["music", 49.9], ["speech", 23.45], ["buzz", 2.82]], null, [["music", 49.44], ["sidetone", 9.81], ["speech", 8.79]], [["music", 40.01], ["groan", 4.88], ["electronic music", 4.44]], null], "duration": [1.75, 2.12, 7.37, 0.37, 1.53, 2.72, 0.7, -0.21, 2.53, 0.39, 0.35, 0.04, 1.25, 0.21, 0.69, 0.52, 0.11, 3.48, 0.84, 2.67, 14.68, 0.14, 5.57, 3.37, 0.2]} \ No newline at end of file diff --git a/annotations_1/8DkbFJ3uz54_filtered.json b/annotations_1/8DkbFJ3uz54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cca6a0176ea56358b1489471c1b4987f3ef0505 --- /dev/null +++ b/annotations_1/8DkbFJ3uz54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [5.0, 8.13], [10.0, 10.03], [12.0, 12.85], [16.0, 15.97], [18.0, 19.18], [20.0, 20.73], [21.0, 21.63], [22.0, 22.47], [26.0, 25.83], [39.0, 40.09], [43.0, 46.14], [48.0, 55.44], [59.0, 62.82], [65.0, 67.68], [70.0, 76.3], [77.0, 81.94], [85.0, 94.71], [97.0, 97.78], [99.0, 99.81], [100.0, 102.76], [103.0, 111.23], [111.0, 113.43], [116.0, 117.31], [120.0, 128.31], [132.0, 131.72], [144.0, 144.46], [149.0, 150.38], [151.0, 155.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 39.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.4, 35.71, 50.56, 60.14, 39.93, 78.72, 31.01, 0.0, 0.0, 33.9, 32.25, 36.07, 0.0, 47.2, 0.0, 0.0, 0.0, 99.96], "audiomae_on_audioset": [null, [["speech", 29.69], ["frog", 21.64], ["animal", 9.14]], null, null, null, null, null, null, null, null, null, [["music", 23.41], ["breaking", 12.19], ["hum", 8.3]], [["music", 57.0], ["throbbing", 9.23], ["hum", 6.51]], null, null, [["music", 56.69], ["speech", 19.1], ["musical instrument", 8.86]], null, [["music", 63.48], ["speech", 12.31], ["boing", 2.23]], null, null, [["music", 48.3], ["sheep", 17.31], ["bleat", 15.9]], [["music", 43.91], ["groan", 33.0], ["speech", 4.21]], [["speech", 24.56], ["sine wave", 13.11], ["chirp tone", 12.29]], null, [["speech", 46.09], ["clang", 12.57], ["throbbing", 7.39]], null, null, null, null], "duration": [0.51, 3.13, 0.03, 0.85, -0.03, 1.18, 0.73, 0.63, 0.47, -0.17, 1.09, 3.14, 7.44, 3.82, 2.68, 6.3, 4.94, 9.71, 0.78, 0.81, 2.76, 8.23, 2.43, 1.31, 8.31, -0.28, 0.46, 1.38, 4.04]} \ No newline at end of file diff --git a/annotations_1/8DrF70mcr38_filtered.json b/annotations_1/8DrF70mcr38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c66285f10343ff207df7e94a27b03f4bc0d95ca --- /dev/null +++ b/annotations_1/8DrF70mcr38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [7.0, 8.23], [12.0, 14.22], [16.0, 20.8], [23.0, 23.75], [25.0, 28.29], [30.0, 30.2], [32.0, 33.12], [34.0, 34.74], [36.0, 36.68], [41.0, 41.5], [45.0, 46.74], [48.0, 50.08], [56.0, 56.66], [58.0, 58.4], [61.0, 61.67], [66.0, 66.72], [70.0, 71.34], [77.0, 77.65], [81.0, 80.82], [83.0, 83.83], [87.0, 87.29], [88.0, 92.3], [93.0, 93.95], [96.0, 96.92], [99.0, 106.95], [107.0, 110.35], [114.0, 114.99], [123.0, 123.6], [132.0, 132.02], [133.0, 133.1], [134.0, 134.55], [135.0, 141.72], [143.0, 142.99], [143.0, 144.12], [147.0, 148.73]], "keep_status": [false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 47.58, 45.65, 0.0, 42.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 69.07, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 45.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["whistling", 20.16], ["radio", 5.59], ["speech", 4.92]], [["glass", 10.88], ["music", 9.96], ["hum", 6.61]], null, [["speech", 12.29], ["animal", 5.78], ["noise", 4.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fowl", 28.79], ["fly, housefly", 14.71], ["speech", 14.35]], null, null, null], "duration": [0.43, 1.23, 2.22, 4.8, 0.75, 3.29, 0.2, 1.12, 0.74, 0.68, 0.5, 1.74, 2.08, 0.66, 0.4, 0.67, 0.72, 1.34, 0.65, -0.18, 0.83, 0.29, 4.3, 0.95, 0.92, 7.95, 3.35, 0.99, 0.6, 0.02, 0.1, 0.55, 6.72, -0.01, 1.12, 1.73]} \ No newline at end of file diff --git a/annotations_1/8Ds9R9puftI_filtered.json b/annotations_1/8Ds9R9puftI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..721c75f2f35cf787c24f4c4dbe22b2daf3c30590 --- /dev/null +++ b/annotations_1/8Ds9R9puftI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.12], [13.0, 12.78], [15.0, 14.96], [16.0, 16.36], [22.0, 22.94], [47.0, 49.01], [52.0, 57.7], [58.0, 58.01], [58.0, 65.89], [67.0, 66.9], [67.0, 67.8], [69.0, 69.6], [71.0, 77.45], [78.0, 79.03], [80.0, 80.42], [84.0, 85.83], [88.0, 88.32], [89.0, 89.7], [90.0, 92.97], [94.0, 94.86], [96.0, 99.52], [107.0, 106.68], [107.0, 107.91], [109.0, 108.7], [121.0, 125.49], [127.0, 139.04], [146.0, 146.99], [151.0, 152.04], [154.0, 154.74], [158.0, 158.38], [160.0, 160.14], [161.0, 161.82], [164.0, 164.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 48.14, 0.0, 70.58, 0.0, 0.0, 0.0, 34.28, 0.0, 0.0, 0.0, 0.0, 0.0, 34.88, 0.0, 33.05, 0.0, 0.0, 0.0, 33.48, 28.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.7], ["guitar", 18.17], ["musical instrument", 9.06]], null, null, null, null, null, [["music", 51.06], ["didgeridoo", 11.56], ["speech", 8.64]], null, null, null, null, null, [["sidetone", 27.12], ["music", 26.54], ["speech", 16.53]], null, [["music", 28.4], ["throbbing", 15.12], ["hum", 10.47]], null, null, null, [["music", 64.21], ["thunk", 18.39], ["musical instrument", 1.63]], [["music", 64.17], ["speech", 5.48], ["groan", 4.8]], null, null, null, null, null, null, null], "duration": [1.12, -0.22, -0.04, 0.36, 0.94, 2.01, 5.7, 0.01, 7.89, -0.1, 0.8, 0.6, 6.45, 1.03, 0.42, 1.83, 0.32, 0.7, 2.97, 0.86, 3.52, -0.32, 0.91, -0.3, 4.49, 12.04, 0.99, 1.04, 0.74, 0.38, 0.14, 0.82, 0.03]} \ No newline at end of file diff --git a/annotations_1/8FHO7Ry4_Jc_filtered.json b/annotations_1/8FHO7Ry4_Jc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2144cb86734c1c1acd24c5446de82f9fded79f09 --- /dev/null +++ b/annotations_1/8FHO7Ry4_Jc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.78], [6.0, 6.45], [18.0, 18.37], [22.0, 23.4], [23.0, 23.46], [24.0, 25.03], [26.0, 26.03], [28.0, 31.67], [33.0, 33.32], [34.0, 35.33], [38.0, 38.01], [42.0, 42.97], [73.0, 73.74], [79.0, 82.05], [84.0, 89.94], [92.0, 94.9]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 51.82, 68.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["noise", 17.45], ["theremin", 6.16], ["telephone", 4.82]], null, null, null, null, null, null, null, null], "duration": [-0.22, 0.45, 0.37, 1.4, 0.46, 1.03, 0.03, 3.67, 0.32, 1.33, 0.01, 0.97, 0.74, 3.05, 5.94, 2.9]} \ No newline at end of file diff --git a/annotations_1/8H_aePfIMzQ_filtered.json b/annotations_1/8H_aePfIMzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a6b656990f87225ec0fac25d8b3b84b7054dc05 --- /dev/null +++ b/annotations_1/8H_aePfIMzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.42], [18.0, 23.87], [25.0, 25.71], [27.0, 31.06], [33.0, 37.69], [40.0, 40.8], [45.0, 47.68], [48.0, 47.71], [48.0, 48.2], [48.0, 52.69], [58.0, 60.13], [61.0, 76.52], [83.0, 82.88], [86.0, 89.75], [94.0, 95.35], [98.0, 99.01], [105.0, 105.97], [112.0, 112.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [38.75, 44.2, 0.0, 42.88, 42.86, 0.0, 34.17, 0.0, 0.0, 36.35, 35.62, 34.29, 0.0, 40.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 79.3], ["speech", 3.41], ["musical instrument", 1.5]], [["music", 65.85], ["speech", 6.06], ["musical instrument", 4.7]], null, [["music", 48.97], ["speech", 10.93], ["musical instrument", 3.94]], [["music", 55.69], ["speech", 17.42], ["electric shaver, electric razor", 3.35]], null, [["cattle, bovinae", 41.07], ["moo", 26.42], ["livestock, farm animals, working animals", 6.99]], null, null, [["music", 60.55], ["speech", 9.58], ["sidetone", 8.51]], [["music", 37.33], ["speech", 29.52], ["boing", 4.67]], [["music", 40.86], ["speech", 11.45], ["cattle, bovinae", 9.78]], null, [["music", 74.63], ["musical instrument", 4.15], ["didgeridoo", 2.93]], null, null, null, null], "duration": [9.42, 5.87, 0.71, 4.06, 4.69, 0.8, 2.68, -0.29, 0.2, 4.69, 2.13, 15.52, -0.12, 3.75, 1.35, 1.01, 0.97, 0.53]} \ No newline at end of file diff --git a/annotations_1/8IJEqeoPPs8_filtered.json b/annotations_1/8IJEqeoPPs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42b6b60d9465cf395f1249874233697b6963d7b8 --- /dev/null +++ b/annotations_1/8IJEqeoPPs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.38], [13.0, 14.82], [16.0, 16.92], [18.0, 19.09], [21.0, 20.98], [22.0, 22.33], [24.0, 52.59], [58.0, 67.05], [68.0, 69.63], [71.0, 101.82], [102.0, 101.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.09, 32.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 42.22], ["speech", 26.31], ["buzz", 2.08]], [["music", 60.71], ["mains hum", 13.2], ["hum", 7.88]], null, null, null], "duration": [1.38, 1.82, 0.92, 1.09, -0.02, 0.33, 28.59, 9.05, 1.63, 30.82, -0.1]} \ No newline at end of file diff --git a/annotations_1/8ILiVgno0_0_filtered.json b/annotations_1/8ILiVgno0_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c2cb5d3b64b6d7deaf7e8f60af09f1dfb3dcad8 --- /dev/null +++ b/annotations_1/8ILiVgno0_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.94], [3.0, 3.5], [8.0, 11.47], [12.0, 12.5], [13.0, 13.73], [16.0, 25.88], [26.0, 27.24], [30.0, 30.7], [32.0, 32.22], [41.0, 65.96], [67.0, 67.76], [68.0, 67.8], [68.0, 69.15], [69.0, 69.18], [69.0, 69.21], [69.0, 69.25], [73.0, 73.45], [74.0, 79.44], [80.0, 83.1], [84.0, 85.33], [89.0, 118.27], [119.0, 120.26], [122.0, 122.79], [125.0, 125.22], [130.0, 131.09], [133.0, 134.23], [137.0, 138.52], [144.0, 144.71], [148.0, 149.59]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.52, 0.0, 0.0, 37.84, 0.0, 0.0, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.6, 30.42, 0.0, 31.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 13.06], ["electric shaver, electric razor", 10.62], ["sheep", 8.01]], null, null, [["grunt", 80.76], ["speech", 15.24], ["buzz", 0.38]], null, null, null, [["music", 31.26], ["hum", 28.18], ["throbbing", 14.22]], null, null, null, null, null, null, null, [["music", 77.24], ["musical instrument", 2.75], ["singing", 2.01]], [["music", 57.15], ["moo", 7.32], ["cattle, bovinae", 5.86]], null, [["music", 85.65], ["theremin", 1.96], ["psychedelic rock", 1.42]], null, null, null, null, null, null, null, null], "duration": [-0.06, 0.5, 3.47, 0.5, 0.73, 9.88, 1.24, 0.7, 0.22, 24.96, 0.76, -0.2, 1.15, 0.18, 0.21, 0.25, 0.45, 5.44, 3.1, 1.33, 29.27, 1.26, 0.79, 0.22, 1.09, 1.23, 1.52, 0.71, 1.59]} \ No newline at end of file diff --git a/annotations_1/8INjmc-WWSY_filtered.json b/annotations_1/8INjmc-WWSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45036b43ed8cd5c72d9d2e62b90e84a873bb1c6d --- /dev/null +++ b/annotations_1/8INjmc-WWSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.95], [6.0, 6.07], [14.0, 14.64], [15.0, 21.69], [30.0, 31.08], [34.0, 38.45], [39.0, 41.72], [42.0, 44.91], [45.0, 47.06], [53.0, 54.41], [56.0, 57.45], [58.0, 60.49], [61.0, 62.8], [63.0, 67.27], [68.0, 68.2], [69.0, 73.65], [74.0, 80.87], [81.0, 82.7], [84.0, 85.11], [87.0, 91.81], [93.0, 97.73], [98.0, 100.14], [101.0, 103.87], [105.0, 107.5], [108.0, 109.98], [111.0, 114.56], [115.0, 116.97], [118.0, 120.5], [121.0, 122.89], [123.0, 125.93], [126.0, 128.82], [130.0, 131.48], [132.0, 134.1], [136.0, 136.81], [137.0, 148.26], [149.0, 150.47], [152.0, 152.79], [154.0, 165.86], [167.0, 167.54], [168.0, 169.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 80.29, 93.6, 69.34, 98.19, 0.0, 0.0, 99.92, 0.0, 61.77, 0.0, 99.8, 99.1, 0.0, 0.0, 89.19, 99.93, 53.91, 99.52, 99.96, 0.0, 97.0, 0.0, 98.27, 0.0, 65.32, 66.63, 0.0, 73.82, 0.0, 59.07, 0.0, 0.0, 50.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.95, 0.07, 0.64, 6.69, 1.08, 4.45, 2.72, 2.91, 2.06, 1.41, 1.45, 2.49, 1.8, 4.27, 0.2, 4.65, 6.87, 1.7, 1.11, 4.81, 4.73, 2.14, 2.87, 2.5, 1.98, 3.56, 1.97, 2.5, 1.89, 2.93, 2.82, 1.48, 2.1, 0.81, 11.26, 1.47, 0.79, 11.86, 0.54, 1.77]} \ No newline at end of file diff --git a/annotations_1/8ISsNLwwmXg_filtered.json b/annotations_1/8ISsNLwwmXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea168f20a0c95a19130ae23666aa1b16e4d7d960 --- /dev/null +++ b/annotations_1/8ISsNLwwmXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [2.0, 1.98], [3.0, 4.21], [5.0, 8.16], [9.0, 10.64], [13.0, 14.3], [17.0, 18.99], [21.0, 21.79], [27.0, 27.18], [32.0, 31.92], [34.0, 33.69], [35.0, 35.06], [36.0, 39.07], [40.0, 40.19], [41.0, 41.35], [43.0, 43.85], [48.0, 49.64], [52.0, 52.3], [55.0, 55.46], [57.0, 57.54], [63.0, 66.77], [67.0, 68.23], [69.0, 79.24], [81.0, 89.31], [90.0, 91.07], [95.0, 95.3], [104.0, 105.27], [106.0, 106.84], [107.0, 111.08], [112.0, 112.51], [113.0, 113.8], [115.0, 115.37]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 54.04, 57.56, 0.0, 0.0, 0.0, 0.0, 37.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 41.36], ["sidetone", 19.16], ["fly, housefly", 8.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.96], ["speech", 11.23], ["trombone", 7.9]], null, null, null], "duration": [0.31, -0.02, 1.21, 3.16, 1.64, 1.3, 1.99, 0.79, 0.18, -0.08, -0.31, 0.06, 3.07, 0.19, 0.35, 0.85, 1.64, 0.3, 0.46, 0.54, 3.77, 1.23, 10.24, 8.31, 1.07, 0.3, 1.27, 0.84, 4.08, 0.51, 0.8, 0.37]} \ No newline at end of file diff --git a/annotations_1/8ITOvb7Des0_filtered.json b/annotations_1/8ITOvb7Des0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b332d0e514db5e9e689f986251c9c3d37f5ef39e --- /dev/null +++ b/annotations_1/8ITOvb7Des0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.58], [23.0, 25.22], [26.0, 35.8], [36.0, 36.48], [45.0, 45.69], [47.0, 48.46], [53.0, 53.0], [53.0, 53.28], [63.0, 63.42], [68.0, 72.18], [74.0, 75.88], [79.0, 79.69], [83.0, 84.84], [89.0, 89.6], [91.0, 91.94], [92.0, 92.62], [95.0, 95.1], [96.0, 97.04]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.36, 69.61, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.18], ["speech", 17.5], ["sidetone", 6.68]], null, [["speech", 43.29], ["music", 28.13], ["synthesizer", 6.87]], null, null, null, null, null, null, [["speech", 85.72], ["dial tone", 5.19], ["sidetone", 2.77]], null, null, null, null, null, null, null, null], "duration": [3.58, 2.22, 9.8, 0.48, 0.69, 1.46, 0.0, 0.28, 0.42, 4.18, 1.88, 0.69, 1.84, 0.6, 0.94, 0.62, 0.1, 1.04]} \ No newline at end of file diff --git a/annotations_1/8JhRzlsZPas_filtered.json b/annotations_1/8JhRzlsZPas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1634a1e57a508328a563ec737d962d31186e1c0 --- /dev/null +++ b/annotations_1/8JhRzlsZPas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.01], [9.0, 11.06], [12.0, 13.09], [15.0, 16.87], [18.0, 18.82], [21.0, 21.88], [24.0, 26.27], [28.0, 29.67], [31.0, 33.64], [35.0, 35.58], [36.0, 37.02], [38.0, 39.19], [40.0, 44.64], [45.0, 45.98], [47.0, 48.29], [50.0, 51.81], [53.0, 54.4], [56.0, 57.81], [58.0, 58.46], [60.0, 62.21], [63.0, 64.79], [66.0, 68.25], [69.0, 70.98], [73.0, 73.75], [76.0, 77.68], [78.0, 80.32], [82.0, 83.94], [86.0, 86.31], [89.0, 92.6], [94.0, 95.77], [98.0, 99.12], [104.0, 104.65], [106.0, 106.51], [108.0, 108.16], [109.0, 110.84], [112.0, 111.89], [113.0, 114.89], [117.0, 122.52], [123.0, 127.74], [129.0, 131.36], [132.0, 141.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 54.1, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 50.71, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 51.23, 87.92, 80.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 2.06, 1.09, 1.87, 0.82, 0.88, 2.27, 1.67, 2.64, 0.58, 1.02, 1.19, 4.64, 0.98, 1.29, 1.81, 1.4, 1.81, 0.46, 2.21, 1.79, 2.25, 1.98, 0.75, 1.68, 2.32, 1.94, 0.31, 3.6, 1.77, 1.12, 0.65, 0.51, 0.16, 1.84, -0.11, 1.89, 5.52, 4.74, 2.36, 9.78]} \ No newline at end of file diff --git a/annotations_1/8Lv0BuXTgoY_filtered.json b/annotations_1/8Lv0BuXTgoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb7106e5bf5c78cb6bacc18b6476799c6c6fa06f --- /dev/null +++ b/annotations_1/8Lv0BuXTgoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 17.37], [18.0, 18.33], [21.0, 21.51], [22.0, 36.15], [37.0, 56.34], [57.0, 68.93], [72.0, 73.89], [80.0, 107.5], [115.0, 130.23]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [29.36, 0.0, 0.0, 29.43, 29.29, 29.32, 0.0, 29.55, 29.68], "audiomae_on_audioset": [[["speech", 40.8], ["music", 27.12], ["hum", 8.65]], null, null, [["music", 36.75], ["speech", 35.97], ["throbbing", 6.07]], [["speech", 48.2], ["music", 25.74], ["vehicle", 6.44]], [["speech", 29.63], ["throbbing", 23.2], ["hum", 18.6]], null, [["speech", 38.88], ["music", 23.06], ["vehicle", 13.29]], [["music", 39.99], ["speech", 31.23], ["hum", 8.39]]], "duration": [11.37, 0.33, 0.51, 14.15, 19.34, 11.93, 1.89, 27.5, 15.23]} \ No newline at end of file diff --git a/annotations_1/8M1kdeDluRE_filtered.json b/annotations_1/8M1kdeDluRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/8M1kdeDluRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/8N9oQUJJstQ_filtered.json b/annotations_1/8N9oQUJJstQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ba8862fd14b96bab886e86ceb106f870c2521de --- /dev/null +++ b/annotations_1/8N9oQUJJstQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 72.3], [73.0, 73.43], [74.0, 151.83], [156.0, 174.45]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.67], "audiomae_on_audioset": [null, null, null, [["music", 40.77], ["didgeridoo", 11.61], ["hum", 7.92]]], "duration": [1.3, 0.43, 77.83, 18.45]} \ No newline at end of file diff --git a/annotations_1/8NZ9CLszc_g_filtered.json b/annotations_1/8NZ9CLszc_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/8NZ9CLszc_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/8O9FIRPJRXc_filtered.json b/annotations_1/8O9FIRPJRXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c25f0e59bff3feb94f02047f6bdb0fe011a3e1d5 --- /dev/null +++ b/annotations_1/8O9FIRPJRXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 23.31], [25.0, 109.31], [112.0, 122.94], [123.0, 137.59], [140.0, 141.37], [142.0, 142.18]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.88, 0.0, 30.35, 30.87, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.41], ["musical instrument", 3.22], ["guitar", 3.06]], null, [["music", 75.1], ["trombone", 2.65], ["musical instrument", 2.61]], [["music", 70.39], ["trombone", 9.01], ["brass instrument", 4.83]], null, null], "duration": [10.31, 84.31, 10.94, 14.59, 1.37, 0.18]} \ No newline at end of file diff --git a/annotations_1/8OS1xorvbAs_filtered.json b/annotations_1/8OS1xorvbAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..868569484a38a5411d616747f4b861c2d72166a3 --- /dev/null +++ b/annotations_1/8OS1xorvbAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.42], [13.0, 12.7], [13.0, 21.96], [23.0, 23.57], [36.0, 39.33], [53.0, 54.36], [59.0, 60.88], [69.0, 72.32], [75.0, 74.88], [76.0, 81.84], [82.0, 84.57], [88.0, 89.13], [89.0, 92.06], [96.0, 96.35], [98.0, 98.91], [107.0, 109.05], [120.0, 121.47], [122.0, 123.63], [127.0, 129.56]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.58, 0.0, 57.4, 0.0, 0.0, 41.07, 0.0, 30.9, 36.19, 0.0, 30.59, 0.0, 0.0, 52.8, 0.0, 0.0, 41.72], "audiomae_on_audioset": [null, null, [["speech", 39.93], ["sidetone", 14.5], ["radio", 6.53]], null, null, null, null, [["speech", 15.96], ["hiccup", 11.93], ["frog", 11.62]], null, [["speech", 32.32], ["explosion", 28.82], ["burst, pop", 20.67]], [["speech", 55.26], ["busy signal", 20.39], ["sine wave", 6.76]], null, [["speech", 50.39], ["thunk", 6.34], ["whack, thwack", 5.01]], null, null, null, null, null, [["speech", 27.06], ["fart", 11.53], ["electric shaver, electric razor", 7.32]]], "duration": [0.42, -0.3, 8.96, 0.57, 3.33, 1.36, 1.88, 3.32, -0.12, 5.84, 2.57, 1.13, 3.06, 0.35, 0.91, 2.05, 1.47, 1.63, 2.56]} \ No newline at end of file diff --git a/annotations_1/8OilisaAv0I_filtered.json b/annotations_1/8OilisaAv0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8a4aa618ae17da4a7911fa4caa508d102a47bb7 --- /dev/null +++ b/annotations_1/8OilisaAv0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.3], [15.0, 15.28], [18.0, 18.35], [20.0, 20.75], [27.0, 32.22], [33.0, 34.67], [35.0, 37.47], [40.0, 42.33], [43.0, 46.7], [47.0, 48.84], [50.0, 51.93], [53.0, 54.48], [55.0, 57.7], [60.0, 62.97], [64.0, 67.68], [69.0, 75.25], [76.0, 96.09], [98.0, 117.83]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.86, 0.0, 46.26, 79.59, 46.43, 0.0, 0.0, 0.0, 40.4, 49.09, 51.66, 51.99, 33.38, 32.14], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 39.44], ["speech", 17.5], ["throbbing", 12.96]], null, [["hum", 45.57], ["throbbing", 38.51], ["mains hum", 2.79]], null, null, null, [["speech", 34.89], ["whale vocalization", 22.44], ["music", 18.51]], [["hum", 29.13], ["music", 20.85], ["rumble", 15.96]], null, null, [["hum", 60.71], ["mains hum", 16.95], ["throbbing", 14.23]], [["hum", 18.79], ["speech", 16.46], ["throbbing", 15.58]]], "duration": [1.3, 0.28, 0.35, 0.75, 5.22, 1.67, 2.47, 2.33, 3.7, 1.84, 1.93, 1.48, 2.7, 2.97, 3.68, 6.25, 20.09, 19.83]} \ No newline at end of file diff --git a/annotations_1/8Ojsvc_KsDY_filtered.json b/annotations_1/8Ojsvc_KsDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37ad204378f379c086456e5f6534ce810d3a28ba --- /dev/null +++ b/annotations_1/8Ojsvc_KsDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [3.0, 3.57], [5.0, 6.1], [7.0, 8.61], [10.0, 10.84], [12.0, 13.27], [14.0, 14.84], [16.0, 18.18], [19.0, 19.47], [22.0, 22.4], [24.0, 25.0], [28.0, 29.56], [30.0, 30.92], [31.0, 31.41], [39.0, 39.21], [41.0, 47.34], [49.0, 49.5], [51.0, 56.46], [57.0, 58.53], [62.0, 64.13], [66.0, 68.3], [69.0, 75.86], [78.0, 82.22], [96.0, 96.69], [98.0, 98.61], [101.0, 101.75], [111.0, 111.57], [118.0, 117.98], [119.0, 119.11], [127.0, 127.68], [130.0, 131.14], [132.0, 134.84], [136.0, 136.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 75.39, 0.0, 89.54, 99.98, 81.17, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.57, 1.1, 1.61, 0.84, 1.27, 0.84, 2.18, 0.47, 0.4, 1.0, 1.56, 0.92, 0.41, 0.21, 6.34, 0.5, 5.46, 1.53, 2.13, 2.3, 6.86, 4.22, 0.69, 0.61, 0.75, 0.57, -0.02, 0.11, 0.68, 1.14, 2.84, 0.88]} \ No newline at end of file diff --git a/annotations_1/8PALGqaFoFI_filtered.json b/annotations_1/8PALGqaFoFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01331b3839ef3da3cc4aeb729203c338d2133ff6 --- /dev/null +++ b/annotations_1/8PALGqaFoFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.45], [21.0, 45.39], [47.0, 88.99], [92.0, 92.37], [96.0, 96.25], [97.0, 99.06], [102.0, 101.61], [105.0, 151.58]], "keep_status": [false, true, false, false, false, true, false, false], "silence_prob": [0.0, 34.04, 0.0, 0.0, 0.0, 36.52, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.26], ["hum", 19.27], ["mains hum", 12.31]], null, null, null, [["sidetone", 23.04], ["music", 16.84], ["boing", 9.54]], null, null], "duration": [0.45, 24.39, 41.99, 0.37, 0.25, 2.06, -0.39, 46.58]} \ No newline at end of file diff --git a/annotations_1/8Pd2fpoD0Xg_filtered.json b/annotations_1/8Pd2fpoD0Xg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67f4a6c30299ae105438b7d0b694cf6785ea55de --- /dev/null +++ b/annotations_1/8Pd2fpoD0Xg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [8.0, 8.46], [14.0, 14.4], [15.0, 15.85], [17.0, 17.83], [28.0, 28.56], [29.0, 28.93], [29.0, 30.96], [34.0, 34.64], [37.0, 37.4], [43.0, 43.51], [47.0, 47.21], [48.0, 49.44], [52.0, 61.37], [64.0, 64.34], [77.0, 78.26], [84.0, 84.13], [91.0, 91.93], [93.0, 94.83], [96.0, 96.57], [100.0, 99.98], [100.0, 101.93], [105.0, 107.96], [111.0, 111.38], [113.0, 113.16], [115.0, 115.48], [118.0, 118.71], [120.0, 119.85], [122.0, 122.66], [127.0, 130.57], [135.0, 136.05], [138.0, 141.32], [141.0, 142.03], [144.0, 143.94], [145.0, 145.37], [149.0, 149.69], [161.0, 165.48], [167.0, 167.54], [169.0, 169.47], [175.0, 180.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 50.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.99], ["hum", 11.52], ["sidetone", 7.48]], null, null, null], "duration": [1.32, 0.46, 0.4, 0.85, 0.83, 0.56, -0.07, 1.96, 0.64, 0.4, 0.51, 0.21, 1.44, 9.37, 0.34, 1.26, 0.13, 0.93, 1.83, 0.57, -0.02, 1.93, 2.96, 0.38, 0.16, 0.48, 0.71, -0.15, 0.66, 3.57, 1.05, 3.32, 1.03, -0.06, 0.37, 0.69, 4.48, 0.54, 0.47, 5.01]} \ No newline at end of file diff --git a/annotations_1/8Q0KYSXhKMU_filtered.json b/annotations_1/8Q0KYSXhKMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13fd83af0b576c6666847bb725fc2082fff3e1a --- /dev/null +++ b/annotations_1/8Q0KYSXhKMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[78.0, 81.63], [83.0, 92.74], [93.0, 93.6], [96.0, 113.9], [116.0, 123.45], [125.0, 132.46], [134.0, 152.61], [155.0, 179.83]], "keep_status": [false, false, false, true, true, true, true, false], "silence_prob": [29.11, 30.24, 0.0, 29.83, 29.61, 29.62, 31.34, 28.98], "audiomae_on_audioset": [[["speech", 66.46], ["sound effect", 3.26], ["roar", 3.12]], [["music", 37.21], ["hum", 18.22], ["throbbing", 14.98]], null, [["grunt", 33.69], ["breaking", 15.18], ["sound effect", 10.5]], [["music", 38.94], ["hum", 11.76], ["mains hum", 11.06]], [["music", 53.05], ["rumble", 7.39], ["hum", 4.85]], [["music", 26.75], ["hum", 11.05], ["synthesizer", 8.42]], [["music", 28.3], ["mains hum", 28.02], ["hum", 19.75]]], "duration": [3.63, 9.74, 0.6, 17.9, 7.45, 7.46, 18.61, 24.83]} \ No newline at end of file diff --git a/annotations_1/8Q2WgdOSfms_filtered.json b/annotations_1/8Q2WgdOSfms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8166d2e1ba174847969d3e65aa790c7168956db --- /dev/null +++ b/annotations_1/8Q2WgdOSfms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [12.0, 13.15], [14.0, 14.45], [15.0, 15.62], [18.0, 18.49], [22.0, 22.67], [25.0, 25.05], [32.0, 33.3], [34.0, 36.12], [36.0, 36.59], [55.0, 55.53], [56.0, 59.56], [67.0, 68.01], [80.0, 80.81], [82.0, 82.68], [84.0, 93.19], [95.0, 96.74], [100.0, 100.85], [103.0, 103.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 1.15, 0.45, 0.62, 0.49, 0.67, 0.05, 1.3, 2.12, 0.59, 0.53, 3.56, 1.01, 0.81, 0.68, 9.19, 1.74, 0.85, 0.33]} \ No newline at end of file diff --git a/annotations_1/8QzFJA3QM7E_filtered.json b/annotations_1/8QzFJA3QM7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a92424e8f309df4913f86101cd01a30d6bb2cf3e --- /dev/null +++ b/annotations_1/8QzFJA3QM7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.52], [21.0, 20.95], [29.0, 33.24], [48.0, 47.93], [57.0, 59.68], [60.0, 61.52], [64.0, 64.22], [65.0, 66.36], [67.0, 68.15], [77.0, 81.43], [82.0, 82.34], [84.0, 84.16], [85.0, 87.35], [93.0, 94.86], [95.0, 96.52], [101.0, 101.55], [103.0, 106.42], [107.0, 108.65], [112.0, 112.38], [113.0, 118.61], [123.0, 127.35], [129.0, 130.76], [133.0, 133.51], [137.0, 138.89], [143.0, 143.36], [151.0, 151.7], [153.0, 156.32], [157.0, 158.72], [161.0, 170.53], [172.0, 173.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.62, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 47.54, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 82.97, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 87.55, 0.0], "audiomae_on_audioset": [null, null, [["speech", 83.31], ["whale vocalization", 1.91], ["hum", 0.84]], null, null, null, null, null, null, null, null, null, [["speech", 22.15], ["glass", 21.93], ["tuning fork", 16.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, -0.05, 4.24, -0.07, 2.68, 1.52, 0.22, 1.36, 1.15, 4.43, 0.34, 0.16, 2.35, 1.86, 1.52, 0.55, 3.42, 1.65, 0.38, 5.61, 4.35, 1.76, 0.51, 1.89, 0.36, 0.7, 3.32, 1.72, 9.53, 1.1]} \ No newline at end of file diff --git a/annotations_1/8R8mxS2E_UQ_filtered.json b/annotations_1/8R8mxS2E_UQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0286d6252c7651a2cb2de2c84df68307db6f0654 --- /dev/null +++ b/annotations_1/8R8mxS2E_UQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.87], [13.0, 13.96], [16.0, 17.22], [20.0, 21.49], [27.0, 30.08]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.47], "audiomae_on_audioset": [null, null, null, null, [["speech", 23.0], ["sidetone", 14.13], ["insect", 9.98]]], "duration": [0.87, 0.96, 1.22, 1.49, 3.08]} \ No newline at end of file diff --git a/annotations_1/8RGjds-aK00_filtered.json b/annotations_1/8RGjds-aK00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee74dc92dade9fd2856f882bec8973bc4dd05b9b --- /dev/null +++ b/annotations_1/8RGjds-aK00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [5.0, 5.29], [11.0, 11.72], [15.0, 15.7], [19.0, 19.52], [22.0, 22.64], [26.0, 26.23], [48.0, 48.29], [49.0, 49.62], [55.0, 55.38], [61.0, 62.06], [65.0, 65.87], [66.0, 66.68], [67.0, 67.81], [68.0, 69.65], [74.0, 76.06], [77.0, 77.99], [80.0, 80.03], [81.0, 82.7], [83.0, 84.06], [88.0, 88.79], [89.0, 90.32], [98.0, 98.37], [100.0, 100.45], [106.0, 107.03], [109.0, 109.56], [111.0, 110.96], [112.0, 112.14], [113.0, 113.8], [122.0, 122.89], [126.0, 126.99], [128.0, 128.07], [129.0, 129.19], [129.0, 130.11], [132.0, 132.07], [134.0, 134.89], [142.0, 142.69], [145.0, 145.08], [150.0, 150.53], [156.0, 156.54], [166.0, 166.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 0.29, 0.72, 0.7, 0.52, 0.64, 0.23, 0.29, 0.62, 0.38, 1.06, 0.87, 0.68, 0.81, 1.65, 2.06, 0.99, 0.03, 1.7, 1.06, 0.79, 1.32, 0.37, 0.45, 1.03, 0.56, -0.04, 0.14, 0.8, 0.89, 0.99, 0.07, 0.19, 1.11, 0.07, 0.89, 0.69, 0.08, 0.53, 0.54, 0.24]} \ No newline at end of file diff --git a/annotations_1/8RuMflmyF9k_filtered.json b/annotations_1/8RuMflmyF9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db621efc72798e22228a0a75cfbc9a86b0eacdd1 --- /dev/null +++ b/annotations_1/8RuMflmyF9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.1], [9.0, 9.78], [12.0, 14.74], [19.0, 20.97], [24.0, 24.73], [27.0, 38.62], [48.0, 48.71], [49.0, 49.42], [50.0, 49.52], [59.0, 59.51], [60.0, 60.2], [60.0, 65.82], [66.0, 77.75], [85.0, 90.05], [93.0, 100.3], [120.0, 124.85], [127.0, 128.97], [130.0, 130.92], [132.0, 133.44], [146.0, 147.16], [154.0, 154.43], [156.0, 160.76], [161.0, 162.68], [165.0, 165.5]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.28, 0.0, 0.0, 33.17, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 49.97, 37.02, 30.47, 35.28, 0.0, 0.0, 0.0, 0.0, 0.0, 30.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 26.58], ["whip", 10.92], ["fart", 5.61]], null, null, [["hum", 40.74], ["throbbing", 7.13], ["mains hum", 5.96]], null, null, null, null, null, [["speech", 33.78], ["music", 20.7], ["fart", 6.23]], [["music", 44.84], ["speech", 16.14], ["fart", 6.21]], [["moo", 33.2], ["cattle, bovinae", 29.77], ["livestock, farm animals, working animals", 27.25]], [["speech", 43.37], ["music", 40.42], ["whack, thwack", 1.11]], [["speech", 18.18], ["explosion", 12.25], ["fireworks", 11.03]], null, null, null, null, null, [["speech", 64.19], ["fart", 6.94], ["whack, thwack", 3.68]], null, null], "duration": [1.1, 0.78, 2.74, 1.97, 0.73, 11.62, 0.71, 0.42, -0.48, 0.51, 0.2, 5.82, 11.75, 5.05, 7.3, 4.85, 1.97, 0.92, 1.44, 1.16, 0.43, 4.76, 1.68, 0.5]} \ No newline at end of file diff --git a/annotations_1/8TbUl9dhTRg_filtered.json b/annotations_1/8TbUl9dhTRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0380f3e134e285cd3468b41cd42f352c18f2f6e --- /dev/null +++ b/annotations_1/8TbUl9dhTRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 31.55], [36.0, 41.23], [45.0, 45.93], [47.0, 52.37], [62.0, 63.75], [68.0, 71.71], [76.0, 76.67], [78.0, 88.2], [93.0, 97.66], [101.0, 102.78], [106.0, 106.51], [111.0, 111.81], [116.0, 121.05], [126.0, 132.44], [134.0, 136.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 57.89, 0.0, 44.99, 0.0, 50.76, 0.0, 34.95, 36.98, 0.0, 0.0, 0.0, 34.24, 32.77, 42.62], "audiomae_on_audioset": [null, null, null, [["music", 60.54], ["carnatic music", 17.54], ["musical instrument", 3.64]], null, null, null, [["music", 92.13], ["singing", 1.02], ["male singing", 0.8]], [["music", 87.73], ["singing", 1.48], ["male singing", 0.72]], null, null, null, [["music", 66.18], ["musical instrument", 4.16], ["saxophone", 3.84]], [["music", 61.98], ["carnatic music", 20.54], ["singing", 2.99]], [["music", 63.32], ["foghorn", 8.09], ["musical instrument", 4.31]]], "duration": [2.55, 5.23, 0.93, 5.37, 1.75, 3.71, 0.67, 10.2, 4.66, 1.78, 0.51, 0.81, 5.05, 6.44, 2.24]} \ No newline at end of file diff --git a/annotations_1/8TcZDzWEVDM_filtered.json b/annotations_1/8TcZDzWEVDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6468c0867f48ab14f446af9b8294a2ddbb989780 --- /dev/null +++ b/annotations_1/8TcZDzWEVDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.09], [13.0, 15.89], [20.0, 23.33], [33.0, 40.44], [41.0, 57.05], [58.0, 84.45], [85.0, 108.35], [110.0, 129.15], [131.0, 132.38]], "keep_status": [false, false, false, false, true, false, false, true, false], "silence_prob": [30.47, 30.0, 30.25, 29.91, 30.2, 30.31, 30.1, 42.98, 0.0], "audiomae_on_audioset": [[["speech", 58.25], ["music", 10.52], ["outside, rural or natural", 5.55]], [["speech", 44.02], ["music", 31.44], ["electronic music", 2.59]], [["speech", 63.22], ["music", 12.12], ["vehicle", 6.05]], [["hum", 32.59], ["mains hum", 31.43], ["music", 16.04]], [["music", 50.01], ["hum", 11.19], ["mains hum", 8.55]], [["music", 53.3], ["hum", 18.1], ["throbbing", 15.04]], [["music", 43.99], ["throbbing", 30.23], ["hum", 6.42]], [["music", 33.79], ["breaking", 7.64], ["single-lens reflex camera", 6.76]], null], "duration": [6.09, 2.89, 3.33, 7.44, 16.05, 26.45, 23.35, 19.15, 1.38]} \ No newline at end of file diff --git a/annotations_1/8UscACJkVxY_filtered.json b/annotations_1/8UscACJkVxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..906e88fd35f24a4f7a46a0182d23c511244ab8e0 --- /dev/null +++ b/annotations_1/8UscACJkVxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.23], [16.0, 16.95], [19.0, 20.65], [23.0, 24.88], [33.0, 33.45], [34.0, 35.4], [37.0, 38.48], [42.0, 42.45], [47.0, 47.92], [48.0, 50.77], [54.0, 60.18], [63.0, 63.1], [64.0, 65.85], [68.0, 70.31], [73.0, 73.06], [74.0, 74.58], [76.0, 77.35], [79.0, 79.98], [81.0, 81.82], [83.0, 83.35], [88.0, 90.93], [94.0, 94.39], [97.0, 96.9], [100.0, 100.68], [104.0, 106.52], [107.0, 107.06], [110.0, 111.45], [113.0, 114.61], [117.0, 119.91], [121.0, 122.03], [128.0, 128.65], [129.0, 131.4], [132.0, 132.68], [135.0, 135.24], [153.0, 156.0], [159.0, 159.07], [161.0, 162.38], [166.0, 171.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 53.53, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 58.38, 0.0, 0.0, 55.6, 0.0, 0.0, 69.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 61.38], ["speech", 10.55], ["scary music", 4.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.95, 1.65, 1.88, 0.45, 1.4, 1.48, 0.45, 0.92, 2.77, 6.18, 0.1, 1.85, 2.31, 0.06, 0.58, 1.35, 0.98, 0.82, 0.35, 2.93, 0.39, -0.1, 0.68, 2.52, 0.06, 1.45, 1.61, 2.91, 1.03, 0.65, 2.4, 0.68, 0.24, 3.0, 0.07, 1.38, 5.64]} \ No newline at end of file diff --git a/annotations_1/8VZctic_uTI_filtered.json b/annotations_1/8VZctic_uTI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a85364b0e8afc908e6a3701e384e07b7ecdf1ecf --- /dev/null +++ b/annotations_1/8VZctic_uTI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.02], [6.0, 7.57], [11.0, 12.23], [16.0, 18.33], [21.0, 20.75], [23.0, 25.35], [27.0, 29.0], [31.0, 35.33], [39.0, 40.74], [42.0, 51.73], [53.0, 54.94], [58.0, 58.62], [60.0, 63.86], [65.0, 66.31], [68.0, 70.01], [71.0, 72.5], [74.0, 75.51], [77.0, 78.09], [79.0, 81.13], [83.0, 84.33], [86.0, 87.47], [90.0, 90.44], [96.0, 97.33], [99.0, 102.05], [109.0, 109.9], [113.0, 113.9], [115.0, 123.42], [124.0, 125.29], [126.0, 127.85], [129.0, 130.03], [135.0, 136.68], [139.0, 140.21], [142.0, 143.31], [147.0, 147.9], [150.0, 150.3], [151.0, 156.03], [158.0, 160.1], [161.0, 162.55], [163.0, 165.11], [166.0, 169.62], [171.0, 174.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [87.55, 0.0, 0.0, 38.25, 0.0, 83.7, 88.64, 53.28, 0.0, 63.21, 0.0, 0.0, 80.64, 0.0, 91.64, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 55.89, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 88.46, 0.0, 35.84, 51.34, 81.53], "audiomae_on_audioset": [null, null, null, [["speech", 76.32], ["dial tone", 7.5], ["sidetone", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.26], ["hum", 11.05], ["moo", 9.05]], null, null], "duration": [3.02, 1.57, 1.23, 2.33, -0.25, 2.35, 2.0, 4.33, 1.74, 9.73, 1.94, 0.62, 3.86, 1.31, 2.01, 1.5, 1.51, 1.09, 2.13, 1.33, 1.47, 0.44, 1.33, 3.05, 0.9, 0.9, 8.42, 1.29, 1.85, 1.03, 1.68, 1.21, 1.31, 0.9, 0.3, 5.03, 2.1, 1.55, 2.11, 3.62, 3.39]} \ No newline at end of file diff --git a/annotations_1/8VhgYX8xRuw_filtered.json b/annotations_1/8VhgYX8xRuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c16eea455bd8c4725d32c1dac1243c7265232e9e --- /dev/null +++ b/annotations_1/8VhgYX8xRuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.13], [20.0, 31.43], [32.0, 37.08], [49.0, 59.98], [62.0, 67.64], [78.0, 79.32], [105.0, 112.46], [119.0, 137.93], [154.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.53, 29.61, 29.47, 29.84, 0.0, 29.48, 29.89, 29.64], "audiomae_on_audioset": [null, [["music", 62.84], ["middle eastern music", 8.11], ["carnatic music", 3.34]], [["music", 61.31], ["drum", 6.01], ["carnatic music", 5.73]], [["music", 74.96], ["synthesizer", 4.27], ["boing", 3.08]], [["music", 83.65], ["drum machine", 1.6], ["synthesizer", 1.27]], null, [["music", 69.18], ["dog", 3.83], ["animal", 3.45]], [["music", 84.55], ["speech", 3.86], ["boing", 2.89]], [["speech", 48.44], ["music", 26.94], ["boing", 14.27]]], "duration": [1.13, 11.43, 5.08, 10.98, 5.64, 1.32, 7.46, 18.93, 10.94]} \ No newline at end of file diff --git a/annotations_1/8Wgkpfa5HMw_filtered.json b/annotations_1/8Wgkpfa5HMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcaa59ee4575a09441726c835b95eccd13f929b0 --- /dev/null +++ b/annotations_1/8Wgkpfa5HMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.83], [30.0, 30.05], [40.0, 41.2], [42.0, 42.53], [44.0, 45.03], [50.0, 55.92], [57.0, 57.94], [59.0, 67.86], [69.0, 71.24], [81.0, 86.64], [89.0, 90.44], [95.0, 102.24], [104.0, 115.75], [124.0, 140.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [35.92, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 65.55, 97.73, 62.99, 0.0, 30.38, 33.63, 33.59], "audiomae_on_audioset": [[["screaming", 50.08], ["speech", 22.69], ["fart", 3.03]], null, null, null, null, null, null, null, null, null, null, [["hum", 20.63], ["music", 19.06], ["noise", 9.33]], [["music", 42.33], ["speech", 32.29], ["synthesizer", 2.73]], [["speech", 45.71], ["music", 17.49], ["brass instrument", 4.98]]], "duration": [21.83, 0.05, 1.2, 0.53, 1.03, 5.92, 0.94, 8.86, 2.24, 5.64, 1.44, 7.24, 11.75, 16.9]} \ No newline at end of file diff --git a/annotations_1/8YQZMbgpmIo_filtered.json b/annotations_1/8YQZMbgpmIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2bc975489b97194697c55aa692a6e3c69432a9a --- /dev/null +++ b/annotations_1/8YQZMbgpmIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [3.0, 2.91], [37.0, 37.93], [42.0, 42.4], [43.0, 44.74], [49.0, 49.01], [52.0, 52.37], [55.0, 55.8], [58.0, 58.36], [69.0, 69.42], [76.0, 76.25], [86.0, 86.53], [91.0, 92.3], [96.0, 96.89], [98.0, 98.05], [98.0, 99.22], [112.0, 113.21], [120.0, 121.17], [124.0, 124.51], [129.0, 129.57], [135.0, 135.77], [137.0, 138.55], [144.0, 144.68], [150.0, 149.66], [151.0, 151.17], [161.0, 161.96], [163.0, 164.86], [168.0, 171.48], [174.0, 173.82], [174.0, 175.53], [178.0, 179.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, -0.09, 0.93, 0.4, 1.74, 0.01, 0.37, 0.8, 0.36, 0.42, 0.25, 0.53, 1.3, 0.89, 0.05, 1.22, 1.21, 1.17, 0.51, 0.57, 0.77, 1.55, 0.68, -0.34, 0.17, 0.96, 1.86, 3.48, -0.18, 1.53, 1.41]} \ No newline at end of file diff --git a/annotations_1/8YUnOHihAU0_filtered.json b/annotations_1/8YUnOHihAU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..661ef47bf27a082e329441e06a763b5f226e0761 --- /dev/null +++ b/annotations_1/8YUnOHihAU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [7.0, 8.83], [10.0, 10.4], [15.0, 16.01], [18.0, 18.67], [21.0, 22.62], [28.0, 27.89], [39.0, 40.1], [49.0, 50.45], [58.0, 58.6], [61.0, 61.55], [64.0, 64.91], [70.0, 70.51], [80.0, 80.1], [81.0, 82.98], [85.0, 86.1], [88.0, 88.32], [90.0, 90.37], [92.0, 93.02], [94.0, 94.8], [98.0, 98.63], [104.0, 107.54], [114.0, 114.42], [117.0, 117.0], [121.0, 121.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 1.83, 0.4, 1.01, 0.67, 1.62, -0.11, 1.1, 1.45, 0.6, 0.55, 0.91, 0.51, 0.1, 1.98, 1.1, 0.32, 0.37, 1.02, 0.8, 0.63, 3.54, 0.42, 0.0, 0.09]} \ No newline at end of file diff --git a/annotations_1/8Yqw_f26SvM_filtered.json b/annotations_1/8Yqw_f26SvM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41c6ee226f96b3d021a6ebd020b4d6bcc1bed18 --- /dev/null +++ b/annotations_1/8Yqw_f26SvM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.25], [27.0, 27.63], [41.0, 41.3], [48.0, 48.9], [74.0, 74.97], [77.0, 76.72], [78.0, 78.75], [80.0, 80.92], [95.0, 96.35], [101.0, 101.41], [106.0, 106.68], [113.0, 117.29], [123.0, 123.2], [143.0, 144.19], [146.0, 151.39], [156.0, 156.78], [162.0, 167.19], [170.0, 170.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.12, 0.0, 0.0, 34.54, 0.0, 33.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 74.34], ["didgeridoo", 3.96], ["musical instrument", 3.02]], null, null, [["music", 60.65], ["musical instrument", 8.3], ["brass instrument", 4.52]], null, [["music", 37.96], ["brass instrument", 13.58], ["saxophone", 10.12]], null], "duration": [0.25, 0.63, 0.3, 0.9, 0.97, -0.28, 0.75, 0.92, 1.35, 0.41, 0.68, 4.29, 0.2, 1.19, 5.39, 0.78, 5.19, 0.6]} \ No newline at end of file diff --git a/annotations_1/8a2aEHT7v54_filtered.json b/annotations_1/8a2aEHT7v54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b15f0287b54f1aae810148058e929cdcc8ce548 --- /dev/null +++ b/annotations_1/8a2aEHT7v54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.53], [10.0, 13.14], [15.0, 17.22], [18.0, 18.45], [19.0, 20.61], [24.0, 25.42], [29.0, 33.56], [34.0, 35.63], [37.0, 46.06], [47.0, 48.42], [49.0, 49.47], [51.0, 66.95], [70.0, 70.63]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [47.9, 41.01, 71.87, 0.0, 0.0, 0.0, 63.85, 0.0, 30.92, 0.0, 0.0, 30.47, 0.0], "audiomae_on_audioset": [[["sidetone", 28.42], ["music", 14.16], ["speech", 12.11]], [["frog", 27.78], ["speech", 23.69], ["croak", 20.54]], null, null, null, null, null, null, [["speech", 40.14], ["music", 25.27], ["beatboxing", 3.77]], null, null, [["music", 61.7], ["speech", 17.44], ["groan", 3.34]], null], "duration": [3.53, 3.14, 2.22, 0.45, 1.61, 1.42, 4.56, 1.63, 9.06, 1.42, 0.47, 15.95, 0.63]} \ No newline at end of file diff --git a/annotations_1/8aK7LsC0G-4_filtered.json b/annotations_1/8aK7LsC0G-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..860da13ab8a7057ef1c4018490f1ed511b8f2914 --- /dev/null +++ b/annotations_1/8aK7LsC0G-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.92], [18.0, 18.81], [21.0, 21.32], [29.0, 29.52], [30.0, 30.77], [35.0, 36.0], [39.0, 43.06], [47.0, 47.21], [47.0, 50.4], [58.0, 58.24], [77.0, 78.26], [103.0, 104.08], [105.0, 106.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 58.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 0.81, 0.32, 0.52, 0.77, 1.0, 4.06, 0.21, 3.4, 0.24, 1.26, 1.08, 1.29]} \ No newline at end of file diff --git a/annotations_1/8bJzLt9AYqc_filtered.json b/annotations_1/8bJzLt9AYqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fece5949f7b94dbfec53f73209bb393b39010cd --- /dev/null +++ b/annotations_1/8bJzLt9AYqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 21.27], [24.0, 24.9], [25.0, 26.91], [39.0, 39.66], [42.0, 42.92], [45.0, 48.64], [61.0, 61.7], [64.0, 66.01], [72.0, 73.16], [76.0, 86.44], [87.0, 87.54], [88.0, 90.21], [102.0, 103.23], [105.0, 105.95], [110.0, 117.29], [149.0, 155.16], [163.0, 163.12]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [34.67, 0.0, 0.0, 0.0, 0.0, 37.35, 0.0, 67.76, 0.0, 86.82, 0.0, 83.7, 0.0, 0.0, 29.85, 30.68, 0.0], "audiomae_on_audioset": [[["music", 56.5], ["speech", 6.69], ["musical instrument", 4.32]], null, null, null, null, [["music", 43.57], ["timpani", 16.34], ["trombone", 4.32]], null, null, null, null, null, null, null, null, [["crowd", 21.46], ["music", 20.3], ["speech", 16.96]], [["speech", 40.9], ["music", 14.85], ["vehicle", 7.54]], null], "duration": [17.27, 0.9, 1.91, 0.66, 0.92, 3.64, 0.7, 2.01, 1.16, 10.44, 0.54, 2.21, 1.23, 0.95, 7.29, 6.16, 0.12]} \ No newline at end of file diff --git a/annotations_1/8cGUULb2K-0_filtered.json b/annotations_1/8cGUULb2K-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a8154ec8ca0b3d063fd5cb66ccaffe3fe50532 --- /dev/null +++ b/annotations_1/8cGUULb2K-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.72], [19.0, 19.75], [21.0, 52.68], [57.0, 63.49], [65.0, 69.72], [72.0, 72.55], [73.0, 78.21], [83.0, 82.78], [86.0, 86.54], [89.0, 94.2], [104.0, 104.85], [106.0, 106.42], [115.0, 115.97], [121.0, 121.86], [123.0, 128.92], [131.0, 131.36]], "keep_status": [true, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [41.85, 0.0, 0.0, 37.61, 38.7, 0.0, 35.69, 0.0, 0.0, 39.04, 0.0, 0.0, 0.0, 0.0, 38.09, 0.0], "audiomae_on_audioset": [[["hum", 21.8], ["insect", 18.73], ["fly, housefly", 18.58]], null, null, [["theremin", 50.71], ["music", 20.21], ["speech", 13.29]], [["speech", 46.09], ["music", 9.21], ["vehicle", 4.19]], null, [["speech", 75.23], ["music", 10.06], ["run", 3.49]], null, null, [["theremin", 15.08], ["dog", 10.84], ["speech", 9.52]], null, null, null, null, [["whale vocalization", 35.32], ["radio", 13.62], ["speech", 7.34]], null], "duration": [17.72, 0.75, 31.68, 6.49, 4.72, 0.55, 5.21, -0.22, 0.54, 5.2, 0.85, 0.42, 0.97, 0.86, 5.92, 0.36]} \ No newline at end of file diff --git a/annotations_1/8coCtKWysGk_filtered.json b/annotations_1/8coCtKWysGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc46a7ecc4f6a38bd2fd51665b415edcfe6365e5 --- /dev/null +++ b/annotations_1/8coCtKWysGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.7], [16.0, 18.52], [19.0, 53.77], [56.0, 79.59], [81.0, 84.1], [89.0, 95.23], [95.0, 95.54], [96.0, 100.85], [102.0, 104.33], [107.0, 108.41], [110.0, 111.86], [114.0, 127.75], [130.0, 134.52], [138.0, 145.74], [153.0, 164.15], [166.0, 168.89]], "keep_status": [false, false, false, false, true, true, false, false, true, false, false, true, true, true, false, false], "silence_prob": [0.0, 30.13, 0.0, 30.1, 31.57, 33.64, 0.0, 43.48, 46.54, 0.0, 0.0, 41.42, 30.84, 28.95, 28.97, 30.97], "audiomae_on_audioset": [null, [["speech", 58.44], ["music", 9.93], ["noise", 4.49]], null, [["music", 60.67], ["fart", 8.6], ["speech", 7.95]], [["speech", 13.23], ["whack, thwack", 12.57], ["music", 8.65]], [["music", 32.51], ["thunk", 17.17], ["speech", 14.91]], null, [["speech", 45.92], ["music", 17.59], ["whale vocalization", 9.92]], [["music", 34.04], ["didgeridoo", 5.15], ["theremin", 3.8]], null, null, [["music", 53.65], ["hum", 4.87], ["didgeridoo", 4.86]], [["whale vocalization", 25.01], ["music", 19.58], ["rumble", 16.39]], [["music", 29.79], ["animal", 18.91], ["boing", 9.74]], [["livestock, farm animals, working animals", 36.46], ["moo", 30.85], ["cattle, bovinae", 26.65]], [["music", 69.54], ["mosquito", 3.5], ["speech", 3.5]]], "duration": [0.7, 2.52, 34.77, 23.59, 3.1, 6.23, 0.54, 4.85, 2.33, 1.41, 1.86, 13.75, 4.52, 7.74, 11.15, 2.89]} \ No newline at end of file diff --git a/annotations_1/8d3LDYM0GF4_filtered.json b/annotations_1/8d3LDYM0GF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d95b51b0c6ffa3fe5dc26516daa9eda5cfc85e65 --- /dev/null +++ b/annotations_1/8d3LDYM0GF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.24], [30.0, 30.65], [35.0, 54.67], [57.0, 58.65], [59.0, 65.04], [68.0, 75.73], [78.0, 84.94], [85.0, 111.52]], "keep_status": [false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 32.56, 0.0, 63.64, 73.82, 50.41, 43.66], "audiomae_on_audioset": [null, null, [["music", 50.7], ["synthesizer", 7.12], ["hum", 3.8]], null, null, null, null, [["noise", 35.11], ["speech", 15.2], ["mains hum", 9.88]]], "duration": [1.24, 0.65, 19.67, 1.65, 6.04, 7.73, 6.94, 26.52]} \ No newline at end of file diff --git a/annotations_1/8e5fzbsfGCI_filtered.json b/annotations_1/8e5fzbsfGCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..821d8972a96b683fca90b1c77cd1889ea3a172f7 --- /dev/null +++ b/annotations_1/8e5fzbsfGCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.4], [16.0, 17.52], [20.0, 22.33], [25.0, 27.31], [28.0, 32.85], [35.0, 36.15], [37.0, 38.28], [39.0, 40.63], [42.0, 44.22], [46.0, 46.21], [48.0, 49.32], [50.0, 50.55], [51.0, 52.12], [53.0, 54.33], [56.0, 56.61], [57.0, 58.18], [59.0, 61.35], [63.0, 67.59], [74.0, 74.97], [81.0, 83.66], [86.0, 86.32], [86.0, 87.44], [88.0, 88.47], [91.0, 92.64], [101.0, 106.96], [108.0, 111.96], [113.0, 114.08]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [56.7, 0.0, 38.78, 50.11, 80.46, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 37.2, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 60.79, 53.34, 0.0], "audiomae_on_audioset": [null, null, [["music", 20.99], ["noise", 19.81], ["throbbing", 11.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.97], ["music", 5.91], ["sidetone", 3.39]], null, null, null, null, null, null, null, null, null], "duration": [2.4, 1.52, 2.33, 2.31, 4.85, 1.15, 1.28, 1.63, 2.22, 0.21, 1.32, 0.55, 1.12, 1.33, 0.61, 1.18, 2.35, 4.59, 0.97, 2.66, 0.32, 1.44, 0.47, 1.64, 5.96, 3.96, 1.08]} \ No newline at end of file diff --git a/annotations_1/8fHMMPXUE5I_filtered.json b/annotations_1/8fHMMPXUE5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2281b45d4963d24da6072df167a76abcf9c89f24 --- /dev/null +++ b/annotations_1/8fHMMPXUE5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.42], [38.0, 39.8], [41.0, 48.98], [50.0, 51.09], [51.0, 52.54], [53.0, 55.16], [56.0, 66.99], [71.0, 101.46], [102.0, 119.04], [121.0, 149.71], [151.0, 162.72]], "keep_status": [false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 99.26, 0.0, 0.0, 88.1, 49.22, 0.0, 29.84, 59.86, 28.94], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.87], ["speech", 13.67], ["gong", 7.73]], null, [["music", 54.64], ["musical instrument", 6.96], ["trombone", 4.53]], null, [["music", 28.25], ["theremin", 22.24], ["musical instrument", 9.36]]], "duration": [0.42, 1.8, 7.98, 1.09, 1.54, 2.16, 10.99, 30.46, 17.04, 28.71, 11.72]} \ No newline at end of file diff --git a/annotations_1/8fizKw4z9fI_filtered.json b/annotations_1/8fizKw4z9fI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..251e1bfb24eb14228a1acfe3f3774889ab7a3ce3 --- /dev/null +++ b/annotations_1/8fizKw4z9fI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.99], [17.0, 17.1], [39.0, 39.18], [39.0, 39.63], [52.0, 52.3], [61.0, 62.6], [81.0, 81.36], [92.0, 91.99], [108.0, 108.48], [129.0, 129.03], [149.0, 151.73], [154.0, 154.36], [160.0, 160.25], [162.0, 164.15], [166.0, 166.6], [167.0, 167.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 30.69, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 53.77], ["ambient music", 11.77], ["synthesizer", 8.56]], null, null, [["music", 23.97], ["speech", 22.35], ["synthesizer", 4.75]], null, null], "duration": [0.99, 0.1, 0.18, 0.63, 0.3, 1.6, 0.36, -0.01, 0.48, 0.03, 2.73, 0.36, 0.25, 2.15, 0.6, 0.44]} \ No newline at end of file diff --git a/annotations_1/8fzGR29bKjY_filtered.json b/annotations_1/8fzGR29bKjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd67e1b10ff046e07d3f425ea4ee142ddb068169 --- /dev/null +++ b/annotations_1/8fzGR29bKjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.48], [9.0, 10.79], [15.0, 15.63], [18.0, 21.0], [28.0, 32.31], [44.0, 54.8], [57.0, 58.87], [59.0, 58.99], [59.0, 60.2], [61.0, 64.1], [65.0, 90.81], [93.0, 94.69], [95.0, 103.62], [109.0, 110.69], [114.0, 115.86], [123.0, 124.33], [125.0, 127.26], [128.0, 128.43], [129.0, 129.42]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.5, 33.42, 32.59, 0.0, 0.0, 0.0, 30.38, 34.67, 0.0, 33.42, 0.0, 0.0, 0.0, 33.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 47.51], ["didgeridoo", 24.58], ["sound effect", 1.97]], [["music", 35.28], ["foghorn", 8.03], ["theremin", 5.41]], [["cattle, bovinae", 30.27], ["livestock, farm animals, working animals", 26.12], ["moo", 17.64]], null, null, null, [["speech", 25.67], ["vehicle", 13.35], ["music", 12.29]], [["music", 32.59], ["throbbing", 15.04], ["hum", 12.25]], null, [["music", 25.7], ["hum", 20.75], ["throbbing", 19.1]], null, null, null, [["speech", 41.68], ["vehicle", 7.54], ["music", 6.67]], null, null], "duration": [0.48, 1.79, 0.63, 3.0, 4.31, 10.8, 1.87, -0.01, 1.2, 3.1, 25.81, 1.69, 8.62, 1.69, 1.86, 1.33, 2.26, 0.43, 0.42]} \ No newline at end of file diff --git a/annotations_1/8gLOoFW3ke0_filtered.json b/annotations_1/8gLOoFW3ke0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb8c70f7e2c6e1c1dea62cd4793f3006508629f1 --- /dev/null +++ b/annotations_1/8gLOoFW3ke0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 44.39], [45.0, 67.61], [69.0, 70.12], [71.0, 91.03]], "keep_status": [true, true, false, false], "silence_prob": [29.97, 29.33, 0.0, 28.98], "audiomae_on_audioset": [[["artillery fire", 45.29], ["explosion", 11.06], ["burst, pop", 7.65]], [["whack, thwack", 28.34], ["smash, crash", 23.13], ["music", 15.77]], null, [["speech", 68.19], ["music", 21.58], ["breaking", 2.86]]], "duration": [13.39, 22.61, 1.12, 20.03]} \ No newline at end of file diff --git a/annotations_1/8gvuU-U64d0_filtered.json b/annotations_1/8gvuU-U64d0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82a0f5700c0cd974955ae47fd11d7246a02b6d2d --- /dev/null +++ b/annotations_1/8gvuU-U64d0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [7.0, 7.52], [12.0, 11.75], [13.0, 13.63], [14.0, 18.6], [19.0, 19.4], [20.0, 22.76], [23.0, 25.2], [27.0, 29.66], [33.0, 33.25], [35.0, 36.21], [39.0, 39.78], [45.0, 47.38], [54.0, 56.79], [60.0, 60.81], [64.0, 64.67], [68.0, 74.43], [76.0, 77.09], [78.0, 82.12], [84.0, 85.99], [87.0, 88.79], [91.0, 91.45], [93.0, 93.51], [95.0, 95.77], [97.0, 97.65], [99.0, 99.96], [103.0, 103.84], [105.0, 104.92], [106.0, 111.15], [112.0, 112.46], [113.0, 114.62], [116.0, 117.09], [122.0, 122.76], [123.0, 124.06], [124.0, 126.01], [127.0, 128.66]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.88, 0.0, 40.33, 71.14, 87.55, 0.0, 0.0, 0.0, 47.43, 89.54, 0.0, 0.0, 99.93, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.51], ["zipper (clothing)", 11.39], ["fly, housefly", 6.13]], null, [["speech", 39.37], ["fly, housefly", 11.43], ["insect", 4.97]], null, null, null, null, null, [["speech", 47.21], ["sidetone", 10.67], ["music", 5.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.52, -0.25, 0.63, 4.6, 0.4, 2.76, 2.2, 2.66, 0.25, 1.21, 0.78, 2.38, 2.79, 0.81, 0.67, 6.43, 1.09, 4.12, 1.99, 1.79, 0.45, 0.51, 0.77, 0.65, 0.96, 0.84, -0.08, 5.15, 0.46, 1.62, 1.09, 0.76, 1.06, 2.01, 1.66]} \ No newline at end of file diff --git a/annotations_1/8hWbptEarkA_filtered.json b/annotations_1/8hWbptEarkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d7b4fa111e4f38221da89aa31d7dbcda6af42d2 --- /dev/null +++ b/annotations_1/8hWbptEarkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 36.44], [37.0, 47.02], [48.0, 51.17], [52.0, 81.68], [82.0, 130.47], [132.0, 134.33], [135.0, 141.71]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [65.67, 49.73, 68.93, 31.47, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, [["music", 47.15], ["fart", 7.27], ["musical instrument", 5.02]], null, [["music", 79.65], ["theremin", 6.61], ["electronic music", 2.01]], null, null, null], "duration": [24.44, 10.02, 3.17, 29.68, 48.47, 2.33, 6.71]} \ No newline at end of file diff --git a/annotations_1/8i7z8cEA4IM_filtered.json b/annotations_1/8i7z8cEA4IM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47e7cd4cb0554d7159d0348b01a6ba47d8980dea --- /dev/null +++ b/annotations_1/8i7z8cEA4IM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [3.0, 4.62], [5.0, 7.59], [9.0, 9.91], [12.0, 21.66], [23.0, 24.17], [25.0, 27.45], [29.0, 39.66], [40.0, 45.0], [46.0, 51.56], [53.0, 53.33], [53.0, 59.98], [66.0, 68.23]], "keep_status": [false, false, true, false, true, false, true, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 36.92, 0.0, 34.7, 0.0, 41.18, 33.34, 33.09, 32.43, 0.0, 30.81, 30.25], "audiomae_on_audioset": [null, null, [["music", 19.16], ["speech", 12.96], ["animal", 3.84]], null, [["music", 27.36], ["speech", 19.48], ["didgeridoo", 12.17]], null, [["fly, housefly", 18.33], ["hum", 11.35], ["mains hum", 11.34]], [["music", 26.27], ["hum", 25.78], ["throbbing", 20.9]], [["speech", 42.62], ["bee, wasp, etc.", 11.91], ["sidetone", 9.21]], [["mains hum", 42.24], ["hum", 31.43], ["music", 10.5]], null, [["music", 33.28], ["speech", 16.76], ["hum", 12.44]], [["music", 40.69], ["speech", 22.59], ["hum", 5.02]]], "duration": [1.3, 1.62, 2.59, 0.91, 9.66, 1.17, 2.45, 10.66, 5.0, 5.56, 0.33, 6.98, 2.23]} \ No newline at end of file diff --git a/annotations_1/8jyiXMPl6EU_filtered.json b/annotations_1/8jyiXMPl6EU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1e87a2839847c1f5be3300722f1e315f8bdf546 --- /dev/null +++ b/annotations_1/8jyiXMPl6EU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.46], [10.0, 12.92], [14.0, 14.91], [15.0, 17.44], [19.0, 30.25], [31.0, 37.93], [39.0, 43.61], [44.0, 43.65], [44.0, 44.37], [45.0, 46.75], [47.0, 48.15], [49.0, 50.45], [55.0, 59.58], [61.0, 62.5], [64.0, 65.18], [66.0, 65.94], [70.0, 85.06], [85.0, 86.48], [87.0, 88.91], [89.0, 102.66], [103.0, 105.38], [106.0, 109.73], [110.0, 110.91], [114.0, 115.4], [117.0, 117.73], [119.0, 120.06], [124.0, 140.12], [141.0, 148.93], [149.0, 148.96], [152.0, 162.45], [164.0, 165.94], [166.0, 167.44]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [50.41, 68.15, 0.0, 49.45, 42.69, 62.37, 47.9, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 0.0, 36.82, 0.0, 0.0, 46.68, 46.72, 54.17, 0.0, 0.0, 0.0, 0.0, 48.39, 35.97, 0.0, 32.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 41.61], ["hum", 7.46], ["music", 7.41]], [["music", 46.63], ["sheep", 10.53], ["bleat", 10.31]], null, [["music", 21.42], ["mains hum", 20.19], ["hum", 14.67]], null, null, null, null, null, null, null, null, null, [["mains hum", 38.32], ["music", 23.9], ["hum", 22.51]], null, null, [["music", 39.3], ["hum", 26.37], ["speech", 14.53]], [["music", 41.35], ["singing bowl", 23.19], ["speech", 4.55]], null, null, null, null, null, [["speech", 40.27], ["music", 19.02], ["synthesizer", 3.06]], [["music", 70.72], ["synthesizer", 4.91], ["musical instrument", 3.07]], null, [["music", 24.93], ["mains hum", 24.23], ["hum", 17.49]], null, null], "duration": [6.46, 2.92, 0.91, 2.44, 11.25, 6.93, 4.61, -0.35, 0.37, 1.75, 1.15, 1.45, 4.58, 1.5, 1.18, -0.06, 15.06, 1.48, 1.91, 13.66, 2.38, 3.73, 0.91, 1.4, 0.73, 1.06, 16.12, 7.93, -0.04, 10.45, 1.94, 1.44]} \ No newline at end of file diff --git a/annotations_1/8kzZwPsHkfo_filtered.json b/annotations_1/8kzZwPsHkfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47c5db78c150ecc56b221d00eb6c968a935c5559 --- /dev/null +++ b/annotations_1/8kzZwPsHkfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.94], [11.0, 14.12], [14.0, 14.88], [19.0, 19.28], [20.0, 20.06], [20.0, 20.88], [22.0, 22.03], [47.0, 48.83], [50.0, 51.06], [53.0, 52.88], [53.0, 53.65], [59.0, 60.07], [60.0, 61.21], [62.0, 63.04], [67.0, 67.74], [71.0, 72.0], [73.0, 73.18], [83.0, 83.69], [84.0, 85.28], [97.0, 97.38], [100.0, 100.5], [101.0, 101.41], [103.0, 103.55], [104.0, 104.58], [106.0, 106.29], [107.0, 108.51], [109.0, 111.94], [114.0, 117.66], [118.0, 119.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 33.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 70.72, 0.0], "audiomae_on_audioset": [null, [["speech", 71.02], ["music", 11.7], ["musical instrument", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.03], ["stomach rumble", 14.05], ["hum", 11.19]], null, null], "duration": [-0.06, 3.12, 0.88, 0.28, 0.06, 0.88, 0.03, 1.83, 1.06, -0.12, 0.65, 1.07, 1.21, 1.04, 0.74, 1.0, 0.18, 0.69, 1.28, 0.38, 0.5, 0.41, 0.55, 0.58, 0.29, 1.51, 2.94, 3.66, 1.37]} \ No newline at end of file diff --git a/annotations_1/8le-4mOgJco_filtered.json b/annotations_1/8le-4mOgJco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca1d08222f71ff3544a4576f27831ee77b9408cc --- /dev/null +++ b/annotations_1/8le-4mOgJco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[123.0, 129.81], [130.0, 131.38], [132.0, 131.92], [133.0, 135.57], [136.0, 143.45], [143.0, 150.08]], "keep_status": [true, false, false, false, false, true], "silence_prob": [35.3, 0.0, 0.0, 44.12, 39.86, 31.1], "audiomae_on_audioset": [[["speech", 22.14], ["music", 21.05], ["glass", 10.05]], null, null, [["didgeridoo", 34.68], ["music", 30.3], ["speech", 7.33]], [["music", 45.93], ["didgeridoo", 27.84], ["hum", 3.06]], [["groan", 27.12], ["animal", 12.21], ["grunt", 8.63]]], "duration": [6.81, 1.38, -0.08, 2.57, 7.45, 7.08]} \ No newline at end of file diff --git a/annotations_1/8lsl4cNrpzI_filtered.json b/annotations_1/8lsl4cNrpzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b65149c0b2fdae4d8dbd5491bbe4490999d788 --- /dev/null +++ b/annotations_1/8lsl4cNrpzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.79], [20.0, 20.88], [22.0, 22.1], [25.0, 25.62], [28.0, 28.97], [30.0, 30.7], [32.0, 33.17], [35.0, 35.33], [38.0, 37.88], [39.0, 39.87], [44.0, 43.71], [47.0, 47.28], [49.0, 49.94], [51.0, 51.68], [54.0, 55.0], [56.0, 57.38], [58.0, 59.31], [60.0, 60.89], [63.0, 97.93], [100.0, 101.36], [112.0, 112.72], [114.0, 119.74], [129.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.88, 0.1, 0.62, 0.97, 0.7, 1.17, 0.33, -0.12, 0.87, -0.29, 0.28, 0.94, 0.68, 1.0, 1.38, 1.31, 0.89, 34.93, 1.36, 0.72, 5.74, 0.07]} \ No newline at end of file diff --git a/annotations_1/8m3HqHIpcWU_filtered.json b/annotations_1/8m3HqHIpcWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2343b1403092de2c14c0fa6795761365a60777a8 --- /dev/null +++ b/annotations_1/8m3HqHIpcWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.43], [15.0, 16.61], [20.0, 26.6], [28.0, 29.1], [30.0, 56.94], [63.0, 64.77], [66.0, 66.93], [69.0, 69.47], [79.0, 79.86], [81.0, 83.27], [84.0, 84.77], [93.0, 93.56], [94.0, 94.81], [96.0, 99.06], [101.0, 101.92], [104.0, 105.83], [108.0, 108.28], [110.0, 112.01], [119.0, 119.04], [122.0, 121.88], [125.0, 126.32], [127.0, 132.09], [133.0, 137.98], [140.0, 141.79], [146.0, 147.5], [151.0, 154.11], [155.0, 158.08]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, true, true, false, false, true, true], "silence_prob": [40.61, 0.0, 34.69, 0.0, 31.96, 0.0, 0.0, 0.0, 0.0, 42.02, 0.0, 0.0, 0.0, 42.53, 0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 39.74, 37.88, 0.0, 0.0, 41.36, 45.95], "audiomae_on_audioset": [[["insect", 21.68], ["single-lens reflex camera", 20.59], ["fly, housefly", 13.83]], null, [["mains hum", 44.19], ["hum", 26.85], ["speech", 3.58]], null, [["hum", 33.23], ["throbbing", 24.92], ["music", 13.16]], null, null, null, null, [["sidetone", 22.3], ["music", 20.01], ["speech", 12.49]], null, null, null, [["music", 25.05], ["hum", 10.98], ["gong", 6.31]], null, null, null, [["music", 17.96], ["speech", 15.03], ["gong", 9.78]], null, null, null, [["hum", 19.47], ["music", 11.72], ["rumble", 10.58]], [["music", 26.18], ["hum", 15.32], ["speech", 14.85]], null, null, [["speech", 42.43], ["hum", 7.53], ["sheep", 5.67]], [["music", 12.44], ["singing bowl", 11.53], ["livestock, farm animals, working animals", 10.89]]], "duration": [4.43, 1.61, 6.6, 1.1, 26.94, 1.77, 0.93, 0.47, 0.86, 2.27, 0.77, 0.56, 0.81, 3.06, 0.92, 1.83, 0.28, 2.01, 0.04, -0.12, 1.32, 5.09, 4.98, 1.79, 1.5, 3.11, 3.08]} \ No newline at end of file diff --git a/annotations_1/8mDtsn0yrsA_filtered.json b/annotations_1/8mDtsn0yrsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64be46bd30a1dfa57871130129c118574ed53ae8 --- /dev/null +++ b/annotations_1/8mDtsn0yrsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.43], [24.0, 23.55], [24.0, 25.32], [27.0, 27.28], [28.0, 29.0], [36.0, 38.57], [42.0, 42.82], [54.0, 58.35], [70.0, 69.84], [77.0, 82.17], [84.0, 85.23], [86.0, 89.85], [93.0, 93.16], [95.0, 95.64], [98.0, 108.89]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, true, false, false, true], "silence_prob": [43.35, 0.0, 0.0, 0.0, 0.0, 32.96, 0.0, 32.5, 0.0, 31.46, 0.0, 31.95, 0.0, 0.0, 31.83], "audiomae_on_audioset": [[["music", 47.54], ["hum", 10.38], ["synthesizer", 6.19]], null, null, null, null, [["music", 59.94], ["speech", 15.38], ["boing", 3.82]], null, [["boing", 58.94], ["music", 23.08], ["speech", 10.4]], null, [["music", 35.73], ["livestock, farm animals, working animals", 14.55], ["cattle, bovinae", 5.66]], null, [["music", 40.13], ["groan", 7.27], ["bleat", 5.42]], null, null, [["music", 20.03], ["livestock, farm animals, working animals", 18.65], ["speech", 12.11]]], "duration": [2.43, -0.45, 1.32, 0.28, 1.0, 2.57, 0.82, 4.35, -0.16, 5.17, 1.23, 3.85, 0.16, 0.64, 10.89]} \ No newline at end of file diff --git a/annotations_1/8myhALdcfvI_filtered.json b/annotations_1/8myhALdcfvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02eba856bc3004f2ff4171fdd87eb9a7f3109a2f --- /dev/null +++ b/annotations_1/8myhALdcfvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.41], [14.0, 13.98], [18.0, 18.08], [21.0, 21.44], [23.0, 24.95], [31.0, 31.01], [34.0, 35.97], [38.0, 40.39], [42.0, 42.74], [45.0, 46.01], [52.0, 52.0], [56.0, 57.16], [60.0, 60.52], [62.0, 63.75], [64.0, 64.99], [69.0, 70.66], [83.0, 84.01], [86.0, 87.88], [89.0, 91.15], [103.0, 105.11], [106.0, 114.29], [117.0, 119.31], [125.0, 129.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 85.54, 50.46, 63.64, 83.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, -0.02, 0.08, 0.44, 1.95, 0.01, 1.97, 2.39, 0.74, 1.01, 0.0, 1.16, 0.52, 1.75, 0.99, 1.66, 1.01, 1.88, 2.15, 2.11, 8.29, 2.31, 4.41]} \ No newline at end of file diff --git a/annotations_1/8n6mcd5Odj8_filtered.json b/annotations_1/8n6mcd5Odj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fd52794a68b5867d8868a4d659ad11b15e05c34 --- /dev/null +++ b/annotations_1/8n6mcd5Odj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 33.13], [34.0, 34.32], [36.0, 38.38], [39.0, 79.76], [82.0, 83.91], [90.0, 92.2], [93.0, 93.56], [95.0, 96.42], [100.0, 101.75], [102.0, 106.0], [109.0, 110.59], [117.0, 117.21], [120.0, 120.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.97, 0.0, 32.45, 0.0, 0.0, 42.08, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 78.37], ["electronic music", 4.88], ["throbbing", 3.65]], null, [["music", 62.62], ["throbbing", 21.24], ["hum", 5.83]], null, null, [["speech", 63.58], ["music", 5.85], ["vehicle", 2.58]], null, null, null, null, null, null, null], "duration": [6.13, 0.32, 2.38, 40.76, 1.91, 2.2, 0.56, 1.42, 1.75, 4.0, 1.59, 0.21, 0.77]} \ No newline at end of file diff --git a/annotations_1/8oq28m4uqe8_filtered.json b/annotations_1/8oq28m4uqe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d927423e72bb317b25e7b9e9b17397979067d45 --- /dev/null +++ b/annotations_1/8oq28m4uqe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [7.0, 12.45], [15.0, 14.61], [16.0, 16.53], [18.0, 17.81], [19.0, 19.33], [20.0, 24.61], [27.0, 38.82], [40.0, 42.9], [45.0, 46.43], [48.0, 79.86], [80.0, 81.85], [84.0, 113.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.22, 0.0, 0.0, 0.0, 0.0, 81.17, 56.63, 72.9, 0.0, 0.0, 0.0, 31.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.85], ["music", 13.23], ["buzz", 5.83]]], "duration": [0.44, 5.45, -0.39, 0.53, -0.19, 0.33, 4.61, 11.82, 2.9, 1.43, 31.86, 1.85, 29.43]} \ No newline at end of file diff --git a/annotations_1/8osP7KRacWk_filtered.json b/annotations_1/8osP7KRacWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ef4bd6f699db9d2092df0d8c693dda7fa349e3 --- /dev/null +++ b/annotations_1/8osP7KRacWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.43], [37.0, 37.61], [39.0, 48.14], [49.0, 50.11], [51.0, 51.49], [53.0, 53.6], [57.0, 58.21], [59.0, 60.05], [63.0, 78.06], [78.0, 79.64], [81.0, 84.94], [86.0, 88.01], [89.0, 89.51], [90.0, 91.03], [93.0, 95.32], [102.0, 103.57], [105.0, 104.92], [107.0, 107.18], [112.0, 112.11], [120.0, 121.15], [122.0, 123.82], [124.0, 130.11], [131.0, 131.62], [134.0, 136.19], [137.0, 139.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 39.74, 0.0, 0.0, 0.0, 0.0, 0.0, 30.75, 0.0, 44.49, 52.27, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.67, 0.0, 46.15, 37.3], "audiomae_on_audioset": [null, null, [["music", 50.08], ["fart", 11.09], ["speech", 7.97]], null, null, null, null, null, [["music", 44.26], ["theremin", 27.52], ["musical instrument", 3.78]], null, [["music", 45.41], ["speech", 13.24], ["musical instrument", 3.97]], null, null, null, null, null, null, null, null, null, null, [["speech", 42.21], ["music", 13.47], ["burst, pop", 11.65]], null, [["music", 26.95], ["speech", 26.15], ["brass instrument", 6.07]], [["speech", 33.34], ["foghorn", 13.07], ["music", 5.82]]], "duration": [0.43, 0.61, 9.14, 1.11, 0.49, 0.6, 1.21, 1.05, 15.06, 1.64, 3.94, 2.01, 0.51, 1.03, 2.32, 1.57, -0.08, 0.18, 0.11, 1.15, 1.82, 6.11, 0.62, 2.19, 2.62]} \ No newline at end of file diff --git a/annotations_1/8p1gevM0y-I_filtered.json b/annotations_1/8p1gevM0y-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0e7fcd18ccc18dd3c8cb9dcdcfdb94832595c80 --- /dev/null +++ b/annotations_1/8p1gevM0y-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.73], [6.0, 6.2], [7.0, 7.59], [10.0, 10.61], [17.0, 17.78], [24.0, 25.62], [29.0, 29.96], [33.0, 33.74], [34.0, 35.09], [36.0, 36.63], [37.0, 37.61], [39.0, 39.53], [40.0, 41.4], [42.0, 42.21], [43.0, 44.34], [46.0, 47.29], [49.0, 50.03], [56.0, 56.54], [58.0, 57.67], [58.0, 58.82], [62.0, 63.53], [64.0, 65.84], [67.0, 67.66], [69.0, 69.96], [73.0, 73.23], [86.0, 89.46], [92.0, 94.27], [101.0, 102.34], [104.0, 104.52], [108.0, 108.38], [112.0, 113.73], [117.0, 116.9], [121.0, 121.95], [123.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 51.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.17], ["radio", 11.94], ["sidetone", 8.19]], null, null, null, null, null, null, null, null], "duration": [2.73, 0.2, 0.59, 0.61, 0.78, 1.62, 0.96, 0.74, 1.09, 0.63, 0.61, 0.53, 1.4, 0.21, 1.34, 1.29, 1.03, 0.54, -0.33, 0.82, 1.53, 1.84, 0.66, 0.96, 0.23, 3.46, 2.27, 1.34, 0.52, 0.38, 1.73, -0.1, 0.95, -0.06]} \ No newline at end of file diff --git a/annotations_1/8p6L3Vl8ezA_filtered.json b/annotations_1/8p6L3Vl8ezA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dafcb9ffcfa7408a6c82dc67a6aca6901650e19 --- /dev/null +++ b/annotations_1/8p6L3Vl8ezA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.16], [8.0, 11.42], [12.0, 13.42], [15.0, 16.68], [18.0, 20.66], [22.0, 41.0], [45.0, 48.34], [53.0, 53.76], [55.0, 59.64], [62.0, 65.25], [68.0, 71.04], [72.0, 72.91], [74.0, 76.72], [80.0, 92.38], [94.0, 99.12], [99.0, 99.89], [100.0, 102.83], [105.0, 147.23], [153.0, 172.2]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [78.04, 47.05, 0.0, 0.0, 81.71, 53.47, 42.11, 0.0, 92.97, 95.37, 96.42, 0.0, 99.1, 70.86, 47.86, 0.0, 37.86, 0.0, 35.53], "audiomae_on_audioset": [null, [["speech", 28.99], ["didgeridoo", 11.08], ["hum", 8.31]], null, null, null, null, [["speech", 20.98], ["music", 19.79], ["didgeridoo", 18.12]], null, null, null, null, null, null, null, [["speech", 68.96], ["sidetone", 15.21], ["music", 2.97]], null, [["speech", 45.66], ["hum", 10.2], ["chirp tone", 4.78]], null, [["beatboxing", 34.03], ["speech", 14.55], ["whack, thwack", 10.36]]], "duration": [2.16, 3.42, 1.42, 1.68, 2.66, 19.0, 3.34, 0.76, 4.64, 3.25, 3.04, 0.91, 2.72, 12.38, 5.12, 0.89, 2.83, 42.23, 19.2]} \ No newline at end of file diff --git a/annotations_1/8pDCGWKvBlk_filtered.json b/annotations_1/8pDCGWKvBlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21ab353501a894ee72b87b9235536cf1ce2330db --- /dev/null +++ b/annotations_1/8pDCGWKvBlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 81.33], [82.0, 100.55], [101.0, 105.06], [106.0, 106.95], [108.0, 108.53], [111.0, 112.13], [114.0, 117.05], [119.0, 123.9], [124.0, 124.55], [126.0, 126.18], [127.0, 150.18], [151.0, 153.5], [155.0, 156.3]], "keep_status": [false, true, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 40.09, 33.7, 0.0, 0.0, 0.0, 43.61, 33.67, 0.0, 0.0, 53.28, 72.01, 0.0], "audiomae_on_audioset": [null, [["music", 42.75], ["speech", 17.22], ["electronic music", 4.4]], [["speech", 14.13], ["music", 9.48], ["didgeridoo", 8.84]], null, null, null, [["speech", 12.28], ["animal", 5.36], ["sound effect", 4.57]], [["hum", 27.91], ["mains hum", 19.05], ["speech", 6.74]], null, null, null, null, null], "duration": [67.33, 18.55, 4.06, 0.95, 0.53, 1.13, 3.05, 4.9, 0.55, 0.18, 23.18, 2.5, 1.3]} \ No newline at end of file diff --git a/annotations_1/8qkahQVFzMI_filtered.json b/annotations_1/8qkahQVFzMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26efd2195c5712fccbc947697dde842717e93e16 --- /dev/null +++ b/annotations_1/8qkahQVFzMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.83], [14.0, 14.47], [16.0, 25.44], [29.0, 48.3], [52.0, 62.51], [65.0, 117.56], [119.0, 143.68], [144.0, 144.61]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.54, 33.75, 32.55, 0.0, 31.99, 0.0], "audiomae_on_audioset": [null, null, [["speech", 37.31], ["music", 23.14], ["sidetone", 15.21]], [["music", 51.42], ["trombone", 15.29], ["brass instrument", 10.09]], [["music", 65.8], ["musical instrument", 10.03], ["synthesizer", 4.26]], null, [["music", 32.49], ["distortion", 7.95], ["effects unit", 7.88]], null], "duration": [1.83, 0.47, 9.44, 19.3, 10.51, 52.56, 24.68, 0.61]} \ No newline at end of file diff --git a/annotations_1/8rX7fkDLEx0_filtered.json b/annotations_1/8rX7fkDLEx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d49f81dfd5fd01c25f4b9d4b94007960fc52eab --- /dev/null +++ b/annotations_1/8rX7fkDLEx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.92], [12.0, 15.92], [18.0, 21.66], [25.0, 25.0], [26.0, 29.25], [38.0, 40.73], [41.0, 41.08], [41.0, 41.32], [45.0, 46.57], [47.0, 50.38], [51.0, 56.3], [68.0, 67.96], [70.0, 82.65], [84.0, 88.79], [93.0, 93.99], [98.0, 97.8], [99.0, 100.99], [103.0, 110.94], [113.0, 115.8], [123.0, 127.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 35.56, 36.27, 0.0, 35.93, 37.21, 0.0, 0.0, 0.0, 34.59, 31.36, 0.0, 30.95, 32.27, 0.0, 0.0, 0.0, 28.55, 28.51, 29.39], "audiomae_on_audioset": [null, [["music", 52.45], ["boing", 23.79], ["frog", 2.46]], [["music", 50.02], ["speech", 14.57], ["radio", 14.1]], null, [["music", 69.97], ["musical instrument", 6.07], ["guitar", 5.62]], [["music", 74.63], ["musical instrument", 6.11], ["synthesizer", 5.91]], null, null, null, [["music", 50.25], ["beatboxing", 14.16], ["musical instrument", 6.38]], [["speech", 42.06], ["fart", 24.94], ["fly, housefly", 4.18]], null, [["music", 60.26], ["throbbing", 15.92], ["hum", 8.06]], [["music", 31.25], ["speech", 16.23], ["hum", 15.4]], null, null, null, [["music", 33.66], ["speech", 13.63], ["throbbing", 10.11]], [["throbbing", 13.54], ["music", 13.37], ["vehicle", 10.73]], [["hum", 36.69], ["throbbing", 35.63], ["music", 10.32]]], "duration": [0.92, 3.92, 3.66, 0.0, 3.25, 2.73, 0.08, 0.32, 1.57, 3.38, 5.3, -0.04, 12.65, 4.79, 0.99, -0.2, 1.99, 7.94, 2.8, 4.65]} \ No newline at end of file diff --git a/annotations_1/8rlAQ3q4RDk_filtered.json b/annotations_1/8rlAQ3q4RDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db340b7499a305f82f97fae4838c2b32736f292a --- /dev/null +++ b/annotations_1/8rlAQ3q4RDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.58], [10.0, 11.04], [15.0, 24.51], [25.0, 39.63], [40.0, 51.87], [54.0, 66.14], [67.0, 80.6], [90.0, 94.59], [99.0, 103.96], [105.0, 109.16], [110.0, 113.68], [114.0, 128.29], [129.0, 132.65]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [92.15, 0.0, 85.9, 59.15, 98.59, 63.42, 69.61, 43.93, 100.0, 100.0, 99.05, 35.44, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["noise", 15.32], ["speech", 10.86], ["music", 7.74]], null, null, null, [["animal", 15.91], ["rumble", 10.53], ["speech", 8.13]], null], "duration": [6.58, 1.04, 9.51, 14.63, 11.87, 12.14, 13.6, 4.59, 4.96, 4.16, 3.68, 14.29, 3.65]} \ No newline at end of file diff --git a/annotations_1/8sURhgulh7E_filtered.json b/annotations_1/8sURhgulh7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4f73081e793e1cc145843d72901207fb96017c4 --- /dev/null +++ b/annotations_1/8sURhgulh7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 44.76], [53.0, 52.57], [56.0, 56.12], [58.0, 59.22], [64.0, 80.23], [82.0, 86.0], [86.0, 87.62], [93.0, 93.55], [95.0, 95.37], [96.0, 104.06], [113.0, 113.1], [114.0, 128.31], [130.0, 130.96], [132.0, 133.83], [136.0, 136.26], [140.0, 141.3], [143.0, 143.87], [146.0, 146.58], [148.0, 150.89], [153.0, 153.6], [156.0, 157.35], [160.0, 159.78]], "keep_status": [true, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.18, 0.0, 0.0, 0.0, 28.98, 31.1, 0.0, 0.0, 0.0, 29.17, 0.0, 31.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 58.75], ["speech", 6.83], ["hum", 3.99]], null, null, null, [["music", 22.47], ["speech", 15.59], ["throbbing", 14.38]], [["music", 37.3], ["speech", 23.28], ["boing", 4.47]], null, null, null, [["music", 44.12], ["whack, thwack", 25.69], ["speech", 8.22]], null, [["fly, housefly", 29.06], ["mosquito", 23.18], ["speech", 14.39]], null, null, null, null, null, null, null, null, null, null], "duration": [23.76, -0.43, 0.12, 1.22, 16.23, 4.0, 1.62, 0.55, 0.37, 8.06, 0.1, 14.31, 0.96, 1.83, 0.26, 1.3, 0.87, 0.58, 2.89, 0.6, 1.35, -0.22]} \ No newline at end of file diff --git a/annotations_1/8tFrGaU6p5U_filtered.json b/annotations_1/8tFrGaU6p5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbe453a434b7a2c42070e83e2817aa3918579c63 --- /dev/null +++ b/annotations_1/8tFrGaU6p5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.18], [22.0, 23.16], [26.0, 27.11], [30.0, 30.54], [34.0, 34.91], [37.0, 58.04], [63.0, 64.86], [68.0, 69.01], [70.0, 72.54], [73.0, 77.41], [79.0, 81.23], [83.0, 83.98], [86.0, 86.31], [88.0, 88.47], [98.0, 98.17], [100.0, 100.67], [104.0, 104.21], [105.0, 105.19], [106.0, 106.64], [117.0, 117.22], [119.0, 120.9], [122.0, 122.5], [129.0, 129.24], [131.0, 133.78], [135.0, 137.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.01, 0.0, 0.0, 100.0, 82.07, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.33, 79.07], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 48.26], ["telephone bell ringing", 27.7], ["telephone", 22.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.08], ["gunshot, gunfire", 16.77], ["artillery fire", 10.22]], null], "duration": [1.18, 1.16, 1.11, 0.54, 0.91, 21.04, 1.86, 1.01, 2.54, 4.41, 2.23, 0.98, 0.31, 0.47, 0.17, 0.67, 0.21, 0.19, 0.64, 0.22, 1.9, 0.5, 0.24, 2.78, 2.57]} \ No newline at end of file diff --git a/annotations_1/8tLhtdDVqzg_filtered.json b/annotations_1/8tLhtdDVqzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d604f99b29279d99838f30e0b114476a7cf24d8e --- /dev/null +++ b/annotations_1/8tLhtdDVqzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [6.0, 7.25], [9.0, 19.92], [24.0, 24.49], [26.0, 31.53], [36.0, 36.17], [36.0, 38.03], [44.0, 45.69], [55.0, 56.91], [61.0, 66.87], [69.0, 72.3], [73.0, 83.83], [98.0, 99.18], [101.0, 106.07], [111.0, 110.78], [116.0, 116.7], [118.0, 118.08], [119.0, 119.6], [125.0, 125.59], [130.0, 130.52], [131.0, 130.76], [131.0, 131.82], [135.0, 136.24], [137.0, 138.47], [144.0, 144.48], [148.0, 148.88], [153.0, 154.75], [155.0, 155.24], [156.0, 157.37], [159.0, 159.48], [161.0, 165.15], [166.0, 166.06], [167.0, 182.04], [182.0, 183.95]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 32.21, 0.0, 30.9, 0.0, 31.68, 0.0, 0.0, 28.81, 29.24, 29.92, 0.0, 39.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 78.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.74], ["didgeridoo", 12.77], ["theremin", 10.83]], null, [["music", 75.39], ["country", 5.73], ["musical instrument", 2.5]], null, [["music", 50.1], ["musical instrument", 7.52], ["plucked string instrument", 6.79]], null, null, [["music", 66.59], ["singing", 4.12], ["yodeling", 2.72]], [["music", 76.03], ["country", 3.32], ["singing", 2.66]], [["music", 61.24], ["didgeridoo", 4.86], ["speech", 4.47]], null, [["thunk", 45.3], ["fly, housefly", 10.46], ["whack, thwack", 5.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.37], ["noise", 18.28], ["thunk", 9.44]], null, null, null], "duration": [0.59, 1.25, 10.92, 0.49, 5.53, 0.17, 2.03, 1.69, 1.91, 5.87, 3.3, 10.83, 1.18, 5.07, -0.22, 0.7, 0.08, 0.6, 0.59, 0.52, -0.24, 0.82, 1.24, 1.47, 0.48, 0.88, 1.75, 0.24, 1.37, 0.48, 4.15, 0.06, 15.04, 1.95]} \ No newline at end of file diff --git a/annotations_1/8ty1025m6XQ_filtered.json b/annotations_1/8ty1025m6XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada83ac214cb3d352a513dd3939178b663f6c9b8 --- /dev/null +++ b/annotations_1/8ty1025m6XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.62], [28.0, 28.54], [29.0, 30.32], [31.0, 30.81], [49.0, 49.79], [52.0, 53.94], [62.0, 69.16], [74.0, 79.93], [82.0, 84.01], [92.0, 98.79], [105.0, 105.41], [111.0, 111.52], [119.0, 119.08], [134.0, 140.7], [141.0, 144.8], [145.0, 145.94], [152.0, 159.22], [161.0, 168.34], [171.0, 174.24], [182.0, 182.09], [205.0, 205.06], [217.0, 218.37]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 95.37, 45.27, 34.94, 0.0, 0.0, 0.0, 34.15, 30.73, 0.0, 34.98, 35.94, 35.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 33.95], ["mosquito", 23.43], ["insect", 15.94]], null, [["speech", 23.66], ["sheep", 11.06], ["animal", 7.99]], [["speech", 40.07], ["grunt", 34.92], ["groan", 21.29]], null, null, null, [["speech", 24.15], ["livestock, farm animals, working animals", 13.52], ["sheep", 13.06]], [["music", 35.25], ["theremin", 19.76], ["musical instrument", 9.94]], null, [["whale vocalization", 29.33], ["livestock, farm animals, working animals", 10.41], ["sound effect", 4.39]], [["whale vocalization", 14.17], ["speech", 13.22], ["animal", 10.65]], [["moo", 26.72], ["livestock, farm animals, working animals", 25.72], ["cattle, bovinae", 22.04]], null, null, null], "duration": [-0.38, 0.54, 1.32, -0.19, 0.79, 1.94, 7.16, 5.93, 2.01, 6.79, 0.41, 0.52, 0.08, 6.7, 3.8, 0.94, 7.22, 7.34, 3.24, 0.09, 0.06, 1.37]} \ No newline at end of file diff --git a/annotations_1/8v7xHt-CJZg_filtered.json b/annotations_1/8v7xHt-CJZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75882d861287f513c6298bb0f087bdb44dd309ef --- /dev/null +++ b/annotations_1/8v7xHt-CJZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.84], [5.0, 11.1], [11.0, 12.12], [14.0, 13.8], [15.0, 16.12], [20.0, 21.47], [26.0, 26.52], [44.0, 44.37], [57.0, 57.94], [105.0, 105.7], [109.0, 109.9], [114.0, 114.18], [126.0, 126.67]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 46.7], ["music", 9.45], ["hum", 5.52]], null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.16, 6.1, 1.12, -0.2, 1.12, 1.47, 0.52, 0.37, 0.94, 0.7, 0.9, 0.18, 0.67]} \ No newline at end of file diff --git a/annotations_1/8wY9r2cpbxQ_filtered.json b/annotations_1/8wY9r2cpbxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..504217a9b89f7591bb3e4b42361eda48d18ffd5e --- /dev/null +++ b/annotations_1/8wY9r2cpbxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.76], [25.0, 54.36], [56.0, 60.51], [62.0, 64.23], [65.0, 66.33], [68.0, 72.96], [74.0, 80.59], [83.0, 92.53]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [86.82, 59.15, 50.26, 48.19, 0.0, 50.86, 59.86, 54.7], "audiomae_on_audioset": [null, null, null, [["music", 16.2], ["singing bowl", 13.82], ["mains hum", 7.79]], null, null, null, null], "duration": [5.76, 29.36, 4.51, 2.23, 1.33, 4.96, 6.59, 9.53]} \ No newline at end of file diff --git a/annotations_1/8wduU3eU6XQ_filtered.json b/annotations_1/8wduU3eU6XQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a77ed751bdb7952eefa63dddd9339c66ff13807 --- /dev/null +++ b/annotations_1/8wduU3eU6XQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[149.0, 149.69], [150.0, 151.44], [153.0, 159.29], [160.0, 160.15], [161.0, 176.44], [177.0, 185.87], [186.0, 186.31], [186.0, 186.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.55, 0.0, 67.38, 80.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.69, 1.44, 6.29, 0.15, 15.44, 8.87, 0.31, 0.44]} \ No newline at end of file diff --git a/annotations_1/8xZ0jOhAHMk_filtered.json b/annotations_1/8xZ0jOhAHMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f290c215a33b9749dbede55f40a6ec8628b1d4c --- /dev/null +++ b/annotations_1/8xZ0jOhAHMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [5.0, 6.66], [16.0, 15.92], [16.0, 16.01], [23.0, 25.93], [34.0, 34.48], [38.0, 38.4], [40.0, 41.39], [45.0, 45.69], [48.0, 53.22], [56.0, 67.29], [68.0, 75.39], [80.0, 80.28], [83.0, 87.13], [91.0, 91.61], [94.0, 93.85], [97.0, 101.58], [103.0, 104.14], [107.0, 108.04], [111.0, 111.16], [114.0, 126.84], [143.0, 148.26], [149.0, 149.67]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 31.04, 30.09, 29.92, 0.0, 30.01, 0.0, 0.0, 31.76, 0.0, 0.0, 0.0, 29.31, 29.03, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 38.72], ["speech", 16.54], ["laughter", 4.56]], null, null, null, null, [["music", 60.93], ["speech", 11.49], ["hum", 3.58]], [["music", 36.96], ["skidding", 18.3], ["vehicle", 6.37]], [["hum", 22.13], ["music", 11.72], ["throbbing", 11.06]], null, [["speech", 24.3], ["music", 18.7], ["hum", 7.5]], null, null, [["music", 69.93], ["hum", 3.71], ["theremin", 2.72]], null, null, null, [["music", 63.41], ["hum", 7.44], ["electronic music", 6.54]], [["speech", 58.96], ["music", 14.27], ["explosion", 2.54]], null], "duration": [0.35, 1.66, -0.08, 0.01, 2.93, 0.48, 0.4, 1.39, 0.69, 5.22, 11.29, 7.39, 0.28, 4.13, 0.61, -0.15, 4.58, 1.14, 1.04, 0.16, 12.84, 5.26, 0.67]} \ No newline at end of file diff --git a/annotations_1/8xgUm0plA8w_filtered.json b/annotations_1/8xgUm0plA8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a1b34e1f050426739015be02ffed64553a0e466 --- /dev/null +++ b/annotations_1/8xgUm0plA8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.41], [16.0, 22.13], [26.0, 27.16], [28.0, 35.55], [37.0, 38.91], [43.0, 47.04], [48.0, 50.8], [51.0, 61.03], [67.0, 68.86], [69.0, 73.57], [78.0, 83.98], [88.0, 88.82], [98.0, 100.31], [106.0, 106.83]], "keep_status": [false, true, false, true, false, false, true, true, false, true, true, false, true, false], "silence_prob": [33.03, 31.3, 0.0, 31.52, 0.0, 68.28, 30.94, 30.89, 0.0, 31.47, 31.15, 0.0, 31.82, 0.0], "audiomae_on_audioset": [[["hum", 39.27], ["throbbing", 18.36], ["music", 14.29]], [["music", 29.1], ["speech", 27.78], ["buzz", 4.08]], null, [["music", 28.16], ["hum", 20.28], ["buzz", 16.16]], null, null, [["livestock, farm animals, working animals", 18.45], ["music", 14.14], ["cattle, bovinae", 12.89]], [["fly, housefly", 27.49], ["speech", 24.36], ["insect", 10.61]], null, [["speech", 23.74], ["music", 22.7], ["theremin", 12.87]], [["music", 32.49], ["speech", 13.91], ["brass instrument", 13.57]], null, [["speech", 23.65], ["sheep", 16.36], ["crowd", 6.37]], null], "duration": [2.41, 6.13, 1.16, 7.55, 1.91, 4.04, 2.8, 10.03, 1.86, 4.57, 5.98, 0.82, 2.31, 0.83]} \ No newline at end of file diff --git a/annotations_1/8xorDb45ajE_filtered.json b/annotations_1/8xorDb45ajE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e7e9419c36f070f34882a3dfa416ff6f6f9c039 --- /dev/null +++ b/annotations_1/8xorDb45ajE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [5.0, 6.13], [10.0, 48.0], [50.0, 50.85], [54.0, 54.85], [59.0, 61.06]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 53.4], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.55, 1.13, 38.0, 0.85, 0.85, 2.06]} \ No newline at end of file diff --git a/annotations_1/8yACSHANED0_filtered.json b/annotations_1/8yACSHANED0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc982af7b955d080ce8bff3cddb692e852f101f4 --- /dev/null +++ b/annotations_1/8yACSHANED0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.91], [11.0, 12.07], [12.0, 31.51], [32.0, 36.24], [37.0, 42.47], [47.0, 52.02], [55.0, 58.7], [63.0, 67.24], [68.0, 80.45], [81.0, 81.41], [85.0, 107.84], [110.0, 110.24], [111.0, 119.15], [120.0, 120.41], [122.0, 134.77], [135.0, 142.57], [145.0, 145.42], [147.0, 147.53], [152.0, 152.71], [153.0, 158.73]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [62.17, 0.0, 79.41, 96.66, 42.24, 36.25, 32.89, 31.88, 31.3, 0.0, 36.03, 0.0, 34.63, 0.0, 33.75, 34.3, 0.0, 0.0, 0.0, 32.51], "audiomae_on_audioset": [null, null, null, null, [["music", 60.82], ["musical instrument", 3.64], ["cello", 2.51]], [["music", 69.6], ["ice cream truck, ice cream van", 8.91], ["vehicle", 2.4]], [["music", 79.16], ["electronic music", 3.51], ["musical instrument", 0.79]], [["music", 70.21], ["synthesizer", 6.65], ["electronic music", 4.94]], [["marimba, xylophone", 32.21], ["music", 31.63], ["percussion", 9.83]], null, [["music", 86.44], ["ice cream truck, ice cream van", 2.28], ["middle eastern music", 1.53]], null, [["gong", 37.12], ["music", 25.03], ["ambient music", 7.51]], null, [["music", 92.8], ["musical instrument", 0.91], ["music of latin america", 0.62]], [["music", 72.08], ["theremin", 6.81], ["musical instrument", 2.14]], null, null, null, [["music", 72.58], ["gong", 4.65], ["musical instrument", 2.54]]], "duration": [3.91, 1.07, 19.51, 4.24, 5.47, 5.02, 3.7, 4.24, 12.45, 0.41, 22.84, 0.24, 8.15, 0.41, 12.77, 7.57, 0.42, 0.53, 0.71, 5.73]} \ No newline at end of file diff --git a/annotations_1/8zMlPNdRRLY_filtered.json b/annotations_1/8zMlPNdRRLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4df73ddd3eb0936428697d47ac7aa5e7014e57da --- /dev/null +++ b/annotations_1/8zMlPNdRRLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.47], [8.0, 9.44], [15.0, 17.46], [21.0, 22.86], [24.0, 24.12], [25.0, 29.83], [31.0, 33.2], [36.0, 36.71], [37.0, 38.18], [45.0, 46.53], [48.0, 48.61], [51.0, 54.16], [60.0, 62.24], [68.0, 68.5], [73.0, 74.16], [75.0, 75.12], [77.0, 77.85], [84.0, 87.89], [94.0, 96.75], [98.0, 101.6], [103.0, 104.13], [105.0, 110.78], [112.0, 113.85], [132.0, 132.63], [150.0, 158.14], [159.0, 161.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [40.88, 0.0, 94.37, 0.0, 0.0, 85.9, 96.89, 0.0, 0.0, 0.0, 0.0, 57.09, 91.3, 0.0, 0.0, 0.0, 0.0, 70.86, 61.97, 80.64, 0.0, 90.08, 0.0, 0.0, 52.8, 47.9], "audiomae_on_audioset": [[["hum", 24.99], ["speech", 17.92], ["music", 17.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.48], ["music", 13.61], ["rumble", 9.53]]], "duration": [2.47, 1.44, 2.46, 1.86, 0.12, 4.83, 2.2, 0.71, 1.18, 1.53, 0.61, 3.16, 2.24, 0.5, 1.16, 0.12, 0.85, 3.89, 2.75, 3.6, 1.13, 5.78, 1.85, 0.63, 8.14, 2.45]} \ No newline at end of file diff --git a/annotations_1/8zYGzyIpue8_filtered.json b/annotations_1/8zYGzyIpue8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e86fe8e43d3bdf5d149c9a0d0867aa95e7baca12 --- /dev/null +++ b/annotations_1/8zYGzyIpue8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.47], [44.0, 64.02], [65.0, 76.13], [77.0, 84.65], [89.0, 93.87], [98.0, 99.15], [100.0, 108.13], [109.0, 115.42]], "keep_status": [false, false, true, true, false, false, true, false], "silence_prob": [0.0, 28.53, 28.15, 28.45, 28.83, 0.0, 28.59, 29.15], "audiomae_on_audioset": [null, [["speech", 49.5], ["music", 19.86], ["hum", 10.78]], [["music", 40.04], ["throbbing", 11.9], ["hum", 9.5]], [["music", 27.96], ["whack, thwack", 21.38], ["sound effect", 5.76]], [["music", 58.97], ["fly, housefly", 7.97], ["insect", 6.25]], null, [["vehicle", 20.29], ["music", 6.96], ["sound effect", 6.22]], [["music", 30.96], ["vehicle", 27.85], ["car", 12.64]]], "duration": [1.47, 20.02, 11.13, 7.65, 4.87, 1.15, 8.13, 6.42]} \ No newline at end of file diff --git a/annotations_1/90j6V8EjSuI_filtered.json b/annotations_1/90j6V8EjSuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b22f11d4fa693caf6ff6a02311ba591cdd41c950 --- /dev/null +++ b/annotations_1/90j6V8EjSuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.37], [3.0, 2.84], [8.0, 8.87], [10.0, 10.77], [14.0, 14.66], [17.0, 17.52], [19.0, 20.34], [26.0, 26.64], [28.0, 29.93], [31.0, 43.41], [47.0, 48.07], [49.0, 49.52], [50.0, 50.58], [54.0, 56.49], [59.0, 59.95], [61.0, 66.63], [67.0, 68.89], [70.0, 72.91], [74.0, 75.14], [77.0, 81.68], [82.0, 89.43], [91.0, 90.93], [95.0, 112.5], [113.0, 113.49], [116.0, 118.4], [122.0, 125.52], [131.0, 135.57], [137.0, 137.71], [142.0, 144.29]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 0.0, 0.0, 0.0, 57.32, 0.0, 37.56, 0.0, 47.5, 0.0, 54.5, 45.49, 0.0, 33.5, 0.0, 42.65, 33.77, 36.61, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.03], ["throbbing", 15.25], ["hum", 13.61]], null, null, null, null, null, [["crushing", 25.69], ["fly, housefly", 16.08], ["hum", 14.56]], null, [["speech", 42.99], ["music", 22.86], ["musical instrument", 3.12]], null, null, [["speech", 27.08], ["hum", 23.94], ["mains hum", 15.58]], null, [["music", 60.34], ["musical instrument", 11.51], ["drum", 4.47]], null, [["speech", 22.94], ["music", 15.37], ["hum", 9.68]], [["music", 45.85], ["musical instrument", 16.77], ["plucked string instrument", 9.05]], [["music", 49.53], ["musical instrument", 15.52], ["plucked string instrument", 9.67]], null, null], "duration": [0.37, -0.16, 0.87, 0.77, 0.66, 0.52, 1.34, 0.64, 1.93, 12.41, 1.07, 0.52, 0.58, 2.49, 0.95, 5.63, 1.89, 2.91, 1.14, 4.68, 7.43, -0.07, 17.5, 0.49, 2.4, 3.52, 4.57, 0.71, 2.29]} \ No newline at end of file diff --git a/annotations_1/912ib1YghJ4_filtered.json b/annotations_1/912ib1YghJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b3831eed5f53ac2ad8d85c033afe3d8681e061 --- /dev/null +++ b/annotations_1/912ib1YghJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.69], [14.0, 17.68], [24.0, 26.18], [34.0, 34.72], [38.0, 38.3], [40.0, 40.76], [47.0, 47.09], [47.0, 49.33], [51.0, 52.29], [57.0, 57.82], [58.0, 59.59], [60.0, 63.09], [63.0, 65.18], [65.0, 73.09], [73.0, 74.49], [75.0, 75.52], [76.0, 78.22], [79.0, 80.43], [81.0, 82.48], [83.0, 86.98], [87.0, 87.78], [92.0, 93.93], [96.0, 96.8], [100.0, 100.97], [105.0, 105.07], [133.0, 133.84], [134.0, 136.48], [137.0, 142.43], [143.0, 144.24], [145.0, 146.45], [147.0, 149.2], [151.0, 153.03], [167.0, 167.04]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.88, 38.59, 0.0, 0.0, 0.0, 0.0, 35.07, 0.0, 0.0, 0.0, 28.96, 31.69, 32.58, 0.0, 0.0, 37.92, 0.0, 0.0, 33.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.17, 32.72, 0.0, 0.0, 32.13, 37.97, 0.0], "audiomae_on_audioset": [null, [["moo", 11.97], ["sidetone", 9.92], ["cattle, bovinae", 8.04]], [["speech", 8.52], ["belly laugh", 6.83], ["whimper", 6.72]], null, null, null, null, [["baby laughter", 21.58], ["inside, small room", 17.33], ["laughter", 14.2]], null, null, null, [["music", 45.22], ["synthesizer", 8.16], ["electronic music", 5.33]], [["music", 48.18], ["speech", 8.36], ["boing", 4.58]], [["music", 32.42], ["speech", 31.18], ["livestock, farm animals, working animals", 4.37]], null, null, [["music", 47.78], ["speech", 11.25], ["sidetone", 6.8]], null, null, [["sidetone", 41.53], ["music", 30.69], ["speech", 16.65]], null, null, null, null, null, null, [["speech", 65.86], ["music", 7.6], ["whale vocalization", 3.44]], [["music", 58.46], ["hum", 8.77], ["throbbing", 4.43]], null, null, [["music", 34.41], ["hum", 24.47], ["mains hum", 18.19]], [["sidetone", 39.89], ["speech", 12.78], ["music", 11.91]], null], "duration": [0.69, 3.68, 2.18, 0.72, 0.3, 0.76, 0.09, 2.33, 1.29, 0.82, 1.59, 3.09, 2.18, 8.09, 1.49, 0.52, 2.22, 1.43, 1.48, 3.98, 0.78, 1.93, 0.8, 0.97, 0.07, 0.84, 2.48, 5.43, 1.24, 1.45, 2.2, 2.03, 0.04]} \ No newline at end of file diff --git a/annotations_1/91Z-_ujQGik_filtered.json b/annotations_1/91Z-_ujQGik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9365e444571adc647e854bcf802068c2729676c7 --- /dev/null +++ b/annotations_1/91Z-_ujQGik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.54], [16.0, 17.79], [20.0, 20.68], [33.0, 33.81], [35.0, 37.47], [40.0, 40.66], [41.0, 44.41], [58.0, 60.32], [73.0, 73.5], [76.0, 76.81], [79.0, 81.21], [82.0, 83.24], [85.0, 85.51], [90.0, 91.08], [93.0, 93.66], [96.0, 97.83], [104.0, 105.16], [106.0, 106.76], [109.0, 109.53], [112.0, 114.64]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.43, 0.0, 0.0, 0.0, 48.31, 0.0, 46.83, 51.23, 0.0, 0.0, 45.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16], "audiomae_on_audioset": [null, null, null, null, [["speech", 44.9], ["crowd", 14.69], ["cheering", 8.69]], null, [["speech", 61.82], ["applause", 2.36], ["hum", 1.98]], null, null, null, [["speech", 41.07], ["fly, housefly", 24.1], ["insect", 14.06]], null, null, null, null, null, null, null, null, null], "duration": [2.54, 1.79, 0.68, 0.81, 2.47, 0.66, 3.41, 2.32, 0.5, 0.81, 2.21, 1.24, 0.51, 1.08, 0.66, 1.83, 1.16, 0.76, 0.53, 2.64]} \ No newline at end of file diff --git a/annotations_1/91nX46JsnlU_filtered.json b/annotations_1/91nX46JsnlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af5c832f68c180f93c459f35552a5f42ec82fb4a --- /dev/null +++ b/annotations_1/91nX46JsnlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.02], [23.0, 22.92], [32.0, 32.8], [34.0, 35.31], [52.0, 51.81], [60.0, 61.59], [68.0, 78.85], [81.0, 81.6], [89.0, 90.68], [104.0, 105.17], [106.0, 107.35], [125.0, 136.56], [150.0, 150.35], [154.0, 153.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 35.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 58.03], ["speech", 17.23], ["boing", 2.98]], null, null], "duration": [0.02, -0.08, 0.8, 1.31, -0.19, 1.59, 10.85, 0.6, 1.68, 1.17, 1.35, 11.56, 0.35, -0.26]} \ No newline at end of file diff --git a/annotations_1/92lO2Bum7v4_filtered.json b/annotations_1/92lO2Bum7v4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4da9fd9f72804e66d62fc04e2c3efcc5840dddba --- /dev/null +++ b/annotations_1/92lO2Bum7v4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 50.08], [53.0, 53.32], [55.0, 60.61], [68.0, 68.44], [69.0, 69.79], [73.0, 76.45], [77.0, 77.31], [77.0, 84.45], [100.0, 109.16], [109.0, 114.56], [115.0, 115.3], [122.0, 126.23], [132.0, 135.78]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.15, 0.0, 30.12, 0.0, 0.0, 29.41, 0.0, 30.57, 30.63, 30.12, 0.0, 29.6, 29.74], "audiomae_on_audioset": [[["music", 58.46], ["electronic music", 4.0], ["house music", 3.81]], null, [["music", 75.48], ["electronic music", 2.6], ["dubstep", 1.37]], null, null, [["music", 68.88], ["singing", 2.42], ["electronic music", 2.33]], null, [["music", 91.43], ["jingle, tinkle", 0.73], ["singing", 0.47]], [["music", 75.52], ["theremin", 1.8], ["didgeridoo", 1.72]], [["music", 72.95], ["funny music", 3.49], ["soundtrack music", 2.5]], null, [["music", 61.21], ["throbbing", 5.18], ["electronic music", 4.52]], [["music", 51.56], ["rattle (instrument)", 3.57], ["fly, housefly", 3.16]]], "duration": [3.08, 0.32, 5.61, 0.44, 0.79, 3.45, 0.31, 7.45, 9.16, 5.56, 0.3, 4.23, 3.78]} \ No newline at end of file diff --git a/annotations_1/93U_80mhzVk_filtered.json b/annotations_1/93U_80mhzVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0e696d5f8cf50ad1f3a0b953d20d19bc38fbb20 --- /dev/null +++ b/annotations_1/93U_80mhzVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.52], [23.0, 23.58], [25.0, 60.15], [61.0, 81.72], [82.0, 82.44]], "keep_status": [false, false, false, false, false], "silence_prob": [29.81, 0.0, 0.0, 30.07, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 35.92], ["cattle, bovinae", 31.99], ["moo", 29.2]], null, null, [["sheep", 40.74], ["music", 20.58], ["bleat", 18.44]], null], "duration": [5.52, 0.58, 35.15, 20.72, 0.44]} \ No newline at end of file diff --git a/annotations_1/93qTzU2bNh8_filtered.json b/annotations_1/93qTzU2bNh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c3de0551b41a1d03c8126a34a92aefd417eae88 --- /dev/null +++ b/annotations_1/93qTzU2bNh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [7.0, 7.57], [9.0, 10.29], [42.0, 43.36], [44.0, 44.31], [45.0, 45.79], [47.0, 48.07], [80.0, 80.59], [85.0, 85.23], [90.0, 90.64], [92.0, 91.86], [125.0, 124.98], [133.0, 133.0], [139.0, 156.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.42], ["musical instrument", 3.59], ["boing", 3.11]]], "duration": [0.75, 0.57, 1.29, 1.36, 0.31, 0.79, 1.07, 0.59, 0.23, 0.64, -0.14, -0.02, 0.0, 17.36]} \ No newline at end of file diff --git a/annotations_1/944BOVL_y_U_filtered.json b/annotations_1/944BOVL_y_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bed756d5b5c1b2f9436eb00edea2f96a35662e15 --- /dev/null +++ b/annotations_1/944BOVL_y_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.37], [14.0, 15.28], [18.0, 18.94], [29.0, 29.96], [35.0, 37.47], [51.0, 51.66], [58.0, 58.73], [59.0, 61.26], [64.0, 67.19], [74.0, 74.93], [98.0, 99.45], [101.0, 102.64], [104.0, 105.8], [107.0, 108.28], [112.0, 112.9], [121.0, 123.33], [125.0, 127.53], [128.0, 129.27], [130.0, 129.52], [135.0, 137.76], [139.0, 140.0], [141.0, 150.9], [156.0, 159.16], [167.0, 178.78], [183.0, 187.73], [188.0, 187.76]], "keep_status": [true, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [31.48, 0.0, 0.0, 0.0, 45.4, 0.0, 0.0, 36.75, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.32, 31.88, 0.0, 0.0, 33.38, 0.0, 28.56, 28.24, 28.23, 28.46, 0.0], "audiomae_on_audioset": [[["hum", 23.03], ["whale vocalization", 15.99], ["sidetone", 13.19]], null, null, null, [["music", 22.54], ["hum", 8.12], ["gong", 7.72]], null, null, [["speech", 53.85], ["music", 7.51], ["hum", 6.81]], [["hum", 28.99], ["music", 20.97], ["throbbing", 16.71]], null, null, null, null, null, null, [["music", 66.51], ["synthesizer", 7.39], ["musical instrument", 4.83]], [["music", 61.78], ["musical instrument", 10.11], ["guitar", 7.21]], null, null, [["music", 61.83], ["synthesizer", 2.7], ["musical instrument", 2.53]], null, [["music", 56.02], ["hum", 15.54], ["mains hum", 7.94]], [["music", 41.32], ["hum", 6.54], ["vocal music", 4.86]], [["music", 41.94], ["didgeridoo", 19.95], ["hum", 10.21]], [["music", 67.25], ["theremin", 7.3], ["musical instrument", 5.2]], null], "duration": [3.37, 1.28, 0.94, 0.96, 2.47, 0.66, 0.73, 2.26, 3.19, 0.93, 1.45, 1.64, 1.8, 1.28, 0.9, 2.33, 2.53, 1.27, -0.48, 2.76, 1.0, 9.9, 3.16, 11.78, 4.73, -0.24]} \ No newline at end of file diff --git a/annotations_1/94J4AzRTLE8_filtered.json b/annotations_1/94J4AzRTLE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f0e006a68b3fb681a6f288a047e2503e55d8e0b --- /dev/null +++ b/annotations_1/94J4AzRTLE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.62], [10.0, 18.13], [19.0, 21.78], [23.0, 24.31], [25.0, 31.89], [33.0, 33.32], [35.0, 35.65], [37.0, 38.1], [40.0, 45.96], [50.0, 53.74], [56.0, 57.96], [60.0, 105.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.68, 58.47, 63.64, 0.0, 62.68, 0.0, 0.0, 0.0, 68.93, 63.31, 0.0, 0.0], "audiomae_on_audioset": [[["singing bowl", 52.42], ["chirp tone", 14.13], ["sine wave", 10.36]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.62, 8.13, 2.78, 1.31, 6.89, 0.32, 0.65, 1.1, 5.96, 3.74, 1.96, 45.12]} \ No newline at end of file diff --git a/annotations_1/94k4a1GI9rY_filtered.json b/annotations_1/94k4a1GI9rY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55740826abe93c0d02f456980524ea52f7d97024 --- /dev/null +++ b/annotations_1/94k4a1GI9rY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [4.0, 4.55], [6.0, 6.0], [7.0, 7.77], [9.0, 9.41], [11.0, 12.8], [15.0, 15.11], [17.0, 18.08], [20.0, 20.43], [26.0, 28.34], [31.0, 34.92], [36.0, 37.34], [39.0, 39.51], [42.0, 42.31], [43.0, 43.93], [46.0, 46.06], [56.0, 56.1], [59.0, 61.37], [63.0, 62.78], [67.0, 66.77], [68.0, 68.96], [74.0, 75.54], [79.0, 81.4], [82.0, 82.54], [84.0, 85.83], [89.0, 90.56], [91.0, 93.01], [95.0, 96.08], [98.0, 98.25], [99.0, 102.1], [104.0, 104.26], [106.0, 111.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 48.87, 0.0, 59.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.92], ["throbbing", 9.08], ["noise", 8.85]], null, null], "duration": [0.75, 0.55, 0.0, 0.77, 0.41, 1.8, 0.11, 1.08, 0.43, 2.34, 3.92, 1.34, 0.51, 0.31, 0.93, 0.06, 0.1, 2.37, -0.22, -0.23, 0.96, 1.54, 2.4, 0.54, 1.83, 1.56, 2.01, 1.08, 0.25, 3.1, 0.26, 5.0]} \ No newline at end of file diff --git a/annotations_1/95FV_p0Rivo_filtered.json b/annotations_1/95FV_p0Rivo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56b7481f83c90d2387824f11192af4e64a417ad --- /dev/null +++ b/annotations_1/95FV_p0Rivo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 37.29], [38.0, 41.12], [42.0, 43.28], [44.0, 44.86], [47.0, 48.09], [52.0, 64.27], [65.0, 66.23], [70.0, 69.85], [71.0, 71.27], [72.0, 72.59], [73.0, 77.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.1, 63.42, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 71.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [20.29, 3.12, 1.28, 0.86, 1.09, 12.27, 1.23, -0.15, 0.27, 0.59, 4.23]} \ No newline at end of file diff --git a/annotations_1/95N85bGdzw4_filtered.json b/annotations_1/95N85bGdzw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05d4d9aba0f5c03fb3dfd9cb2e8e183ce9ec3c23 --- /dev/null +++ b/annotations_1/95N85bGdzw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 17.95], [20.0, 23.89], [26.0, 35.06], [37.0, 40.86], [42.0, 44.39], [46.0, 54.65], [56.0, 58.7], [61.0, 63.31], [65.0, 65.62], [67.0, 69.58], [72.0, 79.89], [80.0, 90.93], [94.0, 95.34], [98.0, 98.85], [103.0, 103.25], [107.0, 108.94], [112.0, 112.99], [116.0, 119.99], [123.0, 124.77], [126.0, 142.82], [146.0, 147.97], [150.0, 153.27], [154.0, 157.54]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.34, 60.51, 99.8, 99.91, 86.64, 100.0, 99.99, 99.99, 0.0, 100.0, 99.97, 57.32, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 39.89, 0.0, 75.07, 84.43], "audiomae_on_audioset": [[["fly, housefly", 23.89], ["buzz", 21.75], ["insect", 19.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.02], ["musical instrument", 5.86], ["hum", 4.42]], null, null, null], "duration": [15.95, 3.89, 9.06, 3.86, 2.39, 8.65, 2.7, 2.31, 0.62, 2.58, 7.89, 10.93, 1.34, 0.85, 0.25, 1.94, 0.99, 3.99, 1.77, 16.82, 1.97, 3.27, 3.54]} \ No newline at end of file diff --git a/annotations_1/95fAKnIgqmM_filtered.json b/annotations_1/95fAKnIgqmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44d5a0077e62ef474e1764e529a2b81a2328996d --- /dev/null +++ b/annotations_1/95fAKnIgqmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [13.0, 15.45], [17.0, 17.27], [40.0, 40.44], [42.0, 42.85], [44.0, 44.76], [51.0, 51.66], [53.0, 53.99], [56.0, 57.52], [69.0, 69.11], [74.0, 74.55], [81.0, 81.95], [84.0, 85.75], [106.0, 106.27], [108.0, 111.32], [112.0, 113.37], [125.0, 127.72], [138.0, 141.35], [145.0, 145.57], [147.0, 151.21], [153.0, 156.74], [159.0, 159.31], [160.0, 166.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, true], "silence_prob": [0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 39.64, 41.3, 0.0, 33.05, 31.18, 0.0, 34.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["effects unit", 15.07], ["distortion", 13.94], ["reverberation", 10.74]], [["ding", 15.42], ["speech", 10.56], ["boing", 10.12]], null, [["music", 30.64], ["boing", 9.46], ["busy signal", 7.01]], [["music", 38.31], ["hum", 9.06], ["bleat", 4.58]], null, [["speech", 26.3], ["livestock, farm animals, working animals", 17.8], ["cattle, bovinae", 17.19]]], "duration": [0.45, 2.45, 0.27, 0.44, 0.85, 0.76, 0.66, 0.99, 1.52, 0.11, 0.55, 0.95, 1.75, 0.27, 3.32, 1.37, 2.72, 3.35, 0.57, 4.21, 3.74, 0.31, 6.63]} \ No newline at end of file diff --git a/annotations_1/961QhyKlg34_filtered.json b/annotations_1/961QhyKlg34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29cf87a0a9483b5b498e4e00630624a2155184ca --- /dev/null +++ b/annotations_1/961QhyKlg34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[90.0, 90.41], [92.0, 127.67], [128.0, 128.49], [132.0, 134.5]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 27.99], "audiomae_on_audioset": [null, null, null, [["zipper (clothing)", 31.25], ["sound effect", 19.22], ["vehicle", 7.82]]], "duration": [0.41, 35.67, 0.49, 2.5]} \ No newline at end of file diff --git a/annotations_1/96IU0EisCes_filtered.json b/annotations_1/96IU0EisCes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a9160dc257049af418babeb286f3bc0b3d7fd59 --- /dev/null +++ b/annotations_1/96IU0EisCes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [10.0, 16.7], [19.0, 19.26], [22.0, 22.28], [23.0, 23.46], [27.0, 26.87], [28.0, 28.61], [29.0, 35.97], [42.0, 42.77], [48.0, 50.9], [52.0, 52.68], [55.0, 55.16], [59.0, 58.9], [61.0, 61.13], [70.0, 70.29], [72.0, 94.07], [95.0, 101.21], [105.0, 149.77], [151.0, 165.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 29.99, 29.77, 0.0, 43.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.23], ["sidetone", 21.39], ["speech", 14.07]], [["music", 34.52], ["didgeridoo", 32.98], ["musical instrument", 13.21]], null, [["music", 59.46], ["theremin", 12.44], ["musical instrument", 2.85]]], "duration": [0.55, 6.7, 0.26, 0.28, 0.46, -0.13, 0.61, 6.97, 0.77, 2.9, 0.68, 0.16, -0.1, 0.13, 0.29, 22.07, 6.21, 44.77, 14.92]} \ No newline at end of file diff --git a/annotations_1/96dlvQbYEds_filtered.json b/annotations_1/96dlvQbYEds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58c6a77baa1e0f35cee6b558edb6006634275d2e --- /dev/null +++ b/annotations_1/96dlvQbYEds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.39], [19.0, 20.41], [22.0, 22.37], [24.0, 24.78], [27.0, 28.22], [29.0, 30.03], [30.0, 35.72], [36.0, 37.37], [40.0, 40.09], [41.0, 43.8]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 30.07], ["insect", 17.42], ["bee, wasp, etc.", 12.06]]], "duration": [0.39, 1.41, 0.37, 0.78, 1.22, 1.03, 5.72, 1.37, 0.09, 2.8]} \ No newline at end of file diff --git a/annotations_1/96pSGRvBg3I_filtered.json b/annotations_1/96pSGRvBg3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5593a8b5baf79444645d4c3e95cb8899c3e688 --- /dev/null +++ b/annotations_1/96pSGRvBg3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [5.0, 16.95], [24.0, 25.95], [31.0, 32.61], [41.0, 49.81], [53.0, 60.47], [64.0, 84.1], [87.0, 89.63], [94.0, 95.55], [105.0, 123.9], [125.0, 144.58]], "keep_status": [false, true, false, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 30.79, 0.0, 0.0, 29.25, 28.9, 28.6, 28.68, 0.0, 34.53, 56.03], "audiomae_on_audioset": [null, [["music", 43.97], ["clang", 10.2], ["ding", 8.17]], null, null, [["speech", 36.92], ["music", 31.12], ["didgeridoo", 5.79]], [["music", 40.93], ["speech", 12.55], ["animal", 5.6]], [["music", 34.44], ["livestock, farm animals, working animals", 9.39], ["electronic music", 5.38]], [["speech", 32.7], ["music", 15.59], ["whoosh, swoosh, swish", 8.9]], null, [["music", 25.54], ["synthesizer", 14.23], ["mosquito", 11.25]], null], "duration": [0.99, 11.95, 1.95, 1.61, 8.81, 7.47, 20.1, 2.63, 1.55, 18.9, 19.58]} \ No newline at end of file diff --git a/annotations_1/97qWmPkODZA_filtered.json b/annotations_1/97qWmPkODZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98f85bae6f95cc52f64e65b80eaa721a02674dbb --- /dev/null +++ b/annotations_1/97qWmPkODZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [6.0, 7.23], [8.0, 9.12], [16.0, 16.33], [21.0, 23.16], [24.0, 28.19], [29.0, 32.76], [34.0, 36.41], [40.0, 40.53], [44.0, 44.27], [48.0, 48.03], [49.0, 49.71], [63.0, 65.45], [66.0, 66.5], [70.0, 72.23], [78.0, 78.66], [80.0, 82.31], [83.0, 84.86], [87.0, 88.5], [89.0, 89.07], [89.0, 90.51], [102.0, 103.72], [107.0, 107.7], [111.0, 112.11], [114.0, 114.79], [117.0, 117.63], [118.0, 119.52], [121.0, 122.3], [123.0, 125.63], [133.0, 133.46], [135.0, 136.63], [137.0, 139.11], [140.0, 140.66], [141.0, 142.74], [146.0, 147.97], [150.0, 152.07], [154.0, 154.72], [155.0, 155.56], [158.0, 160.93], [166.0, 167.21]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 59.24, 47.01, 66.15, 51.94, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 46.79, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 39.3, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 55.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 28.05], ["throbbing", 13.57], ["music", 8.25]], null, null, null, null, null, null, null, null, [["hiccup", 41.63], ["burping, eructation", 25.78], ["speech", 11.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.93], ["hum", 20.04], ["mains hum", 13.85]], null, null, null, null, null, null, null, null], "duration": [1.61, 1.23, 1.12, 0.33, 2.16, 4.19, 3.76, 2.41, 0.53, 0.27, 0.03, 0.71, 2.45, 0.5, 2.23, 0.66, 2.31, 1.86, 1.5, 0.07, 1.51, 1.72, 0.7, 1.11, 0.79, 0.63, 1.52, 1.3, 2.63, 0.46, 1.63, 2.11, 0.66, 1.74, 1.97, 2.07, 0.72, 0.56, 2.93, 1.21]} \ No newline at end of file diff --git a/annotations_1/99IRJoGX238_filtered.json b/annotations_1/99IRJoGX238_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e0df393ce3aed6587ed4823f7f03457d5b6f69a --- /dev/null +++ b/annotations_1/99IRJoGX238_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.09], [23.0, 40.26], [46.0, 45.96], [46.0, 47.93], [50.0, 50.03], [51.0, 54.33], [58.0, 59.93], [61.0, 61.8], [63.0, 63.83], [67.0, 67.41], [68.0, 68.67], [77.0, 79.29], [87.0, 88.26], [89.0, 89.7], [95.0, 95.61], [97.0, 97.5], [99.0, 100.14], [112.0, 112.35], [121.0, 122.0], [124.0, 124.31], [127.0, 127.18], [130.0, 131.08], [133.0, 136.04], [138.0, 139.11], [140.0, 140.26], [142.0, 142.2], [146.0, 146.77], [150.0, 157.92]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 39.82, 0.0, 0.0, 0.0, 37.32, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 96.54], "audiomae_on_audioset": [null, [["hum", 21.17], ["mains hum", 12.8], ["arrow", 9.95]], null, null, null, [["speech", 56.43], ["sidetone", 4.84], ["hum", 3.31]], null, null, null, null, null, [["speech", 25.44], ["radio", 13.2], ["creak", 8.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.09, 17.26, -0.04, 1.93, 0.03, 3.33, 1.93, 0.8, 0.83, 0.41, 0.67, 2.29, 1.26, 0.7, 0.61, 0.5, 1.14, 0.35, 1.0, 0.31, 0.18, 1.08, 3.04, 1.11, 0.26, 0.2, 0.77, 7.92]} \ No newline at end of file diff --git a/annotations_1/99IsS-uXJzQ_filtered.json b/annotations_1/99IsS-uXJzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83873f7187188464723ffa61429294d2f783344a --- /dev/null +++ b/annotations_1/99IsS-uXJzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.77], [7.0, 7.94], [11.0, 24.11], [29.0, 46.43], [48.0, 51.02], [53.0, 54.68], [56.0, 58.29], [60.0, 61.69], [67.0, 71.95], [73.0, 76.25], [78.0, 82.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.1, 49.97, 99.1, 0.0, 99.76, 0.0, 99.98, 83.34, 96.54], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 37.8], ["mosquito", 23.16], ["insect", 22.47]], null, null, null, null, null, null, null], "duration": [1.77, 0.94, 13.11, 17.43, 3.02, 1.68, 2.29, 1.69, 4.95, 3.25, 4.48]} \ No newline at end of file diff --git a/annotations_1/99qifKCGPfA_filtered.json b/annotations_1/99qifKCGPfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bc4c70e0a480956c34f71c41c64d0cf858f7035 --- /dev/null +++ b/annotations_1/99qifKCGPfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.75], [17.0, 17.81], [18.0, 19.11], [23.0, 26.96], [31.0, 31.87], [34.0, 34.82], [53.0, 54.5], [60.0, 66.48], [68.0, 70.73], [76.0, 76.49], [80.0, 80.81], [92.0, 95.08], [105.0, 106.83]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.59, 0.0, 0.0, 0.0, 41.7, 45.27, 0.0, 0.0, 34.2, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 34.17], ["didgeridoo", 19.14], ["noise", 12.65]], null, null, null, [["speech", 82.53], ["noise", 6.13], ["white noise", 1.68]], [["noise", 28.66], ["music", 21.96], ["sidetone", 12.97]], null, null, [["sidetone", 86.49], ["speech", 4.15], ["frog", 3.56]], null], "duration": [1.75, 0.81, 1.11, 3.96, 0.87, 0.82, 1.5, 6.48, 2.73, 0.49, 0.81, 3.08, 1.83]} \ No newline at end of file diff --git a/annotations_1/99wezqewopU_filtered.json b/annotations_1/99wezqewopU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02a0d0174660d2d6397f1361d88766975a9375c1 --- /dev/null +++ b/annotations_1/99wezqewopU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 47.7], [49.0, 55.29], [61.0, 82.17], [83.0, 87.76], [91.0, 106.32], [107.0, 108.9], [110.0, 111.64], [113.0, 116.67]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 29.83, 30.6, 33.55, 31.96, 0.0, 0.0, 34.59], "audiomae_on_audioset": [null, [["speech", 53.41], ["vehicle", 12.47], ["aircraft", 11.78]], [["helicopter", 29.78], ["speech", 23.81], ["vehicle", 11.34]], [["music", 57.09], ["synthesizer", 13.48], ["musical instrument", 8.08]], [["speech", 62.98], ["sidetone", 11.01], ["music", 5.05]], null, null, [["speech", 64.16], ["cacophony", 4.01], ["music", 3.91]]], "duration": [0.7, 6.29, 21.17, 4.76, 15.32, 1.9, 1.64, 3.67]} \ No newline at end of file diff --git a/annotations_1/99ziSsaLUpU_filtered.json b/annotations_1/99ziSsaLUpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abdb546758b368e3e297fcbd9158971209deb9fc --- /dev/null +++ b/annotations_1/99ziSsaLUpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.07], [3.0, 91.5], [94.0, 204.92], [205.0, 204.96], [205.0, 204.99], [205.0, 212.9], [217.0, 229.47]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.19, 32.63], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.25], ["vehicle", 8.03], ["throbbing", 6.83]], [["music", 63.31], ["synthesizer", 6.39], ["speech", 6.32]]], "duration": [1.07, 88.5, 110.92, -0.04, -0.01, 7.9, 12.47]} \ No newline at end of file diff --git a/annotations_1/9BdW5LHQvjM_filtered.json b/annotations_1/9BdW5LHQvjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c59cc060587a3725e9bcf9ef6d7981b03bd7f59 --- /dev/null +++ b/annotations_1/9BdW5LHQvjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.69], [19.0, 25.37], [29.0, 29.96], [31.0, 40.19], [42.0, 43.8], [44.0, 61.92], [64.0, 69.92], [71.0, 70.71], [71.0, 76.25], [77.0, 78.54], [85.0, 106.19], [107.0, 107.94], [111.0, 111.82], [117.0, 117.81]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 32.55, 0.0, 32.43, 0.0, 32.09, 32.19, 0.0, 33.95, 0.0, 52.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.98], ["speech", 29.38], ["musical instrument", 5.05]], null, [["music", 66.43], ["speech", 10.94], ["boing", 5.19]], null, [["music", 59.18], ["boing", 22.61], ["breaking", 5.0]], [["music", 44.17], ["speech", 18.93], ["breaking", 16.28]], null, [["hum", 33.58], ["music", 22.29], ["mains hum", 10.19]], null, null, null, null, null], "duration": [0.69, 6.37, 0.96, 9.19, 1.8, 17.92, 5.92, -0.29, 5.25, 1.54, 21.19, 0.94, 0.82, 0.81]} \ No newline at end of file diff --git a/annotations_1/9C0B94fFZkQ_filtered.json b/annotations_1/9C0B94fFZkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daa6760000d05a5ce428e87e73736e00e0b652f2 --- /dev/null +++ b/annotations_1/9C0B94fFZkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [4.0, 4.31], [16.0, 17.32], [18.0, 18.25], [26.0, 26.79], [28.0, 33.3], [36.0, 36.88], [45.0, 57.79], [58.0, 59.26], [60.0, 61.47], [67.0, 77.08], [82.0, 105.06], [113.0, 115.77], [120.0, 119.92], [125.0, 125.78], [126.0, 127.45], [129.0, 130.89], [135.0, 134.57], [144.0, 147.92], [148.0, 147.97], [150.0, 153.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.32, 0.0, 29.31, 0.0, 0.0, 30.06, 31.0, 28.9, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 82.79], "audiomae_on_audioset": [null, null, null, null, null, [["music", 10.58], ["buzz", 8.11], ["livestock, farm animals, working animals", 7.99]], null, [["speech", 38.67], ["music", 34.5], ["breaking", 5.18]], null, null, [["speech", 37.53], ["music", 12.56], ["moo", 6.44]], [["speech", 46.54], ["electric shaver, electric razor", 16.0], ["buzz", 5.43]], [["music", 47.4], ["boing", 27.52], ["didgeridoo", 8.64]], null, null, null, null, null, null, null, null], "duration": [0.73, 0.31, 1.32, 0.25, 0.79, 5.3, 0.88, 12.79, 1.26, 1.47, 10.08, 23.06, 2.77, -0.08, 0.78, 1.45, 1.89, -0.43, 3.92, -0.03, 3.94]} \ No newline at end of file diff --git a/annotations_1/9C6DANHgdrE_filtered.json b/annotations_1/9C6DANHgdrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45f049b12bb1eb01d9a95dfedce1afd10f6bd791 --- /dev/null +++ b/annotations_1/9C6DANHgdrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.04], [20.0, 26.82], [31.0, 31.7], [40.0, 50.5], [51.0, 50.7], [51.0, 51.53], [53.0, 53.33], [54.0, 76.72], [78.0, 87.99], [88.0, 90.34], [93.0, 99.15], [100.0, 110.12], [114.0, 114.98], [116.0, 115.94], [116.0, 117.54], [120.0, 120.61], [126.0, 132.02], [133.0, 142.69], [145.0, 148.95], [150.0, 151.39], [153.0, 165.3]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [98.44, 57.97, 0.0, 87.74, 0.0, 0.0, 0.0, 71.72, 47.74, 59.24, 99.16, 51.6, 0.0, 0.0, 0.0, 0.0, 98.1, 46.83, 64.18, 0.0, 53.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 57.01], ["fart", 8.24], ["bee, wasp, etc.", 3.68]], null, null, null, null, null, null, null, null, [["speech", 52.68], ["hum", 11.65], ["gong", 4.6]], null, null, null], "duration": [2.04, 6.82, 0.7, 10.5, -0.3, 0.53, 0.33, 22.72, 9.99, 2.34, 6.15, 10.12, 0.98, -0.06, 1.54, 0.61, 6.02, 9.69, 3.95, 1.39, 12.3]} \ No newline at end of file diff --git a/annotations_1/9D5WsQNIAcE_filtered.json b/annotations_1/9D5WsQNIAcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bcb6fd24ff65debedefdf4141dffc7735cbf41a --- /dev/null +++ b/annotations_1/9D5WsQNIAcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [3.0, 4.01], [5.0, 8.95], [12.0, 12.53], [14.0, 14.94], [16.0, 16.85], [20.0, 20.43], [21.0, 21.86], [23.0, 23.68], [25.0, 25.89], [27.0, 28.63], [30.0, 31.04], [33.0, 33.3], [36.0, 36.58], [38.0, 41.03], [44.0, 59.09], [61.0, 62.8], [64.0, 65.7], [66.0, 68.0], [69.0, 70.34], [72.0, 72.87], [75.0, 76.62], [77.0, 79.74], [80.0, 80.81], [82.0, 96.45], [96.0, 97.5], [98.0, 98.22], [99.0, 99.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 96.04, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 99.94, 0.0, 33.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.41], ["foghorn", 14.37], ["theremin", 13.41]], null, null, null], "duration": [0.36, 1.01, 3.95, 0.53, 0.94, 0.85, 0.43, 0.86, 0.68, 0.89, 1.63, 1.04, 0.3, 0.58, 3.03, 15.09, 1.8, 1.7, 2.0, 1.34, 0.87, 1.62, 2.74, 0.81, 14.45, 1.5, 0.22, 0.22]} \ No newline at end of file diff --git a/annotations_1/9EFxRx8EbDk_filtered.json b/annotations_1/9EFxRx8EbDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9de96b3d98df28f7159c9e1ccc205ba3fe20495 --- /dev/null +++ b/annotations_1/9EFxRx8EbDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.26], [21.0, 22.45], [25.0, 26.18], [30.0, 30.01], [41.0, 41.77], [58.0, 59.04], [60.0, 59.9], [61.0, 63.39], [72.0, 76.32], [79.0, 80.32], [86.0, 97.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.47, 31.15, 0.0, 29.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.13], ["speech", 5.01], ["cacophony", 4.17]], [["music", 73.81], ["cacophony", 3.69], ["speech", 3.57]], null, [["music", 48.64], ["speech", 12.62], ["cacophony", 5.76]]], "duration": [0.26, 1.45, 1.18, 0.01, 0.77, 1.04, -0.1, 2.39, 4.32, 1.32, 11.48]} \ No newline at end of file diff --git a/annotations_1/9EOazpvA7-U_filtered.json b/annotations_1/9EOazpvA7-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03e7eaa5bfb20e05b1d02522432ac6ada3f9f88f --- /dev/null +++ b/annotations_1/9EOazpvA7-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 48.51], [51.0, 55.49], [56.0, 56.3], [58.0, 62.31], [63.0, 73.41], [74.0, 81.75], [83.0, 91.66], [93.0, 93.77], [98.0, 110.2], [114.0, 114.12], [114.0, 115.4], [117.0, 117.09], [120.0, 120.12], [124.0, 126.91], [133.0, 134.05], [149.0, 150.09], [153.0, 153.45], [157.0, 157.94], [160.0, 160.57], [161.0, 163.05]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.81, 30.56, 0.0, 32.02, 31.19, 31.2, 30.29, 0.0, 29.89, 0.0, 0.0, 0.0, 0.0, 34.52, 0.0, 0.0, 0.0, 0.0, 0.0, 34.63], "audiomae_on_audioset": [[["hum", 33.87], ["throbbing", 19.43], ["music", 16.15]], [["speech", 43.98], ["music", 38.02], ["hum", 2.74]], null, [["music", 29.33], ["hum", 28.34], ["throbbing", 25.36]], [["speech", 51.82], ["music", 27.31], ["hum", 6.95]], [["hum", 28.21], ["music", 23.18], ["scary music", 12.95]], [["mains hum", 46.83], ["hum", 17.43], ["speech", 13.51]], null, [["music", 74.65], ["scary music", 5.64], ["speech", 5.37]], null, null, null, null, [["music", 58.04], ["didgeridoo", 12.34], ["musical instrument", 6.89]], null, null, null, null, null, [["music", 38.98], ["hum", 14.86], ["mains hum", 11.45]]], "duration": [19.51, 4.49, 0.3, 4.31, 10.41, 7.75, 8.66, 0.77, 12.2, 0.12, 1.4, 0.09, 0.12, 2.91, 1.05, 1.09, 0.45, 0.94, 0.57, 2.05]} \ No newline at end of file diff --git a/annotations_1/9Eont_yEGZs_filtered.json b/annotations_1/9Eont_yEGZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5912d2814d161a564913d2d855dd0d7539ea3909 --- /dev/null +++ b/annotations_1/9Eont_yEGZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.37], [10.0, 13.34], [15.0, 17.58], [25.0, 26.4], [29.0, 31.11], [35.0, 42.6], [47.0, 48.07], [49.0, 50.19], [51.0, 53.37]], "keep_status": [true, true, true, false, true, true, false, false, false], "silence_prob": [47.01, 37.17, 29.19, 0.0, 30.75, 29.45, 0.0, 0.0, 53.34], "audiomae_on_audioset": [[["music", 46.82], ["didgeridoo", 15.87], ["theremin", 6.71]], [["music", 42.51], ["theremin", 6.44], ["didgeridoo", 5.88]], [["breaking", 43.93], ["music", 8.28], ["smash, crash", 3.89]], null, [["music", 49.36], ["theremin", 4.16], ["mosquito", 2.97]], [["music", 14.16], ["buzz", 6.57], ["fly, housefly", 6.07]], null, null, null], "duration": [4.37, 3.34, 2.58, 1.4, 2.11, 7.6, 1.07, 1.19, 2.37]} \ No newline at end of file diff --git a/annotations_1/9F3iBMYvQOs_filtered.json b/annotations_1/9F3iBMYvQOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c91395981e463b9dffe39e5d3c2307ecf39c6712 --- /dev/null +++ b/annotations_1/9F3iBMYvQOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.16], [24.0, 24.22], [30.0, 30.33], [39.0, 39.73], [46.0, 47.11], [50.0, 50.45], [51.0, 52.69], [63.0, 66.31], [71.0, 73.45], [77.0, 77.84], [80.0, 80.35], [89.0, 91.98], [98.0, 109.21], [114.0, 118.2], [143.0, 150.69], [155.0, 155.16], [156.0, 167.19], [172.0, 175.71], [176.0, 178.5], [184.0, 185.85], [186.0, 191.76], [198.0, 203.96], [209.0, 209.56], [213.0, 224.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.5, 47.46, 0.0, 0.0, 31.59, 30.67, 32.05, 46.75, 0.0, 30.25, 31.6, 33.38, 0.0, 30.92, 31.09, 0.0, 45.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.93], ["breaking", 19.71], ["shatter", 7.53]], [["music", 47.95], ["throbbing", 8.54], ["hum", 6.54]], null, null, [["music", 65.07], ["brass instrument", 5.11], ["trombone", 4.57]], [["music", 36.41], ["livestock, farm animals, working animals", 18.27], ["animal", 9.34]], [["speech", 71.35], ["music", 6.71], ["boing", 3.58]], [["speech", 59.01], ["burping, eructation", 23.84], ["grunt", 8.13]], null, [["livestock, farm animals, working animals", 22.48], ["music", 18.69], ["cattle, bovinae", 13.49]], [["music", 45.39], ["speech", 9.66], ["throbbing", 7.69]], [["cattle, bovinae", 27.01], ["moo", 23.0], ["music", 10.97]], null, [["music", 37.14], ["speech", 14.38], ["fly, housefly", 12.97]], [["groan", 21.55], ["livestock, farm animals, working animals", 10.68], ["sound effect", 10.05]], null, [["music", 59.57], ["fart", 10.41], ["crushing", 4.84]]], "duration": [0.16, 0.22, 0.33, 0.73, 1.11, 0.45, 1.69, 3.31, 2.45, 0.84, 0.35, 2.98, 11.21, 4.2, 7.69, 0.16, 11.19, 3.71, 2.5, 1.85, 5.76, 5.96, 0.56, 11.45]} \ No newline at end of file diff --git a/annotations_1/9FAeJgWLKRo_filtered.json b/annotations_1/9FAeJgWLKRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66dfcb50f57c9d64e012881f57185107cfdd9829 --- /dev/null +++ b/annotations_1/9FAeJgWLKRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [2.0, 2.34], [3.0, 3.13], [10.0, 12.14], [12.0, 12.18], [14.0, 14.22], [21.0, 22.65], [33.0, 38.45], [39.0, 44.69], [52.0, 52.51], [56.0, 56.52], [61.0, 61.94], [64.0, 65.18], [66.0, 67.83], [78.0, 89.99], [96.0, 105.12], [110.0, 112.14], [124.0, 124.33]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 0.0, 29.53, 30.18, 0.0, 0.0, 0.0, 0.0, 0.0, 29.1, 29.14, 31.37, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.83], ["didgeridoo", 5.99], ["carnatic music", 3.22]], null, null, null, [["didgeridoo", 64.73], ["music", 29.88], ["musical instrument", 0.73]], [["didgeridoo", 48.76], ["music", 29.95], ["fly, housefly", 3.66]], null, null, null, null, null, [["music", 70.55], ["didgeridoo", 18.01], ["electronic music", 1.69]], [["music", 62.46], ["theremin", 10.6], ["throbbing", 3.66]], [["didgeridoo", 37.34], ["music", 32.77], ["musical instrument", 2.7]], null], "duration": [0.41, 0.34, 0.13, 2.14, 0.18, 0.22, 1.65, 5.45, 5.69, 0.51, 0.52, 0.94, 1.18, 1.83, 11.99, 9.12, 2.14, 0.33]} \ No newline at end of file diff --git a/annotations_1/9GBxXdJBSPU_filtered.json b/annotations_1/9GBxXdJBSPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b67b91a3e76fa2b54a31ec2549fd1e6710fac998 --- /dev/null +++ b/annotations_1/9GBxXdJBSPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [5.0, 8.28], [10.0, 11.35], [15.0, 18.87], [21.0, 29.73], [34.0, 36.53]], "keep_status": [false, true, false, true, false, false], "silence_prob": [0.0, 31.41, 0.0, 30.68, 28.62, 32.76], "audiomae_on_audioset": [null, [["music", 31.61], ["throbbing", 24.32], ["hum", 12.16]], null, [["music", 20.88], ["hum", 13.2], ["throbbing", 13.01]], [["speech", 59.95], ["music", 12.72], ["vehicle", 5.52]], [["music", 57.25], ["throbbing", 18.49], ["hum", 5.41]]], "duration": [1.17, 3.28, 1.35, 3.87, 8.73, 2.53]} \ No newline at end of file diff --git a/annotations_1/9HRIGCog9UQ_filtered.json b/annotations_1/9HRIGCog9UQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48809149445cd1902dcf214cbe371f9fae5209e0 --- /dev/null +++ b/annotations_1/9HRIGCog9UQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [14.0, 26.81], [33.0, 41.72], [42.0, 57.57], [60.0, 64.54], [65.0, 65.74], [68.0, 69.53], [74.0, 74.85], [79.0, 79.14], [82.0, 83.3], [88.0, 88.11], [95.0, 95.37]], "keep_status": [true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [34.39, 32.19, 32.18, 31.6, 42.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.58], ["guitar", 6.27], ["musical instrument", 4.82]], [["music", 73.36], ["musical instrument", 5.39], ["guitar", 4.44]], [["music", 76.58], ["musical instrument", 3.28], ["guitar", 3.18]], [["music", 25.36], ["speech", 22.11], ["breaking", 15.55]], [["fly, housefly", 17.4], ["speech", 11.89], ["mosquito", 11.64]], null, null, null, null, null, null, null], "duration": [3.44, 12.81, 8.72, 15.57, 4.54, 0.74, 1.53, 0.85, 0.14, 1.3, 0.11, 0.37]} \ No newline at end of file diff --git a/annotations_1/9I-FCJRX2Cc_filtered.json b/annotations_1/9I-FCJRX2Cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47d3d42bf999cd25d742568280f56972102ea7f7 --- /dev/null +++ b/annotations_1/9I-FCJRX2Cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.14], [3.0, 3.32], [4.0, 5.0], [6.0, 6.76], [7.0, 9.26], [10.0, 13.66], [15.0, 17.09], [19.0, 19.72], [23.0, 23.31], [24.0, 25.12], [28.0, 30.84], [33.0, 37.35], [39.0, 40.85], [42.0, 43.11], [44.0, 46.01], [47.0, 49.06], [50.0, 50.87], [54.0, 56.25], [58.0, 59.19], [60.0, 62.7], [64.0, 65.13], [66.0, 68.74], [70.0, 74.02], [76.0, 80.79], [87.0, 88.1], [89.0, 90.91], [95.0, 96.52], [98.0, 100.01], [102.0, 102.57], [107.0, 107.79], [109.0, 109.75], [110.0, 112.9], [114.0, 114.67], [118.0, 119.52], [126.0, 128.39], [130.0, 130.35], [132.0, 133.69], [135.0, 140.53], [143.0, 143.78], [145.0, 148.46], [149.0, 151.83], [153.0, 154.03], [156.0, 158.57], [163.0, 165.23], [166.0, 166.41], [167.0, 167.93], [171.0, 172.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.22, 90.6, 55.67, 0.0, 0.0, 0.0, 91.3, 80.11, 0.0, 0.0, 75.55, 62.17, 0.0, 89.19, 0.0, 70.3, 0.0, 96.42, 71.0, 55.96, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 50.61, 0.0, 0.0, 96.29, 0.0, 94.81, 100.0, 0.0, 90.25, 89.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 0.32, 1.0, 0.76, 2.26, 3.66, 2.09, 0.72, 0.31, 1.12, 2.84, 4.35, 1.85, 1.11, 2.01, 2.06, 0.87, 2.25, 1.19, 2.7, 1.13, 2.74, 4.02, 4.79, 1.1, 1.91, 1.52, 2.01, 0.57, 0.79, 0.75, 2.9, 0.67, 1.52, 2.39, 0.35, 1.69, 5.53, 0.78, 3.46, 2.83, 1.03, 2.57, 2.23, 0.41, 0.93, 1.96]} \ No newline at end of file diff --git a/annotations_1/9IYFHAnqOKM_filtered.json b/annotations_1/9IYFHAnqOKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de1c3d409b37ab9fbb5ff1d4fbe8c77ffda57fb5 --- /dev/null +++ b/annotations_1/9IYFHAnqOKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.87], [46.0, 50.84], [57.0, 66.99], [68.0, 72.15], [74.0, 74.56], [75.0, 78.19], [79.0, 80.55], [81.0, 87.99], [91.0, 96.53], [98.0, 98.91], [102.0, 102.19], [126.0, 130.96], [149.0, 149.17], [150.0, 151.21], [154.0, 155.29], [156.0, 156.69], [164.0, 163.76], [166.0, 166.35], [169.0, 170.99], [173.0, 173.84], [177.0, 177.15], [177.0, 178.11], [179.0, 178.97], [188.0, 188.72], [190.0, 190.24], [193.0, 193.24]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.84, 38.72, 83.34, 0.0, 35.18, 0.0, 35.87, 74.92, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 37.36], ["whack, thwack", 19.61], ["music", 10.9]], [["music", 21.99], ["buzz", 16.74], ["glockenspiel", 3.12]], null, null, [["speech", 56.35], ["music", 12.85], ["busy signal", 9.3]], null, [["music", 76.59], ["musical instrument", 3.79], ["sitar", 2.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 4.84, 9.99, 4.15, 0.56, 3.19, 1.55, 6.99, 5.53, 0.91, 0.19, 4.96, 0.17, 1.21, 1.29, 0.69, -0.24, 0.35, 1.99, 0.84, 0.15, 1.11, -0.03, 0.72, 0.24, 0.24]} \ No newline at end of file diff --git a/annotations_1/9JQEbj0uh0k_filtered.json b/annotations_1/9JQEbj0uh0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e359488534d5ede8d4b6181546ec6195ab423b5 --- /dev/null +++ b/annotations_1/9JQEbj0uh0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.34], [23.0, 30.77], [32.0, 31.82], [34.0, 36.34], [44.0, 48.05], [50.0, 50.85], [52.0, 68.94], [79.0, 87.47], [88.0, 99.35], [100.0, 100.92], [103.0, 105.07], [106.0, 108.01], [110.0, 110.64], [116.0, 119.8], [121.0, 122.72], [123.0, 132.24], [133.0, 134.87], [136.0, 142.03], [144.0, 146.37], [147.0, 162.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [94.37, 36.12, 0.0, 81.53, 83.16, 0.0, 47.23, 35.52, 41.3, 0.0, 32.12, 98.44, 0.0, 44.15, 0.0, 34.03, 0.0, 98.73, 98.99, 29.74], "audiomae_on_audioset": [null, [["whale vocalization", 56.12], ["music", 15.53], ["hum", 7.3]], null, null, null, null, [["music", 54.32], ["theremin", 18.09], ["didgeridoo", 7.85]], [["music", 74.78], ["scary music", 6.48], ["throbbing", 2.38]], [["music", 40.34], ["didgeridoo", 16.88], ["foghorn", 5.97]], null, [["music", 64.21], ["synthesizer", 8.73], ["musical instrument", 4.71]], null, null, [["music", 41.16], ["synthesizer", 8.9], ["musical instrument", 8.54]], null, [["music", 56.16], ["theremin", 25.35], ["animal", 2.81]], null, null, null, [["music", 56.2], ["theremin", 6.72], ["synthesizer", 5.54]]], "duration": [10.34, 7.77, -0.18, 2.34, 4.05, 0.85, 16.94, 8.47, 11.35, 0.92, 2.07, 2.01, 0.64, 3.8, 1.72, 9.24, 1.87, 6.03, 2.37, 15.87]} \ No newline at end of file diff --git a/annotations_1/9JTGNwLdSDA_filtered.json b/annotations_1/9JTGNwLdSDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adcc929d125ef7f4b19b9879bfccb7a034f73c96 --- /dev/null +++ b/annotations_1/9JTGNwLdSDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 18.3], [24.0, 24.58], [28.0, 28.65], [30.0, 30.06], [32.0, 33.99], [41.0, 43.38], [68.0, 70.34], [77.0, 83.96], [84.0, 85.13], [90.0, 95.49], [98.0, 98.52], [100.0, 100.35], [104.0, 105.43], [106.0, 107.55], [108.0, 110.03], [113.0, 115.03], [116.0, 117.26], [119.0, 119.55], [121.0, 122.05], [125.0, 125.14], [125.0, 126.15], [131.0, 131.62], [137.0, 137.02], [142.0, 143.18], [144.0, 144.37], [145.0, 146.08], [147.0, 148.61]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.1, 0.0, 0.0, 0.0, 0.0, 49.09, 32.34, 32.67, 0.0, 42.37, 0.0, 0.0, 0.0, 0.0, 99.95, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["beatboxing", 19.59], ["cough", 8.97], ["music", 7.36]], [["speech", 78.53], ["explosion", 1.47], ["door", 1.2]], [["hum", 40.62], ["music", 19.28], ["mains hum", 17.16]], null, [["music", 26.28], ["hum", 25.85], ["mains hum", 14.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.3, 0.58, 0.65, 0.06, 1.99, 2.38, 2.34, 6.96, 1.13, 5.49, 0.52, 0.35, 1.43, 1.55, 2.03, 2.03, 1.26, 0.55, 1.05, 0.14, 1.15, 0.62, 0.02, 1.18, 0.37, 1.08, 1.61]} \ No newline at end of file diff --git a/annotations_1/9KYrqmQdvsI_filtered.json b/annotations_1/9KYrqmQdvsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64fbfedaa505a1bf37e8444f5b8c46a56988bd7e --- /dev/null +++ b/annotations_1/9KYrqmQdvsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.65], [8.0, 14.3], [17.0, 24.39], [27.0, 30.06], [31.0, 32.36], [34.0, 34.1], [38.0, 41.18], [42.0, 43.39], [46.0, 49.22], [50.0, 66.65], [67.0, 70.14], [70.0, 76.11], [79.0, 82.7], [84.0, 86.37], [87.0, 87.39], [88.0, 90.44], [91.0, 97.19], [98.0, 98.69], [99.0, 102.83], [105.0, 107.92], [109.0, 109.53], [112.0, 113.81], [119.0, 121.96], [126.0, 146.8], [148.0, 148.04], [150.0, 152.64], [154.0, 154.82], [157.0, 159.17], [161.0, 163.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, true, true, false, false, true, true, false, true, false, true, true], "silence_prob": [36.77, 50.97, 72.16, 54.56, 0.0, 0.0, 48.87, 0.0, 42.37, 35.33, 45.78, 34.8, 37.35, 48.06, 0.0, 36.2, 34.96, 0.0, 35.29, 31.86, 0.0, 0.0, 31.73, 31.36, 0.0, 29.59, 0.0, 30.84, 30.08], "audiomae_on_audioset": [[["music", 62.23], ["boing", 16.11], ["quack", 9.7]], null, null, null, null, null, [["hum", 32.94], ["music", 29.32], ["throbbing", 11.33]], null, [["music", 66.86], ["fly, housefly", 3.75], ["frog", 3.61]], [["music", 72.89], ["speech", 17.97], ["burping, eructation", 1.37]], [["music", 43.35], ["didgeridoo", 16.89], ["speech", 15.02]], [["fart", 18.57], ["fly, housefly", 18.07], ["insect", 7.37]], [["music", 49.68], ["synthesizer", 6.97], ["speech", 5.35]], [["music", 48.53], ["fly, housefly", 9.73], ["sidetone", 7.94]], null, [["music", 46.83], ["electronic music", 6.62], ["musical instrument", 6.59]], [["music", 55.81], ["trombone", 11.43], ["brass instrument", 9.08]], null, [["music", 41.7], ["saxophone", 10.54], ["musical instrument", 7.07]], [["speech", 24.88], ["music", 22.69], ["vehicle", 3.08]], null, null, [["music", 32.23], ["cacophony", 14.85], ["white noise", 4.66]], [["music", 22.11], ["whale vocalization", 15.91], ["speech", 15.89]], null, [["speech", 28.25], ["bleat", 9.52], ["sheep", 9.33]], null, [["music", 34.11], ["speech", 9.13], ["animal", 7.02]], [["music", 29.05], ["hum", 4.45], ["didgeridoo", 4.36]]], "duration": [5.65, 6.3, 7.39, 3.06, 1.36, 0.1, 3.18, 1.39, 3.22, 16.65, 3.14, 6.11, 3.7, 2.37, 0.39, 2.44, 6.19, 0.69, 3.83, 2.92, 0.53, 1.81, 2.96, 20.8, 0.04, 2.64, 0.82, 2.17, 2.11]} \ No newline at end of file diff --git a/annotations_1/9KkV_swvE2Q_filtered.json b/annotations_1/9KkV_swvE2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af55b910c34d8d7b6ca1bbb6682f7d806406cbd0 --- /dev/null +++ b/annotations_1/9KkV_swvE2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [10.0, 13.9], [16.0, 21.86], [24.0, 26.81], [28.0, 44.34], [47.0, 51.24], [51.0, 51.27], [55.0, 57.91], [60.0, 61.25], [69.0, 70.8], [74.0, 80.03], [87.0, 90.41], [90.0, 90.44], [90.0, 90.49], [91.0, 91.0], [93.0, 106.41], [111.0, 115.97], [122.0, 134.79], [136.0, 140.14], [150.0, 163.36]], "keep_status": [false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 73.97, 65.2, 99.1, 48.39, 33.53, 0.0, 33.08, 0.0, 0.0, 47.86, 35.44, 0.0, 0.0, 0.0, 33.22, 32.36, 32.55, 32.17, 36.4], "audiomae_on_audioset": [null, null, null, null, [["hum", 36.48], ["mains hum", 29.04], ["music", 13.33]], [["music", 32.78], ["speech", 24.26], ["whack, thwack", 7.79]], null, [["hum", 34.63], ["throbbing", 22.68], ["heart sounds, heartbeat", 6.51]], null, null, [["hum", 11.27], ["speech", 10.86], ["music", 9.76]], [["music", 71.21], ["musical instrument", 4.88], ["didgeridoo", 3.25]], null, null, null, [["music", 46.72], ["clang", 7.73], ["ding", 5.92]], [["music", 30.21], ["mains hum", 15.29], ["hum", 13.86]], [["music", 68.8], ["throbbing", 4.99], ["sidetone", 4.5]], [["music", 31.95], ["speech", 24.66], ["electronic music", 4.06]], [["music", 66.52], ["speech", 11.34], ["boing", 2.99]]], "duration": [1.7, 3.9, 5.86, 2.81, 16.34, 4.24, 0.27, 2.91, 1.25, 1.8, 6.03, 3.41, 0.44, 0.49, 0.0, 13.41, 4.97, 12.79, 4.14, 13.36]} \ No newline at end of file diff --git a/annotations_1/9L-HJ7BVR6A_filtered.json b/annotations_1/9L-HJ7BVR6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..419fb3471b1458956b525f3ab60099e8ae88efc8 --- /dev/null +++ b/annotations_1/9L-HJ7BVR6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 33.71], [60.0, 65.45], [67.0, 77.97], [79.0, 79.73], [85.0, 91.54], [95.0, 94.68], [112.0, 111.79], [116.0, 116.06], [118.0, 119.3], [119.0, 119.4], [119.0, 119.58], [120.0, 119.62], [120.0, 119.65], [120.0, 122.66], [123.0, 126.84], [132.0, 141.22], [184.0, 200.08], [201.0, 216.62], [231.0, 245.89], [248.0, 250.6]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [29.9, 30.47, 29.67, 0.0, 29.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.75, 30.56, 32.18, 30.12, 28.53, 28.11, 29.61], "audiomae_on_audioset": [[["music", 53.26], ["speech", 23.84], ["boing", 3.12]], [["music", 61.99], ["didgeridoo", 5.84], ["hum", 5.67]], [["speech", 33.81], ["vehicle", 21.39], ["music", 8.16]], null, [["music", 77.01], ["musical instrument", 3.52], ["theremin", 2.7]], null, null, null, null, null, null, null, null, [["music", 25.66], ["speech", 13.86], ["musical instrument", 6.05]], [["speech", 35.17], ["music", 18.3], ["theremin", 18.13]], [["music", 55.37], ["speech", 16.95], ["fart", 4.89]], [["music", 55.04], ["speech", 18.94], ["boing", 4.28]], [["music", 22.63], ["whip", 15.65], ["speech", 12.4]], [["music", 44.23], ["didgeridoo", 6.35], ["sound effect", 5.82]], [["music", 24.56], ["sound effect", 10.25], ["static", 4.84]]], "duration": [21.71, 5.45, 10.97, 0.73, 6.54, -0.32, -0.21, 0.06, 1.3, 0.4, 0.58, -0.38, -0.35, 2.66, 3.84, 9.22, 16.08, 15.62, 14.89, 2.6]} \ No newline at end of file diff --git a/annotations_1/9LvgzVmAFxo_filtered.json b/annotations_1/9LvgzVmAFxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..928656f2927e02ca191676b782859b03073210b0 --- /dev/null +++ b/annotations_1/9LvgzVmAFxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [13.0, 22.37], [26.0, 25.91], [29.0, 32.34], [33.0, 40.32], [43.0, 43.98], [45.0, 45.4], [48.0, 59.36], [60.0, 60.61], [65.0, 73.77], [84.0, 86.7], [94.0, 94.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 40.01, 0.0, 30.24, 30.67, 0.0, 0.0, 41.12, 0.0, 32.78, 43.69, 0.0], "audiomae_on_audioset": [null, [["mains hum", 41.76], ["hum", 41.66], ["throbbing", 3.35]], null, [["speech", 39.18], ["boing", 11.3], ["livestock, farm animals, working animals", 8.25]], [["speech", 47.13], ["music", 21.24], ["groan", 6.25]], null, null, [["speech", 82.27], ["busy signal", 5.86], ["music", 2.64]], null, [["grunt", 89.0], ["animal", 5.28], ["music", 1.29]], [["boing", 15.9], ["speech", 12.25], ["music", 4.36]], null], "duration": [0.24, 9.37, -0.09, 3.34, 7.32, 0.98, 0.4, 11.36, 0.61, 8.77, 2.7, 0.14]} \ No newline at end of file diff --git a/annotations_1/9MSGSOjdViQ_filtered.json b/annotations_1/9MSGSOjdViQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c08d5de38456852b4188cd52d7dfd24eab264764 --- /dev/null +++ b/annotations_1/9MSGSOjdViQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.49], [9.0, 8.94], [12.0, 14.52], [21.0, 21.24], [40.0, 39.66], [43.0, 44.15], [44.0, 50.18], [56.0, 56.61]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.02, 0.0, 0.0, 0.0, 29.25, 0.0], "audiomae_on_audioset": [null, null, [["gong", 64.79], ["music", 14.06], ["musical instrument", 3.25]], null, null, null, [["gong", 55.22], ["music", 23.77], ["speech", 4.28]], null], "duration": [1.49, -0.06, 2.52, 0.24, -0.34, 1.15, 6.18, 0.61]} \ No newline at end of file diff --git a/annotations_1/9MhRoo23Wak_filtered.json b/annotations_1/9MhRoo23Wak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6bf22d573e6e3df64900dee3a3dc18a11c58bf7 --- /dev/null +++ b/annotations_1/9MhRoo23Wak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [13.0, 14.88], [17.0, 17.49], [27.0, 27.68], [40.0, 41.18], [44.0, 44.14], [68.0, 68.4], [68.0, 68.49], [69.0, 70.11], [79.0, 79.2], [80.0, 80.33], [82.0, 82.66], [89.0, 90.68], [99.0, 100.09], [106.0, 121.26], [122.0, 122.25], [124.0, 124.51], [134.0, 136.65], [138.0, 147.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.52, 0.0, 0.0, 28.43, 28.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.76], ["mains hum", 28.81], ["hum", 8.47]], null, null, [["music", 38.74], ["cattle, bovinae", 14.0], ["speech", 12.79]], [["speech", 40.77], ["music", 30.28], ["fart", 3.6]]], "duration": [0.5, 1.88, 0.49, 0.68, 1.18, 0.14, 0.4, 0.49, 1.11, 0.2, 0.33, 0.66, 1.68, 1.09, 15.26, 0.25, 0.51, 2.65, 9.41]} \ No newline at end of file diff --git a/annotations_1/9NTvToplMlw_filtered.json b/annotations_1/9NTvToplMlw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eff9229727b12aadb4faea7678a13c8a473b48a3 --- /dev/null +++ b/annotations_1/9NTvToplMlw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.01], [4.0, 4.04], [6.0, 7.05], [10.0, 11.38], [12.0, 13.93], [16.0, 17.15], [18.0, 17.98], [19.0, 18.96], [21.0, 21.47], [32.0, 34.79], [36.0, 36.54], [37.0, 37.62], [38.0, 39.29], [40.0, 41.34], [42.0, 49.11], [51.0, 50.75], [52.0, 52.61], [57.0, 62.82], [66.0, 71.49], [79.0, 79.64], [85.0, 85.23], [87.0, 87.15], [87.0, 87.84], [93.0, 93.65], [97.0, 97.46], [114.0, 118.72], [122.0, 123.11], [129.0, 130.4], [131.0, 132.22], [141.0, 141.86], [143.0, 144.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 34.23, 0.0, 0.0, 61.97, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.99], ["groan", 14.07], ["glockenspiel", 8.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.01, 0.04, 1.05, 1.38, 1.93, 1.15, -0.02, -0.04, 0.47, 2.79, 0.54, 0.62, 1.29, 1.34, 7.11, -0.25, 0.61, 5.82, 5.49, 0.64, 0.23, 0.15, 0.84, 0.65, 0.46, 4.72, 1.11, 1.4, 1.22, 0.86, 1.37]} \ No newline at end of file diff --git a/annotations_1/9O-NfAWrkDM_filtered.json b/annotations_1/9O-NfAWrkDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb69a5ce579088015b2414892ebda9ad7e10395a --- /dev/null +++ b/annotations_1/9O-NfAWrkDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 54.26], [57.0, 57.99], [59.0, 59.8], [61.0, 60.76], [62.0, 62.6], [63.0, 67.41], [68.0, 68.99], [70.0, 69.74], [73.0, 111.48], [112.0, 113.17], [114.0, 114.22], [115.0, 115.96], [117.0, 131.68], [133.0, 148.17], [149.0, 177.63], [178.0, 179.02], [181.0, 181.84], [185.0, 185.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.93, 34.58, 31.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 37.2], ["hum", 25.16], ["speech", 9.43]], null, null, null, null, null, null, [["music", 41.11], ["hum", 19.84], ["mains hum", 10.63]], [["mains hum", 32.12], ["hum", 29.21], ["music", 16.05]], [["music", 51.51], ["hum", 8.25], ["theremin", 5.72]], null, null, null], "duration": [44.26, 0.99, 0.8, -0.24, 0.6, 4.41, 0.99, -0.26, 38.48, 1.17, 0.22, 0.96, 14.68, 15.17, 28.63, 1.02, 0.84, 0.97]} \ No newline at end of file diff --git a/annotations_1/9OlXAy0L0yI_filtered.json b/annotations_1/9OlXAy0L0yI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ef53998b13700b7e6d37b27ef963934bb2a0472 --- /dev/null +++ b/annotations_1/9OlXAy0L0yI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [4.0, 4.48], [5.0, 7.79], [8.0, 9.58], [10.0, 11.06], [12.0, 12.39], [13.0, 14.64], [15.0, 16.34], [18.0, 27.94], [32.0, 32.32], [34.0, 34.33], [36.0, 37.79], [38.0, 39.72], [40.0, 42.15], [46.0, 46.21], [50.0, 51.61], [56.0, 56.93], [59.0, 65.42], [66.0, 67.12], [68.0, 68.76], [69.0, 70.53], [72.0, 72.67], [76.0, 76.27], [78.0, 78.95], [80.0, 81.4], [82.0, 82.32], [85.0, 86.29], [88.0, 89.36], [99.0, 99.98], [105.0, 105.58], [108.0, 109.16], [110.0, 112.6], [113.0, 115.4], [116.0, 117.93], [119.0, 121.73], [122.0, 122.03], [122.0, 123.5], [125.0, 125.31], [132.0, 132.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 55.25, 0.0, 39.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 84.47], ["speech", 7.95], ["sine wave", 1.4]], null, null, null, null], "duration": [0.18, 0.48, 2.79, 1.58, 1.06, 0.39, 1.64, 1.34, 9.94, 0.32, 0.33, 1.79, 1.72, 2.15, 0.21, 1.61, 0.93, 6.42, 1.12, 0.76, 1.53, 0.67, 0.27, 0.95, 1.4, 0.32, 1.29, 1.36, 0.98, 0.58, 1.16, 2.6, 2.4, 1.93, 2.73, 0.03, 1.5, 0.31, 0.19]} \ No newline at end of file diff --git a/annotations_1/9Pn6NgaX8I0_filtered.json b/annotations_1/9Pn6NgaX8I0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7026b0b4c7655b8a9a77c042f96a85d920616af0 --- /dev/null +++ b/annotations_1/9Pn6NgaX8I0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.86], [7.0, 11.31], [15.0, 15.92], [18.0, 18.86], [21.0, 22.1], [24.0, 75.68], [83.0, 83.59], [91.0, 92.64], [95.0, 94.91], [97.0, 122.35], [124.0, 123.94], [126.0, 126.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.14, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 32.68], ["music", 26.77], ["mains hum", 10.74]], null, null, null, null, null, null, null, [["electric shaver, electric razor", 28.53], ["music", 21.79], ["speech", 19.92]], null, null], "duration": [-0.14, 4.31, 0.92, 0.86, 1.1, 51.68, 0.59, 1.64, -0.09, 25.35, -0.06, 0.25]} \ No newline at end of file diff --git a/annotations_1/9QJ2mqXdr5I_filtered.json b/annotations_1/9QJ2mqXdr5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eccdab2490e08ccd26c59852fdba2f288cfe0dd --- /dev/null +++ b/annotations_1/9QJ2mqXdr5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.03], [26.0, 32.81], [34.0, 34.84], [36.0, 68.35], [69.0, 69.94], [73.0, 73.99], [82.0, 83.35], [90.0, 91.83], [93.0, 96.6], [108.0, 123.84], [126.0, 135.28], [137.0, 149.55], [151.0, 167.95], [171.0, 175.9]], "keep_status": [true, true, false, false, false, false, false, false, true, false, true, true, true, false], "silence_prob": [31.05, 31.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 29.21, 29.45, 29.33, 29.27, 35.76], "audiomae_on_audioset": [[["music", 38.15], ["speech", 23.41], ["throbbing", 6.23]], [["speech", 31.06], ["music", 15.51], ["crowd", 12.95]], null, null, null, null, null, null, [["fly, housefly", 20.37], ["mains hum", 7.48], ["boing", 6.29]], [["music", 63.31], ["explosion", 3.63], ["theremin", 3.12]], [["music", 38.67], ["whack, thwack", 9.44], ["didgeridoo", 7.4]], [["music", 36.88], ["hum", 8.06], ["smash, crash", 7.64]], [["music", 38.29], ["didgeridoo", 15.96], ["speech", 8.04]], [["music", 37.17], ["throbbing", 33.24], ["hum", 17.06]]], "duration": [13.03, 6.81, 0.84, 32.35, 0.94, 0.99, 1.35, 1.83, 3.6, 15.84, 9.28, 12.55, 16.95, 4.9]} \ No newline at end of file diff --git a/annotations_1/9SYhu10qJ-o_filtered.json b/annotations_1/9SYhu10qJ-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de397f65f8cc808f4f24380336b3e36d32a3a239 --- /dev/null +++ b/annotations_1/9SYhu10qJ-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.08], [11.0, 11.16], [23.0, 26.2], [26.0, 27.06], [29.0, 35.92], [38.0, 52.47], [53.0, 53.74], [56.0, 59.36], [62.0, 71.54], [73.0, 78.38], [79.0, 84.13], [85.0, 85.28], [86.0, 87.34], [89.0, 89.73], [90.0, 90.36], [91.0, 91.23], [92.0, 92.03], [93.0, 93.73], [99.0, 100.23], [102.0, 101.78], [108.0, 109.02], [109.0, 110.34], [112.0, 112.55], [113.0, 116.99], [122.0, 121.93], [126.0, 127.43], [128.0, 128.83], [129.0, 133.73], [138.0, 138.87], [141.0, 150.96]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.26, 0.0, 32.94, 37.73, 0.0, 37.34, 39.54, 69.88, 48.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.42, 0.0, 0.0, 0.0, 39.14, 0.0, 49.31], "audiomae_on_audioset": [null, null, [["music", 34.33], ["carnatic music", 7.72], ["musical instrument", 5.89]], null, [["speech", 47.03], ["music", 24.67], ["theremin", 6.19]], [["livestock, farm animals, working animals", 16.48], ["music", 13.55], ["moo", 12.31]], null, [["speech", 49.35], ["music", 25.9], ["didgeridoo", 4.63]], [["animal", 50.33], ["speech", 23.37], ["livestock, farm animals, working animals", 3.9]], null, [["burping, eructation", 20.13], ["fart", 12.76], ["speech", 12.08]], null, null, null, null, null, null, null, null, null, null, null, null, [["owl", 26.57], ["frog", 21.06], ["hoot", 18.59]], null, null, null, [["music", 51.48], ["didgeridoo", 12.57], ["speech", 11.82]], null, [["music", 23.38], ["electric shaver, electric razor", 17.93], ["didgeridoo", 8.3]]], "duration": [0.08, 0.16, 3.2, 1.06, 6.92, 14.47, 0.74, 3.36, 9.54, 5.38, 5.13, 0.28, 1.34, 0.73, 0.36, 0.23, 0.03, 0.73, 1.23, -0.22, 1.02, 1.34, 0.55, 3.99, -0.07, 1.43, 0.83, 4.73, 0.87, 9.96]} \ No newline at end of file diff --git a/annotations_1/9T4kKk7zH34_filtered.json b/annotations_1/9T4kKk7zH34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a5a5c2d58206312e08ed8fe97919539ad994fd0 --- /dev/null +++ b/annotations_1/9T4kKk7zH34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.78], [14.0, 17.31], [18.0, 18.6], [20.0, 24.27], [25.0, 24.88], [26.0, 27.26], [28.0, 30.2], [33.0, 33.88], [36.0, 41.3], [44.0, 44.79], [46.0, 46.41], [48.0, 48.19], [49.0, 49.49], [51.0, 52.0], [53.0, 54.19], [55.0, 55.53], [57.0, 57.99], [63.0, 64.29], [67.0, 67.88], [72.0, 72.01], [73.0, 74.55], [75.0, 81.73], [84.0, 85.67], [87.0, 89.07], [90.0, 90.98], [93.0, 95.05], [99.0, 99.82], [102.0, 102.78], [106.0, 109.58], [112.0, 117.07], [118.0, 119.45], [121.0, 123.63], [125.0, 126.69], [129.0, 135.13], [136.0, 136.66], [137.0, 137.29], [138.0, 138.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 99.96, 0.0, 0.0, 100.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 91.13, 100.0, 0.0, 99.48, 0.0, 61.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 3.31, 0.6, 4.27, -0.12, 1.26, 2.2, 0.88, 5.3, 0.79, 0.41, 0.19, 0.49, 1.0, 1.19, 0.53, 0.99, 1.29, 0.88, 0.01, 1.55, 6.73, 1.67, 2.07, 0.98, 2.05, 0.82, 0.78, 3.58, 5.07, 1.45, 2.63, 1.69, 6.13, 0.66, 0.29, 0.65]} \ No newline at end of file diff --git a/annotations_1/9T7zP4Ui9VE_filtered.json b/annotations_1/9T7zP4Ui9VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29d7b20c2d48c9cb4f6fd92f549eda7acd57e4bc --- /dev/null +++ b/annotations_1/9T7zP4Ui9VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [5.0, 5.07], [12.0, 11.91], [13.0, 13.24], [20.0, 21.0], [22.0, 22.08], [26.0, 27.7], [30.0, 30.23], [35.0, 36.44], [53.0, 54.09], [58.0, 58.02], [63.0, 65.2], [67.0, 66.95], [67.0, 67.98], [73.0, 73.48], [75.0, 78.41], [82.0, 83.78], [87.0, 93.48], [95.0, 97.83], [99.0, 99.81], [101.0, 101.68], [102.0, 103.23], [104.0, 114.54], [119.0, 122.2], [125.0, 125.49], [132.0, 132.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 76.37, 0.0, 31.27, 33.41, 0.0, 0.0, 0.0, 30.18, 30.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.29], ["throbbing", 21.74], ["hum", 17.85]], [["hum", 42.22], ["mains hum", 24.78], ["throbbing", 9.77]], null, null, null, [["music", 35.0], ["boing", 11.0], ["whack, thwack", 9.32]], [["speech", 73.78], ["music", 8.13], ["explosion", 3.6]], null, null], "duration": [0.67, 0.07, -0.09, 0.24, 1.0, 0.08, 1.7, 0.23, 1.44, 1.09, 0.02, 2.2, -0.05, 0.98, 0.48, 3.41, 1.78, 6.48, 2.83, 0.81, 0.68, 1.23, 10.54, 3.2, 0.49, 0.66]} \ No newline at end of file diff --git a/annotations_1/9UrJ60MVNao_filtered.json b/annotations_1/9UrJ60MVNao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85ee936b1f4b6590b8154828cc94bde556915ae8 --- /dev/null +++ b/annotations_1/9UrJ60MVNao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 91.47], [95.0, 96.28], [98.0, 98.47], [99.0, 108.62], [109.0, 110.61], [111.0, 111.77], [112.0, 114.02], [115.0, 115.94], [118.0, 123.13], [124.0, 128.63], [130.0, 131.62], [135.0, 138.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.16, 0.0, 0.0, 78.21, 0.0, 0.0, 100.0, 0.0, 100.0, 90.43, 0.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.47, 1.28, 0.47, 9.62, 1.61, 0.77, 2.02, 0.94, 5.13, 4.63, 1.62, 3.15]} \ No newline at end of file diff --git a/annotations_1/9VY3OKScxP4_filtered.json b/annotations_1/9VY3OKScxP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba63c91683ab2cbc2c7d2820c1d55ec6fe3735df --- /dev/null +++ b/annotations_1/9VY3OKScxP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.05], [22.0, 22.5], [40.0, 40.85], [52.0, 52.59], [54.0, 54.36], [56.0, 58.08], [62.0, 61.84], [65.0, 66.04], [69.0, 69.33], [78.0, 78.02], [89.0, 93.45], [96.0, 96.47], [101.0, 101.75], [102.0, 102.74], [103.0, 103.84], [105.0, 105.51], [110.0, 110.08], [111.0, 112.41], [114.0, 120.8], [123.0, 123.42], [127.0, 132.02], [135.0, 135.18], [138.0, 140.34], [144.0, 149.88], [153.0, 157.79], [160.0, 160.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [84.43, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 45.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.16, 0.0, 56.03, 0.0, 47.9, 31.41, 32.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 37.65], ["music", 22.17], ["whale vocalization", 15.07]], null, null, null, null, null, null, null, [["hum", 33.41], ["music", 27.39], ["mains hum", 8.14]], null, null, null, [["mains hum", 35.28], ["hum", 21.42], ["music", 4.58]], [["speech", 56.43], ["music", 13.96], ["thunk", 1.8]], [["speech", 53.86], ["music", 15.07], ["throbbing", 6.78]], null], "duration": [2.05, 0.5, 0.85, 0.59, 0.36, 2.08, -0.16, 1.04, 0.33, 0.02, 4.45, 0.47, 0.75, 0.74, 0.84, 0.51, 0.08, 1.41, 6.8, 0.42, 5.02, 0.18, 2.34, 5.88, 4.79, 0.74]} \ No newline at end of file diff --git a/annotations_1/9V_GlFhNX2g_filtered.json b/annotations_1/9V_GlFhNX2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fe12184c1ffac15c34f67887f1116924aa0b165 --- /dev/null +++ b/annotations_1/9V_GlFhNX2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [3.0, 4.09], [6.0, 8.9], [10.0, 12.9], [16.0, 18.94], [20.0, 22.28], [26.0, 28.88], [30.0, 34.35], [37.0, 39.36], [41.0, 45.25], [48.0, 49.5], [52.0, 54.19], [55.0, 55.68], [56.0, 58.62], [60.0, 61.92], [63.0, 63.95], [65.0, 70.92], [76.0, 78.98], [80.0, 80.47], [83.0, 83.24], [84.0, 85.26], [86.0, 86.39], [87.0, 89.97], [92.0, 92.45], [93.0, 94.58], [96.0, 97.71], [99.0, 100.85], [102.0, 103.23], [106.0, 107.55], [109.0, 109.7], [111.0, 111.55], [112.0, 113.36], [117.0, 118.1], [122.0, 122.3], [125.0, 126.52], [129.0, 132.16], [133.0, 135.46], [137.0, 141.1], [143.0, 145.08], [148.0, 147.93], [149.0, 149.4], [151.0, 156.07], [156.0, 158.9], [161.0, 162.01], [163.0, 169.5], [171.0, 173.62], [180.0, 181.03], [182.0, 183.78], [186.0, 186.26], [187.0, 188.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 77.87, 99.44, 90.43, 96.42, 98.99, 99.16, 99.95, 99.97, 0.0, 78.89, 0.0, 74.44, 0.0, 0.0, 98.36, 97.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 99.95, 98.51, 97.92, 0.0, 0.0, 65.09, 39.21, 0.0, 86.82, 99.59, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.36], ["music", 8.75], ["singing bowl", 1.66]], null, null, null, null, null, null, null], "duration": [0.38, 1.09, 2.9, 2.9, 2.94, 2.28, 2.88, 4.35, 2.36, 4.25, 1.5, 2.19, 0.68, 2.62, 1.92, 0.95, 5.92, 2.98, 0.47, 0.24, 1.26, 0.39, 2.97, 0.45, 1.58, 1.71, 1.85, 1.23, 1.55, 0.7, 0.55, 1.36, 1.1, 0.3, 1.52, 3.16, 2.46, 4.1, 2.08, -0.07, 0.4, 5.07, 2.9, 1.01, 6.5, 2.62, 1.03, 1.78, 0.26, 1.25]} \ No newline at end of file diff --git a/annotations_1/9VsHtn_RSHY_filtered.json b/annotations_1/9VsHtn_RSHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1260b517cf15bfa002d77c1d79c0ced3eacfa27f --- /dev/null +++ b/annotations_1/9VsHtn_RSHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.2], [17.0, 41.69], [43.0, 73.18], [74.0, 74.38], [75.0, 80.89]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 31.29, 0.0, 0.0, 32.74], "audiomae_on_audioset": [null, [["music", 30.43], ["hum", 22.08], ["mains hum", 11.15]], null, null, [["speech", 46.86], ["vehicle", 16.71], ["buzz", 5.3]]], "duration": [1.2, 24.69, 30.18, 0.38, 5.89]} \ No newline at end of file diff --git a/annotations_1/9VwWPnHZMrs_filtered.json b/annotations_1/9VwWPnHZMrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ef1c873e196e6b7fcdd98ae222afa75809eef7 --- /dev/null +++ b/annotations_1/9VwWPnHZMrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 31.23], [34.0, 34.87], [38.0, 39.46], [41.0, 41.32], [42.0, 41.77], [42.0, 43.36], [46.0, 47.41], [50.0, 49.55], [50.0, 52.84], [60.0, 60.96], [63.0, 68.17], [77.0, 77.43], [78.0, 78.71], [84.0, 85.65], [96.0, 114.84], [116.0, 116.58]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [29.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.78, 0.0, 30.63, 0.0, 0.0, 0.0, 32.54, 0.0], "audiomae_on_audioset": [[["mosquito", 34.58], ["fly, housefly", 29.61], ["insect", 6.34]], null, null, null, null, null, null, null, [["synthesizer", 23.29], ["music", 22.93], ["throbbing", 5.23]], null, [["music", 59.06], ["boing", 5.51], ["synthesizer", 3.82]], null, null, null, [["music", 40.32], ["speech", 17.61], ["didgeridoo", 12.02]], null], "duration": [2.23, 0.87, 1.46, 0.32, -0.23, 1.36, 1.41, -0.45, 2.84, 0.96, 5.17, 0.43, 0.71, 1.65, 18.84, 0.58]} \ No newline at end of file diff --git a/annotations_1/9We9JImjg-c_filtered.json b/annotations_1/9We9JImjg-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5ea226b69fed3c100ade9401380cf71dd34b5aa --- /dev/null +++ b/annotations_1/9We9JImjg-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.61], [14.0, 15.52], [17.0, 18.27], [21.0, 21.0], [24.0, 24.56], [26.0, 28.24], [29.0, 29.3], [34.0, 54.31], [55.0, 60.42], [63.0, 71.36], [75.0, 76.54], [77.0, 80.22], [84.0, 84.45], [88.0, 89.72], [91.0, 90.93], [92.0, 92.25], [94.0, 94.07], [99.0, 100.99], [104.0, 104.79], [107.0, 108.92], [117.0, 129.05], [140.0, 141.03], [144.0, 144.41], [146.0, 146.31], [148.0, 157.15], [159.0, 158.55]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [45.75, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 35.95, 34.62, 49.13, 0.0, 38.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.52, 0.0, 0.0, 0.0, 41.05, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 37.73], ["cattle, bovinae", 32.18], ["moo", 27.81]], null, null, null, null, null, null, [["music", 39.33], ["speech", 31.25], ["hum", 5.56]], [["speech", 23.42], ["gong", 18.2], ["music", 14.19]], [["gong", 66.67], ["music", 9.7], ["hum", 7.72]], null, [["quack", 14.98], ["hum", 10.28], ["music", 9.59]], null, null, null, null, null, null, null, null, [["cattle, bovinae", 20.84], ["livestock, farm animals, working animals", 12.51], ["music", 12.35]], null, null, null, [["music", 62.66], ["didgeridoo", 15.23], ["hum", 3.25]], null], "duration": [2.61, 1.52, 1.27, 0.0, 0.56, 2.24, 0.3, 20.31, 5.42, 8.36, 1.54, 3.22, 0.45, 1.72, -0.07, 0.25, 0.07, 1.99, 0.79, 1.92, 12.05, 1.03, 0.41, 0.31, 9.15, -0.45]} \ No newline at end of file diff --git a/annotations_1/9Wfswn2lkAo_filtered.json b/annotations_1/9Wfswn2lkAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40cef380f70f515f583b7f00d70bf0f1310670cf --- /dev/null +++ b/annotations_1/9Wfswn2lkAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [9.0, 9.68], [10.0, 11.11], [12.0, 13.85], [17.0, 18.32], [20.0, 25.83], [27.0, 53.59], [55.0, 55.0], [57.0, 57.5], [60.0, 61.52], [63.0, 65.55], [66.0, 68.44], [70.0, 72.22], [83.0, 86.24], [88.0, 91.34], [92.0, 94.02], [97.0, 97.87], [99.0, 101.83], [103.0, 105.17], [106.0, 109.39], [110.0, 110.98], [112.0, 112.99], [113.0, 114.98], [126.0, 127.65], [132.0, 137.93], [139.0, 144.64], [146.0, 150.18], [151.0, 154.43], [155.0, 155.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false, false, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.64, 39.85, 0.0, 0.0, 0.0, 36.94, 41.72, 43.3, 37.62, 39.93, 45.33, 0.0, 47.01, 49.78, 48.95, 0.0, 0.0, 0.0, 0.0, 42.11, 32.73, 29.75, 30.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 59.16], ["mains hum", 17.22], ["music", 7.23]], [["speech", 31.12], ["hum", 25.16], ["mains hum", 20.62]], null, null, null, [["hum", 46.16], ["throbbing", 17.35], ["mains hum", 12.65]], [["music", 55.32], ["didgeridoo", 11.6], ["musical instrument", 4.07]], [["music", 63.58], ["musical instrument", 3.56], ["percussion", 3.22]], [["music", 41.14], ["hum", 9.85], ["throbbing", 7.72]], [["hum", 28.07], ["music", 20.62], ["throbbing", 19.23]], [["music", 45.91], ["speech", 14.85], ["hum", 7.13]], null, [["music", 73.33], ["musical instrument", 5.39], ["speech", 4.04]], [["music", 29.03], ["throbbing", 12.3], ["hum", 10.03]], [["music", 38.07], ["throbbing", 7.34], ["hum", 6.51]], null, null, null, null, [["music", 53.11], ["hum", 9.1], ["speech", 6.83]], [["hum", 21.29], ["music", 19.21], ["speech", 15.51]], [["speech", 25.02], ["hum", 20.34], ["explosion", 14.17]], [["groan", 44.39], ["whale vocalization", 15.76], ["screaming", 3.67]], null], "duration": [1.12, 0.68, 1.11, 1.85, 1.32, 5.83, 26.59, 0.0, 0.5, 1.52, 2.55, 2.44, 2.22, 3.24, 3.34, 2.02, 0.87, 2.83, 2.17, 3.39, 0.98, 0.99, 1.98, 1.65, 5.93, 5.64, 4.18, 3.43, 0.63]} \ No newline at end of file diff --git a/annotations_1/9WpO5zPo8Dg_filtered.json b/annotations_1/9WpO5zPo8Dg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..423ca5a1305c663234f3d82e8db330ded1c91b8e --- /dev/null +++ b/annotations_1/9WpO5zPo8Dg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.73], [12.0, 12.29], [13.0, 56.19], [58.0, 60.25], [65.0, 65.69], [67.0, 69.45], [87.0, 87.15], [89.0, 89.26], [96.0, 97.65], [101.0, 102.41], [107.0, 108.9], [115.0, 116.97], [119.0, 119.21], [120.0, 120.14], [122.0, 125.07], [131.0, 132.33], [134.0, 137.32], [139.0, 139.09], [143.0, 143.45], [148.0, 151.28], [158.0, 160.39], [161.0, 174.34], [176.0, 181.52], [183.0, 190.63], [196.0, 198.31]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.86, 0.0, 0.0, 44.75, 0.0, 29.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.95, 0.0, 32.27, 0.0, 0.0, 33.06, 40.54, 31.78, 33.39, 35.37, 35.37], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 30.46], ["music", 22.75], ["cattle, bovinae", 5.81]], null, null, [["music", 35.95], ["synthesizer", 19.93], ["ambient music", 12.86]], null, [["animal", 57.22], ["howl", 14.18], ["wild animals", 5.66]], null, null, null, null, null, null, null, null, [["cattle, bovinae", 18.36], ["music", 17.75], ["moo", 15.45]], null, [["speech", 72.19], ["fart", 3.59], ["music", 3.52]], null, null, [["music", 55.78], ["speech", 25.52], ["thunk", 6.0]], [["music", 62.39], ["theremin", 5.77], ["speech", 2.02]], [["music", 73.37], ["synthesizer", 5.32], ["theremin", 3.3]], [["music", 74.0], ["musical instrument", 4.51], ["piano", 0.94]], [["whale vocalization", 58.2], ["music", 32.86], ["speech", 2.74]], [["speech", 33.2], ["music", 12.62], ["animal", 2.74]]], "duration": [3.73, 0.29, 43.19, 2.25, 0.69, 2.45, 0.15, 0.26, 1.65, 1.41, 1.9, 1.97, 0.21, 0.14, 3.07, 1.33, 3.32, 0.09, 0.45, 3.28, 2.39, 13.34, 5.52, 7.63, 2.31]} \ No newline at end of file diff --git a/annotations_1/9YgorDRKoEo_filtered.json b/annotations_1/9YgorDRKoEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a016e92ebb287f643a5fa23add91b57d181727b --- /dev/null +++ b/annotations_1/9YgorDRKoEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.35], [7.0, 9.63], [13.0, 21.0], [22.0, 22.82], [24.0, 32.07], [33.0, 38.87], [39.0, 59.34], [62.0, 66.9], [68.0, 91.52], [93.0, 107.81]], "keep_status": [true, false, true, false, true, true, false, false, true, true], "silence_prob": [31.92, 32.0, 32.81, 0.0, 33.1, 31.49, 79.41, 86.82, 34.21, 42.17], "audiomae_on_audioset": [[["music", 12.59], ["frog", 7.31], ["cattle, bovinae", 6.59]], [["sheep", 42.46], ["bleat", 31.62], ["music", 13.56]], [["speech", 37.95], ["music", 21.03], ["fart", 7.7]], null, [["fly, housefly", 16.46], ["music", 15.6], ["mosquito", 11.82]], [["hum", 22.48], ["mains hum", 19.54], ["fly, housefly", 9.23]], null, null, [["music", 32.98], ["theremin", 14.95], ["speech", 12.3]], [["speech", 33.33], ["music", 19.99], ["foghorn", 4.99]]], "duration": [2.35, 2.63, 8.0, 0.82, 8.07, 5.87, 20.34, 4.9, 23.52, 14.81]} \ No newline at end of file diff --git a/annotations_1/9ZBPZ4b5LRw_filtered.json b/annotations_1/9ZBPZ4b5LRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..221a4d5e7361288f4174988d9736e67f58f30f8c --- /dev/null +++ b/annotations_1/9ZBPZ4b5LRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.4], [5.0, 8.38], [9.0, 10.81], [12.0, 14.23], [15.0, 28.85], [29.0, 29.34], [30.0, 46.18], [47.0, 47.8], [48.0, 48.57], [49.0, 105.09], [106.0, 106.81], [107.0, 137.98], [138.0, 138.52], [139.0, 140.85]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.25, 0.0, 96.04, 38.95, 0.0, 41.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hiccup", 26.27], ["cough", 10.99], ["hum", 6.56]], null, [["speech", 56.0], ["fart", 12.38], ["frog", 4.62]], null, null, null, null, null, null, null], "duration": [1.4, 3.38, 1.81, 2.23, 13.85, 0.34, 16.18, 0.8, 0.57, 56.09, 0.81, 30.98, 0.52, 1.85]} \ No newline at end of file diff --git a/annotations_1/9ZEUnzRzvGg_filtered.json b/annotations_1/9ZEUnzRzvGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20be665e84b76e92a696165b4b17b2cf56f1fb47 --- /dev/null +++ b/annotations_1/9ZEUnzRzvGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 9.66], [12.0, 14.2], [14.0, 15.48], [19.0, 20.04], [22.0, 25.91], [27.0, 30.33], [31.0, 38.62], [40.0, 43.51], [47.0, 47.75], [49.0, 50.73], [56.0, 57.87], [62.0, 62.23], [64.0, 64.59], [67.0, 67.96], [71.0, 75.39], [82.0, 83.57], [87.0, 88.65], [91.0, 93.55], [96.0, 98.68], [100.0, 101.12], [108.0, 108.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.52, 69.07, 0.0, 0.0, 99.98, 98.59, 97.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.66, 0.0, 0.0, 97.83, 97.64, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 40.26], ["throbbing", 19.01], ["noise", 12.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.43], ["radio", 11.81], ["sidetone", 6.11]], null, null, null, null, null, null], "duration": [0.5, 4.66, 2.2, 1.48, 1.04, 3.91, 3.33, 7.62, 3.51, 0.75, 1.73, 1.87, 0.23, 0.59, 0.96, 4.39, 1.57, 1.65, 2.55, 2.68, 1.12, 0.75]} \ No newline at end of file diff --git a/annotations_1/9_LX8b0kmiI_filtered.json b/annotations_1/9_LX8b0kmiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09b55f29ff4bf3644c8ea92635b5a634a18ca032 --- /dev/null +++ b/annotations_1/9_LX8b0kmiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.09], [22.0, 22.59], [30.0, 30.45], [32.0, 33.57], [34.0, 34.38], [37.0, 38.58], [40.0, 41.74], [44.0, 45.81], [46.0, 47.97], [49.0, 51.12], [54.0, 57.25], [57.0, 58.16], [68.0, 78.73], [81.0, 82.31], [83.0, 103.38], [107.0, 110.24], [112.0, 112.13], [116.0, 118.57], [119.0, 118.62], [125.0, 125.78], [140.0, 140.43], [146.0, 146.94], [150.0, 152.73], [155.0, 156.2], [158.0, 158.63], [161.0, 162.58], [166.0, 166.51], [168.0, 171.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 69.07, 0.0, 33.29, 0.0, 34.22, 58.55, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 37.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.49], ["whack, thwack", 10.12], ["screaming", 8.37]], null, [["music", 41.89], ["speech", 18.84], ["hum", 6.53]], null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 29.32], ["moo", 16.98], ["speech", 13.02]]], "duration": [10.09, 0.59, 0.45, 1.57, 0.38, 1.58, 1.74, 1.81, 1.97, 2.12, 3.25, 1.16, 10.73, 1.31, 20.38, 3.24, 0.13, 2.57, -0.38, 0.78, 0.43, 0.94, 2.73, 1.2, 0.63, 1.58, 0.51, 3.21]} \ No newline at end of file diff --git a/annotations_1/9_T2VQgL2XY_filtered.json b/annotations_1/9_T2VQgL2XY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9520d10e080aa215bd00930a17de295408d77019 --- /dev/null +++ b/annotations_1/9_T2VQgL2XY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 98.37], [103.0, 111.23], [112.0, 144.68], [147.0, 168.03], [169.0, 172.74], [173.0, 173.62]], "keep_status": [false, true, false, false, false, false], "silence_prob": [37.43, 33.22, 0.0, 46.97, 50.16, 0.0], "audiomae_on_audioset": [[["music", 59.55], ["hum", 13.93], ["mains hum", 7.6]], [["gunshot, gunfire", 33.93], ["music", 18.13], ["speech", 17.49]], null, [["music", 75.14], ["scary music", 6.33], ["ambient music", 3.26]], null, null], "duration": [12.37, 8.23, 32.68, 21.03, 3.74, 0.62]} \ No newline at end of file diff --git a/annotations_1/9_yf1HCH5CY_filtered.json b/annotations_1/9_yf1HCH5CY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9838ebbce703a3d27880ef557402888e75ad7660 --- /dev/null +++ b/annotations_1/9_yf1HCH5CY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [9.0, 9.68], [12.0, 12.63], [16.0, 16.51], [20.0, 20.44], [23.0, 24.66], [29.0, 29.59], [32.0, 32.43], [33.0, 35.73], [42.0, 42.72], [44.0, 44.66], [46.0, 47.88], [53.0, 54.28], [57.0, 58.87], [60.0, 61.69], [64.0, 66.45], [71.0, 71.63], [73.0, 74.07], [75.0, 75.83], [77.0, 77.82], [79.0, 79.83], [80.0, 82.51], [87.0, 87.91], [93.0, 94.26], [102.0, 103.44], [121.0, 120.97], [128.0, 127.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.68, 0.63, 0.51, 0.44, 1.66, 0.59, 0.43, 2.73, 0.72, 0.66, 1.88, 1.28, 1.87, 1.69, 2.45, 0.63, 1.07, 0.83, 0.82, 0.83, 2.51, 0.91, 1.26, 1.44, -0.03, -0.15]} \ No newline at end of file diff --git a/annotations_1/9ccE4YIG76Y_filtered.json b/annotations_1/9ccE4YIG76Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0399344f6399ac00ad238a6a39fec3141c95d39a --- /dev/null +++ b/annotations_1/9ccE4YIG76Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [10.0, 12.02], [15.0, 17.19], [20.0, 28.11], [29.0, 29.61], [37.0, 38.96], [54.0, 57.25], [76.0, 82.07], [90.0, 95.17], [116.0, 117.12], [125.0, 127.45], [129.0, 130.11]], "keep_status": [false, true, false, true, false, false, true, false, true, false, true, false], "silence_prob": [0.0, 28.63, 33.6, 28.72, 0.0, 0.0, 28.74, 28.8, 29.05, 0.0, 28.89, 0.0], "audiomae_on_audioset": [null, [["speech", 50.61], ["eruption", 9.9], ["horse", 6.45]], [["livestock, farm animals, working animals", 47.7], ["cattle, bovinae", 18.49], ["moo", 18.0]], [["speech", 27.52], ["noise", 17.41], ["music", 17.4]], null, null, [["livestock, farm animals, working animals", 19.35], ["rumble", 17.09], ["speech", 14.33]], [["speech", 61.6], ["aircraft", 11.14], ["vehicle", 9.1]], [["music", 12.31], ["rumble", 11.14], ["aircraft", 8.18]], null, [["throbbing", 27.58], ["hum", 20.88], ["mains hum", 12.72]], null], "duration": [0.52, 2.02, 2.19, 8.11, 0.61, 1.96, 3.25, 6.07, 5.17, 1.12, 2.45, 1.11]} \ No newline at end of file diff --git a/annotations_1/9dN7jGSbsVE_filtered.json b/annotations_1/9dN7jGSbsVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35e42584ebe764f3d31992481c6ab4aff500568d --- /dev/null +++ b/annotations_1/9dN7jGSbsVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.59], [13.0, 12.88], [23.0, 23.5], [31.0, 31.08], [40.0, 40.73], [47.0, 47.41], [57.0, 58.45], [65.0, 65.08]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.59, -0.12, 0.5, 0.08, 0.73, 0.41, 1.45, 0.08]} \ No newline at end of file diff --git a/annotations_1/9di5MvVZb1k_filtered.json b/annotations_1/9di5MvVZb1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b43d5a3e5f37b382ba83a93322f4e8ddf2929a6a --- /dev/null +++ b/annotations_1/9di5MvVZb1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 65.58], [69.0, 68.67], [69.0, 68.72], [69.0, 71.1], [73.0, 96.63], [97.0, 98.02], [100.0, 100.28], [102.0, 102.17], [104.0, 105.46]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [32.01, 0.0, 0.0, 85.54, 52.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 84.29], ["musical instrument", 1.98], ["electric shaver, electric razor", 1.48]], null, null, null, null, null, null, null, null], "duration": [16.58, -0.33, -0.28, 2.1, 23.63, 1.02, 0.28, 0.17, 1.46]} \ No newline at end of file diff --git a/annotations_1/9dmlcGZta9E_filtered.json b/annotations_1/9dmlcGZta9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71d0f56f4558b7228acf8c3651dc3de573084982 --- /dev/null +++ b/annotations_1/9dmlcGZta9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [4.0, 4.41], [24.0, 24.51], [25.0, 29.74], [36.0, 36.91], [38.0, 39.78], [45.0, 46.82], [48.0, 49.0], [50.0, 51.27], [53.0, 53.79], [55.0, 54.84], [59.0, 59.29], [68.0, 68.42], [72.0, 71.83], [75.0, 74.8], [80.0, 80.35], [85.0, 85.19], [86.0, 87.72], [90.0, 91.61], [93.0, 95.32], [97.0, 98.36], [102.0, 104.14], [105.0, 107.52], [108.0, 108.87], [118.0, 118.27], [119.0, 122.35], [122.0, 124.44], [126.0, 126.89], [152.0, 156.91], [163.0, 163.73], [164.0, 166.06], [166.0, 167.37]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 64.86, 43.3, 0.0, 0.0, 42.79, 47.7, 0.0, 51.94, 0.0, 56.1, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 45.15], ["boing", 11.78], ["cowbell", 7.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.48], ["music", 25.85], ["doorbell", 3.65]], null, null, [["music", 45.08], ["speech", 36.32], ["thunk", 3.01]], [["music", 49.91], ["speech", 11.58], ["theremin", 4.98]], null, null, null, null, null], "duration": [1.34, 0.41, 0.51, 4.74, 0.91, 1.78, 1.82, 1.0, 1.27, 0.79, -0.16, 0.29, 0.42, -0.17, -0.2, 0.35, 0.19, 1.72, 1.61, 2.32, 1.36, 2.14, 2.52, 0.87, 0.27, 3.35, 2.44, 0.89, 4.91, 0.73, 2.06, 1.37]} \ No newline at end of file diff --git a/annotations_1/9dqOdoFtNcM_filtered.json b/annotations_1/9dqOdoFtNcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e5d418be741b8ee88d57be2d11e7ffd9b4b87c9 --- /dev/null +++ b/annotations_1/9dqOdoFtNcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [7.0, 7.48], [15.0, 17.02], [18.0, 18.47], [19.0, 21.9], [27.0, 27.36], [28.0, 28.54], [29.0, 30.25], [31.0, 33.35], [34.0, 34.84], [35.0, 36.63], [38.0, 39.31], [43.0, 43.87], [45.0, 45.22], [47.0, 47.31], [48.0, 51.85], [58.0, 59.0], [63.0, 63.32], [68.0, 68.54], [70.0, 70.24], [73.0, 73.82], [74.0, 75.47], [86.0, 86.24], [96.0, 97.73], [105.0, 105.65], [106.0, 106.93], [108.0, 108.87], [109.0, 112.67], [123.0, 123.11], [124.0, 129.15], [137.0, 136.54], [137.0, 137.73], [138.0, 137.83], [138.0, 140.93], [162.0, 163.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.59, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.19, 0.0, 33.12, 0.0, 0.0, 0.0, 37.68, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.65], ["noise", 21.9], ["whale vocalization", 6.68]], null, [["music", 47.26], ["speech", 18.19], ["sidetone", 5.49]], null, null, null, [["music", 33.78], ["speech", 28.87], ["sidetone", 3.21]], null], "duration": [1.62, 0.48, 2.02, 0.47, 2.9, 0.36, 0.54, 1.25, 2.35, 0.84, 1.63, 1.31, 0.87, 0.22, 0.31, 3.85, 1.0, 0.32, 0.54, 0.24, 0.82, 1.47, 0.24, 1.73, 0.65, 0.93, 0.87, 3.67, 0.11, 5.15, -0.46, 0.73, -0.17, 2.93, 1.44]} \ No newline at end of file diff --git a/annotations_1/9eI4mt_lKTw_filtered.json b/annotations_1/9eI4mt_lKTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ff9a745b4003c300da8776fa683241d54b477f7 --- /dev/null +++ b/annotations_1/9eI4mt_lKTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.59], [32.0, 32.32], [36.0, 37.4], [38.0, 40.98], [42.0, 45.82], [50.0, 55.58], [56.0, 79.59], [80.0, 82.46], [84.0, 88.62], [91.0, 96.33], [107.0, 107.37], [110.0, 110.49], [113.0, 113.75], [116.0, 129.09], [130.0, 131.23], [135.0, 136.76], [158.0, 159.09], [160.0, 160.56]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.12, 51.28, 31.4, 38.7, 91.81, 58.89, 30.52, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 50.1], ["speech", 18.63], ["throbbing", 10.13]], null, [["whale vocalization", 22.09], ["music", 16.39], ["hum", 13.0]], [["hum", 26.13], ["whale vocalization", 22.59], ["mains hum", 9.74]], null, null, [["speech", 18.88], ["whip", 17.58], ["noise", 15.9]], null, null, null, null, null, null, null, null], "duration": [1.59, 0.32, 1.4, 2.98, 3.82, 5.58, 23.59, 2.46, 4.62, 5.33, 0.37, 0.49, 0.75, 13.09, 1.23, 1.76, 1.09, 0.56]} \ No newline at end of file diff --git a/annotations_1/9ecrIMjE4GQ_filtered.json b/annotations_1/9ecrIMjE4GQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91d218d25c7c2da43ffed9b1e7758ec85f028b89 --- /dev/null +++ b/annotations_1/9ecrIMjE4GQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.82], [25.0, 25.62], [28.0, 31.48], [39.0, 51.02], [54.0, 67.78], [72.0, 77.23], [78.0, 125.58], [128.0, 128.65]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.68, 29.64, 30.51, 29.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.52], ["hum", 4.16], ["throbbing", 2.73]], [["mains hum", 40.14], ["hum", 35.29], ["music", 8.64]], [["music", 63.52], ["throbbing", 7.54], ["hum", 5.29]], [["speech", 59.45], ["music", 9.82], ["hum", 7.28]], null, null], "duration": [0.82, 0.62, 3.48, 12.02, 13.78, 5.23, 47.58, 0.65]} \ No newline at end of file diff --git a/annotations_1/9eosfNwMpMs_filtered.json b/annotations_1/9eosfNwMpMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8822ebfd341cd5321a05ccd1847acb2fed04e0 --- /dev/null +++ b/annotations_1/9eosfNwMpMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.12], [14.0, 18.62], [22.0, 24.75], [29.0, 76.62], [77.0, 80.99], [84.0, 89.58], [92.0, 98.34], [100.0, 103.86], [105.0, 107.06], [109.0, 113.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.73, 99.31, 79.59, 0.0, 52.39, 58.47, 92.8, 67.89, 43.4, 40.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 46.61], ["sonar", 10.88], ["echo", 3.85]], [["music", 56.12], ["hum", 8.58], ["ambient music", 5.62]]], "duration": [6.12, 4.62, 2.75, 47.62, 3.99, 5.58, 6.34, 3.86, 2.06, 4.53]} \ No newline at end of file diff --git a/annotations_1/9f1adgpyRjM_filtered.json b/annotations_1/9f1adgpyRjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03d46afe143d7dae4ed615b535cd5f55a33c942d --- /dev/null +++ b/annotations_1/9f1adgpyRjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [3.0, 3.4], [4.0, 4.36], [7.0, 7.62], [9.0, 11.82], [15.0, 16.36], [18.0, 18.47], [20.0, 20.85], [22.0, 43.48], [48.0, 48.12], [52.0, 52.51], [56.0, 56.46], [62.0, 62.14], [63.0, 63.98], [66.0, 66.93], [68.0, 69.03], [69.0, 69.7], [70.0, 70.92], [71.0, 72.0], [75.0, 76.35], [78.0, 88.06], [98.0, 98.12], [99.0, 98.91], [101.0, 108.6], [121.0, 120.66], [123.0, 123.9], [124.0, 125.47], [126.0, 126.79], [127.0, 128.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 35.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 69.38], ["wind instrument, woodwind instrument", 3.24], ["musical instrument", 3.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.95], ["animal", 26.55], ["dog", 9.42]], null, null, null, null, null], "duration": [-0.09, 0.4, 0.36, 0.62, 2.82, 1.36, 0.47, 0.85, 21.48, 0.12, 0.51, 0.46, 0.14, 0.98, 0.93, 1.03, 0.7, 0.92, 1.0, 1.35, 10.06, 0.12, -0.09, 7.6, -0.34, 0.9, 1.47, 0.79, 1.8]} \ No newline at end of file diff --git a/annotations_1/9fEMKGFr-Sk_filtered.json b/annotations_1/9fEMKGFr-Sk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52cc7855397be6618abcc3e207d769bb00605b88 --- /dev/null +++ b/annotations_1/9fEMKGFr-Sk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 21.56], [22.0, 23.16], [26.0, 27.09], [35.0, 34.97], [36.0, 36.9], [43.0, 44.04], [51.0, 51.61], [53.0, 53.79], [55.0, 55.16], [69.0, 70.71], [73.0, 72.66], [82.0, 97.24], [98.0, 98.85], [100.0, 100.82], [101.0, 111.96], [115.0, 115.37], [116.0, 142.57], [147.0, 151.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 93.45, 0.0, 51.6, 88.64], "audiomae_on_audioset": [[["speech", 42.81], ["music", 41.93], ["hum", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.56, 1.16, 1.09, -0.03, 0.9, 1.04, 0.61, 0.79, 0.16, 1.71, -0.34, 15.24, 0.85, 0.82, 10.96, 0.37, 26.57, 4.36]} \ No newline at end of file diff --git a/annotations_1/9fFbDzUOD5o_filtered.json b/annotations_1/9fFbDzUOD5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f00e6d69c5d3d470eb496fb27544118a999b0f33 --- /dev/null +++ b/annotations_1/9fFbDzUOD5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.01], [32.0, 33.94], [41.0, 42.15], [44.0, 43.85], [45.0, 45.64], [57.0, 61.33], [67.0, 67.49], [69.0, 70.71], [72.0, 72.23], [74.0, 82.41], [83.0, 89.24], [91.0, 97.61], [99.0, 102.84], [103.0, 103.77], [105.0, 116.51]], "keep_status": [true, false, false, false, false, true, false, false, false, true, true, false, true, false, true], "silence_prob": [29.81, 0.0, 0.0, 0.0, 0.0, 31.3, 0.0, 0.0, 0.0, 34.08, 33.59, 29.65, 29.67, 0.0, 30.1], "audiomae_on_audioset": [[["crowd", 13.24], ["explosion", 12.58], ["fireworks", 8.79]], null, null, null, null, [["whale vocalization", 25.6], ["music", 22.95], ["moo", 4.82]], null, null, null, [["music", 31.55], ["livestock, farm animals, working animals", 12.58], ["cattle, bovinae", 9.93]], [["music", 36.31], ["scary music", 16.4], ["hum", 7.28]], [["music", 44.02], ["livestock, farm animals, working animals", 21.24], ["bleat", 7.7]], [["music", 50.52], ["speech", 12.9], ["didgeridoo", 4.81]], null, [["music", 31.04], ["hum", 10.68], ["speech", 10.19]]], "duration": [6.01, 1.94, 1.15, -0.15, 0.64, 4.33, 0.49, 1.71, 0.23, 8.41, 6.24, 6.61, 3.84, 0.77, 11.51]} \ No newline at end of file diff --git a/annotations_1/9fUtcVIlocI_filtered.json b/annotations_1/9fUtcVIlocI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18baa5cfa7920ea1030756310897e7592a595b14 --- /dev/null +++ b/annotations_1/9fUtcVIlocI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.78], [22.0, 22.3], [29.0, 30.0], [30.0, 30.65], [33.0, 33.76], [40.0, 40.9], [44.0, 64.1], [67.0, 68.67], [72.0, 74.9], [76.0, 76.22], [88.0, 88.79], [90.0, 92.01], [93.0, 93.34], [94.0, 94.66], [99.0, 99.01], [108.0, 136.19], [137.0, 142.84], [146.0, 146.92]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 30.76, 0.0, 0.0, 29.19, 0.0, 0.0, 0.0, 36.75, 44.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 79.66], ["speech", 4.88], ["electronic music", 2.68]], null, [["music", 51.86], ["sidetone", 4.77], ["civil defense siren", 3.86]], null, null, [["moo", 43.15], ["cattle, bovinae", 40.59], ["livestock, farm animals, working animals", 11.7]], null, null, null, [["music", 46.46], ["effects unit", 6.93], ["guitar", 6.57]], [["music", 35.21], ["guitar", 11.85], ["plucked string instrument", 9.11]], null], "duration": [0.78, 0.3, 1.0, 0.65, 0.76, 0.9, 20.1, 1.67, 2.9, 0.22, 0.79, 2.01, 0.34, 0.66, 0.01, 28.19, 5.84, 0.92]} \ No newline at end of file diff --git a/annotations_1/9g5pe-B6uL8_filtered.json b/annotations_1/9g5pe-B6uL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/9g5pe-B6uL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/9hMrzEWpZM0_filtered.json b/annotations_1/9hMrzEWpZM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..557d690e9371846610dc425453ad4dce81ad7272 --- /dev/null +++ b/annotations_1/9hMrzEWpZM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [5.0, 6.13], [8.0, 8.92], [10.0, 13.04], [17.0, 17.14], [23.0, 24.29], [25.0, 28.27], [30.0, 31.36], [33.0, 33.47], [35.0, 34.97], [36.0, 36.64], [38.0, 38.82], [42.0, 43.75], [45.0, 47.56], [49.0, 49.37], [53.0, 54.14], [59.0, 64.18], [66.0, 71.81], [75.0, 76.96], [78.0, 79.76], [82.0, 82.51], [84.0, 85.68], [87.0, 88.06], [94.0, 96.3], [97.0, 98.36], [100.0, 100.4], [101.0, 101.06], [103.0, 103.52], [104.0, 104.87], [108.0, 109.29], [110.0, 111.55], [118.0, 118.32], [119.0, 124.33], [124.0, 124.36], [126.0, 125.78], [129.0, 129.66], [130.0, 131.7], [133.0, 137.62], [140.0, 145.35], [146.0, 160.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 98.8, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 98.59, 99.85, 41.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.96], ["sidetone", 14.93], ["breaking", 2.3]], null, null, null, null, null, null, [["speech", 62.08], ["music", 14.15], ["thunk", 12.74]]], "duration": [1.8, 1.13, 0.92, 3.04, 0.14, 1.29, 3.27, 1.36, 0.47, -0.03, 0.64, 0.82, 1.75, 2.56, 0.37, 1.14, 5.18, 5.81, 1.96, 1.76, 0.51, 1.68, 1.06, 2.3, 1.36, 0.4, 0.06, 0.52, 0.87, 1.29, 1.55, 0.32, 5.33, 0.36, -0.22, 0.66, 1.7, 4.62, 5.35, 14.14]} \ No newline at end of file diff --git a/annotations_1/9hNNrKNPGVo_filtered.json b/annotations_1/9hNNrKNPGVo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ea1453c1b67b50034d47a80249dd01878af6b93 --- /dev/null +++ b/annotations_1/9hNNrKNPGVo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[154.0, 155.28], [156.0, 166.65]], "keep_status": [false, false], "silence_prob": [0.0, 100.0], "audiomae_on_audioset": [null, null], "duration": [1.28, 10.65]} \ No newline at end of file diff --git a/annotations_1/9hPgjW2ou9E_filtered.json b/annotations_1/9hPgjW2ou9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e47d46deb505225076075b396d6d19f4e3fd03ec --- /dev/null +++ b/annotations_1/9hPgjW2ou9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.54], [66.0, 166.62], [167.0, 177.94], [181.0, 191.3], [196.0, 195.88], [199.0, 199.07], [200.0, 207.96]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.32, 29.13, 0.0, 0.0, 39.91], "audiomae_on_audioset": [null, null, [["music", 33.7], ["buzz", 21.83], ["synthesizer", 6.83]], [["music", 64.07], ["throbbing", 10.55], ["hum", 9.97]], null, null, [["music", 84.29], ["drum machine", 3.42], ["sampler", 3.18]]], "duration": [0.54, 100.62, 10.94, 10.3, -0.12, 0.07, 7.96]} \ No newline at end of file diff --git a/annotations_1/9j3KAnX0Nhk_filtered.json b/annotations_1/9j3KAnX0Nhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7fda6be6cc77e8abf49355a7383cb2800d05543 --- /dev/null +++ b/annotations_1/9j3KAnX0Nhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 50.25], [50.0, 51.61], [55.0, 58.95], [61.0, 64.29], [66.0, 72.69], [74.0, 80.22], [87.0, 111.84], [116.0, 126.77], [129.0, 142.6], [144.0, 145.23], [146.0, 152.12], [155.0, 158.38]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 29.89, 36.09, 30.81, 30.47, 30.3, 31.91, 30.42, 0.0, 31.64, 32.45], "audiomae_on_audioset": [null, null, [["music", 43.14], ["speech", 35.73], ["cacophony", 2.33]], [["throbbing", 21.61], ["speech", 17.89], ["music", 17.08]], [["music", 68.29], ["hum", 4.33], ["didgeridoo", 3.41]], [["music", 33.74], ["throbbing", 8.61], ["fly, housefly", 8.12]], [["music", 41.27], ["speech", 25.12], ["sidetone", 11.52]], [["speech", 39.3], ["music", 27.38], ["sidetone", 10.49]], [["speech", 53.91], ["music", 9.48], ["buzz", 4.24]], null, [["mains hum", 34.85], ["hum", 30.71], ["speech", 13.57]], [["hum", 19.35], ["sidetone", 14.36], ["music", 14.13]]], "duration": [34.25, 1.61, 3.95, 3.29, 6.69, 6.22, 24.84, 10.77, 13.6, 1.23, 6.12, 3.38]} \ No newline at end of file diff --git a/annotations_1/9j3y-J8IzYo_filtered.json b/annotations_1/9j3y-J8IzYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae950d2d55557895a8c340a5d77a543b7260e7b0 --- /dev/null +++ b/annotations_1/9j3y-J8IzYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 61.01], [62.0, 63.04], [64.0, 65.04], [67.0, 68.44], [71.0, 72.59], [74.0, 73.9], [79.0, 86.63], [88.0, 94.41], [96.0, 98.27], [100.0, 102.51], [103.0, 105.53], [106.0, 114.3], [116.0, 116.75], [119.0, 123.58], [125.0, 125.49], [128.0, 135.18], [137.0, 138.45], [140.0, 167.9], [169.0, 170.68], [174.0, 177.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [52.45, 0.0, 0.0, 0.0, 0.0, 0.0, 38.55, 100.0, 100.0, 100.0, 99.62, 99.78, 0.0, 50.66, 0.0, 31.61, 0.0, 30.88, 0.0, 79.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 45.01], ["fart", 28.59], ["creak", 18.35]], null, null, null, null, null, null, null, null, [["hum", 17.19], ["music", 16.27], ["throbbing", 7.65]], null, [["sidetone", 51.69], ["music", 21.47], ["speech", 10.82]], null, null], "duration": [28.01, 1.04, 1.04, 1.44, 1.59, -0.1, 7.63, 6.41, 2.27, 2.51, 2.53, 8.3, 0.75, 4.58, 0.49, 7.18, 1.45, 27.9, 1.68, 3.48]} \ No newline at end of file diff --git a/annotations_1/9jL7oaQAPMI_filtered.json b/annotations_1/9jL7oaQAPMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e2af0cd214d041310f23a808c3e9b3d0a0b4f07 --- /dev/null +++ b/annotations_1/9jL7oaQAPMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[87.0, 87.61], [88.0, 92.26], [93.0, 108.75], [110.0, 114.57], [118.0, 123.11]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 75.72, 41.74, 90.08, 87.37], "audiomae_on_audioset": [null, null, [["speech", 39.06], ["hum", 16.81], ["mains hum", 12.91]], null, null], "duration": [0.61, 4.26, 15.75, 4.57, 5.11]} \ No newline at end of file diff --git a/annotations_1/9jfRE_FljrE_filtered.json b/annotations_1/9jfRE_FljrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0086017bbd3eb4d4907ecd2e94a642700088e045 --- /dev/null +++ b/annotations_1/9jfRE_FljrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [19.0, 19.4], [22.0, 22.49], [27.0, 28.48], [38.0, 40.64], [54.0, 54.62], [56.0, 58.23]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 31.87], "audiomae_on_audioset": [null, null, null, null, [["music", 43.86], ["boing", 31.86], ["effects unit", 1.53]], null, [["music", 51.74], ["didgeridoo", 22.36], ["theremin", 8.22]]], "duration": [0.53, 0.4, 0.49, 1.48, 2.64, 0.62, 2.23]} \ No newline at end of file diff --git a/annotations_1/9lqv-q15y1c_filtered.json b/annotations_1/9lqv-q15y1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8455c3c72bef8176e9621012eb7bbdfca69bbf2 --- /dev/null +++ b/annotations_1/9lqv-q15y1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [4.0, 4.18], [5.0, 5.48], [7.0, 7.37], [10.0, 10.42], [12.0, 12.36], [13.0, 15.92], [18.0, 18.44], [23.0, 28.51], [29.0, 29.98], [32.0, 32.56], [35.0, 35.51], [38.0, 38.5], [39.0, 39.6], [42.0, 42.6], [47.0, 51.65], [54.0, 55.12], [56.0, 56.62], [58.0, 62.38], [71.0, 71.56], [73.0, 75.19], [76.0, 76.5], [86.0, 87.13], [115.0, 115.59], [118.0, 118.77], [122.0, 123.65], [124.0, 127.82], [129.0, 130.92], [134.0, 139.82], [141.0, 141.56], [142.0, 142.43]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0, 46.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.71, 0.0, 0.0, 79.76, 0.0, 30.6, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 0.0, 29.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["radio", 25.26], ["speech", 21.21], ["hum", 7.02]], null, [["hum", 39.22], ["mains hum", 16.19], ["throbbing", 10.65]], null, null, null, null, null, null, [["speech", 19.94], ["noise", 15.61], ["hum", 10.05]], null, null, null, null, [["speech", 76.71], ["dog", 5.18], ["animal", 3.96]], null, null, null, null, null, [["speech", 26.94], ["telephone", 14.42], ["hum", 12.06]], null, [["snicker", 62.92], ["chuckle, chortle", 16.65], ["laughter", 6.79]], null, null], "duration": [1.55, 0.18, 0.48, 0.37, 0.42, 0.36, 2.92, 0.44, 5.51, 0.98, 0.56, 0.51, 0.5, 0.6, 0.6, 4.65, 1.12, 0.62, 4.38, 0.56, 2.19, 0.5, 1.13, 0.59, 0.77, 1.65, 3.82, 1.92, 5.82, 0.56, 0.43]} \ No newline at end of file diff --git a/annotations_1/9ltpGvaDfBM_filtered.json b/annotations_1/9ltpGvaDfBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5f804fa54f8fc9d3ad66a742efd241c56b880af --- /dev/null +++ b/annotations_1/9ltpGvaDfBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.38], [14.0, 66.01], [68.0, 75.02], [77.0, 79.83], [80.0, 85.8], [88.0, 92.43], [95.0, 95.62], [96.0, 97.61], [98.0, 99.17], [100.0, 100.26], [104.0, 104.57], [105.0, 105.48], [107.0, 107.15], [110.0, 117.26], [119.0, 120.02], [124.0, 135.38], [137.0, 137.13], [142.0, 144.95], [145.0, 147.39], [148.0, 148.51], [150.0, 151.6], [153.0, 153.62], [159.0, 159.73], [162.0, 162.87], [169.0, 170.67], [175.0, 176.03], [177.0, 177.84]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.7, 0.0, 30.45, 34.1, 31.29, 35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.44, 0.0, 32.2, 0.0, 36.13, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.21], ["hum", 20.15], ["speech", 14.04]], null, [["music", 57.6], ["speech", 13.49], ["throbbing", 6.45]], [["speech", 18.64], ["music", 18.08], ["hum", 17.94]], [["music", 52.41], ["hum", 17.89], ["speech", 6.09]], [["hum", 24.84], ["music", 19.1], ["throbbing", 14.84]], null, null, null, null, null, null, null, [["music", 26.58], ["hum", 17.05], ["mains hum", 11.86]], null, [["hum", 23.52], ["mains hum", 19.86], ["speech", 14.36]], null, [["didgeridoo", 20.34], ["music", 13.44], ["mains hum", 7.83]], null, null, null, null, null, null, null, null, null], "duration": [11.38, 52.01, 7.02, 2.83, 5.8, 4.43, 0.62, 1.61, 1.17, 0.26, 0.57, 0.48, 0.15, 7.26, 1.02, 11.38, 0.13, 2.95, 2.39, 0.51, 1.6, 0.62, 0.73, 0.87, 1.67, 1.03, 0.84]} \ No newline at end of file diff --git a/annotations_1/9n23ISvkbFQ_filtered.json b/annotations_1/9n23ISvkbFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f21c8c827adbe19c54101a898760cc3748bc57 --- /dev/null +++ b/annotations_1/9n23ISvkbFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.1], [8.0, 16.12], [19.0, 29.64], [30.0, 30.2], [31.0, 31.78], [33.0, 36.88], [38.0, 39.58], [43.0, 44.58], [45.0, 48.86], [49.0, 51.38], [52.0, 58.58], [59.0, 61.86], [62.0, 65.3], [66.0, 71.05], [72.0, 88.33], [89.0, 91.1], [93.0, 96.45], [97.0, 98.41], [100.0, 104.63], [106.0, 110.05], [112.0, 140.8], [142.0, 142.75], [143.0, 144.83], [146.0, 146.08], [147.0, 147.36], [149.0, 165.15], [165.0, 165.45]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false], "silence_prob": [100.0, 100.0, 96.29, 0.0, 0.0, 46.72, 0.0, 0.0, 99.59, 90.78, 100.0, 99.21, 96.04, 100.0, 100.0, 100.0, 46.86, 0.0, 94.07, 41.76, 95.64, 0.0, 0.0, 0.0, 0.0, 37.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["applause", 26.04], ["speech", 25.66], ["music", 11.19]], null, null, null, null, null, null, null, null, null, null, [["speech", 50.53], ["cheering", 8.43], ["crowd", 7.62]], null, null, [["speech", 38.04], ["applause", 23.77], ["crowd", 6.75]], null, null, null, null, null, [["music", 55.63], ["speech", 7.9], ["musical instrument", 4.15]], null], "duration": [3.1, 8.12, 10.64, 0.2, 0.78, 3.88, 1.58, 1.58, 3.86, 2.38, 6.58, 2.86, 3.3, 5.05, 16.33, 2.1, 3.45, 1.41, 4.63, 4.05, 28.8, 0.75, 1.83, 0.08, 0.36, 16.15, 0.45]} \ No newline at end of file diff --git a/annotations_1/9nOc2GqCQ2Y_filtered.json b/annotations_1/9nOc2GqCQ2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..607f0c33538627df1ee97463f9c2cf15112e95c1 --- /dev/null +++ b/annotations_1/9nOc2GqCQ2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.01], [8.0, 9.17], [27.0, 28.07], [40.0, 41.47], [46.0, 46.31], [51.0, 52.14], [54.0, 65.72], [67.0, 78.09], [101.0, 100.84], [101.0, 120.72], [125.0, 126.84], [129.0, 132.14], [133.0, 140.36], [141.0, 141.24], [142.0, 144.17], [146.0, 172.2], [172.0, 173.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 32.37, 0.0, 31.7, 0.0, 34.11, 32.57, 0.0, 33.08, 32.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 61.16], ["speech", 11.88], ["drum machine", 3.78]], [["music", 74.36], ["funk", 3.44], ["sampler", 1.56]], null, [["music", 65.14], ["speech", 14.59], ["boing", 6.07]], null, [["music", 42.87], ["throbbing", 8.26], ["ding", 7.61]], [["music", 38.97], ["scratching (performance technique)", 6.82], ["drum machine", 6.12]], null, [["music", 53.7], ["throbbing", 9.03], ["hum", 5.34]], [["music", 50.03], ["singing", 5.54], ["song", 5.36]], null], "duration": [0.01, 1.17, 1.07, 1.47, 0.31, 1.14, 11.72, 11.09, -0.16, 19.72, 1.84, 3.14, 7.36, 0.24, 2.17, 26.2, 1.6]} \ No newline at end of file diff --git a/annotations_1/9nc12yOA4jM_filtered.json b/annotations_1/9nc12yOA4jM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51f322c58481c2bea4aa72a23f490c61a986f84b --- /dev/null +++ b/annotations_1/9nc12yOA4jM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.26], [5.0, 9.04], [10.0, 11.92], [13.0, 13.78], [15.0, 16.65], [17.0, 18.94], [23.0, 25.42], [28.0, 30.52], [31.0, 37.03], [37.0, 39.82], [40.0, 41.84], [43.0, 45.52], [46.0, 47.58], [48.0, 51.93], [53.0, 56.78], [59.0, 74.29], [78.0, 81.18], [83.0, 84.32], [84.0, 90.48], [93.0, 102.66], [107.0, 110.84], [115.0, 119.69], [121.0, 121.04], [123.0, 124.73], [127.0, 128.26], [129.0, 129.76], [135.0, 136.0], [141.0, 141.57], [143.0, 143.19], [148.0, 148.34], [162.0, 163.11], [171.0, 172.17], [173.0, 175.04], [175.0, 176.32], [178.0, 180.69], [181.0, 187.62], [188.0, 189.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [100.0, 91.98, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 79.59, 71.43, 0.0, 97.83, 0.0, 74.92, 35.98, 33.58, 100.0, 0.0, 82.79, 36.5, 32.78, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 56.63, 39.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.55], ["whale vocalization", 9.87], ["hum", 6.19]], [["music", 52.11], ["throbbing", 15.62], ["hum", 15.12]], null, null, null, [["music", 62.23], ["sidetone", 11.45], ["boing", 8.33]], [["music", 21.08], ["speech", 15.96], ["fly, housefly", 10.11]], [["speech", 51.3], ["music", 7.18], ["didgeridoo", 5.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.09], ["hum", 16.72], ["throbbing", 13.14]], null], "duration": [2.26, 4.04, 1.92, 0.78, 1.65, 1.94, 2.42, 2.52, 6.03, 2.82, 1.84, 2.52, 1.58, 3.93, 3.78, 15.29, 3.18, 1.32, 6.48, 9.66, 3.84, 4.69, 0.04, 1.73, 1.26, 0.76, 1.0, 0.57, 0.19, 0.34, 1.11, 1.17, 2.04, 1.32, 2.69, 6.62, 1.11]} \ No newline at end of file diff --git a/annotations_1/9nwSOUvKyys_filtered.json b/annotations_1/9nwSOUvKyys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fba546f7070867982f9bd3490799cb3376845622 --- /dev/null +++ b/annotations_1/9nwSOUvKyys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.77], [17.0, 18.6], [24.0, 25.39], [33.0, 34.1], [35.0, 36.21], [45.0, 58.35], [59.0, 59.0], [60.0, 60.27], [61.0, 61.91], [63.0, 67.15], [69.0, 69.58], [71.0, 71.64], [74.0, 74.7], [77.0, 79.3], [80.0, 80.92], [82.0, 82.98], [83.0, 86.17], [87.0, 87.81], [89.0, 89.8], [91.0, 91.57], [93.0, 96.04], [99.0, 100.25], [101.0, 101.16], [102.0, 107.84], [108.0, 109.73], [115.0, 116.38]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 42.17, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 73.51, 0.0, 0.0, 56.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 15.64], ["animal", 12.4], ["roar", 8.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.77, 1.6, 1.39, 1.1, 1.21, 13.35, 0.0, 0.27, 0.91, 4.15, 0.58, 0.64, 0.7, 2.3, 0.92, 0.98, 3.17, 0.81, 0.8, 0.57, 3.04, 1.25, 0.16, 5.84, 1.73, 1.38]} \ No newline at end of file diff --git a/annotations_1/9oS260wm-UM_filtered.json b/annotations_1/9oS260wm-UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b18667305629751f94b0c0a87e823d82ed284c4 --- /dev/null +++ b/annotations_1/9oS260wm-UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.46], [11.0, 11.4], [18.0, 18.49], [20.0, 21.25], [33.0, 36.95], [46.0, 46.94], [49.0, 48.88], [58.0, 58.67], [61.0, 77.8], [81.0, 81.01], [83.0, 94.73], [95.0, 102.63], [104.0, 108.01], [111.0, 115.69], [117.0, 119.57], [122.0, 129.37], [137.0, 137.66], [139.0, 139.73], [141.0, 144.75]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false, false], "silence_prob": [44.6, 0.0, 0.0, 0.0, 34.65, 0.0, 0.0, 0.0, 31.82, 0.0, 31.17, 29.58, 30.26, 30.27, 70.3, 28.96, 0.0, 0.0, 67.76], "audiomae_on_audioset": [[["speech", 44.92], ["music", 33.72], ["brass instrument", 4.14]], null, null, null, [["music", 40.83], ["throbbing", 25.06], ["speech", 7.65]], null, null, null, [["music", 26.04], ["speech", 22.04], ["groan", 21.03]], null, [["speech", 28.32], ["music", 27.71], ["hum", 8.87]], [["sidetone", 44.88], ["music", 25.96], ["speech", 12.76]], [["music", 27.22], ["chirp tone", 5.19], ["tuning fork", 5.15]], [["music", 11.6], ["explosion", 10.78], ["noise", 8.97]], null, [["explosion", 35.63], ["speech", 33.08], ["eruption", 16.88]], null, null, null], "duration": [2.46, 0.4, 0.49, 1.25, 3.95, 0.94, -0.12, 0.67, 16.8, 0.01, 11.73, 7.63, 4.01, 4.69, 2.57, 7.37, 0.66, 0.73, 3.75]} \ No newline at end of file diff --git a/annotations_1/9oiFkoROlu0_filtered.json b/annotations_1/9oiFkoROlu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a99a0b2c2efbc333b92d7fe9ca064a1626ff469 --- /dev/null +++ b/annotations_1/9oiFkoROlu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.72], [22.0, 22.4], [28.0, 28.75], [30.0, 33.94], [36.0, 36.21], [37.0, 46.47], [47.0, 50.38], [51.0, 51.9], [53.0, 53.87], [55.0, 56.73], [57.0, 59.86], [61.0, 63.8], [65.0, 65.75], [67.0, 72.17], [73.0, 75.93], [77.0, 79.64], [81.0, 83.08], [84.0, 84.1], [86.0, 90.29], [91.0, 97.78], [108.0, 108.19], [109.0, 117.85], [122.0, 136.34], [140.0, 150.26], [150.0, 154.04], [154.0, 156.03], [157.0, 159.46], [160.0, 173.04], [175.0, 177.25], [178.0, 177.94]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, true, true, false, false, false], "silence_prob": [50.31, 0.0, 0.0, 37.74, 0.0, 29.87, 29.56, 0.0, 0.0, 0.0, 54.7, 97.43, 0.0, 84.98, 58.47, 75.07, 64.41, 0.0, 29.24, 46.68, 0.0, 37.2, 31.16, 32.71, 31.59, 32.75, 33.11, 28.84, 32.16, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 21.61], ["hum", 13.92], ["electronic music", 12.03]], null, [["music", 21.92], ["rumble", 19.48], ["hum", 8.27]], [["throbbing", 44.91], ["hum", 18.09], ["mains hum", 11.65]], null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 28.63], ["hum", 17.61], ["music", 17.12]], [["hum", 36.72], ["music", 11.73], ["mains hum", 10.12]], null, [["hum", 47.88], ["mains hum", 20.17], ["speech", 12.14]], [["hum", 32.58], ["mains hum", 20.6], ["music", 17.97]], [["throbbing", 31.26], ["hum", 25.29], ["music", 15.3]], [["music", 24.91], ["speech", 20.16], ["throbbing", 19.26]], [["music", 36.44], ["throbbing", 22.46], ["hum", 9.47]], [["music", 44.96], ["speech", 9.81], ["throbbing", 8.05]], [["speech", 57.76], ["music", 14.91], ["mains hum", 7.31]], [["music", 47.78], ["throbbing", 21.45], ["hum", 10.44]], null], "duration": [2.72, 0.4, 0.75, 3.94, 0.21, 9.47, 3.38, 0.9, 0.87, 1.73, 2.86, 2.8, 0.75, 5.17, 2.93, 2.64, 2.08, 0.1, 4.29, 6.78, 0.19, 8.85, 14.34, 10.26, 4.04, 2.03, 2.46, 13.04, 2.25, -0.06]} \ No newline at end of file diff --git a/annotations_1/9pF_vfzjbpY_filtered.json b/annotations_1/9pF_vfzjbpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..515dd3658385355ddb3a2ee8deb54e9140c119e9 --- /dev/null +++ b/annotations_1/9pF_vfzjbpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[159.0, 161.25], [162.0, 162.18], [165.0, 165.96], [168.0, 175.49]], "keep_status": [false, false, false, true], "silence_prob": [44.49, 0.0, 0.0, 38.26], "audiomae_on_audioset": [[["coin (dropping)", 39.88], ["speech", 30.63], ["glass", 5.48]], null, null, [["hum", 21.69], ["speech", 16.17], ["mains hum", 15.12]]], "duration": [2.25, 0.18, 0.96, 7.49]} \ No newline at end of file diff --git a/annotations_1/9qdMVMCGr48_filtered.json b/annotations_1/9qdMVMCGr48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20e2ed9f1e00574e432c52b4af2d16b0f0d08304 --- /dev/null +++ b/annotations_1/9qdMVMCGr48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.21], [12.0, 34.7], [36.0, 38.5], [39.0, 39.45], [39.0, 39.48], [39.0, 39.51], [40.0, 39.68], [42.0, 45.71], [48.0, 60.69], [62.0, 63.75], [66.0, 82.97], [84.0, 85.09], [86.0, 87.12], [88.0, 88.94], [92.0, 93.34], [96.0, 98.41], [100.0, 101.09], [103.0, 103.87], [105.0, 106.03]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [51.99, 48.69, 42.88, 0.0, 0.0, 0.0, 0.0, 34.15, 31.03, 0.0, 36.78, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["water", 29.25], ["slosh", 19.59], ["splash, splatter", 14.09]], [["throbbing", 12.25], ["frog", 10.27], ["music", 7.07]], null, null, null, null, [["throbbing", 41.65], ["hum", 39.35], ["music", 7.37]], [["music", 61.45], ["speech", 16.35], ["sidetone", 1.62]], null, [["cattle, bovinae", 24.33], ["livestock, farm animals, working animals", 24.01], ["moo", 16.81]], null, null, null, null, [["music", 31.76], ["musical instrument", 16.0], ["singing bowl", 6.46]], null, null, null], "duration": [6.21, 22.7, 2.5, 0.45, 0.48, 0.51, -0.32, 3.71, 12.69, 1.75, 16.97, 1.09, 1.12, 0.94, 1.34, 2.41, 1.09, 0.87, 1.03]} \ No newline at end of file diff --git a/annotations_1/9qorxa6iMm4_filtered.json b/annotations_1/9qorxa6iMm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dd1d5004657ef8877ed6d925b796956f2c154b0 --- /dev/null +++ b/annotations_1/9qorxa6iMm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 24.19], [31.0, 32.17], [34.0, 34.52], [36.0, 36.31], [37.0, 44.29], [45.0, 44.95], [47.0, 52.71], [54.0, 95.2], [96.0, 98.64], [101.0, 119.31], [122.0, 122.52]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [37.34, 0.0, 0.0, 0.0, 31.91, 0.0, 39.96, 0.0, 38.37, 35.31, 0.0], "audiomae_on_audioset": [[["music", 48.57], ["theremin", 24.8], ["musical instrument", 8.42]], null, null, null, [["music", 52.4], ["theremin", 8.32], ["musical instrument", 6.75]], null, [["music", 40.43], ["theremin", 27.2], ["musical instrument", 6.4]], null, [["music", 37.94], ["foghorn", 12.41], ["ambient music", 4.35]], [["music", 68.1], ["musical instrument", 6.32], ["synthesizer", 4.52]], null], "duration": [16.19, 1.17, 0.52, 0.31, 7.29, -0.05, 5.71, 41.2, 2.64, 18.31, 0.52]} \ No newline at end of file diff --git a/annotations_1/9riBff-h-hM_filtered.json b/annotations_1/9riBff-h-hM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a46559118bfe26f114433482d27ffa51b151d238 --- /dev/null +++ b/annotations_1/9riBff-h-hM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.07], [12.0, 12.34], [20.0, 20.58], [25.0, 25.34], [27.0, 28.83], [29.0, 29.24], [33.0, 46.72], [48.0, 56.83], [65.0, 74.22], [75.0, 76.55], [82.0, 87.03], [89.0, 89.13], [90.0, 91.07], [98.0, 116.16], [117.0, 117.44], [119.0, 136.98], [137.0, 137.02], [138.0, 149.98]], "keep_status": [true, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [30.64, 0.0, 0.0, 0.0, 0.0, 0.0, 30.22, 31.18, 31.34, 0.0, 30.85, 0.0, 0.0, 32.32, 0.0, 30.64, 0.0, 30.59], "audiomae_on_audioset": [[["music", 43.46], ["speech", 10.56], ["throbbing", 6.36]], null, null, null, null, null, [["music", 35.26], ["speech", 12.01], ["explosion", 6.54]], [["music", 76.54], ["didgeridoo", 3.86], ["throbbing", 3.03]], [["cattle, bovinae", 28.67], ["moo", 16.97], ["livestock, farm animals, working animals", 13.68]], null, [["music", 19.03], ["animal", 8.47], ["livestock, farm animals, working animals", 8.41]], null, null, [["music", 54.83], ["speech", 11.8], ["synthesizer", 4.11]], null, [["music", 63.05], ["speech", 9.53], ["throbbing", 3.31]], null, [["speech", 46.04], ["music", 25.68], ["vehicle", 3.08]]], "duration": [3.07, 0.34, 0.58, 0.34, 1.83, 0.24, 13.72, 8.83, 9.22, 1.55, 5.03, 0.13, 1.07, 18.16, 0.44, 17.98, 0.02, 11.98]} \ No newline at end of file diff --git a/annotations_1/9smHLhj75CU_filtered.json b/annotations_1/9smHLhj75CU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d64cadc9982041ac3195c1ebbfa4ce1708348cbd --- /dev/null +++ b/annotations_1/9smHLhj75CU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.2], [7.0, 8.46], [9.0, 10.49], [12.0, 19.87], [21.0, 22.4], [26.0, 52.66], [55.0, 58.92], [60.0, 64.03], [66.0, 100.33]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 0.0, 0.0, 99.92, 0.0, 99.52, 99.91, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [3.2, 1.46, 1.49, 7.87, 1.4, 26.66, 3.92, 4.03, 34.33]} \ No newline at end of file diff --git a/annotations_1/9svQ60inP0g_filtered.json b/annotations_1/9svQ60inP0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1abca72f38a83dff808950145600d8c4e4b6a2eb --- /dev/null +++ b/annotations_1/9svQ60inP0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [9.0, 9.29], [10.0, 10.39], [11.0, 13.29], [15.0, 15.82], [16.0, 18.89], [20.0, 27.51], [31.0, 31.38], [33.0, 34.5], [35.0, 36.29], [37.0, 38.94], [39.0, 41.28], [42.0, 43.53], [45.0, 47.19], [48.0, 51.24], [54.0, 67.12], [68.0, 114.79], [116.0, 117.98], [118.0, 146.55]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 37.22, 0.0, 34.44, 32.13, 0.0, 0.0, 0.0, 0.0, 37.82, 0.0, 37.57, 36.47, 34.78, 0.0, 0.0, 28.66], "audiomae_on_audioset": [null, null, null, [["music", 17.86], ["hum", 9.57], ["sine wave", 6.01]], null, [["speech", 30.27], ["mains hum", 19.43], ["hum", 7.58]], [["speech", 83.5], ["music", 2.99], ["crumpling, crinkling", 1.4]], null, null, null, null, [["didgeridoo", 74.11], ["music", 15.51], ["speech", 2.02]], null, [["gong", 28.39], ["music", 22.96], ["singing bowl", 12.42]], [["rumble", 11.12], ["moo", 4.21], ["music", 4.02]], [["hum", 65.8], ["throbbing", 13.58], ["mains hum", 13.08]], null, null, [["speech", 37.84], ["music", 7.88], ["ding", 6.08]]], "duration": [0.62, 0.29, 0.39, 2.29, 0.82, 2.89, 7.51, 0.38, 1.5, 1.29, 1.94, 2.28, 1.53, 2.19, 3.24, 13.12, 46.79, 1.98, 28.55]} \ No newline at end of file diff --git a/annotations_1/9tHwS5Ymvag_filtered.json b/annotations_1/9tHwS5Ymvag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d8ac8fa0825aef2cc9a70b9e4088a09dd14ea6a --- /dev/null +++ b/annotations_1/9tHwS5Ymvag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.14], [9.0, 9.1], [10.0, 10.57], [16.0, 16.56], [19.0, 19.06], [27.0, 28.51], [29.0, 30.0], [32.0, 32.66], [35.0, 35.83], [37.0, 37.17], [41.0, 41.52], [43.0, 43.6], [62.0, 62.29], [64.0, 63.93], [70.0, 70.09], [70.0, 71.88], [73.0, 74.28], [76.0, 77.01], [81.0, 82.02], [83.0, 83.71], [85.0, 85.62], [89.0, 89.8], [90.0, 90.31], [92.0, 92.48], [105.0, 105.85], [106.0, 106.68], [107.0, 107.57], [112.0, 112.11], [116.0, 116.67], [118.0, 118.76], [121.0, 121.91], [127.0, 127.57], [128.0, 128.92], [131.0, 131.21], [138.0, 138.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 0.1, 0.57, 0.56, 0.06, 1.51, 1.0, 0.66, 0.83, 0.17, 0.52, 0.6, 0.29, -0.07, 0.09, 1.88, 1.28, 1.01, 1.02, 0.71, 0.62, 0.8, 0.31, 0.48, 0.85, 0.68, 0.57, 0.11, 0.67, 0.76, 0.91, 0.57, 0.92, 0.21, 0.11]} \ No newline at end of file diff --git a/annotations_1/9tli2kwH5mY_filtered.json b/annotations_1/9tli2kwH5mY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..751ce00dad6f7b7ba78c35ed199c47de8ffaaaac --- /dev/null +++ b/annotations_1/9tli2kwH5mY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [7.0, 6.84], [13.0, 14.37], [17.0, 18.13], [33.0, 33.24], [36.0, 36.04], [43.0, 43.9], [45.0, 53.7], [64.0, 66.55], [68.0, 68.15], [74.0, 78.78], [89.0, 89.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 87.74, 0.0, 86.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, -0.16, 1.37, 1.13, 0.24, 0.04, 0.9, 8.7, 2.55, 0.15, 4.78, 0.29]} \ No newline at end of file diff --git a/annotations_1/9tx1z5_iVeo_filtered.json b/annotations_1/9tx1z5_iVeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45c9e8f56d31a8af54de95513e5017778f8419b5 --- /dev/null +++ b/annotations_1/9tx1z5_iVeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.28], [12.0, 16.19], [16.0, 16.85], [17.0, 25.05], [27.0, 28.02], [34.0, 34.94], [43.0, 46.04], [55.0, 55.76], [57.0, 57.57], [59.0, 59.32], [60.0, 60.2], [62.0, 61.94], [70.0, 70.01], [71.0, 73.84], [74.0, 75.47], [76.0, 76.86], [85.0, 85.21], [88.0, 88.75], [93.0, 92.85], [93.0, 93.11], [96.0, 99.27], [101.0, 101.87], [102.0, 103.54], [104.0, 105.04], [107.0, 107.2], [110.0, 110.27], [113.0, 113.27], [115.0, 115.64], [118.0, 118.72], [124.0, 125.02], [126.0, 126.52], [129.0, 129.68], [131.0, 131.58], [132.0, 140.71], [141.0, 148.31], [152.0, 153.17], [155.0, 156.19], [158.0, 159.73], [166.0, 166.41], [167.0, 167.56], [175.0, 175.44], [179.0, 179.66], [180.0, 181.16], [183.0, 183.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.07, 60.51, 0.0, 53.22, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.28, 4.19, 0.85, 8.05, 1.02, 0.94, 3.04, 0.76, 0.57, 0.32, 0.2, -0.06, 0.01, 2.84, 1.47, 0.86, 0.21, 0.75, -0.15, 0.11, 3.27, 0.87, 1.54, 1.04, 0.2, 0.27, 0.27, 0.64, 0.72, 1.02, 0.52, 0.68, 0.58, 8.71, 7.31, 1.17, 1.19, 1.73, 0.41, 0.56, 0.44, 0.66, 1.16, 0.88]} \ No newline at end of file diff --git a/annotations_1/9u6xaK00otk_filtered.json b/annotations_1/9u6xaK00otk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1321623754883cb59e554580e4d57e37900588ac --- /dev/null +++ b/annotations_1/9u6xaK00otk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.19], [14.0, 15.48], [17.0, 18.08], [19.0, 20.75], [22.0, 23.11], [24.0, 26.94], [28.0, 38.62], [41.0, 43.38], [52.0, 52.52], [62.0, 62.36], [67.0, 67.54], [68.0, 69.74], [72.0, 73.63], [77.0, 81.75], [82.0, 84.35], [85.0, 87.89], [89.0, 91.18], [98.0, 109.73], [113.0, 114.52], [118.0, 119.55], [122.0, 123.33], [124.0, 130.94], [132.0, 132.9], [134.0, 135.31], [136.0, 140.37], [141.0, 144.51], [146.0, 149.07], [151.0, 153.79], [156.0, 157.59], [159.0, 159.46], [161.0, 163.63], [165.0, 167.71], [170.0, 172.02], [174.0, 173.92], [175.0, 175.44], [176.0, 177.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 76.86, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 76.86, 96.29, 58.81, 80.82, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 93.91, 78.21, 88.64, 87.55, 0.0, 0.0, 91.64, 91.64, 90.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 1.48, 1.08, 1.75, 1.11, 2.94, 10.62, 2.38, 0.52, 0.36, 0.54, 1.74, 1.63, 4.75, 2.35, 2.89, 2.18, 11.73, 1.52, 1.55, 1.33, 6.94, 0.9, 1.31, 4.37, 3.51, 3.07, 2.79, 1.59, 0.46, 2.63, 2.71, 2.02, -0.08, 0.44, 1.33]} \ No newline at end of file diff --git a/annotations_1/9uXRIrNj_z4_filtered.json b/annotations_1/9uXRIrNj_z4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10911a0ef805d74dff8276b961e82e0fb2094093 --- /dev/null +++ b/annotations_1/9uXRIrNj_z4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 84.86]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [44.86]} \ No newline at end of file diff --git a/annotations_1/9ukjNhwdbGY_filtered.json b/annotations_1/9ukjNhwdbGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2a7e79f8b5672d2d8695519d859c3ab9797929e --- /dev/null +++ b/annotations_1/9ukjNhwdbGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.04], [10.0, 14.61], [16.0, 18.93], [40.0, 40.19], [48.0, 48.56], [51.0, 51.34], [65.0, 65.43], [67.0, 68.35], [73.0, 80.87], [81.0, 84.45], [85.0, 85.4], [87.0, 91.81], [92.0, 92.74], [96.0, 121.34]], "keep_status": [true, true, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [29.85, 30.13, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 32.03, 34.12, 0.0, 33.42, 0.0, 33.78], "audiomae_on_audioset": [[["speech", 39.77], ["music", 13.66], ["animal", 3.89]], [["music", 32.98], ["speech", 32.96], ["outside, urban or manmade", 3.3]], [["cattle, bovinae", 37.57], ["moo", 28.94], ["livestock, farm animals, working animals", 19.36]], null, null, null, null, null, [["music", 26.74], ["speech", 26.66], ["crowd", 5.18]], [["music", 49.7], ["speech", 9.86], ["wind instrument, woodwind instrument", 6.29]], null, [["music", 34.97], ["speech", 24.41], ["bagpipes", 6.44]], null, [["music", 41.02], ["fart", 26.72], ["musical instrument", 9.32]]], "duration": [8.04, 4.61, 2.93, 0.19, 0.56, 0.34, 0.43, 1.35, 7.87, 3.45, 0.4, 4.81, 0.74, 25.34]} \ No newline at end of file diff --git a/annotations_1/9v-2_YOVxGw_filtered.json b/annotations_1/9v-2_YOVxGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f3291a5a6bbef8981c1c712e6eee96906d00396 --- /dev/null +++ b/annotations_1/9v-2_YOVxGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.06], [9.0, 9.68], [15.0, 16.46], [20.0, 21.96], [23.0, 25.44], [27.0, 47.14], [55.0, 72.93], [74.0, 74.22], [74.0, 79.22], [83.0, 83.15], [86.0, 113.44], [117.0, 120.16], [120.0, 120.23], [124.0, 130.13], [130.0, 130.33], [131.0, 132.07]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.8, 33.47, 30.4, 0.0, 34.53, 0.0, 32.15, 34.39, 0.0, 32.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.01], ["hum", 19.76], ["throbbing", 15.95]], [["ding", 21.23], ["livestock, farm animals, working animals", 13.91], ["tuning fork", 11.79]], null, [["cattle, bovinae", 12.57], ["livestock, farm animals, working animals", 10.46], ["moo", 8.98]], null, [["music", 75.32], ["theremin", 8.04], ["synthesizer", 3.03]], [["music", 67.79], ["musical instrument", 10.89], ["guitar", 3.38]], null, [["music", 63.64], ["beatboxing", 19.63], ["boing", 2.99]], null, null], "duration": [0.06, 0.68, 1.46, 1.96, 2.44, 20.14, 17.93, 0.22, 5.22, 0.15, 27.44, 3.16, 0.23, 6.13, 0.33, 1.07]} \ No newline at end of file diff --git a/annotations_1/9wCiCJ7KDs8_filtered.json b/annotations_1/9wCiCJ7KDs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31e840c5e4e616617aa90de73a113011e79dcf6c --- /dev/null +++ b/annotations_1/9wCiCJ7KDs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.28], [11.0, 15.26], [17.0, 25.17], [34.0, 33.93], [35.0, 35.67], [41.0, 45.67], [52.0, 52.25], [52.0, 53.49], [54.0, 53.52], [54.0, 57.64], [65.0, 66.09], [69.0, 70.39], [78.0, 78.09], [80.0, 80.35]], "keep_status": [false, true, true, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 30.76, 31.34, 0.0, 0.0, 29.88, 0.0, 0.0, 0.0, 32.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 23.25], ["music", 14.44], ["hum", 9.9]], [["hum", 23.87], ["sidetone", 23.5], ["speech", 22.16]], null, null, [["speech", 25.44], ["music", 11.28], ["throbbing", 7.2]], null, null, null, [["speech", 59.31], ["fly, housefly", 4.11], ["animal", 3.61]], null, null, null, null], "duration": [1.28, 4.26, 8.17, -0.07, 0.67, 4.67, 0.25, 1.49, -0.48, 3.64, 1.09, 1.39, 0.09, 0.35]} \ No newline at end of file diff --git a/annotations_1/9yDL0AKUCKo_filtered.json b/annotations_1/9yDL0AKUCKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15cbd55bb50e16d991ee665d3b782adf205a78a3 --- /dev/null +++ b/annotations_1/9yDL0AKUCKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 51.71], [55.0, 67.51], [70.0, 70.85], [72.0, 73.06], [75.0, 75.27], [77.0, 77.55], [80.0, 81.43], [83.0, 83.17], [86.0, 86.66], [88.0, 88.23], [91.0, 91.74], [95.0, 95.39], [97.0, 97.6], [99.0, 99.64], [101.0, 124.07], [127.0, 128.21], [129.0, 130.57], [133.0, 134.54], [136.0, 136.78], [138.0, 141.39], [143.0, 145.45], [148.0, 149.23], [154.0, 164.79], [165.0, 164.83], [165.0, 164.86], [165.0, 164.89], [172.0, 172.1], [175.0, 176.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [34.66, 35.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.26, 0.0, 0.0, 0.0, 0.0, 98.01, 74.92, 0.0, 32.88, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.98], ["didgeridoo", 4.78], ["electronic music", 4.53]], [["music", 73.81], ["musical instrument", 3.48], ["electronic music", 2.29]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.43], ["frog", 11.02], ["sidetone", 7.24]], null, null, null, null, null, null, null, [["buzz", 20.93], ["music", 19.01], ["hum", 9.87]], null, null, null, null, null], "duration": [9.71, 12.51, 0.85, 1.06, 0.27, 0.55, 1.43, 0.17, 0.66, 0.23, 0.74, 0.39, 0.6, 0.64, 23.07, 1.21, 1.57, 1.54, 0.78, 3.39, 2.45, 1.23, 10.79, -0.17, -0.14, -0.11, 0.1, 1.96]} \ No newline at end of file diff --git a/annotations_1/9ykMeXdU_Ng_filtered.json b/annotations_1/9ykMeXdU_Ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bf2934c0d2103d84d095fdf2781918327419719 --- /dev/null +++ b/annotations_1/9ykMeXdU_Ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [6.0, 7.08], [9.0, 10.49], [12.0, 12.68], [13.0, 18.23], [19.0, 19.7], [20.0, 21.3], [24.0, 24.46], [25.0, 24.98], [25.0, 25.91], [26.0, 26.87], [27.0, 28.29], [30.0, 30.57], [31.0, 32.14], [33.0, 34.13], [38.0, 38.8], [47.0, 47.87], [57.0, 58.04], [62.0, 62.36], [67.0, 68.55], [80.0, 81.16], [85.0, 85.24], [90.0, 90.68], [94.0, 94.91], [98.0, 98.59], [101.0, 103.06], [105.0, 107.97], [110.0, 120.43], [121.0, 122.81], [124.0, 126.69], [128.0, 129.51], [130.0, 135.51], [138.0, 142.91], [143.0, 145.0], [147.0, 148.07], [151.0, 151.63], [155.0, 155.56], [159.0, 160.51], [163.0, 163.71], [166.0, 167.58], [168.0, 170.19], [171.0, 174.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.53, 100.0, 44.93, 0.0, 99.82, 0.0, 42.28, 52.33, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 74.11], ["crushing", 9.2], ["telephone bell ringing", 4.81]], null, null, null, [["speech", 67.87], ["telephone", 14.62], ["busy signal", 7.11]], null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.08, 1.49, 0.68, 5.23, 0.7, 1.3, 0.46, -0.02, 0.91, 0.87, 1.29, 0.57, 1.14, 1.13, 0.8, 0.87, 1.04, 0.36, 1.55, 1.16, 0.24, 0.68, 0.91, 0.59, 2.06, 2.97, 10.43, 1.81, 2.69, 1.51, 5.51, 4.91, 2.0, 1.07, 0.63, 0.56, 1.51, 0.71, 1.58, 2.19, 3.53]} \ No newline at end of file diff --git a/annotations_1/9z8uqVHf39M_filtered.json b/annotations_1/9z8uqVHf39M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5db7fa8a606972f94ccd5b97927c38c5d15404ff --- /dev/null +++ b/annotations_1/9z8uqVHf39M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [4.0, 5.86], [7.0, 7.01], [35.0, 35.16], [56.0, 60.3], [83.0, 88.13], [92.0, 93.51], [95.0, 95.37], [98.0, 99.6], [100.0, 101.24], [105.0, 105.61], [126.0, 126.82], [135.0, 135.23], [135.0, 139.51], [140.0, 140.59], [142.0, 143.31], [146.0, 146.91]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.27, 33.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.9, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 29.85], ["music", 23.61], ["throbbing", 3.97]], [["hum", 34.2], ["throbbing", 27.11], ["speech", 17.17]], null, null, null, null, null, null, null, [["hum", 36.46], ["throbbing", 22.85], ["mains hum", 16.97]], null, null, null], "duration": [0.66, 1.86, 0.01, 0.16, 4.3, 5.13, 1.51, 0.37, 1.6, 1.24, 0.61, 0.82, 0.23, 4.51, 0.59, 1.31, 0.91]} \ No newline at end of file diff --git a/annotations_1/9zZLmOA4OsA_filtered.json b/annotations_1/9zZLmOA4OsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2184db22620c0228e1ea87645f75a020208a9af4 --- /dev/null +++ b/annotations_1/9zZLmOA4OsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [10.0, 11.01], [18.0, 18.54], [19.0, 18.99], [22.0, 23.9], [26.0, 27.68], [29.0, 32.32], [33.0, 36.91], [60.0, 60.13], [61.0, 61.45], [63.0, 63.8], [65.0, 65.13], [67.0, 67.61], [71.0, 71.41], [72.0, 73.6], [74.0, 73.67], [75.0, 77.68], [78.0, 80.54], [83.0, 83.69], [86.0, 87.0], [87.0, 88.05], [90.0, 93.6], [94.0, 105.53], [108.0, 111.52], [113.0, 119.06], [120.0, 121.42], [123.0, 124.36], [126.0, 126.86], [128.0, 129.03], [133.0, 134.23], [136.0, 137.47], [141.0, 154.7], [156.0, 191.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 34.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.85, 34.29, 0.0, 0.0, 0.0, 56.55, 95.51, 99.56, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 72.99], ["wild animals", 2.06], ["animal", 2.06]], null, null, null, null, null, null, null, null, [["speech", 45.21], ["music", 8.86], ["didgeridoo", 8.63]], [["grunt", 18.68], ["music", 16.59], ["didgeridoo", 10.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 1.01, 0.54, -0.01, 1.9, 1.68, 3.32, 3.91, 0.13, 0.45, 0.8, 0.13, 0.61, 0.41, 1.6, -0.33, 2.68, 2.54, 0.69, 1.0, 1.05, 3.6, 11.53, 3.52, 6.06, 1.42, 1.36, 0.86, 1.03, 1.23, 1.47, 13.7, 35.69]} \ No newline at end of file diff --git a/annotations_1/9zbF578--dE_filtered.json b/annotations_1/9zbF578--dE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3a935be759afb07a587c820950f755e2f8e8099 --- /dev/null +++ b/annotations_1/9zbF578--dE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 5.59], [8.0, 11.94], [14.0, 23.62], [24.0, 27.01], [32.0, 32.41], [39.0, 40.54], [42.0, 43.9], [46.0, 48.98], [50.0, 51.06], [53.0, 53.5], [55.0, 56.71], [59.0, 60.22], [67.0, 67.36], [69.0, 72.05], [75.0, 76.32], [78.0, 78.93], [80.0, 80.54], [81.0, 82.81], [88.0, 89.61], [92.0, 92.58], [100.0, 101.01], [101.0, 101.22], [104.0, 108.53], [109.0, 108.57], [114.0, 114.0], [117.0, 117.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 74.13, 40.79, 36.42, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.06], ["speech", 22.8], ["sidetone", 4.19]], [["music", 52.28], ["hiccup", 12.52], ["zipper (clothing)", 7.96]], null, null, null, null, null, null, null, null, null, [["music", 76.27], ["speech", 4.83], ["electronic music", 2.47]], null, null, null, null, null, null, null, null, [["music", 48.68], ["sidetone", 24.72], ["speech", 17.03]], null, null, null], "duration": [0.51, 0.59, 3.94, 9.62, 3.01, 0.41, 1.54, 1.9, 2.98, 1.06, 0.5, 1.71, 1.22, 0.36, 3.05, 1.32, 0.93, 0.54, 1.81, 1.61, 0.58, 1.01, 0.22, 4.53, -0.43, 0.0, 0.48]} \ No newline at end of file diff --git a/annotations_1/A-Ckh0slywY_filtered.json b/annotations_1/A-Ckh0slywY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34d0a2d8446664fb93f14b03b71cfeddc5457d1e --- /dev/null +++ b/annotations_1/A-Ckh0slywY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 59.83], [60.0, 76.47], [77.0, 107.23], [109.0, 112.87], [114.0, 114.25], [114.0, 153.84], [155.0, 173.33], [175.0, 180.4]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 29.07, 0.0, 29.12, 0.0, 0.0, 67.63, 58.13], "audiomae_on_audioset": [null, [["music", 32.21], ["didgeridoo", 8.99], ["sound effect", 4.49]], null, [["music", 29.41], ["electronic music", 13.54], ["helicopter", 12.93]], null, null, null, null], "duration": [-0.17, 16.47, 30.23, 3.87, 0.25, 39.84, 18.33, 5.4]} \ No newline at end of file diff --git a/annotations_1/A-rs-kWL5-s_filtered.json b/annotations_1/A-rs-kWL5-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47067fea308cd2388be2fe5b5fe649b30c626fda --- /dev/null +++ b/annotations_1/A-rs-kWL5-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.67], [16.0, 19.23], [21.0, 22.2], [27.0, 33.12], [34.0, 34.84], [37.0, 41.13], [42.0, 43.44], [51.0, 51.7], [55.0, 55.85], [57.0, 57.92], [59.0, 60.05], [61.0, 66.28], [69.0, 69.4], [71.0, 72.05], [73.0, 74.07], [76.0, 76.28], [77.0, 78.83], [80.0, 81.84], [89.0, 89.92], [91.0, 92.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.83, 0.0, 96.77, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 3.23, 1.2, 6.12, 0.84, 4.13, 1.44, 0.7, 0.85, 0.92, 1.05, 5.28, 0.4, 1.05, 1.07, 0.28, 1.83, 1.84, 0.92, 1.69]} \ No newline at end of file diff --git a/annotations_1/A0FwoprE1cQ_filtered.json b/annotations_1/A0FwoprE1cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a9bfdda45fa8b6b943e019f6e94a6e5ef9ee5e0 --- /dev/null +++ b/annotations_1/A0FwoprE1cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [5.0, 6.02], [14.0, 15.33], [17.0, 17.09], [18.0, 19.99], [21.0, 26.15], [33.0, 33.67], [37.0, 38.47], [40.0, 42.15], [43.0, 43.75], [45.0, 46.47], [56.0, 57.03], [63.0, 64.47], [71.0, 72.06], [73.0, 74.34], [77.0, 77.92], [82.0, 84.54], [86.0, 86.91], [93.0, 94.07], [97.0, 96.9], [99.0, 99.66], [112.0, 114.67], [125.0, 125.02], [132.0, 132.53], [134.0, 134.94], [141.0, 142.06], [147.0, 147.93], [151.0, 154.65], [157.0, 157.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 1.02, 1.33, 0.09, 1.99, 5.15, 0.67, 1.47, 2.15, 0.75, 1.47, 1.03, 1.47, 1.06, 1.34, 0.92, 2.54, 0.91, 1.07, -0.1, 0.66, 2.67, 0.02, 0.53, 0.94, 1.06, 0.93, 3.65, 0.44]} \ No newline at end of file diff --git a/annotations_1/A1-XFXX8rU4_filtered.json b/annotations_1/A1-XFXX8rU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..942802e0af26b6032b7997e772fca61c5e803ad4 --- /dev/null +++ b/annotations_1/A1-XFXX8rU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [5.0, 7.43], [8.0, 10.76], [14.0, 15.94], [17.0, 21.71], [24.0, 25.22], [30.0, 30.35], [44.0, 44.32], [48.0, 49.84], [54.0, 58.31], [63.0, 63.51], [64.0, 64.44], [70.0, 71.46], [74.0, 82.43], [84.0, 85.8], [96.0, 101.68], [104.0, 104.94], [110.0, 114.89], [118.0, 120.07], [123.0, 123.38], [131.0, 131.16], [136.0, 137.15], [141.0, 142.43], [144.0, 145.3], [149.0, 149.4], [151.0, 158.33], [160.0, 159.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 67.13, 84.07, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 53.53, 0.0, 47.74, 0.0, 63.64, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.28], ["theremin", 17.2], ["violin, fiddle", 11.08]], null, null, null, null, null, null, null, null, null, [["music", 43.35], ["musical instrument", 9.16], ["violin, fiddle", 8.13]], null], "duration": [1.74, 2.43, 2.76, 1.94, 4.71, 1.22, 0.35, 0.32, 1.84, 4.31, 0.51, 0.44, 1.46, 8.43, 1.8, 5.68, 0.94, 4.89, 2.07, 0.38, 0.16, 1.15, 1.43, 1.3, 0.4, 7.33, -0.15]} \ No newline at end of file diff --git a/annotations_1/A1GJyyJzpCo_filtered.json b/annotations_1/A1GJyyJzpCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64bfeeab1d8857202efd1652305a33726304d885 --- /dev/null +++ b/annotations_1/A1GJyyJzpCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.73], [13.0, 13.15], [21.0, 21.88], [25.0, 28.31], [33.0, 35.85], [37.0, 38.35], [40.0, 40.95], [44.0, 45.45], [47.0, 49.2], [52.0, 52.14], [53.0, 53.97], [55.0, 54.84], [56.0, 57.28], [58.0, 59.68], [65.0, 69.3], [91.0, 91.52], [96.0, 97.98], [100.0, 102.22], [112.0, 116.18], [122.0, 123.09], [135.0, 136.31], [138.0, 138.25], [143.0, 154.7]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.78, 35.26, 0.0, 0.0, 0.0, 39.21, 0.0, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 44.07, 48.44, 0.0, 0.0, 0.0, 28.73], "audiomae_on_audioset": [null, null, null, [["speech", 28.86], ["hum", 11.77], ["whack, thwack", 11.45]], [["music", 27.77], ["percussion", 9.42], ["speech", 6.74]], null, null, null, [["speech", 15.17], ["grunt", 11.35], ["fart", 8.22]], null, null, null, null, null, [["insect", 36.04], ["fly, housefly", 32.35], ["fart", 11.22]], null, null, [["music", 35.28], ["chirp tone", 9.54], ["effects unit", 5.92]], [["music", 57.45], ["synthesizer", 8.41], ["hum", 4.19]], null, null, null, [["throbbing", 59.94], ["music", 23.31], ["hum", 7.81]]], "duration": [1.73, 0.15, 0.88, 3.31, 2.85, 1.35, 0.95, 1.45, 2.2, 0.14, 0.97, -0.16, 1.28, 1.68, 4.3, 0.52, 1.98, 2.22, 4.18, 1.09, 1.31, 0.25, 11.7]} \ No newline at end of file diff --git a/annotations_1/A2yqIm58ULo_filtered.json b/annotations_1/A2yqIm58ULo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82249fefcc51ae0b47d53d08e422429948c0286c --- /dev/null +++ b/annotations_1/A2yqIm58ULo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [6.0, 6.83], [10.0, 10.81], [12.0, 12.88], [16.0, 16.85], [18.0, 18.32], [21.0, 22.54], [23.0, 24.33], [25.0, 25.37], [26.0, 26.45], [28.0, 29.51], [32.0, 32.7], [34.0, 34.92], [39.0, 40.85], [42.0, 43.04], [44.0, 45.6], [48.0, 49.35], [54.0, 56.74], [57.0, 58.14], [62.0, 63.12], [66.0, 66.95], [70.0, 70.65], [74.0, 74.24], [78.0, 78.75], [79.0, 79.59], [80.0, 82.97], [85.0, 86.34], [88.0, 90.75], [94.0, 97.8], [99.0, 100.58], [103.0, 103.2], [104.0, 108.06], [111.0, 112.08], [128.0, 127.9], [135.0, 136.73], [142.0, 142.92], [145.0, 146.79], [150.0, 150.2], [151.0, 151.51], [152.0, 153.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 68.93, 99.82, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 0.83, 0.81, 0.88, 0.85, 0.32, 1.54, 1.33, 0.37, 0.45, 1.51, 0.7, 0.92, 1.85, 1.04, 1.6, 1.35, 2.74, 1.14, 1.12, 0.95, 0.65, 0.24, 0.75, 0.59, 2.97, 1.34, 2.75, 3.8, 1.58, 0.2, 4.06, 1.08, -0.1, 1.73, 0.92, 1.79, 0.2, 0.51, 1.28]} \ No newline at end of file diff --git a/annotations_1/A3Vm7zSOm7M_filtered.json b/annotations_1/A3Vm7zSOm7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a5d6c50af8c385e4aa57c7e6abfc825676c882e --- /dev/null +++ b/annotations_1/A3Vm7zSOm7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [4.0, 5.02], [6.0, 7.01], [10.0, 15.74], [19.0, 21.76], [22.0, 27.31], [29.0, 39.75], [41.0, 40.71], [41.0, 55.66], [59.0, 60.13], [61.0, 68.42], [70.0, 70.34], [71.0, 72.67], [75.0, 85.21], [88.0, 90.27], [92.0, 92.58], [95.0, 96.43], [97.0, 97.87], [99.0, 109.85], [112.0, 113.88], [121.0, 130.69], [131.0, 135.78], [151.0, 150.77], [156.0, 156.74], [161.0, 161.82]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.48, 86.64, 38.71, 71.43, 0.0, 75.72, 0.0, 99.98, 0.0, 0.0, 33.98, 60.42, 0.0, 0.0, 0.0, 63.53, 0.0, 91.64, 35.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 40.32], ["rowboat, canoe, kayak", 21.09], ["boat, water vehicle", 6.49]], null, [["speech", 70.11], ["beatboxing", 13.34], ["fart", 1.58]], null, null, null, null, null, null, null, [["speech", 58.58], ["fart", 5.3], ["animal", 4.45]], null, null, null, null, null, null, null, [["music", 43.92], ["keyboard (musical)", 13.09], ["piano", 9.31]], null, null, null], "duration": [0.5, 1.02, 1.01, 5.74, 2.76, 5.31, 10.75, -0.29, 14.66, 1.13, 7.42, 0.34, 1.67, 10.21, 2.27, 0.58, 1.43, 0.87, 10.85, 1.88, 9.69, 4.78, -0.23, 0.74, 0.82]} \ No newline at end of file diff --git a/annotations_1/A5CndWt2xrY_filtered.json b/annotations_1/A5CndWt2xrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61576e7205af80ad7d647ef9ad4647776681bbaf --- /dev/null +++ b/annotations_1/A5CndWt2xrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.91], [9.0, 12.88], [15.0, 21.9], [33.0, 34.4], [38.0, 38.35], [39.0, 41.91], [42.0, 43.01], [49.0, 50.21], [52.0, 53.47], [55.0, 55.26], [56.0, 56.59], [63.0, 63.34], [64.0, 67.34], [68.0, 68.82], [70.0, 71.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.22, 29.99, 0.0, 0.0, 36.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.35], ["music", 16.23], ["sidetone", 2.65]], null, null, [["music", 27.04], ["speech", 17.11], ["caw", 5.89]], null, null, null, null, null, null, null, null, null], "duration": [0.91, 3.88, 6.9, 1.4, 0.35, 2.91, 1.01, 1.21, 1.47, 0.26, 0.59, 0.34, 3.34, 0.82, 1.91]} \ No newline at end of file diff --git a/annotations_1/A6PpUgfZcRU_filtered.json b/annotations_1/A6PpUgfZcRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97bb0912b1fdf29db345db4b5062770a09abb53b --- /dev/null +++ b/annotations_1/A6PpUgfZcRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 37.37], [44.0, 44.41], [45.0, 74.36], [76.0, 85.65], [88.0, 90.78], [95.0, 95.5], [96.0, 102.14], [103.0, 104.82], [108.0, 112.63], [116.0, 133.95]], "keep_status": [false, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 28.39, 30.58, 30.03, 0.0, 31.01, 0.0, 28.09, 28.09], "audiomae_on_audioset": [null, null, [["music", 64.22], ["smash, crash", 5.45], ["breaking", 4.09]], [["hum", 31.08], ["mains hum", 19.44], ["rumble", 10.03]], [["mains hum", 39.06], ["hum", 37.6], ["music", 3.97]], null, [["music", 32.89], ["static", 16.03], ["buzz", 9.26]], null, [["music", 27.1], ["noise", 15.31], ["rumble", 12.4]], [["music", 13.05], ["cacophony", 12.72], ["buzz", 8.2]]], "duration": [36.37, 0.41, 29.36, 9.65, 2.78, 0.5, 6.14, 1.82, 4.63, 17.95]} \ No newline at end of file diff --git a/annotations_1/A6d0qIZY3Hg_filtered.json b/annotations_1/A6d0qIZY3Hg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7810e663a454c86b4c31c48f07ebc56cfe437967 --- /dev/null +++ b/annotations_1/A6d0qIZY3Hg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [4.0, 4.29], [6.0, 7.3], [9.0, 10.34], [14.0, 15.96], [18.0, 19.23], [19.0, 19.77], [21.0, 25.17], [32.0, 49.2], [50.0, 58.55], [59.0, 63.22], [65.0, 65.85], [66.0, 67.74], [72.0, 72.12], [76.0, 98.2], [99.0, 102.51], [119.0, 119.03], [122.0, 122.79], [129.0, 135.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.03, 31.28, 31.12, 30.43, 0.0, 0.0, 0.0, 32.79, 31.16, 0.0, 0.0, 30.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 66.53], ["throbbing", 16.04], ["hum", 2.09]], [["speech", 43.45], ["music", 40.39], ["whack, thwack", 2.29]], [["music", 45.41], ["speech", 27.07], ["explosion", 3.14]], [["music", 42.85], ["speech", 37.19], ["explosion", 3.1]], null, null, null, [["boing", 53.45], ["music", 15.74], ["cowbell", 7.33]], [["music", 40.77], ["throbbing", 17.65], ["speech", 5.11]], null, null, [["music", 37.46], ["speech", 28.16], ["throbbing", 4.5]]], "duration": [0.5, 0.29, 1.3, 1.34, 1.96, 1.23, 0.77, 4.17, 17.2, 8.55, 4.22, 0.85, 1.74, 0.12, 22.2, 3.51, 0.03, 0.79, 6.09]} \ No newline at end of file diff --git a/annotations_1/A6oAEu3DbKk_filtered.json b/annotations_1/A6oAEu3DbKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d79f9775b08748fb416ffa03118bd7ba6a733a84 --- /dev/null +++ b/annotations_1/A6oAEu3DbKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [9.0, 52.95], [61.0, 92.72], [94.0, 95.49], [97.0, 97.06], [100.0, 103.81], [104.0, 109.05], [111.0, 167.27], [168.0, 168.52], [169.0, 170.7], [172.0, 175.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.23, 30.55, 0.0, 0.0, 0.0, 39.67], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.17], ["cattle, bovinae", 8.52], ["moo", 5.96]], [["music", 36.79], ["throbbing", 20.37], ["hum", 13.81]], null, null, null, [["speech", 45.73], ["electric shaver, electric razor", 14.09], ["music", 6.7]]], "duration": [0.57, 43.95, 31.72, 1.49, 0.06, 3.81, 5.05, 56.27, 0.52, 1.7, 3.73]} \ No newline at end of file diff --git a/annotations_1/A7HmqwyZ3oA_filtered.json b/annotations_1/A7HmqwyZ3oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d97c068d7bc57c6d28c366717940722296f5f30 --- /dev/null +++ b/annotations_1/A7HmqwyZ3oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.37], [23.0, 22.6], [23.0, 23.55], [24.0, 63.88], [66.0, 84.67], [87.0, 99.18], [100.0, 106.88], [108.0, 118.22], [122.0, 144.59]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.06, 28.08, 28.21, 28.18, 33.24], "audiomae_on_audioset": [null, null, null, null, [["music", 51.38], ["electronic music", 14.12], ["throbbing", 8.82]], [["music", 89.58], ["throbbing", 2.28], ["electronic music", 1.66]], [["music", 57.39], ["cacophony", 7.14], ["throbbing", 5.96]], [["music", 70.5], ["echo", 3.33], ["throbbing", 3.31]], [["music", 80.65], ["scary music", 5.02], ["ambient music", 3.49]]], "duration": [0.37, -0.4, 0.55, 39.88, 18.67, 12.18, 6.88, 10.22, 22.59]} \ No newline at end of file diff --git a/annotations_1/A7gKFleV_JU_filtered.json b/annotations_1/A7gKFleV_JU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5644ef9c8d579d0543d94e7379272969288b4d80 --- /dev/null +++ b/annotations_1/A7gKFleV_JU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [7.0, 10.94], [13.0, 13.1], [14.0, 15.31], [19.0, 19.04], [22.0, 23.19], [25.0, 25.25], [28.0, 28.68], [29.0, 29.73], [30.0, 31.5], [38.0, 37.86], [39.0, 40.14], [41.0, 42.15], [43.0, 44.36], [47.0, 46.94], [48.0, 48.17], [49.0, 53.42], [56.0, 56.57], [57.0, 58.77], [63.0, 64.39], [68.0, 68.22], [71.0, 70.95], [73.0, 73.41], [75.0, 75.54], [77.0, 77.94], [80.0, 80.13], [83.0, 84.15], [86.0, 86.22], [88.0, 88.8], [92.0, 92.08], [94.0, 95.5], [98.0, 111.1], [116.0, 117.02], [120.0, 132.43], [134.0, 133.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.57, 0.0, 31.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 59.52], ["music", 20.6], ["wind instrument, woodwind instrument", 4.63]], null, [["music", 60.17], ["theremin", 22.86], ["musical instrument", 4.06]], null], "duration": [0.41, 3.94, 0.1, 1.31, 0.04, 1.19, 0.25, 0.68, 0.73, 1.5, -0.14, 1.14, 1.15, 1.36, -0.06, 0.17, 4.42, 0.57, 1.77, 1.39, 0.22, -0.05, 0.41, 0.54, 0.94, 0.13, 1.15, 0.22, 0.8, 0.08, 1.5, 13.1, 1.02, 12.43, -0.11]} \ No newline at end of file diff --git a/annotations_1/A7mWnsrRu6w_filtered.json b/annotations_1/A7mWnsrRu6w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03dac4b90578ee324293dd839e8f0687f6c5ae4c --- /dev/null +++ b/annotations_1/A7mWnsrRu6w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.5], [20.0, 20.82], [26.0, 29.25], [32.0, 38.43], [41.0, 42.33], [44.0, 70.11], [72.0, 74.93], [77.0, 82.75], [85.0, 87.78], [91.0, 92.82], [93.0, 120.51], [121.0, 125.51], [130.0, 137.29], [139.0, 145.32], [149.0, 149.67], [155.0, 166.53], [169.0, 174.34], [177.0, 180.74], [189.0, 189.65], [191.0, 192.4], [195.0, 198.07], [207.0, 208.85], [209.0, 213.97], [217.0, 217.38], [218.0, 219.03], [220.0, 221.54], [222.0, 222.39], [223.0, 225.96], [227.0, 235.09], [238.0, 240.6]], "keep_status": [false, false, true, true, false, false, true, true, false, false, true, true, true, false, false, true, true, true, false, false, true, false, true, false, false, false, false, true, true, true], "silence_prob": [31.34, 0.0, 31.49, 30.9, 0.0, 31.54, 32.36, 32.73, 32.18, 0.0, 32.56, 32.76, 37.45, 31.42, 0.0, 32.82, 32.4, 31.91, 0.0, 0.0, 31.0, 0.0, 30.74, 0.0, 0.0, 0.0, 0.0, 36.02, 32.03, 35.22], "audiomae_on_audioset": [[["music", 36.38], ["throbbing", 29.46], ["hum", 13.37]], null, [["music", 43.32], ["boing", 7.18], ["hum", 4.29]], [["music", 49.35], ["synthesizer", 4.78], ["smash, crash", 3.98]], null, [["fly, housefly", 45.48], ["music", 17.25], ["insect", 16.95]], [["music", 28.36], ["electronic music", 8.75], ["dubstep", 5.77]], [["music", 22.12], ["cattle, bovinae", 18.03], ["moo", 11.11]], [["speech", 51.31], ["theremin", 15.11], ["synthesizer", 5.63]], null, [["speech", 28.55], ["fly, housefly", 25.34], ["insect", 10.19]], [["fly, housefly", 46.72], ["insect", 11.11], ["fart", 10.12]], [["speech", 23.55], ["music", 21.21], ["foghorn", 20.07]], [["speech", 30.27], ["music", 28.71], ["hum", 16.04]], null, [["music", 35.53], ["throbbing", 19.85], ["hum", 8.57]], [["music", 29.15], ["speech", 20.91], ["throbbing", 5.97]], [["throbbing", 34.31], ["music", 17.83], ["speech", 9.54]], null, null, [["eruption", 11.56], ["boing", 6.14], ["music", 5.99]], null, [["noise", 10.5], ["cattle, bovinae", 9.5], ["livestock, farm animals, working animals", 9.15]], null, null, null, null, [["fly, housefly", 10.21], ["mosquito", 9.96], ["insect", 7.69]], [["fly, housefly", 19.14], ["mosquito", 12.83], ["speech", 11.73]], [["music", 48.34], ["speech", 7.32], ["electronic music", 2.52]]], "duration": [4.5, 0.82, 3.25, 6.43, 1.33, 26.11, 2.93, 5.75, 2.78, 1.82, 27.51, 4.51, 7.29, 6.32, 0.67, 11.53, 5.34, 3.74, 0.65, 1.4, 3.07, 1.85, 4.97, 0.38, 1.03, 1.54, 0.39, 2.96, 8.09, 2.6]} \ No newline at end of file diff --git a/annotations_1/A83gS4JJXXE_filtered.json b/annotations_1/A83gS4JJXXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a403bf291a7618b37c720e80098a3ae2a1a0e7c8 --- /dev/null +++ b/annotations_1/A83gS4JJXXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [4.0, 4.67], [6.0, 8.06], [9.0, 9.73], [13.0, 14.08], [16.0, 18.0], [20.0, 20.56], [22.0, 23.79], [25.0, 26.54], [27.0, 28.98], [30.0, 31.41], [33.0, 33.98], [35.0, 35.75], [37.0, 39.9], [41.0, 42.55], [45.0, 45.4], [48.0, 52.95], [53.0, 59.1], [59.0, 82.44], [84.0, 88.55], [89.0, 90.56], [92.0, 93.48], [97.0, 98.25], [100.0, 101.12], [102.0, 115.37], [123.0, 123.26], [126.0, 126.64], [127.0, 127.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.95, 99.68, 68.67, 71.0, 0.0, 0.0, 0.0, 0.0, 42.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.99], ["music", 18.48], ["thunk", 8.07]], null, null, null], "duration": [1.3, 0.67, 2.06, 0.73, 1.08, 2.0, 0.56, 1.79, 1.54, 1.98, 1.41, 0.98, 0.75, 2.9, 1.55, 0.4, 4.95, 6.1, 23.44, 4.55, 1.56, 1.48, 1.25, 1.12, 13.37, 0.26, 0.64, 0.82]} \ No newline at end of file diff --git a/annotations_1/A8BfSnbFxj4_filtered.json b/annotations_1/A8BfSnbFxj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db78905cbc29f80702c9c9b036a9f251cccc680a --- /dev/null +++ b/annotations_1/A8BfSnbFxj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.25], [23.0, 25.2], [26.0, 30.65], [33.0, 34.74], [36.0, 52.22], [54.0, 55.44], [56.0, 82.0], [85.0, 106.98], [109.0, 121.24], [131.0, 134.25], [135.0, 141.47], [145.0, 158.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [66.03, 100.0, 75.39, 0.0, 100.0, 0.0, 57.17, 58.13, 83.16, 33.55, 34.67, 33.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 38.95], ["didgeridoo", 21.49], ["wind instrument, woodwind instrument", 6.37]], [["music", 40.61], ["didgeridoo", 15.5], ["sidetone", 7.94]], [["speech", 34.58], ["music", 22.2], ["didgeridoo", 12.12]]], "duration": [2.25, 2.2, 4.65, 1.74, 16.22, 1.44, 26.0, 21.98, 12.24, 3.25, 6.47, 13.45]} \ No newline at end of file diff --git a/annotations_1/A8xy9h5olhQ_filtered.json b/annotations_1/A8xy9h5olhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e20b970fb14833a85ba0458a9debd7c8e670ae1f --- /dev/null +++ b/annotations_1/A8xy9h5olhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 49.03], [50.0, 69.57], [78.0, 78.98], [83.0, 101.68], [103.0, 103.62], [105.0, 105.71], [107.0, 108.08], [111.0, 112.11], [113.0, 113.1], [114.0, 115.37], [116.0, 143.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.9, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.37], "audiomae_on_audioset": [null, [["music", 57.71], ["hum", 9.03], ["throbbing", 6.2]], null, [["music", 77.57], ["musical instrument", 3.92], ["guitar", 2.74]], null, null, null, null, null, null, [["music", 60.35], ["speech", 13.61], ["hum", 2.78]]], "duration": [48.03, 19.57, 0.98, 18.68, 0.62, 0.71, 1.08, 1.11, 0.1, 1.37, 27.68]} \ No newline at end of file diff --git a/annotations_1/A949a8j5Boo_filtered.json b/annotations_1/A949a8j5Boo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4af6e60f42e0ae1334012e094c7964d930fc272 --- /dev/null +++ b/annotations_1/A949a8j5Boo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.32], [11.0, 11.52], [12.0, 13.86], [16.0, 29.79], [31.0, 34.42], [36.0, 42.21], [43.0, 43.02], [43.0, 43.06], [46.0, 46.65], [47.0, 48.76], [49.0, 51.73], [53.0, 57.82], [59.0, 77.25], [78.0, 79.35], [80.0, 82.49], [83.0, 87.1]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, true, true, false, true, true], "silence_prob": [32.94, 0.0, 0.0, 34.21, 92.97, 44.29, 0.0, 0.0, 0.0, 0.0, 80.82, 35.07, 37.91, 0.0, 38.16, 35.18], "audiomae_on_audioset": [[["throbbing", 32.59], ["music", 22.34], ["hum", 21.42]], null, null, [["music", 31.5], ["cat", 13.43], ["didgeridoo", 8.71]], null, [["fly, housefly", 22.85], ["sidetone", 19.48], ["frog", 11.08]], null, null, null, null, null, [["noise", 47.7], ["sidetone", 13.65], ["whale vocalization", 5.76]], [["animal", 16.2], ["cat", 10.3], ["roaring cats (lions, tigers)", 9.37]], null, [["hum", 28.42], ["music", 28.36], ["noise", 8.92]], [["music", 36.26], ["speech", 13.92], ["synthesizer", 10.34]]], "duration": [5.32, 0.52, 1.86, 13.79, 3.42, 6.21, 0.02, 0.06, 0.65, 1.76, 2.73, 4.82, 18.25, 1.35, 2.49, 4.1]} \ No newline at end of file diff --git a/annotations_1/A9QknjLLso4_filtered.json b/annotations_1/A9QknjLLso4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0c15753fc922993592a4eb8c81090ecb5244ae4 --- /dev/null +++ b/annotations_1/A9QknjLLso4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [8.0, 64.27], [65.0, 75.66]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 63.85], "audiomae_on_audioset": [null, null, null], "duration": [1.06, 56.27, 10.66]} \ No newline at end of file diff --git a/annotations_1/A9sd10CHAP8_filtered.json b/annotations_1/A9sd10CHAP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a116c3040591a7cee1513730bd301fc45a099f31 --- /dev/null +++ b/annotations_1/A9sd10CHAP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [8.0, 8.56], [18.0, 23.95], [31.0, 33.27], [36.0, 37.49], [42.0, 42.45], [44.0, 43.83], [46.0, 46.18], [49.0, 49.27], [51.0, 50.72], [56.0, 55.66], [60.0, 60.67], [64.0, 65.77], [68.0, 69.87], [70.0, 70.17], [73.0, 77.95], [78.0, 78.17], [104.0, 105.63], [106.0, 105.66], [106.0, 108.67]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.12, 39.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.2, 0.0, 0.0, 0.0, 36.02], "audiomae_on_audioset": [null, null, [["music", 47.75], ["throbbing", 17.21], ["hum", 15.32]], [["chant", 20.81], ["choir", 20.56], ["singing", 11.8]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.17], ["fart", 28.37], ["zipper (clothing)", 2.06]], null, null, null, [["cattle, bovinae", 51.1], ["moo", 32.7], ["livestock, farm animals, working animals", 15.99]]], "duration": [0.66, 0.56, 5.95, 2.27, 1.49, 0.45, -0.17, 0.18, 0.27, -0.28, -0.34, 0.67, 1.77, 1.87, 0.17, 4.95, 0.17, 1.63, -0.34, 2.67]} \ No newline at end of file diff --git a/annotations_1/AAByjopE2GE_filtered.json b/annotations_1/AAByjopE2GE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef3e1bc6d0967ef557ce3c9a24e13398025a31f1 --- /dev/null +++ b/annotations_1/AAByjopE2GE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.25], [19.0, 19.03], [31.0, 31.8], [44.0, 49.44], [50.0, 62.75], [64.0, 66.53], [67.0, 90.12], [92.0, 102.36]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.03, 33.82, 57.09, 34.19, 33.15], "audiomae_on_audioset": [null, null, null, [["music", 65.65], ["speech", 5.54], ["ding", 3.58]], [["music", 49.19], ["speech", 17.23], ["drum machine", 2.9]], null, [["music", 69.32], ["drum machine", 6.07], ["speech", 5.33]], [["music", 54.96], ["speech", 17.45], ["musical instrument", 3.55]]], "duration": [1.25, 0.03, 0.8, 5.44, 12.75, 2.53, 23.12, 10.36]} \ No newline at end of file diff --git a/annotations_1/AALREbJZEZk_filtered.json b/annotations_1/AALREbJZEZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb11d97c30c43ef41b5f6bcc5b8287f131b60b41 --- /dev/null +++ b/annotations_1/AALREbJZEZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [8.0, 8.46], [13.0, 13.86], [15.0, 16.04], [17.0, 18.47], [25.0, 26.2], [27.0, 28.43], [34.0, 34.25], [36.0, 36.49], [38.0, 39.99], [44.0, 45.37], [52.0, 54.51], [62.0, 61.74], [68.0, 72.2], [80.0, 81.5], [91.0, 91.02], [92.0, 92.92], [106.0, 106.27], [110.0, 115.72], [120.0, 120.92], [151.0, 151.88], [157.0, 169.08], [171.0, 171.63], [172.0, 173.8], [179.0, 179.39], [182.0, 183.46], [190.0, 190.7], [192.0, 193.04], [197.0, 200.5], [206.0, 206.79], [208.0, 211.77], [215.0, 214.95], [215.0, 215.05], [216.0, 218.59], [237.0, 241.95], [244.0, 252.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4, 0.0, 33.03, 0.0, 0.0, 0.0, 0.0, 33.09, 0.0, 0.0, 32.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.83, 0.0, 32.34, 0.0, 0.0, 30.95, 30.43, 30.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 45.16], ["sampler", 6.3], ["synthesizer", 5.48]], null, [["music", 73.75], ["throbbing", 6.25], ["sidetone", 2.84]], null, null, null, null, [["music", 56.08], ["speech", 15.44], ["sidetone", 6.2]], null, null, [["music", 60.37], ["brass instrument", 10.89], ["didgeridoo", 4.7]], null, null, null, null, null, null, [["music", 63.59], ["musical instrument", 6.75], ["foghorn", 6.11]], null, [["music", 84.26], ["synthesizer", 3.4], ["musical instrument", 2.6]], null, null, [["music", 52.4], ["synthesizer", 8.19], ["musical instrument", 4.16]], [["music", 57.96], ["musical instrument", 5.22], ["brass instrument", 3.81]], [["music", 46.18], ["trombone", 17.92], ["brass instrument", 9.65]]], "duration": [1.6, 0.46, 0.86, 1.04, 1.47, 1.2, 1.43, 0.25, 0.49, 1.99, 1.37, 2.51, -0.26, 4.2, 1.5, 0.02, 0.92, 0.27, 5.72, 0.92, 0.88, 12.08, 0.63, 1.8, 0.39, 1.46, 0.7, 1.04, 3.5, 0.79, 3.77, -0.05, 0.05, 2.59, 4.95, 8.44]} \ No newline at end of file diff --git a/annotations_1/AAN85u-udis_filtered.json b/annotations_1/AAN85u-udis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..001a1c7d87ec4a4d627ebe93049c70ab1be82ade --- /dev/null +++ b/annotations_1/AAN85u-udis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.31], [29.0, 30.48], [35.0, 34.86], [36.0, 37.89], [46.0, 47.46], [51.0, 53.62], [68.0, 79.47], [80.0, 80.91], [81.0, 93.68], [95.0, 94.88], [105.0, 105.12], [106.0, 107.64]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.72, 29.7, 0.0, 30.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.84], ["didgeridoo", 16.51], ["speech", 14.54]], [["music", 58.56], ["didgeridoo", 12.28], ["throbbing", 11.76]], null, [["music", 56.26], ["throbbing", 19.8], ["hum", 8.11]], null, null, null], "duration": [0.31, 1.48, -0.14, 1.89, 1.46, 2.62, 11.47, 0.91, 12.68, -0.12, 0.12, 1.64]} \ No newline at end of file diff --git a/annotations_1/AC9URVogG3g_filtered.json b/annotations_1/AC9URVogG3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64dce71c5abb21c7776ebf807bba65c4aa6dc0f6 --- /dev/null +++ b/annotations_1/AC9URVogG3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.36], [20.0, 44.63], [48.0, 53.08], [55.0, 77.25], [78.0, 81.31], [82.0, 83.81], [85.0, 85.99], [87.0, 87.02], [87.0, 87.44], [88.0, 100.62], [102.0, 104.03], [105.0, 106.89], [109.0, 113.75], [115.0, 130.2], [130.0, 140.59]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [35.87, 29.37, 29.45, 29.37, 39.57, 0.0, 0.0, 0.0, 0.0, 30.5, 65.2, 0.0, 46.94, 30.22, 30.96], "audiomae_on_audioset": [[["music", 64.46], ["inside, large room or hall", 3.34], ["chirp tone", 2.59]], [["livestock, farm animals, working animals", 34.54], ["cattle, bovinae", 25.61], ["moo", 10.28]], [["music", 37.21], ["groan", 6.88], ["cacophony", 6.56]], [["music", 71.9], ["theremin", 6.27], ["throbbing", 4.58]], [["gong", 51.45], ["music", 22.54], ["ambient music", 5.18]], null, null, null, null, [["hum", 17.52], ["sound effect", 15.73], ["music", 12.41]], null, null, [["speech", 30.64], ["noise", 12.17], ["music", 9.49]], [["music", 33.47], ["speech", 18.63], ["throbbing", 17.84]], [["music", 35.85], ["throbbing", 14.56], ["synthesizer", 13.81]]], "duration": [10.36, 24.63, 5.08, 22.25, 3.31, 1.81, 0.99, 0.02, 0.44, 12.62, 2.03, 1.89, 4.75, 15.2, 10.59]} \ No newline at end of file diff --git a/annotations_1/ACcJF4BpXXU_filtered.json b/annotations_1/ACcJF4BpXXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ac37f8571d869c4fbb7b95a9864b95b509465c9 --- /dev/null +++ b/annotations_1/ACcJF4BpXXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.63], [20.0, 21.0], [22.0, 23.21], [24.0, 28.21], [29.0, 30.59], [31.0, 32.64], [33.0, 34.65], [36.0, 40.37], [42.0, 44.85], [46.0, 48.09], [49.0, 50.36], [51.0, 67.71], [69.0, 71.27], [73.0, 73.57], [74.0, 75.03], [80.0, 81.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 91.81, 100.0, 100.0, 0.0, 100.0, 99.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.63, 1.0, 1.21, 4.21, 1.59, 1.64, 1.65, 4.37, 2.85, 2.09, 1.36, 16.71, 2.27, 0.57, 1.03, 1.16]} \ No newline at end of file diff --git a/annotations_1/AD26OcrFQOY_filtered.json b/annotations_1/AD26OcrFQOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c33b96f84b0aeea2adb1eda787aff07efd18331 --- /dev/null +++ b/annotations_1/AD26OcrFQOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.74], [3.0, 4.46], [5.0, 7.35], [9.0, 10.3], [12.0, 14.37], [15.0, 15.45], [17.0, 17.02], [40.0, 40.68], [42.0, 42.55], [44.0, 45.18], [49.0, 56.44], [57.0, 59.88], [61.0, 64.45], [66.0, 69.74], [70.0, 73.38], [75.0, 74.97], [76.0, 75.86], [78.0, 83.32], [89.0, 96.42], [97.0, 96.79], [97.0, 99.08], [100.0, 101.36], [103.0, 105.76], [107.0, 108.26], [110.0, 114.91], [117.0, 125.29], [127.0, 154.21], [155.0, 155.02], [158.0, 161.54], [163.0, 164.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.66, 0.0, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 86.45, 48.91, 95.51, 51.07, 0.0, 0.0, 84.43, 88.64, 0.0, 53.34, 0.0, 75.88, 0.0, 91.47, 88.46, 69.74, 0.0, 73.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.1], ["music", 6.93], ["singing bowl", 5.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 1.46, 2.35, 1.3, 2.37, 0.45, 0.02, 0.68, 0.55, 1.18, 7.44, 2.88, 3.45, 3.74, 3.38, -0.03, -0.14, 5.32, 7.42, -0.21, 2.08, 1.36, 2.76, 1.26, 4.91, 8.29, 27.21, 0.02, 3.54, 1.35]} \ No newline at end of file diff --git a/annotations_1/AD3baa_nijI_filtered.json b/annotations_1/AD3baa_nijI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c820ff81caceedeb8565f3774722dac79316c812 --- /dev/null +++ b/annotations_1/AD3baa_nijI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.2], [16.0, 16.01], [26.0, 26.57], [33.0, 35.78], [39.0, 40.85], [43.0, 58.06], [64.0, 64.67], [67.0, 72.17], [84.0, 85.01], [86.0, 85.7], [87.0, 87.35], [88.0, 89.31], [91.0, 91.25], [92.0, 95.94], [97.0, 124.66], [126.0, 126.94], [129.0, 129.2], [131.0, 132.34], [133.0, 148.1], [151.0, 169.64], [178.0, 196.4]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.8, 0.0, 33.0, 0.0, 33.38, 0.0, 0.0, 0.0, 0.0, 0.0, 33.7, 33.03, 0.0, 0.0, 0.0, 33.43, 33.38, 33.39], "audiomae_on_audioset": [null, null, null, [["music", 62.58], ["synthesizer", 7.36], ["mains hum", 5.41]], null, [["music", 45.04], ["speech", 21.13], ["electronic music", 3.07]], null, [["boing", 43.36], ["music", 33.58], ["throbbing", 5.83]], null, null, null, null, null, [["music", 55.5], ["speech", 17.72], ["synthesizer", 2.96]], [["music", 26.27], ["livestock, farm animals, working animals", 14.94], ["bleat", 10.5]], null, null, null, [["music", 65.78], ["boing", 8.5], ["synthesizer", 2.88]], [["speech", 50.39], ["music", 31.46], ["boing", 4.66]], [["music", 45.94], ["hum", 9.27], ["throbbing", 7.6]]], "duration": [0.2, 0.01, 0.57, 2.78, 1.85, 15.06, 0.67, 5.17, 1.01, -0.3, 0.35, 1.31, 0.25, 3.94, 27.66, 0.94, 0.2, 1.34, 15.1, 18.64, 18.4]} \ No newline at end of file diff --git a/annotations_1/ADqmUtPjP0Q_filtered.json b/annotations_1/ADqmUtPjP0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9701a1224a31988b3b29018d3ff6dc414437569 --- /dev/null +++ b/annotations_1/ADqmUtPjP0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.92], [7.0, 8.48], [14.0, 27.31], [31.0, 35.21], [39.0, 40.51], [43.0, 45.1], [45.0, 46.82], [47.0, 51.41], [53.0, 56.44], [58.0, 58.38], [60.0, 59.97], [64.0, 64.29], [66.0, 67.24], [93.0, 93.95], [96.0, 97.07], [103.0, 103.71], [105.0, 106.39], [113.0, 114.18], [133.0, 133.78], [138.0, 139.24]], "keep_status": [true, false, true, true, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.63, 0.0, 29.32, 29.43, 0.0, 29.78, 0.0, 30.02, 30.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 49.44], ["music", 7.08], ["vehicle", 4.76]], null, [["hum", 30.2], ["music", 19.93], ["throbbing", 14.73]], [["hum", 26.26], ["mains hum", 16.3], ["throbbing", 12.35]], null, [["speech", 26.66], ["microwave oven", 11.53], ["hum", 11.32]], null, [["hum", 24.07], ["mains hum", 23.11], ["speech", 19.65]], [["music", 27.62], ["hum", 21.0], ["throbbing", 11.05]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.92, 1.48, 13.31, 4.21, 1.51, 2.1, 1.82, 4.41, 3.44, 0.38, -0.03, 0.29, 1.24, 0.95, 1.07, 0.71, 1.39, 1.18, 0.78, 1.24]} \ No newline at end of file diff --git a/annotations_1/AE4RhPMAtp0_filtered.json b/annotations_1/AE4RhPMAtp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b72aef92ff874b8f742b008aa0b05c7e72a05623 --- /dev/null +++ b/annotations_1/AE4RhPMAtp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.37], [12.0, 15.48], [17.0, 28.0], [33.0, 60.51], [61.0, 61.42], [63.0, 62.95], [63.0, 63.21], [66.0, 67.26], [70.0, 71.63], [74.0, 87.44], [88.0, 90.95], [92.0, 94.37], [98.0, 98.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [98.99, 97.43, 99.99, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 40.73, 56.1, 82.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["animal", 19.83], ["speech", 15.53], ["grunt", 8.61]], null, null, null], "duration": [2.37, 3.48, 11.0, 27.51, 0.42, -0.05, 0.21, 1.26, 1.63, 13.44, 2.95, 2.37, 0.66]} \ No newline at end of file diff --git a/annotations_1/AEBd24_Uxfk_filtered.json b/annotations_1/AEBd24_Uxfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f270eef218e1f03258237cc5e698025a9cb00af --- /dev/null +++ b/annotations_1/AEBd24_Uxfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [11.0, 12.19], [13.0, 16.6], [19.0, 19.89], [21.0, 21.96], [23.0, 24.71], [29.0, 37.22], [39.0, 61.06], [70.0, 76.87], [79.0, 85.83], [87.0, 87.52], [88.0, 103.69], [105.0, 114.72]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 52.74, 0.0, 0.0, 0.0, 52.68, 32.19, 30.77, 30.33, 0.0, 30.27, 31.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 50.0], ["speech", 11.27], ["whack, thwack", 7.46]], [["music", 31.46], ["clang", 15.32], ["hum", 10.65]], [["music", 43.9], ["speech", 35.95], ["hum", 3.71]], null, [["hum", 31.39], ["mains hum", 30.92], ["music", 14.47]], [["music", 42.09], ["ding", 11.17], ["throbbing", 10.83]]], "duration": [0.56, 1.19, 3.6, 0.89, 0.96, 1.71, 8.22, 22.06, 6.87, 6.83, 0.52, 15.69, 9.72]} \ No newline at end of file diff --git a/annotations_1/AEYh9Sh6kk8_filtered.json b/annotations_1/AEYh9Sh6kk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1735c1d4a0ab5fbc8172e68bf4372faa62bbefe0 --- /dev/null +++ b/annotations_1/AEYh9Sh6kk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [4.0, 6.3], [7.0, 7.89], [20.0, 20.55], [21.0, 21.69], [24.0, 24.17], [25.0, 25.47], [26.0, 27.46], [31.0, 31.82], [61.0, 61.57], [62.0, 77.67], [80.0, 82.46], [86.0, 89.83], [95.0, 96.58], [102.0, 102.34], [104.0, 105.78], [107.0, 107.62], [109.0, 114.24], [118.0, 118.62], [127.0, 128.55], [129.0, 135.16]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.22, 29.92, 29.16, 0.0, 0.0, 0.0, 0.0, 32.51, 0.0, 0.0, 87.92], "audiomae_on_audioset": [null, [["speech", 26.13], ["animal", 15.94], ["domestic animals, pets", 5.48]], null, null, null, null, null, null, null, null, [["music", 67.69], ["static", 3.24], ["sampler", 2.42]], [["music", 63.31], ["synthesizer", 7.77], ["drum machine", 5.34]], [["music", 72.56], ["boing", 5.46], ["zipper (clothing)", 3.5]], null, null, null, null, [["speech", 77.88], ["music", 5.67], ["scratching (performance technique)", 5.08]], null, null, null], "duration": [0.86, 2.3, 0.89, 0.55, 0.69, 0.17, 0.47, 1.46, 0.82, 0.57, 15.67, 2.46, 3.83, 1.58, 0.34, 1.78, 0.62, 5.24, 0.62, 1.55, 6.16]} \ No newline at end of file diff --git a/annotations_1/AGY5gNpoPfI_filtered.json b/annotations_1/AGY5gNpoPfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16e8be17f3a6c8c0018a20ca608e559738bd3a41 --- /dev/null +++ b/annotations_1/AGY5gNpoPfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.7], [18.0, 18.33], [25.0, 41.67], [43.0, 46.6], [48.0, 48.96], [50.0, 51.66], [52.0, 52.46], [53.0, 57.03], [66.0, 66.43], [69.0, 69.06], [70.0, 70.53], [71.0, 71.19], [73.0, 73.38], [76.0, 78.92], [80.0, 81.65], [95.0, 95.4], [118.0, 118.42], [120.0, 123.3], [127.0, 127.25], [128.0, 128.82], [134.0, 134.06], [136.0, 136.44], [137.0, 140.41], [141.0, 145.07], [145.0, 145.52], [148.0, 148.19], [149.0, 149.61], [156.0, 157.99], [161.0, 162.01], [174.0, 174.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.88, 69.74, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 42.79, 42.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 69.84], ["thunk", 23.14], ["boing", 0.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["tuning fork", 53.6], ["speech", 24.89], ["thunk", 4.71]], [["speech", 71.23], ["inside, small room", 4.69], ["radio", 4.17]], null, null, null, null, null, null], "duration": [0.7, 0.33, 16.67, 3.6, 0.96, 1.66, 0.46, 4.03, 0.43, 0.06, 0.53, 0.19, 0.38, 2.92, 1.65, 0.4, 0.42, 3.3, 0.25, 0.82, 0.06, 0.44, 3.41, 4.07, 0.52, 0.19, 0.61, 1.99, 1.01, 0.34]} \ No newline at end of file diff --git a/annotations_1/AHLo7Vs6drM_filtered.json b/annotations_1/AHLo7Vs6drM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df9ecd42bee584a8d02876412ffc3181e6161356 --- /dev/null +++ b/annotations_1/AHLo7Vs6drM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [11.0, 11.58], [13.0, 14.54], [16.0, 17.64], [19.0, 23.43], [24.0, 24.76], [58.0, 59.54], [62.0, 63.07], [64.0, 64.4], [65.0, 64.86], [66.0, 65.64], [66.0, 66.39], [69.0, 71.46], [77.0, 78.56], [85.0, 85.67], [88.0, 87.99], [88.0, 89.04], [94.0, 99.25], [101.0, 101.55], [106.0, 107.05], [109.0, 109.71], [110.0, 112.6], [115.0, 115.7], [117.0, 117.04]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.88, 0.0, 0.0, 0.0, 0.0, 39.11, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.8], ["sine wave", 18.68], ["chirp tone", 14.38]], null, null, null, null, null, null, null, [["hum", 32.68], ["mains hum", 29.23], ["throbbing", 13.81]], null, null, null, null, [["music", 17.77], ["hum", 11.84], ["speech", 8.47]], null, null, null, [["hum", 23.53], ["music", 22.74], ["mains hum", 11.29]], null, null], "duration": [0.46, 0.58, 1.54, 1.64, 4.43, 0.76, 1.54, 1.07, 0.4, -0.14, -0.36, 0.39, 2.46, 1.56, 0.67, -0.01, 1.04, 5.25, 0.55, 1.05, 0.71, 2.6, 0.7, 0.04]} \ No newline at end of file diff --git a/annotations_1/AHV1LepZ2KM_filtered.json b/annotations_1/AHV1LepZ2KM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25be3104206d49ff34d49640eca224888286917f --- /dev/null +++ b/annotations_1/AHV1LepZ2KM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [20.0, 20.33], [22.0, 23.08], [26.0, 25.84], [27.0, 28.31], [35.0, 35.7], [37.0, 37.69], [48.0, 47.92], [49.0, 50.94], [54.0, 54.41], [72.0, 72.86], [74.0, 75.0], [78.0, 78.8], [81.0, 81.67], [85.0, 93.8], [95.0, 96.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.97], ["music", 19.98], ["crowd", 11.21]], null], "duration": [0.19, 0.33, 1.08, -0.16, 1.31, 0.7, 0.69, -0.08, 1.94, 0.41, 0.86, 1.0, 0.8, 0.67, 8.8, 1.69]} \ No newline at end of file diff --git a/annotations_1/AHjOZLikqoM_filtered.json b/annotations_1/AHjOZLikqoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e68150558ffbd54cbb1c035097e5da1162fccd1 --- /dev/null +++ b/annotations_1/AHjOZLikqoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.13], [13.0, 15.74], [21.0, 20.85], [23.0, 23.26], [26.0, 26.64], [33.0, 35.99], [37.0, 46.33], [48.0, 49.25], [50.0, 50.04], [51.0, 52.02], [58.0, 59.31], [65.0, 65.13], [69.0, 70.17], [71.0, 71.36], [75.0, 74.95], [77.0, 78.26], [81.0, 81.14], [91.0, 90.95], [93.0, 93.45], [94.0, 95.91], [97.0, 96.65], [97.0, 98.71], [109.0, 109.14], [110.0, 111.0], [111.0, 118.27], [120.0, 120.18], [122.0, 123.11], [124.0, 132.87], [135.0, 135.09], [137.0, 137.17], [139.0, 139.26], [143.0, 143.4], [155.0, 156.74], [158.0, 160.56], [161.0, 161.92], [167.0, 167.04], [168.0, 168.71], [171.0, 171.78], [175.0, 176.61], [179.0, 182.07], [183.0, 184.69], [188.0, 188.54], [190.0, 193.63]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.91, 88.64, 0.0, 0.0, 0.0, 32.35, 30.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 0.0, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 94.37], "audiomae_on_audioset": [[["speech", 53.86], ["applause", 8.69], ["male speech, man speaking", 8.62]], null, null, null, null, [["throbbing", 40.21], ["hum", 29.41], ["music", 14.39]], [["cattle, bovinae", 19.89], ["livestock, farm animals, working animals", 17.98], ["moo", 12.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.04], ["hum", 15.2], ["thunk", 4.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.13, 2.74, -0.15, 0.26, 0.64, 2.99, 9.33, 1.25, 0.04, 1.02, 1.31, 0.13, 1.17, 0.36, -0.05, 1.26, 0.14, -0.05, 0.45, 1.91, -0.35, 1.71, 0.14, 1.0, 7.27, 0.18, 1.11, 8.87, 0.09, 0.17, 0.26, 0.4, 1.74, 2.56, 0.92, 0.04, 0.71, 0.78, 1.61, 3.07, 1.69, 0.54, 3.63]} \ No newline at end of file diff --git a/annotations_1/AIQHqvG9Ql8_filtered.json b/annotations_1/AIQHqvG9Ql8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..477167fdee6e8a8f61a8163e64d14a4a7fbf7e45 --- /dev/null +++ b/annotations_1/AIQHqvG9Ql8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [15.0, 16.29], [18.0, 18.2], [24.0, 24.0], [24.0, 24.56], [25.0, 27.51], [28.0, 28.65], [32.0, 32.8], [45.0, 65.45], [73.0, 76.5], [82.0, 94.51], [97.0, 120.11], [121.0, 125.66], [128.0, 135.58], [137.0, 150.42], [153.0, 157.28], [159.0, 163.95], [174.0, 175.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.4, 0.0, 0.0, 29.01, 29.25, 28.71, 29.32, 32.11, 29.72, 29.97, 30.16, 30.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.81], ["speech", 41.14], ["radio", 1.07]], null, null, [["music", 39.86], ["speech", 39.56], ["machine gun", 3.78]], [["music", 37.53], ["speech", 24.32], ["gunshot, gunfire", 5.14]], [["music", 39.8], ["smash, crash", 21.91], ["whack, thwack", 4.55]], [["speech", 71.86], ["breaking", 7.98], ["music", 6.11]], [["music", 46.88], ["speech", 14.31], ["boing", 7.21]], [["breaking", 64.95], ["smash, crash", 7.1], ["music", 6.97]], [["music", 60.53], ["speech", 11.55], ["whack, thwack", 8.58]], [["music", 63.55], ["speech", 10.78], ["sidetone", 4.94]], [["breaking", 52.1], ["music", 13.13], ["smash, crash", 8.18]], null], "duration": [0.61, 1.29, 0.2, 0.0, 0.56, 2.51, 0.65, 0.8, 20.45, 3.5, 12.51, 23.11, 4.66, 7.58, 13.42, 4.28, 4.95, 1.66]} \ No newline at end of file diff --git a/annotations_1/AJQd_pt3-pk_filtered.json b/annotations_1/AJQd_pt3-pk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..981d8790bc34cd631bff52aff697430e0230fb7d --- /dev/null +++ b/annotations_1/AJQd_pt3-pk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.13], [5.0, 20.39], [21.0, 31.72], [32.0, 32.64], [36.0, 37.5], [39.0, 39.23], [40.0, 41.08], [43.0, 51.17], [55.0, 63.53], [69.0, 69.57], [71.0, 74.58], [79.0, 79.51], [82.0, 81.8], [82.0, 83.86], [84.0, 87.3], [88.0, 89.61], [90.0, 100.45], [105.0, 105.63], [107.0, 116.45], [118.0, 120.29], [121.0, 130.5], [132.0, 151.31], [152.0, 156.34]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, true, true, true, true], "silence_prob": [94.52, 56.55, 30.51, 0.0, 0.0, 0.0, 0.0, 31.36, 31.84, 0.0, 40.93, 0.0, 0.0, 0.0, 39.33, 0.0, 32.58, 0.0, 30.97, 31.71, 34.71, 33.02, 39.66], "audiomae_on_audioset": [null, null, [["speech", 34.49], ["explosion", 17.19], ["music", 7.56]], null, null, null, null, [["speech", 45.86], ["music", 16.43], ["cattle, bovinae", 3.81]], [["speech", 61.44], ["explosion", 12.87], ["music", 6.92]], null, [["fly, housefly", 32.76], ["mosquito", 21.31], ["insect", 20.62]], null, null, null, [["speech", 6.69], ["cattle, bovinae", 5.56], ["animal", 4.71]], null, [["speech", 39.25], ["hum", 20.7], ["mains hum", 6.57]], null, [["fly, housefly", 23.59], ["insect", 15.83], ["buzz", 13.62]], [["vehicle", 22.68], ["car", 7.64], ["race car, auto racing", 6.12]], [["hum", 34.51], ["throbbing", 13.72], ["mains hum", 12.25]], [["livestock, farm animals, working animals", 28.49], ["animal", 17.12], ["music", 8.02]], [["hum", 29.96], ["mains hum", 15.52], ["noise", 13.81]]], "duration": [3.13, 15.39, 10.72, 0.64, 1.5, 0.23, 1.08, 8.17, 8.53, 0.57, 3.58, 0.51, -0.2, 1.86, 3.3, 1.61, 10.45, 0.63, 9.45, 2.29, 9.5, 19.31, 4.34]} \ No newline at end of file diff --git a/annotations_1/AKXKkeLQWac_filtered.json b/annotations_1/AKXKkeLQWac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..269805d7898dee202f2e47209c14bce6a660c723 --- /dev/null +++ b/annotations_1/AKXKkeLQWac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.96], [11.0, 11.45], [36.0, 36.58], [38.0, 38.4], [39.0, 39.66], [42.0, 44.0], [44.0, 44.66], [54.0, 55.26], [56.0, 56.69], [57.0, 57.86], [64.0, 64.91], [67.0, 67.58], [71.0, 71.44], [74.0, 74.24], [78.0, 78.06], [79.0, 79.57], [81.0, 83.61], [87.0, 86.91], [88.0, 88.37], [91.0, 92.15], [93.0, 93.99], [96.0, 97.01], [108.0, 112.13]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [56.48, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 39.93], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 48.92], ["sidetone", 13.02], ["telephone", 3.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 22.77], ["sidetone", 9.96], ["hum", 7.35]]], "duration": [6.96, 0.45, 0.58, 0.4, 0.66, 2.0, 0.66, 1.26, 0.69, 0.86, 0.91, 0.58, 0.44, 0.24, 0.06, 0.57, 2.61, -0.09, 0.37, 1.15, 0.99, 1.01, 4.13]} \ No newline at end of file diff --git a/annotations_1/ALO5aag-ZIo_filtered.json b/annotations_1/ALO5aag-ZIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..781bf2b641c15029f7097e9e935aabfba428b21e --- /dev/null +++ b/annotations_1/ALO5aag-ZIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.62], [33.0, 34.4], [40.0, 42.7], [45.0, 47.16], [53.0, 54.65], [61.0, 60.93], [62.0, 62.63], [68.0, 69.25], [75.0, 76.38], [83.0, 87.2], [94.0, 111.05], [112.0, 118.3], [122.0, 122.99], [125.0, 125.86]], "keep_status": [false, false, false, true, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 36.56, 33.23, 0.0, 0.0, 0.0, 0.0, 0.0, 31.8, 44.63, 38.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 40.82], ["whale vocalization", 26.43], ["speech", 12.52]], [["speech", 6.83], ["hubbub, speech noise, speech babble", 5.34], ["whale vocalization", 4.91]], null, null, null, null, null, [["hum", 18.6], ["music", 9.92], ["throbbing", 6.84]], [["music", 42.61], ["wind instrument, woodwind instrument", 3.46], ["brass instrument", 2.98]], [["music", 38.67], ["quack", 18.53], ["duck", 8.37]], null, null], "duration": [1.62, 1.4, 2.7, 2.16, 1.65, -0.07, 0.63, 1.25, 1.38, 4.2, 17.05, 6.3, 0.99, 0.86]} \ No newline at end of file diff --git a/annotations_1/ALSUu2CSBOg_filtered.json b/annotations_1/ALSUu2CSBOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad963cdc4e4ee50881551a0d1f1dfd2e721ba057 --- /dev/null +++ b/annotations_1/ALSUu2CSBOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [7.0, 7.47], [8.0, 8.29], [9.0, 11.01], [12.0, 12.5], [13.0, 14.28], [16.0, 16.29], [17.0, 17.24], [19.0, 19.53], [22.0, 22.94], [24.0, 24.95], [26.0, 45.06], [46.0, 47.21], [51.0, 54.24], [55.0, 55.39], [57.0, 57.25], [59.0, 70.92], [72.0, 72.18], [73.0, 73.28], [74.0, 74.83], [76.0, 76.65], [78.0, 78.53], [80.0, 87.93], [88.0, 89.36], [90.0, 91.79], [94.0, 95.55], [96.0, 96.82], [104.0, 104.58], [118.0, 118.13], [126.0, 127.43], [132.0, 133.14], [134.0, 134.57], [140.0, 140.49], [142.0, 142.94], [145.0, 147.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.94, 0.0, 34.18, 0.0, 0.0, 31.26, 0.0, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.33], ["explosion", 24.58], ["noise", 18.42]], null, [["frog", 54.81], ["fly, housefly", 9.1], ["speech", 6.86]], null, null, [["speech", 20.28], ["music", 18.4], ["whistling", 13.87]], null, null, null, null, null, [["wheeze", 16.59], ["hum", 9.92], ["noise", 6.6]], null, null, null, null, null, null, null, null, null, null, null, [["frog", 52.4], ["radio", 16.26], ["sidetone", 4.76]]], "duration": [0.87, 0.47, 0.29, 2.01, 0.5, 1.28, 0.29, 0.24, 0.53, 0.94, 0.95, 19.06, 1.21, 3.24, 0.39, 0.25, 11.92, 0.18, 0.28, 0.83, 0.65, 0.53, 7.93, 1.36, 1.79, 1.55, 0.82, 0.58, 0.13, 1.43, 1.14, 0.57, 0.49, 0.94, 2.34]} \ No newline at end of file diff --git a/annotations_1/ALWV_EA6x8I_filtered.json b/annotations_1/ALWV_EA6x8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dbd7b87ef2fd6bf3fc28e5b9f195e3ff3016071 --- /dev/null +++ b/annotations_1/ALWV_EA6x8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 75.49], [85.0, 85.04], [94.0, 136.39]], "keep_status": [true, false, false], "silence_prob": [30.16, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.41], ["speech", 11.55], ["musical instrument", 6.04]], null, null], "duration": [4.49, 0.04, 42.39]} \ No newline at end of file diff --git a/annotations_1/ALYPTuyCxqI_filtered.json b/annotations_1/ALYPTuyCxqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfc77fd7a1b0e1320575866fd04fe281613082d2 --- /dev/null +++ b/annotations_1/ALYPTuyCxqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 24.75], [29.0, 30.21], [31.0, 32.29], [35.0, 36.0], [36.0, 36.58], [39.0, 54.3], [57.0, 62.5], [63.0, 64.15], [67.0, 72.69], [74.0, 76.81], [78.0, 80.49], [84.0, 93.78], [95.0, 95.66], [101.0, 101.6], [102.0, 103.2], [105.0, 106.37], [107.0, 110.0], [113.0, 114.39], [115.0, 128.73], [130.0, 130.65], [133.0, 135.55], [136.0, 135.58], [136.0, 135.62], [136.0, 135.65], [136.0, 135.72], [136.0, 135.75], [136.0, 135.78], [136.0, 140.17], [142.0, 143.94], [146.0, 147.93], [150.0, 151.44], [152.0, 152.81], [159.0, 160.57]], "keep_status": [true, false, false, false, false, true, true, false, true, true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [33.63, 0.0, 0.0, 0.0, 0.0, 32.39, 35.37, 0.0, 37.3, 37.56, 36.98, 39.78, 0.0, 0.0, 0.0, 0.0, 49.36, 0.0, 35.19, 0.0, 44.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.12, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.74], ["effects unit", 9.29], ["hum", 7.97]], null, null, null, null, [["music", 32.62], ["effects unit", 29.59], ["reverberation", 6.58]], [["music", 19.77], ["animal", 16.04], ["hum", 10.47]], null, [["mains hum", 27.02], ["hum", 24.86], ["noise", 13.19]], [["music", 44.71], ["hum", 6.12], ["static", 3.71]], [["hum", 43.88], ["mains hum", 12.74], ["music", 12.73]], [["speech", 34.57], ["hum", 16.34], ["mains hum", 12.67]], null, null, null, null, [["speech", 23.76], ["sidetone", 19.52], ["hum", 18.1]], null, [["speech", 44.23], ["hum", 13.68], ["throbbing", 13.34]], null, [["hum", 55.52], ["throbbing", 14.0], ["mains hum", 10.19]], null, null, null, null, null, null, [["speech", 32.84], ["hum", 25.77], ["throbbing", 8.97]], null, null, null, null, null], "duration": [18.75, 1.21, 1.29, 1.0, 0.58, 15.3, 5.5, 1.15, 5.69, 2.81, 2.49, 9.78, 0.66, 0.6, 1.2, 1.37, 3.0, 1.39, 13.73, 0.65, 2.55, -0.42, -0.38, -0.35, -0.28, -0.25, -0.22, 4.17, 1.94, 1.93, 1.44, 0.81, 1.57]} \ No newline at end of file diff --git a/annotations_1/ALfuWSv9YVc_filtered.json b/annotations_1/ALfuWSv9YVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16fd46830e7e6b73ced82db2cda1429ef2d3b90d --- /dev/null +++ b/annotations_1/ALfuWSv9YVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [9.0, 9.81], [11.0, 11.85], [13.0, 15.43], [18.0, 19.14], [24.0, 24.38], [28.0, 29.08], [31.0, 31.38], [33.0, 33.91], [36.0, 36.29], [40.0, 40.69], [42.0, 42.42], [47.0, 51.76], [53.0, 54.4], [56.0, 57.74], [60.0, 61.3], [66.0, 66.8], [68.0, 69.18], [72.0, 72.74], [76.0, 76.11], [77.0, 78.46], [79.0, 80.5], [81.0, 81.73], [82.0, 83.2], [89.0, 92.87], [94.0, 95.13], [96.0, 96.65], [100.0, 100.45], [106.0, 107.81], [111.0, 112.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 0.81, 0.85, 2.43, 1.14, 0.38, 1.08, 0.38, 0.91, 0.29, 0.69, 0.42, 4.76, 1.4, 1.74, 1.3, 0.8, 1.18, 0.74, 0.11, 1.46, 1.5, 0.73, 1.2, 3.87, 1.13, 0.65, 0.45, 1.81, 1.95]} \ No newline at end of file diff --git a/annotations_1/ALhR_LDm5Is_filtered.json b/annotations_1/ALhR_LDm5Is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4acfa7d2aea7e271023d34b4461ad376cfbbe32 --- /dev/null +++ b/annotations_1/ALhR_LDm5Is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.86], [7.0, 8.43], [11.0, 15.35], [23.0, 24.31], [34.0, 34.8], [46.0, 46.97], [49.0, 49.84], [66.0, 67.54], [68.0, 68.77], [69.0, 74.38], [74.0, 74.41], [74.0, 74.44], [74.0, 74.51], [75.0, 74.55], [75.0, 75.69], [76.0, 76.2], [76.0, 76.37], [76.0, 80.64], [81.0, 80.67], [81.0, 80.7], [81.0, 81.28], [82.0, 82.58], [96.0, 101.22], [101.0, 101.43], [107.0, 118.45], [120.0, 122.93]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.04, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 98.8, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 35.93], ["speech", 24.47], ["insect", 4.68]], null, null, null, null, null, null, null, [["music", 21.38], ["speech", 17.83], ["didgeridoo", 16.06]], null, null, null, null, null, null, null, null], "duration": [0.86, 1.43, 4.35, 1.31, 0.8, 0.97, 0.84, 1.54, 0.77, 5.38, 0.41, 0.44, 0.51, -0.45, 0.69, 0.2, 0.37, 4.64, -0.33, -0.3, 0.28, 0.58, 5.22, 0.43, 11.45, 2.93]} \ No newline at end of file diff --git a/annotations_1/ALw553euzsc_filtered.json b/annotations_1/ALw553euzsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf8ec08dd0bfd74a711250865d39cf9616839a4 --- /dev/null +++ b/annotations_1/ALw553euzsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 80.97], [81.0, 81.89], [86.0, 87.79], [89.0, 89.31], [91.0, 91.52], [94.0, 97.33], [104.0, 104.95], [106.0, 108.06], [109.0, 113.95], [115.0, 115.48], [119.0, 123.2], [125.0, 134.16], [137.0, 136.81]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.19, 0.0, 65.32, 58.22, 0.0, 48.65, 45.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 29.78], ["speech", 26.08], ["throbbing", 13.18]], null, null, null, null, [["hum", 39.41], ["speech", 23.35], ["mains hum", 19.81]], [["music", 59.26], ["ambient music", 9.82], ["synthesizer", 4.39]], null], "duration": [43.97, 0.89, 1.79, 0.31, 0.52, 3.33, 0.95, 2.06, 4.95, 0.48, 4.2, 9.16, -0.19]} \ No newline at end of file diff --git a/annotations_1/ANAUjvgYxjQ_filtered.json b/annotations_1/ANAUjvgYxjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d052dde3100fff2e7509959285ae8465bdd1e97 --- /dev/null +++ b/annotations_1/ANAUjvgYxjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.04], [21.0, 21.39], [24.0, 25.17], [26.0, 28.17], [32.0, 32.17], [39.0, 38.99], [43.0, 43.31], [49.0, 49.71], [56.0, 55.61], [58.0, 57.74], [60.0, 60.13], [63.0, 62.94], [75.0, 75.51], [77.0, 76.96], [77.0, 78.09], [78.0, 79.27], [96.0, 95.81], [96.0, 96.18], [131.0, 130.99], [131.0, 131.6], [184.0, 184.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.39, 1.17, 2.17, 0.17, -0.01, 0.31, 0.71, -0.39, -0.26, 0.13, -0.06, 0.51, -0.04, 1.09, 1.27, -0.19, 0.18, -0.01, 0.6, 0.22]} \ No newline at end of file diff --git a/annotations_1/ANTOMowTXZU_filtered.json b/annotations_1/ANTOMowTXZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b938b3a09aed15f9ffbeb73c5efb2f55831451d6 --- /dev/null +++ b/annotations_1/ANTOMowTXZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.46], [17.0, 17.19], [29.0, 46.13], [48.0, 52.0], [52.0, 53.99], [54.0, 54.65], [57.0, 57.16], [58.0, 62.63], [64.0, 67.59], [75.0, 80.42], [83.0, 83.83], [85.0, 85.46], [86.0, 111.25], [116.0, 122.61], [128.0, 129.63], [132.0, 131.97]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [29.89, 0.0, 29.37, 29.3, 0.0, 0.0, 0.0, 29.33, 31.67, 29.82, 0.0, 0.0, 29.57, 29.98, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 50.44], ["speech", 8.53], ["music", 4.09]], null, [["music", 40.46], ["speech", 30.47], ["animal", 3.66]], [["music", 24.98], ["speech", 14.83], ["boing", 10.1]], null, null, null, [["livestock, farm animals, working animals", 24.18], ["cattle, bovinae", 21.06], ["moo", 17.0]], [["music", 51.4], ["theremin", 25.51], ["throbbing", 4.04]], [["music", 67.01], ["sound effect", 3.61], ["noise", 2.64]], null, null, [["music", 51.89], ["cacophony", 10.67], ["musical instrument", 4.43]], [["music", 46.68], ["hum", 12.33], ["throbbing", 5.83]], null, null], "duration": [3.46, 0.19, 17.13, 4.0, 1.99, 0.65, 0.16, 4.63, 3.59, 5.42, 0.83, 0.46, 25.25, 6.61, 1.63, -0.03]} \ No newline at end of file diff --git a/annotations_1/ANXSdv-KaCQ_filtered.json b/annotations_1/ANXSdv-KaCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e93d6c3207ece631fed7d73fc2b0b86e1c6ccf08 --- /dev/null +++ b/annotations_1/ANXSdv-KaCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.53], [13.0, 14.5], [17.0, 17.81], [19.0, 19.63], [22.0, 22.84], [27.0, 28.97], [33.0, 34.52], [37.0, 38.3], [41.0, 42.48], [43.0, 51.44], [65.0, 65.99], [72.0, 72.18], [86.0, 88.99], [90.0, 93.88], [96.0, 109.24], [111.0, 114.89], [120.0, 120.04], [127.0, 128.09], [130.0, 130.59], [132.0, 134.69], [137.0, 137.0], [138.0, 138.03], [146.0, 146.4], [150.0, 150.72], [153.0, 154.36], [157.0, 157.92], [162.0, 166.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 41.16, 49.78, 55.25, 84.43, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.16], ["mantra", 20.58], ["vocal music", 5.26]], [["music", 38.26], ["effects unit", 8.06], ["musical instrument", 4.9]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.53, 1.5, 0.81, 0.63, 0.84, 1.97, 1.52, 1.3, 1.48, 8.44, 0.99, 0.18, 2.99, 3.88, 13.24, 3.89, 0.04, 1.09, 0.59, 2.69, 0.0, 0.03, 0.4, 0.72, 1.36, 0.92, 4.5]} \ No newline at end of file diff --git a/annotations_1/ANigqhwwafs_filtered.json b/annotations_1/ANigqhwwafs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d094536fd6fb48aa2f67edbf3e3d8092a8ced664 --- /dev/null +++ b/annotations_1/ANigqhwwafs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 21.34], [22.0, 40.9], [46.0, 62.94], [67.0, 66.8], [68.0, 72.0], [75.0, 84.55], [86.0, 111.99], [113.0, 113.02], [114.0, 114.49], [116.0, 116.94], [123.0, 124.23], [125.0, 125.64], [130.0, 131.41], [135.0, 135.04], [135.0, 136.05], [137.0, 140.16], [143.0, 150.11]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [28.89, 29.49, 28.65, 0.0, 29.02, 31.53, 29.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.27, 29.6], "audiomae_on_audioset": [[["mains hum", 41.33], ["hum", 33.03], ["throbbing", 8.54]], [["music", 58.27], ["synthesizer", 8.53], ["noise", 5.33]], [["music", 48.29], ["speech", 6.16], ["explosion", 5.57]], null, [["music", 34.87], ["speech", 10.72], ["whale vocalization", 6.9]], [["music", 37.93], ["hum", 16.35], ["mains hum", 7.95]], [["music", 39.6], ["speech", 37.32], ["throbbing", 2.31]], null, null, null, null, null, null, null, null, [["music", 77.56], ["musical instrument", 5.09], ["speech", 4.54]], [["music", 48.03], ["livestock, farm animals, working animals", 6.57], ["speech", 5.98]]], "duration": [18.34, 18.9, 16.94, -0.2, 4.0, 9.55, 25.99, 0.02, 0.49, 0.94, 1.23, 0.64, 1.41, 0.04, 1.05, 3.16, 7.11]} \ No newline at end of file diff --git a/annotations_1/AONuDilRd5k_filtered.json b/annotations_1/AONuDilRd5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..065a2a90d892d7a682f1e46ef6c812cd4edebc7f --- /dev/null +++ b/annotations_1/AONuDilRd5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 0.9], [2.0, 3.01], [6.0, 6.32], [6.0, 14.89], [17.0, 27.35], [39.0, 39.02], [43.0, 42.85], [45.0, 54.06], [55.0, 60.47], [61.0, 63.15], [68.0, 68.74], [69.0, 108.41], [109.0, 111.37], [112.0, 116.99], [119.0, 123.11], [126.0, 127.45], [128.0, 129.68], [131.0, 133.08], [137.0, 139.45]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.37, 29.53, 0.0, 0.0, 29.33, 32.85, 33.41, 0.0, 0.0, 29.5, 29.19, 33.33, 0.0, 0.0, 35.46, 28.32], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.73], ["music", 16.59], ["rumble", 7.68]], [["music", 32.74], ["hum", 27.9], ["mains hum", 9.15]], null, null, [["music", 38.85], ["hum", 26.82], ["mains hum", 10.98]], [["music", 41.99], ["foghorn", 5.03], ["hum", 3.31]], [["mains hum", 35.24], ["speech", 16.15], ["hum", 13.24]], null, null, [["music", 36.69], ["musical instrument", 16.11], ["theremin", 13.03]], [["theremin", 37.31], ["music", 33.47], ["synthesizer", 7.48]], [["music", 63.13], ["electronic music", 6.0], ["didgeridoo", 4.08]], null, null, [["music", 38.87], ["theremin", 23.37], ["didgeridoo", 9.61]], [["music", 45.83], ["explosion", 18.59], ["boom", 10.4]]], "duration": [0.5, -0.1, 1.01, 0.32, 8.89, 10.35, 0.02, -0.15, 9.06, 5.47, 2.15, 0.74, 39.41, 2.37, 4.99, 4.11, 1.45, 1.68, 2.08, 2.45]} \ No newline at end of file diff --git a/annotations_1/AOVHdyazjWM_filtered.json b/annotations_1/AOVHdyazjWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..214df24aec0a7bce8d6e8b1ea67d41ddc6d539a5 --- /dev/null +++ b/annotations_1/AOVHdyazjWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.32], [14.0, 15.03], [18.0, 23.58], [27.0, 31.62], [35.0, 36.21], [42.0, 74.71], [78.0, 80.6], [81.0, 81.24], [82.0, 99.22], [103.0, 103.67], [110.0, 131.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.67, 0.0, 29.9, 29.74, 0.0, 0.0, 55.46, 0.0, 28.52, 0.0, 31.85], "audiomae_on_audioset": [[["music", 78.52], ["electronic music", 2.33], ["house music", 1.79]], null, [["music", 79.54], ["electronica", 2.52], ["electronic music", 2.41]], [["hum", 38.78], ["throbbing", 25.49], ["music", 14.68]], null, null, null, null, [["music", 78.21], ["electronic music", 3.31], ["throbbing", 3.2]], null, [["music", 69.42], ["effects unit", 4.32], ["ambient music", 2.51]]], "duration": [2.32, 1.03, 5.58, 4.62, 1.21, 32.71, 2.6, 0.24, 17.22, 0.67, 21.4]} \ No newline at end of file diff --git a/annotations_1/AOv5WvKX57s_filtered.json b/annotations_1/AOv5WvKX57s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8ba8f3b552dbe032cf521dda869bd8f772efaad --- /dev/null +++ b/annotations_1/AOv5WvKX57s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.76], [7.0, 8.14], [8.0, 9.34], [10.0, 10.23], [15.0, 15.23], [19.0, 20.02], [21.0, 22.05], [25.0, 25.74], [27.0, 27.28], [40.0, 40.61], [42.0, 43.01], [43.0, 44.42], [48.0, 48.83], [52.0, 52.88], [58.0, 58.89], [62.0, 62.46], [65.0, 64.96], [71.0, 72.45], [75.0, 75.88], [77.0, 78.38], [80.0, 81.16], [82.0, 83.4], [85.0, 86.46], [87.0, 88.26], [89.0, 90.69], [92.0, 94.05], [98.0, 99.15], [101.0, 102.37], [105.0, 105.9], [108.0, 110.0], [114.0, 115.91], [117.0, 120.34], [124.0, 124.83], [127.0, 129.15], [130.0, 130.81], [134.0, 137.03], [138.0, 140.37], [141.0, 143.28], [144.0, 147.75], [151.0, 155.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 98.44, 0.0, 100.0, 100.0, 69.07, 92.31, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.76, 1.14, 1.34, 0.23, 0.23, 1.02, 1.05, 0.74, 0.28, 0.61, 1.01, 1.42, 0.83, 0.88, 0.89, 0.46, -0.04, 1.45, 0.88, 1.38, 1.16, 1.4, 1.46, 1.26, 1.69, 2.05, 1.15, 1.37, 0.9, 2.0, 1.91, 3.34, 0.83, 2.15, 0.81, 3.03, 2.37, 2.28, 3.75, 4.63]} \ No newline at end of file diff --git a/annotations_1/AQfWibFXtO4_filtered.json b/annotations_1/AQfWibFXtO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2521e36796761395e2d5a956648f4c55dc97ec42 --- /dev/null +++ b/annotations_1/AQfWibFXtO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 58.9], [61.0, 63.1], [64.0, 64.86], [65.0, 67.27], [68.0, 71.56], [72.0, 74.75], [76.0, 77.57]], "keep_status": [false, true, false, true, true, true, false], "silence_prob": [0.0, 38.51, 0.0, 33.41, 36.35, 38.4, 0.0], "audiomae_on_audioset": [null, [["speech", 53.87], ["music", 9.52], ["foghorn", 6.14]], null, [["speech", 27.42], ["music", 25.47], ["radio", 2.25]], [["music", 58.65], ["theremin", 5.44], ["animal", 2.29]], [["music", 17.67], ["speech", 16.88], ["theremin", 16.4]], null], "duration": [31.9, 2.1, 0.86, 2.27, 3.56, 2.75, 1.57]} \ No newline at end of file diff --git a/annotations_1/AQpPxTYahZo_filtered.json b/annotations_1/AQpPxTYahZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb48b02d86ef04e1a4ec71b5d54889231dbd1199 --- /dev/null +++ b/annotations_1/AQpPxTYahZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [8.0, 8.85], [11.0, 11.16], [19.0, 18.76], [21.0, 21.3], [23.0, 28.46], [30.0, 31.01], [32.0, 63.32], [65.0, 66.14], [69.0, 118.03], [122.0, 125.59], [127.0, 127.53], [130.0, 135.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 32.52, 0.0, 31.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 21.91], ["whack, thwack", 18.36], ["throbbing", 5.17]], null, [["music", 52.91], ["throbbing", 7.42], ["hum", 5.92]]], "duration": [0.76, 0.85, 0.16, -0.24, 0.3, 5.46, 1.01, 31.32, 1.14, 49.03, 3.59, 0.53, 5.19]} \ No newline at end of file diff --git a/annotations_1/ARgghWSmq7Q_filtered.json b/annotations_1/ARgghWSmq7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7551d112d8e35e5399de940ad5d764eb2ceec6ea --- /dev/null +++ b/annotations_1/ARgghWSmq7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.13], [12.0, 13.69], [15.0, 15.77], [20.0, 20.65], [21.0, 22.11], [35.0, 35.61], [36.0, 37.5], [39.0, 40.02], [54.0, 54.38], [55.0, 57.55], [71.0, 72.35], [75.0, 75.44], [77.0, 77.04], [78.0, 78.85], [80.0, 80.89], [82.0, 82.26]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.39], ["speech", 28.05], ["theremin", 4.23]], null, null, null, null, null, null, null, null, [["speech", 78.36], ["radio", 3.08], ["telephone", 1.81]], null, null, null, null, null, null], "duration": [6.13, 1.69, 0.77, 0.65, 1.11, 0.61, 1.5, 1.02, 0.38, 2.55, 1.35, 0.44, 0.04, 0.85, 0.89, 0.26]} \ No newline at end of file diff --git a/annotations_1/ATNjQgr7LXc_filtered.json b/annotations_1/ATNjQgr7LXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..667b86244058a15d5ba6c6076b448f5b894624c5 --- /dev/null +++ b/annotations_1/ATNjQgr7LXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [7.0, 7.2], [7.0, 8.09], [10.0, 9.93], [15.0, 15.2], [19.0, 20.16], [20.0, 20.66], [21.0, 24.07], [26.0, 26.87], [27.0, 29.34], [30.0, 33.54], [34.0, 34.94], [36.0, 36.68], [37.0, 37.76], [46.0, 46.45], [47.0, 47.7], [51.0, 52.32], [57.0, 59.81], [60.0, 64.57], [66.0, 66.58], [67.0, 67.9], [69.0, 74.46], [77.0, 77.75], [79.0, 81.06], [82.0, 83.4], [86.0, 86.63], [92.0, 93.78], [94.0, 98.22], [99.0, 100.41], [101.0, 101.8], [106.0, 107.35], [110.0, 114.81], [117.0, 117.78], [119.0, 121.54], [123.0, 123.84], [124.0, 124.85], [127.0, 131.04], [132.0, 132.83], [134.0, 134.81]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.18, 0.0, 50.91, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 59.15, 0.0, 0.0, 73.82, 0.0, 66.51, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 63.74, 0.0, 76.2, 0.0, 0.0, 73.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 24.28], ["doorbell", 13.52], ["radio", 9.36]], null, null, [["squish", 9.47], ["hum", 8.76], ["sidetone", 6.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 0.2, 1.09, -0.07, 0.2, 1.16, 0.66, 3.07, 0.87, 2.34, 3.54, 0.94, 0.68, 0.76, 0.45, 0.7, 1.32, 2.81, 4.57, 0.58, 0.9, 5.46, 0.75, 2.06, 1.4, 0.63, 1.78, 4.22, 1.41, 0.8, 1.35, 4.81, 0.78, 2.54, 0.84, 0.85, 4.04, 0.83, 0.81]} \ No newline at end of file diff --git a/annotations_1/ATU0Znam5Pw_filtered.json b/annotations_1/ATU0Znam5Pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acbdaf4ed452fd87aa2d143cfb4b4cd8b1357344 --- /dev/null +++ b/annotations_1/ATU0Znam5Pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [6.0, 8.04], [9.0, 10.39], [11.0, 13.96], [17.0, 18.4], [22.0, 30.35], [32.0, 32.97], [34.0, 35.38], [36.0, 37.62], [38.0, 40.0], [41.0, 43.68], [44.0, 45.96], [46.0, 48.05], [49.0, 51.04], [52.0, 55.53], [57.0, 59.59], [65.0, 65.96], [70.0, 71.58], [73.0, 74.9], [78.0, 85.58], [86.0, 88.4], [89.0, 90.73], [94.0, 95.76], [100.0, 100.48], [104.0, 116.34], [119.0, 127.36], [128.0, 130.28], [131.0, 132.68]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 96.54, 0.0, 32.11, 0.0, 0.0, 0.0, 86.64, 81.35, 0.0, 99.84, 99.99, 100.0, 100.0, 0.0, 0.0, 0.0, 98.66, 99.91, 0.0, 0.0, 0.0, 57.56, 57.17, 83.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 42.06], ["explosion", 10.5], ["whack, thwack", 5.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 2.04, 1.39, 2.96, 1.4, 8.35, 0.97, 1.38, 1.62, 2.0, 2.68, 1.96, 2.05, 2.04, 3.53, 2.59, 0.96, 1.58, 1.9, 7.58, 2.4, 1.73, 1.76, 0.48, 12.34, 8.36, 2.28, 1.68]} \ No newline at end of file diff --git a/annotations_1/ATid397QdsY_filtered.json b/annotations_1/ATid397QdsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea319aadf3e8d7feeb015714f9112f65b1a0ad9a --- /dev/null +++ b/annotations_1/ATid397QdsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 48.64], [49.0, 51.31], [53.0, 58.99], [60.0, 63.02], [63.0, 91.79], [93.0, 94.64], [95.0, 101.04], [101.0, 103.33]], "keep_status": [true, true, true, false, false, false, true, true], "silence_prob": [33.18, 35.22, 30.21, 28.99, 30.99, 0.0, 30.86, 32.31], "audiomae_on_audioset": [[["music", 27.28], ["hum", 24.11], ["mains hum", 11.16]], [["speech", 36.84], ["brass instrument", 17.72], ["music", 12.28]], [["music", 58.96], ["clarinet", 4.23], ["electronic music", 2.21]], [["hum", 60.08], ["throbbing", 14.47], ["mains hum", 12.41]], [["hum", 55.88], ["mains hum", 20.02], ["throbbing", 12.21]], null, [["speech", 24.62], ["hum", 16.43], ["music", 13.59]], [["speech", 26.44], ["fly, housefly", 15.71], ["bee, wasp, etc.", 9.08]]], "duration": [26.64, 2.31, 5.99, 3.02, 28.79, 1.64, 6.04, 2.33]} \ No newline at end of file diff --git a/annotations_1/AUPdPriOg6I_filtered.json b/annotations_1/AUPdPriOg6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e9085f05c04742e4061499da038015880783ec7 --- /dev/null +++ b/annotations_1/AUPdPriOg6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.96], [23.0, 26.06], [29.0, 31.13], [35.0, 35.77], [39.0, 45.44], [46.0, 47.16], [48.0, 55.19], [56.0, 58.26], [60.0, 61.13], [63.0, 63.04], [68.0, 68.72], [73.0, 74.19], [76.0, 76.99], [78.0, 79.56], [82.0, 82.7], [94.0, 95.12], [97.0, 99.39], [102.0, 103.65], [108.0, 110.94], [112.0, 113.91], [114.0, 114.66], [121.0, 121.14], [122.0, 127.58], [128.0, 129.52], [131.0, 136.31], [144.0, 149.5], [151.0, 159.49], [161.0, 162.21], [164.0, 164.84], [168.0, 168.66], [170.0, 172.13]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 59.96, 97.22, 0.0, 34.52, 0.0, 39.88, 35.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41, 0.0, 65.55, 0.0, 0.0, 0.0, 74.6, 0.0, 78.55, 54.83, 56.1, 0.0, 0.0, 0.0, 90.78], "audiomae_on_audioset": [null, null, null, null, [["speech", 55.37], ["hum", 5.93], ["ding", 3.92]], null, [["music", 31.62], ["ambient music", 24.44], ["hum", 16.2]], [["music", 21.27], ["hum", 12.7], ["mains hum", 8.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 3.06, 2.13, 0.77, 6.44, 1.16, 7.19, 2.26, 1.13, 0.04, 0.72, 1.19, 0.99, 1.56, 0.7, 1.12, 2.39, 1.65, 2.94, 1.91, 0.66, 0.14, 5.58, 1.52, 5.31, 5.5, 8.49, 1.21, 0.84, 0.66, 2.13]} \ No newline at end of file diff --git a/annotations_1/AUbfGwY4Fco_filtered.json b/annotations_1/AUbfGwY4Fco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9148af652c45821cbceaa123c01998332ee194c4 --- /dev/null +++ b/annotations_1/AUbfGwY4Fco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.63], [2.0, 1.73], [2.0, 1.8], [2.0, 1.85], [2.0, 1.88], [2.0, 1.95], [2.0, 1.98], [2.0, 2.05], [2.0, 4.63], [6.0, 6.86], [10.0, 9.53], [10.0, 9.58], [10.0, 10.71], [12.0, 13.59], [15.0, 17.02], [18.0, 21.83], [23.0, 24.41], [26.0, 31.9], [33.0, 35.5], [37.0, 38.91], [43.0, 45.45], [48.0, 49.06], [51.0, 52.52], [54.0, 55.12], [57.0, 61.89], [63.0, 64.54], [69.0, 71.0], [73.0, 75.88], [78.0, 106.88], [108.0, 109.02], [110.0, 115.52], [117.0, 117.68], [119.0, 125.31], [126.0, 128.71], [130.0, 130.99], [132.0, 133.95], [135.0, 136.7], [138.0, 138.57], [139.0, 141.07], [142.0, 142.84], [143.0, 144.64], [145.0, 187.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 92.8, 0.0, 94.37, 44.96, 0.0, 56.86, 0.0, 0.0, 0.0, 76.37, 0.0, 91.64, 97.54, 49.18, 0.0, 37.76, 0.0, 36.9, 40.01, 0.0, 0.0, 0.0, 0.0, 36.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.77], ["speech", 32.38], ["sidetone", 3.18]], null, null, null, null, null, null, null, null, null, [["gong", 39.66], ["hum", 15.68], ["music", 12.45]], null, [["speech", 55.3], ["sidetone", 16.7], ["whale vocalization", 4.16]], null, [["whale vocalization", 29.16], ["throbbing", 9.35], ["music", 8.69]], [["hum", 40.73], ["throbbing", 9.66], ["music", 7.73]], null, null, null, null, [["music", 43.96], ["synthesizer", 7.61], ["sonar", 6.21]], null, null, null], "duration": [-0.37, -0.27, -0.2, -0.15, -0.12, -0.05, -0.02, 0.05, 2.63, 0.86, -0.47, -0.42, 0.71, 1.59, 2.02, 3.83, 1.41, 5.9, 2.5, 1.91, 2.45, 1.06, 1.52, 1.12, 4.89, 1.54, 2.0, 2.88, 28.88, 1.02, 5.52, 0.68, 6.31, 2.71, 0.99, 1.95, 1.7, 0.57, 2.07, 0.84, 1.64, 42.81]} \ No newline at end of file diff --git a/annotations_1/AV3CrPe-1q0_filtered.json b/annotations_1/AV3CrPe-1q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4de898841b6958f11c08744853ff0b6273fde49b --- /dev/null +++ b/annotations_1/AV3CrPe-1q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.98], [19.0, 19.01], [20.0, 26.11], [26.0, 26.52], [29.0, 31.63], [38.0, 41.37], [44.0, 57.62], [59.0, 63.54], [66.0, 65.75], [71.0, 82.68], [84.0, 157.2]], "keep_status": [true, false, false, false, true, true, false, true, false, false, false], "silence_prob": [31.57, 0.0, 31.67, 0.0, 36.96, 39.89, 31.16, 36.02, 0.0, 38.4, 0.0], "audiomae_on_audioset": [[["hum", 36.86], ["mains hum", 18.05], ["music", 13.66]], null, [["explosion", 31.28], ["speech", 30.2], ["eruption", 10.81]], null, [["speech", 20.86], ["whale vocalization", 20.48], ["fly, housefly", 4.91]], [["speech", 21.69], ["fly, housefly", 14.86], ["insect", 6.39]], [["speech", 60.25], ["music", 13.62], ["hum", 6.78]], [["whale vocalization", 24.74], ["music", 17.13], ["gurgling", 4.5]], null, [["music", 72.13], ["whale vocalization", 6.22], ["synthesizer", 4.47]], null], "duration": [13.98, 0.01, 6.11, 0.52, 2.63, 3.37, 13.62, 4.54, -0.25, 11.68, 73.2]} \ No newline at end of file diff --git a/annotations_1/AVHPmsWZnb4_filtered.json b/annotations_1/AVHPmsWZnb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/AVHPmsWZnb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/AVzJme0mGY8_filtered.json b/annotations_1/AVzJme0mGY8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/AVzJme0mGY8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/AWi8x9ctlps_filtered.json b/annotations_1/AWi8x9ctlps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec735ca2f3d6bdb5e8d21edf3e071c4d73153917 --- /dev/null +++ b/annotations_1/AWi8x9ctlps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [9.0, 10.05], [12.0, 17.51], [19.0, 20.19], [23.0, 23.95], [26.0, 30.28], [35.0, 35.38], [36.0, 36.42], [37.0, 37.83], [39.0, 39.75], [45.0, 48.19], [50.0, 50.5], [52.0, 52.37], [54.0, 54.11], [54.0, 93.04], [93.0, 94.31], [96.0, 96.13], [98.0, 109.68], [110.0, 116.24], [117.0, 120.28], [122.0, 148.37], [150.0, 150.72], [153.0, 159.56], [160.0, 161.13], [162.0, 170.01], [171.0, 172.32], [174.0, 178.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.06, 0.0, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 41.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 36.49, 49.64, 58.05, 0.0, 99.78, 0.0, 88.83, 0.0, 99.99], "audiomae_on_audioset": [null, null, [["speech", 74.89], ["radio", 8.95], ["whale vocalization", 3.49]], null, null, [["speech", 20.19], ["music", 14.97], ["burst, pop", 8.85]], null, null, null, null, [["arrow", 9.67], ["mosquito", 8.46], ["croak", 7.64]], null, null, null, null, null, null, [["frog", 66.49], ["fly, housefly", 6.15], ["croak", 6.14]], [["speech", 79.73], ["radio", 9.42], ["sidetone", 3.63]], [["speech", 30.82], ["radio", 29.58], ["sidetone", 8.83]], null, null, null, null, null, null, null], "duration": [0.86, 1.05, 5.51, 1.19, 0.95, 4.28, 0.38, 0.42, 0.83, 0.75, 3.19, 0.5, 0.37, 0.11, 39.04, 1.31, 0.13, 11.68, 6.24, 3.28, 26.37, 0.72, 6.56, 1.13, 8.01, 1.32, 4.04]} \ No newline at end of file diff --git a/annotations_1/AWvRcWDr5y8_filtered.json b/annotations_1/AWvRcWDr5y8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a60c6512fe8638006eb96cd34ed411530e7021d --- /dev/null +++ b/annotations_1/AWvRcWDr5y8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 71.74], [74.0, 74.46], [75.0, 76.6], [78.0, 82.97], [84.0, 84.23], [87.0, 88.08], [90.0, 93.16], [94.0, 104.18], [106.0, 107.23], [109.0, 112.21]], "keep_status": [true, false, false, true, false, false, true, true, false, true], "silence_prob": [30.44, 0.0, 0.0, 38.71, 0.0, 0.0, 35.65, 32.42, 0.0, 33.07], "audiomae_on_audioset": [[["music", 30.74], ["hum", 15.7], ["electronic music", 10.22]], null, null, [["hum", 36.78], ["mains hum", 18.68], ["throbbing", 10.31]], null, null, [["hum", 19.11], ["rumble", 14.98], ["music", 9.61]], [["rumble", 33.21], ["music", 17.96], ["hum", 11.19]], null, [["hum", 27.52], ["music", 13.8], ["mains hum", 6.04]]], "duration": [3.74, 0.46, 1.6, 4.97, 0.23, 1.08, 3.16, 10.18, 1.23, 3.21]} \ No newline at end of file diff --git a/annotations_1/AX-qpuOuDVg_filtered.json b/annotations_1/AX-qpuOuDVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..419030d6aaf7a1815103bd338b33beac599cb3af --- /dev/null +++ b/annotations_1/AX-qpuOuDVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 32.83], [36.0, 37.56], [39.0, 45.18], [46.0, 47.9], [49.0, 50.16], [52.0, 71.02], [72.0, 97.31], [99.0, 100.67]], "keep_status": [false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 33.94, 0.0, 0.0, 28.99, 29.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.47], ["hum", 13.69], ["electronic music", 9.38]], null, null, [["music", 32.18], ["gong", 12.4], ["synthesizer", 8.2]], [["music", 61.44], ["hum", 5.69], ["electronic music", 5.17]], null], "duration": [30.83, 1.56, 6.18, 1.9, 1.16, 19.02, 25.31, 1.67]} \ No newline at end of file diff --git a/annotations_1/AX4i2YZqE14_filtered.json b/annotations_1/AX4i2YZqE14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b13803fd1c75a9cacb97436041b86bb50ee8120 --- /dev/null +++ b/annotations_1/AX4i2YZqE14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [3.0, 3.65], [5.0, 5.22], [8.0, 26.74], [31.0, 47.95], [49.0, 58.02], [59.0, 59.9], [60.0, 66.31], [71.0, 71.83], [74.0, 74.11], [74.0, 75.25], [77.0, 77.45], [80.0, 80.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.25, 28.32, 30.23, 0.0, 28.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 79.53], ["musical instrument", 2.63], ["synthesizer", 1.7]], [["music", 68.19], ["throbbing", 5.85], ["synthesizer", 5.64]], [["music", 36.45], ["throbbing", 22.37], ["hum", 11.34]], null, [["mains hum", 30.91], ["hum", 27.97], ["music", 16.46]], null, null, null, null, null], "duration": [0.34, 0.65, 0.22, 18.74, 16.95, 9.02, 0.9, 6.31, 0.83, 0.11, 1.25, 0.45, 0.77]} \ No newline at end of file diff --git a/annotations_1/AYQjmj7cSM0_filtered.json b/annotations_1/AYQjmj7cSM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..240de2cbbaed3462ab86a7ab989fa72de29997bb --- /dev/null +++ b/annotations_1/AYQjmj7cSM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 12.31], [15.0, 68.03], [72.0, 74.97], [77.0, 145.44], [149.0, 149.77]], "keep_status": [false, false, true, false, false], "silence_prob": [27.87, 0.0, 28.59, 0.0, 0.0], "audiomae_on_audioset": [[["music", 70.89], ["vehicle", 3.89], ["car", 1.94]], null, [["music", 51.77], ["mosquito", 6.33], ["noise", 3.7]], null, null], "duration": [12.31, 53.03, 2.97, 68.44, 0.77]} \ No newline at end of file diff --git a/annotations_1/AZ0AsuZu4ds_filtered.json b/annotations_1/AZ0AsuZu4ds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4741e0b5132e2716db7545421a159a5dea90ebc --- /dev/null +++ b/annotations_1/AZ0AsuZu4ds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.92], [15.0, 15.67], [18.0, 18.86], [20.0, 22.47], [24.0, 24.98], [26.0, 26.55], [30.0, 30.48], [31.0, 32.07], [48.0, 48.14], [55.0, 55.76], [58.0, 59.21], [61.0, 61.89], [64.0, 64.0], [65.0, 65.62], [73.0, 73.58], [76.0, 76.44], [78.0, 77.97], [79.0, 79.25], [80.0, 80.94], [82.0, 83.22], [84.0, 85.02], [91.0, 92.28], [93.0, 95.67], [106.0, 107.27], [112.0, 112.51], [121.0, 122.25], [124.0, 125.86], [132.0, 132.56], [135.0, 135.63], [147.0, 150.13], [151.0, 153.12], [154.0, 158.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.43, 100.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.08, 0.67, 0.86, 2.47, 0.98, 0.55, 0.48, 1.07, 0.14, 0.76, 1.21, 0.89, 0.0, 0.62, 0.58, 0.44, -0.03, 0.25, 0.94, 1.22, 1.02, 1.28, 2.67, 1.27, 0.51, 1.25, 1.86, 0.56, 0.63, 3.13, 2.12, 4.94]} \ No newline at end of file diff --git a/annotations_1/AZfCHDSJc8c_filtered.json b/annotations_1/AZfCHDSJc8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65e3666f47bf6912bc440983e360e2959d374d72 --- /dev/null +++ b/annotations_1/AZfCHDSJc8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [4.0, 9.73], [11.0, 14.23], [15.0, 16.16], [18.0, 30.79], [31.0, 32.0], [32.0, 33.69], [34.0, 34.05], [34.0, 37.39], [38.0, 38.52], [39.0, 42.08], [44.0, 45.82], [47.0, 48.9], [51.0, 51.92], [59.0, 62.87], [66.0, 65.74], [70.0, 70.93], [72.0, 73.47], [74.0, 91.02], [93.0, 93.7], [94.0, 95.84], [103.0, 104.14], [105.0, 106.34], [109.0, 131.36]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 36.93, 61.27, 0.0, 52.98, 0.0, 0.0, 0.0, 51.5, 0.0, 36.76, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 49.04, 0.0, 0.0, 0.0, 0.0, 30.39], "audiomae_on_audioset": [null, [["music", 56.88], ["sonar", 5.98], ["echo", 5.89]], null, null, null, null, null, null, null, null, [["whale vocalization", 56.81], ["animal", 12.12], ["livestock, farm animals, working animals", 5.89]], null, null, null, null, null, null, null, [["music", 45.17], ["hum", 5.61], ["musical instrument", 3.97]], null, null, null, null, [["music", 23.77], ["speech", 17.2], ["buzz", 7.67]]], "duration": [0.83, 5.73, 3.23, 1.16, 12.79, 1.0, 1.69, 0.05, 3.39, 0.52, 3.08, 1.82, 1.9, 0.92, 3.87, -0.26, 0.93, 1.47, 17.02, 0.7, 1.84, 1.14, 1.34, 22.36]} \ No newline at end of file diff --git a/annotations_1/AZxn9md_aZI_filtered.json b/annotations_1/AZxn9md_aZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..366848578d490fa349e433ba8f467780cccbae85 --- /dev/null +++ b/annotations_1/AZxn9md_aZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 12.11], [14.0, 18.42], [19.0, 20.24], [22.0, 43.01], [45.0, 45.71], [46.0, 48.2], [53.0, 57.62], [58.0, 60.56], [62.0, 62.72], [65.0, 67.42], [72.0, 85.4], [89.0, 101.58], [108.0, 109.58], [112.0, 117.14], [123.0, 123.28], [127.0, 135.57], [139.0, 144.09], [144.0, 155.22], [158.0, 159.75], [164.0, 165.3], [169.0, 169.91], [172.0, 182.65]], "keep_status": [true, false, false, false, false, false, false, true, false, true, false, true, false, true, false, false, false, true, false, false, false, false], "silence_prob": [45.11, 52.8, 0.0, 31.13, 0.0, 31.29, 29.97, 36.74, 0.0, 31.23, 29.93, 30.39, 0.0, 29.95, 0.0, 31.39, 78.72, 38.9, 0.0, 0.0, 0.0, 92.8], "audiomae_on_audioset": [[["crushing", 34.75], ["music", 13.52], ["mains hum", 6.41]], null, null, [["speech", 50.05], ["music", 15.76], ["breaking", 7.37]], null, [["speech", 53.83], ["grunt", 13.63], ["whale vocalization", 6.85]], [["music", 38.33], ["speech", 28.62], ["hum", 5.22]], [["creak", 33.86], ["music", 10.25], ["speech", 4.29]], null, [["speech", 43.17], ["hum", 8.88], ["sidetone", 4.2]], [["music", 62.41], ["speech", 15.56], ["whack, thwack", 5.67]], [["speech", 32.54], ["smash, crash", 18.13], ["breaking", 16.13]], null, [["music", 53.12], ["speech", 5.71], ["throbbing", 4.8]], null, [["crack", 81.19], ["breaking", 2.5], ["music", 2.15]], null, [["speech", 30.34], ["music", 17.3], ["sidetone", 9.51]], null, null, null, null], "duration": [10.11, 4.42, 1.24, 21.01, 0.71, 2.2, 4.62, 2.56, 0.72, 2.42, 13.4, 12.58, 1.58, 5.14, 0.28, 8.57, 5.09, 11.22, 1.75, 1.3, 0.91, 10.65]} \ No newline at end of file diff --git a/annotations_1/A_CGtuDwl-A_filtered.json b/annotations_1/A_CGtuDwl-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fe67856145227e8554e4a1370e9bae23aeea8ea --- /dev/null +++ b/annotations_1/A_CGtuDwl-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.28], [32.0, 34.97], [40.0, 41.12], [44.0, 45.17], [46.0, 48.42], [55.0, 83.47], [84.0, 85.31], [85.0, 97.38], [100.0, 100.68], [102.0, 102.09], [102.0, 116.55], [118.0, 119.45], [123.0, 123.65], [136.0, 140.78], [158.0, 160.03], [162.0, 166.5], [173.0, 175.24], [181.0, 181.97], [184.0, 185.85], [187.0, 189.01], [190.0, 190.93], [192.0, 194.51]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, false], "silence_prob": [0.0, 32.48, 0.0, 0.0, 32.42, 31.02, 0.0, 31.39, 0.0, 0.0, 31.13, 0.0, 0.0, 31.78, 29.71, 29.55, 30.79, 0.0, 0.0, 31.24, 0.0, 30.31], "audiomae_on_audioset": [null, [["music", 35.95], ["boing", 9.36], ["fly, housefly", 6.79]], null, null, [["music", 21.0], ["throbbing", 10.51], ["croak", 9.37]], [["music", 43.68], ["speech", 26.56], ["boing", 8.63]], null, [["music", 42.79], ["boing", 15.66], ["speech", 15.17]], null, null, [["livestock, farm animals, working animals", 34.58], ["cattle, bovinae", 22.27], ["moo", 19.65]], null, null, [["music", 27.39], ["speech", 16.38], ["mains hum", 8.81]], [["music", 51.4], ["musical instrument", 5.88], ["pulse", 4.0]], [["music", 56.79], ["throbbing", 8.02], ["hum", 4.67]], [["speech", 40.68], ["music", 10.01], ["vehicle", 9.14]], null, null, [["music", 49.93], ["cacophony", 14.38], ["speech", 5.29]], null, [["throbbing", 43.08], ["music", 32.67], ["hum", 14.84]]], "duration": [0.28, 2.97, 1.12, 1.17, 2.42, 28.47, 1.31, 12.38, 0.68, 0.09, 14.55, 1.45, 0.65, 4.78, 2.03, 4.5, 2.24, 0.97, 1.85, 2.01, 0.93, 2.51]} \ No newline at end of file diff --git a/annotations_1/A_HjMIjzyMU_filtered.json b/annotations_1/A_HjMIjzyMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e5c306de0c732e0db0e568451ba4d69e8ef28e6 --- /dev/null +++ b/annotations_1/A_HjMIjzyMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.75], [5.0, 7.82], [10.0, 10.83], [14.0, 15.33], [19.0, 20.29], [24.0, 24.92], [27.0, 28.98], [36.0, 38.23], [39.0, 39.45], [54.0, 57.62], [59.0, 86.44], [88.0, 103.4], [106.0, 107.1], [109.0, 117.69], [119.0, 119.42], [123.0, 125.95], [126.0, 127.47], [130.0, 220.04], [222.0, 245.13], [248.0, 248.29]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 43.71, 30.74, 31.01, 0.0, 30.8, 0.0, 30.52, 0.0, 0.0, 33.45, 0.0], "audiomae_on_audioset": [null, [["music", 48.87], ["theremin", 4.43], ["musical instrument", 3.73]], null, null, null, null, null, null, null, [["music", 42.97], ["musical instrument", 11.96], ["speech", 4.79]], [["music", 41.34], ["speech", 9.37], ["moo", 6.12]], [["music", 50.42], ["speech", 4.23], ["throbbing", 3.62]], null, [["music", 39.52], ["hum", 13.58], ["throbbing", 7.62]], null, [["cattle, bovinae", 37.61], ["moo", 32.42], ["livestock, farm animals, working animals", 14.93]], null, null, [["music", 49.33], ["speech", 25.95], ["electronic music", 3.54]], null], "duration": [1.75, 2.82, 0.83, 1.33, 1.29, 0.92, 1.98, 2.23, 0.45, 3.62, 27.44, 15.4, 1.1, 8.69, 0.42, 2.95, 1.47, 90.04, 23.13, 0.29]} \ No newline at end of file diff --git a/annotations_1/A_R76lKU0DI_filtered.json b/annotations_1/A_R76lKU0DI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57c051ad5068eb44ca73140e5cf8eeff3a5d7453 --- /dev/null +++ b/annotations_1/A_R76lKU0DI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [7.0, 7.52], [9.0, 9.86], [11.0, 12.07], [14.0, 14.17], [15.0, 16.73], [19.0, 19.35], [21.0, 21.47], [34.0, 34.94], [41.0, 42.58], [45.0, 46.85], [52.0, 52.03], [54.0, 55.54], [61.0, 66.73], [70.0, 71.15], [74.0, 76.22], [79.0, 79.03], [81.0, 81.01], [83.0, 83.44], [87.0, 87.89], [93.0, 94.66], [97.0, 97.44], [106.0, 106.49], [119.0, 119.57], [122.0, 122.3], [124.0, 125.42], [125.0, 126.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.65, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 70.68], ["music", 8.72], ["speech", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.92, 0.52, 0.86, 1.07, 0.17, 1.73, 0.35, 0.47, 0.94, 1.58, 1.85, 0.03, 1.54, 5.73, 1.15, 2.22, 0.03, 0.01, 0.44, 0.89, 1.66, 0.44, 0.49, 0.57, 0.3, 1.42, 1.45]} \ No newline at end of file diff --git a/annotations_1/A_bC8fF6WZE_filtered.json b/annotations_1/A_bC8fF6WZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c401f41223528078daba9bf3e0d9c6f372554d8 --- /dev/null +++ b/annotations_1/A_bC8fF6WZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [5.0, 9.37], [10.0, 10.94], [15.0, 15.28], [18.0, 18.99], [20.0, 22.91], [24.0, 26.94], [32.0, 33.49], [35.0, 35.28], [37.0, 37.83], [41.0, 45.59], [46.0, 45.62], [46.0, 46.11], [48.0, 53.6], [56.0, 57.62], [59.0, 63.96], [65.0, 65.65], [67.0, 71.42], [76.0, 95.76], [98.0, 98.22], [100.0, 100.14], [102.0, 103.08], [106.0, 109.92], [111.0, 114.45], [120.0, 123.99], [126.0, 127.16]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, false, false, false, false, true, true, false], "silence_prob": [0.0, 34.28, 0.0, 0.0, 0.0, 81.17, 99.71, 0.0, 0.0, 0.0, 32.83, 0.0, 0.0, 30.87, 0.0, 40.04, 0.0, 44.23, 36.48, 0.0, 0.0, 0.0, 35.22, 29.36, 30.45, 0.0], "audiomae_on_audioset": [null, [["music", 29.29], ["mains hum", 18.08], ["hum", 17.12]], null, null, null, null, null, null, null, null, [["music", 28.16], ["hum", 26.35], ["mains hum", 14.18]], null, null, [["animal", 39.78], ["livestock, farm animals, working animals", 27.58], ["cowbell", 9.06]], null, [["speech", 33.74], ["music", 18.74], ["noise", 10.22]], null, [["whale vocalization", 14.75], ["music", 11.66], ["animal", 5.61]], [["speech", 37.35], ["hum", 23.7], ["mains hum", 6.57]], null, null, null, [["music", 56.25], ["speech", 17.69], ["mosquito", 2.16]], [["speech", 14.3], ["cattle, bovinae", 10.65], ["livestock, farm animals, working animals", 8.45]], [["speech", 37.33], ["music", 27.87], ["vehicle", 4.19]], null], "duration": [1.89, 4.37, 0.94, 0.28, 0.99, 2.91, 2.94, 1.49, 0.28, 0.83, 4.59, -0.38, 0.11, 5.6, 1.62, 4.96, 0.65, 4.42, 19.76, 0.22, 0.14, 1.08, 3.92, 3.45, 3.99, 1.16]} \ No newline at end of file diff --git a/annotations_1/A_n2FjVMiVY_filtered.json b/annotations_1/A_n2FjVMiVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc044221d7ef8e532f6e0e208836452fb81f9b38 --- /dev/null +++ b/annotations_1/A_n2FjVMiVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.59], [10.0, 21.1], [23.0, 23.01], [23.0, 99.42]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 40.4, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 43.32], ["throbbing", 15.54], ["mains hum", 11.39]], null, null], "duration": [-0.41, 11.1, 0.01, 76.42]} \ No newline at end of file diff --git a/annotations_1/AaMkmiZ9bMM_filtered.json b/annotations_1/AaMkmiZ9bMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db21c770d5cd256764d770a1de5379155936fc01 --- /dev/null +++ b/annotations_1/AaMkmiZ9bMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.86], [8.0, 18.69], [20.0, 20.22], [22.0, 23.36], [24.0, 27.01], [31.0, 31.31], [32.0, 33.08], [35.0, 35.68], [36.0, 36.83], [39.0, 41.1], [45.0, 45.5], [46.0, 47.44], [48.0, 49.08], [51.0, 52.81], [53.0, 53.0], [54.0, 54.73], [55.0, 72.06], [76.0, 78.73], [80.0, 81.38], [90.0, 90.56], [92.0, 93.73], [95.0, 96.25], [108.0, 108.9], [112.0, 119.06], [133.0, 134.3], [143.0, 148.36], [155.0, 157.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, true], "silence_prob": [91.3, 64.75, 0.0, 0.0, 37.01, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 30.91, 35.28], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 39.68], ["fly, housefly", 17.77], ["speech", 14.28]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.79], ["groan", 8.38], ["animal", 6.71]], [["music", 17.05], ["frog", 10.45], ["moo", 8.4]], null, null, null, null, null, [["speech", 45.21], ["rowboat, canoe, kayak", 17.02], ["splash, splatter", 11.02]], null, [["frog", 20.83], ["music", 12.99], ["croak", 6.75]], [["fly, housefly", 20.84], ["whale vocalization", 16.34], ["insect", 13.17]]], "duration": [2.86, 10.69, 0.22, 1.36, 3.01, 0.31, 1.08, 0.68, 0.83, 2.1, 0.5, 1.44, 1.08, 1.81, 0.0, 0.73, 17.06, 2.73, 1.38, 0.56, 1.73, 1.25, 0.9, 7.06, 1.3, 5.36, 2.82]} \ No newline at end of file diff --git a/annotations_1/AcSDeQhGGFM_filtered.json b/annotations_1/AcSDeQhGGFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7598c7f5d9c6600fdc58547f813702668d551618 --- /dev/null +++ b/annotations_1/AcSDeQhGGFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.58], [6.0, 7.52], [8.0, 8.9], [9.0, 10.05], [11.0, 15.06], [18.0, 19.03], [19.0, 19.47], [24.0, 24.12], [24.0, 24.49], [25.0, 26.32], [28.0, 28.46], [29.0, 30.01], [32.0, 35.55], [37.0, 41.08], [44.0, 45.6], [46.0, 52.68], [54.0, 55.32], [57.0, 57.89], [59.0, 59.58], [60.0, 60.17], [65.0, 66.29], [71.0, 71.25], [72.0, 86.14], [87.0, 88.7], [89.0, 90.98], [93.0, 95.25], [97.0, 98.34], [101.0, 102.76], [103.0, 111.82], [113.0, 115.53], [133.0, 157.69], [161.0, 164.15], [169.0, 171.04], [180.0, 180.71], [181.0, 182.76], [188.0, 188.7], [189.0, 190.8], [193.0, 194.27], [199.0, 200.94], [204.0, 205.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 85.72, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 100.0, 0.0, 0.0, 86.82, 100.0, 93.6, 62.58, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.52, 0.9, 1.05, 4.06, 1.03, 0.47, 0.12, 0.49, 1.32, 0.46, 1.01, 3.55, 4.08, 1.6, 6.68, 1.32, 0.89, 0.58, 0.17, 1.29, 0.25, 14.14, 1.7, 1.98, 2.25, 1.34, 1.76, 8.82, 2.53, 24.69, 3.15, 2.04, 0.71, 1.76, 0.7, 1.8, 1.27, 1.94, 1.36]} \ No newline at end of file diff --git a/annotations_1/AcvWJ8bgA8w_filtered.json b/annotations_1/AcvWJ8bgA8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..552945209c6c2552ae0e49ba3f04162cd0cf18cc --- /dev/null +++ b/annotations_1/AcvWJ8bgA8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [8.0, 11.53], [12.0, 13.02], [15.0, 24.22], [25.0, 27.5], [29.0, 33.27], [34.0, 34.33], [38.0, 39.38], [40.0, 41.47], [42.0, 42.72], [45.0, 45.67], [48.0, 49.79], [51.0, 53.16], [55.0, 54.97], [57.0, 59.73], [60.0, 60.72], [64.0, 75.57], [78.0, 77.99], [80.0, 79.96], [83.0, 82.71], [87.0, 88.28], [89.0, 95.98], [96.0, 97.55], [99.0, 100.82], [102.0, 104.8], [108.0, 110.02], [111.0, 110.98], [112.0, 117.64], [122.0, 125.17], [126.0, 129.52], [130.0, 137.3], [138.0, 139.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 72.01, 65.67, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 51.39, 0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 88.64, 89.72, 0.0, 83.16, 96.77, 91.64, 61.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 3.53, 1.02, 9.22, 2.5, 4.27, 0.33, 1.38, 1.47, 0.72, 0.67, 1.79, 2.16, -0.03, 2.73, 0.72, 11.57, -0.01, -0.04, -0.29, 1.28, 6.98, 1.55, 1.82, 2.8, 2.02, -0.02, 5.64, 3.17, 3.52, 7.3, 1.73]} \ No newline at end of file diff --git a/annotations_1/Ad2-FiCzJxc_filtered.json b/annotations_1/Ad2-FiCzJxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cef4386f45ca1385c0de2527bd25059d41f4229a --- /dev/null +++ b/annotations_1/Ad2-FiCzJxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.65], [27.0, 28.02], [30.0, 31.55], [37.0, 37.5], [46.0, 47.33], [50.0, 51.27], [57.0, 57.37], [102.0, 102.07], [140.0, 140.41], [147.0, 147.6], [168.0, 167.88], [180.0, 181.79], [223.0, 223.32], [232.0, 232.29], [240.0, 240.68], [259.0, 259.16], [289.0, 290.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.01], ["musical instrument", 10.75], ["piano", 5.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [16.65, 1.02, 1.55, 0.5, 1.33, 1.27, 0.37, 0.07, 0.41, 0.6, -0.12, 1.79, 0.32, 0.29, 0.68, 0.16, 1.87]} \ No newline at end of file diff --git a/annotations_1/Af-N8CLLoqU_filtered.json b/annotations_1/Af-N8CLLoqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7557e28df5bc757ee29a32608adde4b5ce1de52 --- /dev/null +++ b/annotations_1/Af-N8CLLoqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.6], [3.0, 4.55], [8.0, 7.74], [13.0, 13.2], [14.0, 15.31], [18.0, 19.47], [20.0, 21.17], [22.0, 22.33], [24.0, 24.26], [28.0, 27.95], [33.0, 33.61], [35.0, 69.16], [72.0, 110.46], [118.0, 119.47], [121.0, 144.98], [147.0, 147.88], [148.0, 149.81], [152.0, 151.7], [154.0, 154.21], [157.0, 157.22], [158.0, 159.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.63], ["horse", 7.96], ["animal", 7.42]], null, null, null, null, null, null], "duration": [0.6, 1.55, -0.26, 0.2, 1.31, 1.47, 1.17, 0.33, 0.26, -0.05, 0.61, 34.16, 38.46, 1.47, 23.98, 0.88, 1.81, -0.3, 0.21, 0.22, 1.17]} \ No newline at end of file diff --git a/annotations_1/Afwy5S9__0E_filtered.json b/annotations_1/Afwy5S9__0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce4088e2029e39ae120092fba984dab85fc4de01 --- /dev/null +++ b/annotations_1/Afwy5S9__0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.08], [32.0, 32.44], [54.0, 54.55], [60.0, 59.81], [65.0, 65.23], [75.0, 75.88], [94.0, 94.27], [103.0, 104.09]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [31.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 78.04], ["musical instrument", 4.57], ["banjo", 3.6]], null, null, null, null, null, null, null], "duration": [6.08, 0.44, 0.55, -0.19, 0.23, 0.88, 0.27, 1.09]} \ No newline at end of file diff --git a/annotations_1/AgNH9Ktkrqk_filtered.json b/annotations_1/AgNH9Ktkrqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8c7f74a6b98637ec217d49c32316fd07138272 --- /dev/null +++ b/annotations_1/AgNH9Ktkrqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.99], [12.0, 12.16], [16.0, 16.46], [17.0, 17.69], [21.0, 22.52], [24.0, 25.39], [35.0, 35.46], [37.0, 37.67], [45.0, 45.27], [46.0, 53.6], [55.0, 56.3], [60.0, 62.24], [66.0, 66.39], [67.0, 68.18], [70.0, 71.79], [75.0, 79.51], [80.0, 80.89], [82.0, 83.78], [85.0, 90.44], [94.0, 94.64], [96.0, 96.65], [98.0, 100.87], [102.0, 108.28], [110.0, 110.19], [112.0, 114.84], [116.0, 119.31], [123.0, 123.43], [125.0, 125.63], [135.0, 136.27], [137.0, 138.25], [140.0, 140.27], [142.0, 142.38], [144.0, 151.44], [153.0, 154.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.68, 0.0, 38.19, 0.0, 0.0, 0.0, 32.3, 0.0, 0.0, 32.46, 0.0, 0.0, 31.94, 31.59, 0.0, 30.58, 29.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 63.71], ["synthesizer", 5.26], ["musical instrument", 4.7]], null, [["music", 27.78], ["synthesizer", 20.49], ["keyboard (musical)", 6.92]], null, null, null, [["music", 60.6], ["speech", 8.33], ["firecracker", 2.77]], null, null, [["music", 61.91], ["swing music", 4.67], ["trombone", 3.96]], null, null, [["music", 53.94], ["reggae", 4.05], ["swing music", 3.3]], [["music", 55.42], ["mains hum", 7.22], ["hum", 6.34]], null, [["music", 48.66], ["didgeridoo", 10.23], ["musical instrument", 5.16]], [["livestock, farm animals, working animals", 49.67], ["cattle, bovinae", 28.47], ["moo", 14.32]], null, null, null, null, null, null, [["music", 41.77], ["skateboard", 21.61], ["groan", 2.95]], null], "duration": [1.99, 0.16, 0.46, 0.69, 1.52, 1.39, 0.46, 0.67, 0.27, 7.6, 1.3, 2.24, 0.39, 1.18, 1.79, 4.51, 0.89, 1.78, 5.44, 0.64, 0.65, 2.87, 6.28, 0.19, 2.84, 3.31, 0.43, 0.63, 1.27, 1.25, 0.27, 0.38, 7.44, 1.13]} \ No newline at end of file diff --git a/annotations_1/AhZw2QXKT1A_filtered.json b/annotations_1/AhZw2QXKT1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0c3b70654ac37069ae83e03aea4f2324654c778 --- /dev/null +++ b/annotations_1/AhZw2QXKT1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.59], [19.0, 29.34], [32.0, 32.02], [35.0, 35.83], [38.0, 40.42], [47.0, 55.36], [57.0, 61.37], [65.0, 113.1], [114.0, 114.15], [115.0, 125.73], [127.0, 133.08], [134.0, 139.55], [141.0, 145.05], [145.0, 145.94], [148.0, 148.78], [151.0, 154.87], [156.0, 157.89], [158.0, 158.85], [160.0, 161.82], [163.0, 165.18], [166.0, 167.61], [168.0, 170.53], [175.0, 176.03]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, true, true, false, false, true, false, false, false, false, false, true, false], "silence_prob": [41.42, 62.68, 0.0, 0.0, 45.52, 30.89, 31.94, 0.0, 0.0, 28.96, 68.02, 33.86, 31.43, 0.0, 0.0, 30.12, 0.0, 0.0, 0.0, 42.74, 0.0, 41.4, 0.0], "audiomae_on_audioset": [[["music", 26.21], ["hum", 18.5], ["speech", 7.57]], null, null, null, [["music", 30.56], ["creak", 6.97], ["foghorn", 3.57]], [["music", 48.71], ["didgeridoo", 15.18], ["mains hum", 7.77]], [["music", 54.55], ["didgeridoo", 4.58], ["musical instrument", 2.72]], null, null, [["music", 63.74], ["groan", 4.21], ["theremin", 3.03]], null, [["music", 21.83], ["grunt", 15.22], ["didgeridoo", 9.11]], [["mains hum", 19.01], ["explosion", 18.86], ["speech", 16.07]], null, null, [["whale vocalization", 29.48], ["music", 12.32], ["animal", 9.31]], null, null, null, [["music", 38.86], ["didgeridoo", 27.49], ["speech", 7.92]], null, [["didgeridoo", 21.97], ["frog", 20.67], ["croak", 13.09]], null], "duration": [8.59, 10.34, 0.02, 0.83, 2.42, 8.36, 4.37, 48.1, 0.15, 10.73, 6.08, 5.55, 4.05, 0.94, 0.78, 3.87, 1.89, 0.85, 1.82, 2.18, 1.61, 2.53, 1.03]} \ No newline at end of file diff --git a/annotations_1/AhbCYVILusc_filtered.json b/annotations_1/AhbCYVILusc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e572c8335480a940aa8292bbfd3ff03fa6b3b555 --- /dev/null +++ b/annotations_1/AhbCYVILusc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.76], [7.0, 8.83], [11.0, 10.72], [13.0, 12.88], [14.0, 14.49], [17.0, 18.05], [19.0, 20.48], [21.0, 22.49], [28.0, 28.76], [35.0, 34.74], [38.0, 105.48], [106.0, 110.2], [111.0, 119.26], [121.0, 147.09], [149.0, 156.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.42, 34.39, 31.98, 34.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["thunk", 28.49], ["music", 24.76], ["speech", 11.7]], [["music", 47.98], ["boing", 14.86], ["hum", 2.48]], [["speech", 35.72], ["music", 29.59], ["percussion", 4.67]], [["music", 78.08], ["synthesizer", 3.56], ["electronic music", 2.64]]], "duration": [0.76, 1.83, -0.28, -0.12, 0.49, 1.05, 1.48, 1.49, 0.76, -0.26, 67.48, 4.2, 8.26, 26.09, 7.96]} \ No newline at end of file diff --git a/annotations_1/AhcxeUrWTRc_filtered.json b/annotations_1/AhcxeUrWTRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faff9cf643646a0526d7fea6f90778e24d988884 --- /dev/null +++ b/annotations_1/AhcxeUrWTRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.96], [19.0, 19.67], [38.0, 39.46], [42.0, 49.59], [53.0, 53.33], [55.0, 65.65], [80.0, 80.18], [82.0, 85.68], [97.0, 116.09], [117.0, 141.24], [147.0, 153.27], [158.0, 190.34], [194.0, 194.17]], "keep_status": [false, false, false, true, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.65, 0.0, 32.64, 0.0, 37.41, 30.8, 29.45, 30.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 15.86], ["speech", 9.91], ["livestock, farm animals, working animals", 6.09]], null, [["speech", 34.98], ["music", 30.41], ["foghorn", 11.43]], null, [["music", 57.74], ["speech", 25.39], ["boing", 2.57]], [["foghorn", 42.36], ["speech", 18.52], ["vehicle", 6.88]], [["music", 33.76], ["speech", 11.12], ["foghorn", 7.35]], [["music", 55.25], ["hum", 7.7], ["throbbing", 6.78]], null, null], "duration": [-0.04, 0.67, 1.46, 7.59, 0.33, 10.65, 0.18, 3.68, 19.09, 24.24, 6.27, 32.34, 0.17]} \ No newline at end of file diff --git a/annotations_1/Ai5tZ8_dQUU_filtered.json b/annotations_1/Ai5tZ8_dQUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a150c8e840a3eb527f8f4a99d8b95c714e73e574 --- /dev/null +++ b/annotations_1/Ai5tZ8_dQUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.18], [14.0, 14.13], [19.0, 23.79], [25.0, 25.66], [32.0, 48.78], [51.0, 51.75], [53.0, 56.2], [58.0, 58.51], [70.0, 70.19], [71.0, 73.48], [78.0, 89.8], [90.0, 96.7], [98.0, 104.53], [105.0, 105.95], [107.0, 106.93], [113.0, 113.19], [125.0, 126.13], [127.0, 126.96], [128.0, 127.79], [141.0, 141.54], [142.0, 149.01], [150.0, 150.84]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.52, 0.0, 91.13, 0.0, 39.6, 0.0, 33.48, 0.0, 0.0, 38.4, 43.77, 100.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.84, 0.0], "audiomae_on_audioset": [[["speech", 47.3], ["stomach rumble", 18.57], ["sidetone", 8.57]], null, null, null, [["fly, housefly", 32.23], ["mosquito", 13.96], ["insect", 12.59]], null, [["speech", 73.15], ["door", 2.51], ["ping", 2.05]], null, null, [["speech", 56.66], ["music", 13.77], ["boing", 3.06]], [["speech", 73.82], ["electric shaver, electric razor", 6.66], ["livestock, farm animals, working animals", 2.59]], null, null, null, null, null, null, null, null, null, [["speech", 75.74], ["telephone", 3.67], ["whack, thwack", 3.34]], null], "duration": [11.18, 0.13, 4.79, 0.66, 16.78, 0.75, 3.2, 0.51, 0.19, 2.48, 11.8, 6.7, 6.53, 0.95, -0.07, 0.19, 1.13, -0.04, -0.21, 0.54, 7.01, 0.84]} \ No newline at end of file diff --git a/annotations_1/Ajh84X59SH4_filtered.json b/annotations_1/Ajh84X59SH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc8ceab2a0fdd03487ebd7a664020113af5a5a56 --- /dev/null +++ b/annotations_1/Ajh84X59SH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.77], [18.0, 19.21], [28.0, 48.86], [57.0, 57.03], [62.0, 82.83], [84.0, 96.7], [97.0, 112.65]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [30.12, 0.0, 30.79, 0.0, 30.48, 30.16, 29.63], "audiomae_on_audioset": [[["music", 69.51], ["whale vocalization", 8.22], ["electronic music", 3.37]], null, [["music", 77.86], ["theremin", 3.47], ["brass instrument", 1.51]], null, [["music", 50.5], ["whale vocalization", 34.4], ["gurgling", 2.62]], [["music", 73.54], ["throbbing", 6.5], ["hum", 2.41]], [["speech", 48.61], ["music", 10.51], ["hum", 6.41]]], "duration": [9.77, 1.21, 20.86, 0.03, 20.83, 12.7, 15.65]} \ No newline at end of file diff --git a/annotations_1/Ak8uiLVkpy4_filtered.json b/annotations_1/Ak8uiLVkpy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..715d132d81d4ae02269391236990fa0e037fbfb8 --- /dev/null +++ b/annotations_1/Ak8uiLVkpy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.96], [4.0, 4.56], [5.0, 5.63], [6.0, 7.52], [9.0, 9.29], [11.0, 14.55], [17.0, 17.76], [21.0, 23.3], [25.0, 28.09], [29.0, 30.89], [32.0, 32.44], [34.0, 36.02], [38.0, 40.07], [41.0, 48.81], [50.0, 51.8], [54.0, 55.68], [57.0, 59.22], [62.0, 65.53], [68.0, 70.28], [71.0, 74.76], [76.0, 77.04], [81.0, 82.56], [85.0, 92.5], [96.0, 98.39], [100.0, 100.23], [103.0, 103.49], [107.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 85.54, 99.05, 0.0, 0.0, 92.8, 64.63, 50.66, 0.0, 0.0, 58.38, 58.89, 60.6, 52.92, 0.0, 0.0, 47.5, 46.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.47], ["speech", 15.75], ["hum", 11.16]], [["music", 65.32], ["theremin", 2.88], ["foghorn", 2.74]], null, null, null], "duration": [-0.04, 0.56, 0.63, 1.52, 0.29, 3.55, 0.76, 2.3, 3.09, 1.89, 0.44, 2.02, 2.07, 7.81, 1.8, 1.68, 2.22, 3.53, 2.28, 3.76, 1.04, 1.56, 7.5, 2.39, 0.23, 0.49, 0.86]} \ No newline at end of file diff --git a/annotations_1/AkaPD_qTmok_filtered.json b/annotations_1/AkaPD_qTmok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecfc728dd5448546b648617e00237bc60f421f6a --- /dev/null +++ b/annotations_1/AkaPD_qTmok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.71], [7.0, 7.53], [9.0, 9.58], [13.0, 13.91], [16.0, 16.31], [23.0, 23.9], [28.0, 38.01], [39.0, 40.22], [43.0, 42.75], [43.0, 61.96], [63.0, 70.46], [76.0, 99.74], [102.0, 105.16], [111.0, 110.62], [111.0, 115.52], [117.0, 117.07], [122.0, 122.1], [128.0, 128.97], [130.0, 148.49], [149.0, 151.28], [158.0, 157.98], [171.0, 171.8], [173.0, 174.58], [176.0, 176.77], [178.0, 178.19], [182.0, 182.22], [184.0, 184.42], [189.0, 189.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 48.39, 64.86, 37.91, 30.01, 0.0, 32.85, 0.0, 0.0, 0.0, 100.0, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 56.38], ["grunt", 11.58], ["throbbing", 11.28]], null, null, [["music", 43.43], ["speech", 33.65], ["bouncing", 3.73]], null, [["speech", 25.66], ["whack, thwack", 12.65], ["music", 10.17]], [["animal", 13.27], ["music", 12.49], ["synthesizer", 9.75]], null, [["speech", 79.11], ["thunk", 7.97], ["inside, small room", 2.02]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, 0.53, 0.58, 0.91, 0.31, 0.9, 10.01, 1.22, -0.25, 18.96, 7.46, 23.74, 3.16, -0.38, 4.52, 0.07, 0.1, 0.97, 18.49, 2.28, -0.02, 0.8, 1.58, 0.77, 0.19, 0.22, 0.42, 0.51]} \ No newline at end of file diff --git a/annotations_1/AkjImI2Qpew_filtered.json b/annotations_1/AkjImI2Qpew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54f389b864f555087ffcf252f0c9a650e3cde303 --- /dev/null +++ b/annotations_1/AkjImI2Qpew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [9.0, 12.11], [21.0, 25.02], [26.0, 35.28], [42.0, 43.26], [45.0, 45.91], [47.0, 50.13], [52.0, 52.73], [53.0, 59.37], [63.0, 65.65], [71.0, 76.01], [78.0, 81.11], [82.0, 82.07], [85.0, 87.13], [88.0, 89.5], [110.0, 110.17], [111.0, 115.8], [119.0, 125.56], [130.0, 130.22], [132.0, 132.27], [134.0, 136.65], [138.0, 138.55], [141.0, 142.7], [147.0, 147.14], [150.0, 150.42], [153.0, 153.62], [156.0, 157.11], [161.0, 163.17], [165.0, 164.81]], "keep_status": [false, true, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.69, 46.19, 48.95, 0.0, 0.0, 47.62, 0.0, 39.85, 49.64, 37.15, 42.81, 0.0, 52.33, 0.0, 0.0, 48.61, 45.85, 0.0, 0.0, 48.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0], "audiomae_on_audioset": [null, [["music", 31.51], ["brass instrument", 17.32], ["trombone", 16.75]], [["hum", 34.12], ["rumble", 22.83], ["music", 17.91]], [["hum", 50.73], ["music", 14.46], ["mains hum", 13.89]], null, null, [["music", 36.8], ["hum", 9.43], ["throbbing", 6.25]], null, [["music", 38.64], ["hum", 21.77], ["mains hum", 14.4]], [["music", 43.8], ["rumble", 5.9], ["ambient music", 5.83]], [["mains hum", 18.94], ["hum", 15.93], ["breaking", 12.76]], [["music", 68.59], ["ambient music", 4.14], ["electronic music", 2.88]], null, null, null, null, [["music", 74.74], ["hum", 3.88], ["synthesizer", 2.16]], [["hum", 51.99], ["throbbing", 15.8], ["music", 10.95]], null, null, [["hum", 65.03], ["throbbing", 18.49], ["mains hum", 12.93]], null, null, null, null, null, null, null, null], "duration": [0.61, 3.11, 4.02, 9.28, 1.26, 0.91, 3.13, 0.73, 6.37, 2.65, 5.01, 3.11, 0.07, 2.13, 1.5, 0.17, 4.8, 6.56, 0.22, 0.27, 2.65, 0.55, 1.7, 0.14, 0.42, 0.62, 1.11, 2.17, -0.19]} \ No newline at end of file diff --git a/annotations_1/Aks95ziAQXU_filtered.json b/annotations_1/Aks95ziAQXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bde22b07ed769730a6412d6326f9fc331103c97d --- /dev/null +++ b/annotations_1/Aks95ziAQXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [0.0, 1.73], [4.0, 3.69], [6.0, 5.97], [6.0, 6.49], [9.0, 10.17], [15.0, 15.33], [25.0, 25.41], [33.0, 35.18], [37.0, 39.58], [41.0, 43.12], [47.0, 47.65], [52.0, 53.97], [55.0, 55.88], [59.0, 59.78], [60.0, 60.56], [67.0, 67.53], [71.0, 71.51], [80.0, 80.28], [81.0, 81.63], [82.0, 82.88], [85.0, 85.58], [93.0, 95.49], [96.0, 97.23], [109.0, 109.88], [119.0, 119.31], [121.0, 121.81], [136.0, 136.54], [148.0, 148.83], [163.0, 163.63], [169.0, 169.28], [171.0, 173.31], [174.0, 178.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 96.66, 40.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sine wave", 42.92], ["speech", 19.24], ["chirp tone", 18.68]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 57.02], ["speech", 27.92], ["music", 2.68]], null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 1.73, -0.31, -0.03, 0.49, 1.17, 0.33, 0.41, 2.18, 2.58, 2.12, 0.65, 1.97, 0.88, 0.78, 0.56, 0.53, 0.51, 0.28, 0.63, 0.88, 0.58, 2.49, 1.23, 0.88, 0.31, 0.81, 0.54, 0.83, 0.63, 0.28, 2.31, 4.55]} \ No newline at end of file diff --git a/annotations_1/AmCR7Owu6R8_filtered.json b/annotations_1/AmCR7Owu6R8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5761691439adf22a18bba1a67e4496c20c232d4f --- /dev/null +++ b/annotations_1/AmCR7Owu6R8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.16], [9.0, 10.4], [12.0, 14.13], [16.0, 15.9], [18.0, 22.01], [26.0, 28.97], [32.0, 33.3], [38.0, 39.93], [44.0, 44.93], [47.0, 48.12], [50.0, 51.31], [53.0, 54.31], [56.0, 58.75], [64.0, 65.62], [67.0, 68.61], [70.0, 70.63], [72.0, 74.48], [81.0, 83.24], [88.0, 89.46], [94.0, 96.5], [99.0, 100.85], [103.0, 105.04], [107.0, 108.35], [111.0, 113.63], [115.0, 116.45], [117.0, 119.74], [121.0, 122.45], [124.0, 126.12], [127.0, 128.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [77.87, 0.0, 74.6, 0.0, 71.87, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 47.74, 57.56, 0.0, 49.31, 0.0, 82.97, 0.0, 61.67, 0.0, 43.28, 0.0, 59.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.45], ["music", 24.66], ["hum", 6.72]], null, null, [["music", 35.68], ["speech", 30.44], ["hum", 4.15]], null, null, null, null, null, [["music", 31.76], ["speech", 25.7], ["hum", 3.05]], null, null, null], "duration": [2.16, 1.4, 2.13, -0.1, 4.01, 2.97, 1.3, 1.93, 0.93, 1.12, 1.31, 1.31, 2.75, 1.62, 1.61, 0.63, 2.48, 2.24, 1.46, 2.5, 1.85, 2.04, 1.35, 2.63, 1.45, 2.74, 1.45, 2.12, 1.98]} \ No newline at end of file diff --git a/annotations_1/AnGVJ8Gv8aU_filtered.json b/annotations_1/AnGVJ8Gv8aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93c3be64743781f66d69df2c83ef3a04add820e7 --- /dev/null +++ b/annotations_1/AnGVJ8Gv8aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 41.01], [44.0, 68.4], [70.0, 73.48], [75.0, 82.71], [88.0, 92.2], [94.0, 99.6], [102.0, 102.91], [104.0, 106.57], [108.0, 137.19], [137.0, 138.47], [139.0, 139.7], [142.0, 143.4], [147.0, 147.5], [149.0, 149.35], [152.0, 156.93], [157.0, 156.96], [157.0, 157.72], [163.0, 163.88], [166.0, 167.19], [169.0, 174.02], [174.0, 179.93], [182.0, 192.16], [193.0, 201.97], [203.0, 202.96], [205.0, 205.83]], "keep_status": [false, true, true, true, true, false, false, true, true, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 32.52, 32.8, 30.08, 29.37, 30.23, 0.0, 30.94, 29.15, 0.0, 0.0, 0.0, 0.0, 0.0, 30.32, 0.0, 0.0, 0.0, 0.0, 44.37, 29.16, 38.91, 34.9, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 39.08], ["throbbing", 16.09], ["static", 7.17]], [["music", 29.07], ["throbbing", 14.26], ["hum", 14.16]], [["music", 26.96], ["foghorn", 16.09], ["theremin", 10.61]], [["music", 51.81], ["theremin", 9.38], ["explosion", 3.85]], [["music", 67.04], ["musical instrument", 3.72], ["percussion", 2.22]], null, [["music", 28.95], ["theremin", 8.65], ["throbbing", 7.65]], [["music", 50.49], ["groan", 11.38], ["hum", 4.94]], null, null, null, null, null, [["music", 21.18], ["hum", 20.58], ["groan", 11.55]], null, null, null, null, [["speech", 14.69], ["crow", 9.66], ["hum", 8.69]], [["speech", 41.65], ["explosion", 31.38], ["burst, pop", 5.43]], [["throbbing", 36.17], ["hum", 34.35], ["mains hum", 3.83]], [["speech", 19.07], ["sidetone", 11.11], ["cattle, bovinae", 10.99]], null, null], "duration": [38.01, 24.4, 3.48, 7.71, 4.2, 5.6, 0.91, 2.57, 29.19, 1.47, 0.7, 1.4, 0.5, 0.35, 4.93, -0.04, 0.72, 0.88, 1.19, 5.02, 5.93, 10.16, 8.97, -0.04, 0.83]} \ No newline at end of file diff --git a/annotations_1/AnJm-acXQCo_filtered.json b/annotations_1/AnJm-acXQCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86adf02c6ab32fa5bbba1018fb153474bfe0f086 --- /dev/null +++ b/annotations_1/AnJm-acXQCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.89], [11.0, 10.94], [11.0, 11.01], [11.0, 11.04], [11.0, 18.32], [24.0, 26.55], [27.0, 67.86], [69.0, 69.53], [70.0, 70.46], [75.0, 84.21], [85.0, 99.1], [99.0, 109.7], [111.0, 111.91], [113.0, 114.78], [115.0, 118.12], [120.0, 121.73], [123.0, 125.95], [127.0, 128.75], [131.0, 136.86], [141.0, 141.61], [142.0, 148.98], [150.0, 161.1]], "keep_status": [true, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [29.85, 0.0, 0.0, 0.0, 30.18, 31.22, 0.0, 0.0, 0.0, 35.4, 33.67, 31.37, 0.0, 0.0, 36.12, 0.0, 41.6, 0.0, 36.58, 0.0, 35.97, 32.19], "audiomae_on_audioset": [[["music", 32.37], ["speech", 22.78], ["hum", 13.8]], null, null, null, [["speech", 37.92], ["music", 34.68], ["electronic music", 3.83]], [["music", 39.27], ["electronic music", 10.93], ["sidetone", 9.47]], null, null, null, [["hum", 28.78], ["mains hum", 23.96], ["speech", 10.89]], [["insect", 50.24], ["fly, housefly", 30.75], ["bee, wasp, etc.", 7.33]], [["speech", 51.96], ["vehicle", 20.95], ["buzz", 4.81]], null, null, [["mains hum", 28.69], ["hum", 24.36], ["music", 16.04]], null, [["music", 35.08], ["hum", 18.43], ["throbbing", 14.49]], null, [["hum", 37.37], ["mains hum", 31.34], ["music", 14.12]], null, [["music", 29.7], ["throbbing", 12.72], ["hum", 12.18]], [["hum", 44.2], ["throbbing", 22.77], ["mains hum", 20.2]]], "duration": [6.89, -0.06, 0.01, 0.04, 7.32, 2.55, 40.86, 0.53, 0.46, 9.21, 14.1, 10.7, 0.91, 1.78, 3.12, 1.73, 2.95, 1.75, 5.86, 0.61, 6.98, 11.1]} \ No newline at end of file diff --git a/annotations_1/AoB_mdZxNlY_filtered.json b/annotations_1/AoB_mdZxNlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce685118f493e5a7024368ed40a18861bc175c7f --- /dev/null +++ b/annotations_1/AoB_mdZxNlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 35.13], [36.0, 36.8], [39.0, 41.17], [45.0, 65.64], [71.0, 79.42], [80.0, 94.22], [103.0, 131.43], [135.0, 147.73], [151.0, 193.41]], "keep_status": [false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 34.38, 29.84, 30.01, 29.83, 30.0, 31.95, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 31.33], ["hum", 19.02], ["music", 13.26]], [["boing", 57.93], ["music", 26.4], ["speech", 5.53]], [["music", 65.91], ["speech", 9.8], ["musical instrument", 2.74]], [["music", 71.02], ["smash, crash", 3.78], ["cacophony", 2.67]], [["music", 46.79], ["speech", 16.55], ["electronic music", 6.51]], [["music", 74.58], ["electronic music", 1.99], ["vehicle", 1.85]], null], "duration": [30.13, 0.8, 2.17, 20.64, 8.42, 14.22, 28.43, 12.73, 42.41]} \ No newline at end of file diff --git a/annotations_1/AoKtg7t1Y0M_filtered.json b/annotations_1/AoKtg7t1Y0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3229558f57bb4256842a2a25a52698288d672a25 --- /dev/null +++ b/annotations_1/AoKtg7t1Y0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.16], [18.0, 19.36], [20.0, 19.99], [21.0, 21.09], [27.0, 26.89], [27.0, 29.96], [31.0, 32.61], [34.0, 35.95], [38.0, 38.8], [41.0, 45.32], [47.0, 53.16], [55.0, 58.01], [63.0, 65.65], [68.0, 68.91], [71.0, 71.51], [74.0, 75.07], [76.0, 79.47], [82.0, 83.29], [85.0, 87.49], [88.0, 92.48], [98.0, 98.36], [99.0, 120.45], [121.0, 122.94], [126.0, 126.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.16, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 98.99, 99.52, 97.54, 96.89, 0.0, 0.0, 0.0, 95.51, 0.0, 91.13, 94.07, 0.0, 82.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.16, 1.36, -0.01, 0.09, -0.11, 2.96, 1.61, 1.95, 0.8, 4.32, 6.16, 3.01, 2.65, 0.91, 0.51, 1.07, 3.47, 1.29, 2.49, 4.48, 0.36, 21.45, 1.94, 0.05]} \ No newline at end of file diff --git a/annotations_1/AoPqvTGZv6g_filtered.json b/annotations_1/AoPqvTGZv6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fb334a9a9f3d10cdb18bbd002f49904db118755 --- /dev/null +++ b/annotations_1/AoPqvTGZv6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 8.53], [9.0, 11.77], [15.0, 16.9], [18.0, 20.24], [23.0, 24.97], [27.0, 28.27], [31.0, 31.51], [32.0, 33.08], [34.0, 39.16], [42.0, 45.87], [47.0, 51.26], [53.0, 54.21], [56.0, 58.38], [63.0, 69.08], [75.0, 77.73], [80.0, 85.26], [86.0, 87.74], [88.0, 90.64], [92.0, 92.4], [99.0, 100.99], [103.0, 103.38], [106.0, 106.96], [110.0, 110.59], [112.0, 113.1], [114.0, 114.96], [116.0, 116.87], [119.0, 121.51], [124.0, 125.46], [126.0, 129.86], [131.0, 132.41], [134.0, 136.39], [138.0, 141.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 57.72, 59.24, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 65.09, 91.98, 86.09, 0.0, 98.66, 94.81, 75.88, 70.3, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 45.36, 0.0, 45.3, 47.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.01], ["music", 15.27], ["hum", 8.12]], null, [["music", 46.01], ["effects unit", 5.31], ["squish", 3.49]], [["hum", 16.67], ["mains hum", 14.7], ["music", 12.32]]], "duration": [0.54, 4.53, 2.77, 1.9, 2.24, 1.97, 1.27, 0.51, 1.08, 5.16, 3.87, 4.26, 1.21, 2.38, 6.08, 2.73, 5.26, 1.74, 2.64, 0.4, 1.99, 0.38, 0.96, 0.59, 1.1, 0.96, 0.87, 2.51, 1.46, 3.86, 1.41, 2.39, 3.51]} \ No newline at end of file diff --git a/annotations_1/Ap8p92HCAbg_filtered.json b/annotations_1/Ap8p92HCAbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebbc63500e1d7feb3a54be3d9d8445a74f4fa36 --- /dev/null +++ b/annotations_1/Ap8p92HCAbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.88], [16.0, 17.22], [22.0, 34.42], [36.0, 38.55], [43.0, 44.12], [45.0, 44.83], [45.0, 48.05], [55.0, 55.76], [65.0, 65.57], [66.0, 66.6], [69.0, 78.19], [81.0, 84.11], [92.0, 92.94], [102.0, 102.36], [113.0, 113.81], [117.0, 117.8], [120.0, 119.77], [123.0, 130.64], [132.0, 131.97], [133.0, 133.0], [135.0, 136.97], [137.0, 140.39], [143.0, 143.21]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [34.75, 0.0, 37.45, 58.64, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 62.78, 49.22, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 39.05, 0.0], "audiomae_on_audioset": [[["speech", 36.48], ["explosion", 9.44], ["cattle, bovinae", 5.39]], null, [["livestock, farm animals, working animals", 31.42], ["cattle, bovinae", 17.91], ["music", 17.39]], null, null, null, null, null, null, null, null, [["fly, housefly", 35.18], ["insect", 14.13], ["speech", 8.88]], null, null, null, null, null, [["fly, housefly", 43.61], ["insect", 13.75], ["mosquito", 12.11]], null, null, null, [["speech", 51.04], ["livestock, farm animals, working animals", 9.34], ["sheep", 8.43]], null], "duration": [6.88, 1.22, 12.42, 2.55, 1.12, -0.17, 3.05, 0.76, 0.57, 0.6, 9.19, 3.11, 0.94, 0.36, 0.81, 0.8, -0.23, 7.64, -0.03, 0.0, 1.97, 3.39, 0.21]} \ No newline at end of file diff --git a/annotations_1/ApANYuSl7A0_filtered.json b/annotations_1/ApANYuSl7A0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2eccb917735fdec6944551ee65b2b613c29ed4e9 --- /dev/null +++ b/annotations_1/ApANYuSl7A0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.18], [9.0, 13.96], [17.0, 18.18], [19.0, 25.02], [26.0, 31.92], [32.0, 33.76], [34.0, 35.82], [37.0, 37.98], [38.0, 39.82], [41.0, 53.84], [57.0, 58.4], [60.0, 60.72], [62.0, 62.77], [65.0, 65.3], [67.0, 67.36], [73.0, 75.02], [77.0, 78.95], [82.0, 84.45], [85.0, 88.42], [89.0, 89.73], [92.0, 92.91], [95.0, 95.47], [97.0, 98.04], [99.0, 104.3], [107.0, 107.57], [108.0, 108.5], [110.0, 110.39], [112.0, 112.82], [114.0, 114.24], [116.0, 120.68], [128.0, 128.34], [129.0, 130.11], [132.0, 133.35], [135.0, 137.12], [143.0, 143.38], [147.0, 147.06], [148.0, 148.98], [152.0, 154.95], [156.0, 158.45], [160.0, 162.87], [164.0, 165.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.77, 83.88, 0.0, 99.16, 93.13, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 100.0, 99.44, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 62.68, 0.0, 0.0, 0.0, 100.0, 100.0, 99.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.18, 4.96, 1.18, 6.02, 5.92, 1.76, 1.82, 0.98, 1.82, 12.84, 1.4, 0.72, 0.77, 0.3, 0.36, 2.02, 1.95, 2.45, 3.42, 0.73, 0.91, 0.47, 1.04, 5.3, 0.57, 0.5, 0.39, 0.82, 0.24, 4.68, 0.34, 1.11, 1.35, 2.12, 0.38, 0.06, 0.98, 2.95, 2.45, 2.87, 1.4]} \ No newline at end of file diff --git a/annotations_1/ApuFuuCJc3s_filtered.json b/annotations_1/ApuFuuCJc3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e28c268a4f1d987f3a378ccded00f8bae68f6235 --- /dev/null +++ b/annotations_1/ApuFuuCJc3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.22], [13.0, 13.64], [16.0, 23.5], [28.0, 28.85], [31.0, 31.28], [39.0, 40.12], [46.0, 52.24], [57.0, 57.16], [65.0, 66.24], [75.0, 80.57], [82.0, 87.15], [88.0, 88.35], [95.0, 95.62], [100.0, 106.84], [113.0, 113.66], [118.0, 120.43], [143.0, 145.67], [149.0, 153.57], [154.0, 154.82]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.24, 0.0, 0.0, 0.0, 33.07, 0.0, 0.0, 34.91, 36.48, 0.0, 0.0, 33.4, 0.0, 56.78, 33.51, 35.23, 0.0], "audiomae_on_audioset": [null, null, [["music", 43.58], ["throbbing", 20.95], ["hum", 4.29]], null, null, null, [["music", 67.25], ["electronic music", 6.55], ["techno", 5.7]], null, null, [["music", 52.47], ["electronic music", 9.78], ["house music", 8.29]], [["music", 49.38], ["speech", 26.56], ["techno", 5.18]], null, null, [["moo", 36.02], ["cattle, bovinae", 33.03], ["livestock, farm animals, working animals", 23.16]], null, null, [["speech", 64.45], ["groan", 21.47], ["screaming", 4.05]], [["speech", 67.71], ["music", 5.2], ["radio", 2.68]], null], "duration": [1.22, 0.64, 7.5, 0.85, 0.28, 1.12, 6.24, 0.16, 1.24, 5.57, 5.15, 0.35, 0.62, 6.84, 0.66, 2.43, 2.67, 4.57, 0.82]} \ No newline at end of file diff --git a/annotations_1/ArGWpUHkEmc_filtered.json b/annotations_1/ArGWpUHkEmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddc740b7fb41322838d287c09a681b32b5ead6e8 --- /dev/null +++ b/annotations_1/ArGWpUHkEmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 27.08], [32.0, 53.64], [55.0, 55.86], [60.0, 79.95], [80.0, 128.61], [129.0, 129.86], [131.0, 131.18], [133.0, 168.89]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [33.72, 29.04, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.73], ["whale vocalization", 31.9], ["music", 4.93]], [["whack, thwack", 32.87], ["music", 12.01], ["whip", 7.15]], null, [["hum", 51.88], ["throbbing", 7.3], ["mains hum", 4.55]], null, null, null, null], "duration": [25.08, 21.64, 0.86, 19.95, 48.61, 0.86, 0.18, 35.89]} \ No newline at end of file diff --git a/annotations_1/AryZBe8C69U_filtered.json b/annotations_1/AryZBe8C69U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cba5aac1c8debb252a3872f33f84cd278a969c9 --- /dev/null +++ b/annotations_1/AryZBe8C69U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.72], [4.0, 5.34], [12.0, 15.99], [25.0, 29.84], [32.0, 33.32], [35.0, 35.26], [36.0, 38.06], [39.0, 39.23], [41.0, 41.17], [43.0, 44.09], [44.0, 44.36], [52.0, 54.45], [62.0, 66.55], [73.0, 80.79], [87.0, 93.5], [97.0, 97.97], [98.0, 98.74], [100.0, 101.71], [102.0, 103.25], [105.0, 105.87], [112.0, 113.83], [119.0, 123.74], [125.0, 125.52], [126.0, 126.94], [129.0, 129.25], [134.0, 134.38], [135.0, 135.63], [136.0, 137.15], [139.0, 139.29], [140.0, 141.15], [142.0, 143.38], [144.0, 152.0], [163.0, 163.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.16, 54.63, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 39.17, 35.45, 31.71, 34.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.14, 0.0], "audiomae_on_audioset": [null, null, [["music", 68.81], ["guitar", 6.59], ["musical instrument", 5.97]], null, null, null, null, null, null, null, null, [["music", 73.96], ["boing", 3.04], ["musical instrument", 2.85]], [["music", 30.92], ["animal", 8.28], ["livestock, farm animals, working animals", 7.98]], [["boing", 62.7], ["music", 30.96], ["groan", 1.13]], [["music", 35.42], ["boing", 17.53], ["speech", 9.62]], null, null, null, null, null, null, [["boing", 40.74], ["music", 25.36], ["speech", 12.31]], null, null, null, null, null, null, null, null, null, [["music", 72.09], ["speech", 2.86], ["quack", 2.3]], null], "duration": [-0.28, 1.34, 3.99, 4.84, 1.32, 0.26, 2.06, 0.23, 0.17, 1.09, 0.36, 2.45, 4.55, 7.79, 6.5, 0.97, 0.74, 1.71, 1.25, 0.87, 1.83, 4.74, 0.52, 0.94, 0.25, 0.38, 0.63, 1.15, 0.29, 1.15, 1.38, 8.0, 0.34]} \ No newline at end of file diff --git a/annotations_1/AsR-WnELodI_filtered.json b/annotations_1/AsR-WnELodI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e50c5a56e78dd5c77cc89292f21152e7964a4b2a --- /dev/null +++ b/annotations_1/AsR-WnELodI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.18], [9.0, 9.48], [22.0, 21.9], [25.0, 25.41], [28.0, 29.32], [39.0, 40.85], [41.0, 42.08], [51.0, 51.58], [55.0, 55.54], [61.0, 61.55], [63.0, 64.45], [68.0, 70.83], [72.0, 72.81], [74.0, 87.39], [94.0, 94.76], [111.0, 122.23], [123.0, 123.47], [129.0, 129.86], [131.0, 131.5], [134.0, 135.01], [136.0, 137.66], [138.0, 142.55], [145.0, 146.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 47.78, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 14.37], ["hands", 12.39], ["synthesizer", 8.81]], null, [["hands", 26.12], ["speech", 10.22], ["music", 9.92]], null, null, null, null, null, [["speech", 56.32], ["music", 9.94], ["inside, small room", 4.72]], null], "duration": [1.18, 0.48, -0.1, 0.41, 1.32, 1.85, 1.08, 0.58, 0.54, 0.55, 1.45, 2.83, 0.81, 13.39, 0.76, 11.23, 0.47, 0.86, 0.5, 1.01, 1.66, 4.55, 1.33]} \ No newline at end of file diff --git a/annotations_1/AsfxK5fWMu8_filtered.json b/annotations_1/AsfxK5fWMu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..366bdacf0904a51bdceb215756fa5c32537542e2 --- /dev/null +++ b/annotations_1/AsfxK5fWMu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [7.0, 28.73], [31.0, 31.92], [36.0, 35.85], [37.0, 67.15], [71.0, 72.74], [74.0, 80.38], [81.0, 82.11], [83.0, 99.99], [102.0, 103.64], [105.0, 106.83], [124.0, 174.43], [175.0, 178.04]], "keep_status": [false, true, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 29.97, 0.0, 32.06, 0.0, 0.0, 0.0, 30.22], "audiomae_on_audioset": [null, [["whale vocalization", 37.22], ["noise", 18.61], ["fart", 6.86]], null, null, null, null, [["sidetone", 30.37], ["music", 23.46], ["musical instrument", 6.72]], null, [["music", 58.61], ["fly, housefly", 6.14], ["explosion", 4.44]], null, null, null, [["vehicle", 26.29], ["speech", 12.07], ["motorboat, speedboat", 6.27]]], "duration": [0.1, 21.73, 0.92, -0.15, 30.15, 1.74, 6.38, 1.11, 16.99, 1.64, 1.83, 50.43, 3.04]} \ No newline at end of file diff --git a/annotations_1/AszdXufdl3E_filtered.json b/annotations_1/AszdXufdl3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c0d251fba58eb709678521f0d91c3eb88f84509 --- /dev/null +++ b/annotations_1/AszdXufdl3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.54], [46.0, 46.45], [49.0, 49.6], [80.0, 82.73], [92.0, 92.64], [107.0, 109.16], [111.0, 112.18], [115.0, 116.7]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 50.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.54, 0.45, 0.6, 2.73, 0.64, 2.16, 1.18, 1.7]} \ No newline at end of file diff --git a/annotations_1/AtWL0iQxE7U_filtered.json b/annotations_1/AtWL0iQxE7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3155404b228bde9d86cb7b49ad2e9daa3cab8486 --- /dev/null +++ b/annotations_1/AtWL0iQxE7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 36.96], [37.0, 66.06], [69.0, 94.26], [96.0, 103.94], [104.0, 112.46], [115.0, 115.7], [118.0, 151.17]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [78.21, 42.74, 36.07, 37.8, 32.41, 0.0, 0.0], "audiomae_on_audioset": [null, [["didgeridoo", 61.29], ["music", 15.22], ["hum", 4.55]], [["music", 33.74], ["hum", 23.01], ["throbbing", 12.17]], [["music", 55.56], ["speech", 23.17], ["explosion", 1.75]], [["music", 45.53], ["speech", 15.62], ["whack, thwack", 13.38]], null, null], "duration": [12.96, 29.06, 25.26, 7.94, 8.46, 0.7, 33.17]} \ No newline at end of file diff --git a/annotations_1/AutuCkT54KI_filtered.json b/annotations_1/AutuCkT54KI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a509289ef456101670376d7301e6480b0bc085d --- /dev/null +++ b/annotations_1/AutuCkT54KI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [9.0, 11.7], [15.0, 17.66], [24.0, 28.71], [35.0, 48.3], [50.0, 51.11], [55.0, 79.47], [81.0, 95.89], [98.0, 108.46], [110.0, 110.07], [111.0, 111.38], [113.0, 147.68], [150.0, 152.39], [153.0, 154.77], [156.0, 159.95]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 48.23, 46.15, 70.02, 39.96, 0.0, 30.62, 35.45, 30.12, 0.0, 0.0, 0.0, 30.03, 0.0, 29.72], "audiomae_on_audioset": [null, [["hum", 25.16], ["throbbing", 25.1], ["music", 19.66]], [["music", 44.78], ["electronic music", 8.81], ["throbbing", 8.58]], null, [["music", 45.02], ["throbbing", 21.18], ["hum", 11.0]], null, [["music", 62.71], ["throbbing", 7.79], ["electronic music", 3.68]], [["music", 60.49], ["didgeridoo", 8.89], ["speech", 5.81]], [["music", 56.86], ["speech", 12.71], ["explosion", 3.31]], null, null, null, [["explosion", 36.92], ["music", 17.22], ["eruption", 9.33]], null, [["civil defense siren", 40.26], ["speech", 32.35], ["siren", 12.29]]], "duration": [0.94, 2.7, 2.66, 4.71, 13.3, 1.11, 24.47, 14.89, 10.46, 0.07, 0.38, 34.68, 2.39, 1.77, 3.95]} \ No newline at end of file diff --git a/annotations_1/AvDUQXknug8_filtered.json b/annotations_1/AvDUQXknug8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3901aedcfd21387408ea7bd6099e151bd0d9a53b --- /dev/null +++ b/annotations_1/AvDUQXknug8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.24], [9.0, 9.41], [10.0, 10.56], [24.0, 24.43], [26.0, 26.87], [35.0, 35.33], [51.0, 51.34], [53.0, 52.93], [54.0, 58.01], [59.0, 73.45], [76.0, 76.92], [79.0, 81.95], [83.0, 86.76], [88.0, 88.94], [91.0, 91.5], [92.0, 93.6], [95.0, 116.01], [117.0, 121.42], [123.0, 125.86], [126.0, 128.16], [129.0, 130.76], [132.0, 137.57], [138.0, 139.77], [141.0, 149.2], [153.0, 153.52], [155.0, 157.42], [158.0, 167.85], [173.0, 173.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 83.52, 0.0, 94.95, 99.8, 0.0, 0.0, 0.0, 95.64, 95.09, 99.52, 81.71, 0.0, 94.37, 0.0, 88.83, 0.0, 98.19, 85.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.41, 0.56, 0.43, 0.87, 0.33, 0.34, -0.07, 4.01, 14.45, 0.92, 2.95, 3.76, 0.94, 0.5, 1.6, 21.01, 4.42, 2.86, 2.16, 1.76, 5.57, 1.77, 8.2, 0.52, 2.42, 9.85, 0.53]} \ No newline at end of file diff --git a/annotations_1/AvPVexWamGg_filtered.json b/annotations_1/AvPVexWamGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f26c7714eaca7dc5010aab1f4d1a1a109e2672a --- /dev/null +++ b/annotations_1/AvPVexWamGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [6.0, 22.74], [23.0, 25.03], [31.0, 31.24], [32.0, 32.91], [35.0, 37.17], [43.0, 42.94], [46.0, 62.85], [64.0, 70.61], [72.0, 72.12], [74.0, 78.27], [79.0, 108.94], [113.0, 118.84]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 54.9, 59.33, 0.0, 0.0, 77.87, 0.0, 29.33, 29.25, 0.0, 49.59, 29.51, 32.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 48.9], ["electric shaver, electric razor", 7.44], ["hum", 3.74]], [["speech", 48.84], ["music", 20.07], ["gunshot, gunfire", 4.86]], null, [["hum", 41.2], ["mains hum", 19.55], ["whale vocalization", 10.21]], [["speech", 44.17], ["hum", 20.94], ["music", 4.3]], [["music", 40.41], ["throbbing", 14.1], ["hum", 12.35]]], "duration": [0.39, 16.74, 2.03, 0.24, 0.91, 2.17, -0.06, 16.85, 6.61, 0.12, 4.27, 29.94, 5.84]} \ No newline at end of file diff --git a/annotations_1/AwR1RawiBU0_filtered.json b/annotations_1/AwR1RawiBU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e80e41205e59e0991361e30d1edcd942dda231cc --- /dev/null +++ b/annotations_1/AwR1RawiBU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [3.0, 3.57], [5.0, 20.41], [25.0, 25.46], [26.0, 27.14], [29.0, 50.53], [52.0, 52.51], [53.0, 53.6], [55.0, 55.12], [57.0, 58.02], [60.0, 60.62], [63.0, 63.85], [65.0, 65.23], [66.0, 66.88], [67.0, 67.49], [74.0, 75.59], [81.0, 81.41], [82.0, 83.17], [88.0, 90.46], [99.0, 98.81], [99.0, 102.15], [105.0, 107.59], [123.0, 124.6], [134.0, 140.09], [142.0, 147.38], [150.0, 152.41], [155.0, 154.94], [155.0, 166.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.7, 0.0, 0.0, 29.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 37.52, 51.71, 0.0, 55.89, 66.51, 56.18, 0.0, 91.3], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 55.34], ["explosion", 18.48], ["music", 4.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.92], ["throbbing", 12.13], ["music", 7.11]], null, null, null, null, null, null, null], "duration": [0.34, 0.57, 15.41, 0.46, 1.14, 21.53, 0.51, 0.6, 0.12, 1.02, 0.62, 0.85, 0.23, 0.88, 0.49, 1.59, 0.41, 1.17, 2.46, -0.19, 3.15, 2.59, 1.6, 6.09, 5.38, 2.41, -0.06, 11.68]} \ No newline at end of file diff --git a/annotations_1/AwtSK1gLBBk_filtered.json b/annotations_1/AwtSK1gLBBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d22f28ba78da4fdc669cd94a44301184d185b7 --- /dev/null +++ b/annotations_1/AwtSK1gLBBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.59], [23.0, 23.28], [26.0, 29.25], [32.0, 38.87], [39.0, 46.62], [47.0, 73.82], [82.0, 81.82], [87.0, 110.66], [112.0, 113.26], [115.0, 114.86], [116.0, 118.29], [119.0, 120.18], [121.0, 122.0], [123.0, 122.71], [124.0, 162.14], [162.0, 162.3], [162.0, 185.57]], "keep_status": [false, false, true, true, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [32.5, 0.0, 34.99, 34.67, 31.85, 38.31, 0.0, 31.03, 0.0, 0.0, 34.52, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39], "audiomae_on_audioset": [[["speech", 53.34], ["music", 23.95], ["breaking", 4.3]], null, [["music", 50.38], ["hum", 12.79], ["mains hum", 5.21]], [["speech", 26.19], ["music", 21.43], ["fly, housefly", 5.99]], [["music", 62.42], ["speech", 6.12], ["groan", 5.01]], [["music", 43.39], ["scary music", 28.01], ["hiccup", 12.57]], null, [["hum", 21.74], ["mains hum", 17.81], ["speech", 14.17]], null, null, [["music", 27.24], ["speech", 6.28], ["hum", 4.51]], null, null, null, null, null, [["music", 24.92], ["whack, thwack", 9.52], ["whip", 8.19]]], "duration": [17.59, 0.28, 3.25, 6.87, 7.62, 26.82, -0.18, 23.66, 1.26, -0.14, 2.29, 1.18, 1.0, -0.29, 38.14, 0.3, 23.57]} \ No newline at end of file diff --git a/annotations_1/Ax-iwIoIxjY_filtered.json b/annotations_1/Ax-iwIoIxjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8886f708d27223dc4b3ed4850be2736a23934ec8 --- /dev/null +++ b/annotations_1/Ax-iwIoIxjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [9.0, 16.34], [21.0, 22.69], [24.0, 24.65], [26.0, 46.58], [48.0, 54.35], [59.0, 88.47], [90.0, 89.68], [90.0, 90.86], [91.0, 92.03], [95.0, 95.57], [97.0, 97.48], [99.0, 99.47], [101.0, 100.67], [103.0, 108.9], [110.0, 111.62], [113.0, 113.86], [115.0, 123.67], [125.0, 128.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [0.0, 55.89, 0.0, 0.0, 33.22, 31.81, 34.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.13, 0.0, 0.0, 34.64, 36.41], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 41.73], ["electric shaver, electric razor", 30.48], ["hum", 21.3]], [["speech", 42.29], ["fart", 37.9], ["noise", 2.66]], [["speech", 58.58], ["electric shaver, electric razor", 5.17], ["cattle, bovinae", 3.77]], null, null, null, null, null, null, null, [["music", 19.61], ["machine gun", 11.21], ["gunshot, gunfire", 9.35]], null, null, [["speech", 45.69], ["hum", 7.28], ["vehicle", 5.3]], [["civil defense siren", 28.29], ["mains hum", 9.57], ["hum", 9.11]]], "duration": [1.02, 7.34, 1.69, 0.65, 20.58, 6.35, 29.47, -0.32, 0.86, 1.03, 0.57, 0.48, 0.47, -0.33, 5.9, 1.62, 0.86, 8.67, 3.56]} \ No newline at end of file diff --git a/annotations_1/Ax83IEcbUwU_filtered.json b/annotations_1/Ax83IEcbUwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cfb7cd23c19dfccdcb14a36a4c114b19c0e37d8 --- /dev/null +++ b/annotations_1/Ax83IEcbUwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 120.58], [123.0, 136.07], [137.0, 153.01], [154.0, 158.9], [160.0, 160.52], [162.0, 163.05], [165.0, 166.94]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 30.87, 36.33, 32.9, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 67.42], ["electronic music", 4.29], ["breaking", 3.29]], [["music", 31.3], ["hum", 24.83], ["didgeridoo", 12.95]], [["music", 44.76], ["hum", 20.23], ["mains hum", 10.08]], null, null, null], "duration": [104.58, 13.07, 16.01, 4.9, 0.52, 1.05, 1.94]} \ No newline at end of file diff --git a/annotations_1/AxBkurGlhHg_filtered.json b/annotations_1/AxBkurGlhHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e4e8ad405be6e4ba5f6f5fa2406990f33f54f5c --- /dev/null +++ b/annotations_1/AxBkurGlhHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [5.0, 6.24], [8.0, 10.96], [13.0, 16.98], [19.0, 64.98], [70.0, 76.06], [77.0, 92.35], [93.0, 92.94]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.47, 34.49, 0.0, 30.06, 30.04, 0.0], "audiomae_on_audioset": [null, null, [["speech", 29.16], ["vehicle", 16.47], ["boat, water vehicle", 7.09]], [["speech", 68.6], ["sidetone", 7.25], ["vehicle", 6.51]], null, [["livestock, farm animals, working animals", 31.76], ["cattle, bovinae", 27.41], ["moo", 26.71]], [["music", 54.9], ["didgeridoo", 21.24], ["musical instrument", 2.76]], null], "duration": [0.22, 1.24, 2.96, 3.98, 45.98, 6.06, 15.35, -0.06]} \ No newline at end of file diff --git a/annotations_1/AxGMySJ6ySc_filtered.json b/annotations_1/AxGMySJ6ySc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d74044b22d3cb0f6b32164e911e0589f2ad4589 --- /dev/null +++ b/annotations_1/AxGMySJ6ySc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 21.14], [24.0, 24.48], [32.0, 36.49], [39.0, 54.09], [62.0, 64.52], [66.0, 77.99], [80.0, 92.57], [94.0, 96.79]], "keep_status": [true, false, false, false, false, false, false, true], "silence_prob": [34.33, 0.0, 33.98, 42.15, 37.23, 35.37, 35.7, 33.02], "audiomae_on_audioset": [[["music", 40.59], ["glockenspiel", 19.35], ["marimba, xylophone", 9.73]], null, [["music", 58.56], ["glockenspiel", 11.12], ["mallet percussion", 5.35]], [["music", 76.18], ["ding-dong", 4.4], ["glockenspiel", 2.75]], [["music", 69.62], ["music for children", 11.32], ["boing", 3.39]], [["music", 55.07], ["sheep", 17.11], ["bleat", 14.53]], [["music", 61.08], ["sheep", 7.86], ["music for children", 6.29]], [["music", 42.38], ["synthesizer", 5.79], ["baby cry, infant cry", 3.15]]], "duration": [8.14, 0.48, 4.49, 15.09, 2.52, 11.99, 12.57, 2.79]} \ No newline at end of file diff --git a/annotations_1/AxGXZOLn-U0_filtered.json b/annotations_1/AxGXZOLn-U0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7abded8d88cdc0df99967677f5c1f39e8f8dde2b --- /dev/null +++ b/annotations_1/AxGXZOLn-U0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.76], [6.0, 6.54], [9.0, 10.59], [11.0, 11.69], [14.0, 14.27], [15.0, 16.04], [19.0, 19.33], [22.0, 25.88], [27.0, 28.63], [29.0, 31.73], [41.0, 41.07], [59.0, 59.49], [61.0, 64.62], [78.0, 81.67], [102.0, 109.16], [110.0, 110.59], [111.0, 110.62], [111.0, 110.66], [111.0, 126.81], [130.0, 140.76], [142.0, 144.51]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 45.82, 0.0, 0.0, 51.28, 34.88, 35.96, 0.0, 0.0, 0.0, 32.94, 34.09, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 54.49], ["cattle, bovinae", 7.55], ["moo", 7.19]], null, null, null, [["music", 84.91], ["video game music", 1.0], ["musical instrument", 0.82]], [["boing", 27.52], ["sound effect", 10.49], ["whack, thwack", 10.39]], null, null, null, [["music", 42.06], ["speech", 16.94], ["whack, thwack", 15.45]], [["music", 64.28], ["speech", 9.03], ["animal", 4.73]], null], "duration": [-0.24, 0.54, 1.59, 0.69, 0.27, 1.04, 0.33, 3.88, 1.63, 2.73, 0.07, 0.49, 3.62, 3.67, 7.16, 0.59, -0.38, -0.34, 15.81, 10.76, 2.51]} \ No newline at end of file diff --git a/annotations_1/AxhQq_-31FY_filtered.json b/annotations_1/AxhQq_-31FY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8db0937d19e78950ad8f370b9eaa0e77f0ee627 --- /dev/null +++ b/annotations_1/AxhQq_-31FY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.73], [6.0, 7.97], [9.0, 9.8], [14.0, 18.17], [22.0, 46.25], [47.0, 77.58], [79.0, 80.97], [84.0, 85.55], [86.0, 87.25], [89.0, 96.45], [98.0, 99.15], [100.0, 105.9], [108.0, 108.01], [110.0, 110.25], [114.0, 119.79], [121.0, 125.32]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 45.11, 30.02, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 37.38, 0.0, 0.0, 35.96, 29.65], "audiomae_on_audioset": [null, null, null, [["music", 48.08], ["throbbing", 12.77], ["hum", 10.74]], [["whack, thwack", 47.72], ["music", 19.1], ["thunk", 5.82]], null, null, null, null, [["speech", 24.87], ["music", 18.14], ["explosion", 8.23]], null, [["mains hum", 40.7], ["hum", 32.9], ["music", 5.77]], null, null, [["mains hum", 61.04], ["hum", 19.95], ["music", 6.68]], [["music", 22.16], ["breaking", 14.66], ["cowbell", 6.72]]], "duration": [1.73, 1.97, 0.8, 4.17, 24.25, 30.58, 1.97, 1.55, 1.25, 7.45, 1.15, 5.9, 0.01, 0.25, 5.79, 4.32]} \ No newline at end of file diff --git a/annotations_1/AxrQtWFF91k_filtered.json b/annotations_1/AxrQtWFF91k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11fcf5381ed962fc34aa89c716d8413f47f0c957 --- /dev/null +++ b/annotations_1/AxrQtWFF91k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 2.32], [3.0, 2.76], [3.0, 3.82], [5.0, 5.9], [15.0, 17.93], [28.0, 28.19], [36.0, 40.93], [42.0, 42.08], [45.0, 44.79], [67.0, 67.24], [70.0, 71.17], [72.0, 72.94], [75.0, 76.11], [84.0, 84.52], [98.0, 100.03], [104.0, 104.43], [113.0, 120.04], [121.0, 130.62], [131.0, 130.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 34.2, 39.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.73], ["fly, housefly", 16.34], ["insect", 7.74]], [["fly, housefly", 26.48], ["mosquito", 24.72], ["insect", 8.94]], null], "duration": [0.53, 0.32, -0.24, 0.82, 0.9, 2.93, 0.19, 4.93, 0.08, -0.21, 0.24, 1.17, 0.94, 1.11, 0.52, 2.03, 0.43, 7.04, 9.62, -0.11]} \ No newline at end of file diff --git a/annotations_1/AxxKJ2QgPtY_filtered.json b/annotations_1/AxxKJ2QgPtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c11842613be0dcd4f368ff3b71befb2e859c283 --- /dev/null +++ b/annotations_1/AxxKJ2QgPtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.07], [6.0, 7.96], [10.0, 12.14], [13.0, 14.61], [16.0, 35.43], [36.0, 40.95], [43.0, 49.45], [52.0, 52.49], [54.0, 54.84], [61.0, 61.65], [62.0, 66.65], [67.0, 66.97], [72.0, 73.63], [89.0, 96.87], [97.0, 98.69], [100.0, 117.81], [122.0, 149.32], [153.0, 154.41], [155.0, 161.97]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 51.28, 0.0, 32.19, 30.43, 31.41, 0.0, 0.0, 0.0, 39.86, 0.0, 0.0, 30.91, 0.0, 30.04, 30.11, 0.0, 33.69], "audiomae_on_audioset": [null, null, null, null, [["music", 37.45], ["speech", 35.92], ["musical instrument", 2.63]], [["cattle, bovinae", 48.76], ["moo", 34.55], ["livestock, farm animals, working animals", 14.59]], [["music", 39.83], ["speech", 24.24], ["musical instrument", 3.2]], null, null, null, [["music", 49.53], ["speech", 33.5], ["didgeridoo", 4.3]], null, null, [["music", 48.15], ["speech", 29.49], ["crowd", 2.8]], null, [["music", 18.99], ["crowd", 10.67], ["speech", 7.29]], [["cattle, bovinae", 28.06], ["livestock, farm animals, working animals", 22.31], ["moo", 16.06]], null, [["music", 35.27], ["didgeridoo", 32.42], ["speech", 6.12]]], "duration": [1.07, 1.96, 2.14, 1.61, 19.43, 4.95, 6.45, 0.49, 0.84, 0.65, 4.65, -0.03, 1.63, 7.87, 1.69, 17.81, 27.32, 1.41, 6.97]} \ No newline at end of file diff --git a/annotations_1/AyYlJ6YQp3I_filtered.json b/annotations_1/AyYlJ6YQp3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddae81f961c5d2e2364f71c050918cbe61e2dd5e --- /dev/null +++ b/annotations_1/AyYlJ6YQp3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.81], [5.0, 8.53], [9.0, 9.95], [12.0, 12.88], [13.0, 13.68], [21.0, 21.03], [27.0, 28.73], [30.0, 30.43], [33.0, 33.74], [37.0, 44.17], [45.0, 48.34], [60.0, 60.57], [66.0, 66.33], [74.0, 74.58], [77.0, 80.18], [83.0, 83.88], [85.0, 90.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 87.37, 0.0, 0.0, 0.0, 38.49, 0.0, 30.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.36], ["musical instrument", 5.05], ["synthesizer", 4.74]], null, [["music", 74.54], ["ding-dong", 3.63], ["synthesizer", 3.57]]], "duration": [-0.19, 3.53, 0.95, 0.88, 0.68, 0.03, 1.73, 0.43, 0.74, 7.17, 3.34, 0.57, 0.33, 0.58, 3.18, 0.88, 5.07]} \ No newline at end of file diff --git a/annotations_1/B-S7jkgEC8Y_filtered.json b/annotations_1/B-S7jkgEC8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd41f668910110fa1b14d551924435d73357aff8 --- /dev/null +++ b/annotations_1/B-S7jkgEC8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.54], [16.0, 15.94], [17.0, 23.36], [32.0, 33.0], [34.0, 33.99], [35.0, 35.61], [37.0, 39.68], [46.0, 51.07], [51.0, 55.63], [56.0, 57.65], [62.0, 66.06], [80.0, 82.17], [89.0, 92.85], [93.0, 97.09], [98.0, 98.86], [99.0, 100.41], [101.0, 103.5], [105.0, 109.07], [116.0, 116.01], [116.0, 118.34], [133.0, 137.59]], "keep_status": [true, false, true, false, false, false, true, true, true, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [35.28, 0.0, 35.98, 0.0, 0.0, 0.0, 31.13, 38.5, 39.31, 0.0, 34.68, 58.05, 45.52, 56.03, 0.0, 0.0, 58.13, 63.42, 0.0, 47.86, 83.88], "audiomae_on_audioset": [[["speech", 31.13], ["music", 19.34], ["boing", 9.11]], null, [["speech", 39.1], ["noise", 19.09], ["animal", 6.27]], null, null, null, [["music", 30.3], ["wild animals", 12.15], ["animal", 8.1]], [["music", 34.29], ["speech", 21.68], ["sidetone", 9.91]], [["music", 42.35], ["speech", 20.82], ["sidetone", 6.19]], null, [["music", 57.04], ["musical instrument", 4.76], ["speech", 3.45]], null, [["speech", 49.33], ["music", 8.69], ["glass", 7.18]], null, null, null, null, null, null, [["sidetone", 32.72], ["music", 27.9], ["speech", 18.66]], null], "duration": [2.54, -0.06, 6.36, 1.0, -0.01, 0.61, 2.68, 5.07, 4.63, 1.65, 4.06, 2.17, 3.85, 4.09, 0.86, 1.41, 2.5, 4.07, 0.01, 2.34, 4.59]} \ No newline at end of file diff --git a/annotations_1/B-Wf5QOHPxw_filtered.json b/annotations_1/B-Wf5QOHPxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a9430b94233af60d966ee2a1e12459b6b42a4a --- /dev/null +++ b/annotations_1/B-Wf5QOHPxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 36.1], [42.0, 42.82], [61.0, 66.26], [67.0, 103.82], [111.0, 115.06], [115.0, 117.12], [118.0, 118.86], [120.0, 138.91], [141.0, 162.09], [169.0, 190.85]], "keep_status": [false, false, false, false, true, true, false, true, true, true], "silence_prob": [28.63, 0.0, 29.92, 0.0, 28.34, 30.6, 0.0, 28.22, 28.37, 28.43], "audiomae_on_audioset": [[["music", 50.93], ["speech", 13.25], ["electronic music", 6.51]], null, [["speech", 42.4], ["vehicle", 24.06], ["car", 7.83]], null, [["music", 37.68], ["synthesizer", 9.77], ["musical instrument", 6.56]], [["speech", 24.77], ["music", 16.83], ["hum", 7.47]], null, [["hum", 22.44], ["mains hum", 14.44], ["music", 10.11]], [["music", 24.17], ["speech", 19.22], ["hum", 14.19]], [["hum", 13.73], ["music", 13.38], ["vehicle", 9.82]]], "duration": [4.1, 0.82, 5.26, 36.82, 4.06, 2.12, 0.86, 18.91, 21.09, 21.85]} \ No newline at end of file diff --git a/annotations_1/B0nhCPv8VB8_filtered.json b/annotations_1/B0nhCPv8VB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d517b1f4774a643206c284d6b3960c77a4fc7f6 --- /dev/null +++ b/annotations_1/B0nhCPv8VB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.76], [12.0, 15.2], [17.0, 23.65], [25.0, 52.64], [54.0, 67.54], [69.0, 69.87], [74.0, 76.27], [79.0, 104.55], [106.0, 133.44]], "keep_status": [false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 36.52, 34.63, 29.36, 30.22, 0.0, 28.08, 28.62, 29.13], "audiomae_on_audioset": [null, [["mains hum", 60.69], ["hum", 29.12], ["throbbing", 3.27]], [["hum", 35.49], ["mains hum", 21.89], ["speech", 11.97]], [["music", 75.94], ["electronic music", 6.4], ["throbbing", 2.95]], [["music", 42.8], ["throbbing", 40.11], ["hum", 7.94]], null, [["music", 43.21], ["mains hum", 4.16], ["explosion", 4.03]], [["music", 31.62], ["hum", 25.23], ["mains hum", 10.47]], [["music", 53.95], ["speech", 18.34], ["throbbing", 3.82]]], "duration": [1.76, 3.2, 6.65, 27.64, 13.54, 0.87, 2.27, 25.55, 27.44]} \ No newline at end of file diff --git a/annotations_1/B2KSjVAskxM_filtered.json b/annotations_1/B2KSjVAskxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a87d72675c79e5d39919e62af0ced8aff7f09dc0 --- /dev/null +++ b/annotations_1/B2KSjVAskxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [16.0, 16.38], [19.0, 22.65], [25.0, 32.46], [34.0, 38.37], [43.0, 46.16], [48.0, 49.18], [55.0, 73.43], [77.0, 79.2]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.76, 41.38, 37.54, 80.29, 0.0, 30.52, 30.67], "audiomae_on_audioset": [null, null, null, [["music", 52.1], ["speech", 17.03], ["synthesizer", 4.4]], [["music", 80.56], ["musical instrument", 1.76], ["electronic music", 1.75]], null, null, [["music", 76.44], ["speech", 7.04], ["electronic music", 2.38]], [["music", 64.85], ["speech", 11.11], ["musical instrument", 2.84]]], "duration": [0.32, 0.38, 3.65, 7.46, 4.37, 3.16, 1.18, 18.43, 2.2]} \ No newline at end of file diff --git a/annotations_1/B2zzhcU9f9U_filtered.json b/annotations_1/B2zzhcU9f9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b40e8d5bb67d15f451dd3edcd1e548a95907189 --- /dev/null +++ b/annotations_1/B2zzhcU9f9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.34], [15.0, 15.58], [22.0, 24.46], [29.0, 32.54], [38.0, 46.84], [48.0, 53.42], [56.0, 60.61], [61.0, 61.6], [62.0, 81.04], [81.0, 81.46], [82.0, 93.73], [96.0, 98.98], [101.0, 104.72], [108.0, 110.66], [113.0, 123.01], [123.0, 132.29], [134.0, 137.44], [138.0, 142.45], [146.0, 153.39], [162.0, 167.32], [168.0, 169.75]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [34.93, 0.0, 32.86, 34.11, 42.51, 40.12, 36.03, 0.0, 87.55, 0.0, 68.02, 97.33, 45.65, 72.75, 96.29, 80.64, 100.0, 98.59, 34.75, 31.85, 0.0], "audiomae_on_audioset": [[["speech", 62.81], ["wail, moan", 9.5], ["baby cry, infant cry", 3.16]], null, [["speech", 54.18], ["whimper", 13.63], ["wail, moan", 9.53]], [["baby laughter", 21.99], ["speech", 16.13], ["laughter", 13.11]], [["speech", 29.58], ["sheep", 17.97], ["crying, sobbing", 6.64]], [["speech", 48.73], ["baby laughter", 17.76], ["laughter", 8.14]], [["whack, thwack", 27.55], ["speech", 14.35], ["frog", 11.76]], null, null, null, null, null, [["speech", 91.21], ["inside, small room", 1.36], ["fart", 0.64]], null, null, null, null, null, [["burping, eructation", 6.78], ["mosquito", 5.46], ["stomach rumble", 4.9]], [["breaking", 25.16], ["thunk", 22.05], ["whack, thwack", 17.26]], null], "duration": [4.34, 0.58, 2.46, 3.54, 8.84, 5.42, 4.61, 0.6, 19.04, 0.46, 11.73, 2.98, 3.72, 2.66, 10.01, 9.29, 3.44, 4.45, 7.39, 5.32, 1.75]} \ No newline at end of file diff --git a/annotations_1/B3thiUpvzKo_filtered.json b/annotations_1/B3thiUpvzKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49dbac3093f0bb224f9f1e7968053f14881f7d58 --- /dev/null +++ b/annotations_1/B3thiUpvzKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [16.0, 16.8], [19.0, 22.11], [24.0, 24.6], [34.0, 34.96], [75.0, 79.64], [83.0, 83.56], [87.0, 87.39]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 90.08, 0.0, 0.0, 46.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 51.11], ["hum", 13.25], ["inside, small room", 2.51]], null, null], "duration": [0.62, 0.8, 3.11, 0.6, 0.96, 4.64, 0.56, 0.39]} \ No newline at end of file diff --git a/annotations_1/B46nugc-4c4_filtered.json b/annotations_1/B46nugc-4c4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c16810888e2b0b6f9fb72c9892f3b5c1c80c2af5 --- /dev/null +++ b/annotations_1/B46nugc-4c4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [7.0, 7.33], [10.0, 12.39], [13.0, 15.36], [28.0, 29.37], [36.0, 38.52], [42.0, 42.6], [47.0, 47.92], [51.0, 54.5], [57.0, 57.99], [62.0, 66.5], [68.0, 67.88], [69.0, 70.98], [72.0, 72.2], [73.0, 73.33], [77.0, 77.67], [88.0, 88.84], [90.0, 93.33], [96.0, 96.04], [96.0, 99.55], [100.0, 102.25], [104.0, 161.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 84.98, 79.24, 0.0, 78.38, 0.0, 0.0, 43.96, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 46.79, 74.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 87.61], ["music", 2.28], ["didgeridoo", 1.41]], null, null, null, null, null, null, null, null, null, null, [["speech", 41.78], ["hum", 18.19], ["mains hum", 9.79]], null, null], "duration": [1.24, 0.33, 2.39, 2.36, 1.37, 2.52, 0.6, 0.92, 3.5, 0.99, 4.5, -0.12, 1.98, 0.2, 0.33, 0.67, 0.84, 3.33, 0.04, 3.55, 2.25, 57.06]} \ No newline at end of file diff --git a/annotations_1/B5goHV7tFnE_filtered.json b/annotations_1/B5goHV7tFnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f29ddd5ea628b4e35b4b71d90523a4a2f111e54 --- /dev/null +++ b/annotations_1/B5goHV7tFnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.91], [25.0, 25.62], [27.0, 28.9], [32.0, 33.2], [34.0, 34.43], [36.0, 36.04], [43.0, 43.63], [46.0, 46.8], [49.0, 50.36], [51.0, 51.83], [55.0, 56.67], [64.0, 64.91], [70.0, 71.74], [74.0, 74.44], [76.0, 78.16], [81.0, 93.41], [99.0, 99.84], [104.0, 117.12], [125.0, 126.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.5, 31.74, 0.0, 31.09, 0.0], "audiomae_on_audioset": [[["speech", 43.46], ["music", 25.19], ["electric shaver, electric razor", 5.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.78], ["boing", 19.88], ["music", 11.11]], [["music", 64.43], ["throbbing", 11.22], ["hum", 9.85]], null, [["music", 76.4], ["synthesizer", 3.37], ["cattle, bovinae", 2.75]], null], "duration": [5.91, 0.62, 1.9, 1.2, 0.43, 0.04, 0.63, 0.8, 1.36, 0.83, 1.67, 0.91, 1.74, 0.44, 2.16, 12.41, 0.84, 13.12, 1.77]} \ No newline at end of file diff --git a/annotations_1/B5uw3qZ04NY_filtered.json b/annotations_1/B5uw3qZ04NY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38160a1e701778e5e6d42b78bcc85a6afbf205e1 --- /dev/null +++ b/annotations_1/B5uw3qZ04NY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.03], [8.0, 12.77], [16.0, 18.15], [24.0, 26.96], [29.0, 29.13], [31.0, 33.42], [35.0, 36.93], [39.0, 39.06], [40.0, 42.43], [43.0, 45.67], [46.0, 58.01], [59.0, 61.26], [62.0, 73.72], [76.0, 82.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [49.78, 90.08, 99.84, 75.72, 0.0, 87.19, 0.0, 0.0, 82.07, 76.2, 29.06, 60.42, 29.63, 33.1], "audiomae_on_audioset": [[["speech", 34.2], ["hum", 18.69], ["sidetone", 10.65]], null, null, null, null, null, null, null, null, null, [["speech", 28.95], ["sidetone", 13.15], ["music", 8.57]], null, [["speech", 30.22], ["sonar", 26.69], ["music", 14.92]], [["music", 27.65], ["speech", 24.32], ["musical instrument", 11.15]]], "duration": [2.03, 4.77, 2.15, 2.96, 0.13, 2.42, 1.93, 0.06, 2.43, 2.67, 12.01, 2.26, 11.72, 6.44]} \ No newline at end of file diff --git a/annotations_1/B8dPQzwGcZI_filtered.json b/annotations_1/B8dPQzwGcZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e402f3a4faba3367eaab13fb80ed9d3ccfd1e6cb --- /dev/null +++ b/annotations_1/B8dPQzwGcZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [7.0, 6.79], [8.0, 10.15], [11.0, 11.91], [21.0, 22.77], [27.0, 27.48], [29.0, 30.59], [32.0, 33.34], [34.0, 36.66], [42.0, 43.01], [50.0, 51.04], [55.0, 59.93], [68.0, 68.22], [73.0, 76.64], [78.0, 78.43], [90.0, 90.22], [92.0, 94.07], [98.0, 101.01], [104.0, 104.77], [109.0, 111.42], [113.0, 113.44], [118.0, 118.22], [120.0, 120.31], [126.0, 126.39], [128.0, 130.87], [132.0, 132.63], [133.0, 133.49], [135.0, 135.89], [138.0, 139.21], [140.0, 144.66], [147.0, 147.16], [148.0, 149.4], [153.0, 154.47], [158.0, 161.67], [164.0, 164.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 52.27, 0.0, 36.37, 0.0, 0.0, 99.88, 70.3, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 84.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.34], ["throbbing", 17.57], ["hum", 6.79]], null, null, null, null, null, null, null, null, null, null, [["speech", 77.66], ["tap", 4.17], ["thump, thud", 4.11]], null, null, null, null, null, null, null, null, null, null], "duration": [0.43, -0.21, 2.15, 0.91, 1.77, 0.48, 1.59, 1.34, 2.66, 1.01, 1.04, 4.93, 0.22, 3.64, 0.43, 0.22, 2.07, 3.01, 0.77, 2.42, 0.44, 0.22, 0.31, 0.39, 2.87, 0.63, 0.49, 0.89, 1.21, 4.66, 0.16, 1.4, 1.47, 3.67, 0.27]} \ No newline at end of file diff --git a/annotations_1/B9SkWFyq-EQ_filtered.json b/annotations_1/B9SkWFyq-EQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d07e6a69cc78ab20dea591ff9ad371fd1ce7ff6d --- /dev/null +++ b/annotations_1/B9SkWFyq-EQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 61.8], [64.0, 68.82], [70.0, 75.41], [77.0, 77.94]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 46.22, 96.04, 0.0], "audiomae_on_audioset": [null, [["throbbing", 21.72], ["music", 21.52], ["hum", 21.15]], null, null], "duration": [53.8, 4.82, 5.41, 0.94]} \ No newline at end of file diff --git a/annotations_1/B9r99FImuSc_filtered.json b/annotations_1/B9r99FImuSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ed1bf64f8ced50919061366ed159ac6fbdcbf1 --- /dev/null +++ b/annotations_1/B9r99FImuSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.09], [12.0, 12.19], [13.0, 15.53], [29.0, 29.89], [33.0, 33.34], [39.0, 39.46], [42.0, 42.75], [57.0, 57.2], [60.0, 63.05], [63.0, 63.09], [63.0, 63.41], [81.0, 82.38], [90.0, 100.58], [104.0, 104.82], [105.0, 105.49], [107.0, 107.84], [117.0, 127.67], [134.0, 136.92], [139.0, 140.49], [153.0, 154.84]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 36.29, 0.0, 0.0, 0.0, 0.0, 0.0, 30.24, 0.0, 0.0, 0.0, 28.5, 0.0, 0.0, 0.0, 30.31, 99.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.78], ["throbbing", 21.59], ["hum", 6.1]], null, null, null, null, null, [["music", 53.11], ["musical instrument", 8.42], ["didgeridoo", 6.22]], null, null, null, [["music", 51.03], ["didgeridoo", 39.75], ["musical instrument", 1.85]], null, null, null, [["music", 55.12], ["effects unit", 6.3], ["echo", 5.52]], null, null, null], "duration": [0.09, 0.19, 2.53, 0.89, 0.34, 0.46, 0.75, 0.2, 3.05, 0.09, 0.41, 1.38, 10.58, 0.82, 0.49, 0.84, 10.67, 2.92, 1.49, 1.84]} \ No newline at end of file diff --git a/annotations_1/BANrqTBnEy4_filtered.json b/annotations_1/BANrqTBnEy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565943a2181f324a5163b221ec464226979e832b --- /dev/null +++ b/annotations_1/BANrqTBnEy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.29], [7.0, 9.49], [11.0, 16.28], [19.0, 33.27], [35.0, 35.26], [36.0, 43.04], [44.0, 52.29], [53.0, 60.64], [63.0, 65.35], [68.0, 70.41], [71.0, 78.66], [79.0, 91.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 100.0, 99.31, 99.94, 0.0, 82.25, 91.3, 88.1, 93.6, 97.43, 95.64, 90.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.29, 2.49, 5.28, 14.27, 0.26, 7.04, 8.29, 7.64, 2.35, 2.41, 7.66, 12.29]} \ No newline at end of file diff --git a/annotations_1/BB3VbfL6Xyg_filtered.json b/annotations_1/BB3VbfL6Xyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4f2688a19b9cfa7376dfcd770e707eabb53b021 --- /dev/null +++ b/annotations_1/BB3VbfL6Xyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.17], [17.0, 20.12], [30.0, 44.61], [46.0, 48.12], [51.0, 52.96], [54.0, 82.21], [84.0, 84.84], [86.0, 87.1]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [93.91, 96.42, 93.45, 53.34, 0.0, 39.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.08], ["music", 16.09], ["noise", 6.35]], null, null], "duration": [2.17, 3.12, 14.61, 2.12, 1.96, 28.21, 0.84, 1.1]} \ No newline at end of file diff --git a/annotations_1/BCC8LOkisAI_filtered.json b/annotations_1/BCC8LOkisAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ca49b72cb21836197c4790c0b5cf6157f4cea6a --- /dev/null +++ b/annotations_1/BCC8LOkisAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [5.0, 5.73], [9.0, 9.78], [11.0, 11.57], [13.0, 13.41], [14.0, 14.71], [16.0, 16.58], [28.0, 28.05], [30.0, 30.1], [50.0, 51.19], [52.0, 52.57], [54.0, 54.85], [60.0, 60.17], [61.0, 61.48], [62.0, 62.48], [63.0, 64.39], [66.0, 67.02], [69.0, 70.24], [71.0, 71.81], [73.0, 75.61], [77.0, 79.79], [82.0, 82.7], [93.0, 94.07], [102.0, 102.1], [104.0, 104.01], [108.0, 108.58], [118.0, 119.79], [120.0, 120.43], [121.0, 123.03], [123.0, 124.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.7], ["radio", 9.37], ["sidetone", 4.98]], null], "duration": [1.62, 0.73, 0.78, 0.57, 0.41, 0.71, 0.58, 0.05, 0.1, 1.19, 0.57, 0.85, 0.17, 0.48, 0.48, 1.39, 1.02, 1.24, 0.81, 2.61, 2.79, 0.7, 1.07, 0.1, 0.01, 0.58, 1.79, 0.43, 2.03, 1.16]} \ No newline at end of file diff --git a/annotations_1/BCGzM3s9-1o_filtered.json b/annotations_1/BCGzM3s9-1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bc910d2737a129235c4ed123450394518e89217 --- /dev/null +++ b/annotations_1/BCGzM3s9-1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [6.0, 6.96], [7.0, 8.41], [11.0, 13.66], [17.0, 18.59], [25.0, 37.1], [39.0, 53.2], [54.0, 56.49], [58.0, 58.62], [61.0, 64.64], [65.0, 67.81], [69.0, 71.79], [73.0, 76.17], [77.0, 78.09], [81.0, 84.84], [98.0, 101.26], [103.0, 109.53], [113.0, 123.45], [124.0, 127.3], [128.0, 129.96], [132.0, 132.46], [135.0, 136.59], [137.0, 145.94], [148.0, 159.29]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.47, 0.0, 34.12, 33.92, 35.2, 0.0, 97.83, 66.27, 84.98, 70.86, 0.0, 32.27, 49.59, 72.75, 96.42, 76.37, 0.0, 0.0, 0.0, 65.44, 58.72], "audiomae_on_audioset": [null, null, null, [["music", 34.2], ["speech", 24.56], ["musical instrument", 10.95]], null, [["music", 69.1], ["animal", 4.1], ["piano", 2.12]], [["music", 77.03], ["musical instrument", 3.44], ["keyboard (musical)", 2.45]], [["music", 43.23], ["speech", 28.17], ["musical instrument", 5.96]], null, null, null, null, null, null, [["music", 47.22], ["throbbing", 16.16], ["hum", 7.68]], [["hum", 29.7], ["mains hum", 27.42], ["speech", 16.37]], null, null, null, null, null, null, null, null], "duration": [1.13, 0.96, 1.41, 2.66, 1.59, 12.1, 14.2, 2.49, 0.62, 3.64, 2.81, 2.79, 3.17, 1.09, 3.84, 3.26, 6.53, 10.45, 3.3, 1.96, 0.46, 1.59, 8.94, 11.29]} \ No newline at end of file diff --git a/annotations_1/BCSe_CsI75w_filtered.json b/annotations_1/BCSe_CsI75w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73325adec71cfcce96d01f9ffe9ffdd23623dc91 --- /dev/null +++ b/annotations_1/BCSe_CsI75w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [28.0, 29.74], [40.0, 39.61], [40.0, 41.27], [60.0, 61.2], [66.0, 68.77], [75.0, 79.93], [81.0, 81.46], [82.0, 81.65], [84.0, 86.91], [91.0, 93.58], [99.0, 100.7], [101.0, 100.97], [101.0, 101.01], [101.0, 101.56], [107.0, 108.03], [116.0, 116.85]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.34, 31.57, 0.0, 0.0, 37.53, 34.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 81.78], ["synthesizer", 5.1], ["musical instrument", 3.09]], [["music", 42.22], ["musical instrument", 8.06], ["theremin", 7.81]], null, null, [["music", 65.35], ["synthesizer", 4.69], ["sampler", 3.3]], [["music", 56.21], ["boing", 8.16], ["speech", 5.05]], null, null, null, null, null, null], "duration": [0.72, 1.74, -0.39, 1.27, 1.2, 2.77, 4.93, 0.46, -0.35, 2.91, 2.58, 1.7, -0.03, 0.01, 0.56, 1.03, 0.85]} \ No newline at end of file diff --git a/annotations_1/BCcw2q6KbbI_filtered.json b/annotations_1/BCcw2q6KbbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7aa3a41670e83be056920cfb659e2462625d184 --- /dev/null +++ b/annotations_1/BCcw2q6KbbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [4.0, 4.87], [14.0, 15.38], [37.0, 38.01], [49.0, 49.67], [55.0, 55.54], [60.0, 60.83], [63.0, 64.0], [74.0, 73.87], [77.0, 76.98], [82.0, 91.12], [96.0, 96.11], [102.0, 102.56], [106.0, 112.18], [113.0, 113.53], [118.0, 119.03], [135.0, 138.33], [144.0, 145.03], [154.0, 154.3], [159.0, 159.95], [165.0, 165.35], [168.0, 168.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 0.0, 0.0, 32.57, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 39.05], ["sidetone", 23.77], ["synthesizer", 11.14]], null, null, [["music", 67.96], ["musical instrument", 7.86], ["synthesizer", 6.45]], null, null, [["music", 62.49], ["synthesizer", 15.7], ["musical instrument", 3.64]], null, null, null, null, null], "duration": [-0.01, 0.87, 1.38, 1.01, 0.67, 0.54, 0.83, 1.0, -0.13, -0.02, 9.12, 0.11, 0.56, 6.18, 0.53, 1.03, 3.33, 1.03, 0.3, 0.95, 0.35, 0.42]} \ No newline at end of file diff --git a/annotations_1/BCyz82L_61E_filtered.json b/annotations_1/BCyz82L_61E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9968f0f6ba4d85c51cda17ad9122fc22b1c728b0 --- /dev/null +++ b/annotations_1/BCyz82L_61E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.17], [11.0, 11.91], [19.0, 19.75], [26.0, 26.38], [27.0, 27.53], [28.0, 28.71], [32.0, 32.53], [39.0, 41.86], [45.0, 47.33], [49.0, 50.41], [67.0, 71.9], [74.0, 83.22], [84.0, 88.32], [89.0, 110.3], [116.0, 128.16], [133.0, 136.43], [137.0, 138.45], [140.0, 140.63], [148.0, 148.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 97.43, 0.0, 95.09, 92.48, 68.28, 31.47, 31.35, 65.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.67], ["speech", 9.22], ["whack, thwack", 7.92]], [["music", 53.34], ["speech", 12.45], ["whack, thwack", 5.03]], null, null, null, null], "duration": [3.17, 0.91, 0.75, 0.38, 0.53, 0.71, 0.53, 2.86, 2.33, 1.41, 4.9, 9.22, 4.32, 21.3, 12.16, 3.43, 1.45, 0.63, 0.58]} \ No newline at end of file diff --git a/annotations_1/BDZK9B4Gu6g_filtered.json b/annotations_1/BDZK9B4Gu6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a05a2cf1cc51abf6dbc502fae6169c00b98a821 --- /dev/null +++ b/annotations_1/BDZK9B4Gu6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.54], [11.0, 11.52], [16.0, 17.98], [19.0, 20.38], [23.0, 24.31], [25.0, 28.12], [31.0, 31.13], [33.0, 33.3], [35.0, 35.78], [38.0, 38.85], [41.0, 43.01], [44.0, 73.4], [74.0, 98.63], [101.0, 126.67], [128.0, 142.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.38, 0.0, 0.0, 0.0, 0.0, 35.5, 29.96, 31.43, 29.87, 30.6], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 72.99], ["sine wave", 3.74], ["hum", 2.44]], null, null, null, null, [["music", 23.05], ["speech", 18.96], ["didgeridoo", 6.55]], [["buzz", 39.43], ["music", 23.36], ["fly, housefly", 10.24]], [["music", 41.74], ["theremin", 21.08], ["speech", 10.46]], [["music", 61.71], ["carnatic music", 5.39], ["tabla", 3.51]], [["music", 28.64], ["cowbell", 16.92], ["cacophony", 16.4]]], "duration": [1.54, 0.52, 1.98, 1.38, 1.31, 3.12, 0.13, 0.3, 0.78, 0.85, 2.01, 29.4, 24.63, 25.67, 14.75]} \ No newline at end of file diff --git a/annotations_1/BDvjjQvM498_filtered.json b/annotations_1/BDvjjQvM498_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88ae4b861f455f427446e7ba02081e5e81086ab4 --- /dev/null +++ b/annotations_1/BDvjjQvM498_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.05], [19.0, 91.5], [93.0, 97.68], [102.0, 103.86], [105.0, 107.5], [111.0, 111.94], [115.0, 114.74], [117.0, 117.95], [120.0, 124.16], [125.0, 126.28], [131.0, 134.16], [135.0, 140.63], [142.0, 143.41], [147.0, 150.45], [151.0, 153.55], [155.0, 157.17], [158.0, 159.39], [160.0, 164.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [92.48, 0.0, 69.88, 0.0, 54.17, 0.0, 0.0, 0.0, 65.09, 0.0, 51.88, 48.19, 0.0, 37.42, 69.47, 79.24, 0.0, 40.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.56], ["music", 15.82], ["didgeridoo", 8.22]], null, [["speech", 65.49], ["music", 22.57], ["radio", 0.91]], null, null, null, [["speech", 33.37], ["music", 23.37], ["sidetone", 23.02]]], "duration": [12.05, 72.5, 4.68, 1.86, 2.5, 0.94, -0.26, 0.95, 4.16, 1.28, 3.16, 5.63, 1.41, 3.45, 2.55, 2.17, 1.39, 4.12]} \ No newline at end of file diff --git a/annotations_1/BEKzJzaZ0Fk_filtered.json b/annotations_1/BEKzJzaZ0Fk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0a48eb0c34702d7f8676c871aed8212c477d3d5 --- /dev/null +++ b/annotations_1/BEKzJzaZ0Fk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [8.0, 8.65], [11.0, 11.06], [14.0, 14.96], [17.0, 17.09], [21.0, 24.04], [27.0, 27.21], [30.0, 30.0], [33.0, 32.88], [34.0, 34.38], [35.0, 42.06], [45.0, 44.9], [48.0, 48.24], [52.0, 53.65], [57.0, 57.55], [61.0, 61.47], [62.0, 63.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 62.59], ["radio", 20.87], ["sidetone", 7.97]], null, null, null, null, null, null], "duration": [-0.2, 0.65, 0.06, 0.96, 0.09, 3.04, 0.21, 0.0, -0.12, 0.38, 7.06, -0.1, 0.24, 1.65, 0.55, 0.47, 1.19]} \ No newline at end of file diff --git a/annotations_1/BEsaqfzc6wQ_filtered.json b/annotations_1/BEsaqfzc6wQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc76bfed3f5ac7b34e591592990bcddbb387d5c --- /dev/null +++ b/annotations_1/BEsaqfzc6wQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.08], [31.0, 33.83], [36.0, 37.25], [49.0, 49.79], [53.0, 54.01], [57.0, 57.87], [61.0, 61.84], [65.0, 84.55], [87.0, 88.37], [91.0, 92.45], [95.0, 96.47], [99.0, 100.41], [103.0, 105.19], [108.0, 108.77], [115.0, 118.07]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.38, 43.38, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 95.91], "audiomae_on_audioset": [[["hum", 43.16], ["mains hum", 17.38], ["noise", 8.05]], [["hum", 22.67], ["mains hum", 20.75], ["arrow", 8.42]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.08, 2.83, 1.25, 0.79, 1.01, 0.87, 0.84, 19.55, 1.37, 1.45, 1.47, 1.41, 2.19, 0.77, 3.07]} \ No newline at end of file diff --git a/annotations_1/BFAfiz1daR4_filtered.json b/annotations_1/BFAfiz1daR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1096427ff7cef9bf03a98509469ba7b8811443dc --- /dev/null +++ b/annotations_1/BFAfiz1daR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.4], [25.0, 25.86], [26.0, 30.0], [32.0, 32.85], [35.0, 38.3], [43.0, 60.44], [63.0, 63.44], [65.0, 64.99], [65.0, 65.53], [68.0, 70.58], [71.0, 71.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.9, 0.0, 99.48, 29.54, 0.0, 0.0, 0.0, 83.7, 0.0], "audiomae_on_audioset": [null, null, [["speech", 58.8], ["sidetone", 14.7], ["noise", 9.96]], null, null, [["music", 26.68], ["machine gun", 19.54], ["speech", 16.97]], null, null, null, null, null], "duration": [0.4, 0.86, 4.0, 0.85, 3.3, 17.44, 0.44, -0.01, 0.53, 2.58, 0.61]} \ No newline at end of file diff --git a/annotations_1/BFSjHBVx-xk_filtered.json b/annotations_1/BFSjHBVx-xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39dc33fb3ac8b45f46ec7042667eccd454ad689c --- /dev/null +++ b/annotations_1/BFSjHBVx-xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 48.0], [50.0, 141.44]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [45.0, 91.44]} \ No newline at end of file diff --git a/annotations_1/BG3bNlh0qiU_filtered.json b/annotations_1/BG3bNlh0qiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9f8835d706c22b5d912997cff24a565ebe730bc --- /dev/null +++ b/annotations_1/BG3bNlh0qiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 47.39], [50.0, 55.86], [59.0, 84.27], [85.0, 85.33], [86.0, 98.29], [100.0, 100.77], [102.0, 104.14], [105.0, 110.56], [114.0, 114.59]], "keep_status": [false, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 30.3, 29.96, 0.0, 30.24, 0.0, 31.56, 29.43, 0.0], "audiomae_on_audioset": [null, [["music", 24.43], ["hum", 15.14], ["mains hum", 10.63]], [["music", 33.89], ["noise", 20.81], ["hum", 7.54]], null, [["music", 31.46], ["hum", 17.22], ["cacophony", 10.04]], null, [["speech", 41.58], ["hum", 8.86], ["mains hum", 7.26]], [["speech", 59.96], ["music", 7.06], ["hum", 3.55]], null], "duration": [0.39, 5.86, 25.27, 0.33, 12.29, 0.77, 2.14, 5.56, 0.59]} \ No newline at end of file diff --git a/annotations_1/BGEFW4kc5EQ_filtered.json b/annotations_1/BGEFW4kc5EQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4d0a0b0ca8b603b1db2ac6bf5d00a7d83e9f137 --- /dev/null +++ b/annotations_1/BGEFW4kc5EQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.24], [35.0, 35.95], [73.0, 78.63], [80.0, 80.5], [83.0, 83.56], [86.0, 86.43], [96.0, 99.23], [114.0, 114.88], [122.0, 123.11], [135.0, 143.77], [147.0, 148.15], [149.0, 149.23], [152.0, 157.18]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 31.78, 0.0, 0.0, 0.0, 29.24, 0.0, 0.0, 32.65, 0.0, 0.0, 33.21], "audiomae_on_audioset": [null, null, [["music", 34.66], ["hum", 9.9], ["throbbing", 8.04]], null, null, null, [["music", 53.03], ["throbbing", 14.94], ["didgeridoo", 11.28]], null, null, [["music", 30.12], ["animal", 8.29], ["livestock, farm animals, working animals", 8.0]], null, null, [["music", 21.55], ["mosquito", 17.83], ["fly, housefly", 16.59]]], "duration": [1.24, 0.95, 5.63, 0.5, 0.56, 0.43, 3.23, 0.88, 1.11, 8.77, 1.15, 0.23, 5.18]} \ No newline at end of file diff --git a/annotations_1/BGGyUpO3W-A_filtered.json b/annotations_1/BGGyUpO3W-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f85b24aac03dc3ad1b01b4c6c893cf9b89bba9ee --- /dev/null +++ b/annotations_1/BGGyUpO3W-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.5], [17.0, 16.9], [19.0, 20.98], [23.0, 25.79], [27.0, 29.22], [31.0, 35.29], [37.0, 43.88], [49.0, 51.6], [56.0, 58.99], [72.0, 104.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [32.4, 0.0, 0.0, 32.59, 48.61, 35.43, 29.48, 29.4, 29.49, 0.0], "audiomae_on_audioset": [[["music", 47.03], ["musical instrument", 12.22], ["guitar", 10.83]], null, null, [["music", 67.34], ["musical instrument", 16.09], ["guitar", 6.29]], [["music", 45.07], ["speech", 4.84], ["chorus effect", 3.59]], [["music", 62.57], ["musical instrument", 10.25], ["synthesizer", 10.04]], [["music", 72.86], ["electronic music", 1.94], ["sampler", 1.5]], [["music", 75.52], ["sampler", 1.78], ["singing", 1.48]], [["music", 47.9], ["speech", 21.08], ["electronic music", 3.24]], null], "duration": [3.5, -0.1, 1.98, 2.79, 2.22, 4.29, 6.88, 2.6, 2.99, 32.7]} \ No newline at end of file diff --git a/annotations_1/BGOL5YmTrAY_filtered.json b/annotations_1/BGOL5YmTrAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19e685bbbb6fb37c8ecf85c7f04baebab77a0b4d --- /dev/null +++ b/annotations_1/BGOL5YmTrAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.89], [22.0, 22.71], [27.0, 27.63], [31.0, 36.9], [39.0, 40.9], [42.0, 42.7], [44.0, 45.05], [47.0, 57.23], [63.0, 70.85], [73.0, 74.19], [77.0, 77.85], [82.0, 82.27], [85.0, 86.61], [87.0, 89.51], [91.0, 95.28], [96.0, 96.72], [102.0, 110.35], [115.0, 128.8], [130.0, 135.4], [136.0, 140.19], [142.0, 144.9], [147.0, 150.74], [151.0, 153.82], [157.0, 157.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, true, false, false], "silence_prob": [33.96, 0.0, 0.0, 37.56, 0.0, 0.0, 0.0, 31.64, 37.26, 0.0, 0.0, 0.0, 0.0, 30.7, 32.87, 0.0, 30.79, 31.29, 30.35, 31.87, 31.83, 31.02, 30.63, 0.0], "audiomae_on_audioset": [[["throbbing", 43.51], ["music", 32.46], ["speech", 7.61]], null, null, [["music", 59.38], ["theremin", 10.82], ["didgeridoo", 7.87]], null, null, null, [["music", 52.73], ["throbbing", 14.76], ["hum", 5.49]], [["music", 65.28], ["speech", 9.57], ["musical instrument", 2.94]], null, null, null, null, [["music", 60.69], ["speech", 17.52], ["boing", 3.76]], [["music", 71.02], ["speech", 5.39], ["throbbing", 3.66]], null, [["music", 55.87], ["speech", 5.2], ["musical instrument", 4.84]], [["music", 37.17], ["bleat", 19.18], ["sheep", 10.32]], [["music", 45.84], ["speech", 21.64], ["synthesizer", 3.89]], [["music", 52.11], ["speech", 7.17], ["musical instrument", 5.91]], [["music", 50.3], ["speech", 14.08], ["throbbing", 5.36]], [["speech", 24.11], ["cattle, bovinae", 12.12], ["moo", 10.33]], [["cattle, bovinae", 50.07], ["moo", 29.28], ["livestock, farm animals, working animals", 17.38]], null], "duration": [4.89, 0.71, 0.63, 5.9, 1.9, 0.7, 1.05, 10.23, 7.85, 1.19, 0.85, 0.27, 1.61, 2.51, 4.28, 0.72, 8.35, 13.8, 5.4, 4.19, 2.9, 3.74, 2.82, 0.86]} \ No newline at end of file diff --git a/annotations_1/BGZN_6xPw64_filtered.json b/annotations_1/BGZN_6xPw64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86daacb036394612153919ffd4d7476644769be2 --- /dev/null +++ b/annotations_1/BGZN_6xPw64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 33.44], [38.0, 42.99], [44.0, 48.69], [51.0, 56.94], [64.0, 70.65], [76.0, 81.36], [82.0, 88.08], [89.0, 90.26], [92.0, 92.79], [94.0, 95.3], [102.0, 103.77], [105.0, 109.58]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, true], "silence_prob": [29.38, 44.4, 30.48, 29.45, 29.55, 28.42, 32.69, 0.0, 0.0, 0.0, 0.0, 46.4], "audiomae_on_audioset": [[["speech", 19.24], ["music", 17.87], ["cattle, bovinae", 15.22]], [["speech", 42.11], ["music", 25.67], ["singing bowl", 6.61]], [["music", 78.03], ["mains hum", 3.71], ["hum", 3.64]], [["music", 46.36], ["speech", 29.7], ["didgeridoo", 4.86]], [["speech", 37.01], ["explosion", 27.11], ["burst, pop", 9.42]], [["explosion", 26.4], ["eruption", 16.86], ["burst, pop", 11.1]], [["explosion", 44.46], ["speech", 11.53], ["burst, pop", 8.54]], null, null, null, null, [["music", 47.97], ["hum", 8.47], ["theremin", 7.51]]], "duration": [6.44, 4.99, 4.69, 5.94, 6.65, 5.36, 6.08, 1.26, 0.79, 1.3, 1.77, 4.58]} \ No newline at end of file diff --git a/annotations_1/BGlWalxUId0_filtered.json b/annotations_1/BGlWalxUId0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..646a36e7028351be2c6c7a2595ddea7d33c54bb1 --- /dev/null +++ b/annotations_1/BGlWalxUId0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.21], [8.0, 8.72], [10.0, 11.53], [12.0, 14.66], [17.0, 18.33], [19.0, 19.87], [21.0, 23.19], [24.0, 29.52], [32.0, 33.12], [35.0, 38.47], [39.0, 41.62], [42.0, 43.09], [43.0, 44.56], [47.0, 48.42], [50.0, 51.16], [52.0, 52.89], [58.0, 62.01], [63.0, 63.0], [65.0, 66.14], [67.0, 68.54], [69.0, 70.95], [73.0, 73.16], [75.0, 75.03], [76.0, 95.72], [97.0, 99.55], [100.0, 101.04], [103.0, 106.44], [112.0, 112.6], [113.0, 113.81], [115.0, 115.23], [116.0, 116.5], [120.0, 120.93], [122.0, 123.03], [124.0, 126.66], [127.0, 127.13], [129.0, 129.81], [131.0, 131.26], [132.0, 132.98], [134.0, 134.77]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.27, 0.0, 0.0, 47.12, 0.0, 0.0, 100.0, 31.03, 0.0, 60.32, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.99, 78.38, 0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 89.97], ["speech", 4.62], ["hum", 0.99]], null, null, null, [["fly, housefly", 21.79], ["mosquito", 15.25], ["explosion", 14.34]], null, null, null, null, null, null, null, null, [["music", 43.52], ["speech", 31.59], ["synthesizer", 4.67]], null, null, null, null, null, null, [["saxophone", 44.67], ["music", 28.32], ["brass instrument", 7.79]], null, null, [["boing", 36.41], ["speech", 25.42], ["music", 9.58]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 0.72, 1.53, 2.66, 1.33, 0.87, 2.19, 5.52, 1.12, 3.47, 2.62, 1.09, 1.56, 1.42, 1.16, 0.89, 4.01, 0.0, 1.14, 1.54, 1.95, 0.16, 0.03, 19.72, 2.55, 1.04, 3.44, 0.6, 0.81, 0.23, 0.5, 0.93, 1.03, 2.66, 0.13, 0.81, 0.26, 0.98, 0.77]} \ No newline at end of file diff --git a/annotations_1/BGmXnidRtoA_filtered.json b/annotations_1/BGmXnidRtoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62299687d580413aa8eb5f7f43f11e7325c68d6b --- /dev/null +++ b/annotations_1/BGmXnidRtoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [7.0, 7.65], [9.0, 10.12], [11.0, 11.48], [13.0, 14.12], [21.0, 22.47], [23.0, 24.68], [25.0, 25.47], [30.0, 36.02], [37.0, 37.72], [39.0, 40.74], [42.0, 42.13], [43.0, 43.31], [45.0, 45.06], [49.0, 49.44], [51.0, 50.9], [60.0, 59.86], [61.0, 62.68], [68.0, 68.99], [72.0, 73.55], [74.0, 76.81], [79.0, 79.3], [83.0, 87.51], [88.0, 90.26], [91.0, 99.59], [100.0, 100.97], [101.0, 103.15], [106.0, 107.33], [108.0, 108.78], [110.0, 110.73], [113.0, 114.39], [122.0, 122.32], [125.0, 126.2], [129.0, 141.61], [142.0, 149.22], [150.0, 151.38], [152.0, 155.55], [156.0, 157.89], [159.0, 160.64], [163.0, 165.45], [166.0, 166.75], [168.0, 177.45], [179.0, 180.2], [182.0, 184.45], [185.0, 188.62], [189.0, 190.07], [192.0, 192.67], [194.0, 195.35], [197.0, 199.52], [200.0, 207.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 100.0, 67.0, 98.73, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 76.2, 0.0, 79.41, 0.0, 0.0, 99.56, 0.0, 43.28, 0.0, 69.2, 99.95, 0.0, 0.0, 0.0, 100.0, 92.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.17], ["sidetone", 24.4], ["noise", 5.3]], null, null, null, null, null, null, null, null], "duration": [1.56, 0.65, 1.12, 0.48, 1.12, 1.47, 1.68, 0.47, 6.02, 0.72, 1.74, 0.13, 0.31, 0.06, 0.44, -0.1, -0.14, 1.68, 0.99, 1.55, 2.81, 0.3, 4.51, 2.26, 8.59, 0.97, 2.15, 1.33, 0.78, 0.73, 1.39, 0.32, 1.2, 12.61, 7.22, 1.38, 3.55, 1.89, 1.64, 2.45, 0.75, 9.45, 1.2, 2.45, 3.62, 1.07, 0.67, 1.35, 2.52, 7.05]} \ No newline at end of file diff --git a/annotations_1/BH-EprDz8wI_filtered.json b/annotations_1/BH-EprDz8wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6236b9ed90d9b60ac84216ab82c7235651331eb5 --- /dev/null +++ b/annotations_1/BH-EprDz8wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 55.95], [57.0, 57.82], [58.0, 69.06], [70.0, 106.46]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 44.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 71.76], ["singing bowl", 4.02], ["synthesizer", 3.03]], null], "duration": [51.95, 0.82, 11.06, 36.46]} \ No newline at end of file diff --git a/annotations_1/BICqcEvzhVw_filtered.json b/annotations_1/BICqcEvzhVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ad419c118453495475175efd7fd2f85c101363d --- /dev/null +++ b/annotations_1/BICqcEvzhVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.23], [10.0, 11.03], [18.0, 18.87], [21.0, 22.59], [25.0, 25.02], [30.0, 30.08], [31.0, 31.65], [34.0, 35.21], [36.0, 37.54], [38.0, 39.14], [41.0, 41.52], [44.0, 47.71], [48.0, 48.64], [49.0, 49.5], [51.0, 51.93], [53.0, 53.99], [55.0, 54.9], [57.0, 57.65], [58.0, 58.53], [59.0, 59.75], [61.0, 61.5], [63.0, 63.14], [64.0, 64.54], [66.0, 66.39], [69.0, 70.07], [72.0, 73.11], [73.0, 74.56], [75.0, 76.38], [83.0, 83.34], [85.0, 87.35], [88.0, 91.02], [93.0, 94.58], [95.0, 96.43], [99.0, 99.72], [101.0, 102.37], [103.0, 103.77], [107.0, 107.18], [114.0, 114.56], [118.0, 119.2], [120.0, 123.36], [127.0, 127.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.45], ["hum", 3.9], ["noise", 2.28]], null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.03, 0.87, 1.59, 0.02, 0.08, 0.65, 1.21, 1.54, 1.14, 0.52, 3.71, 0.64, 0.5, 0.93, 0.99, -0.1, 0.65, 0.53, 0.75, 0.5, 0.14, 0.54, 0.39, 1.07, 1.11, 1.56, 1.38, 0.34, 2.35, 3.02, 1.58, 1.43, 0.72, 1.37, 0.77, 0.18, 0.56, 1.2, 3.36, 0.08]} \ No newline at end of file diff --git a/annotations_1/BIdtUDoR5A0_filtered.json b/annotations_1/BIdtUDoR5A0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c878c6430bca4f044978914420326577b44382dd --- /dev/null +++ b/annotations_1/BIdtUDoR5A0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 39.6], [41.0, 41.94], [43.0, 48.57], [53.0, 53.43], [57.0, 59.8], [62.0, 72.22], [75.0, 99.33], [103.0, 103.27], [104.0, 104.25], [106.0, 106.54], [107.0, 110.98], [113.0, 142.42], [148.0, 148.39], [150.0, 150.92], [152.0, 173.25]], "keep_status": [false, false, true, false, true, false, true, false, false, false, true, true, false, false, false], "silence_prob": [28.38, 0.0, 28.41, 0.0, 28.4, 28.38, 28.24, 0.0, 0.0, 0.0, 29.1, 28.18, 0.0, 0.0, 28.16], "audiomae_on_audioset": [[["speech", 67.48], ["music", 13.12], ["cacophony", 2.76]], null, [["rumble", 13.34], ["mains hum", 12.57], ["speech", 11.91]], null, [["explosion", 21.8], ["zipper (clothing)", 14.96], ["fart", 8.96]], [["music", 48.3], ["breaking", 14.81], ["smash, crash", 7.35]], [["music", 37.9], ["boom", 7.37], ["whack, thwack", 3.69]], null, null, null, [["music", 50.11], ["rumble", 14.61], ["mains hum", 4.68]], [["whack, thwack", 16.61], ["boom", 9.91], ["explosion", 6.48]], null, null, [["music", 74.88], ["cacophony", 3.64], ["electronic music", 3.17]]], "duration": [24.6, 0.94, 5.57, 0.43, 2.8, 10.22, 24.33, 0.27, 0.25, 0.54, 3.98, 29.42, 0.39, 0.92, 21.25]} \ No newline at end of file diff --git a/annotations_1/BIg5_09Tcf8_filtered.json b/annotations_1/BIg5_09Tcf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed33f32284821be1d585fda86d947afc3360ff97 --- /dev/null +++ b/annotations_1/BIg5_09Tcf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[87.0, 106.42], [108.0, 111.25], [114.0, 117.96], [119.0, 132.24]], "keep_status": [true, true, true, true], "silence_prob": [30.62, 33.29, 31.41, 29.76], "audiomae_on_audioset": [[["buzz", 27.82], ["music", 25.51], ["hum", 8.6]], [["hum", 22.92], ["throbbing", 11.77], ["music", 9.5]], [["hum", 26.17], ["mains hum", 24.12], ["music", 11.76]], [["music", 17.41], ["mains hum", 15.12], ["hum", 13.61]]], "duration": [19.42, 3.25, 3.96, 13.24]} \ No newline at end of file diff --git a/annotations_1/BJWR0io_SuE_filtered.json b/annotations_1/BJWR0io_SuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bba85bb9bc195fd046915ae045236c1daa9d0d8 --- /dev/null +++ b/annotations_1/BJWR0io_SuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.07], [15.0, 24.53], [25.0, 29.3], [30.0, 33.15], [34.0, 37.44], [38.0, 39.11], [40.0, 40.47], [41.0, 43.5], [47.0, 48.61], [49.0, 49.6], [53.0, 53.32], [54.0, 58.23], [59.0, 61.82], [63.0, 64.35], [65.0, 65.7], [66.0, 67.05], [68.0, 69.26], [71.0, 72.28], [76.0, 75.96], [77.0, 80.27], [83.0, 90.83], [91.0, 92.01], [93.0, 93.26], [94.0, 95.12], [97.0, 97.83], [104.0, 115.16], [116.0, 118.18], [119.0, 124.09], [128.0, 128.65], [130.0, 132.8], [136.0, 137.12], [142.0, 145.42], [153.0, 156.57], [159.0, 160.54], [164.0, 164.96], [170.0, 170.78], [173.0, 176.44], [177.0, 178.82]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [49.78, 78.89, 76.53, 85.9, 50.91, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 52.39, 50.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 52.1, 0.0, 0.0, 0.0, 0.0, 35.13, 32.82, 39.11, 0.0, 30.61, 0.0, 31.09, 38.3, 0.0, 0.0, 0.0, 44.99, 0.0], "audiomae_on_audioset": [[["music", 63.56], ["hum", 11.15], ["mains hum", 3.72]], null, null, null, null, null, null, [["music", 34.81], ["sidetone", 17.83], ["speech", 16.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.13], ["sonar", 20.45], ["hum", 15.01]], [["speech", 57.52], ["sidetone", 29.02], ["dial tone", 2.24]], [["music", 16.0], ["gong", 13.18], ["hum", 12.79]], null, [["music", 59.84], ["synthesizer", 8.57], ["throbbing", 7.25]], null, [["throbbing", 35.97], ["hum", 20.55], ["music", 19.84]], [["speech", 19.71], ["music", 14.81], ["hum", 12.22]], null, null, null, [["hum", 44.53], ["mains hum", 13.67], ["whale vocalization", 7.86]], null], "duration": [6.07, 9.53, 4.3, 3.15, 3.44, 1.11, 0.47, 2.5, 1.61, 0.6, 0.32, 4.23, 2.82, 1.35, 0.7, 1.05, 1.26, 1.28, -0.04, 3.27, 7.83, 1.01, 0.26, 1.12, 0.83, 11.16, 2.18, 5.09, 0.65, 2.8, 1.12, 3.42, 3.57, 1.54, 0.96, 0.78, 3.44, 1.82]} \ No newline at end of file diff --git a/annotations_1/BKYpzJIAkeo_filtered.json b/annotations_1/BKYpzJIAkeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab5d8f05d4107f39789e7569334c1f03684b9eec --- /dev/null +++ b/annotations_1/BKYpzJIAkeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.3], [12.0, 13.05], [29.0, 28.97], [36.0, 37.5], [45.0, 45.54], [72.0, 79.46], [82.0, 83.27], [88.0, 88.67], [90.0, 91.13], [93.0, 94.1], [100.0, 100.99], [109.0, 110.05], [122.0, 122.5], [124.0, 124.58], [127.0, 127.79], [130.0, 130.57], [134.0, 134.43], [139.0, 139.62], [145.0, 145.57], [150.0, 150.62], [153.0, 154.25], [156.0, 158.31], [161.0, 161.69], [165.0, 165.55], [169.0, 170.36], [171.0, 172.49]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.55, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 25.72], ["mains hum", 19.49], ["music", 18.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.32], ["music", 25.37], ["mains hum", 17.22]], null, null, null, null], "duration": [0.3, 1.05, -0.03, 1.5, 0.54, 7.46, 1.27, 0.67, 1.13, 1.1, 0.99, 1.05, 0.5, 0.58, 0.79, 0.57, 0.43, 0.62, 0.57, 0.62, 1.25, 2.31, 0.69, 0.55, 1.36, 1.49]} \ No newline at end of file diff --git a/annotations_1/BKgd8Q3X0AA_filtered.json b/annotations_1/BKgd8Q3X0AA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb6677d4f0ce8fa6f3f4f41b0c07a3a0a3e2b6e8 --- /dev/null +++ b/annotations_1/BKgd8Q3X0AA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [2.0, 1.71], [4.0, 7.43], [15.0, 16.39], [18.0, 26.38], [32.0, 33.3], [34.0, 35.02], [36.0, 36.73], [46.0, 46.95], [48.0, 48.78], [52.0, 53.28], [56.0, 56.2], [57.0, 57.47], [61.0, 66.18], [69.0, 73.68], [75.0, 94.12], [94.0, 114.24]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 31.56, 0.0, 30.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 31.49, 28.66, 29.31], "audiomae_on_audioset": [null, null, [["music", 27.53], ["noise", 19.29], ["hum", 13.38]], null, [["music", 27.37], ["hum", 11.54], ["rumble", 9.41]], null, null, null, null, null, null, null, null, [["hum", 19.38], ["music", 17.36], ["throbbing", 11.93]], [["speech", 27.12], ["music", 23.01], ["hum", 9.49]], [["music", 23.08], ["smash, crash", 17.48], ["thump, thud", 10.9]], [["didgeridoo", 36.97], ["music", 33.8], ["whack, thwack", 4.49]]], "duration": [0.31, -0.29, 3.43, 1.39, 8.38, 1.3, 1.02, 0.73, 0.95, 0.78, 1.28, 0.2, 0.47, 5.18, 4.68, 19.12, 20.24]} \ No newline at end of file diff --git a/annotations_1/BLElh2JGufs_filtered.json b/annotations_1/BLElh2JGufs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb33330700da75e62e4a063fc07c8fe09183dc5a --- /dev/null +++ b/annotations_1/BLElh2JGufs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.79], [13.0, 14.12], [16.0, 18.87], [28.0, 27.55], [31.0, 31.26], [40.0, 40.34], [42.0, 42.01], [44.0, 44.41], [54.0, 54.62], [70.0, 70.34], [73.0, 73.28], [81.0, 80.65], [84.0, 84.16], [85.0, 85.75], [88.0, 88.72], [90.0, 91.02], [92.0, 95.71], [106.0, 106.32], [108.0, 111.47], [114.0, 115.48], [129.0, 130.27], [131.0, 131.79], [135.0, 140.0], [144.0, 143.97], [148.0, 149.32], [156.0, 159.39], [174.0, 175.83], [179.0, 179.44], [181.0, 188.77], [190.0, 191.15], [192.0, 193.38], [200.0, 201.39], [202.0, 205.83], [209.0, 211.65], [213.0, 214.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 56.63, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 70.58, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 93.91, 87.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.12, 2.87, -0.45, 0.26, 0.34, 0.01, 0.41, 0.62, 0.34, 0.28, -0.35, 0.16, 0.75, 0.72, 1.02, 3.71, 0.32, 3.47, 1.48, 1.27, 0.79, 5.0, -0.03, 1.32, 3.39, 1.83, 0.44, 7.77, 1.15, 1.38, 1.39, 3.83, 2.65, 1.22]} \ No newline at end of file diff --git a/annotations_1/BLSFQUjyBQo_filtered.json b/annotations_1/BLSFQUjyBQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..107cc0ddbdef3eed0ae48a30d9b6c6789274ec63 --- /dev/null +++ b/annotations_1/BLSFQUjyBQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 65.96], [67.0, 179.02]], "keep_status": [false, false], "silence_prob": [28.85, 0.0], "audiomae_on_audioset": [[["hum", 40.39], ["mains hum", 36.76], ["throbbing", 13.11]], null], "duration": [24.96, 112.02]} \ No newline at end of file diff --git a/annotations_1/BLgX2oB_qn4_filtered.json b/annotations_1/BLgX2oB_qn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74b07296ea7d9cdd098840404c527295b328d381 --- /dev/null +++ b/annotations_1/BLgX2oB_qn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[100.0, 100.47], [101.0, 106.05], [107.0, 108.31], [110.0, 113.59], [115.0, 118.94], [120.0, 121.1], [122.0, 121.95]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 51.77, 0.0, 80.11, 36.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 71.23], ["fart", 4.97], ["hum", 4.77]], null, null], "duration": [0.47, 5.05, 1.31, 3.59, 3.94, 1.1, -0.05]} \ No newline at end of file diff --git a/annotations_1/BM29Ze3d_cs_filtered.json b/annotations_1/BM29Ze3d_cs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..209658739d520a9be5a6c1fe96cbfe0f153b2405 --- /dev/null +++ b/annotations_1/BM29Ze3d_cs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [5.0, 4.82], [6.0, 6.84], [8.0, 12.56], [14.0, 17.69], [18.0, 23.84], [24.0, 25.78], [29.0, 29.08], [30.0, 33.74], [35.0, 37.5], [40.0, 40.68], [41.0, 41.37], [42.0, 42.26], [46.0, 50.6], [51.0, 51.51], [52.0, 57.18], [68.0, 68.42], [74.0, 74.95], [83.0, 87.17], [87.0, 87.96], [88.0, 89.07], [91.0, 91.27], [94.0, 94.74], [108.0, 112.73], [116.0, 150.74], [156.0, 155.78], [157.0, 157.62], [159.0, 161.37], [163.0, 204.43], [207.0, 206.9]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.34, 43.33, 31.64, 0.0, 0.0, 62.58, 39.24, 0.0, 0.0, 0.0, 45.56, 0.0, 34.51, 0.0, 0.0, 41.66, 0.0, 0.0, 0.0, 0.0, 37.62, 0.0, 0.0, 0.0, 31.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.67], ["electronic music", 10.78], ["synthesizer", 4.81]], [["music", 40.13], ["thunk", 29.31], ["theremin", 4.25]], [["speech", 39.3], ["music", 8.38], ["cattle, bovinae", 7.17]], null, null, null, [["music", 36.72], ["noise", 22.06], ["whale vocalization", 12.54]], null, null, null, [["music", 66.68], ["boing", 7.22], ["plop", 2.42]], null, [["music", 42.62], ["screaming", 36.09], ["speech", 9.61]], null, null, [["hum", 18.66], ["throbbing", 8.98], ["speech", 7.83]], null, null, null, null, [["boing", 41.08], ["music", 39.91], ["speech", 6.3]], null, null, null, [["music", 54.22], ["animal", 5.68], ["grunt", 3.91]], null, null], "duration": [0.98, -0.18, 0.84, 4.56, 3.69, 5.84, 1.78, 0.08, 3.74, 2.5, 0.68, 0.37, 0.26, 4.6, 0.51, 5.18, 0.42, 0.95, 4.17, 0.96, 1.07, 0.27, 0.74, 4.73, 34.74, -0.22, 0.62, 2.37, 41.43, -0.1]} \ No newline at end of file diff --git a/annotations_1/BMlHiDzHkSk_filtered.json b/annotations_1/BMlHiDzHkSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d212a3ef222828f8e7e106c1e61209684f25eec8 --- /dev/null +++ b/annotations_1/BMlHiDzHkSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.7], [12.0, 12.5], [15.0, 19.55], [20.0, 20.83], [23.0, 79.83]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 45.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 27.65], ["speech", 17.6], ["synthesizer", 9.67]], null, null], "duration": [-0.3, 0.5, 4.55, 0.83, 56.83]} \ No newline at end of file diff --git a/annotations_1/BN77UGYk5tg_filtered.json b/annotations_1/BN77UGYk5tg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39b3258a1a5deccb6476f3ad9df39deb2f4c6f81 --- /dev/null +++ b/annotations_1/BN77UGYk5tg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.56], [10.0, 10.12], [11.0, 11.26], [12.0, 12.26], [16.0, 16.12], [17.0, 17.52], [18.0, 18.62], [19.0, 19.55], [20.0, 22.3], [24.0, 25.2], [26.0, 27.06], [29.0, 30.89], [32.0, 34.06], [35.0, 36.36], [37.0, 39.19], [40.0, 40.64], [42.0, 42.08], [43.0, 43.77], [45.0, 46.95], [48.0, 49.2], [50.0, 52.78], [55.0, 56.61], [59.0, 59.68], [60.0, 61.67], [63.0, 63.51], [66.0, 66.66], [68.0, 69.99], [72.0, 75.79], [79.0, 80.79], [83.0, 89.51], [90.0, 91.96], [93.0, 94.31], [95.0, 98.31], [99.0, 99.71], [102.0, 104.68], [105.0, 105.92], [107.0, 108.26], [111.0, 112.28], [114.0, 115.65], [117.0, 123.58], [131.0, 135.63], [138.0, 143.8], [144.0, 145.12], [148.0, 149.98], [151.0, 152.76], [154.0, 154.84], [156.0, 156.64], [158.0, 161.57], [163.0, 164.17], [165.0, 165.62], [167.0, 167.8], [168.0, 175.05], [176.0, 177.52], [179.0, 178.71], [179.0, 179.47], [180.0, 183.07], [184.0, 184.84], [185.0, 185.7], [186.0, 195.1], [195.0, 195.78], [197.0, 207.66], [208.0, 209.76], [211.0, 215.22], [218.0, 219.6], [220.0, 221.12], [225.0, 225.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 99.71, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 35.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 88.46, 0.0, 0.0, 80.11, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 39.47, 35.1, 47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 39.28, 0.0, 0.0, 0.0, 35.81, 0.0, 0.0, 41.18, 0.0, 36.0, 0.0, 92.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.16], ["dial tone", 20.01], ["telephone", 4.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 26.76], ["speech", 20.28], ["arrow", 12.57]], [["radio", 37.58], ["creak", 31.13], ["speech", 15.78]], [["insect", 24.28], ["sidetone", 14.46], ["radio", 11.43]], null, null, null, null, null, null, null, null, null, [["animal", 15.77], ["horse", 12.93], ["clip-clop", 5.98]], null, null, null, [["cattle, bovinae", 52.67], ["moo", 32.85], ["livestock, farm animals, working animals", 12.39]], null, null, [["hum", 35.65], ["speech", 12.59], ["stomach rumble", 5.89]], null, [["horse", 8.7], ["burst, pop", 7.09], ["whack, thwack", 5.85]], null, null, null, null, null], "duration": [1.56, 0.12, 0.26, 0.26, 0.12, 0.52, 0.62, 0.55, 2.3, 1.2, 1.06, 1.89, 2.06, 1.36, 2.19, 0.64, 0.08, 0.77, 1.95, 1.2, 2.78, 1.61, 0.68, 1.67, 0.51, 0.66, 1.99, 3.79, 1.79, 6.51, 1.96, 1.31, 3.31, 0.71, 2.68, 0.92, 1.26, 1.28, 1.65, 6.58, 4.63, 5.8, 1.12, 1.98, 1.76, 0.84, 0.64, 3.57, 1.17, 0.62, 0.8, 7.05, 1.52, -0.29, 0.47, 3.07, 0.84, 0.7, 9.1, 0.78, 10.66, 1.76, 4.22, 1.6, 1.12, 0.95]} \ No newline at end of file diff --git a/annotations_1/BN8VnFVqRRI_filtered.json b/annotations_1/BN8VnFVqRRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04d59700d09207cf233e35f86d160b0932e91285 --- /dev/null +++ b/annotations_1/BN8VnFVqRRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 68.91], [72.0, 96.06], [102.0, 102.84]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.81, 0.0], "audiomae_on_audioset": [null, [["music", 63.82], ["cacophony", 4.6], ["hum", 4.21]], null], "duration": [43.91, 24.06, 0.84]} \ No newline at end of file diff --git a/annotations_1/BPuGsFSTy0Y_filtered.json b/annotations_1/BPuGsFSTy0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac499b0ee04f29542eb38c7b4f5440f95c231071 --- /dev/null +++ b/annotations_1/BPuGsFSTy0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.42], [19.0, 30.3], [34.0, 35.46], [38.0, 39.72], [41.0, 41.91], [43.0, 46.62], [51.0, 52.42], [63.0, 63.73], [74.0, 74.11], [81.0, 82.86], [84.0, 90.46], [91.0, 96.7], [98.0, 98.73], [103.0, 107.67], [112.0, 112.87], [121.0, 122.96], [133.0, 153.52], [155.0, 157.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [31.26, 30.66, 0.0, 0.0, 0.0, 32.16, 0.0, 0.0, 0.0, 0.0, 30.47, 30.07, 0.0, 29.17, 0.0, 0.0, 30.95, 38.58], "audiomae_on_audioset": [[["music", 55.71], ["speech", 18.57], ["throbbing", 6.9]], [["music", 76.6], ["throbbing", 4.12], ["vehicle", 3.32]], null, null, null, [["music", 38.75], ["boing", 29.45], ["speech", 4.38]], null, null, null, null, [["music", 31.06], ["throbbing", 30.08], ["hum", 17.65]], [["cattle, bovinae", 25.16], ["livestock, farm animals, working animals", 24.45], ["moo", 16.38]], null, [["music", 34.22], ["buzz", 20.5], ["smash, crash", 5.5]], null, null, [["music", 88.07], ["didgeridoo", 6.19], ["electronic music", 0.75]], [["livestock, farm animals, working animals", 23.05], ["cattle, bovinae", 12.78], ["music", 10.88]]], "duration": [9.42, 11.3, 1.46, 1.72, 0.91, 3.62, 1.42, 0.73, 0.11, 1.86, 6.46, 5.7, 0.73, 4.67, 0.87, 1.96, 20.52, 2.49]} \ No newline at end of file diff --git a/annotations_1/BQl4CNHsgvc_filtered.json b/annotations_1/BQl4CNHsgvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d2805cc68a9291bca1f234470a9dce15503a3b3 --- /dev/null +++ b/annotations_1/BQl4CNHsgvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.07], [18.0, 43.23], [44.0, 54.4], [55.0, 56.98], [60.0, 64.91], [67.0, 71.14]], "keep_status": [false, false, false, false, false, false], "silence_prob": [46.57, 56.03, 56.18, 0.0, 70.86, 81.0], "audiomae_on_audioset": [[["music", 61.4], ["ambient music", 5.73], ["hum", 5.46]], null, null, null, null, null], "duration": [4.07, 25.23, 10.4, 1.98, 4.91, 4.14]} \ No newline at end of file diff --git a/annotations_1/BR-kA4Jnn8M_filtered.json b/annotations_1/BR-kA4Jnn8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd52394c3919beb005a908f0d6e4baa138a70d07 --- /dev/null +++ b/annotations_1/BR-kA4Jnn8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.21], [5.0, 6.37], [20.0, 19.87], [21.0, 21.95], [24.0, 30.35], [31.0, 32.44], [37.0, 37.88], [38.0, 41.07], [43.0, 43.61], [52.0, 52.41], [57.0, 57.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.44, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 1.37, -0.13, 0.95, 6.35, 1.44, 0.88, 3.07, 0.61, 0.41, 0.6]} \ No newline at end of file diff --git a/annotations_1/BRBSfKmp3vs_filtered.json b/annotations_1/BRBSfKmp3vs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d8bb8a5551bb81fecdd7a12e6092492e348f19 --- /dev/null +++ b/annotations_1/BRBSfKmp3vs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [4.0, 4.09], [5.0, 6.52], [10.0, 10.86], [12.0, 12.73], [13.0, 15.3], [18.0, 19.94], [21.0, 21.79], [23.0, 23.25], [25.0, 25.3], [26.0, 32.41], [33.0, 39.58], [41.0, 47.95], [59.0, 61.74], [63.0, 66.43], [68.0, 69.16], [70.0, 70.78], [76.0, 86.54], [92.0, 97.36], [99.0, 105.14], [106.0, 107.0], [109.0, 109.43], [112.0, 117.68], [119.0, 120.23], [129.0, 130.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 63.1, 35.94, 32.68, 100.0, 99.99, 0.0, 0.0, 41.32, 76.86, 65.44, 0.0, 0.0, 32.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["crushing", 69.55], ["fly, housefly", 6.52], ["glass", 3.94]], [["music", 19.08], ["synthesizer", 11.9], ["effects unit", 9.84]], null, null, null, null, [["music", 61.02], ["throbbing", 16.84], ["hum", 5.73]], null, null, null, null, [["speech", 54.85], ["music", 7.63], ["vehicle", 5.86]], null, null], "duration": [-0.2, 0.09, 1.52, 0.86, 0.73, 2.3, 1.94, 0.79, 0.25, 0.3, 6.41, 6.58, 6.95, 2.74, 3.43, 1.16, 0.78, 10.54, 5.36, 6.14, 1.0, 0.43, 5.68, 1.23, 1.05]} \ No newline at end of file diff --git a/annotations_1/BSQeVY2fdL8_filtered.json b/annotations_1/BSQeVY2fdL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c37286a17a4a6314c9523bd8d7d96b2f5e77a23a --- /dev/null +++ b/annotations_1/BSQeVY2fdL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.24], [15.0, 15.26], [17.0, 17.78], [22.0, 23.01], [24.0, 27.36], [30.0, 54.21], [56.0, 56.84], [59.0, 58.83], [62.0, 62.87], [67.0, 68.22], [78.0, 78.54], [80.0, 85.08], [88.0, 146.08], [156.0, 157.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 89.01, 32.07, 0.0, 0.0, 0.0, 0.0, 0.0, 30.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 28.59], ["music", 18.0], ["rumble", 8.16]], null, null, null, null, null, [["moo", 23.88], ["livestock, farm animals, working animals", 20.77], ["cattle, bovinae", 16.49]], null, null], "duration": [0.24, 0.26, 0.78, 1.01, 3.36, 24.21, 0.84, -0.17, 0.87, 1.22, 0.54, 5.08, 58.08, 1.59]} \ No newline at end of file diff --git a/annotations_1/BSWKnZ4-2eE_filtered.json b/annotations_1/BSWKnZ4-2eE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30322ba1c866cba0210acf3b4c01597f28d06c80 --- /dev/null +++ b/annotations_1/BSWKnZ4-2eE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 34.03], [34.0, 38.13], [40.0, 44.34], [48.0, 55.71], [62.0, 63.41], [70.0, 74.68], [85.0, 89.63], [90.0, 90.64], [91.0, 91.94], [94.0, 98.07], [104.0, 113.61], [114.0, 137.69]], "keep_status": [false, true, false, false, false, true, false, false, false, true, false, false], "silence_prob": [29.05, 29.27, 29.41, 28.99, 0.0, 30.81, 30.27, 0.0, 0.0, 32.23, 31.2, 30.53], "audiomae_on_audioset": [[["music", 74.0], ["musical instrument", 4.46], ["trombone", 4.22]], [["music", 34.82], ["throbbing", 11.55], ["musical instrument", 9.03]], [["moo", 28.26], ["music", 26.33], ["cattle, bovinae", 24.82]], [["music", 59.16], ["speech", 9.73], ["carnatic music", 9.3]], null, [["music", 50.71], ["musical instrument", 6.55], ["guitar", 6.21]], [["music", 75.91], ["musical instrument", 2.56], ["brass instrument", 1.47]], null, null, [["music", 33.11], ["speech", 19.72], ["foghorn", 12.23]], [["music", 69.25], ["swing music", 6.5], ["trombone", 3.59]], [["music", 60.83], ["musical instrument", 6.15], ["trombone", 5.57]]], "duration": [29.03, 4.13, 4.34, 7.71, 1.41, 4.68, 4.63, 0.64, 0.94, 4.07, 9.61, 23.69]} \ No newline at end of file diff --git a/annotations_1/BTJ-smMan7Y_filtered.json b/annotations_1/BTJ-smMan7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb37364a742cc2d2d643c16c1ba3e5f1221fe876 --- /dev/null +++ b/annotations_1/BTJ-smMan7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 34.94], [36.0, 45.99], [46.0, 46.03], [46.0, 46.06], [46.0, 46.09], [46.0, 46.13], [50.0, 49.91], [50.0, 105.93], [108.0, 111.18], [118.0, 126.44], [130.0, 149.39], [160.0, 168.08], [174.0, 179.73], [180.0, 193.4], [201.0, 203.64], [207.0, 207.18], [210.0, 224.4], [226.0, 229.88], [230.0, 235.52]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.95, 34.22, 31.51, 36.79, 34.24, 31.56, 33.82, 0.0, 32.14, 32.4, 33.43], "audiomae_on_audioset": [null, [["speech", 59.87], ["music", 23.84], ["shatter", 2.72]], null, null, null, null, null, null, [["speech", 34.43], ["fart", 10.35], ["sound effect", 6.11]], [["music", 21.52], ["groan", 15.76], ["fart", 6.38]], [["speech", 40.7], ["music", 20.16], ["explosion", 7.91]], [["livestock, farm animals, working animals", 29.0], ["cattle, bovinae", 28.3], ["moo", 20.99]], [["cattle, bovinae", 42.76], ["moo", 29.09], ["livestock, farm animals, working animals", 24.9]], [["music", 59.16], ["speech", 11.52], ["sidetone", 6.15]], [["music", 58.66], ["speech", 14.91], ["electronic music", 3.1]], null, [["speech", 37.23], ["music", 25.81], ["vehicle", 12.82]], [["music", 53.63], ["speech", 20.07], ["didgeridoo", 1.75]], [["music", 35.12], ["speech", 5.78], ["didgeridoo", 4.97]]], "duration": [31.94, 9.99, 0.03, 0.06, 0.09, 0.13, -0.09, 55.93, 3.18, 8.44, 19.39, 8.08, 5.73, 13.4, 2.64, 0.18, 14.4, 3.88, 5.52]} \ No newline at end of file diff --git a/annotations_1/BT_QpciXdcI_filtered.json b/annotations_1/BT_QpciXdcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc943b53d147c52a62cd3e96e24cc479c5abcf2e --- /dev/null +++ b/annotations_1/BT_QpciXdcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.94], [24.0, 61.21], [61.0, 63.51], [66.0, 67.26], [69.0, 68.93], [70.0, 71.49], [72.0, 74.01], [78.0, 82.24], [87.0, 87.2], [88.0, 88.57], [90.0, 90.05], [92.0, 95.74], [97.0, 97.23], [98.0, 98.73], [101.0, 104.03], [106.0, 106.07], [107.0, 106.91], [107.0, 108.03], [111.0, 111.91], [113.0, 113.31], [118.0, 121.36], [123.0, 123.42], [123.0, 123.94]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.06, 0.0, 41.64, 0.0, 0.0, 0.0, 99.99, 99.99, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 46.96], ["music", 12.77], ["echo", 8.7]], null, [["music", 54.89], ["musical instrument", 6.94], ["guitar", 3.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.94, 37.21, 2.51, 1.26, -0.07, 1.49, 2.01, 4.24, 0.2, 0.57, 0.05, 3.74, 0.23, 0.73, 3.03, 0.07, -0.09, 1.03, 0.91, 0.31, 3.36, 0.42, 0.94]} \ No newline at end of file diff --git a/annotations_1/BTeAQ_QLObc_filtered.json b/annotations_1/BTeAQ_QLObc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21188dd3faf2bbb8788fb103bbf2cdf3abcde09f --- /dev/null +++ b/annotations_1/BTeAQ_QLObc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.47], [23.0, 23.79], [25.0, 26.05], [43.0, 43.61], [49.0, 49.62], [51.0, 50.99], [55.0, 54.89], [55.0, 55.48], [56.0, 56.4], [58.0, 62.23], [66.0, 66.51], [70.0, 69.74], [72.0, 73.43], [79.0, 78.78], [80.0, 80.96], [82.0, 83.05], [93.0, 92.7], [93.0, 95.0], [98.0, 101.7], [104.0, 107.55], [109.0, 109.66], [110.0, 111.75], [120.0, 120.29], [120.0, 124.61], [125.0, 126.59], [128.0, 129.39], [130.0, 130.67], [133.0, 141.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [42.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.91, 44.37, 34.04, 0.0, 0.0, 0.0, 31.4, 0.0, 0.0, 0.0, 32.78], "audiomae_on_audioset": [[["didgeridoo", 58.45], ["music", 24.75], ["throbbing", 3.18]], null, null, null, null, null, null, null, null, [["music", 37.84], ["beatboxing", 8.24], ["synthesizer", 6.48]], null, null, null, null, null, null, null, [["music", 35.84], ["frog", 21.46], ["croak", 8.27]], [["music", 36.22], ["owl", 16.6], ["hoot", 9.21]], [["music", 44.9], ["electronic music", 9.47], ["trance music", 7.64]], null, null, null, [["speech", 53.27], ["music", 24.78], ["hum", 4.46]], null, null, null, [["music", 31.97], ["hum", 31.45], ["throbbing", 24.56]]], "duration": [6.47, 0.79, 1.05, 0.61, 0.62, -0.01, -0.11, 0.48, 0.4, 4.23, 0.51, -0.26, 1.43, -0.22, 0.96, 1.05, -0.3, 2.0, 3.7, 3.55, 0.66, 1.75, 0.29, 4.61, 1.59, 1.39, 0.67, 8.27]} \ No newline at end of file diff --git a/annotations_1/BUB6TUH7N0A_filtered.json b/annotations_1/BUB6TUH7N0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565cedef28ffce1d5ad01314643c47851dfb55e2 --- /dev/null +++ b/annotations_1/BUB6TUH7N0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [5.0, 5.51], [8.0, 8.07], [8.0, 9.95], [16.0, 17.68], [21.0, 29.44], [30.0, 30.84], [31.0, 34.4], [42.0, 42.87], [48.0, 48.93], [55.0, 57.59], [60.0, 60.88], [64.0, 66.07], [69.0, 69.09], [69.0, 69.3], [69.0, 69.33], [69.0, 69.36], [69.0, 69.4], [69.0, 74.14], [76.0, 78.63], [81.0, 82.53], [84.0, 85.11], [87.0, 87.0], [89.0, 93.82], [99.0, 99.94], [113.0, 115.13], [130.0, 131.82], [159.0, 161.3]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.08, 0.0, 30.81, 0.0, 0.0, 30.24, 0.0, 32.07, 0.0, 0.0, 0.0, 0.0, 0.0, 30.83, 32.19, 0.0, 0.0, 0.0, 30.71, 0.0, 31.42, 0.0, 30.14], "audiomae_on_audioset": [null, null, null, null, null, [["music", 69.45], ["musical instrument", 11.11], ["guitar", 5.1]], null, [["music", 58.48], ["musical instrument", 5.01], ["plucked string instrument", 3.05]], null, null, [["music", 74.3], ["guitar", 7.81], ["musical instrument", 6.26]], null, [["music", 54.56], ["musical instrument", 12.44], ["guitar", 9.51]], null, null, null, null, null, [["music", 85.91], ["musical instrument", 2.07], ["singing", 1.28]], [["music", 59.63], ["guitar", 6.73], ["musical instrument", 5.61]], null, null, null, [["music", 65.73], ["didgeridoo", 4.38], ["synthesizer", 2.99]], null, [["music", 69.17], ["musical instrument", 6.45], ["bass guitar", 3.13]], null, [["music", 56.05], ["musical instrument", 8.34], ["guitar", 6.03]]], "duration": [0.99, 0.51, 0.07, 1.95, 1.68, 8.44, 0.84, 3.4, 0.87, 0.93, 2.59, 0.88, 2.07, 0.09, 0.3, 0.33, 0.36, 0.4, 5.14, 2.63, 1.53, 1.11, 0.0, 4.82, 0.94, 2.13, 1.82, 2.3]} \ No newline at end of file diff --git a/annotations_1/BUqJMPAtmdY_filtered.json b/annotations_1/BUqJMPAtmdY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27c41e791eb08b69751463a16b9e80383e805533 --- /dev/null +++ b/annotations_1/BUqJMPAtmdY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 41.34], [42.0, 132.81], [135.0, 161.32], [163.0, 162.9]], "keep_status": [false, false, false, false], "silence_prob": [29.97, 0.0, 31.15, 0.0], "audiomae_on_audioset": [[["music", 60.61], ["speech", 8.43], ["trance music", 3.69]], null, [["music", 76.38], ["speech", 3.99], ["hum", 2.47]], null], "duration": [21.34, 90.81, 26.32, -0.1]} \ No newline at end of file diff --git a/annotations_1/BVrhwsgCuFU_filtered.json b/annotations_1/BVrhwsgCuFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a0f2c3287e2342ec3e7c8afb1783a00ff07ddb --- /dev/null +++ b/annotations_1/BVrhwsgCuFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.1], [19.0, 20.58], [22.0, 24.22], [24.0, 27.45], [28.0, 35.55], [36.0, 40.26], [41.0, 47.9], [49.0, 49.74], [52.0, 57.28], [59.0, 61.77], [63.0, 65.3], [66.0, 67.36], [68.0, 77.7], [78.0, 78.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.21, 0.0, 98.66, 68.02, 84.62, 92.48, 99.05, 0.0, 97.73, 98.8, 98.27, 0.0, 31.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.69], ["theremin", 15.08], ["speech", 5.28]], null], "duration": [3.1, 1.58, 2.22, 3.45, 7.55, 4.26, 6.9, 0.74, 5.28, 2.77, 2.3, 1.36, 9.7, 0.73]} \ No newline at end of file diff --git a/annotations_1/BW1kpbOz5Eo_filtered.json b/annotations_1/BW1kpbOz5Eo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c65ab81b8ceb00241c6710c8e7408638047a1e --- /dev/null +++ b/annotations_1/BW1kpbOz5Eo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 10.17], [14.0, 14.52], [24.0, 23.85], [24.0, 24.68], [33.0, 33.3], [39.0, 39.34]], "keep_status": [true, false, false, false, false, false], "silence_prob": [34.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["buzz", 32.15], ["noise", 11.27], ["music", 8.67]], null, null, null, null, null], "duration": [10.17, 0.52, -0.15, 0.68, 0.3, 0.34]} \ No newline at end of file diff --git a/annotations_1/BWR9aK0vAAY_filtered.json b/annotations_1/BWR9aK0vAAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb11dbb3be6bea217d0dadbeaf73410054eec9b0 --- /dev/null +++ b/annotations_1/BWR9aK0vAAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 8.72], [10.0, 13.68], [14.0, 14.96], [17.0, 17.44], [19.0, 36.09], [38.0, 39.33], [41.0, 43.14], [45.0, 45.96], [47.0, 48.47], [51.0, 51.71], [53.0, 60.15], [61.0, 80.35], [81.0, 81.09], [82.0, 82.54], [85.0, 86.58], [89.0, 93.24], [94.0, 94.54], [99.0, 98.83], [102.0, 102.74], [106.0, 107.35], [110.0, 112.7], [116.0, 146.62]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.01, 62.27, 0.0, 0.0, 43.96, 0.0, 51.02, 0.0, 0.0, 0.0, 34.34, 44.15, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 50.27], ["speech", 7.95], ["ambient music", 7.93]], null, null, null, null, null, [["music", 39.68], ["hum", 24.97], ["mains hum", 15.6]], [["mains hum", 66.43], ["hum", 29.0], ["music", 1.5]], null, null, null, null, null, null, null, null, [["music", 76.5], ["hum", 3.03], ["electronic music", 2.3]], null], "duration": [1.42, 3.72, 3.68, 0.96, 0.44, 17.09, 1.33, 2.14, 0.96, 1.47, 0.71, 7.15, 19.35, 0.09, 0.54, 1.58, 4.24, 0.54, -0.17, 0.74, 1.35, 2.7, 30.62]} \ No newline at end of file diff --git a/annotations_1/BWT3i-fgw0s_filtered.json b/annotations_1/BWT3i-fgw0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c4a10aa0046fbce0475e9bd1ea4edf09cd8fd97 --- /dev/null +++ b/annotations_1/BWT3i-fgw0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.35], [30.0, 30.82], [34.0, 34.06], [43.0, 43.33], [55.0, 55.46], [63.0, 63.15], [69.0, 81.13], [87.0, 106.46], [112.0, 128.76], [133.0, 133.41], [141.0, 141.42], [142.0, 156.79], [158.0, 159.43], [164.0, 166.82]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.39, 30.77, 32.03, 0.0, 0.0, 30.1, 0.0, 31.88], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 68.15], ["throbbing", 9.33], ["hum", 7.68]], [["music", 89.04], ["electronic music", 1.25], ["throbbing", 0.78]], [["music", 25.59], ["speech", 21.06], ["throbbing", 10.46]], null, null, [["speech", 61.23], ["vehicle", 5.58], ["outside, rural or natural", 3.58]], null, [["speech", 49.57], ["eruption", 5.19], ["vehicle", 3.98]]], "duration": [0.35, 0.82, 0.06, 0.33, 0.46, 0.15, 12.13, 19.46, 16.76, 0.41, 0.42, 14.79, 1.43, 2.82]} \ No newline at end of file diff --git a/annotations_1/BX-hxkRsaT4_filtered.json b/annotations_1/BX-hxkRsaT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad24372a70a6b8fb6615fc1bc33783315c2d1525 --- /dev/null +++ b/annotations_1/BX-hxkRsaT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.03], [15.0, 16.23], [22.0, 25.61], [26.0, 27.58], [28.0, 35.85], [36.0, 37.37], [42.0, 42.08], [57.0, 61.94], [72.0, 75.88], [78.0, 81.95], [90.0, 90.48], [94.0, 109.78], [110.0, 111.38], [112.0, 112.92], [118.0, 120.41], [124.0, 124.63], [126.0, 126.23], [128.0, 129.88], [135.0, 135.19], [136.0, 139.51], [140.0, 139.55]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [48.82, 0.0, 41.36, 0.0, 50.81, 0.0, 0.0, 48.39, 45.14, 89.01, 0.0, 33.76, 0.0, 0.0, 37.19, 0.0, 0.0, 0.0, 0.0, 33.85, 0.0], "audiomae_on_audioset": [[["music", 39.71], ["speech", 9.45], ["musical instrument", 5.96]], null, [["music", 73.72], ["musical instrument", 3.56], ["marimba, xylophone", 2.44]], null, null, null, null, [["speech", 89.92], ["tap", 1.36], ["telephone", 0.66]], [["speech", 67.88], ["tap", 16.69], ["music", 4.56]], null, null, [["music", 59.34], ["harp", 8.13], ["keyboard (musical)", 6.65]], null, null, [["speech", 63.57], ["music", 5.66], ["inside, small room", 3.57]], null, null, null, null, [["speech", 23.03], ["horse", 17.27], ["music", 11.53]], null], "duration": [3.03, 1.23, 3.61, 1.58, 7.85, 1.37, 0.08, 4.94, 3.88, 3.95, 0.48, 15.78, 1.38, 0.92, 2.41, 0.63, 0.23, 1.88, 0.19, 3.51, -0.45]} \ No newline at end of file diff --git a/annotations_1/BXNuNJhLWyw_filtered.json b/annotations_1/BXNuNJhLWyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab5713d6d4eb9f0c95c7e25b44d281c910fb47bc --- /dev/null +++ b/annotations_1/BXNuNJhLWyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.9], [16.0, 22.89], [25.0, 25.25], [27.0, 27.31], [30.0, 31.6], [33.0, 38.52], [41.0, 41.88], [43.0, 52.83], [54.0, 57.06], [60.0, 59.75], [62.0, 65.33], [71.0, 72.05], [73.0, 75.73], [77.0, 81.68]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.16, 0.0, 0.0, 0.0, 46.68, 0.0, 55.6, 75.72, 0.0, 58.22, 0.0, 77.36, 71.29], "audiomae_on_audioset": [null, [["music", 58.91], ["effects unit", 9.97], ["guitar", 6.29]], null, null, null, [["music", 49.47], ["hum", 6.78], ["mains hum", 3.65]], null, null, null, null, null, null, null, null], "duration": [-0.1, 6.89, 0.25, 0.31, 1.6, 5.52, 0.88, 9.83, 3.06, -0.25, 3.33, 1.05, 2.73, 4.68]} \ No newline at end of file diff --git a/annotations_1/BXXY48jjLtw_filtered.json b/annotations_1/BXXY48jjLtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c68ad4a5067a5cf4699f1cf0bb5cbd5c82a02332 --- /dev/null +++ b/annotations_1/BXXY48jjLtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.31], [25.0, 28.75], [31.0, 60.13], [61.0, 93.09], [95.0, 97.87]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 28.9, 36.75, 0.0, 86.45], "audiomae_on_audioset": [null, [["music", 47.07], ["speech", 24.34], ["noise", 4.36]], [["hum", 31.37], ["music", 29.75], ["mains hum", 11.19]], null, null], "duration": [1.31, 3.75, 29.13, 32.09, 2.87]} \ No newline at end of file diff --git a/annotations_1/BXlYuaycRbU_filtered.json b/annotations_1/BXlYuaycRbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db0b4407484aec2ad2656570b918dcf26c9504a9 --- /dev/null +++ b/annotations_1/BXlYuaycRbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 16.98], [43.0, 44.12], [58.0, 60.44], [88.0, 87.79], [90.0, 90.39], [98.0, 98.79], [107.0, 107.89], [109.0, 110.1], [114.0, 115.65], [128.0, 133.39], [138.0, 139.53], [142.0, 144.44], [147.0, 149.35], [152.0, 154.25], [157.0, 159.16], [162.0, 165.37], [166.0, 167.59], [168.0, 169.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.72, 0.0, 33.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.3, 0.0, 32.63, 31.98, 32.55, 31.74, 31.22, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.11], ["boing", 4.85], ["musical instrument", 3.78]], null, [["music", 69.49], ["electronic music", 3.14], ["sampler", 2.04]], null, null, null, null, null, null, [["music", 65.34], ["boing", 10.43], ["throbbing", 3.93]], null, [["throbbing", 49.1], ["music", 19.51], ["hum", 18.24]], [["music", 38.58], ["throbbing", 32.69], ["hum", 10.6]], [["throbbing", 32.62], ["music", 32.39], ["hum", 14.49]], [["throbbing", 33.44], ["music", 24.98], ["hum", 13.49]], [["throbbing", 48.63], ["hum", 21.36], ["music", 15.54]], null, null], "duration": [11.98, 1.12, 2.44, -0.21, 0.39, 0.79, 0.89, 1.1, 1.65, 5.39, 1.53, 2.44, 2.35, 2.25, 2.16, 3.37, 1.59, 1.01]} \ No newline at end of file diff --git a/annotations_1/BYmHra1d_Nw_filtered.json b/annotations_1/BYmHra1d_Nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acf00b0bc7107c26af4534ac3df76065562ccf5f --- /dev/null +++ b/annotations_1/BYmHra1d_Nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [3.0, 4.48], [6.0, 6.59], [7.0, 7.55], [8.0, 9.93], [12.0, 13.32], [14.0, 17.91], [22.0, 23.36], [25.0, 26.2], [29.0, 31.23], [35.0, 36.39], [37.0, 38.31], [45.0, 44.88], [48.0, 48.63], [50.0, 51.38], [52.0, 53.97], [55.0, 58.13], [59.0, 61.28], [62.0, 63.51], [64.0, 66.95], [68.0, 69.55], [70.0, 71.68], [73.0, 75.07], [76.0, 81.62], [85.0, 93.55], [95.0, 96.82], [98.0, 99.52], [100.0, 100.74], [101.0, 110.4], [112.0, 112.82], [115.0, 115.32], [116.0, 117.81], [124.0, 124.02], [125.0, 126.81], [136.0, 137.54], [139.0, 141.18], [143.0, 145.17], [147.0, 152.88], [153.0, 156.73], [158.0, 158.84], [160.0, 160.91], [162.0, 166.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38, 99.48, 0.0, 99.85, 0.0, 0.0, 85.9, 98.66, 87.37, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.15, 99.98, 99.99, 98.93, 0.0, 0.0, 51.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 1.48, 0.59, 0.55, 1.93, 1.32, 3.91, 1.36, 1.2, 2.23, 1.39, 1.31, -0.12, 0.63, 1.38, 1.97, 3.13, 2.28, 1.51, 2.95, 1.55, 1.68, 2.07, 5.62, 8.55, 1.82, 1.52, 0.74, 9.4, 0.82, 0.32, 1.81, 0.02, 1.81, 1.54, 2.18, 2.17, 5.88, 3.73, 0.84, 0.91, 4.43]} \ No newline at end of file diff --git a/annotations_1/BYrS2k5nPbw_filtered.json b/annotations_1/BYrS2k5nPbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d968290ac9155ac33cf2f1b8229def2c8301169 --- /dev/null +++ b/annotations_1/BYrS2k5nPbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.52], [12.0, 18.28], [20.0, 20.38], [21.0, 25.83], [27.0, 28.56], [34.0, 34.23], [35.0, 36.29], [37.0, 38.74], [39.0, 78.51], [81.0, 84.38], [85.0, 97.33], [100.0, 100.11], [102.0, 115.67], [117.0, 125.64], [127.0, 132.29], [134.0, 135.7], [136.0, 154.53], [157.0, 157.32], [158.0, 158.5], [159.0, 160.12], [161.0, 162.18], [163.0, 164.66], [170.0, 176.17], [180.0, 181.99], [185.0, 186.88], [188.0, 188.15], [192.0, 203.59]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.95, 0.0, 36.43, 0.0, 0.0, 0.0, 0.0, 0.0, 33.15, 29.39, 0.0, 29.37, 29.47, 28.73, 0.0, 29.03, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 31.93], "audiomae_on_audioset": [null, [["throbbing", 47.5], ["music", 31.65], ["hum", 6.28]], null, [["throbbing", 61.52], ["hum", 14.18], ["music", 12.85]], null, null, null, null, null, [["music", 23.23], ["didgeridoo", 9.29], ["mechanisms", 8.86]], [["music", 54.95], ["smash, crash", 6.27], ["cacophony", 5.75]], null, [["music", 55.42], ["hum", 11.05], ["throbbing", 5.24]], [["music", 36.4], ["speech", 24.17], ["thump, thud", 5.46]], [["music", 28.47], ["noise", 11.58], ["throbbing", 7.2]], null, [["music", 28.81], ["fly, housefly", 14.12], ["mosquito", 8.35]], null, null, null, null, null, [["music", 61.63], ["didgeridoo", 8.0], ["buzz", 6.09]], null, null, null, [["music", 83.24], ["crack", 4.0], ["synthesizer", 1.92]]], "duration": [0.52, 6.28, 0.38, 4.83, 1.56, 0.23, 1.29, 1.74, 39.51, 3.38, 12.33, 0.11, 13.67, 8.64, 5.29, 1.7, 18.53, 0.32, 0.5, 1.12, 1.18, 1.66, 6.17, 1.99, 1.88, 0.15, 11.59]} \ No newline at end of file diff --git a/annotations_1/B_JVGEptSOw_filtered.json b/annotations_1/B_JVGEptSOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59145861a06da813232e75459c43d0886c119f80 --- /dev/null +++ b/annotations_1/B_JVGEptSOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.05], [18.0, 19.16], [19.0, 25.35], [32.0, 32.36], [34.0, 34.94], [37.0, 39.83], [42.0, 50.99], [54.0, 66.65], [69.0, 72.74], [75.0, 75.49], [80.0, 80.69], [81.0, 82.07], [83.0, 85.23], [87.0, 87.51], [88.0, 88.33], [90.0, 93.77], [95.0, 95.88], [98.0, 101.88], [107.0, 108.46], [111.0, 115.01], [120.0, 121.39], [122.0, 122.18], [124.0, 126.64], [128.0, 132.98], [136.0, 145.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [46.26, 0.0, 51.99, 0.0, 0.0, 48.61, 46.9, 51.71, 54.9, 0.0, 0.0, 0.0, 58.22, 0.0, 0.0, 71.72, 0.0, 46.68, 0.0, 44.26, 0.0, 0.0, 46.19, 39.3, 47.43], "audiomae_on_audioset": [[["sidetone", 57.78], ["music", 22.96], ["speech", 3.21]], null, null, null, null, [["speech", 42.09], ["music", 22.68], ["guitar", 7.87]], [["music", 39.63], ["speech", 26.96], ["hum", 4.65]], null, null, null, null, null, null, null, null, null, null, [["music", 40.66], ["speech", 28.25], ["guitar", 3.07]], null, [["music", 51.96], ["gong", 9.9], ["harmonic", 5.04]], null, null, [["music", 63.91], ["musical instrument", 8.1], ["gong", 5.77]], [["music", 26.89], ["mains hum", 12.88], ["hum", 12.84]], [["music", 74.57], ["synthesizer", 3.66], ["musical instrument", 3.01]]], "duration": [2.05, 1.16, 6.35, 0.36, 0.94, 2.83, 8.99, 12.65, 3.74, 0.49, 0.69, 1.07, 2.23, 0.51, 0.33, 3.77, 0.88, 3.88, 1.46, 4.01, 1.39, 0.18, 2.64, 4.98, 9.91]} \ No newline at end of file diff --git a/annotations_1/BbHxQ77anjQ_filtered.json b/annotations_1/BbHxQ77anjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38d669669e34cb95d435319152104d471614ec89 --- /dev/null +++ b/annotations_1/BbHxQ77anjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 106.56], [110.0, 110.12], [111.0, 111.15]], "keep_status": [true, false, false], "silence_prob": [31.16, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.02], ["cattle, bovinae", 22.26], ["moo", 14.22]], null, null], "duration": [5.56, 0.12, 0.15]} \ No newline at end of file diff --git a/annotations_1/BbbXgjwlOpI_filtered.json b/annotations_1/BbbXgjwlOpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..855a26a15617c14723f105f47c62d5d2d37a1ef4 --- /dev/null +++ b/annotations_1/BbbXgjwlOpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 33.74], [37.0, 56.78], [59.0, 81.18], [81.0, 90.78], [91.0, 91.77], [93.0, 94.02], [95.0, 100.41], [101.0, 106.29], [108.0, 119.3], [120.0, 124.07], [126.0, 152.81], [154.0, 156.41]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [31.29, 33.06, 30.61, 31.53, 0.0, 0.0, 40.41, 33.06, 32.0, 41.95, 30.9, 44.99], "audiomae_on_audioset": [[["music", 66.09], ["hum", 9.31], ["throbbing", 7.74]], [["music", 71.78], ["throbbing", 8.66], ["hum", 3.86]], [["music", 75.95], ["hum", 2.16], ["breaking", 2.11]], [["whale vocalization", 48.19], ["speech", 11.14], ["boat, water vehicle", 9.5]], null, null, [["fly, housefly", 54.8], ["insect", 23.81], ["mosquito", 18.8]], [["fly, housefly", 27.49], ["speech", 9.66], ["insect", 9.42]], [["music", 72.56], ["mains hum", 2.71], ["gong", 2.53]], [["music", 55.7], ["ambient music", 5.47], ["musical instrument", 4.49]], [["music", 46.08], ["hum", 19.96], ["mains hum", 11.47]], [["hum", 37.12], ["mains hum", 22.53], ["music", 15.42]]], "duration": [10.74, 19.78, 22.18, 9.78, 0.77, 1.02, 5.41, 5.29, 11.3, 4.07, 26.81, 2.41]} \ No newline at end of file diff --git a/annotations_1/BbyMGiPjDOw_filtered.json b/annotations_1/BbyMGiPjDOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..720ccea961bc38845ed089361241e44fb560fe9d --- /dev/null +++ b/annotations_1/BbyMGiPjDOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [10.0, 10.89], [21.0, 22.59], [33.0, 33.94], [39.0, 39.68], [51.0, 53.11], [55.0, 56.1], [57.0, 58.89], [62.0, 63.0], [65.0, 65.21], [67.0, 67.96], [82.0, 81.99], [84.0, 84.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 27.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 74.85], ["music", 2.33], ["mechanisms", 2.13]], null, null, null, null, null, null, null], "duration": [0.61, 0.89, 1.59, 0.94, 0.68, 2.11, 1.1, 1.89, 1.0, 0.21, 0.96, -0.01, 0.4]} \ No newline at end of file diff --git a/annotations_1/Bc3PB049HQc_filtered.json b/annotations_1/Bc3PB049HQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61d86f7da2381ba249cc36dcf5e5505cccb252c2 --- /dev/null +++ b/annotations_1/Bc3PB049HQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 20.43], [22.0, 53.65], [54.0, 54.5], [58.0, 62.61], [63.0, 62.95], [63.0, 63.32], [64.0, 65.52], [68.0, 69.16], [72.0, 91.5]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [45.78, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 33.95], "audiomae_on_audioset": [[["speech", 33.34], ["hum", 10.73], ["animal", 10.03]], null, null, [["music", 62.49], ["didgeridoo", 5.32], ["throbbing", 4.25]], null, null, null, null, [["explosion", 12.49], ["speech", 10.0], ["burst, pop", 8.62]]], "duration": [10.43, 31.65, 0.5, 4.61, -0.05, 0.32, 1.52, 1.16, 19.5]} \ No newline at end of file diff --git a/annotations_1/BdZN3EJVjo8_filtered.json b/annotations_1/BdZN3EJVjo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8dccb616b1994f24658bd2cc170b35e8fa489e1 --- /dev/null +++ b/annotations_1/BdZN3EJVjo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 43.97], [47.0, 50.48], [53.0, 55.68]], "keep_status": [false, false, false], "silence_prob": [99.99, 96.17, 100.0], "audiomae_on_audioset": [null, null, null], "duration": [5.97, 3.48, 2.68]} \ No newline at end of file diff --git a/annotations_1/BdZgC84uYUo_filtered.json b/annotations_1/BdZgC84uYUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bc597a9443c95a9ae21ff6f82d6e36458e14d5b --- /dev/null +++ b/annotations_1/BdZgC84uYUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.93], [13.0, 18.0], [19.0, 23.62], [26.0, 27.94], [29.0, 29.74], [31.0, 31.16], [36.0, 38.85], [40.0, 49.01], [50.0, 52.17], [58.0, 58.24], [58.0, 58.78], [59.0, 60.54], [61.0, 64.66], [67.0, 86.68], [89.0, 89.28], [90.0, 109.17], [110.0, 111.65], [114.0, 130.06], [133.0, 134.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 41.09, 96.89, 0.0, 0.0, 0.0, 55.18, 43.43, 34.67, 0.0, 0.0, 0.0, 32.77, 28.89, 0.0, 29.35, 0.0, 28.83, 0.0], "audiomae_on_audioset": [null, [["sidetone", 43.88], ["speech", 27.08], ["hum", 5.02]], null, null, null, null, null, [["music", 33.26], ["hum", 28.74], ["throbbing", 21.37]], [["music", 62.28], ["throbbing", 8.4], ["synthesizer", 4.29]], null, null, null, [["music", 72.54], ["electronic music", 4.6], ["throbbing", 4.11]], [["music", 53.33], ["hum", 5.86], ["electronic music", 4.94]], null, [["hum", 47.33], ["throbbing", 38.58], ["mains hum", 10.49]], null, [["throbbing", 45.43], ["music", 24.67], ["hum", 17.03]], null], "duration": [0.93, 5.0, 4.62, 1.94, 0.74, 0.16, 2.85, 9.01, 2.17, 0.24, 0.78, 1.54, 3.66, 19.68, 0.28, 19.17, 1.65, 16.06, 1.76]} \ No newline at end of file diff --git a/annotations_1/BefYI15la84_filtered.json b/annotations_1/BefYI15la84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..beed3fa7bcd7b114227e6a968e1055c30a341eae --- /dev/null +++ b/annotations_1/BefYI15la84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.33], [12.0, 13.51], [18.0, 18.45], [19.0, 22.57], [24.0, 63.26], [65.0, 107.57], [109.0, 131.7], [133.0, 135.18]], "keep_status": [false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 34.72, 0.0, 0.0, 34.33, 56.4], "audiomae_on_audioset": [null, null, null, [["speech", 23.75], ["hum", 20.14], ["mains hum", 17.56]], null, null, [["speech", 53.7], ["basketball bounce", 9.45], ["mains hum", 5.97]], null], "duration": [1.33, 1.51, 0.45, 3.57, 39.26, 42.57, 22.7, 2.18]} \ No newline at end of file diff --git a/annotations_1/Bf6FD5UbSns_filtered.json b/annotations_1/Bf6FD5UbSns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec64538dfbc933b6f90b413a387ba0240454eaa7 --- /dev/null +++ b/annotations_1/Bf6FD5UbSns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 28.22], [29.0, 30.45], [32.0, 32.44], [33.0, 33.47], [34.0, 36.19], [40.0, 41.17], [42.0, 42.89], [44.0, 50.55], [52.0, 53.06], [54.0, 54.57], [56.0, 57.97], [61.0, 65.25], [72.0, 79.03], [81.0, 83.34], [84.0, 85.21], [86.0, 86.54], [88.0, 116.68], [117.0, 139.75]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [28.82, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0, 28.5, 0.0, 0.0, 0.0, 28.81, 28.27, 30.29, 0.0, 0.0, 28.6, 28.71], "audiomae_on_audioset": [[["music", 63.36], ["throbbing", 13.09], ["hum", 6.67]], null, null, null, [["hum", 26.41], ["music", 18.06], ["mains hum", 15.68]], null, null, [["music", 39.73], ["hum", 22.24], ["throbbing", 17.54]], null, null, null, [["music", 42.98], ["throbbing", 25.42], ["hum", 17.26]], [["music", 68.37], ["mains hum", 7.62], ["hum", 7.4]], [["music", 43.61], ["speech", 14.49], ["rumble", 5.85]], null, null, [["music", 63.66], ["speech", 7.74], ["electronic music", 5.53]], [["music", 18.84], ["ambulance (siren)", 18.69], ["speech", 13.64]]], "duration": [16.22, 1.45, 0.44, 0.47, 2.19, 1.17, 0.89, 6.55, 1.06, 0.57, 1.97, 4.25, 7.03, 2.34, 1.21, 0.54, 28.68, 22.75]} \ No newline at end of file diff --git a/annotations_1/Bf6I7N-DC7g_filtered.json b/annotations_1/Bf6I7N-DC7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e787d101d385e2df41a12aeb43993977305f10e --- /dev/null +++ b/annotations_1/Bf6I7N-DC7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.86], [10.0, 10.37], [18.0, 18.49], [19.0, 20.65], [22.0, 25.51], [27.0, 30.05], [31.0, 33.88], [46.0, 47.31], [50.0, 50.03], [66.0, 66.77], [75.0, 75.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.23, 89.54, 80.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 0.37, 0.49, 1.65, 3.51, 3.05, 2.88, 1.31, 0.03, 0.77, 0.2]} \ No newline at end of file diff --git a/annotations_1/BfF5J0uSC3E_filtered.json b/annotations_1/BfF5J0uSC3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4625a205cecba6b410a1a1f2c2aebd32a79e52aa --- /dev/null +++ b/annotations_1/BfF5J0uSC3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.0], [20.0, 30.79], [38.0, 44.2], [44.0, 57.67], [61.0, 154.57], [165.0, 165.42], [167.0, 198.91], [203.0, 203.07]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.79, 31.72, 34.01, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.33], ["whale vocalization", 6.74], ["electric shaver, electric razor", 4.36]], [["music", 49.56], ["hum", 15.58], ["throbbing", 11.48]], [["music", 40.17], ["throbbing", 27.5], ["hum", 15.8]], null, null, null, null], "duration": [0.0, 10.79, 6.2, 13.67, 93.57, 0.42, 31.91, 0.07]} \ No newline at end of file diff --git a/annotations_1/BfRUV4g8sYw_filtered.json b/annotations_1/BfRUV4g8sYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..210474e9ff59647ab512f3c0a836b8fd70a3993e --- /dev/null +++ b/annotations_1/BfRUV4g8sYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.95], [2.0, 5.86], [7.0, 8.4], [10.0, 10.23], [11.0, 12.36], [13.0, 15.94], [16.0, 20.36], [27.0, 27.5], [28.0, 28.93], [30.0, 67.93], [69.0, 69.87], [81.0, 83.93], [87.0, 94.68], [96.0, 96.9], [100.0, 104.4], [107.0, 138.91], [140.0, 140.37], [141.0, 143.53]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 50.61, 0.0, 0.0, 0.0, 34.21, 53.53, 0.0, 0.0, 0.0, 0.0, 29.81, 32.2, 0.0, 29.8, 0.0, 0.0, 35.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.33], ["sonar", 11.73], ["gong", 7.29]], null, null, null, null, null, [["speech", 28.98], ["electric shaver, electric razor", 10.74], ["buzz", 10.21]], [["music", 36.98], ["speech", 27.16], ["tabla", 12.61]], null, [["music", 26.75], ["fart", 11.9], ["speech", 8.62]], null, null, [["music", 38.95], ["throbbing", 11.63], ["hum", 7.43]]], "duration": [0.95, 3.86, 1.4, 0.23, 1.36, 2.94, 4.36, 0.5, 0.93, 37.93, 0.87, 2.93, 7.68, 0.9, 4.4, 31.91, 0.37, 2.53]} \ No newline at end of file diff --git a/annotations_1/Bfj5GHwgXno_filtered.json b/annotations_1/Bfj5GHwgXno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aca279ad0fcfaf37bc1b8d855f3f47b95e4bd34a --- /dev/null +++ b/annotations_1/Bfj5GHwgXno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.85], [20.0, 20.66], [23.0, 31.68], [32.0, 41.54], [48.0, 50.21], [51.0, 52.32], [54.0, 55.46], [57.0, 58.26], [59.0, 59.1], [59.0, 71.17], [73.0, 75.41], [86.0, 87.02], [89.0, 96.38], [97.0, 97.95], [101.0, 100.9], [106.0, 106.35], [111.0, 111.74], [113.0, 113.1], [118.0, 117.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.29, 0.0, 66.03, 80.46, 65.2, 0.0, 0.0, 0.0, 0.0, 58.38, 97.92, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.85, 0.66, 8.68, 9.54, 2.21, 1.32, 1.46, 1.26, 0.1, 12.17, 2.41, 1.02, 7.38, 0.95, -0.1, 0.35, 0.74, 0.1, -0.05]} \ No newline at end of file diff --git a/annotations_1/BgCgiRitEmM_filtered.json b/annotations_1/BgCgiRitEmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a2449049e563b06113e6fa79d91035b226d10fa --- /dev/null +++ b/annotations_1/BgCgiRitEmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[116.0, 117.8], [119.0, 144.46]], "keep_status": [false, true], "silence_prob": [0.0, 31.4], "audiomae_on_audioset": [null, [["music", 46.26], ["hum", 10.29], ["didgeridoo", 5.41]]], "duration": [1.8, 25.46]} \ No newline at end of file diff --git a/annotations_1/BgxPmLpvxzc_filtered.json b/annotations_1/BgxPmLpvxzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/BgxPmLpvxzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/BhHv3Yxcuro_filtered.json b/annotations_1/BhHv3Yxcuro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4fdfa14d571dd61efab436afbd17015e9a3b89e --- /dev/null +++ b/annotations_1/BhHv3Yxcuro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [5.0, 9.1], [9.0, 12.7], [14.0, 19.16], [20.0, 28.76], [30.0, 30.67], [32.0, 34.21], [35.0, 38.65], [40.0, 40.2], [41.0, 54.35], [56.0, 61.99], [65.0, 64.93], [69.0, 69.72], [70.0, 72.6], [73.0, 78.46], [79.0, 87.25], [90.0, 108.95], [109.0, 116.48], [118.0, 135.65], [136.0, 141.02], [144.0, 143.87], [145.0, 146.42], [148.0, 150.18], [151.0, 151.98], [154.0, 155.78], [157.0, 157.86], [163.0, 163.78], [166.0, 166.82], [170.0, 171.91]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.92, 34.34, 90.95, 35.62, 0.0, 33.33, 33.48, 0.0, 31.91, 51.07, 0.0, 0.0, 36.97, 37.04, 36.94, 38.31, 42.42, 35.12, 38.5, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["animal", 53.63], ["dog", 11.5], ["bow-wow", 10.8]], null, [["animal", 36.84], ["music", 21.46], ["dog", 12.14]], null, [["animal", 28.7], ["dog", 21.21], ["domestic animals, pets", 15.78]], [["music", 39.38], ["didgeridoo", 24.14], ["speech", 10.67]], null, [["music", 67.97], ["theremin", 5.82], ["didgeridoo", 4.61]], null, null, null, [["speech", 43.09], ["animal", 5.23], ["hum", 4.93]], [["music", 15.18], ["speech", 11.82], ["animal", 11.03]], [["music", 32.41], ["speech", 26.9], ["theremin", 13.38]], [["music", 47.53], ["singing bowl", 9.56], ["animal", 7.83]], [["music", 39.89], ["theremin", 5.88], ["animal", 4.05]], [["music", 62.24], ["quack", 13.3], ["theremin", 4.29]], [["music", 37.42], ["speech", 8.78], ["foghorn", 5.84]], null, null, null, null, null, null, null, null, null], "duration": [-0.13, 4.1, 3.7, 5.16, 8.76, 0.67, 2.21, 3.65, 0.2, 13.35, 5.99, -0.07, 0.72, 2.6, 5.46, 8.25, 18.95, 7.48, 17.65, 5.02, -0.13, 1.42, 2.18, 0.98, 1.78, 0.86, 0.78, 0.82, 1.91]} \ No newline at end of file diff --git a/annotations_1/Bi8Spey13uY_filtered.json b/annotations_1/Bi8Spey13uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..175b8d7a6127bb217dfcdfbd8590bd8095ece96b --- /dev/null +++ b/annotations_1/Bi8Spey13uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [18.0, 18.42], [19.0, 19.67], [20.0, 20.88], [21.0, 22.4], [23.0, 23.95], [25.0, 41.42], [42.0, 44.09], [47.0, 57.5], [61.0, 94.46], [96.0, 97.75], [100.0, 100.26], [102.0, 102.63], [105.0, 105.93], [108.0, 109.88], [112.0, 114.74], [115.0, 116.75], [118.0, 118.59], [119.0, 119.58], [120.0, 121.95], [123.0, 124.88], [125.0, 127.11], [128.0, 128.61], [133.0, 133.59], [135.0, 136.8], [139.0, 139.06], [140.0, 144.34], [145.0, 147.11], [149.0, 149.4], [151.0, 151.78], [153.0, 152.9], [153.0, 153.86], [155.0, 155.17], [156.0, 156.9], [159.0, 159.36], [160.0, 160.56], [162.0, 162.58], [164.0, 164.42], [165.0, 165.6], [166.0, 167.02], [169.0, 168.91], [169.0, 170.01], [172.0, 199.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.82, 53.91, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 41.42, 0.0, 0.0, 0.0, 0.0, 42.88, 32.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 34.89], ["mains hum", 28.16], ["music", 5.06]], null, [["speech", 71.8], ["radio", 4.11], ["sidetone", 3.66]], null, null, null, null, null, null, [["whale vocalization", 25.03], ["speech", 10.71], ["animal", 10.53]], null, null, null, null, null, [["roaring cats (lions, tigers)", 18.01], ["livestock, farm animals, working animals", 9.07], ["animal", 9.0]], null, null, null, null, [["stomach rumble", 16.33], ["whack, thwack", 6.65], ["groan", 4.07]], [["speech", 26.24], ["music", 7.97], ["radio", 6.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 17.59], ["mechanisms", 8.81], ["music", 8.43]]], "duration": [0.74, 0.42, 0.67, 0.88, 1.4, 0.95, 16.42, 2.09, 10.5, 33.46, 1.75, 0.26, 0.63, 0.93, 1.88, 2.74, 1.75, 0.59, 0.58, 1.95, 1.88, 2.11, 0.61, 0.59, 1.8, 0.06, 4.34, 2.11, 0.4, 0.78, -0.1, 0.86, 0.17, 0.9, 0.36, 0.56, 0.58, 0.42, 0.6, 1.02, -0.09, 1.01, 27.29]} \ No newline at end of file diff --git a/annotations_1/BiPY5_H9EIw_filtered.json b/annotations_1/BiPY5_H9EIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef7f421a8f5eaab720409d6ddf5f2b0f934f767c --- /dev/null +++ b/annotations_1/BiPY5_H9EIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [4.0, 20.46], [27.0, 27.94], [30.0, 32.36], [33.0, 37.66], [38.0, 37.69], [39.0, 40.0], [40.0, 40.19], [42.0, 60.51], [62.0, 80.03], [86.0, 88.94], [93.0, 100.68], [103.0, 128.93], [129.0, 129.47], [136.0, 140.37]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, true, true, false, true], "silence_prob": [0.0, 35.33, 0.0, 30.1, 35.68, 0.0, 0.0, 0.0, 32.83, 29.56, 29.88, 29.9, 35.2, 0.0, 42.81], "audiomae_on_audioset": [null, [["speech", 58.58], ["music", 26.06], ["bleat", 0.99]], null, [["speech", 68.24], ["music", 19.98], ["radio", 4.64]], [["music", 27.64], ["fly, housefly", 9.37], ["insect", 5.78]], null, null, null, [["music", 79.16], ["a capella", 4.42], ["vocal music", 2.35]], [["music", 50.93], ["echo", 6.21], ["sound effect", 3.68]], [["music", 61.68], ["didgeridoo", 9.15], ["singing", 3.87]], [["music", 28.07], ["cattle, bovinae", 16.63], ["livestock, farm animals, working animals", 13.26]], [["music", 48.93], ["outside, rural or natural", 2.82], ["explosion", 2.53]], null, [["speech", 47.07], ["music", 17.75], ["didgeridoo", 4.59]]], "duration": [0.38, 16.46, 0.94, 2.36, 4.66, -0.31, 1.0, 0.19, 18.51, 18.03, 2.94, 7.68, 25.93, 0.47, 4.37]} \ No newline at end of file diff --git a/annotations_1/BiuCpXg_jgU_filtered.json b/annotations_1/BiuCpXg_jgU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5894e38582fb35bed3d96c9e485c98c4ede4d05 --- /dev/null +++ b/annotations_1/BiuCpXg_jgU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 51.71], [53.0, 61.43], [64.0, 74.14], [77.0, 78.21], [81.0, 87.42], [91.0, 94.63], [104.0, 105.51], [108.0, 113.32], [118.0, 122.55], [124.0, 145.89], [146.0, 147.21], [148.0, 150.38], [151.0, 152.2], [153.0, 153.59], [154.0, 155.38]], "keep_status": [true, false, true, false, true, true, false, true, true, false, false, true, false, false, false], "silence_prob": [28.71, 27.96, 28.03, 0.0, 27.82, 27.95, 0.0, 27.82, 27.83, 28.51, 0.0, 40.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 35.2], ["civil defense siren", 4.79], ["electric shaver, electric razor", 4.6]], [["music", 77.39], ["buzz", 3.92], ["theremin", 2.86]], [["music", 39.76], ["electronic music", 6.88], ["sound effect", 6.69]], null, [["speech", 27.17], ["mains hum", 19.5], ["music", 16.62]], [["explosion", 24.93], ["rumble", 17.1], ["burst, pop", 8.81]], null, [["vehicle", 26.19], ["mains hum", 6.57], ["accelerating, revving, vroom", 5.51]], [["explosion", 20.86], ["breaking", 16.81], ["burst, pop", 8.86]], [["hum", 56.02], ["mains hum", 32.99], ["throbbing", 4.31]], null, [["music", 47.28], ["buzz", 5.53], ["hum", 2.98]], null, null, null], "duration": [2.71, 8.43, 10.14, 1.21, 6.42, 3.63, 1.51, 5.32, 4.55, 21.89, 1.21, 2.38, 1.2, 0.59, 1.38]} \ No newline at end of file diff --git a/annotations_1/BjPUO_4HJeo_filtered.json b/annotations_1/BjPUO_4HJeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce4a4de2c9b14b22256391d67330c9e8ec595556 --- /dev/null +++ b/annotations_1/BjPUO_4HJeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.26], [12.0, 13.02], [14.0, 14.86], [16.0, 17.1], [18.0, 19.26], [23.0, 23.23], [29.0, 29.03], [29.0, 30.32], [33.0, 33.22], [39.0, 39.43], [43.0, 43.33], [50.0, 51.07], [56.0, 55.85], [64.0, 64.99], [68.0, 68.4], [69.0, 70.28], [84.0, 84.77], [88.0, 88.75], [91.0, 92.15], [95.0, 96.23], [101.0, 101.29], [104.0, 110.39], [111.0, 112.62], [115.0, 115.37], [134.0, 135.55], [139.0, 139.24], [143.0, 142.86], [148.0, 148.2], [157.0, 158.55], [159.0, 159.7], [161.0, 161.42], [163.0, 162.85], [167.0, 167.31], [172.0, 174.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.3], ["speech", 20.16], ["hum", 8.24]]], "duration": [1.26, 1.02, 0.86, 1.1, 1.26, 0.23, 0.03, 1.32, 0.22, 0.43, 0.33, 1.07, -0.15, 0.99, 0.4, 1.28, 0.77, 0.75, 1.15, 1.23, 0.29, 6.39, 1.62, 0.37, 1.55, 0.24, -0.14, 0.2, 1.55, 0.7, 0.42, -0.15, 0.31, 2.23]} \ No newline at end of file diff --git a/annotations_1/BjsuTimPBAM_filtered.json b/annotations_1/BjsuTimPBAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88b63655e66344f0a26fcdd29d5ab4ed371d1917 --- /dev/null +++ b/annotations_1/BjsuTimPBAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.24], [4.0, 4.36], [13.0, 13.32], [14.0, 15.58], [20.0, 20.63], [50.0, 50.57], [55.0, 56.17], [66.0, 67.17], [69.0, 70.97], [72.0, 81.04], [82.0, 97.06], [98.0, 99.06], [100.0, 103.6], [105.0, 105.22], [106.0, 107.01], [108.0, 111.23], [114.0, 117.83], [118.0, 119.96], [121.0, 123.65], [124.0, 126.81], [128.0, 130.18], [133.0, 133.56], [134.0, 137.35], [138.0, 141.07], [149.0, 151.29], [152.0, 152.27], [156.0, 156.59], [159.0, 161.35], [163.0, 164.0], [165.0, 167.44], [169.0, 169.38], [171.0, 171.76], [174.0, 174.99], [189.0, 189.62], [198.0, 198.51], [202.0, 202.53], [203.0, 203.47], [204.0, 204.43], [215.0, 215.92], [217.0, 217.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.36, 0.0, 0.0, 99.97, 99.96, 0.0, 98.99, 97.83, 96.66, 0.0, 99.97, 99.94, 98.8, 0.0, 0.0, 99.93, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.36, 0.32, 1.58, 0.63, 0.57, 1.17, 1.17, 1.97, 9.04, 15.06, 1.06, 3.6, 0.22, 1.01, 3.23, 3.83, 1.96, 2.65, 2.81, 2.18, 0.56, 3.35, 3.07, 2.29, 0.27, 0.59, 2.35, 1.0, 2.44, 0.38, 0.76, 0.99, 0.62, 0.51, 0.53, 0.47, 0.43, 0.92, 0.71]} \ No newline at end of file diff --git a/annotations_1/BkNCfTfR6fQ_filtered.json b/annotations_1/BkNCfTfR6fQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af28bf76dc35a29e748adf3bca0b4f96f0f72b3b --- /dev/null +++ b/annotations_1/BkNCfTfR6fQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.23], [11.0, 14.79], [16.0, 16.77], [18.0, 23.94], [32.0, 33.07], [33.0, 36.56], [38.0, 47.85], [52.0, 53.16], [59.0, 60.88], [64.0, 64.08], [66.0, 93.33], [95.0, 103.99], [112.0, 117.24], [123.0, 127.47], [129.0, 129.36]], "keep_status": [true, true, false, true, false, true, true, false, false, false, true, true, true, true, false], "silence_prob": [42.98, 41.95, 0.0, 41.6, 0.0, 41.87, 39.24, 0.0, 0.0, 0.0, 33.26, 30.36, 45.46, 45.36, 0.0], "audiomae_on_audioset": [[["music", 34.69], ["mosquito", 9.37], ["fly, housefly", 7.28]], [["music", 14.0], ["fly, housefly", 8.19], ["frog", 5.76]], null, [["music", 31.53], ["hum", 8.46], ["mains hum", 5.84]], null, [["speech", 14.88], ["frog", 14.04], ["fly, housefly", 10.25]], [["music", 28.28], ["speech", 22.61], ["buzz", 9.43]], null, null, null, [["music", 22.58], ["fly, housefly", 11.42], ["hum", 11.3]], [["music", 50.01], ["sidetone", 10.02], ["speech", 8.54]], [["music", 29.86], ["hum", 21.32], ["throbbing", 11.41]], [["fly, housefly", 39.99], ["music", 9.92], ["insect", 9.34]], null], "duration": [6.23, 3.79, 0.77, 5.94, 1.07, 3.56, 9.85, 1.16, 1.88, 0.08, 27.33, 8.99, 5.24, 4.47, 0.36]} \ No newline at end of file diff --git a/annotations_1/BkZ6lFCzAwM_filtered.json b/annotations_1/BkZ6lFCzAwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d66617004b2837419aba9735136794f196d2cbdb --- /dev/null +++ b/annotations_1/BkZ6lFCzAwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.03], [26.0, 26.45], [58.0, 96.62]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [1.03, 0.45, 38.62]} \ No newline at end of file diff --git a/annotations_1/BnnkcdH5v14_filtered.json b/annotations_1/BnnkcdH5v14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d484b718d37c89e9e1e4b1146471accf886fbd0 --- /dev/null +++ b/annotations_1/BnnkcdH5v14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.33], [12.0, 11.72], [17.0, 17.56], [41.0, 41.05], [42.0, 42.23], [47.0, 48.15], [49.0, 49.25], [55.0, 55.49], [66.0, 71.1], [76.0, 76.1], [80.0, 80.72], [111.0, 114.07], [115.0, 115.62], [117.0, 117.66], [120.0, 120.46], [122.0, 123.11], [126.0, 126.77], [127.0, 127.82], [129.0, 129.24], [138.0, 138.57], [139.0, 140.54], [142.0, 142.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 35.0], ["music", 19.98], ["trombone", 16.5]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, -0.28, 0.56, 0.05, 0.23, 1.15, 0.25, 0.49, 5.1, 0.1, 0.72, 3.07, 0.62, 0.66, 0.46, 1.11, 0.77, 0.82, 0.24, 0.57, 1.54, 0.82]} \ No newline at end of file diff --git a/annotations_1/Bo-2-sJi7Uk_filtered.json b/annotations_1/Bo-2-sJi7Uk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d76f4ec21a4bb72ff194da7ffff50f5c02d882e2 --- /dev/null +++ b/annotations_1/Bo-2-sJi7Uk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.39], [5.0, 5.97], [8.0, 7.72], [9.0, 14.32], [20.0, 22.22], [22.0, 24.17], [27.0, 35.48], [36.0, 38.11], [40.0, 40.26], [46.0, 46.48], [47.0, 48.24], [50.0, 50.4], [51.0, 52.1], [54.0, 55.58], [71.0, 71.71], [76.0, 77.09], [82.0, 81.85], [85.0, 86.53], [88.0, 93.16], [98.0, 101.11], [103.0, 104.5], [107.0, 107.27], [110.0, 111.38], [113.0, 114.71], [116.0, 118.74], [119.0, 121.41], [123.0, 125.93], [127.0, 136.59], [138.0, 139.14], [140.0, 144.15], [145.0, 147.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.83, 100.0, 79.76, 99.88, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 99.96, 0.0, 0.0, 0.0, 0.0, 99.8, 97.43, 99.98, 98.44, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 0.97, -0.28, 5.32, 2.22, 2.17, 8.48, 2.11, 0.26, 0.48, 1.24, 0.4, 1.1, 1.58, 0.71, 1.09, -0.15, 1.53, 5.16, 3.11, 1.5, 0.27, 1.38, 1.71, 2.74, 2.41, 2.93, 9.59, 1.14, 4.15, 2.36]} \ No newline at end of file diff --git a/annotations_1/Boona4-qLSE_filtered.json b/annotations_1/Boona4-qLSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffe525432c90adffb500584866ad8f8c9784b54a --- /dev/null +++ b/annotations_1/Boona4-qLSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.09], [10.0, 16.8], [20.0, 21.0], [22.0, 27.68], [44.0, 45.98], [47.0, 48.44], [49.0, 57.08], [58.0, 59.63], [63.0, 64.39], [67.0, 67.49], [68.0, 72.91], [77.0, 77.77], [78.0, 80.5], [85.0, 86.63], [88.0, 109.93], [112.0, 137.39], [138.0, 151.04], [151.0, 151.36], [153.0, 153.57], [154.0, 158.46], [159.0, 165.67], [166.0, 170.55], [171.0, 171.22], [178.0, 178.21], [181.0, 182.14]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, false, false, false, false], "silence_prob": [32.45, 36.99, 0.0, 40.11, 0.0, 0.0, 50.41, 0.0, 0.0, 0.0, 35.67, 0.0, 40.81, 0.0, 30.19, 35.33, 41.74, 0.0, 0.0, 38.15, 45.33, 68.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 19.3], ["music", 16.38], ["mains hum", 5.93]], [["music", 37.03], ["speech", 22.15], ["hum", 17.51]], null, [["music", 51.52], ["pour", 10.56], ["whale vocalization", 4.45]], null, null, null, null, null, null, [["fly, housefly", 52.23], ["mosquito", 24.77], ["insect", 19.95]], null, [["mosquito", 53.01], ["whale vocalization", 28.58], ["fly, housefly", 6.64]], null, [["music", 39.95], ["hum", 17.11], ["throbbing", 8.48]], [["music", 75.11], ["brass instrument", 4.64], ["grunt", 4.48]], [["whale vocalization", 21.91], ["animal", 20.97], ["cattle, bovinae", 15.31]], null, null, [["fill (with liquid)", 19.48], ["liquid", 18.53], ["water", 10.24]], [["livestock, farm animals, working animals", 29.9], ["animal", 16.31], ["sheep", 8.76]], null, null, null, null], "duration": [2.09, 6.8, 1.0, 5.68, 1.98, 1.44, 8.08, 1.63, 1.39, 0.49, 4.91, 0.77, 2.5, 1.63, 21.93, 25.39, 13.04, 0.36, 0.57, 4.46, 6.67, 4.55, 0.22, 0.21, 1.14]} \ No newline at end of file diff --git a/annotations_1/BpAvVBwO8J0_filtered.json b/annotations_1/BpAvVBwO8J0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f4e008ce333b929c1595d62a0ec294d254cf202 --- /dev/null +++ b/annotations_1/BpAvVBwO8J0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.07], [39.0, 40.0], [41.0, 42.9], [48.0, 52.74], [56.0, 56.3], [59.0, 60.15], [63.0, 63.14], [65.0, 65.84], [66.0, 67.44], [68.0, 69.62], [73.0, 72.77], [87.0, 87.02], [89.0, 90.27], [94.0, 94.47], [96.0, 96.72], [97.0, 97.58], [99.0, 109.41], [111.0, 112.67], [113.0, 116.06], [117.0, 119.03], [121.0, 121.12], [122.0, 122.91], [130.0, 130.47], [131.0, 131.28], [133.0, 137.86], [141.0, 141.64], [143.0, 143.73], [146.0, 148.42], [152.0, 152.42], [153.0, 153.77], [156.0, 156.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [29.86, 0.0, 0.0, 34.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 54.1, 54.97, 0.0, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 38.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.45], ["speech", 5.93], ["didgeridoo", 2.44]], null, null, [["music", 72.73], ["speech", 5.56], ["sidetone", 3.57]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.48], ["throbbing", 19.47], ["music", 12.79]], null, null, null, null, null, null, null, [["throbbing", 58.16], ["hum", 23.39], ["mains hum", 3.49]], null, null, [["music", 16.5], ["sheep", 11.76], ["hum", 9.3]], null, null, null], "duration": [9.07, 1.0, 1.9, 4.74, 0.3, 1.15, 0.14, 0.84, 1.44, 1.62, -0.23, 0.02, 1.27, 0.47, 0.72, 0.58, 10.41, 1.67, 3.06, 2.03, 0.12, 0.91, 0.47, 0.28, 4.86, 0.64, 0.73, 2.42, 0.42, 0.77, 0.86]} \ No newline at end of file diff --git a/annotations_1/BpnlB0ILpWw_filtered.json b/annotations_1/BpnlB0ILpWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc3e18a11c6fa591d5fcf31faba3090f06a7bb44 --- /dev/null +++ b/annotations_1/BpnlB0ILpWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [5.0, 8.61], [10.0, 16.02], [17.0, 18.77], [20.0, 21.34], [25.0, 25.71], [26.0, 26.92], [32.0, 37.98], [39.0, 40.69], [42.0, 42.52], [44.0, 46.63], [51.0, 52.93], [54.0, 56.74], [59.0, 59.8], [64.0, 64.79], [65.0, 65.91], [67.0, 68.59], [81.0, 82.48], [89.0, 89.06], [90.0, 91.25], [92.0, 92.79], [94.0, 96.82], [98.0, 97.97], [99.0, 100.87], [102.0, 104.18], [105.0, 110.94], [114.0, 114.39], [116.0, 116.45], [118.0, 134.97], [138.0, 139.51], [140.0, 141.52], [143.0, 143.83], [145.0, 147.51], [148.0, 148.63], [149.0, 157.2], [158.0, 174.56], [175.0, 182.56], [186.0, 188.27], [189.0, 192.13]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 46.54, 98.01, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0, 0.0, 99.85, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 79.07, 41.85, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 35.39, 0.0, 30.9, 53.84, 86.45, 100.0, 100.0], "audiomae_on_audioset": [null, [["music", 30.92], ["speech", 14.65], ["whale vocalization", 13.76]], null, null, null, null, null, [["speech", 29.47], ["sidetone", 18.2], ["music", 9.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.2], ["gong", 4.8], ["domestic animals, pets", 2.36]], null, null, null, null, null, null, [["speech", 28.72], ["didgeridoo", 9.27], ["music", 8.6]], null, [["groan", 23.51], ["fly, housefly", 19.26], ["mosquito", 12.45]], null, null, null, null], "duration": [0.82, 3.61, 6.02, 1.77, 1.34, 0.71, 0.92, 5.98, 1.69, 0.52, 2.63, 1.93, 2.74, 0.8, 0.79, 0.91, 1.59, 1.48, 0.06, 1.25, 0.79, 2.82, -0.03, 1.87, 2.18, 5.94, 0.39, 0.45, 16.97, 1.51, 1.52, 0.83, 2.51, 0.63, 8.2, 16.56, 7.56, 2.27, 3.13]} \ No newline at end of file diff --git a/annotations_1/Br9zd0KkFTU_filtered.json b/annotations_1/Br9zd0KkFTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c64b20af0839c1412dcf2b9e49c27a527b6d1028 --- /dev/null +++ b/annotations_1/Br9zd0KkFTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [18.0, 21.32], [52.0, 54.09], [69.0, 70.02], [72.0, 75.46], [77.0, 79.59], [80.0, 80.28], [86.0, 86.76], [88.0, 88.67], [91.0, 105.26], [110.0, 113.97], [115.0, 117.26], [118.0, 119.2], [120.0, 136.31], [137.0, 137.05], [138.0, 138.7], [139.0, 141.69], [143.0, 151.44], [152.0, 160.47]], "keep_status": [false, true, true, false, false, true, false, false, false, true, true, true, false, true, false, false, true, false, true], "silence_prob": [0.0, 31.64, 29.55, 0.0, 50.26, 39.57, 0.0, 0.0, 0.0, 30.09, 30.87, 33.45, 0.0, 30.21, 0.0, 0.0, 30.7, 29.57, 40.11], "audiomae_on_audioset": [null, [["music", 30.52], ["rain on surface", 6.01], ["rain", 5.31]], [["music", 23.47], ["bang", 6.52], ["whack, thwack", 6.06]], null, null, [["music", 24.24], ["hum", 12.13], ["rain on surface", 11.91]], null, null, null, [["buzz", 27.52], ["music", 18.9], ["mains hum", 14.84]], [["speech", 49.39], ["music", 17.31], ["vehicle", 2.39]], [["music", 20.03], ["rain", 11.01], ["rain on surface", 10.61]], null, [["hum", 38.49], ["mains hum", 21.98], ["speech", 5.75]], null, null, [["speech", 24.1], ["buzzer", 23.37], ["electric shaver, electric razor", 9.08]], [["hum", 41.53], ["mains hum", 32.53], ["throbbing", 6.22]], [["music", 20.35], ["hum", 16.32], ["mains hum", 5.7]]], "duration": [0.15, 3.32, 2.09, 1.02, 3.46, 2.59, 0.28, 0.76, 0.67, 14.26, 3.97, 2.26, 1.2, 16.31, 0.05, 0.7, 2.69, 8.44, 8.47]} \ No newline at end of file diff --git a/annotations_1/BrLcbi68R_A_filtered.json b/annotations_1/BrLcbi68R_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0f23a4ae2f483d84d2660e839a20bb9a05d2a26 --- /dev/null +++ b/annotations_1/BrLcbi68R_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.54], [37.0, 38.53], [42.0, 42.63], [44.0, 45.87], [50.0, 49.94], [64.0, 65.11], [67.0, 69.28], [71.0, 78.65], [79.0, 79.44], [80.0, 80.37], [84.0, 89.19], [92.0, 98.34], [111.0, 114.79], [117.0, 118.4], [121.0, 134.89], [135.0, 136.51], [137.0, 141.93], [142.0, 143.72], [148.0, 149.57], [156.0, 156.61], [163.0, 164.32], [167.0, 167.07], [167.0, 171.27], [173.0, 177.79]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 40.45, 35.42, 0.0, 0.0, 35.62, 37.16, 30.14, 0.0, 30.6, 0.0, 31.24, 0.0, 0.0, 0.0, 0.0, 0.0, 30.75, 29.6], "audiomae_on_audioset": [[["music", 40.0], ["wind instrument, woodwind instrument", 9.14], ["shofar", 8.85]], null, null, null, null, null, [["music", 70.81], ["swing music", 3.85], ["funny music", 1.91]], [["music", 78.55], ["synthesizer", 2.57], ["theremin", 2.42]], null, null, [["music", 58.81], ["funk", 6.71], ["reggae", 4.98]], [["music", 79.18], ["musical instrument", 4.13], ["synthesizer", 2.55]], [["music", 69.12], ["vocal music", 2.77], ["singing", 2.71]], null, [["music", 76.44], ["funk", 1.83], ["singing", 1.51]], null, [["music", 65.9], ["jingle (music)", 8.13], ["christmas music", 4.05]], null, null, null, null, null, [["music", 67.83], ["electronic music", 3.06], ["didgeridoo", 2.68]], [["music", 63.25], ["christian music", 3.76], ["singing", 3.44]]], "duration": [3.54, 1.53, 0.63, 1.87, -0.06, 1.11, 2.28, 7.65, 0.44, 0.37, 5.19, 6.34, 3.79, 1.4, 13.89, 1.51, 4.93, 1.72, 1.57, 0.61, 1.32, 0.07, 4.27, 4.79]} \ No newline at end of file diff --git a/annotations_1/BrWwVhnztcg_filtered.json b/annotations_1/BrWwVhnztcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a11a0fab75a6bc1b1b3311d909cc78e1275e605 --- /dev/null +++ b/annotations_1/BrWwVhnztcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [12.0, 12.87], [15.0, 16.41], [18.0, 19.18], [25.0, 27.06], [34.0, 34.38], [37.0, 38.75], [40.0, 41.94], [44.0, 65.45], [67.0, 67.9], [69.0, 69.63], [70.0, 71.47], [76.0, 79.03], [80.0, 82.59], [84.0, 85.36], [87.0, 88.96], [90.0, 92.45], [94.0, 96.8], [100.0, 100.58], [101.0, 103.22], [104.0, 105.71], [106.0, 111.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 96.04, 94.95, 0.0, 0.0, 86.27, 93.13, 0.0, 88.1, 0.0, 97.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.87, 1.41, 1.18, 2.06, 0.38, 1.75, 1.94, 21.45, 0.9, 0.63, 1.47, 3.03, 2.59, 1.36, 1.96, 2.45, 2.8, 0.58, 2.22, 1.71, 5.52]} \ No newline at end of file diff --git a/annotations_1/BshBOgRLN28_filtered.json b/annotations_1/BshBOgRLN28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a3e51fc58c14c9654289175e9f708796786add2 --- /dev/null +++ b/annotations_1/BshBOgRLN28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [9.0, 9.69], [16.0, 16.83], [18.0, 18.79], [20.0, 22.49], [25.0, 25.42], [26.0, 27.73], [34.0, 86.71], [88.0, 147.85], [149.0, 164.67]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.22, 0.0, 0.0, 0.0, 0.0, 34.12], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.93], ["music", 17.5], ["hum", 17.47]], null, null, null, null, [["hum", 41.58], ["music", 23.68], ["throbbing", 10.53]]], "duration": [0.68, 0.69, 0.83, 0.79, 2.49, 0.42, 1.73, 52.71, 59.85, 15.67]} \ No newline at end of file diff --git a/annotations_1/Btywn5TiBNQ_filtered.json b/annotations_1/Btywn5TiBNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9519d0c09b8016c39bc04478294a128f22eaf0fd --- /dev/null +++ b/annotations_1/Btywn5TiBNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.83], [18.0, 37.52], [39.0, 59.76], [62.0, 63.61], [66.0, 66.72], [69.0, 70.78], [71.0, 75.17], [75.0, 112.48], [115.0, 119.28], [123.0, 123.89], [124.0, 124.16], [124.0, 124.6]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.67, 51.77, 30.33, 0.0, 0.0, 0.0, 29.26, 0.0, 28.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["didgeridoo", 26.07], ["music", 25.29], ["foghorn", 15.39]], null, [["music", 75.76], ["musical instrument", 3.98], ["electronic music", 2.91]], null, null, null, [["music", 48.97], ["clarinet", 13.44], ["musical instrument", 10.15]], null, [["speech", 38.81], ["foghorn", 13.88], ["music", 12.91]], null, null, null], "duration": [9.83, 19.52, 20.76, 1.61, 0.72, 1.78, 4.17, 37.48, 4.28, 0.89, 0.16, 0.6]} \ No newline at end of file diff --git a/annotations_1/BuN4WOVbk7s_filtered.json b/annotations_1/BuN4WOVbk7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c043bc6e12be400651158b9b0251e852256d016 --- /dev/null +++ b/annotations_1/BuN4WOVbk7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.15], [26.0, 25.91], [31.0, 33.86], [37.0, 37.5], [38.0, 37.57], [51.0, 53.87], [54.0, 57.37], [61.0, 61.79], [64.0, 64.84], [73.0, 73.95], [81.0, 81.58], [83.0, 86.97]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.9, 0.0, 0.0, 30.42, 31.95, 0.0, 0.0, 0.0, 0.0, 31.36], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 22.86], ["radio", 20.09], ["speech", 12.33]], null, null, [["speech", 68.78], ["radio", 14.39], ["sidetone", 5.26]], [["speech", 78.23], ["sidetone", 11.78], ["radio", 2.64]], null, null, null, null, [["speech", 52.24], ["hum", 9.77], ["radio", 8.55]]], "duration": [0.15, -0.09, 2.86, 0.5, -0.43, 2.87, 3.37, 0.79, 0.84, 0.95, 0.58, 3.97]} \ No newline at end of file diff --git a/annotations_1/BuPdA_CDITw_filtered.json b/annotations_1/BuPdA_CDITw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c89aa533325d59d02fadde6872836c5786275cd8 --- /dev/null +++ b/annotations_1/BuPdA_CDITw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.45], [9.0, 10.37], [12.0, 14.39], [15.0, 17.9], [19.0, 19.3], [21.0, 21.29], [22.0, 23.8], [27.0, 28.07], [30.0, 31.87], [35.0, 35.83], [38.0, 38.79], [39.0, 39.6], [42.0, 44.88], [45.0, 47.41], [52.0, 52.25], [53.0, 55.86], [58.0, 59.53], [60.0, 61.28], [62.0, 64.98], [67.0, 68.35], [73.0, 73.77], [75.0, 76.33], [77.0, 77.53], [78.0, 78.8], [79.0, 80.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.97, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 47.12, 0.0, 65.44, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.37], ["didgeridoo", 12.48], ["music", 7.05]], [["fly, housefly", 20.44], ["bee, wasp, etc.", 14.31], ["speech", 12.21]], null, null, null, null, [["hum", 30.7], ["mains hum", 28.61], ["radio", 4.42]], null, null, null, null, null, null], "duration": [1.45, 1.37, 2.39, 2.9, 0.3, 0.29, 1.8, 1.07, 1.87, 0.83, 0.79, 0.6, 2.88, 2.41, 0.25, 2.86, 1.53, 1.28, 2.98, 1.35, 0.77, 1.33, 0.53, 0.8, 1.4]} \ No newline at end of file diff --git a/annotations_1/BvcBo3De8Hc_filtered.json b/annotations_1/BvcBo3De8Hc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf93c00eb108fae86c4c4d014291117afecb96c --- /dev/null +++ b/annotations_1/BvcBo3De8Hc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 47.17], [48.0, 57.62], [60.0, 67.24], [69.0, 74.31], [76.0, 80.84], [82.0, 83.51], [88.0, 90.58], [91.0, 94.93], [97.0, 97.58], [101.0, 101.31], [102.0, 103.08], [104.0, 104.99], [106.0, 107.81], [108.0, 109.29], [111.0, 113.98], [114.0, 115.3], [116.0, 119.99], [122.0, 123.16], [130.0, 129.9], [132.0, 146.55], [148.0, 149.49]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.51, 31.98, 30.22, 37.28, 0.0, 69.07, 74.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 39.58, 0.0, 0.0, 32.58, 0.0], "audiomae_on_audioset": [null, [["music", 71.91], ["didgeridoo", 3.54], ["electronic music", 3.17]], [["fly, housefly", 25.39], ["insect", 14.38], ["sine wave", 10.2]], [["speech", 54.43], ["music", 17.83], ["throbbing", 5.21]], [["music", 34.58], ["brass instrument", 11.73], ["trombone", 5.19]], null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 46.94], ["speech", 44.19], ["radio", 1.35]], null, null, [["music", 80.55], ["synthesizer", 6.11], ["electronic music", 1.89]], null], "duration": [34.17, 9.62, 7.24, 5.31, 4.84, 1.51, 2.58, 3.93, 0.58, 0.31, 1.08, 0.99, 1.81, 1.29, 2.98, 1.3, 3.99, 1.16, -0.1, 14.55, 1.49]} \ No newline at end of file diff --git a/annotations_1/BwWzZtG_6fA_filtered.json b/annotations_1/BwWzZtG_6fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6d019a9f77fff895a2401e999d7b8dd41dbb473 --- /dev/null +++ b/annotations_1/BwWzZtG_6fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.21], [6.0, 6.24], [9.0, 10.88], [13.0, 16.75], [18.0, 20.11], [21.0, 27.58], [36.0, 37.54], [40.0, 41.25], [44.0, 44.37], [46.0, 48.3], [50.0, 53.86], [60.0, 83.22], [86.0, 90.19], [90.0, 90.53], [91.0, 91.99], [93.0, 93.28], [94.0, 102.27], [103.0, 109.73], [110.0, 113.83], [119.0, 127.09], [128.0, 133.35], [135.0, 142.82], [143.0, 147.53], [153.0, 153.33], [155.0, 155.16], [156.0, 157.65], [164.0, 164.19], [166.0, 166.29], [168.0, 169.4], [171.0, 170.95], [171.0, 171.9], [176.0, 177.53]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 0.0, 93.6, 45.59, 42.46, 0.0, 0.0, 0.0, 42.91, 54.04, 34.32, 70.86, 0.0, 0.0, 0.0, 45.69, 39.46, 39.28, 68.41, 69.07, 41.26, 32.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 38.21], ["cacophony", 19.03], ["noise", 13.39]], [["speech", 24.58], ["music", 16.23], ["fly, housefly", 10.99]], null, null, null, [["whale vocalization", 33.38], ["sonar", 13.95], ["hum", 9.89]], null, [["speech", 23.52], ["music", 22.29], ["hum", 14.71]], null, null, null, null, [["music", 59.57], ["speech", 12.37], ["electronic music", 5.12]], [["music", 28.1], ["hum", 15.3], ["mains hum", 7.46]], [["music", 40.0], ["speech", 34.72], ["fart", 5.52]], null, null, [["music", 55.29], ["synthesizer", 13.62], ["speech", 4.64]], [["music", 37.91], ["fly, housefly", 8.38], ["hum", 6.73]], null, null, null, null, null, null, null, null, null], "duration": [3.21, 0.24, 1.88, 3.75, 2.11, 6.58, 1.54, 1.25, 0.37, 2.3, 3.86, 23.22, 4.19, 0.53, 0.99, 0.28, 8.27, 6.73, 3.83, 8.09, 5.35, 7.82, 4.53, 0.33, 0.16, 1.65, 0.19, 0.29, 1.4, -0.05, 0.9, 1.53]} \ No newline at end of file diff --git a/annotations_1/Bwpvq4JhqY4_filtered.json b/annotations_1/Bwpvq4JhqY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019b55c5c598c4298371fdf525156d2b9bdbbfec --- /dev/null +++ b/annotations_1/Bwpvq4JhqY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [13.0, 14.88], [21.0, 22.4], [24.0, 25.12], [32.0, 33.37], [39.0, 39.51], [46.0, 46.85], [49.0, 49.84], [52.0, 59.21], [60.0, 65.84], [66.0, 69.35], [70.0, 73.67], [75.0, 77.38], [79.0, 81.19], [82.0, 83.83], [87.0, 88.05], [90.0, 91.72], [95.0, 96.5], [97.0, 97.98], [103.0, 105.17], [109.0, 109.54], [110.0, 112.21], [112.0, 114.81], [116.0, 121.31], [122.0, 125.79], [129.0, 130.1], [131.0, 132.58], [133.0, 133.71], [140.0, 141.42], [144.0, 146.35], [150.0, 151.26], [152.0, 151.88], [157.0, 169.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 79.41, 56.33, 90.08, 51.77, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 65.2, 70.44, 83.52, 42.28, 0.0, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 53.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.77], ["frog", 9.64], ["mains hum", 8.85]], null, null, null, null, [["didgeridoo", 13.12], ["music", 12.82], ["fly, housefly", 7.65]], null, null, null], "duration": [0.51, 1.88, 1.4, 1.12, 1.37, 0.51, 0.85, 0.84, 7.21, 5.84, 3.35, 3.67, 2.38, 2.19, 1.83, 1.05, 1.72, 1.5, 0.98, 2.17, 0.54, 2.21, 2.81, 5.31, 3.79, 1.1, 1.58, 0.71, 1.42, 2.35, 1.26, -0.12, 12.01]} \ No newline at end of file diff --git a/annotations_1/Bx9JRDKjrwA_filtered.json b/annotations_1/Bx9JRDKjrwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a95987912b6eab27f41f2469c7de13c97b8fddee --- /dev/null +++ b/annotations_1/Bx9JRDKjrwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.13], [9.0, 9.05], [10.0, 10.2], [11.0, 10.79], [12.0, 12.28], [14.0, 15.77], [27.0, 27.73], [28.0, 28.56], [31.0, 31.33], [32.0, 32.49], [34.0, 40.31], [41.0, 41.93], [51.0, 51.39], [52.0, 55.98], [63.0, 63.78], [66.0, 69.15], [72.0, 77.18], [80.0, 80.89], [85.0, 87.17], [89.0, 90.12], [91.0, 93.14], [100.0, 100.47], [108.0, 107.92], [114.0, 115.43], [116.0, 117.34], [122.0, 133.08], [134.0, 134.08], [135.0, 135.41], [140.0, 140.22], [141.0, 141.27], [142.0, 142.28], [151.0, 151.19], [156.0, 157.01], [161.0, 163.7]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.22, 0.0, 0.0, 44.49, 0.0, 33.57, 35.36, 0.0, 37.59, 0.0, 52.74, 0.0, 0.0, 0.0, 0.0, 38.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89], "audiomae_on_audioset": [[["speech", 25.39], ["sidetone", 23.4], ["fly, housefly", 7.72]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.54], ["music", 13.76], ["grunt", 6.48]], null, [["fart", 18.27], ["speech", 14.56], ["fly, housefly", 10.99]], [["fart", 26.13], ["speech", 23.63], ["music", 12.66]], null, [["speech", 22.77], ["livestock, farm animals, working animals", 8.12], ["roar", 7.87]], null, null, null, null, null, null, [["speech", 43.49], ["sidetone", 36.15], ["fly, housefly", 4.24]], null, null, null, null, null, null, null, null], "duration": [2.13, 0.05, 0.2, -0.21, 0.28, 1.77, 0.73, 0.56, 0.33, 0.49, 6.31, 0.93, 0.39, 3.98, 0.78, 3.15, 5.18, 0.89, 2.17, 1.12, 2.14, 0.47, -0.08, 1.43, 1.34, 11.08, 0.08, 0.41, 0.22, 0.27, 0.28, 0.19, 1.01, 2.7]} \ No newline at end of file diff --git a/annotations_1/BxB1Mpj8NiM_filtered.json b/annotations_1/BxB1Mpj8NiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..484759a65f54d121ccc4f809ca46fdc2ecdb948f --- /dev/null +++ b/annotations_1/BxB1Mpj8NiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 55.68], [59.0, 66.14], [70.0, 71.15], [72.0, 72.67], [76.0, 76.82], [80.0, 80.77], [91.0, 91.49], [99.0, 101.22], [102.0, 102.17], [103.0, 103.84], [106.0, 106.08], [107.0, 108.19], [109.0, 109.86], [113.0, 113.12], [115.0, 118.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.36, 48.44, 0.0, 0.0, 0.0, 0.0, 0.0, 35.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.89], "audiomae_on_audioset": [[["music", 62.11], ["speech", 13.32], ["boing", 3.07]], [["music", 66.41], ["throbbing", 5.08], ["electronic music", 2.57]], null, null, null, null, null, [["music", 60.05], ["whack, thwack", 6.04], ["electronic music", 3.58]], null, null, null, null, null, null, [["speech", 38.1], ["music", 37.94], ["sidetone", 5.82]]], "duration": [13.68, 7.14, 1.15, 0.67, 0.82, 0.77, 0.49, 2.22, 0.17, 0.84, 0.08, 1.19, 0.86, 0.12, 3.94]} \ No newline at end of file diff --git a/annotations_1/BxIcBWi4ETk_filtered.json b/annotations_1/BxIcBWi4ETk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..796d83e91375a9caf313d6da15166a329d769599 --- /dev/null +++ b/annotations_1/BxIcBWi4ETk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 27.21], [29.0, 30.7], [39.0, 39.63], [44.0, 45.03], [48.0, 72.18], [76.0, 101.58], [103.0, 114.99]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [32.99, 0.0, 0.0, 0.0, 30.02, 30.92, 29.53], "audiomae_on_audioset": [[["throbbing", 56.0], ["hum", 19.07], ["speech", 11.62]], null, null, null, [["speech", 44.77], ["music", 26.5], ["thump, thud", 5.96]], [["music", 49.82], ["whack, thwack", 11.36], ["speech", 10.65]], [["whack, thwack", 43.04], ["music", 8.45], ["hum", 7.11]]], "duration": [20.21, 1.7, 0.63, 1.03, 24.18, 25.58, 11.99]} \ No newline at end of file diff --git a/annotations_1/By05PXEvGWA_filtered.json b/annotations_1/By05PXEvGWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3bb063c66cc0959c432bfd2423792e219a73c03 --- /dev/null +++ b/annotations_1/By05PXEvGWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.85], [7.0, 8.65], [17.0, 17.34], [21.0, 21.98], [24.0, 25.57], [29.0, 29.57], [34.0, 34.2], [36.0, 37.27], [41.0, 41.12], [43.0, 44.12], [48.0, 50.7], [51.0, 53.1], [54.0, 55.32], [56.0, 60.66], [62.0, 61.57], [64.0, 97.63], [98.0, 100.13], [101.0, 104.46], [105.0, 106.27], [107.0, 108.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 62.27, 0.0, 78.55, 0.0, 0.0, 39.69, 37.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["foghorn", 60.85], ["double bass", 12.26], ["music", 8.65]], [["music", 53.98], ["double bass", 11.09], ["cello", 8.42]], null, null], "duration": [1.85, 1.65, 0.34, 0.98, 1.57, 0.57, 0.2, 1.27, 0.12, 1.12, 2.7, 2.1, 1.32, 4.66, -0.43, 33.63, 2.13, 3.46, 1.27, 1.11]} \ No newline at end of file diff --git a/annotations_1/ByPtVBI4_MI_filtered.json b/annotations_1/ByPtVBI4_MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55ee8dc02818ab93034a223ba07f2b73a5e9d9e9 --- /dev/null +++ b/annotations_1/ByPtVBI4_MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.24], [40.0, 48.81], [50.0, 51.17], [52.0, 53.23], [88.0, 94.83]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 32.8, 0.0, 0.0, 31.52], "audiomae_on_audioset": [null, [["music", 20.08], ["throbbing", 17.36], ["speech", 10.92]], null, null, [["music", 67.09], ["synthesizer", 8.55], ["musical instrument", 5.37]]], "duration": [1.24, 8.81, 1.17, 1.23, 6.83]} \ No newline at end of file diff --git a/annotations_1/ByRUwa_QiaE_filtered.json b/annotations_1/ByRUwa_QiaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..911085ea7a916ceca53e3135c13221f2e776ab7c --- /dev/null +++ b/annotations_1/ByRUwa_QiaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.79], [27.0, 28.56], [32.0, 43.95], [51.0, 53.67], [67.0, 78.49], [79.0, 78.61], [91.0, 104.13], [106.0, 110.32], [120.0, 120.7], [122.0, 123.75], [126.0, 126.72], [129.0, 128.71], [130.0, 131.62], [134.0, 135.9], [152.0, 152.88]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.14, 0.0, 40.02, 73.97, 38.31, 0.0, 58.89, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.44], ["sidetone", 15.02], ["speech", 6.08]], null, [["music", 44.13], ["speech", 15.4], ["animal", 2.73]], null, null, null, null, null, null, null, null, null, null], "duration": [3.79, 1.56, 11.95, 2.67, 11.49, -0.39, 13.13, 4.32, 0.7, 1.75, 0.72, -0.29, 1.62, 1.9, 0.88]} \ No newline at end of file diff --git a/annotations_1/ByRXX8KHS5o_filtered.json b/annotations_1/ByRXX8KHS5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb4ada6814e90b5ca44a916fcf71423221f7f55 --- /dev/null +++ b/annotations_1/ByRXX8KHS5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.03], [18.0, 21.0], [25.0, 27.43], [29.0, 28.97], [32.0, 35.73], [38.0, 37.98], [40.0, 42.82], [44.0, 47.29], [49.0, 49.71], [51.0, 52.69], [53.0, 54.78], [56.0, 85.26], [86.0, 85.89], [87.0, 89.97], [97.0, 99.86], [101.0, 111.94], [115.0, 121.61], [128.0, 128.01], [131.0, 133.73], [136.0, 136.48], [137.0, 139.51], [142.0, 142.6], [147.0, 153.57], [165.0, 165.7], [171.0, 171.53]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, true, true, true, true, false, true, false, true, false, true, false, false], "silence_prob": [83.88, 82.25, 80.82, 0.0, 32.05, 0.0, 91.13, 40.34, 0.0, 0.0, 0.0, 35.57, 0.0, 34.9, 46.5, 41.85, 49.04, 0.0, 41.07, 0.0, 33.7, 0.0, 43.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 36.14], ["cattle, bovinae", 13.85], ["moo", 12.7]], null, null, [["fly, housefly", 29.42], ["insect", 20.93], ["mosquito", 10.52]], null, null, null, [["music", 78.56], ["speech", 6.67], ["thunk", 1.88]], null, [["thunk", 15.55], ["music", 10.36], ["ding", 8.92]], [["speech", 29.97], ["music", 23.87], ["didgeridoo", 9.36]], [["speech", 29.65], ["music", 19.82], ["hum", 4.6]], [["fly, housefly", 11.2], ["speech", 9.31], ["music", 8.09]], null, [["music", 44.36], ["throbbing", 11.12], ["synthesizer", 6.08]], null, [["speech", 36.15], ["mains hum", 10.31], ["hum", 9.73]], null, [["hum", 22.82], ["music", 18.82], ["mains hum", 12.07]], null, null], "duration": [3.03, 3.0, 2.43, -0.03, 3.73, -0.02, 2.82, 3.29, 0.71, 1.69, 1.78, 29.26, -0.11, 2.97, 2.86, 10.94, 6.61, 0.01, 2.73, 0.48, 2.51, 0.6, 6.57, 0.7, 0.53]} \ No newline at end of file diff --git a/annotations_1/BznPcrTUYvg_filtered.json b/annotations_1/BznPcrTUYvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff494e2577a5221b32cd5b1f42f8f98d11cbff0c --- /dev/null +++ b/annotations_1/BznPcrTUYvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [7.0, 8.31], [9.0, 10.84], [15.0, 17.51], [19.0, 21.03], [23.0, 24.24], [25.0, 27.18], [28.0, 31.5], [32.0, 32.86], [34.0, 36.36], [37.0, 42.63], [43.0, 45.27], [47.0, 48.46], [49.0, 52.22], [54.0, 55.95], [59.0, 64.37], [66.0, 67.9], [70.0, 71.2], [72.0, 72.54], [73.0, 76.18], [78.0, 84.25], [85.0, 100.31], [101.0, 102.63], [103.0, 107.3], [108.0, 111.42], [113.0, 123.18], [126.0, 126.49], [128.0, 129.24], [130.0, 131.31], [133.0, 134.5], [136.0, 137.76], [141.0, 141.66], [145.0, 145.32], [149.0, 173.55], [175.0, 177.25], [179.0, 185.95], [187.0, 189.48], [190.0, 192.54], [194.0, 195.35], [196.0, 199.76], [201.0, 202.07], [202.0, 206.07], [207.0, 209.31], [210.0, 225.88], [228.0, 230.37], [232.0, 236.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.65, 65.32, 0.0, 76.53, 90.43, 0.0, 91.47, 75.23, 87.0, 0.0, 47.39, 0.0, 86.82, 0.0, 0.0, 0.0, 80.82, 97.73, 76.37, 0.0, 75.88, 61.47, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 71.14, 87.0, 86.82, 71.29, 0.0, 89.9, 0.0, 80.64, 71.72, 91.81, 62.47, 71.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 63.15], ["speech", 14.94], ["music", 5.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 1.31, 1.84, 2.51, 2.03, 1.24, 2.18, 3.5, 0.86, 2.36, 5.63, 2.27, 1.46, 3.22, 1.95, 5.37, 1.9, 1.2, 0.54, 3.18, 6.25, 15.31, 1.63, 4.3, 3.42, 10.18, 0.49, 1.24, 1.31, 1.5, 1.76, 0.66, 0.32, 24.55, 2.25, 6.95, 2.48, 2.54, 1.35, 3.76, 1.07, 4.07, 2.31, 15.88, 2.37, 4.49]} \ No newline at end of file diff --git a/annotations_1/C-FH-TOuFpQ_filtered.json b/annotations_1/C-FH-TOuFpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f93fc5154273540c5e7c51afd51eea4bed46a3 --- /dev/null +++ b/annotations_1/C-FH-TOuFpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 89.87], [91.0, 97.31], [98.0, 101.12], [102.0, 107.13], [112.0, 113.56], [114.0, 114.71], [121.0, 120.93], [122.0, 122.49], [123.0, 131.3], [132.0, 135.16], [139.0, 140.21], [145.0, 147.01], [151.0, 152.02], [153.0, 153.35], [154.0, 155.87], [157.0, 160.41], [163.0, 164.84], [166.0, 168.05], [169.0, 171.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 87.19, 100.0, 63.42, 0.0, 0.0, 0.0, 0.0, 59.59, 65.67, 0.0, 55.31, 0.0, 0.0, 0.0, 75.55, 0.0, 40.88, 99.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 19.48], ["sidetone", 16.16], ["guitar", 8.66]], null], "duration": [42.87, 6.31, 3.12, 5.13, 1.56, 0.71, -0.07, 0.49, 8.3, 3.16, 1.21, 2.01, 1.02, 0.35, 1.87, 3.41, 1.84, 2.05, 2.42]} \ No newline at end of file diff --git a/annotations_1/C-uCzmnXn-g_filtered.json b/annotations_1/C-uCzmnXn-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f848a49b8cd885356f5daeed925f76d109ffea9 --- /dev/null +++ b/annotations_1/C-uCzmnXn-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.54], [2.0, 1.63], [2.0, 2.69], [5.0, 6.08], [8.0, 8.68], [10.0, 12.31], [13.0, 13.76], [18.0, 18.74], [19.0, 22.82], [23.0, 24.11], [26.0, 26.7], [29.0, 30.08], [33.0, 34.05], [35.0, 35.72], [42.0, 45.13], [46.0, 49.38], [50.0, 51.53], [53.0, 54.3], [61.0, 62.04], [63.0, 64.3], [71.0, 75.95], [76.0, 77.21], [81.0, 82.9], [93.0, 93.85], [96.0, 97.46], [100.0, 101.98], [104.0, 107.57], [111.0, 117.78], [123.0, 124.16], [129.0, 143.23], [144.0, 145.59], [147.0, 164.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.9, 0.0, 0.0, 52.98, 0.0, 0.0, 0.0, 0.0, 0.0, 40.5, 36.02, 0.0, 0.0, 0.0, 0.0, 40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 33.91, 33.51, 0.0, 38.19, 0.0, 29.81], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 33.14], ["mains hum", 30.38], ["music", 7.59]], null, null, null, null, null, null, null, null, [["music", 47.37], ["mains hum", 12.73], ["hum", 11.78]], [["music", 60.49], ["ambient music", 8.83], ["hum", 5.79]], null, null, null, null, [["music", 37.05], ["mains hum", 20.18], ["hum", 14.12]], null, null, null, null, null, [["music", 59.68], ["hum", 7.44], ["didgeridoo", 5.84]], [["music", 66.89], ["hum", 7.86], ["electronic music", 3.19]], null, [["music", 48.07], ["hum", 8.93], ["scary music", 4.75]], null, [["buzz", 25.39], ["music", 24.19], ["speech", 6.61]]], "duration": [0.54, -0.37, 0.69, 1.08, 0.68, 2.31, 0.76, 0.74, 3.82, 1.11, 0.7, 1.08, 1.05, 0.72, 3.13, 3.38, 1.53, 1.3, 1.04, 1.3, 4.95, 1.21, 1.9, 0.85, 1.46, 1.98, 3.57, 6.78, 1.16, 14.23, 1.59, 17.1]} \ No newline at end of file diff --git a/annotations_1/C05qUz1ukWo_filtered.json b/annotations_1/C05qUz1ukWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1cb344e4a19b390f2da6d0fe5b697a19f219089 --- /dev/null +++ b/annotations_1/C05qUz1ukWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [22.0, 29.44], [31.0, 47.21], [70.0, 71.81], [79.0, 80.32], [82.0, 87.44], [94.0, 95.03], [96.0, 96.84], [98.0, 101.19], [102.0, 102.17], [107.0, 109.58], [112.0, 121.81], [123.0, 124.48]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 73.97, 43.03, 0.0, 0.0, 43.77, 0.0, 0.0, 45.27, 0.0, 43.13, 32.73, 0.0], "audiomae_on_audioset": [null, null, [["speech", 83.73], ["sidetone", 3.61], ["hum", 2.36]], null, null, [["music", 40.2], ["speech", 24.83], ["noise", 4.18]], null, null, [["speech", 40.47], ["music", 5.64], ["beatboxing", 4.8]], null, [["speech", 68.01], ["music", 17.72], ["inside, small room", 1.79]], [["music", 64.85], ["synthesizer", 10.06], ["musical instrument", 5.64]], null], "duration": [0.48, 7.44, 16.21, 1.81, 1.32, 5.44, 1.03, 0.84, 3.19, 0.17, 2.58, 9.81, 1.48]} \ No newline at end of file diff --git a/annotations_1/C0H2SnzitoM_filtered.json b/annotations_1/C0H2SnzitoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..727c8692f8dd94f15f4057300afab51acc3a87b4 --- /dev/null +++ b/annotations_1/C0H2SnzitoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.3], [8.0, 8.83], [10.0, 11.25], [11.0, 11.35], [11.0, 12.09], [13.0, 15.53], [16.0, 22.01], [22.0, 22.45], [23.0, 27.13], [28.0, 28.92], [31.0, 39.16], [40.0, 40.74], [43.0, 42.85], [44.0, 46.57], [47.0, 69.99], [76.0, 86.41], [87.0, 98.93]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false], "silence_prob": [42.72, 0.0, 0.0, 0.0, 0.0, 31.04, 32.42, 0.0, 30.98, 0.0, 31.17, 0.0, 0.0, 32.07, 45.08, 49.78, 59.51], "audiomae_on_audioset": [[["music", 57.92], ["thunk", 7.21], ["singing", 2.57]], null, null, null, null, [["music", 51.87], ["speech", 25.57], ["boing", 4.72]], [["music", 69.01], ["speech", 4.91], ["singing", 3.72]], null, [["music", 57.08], ["boing", 5.09], ["sampler", 1.79]], null, [["music", 87.67], ["electronic music", 1.07], ["sampler", 0.87]], null, null, [["speech", 36.55], ["cattle, bovinae", 11.86], ["groan", 8.59]], [["music", 65.5], ["speech", 7.31], ["animal", 1.71]], [["music", 36.23], ["speech", 11.19], ["fly, housefly", 8.76]], null], "duration": [2.3, 0.83, 1.25, 0.35, 1.09, 2.53, 6.01, 0.45, 4.13, 0.92, 8.16, 0.74, -0.15, 2.57, 22.99, 10.41, 11.93]} \ No newline at end of file diff --git a/annotations_1/C0KLb_v50-k_filtered.json b/annotations_1/C0KLb_v50-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1adc6c05ee7115f55c13101019148d615f960b0 --- /dev/null +++ b/annotations_1/C0KLb_v50-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.43], [17.0, 18.22], [21.0, 25.74], [26.0, 36.69], [40.0, 40.27], [41.0, 48.32], [50.0, 51.31], [59.0, 58.89], [62.0, 63.96], [67.0, 67.32], [70.0, 70.04], [71.0, 72.6], [78.0, 78.75], [80.0, 80.99], [81.0, 87.29], [91.0, 91.57], [99.0, 100.38], [101.0, 101.17], [106.0, 106.46], [107.0, 113.46], [115.0, 115.13], [121.0, 122.71], [127.0, 127.45], [128.0, 129.2], [134.0, 134.76], [138.0, 139.68], [140.0, 141.67], [143.0, 143.78], [144.0, 145.72], [147.0, 147.97], [149.0, 153.13], [157.0, 158.11], [158.0, 160.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 45.27, 39.28, 0.0, 32.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 40.61], "audiomae_on_audioset": [null, null, [["music", 66.75], ["synthesizer", 3.71], ["hum", 3.51]], [["music", 48.06], ["thunk", 36.69], ["musical instrument", 1.79]], null, [["speech", 72.66], ["knock", 9.77], ["hum", 1.37]], null, null, null, null, null, null, null, null, [["speech", 61.35], ["sine wave", 12.0], ["chirp tone", 5.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.58], ["music", 22.56], ["singing bowl", 3.14]]], "duration": [1.43, 1.22, 4.74, 10.69, 0.27, 7.32, 1.31, -0.11, 1.96, 0.32, 0.04, 1.6, 0.75, 0.99, 6.29, 0.57, 1.38, 0.17, 0.46, 6.46, 0.13, 1.71, 0.45, 1.2, 0.76, 1.68, 1.67, 0.78, 1.72, 0.97, 4.13, 1.11, 2.62]} \ No newline at end of file diff --git a/annotations_1/C0NVo07t9UI_filtered.json b/annotations_1/C0NVo07t9UI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2521529ecb19a6321149aa415d23b90212748f9e --- /dev/null +++ b/annotations_1/C0NVo07t9UI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.72], [26.0, 34.08], [35.0, 46.2], [49.0, 53.97], [54.0, 67.14], [67.0, 70.55], [71.0, 72.98], [75.0, 77.33], [79.0, 81.58], [82.0, 84.18], [93.0, 93.34], [95.0, 101.88], [102.0, 102.96], [106.0, 106.76], [108.0, 108.16], [110.0, 110.89], [112.0, 114.15], [115.0, 116.61], [118.0, 122.61], [123.0, 123.97], [124.0, 125.27], [127.0, 128.17], [129.0, 130.86], [138.0, 139.06], [147.0, 146.87], [148.0, 154.48], [163.0, 163.81], [164.0, 165.65], [167.0, 166.99], [168.0, 169.53], [175.0, 175.2], [179.0, 180.64], [189.0, 189.23], [191.0, 192.11], [193.0, 196.21], [197.0, 198.05], [199.0, 203.08]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.73, 97.22, 29.46, 38.52, 56.7, 0.0, 74.6, 48.31, 46.68, 0.0, 41.6, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 72.16], "audiomae_on_audioset": [null, null, null, [["heart sounds, heartbeat", 14.62], ["groan", 12.56], ["speech", 10.81]], [["cattle, bovinae", 27.76], ["livestock, farm animals, working animals", 25.68], ["moo", 19.83]], null, null, null, [["hum", 26.86], ["music", 20.66], ["whale vocalization", 11.73]], [["fly, housefly", 59.35], ["insect", 13.77], ["bee, wasp, etc.", 12.31]], null, [["speech", 40.89], ["music", 9.93], ["livestock, farm animals, working animals", 6.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.52], ["theremin", 14.25], ["didgeridoo", 12.97]], null, null], "duration": [1.72, 8.08, 11.2, 4.97, 13.14, 3.55, 1.98, 2.33, 2.58, 2.18, 0.34, 6.88, 0.96, 0.76, 0.16, 0.89, 2.15, 1.61, 4.61, 0.97, 1.27, 1.17, 1.86, 1.06, -0.13, 6.48, 0.81, 1.65, -0.01, 1.53, 0.2, 1.64, 0.23, 1.11, 3.21, 1.05, 4.08]} \ No newline at end of file diff --git a/annotations_1/C0vM89y4088_filtered.json b/annotations_1/C0vM89y4088_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6366f6cbca2d8289e8870f306b9720bbe6838b40 --- /dev/null +++ b/annotations_1/C0vM89y4088_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.13], [8.0, 11.28], [12.0, 14.13], [20.0, 20.76], [26.0, 30.16], [33.0, 40.32], [49.0, 65.25], [71.0, 91.18], [92.0, 92.99], [94.0, 94.53], [97.0, 96.97], [105.0, 105.39], [107.0, 116.92], [118.0, 128.76], [130.0, 130.81], [132.0, 132.93], [135.0, 135.19], [141.0, 144.71], [148.0, 148.59], [150.0, 149.88], [151.0, 152.17], [153.0, 153.3], [160.0, 160.57], [161.0, 161.52], [165.0, 168.69], [171.0, 172.99], [174.0, 176.39], [178.0, 178.29], [183.0, 183.39], [184.0, 184.64]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.73, 35.52, 0.0, 50.81, 29.0, 30.15, 28.35, 0.0, 0.0, 0.0, 0.0, 29.94, 48.23, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 72.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 59.72], ["sidetone", 6.25], ["boing", 6.25]], [["music", 22.47], ["whale vocalization", 14.34], ["hum", 12.75]], null, null, [["music", 18.26], ["hum", 18.01], ["explosion", 14.15]], [["music", 35.15], ["speech", 15.19], ["throbbing", 14.63]], [["speech", 53.11], ["explosion", 10.32], ["music", 8.57]], null, null, null, null, [["speech", 69.08], ["music", 8.24], ["hum", 6.08]], [["speech", 43.85], ["music", 19.03], ["mains hum", 6.32]], null, null, null, [["cattle, bovinae", 44.47], ["moo", 27.8], ["livestock, farm animals, working animals", 18.77]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 3.28, 2.13, 0.76, 4.16, 7.32, 16.25, 20.18, 0.99, 0.53, -0.03, 0.39, 9.92, 10.76, 0.81, 0.93, 0.19, 3.71, 0.59, -0.12, 1.17, 0.3, 0.57, 0.52, 3.69, 1.99, 2.39, 0.29, 0.39, 0.64]} \ No newline at end of file diff --git a/annotations_1/C1PilkENI-k_filtered.json b/annotations_1/C1PilkENI-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c198d98c44e5049683c087eb638ad19230747c2 --- /dev/null +++ b/annotations_1/C1PilkENI-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.88], [21.0, 23.21], [37.0, 46.72], [47.0, 48.49]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 99.62, 94.66, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.88, 2.21, 9.72, 1.49]} \ No newline at end of file diff --git a/annotations_1/C2KN6BHuPWA_filtered.json b/annotations_1/C2KN6BHuPWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23cf5d7749849172d4938238428d77d62fb34c2b --- /dev/null +++ b/annotations_1/C2KN6BHuPWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.17], [7.0, 7.72], [8.0, 9.76], [18.0, 17.64], [28.0, 28.05], [29.0, 29.42], [31.0, 31.23], [35.0, 36.37], [39.0, 39.85], [42.0, 42.21], [43.0, 43.04], [54.0, 54.63], [59.0, 59.73], [63.0, 64.25], [66.0, 66.39], [71.0, 71.73], [72.0, 73.68], [77.0, 77.48], [78.0, 78.66], [80.0, 81.92], [84.0, 84.67], [97.0, 97.33], [98.0, 98.78], [100.0, 100.08], [102.0, 102.95], [104.0, 106.39], [108.0, 109.9], [113.0, 114.56], [119.0, 120.29], [121.0, 122.47], [123.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 0.72, 1.76, -0.36, 0.05, 0.42, 0.23, 1.37, 0.85, 0.21, 0.04, 0.63, 0.73, 1.25, 0.39, 0.73, 1.68, 0.48, 0.66, 1.92, 0.67, 0.33, 0.78, 0.08, 0.95, 2.39, 1.9, 1.56, 1.29, 1.47, -0.02]} \ No newline at end of file diff --git a/annotations_1/C3J1AO9z0tA_filtered.json b/annotations_1/C3J1AO9z0tA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce048ff5d7e179a70a275b2ca541cfb19321651 --- /dev/null +++ b/annotations_1/C3J1AO9z0tA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [8.0, 10.08], [11.0, 11.67], [22.0, 26.91], [31.0, 31.6], [32.0, 44.79], [51.0, 66.06], [68.0, 69.87], [72.0, 72.12], [73.0, 73.99], [75.0, 77.38], [82.0, 83.57], [86.0, 86.31], [105.0, 108.19], [109.0, 109.48], [119.0, 122.64], [127.0, 126.99], [150.0, 151.98], [156.0, 156.05], [163.0, 162.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 59.68, 0.0, 67.89, 0.0, 43.96, 29.97, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 29.55, 0.0, 34.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["throbbing", 28.35], ["hum", 25.48], ["music", 11.04]], [["music", 73.94], ["hum", 3.88], ["electronic music", 2.32]], null, null, null, null, null, null, [["music", 34.21], ["hum", 26.95], ["throbbing", 14.4]], null, [["music", 36.87], ["speech", 22.13], ["throbbing", 6.63]], null, null, null, null], "duration": [0.85, 2.08, 0.67, 4.91, 0.6, 12.79, 15.06, 1.87, 0.12, 0.99, 2.38, 1.57, 0.31, 3.19, 0.48, 3.64, -0.01, 1.98, 0.05, -0.06]} \ No newline at end of file diff --git a/annotations_1/C3TAMx8Gqro_filtered.json b/annotations_1/C3TAMx8Gqro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..990715e6600def039ab8b349eca4738ed02ae3de --- /dev/null +++ b/annotations_1/C3TAMx8Gqro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 34.64], [37.0, 38.67], [40.0, 44.86], [47.0, 50.19], [51.0, 55.36], [56.0, 58.35], [59.0, 60.54], [61.0, 69.58], [70.0, 83.86], [88.0, 89.16], [90.0, 91.12], [92.0, 94.22], [97.0, 101.09]], "keep_status": [true, false, false, true, true, false, false, true, false, false, false, false, false], "silence_prob": [31.49, 0.0, 71.87, 37.38, 37.37, 62.17, 0.0, 30.53, 38.74, 0.0, 0.0, 56.33, 80.82], "audiomae_on_audioset": [[["hum", 23.81], ["music", 21.01], ["mains hum", 18.59]], null, null, [["music", 21.91], ["sine wave", 19.25], ["chirp tone", 15.09]], [["speech", 53.12], ["clang", 12.18], ["arrow", 4.16]], null, null, [["gunshot, gunfire", 31.11], ["speech", 24.59], ["machine gun", 6.73]], [["whale vocalization", 53.24], ["speech", 11.74], ["rumble", 7.92]], null, null, null, null], "duration": [29.64, 1.67, 4.86, 3.19, 4.36, 2.35, 1.54, 8.58, 13.86, 1.16, 1.12, 2.22, 4.09]} \ No newline at end of file diff --git a/annotations_1/C3rDWENRI7c_filtered.json b/annotations_1/C3rDWENRI7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8af2f8b6d710c88fd13ba6e0650e215a3eb4c2 --- /dev/null +++ b/annotations_1/C3rDWENRI7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.26], [7.0, 8.43], [13.0, 14.01], [15.0, 19.13], [21.0, 36.39], [39.0, 45.4], [48.0, 48.73], [51.0, 55.12], [56.0, 70.6], [77.0, 78.92], [80.0, 92.18], [95.0, 95.76], [96.0, 99.82], [100.0, 101.29], [103.0, 104.31], [106.0, 105.8], [110.0, 112.55], [116.0, 117.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 0.0, 0.0, 99.92, 98.36, 93.6, 0.0, 88.1, 83.7, 0.0, 69.07, 0.0, 59.77, 0.0, 0.0, 0.0, 79.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.26, 1.43, 1.01, 4.13, 15.39, 6.4, 0.73, 4.12, 14.6, 1.92, 12.18, 0.76, 3.82, 1.29, 1.31, -0.2, 2.55, 1.59]} \ No newline at end of file diff --git a/annotations_1/C41s4A5Wq1Y_filtered.json b/annotations_1/C41s4A5Wq1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecc2692d7420b58a09e8915c59b1d59e9494fa62 --- /dev/null +++ b/annotations_1/C41s4A5Wq1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.43], [21.0, 21.1], [21.0, 49.52], [52.0, 57.42], [58.0, 58.21], [59.0, 59.78], [62.0, 64.93], [73.0, 75.42], [76.0, 76.6], [81.0, 82.48], [83.0, 84.05], [84.0, 84.77], [86.0, 87.93], [89.0, 92.47], [95.0, 95.98], [99.0, 99.0], [101.0, 101.26], [104.0, 104.38], [107.0, 127.11], [130.0, 146.58], [150.0, 150.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.37, 44.87, 0.0, 0.0, 60.6, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91, 0.0, 0.0, 0.0, 0.0, 30.57, 32.26, 0.0], "audiomae_on_audioset": [null, null, [["hum", 45.11], ["speech", 19.48], ["mains hum", 13.66]], [["speech", 44.42], ["hum", 10.01], ["sidetone", 8.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.2], ["explosion", 4.42], ["burst, pop", 3.89]], [["music", 49.27], ["hum", 15.77], ["throbbing", 14.22]], null], "duration": [1.43, 0.1, 28.52, 5.42, 0.21, 0.78, 2.93, 2.42, 0.6, 1.48, 1.05, 0.77, 1.93, 3.47, 0.98, 0.0, 0.26, 0.38, 20.11, 16.58, 0.42]} \ No newline at end of file diff --git a/annotations_1/C4DPvNXtOzA_filtered.json b/annotations_1/C4DPvNXtOzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b473901afd48bbebeb0d466248847037309b453 --- /dev/null +++ b/annotations_1/C4DPvNXtOzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.86], [17.0, 21.78], [24.0, 28.19], [29.0, 30.28], [34.0, 34.32], [35.0, 37.23], [39.0, 40.88], [43.0, 51.97], [59.0, 59.68], [67.0, 67.78], [69.0, 69.84], [75.0, 76.72], [78.0, 81.89], [83.0, 85.11], [87.0, 89.09], [92.0, 94.96], [95.0, 95.62], [96.0, 98.29], [99.0, 99.87], [101.0, 100.94], [101.0, 101.61], [102.0, 102.86], [104.0, 127.72], [128.0, 132.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 0.0, 79.07, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 82.07, 99.98, 42.11, 31.75, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 98.27, 36.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 13.24], ["throbbing", 6.84], ["speech", 6.72]], [["speech", 43.41], ["thunk", 42.25], ["crackle", 2.04]], null, null, null, null, null, null, null, [["music", 59.68], ["musical instrument", 8.51], ["guitar", 5.96]]], "duration": [-0.14, 4.78, 4.19, 1.28, 0.32, 2.23, 1.88, 8.97, 0.68, 0.78, 0.84, 1.72, 3.89, 2.11, 2.09, 2.96, 0.62, 2.29, 0.87, -0.06, 0.61, 0.86, 23.72, 4.65]} \ No newline at end of file diff --git a/annotations_1/C58_gjlogWY_filtered.json b/annotations_1/C58_gjlogWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42294b56e9ba1b481e78d6d24c9761eb4579f20f --- /dev/null +++ b/annotations_1/C58_gjlogWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.12], [10.0, 12.97], [19.0, 19.55], [26.0, 27.57], [28.0, 32.05], [32.0, 32.58], [51.0, 51.06], [53.0, 71.34], [72.0, 73.94], [77.0, 78.14], [79.0, 79.84], [83.0, 84.23], [102.0, 104.62], [105.0, 107.15], [108.0, 109.86], [110.0, 111.0], [112.0, 112.97], [114.0, 114.47], [115.0, 115.8], [118.0, 119.26], [120.0, 121.32], [123.0, 124.65], [135.0, 135.46], [141.0, 142.13], [143.0, 146.91], [148.0, 148.09], [159.0, 158.95], [159.0, 160.24], [163.0, 164.29], [165.0, 166.55], [167.0, 169.35], [171.0, 171.53], [172.0, 173.77], [174.0, 175.12]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 40.45, 0.0, 0.0, 48.87, 0.0, 0.0, 43.2, 0.0, 0.0, 0.0, 0.0, 92.64, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.66, 0.0, 0.0, 0.0, 0.0, 0.0, 39.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 66.15], ["vehicle", 7.65], ["car", 3.03]], null, null, [["speech", 45.3], ["sidetone", 12.45], ["hum", 3.95]], null, null, [["music", 41.61], ["cattle, bovinae", 10.12], ["speech", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.81], ["electric shaver, electric razor", 10.79], ["outside, rural or natural", 2.67]], null, null, null, null, null, [["speech", 43.97], ["music", 12.9], ["whip", 4.81]], null, null, null], "duration": [0.12, 2.97, 0.55, 1.57, 4.05, 0.58, 0.06, 18.34, 1.94, 1.14, 0.84, 1.23, 2.62, 2.15, 1.86, 1.0, 0.97, 0.47, 0.8, 1.26, 1.32, 1.65, 0.46, 1.13, 3.91, 0.09, -0.05, 1.24, 1.29, 1.55, 2.35, 0.53, 1.77, 1.12]} \ No newline at end of file diff --git a/annotations_1/C5UD270jxfs_filtered.json b/annotations_1/C5UD270jxfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e795d17cc1f4e3da10f5a61445dc11638adc5c9b --- /dev/null +++ b/annotations_1/C5UD270jxfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [5.0, 5.51], [7.0, 7.35], [12.0, 14.57], [25.0, 24.88], [25.0, 25.34], [36.0, 43.46], [48.0, 48.98], [53.0, 54.28], [56.0, 59.68], [61.0, 60.96], [72.0, 81.67], [83.0, 83.47], [87.0, 87.2], [88.0, 91.91], [95.0, 104.94], [109.0, 113.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 81.53, 0.0, 0.0, 62.68, 0.0, 56.78, 0.0, 0.0, 36.63, 42.88, 38.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 54.17], ["insect", 22.88], ["mosquito", 11.0]], [["music", 73.63], ["speech", 4.55], ["quack", 1.03]], [["hum", 28.57], ["music", 26.63], ["throbbing", 18.99]]], "duration": [0.53, 0.51, 0.35, 2.57, -0.12, 0.34, 7.46, 0.98, 1.28, 3.68, -0.04, 9.67, 0.47, 0.2, 3.91, 9.94, 4.53]} \ No newline at end of file diff --git a/annotations_1/C5lMZZxrewE_filtered.json b/annotations_1/C5lMZZxrewE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb5c416182ad383cb320fe977edc66853082e9a7 --- /dev/null +++ b/annotations_1/C5lMZZxrewE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.89], [7.0, 7.18], [10.0, 14.28], [17.0, 17.79], [18.0, 20.39], [22.0, 22.57], [26.0, 34.99], [35.0, 36.44], [38.0, 39.04], [40.0, 45.72], [46.0, 47.04], [49.0, 49.15], [50.0, 50.87], [53.0, 58.6], [63.0, 68.25], [71.0, 71.32], [74.0, 103.45], [104.0, 104.89], [105.0, 112.04], [113.0, 116.78], [121.0, 121.24], [124.0, 123.84], [128.0, 130.72], [132.0, 131.97], [134.0, 133.95]], "keep_status": [true, false, true, false, true, false, true, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [45.3, 0.0, 38.64, 0.0, 35.77, 0.0, 37.49, 0.0, 0.0, 34.75, 0.0, 0.0, 0.0, 30.16, 30.91, 0.0, 30.92, 0.0, 30.93, 31.72, 0.0, 0.0, 87.92, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.64], ["speech", 17.21], ["fly, housefly", 7.05]], null, [["music", 12.32], ["speech", 10.82], ["fly, housefly", 8.22]], null, [["speech", 9.43], ["whale vocalization", 6.79], ["vehicle", 3.09]], null, [["speech", 22.75], ["music", 21.15], ["mains hum", 13.06]], null, null, [["insect", 41.44], ["fly, housefly", 39.1], ["mosquito", 9.84]], null, null, null, [["music", 56.59], ["speech", 9.74], ["electronic music", 3.47]], [["music", 69.3], ["electronic music", 3.3], ["synthesizer", 2.87]], null, [["music", 37.26], ["speech", 19.4], ["hum", 4.91]], null, [["music", 34.85], ["speech", 21.28], ["hum", 19.91]], [["music", 55.49], ["mains hum", 4.04], ["hum", 3.96]], null, null, null, null, null], "duration": [3.89, 0.18, 4.28, 0.79, 2.39, 0.57, 8.99, 1.44, 1.04, 5.72, 1.04, 0.15, 0.87, 5.6, 5.25, 0.32, 29.45, 0.89, 7.04, 3.78, 0.24, -0.16, 2.72, -0.03, -0.05]} \ No newline at end of file diff --git a/annotations_1/C83hfoyHHHk_filtered.json b/annotations_1/C83hfoyHHHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b98df68541a09354847090bc058905f51ec2842 --- /dev/null +++ b/annotations_1/C83hfoyHHHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.94], [50.0, 74.7], [76.0, 76.89], [81.0, 81.48], [82.0, 86.64], [90.0, 94.86], [97.0, 123.5], [125.0, 126.1], [129.0, 139.23], [140.0, 141.13], [142.0, 143.63], [146.0, 163.16], [164.0, 164.32], [166.0, 166.73], [168.0, 168.56], [170.0, 173.58], [176.0, 176.69]], "keep_status": [false, true, false, false, false, false, true, false, true, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 28.73, 0.0, 0.0, 29.08, 29.0, 29.36, 0.0, 29.97, 0.0, 0.0, 33.28, 0.0, 0.0, 0.0, 30.25, 0.0], "audiomae_on_audioset": [null, [["speech", 46.57], ["music", 10.35], ["fart", 3.69]], null, null, [["hum", 47.37], ["throbbing", 27.32], ["mains hum", 18.68]], [["hum", 36.22], ["throbbing", 20.21], ["mains hum", 15.5]], [["music", 31.89], ["hum", 15.63], ["throbbing", 15.55]], null, [["music", 16.4], ["explosion", 11.29], ["hum", 10.72]], null, null, [["music", 25.38], ["speech", 7.5], ["crow", 5.59]], null, null, null, [["hum", 36.64], ["mains hum", 17.68], ["music", 6.18]], null], "duration": [0.94, 24.7, 0.89, 0.48, 4.64, 4.86, 26.5, 1.1, 10.23, 1.13, 1.63, 17.16, 0.32, 0.73, 0.56, 3.58, 0.69]} \ No newline at end of file diff --git a/annotations_1/C9PYzGyIfF8_filtered.json b/annotations_1/C9PYzGyIfF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0519422496538cda85afd0de15e5ec524e659767 --- /dev/null +++ b/annotations_1/C9PYzGyIfF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.07], [14.0, 14.44], [25.0, 28.98], [48.0, 53.08], [56.0, 61.37], [72.0, 76.0], [80.0, 81.06], [81.0, 81.65], [97.0, 98.2]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [33.36, 0.0, 32.25, 31.3, 31.66, 31.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 84.86], ["didgeridoo", 3.39], ["synthesizer", 1.14]], null, [["music", 63.74], ["speech", 6.82], ["electronic music", 4.0]], [["music", 53.31], ["cacophony", 6.2], ["boing", 5.18]], [["music", 64.35], ["drum and bass", 6.29], ["didgeridoo", 3.92]], [["music", 59.43], ["throbbing", 14.76], ["hum", 3.17]], null, null, null], "duration": [8.07, 0.44, 3.98, 5.08, 5.37, 4.0, 1.06, 0.65, 1.2]} \ No newline at end of file diff --git a/annotations_1/C9rUREflwDI_filtered.json b/annotations_1/C9rUREflwDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d3f9858b38b29f812d3f9a80c5e259a969684ab --- /dev/null +++ b/annotations_1/C9rUREflwDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 130.5], [133.0, 133.69], [134.0, 133.89]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [117.5, 0.69, -0.11]} \ No newline at end of file diff --git a/annotations_1/CARc1uUq1lA_filtered.json b/annotations_1/CARc1uUq1lA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deff2ef424cebd6fa24b6c17c2d63b398de37074 --- /dev/null +++ b/annotations_1/CARc1uUq1lA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.25], [10.0, 11.06], [14.0, 25.86], [34.0, 34.77], [35.0, 36.48], [39.0, 39.85], [40.0, 40.8], [42.0, 42.63], [45.0, 47.66], [51.0, 51.58], [52.0, 55.05], [57.0, 64.89], [66.0, 67.0], [68.0, 75.9], [79.0, 80.81], [81.0, 87.37], [93.0, 96.99], [101.0, 107.45], [110.0, 110.57], [112.0, 111.91], [115.0, 116.21], [117.0, 117.27], [120.0, 120.26], [123.0, 124.36], [127.0, 128.21], [129.0, 131.28], [133.0, 133.66], [137.0, 137.76], [138.0, 138.45], [138.0, 138.55], [140.0, 140.09], [143.0, 143.02], [144.0, 144.81], [146.0, 146.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.11, 0.0, 0.0, 0.0, 0.0, 0.0, 37.56, 0.0, 42.81, 31.8, 0.0, 40.21, 0.0, 32.44, 44.18, 36.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["theremin", 83.65], ["music", 9.12], ["musical instrument", 1.25]], null, null, null, null, null, [["hum", 28.23], ["mains hum", 25.12], ["music", 8.08]], null, [["music", 57.45], ["didgeridoo", 21.24], ["musical instrument", 6.82]], [["music", 55.85], ["didgeridoo", 22.65], ["beatboxing", 5.48]], null, [["music", 37.02], ["speech", 23.5], ["radio", 17.39]], null, [["speech", 48.84], ["music", 29.97], ["bow-wow", 6.61]], [["mosquito", 34.63], ["fly, housefly", 17.27], ["frog", 15.19]], [["mosquito", 29.29], ["fly, housefly", 24.04], ["speech", 20.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 1.06, 11.86, 0.77, 1.48, 0.85, 0.8, 0.63, 2.66, 0.58, 3.05, 7.89, 1.0, 7.9, 1.81, 6.37, 3.99, 6.45, 0.57, -0.09, 1.21, 0.27, 0.26, 1.36, 1.21, 2.28, 0.66, 0.76, 0.45, 0.55, 0.09, 0.02, 0.81, 0.64]} \ No newline at end of file diff --git a/annotations_1/CB5qzQrDnZE_filtered.json b/annotations_1/CB5qzQrDnZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faf09e0f0db8384cc155ecea0c45aa48345d0476 --- /dev/null +++ b/annotations_1/CB5qzQrDnZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 67.71], [73.0, 73.94], [77.0, 78.49], [83.0, 83.84], [86.0, 86.76], [88.0, 89.34], [91.0, 91.66], [95.0, 94.83], [97.0, 122.81], [125.0, 131.84], [136.0, 146.4], [152.0, 152.32], [156.0, 157.47], [159.0, 159.93], [161.0, 161.76], [162.0, 185.73], [187.0, 187.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.3, 98.66, 74.44, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 22.08], ["buzz", 18.92], ["insect", 11.76]], null, null, null, null, null, null, null, null], "duration": [0.71, 0.94, 1.49, 0.84, 0.76, 1.34, 0.66, -0.17, 25.81, 6.84, 10.4, 0.32, 1.47, 0.93, 0.76, 23.73, 0.91]} \ No newline at end of file diff --git a/annotations_1/CBUtXwZNA8Y_filtered.json b/annotations_1/CBUtXwZNA8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e222392fe66035e522868502f5a8a6f310e73c9 --- /dev/null +++ b/annotations_1/CBUtXwZNA8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.97], [8.0, 10.72], [19.0, 19.58], [23.0, 29.32], [32.0, 33.51], [34.0, 36.15], [36.0, 36.78], [37.0, 36.81], [40.0, 41.69], [55.0, 55.27], [67.0, 69.23], [80.0, 80.69], [82.0, 86.64], [92.0, 93.92], [110.0, 111.23], [111.0, 111.27], [113.0, 113.61], [114.0, 114.88], [118.0, 119.5], [121.0, 121.56], [128.0, 135.19], [139.0, 141.0], [156.0, 156.69]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 31.11, 0.0, 34.58, 0.0, 31.61, 0.0, 0.0, 0.0, 0.0, 39.66, 0.0, 34.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.86, 32.68, 0.0], "audiomae_on_audioset": [null, [["speech", 59.7], ["fart", 5.6], ["music", 3.41]], null, [["moo", 36.63], ["cattle, bovinae", 34.98], ["livestock, farm animals, working animals", 25.85]], null, [["speech", 28.5], ["boing", 17.2], ["fireworks", 9.75]], null, null, null, null, [["music", 57.27], ["grunt", 13.87], ["music for children", 6.42]], null, [["speech", 54.49], ["music", 17.17], ["thunk", 12.09]], null, null, null, null, null, null, null, [["music", 25.31], ["speech", 18.45], ["whack, thwack", 8.78]], [["music", 36.95], ["sigh", 13.64], ["groan", 10.82]], null], "duration": [-0.03, 2.72, 0.58, 6.32, 1.51, 2.15, 0.78, -0.19, 1.69, 0.27, 2.23, 0.69, 4.64, 1.92, 1.23, 0.27, 0.61, 0.88, 1.5, 0.56, 7.19, 2.0, 0.69]} \ No newline at end of file diff --git a/annotations_1/CBbH4CVp1S0_filtered.json b/annotations_1/CBbH4CVp1S0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f3a7ceabade2bed10456b41fc875a6df2be0e0a --- /dev/null +++ b/annotations_1/CBbH4CVp1S0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.42], [28.0, 43.53], [47.0, 47.17], [50.0, 59.32], [61.0, 74.16], [75.0, 75.66], [78.0, 81.84], [85.0, 87.44]], "keep_status": [false, false, false, true, true, false, true, false], "silence_prob": [34.8, 34.58, 0.0, 31.31, 32.08, 0.0, 35.36, 38.09], "audiomae_on_audioset": [[["hum", 50.86], ["mains hum", 29.09], ["music", 6.4]], [["music", 64.69], ["theremin", 6.67], ["hum", 4.6]], null, [["music", 32.83], ["hum", 23.09], ["throbbing", 8.64]], [["livestock, farm animals, working animals", 31.44], ["cattle, bovinae", 24.7], ["moo", 8.83]], null, [["music", 34.37], ["didgeridoo", 21.24], ["hum", 7.17]], [["music", 37.72], ["throbbing", 20.77], ["hum", 20.08]]], "duration": [2.42, 15.53, 0.17, 9.32, 13.16, 0.66, 3.84, 2.44]} \ No newline at end of file diff --git a/annotations_1/CDQw1Ez9yOs_filtered.json b/annotations_1/CDQw1Ez9yOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2ebce0bdcc78a839eee192a7903b1f0ddb09a66 --- /dev/null +++ b/annotations_1/CDQw1Ez9yOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 4.92], [6.0, 14.34], [17.0, 21.12], [23.0, 26.15], [28.0, 29.3], [31.0, 32.75], [34.0, 36.17], [41.0, 48.91], [51.0, 50.87], [52.0, 53.27], [59.0, 59.51], [63.0, 63.49], [65.0, 65.79], [68.0, 68.01], [69.0, 70.44], [72.0, 76.45], [80.0, 81.26], [82.0, 82.9], [91.0, 91.08], [94.0, 98.37], [103.0, 110.12], [111.0, 116.65], [122.0, 121.96], [125.0, 126.22], [127.0, 131.9], [133.0, 135.53], [136.0, 166.89], [167.0, 167.46], [167.0, 167.49], [169.0, 169.47], [170.0, 170.78]], "keep_status": [false, false, false, true, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.62, 40.77, 34.04, 0.0, 0.0, 37.47, 35.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.33, 0.0, 0.0, 0.0, 35.76, 36.65, 36.52, 0.0, 0.0, 35.16, 36.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.7], ["hum", 20.85], ["throbbing", 19.5]], [["music", 24.99], ["theremin", 12.3], ["hum", 9.68]], [["music", 49.71], ["hum", 10.33], ["throbbing", 6.1]], null, null, [["music", 21.65], ["hum", 17.27], ["electronic music", 10.65]], [["speech", 24.93], ["music", 18.38], ["hum", 16.09]], null, null, null, null, null, null, null, [["music", 57.53], ["speech", 18.97], ["burping, eructation", 2.9]], null, null, null, [["music", 34.62], ["speech", 9.51], ["hum", 8.96]], [["music", 41.81], ["hum", 14.43], ["throbbing", 11.43]], [["music", 65.09], ["throbbing", 17.05], ["hum", 4.37]], null, null, [["music", 66.19], ["throbbing", 5.02], ["bell", 2.42]], [["music", 78.81], ["throbbing", 3.75], ["electronic music", 2.0]], null, null, null, null, null], "duration": [1.31, -0.08, 8.34, 4.12, 3.15, 1.3, 1.75, 2.17, 7.91, -0.13, 1.27, 0.51, 0.49, 0.79, 0.01, 1.44, 4.45, 1.26, 0.9, 0.08, 4.37, 7.12, 5.65, -0.04, 1.22, 4.9, 2.53, 30.89, 0.46, 0.49, 0.47, 0.78]} \ No newline at end of file diff --git a/annotations_1/CDTnjLPgMKM_filtered.json b/annotations_1/CDTnjLPgMKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aabf9966d37555d6324a3809ad18c2cbb70db5f1 --- /dev/null +++ b/annotations_1/CDTnjLPgMKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.67], [44.0, 44.51], [47.0, 48.0], [69.0, 70.98], [72.0, 72.5], [75.0, 75.81], [78.0, 77.97], [79.0, 78.87], [83.0, 83.66], [96.0, 96.77], [103.0, 103.59], [109.0, 110.46], [116.0, 116.68], [118.0, 118.08], [125.0, 127.08], [129.0, 129.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [40.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.52, 0.0], "audiomae_on_audioset": [[["music", 33.98], ["hum", 18.46], ["throbbing", 15.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 16.49], ["roaring cats (lions, tigers)", 11.46], ["whale vocalization", 8.71]], null], "duration": [12.67, 0.51, 1.0, 1.98, 0.5, 0.81, -0.03, -0.13, 0.66, 0.77, 0.59, 1.46, 0.68, 0.08, 2.08, 0.05]} \ No newline at end of file diff --git a/annotations_1/CDwnIJ5ohu4_filtered.json b/annotations_1/CDwnIJ5ohu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5d059df0cf9d2c274a42c7dcab710e1510efc1 --- /dev/null +++ b/annotations_1/CDwnIJ5ohu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [3.0, 3.89], [5.0, 6.99], [11.0, 11.21], [17.0, 18.54], [21.0, 22.99], [27.0, 28.61], [31.0, 31.6], [38.0, 40.47], [41.0, 44.83], [45.0, 47.04], [50.0, 54.46], [56.0, 56.39], [59.0, 59.66], [62.0, 63.95], [66.0, 68.05], [71.0, 71.64], [75.0, 75.19], [80.0, 80.89], [86.0, 87.54], [88.0, 89.87], [94.0, 95.28], [100.0, 101.98], [104.0, 104.55], [106.0, 106.86], [111.0, 113.85], [115.0, 117.59], [120.0, 121.34], [123.0, 123.94], [128.0, 128.53], [131.0, 132.75], [134.0, 136.73], [139.0, 141.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 81.89, 45.4, 99.95, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 66.27, 90.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["busy signal", 50.37], ["speech", 37.88], ["dial tone", 2.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.89, 1.99, 0.21, 1.54, 1.99, 1.61, 0.6, 2.47, 3.83, 2.04, 4.46, 0.39, 0.66, 1.95, 2.05, 0.64, 0.19, 0.89, 1.54, 1.87, 1.28, 1.98, 0.55, 0.86, 2.85, 2.59, 1.34, 0.94, 0.53, 1.75, 2.73, 2.54]} \ No newline at end of file diff --git a/annotations_1/CE8VRLW8Zw4_filtered.json b/annotations_1/CE8VRLW8Zw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64171ce3fed65bc56c3044dfe7dc70d2a3f21dc0 --- /dev/null +++ b/annotations_1/CE8VRLW8Zw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.55], [16.0, 16.83], [18.0, 18.67], [19.0, 21.42], [23.0, 23.77], [25.0, 25.17], [26.0, 27.62], [31.0, 33.12], [35.0, 36.83], [40.0, 43.34], [44.0, 55.41], [58.0, 80.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 0.0, 51.5, 0.0, 52.16, 31.91, 33.88], "audiomae_on_audioset": [null, null, null, [["sidetone", 69.52], ["music", 9.8], ["radio", 5.95]], null, null, null, null, null, null, [["music", 51.53], ["fly, housefly", 9.35], ["mosquito", 4.01]], [["music", 47.79], ["speech", 32.02], ["electric shaver, electric razor", 2.85]]], "duration": [0.55, 0.83, 0.67, 2.42, 0.77, 0.17, 1.62, 2.12, 1.83, 3.34, 11.41, 22.23]} \ No newline at end of file diff --git a/annotations_1/CECosJ9_6MI_filtered.json b/annotations_1/CECosJ9_6MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1de4fa9dc16350ed6becd57df414f66191b7a25 --- /dev/null +++ b/annotations_1/CECosJ9_6MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [6.0, 6.78], [7.0, 7.6], [22.0, 22.82], [34.0, 34.06], [35.0, 37.0], [39.0, 39.92], [41.0, 41.35], [43.0, 44.15], [52.0, 52.54], [54.0, 54.24], [58.0, 58.55], [63.0, 63.24], [66.0, 66.39], [67.0, 68.2], [69.0, 69.04], [70.0, 71.79], [73.0, 76.3], [79.0, 79.44], [81.0, 81.68], [83.0, 83.08], [84.0, 84.57], [90.0, 90.76], [92.0, 93.01], [94.0, 95.12], [97.0, 97.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.8], ["theremin", 19.0], ["musical instrument", 7.63]], null, null, null, null, null, null, null, null], "duration": [0.49, 0.78, 0.6, 0.82, 0.06, 2.0, 0.92, 0.35, 1.15, 0.54, 0.24, 0.55, 0.24, 0.39, 1.2, 0.04, 1.79, 3.3, 0.44, 0.68, 0.08, 0.57, 0.76, 1.01, 1.12, 0.71]} \ No newline at end of file diff --git a/annotations_1/CEO9YAsxMfI_filtered.json b/annotations_1/CEO9YAsxMfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ab89611c71c528e215cb658ac2fe466b2c7db08 --- /dev/null +++ b/annotations_1/CEO9YAsxMfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 6.61], [7.0, 7.4], [9.0, 9.36], [11.0, 11.72], [24.0, 24.27], [26.0, 26.16], [42.0, 44.64], [46.0, 47.63], [51.0, 51.61], [52.0, 54.95], [56.0, 59.1], [64.0, 66.06], [69.0, 74.22], [75.0, 80.49], [81.0, 89.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 61.77, 48.19, 96.17, 63.74, 69.47, 52.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["synthesizer", 10.52], ["chirp tone", 8.27], ["hum", 8.16]], null, null, null, null], "duration": [0.33, 1.61, 0.4, 0.36, 0.72, 0.27, 0.16, 2.64, 1.63, 0.61, 2.95, 3.1, 2.06, 5.22, 5.49, 8.41]} \ No newline at end of file diff --git a/annotations_1/CEwyZcmwNiQ_filtered.json b/annotations_1/CEwyZcmwNiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfbfb0f43f52623de35f386eecde44edeafc9e31 --- /dev/null +++ b/annotations_1/CEwyZcmwNiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.95], [7.0, 10.74], [39.0, 39.56], [51.0, 51.29], [54.0, 53.7], [59.0, 60.39]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 40.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 16.44], ["mains hum", 14.28], ["hum", 12.71]], null, null, null, null], "duration": [-0.05, 3.74, 0.56, 0.29, -0.3, 1.39]} \ No newline at end of file diff --git a/annotations_1/CFOC-_DYKXk_filtered.json b/annotations_1/CFOC-_DYKXk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fe06f5086c471dd85c4b3c3e801486de919bd55 --- /dev/null +++ b/annotations_1/CFOC-_DYKXk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.64], [12.0, 12.12], [13.0, 14.89], [16.0, 17.49], [20.0, 19.97], [22.0, 23.35], [24.0, 24.87], [26.0, 26.52], [28.0, 30.99], [34.0, 35.73], [38.0, 39.55], [40.0, 40.42], [42.0, 42.45], [50.0, 51.93], [53.0, 53.92], [58.0, 58.43], [67.0, 67.54], [69.0, 68.81], [75.0, 75.83], [86.0, 86.58], [89.0, 89.11], [89.0, 91.79], [92.0, 104.77], [107.0, 115.3], [116.0, 132.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 89.36, 98.1, 92.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.64, 0.12, 1.89, 1.49, -0.03, 1.35, 0.87, 0.52, 2.99, 1.73, 1.55, 0.42, 0.45, 1.93, 0.92, 0.43, 0.54, -0.19, 0.83, 0.58, 0.11, 2.79, 12.77, 8.3, 16.85]} \ No newline at end of file diff --git a/annotations_1/CFqO1y01qjs_filtered.json b/annotations_1/CFqO1y01qjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91412833855c7c6935f63da76a198943be141e0a --- /dev/null +++ b/annotations_1/CFqO1y01qjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [3.0, 5.56], [7.0, 7.15], [8.0, 10.47], [13.0, 15.03], [16.0, 18.27], [20.0, 22.01], [23.0, 26.22], [27.0, 36.24], [44.0, 50.57], [52.0, 76.55], [77.0, 79.37], [80.0, 109.48], [113.0, 153.03], [157.0, 171.54], [175.0, 178.95], [179.0, 179.44]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, true, false, false, true, true, false], "silence_prob": [0.0, 100.0, 0.0, 99.21, 100.0, 66.27, 100.0, 33.26, 34.85, 32.13, 30.2, 34.92, 30.37, 0.0, 30.65, 36.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["grunt", 29.08], ["groan", 7.31], ["wild animals", 6.97]], [["music", 59.8], ["synthesizer", 16.17], ["sidetone", 3.58]], [["music", 43.19], ["throbbing", 9.77], ["hum", 9.49]], [["music", 44.93], ["throbbing", 12.81], ["synthesizer", 11.6]], [["fly, housefly", 20.0], ["cattle, bovinae", 15.62], ["moo", 15.52]], [["music", 67.57], ["speech", 5.55], ["throbbing", 3.74]], null, [["music", 36.82], ["musical instrument", 8.51], ["speech", 8.17]], [["speech", 53.49], ["animal", 6.49], ["wild animals", 4.47]], null], "duration": [0.83, 2.56, 0.15, 2.47, 2.03, 2.27, 2.01, 3.22, 9.24, 6.57, 24.55, 2.37, 29.48, 40.03, 14.54, 3.95, 0.44]} \ No newline at end of file diff --git a/annotations_1/CG2YRWPhfiA_filtered.json b/annotations_1/CG2YRWPhfiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59fe0d85ebb55936497309d07e5610ebb332f0fe --- /dev/null +++ b/annotations_1/CG2YRWPhfiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 57.21], [58.0, 58.65], [59.0, 60.45], [62.0, 62.72], [67.0, 67.64], [69.0, 70.16], [73.0, 72.84], [74.0, 74.56], [76.0, 76.15], [77.0, 107.49], [109.0, 109.93], [113.0, 113.46], [114.0, 114.44], [116.0, 116.99], [118.0, 120.21], [121.0, 122.77], [125.0, 125.66], [127.0, 127.41], [130.0, 131.79], [134.0, 134.99], [136.0, 176.03], [178.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.72], ["hum", 15.32], ["sidetone", 10.53]], null, null, null, null, null, null, null], "duration": [1.21, 0.65, 1.45, 0.72, 0.64, 1.16, -0.16, 0.56, 0.15, 30.49, 0.93, 0.46, 0.44, 0.99, 2.21, 1.77, 0.66, 0.41, 1.79, 0.99, 40.03, 0.12]} \ No newline at end of file diff --git a/annotations_1/CGwzaIS-tLk_filtered.json b/annotations_1/CGwzaIS-tLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d8de24d401e7f06d6573b8601a4b34b9e1a031c --- /dev/null +++ b/annotations_1/CGwzaIS-tLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 99.45]], "keep_status": [true], "silence_prob": [36.7], "audiomae_on_audioset": [[["mains hum", 29.1], ["music", 17.9], ["hum", 15.37]]], "duration": [23.45]} \ No newline at end of file diff --git a/annotations_1/CHBydX2-I50_filtered.json b/annotations_1/CHBydX2-I50_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65d6169ff8a01eccc537f2b9550cc32c7a86e65e --- /dev/null +++ b/annotations_1/CHBydX2-I50_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.32], [14.0, 14.91], [16.0, 18.54], [22.0, 23.06], [25.0, 25.15], [28.0, 32.51], [34.0, 39.8], [41.0, 45.5], [46.0, 50.23], [54.0, 56.35], [57.0, 57.43], [61.0, 62.28], [64.0, 65.79], [67.0, 67.63], [71.0, 71.78], [73.0, 74.98], [77.0, 77.14], [78.0, 78.16], [80.0, 83.76], [84.0, 96.25], [106.0, 112.75], [114.0, 114.86], [116.0, 116.99], [120.0, 166.08]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 36.56, 0.0, 0.0, 36.25, 37.04, 44.18, 36.56, 74.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 38.14, 45.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 61.31], ["sine wave", 8.53], ["speech", 7.12]], null, null, [["hum", 31.73], ["throbbing", 16.08], ["rumble", 11.66]], [["hum", 27.63], ["throbbing", 25.81], ["rumble", 17.6]], [["speech", 25.36], ["hum", 23.24], ["throbbing", 14.36]], [["speech", 10.41], ["hum", 6.79], ["fly, housefly", 5.32]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 22.73], ["speech", 11.4], ["sidetone", 8.21]], [["noise", 10.8], ["thunk", 9.73], ["animal", 8.9]], null, null, null], "duration": [0.32, 0.91, 2.54, 1.06, 0.15, 4.51, 5.8, 4.5, 4.23, 2.35, 0.43, 1.28, 1.79, 0.63, 0.78, 1.98, 0.14, 0.16, 3.76, 12.25, 6.75, 0.86, 0.99, 46.08]} \ No newline at end of file diff --git a/annotations_1/CHOpoOnkRJE_filtered.json b/annotations_1/CHOpoOnkRJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9723b199fb89b6bd3d9fa1ab57b9324ad1925d0d --- /dev/null +++ b/annotations_1/CHOpoOnkRJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 48.12], [51.0, 50.97], [54.0, 55.12], [56.0, 56.91], [64.0, 68.96], [69.0, 70.48], [75.0, 76.71], [78.0, 78.53], [83.0, 84.01], [94.0, 96.5], [102.0, 102.74], [110.0, 110.73], [116.0, 116.23]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 35.77], ["speech", 14.36], ["electric shaver, electric razor", 6.64]], null, null, null, null, null, null, null, null], "duration": [1.12, -0.03, 1.12, 0.91, 4.96, 1.48, 1.71, 0.53, 1.01, 2.5, 0.74, 0.73, 0.23]} \ No newline at end of file diff --git a/annotations_1/CHs36bNm7xk_filtered.json b/annotations_1/CHs36bNm7xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b3e6ec34d961275d840135eef9823267746251 --- /dev/null +++ b/annotations_1/CHs36bNm7xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.47], [7.0, 7.75], [12.0, 14.18], [24.0, 25.2], [28.0, 29.32], [31.0, 31.23], [38.0, 38.11], [42.0, 44.54], [47.0, 47.19], [49.0, 51.88], [55.0, 55.44], [64.0, 64.37], [67.0, 67.98], [72.0, 72.6], [73.0, 74.43], [77.0, 77.13], [78.0, 78.6], [79.0, 80.49], [83.0, 82.78], [86.0, 87.2], [89.0, 89.36], [95.0, 95.13], [97.0, 102.19], [103.0, 105.83], [112.0, 112.62], [114.0, 120.48], [123.0, 122.76], [124.0, 128.09], [129.0, 129.76], [131.0, 133.79], [138.0, 138.38], [162.0, 167.91]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 32.56, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 95.78, 0.0, 63.85, 0.0, 68.28, 0.0, 57.72, 0.0, 61.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 26.76], ["music", 9.23], ["thunk", 8.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.75, 2.18, 1.2, 1.32, 0.23, 0.11, 2.54, 0.19, 2.88, 0.44, 0.37, 0.98, 0.6, 1.43, 0.13, 0.6, 1.49, -0.22, 1.2, 0.36, 0.13, 5.19, 2.83, 0.62, 6.48, -0.24, 4.09, 0.76, 2.79, 0.38, 5.91]} \ No newline at end of file diff --git a/annotations_1/CKIh_vKo7Fg_filtered.json b/annotations_1/CKIh_vKo7Fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41cde97fbd0f7ef7308047eb4912aa8986d96d55 --- /dev/null +++ b/annotations_1/CKIh_vKo7Fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.49], [3.0, 4.45], [7.0, 7.42], [25.0, 25.51], [26.0, 30.96], [38.0, 37.57], [45.0, 45.54], [46.0, 46.23], [51.0, 53.3], [55.0, 56.07], [58.0, 59.27], [60.0, 61.37], [64.0, 69.28], [70.0, 69.63], [72.0, 78.83], [83.0, 83.39], [90.0, 90.39], [95.0, 94.76], [95.0, 94.83], [95.0, 101.31], [107.0, 108.13], [109.0, 109.31], [110.0, 114.4], [115.0, 116.46], [117.0, 118.44], [121.0, 121.37], [126.0, 125.96], [128.0, 128.75], [141.0, 141.2], [148.0, 149.37], [152.0, 152.22], [153.0, 154.23], [155.0, 157.08], [161.0, 177.65], [183.0, 183.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.22, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 37.61, 0.0, 44.78, 0.0, 0.0, 0.0, 0.0, 30.08, 0.0, 0.0, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 33.98, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 80.09], ["music", 2.71], ["inside, small room", 1.77]], null, null, null, [["thunk", 73.86], ["music", 3.61], ["door", 3.58]], null, null, null, [["speech", 68.72], ["fart", 3.09], ["whack, thwack", 3.03]], null, [["music", 47.84], ["singing bowl", 5.85], ["didgeridoo", 3.98]], null, null, null, null, [["speech", 49.28], ["music", 18.71], ["boing", 10.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.63], ["throbbing", 4.53], ["hum", 4.09]], null], "duration": [1.49, 1.45, 0.42, 0.51, 4.96, -0.43, 0.54, 0.23, 2.3, 1.07, 1.27, 1.37, 5.28, -0.37, 6.83, 0.39, 0.39, -0.24, -0.17, 6.31, 1.13, 0.31, 4.4, 1.46, 1.44, 0.37, -0.04, 0.75, 0.2, 1.37, 0.22, 1.23, 2.08, 16.65, 0.32]} \ No newline at end of file diff --git a/annotations_1/CKc8xHhxP0Q_filtered.json b/annotations_1/CKc8xHhxP0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..105246c068acb9d626c872795a90598666c22679 --- /dev/null +++ b/annotations_1/CKc8xHhxP0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 23.9], [31.0, 32.97], [35.0, 43.68], [44.0, 64.1], [78.0, 86.8], [90.0, 91.4], [93.0, 121.78], [122.0, 122.77], [123.0, 124.46], [127.0, 130.6], [131.0, 140.81], [141.0, 152.15]], "keep_status": [true, false, false, true, true, false, true, false, false, true, false, true], "silence_prob": [29.41, 0.0, 29.51, 29.17, 36.11, 0.0, 29.51, 0.0, 0.0, 28.83, 29.6, 33.76], "audiomae_on_audioset": [[["buzz", 31.19], ["electric shaver, electric razor", 17.32], ["speech", 17.16]], null, [["music", 60.81], ["boom", 5.72], ["didgeridoo", 5.03]], [["throbbing", 11.76], ["music", 11.53], ["hum", 11.22]], [["hum", 28.35], ["throbbing", 19.37], ["speech", 15.43]], null, [["music", 49.87], ["grunt", 8.12], ["speech", 7.73]], null, null, [["music", 47.31], ["hum", 6.93], ["speech", 6.54]], [["speech", 71.5], ["music", 13.0], ["hum", 1.97]], [["music", 40.61], ["hum", 16.68], ["mains hum", 8.67]]], "duration": [18.9, 1.97, 8.68, 20.1, 8.8, 1.4, 28.78, 0.77, 1.46, 3.6, 9.81, 11.15]} \ No newline at end of file diff --git a/annotations_1/CL3IXUZKbto_filtered.json b/annotations_1/CL3IXUZKbto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e368ddd228b2b58b9785afd227bf28e27fc4f695 --- /dev/null +++ b/annotations_1/CL3IXUZKbto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 87.25], [88.0, 97.55], [100.0, 103.25], [104.0, 115.64], [119.0, 135.94], [136.0, 136.59], [137.0, 138.11], [139.0, 158.92], [159.0, 170.11], [175.0, 200.43]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 59.59, 83.52, 61.67, 62.37, 0.0, 0.0, 59.15, 33.19, 31.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["theremin", 67.01], ["music", 22.79], ["musical instrument", 2.17]], [["music", 44.86], ["theremin", 15.85], ["cello", 5.51]]], "duration": [85.25, 9.55, 3.25, 11.64, 16.94, 0.59, 1.11, 19.92, 11.11, 25.43]} \ No newline at end of file diff --git a/annotations_1/CLWCgMVf6U0_filtered.json b/annotations_1/CLWCgMVf6U0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c47fa936722a9ffecedfc82c5450ec4aee389af6 --- /dev/null +++ b/annotations_1/CLWCgMVf6U0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.62], [17.0, 35.19], [36.0, 37.66], [38.0, 46.6], [47.0, 49.0], [50.0, 50.84], [52.0, 52.15], [53.0, 59.16], [61.0, 107.1], [107.0, 147.16]], "keep_status": [false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.28, 0.0, 30.06, 31.65, 0.0, 0.0, 30.16, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 13.4], ["cattle, bovinae", 11.14], ["livestock, farm animals, working animals", 11.14]], null, [["livestock, farm animals, working animals", 41.01], ["cattle, bovinae", 29.91], ["moo", 16.44]], [["music", 47.49], ["hum", 12.05], ["didgeridoo", 10.49]], null, null, [["speech", 17.26], ["music", 15.27], ["vehicle", 7.72]], null, null], "duration": [0.62, 18.19, 1.66, 8.6, 2.0, 0.84, 0.15, 6.16, 46.1, 40.16]} \ No newline at end of file diff --git a/annotations_1/CLxHRE-Knmc_filtered.json b/annotations_1/CLxHRE-Knmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93fdbd4af0ddb10d6386205950d654f92eaa4ccc --- /dev/null +++ b/annotations_1/CLxHRE-Knmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [5.0, 12.68], [14.0, 14.05], [16.0, 40.05], [41.0, 43.78], [44.0, 45.4], [46.0, 49.87], [51.0, 52.2], [60.0, 59.58], [60.0, 61.42], [64.0, 64.94], [68.0, 68.81], [71.0, 70.6], [74.0, 80.06], [81.0, 82.43], [84.0, 93.41], [97.0, 96.85], [97.0, 96.89], [97.0, 96.96]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 30.29, 0.0, 29.07, 32.27, 0.0, 32.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.96, 0.0, 28.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 29.6], ["hum", 28.93], ["mains hum", 24.13]], null, [["music", 50.05], ["vehicle", 9.96], ["throbbing", 9.08]], [["hum", 23.25], ["mains hum", 16.23], ["buzz", 10.36]], null, [["hum", 33.4], ["mains hum", 23.63], ["throbbing", 18.46]], null, null, null, null, null, null, [["breaking", 16.63], ["hum", 11.84], ["mains hum", 11.43]], null, [["hum", 24.19], ["speech", 23.14], ["mains hum", 17.48]], null, null, null], "duration": [0.13, 7.68, 0.05, 24.05, 2.78, 1.4, 3.87, 1.2, -0.42, 1.42, 0.94, 0.81, -0.4, 6.06, 1.43, 9.41, -0.15, -0.11, -0.04]} \ No newline at end of file diff --git a/annotations_1/CMfYaFpa3nY_filtered.json b/annotations_1/CMfYaFpa3nY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d31ad80d0b4c76b1c7076c061152181bd5340416 --- /dev/null +++ b/annotations_1/CMfYaFpa3nY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 42.62], [43.0, 45.59], [47.0, 48.81], [50.0, 53.25], [55.0, 57.72], [59.0, 60.64], [61.0, 70.56], [72.0, 77.06], [78.0, 81.3], [82.0, 86.95], [88.0, 92.13], [94.0, 97.19], [98.0, 102.91], [104.0, 115.92], [120.0, 122.66], [125.0, 127.08], [128.0, 133.29], [134.0, 138.23], [139.0, 143.04], [145.0, 149.13], [151.0, 151.85], [152.0, 153.3], [154.0, 154.04], [154.0, 154.13], [154.0, 154.16], [154.0, 154.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.99, 82.97, 0.0, 96.66, 96.66, 0.0, 88.28, 82.25, 98.19, 72.9, 95.91, 89.72, 93.6, 92.8, 89.19, 95.51, 96.04, 72.31, 67.38, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.62, 2.59, 1.81, 3.25, 2.72, 1.64, 9.56, 5.06, 3.3, 4.95, 4.13, 3.19, 4.91, 11.92, 2.66, 2.08, 5.29, 4.23, 4.04, 4.13, 0.85, 1.3, 0.04, 0.13, 0.16, 0.2]} \ No newline at end of file diff --git a/annotations_1/CN6dU8mcuMY_filtered.json b/annotations_1/CN6dU8mcuMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9333206ea2a9fb80558f9234394547ece1272b77 --- /dev/null +++ b/annotations_1/CN6dU8mcuMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.04], [12.0, 12.66], [14.0, 13.96], [17.0, 16.93], [24.0, 27.06], [30.0, 30.47], [31.0, 34.42], [36.0, 41.49], [43.0, 43.41], [49.0, 51.7], [54.0, 56.32], [58.0, 58.11], [60.0, 60.59], [64.0, 66.5], [69.0, 69.45], [74.0, 75.3], [78.0, 78.17], [87.0, 89.43], [90.0, 92.4], [94.0, 96.79], [100.0, 101.24], [104.0, 104.84], [109.0, 111.18], [112.0, 115.01], [117.0, 119.37], [123.0, 128.02], [129.0, 130.06], [137.0, 137.88], [140.0, 141.51], [144.0, 143.94], [146.0, 146.74], [149.0, 149.45], [152.0, 152.0], [158.0, 163.53], [165.0, 166.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.98, 98.51, 0.0, 96.29, 95.51, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 99.1, 99.99, 99.59, 0.0, 0.0, 100.0, 98.44, 99.95, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.66, -0.04, -0.07, 3.06, 0.47, 3.42, 5.49, 0.41, 2.7, 2.32, 0.11, 0.59, 2.5, 0.45, 1.3, 0.17, 2.43, 2.4, 2.79, 1.24, 0.84, 2.18, 3.01, 2.37, 5.02, 1.06, 0.88, 1.51, -0.06, 0.74, 0.45, 0.0, 5.53, 1.38]} \ No newline at end of file diff --git a/annotations_1/CNuEnlaPuls_filtered.json b/annotations_1/CNuEnlaPuls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1368d4376579ead917fbdd81615c2ca7c779fff3 --- /dev/null +++ b/annotations_1/CNuEnlaPuls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [18.0, 52.44], [53.0, 73.08], [74.0, 74.49], [76.0, 77.36], [78.0, 95.96], [97.0, 115.67], [117.0, 118.71], [121.0, 122.57], [125.0, 131.13], [132.0, 134.59], [135.0, 144.91]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.33, 0.0, 0.0, 29.44, 29.55, 0.0, 0.0, 65.09, 54.3, 48.14], "audiomae_on_audioset": [null, null, [["throbbing", 49.62], ["music", 23.24], ["hum", 17.85]], null, null, [["throbbing", 18.85], ["hum", 18.73], ["music", 15.7]], [["speech", 46.81], ["music", 14.37], ["hum", 4.11]], null, null, null, null, [["hum", 31.33], ["music", 30.61], ["throbbing", 24.75]]], "duration": [0.85, 34.44, 20.08, 0.49, 1.36, 17.96, 18.67, 1.71, 1.57, 6.13, 2.59, 9.91]} \ No newline at end of file diff --git a/annotations_1/COSkA00zJlo_filtered.json b/annotations_1/COSkA00zJlo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7c8d522963b0dc3ae0d1d91b4c921a8d5b44c06 --- /dev/null +++ b/annotations_1/COSkA00zJlo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.1], [20.0, 20.85], [24.0, 24.76], [27.0, 27.51], [33.0, 33.93], [38.0, 39.02], [41.0, 41.42], [44.0, 45.0], [46.0, 46.94], [52.0, 52.64], [54.0, 55.12], [56.0, 57.59], [58.0, 61.26], [62.0, 63.88], [67.0, 67.73], [73.0, 74.56], [76.0, 78.27], [83.0, 84.54], [85.0, 86.02], [86.0, 87.45], [88.0, 89.67], [91.0, 91.59], [95.0, 95.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.1, 0.85, 0.76, 0.51, 0.93, 1.02, 0.42, 1.0, 0.94, 0.64, 1.12, 1.59, 3.26, 1.88, 0.73, 1.56, 2.27, 1.54, 1.02, 1.45, 1.67, 0.59, 0.05]} \ No newline at end of file diff --git a/annotations_1/CRu7V9v8Nnk_filtered.json b/annotations_1/CRu7V9v8Nnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4769551112cd2c728b1d40dd52c8d22731f68ad --- /dev/null +++ b/annotations_1/CRu7V9v8Nnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.9], [19.0, 22.4], [26.0, 25.98], [28.0, 28.38], [35.0, 35.8], [43.0, 43.93], [64.0, 65.03], [66.0, 67.53], [68.0, 68.39], [68.0, 72.27], [75.0, 79.34], [81.0, 80.91], [87.0, 93.39], [95.0, 97.26], [100.0, 100.84], [105.0, 105.0], [107.0, 108.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [30.77, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.37, 31.99, 0.0, 45.02, 47.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 85.39], ["theremin", 7.51], ["musical instrument", 0.98]], [["harp", 37.78], ["music", 32.27], ["musical instrument", 4.71]], null, null, null, null, null, null, null, [["music", 59.41], ["speech", 3.73], ["didgeridoo", 3.53]], [["music", 58.39], ["synthesizer", 5.05], ["theremin", 4.68]], null, [["music", 77.5], ["musical instrument", 2.86], ["harp", 2.31]], [["music", 41.9], ["speech", 15.69], ["ice cream truck, ice cream van", 5.07]], null, null, null], "duration": [4.9, 3.4, -0.02, 0.38, 0.8, 0.93, 1.03, 1.53, 0.39, 4.27, 4.34, -0.09, 6.39, 2.26, 0.84, 0.0, 1.94]} \ No newline at end of file diff --git a/annotations_1/CScFydObPJA_filtered.json b/annotations_1/CScFydObPJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a0a9ed3f254982f09670c19416c4588176e493 --- /dev/null +++ b/annotations_1/CScFydObPJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [9.0, 12.31], [13.0, 13.26], [19.0, 20.78], [22.0, 22.06], [43.0, 44.1], [45.0, 46.26], [46.0, 46.35], [49.0, 49.67], [50.0, 50.97], [55.0, 59.34], [60.0, 62.5], [65.0, 65.5], [71.0, 77.99], [79.0, 83.05], [86.0, 88.69], [89.0, 91.94], [94.0, 94.24], [104.0, 104.19], [108.0, 107.89], [112.0, 112.24], [117.0, 120.39], [140.0, 140.29], [143.0, 145.59], [156.0, 157.01], [161.0, 160.84], [162.0, 162.04], [163.0, 163.38], [164.0, 164.64], [165.0, 165.67], [167.0, 166.75], [169.0, 170.68], [175.0, 175.76]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 42.44, 0.0, 32.6, 33.56, 39.96, 36.55, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 21.05], ["hum", 15.47], ["mains hum", 13.28]], null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 21.81], ["speech", 7.09], ["fly, housefly", 6.22]], [["music", 50.55], ["throbbing", 10.51], ["hum", 9.15]], null, [["music", 29.21], ["speech", 28.69], ["sidetone", 19.19]], [["music", 55.72], ["throbbing", 16.3], ["hum", 7.41]], [["music", 59.56], ["hum", 12.62], ["throbbing", 7.83]], [["hum", 26.56], ["music", 18.98], ["mains hum", 11.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 3.31, 0.26, 1.78, 0.06, 1.1, 1.26, 0.35, 0.67, 0.97, 4.34, 2.5, 0.5, 6.99, 4.05, 2.69, 2.94, 0.24, 0.19, -0.11, 0.24, 3.39, 0.29, 2.59, 1.01, -0.16, 0.04, 0.38, 0.64, 0.67, -0.25, 1.68, 0.76]} \ No newline at end of file diff --git a/annotations_1/CShHiYrQPGM_filtered.json b/annotations_1/CShHiYrQPGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c48924aac922ac72ee10f5eb16f97d26d7922485 --- /dev/null +++ b/annotations_1/CShHiYrQPGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [5.0, 6.96], [8.0, 14.84], [17.0, 24.9], [26.0, 28.71], [30.0, 36.39], [39.0, 68.17], [69.0, 74.44], [75.0, 143.04], [150.0, 158.36], [159.0, 159.63], [161.0, 166.11], [167.0, 167.68]], "keep_status": [false, false, true, true, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.76, 32.25, 47.23, 34.66, 39.02, 53.91, 0.0, 41.58, 0.0, 33.3, 0.0], "audiomae_on_audioset": [null, null, [["hum", 24.98], ["speech", 22.69], ["music", 14.5]], [["music", 45.34], ["hum", 6.4], ["mains hum", 5.34]], [["music", 22.61], ["hum", 19.77], ["speech", 10.67]], [["music", 46.08], ["speech", 21.61], ["hum", 3.81]], [["music", 27.21], ["hum", 24.04], ["throbbing", 14.13]], null, null, [["music", 45.47], ["hum", 10.3], ["throbbing", 9.28]], null, [["music", 50.35], ["speech", 35.41], ["explosion", 2.22]], null], "duration": [0.89, 1.96, 6.84, 7.9, 2.71, 6.39, 29.17, 5.44, 68.04, 8.36, 0.63, 5.11, 0.68]} \ No newline at end of file diff --git a/annotations_1/CTRZgOL-vA0_filtered.json b/annotations_1/CTRZgOL-vA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2de8d8eddbc7605279a40aa88b1e20b2d377de69 --- /dev/null +++ b/annotations_1/CTRZgOL-vA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [7.0, 7.26], [9.0, 31.21], [32.0, 32.43], [34.0, 35.7], [36.0, 38.64], [40.0, 40.91], [42.0, 43.7], [46.0, 47.31], [52.0, 54.28], [58.0, 59.16], [61.0, 63.37], [65.0, 66.77], [67.0, 69.97], [72.0, 76.62], [80.0, 80.15], [81.0, 83.35], [85.0, 90.46], [91.0, 95.89], [97.0, 101.66], [103.0, 107.84], [108.0, 117.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 48.23, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 68.41, 0.0, 79.59, 0.0, 53.16, 54.97, 0.0, 45.82, 53.28, 48.69, 47.31, 57.09, 48.06], "audiomae_on_audioset": [null, null, [["music", 70.39], ["musical instrument", 6.41], ["hum", 2.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 25.69], ["music", 23.79], ["didgeridoo", 8.36]], null, [["hum", 17.85], ["music", 16.19], ["noise", 7.26]], [["music", 62.1], ["musical instrument", 4.42], ["guitar", 3.34]], null, [["music", 68.95], ["speech", 9.11], ["echo", 4.55]]], "duration": [0.1, 0.26, 22.21, 0.43, 1.7, 2.64, 0.91, 1.7, 1.31, 2.28, 1.16, 2.37, 1.77, 2.97, 4.62, 0.15, 2.35, 5.46, 4.89, 4.66, 4.84, 9.63]} \ No newline at end of file diff --git a/annotations_1/CTpAikAZ2aA_filtered.json b/annotations_1/CTpAikAZ2aA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28a701aaa0ea60a357c267a0201d125dbfdce3f3 --- /dev/null +++ b/annotations_1/CTpAikAZ2aA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 123.77], [127.0, 130.49], [131.0, 133.79]], "keep_status": [false, true, false], "silence_prob": [0.0, 42.19, 82.07], "audiomae_on_audioset": [null, [["music", 11.49], ["hum", 11.36], ["noise", 10.66]], null], "duration": [86.77, 3.49, 2.79]} \ No newline at end of file diff --git a/annotations_1/CU7-qLo7GPo_filtered.json b/annotations_1/CU7-qLo7GPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e1392bafaa0a7f700e90e2ba7d629adf1ec7496 --- /dev/null +++ b/annotations_1/CU7-qLo7GPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.79], [19.0, 19.52], [20.0, 21.29], [32.0, 34.67], [39.0, 38.87], [39.0, 39.73], [52.0, 52.88], [55.0, 54.84], [58.0, 64.3], [70.0, 72.64], [76.0, 77.26], [78.0, 79.25], [81.0, 81.6], [88.0, 91.64], [94.0, 101.06]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 38.46, 0.0, 0.0, 0.0, 0.0, 33.09, 34.15, 0.0, 0.0, 0.0, 32.63, 32.11], "audiomae_on_audioset": [null, null, null, [["speech", 76.66], ["effects unit", 3.02], ["music", 2.48]], null, null, null, null, [["speech", 29.95], ["music", 22.76], ["throbbing", 9.11]], [["music", 39.06], ["speech", 11.73], ["electronic music", 4.64]], null, null, null, [["music", 45.18], ["speech", 12.09], ["electronic music", 8.57]], [["music", 56.67], ["sidetone", 5.7], ["throbbing", 5.5]]], "duration": [0.79, 0.52, 1.29, 2.67, -0.13, 0.73, 0.88, -0.16, 6.3, 2.64, 1.26, 1.25, 0.6, 3.64, 7.06]} \ No newline at end of file diff --git a/annotations_1/CUYNZo-8cDM_filtered.json b/annotations_1/CUYNZo-8cDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a47f550698039b79509369a1e2e6d43923bed0b --- /dev/null +++ b/annotations_1/CUYNZo-8cDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.06], [39.0, 54.41], [55.0, 58.6], [59.0, 60.32], [62.0, 65.94], [68.0, 75.49], [77.0, 79.02], [81.0, 83.03], [85.0, 94.47], [101.0, 105.26], [106.0, 106.69], [108.0, 107.99], [109.0, 109.9], [113.0, 112.89], [117.0, 119.5]], "keep_status": [false, true, false, false, false, true, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 29.05, 29.99, 0.0, 29.06, 28.53, 28.89, 30.2, 28.58, 28.4, 0.0, 0.0, 0.0, 0.0, 29.99], "audiomae_on_audioset": [null, [["speech", 29.61], ["music", 23.97], ["mains hum", 6.0]], [["burping, eructation", 91.58], ["hum", 1.94], ["throbbing", 1.48]], null, [["hum", 37.72], ["mains hum", 28.27], ["rumble", 10.26]], [["hum", 23.84], ["mains hum", 11.79], ["music", 11.42]], [["speech", 49.64], ["music", 11.08], ["hum", 9.03]], [["mains hum", 22.28], ["speech", 18.28], ["hum", 17.33]], [["music", 67.88], ["throbbing", 10.61], ["didgeridoo", 4.49]], [["sound effect", 16.06], ["fart", 16.05], ["zipper (clothing)", 9.49]], null, null, null, null, [["music", 50.22], ["speech", 14.87], ["throbbing", 4.48]]], "duration": [1.06, 15.41, 3.6, 1.32, 3.94, 7.49, 2.02, 2.03, 9.47, 4.26, 0.69, -0.01, 0.9, -0.11, 2.5]} \ No newline at end of file diff --git a/annotations_1/CUnezbuG4fo_filtered.json b/annotations_1/CUnezbuG4fo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b4edd8ea3e74973b7ebff8c657ab129a6d93f71 --- /dev/null +++ b/annotations_1/CUnezbuG4fo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.44], [16.0, 18.22], [19.0, 19.6], [21.0, 22.06], [24.0, 26.01], [27.0, 33.84], [35.0, 35.33], [39.0, 41.44], [47.0, 47.55], [49.0, 57.74], [64.0, 63.8], [68.0, 68.52], [74.0, 74.19], [79.0, 79.25], [82.0, 83.05], [94.0, 95.2]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [50.41, 43.82, 0.0, 0.0, 66.88, 61.87, 0.0, 49.5, 0.0, 29.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 32.7], ["insect", 24.14], ["bee, wasp, etc.", 14.12]], null, null, null, null, null, [["crushing", 39.44], ["speech", 27.85], ["fart", 4.48]], null, [["speech", 36.14], ["music", 11.17], ["whack, thwack", 5.17]], null, null, null, null, null, null], "duration": [5.44, 2.22, 0.6, 1.06, 2.01, 6.84, 0.33, 2.44, 0.55, 8.74, -0.2, 0.52, 0.19, 0.25, 1.05, 1.2]} \ No newline at end of file diff --git a/annotations_1/CUzNygPSRZM_filtered.json b/annotations_1/CUzNygPSRZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1459a2a8921f8c36a9000383f1d821101e46b646 --- /dev/null +++ b/annotations_1/CUzNygPSRZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [7.0, 7.86], [12.0, 12.58], [20.0, 20.28], [23.0, 22.92], [30.0, 36.34], [41.0, 46.04], [49.0, 53.3], [56.0, 57.11], [60.0, 61.4], [65.0, 66.19], [69.0, 70.51], [73.0, 73.75], [79.0, 82.02], [85.0, 85.72], [90.0, 90.48], [91.0, 93.04], [95.0, 96.35], [99.0, 99.89], [101.0, 101.24], [101.0, 102.51], [103.0, 103.18], [104.0, 107.52], [108.0, 109.36], [113.0, 115.79], [116.0, 117.83], [119.0, 119.84], [121.0, 121.96], [123.0, 124.24], [126.0, 126.59], [130.0, 132.31], [134.0, 139.45], [144.0, 146.6], [147.0, 149.27], [151.0, 163.0], [166.0, 170.94], [172.0, 179.79]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.95, 29.32, 38.72, 0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 70.02, 79.07, 59.59, 36.3, 36.13, 35.26], "audiomae_on_audioset": [null, null, null, null, null, [["music", 38.47], ["speech", 15.15], ["boing", 11.24]], [["speech", 42.25], ["music", 33.1], ["groan", 7.21]], [["speech", 26.22], ["music", 17.22], ["musical instrument", 3.17]], null, null, null, null, null, [["speech", 28.73], ["whack, thwack", 8.64], ["frog", 3.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.4], ["fly, housefly", 7.94], ["hum", 7.46]], [["music", 29.56], ["camera", 26.21], ["single-lens reflex camera", 25.56]], [["music", 42.52], ["speech", 10.16], ["cowbell", 5.31]]], "duration": [1.19, 0.86, 0.58, 0.28, -0.08, 6.34, 5.04, 4.3, 1.11, 1.4, 1.19, 1.51, 0.75, 3.02, 0.72, 0.48, 2.04, 1.35, 0.89, 0.24, 1.51, 0.18, 3.52, 1.36, 2.79, 1.83, 0.84, 0.96, 1.24, 0.59, 2.31, 5.45, 2.6, 2.27, 12.0, 4.94, 7.79]} \ No newline at end of file diff --git a/annotations_1/CVxgFZixwlg_filtered.json b/annotations_1/CVxgFZixwlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad6942f1a22ef6b7904a85f07934d01d72f0ccb0 --- /dev/null +++ b/annotations_1/CVxgFZixwlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.67], [12.0, 14.07], [22.0, 51.9], [59.0, 71.04], [74.0, 73.6], [78.0, 79.52], [81.0, 82.75], [108.0, 115.52], [121.0, 121.47], [122.0, 124.12], [129.0, 130.44], [137.0, 136.83], [138.0, 148.8], [154.0, 159.22], [168.0, 168.47]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, true, true, false], "silence_prob": [0.0, 29.36, 31.16, 30.9, 0.0, 0.0, 0.0, 29.22, 0.0, 29.65, 0.0, 0.0, 29.83, 29.73, 0.0], "audiomae_on_audioset": [null, [["moo", 49.84], ["cattle, bovinae", 30.8], ["livestock, farm animals, working animals", 10.09]], [["mosquito", 15.61], ["music", 15.5], ["fly, housefly", 11.63]], [["speech", 43.79], ["music", 29.51], ["groan", 11.65]], null, null, null, [["speech", 49.73], ["vehicle", 6.75], ["buzz", 6.21]], null, [["speech", 51.1], ["music", 5.07], ["eruption", 2.55]], null, null, [["livestock, farm animals, working animals", 22.33], ["cattle, bovinae", 19.66], ["speech", 17.89]], [["mosquito", 22.11], ["fly, housefly", 20.3], ["insect", 18.79]], null], "duration": [-0.33, 2.07, 29.9, 12.04, -0.4, 1.52, 1.75, 7.52, 0.47, 2.12, 1.44, -0.17, 10.8, 5.22, 0.47]} \ No newline at end of file diff --git a/annotations_1/CWS1CWSAmjs_filtered.json b/annotations_1/CWS1CWSAmjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..477fbde73e320da51fd5f67d7ccc6fadcd3899e2 --- /dev/null +++ b/annotations_1/CWS1CWSAmjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.14], [24.0, 28.38], [33.0, 33.64], [35.0, 39.09], [41.0, 42.47], [68.0, 68.72], [86.0, 91.1], [110.0, 109.95], [120.0, 120.31], [129.0, 137.12], [140.0, 148.56], [156.0, 157.81], [159.0, 160.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 46.5, 0.0, 33.24, 0.0, 0.0, 30.52, 0.0, 0.0, 29.36, 32.31, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.5], ["speech", 18.34], ["throbbing", 6.64]], null, [["music", 38.5], ["throbbing", 21.66], ["speech", 15.88]], null, null, [["hum", 34.46], ["mains hum", 14.03], ["music", 10.37]], null, null, [["throbbing", 32.43], ["music", 29.38], ["hum", 12.23]], [["music", 63.9], ["speech", 20.95], ["sidetone", 3.3]], null, null], "duration": [0.14, 4.38, 0.64, 4.09, 1.47, 0.72, 5.1, -0.05, 0.31, 8.12, 8.56, 1.81, 1.89]} \ No newline at end of file diff --git a/annotations_1/CXdc2L3QH9U_filtered.json b/annotations_1/CXdc2L3QH9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9df6827881d56cadf5c3b06c17293d5228b29336 --- /dev/null +++ b/annotations_1/CXdc2L3QH9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [5.0, 5.71], [16.0, 16.44], [17.0, 17.98], [21.0, 21.73], [24.0, 25.2], [27.0, 28.29], [30.0, 30.97], [35.0, 35.83], [37.0, 41.34], [48.0, 49.6], [58.0, 59.12], [62.0, 62.75], [69.0, 69.85], [75.0, 75.14], [77.0, 78.33], [86.0, 85.55], [87.0, 86.81], [98.0, 98.34], [100.0, 108.04], [117.0, 117.49], [121.0, 124.34], [126.0, 127.43], [128.0, 134.92]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 69.74, 0.0, 33.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 29.74], ["speech", 13.48], ["brass instrument", 6.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.51], ["trombone", 5.85], ["musical instrument", 4.26]]], "duration": [0.45, 0.71, 0.44, 0.98, 0.73, 1.2, 1.29, 0.97, 0.83, 4.34, 1.6, 1.12, 0.75, 0.85, 0.14, 1.33, -0.45, -0.19, 0.34, 8.04, 0.49, 3.34, 1.43, 6.92]} \ No newline at end of file diff --git a/annotations_1/CY5X8DD0ams_filtered.json b/annotations_1/CY5X8DD0ams_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa09d03a7d38d946a912050c712e45d02022560 --- /dev/null +++ b/annotations_1/CY5X8DD0ams_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.41], [1.0, 7.77], [24.0, 23.8], [33.0, 34.21], [37.0, 46.5], [64.0, 73.7], [77.0, 77.85], [82.0, 96.79], [108.0, 108.11], [109.0, 110.05], [111.0, 111.86]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.71, 0.0, 0.0, 36.52, 28.43, 0.0, 33.37, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 23.97], ["music", 20.34], ["theremin", 7.59]], null, null, [["music", 45.16], ["speech", 16.84], ["quack", 15.7]], [["foghorn", 48.98], ["music", 10.67], ["cattle, bovinae", 8.89]], null, [["music", 59.44], ["musical instrument", 7.19], ["brass instrument", 6.61]], null, null, null], "duration": [0.41, 6.77, -0.2, 1.21, 9.5, 9.7, 0.85, 14.79, 0.11, 1.05, 0.86]} \ No newline at end of file diff --git a/annotations_1/CYGCwkmaa1s_filtered.json b/annotations_1/CYGCwkmaa1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aef270748c2b44ce39a000669989ec96bc93d9a5 --- /dev/null +++ b/annotations_1/CYGCwkmaa1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.8], [4.0, 5.66], [7.0, 7.2], [10.0, 11.26], [12.0, 12.7], [13.0, 15.03], [17.0, 19.25], [20.0, 20.41], [23.0, 56.03]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 99.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.66, 0.2, 1.26, 0.7, 2.03, 2.25, 0.41, 33.03]} \ No newline at end of file diff --git a/annotations_1/CYO8cs7VRMc_filtered.json b/annotations_1/CYO8cs7VRMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2f2428463c52cee63456914f1d4833cc1e40679 --- /dev/null +++ b/annotations_1/CYO8cs7VRMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 61.05], [61.0, 61.5], [62.0, 63.12], [65.0, 69.21], [70.0, 69.87], [70.0, 70.14], [70.0, 78.9], [86.0, 96.03], [100.0, 122.1], [123.0, 123.36], [124.0, 124.5]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [29.26, 0.0, 0.0, 28.47, 0.0, 0.0, 30.01, 29.65, 29.39, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 43.58], ["mains hum", 24.28], ["throbbing", 8.54]], null, null, [["cattle, bovinae", 43.42], ["livestock, farm animals, working animals", 33.78], ["moo", 21.55]], null, null, [["hum", 21.5], ["mains hum", 18.13], ["whack, thwack", 7.03]], [["speech", 16.01], ["music", 12.99], ["hum", 9.83]], [["music", 36.9], ["animal", 7.59], ["outside, rural or natural", 6.19]], null, null], "duration": [3.05, 0.5, 1.12, 4.21, -0.13, 0.14, 8.9, 10.03, 22.1, 0.36, 0.5]} \ No newline at end of file diff --git a/annotations_1/CYQXYJIN3Jw_filtered.json b/annotations_1/CYQXYJIN3Jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bab3fa95a04ad9050fca75a5ba12670d0e194902 --- /dev/null +++ b/annotations_1/CYQXYJIN3Jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [3.0, 3.32], [40.0, 40.78], [53.0, 54.09], [123.0, 125.17], [134.0, 135.53], [159.0, 165.87], [167.0, 168.24], [169.0, 170.73], [171.0, 171.81], [173.0, 174.48], [176.0, 176.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.32, 0.78, 1.09, 2.17, 1.53, 6.87, 1.24, 1.73, 0.81, 1.48, 0.71]} \ No newline at end of file diff --git a/annotations_1/CYgNbOsiKtk_filtered.json b/annotations_1/CYgNbOsiKtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f23cd83e7308607b8c9cbdfd1c22fcf143fa978 --- /dev/null +++ b/annotations_1/CYgNbOsiKtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.68], [2.0, 8.46], [12.0, 23.46], [23.0, 23.53], [24.0, 32.64], [36.0, 38.15], [42.0, 42.9], [49.0, 48.84], [51.0, 56.05], [58.0, 58.19], [59.0, 58.75], [59.0, 60.42], [62.0, 64.45], [65.0, 66.06], [67.0, 68.03], [70.0, 75.91], [76.0, 104.01], [105.0, 105.34], [106.0, 105.7], [106.0, 105.87], [107.0, 107.99], [111.0, 113.39], [114.0, 115.96], [121.0, 121.85], [123.0, 127.04], [130.0, 131.77], [132.0, 132.88], [135.0, 135.06], [138.0, 143.45], [147.0, 147.09], [151.0, 152.42], [153.0, 164.03], [166.0, 166.31], [168.0, 169.01], [170.0, 174.77]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.34, 46.94, 0.0, 90.78, 73.67, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 90.43, 93.13, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 76.37, 0.0, 0.0, 87.37], "audiomae_on_audioset": [null, [["music", 54.88], ["speech", 9.46], ["theremin", 3.23]], [["music", 57.09], ["fart", 8.57], ["speech", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.32, 6.46, 11.46, 0.53, 8.64, 2.15, 0.9, -0.16, 5.05, 0.19, -0.25, 1.42, 2.45, 1.06, 1.03, 5.91, 28.01, 0.34, -0.3, -0.13, 0.99, 2.39, 1.96, 0.85, 4.04, 1.77, 0.88, 0.06, 5.45, 0.09, 1.42, 11.03, 0.31, 1.01, 4.77]} \ No newline at end of file diff --git a/annotations_1/C_06Kac9rpg_filtered.json b/annotations_1/C_06Kac9rpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53d8d9fd4afa2bfa2d604338484d0c27a28219d3 --- /dev/null +++ b/annotations_1/C_06Kac9rpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [5.0, 5.66], [7.0, 8.51], [10.0, 10.23], [10.0, 10.64], [12.0, 13.17], [16.0, 23.99], [29.0, 29.64], [34.0, 35.8], [40.0, 41.71], [47.0, 47.76], [49.0, 49.92], [53.0, 54.04], [55.0, 55.83], [57.0, 58.31], [60.0, 70.5], [74.0, 73.62], [74.0, 73.68], [89.0, 91.34], [102.0, 105.92], [108.0, 110.88], [114.0, 116.41], [118.0, 118.67], [121.0, 174.5], [176.0, 175.83], [177.0, 177.33], [183.0, 184.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 32.83, 32.23, 63.96, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.45], ["electronic music", 3.27], ["musical instrument", 2.51]], null, null, [["beatboxing", 55.59], ["vocal music", 11.3], ["music", 9.72]], [["music", 60.97], ["beatboxing", 5.87], ["boing", 4.31]], null, null, null, null, null, null, null], "duration": [1.38, 0.66, 1.51, 0.23, 0.64, 1.17, 7.99, 0.64, 1.8, 1.71, 0.76, 0.92, 1.04, 0.83, 1.31, 10.5, -0.38, -0.32, 2.34, 3.92, 2.88, 2.41, 0.67, 53.5, -0.17, 0.33, 1.08]} \ No newline at end of file diff --git a/annotations_1/C_TfdNAXOwE_filtered.json b/annotations_1/C_TfdNAXOwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..234fb225576a8471194372be396d107d945767d4 --- /dev/null +++ b/annotations_1/C_TfdNAXOwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.51], [10.0, 13.98], [14.0, 18.47], [19.0, 22.87], [23.0, 26.87], [27.0, 30.3], [31.0, 34.82], [35.0, 41.71], [42.0, 47.56], [48.0, 52.52], [53.0, 56.39], [57.0, 58.94], [59.0, 62.82], [63.0, 68.49], [69.0, 73.04], [73.0, 76.84], [77.0, 87.4], [88.0, 97.85], [98.0, 99.49], [100.0, 107.84], [108.0, 111.4], [112.0, 122.79], [124.0, 125.76], [126.0, 130.99], [131.0, 147.19], [150.0, 158.33], [162.0, 162.97], [165.0, 166.33], [167.0, 171.29], [172.0, 173.4], [174.0, 174.99], [178.0, 179.05], [179.0, 180.3], [183.0, 183.79], [187.0, 187.52], [191.0, 193.29], [194.0, 195.13], [195.0, 196.69], [199.0, 202.31], [204.0, 205.14], [209.0, 209.68], [213.0, 214.57], [216.0, 215.91], [216.0, 216.97], [217.0, 218.46], [221.0, 222.61], [224.0, 224.21], [227.0, 227.43], [229.0, 241.34], [242.0, 245.13], [246.0, 247.67], [249.0, 251.31], [254.0, 255.58], [256.0, 256.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.17, 84.62, 78.72, 95.37, 73.82, 85.54, 81.17, 55.04, 86.09, 99.05, 99.4, 0.0, 86.82, 80.82, 93.6, 89.01, 98.99, 99.98, 0.0, 99.68, 89.72, 99.21, 0.0, 51.99, 43.38, 99.21, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18, 52.45, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.48], ["ding", 9.89], ["chink, clink", 6.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.51, 3.98, 4.47, 3.87, 3.87, 3.3, 3.82, 6.71, 5.56, 4.52, 3.39, 1.94, 3.82, 5.49, 4.04, 3.84, 10.4, 9.85, 1.49, 7.84, 3.4, 10.79, 1.76, 4.99, 16.19, 8.33, 0.97, 1.33, 4.29, 1.4, 0.99, 1.05, 1.3, 0.79, 0.52, 2.29, 1.13, 1.69, 3.31, 1.14, 0.68, 1.57, -0.09, 0.97, 1.46, 1.61, 0.21, 0.43, 12.34, 3.13, 1.67, 2.31, 1.58, 0.15]} \ No newline at end of file diff --git a/annotations_1/C_fhEQGp9Hw_filtered.json b/annotations_1/C_fhEQGp9Hw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dad74d58c809418e265c9a8205364bdc196d2497 --- /dev/null +++ b/annotations_1/C_fhEQGp9Hw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [9.0, 9.54], [14.0, 15.11], [16.0, 17.02], [18.0, 18.69], [22.0, 22.47], [23.0, 29.88], [30.0, 31.95], [33.0, 38.94], [47.0, 48.05], [49.0, 52.78], [54.0, 55.43], [64.0, 65.08], [66.0, 72.5], [73.0, 75.05], [76.0, 78.93], [83.0, 84.01], [86.0, 88.48], [90.0, 92.37], [94.0, 94.85], [97.0, 100.18], [101.0, 101.76], [104.0, 104.94], [108.0, 112.48], [114.0, 114.13], [119.0, 120.9], [122.0, 122.37], [123.0, 126.1]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 36.93, 0.0, 32.27, 0.0, 0.0, 49.22, 93.29, 87.92, 0.0, 72.16, 77.36, 0.0, 78.38, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 39.01], ["whack, thwack", 9.51], ["whip", 7.16]], null, [["music", 44.25], ["didgeridoo", 6.71], ["synthesizer", 5.49]], null, [["hum", 54.99], ["mains hum", 12.88], ["throbbing", 8.37]], null, null, [["speech", 32.96], ["sidetone", 17.6], ["fly, housefly", 8.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 0.54, 1.11, 1.02, 0.69, 0.47, 6.88, 1.95, 5.94, 1.05, 3.78, 1.43, 1.08, 6.5, 2.05, 2.93, 1.01, 2.48, 2.37, 0.85, 3.18, 0.76, 0.94, 4.48, 0.13, 1.9, 0.37, 3.1]} \ No newline at end of file diff --git a/annotations_1/Ca273QV9ik8_filtered.json b/annotations_1/Ca273QV9ik8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cabd13d940edd03827a99ddce932692bda23f4ba --- /dev/null +++ b/annotations_1/Ca273QV9ik8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[127.0, 133.73], [139.0, 141.94], [143.0, 146.03], [148.0, 155.44], [156.0, 156.69], [157.0, 215.82]], "keep_status": [true, false, true, false, false, false], "silence_prob": [29.94, 78.21, 48.48, 88.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.72], ["hum", 18.72], ["mains hum", 12.95]], null, [["hum", 14.02], ["whale vocalization", 11.55], ["eruption", 8.77]], null, null, null], "duration": [6.73, 2.94, 3.03, 7.44, 0.69, 58.82]} \ No newline at end of file diff --git a/annotations_1/CaQWWTLOzhY_filtered.json b/annotations_1/CaQWWTLOzhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bb7ee24875c22cf71eb106ba298de84d042b122 --- /dev/null +++ b/annotations_1/CaQWWTLOzhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.43], [13.0, 13.32], [14.0, 14.81], [17.0, 18.59], [25.0, 25.46], [30.0, 30.7], [36.0, 38.87], [51.0, 58.99], [66.0, 69.09], [72.0, 78.36], [80.0, 139.16], [140.0, 140.66], [143.0, 143.61], [148.0, 148.59], [149.0, 154.68], [156.0, 159.41], [163.0, 171.04], [172.0, 172.93], [174.0, 175.85], [177.0, 178.09], [179.0, 180.13]], "keep_status": [false, false, false, false, false, false, true, true, true, true, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.41, 49.45, 31.19, 30.58, 0.0, 0.0, 0.0, 0.0, 31.19, 52.22, 44.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 20.57], ["hum", 14.11], ["throbbing", 11.67]], [["hum", 33.94], ["throbbing", 22.72], ["music", 10.89]], [["music", 46.07], ["boing", 13.44], ["hum", 9.25]], [["speech", 24.16], ["hum", 22.93], ["throbbing", 22.11]], null, null, null, null, [["speech", 50.34], ["buzz", 3.01], ["hum", 2.93]], null, [["music", 45.03], ["hum", 13.57], ["throbbing", 4.82]], null, null, null, null], "duration": [0.43, 0.32, 0.81, 1.59, 0.46, 0.7, 2.87, 7.99, 3.09, 6.36, 59.16, 0.66, 0.61, 0.59, 5.68, 3.41, 8.04, 0.93, 1.85, 1.09, 1.13]} \ No newline at end of file diff --git a/annotations_1/Cd1Q6LsOR8o_filtered.json b/annotations_1/Cd1Q6LsOR8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d649d1a18fe407761009eeb2cda2c2563336e62a --- /dev/null +++ b/annotations_1/Cd1Q6LsOR8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.84], [1.0, 0.87], [1.0, 3.3], [5.0, 5.12], [6.0, 7.32], [8.0, 8.19], [9.0, 9.29], [10.0, 20.75], [23.0, 28.68], [31.0, 31.16], [34.0, 35.53], [39.0, 40.05], [42.0, 42.13], [43.0, 44.27], [49.0, 49.92], [50.0, 52.17], [58.0, 58.95], [60.0, 60.59], [62.0, 62.4], [64.0, 64.56], [66.0, 66.83], [68.0, 68.57], [70.0, 70.66], [76.0, 76.42], [79.0, 79.3], [89.0, 89.68], [96.0, 96.84], [99.0, 100.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 43.15, 55.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 56.59], ["gong", 8.6], ["musical instrument", 6.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.16, -0.13, 2.3, 0.12, 1.32, 0.19, 0.29, 10.75, 5.68, 0.16, 1.53, 1.05, 0.13, 1.27, 0.92, 2.17, 0.95, 0.59, 0.4, 0.56, 0.83, 0.57, 0.66, 0.42, 0.3, 0.68, 0.84, 1.11]} \ No newline at end of file diff --git a/annotations_1/CdVuOYKr2cQ_filtered.json b/annotations_1/CdVuOYKr2cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24e9e70c3bbff7fad5b7ed861acc66338addd5aa --- /dev/null +++ b/annotations_1/CdVuOYKr2cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.86], [29.0, 46.5], [53.0, 63.8], [68.0, 84.23], [87.0, 87.51], [88.0, 93.46], [98.0, 101.44], [103.0, 103.65], [105.0, 106.24], [107.0, 108.57], [110.0, 113.16], [115.0, 115.91], [116.0, 117.64], [118.0, 128.46]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [30.34, 30.47, 30.44, 30.48, 0.0, 32.61, 37.18, 0.0, 0.0, 0.0, 32.64, 0.0, 0.0, 32.66], "audiomae_on_audioset": [[["didgeridoo", 33.66], ["music", 24.78], ["speech", 5.27]], [["throbbing", 22.18], ["hum", 21.98], ["music", 20.42]], [["music", 35.06], ["speech", 29.5], ["cacophony", 6.83]], [["music", 38.88], ["hum", 19.78], ["throbbing", 15.99]], null, [["speech", 80.2], ["breaking", 3.5], ["inside, small room", 2.15]], [["music", 50.59], ["hum", 5.65], ["frog", 2.6]], null, null, null, [["music", 31.19], ["didgeridoo", 25.46], ["speech", 16.72]], null, null, [["music", 23.25], ["speech", 23.25], ["throbbing", 13.16]]], "duration": [2.86, 17.5, 10.8, 16.23, 0.51, 5.46, 3.44, 0.65, 1.24, 1.57, 3.16, 0.91, 1.64, 10.46]} \ No newline at end of file diff --git a/annotations_1/CdppQAIYPzY_filtered.json b/annotations_1/CdppQAIYPzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23df3f57bbc39d41747b664c2f262eda1bc24c7c --- /dev/null +++ b/annotations_1/CdppQAIYPzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [5.0, 6.66], [9.0, 10.03], [10.0, 12.8], [17.0, 19.65], [20.0, 21.93], [22.0, 28.98], [29.0, 35.48], [37.0, 37.69], [39.0, 39.95], [42.0, 45.37], [46.0, 46.58], [51.0, 51.92], [52.0, 54.18], [55.0, 56.78], [58.0, 68.86], [72.0, 72.27], [74.0, 73.95], [74.0, 102.81], [106.0, 114.76], [118.0, 127.48], [130.0, 139.73], [143.0, 146.37], [148.0, 149.03], [149.0, 173.43], [174.0, 174.65], [176.0, 176.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.72, 67.13, 0.0, 60.6, 52.92, 0.0, 0.0, 63.53, 0.0, 0.0, 57.17, 0.0, 43.9, 0.0, 0.0, 33.63, 30.03, 30.54, 29.9, 33.19, 0.0, 31.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.69], ["hum", 19.34], ["speech", 13.87]], null, null, [["music", 67.09], ["hum", 10.27], ["mains hum", 4.34]], [["smash, crash", 17.22], ["throbbing", 9.28], ["breaking", 6.06]], [["music", 55.04], ["speech", 18.04], ["smash, crash", 6.54]], [["music", 57.41], ["smash, crash", 10.72], ["whack, thwack", 5.82]], [["music", 37.77], ["creak", 14.12], ["hum", 9.87]], null, [["music", 68.98], ["hum", 3.94], ["electronic music", 3.91]], null, null], "duration": [1.28, 1.66, 1.03, 2.8, 2.65, 1.93, 6.98, 6.48, 0.69, 0.95, 3.37, 0.58, 0.92, 2.18, 1.78, 10.86, 0.27, -0.05, 28.81, 8.76, 9.48, 9.73, 3.37, 1.03, 24.43, 0.65, 0.88]} \ No newline at end of file diff --git a/annotations_1/CeE4xdFmuVs_filtered.json b/annotations_1/CeE4xdFmuVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8f392905a32dee4ad310694757e724fadb3225b --- /dev/null +++ b/annotations_1/CeE4xdFmuVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [8.0, 8.09], [13.0, 13.63], [26.0, 27.03], [27.0, 28.48], [30.0, 30.77], [39.0, 39.36], [43.0, 43.51], [44.0, 44.86], [46.0, 46.36], [58.0, 59.71], [60.0, 60.83], [66.0, 67.07], [67.0, 71.58], [75.0, 74.68], [76.0, 76.64], [78.0, 79.2], [85.0, 85.87], [88.0, 91.13], [95.0, 96.26], [98.0, 105.43], [112.0, 113.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 65.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.09, 0.63, 1.03, 1.48, 0.77, 0.36, 0.51, 0.86, 0.36, 1.71, 0.83, 1.07, 4.58, -0.32, 0.64, 1.2, 0.87, 3.13, 1.26, 7.43, 1.21]} \ No newline at end of file diff --git a/annotations_1/CeJQF4L0hx8_filtered.json b/annotations_1/CeJQF4L0hx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/CeJQF4L0hx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/CeX8drgioLs_filtered.json b/annotations_1/CeX8drgioLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bb29ebed7fa4d5f6645a6593bcb4c37ce8756f6 --- /dev/null +++ b/annotations_1/CeX8drgioLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.92], [9.0, 10.94], [16.0, 16.98], [18.0, 18.72], [20.0, 20.19], [21.0, 21.73], [22.0, 24.8], [37.0, 37.64], [39.0, 40.12], [44.0, 43.7], [49.0, 50.5], [53.0, 67.91], [68.0, 69.79], [70.0, 70.56], [83.0, 84.69], [86.0, 86.97], [89.0, 89.43], [92.0, 93.34], [95.0, 95.67], [98.0, 98.41], [102.0, 102.39], [106.0, 106.39], [107.0, 108.82], [114.0, 114.2], [118.0, 118.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.92, 1.94, 0.98, 0.72, 0.19, 0.73, 2.8, 0.64, 1.12, -0.3, 1.5, 14.91, 1.79, 0.56, 1.69, 0.97, 0.43, 1.34, 0.67, 0.41, 0.39, 0.39, 1.82, 0.2, 0.05]} \ No newline at end of file diff --git a/annotations_1/CfRKGG52TPY_filtered.json b/annotations_1/CfRKGG52TPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e02b0b8f7d5fc6f2073256f1f2beecb2d0b9d545 --- /dev/null +++ b/annotations_1/CfRKGG52TPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [6.0, 15.82], [23.0, 30.94], [41.0, 46.57], [51.0, 52.73], [56.0, 57.13], [61.0, 62.88], [67.0, 89.01], [89.0, 89.87], [91.0, 92.08], [94.0, 94.17], [96.0, 96.65], [99.0, 99.76], [109.0, 109.32]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.88, 29.04, 28.87, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 23.86], ["speech", 19.88], ["theremin", 19.42]], [["speech", 49.4], ["music", 14.29], ["foghorn", 10.9]], [["foghorn", 33.59], ["music", 14.99], ["speech", 12.17]], null, null, null, [["speech", 29.56], ["music", 18.78], ["foghorn", 7.16]], null, null, null, null, null, null], "duration": [0.17, 9.82, 7.94, 5.57, 1.73, 1.13, 1.88, 22.01, 0.87, 1.08, 0.17, 0.65, 0.76, 0.32]} \ No newline at end of file diff --git a/annotations_1/CfaPUQMa1gc_filtered.json b/annotations_1/CfaPUQMa1gc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ea7568a7a4af81490ccdb48267ccb24759d4c68 --- /dev/null +++ b/annotations_1/CfaPUQMa1gc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.71], [14.0, 17.56], [19.0, 25.93], [30.0, 54.58], [59.0, 62.63], [65.0, 65.6], [67.0, 67.9], [71.0, 72.93], [73.0, 76.23], [78.0, 84.38], [85.0, 88.69]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 37.5, 30.63, 29.85, 53.34, 0.0, 0.0, 0.0, 44.78, 44.23, 37.73], "audiomae_on_audioset": [null, [["music", 65.16], ["electronic music", 10.78], ["throbbing", 4.25]], [["music", 45.14], ["speech", 20.33], ["didgeridoo", 9.79]], [["whack, thwack", 16.39], ["music", 13.89], ["sound effect", 5.82]], null, null, null, null, [["music", 33.16], ["sidetone", 20.49], ["speech", 13.82]], [["sidetone", 92.73], ["speech", 3.2], ["music", 3.14]], [["music", 80.96], ["sidetone", 4.63], ["speech", 1.81]]], "duration": [0.71, 3.56, 6.93, 24.58, 3.63, 0.6, 0.9, 1.93, 3.23, 6.38, 3.69]} \ No newline at end of file diff --git a/annotations_1/CflcJ-HSA_Y_filtered.json b/annotations_1/CflcJ-HSA_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13ce1e9e7226f2e951e2fc58f3403aa667cfbda4 --- /dev/null +++ b/annotations_1/CflcJ-HSA_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 130.62]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [63.62]} \ No newline at end of file diff --git a/annotations_1/CfsveeSvZNw_filtered.json b/annotations_1/CfsveeSvZNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1803231d155156975c07e1e976bd3a5cfbf1ce6 --- /dev/null +++ b/annotations_1/CfsveeSvZNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 29.13], [31.0, 33.12], [34.0, 36.04], [37.0, 42.5], [43.0, 42.75], [45.0, 45.6], [47.0, 48.0], [50.0, 51.27], [51.0, 51.31], [51.0, 52.07], [57.0, 57.37], [58.0, 58.45], [63.0, 63.71], [64.0, 66.68], [67.0, 71.46], [73.0, 73.92], [75.0, 76.15], [80.0, 81.48], [85.0, 85.87], [88.0, 88.13], [94.0, 95.39], [100.0, 102.1], [104.0, 105.26], [106.0, 107.82], [110.0, 110.46], [112.0, 112.82], [113.0, 113.68], [118.0, 120.36], [122.0, 124.55], [126.0, 126.08], [128.0, 129.05], [131.0, 131.21], [132.0, 133.95], [135.0, 135.89], [139.0, 139.68], [141.0, 143.63], [145.0, 145.54], [148.0, 148.8], [151.0, 151.55], [154.0, 154.38], [157.0, 158.67], [159.0, 160.84], [162.0, 167.09], [167.0, 169.06], [170.0, 171.51], [172.0, 173.23], [174.0, 174.56], [176.0, 176.81]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.3, 43.58, 49.09, 41.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 97.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 28.23], ["music", 19.06], ["hum", 7.85]], [["music", 49.32], ["noise", 9.71], ["didgeridoo", 8.5]], [["music", 39.08], ["singing bowl", 6.59], ["musical instrument", 4.97]], [["music", 67.26], ["musical instrument", 1.93], ["speech", 1.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 13.58], ["cattle, bovinae", 13.1], ["moo", 12.74]], [["animal", 44.8], ["grunt", 13.0], ["livestock, farm animals, working animals", 9.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.13, 2.12, 2.04, 5.5, -0.25, 0.6, 1.0, 1.27, 0.31, 1.07, 0.37, 0.45, 0.71, 2.68, 4.46, 0.92, 1.15, 1.48, 0.87, 0.13, 1.39, 2.1, 1.26, 1.82, 0.46, 0.82, 0.68, 2.36, 2.55, 0.08, 1.05, 0.21, 1.95, 0.89, 0.68, 2.63, 0.54, 0.8, 0.55, 0.38, 1.67, 1.84, 5.09, 2.06, 1.51, 1.23, 0.56, 0.81]} \ No newline at end of file diff --git a/annotations_1/CgmI90T4Efk_filtered.json b/annotations_1/CgmI90T4Efk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d022fe271562e4f2f70cf31825fef25d6f66cc4 --- /dev/null +++ b/annotations_1/CgmI90T4Efk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.06], [8.0, 10.34], [11.0, 12.51], [19.0, 55.44], [58.0, 96.26], [99.0, 111.18], [111.0, 111.84], [114.0, 125.98], [126.0, 126.33], [127.0, 165.7], [169.0, 170.8], [174.0, 174.77]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [44.63, 55.74, 0.0, 0.0, 0.0, 28.64, 0.0, 28.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 30.95], ["mains hum", 17.41], ["music", 11.13]], null, null, null, null, [["livestock, farm animals, working animals", 19.07], ["speech", 12.38], ["vehicle", 9.77]], null, [["music", 67.08], ["hum", 7.17], ["throbbing", 4.47]], null, null, null, null], "duration": [3.06, 2.34, 1.51, 36.44, 38.26, 12.18, 0.84, 11.98, 0.33, 38.7, 1.8, 0.77]} \ No newline at end of file diff --git a/annotations_1/CgwNoOUtr7s_filtered.json b/annotations_1/CgwNoOUtr7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0438405dbf3c7afe6faec9c2c8d4c8709f45f925 --- /dev/null +++ b/annotations_1/CgwNoOUtr7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [6.0, 6.49], [10.0, 11.26], [12.0, 13.14], [14.0, 25.44], [27.0, 28.27], [29.0, 30.3], [32.0, 33.1], [40.0, 42.16], [44.0, 44.78], [46.0, 54.67], [55.0, 55.49], [56.0, 56.13], [59.0, 60.22], [62.0, 64.94], [66.0, 66.82], [71.0, 80.03], [85.0, 87.27], [91.0, 92.7], [94.0, 94.59], [100.0, 101.21], [101.0, 103.89], [106.0, 113.34], [114.0, 115.38], [118.0, 118.13], [120.0, 131.99], [132.0, 133.54], [137.0, 139.13], [141.0, 141.86], [151.0, 153.08], [154.0, 155.31], [156.0, 158.58], [159.0, 159.83], [162.0, 165.52], [167.0, 167.63], [169.0, 170.31], [172.0, 172.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.83, 0.0, 0.0, 0.0, 57.81, 0.0, 36.95, 0.0, 0.0, 0.0, 39.72, 0.0, 41.36, 43.66, 0.0, 0.0, 0.0, 38.22, 39.55, 0.0, 0.0, 36.64, 0.0, 39.74, 0.0, 36.39, 0.0, 41.22, 0.0, 43.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 48.47], ["speech", 26.61], ["clarinet", 6.02]], null, null, null, null, null, [["music", 56.43], ["speech", 4.64], ["didgeridoo", 4.06]], null, null, null, [["music", 80.95], ["speech", 3.89], ["musical instrument", 3.27]], null, [["music", 49.58], ["speech", 17.45], ["ice cream truck, ice cream van", 9.94]], [["music", 59.52], ["didgeridoo", 3.38], ["guitar", 2.09]], null, null, null, [["music", 56.79], ["speech", 6.16], ["musical instrument", 3.37]], [["music", 50.42], ["ice cream truck, ice cream van", 13.93], ["speech", 12.63]], null, null, [["music", 61.2], ["ice cream truck, ice cream van", 9.28], ["organ", 3.08]], null, [["music", 59.99], ["musical instrument", 4.54], ["marimba, xylophone", 4.13]], null, [["ice cream truck, ice cream van", 49.48], ["music", 39.08], ["didgeridoo", 1.24]], null, [["music", 66.7], ["musical instrument", 3.22], ["guitar", 2.65]], null, [["music", 70.46], ["synthesizer", 2.98], ["marimba, xylophone", 1.59]], null, null, null], "duration": [0.21, 0.49, 1.26, 1.14, 11.44, 1.27, 1.3, 1.1, 2.16, 0.78, 8.67, 0.49, 0.13, 1.22, 2.94, 0.82, 9.03, 2.27, 1.7, 0.59, 1.21, 2.89, 7.34, 1.38, 0.13, 11.99, 1.54, 2.13, 0.86, 2.08, 1.31, 2.58, 0.83, 3.52, 0.63, 1.31, 0.76]} \ No newline at end of file diff --git a/annotations_1/Ch1DsDy-osI_filtered.json b/annotations_1/Ch1DsDy-osI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbedb7b0b7a7a612ce53f373c6fea31bd1e2c8ee --- /dev/null +++ b/annotations_1/Ch1DsDy-osI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [3.0, 5.21], [12.0, 13.36], [15.0, 16.21], [19.0, 20.06], [22.0, 23.38], [24.0, 26.35], [27.0, 28.19], [35.0, 35.58], [37.0, 37.54], [46.0, 47.24], [54.0, 55.07], [56.0, 56.61], [59.0, 59.46], [63.0, 62.85], [70.0, 71.71], [78.0, 81.9], [88.0, 88.8], [90.0, 90.39], [91.0, 91.71], [95.0, 95.74], [96.0, 96.65], [98.0, 98.85], [106.0, 106.41], [118.0, 119.16], [128.0, 127.85], [129.0, 129.03], [130.0, 130.32], [141.0, 142.55], [146.0, 146.84], [151.0, 151.39], [152.0, 154.04], [156.0, 156.14], [161.0, 162.95], [164.0, 165.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.23, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 84.6], ["sidetone", 2.83], ["boing", 1.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 2.21, 1.36, 1.21, 1.06, 1.38, 2.35, 1.19, 0.58, 0.54, 1.24, 1.07, 0.61, 0.46, -0.15, 1.71, 3.9, 0.8, 0.39, 0.71, 0.74, 0.65, 0.85, 0.41, 1.16, -0.15, 0.03, 0.32, 1.55, 0.84, 0.39, 2.04, 0.14, 1.95, 1.77]} \ No newline at end of file diff --git a/annotations_1/ChD8PRF0hBg_filtered.json b/annotations_1/ChD8PRF0hBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79ae9c682a69853332d280aec6ef2f8556a4e9fc --- /dev/null +++ b/annotations_1/ChD8PRF0hBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [6.0, 8.45], [10.0, 23.08], [25.0, 24.68], [25.0, 25.62], [26.0, 26.35], [31.0, 32.04], [32.0, 32.21], [36.0, 49.45], [64.0, 65.06], [72.0, 73.23], [75.0, 77.26], [81.0, 85.58], [87.0, 89.8], [91.0, 92.11], [95.0, 95.62], [97.0, 97.95], [98.0, 99.69], [112.0, 114.18], [115.0, 120.88], [122.0, 123.42], [125.0, 125.1], [125.0, 125.63], [127.0, 130.25], [131.0, 136.27], [141.0, 150.55], [151.0, 164.54]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 99.87, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 0.0, 99.65, 96.77, 97.64, 0.0, 0.0, 0.0, 0.0, 91.3, 94.22, 0.0, 0.0, 0.0, 35.74, 31.81, 30.82, 33.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 44.58], ["music", 14.42], ["electric shaver, electric razor", 6.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.03], ["noise", 8.73], ["music", 7.72]], [["speech", 42.5], ["music", 21.15], ["mains hum", 8.48]], [["speech", 51.5], ["music", 20.08], ["breaking", 9.4]], [["music", 30.66], ["speech", 29.1], ["throbbing", 11.57]]], "duration": [1.16, 2.45, 13.08, -0.32, 0.62, 0.35, 1.04, 0.21, 13.45, 1.06, 1.23, 2.26, 4.58, 2.8, 1.11, 0.62, 0.95, 1.69, 2.18, 5.88, 1.42, 0.1, 0.63, 3.25, 5.27, 9.55, 13.54]} \ No newline at end of file diff --git a/annotations_1/ChIQpmBLPAo_filtered.json b/annotations_1/ChIQpmBLPAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af6c4e24489b20be76441611341c398e6666abcc --- /dev/null +++ b/annotations_1/ChIQpmBLPAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.23], [15.0, 16.11], [17.0, 19.11], [19.0, 19.16], [19.0, 19.68], [20.0, 22.1], [26.0, 26.89], [28.0, 66.99], [73.0, 73.58], [76.0, 77.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.9, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 66.38], ["music", 6.03], ["rumble", 4.68]], null, null, [["speech", 60.03], ["hum", 15.32], ["music", 7.58]], null, null, null, null], "duration": [0.23, 1.11, 2.11, 0.16, 0.68, 2.1, 0.89, 38.99, 0.58, 1.14]} \ No newline at end of file diff --git a/annotations_1/CiqtsKGMblU_filtered.json b/annotations_1/CiqtsKGMblU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1beea76ae4d749643bf69d0d890f0f46742b4d --- /dev/null +++ b/annotations_1/CiqtsKGMblU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.07], [10.0, 11.69], [14.0, 15.74], [16.0, 20.22], [22.0, 25.2], [27.0, 28.43], [31.0, 31.58], [33.0, 39.01], [40.0, 41.52], [42.0, 43.33], [44.0, 50.06], [51.0, 53.28], [56.0, 57.89], [60.0, 60.66], [61.0, 62.28], [63.0, 63.96], [65.0, 66.9], [69.0, 76.37], [77.0, 84.43], [86.0, 90.09], [91.0, 91.22], [95.0, 96.26], [97.0, 98.29], [105.0, 106.68], [110.0, 111.13], [114.0, 115.4], [116.0, 117.85], [119.0, 126.77], [130.0, 150.11], [152.0, 173.35]], "keep_status": [false, false, false, true, false, false, false, true, false, false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [29.16, 0.0, 0.0, 29.51, 27.87, 0.0, 0.0, 29.45, 0.0, 0.0, 29.88, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0, 28.68, 27.87, 28.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.94, 27.91, 28.2], "audiomae_on_audioset": [[["music", 72.52], ["electronic music", 4.27], ["didgeridoo", 3.19]], null, null, [["music", 39.59], ["musical instrument", 13.23], ["noise", 5.9]], [["mains hum", 34.83], ["speech", 18.16], ["hum", 17.23]], null, null, [["speech", 27.86], ["music", 14.18], ["cattle, bovinae", 8.8]], null, null, [["music", 52.48], ["tabla", 6.8], ["percussion", 5.07]], [["music", 52.64], ["ambient music", 8.46], ["electronic music", 4.56]], null, null, null, null, null, [["music", 17.0], ["mains hum", 12.84], ["hum", 10.6]], [["music", 18.1], ["boat, water vehicle", 9.16], ["ship", 8.6]], [["speech", 52.42], ["music", 21.19], ["vehicle", 7.25]], null, null, null, null, null, null, null, [["speech", 14.4], ["whack, thwack", 13.27], ["music", 10.41]], [["music", 80.16], ["electronic music", 2.2], ["speech", 1.46]], [["music", 46.99], ["noise", 10.81], ["speech", 7.88]]], "duration": [6.07, 1.69, 1.74, 4.22, 3.2, 1.43, 0.58, 6.01, 1.52, 1.33, 6.06, 2.28, 1.89, 0.66, 1.28, 0.96, 1.9, 7.37, 7.43, 4.09, 0.22, 1.26, 1.29, 1.68, 1.13, 1.4, 1.85, 7.77, 20.11, 21.35]} \ No newline at end of file diff --git a/annotations_1/Cj80JkVCCpg_filtered.json b/annotations_1/Cj80JkVCCpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1f25c2c38cd0d2fbc3a9033b8b64d6ba4d3d108 --- /dev/null +++ b/annotations_1/Cj80JkVCCpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [7.0, 8.31], [10.0, 25.15], [28.0, 31.65]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 37.07, 29.48], "audiomae_on_audioset": [null, null, [["hum", 57.89], ["throbbing", 22.58], ["mains hum", 7.27]], [["music", 63.1], ["cacophony", 3.86], ["musical instrument", 3.81]]], "duration": [0.31, 1.31, 15.15, 3.65]} \ No newline at end of file diff --git a/annotations_1/CjXwJJQ-8XM_filtered.json b/annotations_1/CjXwJJQ-8XM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf0c6fec050a41c64404ee2b22f65262a73528cd --- /dev/null +++ b/annotations_1/CjXwJJQ-8XM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [4.0, 4.65], [10.0, 20.46], [23.0, 26.27], [33.0, 40.69], [41.0, 41.07], [46.0, 49.64], [50.0, 49.94], [50.0, 59.0], [61.0, 60.71], [61.0, 61.69], [62.0, 62.63], [63.0, 64.62], [66.0, 76.89], [77.0, 76.94]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.3, 32.0, 43.74, 0.0, 60.32, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.79], ["laughter", 5.03], ["speech", 4.56]], [["whimper", 31.22], ["crying, sobbing", 28.21], ["baby cry, infant cry", 11.69]], [["whale vocalization", 12.88], ["horse", 5.78], ["crying, sobbing", 4.42]], null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.65, 10.46, 3.27, 7.69, 0.07, 3.64, -0.06, 9.0, -0.29, 0.69, 0.63, 1.62, 10.89, -0.06]} \ No newline at end of file diff --git a/annotations_1/CkAf_qzHNwo_filtered.json b/annotations_1/CkAf_qzHNwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a1f1e8230bfbbadef5be3af3cdfb129eddd1bb6 --- /dev/null +++ b/annotations_1/CkAf_qzHNwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.67], [4.0, 5.26], [7.0, 36.9], [40.0, 82.12], [85.0, 166.85], [169.0, 182.92]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.12, 0.0, 0.0, 29.08], "audiomae_on_audioset": [null, null, [["whack, thwack", 17.26], ["speech", 13.89], ["fly, housefly", 9.47]], null, null, [["music", 81.24], ["cacophony", 1.56], ["sound effect", 1.22]]], "duration": [1.67, 1.26, 29.9, 42.12, 81.85, 13.92]} \ No newline at end of file diff --git a/annotations_1/ClOGZ8IiO90_filtered.json b/annotations_1/ClOGZ8IiO90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..697562f6e3d5e0d0bbb8310742c2624c3376b87b --- /dev/null +++ b/annotations_1/ClOGZ8IiO90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [4.0, 5.54], [6.0, 6.49], [8.0, 23.01], [27.0, 31.21], [38.0, 40.44], [45.0, 54.99], [58.0, 57.89], [58.0, 79.56], [82.0, 85.95], [89.0, 97.71], [101.0, 102.56], [104.0, 105.19], [107.0, 109.61], [113.0, 114.69], [117.0, 120.24], [121.0, 121.93], [131.0, 132.6], [136.0, 149.0], [151.0, 153.22], [154.0, 154.25], [155.0, 155.33], [157.0, 158.43], [160.0, 161.18], [163.0, 168.05], [170.0, 171.58]], "keep_status": [false, false, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.79, 29.92, 30.74, 29.34, 0.0, 29.45, 30.72, 58.38, 0.0, 0.0, 99.98, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 15.88], ["livestock, farm animals, working animals", 13.31], ["cattle, bovinae", 12.25]], [["cattle, bovinae", 41.03], ["livestock, farm animals, working animals", 21.0], ["moo", 14.57]], [["music", 38.24], ["speech", 20.14], ["sidetone", 5.75]], [["music", 37.18], ["groan", 7.36], ["didgeridoo", 6.51]], null, [["music", 65.72], ["groan", 5.44], ["bleat", 5.23]], [["music", 17.64], ["cattle, bovinae", 10.01], ["speech", 8.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.54, 0.49, 15.01, 4.21, 2.44, 9.99, -0.11, 21.56, 3.95, 8.71, 1.56, 1.19, 2.61, 1.69, 3.24, 0.93, 1.6, 13.0, 2.22, 0.25, 0.33, 1.43, 1.18, 5.05, 1.58]} \ No newline at end of file diff --git a/annotations_1/Cm5NLiqmVtk_filtered.json b/annotations_1/Cm5NLiqmVtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8826edec8de02592f076c1397eff904cb72928ef --- /dev/null +++ b/annotations_1/Cm5NLiqmVtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.26], [8.0, 10.74], [12.0, 32.58], [33.0, 36.68], [38.0, 41.71], [43.0, 45.0], [47.0, 48.93], [50.0, 53.81], [55.0, 56.78], [58.0, 85.19], [86.0, 87.47], [92.0, 102.0], [105.0, 129.12]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 80.82, 72.9, 76.86, 75.23, 89.01, 0.0, 39.09, 0.0, 32.31, 0.0, 31.92, 30.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 28.61], ["theremin", 25.8], ["hum", 9.0]], null, [["music", 48.66], ["speech", 16.05], ["hum", 10.13]], null, [["music", 29.66], ["speech", 16.98], ["foghorn", 7.33]], [["music", 26.68], ["didgeridoo", 21.05], ["musical instrument", 5.11]]], "duration": [1.26, 2.74, 20.58, 3.68, 3.71, 2.0, 1.93, 3.81, 1.78, 27.19, 1.47, 10.0, 24.12]} \ No newline at end of file diff --git a/annotations_1/Cm6FChNhtSc_filtered.json b/annotations_1/Cm6FChNhtSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6cb35f4671b3d95add1e984f912271e827f2f1 --- /dev/null +++ b/annotations_1/Cm6FChNhtSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.15], [8.0, 8.88], [11.0, 12.14], [18.0, 21.29], [21.0, 21.34], [26.0, 27.24], [30.0, 31.18], [36.0, 36.68], [38.0, 38.31], [39.0, 39.88], [42.0, 46.04], [48.0, 47.71], [53.0, 54.55], [56.0, 60.62], [62.0, 62.33], [63.0, 68.23], [71.0, 71.41], [72.0, 73.11], [75.0, 76.62], [78.0, 80.11], [88.0, 89.11], [92.0, 92.64], [96.0, 99.99], [105.0, 105.12], [108.0, 110.66], [114.0, 114.56], [115.0, 116.04], [127.0, 129.98], [132.0, 132.61]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.35, 0.0, 0.0, 38.04, 0.0, 32.68, 0.0, 0.0, 0.0, 36.35, 0.0, 0.0, 35.02, 0.0, 33.72, 0.0, 0.0, 60.98, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 35.58], ["insect", 21.53], ["cattle, bovinae", 6.43]], null, null, null, null, null, null, [["fly, housefly", 33.87], ["mosquito", 20.16], ["insect", 3.6]], null, null, [["whale vocalization", 28.84], ["speech", 13.51], ["cattle, bovinae", 9.02]], null, [["whale vocalization", 33.05], ["speech", 20.92], ["mosquito", 5.43]], null, null, null, [["music", 22.54], ["speech", 19.26], ["noise", 5.91]], null, null, [["music", 39.63], ["moo", 5.97], ["cattle, bovinae", 5.84]], null, [["hum", 33.16], ["mains hum", 27.41], ["throbbing", 14.27]], null, null, null, null], "duration": [1.15, 0.88, 1.14, 3.29, 0.34, 1.24, 1.18, 0.68, 0.31, 0.88, 4.04, -0.29, 1.55, 4.62, 0.33, 5.23, 0.41, 1.11, 1.62, 2.11, 1.11, 0.64, 3.99, 0.12, 2.66, 0.56, 1.04, 2.98, 0.61]} \ No newline at end of file diff --git a/annotations_1/CmMeT8MW1LA_filtered.json b/annotations_1/CmMeT8MW1LA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10918b5419e2b14a880b99780961e1a3e9ed5ed3 --- /dev/null +++ b/annotations_1/CmMeT8MW1LA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.03], [25.0, 25.17], [27.0, 37.13], [37.0, 39.36], [40.0, 44.63], [45.0, 138.94]], "keep_status": [true, false, true, true, true, false], "silence_prob": [29.35, 0.0, 31.52, 34.25, 35.75, 0.0], "audiomae_on_audioset": [[["music", 35.33], ["noise", 6.96], ["musical instrument", 4.81]], null, [["hum", 41.01], ["music", 13.53], ["mains hum", 13.12]], [["speech", 13.36], ["music", 13.07], ["hum", 11.97]], [["music", 32.87], ["hum", 19.35], ["mains hum", 7.8]], null], "duration": [11.03, 0.17, 10.13, 2.36, 4.63, 93.94]} \ No newline at end of file diff --git a/annotations_1/Cn_70ds_Slw_filtered.json b/annotations_1/Cn_70ds_Slw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f5ac45ee293e15190e8f3efad42064bddc549cd --- /dev/null +++ b/annotations_1/Cn_70ds_Slw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 70.82], [74.0, 96.87], [97.0, 99.3], [101.0, 101.14], [108.0, 126.79]], "keep_status": [false, true, false, false, false], "silence_prob": [80.82, 29.37, 33.0, 0.0, 45.46], "audiomae_on_audioset": [null, [["music", 35.98], ["hum", 20.75], ["throbbing", 11.15]], [["sidetone", 72.36], ["speech", 10.79], ["music", 7.53]], null, [["music", 82.6], ["theremin", 2.65], ["hum", 1.91]]], "duration": [9.82, 22.87, 2.3, 0.14, 18.79]} \ No newline at end of file diff --git a/annotations_1/Cn_nTq97C7Y_filtered.json b/annotations_1/Cn_nTq97C7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efd89fb46c7c24472c9740e2faca261f44287b79 --- /dev/null +++ b/annotations_1/Cn_nTq97C7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 74.73], [77.0, 81.03], [83.0, 86.81], [87.0, 100.16], [101.0, 101.01], [101.0, 109.65], [115.0, 125.88]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 41.28, 54.56, 54.43, 0.0, 33.36, 66.27], "audiomae_on_audioset": [null, [["speech", 44.53], ["arrow", 10.72], ["music", 8.44]], null, null, null, [["music", 63.09], ["scary music", 10.08], ["speech", 6.77]], null], "duration": [1.73, 4.03, 3.81, 13.16, 0.01, 8.65, 10.88]} \ No newline at end of file diff --git a/annotations_1/CnrR2upI8Jo_filtered.json b/annotations_1/CnrR2upI8Jo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24e27d1fd67fd25e2bdcc33b10fedee668d0f57d --- /dev/null +++ b/annotations_1/CnrR2upI8Jo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [4.0, 6.37], [7.0, 16.02], [17.0, 18.08], [27.0, 27.72], [34.0, 36.78], [54.0, 54.45], [61.0, 60.93], [65.0, 65.37], [74.0, 75.0], [75.0, 75.51], [79.0, 80.03], [85.0, 86.05], [93.0, 93.12], [109.0, 110.17], [138.0, 139.43], [140.0, 140.49], [144.0, 144.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.09, 93.29, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 2.37, 9.02, 1.08, 0.72, 2.78, 0.45, -0.07, 0.37, 1.0, 0.51, 1.03, 1.05, 0.12, 1.17, 1.43, 0.49, 0.76]} \ No newline at end of file diff --git a/annotations_1/CoQM9K_r3kY_filtered.json b/annotations_1/CoQM9K_r3kY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e65b3026f22e52b09e09f1cf9bc5ff24f796ae68 --- /dev/null +++ b/annotations_1/CoQM9K_r3kY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.54], [26.0, 27.67], [29.0, 30.94], [32.0, 31.95], [32.0, 33.27], [35.0, 37.96], [48.0, 51.8], [53.0, 57.0], [58.0, 59.44], [60.0, 61.4], [63.0, 64.12], [66.0, 68.74], [69.0, 71.52], [72.0, 77.73], [82.0, 85.58], [86.0, 87.02], [88.0, 89.07], [91.0, 91.22], [93.0, 95.96], [97.0, 99.52], [101.0, 109.68], [110.0, 110.81], [111.0, 117.34], [118.0, 136.11], [136.0, 138.55], [140.0, 145.37], [147.0, 147.92], [148.0, 152.56], [154.0, 155.7], [156.0, 157.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false], "silence_prob": [62.07, 0.0, 0.0, 0.0, 0.0, 54.76, 87.55, 54.17, 0.0, 0.0, 0.0, 90.43, 41.95, 63.64, 48.31, 0.0, 0.0, 0.0, 81.17, 74.76, 52.98, 0.0, 42.46, 35.84, 37.75, 34.25, 0.0, 37.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.56], ["speech", 22.1], ["hum", 5.14]], null, [["music", 24.43], ["speech", 23.26], ["hum", 8.89]], null, null, null, null, null, null, null, [["music", 45.26], ["speech", 6.67], ["marimba, xylophone", 6.14]], [["music", 52.07], ["musical instrument", 3.82], ["hum", 3.22]], [["music", 65.15], ["didgeridoo", 5.25], ["musical instrument", 2.39]], [["music", 72.36], ["theremin", 3.42], ["didgeridoo", 3.38]], null, [["music", 25.3], ["mains hum", 19.64], ["speech", 13.73]], null, null], "duration": [10.54, 1.67, 1.94, -0.05, 1.27, 2.96, 3.8, 4.0, 1.44, 1.4, 1.12, 2.74, 2.52, 5.73, 3.58, 1.02, 1.07, 0.22, 2.96, 2.52, 8.68, 0.81, 6.34, 18.11, 2.55, 5.37, 0.92, 4.56, 1.7, 1.37]} \ No newline at end of file diff --git a/annotations_1/Cony281khiE_filtered.json b/annotations_1/Cony281khiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..457bd15e95f94003d514cb483fcea4e72e259667 --- /dev/null +++ b/annotations_1/Cony281khiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.46], [38.0, 84.81], [85.0, 88.16], [90.0, 90.56], [91.0, 110.3]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 33.77, 0.0, 63.64], "audiomae_on_audioset": [null, null, [["music", 18.81], ["speech", 16.68], ["theremin", 10.63]], null, null], "duration": [0.46, 46.81, 3.16, 0.56, 19.3]} \ No newline at end of file diff --git a/annotations_1/Cp2KrXtWwAA_filtered.json b/annotations_1/Cp2KrXtWwAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67e3def98962fef9c00377cb993097a254ec3d34 --- /dev/null +++ b/annotations_1/Cp2KrXtWwAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 34.3], [38.0, 106.56], [111.0, 111.79], [112.0, 112.24], [114.0, 115.06], [116.0, 117.39], [124.0, 131.89]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [29.42, 0.0, 0.0, 0.0, 0.0, 0.0, 40.59], "audiomae_on_audioset": [[["music", 62.51], ["didgeridoo", 3.95], ["singing", 2.08]], null, null, null, null, null, [["music", 54.05], ["speech", 14.34], ["ambient music", 4.77]]], "duration": [4.3, 68.56, 0.79, 0.24, 1.06, 1.39, 7.89]} \ No newline at end of file diff --git a/annotations_1/Cp3FHbNWi64_filtered.json b/annotations_1/Cp3FHbNWi64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e7a62fb14d12dcaba181df86e3fef441172fd --- /dev/null +++ b/annotations_1/Cp3FHbNWi64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.67], [14.0, 17.12], [19.0, 19.95], [23.0, 23.5], [30.0, 34.69], [50.0, 50.04], [51.0, 51.63], [54.0, 54.7], [57.0, 66.09], [68.0, 67.73], [75.0, 78.26]], "keep_status": [false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 78.38, 0.0, 0.0, 45.69, 0.0, 0.0, 0.0, 28.56, 0.0, 34.66], "audiomae_on_audioset": [null, null, null, null, [["bee, wasp, etc.", 19.41], ["fly, housefly", 19.28], ["insect", 16.55]], null, null, null, [["speech", 33.04], ["music", 29.8], ["hum", 6.38]], null, [["music", 49.09], ["mains hum", 9.05], ["hum", 4.95]]], "duration": [-0.33, 3.12, 0.95, 0.5, 4.69, 0.04, 0.63, 0.7, 9.09, -0.27, 3.26]} \ No newline at end of file diff --git a/annotations_1/CpAVT7Y3vpM_filtered.json b/annotations_1/CpAVT7Y3vpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..727a5e4d0bde50fe6c69e02d380b7ecca451ca52 --- /dev/null +++ b/annotations_1/CpAVT7Y3vpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.85], [10.0, 15.99], [17.0, 18.69], [20.0, 20.66], [27.0, 28.92], [32.0, 39.92], [41.0, 45.98], [47.0, 49.37], [50.0, 50.48], [51.0, 53.25], [54.0, 54.7], [56.0, 57.03], [63.0, 63.12], [65.0, 66.09], [68.0, 68.17], [72.0, 74.56], [78.0, 80.97], [82.0, 84.28], [86.0, 90.53], [93.0, 95.08], [96.0, 99.91], [102.0, 103.35], [105.0, 106.66], [110.0, 111.65], [112.0, 113.22], [115.0, 116.55], [118.0, 121.36], [124.0, 126.4], [129.0, 129.19], [130.0, 132.09], [133.0, 136.07], [137.0, 137.76], [151.0, 158.45], [160.0, 164.86], [167.0, 170.53], [171.0, 171.53], [172.0, 174.39], [176.0, 176.64], [177.0, 178.93], [180.0, 180.59], [181.0, 180.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 100.0, 0.0, 0.0, 0.0, 99.98, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.99, 96.89, 87.92, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 93.29, 99.97, 99.98, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.85, 5.99, 1.69, 0.66, 1.92, 7.92, 4.98, 2.37, 0.48, 2.25, 0.7, 1.03, 0.12, 1.09, 0.17, 2.56, 2.97, 2.28, 4.53, 2.08, 3.91, 1.35, 1.66, 1.65, 1.22, 1.55, 3.36, 2.4, 0.19, 2.09, 3.07, 0.76, 7.45, 4.86, 3.53, 0.53, 2.39, 0.64, 1.93, 0.59, -0.06]} \ No newline at end of file diff --git a/annotations_1/CpIgfRGUpU0_filtered.json b/annotations_1/CpIgfRGUpU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..129889c416dcd2896f70bc2e93944400ba44ff4c --- /dev/null +++ b/annotations_1/CpIgfRGUpU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [20.0, 22.28], [23.0, 31.26], [36.0, 35.87], [47.0, 47.73], [62.0, 62.16], [63.0, 63.59], [67.0, 70.14], [74.0, 75.46], [87.0, 88.53], [100.0, 101.65], [103.0, 103.18], [106.0, 107.97], [109.0, 109.09], [110.0, 110.49], [116.0, 116.78], [124.0, 123.74], [126.0, 126.39], [127.0, 127.43], [131.0, 130.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.99, 51.88, 0.0, 0.0, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 2.28, 8.26, -0.13, 0.73, 0.16, 0.59, 3.14, 1.46, 1.53, 1.65, 0.18, 1.97, 0.09, 0.49, 0.78, -0.26, 0.39, 0.43, -0.33]} \ No newline at end of file diff --git a/annotations_1/CpcopOQAWWA_filtered.json b/annotations_1/CpcopOQAWWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4948daf980a98d3a4da8fe9ffe3a274c4204f593 --- /dev/null +++ b/annotations_1/CpcopOQAWWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.68], [14.0, 16.31], [22.0, 27.63], [29.0, 28.63], [29.0, 29.62], [34.0, 34.62], [35.0, 35.63], [36.0, 36.14], [38.0, 38.55], [42.0, 43.46], [45.0, 47.55], [51.0, 54.11], [56.0, 58.24], [59.0, 60.12], [63.0, 63.29], [65.0, 65.91], [71.0, 71.68], [74.0, 74.02], [74.0, 75.25], [79.0, 82.41], [83.0, 84.81], [86.0, 86.43], [87.0, 88.94], [89.0, 91.83], [97.0, 99.49], [101.0, 106.1], [108.0, 109.48], [114.0, 117.58], [120.0, 120.26], [127.0, 134.06], [134.0, 134.87], [136.0, 135.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 71.0, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 34.94, 41.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.57, 0.0, 0.0, 0.0, 32.55, 35.37, 43.35, 0.0, 33.61, 0.0, 41.66, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.0], ["effects unit", 9.78], ["synthesizer", 9.49]], [["music", 67.72], ["speech", 9.51], ["guitar", 8.97]], [["didgeridoo", 73.89], ["music", 5.42], ["effects unit", 4.3]], null, null, null, null, null, null, [["didgeridoo", 71.2], ["music", 18.26], ["musical instrument", 2.91]], null, null, null, [["cattle, bovinae", 41.8], ["moo", 37.63], ["livestock, farm animals, working animals", 12.83]], [["speech", 26.24], ["music", 23.62], ["musical instrument", 11.3]], [["effects unit", 22.35], ["livestock, farm animals, working animals", 19.22], ["cattle, bovinae", 16.63]], null, [["sidetone", 32.03], ["doorbell", 26.6], ["music", 4.71]], null, [["speech", 65.55], ["male speech, man speaking", 7.99], ["whack, thwack", 3.78]], null, null], "duration": [1.68, 2.31, 5.63, -0.37, 0.62, 0.62, 0.63, 0.14, 0.55, 1.46, 2.55, 3.11, 2.24, 1.12, 0.29, 0.91, 0.68, 0.02, 1.25, 3.41, 1.81, 0.43, 1.94, 2.83, 2.49, 5.1, 1.48, 3.58, 0.26, 7.06, 0.87, -0.22]} \ No newline at end of file diff --git a/annotations_1/Cq2Wzdd_PYs_filtered.json b/annotations_1/Cq2Wzdd_PYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a6b80d9159600457ef41d18b649b4f6353e5980 --- /dev/null +++ b/annotations_1/Cq2Wzdd_PYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.86], [18.0, 18.71], [20.0, 20.34], [21.0, 22.87], [29.0, 29.69], [33.0, 34.7], [36.0, 42.63], [49.0, 49.38], [53.0, 53.54], [64.0, 71.34], [76.0, 77.08], [79.0, 80.0], [88.0, 88.65], [90.0, 90.78], [92.0, 92.92], [94.0, 93.83], [95.0, 107.33], [108.0, 109.0], [110.0, 110.07], [113.0, 113.91], [118.0, 118.45], [120.0, 119.92], [121.0, 121.46], [122.0, 123.38], [125.0, 131.62], [132.0, 136.14], [137.0, 137.71], [139.0, 140.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.91, 0.0, 0.0, 50.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.19, 38.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.41], ["noise", 27.01], ["mains hum", 11.44]], null, null, null, null, null, null, null, [["speech", 31.31], ["sidetone", 26.94], ["hum", 14.37]], [["hum", 41.27], ["mains hum", 29.79], ["noise", 11.96]], null, null], "duration": [0.86, 0.71, 0.34, 1.87, 0.69, 1.7, 6.63, 0.38, 0.54, 7.34, 1.08, 1.0, 0.65, 0.78, 0.92, -0.17, 12.33, 1.0, 0.07, 0.91, 0.45, -0.08, 0.46, 1.38, 6.62, 4.14, 0.71, 1.32]} \ No newline at end of file diff --git a/annotations_1/CsOM7mptOLM_filtered.json b/annotations_1/CsOM7mptOLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1be1a6d92415c2f0c55108678dd4965f6464eeb2 --- /dev/null +++ b/annotations_1/CsOM7mptOLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.41], [13.0, 19.18], [22.0, 43.98], [45.0, 56.93], [58.0, 67.2]], "keep_status": [true, false, false, false, true], "silence_prob": [40.06, 35.04, 32.82, 30.29, 29.7], "audiomae_on_audioset": [[["music", 46.19], ["effects unit", 11.62], ["distortion", 6.7]], [["music", 53.29], ["synthesizer", 13.07], ["musical instrument", 11.26]], [["music", 53.82], ["musical instrument", 10.45], ["theremin", 9.84]], [["music", 58.7], ["effects unit", 9.32], ["musical instrument", 4.43]], [["music", 36.15], ["musical instrument", 15.05], ["effects unit", 8.51]]], "duration": [7.41, 6.18, 21.98, 11.93, 9.2]} \ No newline at end of file diff --git a/annotations_1/Csn39S3c0kI_filtered.json b/annotations_1/Csn39S3c0kI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dba1d5cb737e2ee860ac77f1cb461f1c6547fce --- /dev/null +++ b/annotations_1/Csn39S3c0kI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.26], [23.0, 25.19], [26.0, 28.19], [32.0, 34.16], [37.0, 39.28], [41.0, 42.82], [48.0, 49.74], [60.0, 61.77], [63.0, 89.65]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [98.51, 99.92, 99.98, 99.4, 99.98, 0.0, 0.0, 0.0, 37.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 31.36], ["speech", 23.36], ["hum", 11.5]]], "duration": [2.26, 2.19, 2.19, 2.16, 2.28, 1.82, 1.74, 1.77, 26.65]} \ No newline at end of file diff --git a/annotations_1/CsukLjjPv-U_filtered.json b/annotations_1/CsukLjjPv-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4caa733e16179ed12b1fdd14920b6d0a03024e --- /dev/null +++ b/annotations_1/CsukLjjPv-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.29], [3.0, 3.21], [4.0, 5.64], [7.0, 13.73], [16.0, 30.86], [34.0, 39.68], [43.0, 68.12], [80.0, 80.5], [81.0, 85.06], [85.0, 85.14], [86.0, 85.8], [86.0, 85.83], [86.0, 93.01], [94.0, 100.3], [105.0, 108.63], [111.0, 112.35], [113.0, 115.23], [116.0, 121.54], [128.0, 131.55]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.11, 29.08, 29.56, 29.39, 0.0, 30.29, 0.0, 0.0, 0.0, 29.4, 28.39, 30.19, 0.0, 32.68, 28.72, 28.89], "audiomae_on_audioset": [null, null, null, [["music", 41.53], ["hum", 16.12], ["throbbing", 12.94]], [["music", 60.03], ["throbbing", 8.1], ["hum", 3.43]], [["speech", 51.95], ["explosion", 18.91], ["eruption", 13.14]], [["music", 44.6], ["throbbing", 16.82], ["hum", 12.41]], null, [["speech", 35.62], ["groan", 8.77], ["fart", 7.13]], null, null, null, [["speech", 52.4], ["music", 25.3], ["explosion", 3.09]], [["hum", 23.55], ["explosion", 12.35], ["mains hum", 10.33]], [["music", 39.51], ["speech", 25.8], ["throbbing", 3.91]], null, [["throbbing", 29.48], ["music", 23.81], ["hum", 12.09]], [["speech", 52.26], ["explosion", 12.03], ["eruption", 9.15]], [["music", 35.66], ["speech", 33.22], ["sound effect", 5.16]]], "duration": [1.29, 0.21, 1.64, 6.73, 14.86, 5.68, 25.12, 0.5, 4.06, 0.14, -0.2, -0.17, 7.01, 6.3, 3.63, 1.35, 2.23, 5.54, 3.55]} \ No newline at end of file diff --git a/annotations_1/Ct-zGV4TgKY_filtered.json b/annotations_1/Ct-zGV4TgKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2f47d32147a2011c306278f14748cf9da9ea96c --- /dev/null +++ b/annotations_1/Ct-zGV4TgKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 41.23], [45.0, 46.75], [48.0, 50.92], [52.0, 54.19], [57.0, 58.16], [60.0, 61.59], [63.0, 78.6], [79.0, 79.73], [80.0, 87.18], [88.0, 143.7], [146.0, 168.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 67.25, 48.61, 0.0, 0.0, 32.21, 0.0, 47.35, 0.0, 29.12], "audiomae_on_audioset": [null, null, null, [["didgeridoo", 27.35], ["music", 25.66], ["speech", 8.82]], null, null, [["telephone bell ringing", 71.2], ["music", 16.86], ["speech", 3.12]], null, [["speech", 35.37], ["music", 22.07], ["gong", 14.52]], null, [["throbbing", 43.36], ["hum", 26.46], ["music", 12.69]]], "duration": [36.23, 1.75, 2.92, 2.19, 1.16, 1.59, 15.6, 0.73, 7.18, 55.7, 22.94]} \ No newline at end of file diff --git a/annotations_1/Ct21N7taYlc_filtered.json b/annotations_1/Ct21N7taYlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..659bdedc2c88d52555625d9a16be59d6d427bc91 --- /dev/null +++ b/annotations_1/Ct21N7taYlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[125.0, 130.84], [132.0, 133.86]], "keep_status": [false, false], "silence_prob": [31.04, 0.0], "audiomae_on_audioset": [[["speech", 43.8], ["music", 40.34], ["explosion", 1.74]], null], "duration": [5.84, 1.86]} \ No newline at end of file diff --git a/annotations_1/CtDBcCXiE3M_filtered.json b/annotations_1/CtDBcCXiE3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30246c6d4a1d0c1392a03927db28c177777854f5 --- /dev/null +++ b/annotations_1/CtDBcCXiE3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.34], [15.0, 16.95], [17.0, 17.9], [26.0, 27.68], [30.0, 63.24], [66.0, 68.71], [71.0, 71.46], [73.0, 73.79], [75.0, 79.93], [81.0, 82.0], [85.0, 85.9], [89.0, 91.18], [92.0, 168.42]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.85, 0.0, 0.0, 0.0, 0.0, 43.79, 0.0, 0.0, 68.67, 0.0, 0.0, 92.48, 0.0], "audiomae_on_audioset": [[["music", 33.38], ["gong", 24.68], ["singing bowl", 9.33]], null, null, null, null, [["echo", 39.18], ["speech", 36.84], ["radio", 5.12]], null, null, null, null, null, null, null], "duration": [6.34, 1.95, 0.9, 1.68, 33.24, 2.71, 0.46, 0.79, 4.93, 1.0, 0.9, 2.18, 76.42]} \ No newline at end of file diff --git a/annotations_1/CtYTXG1RFQ0_filtered.json b/annotations_1/CtYTXG1RFQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f22e25eca49dd53752b3ba1e0b70eee1d5a207f3 --- /dev/null +++ b/annotations_1/CtYTXG1RFQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.95], [20.0, 22.3], [25.0, 27.9], [28.0, 28.54], [29.0, 43.48], [46.0, 52.24], [53.0, 54.58], [55.0, 131.41], [132.0, 132.88], [134.0, 134.37], [137.0, 137.39], [138.0, 142.97], [143.0, 143.88]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, true, false], "silence_prob": [33.45, 35.8, 31.99, 0.0, 30.26, 38.86, 0.0, 0.0, 0.0, 0.0, 0.0, 38.64, 0.0], "audiomae_on_audioset": [[["music", 65.77], ["theremin", 18.49], ["musical instrument", 2.77]], [["music", 41.32], ["mains hum", 8.71], ["hum", 6.15]], [["hum", 38.63], ["mains hum", 12.41], ["buzz", 10.15]], null, [["speech", 26.92], ["buzz", 11.98], ["livestock, farm animals, working animals", 9.63]], [["throbbing", 53.11], ["hum", 26.7], ["music", 7.64]], null, null, null, null, null, [["throbbing", 41.62], ["didgeridoo", 14.92], ["hum", 12.88]], null], "duration": [2.95, 2.3, 2.9, 0.54, 14.48, 6.24, 1.58, 76.41, 0.88, 0.37, 0.39, 4.97, 0.88]} \ No newline at end of file diff --git a/annotations_1/CtcQNdbPsSQ_filtered.json b/annotations_1/CtcQNdbPsSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c990bc688b9e87ed7c28e2ae27ad57122329aa4 --- /dev/null +++ b/annotations_1/CtcQNdbPsSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [5.0, 5.48], [9.0, 12.8], [13.0, 23.36], [27.0, 28.02], [30.0, 29.78], [30.0, 31.08], [37.0, 37.32], [38.0, 39.26], [42.0, 42.82], [52.0, 58.13], [58.0, 60.84], [65.0, 65.79], [67.0, 73.06], [73.0, 79.68], [81.0, 81.67], [88.0, 88.91], [94.0, 94.12], [96.0, 97.04], [103.0, 103.79], [106.0, 107.55], [109.0, 108.85], [111.0, 111.08], [113.0, 114.35], [123.0, 124.26], [125.0, 127.21], [128.0, 128.78], [134.0, 134.82], [138.0, 142.3]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 47.54, 40.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 54.1, 0.0, 56.03, 42.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.26, 0.0, 0.0, 31.86], "audiomae_on_audioset": [null, null, [["hum", 36.52], ["throbbing", 21.21], ["arrow", 3.96]], [["music", 68.57], ["throbbing", 5.18], ["musical instrument", 4.24]], null, null, null, null, null, null, [["hum", 38.45], ["throbbing", 14.84], ["speech", 9.7]], null, null, null, [["music", 34.04], ["hum", 12.47], ["mains hum", 9.81]], null, null, null, null, null, null, null, null, null, null, [["speech", 51.53], ["music", 18.08], ["hum", 5.32]], null, null, [["music", 54.88], ["throbbing", 5.49], ["quack", 4.05]]], "duration": [0.13, 0.48, 3.8, 10.36, 1.02, -0.22, 1.08, 0.32, 1.26, 0.82, 6.13, 2.84, 0.79, 6.06, 6.68, 0.67, 0.91, 0.12, 1.04, 0.79, 1.55, -0.15, 0.08, 1.35, 1.26, 2.21, 0.78, 0.82, 4.3]} \ No newline at end of file diff --git a/annotations_1/Cu5F2Z9mKmo_filtered.json b/annotations_1/Cu5F2Z9mKmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43548030255e46321f879a1a5c6a785311cc3b2c --- /dev/null +++ b/annotations_1/Cu5F2Z9mKmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [7.0, 9.0], [9.0, 10.62], [14.0, 14.34], [15.0, 15.42], [16.0, 18.05], [19.0, 20.68], [23.0, 23.58], [25.0, 25.03], [32.0, 33.02], [34.0, 35.28], [41.0, 41.71], [43.0, 43.24], [58.0, 59.1], [62.0, 64.05], [66.0, 67.31], [70.0, 70.51], [75.0, 76.08], [78.0, 78.76], [81.0, 80.82], [82.0, 82.17], [83.0, 83.12], [91.0, 92.2], [92.0, 92.23], [92.0, 92.26], [93.0, 92.58], [94.0, 103.52], [110.0, 109.88], [110.0, 113.95], [118.0, 118.22], [119.0, 118.91], [125.0, 125.24], [127.0, 130.08], [135.0, 135.67], [138.0, 138.6], [139.0, 140.64], [155.0, 155.55], [156.0, 156.69], [159.0, 161.97], [168.0, 168.3], [176.0, 176.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.95, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 60.89, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 2.0, 1.62, 0.34, 0.42, 2.05, 1.68, 0.58, 0.03, 1.02, 1.28, 0.71, 0.24, 1.1, 2.05, 1.31, 0.51, 1.08, 0.76, -0.18, 0.17, 0.12, 1.2, 0.23, 0.26, -0.42, 9.52, -0.12, 3.95, 0.22, -0.09, 0.24, 3.08, 0.67, 0.6, 1.64, 0.55, 0.69, 2.97, 0.3, 0.69]} \ No newline at end of file diff --git a/annotations_1/CujcdaQpYWE_filtered.json b/annotations_1/CujcdaQpYWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..096f550d8357d027d2529c2242c57b73e801c129 --- /dev/null +++ b/annotations_1/CujcdaQpYWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[153.0, 158.04]], "keep_status": [true], "silence_prob": [46.26], "audiomae_on_audioset": [[["music", 23.31], ["hum", 23.26], ["speech", 13.8]]], "duration": [5.04]} \ No newline at end of file diff --git a/annotations_1/CvLrYbRzjAE_filtered.json b/annotations_1/CvLrYbRzjAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c47852289afc5e8518c2fab6ccbe84c8ed13307a --- /dev/null +++ b/annotations_1/CvLrYbRzjAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 35.56], [40.0, 48.2], [49.0, 48.74], [49.0, 48.78], [49.0, 76.57], [80.0, 80.47], [85.0, 97.75], [98.0, 98.78], [110.0, 110.57], [118.0, 118.99], [122.0, 132.31], [133.0, 134.81], [137.0, 141.42], [151.0, 151.9], [153.0, 166.89], [167.0, 171.04], [171.0, 171.12], [171.0, 171.31], [171.0, 171.51], [172.0, 181.82], [194.0, 197.72], [202.0, 222.78], [224.0, 225.0], [226.0, 227.77], [228.0, 228.78], [229.0, 229.24]], "keep_status": [false, false, false, false, true, false, true, false, false, false, true, false, true, false, true, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [31.77, 32.04, 0.0, 0.0, 32.12, 0.0, 31.77, 0.0, 0.0, 0.0, 31.29, 0.0, 32.49, 0.0, 31.17, 32.45, 0.0, 0.0, 0.0, 32.07, 34.89, 31.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 45.78], ["music", 41.9], ["fart", 1.67]], [["music", 48.11], ["theremin", 23.61], ["musical instrument", 4.6]], null, null, [["whack, thwack", 24.17], ["didgeridoo", 22.19], ["music", 21.52]], null, [["music", 47.5], ["whale vocalization", 6.07], ["noise", 5.94]], null, null, null, [["music", 31.23], ["speech", 27.02], ["electric shaver, electric razor", 6.02]], null, [["music", 28.0], ["cattle, bovinae", 18.35], ["livestock, farm animals, working animals", 17.62]], null, [["music", 29.03], ["fly, housefly", 26.34], ["mosquito", 12.91]], [["mosquito", 27.2], ["didgeridoo", 15.24], ["fly, housefly", 8.27]], null, null, null, [["music", 23.6], ["speech", 15.59], ["fly, housefly", 11.72]], [["music", 23.16], ["groan", 7.77], ["mosquito", 5.18]], [["speech", 20.22], ["music", 19.28], ["theremin", 11.68]], null, null, null, null], "duration": [23.56, 8.2, -0.26, -0.22, 27.57, 0.47, 12.75, 0.78, 0.57, 0.99, 10.31, 1.81, 4.42, 0.9, 13.89, 4.04, 0.12, 0.31, 0.51, 9.82, 3.72, 20.78, 1.0, 1.77, 0.78, 0.24]} \ No newline at end of file diff --git a/annotations_1/CvoAG6pgdC4_filtered.json b/annotations_1/CvoAG6pgdC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eba351e1f6f2f3dbec62063b82d048b324a1cda7 --- /dev/null +++ b/annotations_1/CvoAG6pgdC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [5.0, 5.37], [6.0, 7.16], [8.0, 10.02], [11.0, 13.1], [15.0, 17.29], [18.0, 22.74], [26.0, 26.38], [33.0, 40.98], [45.0, 46.09], [52.0, 52.27], [54.0, 54.46], [55.0, 55.9], [57.0, 58.09], [60.0, 60.24], [86.0, 91.18], [93.0, 93.23]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.8, 100.0, 56.33, 97.64, 0.0, 46.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["animal", 36.77], ["sidetone", 9.41], ["domestic animals, pets", 4.61]], null, null, null, null, null, null, null, null], "duration": [0.81, 0.37, 1.16, 2.02, 2.1, 2.29, 4.74, 0.38, 7.98, 1.09, 0.27, 0.46, 0.9, 1.09, 0.24, 5.18, 0.23]} \ No newline at end of file diff --git a/annotations_1/Cw9FQ_X-gP0_filtered.json b/annotations_1/Cw9FQ_X-gP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca85b4ed9398dd2f8b9d33193ebe6d280ea341de --- /dev/null +++ b/annotations_1/Cw9FQ_X-gP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.29], [8.0, 76.67], [80.0, 87.71], [88.0, 90.41], [91.0, 132.68]], "keep_status": [true, false, false, true, false], "silence_prob": [35.94, 0.0, 39.31, 32.73, 0.0], "audiomae_on_audioset": [[["music", 34.74], ["ambient music", 21.6], ["electronic music", 11.43]], null, [["music", 57.5], ["synthesizer", 9.35], ["ambient music", 8.19]], [["music", 44.57], ["ambient music", 16.86], ["hum", 7.58]], null], "duration": [2.29, 68.67, 7.71, 2.41, 41.68]} \ No newline at end of file diff --git a/annotations_1/CxQ4aL5IXZw_filtered.json b/annotations_1/CxQ4aL5IXZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c419bbc5cc020ae2acf26ce8404ff3d6bd626a27 --- /dev/null +++ b/annotations_1/CxQ4aL5IXZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.99], [14.0, 18.39], [22.0, 40.29], [43.0, 56.19], [57.0, 63.51], [67.0, 84.57], [85.0, 94.47]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [59.24, 52.86, 67.51, 95.37, 69.88, 35.82, 82.25], "audiomae_on_audioset": [null, null, null, null, null, [["music", 35.63], ["wild animals", 4.9], ["hum", 4.03]], null], "duration": [3.99, 4.39, 18.29, 13.19, 6.51, 17.57, 9.47]} \ No newline at end of file diff --git a/annotations_1/CxrQd6Sn5PA_filtered.json b/annotations_1/CxrQd6Sn5PA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc20975600fedeebbcb2ce8e098f24f57856372d --- /dev/null +++ b/annotations_1/CxrQd6Sn5PA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [5.0, 7.18], [8.0, 8.28], [9.0, 13.44], [14.0, 14.2], [15.0, 17.07], [18.0, 18.69], [20.0, 33.61], [34.0, 34.72], [37.0, 37.64], [38.0, 42.75], [44.0, 48.73], [49.0, 51.71], [52.0, 52.89], [54.0, 66.82], [67.0, 128.21], [131.0, 133.88]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 97.33, 0.0, 97.22, 0.0, 90.6, 0.0, 35.09, 0.0, 0.0, 75.39, 68.93, 59.15, 0.0, 41.38, 0.0, 30.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 30.25], ["mains hum", 18.94], ["music", 16.1]], null, null, null, null, null, null, [["music", 37.3], ["synthesizer", 12.67], ["hum", 8.65]], null, [["whale vocalization", 90.83], ["fly, housefly", 2.28], ["insect", 1.72]]], "duration": [0.97, 2.18, 0.28, 4.44, 0.2, 2.07, 0.69, 13.61, 0.72, 0.64, 4.75, 4.73, 2.71, 0.89, 12.82, 61.21, 2.88]} \ No newline at end of file diff --git a/annotations_1/CyAW5eAhhPo_filtered.json b/annotations_1/CyAW5eAhhPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e460bbc9ad04b7b92ad8940b9792e844b34e0d6 --- /dev/null +++ b/annotations_1/CyAW5eAhhPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.01], [11.0, 12.16], [13.0, 14.05], [17.0, 21.39], [24.0, 29.27], [31.0, 32.19], [33.0, 38.6], [40.0, 41.32], [42.0, 46.9], [48.0, 49.42], [50.0, 51.02], [54.0, 55.65], [59.0, 59.27], [62.0, 64.03], [64.0, 65.33], [67.0, 70.02], [81.0, 84.3], [85.0, 86.31], [89.0, 89.94], [91.0, 94.19], [95.0, 96.01], [99.0, 101.29], [105.0, 109.26], [111.0, 148.81], [155.0, 155.02]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.4, 0.0, 0.0, 52.86, 99.78, 0.0, 91.81, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 68.67, 81.89, 0.0, 0.0, 78.72, 0.0, 65.55, 42.04, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.48], ["music", 5.24], ["inside, small room", 4.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.45], ["hum", 18.94], ["mains hum", 12.92]], null, null], "duration": [4.01, 1.16, 1.05, 4.39, 5.27, 1.19, 5.6, 1.32, 4.9, 1.42, 1.02, 1.65, 0.27, 2.03, 1.33, 3.02, 3.3, 1.31, 0.94, 3.19, 1.01, 2.29, 4.26, 37.81, 0.02]} \ No newline at end of file diff --git a/annotations_1/CyJglP6k8lE_filtered.json b/annotations_1/CyJglP6k8lE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b2c04cff889b7567cb31e31f6515f5463b71f5c --- /dev/null +++ b/annotations_1/CyJglP6k8lE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.87], [23.0, 30.13], [32.0, 34.2], [36.0, 51.68], [55.0, 61.99], [69.0, 69.38], [75.0, 82.66], [86.0, 112.89], [114.0, 116.45], [118.0, 119.47], [126.0, 126.23], [131.0, 131.87], [138.0, 143.28], [152.0, 153.3], [157.0, 165.74], [170.0, 175.37], [179.0, 180.17], [184.0, 191.74]], "keep_status": [true, false, true, false, true, false, true, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [30.52, 33.51, 32.53, 32.48, 31.52, 0.0, 32.09, 36.43, 100.0, 0.0, 0.0, 0.0, 32.11, 0.0, 31.22, 32.01, 0.0, 32.04], "audiomae_on_audioset": [[["moo", 14.65], ["cattle, bovinae", 14.0], ["livestock, farm animals, working animals", 10.98]], [["speech", 41.47], ["music", 24.53], ["boing", 5.77]], [["speech", 49.4], ["music", 11.98], ["throbbing", 5.29]], [["music", 80.38], ["synthesizer", 2.12], ["electronic music", 1.11]], [["music", 40.52], ["speech", 11.67], ["fart", 6.47]], null, [["music", 57.75], ["speech", 8.2], ["noise", 2.57]], [["buzz", 25.0], ["speech", 15.51], ["music", 9.05]], null, null, null, null, [["music", 63.97], ["speech", 21.65], ["groan", 3.13]], null, [["speech", 53.23], ["music", 12.51], ["fart", 4.49]], [["music", 29.41], ["speech", 16.07], ["fart", 8.71]], null, [["speech", 39.19], ["music", 21.76], ["sound effect", 4.44]]], "duration": [12.87, 7.13, 2.2, 15.68, 6.99, 0.38, 7.66, 26.89, 2.45, 1.47, 0.23, 0.87, 5.28, 1.3, 8.74, 5.37, 1.17, 7.74]} \ No newline at end of file diff --git a/annotations_1/CyUZe8xRNnQ_filtered.json b/annotations_1/CyUZe8xRNnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14e6651a761d1f702910abc316d5a1c31d3fdb22 --- /dev/null +++ b/annotations_1/CyUZe8xRNnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.17], [12.0, 12.63], [20.0, 22.71], [27.0, 33.78], [34.0, 36.68], [40.0, 40.1], [42.0, 44.34], [49.0, 51.75], [53.0, 54.19], [58.0, 59.53], [63.0, 64.2], [69.0, 70.16], [77.0, 85.5], [94.0, 100.33], [102.0, 102.61], [105.0, 115.97], [117.0, 118.13], [122.0, 124.39], [126.0, 140.44], [144.0, 143.9], [145.0, 145.44], [146.0, 152.78], [160.0, 160.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [38.66, 0.0, 30.09, 30.38, 30.85, 0.0, 30.39, 30.01, 0.0, 0.0, 0.0, 0.0, 29.46, 29.36, 0.0, 30.08, 0.0, 34.43, 30.22, 0.0, 0.0, 31.45, 0.0], "audiomae_on_audioset": [[["music", 61.0], ["guitar", 10.8], ["musical instrument", 9.17]], null, [["music", 59.92], ["boing", 11.06], ["sidetone", 2.65]], [["music", 82.47], ["speech", 1.59], ["sampler", 1.13]], [["music", 72.05], ["musical instrument", 2.75], ["sampler", 1.98]], null, [["music", 35.69], ["trombone", 25.27], ["brass instrument", 18.18]], [["music", 78.04], ["singing", 2.08], ["song", 1.48]], null, null, null, null, [["music", 84.51], ["funk", 1.16], ["musical instrument", 0.79]], [["music", 57.77], ["didgeridoo", 17.54], ["theremin", 2.41]], null, [["music", 73.89], ["didgeridoo", 8.84], ["synthesizer", 3.45]], null, [["music", 46.3], ["musical instrument", 6.98], ["piano", 3.57]], [["music", 86.14], ["musical instrument", 1.61], ["didgeridoo", 0.95]], null, null, [["music", 62.84], ["theremin", 7.51], ["throbbing", 2.22]], null], "duration": [3.17, 0.63, 2.71, 6.78, 2.68, 0.1, 2.34, 2.75, 1.19, 1.53, 1.2, 1.16, 8.5, 6.33, 0.61, 10.97, 1.13, 2.39, 14.44, -0.1, 0.44, 6.78, 0.71]} \ No newline at end of file diff --git a/annotations_1/CyhOZgd8ahs_filtered.json b/annotations_1/CyhOZgd8ahs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/CyhOZgd8ahs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/CzbL7AJIhJI_filtered.json b/annotations_1/CzbL7AJIhJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0973b5573d3645094a2d2726e5119f8c0e6d4b8 --- /dev/null +++ b/annotations_1/CzbL7AJIhJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 20.88], [22.0, 21.73], [22.0, 29.67], [31.0, 89.21], [90.0, 103.54]], "keep_status": [true, false, false, false, false], "silence_prob": [33.27, 0.0, 31.52, 0.0, 32.85], "audiomae_on_audioset": [[["music", 27.44], ["brass instrument", 7.31], ["theremin", 7.24]], null, [["music", 63.08], ["musical instrument", 9.35], ["wind instrument, woodwind instrument", 2.92]], null, [["music", 41.65], ["hum", 21.54], ["mains hum", 15.06]]], "duration": [18.88, -0.27, 7.67, 58.21, 13.54]} \ No newline at end of file diff --git a/annotations_1/D-gTnaF9LVA_filtered.json b/annotations_1/D-gTnaF9LVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfdfa8501594c4d8bf6a95b0cf48c6bcebb41e8a --- /dev/null +++ b/annotations_1/D-gTnaF9LVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [10.0, 12.31], [16.0, 15.72], [19.0, 19.85], [33.0, 35.21], [36.0, 37.91], [43.0, 44.42], [50.0, 53.81], [56.0, 57.37], [59.0, 61.11], [63.0, 64.35], [65.0, 66.53], [67.0, 68.01], [70.0, 72.25], [75.0, 75.15], [77.0, 77.6], [81.0, 81.57], [89.0, 88.65], [97.0, 97.85], [103.0, 103.38], [107.0, 107.69], [118.0, 118.1], [120.0, 121.98], [123.0, 123.8], [131.0, 132.16], [139.0, 139.58], [140.0, 143.55], [147.0, 146.85], [149.0, 150.33], [155.0, 162.36], [167.0, 167.54], [169.0, 169.05], [173.0, 173.25], [174.0, 183.95]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 56.93, 0.0, 0.0, 61.67, 0.0, 0.0, 59.77, 0.0, 36.93, 0.0, 0.0, 0.0, 38.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.2, 0.0, 0.0, 29.7, 0.0, 0.0, 0.0, 31.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 37.99], ["hum", 6.72], ["mains hum", 6.27]], null, null, null, [["hum", 30.42], ["mains hum", 28.17], ["music", 12.59]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.07], ["throbbing", 12.28], ["boing", 10.5]], null, null, [["music", 18.58], ["speech", 13.25], ["buzz", 10.9]], null, null, null, [["music", 36.26], ["hum", 24.07], ["throbbing", 14.5]]], "duration": [1.45, 2.31, -0.28, 0.85, 2.21, 1.91, 1.42, 3.81, 1.37, 2.11, 1.35, 1.53, 1.01, 2.25, 0.15, 0.6, 0.57, -0.35, 0.85, 0.38, 0.69, 0.1, 1.98, 0.8, 1.16, 0.58, 3.55, -0.15, 1.33, 7.36, 0.54, 0.05, 0.25, 9.95]} \ No newline at end of file diff --git a/annotations_1/D01cKQMu5Ew_filtered.json b/annotations_1/D01cKQMu5Ew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ac58faaddd08cf73564f6073f205b65c938ecb --- /dev/null +++ b/annotations_1/D01cKQMu5Ew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [4.0, 5.73], [7.0, 12.09], [17.0, 23.09], [23.0, 23.84], [26.0, 27.11], [30.0, 29.98], [31.0, 42.55], [44.0, 45.01], [45.0, 49.03], [50.0, 51.12], [52.0, 58.85], [60.0, 60.94], [65.0, 66.23], [73.0, 73.45], [79.0, 88.18], [91.0, 95.69], [97.0, 97.44]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.11, 36.84, 0.0, 0.0, 0.0, 40.66, 0.0, 97.83, 0.0, 67.76, 0.0, 0.0, 0.0, 58.98, 45.78, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 41.1], ["music", 9.73], ["sidetone", 4.7]], null, null, null, [["speech", 66.93], ["sidetone", 14.26], ["computer keyboard", 3.07]], null, null, null, null, null, null, null, null, [["music", 68.99], ["speech", 4.18], ["guitar", 3.35]], null], "duration": [0.18, 1.73, 5.09, 6.09, 0.84, 1.11, -0.02, 11.55, 1.01, 4.03, 1.12, 6.85, 0.94, 1.23, 0.45, 9.18, 4.69, 0.44]} \ No newline at end of file diff --git a/annotations_1/D0bIbyAa_XE_filtered.json b/annotations_1/D0bIbyAa_XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab27c8c4dc5c688fb3c3298a872c02fa93886bb4 --- /dev/null +++ b/annotations_1/D0bIbyAa_XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.32], [12.0, 16.73], [24.0, 24.21], [31.0, 31.8], [35.0, 34.92], [39.0, 40.56], [45.0, 63.56], [70.0, 81.36], [85.0, 88.01], [91.0, 94.1], [95.0, 95.74], [98.0, 98.69], [101.0, 101.19], [102.0, 123.06]], "keep_status": [false, true, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 29.5, 0.0, 0.0, 0.0, 0.0, 28.61, 28.63, 29.08, 39.94, 0.0, 0.0, 0.0, 33.52], "audiomae_on_audioset": [null, [["speech", 46.32], ["aircraft", 6.9], ["buzzer", 6.11]], null, null, null, null, [["speech", 40.37], ["buzz", 8.14], ["music", 6.97]], [["music", 21.41], ["rumble", 16.45], ["hum", 12.57]], [["music", 28.91], ["theremin", 9.01], ["wind instrument, woodwind instrument", 5.83]], [["speech", 34.73], ["hum", 27.73], ["mains hum", 10.15]], null, null, null, [["mains hum", 40.13], ["hum", 26.27], ["speech", 6.66]]], "duration": [1.32, 4.73, 0.21, 0.8, -0.08, 1.56, 18.56, 11.36, 3.01, 3.1, 0.74, 0.69, 0.19, 21.06]} \ No newline at end of file diff --git a/annotations_1/D143VuAxr-k_filtered.json b/annotations_1/D143VuAxr-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63c3af1f0d08a71927c5b4708c97634997062cf8 --- /dev/null +++ b/annotations_1/D143VuAxr-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 20.78], [23.0, 28.0], [35.0, 35.67], [37.0, 37.99], [41.0, 40.93], [45.0, 51.19], [52.0, 60.08], [62.0, 62.7], [64.0, 65.33], [66.0, 66.16], [70.0, 70.01], [72.0, 81.18], [82.0, 85.67], [87.0, 102.98], [107.0, 125.83], [130.0, 130.03], [134.0, 134.33], [137.0, 137.91], [139.0, 140.68], [143.0, 143.55], [146.0, 149.18], [150.0, 151.63]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [57.81, 54.7, 0.0, 0.0, 0.0, 48.35, 54.97, 0.0, 0.0, 0.0, 0.0, 38.27, 34.67, 37.45, 34.37, 0.0, 0.0, 0.0, 0.0, 0.0, 38.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["thunk", 11.78], ["creak", 9.81], ["microwave oven", 8.44]], null, null, null, null, null, [["didgeridoo", 53.33], ["music", 24.98], ["hum", 5.23]], [["music", 34.93], ["synthesizer", 9.75], ["theremin", 6.37]], [["music", 69.12], ["ambient music", 6.05], ["theremin", 3.52]], [["music", 49.06], ["ambient music", 6.22], ["hum", 5.43]], null, null, null, null, null, [["music", 53.73], ["didgeridoo", 8.4], ["musical instrument", 6.67]], null], "duration": [16.78, 5.0, 0.67, 0.99, -0.07, 6.19, 8.08, 0.7, 1.33, 0.16, 0.01, 9.18, 3.67, 15.98, 18.83, 0.03, 0.33, 0.91, 1.68, 0.55, 3.18, 1.63]} \ No newline at end of file diff --git a/annotations_1/D1IshjFWDJk_filtered.json b/annotations_1/D1IshjFWDJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a0abf9eca4c76ce3cc772620be419f8069525fd --- /dev/null +++ b/annotations_1/D1IshjFWDJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [8.0, 7.86], [9.0, 9.09], [11.0, 10.99], [22.0, 22.54], [28.0, 28.07], [32.0, 39.34], [45.0, 45.57], [47.0, 47.36], [51.0, 51.49], [55.0, 55.07], [58.0, 58.41], [73.0, 78.24], [79.0, 87.1], [88.0, 88.67], [89.0, 102.91], [104.0, 105.11], [106.0, 106.71], [109.0, 117.56], [119.0, 119.45]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.92, 0.0, 0.0, 0.0, 0.0, 0.0, 33.54, 98.8, 0.0, 95.78, 0.0, 0.0, 75.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 32.21], ["speech", 12.62], ["moo", 5.48]], null, null, null, null, null, [["animal", 23.96], ["music", 13.85], ["whale vocalization", 7.16]], null, null, null, null, null, null, null], "duration": [0.19, -0.14, 0.09, -0.01, 0.54, 0.07, 7.34, 0.57, 0.36, 0.49, 0.07, 0.41, 5.24, 8.1, 0.67, 13.91, 1.11, 0.71, 8.56, 0.45]} \ No newline at end of file diff --git a/annotations_1/D1YHdHw-doQ_filtered.json b/annotations_1/D1YHdHw-doQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46aee378fc7581acaf3eb9e27a0ba0352eecc383 --- /dev/null +++ b/annotations_1/D1YHdHw-doQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.21], [21.0, 21.32], [21.0, 21.56], [25.0, 33.39], [39.0, 39.8], [44.0, 45.28], [47.0, 47.88], [49.0, 55.65], [61.0, 62.63], [69.0, 70.41], [73.0, 75.69], [76.0, 76.47], [79.0, 84.1], [88.0, 93.61], [96.0, 97.19], [103.0, 104.77], [112.0, 111.86], [114.0, 116.26], [118.0, 119.64], [121.0, 122.3], [124.0, 126.27], [129.0, 130.84], [133.0, 138.05], [139.0, 141.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 57.81, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 61.77, 0.0, 43.51, 68.15, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 57.97, 0.0, 42.84, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.78], ["hum", 5.65], ["synthesizer", 4.43]], null, null, null, null, null, null, null, null, null, [["music", 37.05], ["didgeridoo", 20.34], ["speech", 9.17]], null], "duration": [0.21, 0.32, 0.56, 8.39, 0.8, 1.28, 0.88, 6.65, 1.63, 1.41, 2.69, 0.47, 5.1, 5.61, 1.19, 1.77, -0.14, 2.26, 1.64, 1.3, 2.27, 1.84, 5.05, 2.76]} \ No newline at end of file diff --git a/annotations_1/D3fVS2I9ZVM_filtered.json b/annotations_1/D3fVS2I9ZVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2007f03bfe77395a2a225aa08f279a65dea23b85 --- /dev/null +++ b/annotations_1/D3fVS2I9ZVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[142.0, 163.9]], "keep_status": [false], "silence_prob": [38.37], "audiomae_on_audioset": [[["hum", 51.73], ["mains hum", 42.07], ["throbbing", 3.84]]], "duration": [21.9]} \ No newline at end of file diff --git a/annotations_1/D4HGK-_5TkY_filtered.json b/annotations_1/D4HGK-_5TkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5de3d483dcbd32af54e1509f3e7438f14c676ff1 --- /dev/null +++ b/annotations_1/D4HGK-_5TkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.02], [10.0, 10.45], [11.0, 11.01], [12.0, 15.25], [16.0, 17.61], [22.0, 27.03], [30.0, 37.42], [38.0, 39.66], [42.0, 45.39], [48.0, 50.62], [51.0, 51.7], [53.0, 57.01], [59.0, 65.15], [66.0, 66.18], [68.0, 68.39], [69.0, 71.31], [72.0, 73.21], [77.0, 77.28], [78.0, 108.89], [112.0, 112.31], [112.0, 112.85], [121.0, 121.64], [127.0, 127.45], [132.0, 132.73], [135.0, 139.19], [141.0, 141.37], [143.0, 144.21], [146.0, 147.8], [149.0, 150.09], [151.0, 152.71]], "keep_status": [true, false, false, false, false, true, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [37.34, 0.0, 0.0, 51.12, 0.0, 43.74, 44.4, 0.0, 42.62, 45.49, 0.0, 36.61, 30.22, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.58, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.8], ["whale vocalization", 25.75], ["sound effect", 2.81]], null, null, null, null, [["music", 54.86], ["hum", 9.07], ["mains hum", 5.44]], [["music", 78.22], ["electronic music", 3.17], ["hum", 2.87]], null, [["music", 39.39], ["whale vocalization", 11.67], ["animal", 9.76]], [["music", 18.28], ["livestock, farm animals, working animals", 9.14], ["moo", 7.36]], null, [["whale vocalization", 99.5], ["animal", 0.09], ["livestock, farm animals, working animals", 0.07]], [["groan", 42.16], ["music", 14.76], ["fly, housefly", 9.6]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.53], ["mains hum", 18.05], ["music", 17.94]], null, null, null, null, null], "duration": [3.02, 0.45, 0.01, 3.25, 1.61, 5.03, 7.42, 1.66, 3.39, 2.62, 0.7, 4.01, 6.15, 0.18, 0.39, 2.31, 1.21, 0.28, 30.89, 0.31, 0.85, 0.64, 0.45, 0.73, 4.19, 0.37, 1.21, 1.8, 1.09, 1.71]} \ No newline at end of file diff --git a/annotations_1/D4gPEFccxPk_filtered.json b/annotations_1/D4gPEFccxPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db643fbdd82e7f213b64e191dcdb7e11a25aec3e --- /dev/null +++ b/annotations_1/D4gPEFccxPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 35.78], [37.0, 57.4], [58.0, 59.27], [60.0, 69.43], [73.0, 73.87], [78.0, 78.73], [80.0, 84.81], [92.0, 92.5], [93.0, 93.01], [93.0, 93.28], [93.0, 93.58], [99.0, 99.4]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 39.09, 0.0, 39.34, 0.0, 0.0, 36.07, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["busy signal", 27.01], ["hum", 19.45], ["throbbing", 12.94]], null, [["chirp tone", 37.26], ["sine wave", 10.02], ["music", 7.09]], null, null, [["music", 23.16], ["synthesizer", 15.71], ["dial tone", 10.56]], null, null, null, null, null], "duration": [1.78, 20.4, 1.27, 9.43, 0.87, 0.73, 4.81, 0.5, 0.01, 0.28, 0.58, 0.4]} \ No newline at end of file diff --git a/annotations_1/D4sj2Yq5bnU_filtered.json b/annotations_1/D4sj2Yq5bnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdf9d8a551d9019600269c1f8dcae852256e7eb7 --- /dev/null +++ b/annotations_1/D4sj2Yq5bnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 67.58], [72.0, 105.75], [106.0, 114.86]], "keep_status": [false, false, false], "silence_prob": [33.6, 0.0, 52.39], "audiomae_on_audioset": [[["throbbing", 27.88], ["music", 26.91], ["hum", 15.95]], null, null], "duration": [21.58, 33.75, 8.86]} \ No newline at end of file diff --git a/annotations_1/D56dpMQVGTo_filtered.json b/annotations_1/D56dpMQVGTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbe66ff52a391300195e9977e42c904d8cafcc29 --- /dev/null +++ b/annotations_1/D56dpMQVGTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.57], [19.0, 27.57], [28.0, 29.4], [31.0, 32.61], [35.0, 37.17], [41.0, 41.59], [52.0, 53.0], [58.0, 59.95], [61.0, 61.37], [64.0, 64.98], [71.0, 75.12], [79.0, 81.62], [82.0, 82.85], [84.0, 84.37], [85.0, 85.08], [86.0, 86.83], [88.0, 89.04], [91.0, 91.71], [92.0, 92.45], [98.0, 98.51], [99.0, 98.69], [109.0, 109.68], [110.0, 111.79], [112.0, 112.06], [112.0, 115.6], [119.0, 119.87], [121.0, 122.08], [126.0, 130.55], [131.0, 130.59], [131.0, 130.71], [132.0, 133.35], [136.0, 137.42], [139.0, 139.92], [143.0, 146.8], [159.0, 160.51], [164.0, 164.59], [165.0, 171.29], [175.0, 180.84], [187.0, 191.54], [192.0, 192.99]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.2, 62.78, 0.0, 0.0, 53.91, 0.0, 0.0, 0.0, 0.0, 0.0, 37.38, 31.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 33.17, 56.78, 37.01, 0.0], "audiomae_on_audioset": [[["hum", 16.51], ["speech", 13.92], ["heart sounds, heartbeat", 9.44]], null, null, null, null, null, null, null, null, null, [["music", 72.3], ["musical instrument", 6.47], ["didgeridoo", 3.47]], [["music", 30.35], ["speech", 19.16], ["boing", 7.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.49], ["speech", 15.95], ["sidetone", 6.5]], null, null, null, null, null, null, null, null, [["music", 48.08], ["sidetone", 24.68], ["boing", 6.33]], null, [["mosquito", 50.6], ["fly, housefly", 33.49], ["insect", 8.46]], null], "duration": [3.57, 8.57, 1.4, 1.61, 2.17, 0.59, 1.0, 1.95, 0.37, 0.98, 4.12, 2.62, 0.85, 0.37, 0.08, 0.83, 1.04, 0.71, 0.45, 0.51, -0.31, 0.68, 1.79, 0.06, 3.6, 0.87, 1.08, 4.55, -0.41, -0.29, 1.35, 1.42, 0.92, 3.8, 1.51, 0.59, 6.29, 5.84, 4.54, 0.99]} \ No newline at end of file diff --git a/annotations_1/D6MN7T-tnDw_filtered.json b/annotations_1/D6MN7T-tnDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97f881e614c6a6f53e351605370c36a8b048b0ff --- /dev/null +++ b/annotations_1/D6MN7T-tnDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 82.51]], "keep_status": [false], "silence_prob": [29.49], "audiomae_on_audioset": [[["music", 27.33], ["boom", 26.81], ["fireworks", 16.52]]], "duration": [3.51]} \ No newline at end of file diff --git a/annotations_1/D7gk8nagjHU_filtered.json b/annotations_1/D7gk8nagjHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15afe64abdbfa9e32fec24f6ca226356d8779533 --- /dev/null +++ b/annotations_1/D7gk8nagjHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.59], [11.0, 12.26], [13.0, 15.11], [16.0, 17.17], [18.0, 18.0], [22.0, 21.9], [23.0, 60.72], [62.0, 75.14], [76.0, 100.92]], "keep_status": [false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 29.64, 30.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 47.76], ["buzz", 12.09], ["speech", 7.18]], [["music", 35.05], ["speech", 27.85], ["didgeridoo", 7.08]]], "duration": [1.59, 1.26, 2.11, 1.17, 0.0, -0.1, 37.72, 13.14, 24.92]} \ No newline at end of file diff --git a/annotations_1/D7tCnGstwcs_filtered.json b/annotations_1/D7tCnGstwcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15b45aac668632a11b143791f6c66e461478e4af --- /dev/null +++ b/annotations_1/D7tCnGstwcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.38], [9.0, 9.56], [11.0, 12.01], [14.0, 14.94], [17.0, 18.25], [19.0, 19.53], [20.0, 21.0], [22.0, 23.18], [25.0, 25.47], [27.0, 27.26], [30.0, 30.91], [32.0, 32.93], [35.0, 34.72], [36.0, 38.42], [40.0, 40.54], [42.0, 43.02], [43.0, 43.66], [45.0, 45.72], [46.0, 46.2], [48.0, 48.95], [51.0, 50.77], [52.0, 52.78], [53.0, 53.23], [54.0, 54.85], [57.0, 56.57], [58.0, 58.56], [59.0, 59.32], [60.0, 60.32], [69.0, 69.18], [70.0, 71.74], [76.0, 76.22], [79.0, 79.89], [81.0, 82.17], [87.0, 87.1], [91.0, 91.83], [94.0, 94.46], [97.0, 98.42], [99.0, 102.24], [104.0, 104.99], [106.0, 107.32], [109.0, 110.03], [111.0, 112.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.56, 1.01, 0.94, 1.25, 0.53, 1.0, 1.18, 0.47, 0.26, 0.91, 0.93, -0.28, 2.42, 0.54, 1.02, 0.66, 0.72, 0.2, 0.95, -0.23, 0.78, 0.23, 0.85, -0.43, 0.56, 0.32, 0.32, 0.18, 1.74, 0.22, 0.89, 1.17, 0.1, 0.83, 0.46, 1.42, 3.24, 0.99, 1.32, 1.03, 1.58]} \ No newline at end of file diff --git a/annotations_1/D8Cra7i2kGc_filtered.json b/annotations_1/D8Cra7i2kGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c049abfaf6ceeddd032d85b47cdb377c87769ecd --- /dev/null +++ b/annotations_1/D8Cra7i2kGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.47], [11.0, 14.13], [16.0, 22.38], [24.0, 24.02], [25.0, 30.54], [32.0, 32.88], [35.0, 40.66], [41.0, 98.64], [101.0, 170.94], [178.0, 178.68]], "keep_status": [true, true, true, false, true, false, true, false, false, false], "silence_prob": [40.73, 45.59, 37.49, 0.0, 43.66, 0.0, 43.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 24.47], ["music", 15.7], ["hum", 7.89]], [["music", 40.73], ["hum", 9.13], ["whale vocalization", 6.96]], [["music", 38.38], ["didgeridoo", 23.73], ["boat, water vehicle", 3.41]], null, [["music", 44.64], ["hum", 6.63], ["throbbing", 5.13]], null, [["music", 45.46], ["speech", 7.28], ["hum", 4.3]], null, null, null], "duration": [7.47, 3.13, 6.38, 0.02, 5.54, 0.88, 5.66, 57.64, 69.94, 0.68]} \ No newline at end of file diff --git a/annotations_1/D8NMSoCRPV8_filtered.json b/annotations_1/D8NMSoCRPV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55b20fc5d8632215e8988052198dafb5914c4483 --- /dev/null +++ b/annotations_1/D8NMSoCRPV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.75], [7.0, 9.1], [11.0, 12.39], [12.0, 12.43], [13.0, 31.58], [32.0, 63.71], [65.0, 86.81], [87.0, 126.94], [129.0, 130.71], [131.0, 131.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 69.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 2.1, 1.39, 0.43, 18.58, 31.71, 21.81, 39.94, 1.71, 0.45]} \ No newline at end of file diff --git a/annotations_1/D93GR0PGUD0_filtered.json b/annotations_1/D93GR0PGUD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da35bfcca38e89bec099ca4085c87c028a9461be --- /dev/null +++ b/annotations_1/D93GR0PGUD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.02], [18.0, 18.03], [21.0, 21.24], [27.0, 27.31], [31.0, 31.67], [33.0, 33.83], [37.0, 37.44], [40.0, 40.2], [49.0, 50.06], [51.0, 51.41], [52.0, 53.76], [56.0, 56.61], [58.0, 58.28], [60.0, 60.29], [62.0, 62.33], [63.0, 63.54], [64.0, 64.67], [65.0, 66.06], [67.0, 67.19], [67.0, 72.77], [74.0, 74.02], [75.0, 77.43], [80.0, 82.41], [84.0, 85.02], [94.0, 101.53], [102.0, 102.47], [113.0, 112.94], [114.0, 114.51], [119.0, 130.08]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, true], "silence_prob": [37.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 41.7, 39.57, 0.0, 38.67, 0.0, 0.0, 0.0, 31.39], "audiomae_on_audioset": [[["music", 34.46], ["foghorn", 13.23], ["musical instrument", 8.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.66], ["theremin", 11.7], ["didgeridoo", 8.68]], null, [["music", 49.31], ["synthesizer", 8.53], ["musical instrument", 6.04]], [["music", 32.55], ["singing bowl", 10.29], ["didgeridoo", 8.65]], null, [["music", 25.17], ["gong", 22.4], ["musical instrument", 9.78]], null, null, null, [["speech", 18.79], ["cattle, bovinae", 17.93], ["moo", 15.33]]], "duration": [5.02, 0.03, 0.24, 0.31, 0.67, 0.83, 0.44, 0.2, 1.06, 0.41, 1.76, 0.61, 0.28, 0.29, 0.33, 0.54, 0.67, 1.06, 0.19, 5.77, 0.02, 2.43, 2.41, 1.02, 7.53, 0.47, -0.06, 0.51, 11.08]} \ No newline at end of file diff --git a/annotations_1/DAPrbiJaej4_filtered.json b/annotations_1/DAPrbiJaej4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5daabbc580fe846d1caf8bb00c433c3391592d1b --- /dev/null +++ b/annotations_1/DAPrbiJaej4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.44], [17.0, 17.36], [28.0, 31.28], [32.0, 40.61], [46.0, 45.96], [50.0, 50.57], [51.0, 54.13], [56.0, 57.33], [61.0, 62.82], [63.0, 63.51], [64.0, 65.08], [69.0, 71.37], [72.0, 72.87], [74.0, 75.59], [78.0, 78.66], [142.0, 143.11], [144.0, 145.2], [145.0, 147.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.09, 32.24, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48], "audiomae_on_audioset": [null, null, null, [["music", 67.59], ["synthesizer", 6.67], ["drum machine", 4.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 0.36, 3.28, 8.61, -0.04, 0.57, 3.13, 1.33, 1.82, 0.51, 1.08, 2.37, 0.87, 1.59, 0.66, 1.11, 1.2, 2.21]} \ No newline at end of file diff --git a/annotations_1/DBUXGB_L5q8_filtered.json b/annotations_1/DBUXGB_L5q8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62ca087f7ff56701249671194c27c084031c6099 --- /dev/null +++ b/annotations_1/DBUXGB_L5q8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.54], [23.0, 23.82], [28.0, 27.84], [29.0, 28.97], [31.0, 31.26], [31.0, 31.4], [33.0, 55.39], [62.0, 72.35], [74.0, 90.44], [92.0, 92.52], [105.0, 105.41], [108.0, 119.8], [122.0, 122.82], [126.0, 157.05], [160.0, 168.0], [169.0, 170.5], [177.0, 177.16], [178.0, 190.43], [195.0, 217.21], [220.0, 224.13], [227.0, 239.89]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, true, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.8, 30.8, 30.06, 0.0, 0.0, 29.52, 0.0, 0.0, 30.41, 0.0, 0.0, 29.07, 28.94, 29.25, 30.43], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 41.76], ["hum", 15.99], ["throbbing", 8.83]], [["livestock, farm animals, working animals", 19.39], ["motorcycle", 11.42], ["cattle, bovinae", 10.53]], [["buzz", 30.37], ["music", 17.71], ["hum", 17.21]], null, null, [["music", 15.78], ["vehicle", 14.98], ["speech", 11.92]], null, null, [["music", 38.85], ["hum", 18.2], ["throbbing", 8.73]], null, null, [["speech", 28.77], ["vehicle", 21.9], ["car", 7.32]], [["speech", 41.68], ["music", 40.29], ["hum", 4.85]], [["music", 40.36], ["hum", 9.36], ["mains hum", 8.92]], [["music", 38.93], ["speech", 13.85], ["fart", 9.07]]], "duration": [0.54, 0.82, -0.16, -0.03, 0.26, 0.4, 22.39, 10.35, 16.44, 0.52, 0.41, 11.8, 0.82, 31.05, 8.0, 1.5, 0.16, 12.43, 22.21, 4.13, 12.89]} \ No newline at end of file diff --git a/annotations_1/DC2QaWmat7A_filtered.json b/annotations_1/DC2QaWmat7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6ccd106acacfc23e5472f55cd5256075ec9282f --- /dev/null +++ b/annotations_1/DC2QaWmat7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.32], [26.0, 27.87], [29.0, 36.71], [38.0, 41.4], [43.0, 44.25], [47.0, 48.15], [54.0, 58.94]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 40.11, 48.56, 0.0, 0.0, 73.21], "audiomae_on_audioset": [null, null, [["mains hum", 37.0], ["hum", 31.42], ["crushing", 5.71]], [["hum", 10.76], ["mains hum", 5.54], ["music", 5.07]], null, null, null], "duration": [0.32, 1.87, 7.71, 3.4, 1.25, 1.15, 4.94]} \ No newline at end of file diff --git a/annotations_1/DC3rYQXOTjA_filtered.json b/annotations_1/DC3rYQXOTjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd9b94cbd1786138081c5ad4c1807138f5f58d0 --- /dev/null +++ b/annotations_1/DC3rYQXOTjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 21.03], [25.0, 30.11], [35.0, 36.14], [39.0, 41.44]], "keep_status": [false, true, false, true], "silence_prob": [52.16, 39.34, 0.0, 29.63], "audiomae_on_audioset": [null, [["music", 33.38], ["speech", 20.77], ["musical instrument", 3.8]], null, [["speech", 41.59], ["splash, splatter", 15.42], ["cattle, bovinae", 8.79]]], "duration": [6.03, 5.11, 1.14, 2.44]} \ No newline at end of file diff --git a/annotations_1/DCF_BXNE3oM_filtered.json b/annotations_1/DCF_BXNE3oM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fd58960bf38d76a9df7f7fbbc794478ab386699 --- /dev/null +++ b/annotations_1/DCF_BXNE3oM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [4.0, 4.99], [9.0, 10.3], [11.0, 11.15], [16.0, 16.93], [19.0, 20.14], [28.0, 29.19], [33.0, 33.78], [40.0, 41.05], [52.0, 52.24], [64.0, 63.91], [67.0, 67.61], [83.0, 83.44], [84.0, 84.91], [90.0, 90.54], [99.0, 102.27], [104.0, 105.36], [107.0, 108.5], [110.0, 112.19], [119.0, 122.0], [123.0, 125.81], [131.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 76.37, 100.0, 91.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 0.99, 1.3, 0.15, 0.93, 1.14, 1.19, 0.78, 1.05, 0.24, -0.09, 0.61, 0.44, 0.91, 0.54, 3.27, 1.36, 1.5, 2.19, 3.0, 2.81, 0.94]} \ No newline at end of file diff --git a/annotations_1/DCThJoIT-bY_filtered.json b/annotations_1/DCThJoIT-bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c83e1d84d962a3f04c5fa3c602a8850501b19e3 --- /dev/null +++ b/annotations_1/DCThJoIT-bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.59], [13.0, 16.23], [18.0, 23.79], [26.0, 29.66], [31.0, 36.91], [40.0, 41.42], [44.0, 45.12], [46.0, 46.82], [48.0, 62.16], [63.0, 65.87], [67.0, 71.22], [72.0, 72.69], [74.0, 76.59], [78.0, 77.99], [78.0, 79.24], [81.0, 81.68], [84.0, 91.05], [92.0, 93.29], [98.0, 99.15], [102.0, 103.33], [104.0, 104.31], [107.0, 107.81], [113.0, 115.05], [118.0, 121.86], [128.0, 127.94], [131.0, 135.73], [138.0, 138.99], [142.0, 145.44], [146.0, 149.5], [150.0, 154.5], [155.0, 156.96], [158.0, 161.01]], "keep_status": [false, false, false, true, true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, false, true], "silence_prob": [54.43, 62.27, 47.31, 47.35, 41.78, 0.0, 0.0, 0.0, 37.82, 38.7, 39.38, 0.0, 46.57, 0.0, 0.0, 0.0, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 57.89, 45.78, 0.0, 51.44, 0.0, 45.46, 39.28, 39.69, 0.0, 36.15], "audiomae_on_audioset": [null, null, [["hum", 37.91], ["throbbing", 31.19], ["mains hum", 12.53]], [["music", 55.32], ["hum", 7.76], ["rumble", 4.18]], [["hum", 31.04], ["mains hum", 15.94], ["coin (dropping)", 11.49]], null, null, null, [["hum", 65.55], ["mains hum", 24.4], ["throbbing", 5.62]], [["rumble", 12.83], ["music", 11.03], ["heart sounds, heartbeat", 9.46]], [["music", 29.26], ["animal", 10.07], ["dog", 7.34]], null, [["music", 48.1], ["hum", 13.06], ["throbbing", 8.78]], null, null, null, [["throbbing", 44.09], ["hum", 32.97], ["music", 4.14]], null, null, null, null, null, null, [["throbbing", 27.32], ["hum", 19.19], ["heart sounds, heartbeat", 17.2]], null, null, null, [["speech", 52.35], ["whale vocalization", 8.66], ["sidetone", 8.52]], [["speech", 11.99], ["music", 10.06], ["singing bowl", 9.73]], [["grunt", 15.4], ["speech", 12.65], ["cattle, bovinae", 7.2]], null, [["music", 24.3], ["whale vocalization", 22.88], ["sine wave", 5.1]]], "duration": [5.59, 3.23, 5.79, 3.66, 5.91, 1.42, 1.12, 0.82, 14.16, 2.87, 4.22, 0.69, 2.59, -0.01, 1.24, 0.68, 7.05, 1.29, 1.15, 1.33, 0.31, 0.81, 2.05, 3.86, -0.06, 4.73, 0.99, 3.44, 3.5, 4.5, 1.96, 3.01]} \ No newline at end of file diff --git a/annotations_1/DC_6r5VR5_U_filtered.json b/annotations_1/DC_6r5VR5_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18c922a4136988209983cf442dafff471dfa8b55 --- /dev/null +++ b/annotations_1/DC_6r5VR5_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.02], [17.0, 17.73], [19.0, 28.36], [30.0, 31.72], [33.0, 35.16], [39.0, 38.94], [39.0, 42.89], [46.0, 51.54], [53.0, 53.45], [54.0, 73.23], [75.0, 78.16], [83.0, 84.42], [86.0, 88.33], [91.0, 92.67], [93.0, 95.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.92, 0.0, 90.78, 0.0, 54.76, 98.59, 0.0, 80.82, 95.91, 0.0, 95.91, 0.0, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 0.73, 9.36, 1.72, 2.16, -0.06, 3.89, 5.54, 0.45, 19.23, 3.16, 1.42, 2.33, 1.67, 2.1]} \ No newline at end of file diff --git a/annotations_1/DECG3af2qh8_filtered.json b/annotations_1/DECG3af2qh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..289fbb34899344fb3ba3e1f6b19caf471ab04b7b --- /dev/null +++ b/annotations_1/DECG3af2qh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.02], [15.0, 15.87], [20.0, 20.46], [27.0, 28.26], [58.0, 58.48], [60.0, 61.18]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.02, 0.87, 0.46, 1.26, 0.48, 1.18]} \ No newline at end of file diff --git a/annotations_1/DECt9uTxaLE_filtered.json b/annotations_1/DECt9uTxaLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4bfc41bcef1722f60097e75d0247e777dd7fd51 --- /dev/null +++ b/annotations_1/DECt9uTxaLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.82], [6.0, 6.99], [22.0, 23.89], [31.0, 33.1], [35.0, 36.02], [37.0, 37.77], [41.0, 41.66], [42.0, 43.51], [45.0, 47.7], [57.0, 59.66], [62.0, 64.57], [66.0, 66.48], [69.0, 72.96], [74.0, 74.49], [76.0, 78.54], [83.0, 82.78], [84.0, 85.41], [86.0, 87.03], [89.0, 89.73], [94.0, 94.19], [95.0, 95.18], [97.0, 98.71], [101.0, 101.76], [103.0, 104.5], [105.0, 106.41], [108.0, 110.08], [115.0, 117.69], [122.0, 124.7], [130.0, 130.64], [131.0, 131.77], [132.0, 132.16], [132.0, 132.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 50.56, 52.68, 51.94, 0.0, 54.76, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 79.59, 69.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.18, 0.99, 1.89, 2.1, 1.02, 0.77, 0.66, 1.51, 2.7, 2.66, 2.57, 0.48, 3.96, 0.49, 2.54, -0.22, 1.41, 1.03, 0.73, 0.19, 0.18, 1.71, 0.76, 1.5, 1.41, 2.08, 2.69, 2.7, 0.64, 0.77, 0.16, 0.76]} \ No newline at end of file diff --git a/annotations_1/DEKdqE9W_i8_filtered.json b/annotations_1/DEKdqE9W_i8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b19e93283bc6629a7a46f696fd74532904d1c930 --- /dev/null +++ b/annotations_1/DEKdqE9W_i8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.18], [5.0, 5.43], [6.0, 8.01], [10.0, 11.47], [12.0, 12.73], [14.0, 14.28], [15.0, 16.24], [17.0, 24.8], [27.0, 27.77], [31.0, 31.87], [35.0, 86.07], [89.0, 95.62], [96.0, 97.19], [104.0, 105.0], [106.0, 106.56], [108.0, 108.19], [110.0, 110.52], [112.0, 114.84], [117.0, 117.19], [118.0, 121.73], [123.0, 127.85], [129.0, 161.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 54.97, 0.0, 0.0, 0.0, 44.66, 0.0, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 76.86, 88.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.7], ["vehicle", 16.97], ["hum", 8.42]], null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 0.43, 2.01, 1.47, 0.73, 0.28, 1.24, 7.8, 0.77, 0.87, 51.07, 6.62, 1.19, 1.0, 0.56, 0.19, 0.52, 2.84, 0.19, 3.73, 4.85, 32.99]} \ No newline at end of file diff --git a/annotations_1/DEcY6WXL6_Y_filtered.json b/annotations_1/DEcY6WXL6_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e5ff6ca1c4ab723ca8fbbb8304405db67adfdc6 --- /dev/null +++ b/annotations_1/DEcY6WXL6_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.96], [12.0, 12.38], [13.0, 20.11], [21.0, 21.42], [22.0, 24.36], [25.0, 27.06], [29.0, 30.57], [35.0, 45.71], [47.0, 52.02], [53.0, 56.0], [57.0, 58.83], [59.0, 63.91], [66.0, 67.49], [69.0, 72.05], [74.0, 77.92], [78.0, 81.57], [82.0, 84.06], [87.0, 101.7], [104.0, 105.14], [106.0, 107.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.95, 0.0, 95.91, 96.54, 0.0, 97.33, 97.22, 96.77, 0.0, 93.91, 0.0, 91.81, 73.36, 68.15, 65.09, 53.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.38, 7.11, 0.42, 2.36, 2.06, 1.57, 10.71, 5.02, 3.0, 1.83, 4.91, 1.49, 3.05, 3.92, 3.57, 2.06, 14.7, 1.14, 1.49]} \ No newline at end of file diff --git a/annotations_1/DEmZWy1aDuo_filtered.json b/annotations_1/DEmZWy1aDuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40007d525451254926753bdb583181cf33c1c831 --- /dev/null +++ b/annotations_1/DEmZWy1aDuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 5.02], [6.0, 8.55], [15.0, 15.7], [20.0, 20.82], [23.0, 25.05], [25.0, 49.82], [51.0, 52.19], [53.0, 55.22], [57.0, 59.36], [60.0, 60.91], [64.0, 66.5], [68.0, 69.57], [71.0, 73.23], [76.0, 76.23], [79.0, 82.93], [84.0, 83.84], [86.0, 86.63], [88.0, 92.28], [94.0, 94.04], [102.0, 102.27], [107.0, 107.7], [109.0, 112.83], [113.0, 113.81], [114.0, 126.86], [128.0, 128.8], [134.0, 134.69], [137.0, 137.4], [139.0, 141.07], [147.0, 147.99], [150.0, 151.46], [158.0, 159.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.16, 0.0, 0.0, 75.07, 93.29, 0.0, 94.22, 99.1, 0.0, 98.93, 0.0, 87.19, 0.0, 99.26, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 94.66, 0.0, 74.29, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.02, 2.55, 0.7, 0.82, 2.05, 24.82, 1.19, 2.22, 2.36, 0.91, 2.5, 1.57, 2.23, 0.23, 3.93, -0.16, 0.63, 4.28, 0.04, 0.27, 0.7, 3.83, 0.81, 12.86, 0.8, 0.69, 0.4, 2.07, 0.99, 1.46, 1.06]} \ No newline at end of file diff --git a/annotations_1/DGOews8SVLw_filtered.json b/annotations_1/DGOews8SVLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a05caf1cac292e971f8aa206943a1474c9634e0b --- /dev/null +++ b/annotations_1/DGOews8SVLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.66], [9.0, 19.52], [23.0, 24.71], [27.0, 28.39], [31.0, 34.97], [38.0, 40.44], [43.0, 44.86], [48.0, 67.0], [72.0, 74.22], [76.0, 96.13], [96.0, 97.19], [100.0, 100.18], [101.0, 107.94], [111.0, 124.61], [126.0, 129.98], [130.0, 130.08], [130.0, 131.46]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 29.94, 0.0, 0.0, 29.64, 29.26, 0.0, 29.76, 29.91, 30.0, 0.0, 0.0, 29.66, 29.64, 29.89, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.44], ["car", 13.84], ["skidding", 11.07]], null, null, [["vehicle", 35.27], ["car", 17.11], ["race car, auto racing", 12.48]], [["vehicle", 34.24], ["car", 26.37], ["race car, auto racing", 11.36]], null, [["music", 61.94], ["throbbing", 17.51], ["hum", 5.5]], [["music", 64.41], ["throbbing", 19.41], ["hum", 3.62]], [["music", 72.76], ["throbbing", 3.14], ["animal", 1.69]], null, null, [["music", 25.58], ["vehicle", 23.14], ["car", 19.14]], [["whack, thwack", 40.42], ["thump, thud", 8.53], ["music", 7.71]], [["music", 31.22], ["speech", 19.2], ["sound effect", 5.2]], null, null], "duration": [0.66, 10.52, 1.71, 1.39, 3.97, 2.44, 1.86, 19.0, 2.22, 20.13, 1.19, 0.18, 6.94, 13.61, 3.98, 0.08, 1.46]} \ No newline at end of file diff --git a/annotations_1/DGQkgqsHQns_filtered.json b/annotations_1/DGQkgqsHQns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a64327986de4df54919c6da9ec4071181210aaa --- /dev/null +++ b/annotations_1/DGQkgqsHQns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [7.0, 7.13], [12.0, 18.01], [22.0, 22.99], [30.0, 30.55], [32.0, 32.86], [36.0, 38.74]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 35.65, 0.0, 0.0, 0.0, 33.39], "audiomae_on_audioset": [null, null, [["music", 32.82], ["throbbing", 15.91], ["electronic music", 4.96]], null, null, null, [["music", 72.41], ["musical instrument", 2.56], ["theremin", 2.09]]], "duration": [0.05, 0.13, 6.01, 0.99, 0.55, 0.86, 2.74]} \ No newline at end of file diff --git a/annotations_1/DGW436DH8Yw_filtered.json b/annotations_1/DGW436DH8Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4c09d57726c3995b5217110ffb7e950030a0d8f --- /dev/null +++ b/annotations_1/DGW436DH8Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.72], [6.0, 6.49], [7.0, 8.36], [11.0, 11.21], [18.0, 18.67], [19.0, 20.46], [22.0, 27.53], [28.0, 28.58], [30.0, 34.52], [35.0, 35.9], [37.0, 38.55], [45.0, 45.5], [47.0, 48.14], [48.0, 49.92], [52.0, 66.8], [69.0, 69.85], [70.0, 75.17], [78.0, 87.18], [88.0, 88.82], [90.0, 93.24], [95.0, 96.82], [100.0, 106.24], [111.0, 114.74], [116.0, 123.97], [125.0, 125.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.12, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 0.0, 32.74, 30.22, 0.0, 32.57, 0.0, 31.83, 29.77, 29.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["throbbing", 52.81], ["hum", 37.99], ["music", 4.31]], null, [["throbbing", 46.65], ["music", 23.99], ["hum", 18.23]], null, null, null, null, null, [["music", 40.26], ["throbbing", 29.42], ["hum", 18.5]], null, [["speech", 27.09], ["hum", 20.11], ["music", 14.87]], [["hum", 33.26], ["music", 31.42], ["throbbing", 19.82]], null, [["music", 36.08], ["throbbing", 17.94], ["speech", 16.56]], null, [["music", 47.43], ["speech", 11.36], ["sonar", 11.23]], [["throbbing", 29.08], ["hum", 23.98], ["music", 19.46]], [["speech", 52.28], ["music", 18.04], ["hum", 9.25]], null], "duration": [-0.28, 0.49, 1.36, 0.21, 0.67, 1.46, 5.53, 0.58, 4.52, 0.9, 1.55, 0.5, 1.14, 1.92, 14.8, 0.85, 5.17, 9.18, 0.82, 3.24, 1.82, 6.24, 3.74, 7.97, 0.25]} \ No newline at end of file diff --git a/annotations_1/DGpJ1ndBxOA_filtered.json b/annotations_1/DGpJ1ndBxOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3256043b7985d610f33f21d272eaed54ad4ce1d9 --- /dev/null +++ b/annotations_1/DGpJ1ndBxOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.0], [13.0, 14.94], [21.0, 27.5], [61.0, 61.06], [62.0, 82.38], [83.0, 84.5], [86.0, 87.57], [88.0, 87.94]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [34.92, 0.0, 37.8, 0.0, 39.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 52.92], ["explosion", 13.06], ["burst, pop", 12.8]], null, [["music", 41.98], ["hum", 20.33], ["throbbing", 14.54]], null, [["hum", 59.44], ["mains hum", 21.12], ["music", 8.02]], null, null, null], "duration": [6.0, 1.94, 6.5, 0.06, 20.38, 1.5, 1.57, -0.06]} \ No newline at end of file diff --git a/annotations_1/DHWbxxpKb04_filtered.json b/annotations_1/DHWbxxpKb04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee57e95f356febc0f1996e774053a343a4e7a214 --- /dev/null +++ b/annotations_1/DHWbxxpKb04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [28.0, 30.57], [37.0, 49.44], [53.0, 71.86], [74.0, 78.63], [82.0, 82.04], [86.0, 94.22], [104.0, 104.58], [107.0, 115.21], [125.0, 125.15], [132.0, 131.94], [136.0, 137.22], [141.0, 144.12], [149.0, 149.42], [150.0, 149.94], [150.0, 151.16], [160.0, 161.25], [162.0, 168.99]], "keep_status": [false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.51, 31.43, 31.25, 36.91, 0.0, 34.55, 0.0, 29.69, 0.0, 0.0, 0.0, 35.42, 0.0, 0.0, 0.0, 0.0, 32.73], "audiomae_on_audioset": [null, [["music", 44.63], ["smash, crash", 8.32], ["breaking", 7.45]], [["music", 23.79], ["speech", 22.88], ["buzz", 7.38]], [["boing", 46.13], ["music", 44.46], ["sound effect", 1.43]], [["music", 66.86], ["hum", 4.95], ["cacophony", 3.75]], null, [["music", 48.89], ["speech", 19.99], ["breaking", 15.5]], null, [["vehicle", 26.7], ["music", 21.48], ["car", 8.25]], null, null, null, [["music", 51.03], ["speech", 18.2], ["synthesizer", 6.1]], null, null, null, null, [["music", 64.02], ["theremin", 8.59], ["hum", 2.3]]], "duration": [0.5, 2.57, 12.44, 18.86, 4.63, 0.04, 8.22, 0.58, 8.21, 0.15, -0.06, 1.22, 3.12, 0.42, -0.06, 1.16, 1.25, 6.99]} \ No newline at end of file diff --git a/annotations_1/DHXHxop1gPw_filtered.json b/annotations_1/DHXHxop1gPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc454071c01ff9cbdd0a303d42f06622b132891d --- /dev/null +++ b/annotations_1/DHXHxop1gPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [7.0, 9.1], [10.0, 14.4], [15.0, 24.61], [26.0, 33.1], [36.0, 48.22], [52.0, 53.32], [55.0, 55.66], [56.0, 58.53], [63.0, 63.07], [64.0, 66.09], [69.0, 72.06], [75.0, 76.37], [80.0, 87.27], [91.0, 95.2], [102.0, 103.33], [104.0, 132.49]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.68, 36.07, 32.36, 29.89, 30.54, 0.0, 0.0, 36.27, 0.0, 38.7, 65.09, 0.0, 71.87, 97.54, 0.0, 50.41], "audiomae_on_audioset": [null, [["music", 70.42], ["musical instrument", 5.87], ["drum machine", 2.9]], [["music", 47.27], ["boing", 37.18], ["speech", 3.77]], [["music", 75.12], ["sampler", 2.41], ["musical instrument", 2.04]], [["music", 53.46], ["speech", 18.93], ["throbbing", 10.13]], [["music", 73.97], ["speech", 12.48], ["throbbing", 2.13]], null, null, [["speech", 23.56], ["fire", 20.55], ["field recording", 4.99]], null, [["cattle, bovinae", 40.11], ["moo", 28.99], ["livestock, farm animals, working animals", 26.98]], null, null, null, null, null, null], "duration": [0.55, 2.1, 4.4, 9.61, 7.1, 12.22, 1.32, 0.66, 2.53, 0.07, 2.09, 3.06, 1.37, 7.27, 4.2, 1.33, 28.49]} \ No newline at end of file diff --git a/annotations_1/DHYCHYsyqTc_filtered.json b/annotations_1/DHYCHYsyqTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fced1372d7fa107b11681c9e48533ebc041e727 --- /dev/null +++ b/annotations_1/DHYCHYsyqTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.72], [13.0, 13.49], [14.0, 15.2], [16.0, 16.41], [18.0, 18.77], [22.0, 22.5], [30.0, 36.71], [48.0, 57.79], [60.0, 60.49], [64.0, 67.76], [69.0, 69.94], [70.0, 71.19], [72.0, 78.26], [83.0, 83.07], [84.0, 84.79], [86.0, 86.86], [91.0, 91.18], [92.0, 93.19], [94.0, 95.01], [106.0, 110.78], [112.0, 115.96], [119.0, 121.31], [123.0, 123.6], [125.0, 127.68], [130.0, 130.54], [132.0, 135.24], [137.0, 136.71], [138.0, 138.28], [145.0, 145.76], [149.0, 153.13], [155.0, 155.51], [157.0, 157.47], [163.0, 174.26]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.31, 30.79, 0.0, 32.85, 0.0, 0.0, 30.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.39, 35.42, 32.49, 0.0, 34.2, 0.0, 33.41, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 30.14], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 25.01], ["moo", 13.83], ["throbbing", 10.35]], [["music", 47.66], ["boing", 23.28], ["throbbing", 6.76]], null, [["music", 33.29], ["hum", 22.29], ["throbbing", 17.63]], null, null, [["cattle, bovinae", 34.74], ["moo", 31.05], ["livestock, farm animals, working animals", 28.49]], null, null, null, null, null, null, [["music", 46.37], ["speech", 11.36], ["throbbing", 9.93]], [["music", 66.61], ["speech", 9.08], ["electronic music", 3.7]], [["throbbing", 33.27], ["music", 29.39], ["hum", 7.12]], null, [["music", 61.97], ["hum", 4.57], ["throbbing", 4.24]], null, [["cattle, bovinae", 41.71], ["moo", 36.79], ["livestock, farm animals, working animals", 20.62]], null, null, null, [["hum", 32.13], ["mains hum", 17.89], ["music", 14.38]], null, null, [["music", 36.61], ["mains hum", 10.63], ["hum", 7.77]]], "duration": [0.72, 0.49, 1.2, 0.41, 0.77, 0.5, 6.71, 9.79, 0.49, 3.76, 0.94, 1.19, 6.26, 0.07, 0.79, 0.86, 0.18, 1.19, 1.01, 4.78, 3.96, 2.31, 0.6, 2.68, 0.54, 3.24, -0.29, 0.28, 0.76, 4.13, 0.51, 0.47, 11.26]} \ No newline at end of file diff --git a/annotations_1/DHk_bI_wMcY_filtered.json b/annotations_1/DHk_bI_wMcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc69b00156b4879698bd14380c00136fc3d17d2c --- /dev/null +++ b/annotations_1/DHk_bI_wMcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 37.83], [41.0, 41.54], [42.0, 70.24]], "keep_status": [false, false, false], "silence_prob": [31.06, 0.0, 31.93], "audiomae_on_audioset": [[["music", 56.38], ["throbbing", 10.95], ["hum", 10.93]], null, [["music", 67.47], ["didgeridoo", 5.41], ["buzz", 4.37]]], "duration": [6.83, 0.54, 28.24]} \ No newline at end of file diff --git a/annotations_1/DHnwNo7Z6Ts_filtered.json b/annotations_1/DHnwNo7Z6Ts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b203f6ae912ff7dcfd64ef1b86c0fb39fb902c6 --- /dev/null +++ b/annotations_1/DHnwNo7Z6Ts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [4.0, 4.87], [6.0, 8.45], [9.0, 10.98], [13.0, 13.29], [16.0, 17.56], [22.0, 22.23], [24.0, 25.12], [28.0, 29.2], [30.0, 33.03], [34.0, 34.8], [36.0, 38.87], [42.0, 42.36], [46.0, 48.81], [51.0, 55.71], [57.0, 58.7], [60.0, 74.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 97.83, 0.0, 95.51, 99.99, 0.0, 90.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.33, 0.87, 2.45, 1.98, 0.29, 1.56, 0.23, 1.12, 1.2, 3.03, 0.8, 2.87, 0.36, 2.81, 4.71, 1.7, 14.7]} \ No newline at end of file diff --git a/annotations_1/DHzeRLN8UVc_filtered.json b/annotations_1/DHzeRLN8UVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25189cc3add45c405c0823fa66771eefa6d1e7c1 --- /dev/null +++ b/annotations_1/DHzeRLN8UVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.89], [4.0, 5.93], [6.0, 5.97], [6.0, 6.4], [7.0, 7.42], [24.0, 26.06], [32.0, 34.64], [40.0, 47.36], [53.0, 53.38], [53.0, 64.67], [69.0, 69.43], [70.0, 70.02], [71.0, 78.7], [83.0, 83.79], [86.0, 93.28], [95.0, 95.89], [97.0, 96.96], [99.0, 100.87], [104.0, 104.77], [105.0, 106.39], [107.0, 109.95]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.57, 45.56, 35.51, 0.0, 33.54, 0.0, 0.0, 38.98, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 39.83], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.66], ["speech", 19.63], ["sidetone", 9.4]], [["music", 59.1], ["throbbing", 6.78], ["boing", 4.49]], [["speech", 23.93], ["music", 17.56], ["electric shaver, electric razor", 10.63]], null, [["speech", 52.89], ["music", 24.46], ["sidetone", 2.62]], null, null, [["speech", 35.69], ["whack, thwack", 13.62], ["music", 10.14]], null, null, null, null, null, null, null, [["music", 39.66], ["thunk", 13.92], ["didgeridoo", 6.97]]], "duration": [-0.11, 1.93, -0.03, 0.4, 0.42, 2.06, 2.64, 7.36, 0.38, 11.67, 0.43, 0.02, 7.7, 0.79, 7.28, 0.89, -0.04, 1.87, 0.77, 1.39, 2.95]} \ No newline at end of file diff --git a/annotations_1/DI5t1Bxfy90_filtered.json b/annotations_1/DI5t1Bxfy90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f24631d0a75281ce6551891bf2229a1cc75d61c6 --- /dev/null +++ b/annotations_1/DI5t1Bxfy90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.97], [15.0, 19.09], [22.0, 28.92], [30.0, 31.26], [38.0, 41.77], [54.0, 68.4], [70.0, 70.88]], "keep_status": [false, true, false, false, false, true, false], "silence_prob": [0.0, 29.97, 28.93, 0.0, 30.01, 28.79, 0.0], "audiomae_on_audioset": [null, [["music", 34.03], ["speech", 14.88], ["throbbing", 9.44]], [["whale vocalization", 83.4], ["music", 6.37], ["speech", 2.15]], null, [["music", 48.03], ["speech", 25.48], ["electronic music", 1.99]], [["vehicle", 35.81], ["car", 18.67], ["speech", 9.49]], null], "duration": [1.97, 4.09, 6.92, 1.26, 3.77, 14.4, 0.88]} \ No newline at end of file diff --git a/annotations_1/DII9AQZoUTo_filtered.json b/annotations_1/DII9AQZoUTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f085019f8a9b6d012bfdaa81835d6e788022ee5 --- /dev/null +++ b/annotations_1/DII9AQZoUTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [5.0, 5.21], [7.0, 16.23], [18.0, 20.36], [23.0, 52.54], [53.0, 54.3], [56.0, 56.73], [58.0, 59.53], [60.0, 60.71], [64.0, 64.15]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.21, 38.31, 31.28, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 60.36], ["sidetone", 11.79], ["music", 11.51]], [["speech", 31.03], ["music", 28.41], ["animal", 3.51]], [["synthesizer", 30.23], ["music", 17.61], ["noise", 9.04]], null, null, null, null, null], "duration": [1.37, 0.21, 9.23, 2.36, 29.54, 1.3, 0.73, 1.53, 0.71, 0.15]} \ No newline at end of file diff --git a/annotations_1/DIkKczv9Eo4_filtered.json b/annotations_1/DIkKczv9Eo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..188e7b1ff36fd7b8aa0ecd6a5cbff62ad7c248da --- /dev/null +++ b/annotations_1/DIkKczv9Eo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [6.0, 7.13], [9.0, 9.75], [17.0, 23.23], [24.0, 24.71], [26.0, 31.94], [34.0, 35.87], [37.0, 38.85], [40.0, 75.95], [77.0, 102.57], [103.0, 108.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.31, 0.0, 99.93, 0.0, 0.0, 0.0, 100.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 1.13, 0.75, 6.23, 0.71, 5.94, 1.87, 1.85, 35.95, 25.57, 5.85]} \ No newline at end of file diff --git a/annotations_1/DIlHR2SWW9E_filtered.json b/annotations_1/DIlHR2SWW9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9805352a50403971de41ec1b76a815b04f8cbdc3 --- /dev/null +++ b/annotations_1/DIlHR2SWW9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [4.0, 12.8], [13.0, 13.24], [17.0, 18.5], [24.0, 28.85], [29.0, 34.64], [38.0, 38.28], [40.0, 46.94], [49.0, 49.99], [51.0, 51.49], [52.0, 52.14], [56.0, 58.28], [62.0, 62.58], [65.0, 65.91], [66.0, 74.43], [76.0, 78.12], [79.0, 79.68], [81.0, 82.19], [82.0, 82.95], [83.0, 86.0], [87.0, 88.21], [89.0, 90.12], [90.0, 93.77], [99.0, 101.38], [102.0, 103.55], [104.0, 106.27], [107.0, 114.45], [115.0, 119.06], [122.0, 122.39], [127.0, 127.95], [128.0, 128.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.96, 0.0, 0.0, 99.94, 55.39, 0.0, 90.78, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 83.7, 94.81, 0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 64.86, 68.28, 0.0, 97.33, 77.7, 95.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 8.8, 0.24, 1.5, 4.85, 5.64, 0.28, 6.94, 0.99, 0.49, 0.14, 2.28, 0.58, 0.91, 8.43, 2.12, 0.68, 1.19, 0.95, 3.0, 1.21, 1.12, 3.77, 2.38, 1.55, 2.27, 7.45, 4.06, 0.39, 0.95, 0.88]} \ No newline at end of file diff --git a/annotations_1/DJTF3NmqF7U_filtered.json b/annotations_1/DJTF3NmqF7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a350c66deef55c571471e3a87560ae49c1bafb9 --- /dev/null +++ b/annotations_1/DJTF3NmqF7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.38], [13.0, 13.19], [14.0, 18.82], [20.0, 20.31], [22.0, 26.49], [28.0, 28.9], [30.0, 30.57], [36.0, 47.6], [54.0, 56.84], [57.0, 58.19], [60.0, 60.79], [67.0, 70.71], [72.0, 72.47], [76.0, 77.03], [78.0, 80.49], [82.0, 82.56], [85.0, 85.8], [88.0, 96.16], [99.0, 102.83], [104.0, 106.39], [107.0, 112.24], [114.0, 117.83]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.46, 0.0, 51.77, 0.0, 0.0, 51.77, 47.2, 0.0, 0.0, 67.89, 0.0, 0.0, 80.64, 0.0, 0.0, 88.64, 93.13, 77.03, 94.95, 58.05], "audiomae_on_audioset": [null, null, [["speech", 43.76], ["sidetone", 14.72], ["hum", 11.24]], null, null, null, null, null, [["mains hum", 45.56], ["hum", 31.44], ["fly, housefly", 3.37]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.19, 4.82, 0.31, 4.49, 0.9, 0.57, 11.6, 2.84, 1.19, 0.79, 3.71, 0.47, 1.03, 2.49, 0.56, 0.8, 8.16, 3.83, 2.39, 5.24, 3.83]} \ No newline at end of file diff --git a/annotations_1/DJWKWwfURtI_filtered.json b/annotations_1/DJWKWwfURtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..058a5b624c15c55a67c61b4a94eb7713a35855d8 --- /dev/null +++ b/annotations_1/DJWKWwfURtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 37.67], [46.0, 45.67], [46.0, 63.24], [66.0, 67.56], [79.0, 79.69], [85.0, 85.14], [92.0, 92.33], [95.0, 96.06], [98.0, 100.26], [102.0, 108.87], [111.0, 111.23], [112.0, 114.93]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.67, 0.0, 30.57, 0.0, 0.0, 0.0, 0.0, 0.0, 31.97, 38.17, 0.0, 56.7], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 40.05], ["cattle, bovinae", 32.84], ["moo", 21.77]], null, [["music", 67.94], ["whack, thwack", 4.66], ["boing", 3.89]], null, null, null, null, null, [["music", 24.99], ["mains hum", 19.52], ["hum", 13.06]], [["theremin", 32.95], ["music", 30.09], ["didgeridoo", 11.91]], null, null], "duration": [7.67, -0.33, 17.24, 1.56, 0.69, 0.14, 0.33, 1.06, 2.26, 6.87, 0.23, 2.93]} \ No newline at end of file diff --git a/annotations_1/DJZqFXSHyvc_filtered.json b/annotations_1/DJZqFXSHyvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..459384f325fe7c7be3cc36916f456c3f52914e9c --- /dev/null +++ b/annotations_1/DJZqFXSHyvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 31.7], [32.0, 36.73], [38.0, 39.8], [40.0, 42.79], [44.0, 55.27], [57.0, 58.72], [60.0, 62.77], [64.0, 65.99], [67.0, 70.8], [72.0, 74.12], [79.0, 79.2], [85.0, 85.58], [87.0, 93.34], [95.0, 96.42], [102.0, 104.48], [107.0, 109.27], [110.0, 110.88], [113.0, 113.98], [115.0, 116.48], [131.0, 131.4], [135.0, 135.04], [144.0, 148.02], [150.0, 150.7], [158.0, 158.73], [160.0, 160.56], [168.0, 170.51], [173.0, 174.99]], "keep_status": [true, false, false, true, true, false, true, false, true, true, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [45.14, 59.42, 0.0, 34.57, 34.26, 0.0, 35.5, 0.0, 33.01, 30.02, 0.0, 0.0, 33.08, 0.0, 33.67, 35.46, 0.0, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 35.59, 0.0], "audiomae_on_audioset": [[["whale vocalization", 16.79], ["animal", 15.13], ["speech", 7.21]], null, null, [["speech", 24.02], ["noise", 17.05], ["music", 11.02]], [["speech", 52.35], ["hum", 6.6], ["music", 5.0]], null, [["speech", 27.66], ["throbbing", 24.24], ["music", 15.66]], null, [["music", 39.15], ["hum", 16.56], ["mains hum", 6.5]], [["music", 16.16], ["hum", 15.17], ["vehicle", 11.09]], null, null, [["music", 27.5], ["fly, housefly", 10.17], ["didgeridoo", 8.62]], null, [["music", 38.46], ["livestock, farm animals, working animals", 12.84], ["cattle, bovinae", 12.77]], [["music", 45.47], ["hum", 12.81], ["throbbing", 7.25]], null, null, null, null, null, [["speech", 31.46], ["mains hum", 18.31], ["hum", 15.38]], null, null, null, [["music", 34.06], ["sonar", 19.37], ["hum", 12.99]], null], "duration": [5.7, 4.73, 1.8, 2.79, 11.27, 1.72, 2.77, 1.99, 3.8, 2.12, 0.2, 0.58, 6.34, 1.42, 2.48, 2.27, 0.88, 0.98, 1.48, 0.4, 0.04, 4.02, 0.7, 0.73, 0.56, 2.51, 1.99]} \ No newline at end of file diff --git a/annotations_1/DKqFCG3UTEs_filtered.json b/annotations_1/DKqFCG3UTEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68d6d3016a0ff23124ffde81af29f41794bdf7e8 --- /dev/null +++ b/annotations_1/DKqFCG3UTEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.87], [20.0, 31.26], [32.0, 32.34], [33.0, 34.2], [34.0, 35.45], [39.0, 39.9], [41.0, 41.52], [50.0, 51.14], [56.0, 64.93], [68.0, 68.03], [75.0, 76.03], [78.0, 78.22], [79.0, 79.91], [81.0, 81.72], [84.0, 84.69], [87.0, 88.1], [89.0, 89.61], [99.0, 100.38], [102.0, 101.73], [106.0, 106.83], [113.0, 114.62], [115.0, 117.93], [120.0, 120.16], [121.0, 124.12], [127.0, 128.11], [131.0, 135.99], [137.0, 139.78], [141.0, 142.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.86, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 0.0, 89.9, 0.0, 97.83, 94.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.87, 11.26, 0.34, 1.2, 1.45, 0.9, 0.52, 1.14, 8.93, 0.03, 1.03, 0.22, 0.91, 0.72, 0.69, 1.1, 0.61, 1.38, -0.27, 0.83, 1.62, 2.93, 0.16, 3.12, 1.11, 4.99, 2.78, 1.26]} \ No newline at end of file diff --git a/annotations_1/DKtupzAQYv4_filtered.json b/annotations_1/DKtupzAQYv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60a8ec4fcdec0ea300f68e7f5e2f77e420082420 --- /dev/null +++ b/annotations_1/DKtupzAQYv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [7.0, 7.33], [22.0, 23.08], [44.0, 44.59], [56.0, 56.93], [74.0, 76.45], [84.0, 84.94], [107.0, 107.84], [121.0, 121.88]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 29.73], ["hum", 6.52], ["rumble", 6.2]], null, null, null], "duration": [0.59, 0.33, 1.08, 0.59, 0.93, 2.45, 0.94, 0.84, 0.88]} \ No newline at end of file diff --git a/annotations_1/DL-fT3OymQI_filtered.json b/annotations_1/DL-fT3OymQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8da3dd3d8b15d54134023126f5fef388628af50 --- /dev/null +++ b/annotations_1/DL-fT3OymQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 12.04], [13.0, 14.25], [15.0, 15.42], [18.0, 18.44], [19.0, 19.43], [20.0, 20.49], [22.0, 25.3], [31.0, 33.2], [34.0, 38.1], [38.0, 38.26], [45.0, 46.06], [47.0, 47.39], [48.0, 48.71], [49.0, 50.97], [60.0, 60.64], [61.0, 62.11], [64.0, 73.28], [78.0, 78.68], [81.0, 82.58], [84.0, 85.77], [87.0, 100.01], [104.0, 104.19], [104.0, 151.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.56, 0.0, 0.0, 0.0, 0.0, 0.0, 37.44, 36.73, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.85, 0.0, 0.0, 0.0, 28.41, 0.0, 0.0], "audiomae_on_audioset": [[["music", 72.53], ["musical instrument", 4.96], ["guitar", 4.18]], null, null, null, null, null, [["didgeridoo", 49.86], ["music", 40.09], ["musical instrument", 2.48]], [["didgeridoo", 53.54], ["music", 25.96], ["theremin", 7.71]], [["music", 59.58], ["didgeridoo", 19.89], ["musical instrument", 8.64]], null, null, null, null, null, null, null, [["music", 81.84], ["musical instrument", 1.33], ["didgeridoo", 1.32]], null, null, null, [["music", 73.8], ["psychedelic rock", 3.17], ["speech", 2.4]], null, null], "duration": [10.04, 1.25, 0.42, 0.44, 0.43, 0.49, 3.3, 2.2, 4.1, 0.26, 1.06, 0.39, 0.71, 1.97, 0.64, 1.11, 9.28, 0.68, 1.58, 1.77, 13.01, 0.19, 47.36]} \ No newline at end of file diff --git a/annotations_1/DLb9vR3Zu3g_filtered.json b/annotations_1/DLb9vR3Zu3g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96a94e7716001a80e28c085b51968f963bf52445 --- /dev/null +++ b/annotations_1/DLb9vR3Zu3g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [5.0, 7.8], [9.0, 9.24], [10.0, 28.29], [31.0, 36.19], [41.0, 45.72], [47.0, 47.61], [49.0, 48.63], [54.0, 54.75], [56.0, 56.52], [57.0, 59.24], [60.0, 61.2], [63.0, 66.39], [69.0, 71.96], [75.0, 78.14], [81.0, 82.46], [84.0, 83.96], [86.0, 87.24], [93.0, 94.91], [101.0, 102.88], [111.0, 111.47], [115.0, 115.86], [117.0, 118.52], [137.0, 139.45], [144.0, 148.54], [151.0, 157.77], [159.0, 161.65], [162.0, 163.73], [164.0, 165.74], [167.0, 167.91], [171.0, 171.39], [173.0, 174.48], [175.0, 175.29]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.07, 0.0, 69.47, 82.25, 48.14, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 96.17, 97.43, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 95.64, 92.8, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["animal", 25.69], ["music", 9.42], ["dog", 9.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 2.8, 0.24, 18.29, 5.19, 4.72, 0.61, -0.37, 0.75, 0.52, 2.24, 1.2, 3.39, 2.96, 3.14, 1.46, -0.04, 1.24, 1.91, 1.88, 0.47, 0.86, 1.52, 2.45, 4.54, 6.77, 2.65, 1.73, 1.74, 0.91, 0.39, 1.48, 0.29]} \ No newline at end of file diff --git a/annotations_1/DLzp0YkZnRc_filtered.json b/annotations_1/DLzp0YkZnRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d29f6b896498c8cb9fdd7a90bc1052c1b6e0a1b7 --- /dev/null +++ b/annotations_1/DLzp0YkZnRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.04], [19.0, 21.02], [37.0, 46.6], [48.0, 51.88], [53.0, 58.06], [59.0, 60.45], [66.0, 68.13], [71.0, 71.98], [75.0, 77.18], [80.0, 80.65], [85.0, 86.81], [91.0, 91.59], [97.0, 98.12], [101.0, 102.34], [115.0, 115.94], [118.0, 118.44], [126.0, 126.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.93, 99.96, 51.94, 99.44, 99.93, 0.0, 99.78, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.04, 2.02, 9.6, 3.88, 5.06, 1.45, 2.13, 0.98, 2.18, 0.65, 1.81, 0.59, 1.12, 1.34, 0.94, 0.44, 0.15]} \ No newline at end of file diff --git a/annotations_1/DNHmujbuC74_filtered.json b/annotations_1/DNHmujbuC74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba2d6026051ac2426cdca481b84ef87872cbf2f2 --- /dev/null +++ b/annotations_1/DNHmujbuC74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [3.0, 3.64], [19.0, 20.34], [27.0, 27.51], [29.0, 30.59], [33.0, 34.67], [41.0, 41.18], [44.0, 45.03], [47.0, 48.78], [49.0, 50.06], [50.0, 54.53], [65.0, 66.93], [67.0, 68.23], [73.0, 76.96], [79.0, 79.2], [80.0, 82.22], [86.0, 86.63], [88.0, 93.51], [96.0, 96.92], [101.0, 101.17], [108.0, 108.09], [109.0, 110.02], [124.0, 124.04], [127.0, 172.66], [173.0, 179.27], [184.0, 184.91], [188.0, 188.38], [190.0, 190.78], [192.0, 194.81], [198.0, 200.37], [204.0, 204.89], [207.0, 207.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 82.43, 0.0, 34.58, 0.0, 41.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.69, 0.0, 0.0, 0.0, 99.76, 77.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.67], ["music", 11.65], ["grunt", 8.44]], null, [["speech", 83.35], ["busy signal", 4.25], ["moo", 1.87]], null, null, null, null, null, null, [["music", 63.56], ["musical instrument", 3.65], ["singing", 3.18]], null, null, null, null, null, null, null], "duration": [0.05, 0.64, 1.34, 0.51, 1.59, 1.67, 0.18, 1.03, 1.78, 1.06, 4.53, 1.93, 1.23, 3.96, 0.2, 2.22, 0.63, 5.51, 0.92, 0.17, 0.09, 1.02, 0.04, 45.66, 6.27, 0.91, 0.38, 0.78, 2.81, 2.37, 0.89, 0.3]} \ No newline at end of file diff --git a/annotations_1/DOmIpiTMs2w_filtered.json b/annotations_1/DOmIpiTMs2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce31693d5cc745ed4634b126dc8695999076ca33 --- /dev/null +++ b/annotations_1/DOmIpiTMs2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 34.26], [36.0, 35.9], [40.0, 40.54], [43.0, 43.77], [45.0, 56.96], [57.0, 58.5], [61.0, 62.48], [62.0, 62.55], [63.0, 71.49], [74.0, 75.3], [81.0, 84.45], [88.0, 105.04], [106.0, 116.6], [132.0, 132.65], [133.0, 133.51], [138.0, 138.57], [142.0, 142.96], [143.0, 142.99], [153.0, 155.12], [156.0, 157.2], [159.0, 158.75], [161.0, 162.33], [163.0, 163.61], [164.0, 166.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.77, 0.0, 0.0, 0.0, 32.95, 0.0, 0.0, 0.0, 33.1, 0.0, 33.3, 33.98, 49.27, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 98.8], "audiomae_on_audioset": [null, null, null, null, [["music", 80.14], ["speech", 2.6], ["drum machine", 2.23]], null, null, null, [["music", 88.7], ["funny music", 1.09], ["sampler", 0.75]], null, [["music", 78.42], ["musical instrument", 1.76], ["didgeridoo", 1.49]], [["music", 88.56], ["sampler", 1.85], ["synthesizer", 1.42]], [["music", 51.35], ["throbbing", 6.12], ["hum", 5.71]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.26, -0.1, 0.54, 0.77, 11.96, 1.5, 1.48, 0.55, 8.49, 1.3, 3.45, 17.04, 10.6, 0.65, 0.51, 0.57, 0.96, -0.01, 2.12, 1.2, -0.25, 1.33, 0.61, 2.35]} \ No newline at end of file diff --git a/annotations_1/DPmHrgbe3xo_filtered.json b/annotations_1/DPmHrgbe3xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e150168903dd5ebf2e5f6fd95ae7bcb36b135154 --- /dev/null +++ b/annotations_1/DPmHrgbe3xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.3], [13.0, 14.98], [16.0, 22.38], [30.0, 30.38], [32.0, 32.75], [38.0, 39.77], [42.0, 43.8], [47.0, 47.43], [51.0, 79.24], [80.0, 86.16], [86.0, 86.31], [92.0, 93.14], [95.0, 95.79], [99.0, 100.36], [106.0, 118.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.57, 0.0, 0.0, 0.0, 0.0, 0.0, 28.98, 28.99, 0.0, 0.0, 0.0, 0.0, 28.41], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 39.4], ["cattle, bovinae", 39.35], ["moo", 20.83]], null, null, null, null, null, [["music", 85.73], ["carnatic music", 2.48], ["musical instrument", 1.4]], [["music", 59.67], ["cattle, bovinae", 9.94], ["moo", 6.94]], null, null, null, null, [["cattle, bovinae", 30.06], ["music", 24.01], ["moo", 16.55]]], "duration": [0.3, 1.98, 6.38, 0.38, 0.75, 1.77, 1.8, 0.43, 28.24, 6.16, 0.31, 1.14, 0.79, 1.36, 12.44]} \ No newline at end of file diff --git a/annotations_1/DQU7X4QDX80_filtered.json b/annotations_1/DQU7X4QDX80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b454ac8eff7f0b3c85b3fe6f039837c7008981b5 --- /dev/null +++ b/annotations_1/DQU7X4QDX80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.88], [12.0, 11.84], [13.0, 12.82], [14.0, 14.18], [28.0, 42.72], [45.0, 45.69], [46.0, 55.02], [59.0, 67.66], [68.0, 68.79], [70.0, 71.64], [73.0, 75.32], [86.0, 87.57], [89.0, 92.33], [97.0, 97.8], [108.0, 121.02], [124.0, 127.14], [130.0, 130.69], [134.0, 134.65], [151.0, 151.61], [155.0, 157.86]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.38, 0.0, 29.3, 34.9, 0.0, 0.0, 34.34, 0.0, 31.99, 0.0, 29.41, 30.82, 0.0, 0.0, 0.0, 34.07], "audiomae_on_audioset": [null, null, null, null, [["music", 73.95], ["throbbing", 8.9], ["electronic music", 4.56]], null, [["music", 50.69], ["throbbing", 19.66], ["speech", 10.27]], [["music", 29.31], ["cattle, bovinae", 17.25], ["moo", 12.48]], null, null, [["music", 64.01], ["cattle, bovinae", 6.34], ["moo", 5.06]], null, [["music", 21.7], ["cattle, bovinae", 19.26], ["moo", 15.95]], null, [["music", 36.26], ["fly, housefly", 27.95], ["buzz", 10.17]], [["throbbing", 46.88], ["music", 34.85], ["hum", 9.0]], null, null, null, [["music", 56.14], ["speech", 11.58], ["electronic music", 5.71]]], "duration": [0.88, -0.16, -0.18, 0.18, 14.72, 0.69, 9.02, 8.66, 0.79, 1.64, 2.32, 1.57, 3.33, 0.8, 13.02, 3.14, 0.69, 0.65, 0.61, 2.86]} \ No newline at end of file diff --git a/annotations_1/DQjDI3NorAY_filtered.json b/annotations_1/DQjDI3NorAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9de2bc9cff517be80c02604b1d62a2c2d2b8647 --- /dev/null +++ b/annotations_1/DQjDI3NorAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [12.0, 12.14], [17.0, 17.15], [23.0, 24.36], [26.0, 26.3], [28.0, 28.14], [33.0, 34.35], [57.0, 60.39], [63.0, 63.88], [66.0, 67.69], [69.0, 69.65], [74.0, 74.88], [75.0, 77.36], [78.0, 80.1], [93.0, 95.23], [97.0, 97.24], [117.0, 117.53], [119.0, 119.18], [120.0, 121.85], [125.0, 127.89], [129.0, 133.47], [145.0, 145.61], [151.0, 152.83], [154.0, 155.24], [182.0, 183.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 70.02, 46.94, 99.59, 0.0, 0.0, 0.0, 0.0, 88.1, 45.14, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 12.66], ["burping, eructation", 11.46], ["stomach rumble", 6.72]], null, null, null, null, null, null, [["music", 80.95], ["effects unit", 4.7], ["guitar", 4.29]], null, null, null, null], "duration": [0.39, 0.14, 0.15, 1.36, 0.3, 0.14, 1.35, 3.39, 0.88, 1.69, 0.65, 0.88, 2.36, 2.1, 2.23, 0.24, 0.53, 0.18, 1.85, 2.89, 4.47, 0.61, 1.83, 1.24, 1.25]} \ No newline at end of file diff --git a/annotations_1/DRGjkQ_iBL8_filtered.json b/annotations_1/DRGjkQ_iBL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2c6a01ee4c7d1d741b4bbde8a511b5f0c8e4e6f --- /dev/null +++ b/annotations_1/DRGjkQ_iBL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [5.0, 8.75], [10.0, 20.34], [22.0, 23.19], [24.0, 49.05], [52.0, 53.94], [56.0, 62.11], [63.0, 68.05], [69.0, 72.44], [73.0, 96.45], [98.0, 98.42], [99.0, 127.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 99.98, 0.0, 99.36, 0.0, 99.62, 99.59, 99.95, 74.13, 0.0, 32.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 35.98], ["speech", 34.45], ["whale vocalization", 12.02]]], "duration": [2.01, 3.75, 10.34, 1.19, 25.05, 1.94, 6.11, 5.05, 3.44, 23.45, 0.42, 28.45]} \ No newline at end of file diff --git a/annotations_1/DRtbf7iG8Nw_filtered.json b/annotations_1/DRtbf7iG8Nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5eea10cdf34762c5ff82793c843bb24eccf646d --- /dev/null +++ b/annotations_1/DRtbf7iG8Nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.59], [11.0, 11.84], [16.0, 16.63], [20.0, 24.43], [31.0, 32.04], [33.0, 34.21], [36.0, 36.27], [39.0, 45.35], [46.0, 47.28], [51.0, 51.81], [58.0, 59.9], [67.0, 67.51], [72.0, 72.03], [74.0, 78.34], [89.0, 89.55], [99.0, 100.9], [104.0, 103.72], [109.0, 108.82], [110.0, 110.25]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 41.6, 0.0, 0.0, 0.0, 0.0, 0.0, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 58.09], ["mantra", 5.74], ["chant", 4.61]], null, null, null, [["music", 46.97], ["lullaby", 14.87], ["mantra", 6.31]], null, null, null, null, null, [["music", 52.13], ["theremin", 12.33], ["wind instrument, woodwind instrument", 8.43]], null, null, null, null, null], "duration": [1.59, 0.84, 0.63, 4.43, 1.04, 1.21, 0.27, 6.35, 1.28, 0.81, 1.9, 0.51, 0.03, 4.34, 0.55, 1.9, -0.28, -0.18, 0.25]} \ No newline at end of file diff --git a/annotations_1/DSO1F6sM63s_filtered.json b/annotations_1/DSO1F6sM63s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85deb60d677975705a7177539fc1b75fa292349f --- /dev/null +++ b/annotations_1/DSO1F6sM63s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.51], [8.0, 12.51], [13.0, 14.4], [15.0, 17.15], [18.0, 18.81], [21.0, 21.2], [26.0, 27.36], [30.0, 30.94], [35.0, 44.73], [47.0, 112.19], [114.0, 115.03], [116.0, 119.57], [120.0, 120.61], [123.0, 124.01], [125.0, 126.25], [127.0, 126.96], [127.0, 129.02], [130.0, 130.98], [135.0, 135.62], [145.0, 145.74], [151.0, 150.99], [153.0, 158.21], [160.0, 160.52], [162.0, 162.63], [168.0, 168.17]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.08, 29.45, 0.0, 29.09, 0.0, 0.0, 0.0, 0.0, 29.36, 0.0, 0.0, 46.64, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 30.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["car", 29.98], ["vehicle", 20.16], ["race car, auto racing", 11.71]], [["mains hum", 23.59], ["hum", 22.34], ["music", 18.54]], null, [["music", 17.42], ["noise", 7.74], ["theremin", 7.29]], null, null, null, null, [["hum", 51.46], ["throbbing", 29.83], ["mains hum", 15.1]], null, null, [["frog", 20.37], ["speech", 15.78], ["whack, thwack", 7.69]], null, null, null, null, [["speech", 63.61], ["sidetone", 12.36], ["radio", 3.88]], null, null, null, null, [["whack, thwack", 34.81], ["hum", 21.66], ["throbbing", 6.63]], null, null, null], "duration": [2.51, 4.51, 1.4, 2.15, 0.81, 0.2, 1.36, 0.94, 9.73, 65.19, 1.03, 3.57, 0.61, 1.01, 1.25, -0.04, 2.02, 0.98, 0.62, 0.74, -0.01, 5.21, 0.52, 0.63, 0.17]} \ No newline at end of file diff --git a/annotations_1/DSaBwTpdfkQ_filtered.json b/annotations_1/DSaBwTpdfkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11e3eaf19e9893d3162a141780ba7c06a16e8966 --- /dev/null +++ b/annotations_1/DSaBwTpdfkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.7], [13.0, 13.71], [15.0, 19.5], [20.0, 73.52], [75.0, 77.13], [77.0, 79.42]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.07, 0.0, 41.93, 44.75], "audiomae_on_audioset": [null, null, null, null, [["music", 61.65], ["didgeridoo", 9.77], ["musical instrument", 3.6]], [["music", 64.11], ["gong", 8.6], ["ambient music", 5.97]]], "duration": [1.7, 0.71, 4.5, 53.52, 2.13, 2.42]} \ No newline at end of file diff --git a/annotations_1/DSyCwx2AlQc_filtered.json b/annotations_1/DSyCwx2AlQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e4f19f2e179bf1b2bec7dfa1a77847f01bee349 --- /dev/null +++ b/annotations_1/DSyCwx2AlQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.82], [5.0, 10.5], [15.0, 24.31], [25.0, 80.28], [82.0, 86.68], [90.0, 122.01]], "keep_status": [true, false, true, false, false, false], "silence_prob": [32.23, 31.03, 32.08, 0.0, 30.65, 0.0], "audiomae_on_audioset": [[["speech", 10.31], ["electric shaver, electric razor", 8.22], ["mains hum", 6.28]], [["mains hum", 37.42], ["hum", 24.9], ["speech", 14.03]], [["vehicle", 23.59], ["music", 19.6], ["aircraft", 8.03]], null, [["music", 51.6], ["throbbing", 12.82], ["hum", 6.87]], null], "duration": [2.82, 5.5, 9.31, 55.28, 4.68, 32.01]} \ No newline at end of file diff --git a/annotations_1/DTWggpNq1a0_filtered.json b/annotations_1/DTWggpNq1a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9be388107b2c861d7bfe06544fec25d148434f34 --- /dev/null +++ b/annotations_1/DTWggpNq1a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 30.27], [31.0, 35.99], [37.0, 41.61], [42.0, 44.15], [46.0, 46.52], [48.0, 48.59], [51.0, 52.71], [54.0, 65.99], [67.0, 69.5], [70.0, 97.16]], "keep_status": [true, true, true, true, false, false, false, false, true, false], "silence_prob": [30.93, 29.59, 29.71, 38.0, 0.0, 0.0, 0.0, 30.91, 30.74, 29.46], "audiomae_on_audioset": [[["music", 59.62], ["guitar", 2.7], ["synthesizer", 2.53]], [["music", 37.63], ["speech", 22.37], ["theremin", 6.54]], [["music", 44.13], ["guitar", 14.52], ["musical instrument", 7.49]], [["music", 41.84], ["effects unit", 5.04], ["guitar", 4.95]], null, null, null, [["music", 85.13], ["guitar", 1.89], ["musical instrument", 1.48]], [["music", 53.59], ["musical instrument", 6.21], ["guitar", 5.28]], [["music", 49.15], ["theremin", 26.9], ["harmonic", 2.72]]], "duration": [5.27, 4.99, 4.61, 2.15, 0.52, 0.59, 1.71, 11.99, 2.5, 27.16]} \ No newline at end of file diff --git a/annotations_1/DTdDzcr-7UM_filtered.json b/annotations_1/DTdDzcr-7UM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f2601132e0cefb9991e6a9ad9e29df93b5d76c9 --- /dev/null +++ b/annotations_1/DTdDzcr-7UM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.86], [10.0, 12.23], [13.0, 13.56], [17.0, 22.52], [29.0, 29.52], [32.0, 35.14], [36.0, 36.59], [37.0, 37.86], [39.0, 39.87], [43.0, 62.87], [63.0, 64.54], [67.0, 67.68], [69.0, 71.15], [73.0, 73.5], [75.0, 78.81], [83.0, 85.67], [89.0, 91.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.62, 66.03, 0.0, 74.6, 0.0, 66.63, 0.0, 0.0, 0.0, 57.72, 0.0, 0.0, 95.91, 0.0, 92.97, 97.92, 100.0], "audiomae_on_audioset": [[["speech", 39.18], ["whimper", 15.14], ["crying, sobbing", 11.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.86, 2.23, 0.56, 5.52, 0.52, 3.14, 0.59, 0.86, 0.87, 19.87, 1.54, 0.68, 2.15, 0.5, 3.81, 2.67, 2.94]} \ No newline at end of file diff --git a/annotations_1/DTexn9N2HMI_filtered.json b/annotations_1/DTexn9N2HMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e9eef282ad7f01ab131d7df4270b92097ef11db --- /dev/null +++ b/annotations_1/DTexn9N2HMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [9.0, 9.37], [31.0, 31.63], [34.0, 41.2], [43.0, 45.03], [47.0, 48.42], [51.0, 54.53], [56.0, 58.58], [60.0, 61.45], [64.0, 79.89], [81.0, 92.74], [93.0, 108.19], [110.0, 116.67], [119.0, 123.13], [124.0, 124.14], [125.0, 125.81], [129.0, 132.87], [134.0, 137.29], [140.0, 141.27], [143.0, 158.45]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 74.92, 91.81, 0.0, 66.76, 77.87, 0.0, 32.76, 39.47, 31.12, 85.17, 75.39, 0.0, 0.0, 87.0, 81.0, 0.0, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 26.28], ["music", 9.14], ["hum", 5.39]], [["didgeridoo", 21.58], ["music", 14.88], ["animal", 8.94]], [["animal", 37.23], ["dog", 31.56], ["domestic animals, pets", 13.56]], null, null, null, null, null, null, null, null], "duration": [0.62, 0.37, 0.63, 7.2, 2.03, 1.42, 3.53, 2.58, 1.45, 15.89, 11.74, 15.19, 6.67, 4.13, 0.14, 0.81, 3.87, 3.29, 1.27, 15.45]} \ No newline at end of file diff --git a/annotations_1/DUjB9LTtzGg_filtered.json b/annotations_1/DUjB9LTtzGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0016831a60abf7cbf916619083d3775448f88dd --- /dev/null +++ b/annotations_1/DUjB9LTtzGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.33], [34.0, 43.04], [51.0, 58.5], [60.0, 60.47], [65.0, 65.58], [67.0, 67.34], [72.0, 76.72], [84.0, 84.69], [90.0, 93.23], [95.0, 100.03], [102.0, 111.92], [120.0, 119.96], [123.0, 128.9], [129.0, 129.44], [129.0, 129.9], [136.0, 137.02], [144.0, 150.74], [154.0, 154.31], [158.0, 163.02]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, true], "silence_prob": [30.42, 29.99, 29.51, 0.0, 0.0, 0.0, 29.28, 0.0, 31.17, 30.36, 29.86, 0.0, 29.48, 0.0, 0.0, 0.0, 29.45, 0.0, 30.28], "audiomae_on_audioset": [[["music", 74.44], ["electronic music", 4.05], ["dubstep", 3.44]], [["music", 83.84], ["funny music", 2.21], ["boing", 0.84]], [["music", 78.71], ["throbbing", 2.6], ["funny music", 1.66]], null, null, null, [["music", 65.15], ["rock and roll", 2.71], ["electronic music", 1.66]], null, [["music", 60.74], ["reggae", 3.47], ["electronic music", 2.61]], [["music", 79.21], ["throbbing", 2.39], ["sampler", 2.16]], [["music", 82.94], ["funny music", 3.74], ["male singing", 0.96]], null, [["music", 57.38], ["throbbing", 6.15], ["synthetic singing", 4.18]], null, null, null, [["music", 80.01], ["rock and roll", 1.87], ["reggae", 1.28]], null, [["sidetone", 27.89], ["music", 26.85], ["frog", 12.62]]], "duration": [3.33, 9.04, 7.5, 0.47, 0.58, 0.34, 4.72, 0.69, 3.23, 5.03, 9.92, -0.04, 5.9, 0.44, 0.9, 1.02, 6.74, 0.31, 5.02]} \ No newline at end of file diff --git a/annotations_1/DV5EHuaa23c_filtered.json b/annotations_1/DV5EHuaa23c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9410484b675efd33d3b289e7d55a1a75cf054d4c --- /dev/null +++ b/annotations_1/DV5EHuaa23c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.5], [24.0, 25.91], [28.0, 28.07], [31.0, 31.31], [35.0, 35.97], [37.0, 40.59], [42.0, 45.76], [48.0, 48.51], [49.0, 50.48], [51.0, 53.1], [55.0, 55.14], [56.0, 57.01], [60.0, 60.54], [62.0, 61.7], [66.0, 66.48], [69.0, 73.14], [77.0, 85.95], [86.0, 86.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 91.47, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 54.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.91, 0.07, 0.31, 0.97, 3.59, 3.76, 0.51, 1.48, 2.1, 0.14, 1.01, 0.54, -0.3, 0.48, 4.14, 8.95, 0.44]} \ No newline at end of file diff --git a/annotations_1/DVA8vzEbm9Y_filtered.json b/annotations_1/DVA8vzEbm9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a84306d9f1e3bdf9bcfa729f22d9ef74ddb398b --- /dev/null +++ b/annotations_1/DVA8vzEbm9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.22], [15.0, 15.96], [17.0, 16.9], [18.0, 18.3], [20.0, 21.96], [25.0, 45.35], [51.0, 52.42], [57.0, 85.53], [91.0, 92.01], [93.0, 95.08], [97.0, 96.97], [97.0, 98.49], [99.0, 102.73], [104.0, 104.75], [116.0, 118.15], [118.0, 119.75], [121.0, 122.22], [123.0, 124.58], [126.0, 127.85], [129.0, 129.76], [130.0, 132.49], [133.0, 137.64], [140.0, 140.73], [144.0, 145.15], [147.0, 147.11], [150.0, 150.63], [151.0, 152.22], [153.0, 162.23], [163.0, 164.02]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [41.03, 0.0, 0.0, 0.0, 0.0, 32.42, 0.0, 34.49, 0.0, 91.64, 0.0, 0.0, 66.03, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 37.13, 0.0, 0.0, 0.0, 0.0, 0.0, 47.58, 0.0], "audiomae_on_audioset": [[["music", 43.87], ["throbbing", 14.35], ["speech", 10.64]], null, null, null, null, [["music", 77.63], ["livestock, farm animals, working animals", 5.89], ["bleat", 3.08]], null, [["music", 56.93], ["speech", 11.27], ["synthesizer", 4.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.54], ["crushing", 8.31], ["fart", 6.6]], null, null, null, null, null, [["hum", 38.6], ["mains hum", 20.92], ["speech", 18.24]], null], "duration": [3.22, 0.96, -0.1, 0.3, 1.96, 20.35, 1.42, 28.53, 1.01, 2.08, -0.03, 1.49, 3.73, 0.75, 2.15, 1.75, 1.22, 1.58, 1.85, 0.76, 2.49, 4.64, 0.73, 1.15, 0.11, 0.63, 1.22, 9.23, 1.02]} \ No newline at end of file diff --git a/annotations_1/DVQQY4-us8k_filtered.json b/annotations_1/DVQQY4-us8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2f49182365df850cc04fca54e1e172be9c326d7 --- /dev/null +++ b/annotations_1/DVQQY4-us8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.03], [4.0, 3.91], [4.0, 4.48], [18.0, 18.22], [18.0, 20.85], [21.0, 24.07], [33.0, 32.98], [36.0, 36.29], [40.0, 40.53], [46.0, 46.7], [47.0, 50.31], [53.0, 53.96], [55.0, 55.51], [56.0, 58.01], [62.0, 62.38], [65.0, 68.45], [71.0, 71.46], [72.0, 72.86], [83.0, 85.24], [87.0, 88.06], [89.0, 89.36], [90.0, 93.01], [106.0, 111.87], [117.0, 117.64], [119.0, 120.07], [123.0, 122.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 79.76, 34.33, 0.0, 0.0, 0.0, 0.0, 34.71, 0.0, 0.0, 64.07, 0.0, 84.07, 0.0, 0.0, 30.52, 0.0, 0.0, 30.66, 33.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 42.01], ["throbbing", 27.43], ["music", 3.94]], null, null, null, null, [["speech", 29.29], ["music", 26.44], ["knock", 13.3]], null, null, null, null, null, null, null, [["music", 54.01], ["speech", 23.71], ["drum machine", 3.57]], null, null, [["speech", 63.28], ["boing", 10.2], ["music", 6.89]], [["music", 15.38], ["fart", 15.31], ["whack, thwack", 9.82]], null, null, null], "duration": [0.03, -0.09, 0.48, 0.22, 2.85, 3.07, -0.02, 0.29, 0.53, 0.7, 3.31, 0.96, 0.51, 2.01, 0.38, 3.45, 0.46, 0.86, 2.24, 1.06, 0.36, 3.01, 5.87, 0.64, 1.07, -0.02]} \ No newline at end of file diff --git a/annotations_1/DVR6p7Iopec_filtered.json b/annotations_1/DVR6p7Iopec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1197b0ec30cb01ec5cca3f2f1b22ae448e0dc67 --- /dev/null +++ b/annotations_1/DVR6p7Iopec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 58.63], [59.0, 81.06], [82.0, 113.26]], "keep_status": [false, false, false], "silence_prob": [34.61, 32.66, 0.0], "audiomae_on_audioset": [[["music", 41.45], ["speech", 19.47], ["theremin", 16.91]], [["music", 54.57], ["speech", 17.85], ["bow-wow", 3.11]], null], "duration": [21.63, 22.06, 31.26]} \ No newline at end of file diff --git a/annotations_1/DV_eqkGxAa4_filtered.json b/annotations_1/DV_eqkGxAa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84bde80220cbd73edaf7990a55b5bd5da3905989 --- /dev/null +++ b/annotations_1/DV_eqkGxAa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [15.0, 25.1], [29.0, 31.58], [35.0, 35.41], [36.0, 46.06], [49.0, 51.31], [56.0, 67.86], [71.0, 71.31], [73.0, 75.51], [82.0, 85.46], [86.0, 87.15], [88.0, 90.63], [93.0, 93.41], [95.0, 96.57], [98.0, 99.12], [100.0, 134.5]], "keep_status": [false, true, false, false, true, true, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 30.69, 56.93, 0.0, 33.76, 29.91, 35.2, 0.0, 48.19, 56.1, 0.0, 32.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["eruption", 28.42], ["speech", 24.14], ["explosion", 16.04]], null, null, [["speech", 50.02], ["explosion", 11.98], ["gunshot, gunfire", 5.43]], [["noise", 16.0], ["radio", 15.25], ["cacophony", 7.48]], [["speech", 20.98], ["hum", 11.01], ["vehicle", 10.13]], null, [["speech", 52.58], ["fly, housefly", 7.74], ["bee, wasp, etc.", 6.84]], null, null, [["speech", 42.74], ["static", 12.49], ["hum", 7.79]], null, null, null, null], "duration": [0.22, 10.1, 2.58, 0.41, 10.06, 2.31, 11.86, 0.31, 2.51, 3.46, 1.15, 2.63, 0.41, 1.57, 1.12, 34.5]} \ No newline at end of file diff --git a/annotations_1/DX1p8C_FuxU_filtered.json b/annotations_1/DX1p8C_FuxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43dc70f3125480dbc1dfb7b835aa6855a888c9 --- /dev/null +++ b/annotations_1/DX1p8C_FuxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.42], [12.0, 15.85], [16.0, 17.04], [22.0, 22.28], [24.0, 27.48], [28.0, 29.54], [30.0, 31.67], [32.0, 48.96], [50.0, 50.8], [51.0, 53.2], [54.0, 55.0], [56.0, 60.37], [61.0, 64.42], [66.0, 72.0], [74.0, 77.13], [78.0, 82.48], [83.0, 89.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.89, 87.37, 0.0, 0.0, 64.41, 0.0, 0.0, 93.76, 0.0, 69.74, 0.0, 60.23, 56.86, 52.05, 56.7, 51.88, 61.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.42, 3.85, 1.04, 0.28, 3.48, 1.54, 1.67, 16.96, 0.8, 2.2, 1.0, 4.37, 3.42, 6.0, 3.13, 4.48, 6.29]} \ No newline at end of file diff --git a/annotations_1/DXFN60x3vP4_filtered.json b/annotations_1/DXFN60x3vP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86a6842936a29bcafa95e481f9994b943937c95c --- /dev/null +++ b/annotations_1/DXFN60x3vP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.61], [20.0, 23.08], [24.0, 25.02], [49.0, 49.42], [50.0, 50.72], [52.0, 54.6], [60.0, 61.03], [65.0, 65.99], [71.0, 72.74], [80.0, 80.27], [91.0, 92.85], [95.0, 95.71], [100.0, 100.68], [102.0, 109.29], [116.0, 120.38], [129.0, 129.42], [130.0, 136.73], [137.0, 136.95], [138.0, 138.08], [143.0, 152.17], [152.0, 152.2], [154.0, 154.89], [156.0, 159.39], [160.0, 162.16], [163.0, 172.29], [173.0, 174.26]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 32.73, 0.0, 0.0, 0.0, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.32, 29.84, 0.0, 29.95, 0.0, 0.0, 30.25, 0.0, 0.0, 30.68, 29.58, 30.34, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 27.73], ["cattle, bovinae", 24.49], ["moo", 15.17]], null, null, null, [["hum", 24.5], ["mains hum", 24.08], ["throbbing", 11.25]], null, null, null, null, null, null, null, [["music", 43.66], ["throbbing", 35.74], ["hum", 5.64]], [["music", 59.48], ["speech", 22.34], ["throbbing", 1.75]], null, [["music", 42.62], ["throbbing", 16.28], ["boing", 6.61]], null, null, [["animal", 28.37], ["music", 26.19], ["howl", 11.63]], null, null, [["music", 38.52], ["theremin", 37.61], ["whale vocalization", 3.05]], [["music", 32.33], ["animal", 18.33], ["domestic animals, pets", 10.24]], [["music", 65.02], ["speech", 22.12], ["breaking", 2.23]], null], "duration": [0.61, 3.08, 1.02, 0.42, 0.72, 2.6, 1.03, 0.99, 1.74, 0.27, 1.85, 0.71, 0.68, 7.29, 4.38, 0.42, 6.73, -0.05, 0.08, 9.17, 0.2, 0.89, 3.39, 2.16, 9.29, 1.26]} \ No newline at end of file diff --git a/annotations_1/DYAdSce8Rd0_filtered.json b/annotations_1/DYAdSce8Rd0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edd3c83c88f29713088ec88dad8d912c0be8d3fd --- /dev/null +++ b/annotations_1/DYAdSce8Rd0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [5.0, 6.0], [14.0, 15.58], [29.0, 29.25], [33.0, 35.63], [38.0, 38.89], [39.0, 40.02], [40.0, 41.34], [44.0, 45.0], [51.0, 51.98], [53.0, 53.6], [56.0, 62.9], [65.0, 65.8], [76.0, 76.2], [78.0, 78.85], [89.0, 89.28], [91.0, 92.5], [95.0, 102.07], [106.0, 106.34], [107.0, 108.82], [112.0, 112.95], [114.0, 114.51], [116.0, 116.13], [117.0, 117.49], [118.0, 119.87]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 40.78], ["speech", 16.13], ["synthesizer", 4.82]], null, null, null, null, null, null, [["music", 65.84], ["drum machine", 18.73], ["electronic music", 5.09]], null, null, null, null, null, [["music", 79.23], ["musical instrument", 2.07], ["scrape", 1.91]], null, null, null, null, null, null, null], "duration": [0.23, 1.0, 1.58, 0.25, 2.63, 0.89, 1.02, 1.34, 1.0, 0.98, 0.6, 6.9, 0.8, 0.2, 0.85, 0.28, 1.5, 7.07, 0.34, 1.82, 0.95, 0.51, 0.13, 0.49, 1.87]} \ No newline at end of file diff --git a/annotations_1/DYPR82c0v00_filtered.json b/annotations_1/DYPR82c0v00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f1603598808e53eebee5ef1c5ebd5a2ebf0c1fe --- /dev/null +++ b/annotations_1/DYPR82c0v00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.91], [13.0, 13.73], [14.0, 14.61], [16.0, 17.74], [20.0, 20.22], [23.0, 23.16], [27.0, 27.55], [31.0, 32.73], [34.0, 33.99], [35.0, 35.36], [38.0, 40.05], [41.0, 41.77], [43.0, 43.58], [48.0, 55.16], [66.0, 66.51], [88.0, 88.84], [89.0, 89.88], [91.0, 91.34], [93.0, 93.21], [94.0, 95.5], [96.0, 96.75], [98.0, 98.88], [100.0, 99.74], [106.0, 109.16], [110.0, 112.85], [113.0, 113.56], [115.0, 118.02], [119.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 90.6, 0.0, 63.1, 72.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.91, 0.73, 0.61, 1.74, 0.22, 0.16, 0.55, 1.73, -0.01, 0.36, 2.05, 0.77, 0.58, 7.16, 0.51, 0.84, 0.88, 0.34, 0.21, 1.5, 0.75, 0.88, -0.26, 3.16, 2.85, 0.56, 3.02, 8.16]} \ No newline at end of file diff --git a/annotations_1/DZlM8Wm7OKY_filtered.json b/annotations_1/DZlM8Wm7OKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..886a6233d01cb8351b22d0a698df21f39a57180a --- /dev/null +++ b/annotations_1/DZlM8Wm7OKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.22], [22.0, 28.26], [31.0, 34.38], [36.0, 37.35], [42.0, 42.52], [47.0, 49.65], [56.0, 55.9], [68.0, 68.61], [70.0, 69.82], [84.0, 86.85], [89.0, 89.83], [91.0, 91.81], [93.0, 94.98], [103.0, 103.65], [159.0, 165.55], [180.0, 180.47], [184.0, 184.45]], "keep_status": [false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.53, 31.98, 40.93, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 59.77], ["music", 9.45], ["vehicle", 2.82]], [["speech", 36.1], ["music", 9.51], ["buzz", 4.96]], [["animal", 20.51], ["livestock, farm animals, working animals", 17.95], ["cattle, bovinae", 17.59]], null, null, [["speech", 27.24], ["radio", 13.82], ["music", 9.28]], null, null, null, null, null, null, null, null, [["telephone bell ringing", 37.51], ["speech", 35.87], ["telephone", 15.66]], null, null], "duration": [4.22, 6.26, 3.38, 1.35, 0.52, 2.65, -0.1, 0.61, -0.18, 2.85, 0.83, 0.81, 1.98, 0.65, 6.55, 0.47, 0.45]} \ No newline at end of file diff --git a/annotations_1/D_FRoxgOUNA_filtered.json b/annotations_1/D_FRoxgOUNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45514e9a200cc0f8057783f975fdd84961845c4b --- /dev/null +++ b/annotations_1/D_FRoxgOUNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [5.0, 7.79], [9.0, 9.42], [11.0, 12.48], [15.0, 16.68], [20.0, 21.2], [28.0, 28.61], [29.0, 28.7], [40.0, 40.64], [54.0, 54.01], [58.0, 59.58], [60.0, 60.99], [66.0, 67.42], [68.0, 84.96], [90.0, 93.23], [95.0, 97.21], [99.0, 100.58], [112.0, 112.58], [122.0, 121.68], [131.0, 131.38], [135.0, 144.68], [155.0, 155.46], [156.0, 160.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.49, 75.55, 99.65, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 60.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 86.59], ["musical instrument", 2.09], ["guitar", 1.08]], null, null, null, null, null, null, null, null, null], "duration": [1.17, 2.79, 0.42, 1.48, 1.68, 1.2, 0.61, -0.3, 0.64, 0.01, 1.58, 0.99, 1.42, 16.96, 3.23, 2.21, 1.58, 0.58, -0.32, 0.38, 9.68, 0.46, 4.74]} \ No newline at end of file diff --git a/annotations_1/D_N9S0bAiWI_filtered.json b/annotations_1/D_N9S0bAiWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a8c4bde6f914110c52ac1671a0ff85f99a95f66 --- /dev/null +++ b/annotations_1/D_N9S0bAiWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.49], [12.0, 30.52], [31.0, 31.46], [32.0, 31.85], [36.0, 46.09], [49.0, 77.3], [80.0, 80.79], [81.0, 82.61], [84.0, 104.4], [106.0, 112.83], [115.0, 122.07], [124.0, 125.36]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [29.84, 31.02, 0.0, 0.0, 30.42, 30.09, 0.0, 0.0, 30.13, 31.28, 29.9, 0.0], "audiomae_on_audioset": [[["speech", 25.58], ["music", 13.99], ["noise", 8.75]], [["mains hum", 42.59], ["hum", 25.84], ["music", 11.93]], null, null, [["cattle, bovinae", 31.09], ["moo", 26.52], ["livestock, farm animals, working animals", 25.68]], [["music", 24.74], ["mains hum", 22.89], ["hum", 19.16]], null, null, [["music", 33.78], ["hum", 23.26], ["mains hum", 18.95]], [["hum", 33.8], ["music", 23.22], ["throbbing", 20.41]], [["hum", 48.11], ["mains hum", 32.91], ["throbbing", 12.3]], null], "duration": [8.49, 18.52, 0.46, -0.15, 10.09, 28.3, 0.79, 1.61, 20.4, 6.83, 7.07, 1.36]} \ No newline at end of file diff --git a/annotations_1/Da02cZG3NDI_filtered.json b/annotations_1/Da02cZG3NDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3199d3c8cf2e2065813d8307a56f06b41808b041 --- /dev/null +++ b/annotations_1/Da02cZG3NDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.15], [15.0, 15.11], [17.0, 18.64], [20.0, 21.24], [23.0, 24.07], [26.0, 26.59], [31.0, 33.96], [36.0, 36.93], [39.0, 40.39], [42.0, 43.34], [45.0, 46.5], [48.0, 49.1], [51.0, 52.42], [57.0, 58.01], [60.0, 61.16], [63.0, 63.81], [66.0, 66.9], [69.0, 70.17], [72.0, 73.11], [75.0, 75.76], [79.0, 80.54], [83.0, 84.43], [86.0, 88.33], [91.0, 92.2], [94.0, 95.2], [97.0, 97.98], [99.0, 100.87], [103.0, 103.59], [105.0, 107.2], [108.0, 110.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.15, 0.11, 1.64, 1.24, 1.07, 0.59, 2.96, 0.93, 1.39, 1.34, 1.5, 1.1, 1.42, 1.01, 1.16, 0.81, 0.9, 1.17, 1.11, 0.76, 1.54, 1.43, 2.33, 1.2, 1.2, 0.98, 1.87, 0.59, 2.2, 2.39]} \ No newline at end of file diff --git a/annotations_1/DaDZptGm6nI_filtered.json b/annotations_1/DaDZptGm6nI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25363ed64774d5dd25686686b1d0ef9aefc52c49 --- /dev/null +++ b/annotations_1/DaDZptGm6nI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.34], [14.0, 14.72], [15.0, 17.05], [22.0, 22.52], [30.0, 29.81], [38.0, 37.88], [40.0, 40.31], [45.0, 46.16], [47.0, 47.61], [53.0, 52.71], [64.0, 66.16], [93.0, 93.18], [95.0, 96.33], [98.0, 98.96], [103.0, 103.2], [106.0, 105.8], [129.0, 133.25], [134.0, 135.11], [150.0, 154.2], [159.0, 163.07], [164.0, 166.04], [166.0, 168.52], [170.0, 170.53], [172.0, 173.2], [175.0, 176.76], [177.0, 185.57], [187.0, 188.01], [188.0, 189.92], [192.0, 194.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.1, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 91.98, 99.68, 99.96, 97.22, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 78.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.34, 0.72, 2.05, 0.52, -0.19, -0.12, 0.31, 1.16, 0.61, -0.29, 2.16, 0.18, 1.33, 0.96, 0.2, -0.2, 4.25, 1.11, 4.2, 4.07, 2.04, 2.52, 0.53, 1.2, 1.76, 8.57, 1.01, 1.92, 2.19]} \ No newline at end of file diff --git a/annotations_1/DaWi5EoJVGA_filtered.json b/annotations_1/DaWi5EoJVGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5e02df625fb4ea425d3ff128167174c2ca1f3ba --- /dev/null +++ b/annotations_1/DaWi5EoJVGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [6.0, 6.03], [11.0, 11.47], [15.0, 15.6], [17.0, 17.69], [18.0, 21.17], [23.0, 23.7], [24.0, 25.0], [28.0, 29.3], [30.0, 30.08], [33.0, 33.51], [35.0, 37.27], [38.0, 38.65], [41.0, 42.18], [44.0, 44.54], [54.0, 59.64], [61.0, 62.34], [65.0, 66.45], [70.0, 70.46], [74.0, 74.98], [80.0, 80.35], [84.0, 84.64], [90.0, 90.83], [93.0, 93.53], [98.0, 98.34], [99.0, 100.08], [102.0, 102.61], [104.0, 105.04], [112.0, 113.12], [115.0, 115.1], [118.0, 118.15], [121.0, 121.47], [125.0, 125.32], [129.0, 130.4], [135.0, 135.43], [138.0, 139.26], [149.0, 149.3], [154.0, 155.58], [157.0, 157.18], [162.0, 162.26], [164.0, 165.03], [167.0, 167.81]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.45, 0.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.93], ["theremin", 7.85], ["sitar", 5.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.89], ["hum", 5.73], ["theremin", 4.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 0.03, 0.47, 0.6, 0.69, 3.17, 0.7, 1.0, 1.3, 0.08, 0.51, 2.27, 0.65, 1.18, 0.54, 5.64, 1.34, 1.45, 0.46, 0.98, 0.35, 0.64, 0.83, 0.53, 0.34, 1.08, 0.61, 1.04, 1.12, 0.1, 0.15, 0.47, 0.32, 1.4, 0.43, 1.26, 0.3, 1.58, 0.18, 0.26, 1.03, 0.81]} \ No newline at end of file diff --git a/annotations_1/DbORPqtzyx4_filtered.json b/annotations_1/DbORPqtzyx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca239d8ff29a19a92ae8fa06ffa8b2accd08d2a3 --- /dev/null +++ b/annotations_1/DbORPqtzyx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 42.99], [44.0, 50.06], [51.0, 52.14], [53.0, 60.59], [62.0, 115.89], [117.0, 147.51]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 32.58, 0.0, 30.6, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 66.94], ["synthesizer", 5.96], ["throbbing", 3.96]], null, [["music", 53.61], ["fart", 17.87], ["quack", 4.57]], null, null], "duration": [39.99, 6.06, 1.14, 7.59, 53.89, 30.51]} \ No newline at end of file diff --git a/annotations_1/Dc-fBk3yoqs_filtered.json b/annotations_1/Dc-fBk3yoqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e99cf21eb478759bae37c52d91a8cc2fa4b57b4 --- /dev/null +++ b/annotations_1/Dc-fBk3yoqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.71], [21.0, 21.95], [24.0, 48.39], [53.0, 53.52], [55.0, 56.07], [57.0, 69.96], [72.0, 77.57], [81.0, 85.23], [87.0, 90.07], [92.0, 92.53], [96.0, 97.44], [99.0, 99.2], [105.0, 105.17], [106.0, 106.62], [113.0, 113.98], [114.0, 114.03], [115.0, 130.44], [131.0, 140.41], [141.0, 141.72], [151.0, 155.44], [156.0, 156.78], [163.0, 163.46], [165.0, 183.42], [191.0, 192.16], [192.0, 193.89], [195.0, 195.57], [197.0, 198.21]], "keep_status": [false, false, true, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.52, 0.0, 0.0, 33.78, 32.18, 30.35, 30.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.3, 30.55, 0.0, 30.06, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.76], ["speech", 8.58], ["boing", 6.69]], null, null, [["speech", 75.71], ["fireworks", 4.68], ["electric shaver, electric razor", 2.03]], [["speech", 43.56], ["explosion", 17.57], ["gunshot, gunfire", 8.68]], [["speech", 36.69], ["sound effect", 17.95], ["whoosh, swoosh, swish", 6.96]], [["gunshot, gunfire", 32.82], ["speech", 24.26], ["explosion", 7.46]], null, null, null, null, null, null, null, [["music", 53.82], ["hum", 10.54], ["angry music", 8.9]], [["music", 41.05], ["speech", 11.96], ["throbbing", 8.76]], null, [["music", 55.2], ["speech", 16.28], ["sidetone", 6.89]], null, null, [["music", 69.06], ["cacophony", 6.9], ["throbbing", 4.81]], null, null, null, null], "duration": [0.71, 0.95, 24.39, 0.52, 1.07, 12.96, 5.57, 4.23, 3.07, 0.53, 1.44, 0.2, 0.17, 0.62, 0.98, 0.03, 15.44, 9.41, 0.72, 4.44, 0.78, 0.46, 18.42, 1.16, 1.89, 0.57, 1.21]} \ No newline at end of file diff --git a/annotations_1/DcpIpj7RbxQ_filtered.json b/annotations_1/DcpIpj7RbxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba42bec16b66ef6e241a953a837c046554a42594 --- /dev/null +++ b/annotations_1/DcpIpj7RbxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [34.0, 34.5], [46.0, 46.87], [48.0, 48.0], [53.0, 53.84], [71.0, 71.27], [93.0, 94.39], [119.0, 123.57]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cattle, bovinae", 31.88], ["moo", 28.64], ["music", 12.62]]], "duration": [0.93, 0.5, 0.87, 0.0, 0.84, 0.27, 1.39, 4.57]} \ No newline at end of file diff --git a/annotations_1/Dd0f82f8ymk_filtered.json b/annotations_1/Dd0f82f8ymk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..750866d47bef20a73ca65881eb862b0b93c1066f --- /dev/null +++ b/annotations_1/Dd0f82f8ymk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.94], [48.0, 60.96], [62.0, 62.5], [64.0, 64.91], [67.0, 67.39], [68.0, 68.42], [70.0, 82.56], [86.0, 106.61], [110.0, 112.09], [112.0, 114.12], [115.0, 125.27], [128.0, 131.36], [132.0, 133.27], [135.0, 135.99], [137.0, 137.2], [138.0, 139.16]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.02, 0.0, 0.0, 0.0, 0.0, 36.1, 41.85, 93.45, 80.46, 38.87, 44.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.04], ["mains hum", 13.23], ["hum", 11.02]], null, null, null, null, [["hum", 28.45], ["mains hum", 20.51], ["electric shaver, electric razor", 7.41]], [["fly, housefly", 64.22], ["mosquito", 11.88], ["insect", 11.51]], null, null, [["hum", 49.78], ["mains hum", 35.05], ["music", 5.0]], [["speech", 66.93], ["music", 4.91], ["hum", 2.96]], null, null, null, null], "duration": [0.94, 12.96, 0.5, 0.91, 0.39, 0.42, 12.56, 20.61, 2.09, 2.12, 10.27, 3.36, 1.27, 0.99, 0.2, 1.16]} \ No newline at end of file diff --git a/annotations_1/DdNfSuTpDbA_filtered.json b/annotations_1/DdNfSuTpDbA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af4fb43c34841413ed34eb09ea9143e5de28bcf2 --- /dev/null +++ b/annotations_1/DdNfSuTpDbA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.78], [9.0, 10.0], [11.0, 11.31], [15.0, 15.94], [21.0, 24.46], [29.0, 29.94], [31.0, 31.16], [34.0, 33.99], [36.0, 37.76], [38.0, 40.42], [42.0, 56.3], [60.0, 60.88], [66.0, 73.2], [74.0, 75.25], [76.0, 78.17], [79.0, 82.95], [84.0, 85.36], [93.0, 93.78], [97.0, 97.21], [100.0, 101.53], [102.0, 102.47], [103.0, 103.33]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.89, 0.0, 0.0, 0.0, 0.0, 47.16, 83.52, 0.0, 31.06, 0.0, 99.99, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 86.03], ["musical instrument", 2.24], ["synthesizer", 2.21]], null, null, null, null, [["keyboard (musical)", 26.04], ["music", 22.14], ["synthesizer", 12.93]], null, null, [["whack, thwack", 22.3], ["sound effect", 18.09], ["fart", 13.29]], null, null, null, null, null, null, null, null, null], "duration": [0.78, 1.0, 0.31, 0.94, 3.46, 0.94, 0.16, -0.01, 1.76, 2.42, 14.3, 0.88, 7.2, 1.25, 2.17, 3.95, 1.36, 0.78, 0.21, 1.53, 0.47, 0.33]} \ No newline at end of file diff --git a/annotations_1/DdpMl3_vPmQ_filtered.json b/annotations_1/DdpMl3_vPmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8d68ac8d101a9252b941cdb537570248492581 --- /dev/null +++ b/annotations_1/DdpMl3_vPmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 54.18], [56.0, 56.44], [57.0, 77.25], [79.0, 82.78], [83.0, 83.94], [84.0, 89.53], [90.0, 89.7]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [30.66, 0.0, 31.1, 31.36, 0.0, 31.07, 0.0], "audiomae_on_audioset": [[["music", 83.12], ["didgeridoo", 3.61], ["echo", 1.13]], null, [["music", 82.85], ["brass instrument", 3.5], ["trombone", 3.18]], [["music", 43.72], ["cello", 8.4], ["musical instrument", 5.82]], null, [["music", 71.68], ["musical instrument", 3.77], ["music of latin america", 2.5]], null], "duration": [24.18, 0.44, 20.25, 3.78, 0.94, 5.53, -0.3]} \ No newline at end of file diff --git a/annotations_1/Ded2FG1gA0c_filtered.json b/annotations_1/Ded2FG1gA0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7184a405f8b2c272e2760280ef3447750a476a03 --- /dev/null +++ b/annotations_1/Ded2FG1gA0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.55], [27.0, 27.16], [28.0, 27.94], [28.0, 28.68], [31.0, 34.62], [37.0, 37.71], [41.0, 44.95], [49.0, 55.46], [60.0, 99.62], [100.0, 101.39], [108.0, 109.44], [111.0, 111.47], [114.0, 116.83], [119.0, 121.41], [123.0, 123.9], [125.0, 126.5], [128.0, 129.37], [131.0, 132.76]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.08, 0.0, 0.0, 0.0, 28.16, 0.0, 28.29, 29.34, 0.0, 0.0, 0.0, 0.0, 54.9, 83.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.11], ["speech", 19.83], ["vehicle", 10.1]], null, null, null, [["speech", 28.31], ["vehicle", 9.59], ["whale vocalization", 8.32]], null, [["hum", 22.93], ["mains hum", 17.03], ["music", 5.83]], [["mains hum", 23.96], ["speech", 21.72], ["hum", 17.99]], null, null, null, null, null, null, null, null, null, null], "duration": [18.55, 0.16, -0.06, 0.68, 3.62, 0.71, 3.95, 6.46, 39.62, 1.39, 1.44, 0.47, 2.83, 2.41, 0.9, 1.5, 1.37, 1.76]} \ No newline at end of file diff --git a/annotations_1/DefILRrX77k_filtered.json b/annotations_1/DefILRrX77k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b8ba2f9cd863ea3bfee3198fc9ff6e54d441886 --- /dev/null +++ b/annotations_1/DefILRrX77k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.1], [9.0, 27.75], [28.0, 62.45], [64.0, 94.34], [96.0, 96.52], [97.0, 118.25]], "keep_status": [false, true, false, false, false, true], "silence_prob": [61.77, 36.05, 0.0, 0.0, 0.0, 29.68], "audiomae_on_audioset": [null, [["music", 34.67], ["hum", 16.96], ["ambient music", 7.96]], null, null, null, [["music", 19.06], ["mosquito", 10.36], ["fly, housefly", 7.55]]], "duration": [2.1, 18.75, 34.45, 30.34, 0.52, 21.25]} \ No newline at end of file diff --git a/annotations_1/Dh3WAI9JeJw_filtered.json b/annotations_1/Dh3WAI9JeJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532a12641b5c57f27944634500a74da8b8421b83 --- /dev/null +++ b/annotations_1/Dh3WAI9JeJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.94], [21.0, 21.14], [28.0, 28.49], [67.0, 67.56], [72.0, 72.5], [100.0, 100.94], [117.0, 117.69], [125.0, 126.22], [133.0, 134.76], [147.0, 147.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.14, 0.49, 0.56, 0.5, 0.94, 0.69, 1.22, 1.76, 0.41]} \ No newline at end of file diff --git a/annotations_1/DhUcvFP_Tas_filtered.json b/annotations_1/DhUcvFP_Tas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0067439f2853741593bf01e67c471397e73ba05f --- /dev/null +++ b/annotations_1/DhUcvFP_Tas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.85], [39.0, 39.39], [41.0, 41.61], [44.0, 44.69], [45.0, 47.33], [48.0, 48.88], [53.0, 74.82], [80.0, 80.92], [81.0, 84.69], [93.0, 96.45], [100.0, 101.12], [101.0, 105.63], [113.0, 116.99], [130.0, 142.55], [148.0, 149.76], [153.0, 167.19], [171.0, 174.99], [176.0, 177.42], [179.0, 179.76], [180.0, 196.52], [197.0, 196.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.09, 0.0, 30.23, 0.0, 30.68, 29.77, 0.0, 31.6, 29.76, 30.09, 0.0, 29.26, 29.08, 0.0, 0.0, 29.05, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.78], ["didgeridoo", 9.08], ["carnatic music", 4.3]], null, [["music", 87.96], ["christian music", 1.57], ["christmas music", 1.16]], null, [["music", 53.76], ["accordion", 14.58], ["musical instrument", 5.38]], [["music", 69.82], ["foghorn", 4.42], ["musical instrument", 2.87]], null, [["music", 44.1], ["trombone", 21.38], ["brass instrument", 14.37]], [["music", 78.76], ["synthetic singing", 2.6], ["music of latin america", 1.66]], [["music", 82.32], ["yodeling", 5.36], ["brass instrument", 1.15]], null, [["music", 75.08], ["funny music", 1.96], ["synthetic singing", 1.75]], [["music", 68.6], ["middle eastern music", 5.58], ["crowd", 2.7]], null, null, [["music", 71.81], ["musical instrument", 3.5], ["brass instrument", 3.13]], null], "duration": [1.85, 0.39, 0.61, 0.69, 2.33, 0.88, 21.82, 0.92, 3.69, 3.45, 1.12, 4.63, 3.99, 12.55, 1.76, 14.19, 3.99, 1.42, 0.76, 16.52, -0.06]} \ No newline at end of file diff --git a/annotations_1/Dj9G_kEq5W8_filtered.json b/annotations_1/Dj9G_kEq5W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3f5f1189b9a17770bce0f28809955499cce7a37 --- /dev/null +++ b/annotations_1/Dj9G_kEq5W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.7], [34.0, 35.24], [64.0, 65.82], [84.0, 86.31], [96.0, 95.79], [98.0, 97.9], [98.0, 97.97], [98.0, 98.51], [102.0, 103.08], [104.0, 104.52], [106.0, 118.44], [119.0, 119.15], [119.0, 119.94], [120.0, 120.28], [121.0, 124.19], [125.0, 133.27], [134.0, 138.72], [141.0, 152.05], [158.0, 164.44], [165.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 37.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.09, 0.0, 0.0, 0.0, 35.25, 35.64, 34.91, 35.54, 37.91, 0.0], "audiomae_on_audioset": [null, null, null, [["foghorn", 61.34], ["music", 12.47], ["brass instrument", 10.99]], null, null, null, null, null, null, [["music", 38.14], ["brass instrument", 27.5], ["trumpet", 11.73]], null, null, null, [["music", 19.99], ["foghorn", 16.4], ["theremin", 14.98]], [["music", 32.04], ["brass instrument", 21.32], ["trombone", 13.55]], [["music", 32.08], ["brass instrument", 30.23], ["trombone", 11.44]], [["music", 25.66], ["brass instrument", 21.91], ["trumpet", 16.65]], [["music", 35.46], ["brass instrument", 18.36], ["musical instrument", 5.8]], null], "duration": [1.7, 1.24, 1.82, 2.31, -0.21, -0.1, -0.03, 0.51, 1.08, 0.52, 12.44, 0.15, 0.94, 0.28, 3.19, 8.27, 4.72, 11.05, 6.44, -0.06]} \ No newline at end of file diff --git a/annotations_1/DjNVqYjp3E4_filtered.json b/annotations_1/DjNVqYjp3E4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd491f0f76b5c59423614f55967d4151992ba7ec --- /dev/null +++ b/annotations_1/DjNVqYjp3E4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.01], [16.0, 16.92], [29.0, 29.49], [33.0, 40.9], [43.0, 44.32], [50.0, 52.03], [57.0, 57.64], [58.0, 59.68], [63.0, 63.71], [64.0, 67.46], [69.0, 69.7], [75.0, 79.19]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.35, 0.0, 96.54, 0.0, 0.0, 0.0, 81.0, 0.0, 87.55], "audiomae_on_audioset": [null, null, null, [["music", 36.11], ["hum", 18.66], ["throbbing", 10.35]], null, null, null, null, null, null, null, null], "duration": [0.01, 0.92, 0.49, 7.9, 1.32, 2.03, 0.64, 1.68, 0.71, 3.46, 0.7, 4.19]} \ No newline at end of file diff --git a/annotations_1/Dk2BtXCzdzc_filtered.json b/annotations_1/Dk2BtXCzdzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131229c0b42705c504aaefd0e19181b69b29028d --- /dev/null +++ b/annotations_1/Dk2BtXCzdzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.16], [16.0, 16.56], [17.0, 20.12], [24.0, 24.43], [24.0, 24.53], [27.0, 29.02], [31.0, 30.79], [40.0, 40.32], [42.0, 43.07], [44.0, 53.99], [59.0, 60.47], [61.0, 61.62], [63.0, 65.94], [66.0, 91.1], [101.0, 105.75], [107.0, 109.93], [111.0, 113.51], [116.0, 129.37], [136.0, 136.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 53.84, 0.0, 0.0, 36.55, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 71.0, 38.68, 51.66, 82.25, 75.72, 32.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 58.5], ["music", 18.57], ["doorbell", 7.07]], null, null, null, null, null, null, null, [["music", 40.51], ["synthesizer", 25.6], ["musical instrument", 5.88]], null, null, null, [["music", 47.97], ["theremin", 10.09], ["musical instrument", 5.16]], null], "duration": [0.16, 0.56, 3.12, 0.43, 0.53, 2.02, -0.21, 0.32, 1.07, 9.99, 1.47, 0.62, 2.94, 25.1, 4.75, 2.93, 2.51, 13.37, 0.93]} \ No newline at end of file diff --git a/annotations_1/DkGLIu6lnT4_filtered.json b/annotations_1/DkGLIu6lnT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1fdd8fc20fd7dcd175fc382e7d73ebd4f1827a9 --- /dev/null +++ b/annotations_1/DkGLIu6lnT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [4.0, 93.12], [93.0, 94.37], [96.0, 114.3], [118.0, 118.67]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.63, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 70.93], ["speech", 13.05], ["synthesizer", 3.66]], null], "duration": [0.79, 89.12, 1.37, 18.3, 0.67]} \ No newline at end of file diff --git a/annotations_1/DmXp6Pm-uLI_filtered.json b/annotations_1/DmXp6Pm-uLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af25a11a9b391864467349aa0dcef01f8cd6995c --- /dev/null +++ b/annotations_1/DmXp6Pm-uLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.76], [11.0, 12.77], [13.0, 15.94], [19.0, 21.81], [23.0, 27.13], [29.0, 28.85], [31.0, 33.39], [35.0, 37.61], [42.0, 52.07], [54.0, 54.41], [58.0, 58.95], [60.0, 71.36], [74.0, 77.3], [82.0, 82.44], [85.0, 84.99], [87.0, 100.43], [102.0, 117.31], [122.0, 160.62], [161.0, 166.51], [169.0, 173.69]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 52.51, 66.76, 62.47, 0.0, 50.06, 42.11, 32.39, 0.0, 0.0, 30.15, 29.76, 0.0, 0.0, 29.1, 29.28, 0.0, 33.09, 43.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 54.43], ["mantra", 5.14], ["choir", 4.94]], [["music", 48.58], ["theremin", 40.62], ["musical instrument", 1.93]], null, null, [["music", 45.59], ["theremin", 24.13], ["speech", 20.43]], [["foghorn", 56.74], ["music", 15.17], ["theremin", 5.76]], null, null, [["music", 33.44], ["didgeridoo", 21.14], ["theremin", 19.08]], [["music", 19.84], ["fly, housefly", 6.38], ["vehicle", 5.65]], null, [["music", 33.62], ["speech", 23.83], ["moo", 5.89]], [["music", 66.9], ["grunt", 5.61], ["theremin", 4.38]]], "duration": [1.76, 1.77, 2.94, 2.81, 4.13, -0.15, 2.39, 2.61, 10.07, 0.41, 0.95, 11.36, 3.3, 0.44, -0.01, 13.43, 15.31, 38.62, 5.51, 4.69]} \ No newline at end of file diff --git a/annotations_1/DnGpfWa6FAQ_filtered.json b/annotations_1/DnGpfWa6FAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7be8e492089fb25feb559268dbd1adfd90ad057 --- /dev/null +++ b/annotations_1/DnGpfWa6FAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.54], [14.0, 39.5], [42.0, 69.11], [73.0, 105.36], [107.0, 136.44], [138.0, 150.01], [151.0, 151.34]], "keep_status": [false, true, false, false, true, false, false], "silence_prob": [0.0, 29.74, 29.35, 0.0, 29.78, 29.75, 0.0], "audiomae_on_audioset": [null, [["music", 47.83], ["livestock, farm animals, working animals", 8.7], ["cattle, bovinae", 4.81]], [["cattle, bovinae", 43.41], ["moo", 33.75], ["livestock, farm animals, working animals", 21.81]], null, [["music", 55.6], ["speech", 8.15], ["cattle, bovinae", 3.5]], [["music", 67.36], ["didgeridoo", 11.84], ["musical instrument", 2.73]], null], "duration": [1.54, 25.5, 27.11, 32.36, 29.44, 12.01, 0.34]} \ No newline at end of file diff --git a/annotations_1/DoVnHRhvtKI_filtered.json b/annotations_1/DoVnHRhvtKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1627e5df4e0a9b9aae238c4993778256215ae78c --- /dev/null +++ b/annotations_1/DoVnHRhvtKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [6.0, 8.58], [17.0, 22.38], [30.0, 31.36], [35.0, 65.3], [67.0, 97.66]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 44.75, 30.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 37.53], ["throbbing", 16.31], ["music", 14.73]], [["speech", 68.31], ["music", 8.33], ["hum", 5.54]], null, null, null], "duration": [0.88, 2.58, 5.38, 1.36, 30.3, 30.66]} \ No newline at end of file diff --git a/annotations_1/DooTtUcpKM4_filtered.json b/annotations_1/DooTtUcpKM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a7c1c298587b34eb86f6cab4676725faf4c9268 --- /dev/null +++ b/annotations_1/DooTtUcpKM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.38], [14.0, 20.21], [21.0, 21.9], [22.0, 22.71], [23.0, 34.67], [42.0, 43.71], [45.0, 50.26]], "keep_status": [false, false, false, false, true, false, true], "silence_prob": [64.41, 46.75, 0.0, 0.0, 29.82, 0.0, 31.97], "audiomae_on_audioset": [null, [["hum", 49.45], ["mains hum", 30.29], ["throbbing", 11.6]], null, null, [["livestock, farm animals, working animals", 30.88], ["animal", 20.67], ["cattle, bovinae", 8.55]], null, [["music", 43.36], ["electronic music", 12.56], ["throbbing", 6.99]]], "duration": [6.38, 6.21, 0.9, 0.71, 11.67, 1.71, 5.26]} \ No newline at end of file diff --git a/annotations_1/DpA2bMJlDpI_filtered.json b/annotations_1/DpA2bMJlDpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a9ff0498555ca77c1c9ec5f15d769a69ef98d93 --- /dev/null +++ b/annotations_1/DpA2bMJlDpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 30.94], [32.0, 32.32], [33.0, 33.69], [35.0, 38.2], [39.0, 40.51], [42.0, 42.53], [44.0, 44.17], [53.0, 53.43], [63.0, 64.99], [73.0, 75.9], [77.0, 77.48], [87.0, 87.1], [97.0, 99.39], [104.0, 105.46], [113.0, 119.75], [127.0, 126.77], [128.0, 130.05], [131.0, 131.53], [137.0, 137.05], [139.0, 139.73], [144.0, 149.0], [152.0, 183.19], [188.0, 188.13], [190.0, 189.68]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [31.76, 0.0, 0.0, 32.15, 0.0, 0.0, 0.0, 0.0, 0.0, 32.07, 0.0, 0.0, 32.0, 0.0, 31.54, 0.0, 30.46, 0.0, 0.0, 0.0, 31.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.97], ["speech", 9.03], ["sidetone", 5.8]], null, null, [["cattle, bovinae", 24.57], ["music", 21.66], ["moo", 19.19]], null, null, null, null, null, [["music", 31.78], ["boing", 12.14], ["speech", 5.45]], null, null, [["cattle, bovinae", 25.02], ["moo", 22.91], ["livestock, farm animals, working animals", 17.1]], null, [["music", 38.1], ["speech", 9.93], ["electronic music", 8.06]], null, [["music", 33.29], ["speech", 24.88], ["sidetone", 3.6]], null, null, null, [["music", 58.84], ["speech", 17.77], ["synthesizer", 2.81]], null, null, null], "duration": [9.94, 0.32, 0.69, 3.2, 1.51, 0.53, 0.17, 0.43, 1.99, 2.9, 0.48, 0.1, 2.39, 1.46, 6.75, -0.23, 2.05, 0.53, 0.05, 0.73, 5.0, 31.19, 0.13, -0.32]} \ No newline at end of file diff --git a/annotations_1/DpQHj1R8kXk_filtered.json b/annotations_1/DpQHj1R8kXk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17c3e49cacc7968767479e670f62fadd3a03d31 --- /dev/null +++ b/annotations_1/DpQHj1R8kXk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.57], [12.0, 12.38], [15.0, 16.9], [20.0, 20.09], [22.0, 22.62], [24.0, 24.85], [26.0, 26.84], [29.0, 31.7], [38.0, 39.14], [39.0, 41.55], [43.0, 43.11], [45.0, 45.87], [52.0, 53.22], [57.0, 59.61], [60.0, 63.54], [65.0, 67.07], [77.0, 77.58], [79.0, 80.37], [86.0, 89.77], [91.0, 114.39], [116.0, 147.19], [148.0, 149.49], [152.0, 156.71]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.1, 0.0, 31.58, 0.0, 0.0, 0.0, 64.41, 48.31, 39.58, 0.0, 0.0, 97.33, 38.41, 0.0, 0.0, 29.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["breaking", 20.97], ["explosion", 18.37], ["whack, thwack", 9.23]], null, [["hum", 24.24], ["mains hum", 8.39], ["music", 5.28]], null, null, null, null, [["speech", 64.37], ["sine wave", 15.53], ["dial tone", 5.61]], [["speech", 67.09], ["music", 4.68], ["rumble", 3.52]], null, null, null, [["throbbing", 45.53], ["hum", 33.82], ["mains hum", 5.07]], null, null, [["speech", 45.99], ["hum", 8.32], ["music", 7.08]]], "duration": [0.57, 0.38, 1.9, 0.09, 0.62, 0.85, 0.84, 2.7, 1.14, 2.55, 0.11, 0.87, 1.22, 2.61, 3.54, 2.07, 0.58, 1.37, 3.77, 23.39, 31.19, 1.49, 4.71]} \ No newline at end of file diff --git a/annotations_1/DqSBqfDgOsQ_filtered.json b/annotations_1/DqSBqfDgOsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3f7fb5b7ac239fe47b24df741a4e379cc36128c --- /dev/null +++ b/annotations_1/DqSBqfDgOsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.7], [22.0, 23.04], [24.0, 25.34], [27.0, 26.69], [27.0, 27.94], [33.0, 34.2], [37.0, 38.97], [41.0, 41.89], [50.0, 50.87], [53.0, 53.94], [58.0, 59.37], [60.0, 60.91], [63.0, 66.18], [68.0, 68.22], [70.0, 69.87], [71.0, 71.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.49, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.2], ["singing bowl", 20.81], ["gong", 5.06]], null, null, null], "duration": [0.7, 1.04, 1.34, -0.31, 0.94, 1.2, 1.97, 0.89, 0.87, 0.94, 1.37, 0.91, 3.18, 0.22, -0.13, 0.59]} \ No newline at end of file diff --git a/annotations_1/Dr6eV4y0atg_filtered.json b/annotations_1/Dr6eV4y0atg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aaf858c01cb7e421f4d5c0e4910c2552c6b1b1e --- /dev/null +++ b/annotations_1/Dr6eV4y0atg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.59], [38.0, 39.87], [43.0, 44.24], [49.0, 52.59]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.41], "audiomae_on_audioset": [null, null, null, [["music", 68.66], ["synthesizer", 5.98], ["didgeridoo", 3.49]]], "duration": [0.59, 1.87, 1.24, 3.59]} \ No newline at end of file diff --git a/annotations_1/DrrwX4AnbMk_filtered.json b/annotations_1/DrrwX4AnbMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67c8c7381ced912c4aab4dd5156c764c0e90ed76 --- /dev/null +++ b/annotations_1/DrrwX4AnbMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 40.53], [43.0, 43.06], [44.0, 59.29], [60.0, 72.6], [76.0, 77.5], [79.0, 89.02], [96.0, 103.74], [105.0, 109.95]], "keep_status": [true, false, true, true, false, false, false, false], "silence_prob": [32.17, 0.0, 28.53, 29.16, 0.0, 36.39, 51.39, 36.98], "audiomae_on_audioset": [[["music", 48.42], ["animal", 11.4], ["roar", 6.75]], null, [["music", 28.63], ["theremin", 9.22], ["gong", 8.7]], [["gong", 43.75], ["hum", 16.45], ["music", 6.58]], null, [["music", 44.29], ["theremin", 31.43], ["musical instrument", 5.9]], null, [["theremin", 79.14], ["music", 15.71], ["musical instrument", 1.07]]], "duration": [5.53, 0.06, 15.29, 12.6, 1.5, 10.02, 7.74, 4.95]} \ No newline at end of file diff --git a/annotations_1/Drt2w_iit1M_filtered.json b/annotations_1/Drt2w_iit1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd7c885a151841130b4492c34e3b9ace1d81695b --- /dev/null +++ b/annotations_1/Drt2w_iit1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [3.0, 5.21], [7.0, 11.91], [15.0, 15.6], [18.0, 18.3], [20.0, 20.29], [23.0, 25.86], [27.0, 28.16], [30.0, 31.73], [33.0, 44.79], [50.0, 51.22], [52.0, 94.09], [96.0, 109.51], [111.0, 121.15], [124.0, 124.77]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 63.96, 79.59, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 29.06, 0.0, 0.0, 29.64, 50.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 32.27], ["hum", 14.4], ["music", 13.9]], null, null, [["music", 26.61], ["hum", 26.12], ["throbbing", 11.67]], null, null, [["didgeridoo", 33.1], ["music", 14.8], ["hum", 10.02]], null, null], "duration": [0.65, 2.21, 4.91, 0.6, 0.3, 0.29, 2.86, 1.16, 1.73, 11.79, 1.22, 42.09, 13.51, 10.15, 0.77]} \ No newline at end of file diff --git a/annotations_1/DsMU1n2HUDo_filtered.json b/annotations_1/DsMU1n2HUDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cb75ca0f77797c24e10bf4cf188604b4a8bcd46 --- /dev/null +++ b/annotations_1/DsMU1n2HUDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 42.16], [46.0, 126.57], [128.0, 144.36], [145.0, 146.47], [147.0, 162.84], [163.0, 163.48], [166.0, 167.12], [169.0, 173.84]], "keep_status": [true, false, true, false, false, false, false, false], "silence_prob": [35.35, 0.0, 29.06, 0.0, 31.87, 0.0, 0.0, 63.42], "audiomae_on_audioset": [[["speech", 37.06], ["throbbing", 16.22], ["hum", 11.57]], null, [["music", 45.04], ["smash, crash", 15.2], ["breaking", 8.17]], null, [["music", 38.57], ["speech", 29.61], ["didgeridoo", 14.84]], null, null, null], "duration": [8.16, 80.57, 16.36, 1.47, 15.84, 0.48, 1.12, 4.84]} \ No newline at end of file diff --git a/annotations_1/DtH30Cz2Zec_filtered.json b/annotations_1/DtH30Cz2Zec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5192a2f295758e0003cb4dc28ef3c701e002744 --- /dev/null +++ b/annotations_1/DtH30Cz2Zec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 66.7], [69.0, 69.23]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.7, 0.23]} \ No newline at end of file diff --git a/annotations_1/DtV4RnADOeA_filtered.json b/annotations_1/DtV4RnADOeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0ce6afcf4fd4da88da88af3e4dd159aaa7db0fb --- /dev/null +++ b/annotations_1/DtV4RnADOeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.03], [11.0, 51.65], [53.0, 92.45], [93.0, 161.99], [163.0, 163.51], [168.0, 168.81]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.03, 40.65, 39.45, 68.99, 0.51, 0.81]} \ No newline at end of file diff --git a/annotations_1/DtuXEqWdWCI_filtered.json b/annotations_1/DtuXEqWdWCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f87b649a5f78e906c874c97e8bc9b118edd5034 --- /dev/null +++ b/annotations_1/DtuXEqWdWCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 35.83], [36.0, 36.71], [37.0, 37.76], [39.0, 43.04], [44.0, 72.05], [73.0, 73.45], [76.0, 77.11], [78.0, 80.23], [86.0, 87.0], [92.0, 95.37], [98.0, 103.0], [107.0, 107.15], [111.0, 113.07], [116.0, 117.21], [120.0, 121.04], [123.0, 123.79], [124.0, 125.25]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.71, 0.0, 0.0, 29.15, 30.13, 0.0, 0.0, 35.87, 0.0, 43.71, 30.1, 0.0, 29.57, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.36], ["speech", 4.87], ["throbbing", 3.33]], null, null, [["speech", 40.75], ["explosion", 11.35], ["eruption", 11.04]], [["music", 57.26], ["throbbing", 11.43], ["hum", 5.16]], null, null, [["throbbing", 57.45], ["hum", 15.74], ["music", 9.59]], null, [["speech", 36.58], ["sidetone", 28.12], ["didgeridoo", 10.23]], [["speech", 61.09], ["music", 8.3], ["explosion", 5.68]], null, [["speech", 47.42], ["explosion", 12.72], ["artillery fire", 10.18]], null, null, null, null], "duration": [12.83, 0.71, 0.76, 4.04, 28.05, 0.45, 1.11, 2.23, 1.0, 3.37, 5.0, 0.15, 2.07, 1.21, 1.04, 0.79, 1.25]} \ No newline at end of file diff --git a/annotations_1/DubYVqV92OQ_filtered.json b/annotations_1/DubYVqV92OQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8beef7a3032cfb6959c2ffb9fe5d36a5a5d7aeb --- /dev/null +++ b/annotations_1/DubYVqV92OQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [18.0, 20.82], [33.0, 39.78], [40.0, 40.14], [42.0, 42.69], [46.0, 49.94], [50.0, 55.53], [56.0, 59.58], [75.0, 84.11]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 99.96, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.35, 2.82, 6.78, 0.14, 0.69, 3.94, 5.53, 3.58, 9.11]} \ No newline at end of file diff --git a/annotations_1/DujyJ1EDft8_filtered.json b/annotations_1/DujyJ1EDft8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6a0639377e62fe0d5c16bf40bbcee564c4514e2 --- /dev/null +++ b/annotations_1/DujyJ1EDft8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 35.19], [36.0, 43.17], [44.0, 47.78], [49.0, 49.18], [50.0, 50.19], [51.0, 52.62], [53.0, 53.57], [55.0, 55.9], [57.0, 57.28], [58.0, 59.02], [60.0, 61.5], [63.0, 63.9], [67.0, 68.59], [69.0, 96.11]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 32.14, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.86], "audiomae_on_audioset": [null, [["effects unit", 25.39], ["civil defense siren", 21.1], ["distortion", 18.59]], null, null, null, null, null, null, null, null, null, null, null, [["music", 30.39], ["hum", 11.66], ["synthesizer", 10.48]]], "duration": [35.19, 7.17, 3.78, 0.18, 0.19, 1.62, 0.57, 0.9, 0.28, 1.02, 1.5, 0.9, 1.59, 27.11]} \ No newline at end of file diff --git a/annotations_1/Dwiczhta4e0_filtered.json b/annotations_1/Dwiczhta4e0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..932bbcbb442039040a9ae8eabdaa02a14a10821f --- /dev/null +++ b/annotations_1/Dwiczhta4e0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [4.0, 4.48], [12.0, 12.31], [13.0, 13.78], [14.0, 15.23], [17.0, 17.27], [41.0, 43.09], [48.0, 49.13], [52.0, 54.94], [76.0, 76.49], [87.0, 93.31], [95.0, 95.82], [100.0, 99.74], [100.0, 99.82], [100.0, 99.86], [100.0, 99.93], [100.0, 99.96], [100.0, 102.25], [107.0, 107.11], [108.0, 108.63], [110.0, 111.2], [123.0, 123.69], [125.0, 125.83], [130.0, 130.49], [134.0, 134.91], [136.0, 136.58], [137.0, 137.89], [143.0, 148.78], [151.0, 151.43], [152.0, 155.95], [159.0, 159.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 65.79, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.69, 0.0, 49.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["throbbing", 30.66], ["sidetone", 18.7], ["hum", 14.78]], null, null, null, null, null, null, [["music", 40.07], ["speech", 14.15], ["hum", 12.36]], null, null, null, null, null, null, null, null, null, [["music", 41.37], ["sheep", 11.88], ["bleat", 7.99]], null, [["music", 53.92], ["hum", 8.17], ["throbbing", 4.27]], null], "duration": [0.43, 0.48, 0.31, 0.78, 1.23, 0.27, 2.09, 1.13, 2.94, 0.49, 6.31, 0.82, -0.26, -0.18, -0.14, -0.07, -0.04, 2.25, 0.11, 0.63, 1.2, 0.69, 0.83, 0.49, 0.91, 0.58, 0.89, 5.78, 0.43, 3.95, 0.81]} \ No newline at end of file diff --git a/annotations_1/DxCjqhDD7X4_filtered.json b/annotations_1/DxCjqhDD7X4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa9ef36854e30b6625dde100d810300c713ad957 --- /dev/null +++ b/annotations_1/DxCjqhDD7X4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.75], [9.0, 10.0], [11.0, 12.16], [20.0, 27.87], [29.0, 31.45], [33.0, 90.75], [97.0, 101.6], [103.0, 106.07], [108.0, 112.23], [116.0, 159.48], [161.0, 161.74]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.27, 38.56, 0.0, 29.75, 29.67, 30.5, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 60.21], ["musical instrument", 8.99], ["synthesizer", 5.28]], [["music", 74.14], ["musical instrument", 5.0], ["didgeridoo", 3.94]], null, [["music", 39.31], ["didgeridoo", 22.61], ["musical instrument", 4.06]], [["mosquito", 18.2], ["music", 13.87], ["fly, housefly", 9.47]], [["music", 48.14], ["vocal music", 4.33], ["beatboxing", 3.43]], null, null], "duration": [0.75, 1.0, 1.16, 7.87, 2.45, 57.75, 4.6, 3.07, 4.23, 43.48, 0.74]} \ No newline at end of file diff --git a/annotations_1/DyCfCl46JSE_filtered.json b/annotations_1/DyCfCl46JSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4de32e6cf7d7ccba58b4d44693a9f1f5d414347 --- /dev/null +++ b/annotations_1/DyCfCl46JSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.07], [60.0, 67.07], [73.0, 72.86], [74.0, 75.32]], "keep_status": [true, false, false, false], "silence_prob": [32.59, 31.45, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.3], ["synthesizer", 6.93], ["musical instrument", 6.76]], [["music", 81.98], ["singing", 3.99], ["beatboxing", 2.07]], null, null], "duration": [2.07, 7.07, -0.14, 1.32]} \ No newline at end of file diff --git a/annotations_1/DyUus5cUe08_filtered.json b/annotations_1/DyUus5cUe08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9508af9a7f8d985dc306cc6164be49e62d2e9530 --- /dev/null +++ b/annotations_1/DyUus5cUe08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 105.12], [105.0, 105.98], [106.0, 130.17]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 32.3], "audiomae_on_audioset": [null, null, [["gong", 19.58], ["sonar", 15.17], ["hum", 12.78]]], "duration": [65.12, 0.98, 24.17]} \ No newline at end of file diff --git a/annotations_1/Dys_AAhlGqU_filtered.json b/annotations_1/Dys_AAhlGqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..755a1453b9883474eceff91caa823792929078d0 --- /dev/null +++ b/annotations_1/Dys_AAhlGqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [21.0, 22.72], [48.0, 53.72], [55.0, 55.0], [57.0, 57.55], [59.0, 60.32], [62.0, 63.48], [64.0, 84.96], [85.0, 86.75], [88.0, 88.69], [100.0, 99.71], [102.0, 102.59], [105.0, 106.44], [108.0, 109.04], [110.0, 110.73], [116.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.81, 0.0, 0.0, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 74.21], ["throbbing", 8.3], ["electronic music", 4.49]], null, null, null, null, [["music", 80.16], ["scratching (performance technique)", 7.2], ["electronic music", 3.38]], null, null, null, null, null, null, null, null], "duration": [0.53, 1.72, 5.72, 0.0, 0.55, 1.32, 1.48, 20.96, 1.75, 0.69, -0.29, 0.59, 1.44, 1.04, 0.73, 0.16]} \ No newline at end of file diff --git a/annotations_1/DyxkjYmlzhg_filtered.json b/annotations_1/DyxkjYmlzhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5143ded56403008020fbbbc280f5dae98ac70b95 --- /dev/null +++ b/annotations_1/DyxkjYmlzhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.69], [14.0, 13.96], [19.0, 19.74], [20.0, 21.57], [26.0, 26.32], [31.0, 31.36], [34.0, 39.43], [40.0, 42.15], [43.0, 48.84], [53.0, 55.83], [60.0, 63.73], [71.0, 71.29], [86.0, 87.69], [92.0, 92.74], [94.0, 94.47], [96.0, 99.74], [103.0, 103.44], [119.0, 119.97], [127.0, 127.3], [128.0, 128.76], [130.0, 130.65], [137.0, 138.15], [141.0, 140.7], [143.0, 142.87], [144.0, 144.54], [151.0, 151.97], [156.0, 156.24], [160.0, 161.06], [162.0, 162.46], [165.0, 166.87], [168.0, 171.39], [179.0, 179.09], [185.0, 185.26], [186.0, 187.76], [189.0, 190.34], [192.0, 192.11], [193.0, 194.26], [196.0, 199.07], [200.0, 205.85], [207.0, 207.5], [208.0, 209.43], [214.0, 214.52], [223.0, 226.64], [228.0, 229.41], [231.0, 231.97], [233.0, 241.24], [242.0, 250.64], [252.0, 254.92], [256.0, 259.41], [264.0, 267.49], [268.0, 270.33], [271.0, 276.34], [278.0, 283.98]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, true, false, true, false, true, false], "silence_prob": [40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 47.7, 48.82, 51.5, 47.9, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.43, 41.14, 0.0, 0.0, 0.0, 40.92, 0.0, 0.0, 44.2, 43.38, 46.4, 48.31, 46.68, 50.71, 42.28, 42.13], "audiomae_on_audioset": [[["hum", 37.12], ["mains hum", 32.81], ["throbbing", 16.39]], null, null, null, null, null, [["music", 41.63], ["hum", 7.87], ["electronic music", 5.82]], [["music", 46.03], ["hum", 7.69], ["speech", 7.29]], [["hum", 46.03], ["music", 15.96], ["throbbing", 11.46]], null, [["hum", 47.81], ["mains hum", 14.28], ["music", 12.61]], null, null, null, null, [["hum", 31.77], ["mains hum", 19.31], ["speech", 15.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.04], ["hum", 16.81], ["chirp tone", 12.54]], [["music", 39.37], ["hum", 14.26], ["didgeridoo", 11.13]], null, null, null, [["hum", 31.21], ["speech", 10.72], ["mains hum", 9.92]], null, null, [["speech", 30.35], ["hum", 22.06], ["mains hum", 17.7]], [["hum", 43.71], ["mains hum", 36.33], ["music", 5.3]], [["music", 32.58], ["speech", 20.63], ["hum", 13.37]], [["music", 30.66], ["hum", 23.37], ["throbbing", 17.08]], [["music", 39.37], ["throbbing", 13.56], ["hum", 8.46]], null, [["throbbing", 32.84], ["music", 23.41], ["croak", 10.92]], [["throbbing", 33.04], ["hum", 24.83], ["music", 21.81]]], "duration": [7.69, -0.04, 0.74, 1.57, 0.32, 0.36, 5.43, 2.15, 5.84, 2.83, 3.73, 0.29, 1.69, 0.74, 0.47, 3.74, 0.44, 0.97, 0.3, 0.76, 0.65, 1.15, -0.3, -0.13, 0.54, 0.97, 0.24, 1.06, 0.46, 1.87, 3.39, 0.09, 0.26, 1.76, 1.34, 0.11, 1.26, 3.07, 5.85, 0.5, 1.43, 0.52, 3.64, 1.41, 0.97, 8.24, 8.64, 2.92, 3.41, 3.49, 2.33, 5.34, 5.98]} \ No newline at end of file diff --git a/annotations_1/DzQjdpw73ZY_filtered.json b/annotations_1/DzQjdpw73ZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d08ff70f9b2f37186fbd030131c46e79250388b --- /dev/null +++ b/annotations_1/DzQjdpw73ZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.62], [14.0, 14.08], [18.0, 17.73], [19.0, 19.74], [25.0, 25.27], [26.0, 26.18], [41.0, 42.13], [51.0, 53.22], [54.0, 54.84], [56.0, 58.8], [64.0, 64.27], [66.0, 66.11], [67.0, 70.78], [73.0, 74.07], [76.0, 77.52], [79.0, 79.52], [87.0, 88.48], [99.0, 99.98], [105.0, 105.26], [110.0, 110.4], [113.0, 114.84]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 36.11, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 63.54], ["animal", 1.7], ["snicker", 1.63]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.08, -0.27, 0.74, 0.27, 0.18, 1.13, 2.22, 0.84, 2.8, 0.27, 0.11, 3.78, 1.07, 1.52, 0.52, 1.48, 0.98, 0.26, 0.4, 1.84]} \ No newline at end of file diff --git a/annotations_1/DzqzlpAo9s4_filtered.json b/annotations_1/DzqzlpAo9s4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d71dcf50e3ee78fd4b881f0449a059db59c6115 --- /dev/null +++ b/annotations_1/DzqzlpAo9s4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.97], [12.0, 12.92], [17.0, 27.53], [30.0, 31.06], [40.0, 40.98], [42.0, 43.21], [46.0, 50.94], [51.0, 63.09]], "keep_status": [false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 31.03, 29.31], "audiomae_on_audioset": [null, null, [["speech", 26.6], ["fly, housefly", 10.39], ["hum", 7.39]], null, null, null, [["music", 25.61], ["hum", 18.3], ["mains hum", 8.55]], [["speech", 75.77], ["explosion", 4.61], ["eruption", 4.33]]], "duration": [0.97, 0.92, 10.53, 1.06, 0.98, 1.21, 4.94, 12.09]} \ No newline at end of file diff --git a/annotations_1/E-EDJ6Z8mS8_filtered.json b/annotations_1/E-EDJ6Z8mS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4ae16ad8aaf224c74b381d8d4e44fa0951dec1 --- /dev/null +++ b/annotations_1/E-EDJ6Z8mS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.7], [33.0, 32.85], [34.0, 49.87], [52.0, 53.35], [54.0, 54.24], [55.0, 59.29], [60.0, 60.71], [62.0, 62.13], [64.0, 63.8], [66.0, 88.23], [91.0, 95.08], [101.0, 115.1]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 30.02, 0.0, 0.0, 38.56, 0.0, 0.0, 0.0, 28.83, 28.4, 28.54], "audiomae_on_audioset": [null, null, [["speech", 32.92], ["sidetone", 31.53], ["hum", 8.95]], null, null, [["mains hum", 72.39], ["hum", 23.31], ["sidetone", 1.0]], null, null, null, [["music", 43.32], ["throbbing", 19.94], ["hum", 4.99]], [["music", 20.96], ["speech", 11.76], ["throbbing", 9.9]], [["speech", 27.42], ["music", 16.44], ["boom", 7.05]]], "duration": [0.7, -0.15, 15.87, 1.35, 0.24, 4.29, 0.71, 0.13, -0.2, 22.23, 4.08, 14.1]} \ No newline at end of file diff --git a/annotations_1/E-F92GOLVcU_filtered.json b/annotations_1/E-F92GOLVcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7667772784561bb95c5fef138b37a9ecf6e6e2f3 --- /dev/null +++ b/annotations_1/E-F92GOLVcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.5], [18.0, 18.76], [25.0, 26.35], [32.0, 32.86], [34.0, 36.17], [38.0, 38.52], [42.0, 42.53], [44.0, 47.04], [54.0, 54.97], [56.0, 61.69], [77.0, 77.55], [80.0, 80.91], [87.0, 87.35], [92.0, 106.44], [113.0, 113.66], [120.0, 119.89], [133.0, 134.64], [137.0, 137.32], [139.0, 141.83], [146.0, 149.05], [150.0, 150.65], [153.0, 154.68], [155.0, 158.94], [161.0, 161.52]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 71.14, 0.0, 43.18, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 34.51, 32.81, 0.0, 0.0, 33.24, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 57.24], ["drip", 4.44], ["gurgling", 3.56]], null, null, null, null, [["speech", 69.92], ["hum", 3.95], ["throbbing", 3.82]], null, null, null, null, null, null, null, null, [["speech", 55.99], ["music", 8.51], ["boing", 4.83]], [["whale vocalization", 25.12], ["cattle, bovinae", 19.44], ["moo", 13.55]], null, null, [["whale vocalization", 26.74], ["speech", 12.29], ["music", 10.49]], null], "duration": [0.5, 0.76, 1.35, 0.86, 2.17, 0.52, 0.53, 3.04, 0.97, 5.69, 0.55, 0.91, 0.35, 14.44, 0.66, -0.11, 1.64, 0.32, 2.83, 3.05, 0.65, 1.68, 3.94, 0.52]} \ No newline at end of file diff --git a/annotations_1/E-MOzwWySaQ_filtered.json b/annotations_1/E-MOzwWySaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dda73614f486a39542a489a685eb6e820e0ea3aa --- /dev/null +++ b/annotations_1/E-MOzwWySaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.2], [11.0, 11.97], [14.0, 100.45], [104.0, 112.68], [125.0, 124.98], [140.0, 149.81], [150.0, 150.84], [151.0, 180.05], [187.0, 200.79]], "keep_status": [true, false, false, true, false, false, false, false, false], "silence_prob": [36.9, 0.0, 0.0, 31.79, 0.0, 29.46, 0.0, 29.76, 29.21], "audiomae_on_audioset": [[["hum", 27.06], ["speech", 26.28], ["music", 14.91]], null, null, [["music", 30.41], ["speech", 29.15], ["sidetone", 7.01]], null, [["speech", 39.88], ["music", 33.65], ["cacophony", 4.49]], null, [["speech", 39.92], ["music", 23.66], ["hum", 6.59]], [["music", 46.34], ["hum", 21.41], ["throbbing", 13.15]]], "duration": [2.2, 0.97, 86.45, 8.68, -0.02, 9.81, 0.84, 29.05, 13.79]} \ No newline at end of file diff --git a/annotations_1/E-NXKcnsDJ8_filtered.json b/annotations_1/E-NXKcnsDJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5f925685a175a1ccfbc4ea442fc3a0e17d1d420 --- /dev/null +++ b/annotations_1/E-NXKcnsDJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.06], [10.0, 17.59], [19.0, 51.34], [53.0, 52.95], [54.0, 64.69], [66.0, 67.56], [69.0, 69.48], [73.0, 73.62], [87.0, 92.04], [93.0, 145.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.68, 0.0, 0.0, 30.61, 0.0, 0.0, 0.0, 32.02, 0.0], "audiomae_on_audioset": [null, [["music", 77.66], ["electronic music", 3.55], ["soundtrack music", 3.05]], null, null, [["mains hum", 68.22], ["hum", 16.19], ["speech", 8.63]], null, null, null, [["music", 35.91], ["hum", 18.69], ["throbbing", 16.43]], null], "duration": [0.06, 7.59, 32.34, -0.05, 10.69, 1.56, 0.48, 0.62, 5.04, 52.37]} \ No newline at end of file diff --git a/annotations_1/E-Ts3DuFLDg_filtered.json b/annotations_1/E-Ts3DuFLDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a99345371ba8d5e32824a997b033ed077cc53ceb --- /dev/null +++ b/annotations_1/E-Ts3DuFLDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 26.2], [38.0, 45.47], [46.0, 49.5], [54.0, 60.02], [60.0, 60.99], [84.0, 86.49], [90.0, 100.09], [106.0, 110.25], [125.0, 125.56], [127.0, 128.97], [133.0, 134.4], [160.0, 160.0], [162.0, 174.6]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.6, 30.24, 37.3, 33.03, 0.0, 30.64, 30.27, 32.29, 0.0, 0.0, 0.0, 0.0, 34.71], "audiomae_on_audioset": [[["music", 68.59], ["throbbing", 12.5], ["synthesizer", 4.06]], [["music", 76.68], ["didgeridoo", 9.19], ["throbbing", 2.57]], [["didgeridoo", 37.87], ["music", 27.25], ["speech", 17.65]], [["hum", 34.45], ["music", 18.83], ["mains hum", 18.69]], null, [["music", 76.25], ["didgeridoo", 5.7], ["singing", 2.58]], [["music", 76.4], ["theremin", 2.87], ["throbbing", 2.35]], [["music", 49.93], ["musical instrument", 7.38], ["double bass", 3.74]], null, null, null, null, [["music", 69.45], ["hum", 4.4], ["throbbing", 3.52]]], "duration": [20.2, 7.47, 3.5, 6.02, 0.99, 2.49, 10.09, 4.25, 0.56, 1.97, 1.4, 0.0, 12.6]} \ No newline at end of file diff --git a/annotations_1/E-fSwxZNG-0_filtered.json b/annotations_1/E-fSwxZNG-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e7c64da6a6346b5c148028ea032fc38708855f5 --- /dev/null +++ b/annotations_1/E-fSwxZNG-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 81.18], [82.0, 83.07], [87.0, 91.03], [92.0, 96.72], [98.0, 105.06], [106.0, 110.12], [111.0, 126.81]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [31.31, 0.0, 98.19, 96.89, 80.29, 82.07, 93.76], "audiomae_on_audioset": [[["sidetone", 76.57], ["speech", 16.47], ["radio", 0.65]], null, null, null, null, null, null], "duration": [10.18, 1.07, 4.03, 4.72, 7.06, 4.12, 15.81]} \ No newline at end of file diff --git a/annotations_1/E-gwIn1O1pE_filtered.json b/annotations_1/E-gwIn1O1pE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdd545c868d1077ae11f67f9fbae0573c708a013 --- /dev/null +++ b/annotations_1/E-gwIn1O1pE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [5.0, 5.64], [9.0, 9.58], [12.0, 12.7], [15.0, 15.92], [21.0, 23.01], [27.0, 27.36], [27.0, 29.59], [31.0, 31.92], [33.0, 35.41], [48.0, 49.22], [53.0, 55.17], [60.0, 70.6], [72.0, 73.43], [76.0, 76.65], [79.0, 79.3], [82.0, 83.27], [89.0, 89.53], [100.0, 102.14], [107.0, 108.41], [111.0, 112.19], [115.0, 115.75], [121.0, 122.07], [125.0, 127.68], [129.0, 134.06], [136.0, 138.11], [139.0, 142.53], [145.0, 145.74], [147.0, 149.22], [151.0, 153.42], [156.0, 163.95], [165.0, 167.97], [169.0, 170.8], [174.0, 178.23], [181.0, 182.02], [185.0, 201.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.81, 0.0, 30.58, 0.0, 28.89, 0.0, 53.22, 71.14, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 0.0, 0.0, 57.17, 34.82, 34.07, 31.0, 0.0, 95.51, 94.81, 92.8, 61.57, 0.0, 99.87, 0.0, 44.9], "audiomae_on_audioset": [null, null, null, null, null, [["music", 77.21], ["speech", 9.02], ["didgeridoo", 2.78]], null, [["livestock, farm animals, working animals", 51.35], ["cattle, bovinae", 25.38], ["moo", 15.34]], null, [["cattle, bovinae", 46.13], ["moo", 29.4], ["livestock, farm animals, working animals", 15.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.66], ["musical instrument", 3.93], ["clapping", 3.25]], [["music", 42.35], ["speech", 20.21], ["didgeridoo", 14.49]], [["music", 25.47], ["thunk", 15.35], ["speech", 5.35]], null, null, null, null, null, null, null, null, [["throbbing", 15.5], ["speech", 15.49], ["hum", 13.71]]], "duration": [1.28, 0.64, 0.58, 0.7, 0.92, 2.01, 0.36, 2.59, 0.92, 2.41, 1.22, 2.17, 10.6, 1.43, 0.65, 0.3, 1.27, 0.53, 2.14, 1.41, 1.19, 0.75, 1.07, 2.68, 5.06, 2.11, 3.53, 0.74, 2.22, 2.42, 7.95, 2.97, 1.8, 4.23, 1.02, 16.77]} \ No newline at end of file diff --git a/annotations_1/E-mnMI7Klyw_filtered.json b/annotations_1/E-mnMI7Klyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..025c2743d211d4e8179589b797b8f4e5fbdc4f59 --- /dev/null +++ b/annotations_1/E-mnMI7Klyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 43.58], [47.0, 50.03], [51.0, 51.85], [53.0, 54.72], [57.0, 57.6], [61.0, 61.32], [66.0, 65.94], [118.0, 117.98], [119.0, 121.07], [126.0, 127.85], [131.0, 131.26], [131.0, 132.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 39.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 72.59], ["snoring", 3.83], ["wild animals", 2.71]], null, null, null, null, null, null, [["music", 24.89], ["fly, housefly", 15.97], ["insect", 8.93]], null, null, null], "duration": [1.58, 3.03, 0.85, 1.72, 0.6, 0.32, -0.06, -0.02, 2.07, 1.85, 0.26, 1.87]} \ No newline at end of file diff --git a/annotations_1/E-wr7dD1n5w_filtered.json b/annotations_1/E-wr7dD1n5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fcfbd5a7ac23471e5df6ed4ea97105a78ea6686 --- /dev/null +++ b/annotations_1/E-wr7dD1n5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.51], [26.0, 27.31], [29.0, 30.06], [33.0, 35.61], [40.0, 51.26], [52.0, 59.95], [60.0, 100.67], [103.0, 133.07], [134.0, 134.47], [136.0, 147.48], [150.0, 151.68], [152.0, 151.83], [156.0, 167.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.57, 36.58, 60.05, 0.0, 0.0, 0.0, 32.62, 0.0, 0.0, 32.89], "audiomae_on_audioset": [null, null, null, null, [["music", 49.02], ["speech", 27.66], ["scary music", 3.75]], null, null, null, null, [["music", 54.24], ["speech", 27.84], ["electronic music", 3.93]], null, null, [["music", 49.7], ["speech", 21.33], ["hum", 3.36]]], "duration": [1.51, 1.31, 1.06, 2.61, 11.26, 7.95, 40.67, 30.07, 0.47, 11.48, 1.68, -0.17, 11.53]} \ No newline at end of file diff --git a/annotations_1/E0BY209ZNEY_filtered.json b/annotations_1/E0BY209ZNEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64328d8d014bfe6e9321ec9bceb545e5584f24ad --- /dev/null +++ b/annotations_1/E0BY209ZNEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.33], [19.0, 19.5], [20.0, 20.26], [23.0, 23.65], [26.0, 26.49], [28.0, 33.54], [36.0, 37.81], [38.0, 43.34], [46.0, 47.39], [51.0, 52.1], [55.0, 57.79], [60.0, 60.74], [73.0, 78.93], [90.0, 91.74], [94.0, 97.24], [100.0, 100.23], [105.0, 106.24], [125.0, 125.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [40.86, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 44.55, 0.0, 0.0, 62.68, 0.0, 34.64, 0.0, 33.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 43.79], ["hum", 15.39], ["mains hum", 10.84]], null, null, null, null, null, null, [["fly, housefly", 59.44], ["insect", 15.15], ["bee, wasp, etc.", 11.67]], null, null, null, null, [["music", 61.56], ["speech", 16.32], ["musical instrument", 3.03]], null, [["music", 49.41], ["throbbing", 7.89], ["musical instrument", 6.71]], null, null, null], "duration": [4.33, 0.5, 0.26, 0.65, 0.49, 5.54, 1.81, 5.34, 1.39, 1.1, 2.79, 0.74, 5.93, 1.74, 3.24, 0.23, 1.24, 0.39]} \ No newline at end of file diff --git a/annotations_1/E0i4dabbAcI_filtered.json b/annotations_1/E0i4dabbAcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd1986e555d2ac410856e98a2f22ad6adf914c0 --- /dev/null +++ b/annotations_1/E0i4dabbAcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [6.0, 8.9], [9.0, 9.12], [10.0, 20.21], [20.0, 23.18], [24.0, 37.94], [39.0, 51.98], [53.0, 61.45], [62.0, 66.8], [69.0, 70.26], [70.0, 71.22], [72.0, 80.64], [83.0, 84.08], [85.0, 90.83], [93.0, 93.77], [97.0, 98.22], [100.0, 111.13], [112.0, 114.15], [122.0, 122.49]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 39.77, 0.0, 62.89, 72.46, 93.91, 82.61, 99.84, 65.32, 0.0, 0.0, 74.76, 0.0, 49.04, 0.0, 0.0, 64.29, 37.59, 0.0], "audiomae_on_audioset": [null, [["speech", 35.02], ["sidetone", 16.58], ["radio", 12.68]], null, null, null, null, null, null, null, null, null, null, null, [["effects unit", 29.28], ["noise", 17.2], ["music", 12.18]], null, null, null, [["mechanisms", 32.89], ["gears", 27.72], ["speech", 13.22]], null], "duration": [0.48, 2.9, 0.12, 10.21, 3.18, 13.94, 12.98, 8.45, 4.8, 1.26, 1.22, 8.64, 1.08, 5.83, 0.77, 1.22, 11.13, 2.15, 0.49]} \ No newline at end of file diff --git a/annotations_1/E1u3lo2EsMg_filtered.json b/annotations_1/E1u3lo2EsMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a9e8a6cf4ce00cddac04992c1c80282cb06318f --- /dev/null +++ b/annotations_1/E1u3lo2EsMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 20.44], [21.0, 23.72], [24.0, 26.96], [29.0, 30.23], [36.0, 37.45], [39.0, 39.34], [43.0, 44.27], [45.0, 48.19], [51.0, 51.51], [55.0, 56.67], [57.0, 60.71], [62.0, 63.09], [69.0, 71.32], [73.0, 73.79], [76.0, 76.57], [77.0, 77.04], [88.0, 89.29], [91.0, 92.69], [97.0, 97.28], [118.0, 119.38], [121.0, 121.61], [127.0, 127.25], [139.0, 142.43], [143.0, 144.61], [145.0, 147.39], [148.0, 148.78], [153.0, 159.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [76.37, 49.82, 46.68, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 0.0, 81.35, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 37.81, 0.0, 37.55], "audiomae_on_audioset": [null, [["sidetone", 85.87], ["speech", 6.81], ["hum", 1.21]], [["speech", 35.51], ["fly, housefly", 11.88], ["bee, wasp, etc.", 6.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.92], ["crack", 10.6], ["arrow", 4.41]], null, [["speech", 20.7], ["thunk", 20.05], ["thump, thud", 15.48]]], "duration": [8.44, 2.72, 2.96, 1.23, 1.45, 0.34, 1.27, 3.19, 0.51, 1.67, 3.71, 1.09, 2.32, 0.79, 0.57, 0.04, 1.29, 1.69, 0.28, 1.38, 0.61, 0.25, 3.43, 1.61, 2.39, 0.78, 6.88]} \ No newline at end of file diff --git a/annotations_1/E2WZXK79_d0_filtered.json b/annotations_1/E2WZXK79_d0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8bda2f24e043dc16bfccf5412ff473204798515 --- /dev/null +++ b/annotations_1/E2WZXK79_d0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.12], [10.0, 13.05], [18.0, 21.71], [24.0, 24.76], [26.0, 27.75], [29.0, 28.97], [31.0, 32.31], [34.0, 34.69], [37.0, 44.27], [49.0, 55.21], [57.0, 67.54], [70.0, 77.97], [80.0, 80.38], [81.0, 82.21], [85.0, 87.24], [90.0, 143.14], [144.0, 144.46], [147.0, 177.65]], "keep_status": [false, false, true, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [84.07, 58.72, 30.2, 0.0, 0.0, 0.0, 0.0, 0.0, 36.62, 34.58, 31.07, 34.11, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["explosion", 50.43], ["burst, pop", 11.78], ["eruption", 6.96]], null, null, null, null, null, [["music", 61.52], ["musical instrument", 5.13], ["synthesizer", 4.27]], [["music", 56.19], ["musical instrument", 8.55], ["drum", 3.34]], [["music", 40.36], ["tabla", 15.57], ["musical instrument", 7.75]], [["music", 41.29], ["speech", 38.46], ["tabla", 3.44]], null, null, [["music", 22.97], ["boing", 9.12], ["explosion", 8.55]], null, null, null], "duration": [2.12, 3.05, 3.71, 0.76, 1.75, -0.03, 1.31, 0.69, 7.27, 6.21, 10.54, 7.97, 0.38, 1.21, 2.24, 53.14, 0.46, 30.65]} \ No newline at end of file diff --git a/annotations_1/E2wr_tRqNZQ_filtered.json b/annotations_1/E2wr_tRqNZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60bc5690a397b280ed5cb5658fcd95edf5af3d9d --- /dev/null +++ b/annotations_1/E2wr_tRqNZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.4], [33.0, 34.3], [73.0, 74.24], [75.0, 78.0], [81.0, 80.82], [84.0, 84.65], [113.0, 113.37], [125.0, 125.66]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.73, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.72], ["speech", 6.32], ["hum", 5.84]], null, null, null, null], "duration": [0.4, 1.3, 1.24, 3.0, -0.18, 0.65, 0.37, 0.66]} \ No newline at end of file diff --git a/annotations_1/E3yX8lT2UAI_filtered.json b/annotations_1/E3yX8lT2UAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25e7c633992e5affebb59f59beddc10c328fa390 --- /dev/null +++ b/annotations_1/E3yX8lT2UAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.33], [18.0, 19.5], [21.0, 21.22], [27.0, 38.18]], "keep_status": [true, false, false, true], "silence_prob": [29.71, 0.0, 0.0, 31.52], "audiomae_on_audioset": [[["mains hum", 13.88], ["vehicle", 12.48], ["radio", 12.09]], null, null, [["music", 22.58], ["toot", 11.64], ["synthesizer", 6.26]]], "duration": [4.33, 1.5, 0.22, 11.18]} \ No newline at end of file diff --git a/annotations_1/E4rFRdmeWqU_filtered.json b/annotations_1/E4rFRdmeWqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19d85ec5ded6bd8ce0f16b75696375d086dcb419 --- /dev/null +++ b/annotations_1/E4rFRdmeWqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.14], [9.0, 10.07], [11.0, 10.88], [26.0, 26.59], [27.0, 28.04], [29.0, 30.96], [32.0, 31.7], [36.0, 36.63], [38.0, 38.53], [40.0, 41.08], [43.0, 43.83], [45.0, 47.33], [49.0, 49.11], [50.0, 52.24], [53.0, 54.82], [56.0, 56.59], [59.0, 60.22], [61.0, 61.06], [62.0, 65.6], [67.0, 68.05], [70.0, 71.32], [79.0, 79.44], [80.0, 80.77], [83.0, 83.78], [85.0, 86.24], [87.0, 88.01], [90.0, 93.87], [96.0, 102.64], [111.0, 112.31], [113.0, 114.71], [116.0, 122.67], [124.0, 125.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.79, 0.0, 38.25, 0.0, 0.0, 0.0, 0.0, 29.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.08, 29.42, 0.0, 0.0, 29.26, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["rumble", 11.01], ["vehicle", 9.37], ["hum", 6.08]], null, [["speech", 46.04], ["mains hum", 9.17], ["bee, wasp, etc.", 7.92]], null, null, null, null, [["music", 73.49], ["synthesizer", 4.38], ["electronic music", 4.21]], null, null, null, null, null, null, null, [["music", 54.12], ["throbbing", 17.86], ["hum", 4.96]], [["music", 73.29], ["speech", 6.38], ["cacophony", 6.05]], null, null, [["music", 67.69], ["throbbing", 9.42], ["hum", 5.05]], null], "duration": [1.14, 1.07, -0.12, 0.59, 1.04, 1.96, -0.3, 0.63, 0.53, 1.08, 0.83, 2.33, 0.11, 2.24, 1.82, 0.59, 1.22, 0.06, 3.6, 1.05, 1.32, 0.44, 0.77, 0.78, 1.24, 1.01, 3.87, 6.64, 1.31, 1.71, 6.67, 1.0]} \ No newline at end of file diff --git a/annotations_1/E67jk75CRWM_filtered.json b/annotations_1/E67jk75CRWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3511cc6675f0f66f5804078a1913e93e6cc9d01 --- /dev/null +++ b/annotations_1/E67jk75CRWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [6.0, 6.18], [7.0, 7.2], [10.0, 76.76], [79.0, 80.08], [81.0, 83.51], [85.0, 96.87], [99.0, 99.82], [104.0, 105.0], [105.0, 108.33], [110.0, 111.77], [113.0, 120.77], [124.0, 125.69], [129.0, 150.7], [151.0, 151.14], [151.0, 155.34], [157.0, 157.81], [162.0, 166.78], [167.0, 168.42], [170.0, 174.88], [176.0, 175.86]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, true, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.87, 29.99, 0.0, 0.0, 29.58, 0.0, 28.95, 0.0, 29.22, 0.0, 28.85, 0.0, 28.84, 0.0, 42.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["creak", 28.99], ["crushing", 26.26], ["heart sounds, heartbeat", 6.59]], [["music", 44.19], ["mains hum", 10.89], ["hum", 10.84]], null, null, [["speech", 35.03], ["music", 20.78], ["sonar", 9.57]], null, [["music", 25.75], ["speech", 22.52], ["throbbing", 17.17]], null, [["speech", 35.28], ["music", 13.84], ["hum", 13.56]], null, [["music", 29.74], ["speech", 18.2], ["hum", 11.84]], null, [["music", 47.04], ["reverberation", 7.34], ["breaking", 4.93]], null, [["mains hum", 31.54], ["music", 20.79], ["hum", 20.18]], null], "duration": [0.55, 0.18, 0.2, 66.76, 1.08, 2.51, 11.87, 0.82, 1.0, 3.33, 1.77, 7.77, 1.69, 21.7, 0.14, 4.34, 0.81, 4.78, 1.42, 4.88, -0.14]} \ No newline at end of file diff --git a/annotations_1/E6AQQLVI68g_filtered.json b/annotations_1/E6AQQLVI68g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa521501adfad9f51e7ceae418d43fe3f3110f93 --- /dev/null +++ b/annotations_1/E6AQQLVI68g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.64], [38.0, 96.11], [96.0, 143.51], [146.0, 151.51], [152.0, 152.58], [153.0, 154.03], [155.0, 155.58], [156.0, 156.69], [160.0, 176.55]], "keep_status": [false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 34.73, 0.0, 0.0, 0.0, 0.0, 37.66], "audiomae_on_audioset": [null, null, null, [["music", 27.21], ["whack, thwack", 24.9], ["speech", 4.39]], null, null, null, null, [["music", 28.77], ["theremin", 11.67], ["whale vocalization", 11.56]]], "duration": [0.64, 58.11, 47.51, 5.51, 0.58, 1.03, 0.58, 0.69, 16.55]} \ No newline at end of file diff --git a/annotations_1/E6AYVGKx6Es_filtered.json b/annotations_1/E6AYVGKx6Es_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49cc346203068f3a3534d878e9e713ebffb7bbcd --- /dev/null +++ b/annotations_1/E6AYVGKx6Es_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [4.0, 4.67], [8.0, 12.78], [14.0, 14.81], [16.0, 20.9], [21.0, 46.45], [49.0, 52.52], [53.0, 55.44], [57.0, 57.38], [59.0, 60.37], [61.0, 62.78], [64.0, 64.25], [66.0, 66.99], [68.0, 70.66], [73.0, 78.68], [82.0, 96.43], [97.0, 98.63], [100.0, 107.97], [121.0, 124.58], [127.0, 130.76], [131.0, 132.51]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, false, false, true, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.69, 0.0, 33.82, 33.58, 29.72, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 38.08, 34.46, 28.92, 0.0, 30.0, 40.77, 48.74, 0.0], "audiomae_on_audioset": [null, null, [["music", 21.68], ["speech", 14.32], ["hum", 12.19]], null, [["music", 57.04], ["theremin", 16.07], ["synthesizer", 7.08]], [["music", 65.6], ["theremin", 13.79], ["synthesizer", 3.16]], [["music", 36.66], ["mains hum", 18.09], ["hum", 13.03]], [["theremin", 22.65], ["music", 21.42], ["whale vocalization", 8.98]], null, null, null, null, null, [["music", 47.24], ["speech", 14.42], ["theremin", 7.14]], [["hum", 26.21], ["music", 19.01], ["mains hum", 7.87]], [["music", 27.31], ["throbbing", 11.48], ["livestock, farm animals, working animals", 11.09]], null, [["speech", 27.1], ["animal", 20.81], ["hum", 20.07]], [["mains hum", 45.46], ["hum", 43.21], ["creak", 3.01]], [["telephone", 61.02], ["telephone bell ringing", 12.55], ["telephone dialing, dtmf", 7.94]], null], "duration": [0.64, 0.67, 4.78, 0.81, 4.9, 25.45, 3.52, 2.44, 0.38, 1.37, 1.78, 0.25, 0.99, 2.66, 5.68, 14.43, 1.63, 7.97, 3.58, 3.76, 1.51]} \ No newline at end of file diff --git a/annotations_1/E7fMOxGw-dw_filtered.json b/annotations_1/E7fMOxGw-dw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd356946fdc6528ce955681d647207fa49f04b88 --- /dev/null +++ b/annotations_1/E7fMOxGw-dw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.17], [3.0, 3.37], [6.0, 6.56], [12.0, 16.31], [19.0, 19.43], [20.0, 20.19], [22.0, 28.95], [44.0, 44.39], [46.0, 46.3], [49.0, 49.33], [49.0, 49.74], [60.0, 60.83], [82.0, 85.06], [85.0, 86.26], [104.0, 122.64], [128.0, 131.06], [131.0, 132.51], [142.0, 151.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [55.11, 0.0, 0.0, 40.68, 0.0, 0.0, 42.72, 0.0, 0.0, 0.0, 0.0, 0.0, 39.72, 0.0, 52.1, 85.17, 0.0, 37.23], "audiomae_on_audioset": [null, null, null, [["music", 52.65], ["speech", 17.14], ["brass instrument", 8.04]], null, null, [["fart", 35.1], ["speech", 27.2], ["music", 17.79]], null, null, null, null, null, [["speech", 25.35], ["insect", 12.6], ["fly, housefly", 11.01]], null, null, null, null, [["hum", 19.86], ["speech", 16.55], ["throbbing", 16.45]]], "duration": [2.17, 0.37, 0.56, 4.31, 0.43, 0.19, 6.95, 0.39, 0.3, 0.33, 0.74, 0.83, 3.06, 1.26, 18.64, 3.06, 1.51, 9.04]} \ No newline at end of file diff --git a/annotations_1/E7i4pNsqnls_filtered.json b/annotations_1/E7i4pNsqnls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d727422205827da495b6a6f29fe12a853f8eaf3e --- /dev/null +++ b/annotations_1/E7i4pNsqnls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.37], [12.0, 12.43], [13.0, 13.54], [16.0, 16.48], [19.0, 19.79], [26.0, 27.18], [28.0, 28.07], [29.0, 29.44], [30.0, 31.92], [33.0, 35.41], [36.0, 36.39], [39.0, 39.07], [50.0, 61.57], [63.0, 66.26], [67.0, 68.1], [76.0, 77.87], [79.0, 99.91], [100.0, 114.37], [118.0, 132.65], [137.0, 157.38], [158.0, 160.39], [163.0, 163.63], [165.0, 165.59], [167.0, 168.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.1, 0.0, 0.0, 44.49, 59.15, 0.0, 0.0, 33.36, 31.38, 30.1, 28.81, 35.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.08], ["hum", 9.27], ["mains hum", 8.34]], null, null, null, [["music", 79.56], ["throbbing", 4.42], ["electronic music", 4.33]], [["music", 48.73], ["speech", 20.55], ["didgeridoo", 13.09]], [["music", 45.24], ["didgeridoo", 31.45], ["percussion", 6.6]], [["music", 50.31], ["didgeridoo", 16.85], ["electronic music", 7.01]], [["music", 26.72], ["hum", 20.01], ["mains hum", 16.91]], null, null, null], "duration": [1.37, 0.43, 0.54, 0.48, 0.79, 1.18, 0.07, 0.44, 1.92, 2.41, 0.39, 0.07, 11.57, 3.26, 1.1, 1.87, 20.91, 14.37, 14.65, 20.38, 2.39, 0.63, 0.59, 1.45]} \ No newline at end of file diff --git a/annotations_1/E8x4G2WceJA_filtered.json b/annotations_1/E8x4G2WceJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73542e1065fce319fc61aa9bc8b08beebd5b4805 --- /dev/null +++ b/annotations_1/E8x4G2WceJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.79], [17.0, 16.6], [20.0, 19.92], [30.0, 30.18], [31.0, 31.41], [35.0, 36.51], [38.0, 39.39], [41.0, 41.44], [48.0, 47.98], [53.0, 54.03], [56.0, 56.57], [60.0, 60.78], [66.0, 66.51], [69.0, 69.18], [72.0, 72.86], [77.0, 76.74], [79.0, 83.0], [83.0, 83.74], [84.0, 85.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.54], ["didgeridoo", 33.68], ["theremin", 2.73]], null, null], "duration": [1.79, -0.4, -0.08, 0.18, 0.41, 1.51, 1.39, 0.44, -0.02, 1.03, 0.57, 0.78, 0.51, 0.18, 0.86, -0.26, 4.0, 0.74, 1.58]} \ No newline at end of file diff --git a/annotations_1/E9B65UGKQ5o_filtered.json b/annotations_1/E9B65UGKQ5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8121fbca80e7725f6f0f5d3a04d758f91fd3e15d --- /dev/null +++ b/annotations_1/E9B65UGKQ5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 37.44], [39.0, 40.29], [42.0, 45.39], [51.0, 56.27], [69.0, 68.88], [70.0, 74.65], [77.0, 94.07], [102.0, 104.36], [109.0, 109.51], [111.0, 124.17]], "keep_status": [true, false, false, true, false, false, true, true, false, false], "silence_prob": [43.79, 0.0, 87.74, 44.78, 0.0, 47.16, 48.39, 47.12, 0.0, 43.56], "audiomae_on_audioset": [[["music", 29.2], ["hum", 14.42], ["throbbing", 6.16]], null, null, [["livestock, farm animals, working animals", 30.31], ["music", 14.22], ["hum", 8.85]], null, [["music", 32.63], ["hum", 19.11], ["throbbing", 18.35]], [["music", 22.83], ["hum", 18.05], ["speech", 15.98]], [["music", 45.37], ["buzz", 8.27], ["didgeridoo", 2.95]], null, [["music", 30.87], ["throbbing", 30.24], ["hum", 13.1]]], "duration": [2.44, 1.29, 3.39, 5.27, -0.12, 4.65, 17.07, 2.36, 0.51, 13.17]} \ No newline at end of file diff --git a/annotations_1/E9pB6_WUR-U_filtered.json b/annotations_1/E9pB6_WUR-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bd923c75a147a89dee898b9097a90366a31d45f --- /dev/null +++ b/annotations_1/E9pB6_WUR-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 63.44], [65.0, 102.84], [104.0, 104.33], [105.0, 112.18], [113.0, 113.32], [114.0, 127.25], [130.0, 179.34], [181.0, 181.43], [183.0, 194.81]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.25, 0.0, 30.57, 0.0, 0.0, 30.04], "audiomae_on_audioset": [null, null, null, [["music", 67.5], ["throbbing", 9.41], ["hum", 4.44]], null, [["music", 44.27], ["throbbing", 24.97], ["hum", 13.17]], null, null, [["hum", 34.05], ["music", 31.98], ["mains hum", 12.13]]], "duration": [61.44, 37.84, 0.33, 7.18, 0.32, 13.25, 49.34, 0.43, 11.81]} \ No newline at end of file diff --git a/annotations_1/EAd7cMSm4Ng_filtered.json b/annotations_1/EAd7cMSm4Ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36cbdb3609bf43ea37ca0fff890201cbd8e43872 --- /dev/null +++ b/annotations_1/EAd7cMSm4Ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 5.09], [11.0, 12.99], [14.0, 14.99], [16.0, 18.03], [18.0, 20.07], [21.0, 22.05], [28.0, 29.4], [31.0, 31.7], [34.0, 36.19], [38.0, 43.11], [49.0, 50.7], [53.0, 55.81], [57.0, 58.58], [59.0, 74.02], [77.0, 80.27], [84.0, 87.37], [95.0, 96.08], [98.0, 98.83], [108.0, 109.24], [111.0, 112.73]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.73, 31.1, 0.0, 0.0, 0.0, 53.97, 49.13, 0.0, 39.94, 0.0, 43.56, 43.58, 51.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 55.87], ["music", 15.73], ["crow", 4.0]], [["theremin", 27.95], ["music", 23.64], ["whale vocalization", 17.96]], null, null, null, null, [["speech", 38.35], ["music", 27.99], ["singing bowl", 4.99]], null, [["music", 23.47], ["speech", 9.5], ["gong", 5.6]], null, [["music", 51.23], ["speech", 9.79], ["ambient music", 5.32]], [["music", 63.09], ["synthesizer", 8.78], ["musical instrument", 2.53]], null, null, null, null, null], "duration": [1.21, 1.09, 1.99, 0.99, 2.03, 2.07, 1.05, 1.4, 0.7, 2.19, 5.11, 1.7, 2.81, 1.58, 15.02, 3.27, 3.37, 1.08, 0.83, 1.24, 1.73]} \ No newline at end of file diff --git a/annotations_1/EBLS3sCB4rk_filtered.json b/annotations_1/EBLS3sCB4rk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95219f8729c1b3b356f6c9a47b049b5125b64edb --- /dev/null +++ b/annotations_1/EBLS3sCB4rk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [2.0, 3.28], [4.0, 8.53], [11.0, 11.25], [11.0, 37.32], [41.0, 42.06], [43.0, 81.31], [83.0, 83.37], [87.0, 87.44], [89.0, 88.94], [94.0, 95.03], [96.0, 99.13], [105.0, 111.5], [116.0, 117.83], [119.0, 119.31], [120.0, 121.74], [123.0, 127.33], [129.0, 129.46], [130.0, 130.84], [132.0, 132.11], [132.0, 133.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.94, 0.0, 32.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.26, 68.67, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 60.25], ["speech", 10.47], ["sidetone", 4.02]], null, [["music", 51.79], ["speech", 17.23], ["cattle, bovinae", 3.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 1.28, 4.53, 0.25, 26.32, 1.06, 38.31, 0.37, 0.44, -0.06, 1.03, 3.13, 6.5, 1.83, 0.31, 1.74, 4.33, 0.46, 0.84, 0.11, 1.03]} \ No newline at end of file diff --git a/annotations_1/ECDKjStq8Eg_filtered.json b/annotations_1/ECDKjStq8Eg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22169c3e7383118e99511a79aec853decc778092 --- /dev/null +++ b/annotations_1/ECDKjStq8Eg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 48.61], [51.0, 57.32], [60.0, 68.94], [75.0, 92.99], [95.0, 132.73]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 30.31, 29.41, 30.58, 0.0], "audiomae_on_audioset": [null, [["speech", 44.57], ["music", 34.68], ["hum", 4.24]], [["music", 40.28], ["animal", 4.72], ["hum", 4.58]], [["music", 53.08], ["speech", 18.91], ["hum", 4.67]], null], "duration": [46.61, 6.32, 8.94, 17.99, 37.73]} \ No newline at end of file diff --git a/annotations_1/ECirl_sSf-M_filtered.json b/annotations_1/ECirl_sSf-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..216c762b546441803826d741d79bf8bc460b983d --- /dev/null +++ b/annotations_1/ECirl_sSf-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [8.0, 8.6], [10.0, 10.27], [16.0, 18.23], [21.0, 21.0], [22.0, 23.38], [29.0, 32.73], [34.0, 41.1], [42.0, 43.46], [45.0, 48.24], [51.0, 56.52], [57.0, 59.39], [61.0, 72.03], [76.0, 76.76], [87.0, 89.02], [92.0, 93.07], [94.0, 96.84], [100.0, 100.16], [101.0, 104.6], [106.0, 111.03], [111.0, 112.13], [114.0, 115.43], [116.0, 117.44], [118.0, 119.31], [124.0, 126.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.98, 100.0, 0.0, 99.98, 100.0, 100.0, 99.99, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 0.6, 0.27, 2.23, 0.0, 1.38, 3.73, 7.1, 1.46, 3.24, 5.52, 2.39, 11.03, 0.76, 2.02, 1.07, 2.84, 0.16, 3.6, 5.03, 1.13, 1.43, 1.44, 1.31, 2.44]} \ No newline at end of file diff --git a/annotations_1/EDq1QNZ_JJo_filtered.json b/annotations_1/EDq1QNZ_JJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084b367dc39a32d55aa41cf8d4afc5a6d3bcd840 --- /dev/null +++ b/annotations_1/EDq1QNZ_JJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.67], [5.0, 4.9], [15.0, 44.42], [47.0, 49.01], [49.0, 50.08], [54.0, 65.03], [67.0, 68.1], [72.0, 77.26], [78.0, 80.33], [82.0, 82.81], [84.0, 85.92], [87.0, 87.47], [89.0, 99.93], [106.0, 106.83], [109.0, 111.03], [112.0, 113.78], [114.0, 117.8], [118.0, 119.77], [121.0, 121.09], [122.0, 130.15], [132.0, 135.11], [136.0, 136.98], [138.0, 145.17], [147.0, 148.24], [149.0, 153.28], [157.0, 157.01], [159.0, 161.0], [164.0, 165.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.32, 67.13, 0.0, 46.64, 0.0, 37.08, 51.07, 0.0, 0.0, 0.0, 60.6, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 76.53, 98.01, 0.0, 47.5, 0.0, 78.55, 0.0, 99.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 37.88], ["speech", 19.46], ["theremin", 15.39]], null, [["whale vocalization", 50.65], ["speech", 16.47], ["music", 9.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.95], ["fly, housefly", 9.17], ["moo", 6.7]], null, null, null, null, null], "duration": [0.67, -0.1, 29.42, 2.01, 1.08, 11.03, 1.1, 5.26, 2.33, 0.81, 1.92, 0.47, 10.93, 0.83, 2.03, 1.78, 3.8, 1.77, 0.09, 8.15, 3.11, 0.98, 7.17, 1.24, 4.28, 0.01, 2.0, 1.42]} \ No newline at end of file diff --git a/annotations_1/EDywdraYOBA_filtered.json b/annotations_1/EDywdraYOBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36c63eceabaea6f5024a61b352c7a9f5a57fb1bc --- /dev/null +++ b/annotations_1/EDywdraYOBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 55.54], [62.0, 62.6], [63.0, 64.86], [69.0, 69.55], [72.0, 71.79], [102.0, 103.15], [103.0, 103.3], [106.0, 106.27], [107.0, 107.27], [121.0, 121.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.6, 1.86, 0.55, -0.21, 1.15, 0.3, 0.27, 0.27, 0.56]} \ No newline at end of file diff --git a/annotations_1/EEaUjfxQQFI_filtered.json b/annotations_1/EEaUjfxQQFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd5da069069d2b73544feb810043c7815a1ed539 --- /dev/null +++ b/annotations_1/EEaUjfxQQFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 47.06], [48.0, 49.4], [51.0, 51.14], [52.0, 55.34], [56.0, 63.91], [65.0, 65.6], [66.0, 72.35], [73.0, 74.82], [79.0, 80.18], [82.0, 83.15], [84.0, 86.98], [89.0, 107.16], [112.0, 143.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [60.05, 0.0, 0.0, 60.79, 63.1, 0.0, 60.14, 0.0, 0.0, 0.0, 45.43, 46.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 28.97], ["hum", 8.87], ["mains hum", 7.21]], [["music", 39.39], ["mains hum", 18.45], ["hum", 17.67]], null], "duration": [4.06, 1.4, 0.14, 3.34, 7.91, 0.6, 6.35, 1.82, 1.18, 1.15, 2.98, 18.16, 31.94]} \ No newline at end of file diff --git a/annotations_1/EFtdTsawXK0_filtered.json b/annotations_1/EFtdTsawXK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55f8ce531541a606d35a1179ef7d33b41c99aedf --- /dev/null +++ b/annotations_1/EFtdTsawXK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.73], [7.0, 6.76], [7.0, 6.81], [12.0, 17.59], [32.0, 35.24], [36.0, 40.29], [41.0, 43.87], [53.0, 53.54], [55.0, 54.9], [57.0, 56.81], [60.0, 60.56], [61.0, 62.07], [63.0, 63.44], [69.0, 68.76], [80.0, 81.23], [93.0, 93.45], [94.0, 99.1], [108.0, 108.13], [109.0, 115.69], [117.0, 118.57], [120.0, 120.6], [121.0, 121.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.97, 77.7, 100.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 0.0, 39.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["wail, moan", 48.79], ["insect", 12.19], ["speech", 11.24]], null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 35.62], ["cattle, bovinae", 24.49], ["moo", 19.05]], null, [["noise", 42.91], ["fart", 5.59], ["frog", 4.99]], null, null, null], "duration": [1.73, -0.24, -0.19, 5.59, 3.24, 4.29, 2.87, 0.54, -0.1, -0.19, 0.56, 1.07, 0.44, -0.24, 1.23, 0.45, 5.1, 0.13, 6.69, 1.57, 0.6, 0.51]} \ No newline at end of file diff --git a/annotations_1/EGbVLHy9Lvw_filtered.json b/annotations_1/EGbVLHy9Lvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81f5311bdd025e8d31a2f009a343b0f79bdac0af --- /dev/null +++ b/annotations_1/EGbVLHy9Lvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 19.55], [21.0, 22.33], [23.0, 24.92], [28.0, 28.51], [29.0, 29.69], [32.0, 32.44], [33.0, 34.35], [36.0, 36.24], [39.0, 39.87], [42.0, 44.68], [47.0, 47.34], [50.0, 51.46], [52.0, 52.98], [54.0, 54.62], [65.0, 65.79], [67.0, 69.9], [71.0, 71.37], [74.0, 73.74], [75.0, 76.76], [78.0, 79.42], [83.0, 84.03], [87.0, 87.66], [91.0, 92.08], [94.0, 94.98], [95.0, 96.47], [100.0, 114.47], [115.0, 119.13], [120.0, 121.19], [122.0, 122.25], [124.0, 125.27], [126.0, 126.49], [130.0, 130.4], [132.0, 139.89], [141.0, 142.59], [144.0, 144.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.29, 37.38, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.24], ["effects unit", 13.23], ["distortion", 10.93]], null, null, null, null, null, null, null, null, null, [["theremin", 69.07], ["music", 24.37], ["cello", 1.36]], [["theremin", 34.93], ["music", 33.97], ["shofar", 3.88]], null, null, null, null, null, null, null, null], "duration": [6.55, 1.33, 1.92, 0.51, 0.69, 0.44, 1.35, 0.24, 0.87, 2.68, 0.34, 1.46, 0.98, 0.62, 0.79, 2.9, 0.37, -0.26, 1.76, 1.42, 1.03, 0.66, 1.08, 0.98, 1.47, 14.47, 4.13, 1.19, 0.25, 1.27, 0.49, 0.4, 7.89, 1.59, 0.09]} \ No newline at end of file diff --git a/annotations_1/EGt-Nk6a1UQ_filtered.json b/annotations_1/EGt-Nk6a1UQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b1035a4bd571257be09d31e1a173e7097eabfee --- /dev/null +++ b/annotations_1/EGt-Nk6a1UQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.33], [35.0, 51.83], [56.0, 61.92], [62.0, 63.15], [66.0, 67.56], [70.0, 71.02], [73.0, 73.7], [77.0, 78.65], [85.0, 86.14], [88.0, 88.5], [90.0, 100.01]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [31.16, 30.11, 34.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.4], "audiomae_on_audioset": [[["music", 29.96], ["speech", 21.91], ["foghorn", 14.92]], [["whack, thwack", 31.43], ["music", 30.12], ["thunk", 12.3]], [["thunk", 50.86], ["busy signal", 8.29], ["speech", 7.18]], null, null, null, null, null, null, null, [["music", 71.53], ["animal", 1.39], ["musical instrument", 1.19]]], "duration": [9.33, 16.83, 5.92, 1.15, 1.56, 1.02, 0.7, 1.65, 1.14, 0.5, 10.01]} \ No newline at end of file diff --git a/annotations_1/EL-Zzx9ZrOw_filtered.json b/annotations_1/EL-Zzx9ZrOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a889f52353b8ae14c3549795a0fe099cc86d77b --- /dev/null +++ b/annotations_1/EL-Zzx9ZrOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.74], [18.0, 21.15], [27.0, 27.62], [29.0, 30.28], [31.0, 34.69], [39.0, 39.12], [41.0, 42.79], [84.0, 85.16], [91.0, 92.97], [94.0, 95.62], [114.0, 115.67], [117.0, 117.73], [131.0, 131.11], [142.0, 142.69], [144.0, 160.73], [164.0, 165.45], [170.0, 173.91], [174.0, 174.58], [177.0, 176.98]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.45, 28.96, 0.0, 0.0, 28.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.33, 0.0, 29.95, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.51], ["speech", 30.31], ["buzzer", 3.81]], [["music", 53.66], ["cacophony", 10.36], ["frog", 4.4]], null, null, [["gong", 34.15], ["sound effect", 22.13], ["music", 5.42]], null, null, null, null, null, null, null, null, null, [["music", 53.46], ["speech", 27.04], ["didgeridoo", 5.44]], null, [["fly, housefly", 30.42], ["whack, thwack", 22.55], ["mosquito", 10.01]], null, null], "duration": [7.74, 3.15, 0.62, 1.28, 3.69, 0.12, 1.79, 1.16, 1.97, 1.62, 1.67, 0.73, 0.11, 0.69, 16.73, 1.45, 3.91, 0.58, -0.02]} \ No newline at end of file diff --git a/annotations_1/EL3Ma917bug_filtered.json b/annotations_1/EL3Ma917bug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1caffbbeecf42fdcf6ffc1011ce77e6899e8658d --- /dev/null +++ b/annotations_1/EL3Ma917bug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.91], [11.0, 11.37], [17.0, 18.82], [21.0, 21.61], [24.0, 35.9], [41.0, 41.91], [46.0, 47.11], [49.0, 53.64], [55.0, 55.63], [58.0, 62.5], [63.0, 64.29], [67.0, 69.06], [71.0, 71.73], [72.0, 77.13], [79.0, 83.47], [85.0, 118.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 0.0, 34.86, 0.0, 31.0, 0.0, 34.29, 0.0, 31.5, 33.3, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 68.45], ["throbbing", 5.46], ["explosion", 3.78]], null, null, [["music", 28.78], ["hum", 22.27], ["throbbing", 20.06]], null, [["music", 37.93], ["throbbing", 30.29], ["speech", 12.67]], null, [["throbbing", 35.77], ["hum", 30.83], ["music", 13.05]], null, [["speech", 60.96], ["sidetone", 21.88], ["music", 2.72]], [["noise", 24.11], ["throbbing", 18.44], ["music", 16.44]], null], "duration": [0.91, 0.37, 1.82, 0.61, 11.9, 0.91, 1.11, 4.64, 0.63, 4.5, 1.29, 2.06, 0.73, 5.13, 4.47, 33.3]} \ No newline at end of file diff --git a/annotations_1/EMKD4L6Peto_filtered.json b/annotations_1/EMKD4L6Peto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..898ae5aaa1a3c5d2d5c2df41cf7f0d39d4321491 --- /dev/null +++ b/annotations_1/EMKD4L6Peto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [6.0, 6.27], [7.0, 6.69], [7.0, 18.62], [21.0, 107.54]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.95, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 40.96], ["theremin", 33.3], ["didgeridoo", 2.38]], null], "duration": [1.67, 0.27, -0.31, 11.62, 86.54]} \ No newline at end of file diff --git a/annotations_1/ENC7ueK93Ow_filtered.json b/annotations_1/ENC7ueK93Ow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088a3f0458bfa884cf4fdbd7899db983280967b4 --- /dev/null +++ b/annotations_1/ENC7ueK93Ow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.33], [8.0, 7.7], [11.0, 15.84], [22.0, 23.55], [26.0, 30.7], [32.0, 54.97], [58.0, 60.02], [64.0, 64.52], [68.0, 80.55], [84.0, 87.59], [88.0, 88.42], [89.0, 88.94], [91.0, 96.35], [100.0, 105.75], [108.0, 113.63], [114.0, 114.99], [116.0, 118.12], [119.0, 130.92], [133.0, 135.67], [137.0, 144.9]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [42.11, 0.0, 40.97, 0.0, 42.33, 33.78, 41.09, 0.0, 30.11, 28.99, 0.0, 0.0, 28.8, 29.63, 29.56, 0.0, 28.79, 29.2, 29.59, 29.14], "audiomae_on_audioset": [[["music", 26.86], ["speech", 22.46], ["hum", 12.02]], null, [["music", 75.29], ["didgeridoo", 11.46], ["carnatic music", 4.61]], null, [["music", 65.32], ["hum", 3.08], ["boing", 2.83]], [["music", 75.28], ["didgeridoo", 2.43], ["speech", 1.85]], [["music", 49.69], ["throbbing", 9.1], ["hum", 5.55]], null, [["music", 41.58], ["speech", 14.56], ["drum", 7.55]], [["music", 52.05], ["sidetone", 13.53], ["speech", 6.39]], null, null, [["music", 36.84], ["boing", 13.58], ["didgeridoo", 7.66]], [["music", 91.2], ["didgeridoo", 0.85], ["musical instrument", 0.61]], [["music", 76.29], ["didgeridoo", 5.67], ["singing", 2.03]], null, [["music", 54.62], ["didgeridoo", 7.34], ["sound effect", 4.44]], [["music", 82.43], ["singing", 2.02], ["musical instrument", 1.39]], [["music", 82.23], ["middle eastern music", 1.48], ["musical instrument", 1.45]], [["music", 43.11], ["speech", 13.85], ["sidetone", 11.43]]], "duration": [3.33, -0.3, 4.84, 1.55, 4.7, 22.97, 2.02, 0.52, 12.55, 3.59, 0.42, -0.06, 5.35, 5.75, 5.63, 0.99, 2.12, 11.92, 2.67, 7.9]} \ No newline at end of file diff --git a/annotations_1/EOQeU_6vbeg_filtered.json b/annotations_1/EOQeU_6vbeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a65421ec4fd335e9291caf5135ebc66c3ef1e943 --- /dev/null +++ b/annotations_1/EOQeU_6vbeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.27], [6.0, 6.44], [7.0, 10.91], [12.0, 14.45], [15.0, 20.85], [25.0, 25.14], [25.0, 25.83], [28.0, 55.48], [58.0, 59.09], [60.0, 60.89], [62.0, 64.05], [72.0, 73.72], [78.0, 81.16], [93.0, 93.99], [96.0, 96.36], [102.0, 114.03], [115.0, 116.46], [118.0, 139.73], [140.0, 151.33], [153.0, 154.52], [155.0, 155.87], [157.0, 157.32], [159.0, 167.0], [170.0, 175.56], [177.0, 178.23], [182.0, 185.57], [187.0, 191.96], [206.0, 232.46], [233.0, 234.89]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 40.17, 53.16, 94.66, 0.0, 0.0, 66.03, 0.0, 0.0, 74.92, 0.0, 81.71, 0.0, 0.0, 57.4, 0.0, 50.41, 46.5, 0.0, 0.0, 0.0, 57.64, 58.64, 0.0, 34.39, 30.63, 31.57, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.96], ["tick-tock", 6.24], ["clang", 5.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.47], ["trombone", 17.6], ["brass instrument", 9.45]], null, null, null, null, null, null, [["speech", 29.04], ["hum", 18.22], ["mains hum", 12.63]], [["crowd", 28.57], ["battle cry", 22.87], ["chant", 18.04]], [["buzz", 45.49], ["speech", 22.98], ["vehicle", 13.45]], null], "duration": [1.27, 0.44, 3.91, 2.45, 5.85, 0.14, 0.83, 27.48, 1.09, 0.89, 2.05, 1.72, 3.16, 0.99, 0.36, 12.03, 1.46, 21.73, 11.33, 1.52, 0.87, 0.32, 8.0, 5.56, 1.23, 3.57, 4.96, 26.46, 1.89]} \ No newline at end of file diff --git a/annotations_1/EOavA469Z24_filtered.json b/annotations_1/EOavA469Z24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a35c29f7012e65a5664ee6d286fc377b463f20f1 --- /dev/null +++ b/annotations_1/EOavA469Z24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.24], [13.0, 14.99], [17.0, 17.74], [21.0, 21.83], [23.0, 24.31], [26.0, 27.04], [28.0, 31.29], [35.0, 43.01], [45.0, 45.45], [49.0, 49.77], [53.0, 53.57], [60.0, 61.01], [64.0, 72.17], [76.0, 78.21], [80.0, 81.63], [83.0, 83.24], [84.0, 84.28], [86.0, 86.61], [87.0, 88.21], [109.0, 109.09], [116.0, 116.53], [117.0, 124.07], [131.0, 130.77], [132.0, 133.37], [135.0, 137.1], [138.0, 139.08], [142.0, 149.32], [153.0, 153.87], [155.0, 155.92], [158.0, 159.26], [161.0, 162.11], [163.0, 163.53], [170.0, 171.36], [173.0, 173.67], [178.0, 181.31], [182.0, 183.34], [191.0, 191.24], [193.0, 194.58], [198.0, 199.17], [200.0, 205.51], [214.0, 216.72]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [38.25, 0.0, 0.0, 0.0, 0.0, 0.0, 35.8, 29.84, 0.0, 0.0, 0.0, 0.0, 31.9, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.58, 0.0, 0.0, 28.56, 0.0, 29.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.39, 0.0, 0.0, 0.0, 0.0, 43.66, 40.68], "audiomae_on_audioset": [[["throbbing", 25.93], ["hum", 23.9], ["rumble", 12.53]], null, null, null, null, null, [["hum", 63.34], ["mains hum", 7.99], ["buzz", 4.82]], [["music", 22.42], ["hum", 15.27], ["throbbing", 6.94]], null, null, null, null, [["music", 52.69], ["hum", 15.28], ["throbbing", 9.3]], [["music", 12.68], ["speech", 10.9], ["hum", 10.49]], null, null, null, null, null, null, null, [["music", 15.53], ["rumble", 12.03], ["hum", 10.69]], null, null, [["speech", 23.86], ["vehicle", 9.06], ["rumble", 4.24]], null, [["hum", 36.92], ["mains hum", 30.13], ["speech", 12.73]], null, null, null, null, null, null, null, [["music", 29.33], ["gong", 10.76], ["rumble", 6.99]], null, null, null, null, [["speech", 25.64], ["hum", 15.92], ["rumble", 10.92]], [["speech", 38.69], ["rumble", 7.82], ["music", 5.89]]], "duration": [2.24, 1.99, 0.74, 0.83, 1.31, 1.04, 3.29, 8.01, 0.45, 0.77, 0.57, 1.01, 8.17, 2.21, 1.63, 0.24, 0.28, 0.61, 1.21, 0.09, 0.53, 7.07, -0.23, 1.37, 2.1, 1.08, 7.32, 0.87, 0.92, 1.26, 1.11, 0.53, 1.36, 0.67, 3.31, 1.34, 0.24, 1.58, 1.17, 5.51, 2.72]} \ No newline at end of file diff --git a/annotations_1/EOyAHaO7lwA_filtered.json b/annotations_1/EOyAHaO7lwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97837b21b2abc2add56daa6379d59b3357d588c1 --- /dev/null +++ b/annotations_1/EOyAHaO7lwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.68], [3.0, 3.69], [9.0, 13.41], [14.0, 18.59], [20.0, 21.12], [22.0, 22.64], [24.0, 23.84], [31.0, 33.24], [35.0, 36.56], [37.0, 39.78], [46.0, 46.85], [49.0, 49.35], [50.0, 51.78], [53.0, 53.37], [56.0, 56.4], [57.0, 57.74], [67.0, 68.15], [70.0, 70.9], [73.0, 72.98], [79.0, 82.19], [85.0, 86.71], [88.0, 89.43], [92.0, 93.78], [95.0, 105.41], [106.0, 112.31], [117.0, 120.68], [129.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 79.76, 63.21, 0.0, 0.0, 0.0, 53.34, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 96.42, 42.37, 63.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.12], ["sidetone", 26.71], ["hum", 7.02]], null, null], "duration": [0.68, 0.69, 4.41, 4.59, 1.12, 0.64, -0.16, 2.24, 1.56, 2.78, 0.85, 0.35, 1.78, 0.37, 0.4, 0.74, 1.15, 0.9, -0.02, 3.19, 1.71, 1.43, 1.78, 10.41, 6.31, 3.68, 1.06]} \ No newline at end of file diff --git a/annotations_1/EPa8iQyK5mQ_filtered.json b/annotations_1/EPa8iQyK5mQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ed29a0b61583a4def103db7ace98619c02b9542 --- /dev/null +++ b/annotations_1/EPa8iQyK5mQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.44], [4.0, 27.95], [30.0, 31.04], [40.0, 40.68], [45.0, 45.79], [49.0, 49.59], [54.0, 54.09], [58.0, 58.73], [63.0, 64.03], [67.0, 68.25], [75.0, 75.79], [91.0, 92.5], [97.0, 100.13]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.6, 29.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.26], "audiomae_on_audioset": [[["speech", 52.7], ["vehicle", 19.08], ["aircraft", 3.92]], [["eruption", 21.35], ["explosion", 13.84], ["vehicle", 7.48]], null, null, null, null, null, null, null, null, null, null, [["sidetone", 46.07], ["speech", 8.28], ["radio", 7.37]]], "duration": [2.44, 23.95, 1.04, 0.68, 0.79, 0.59, 0.09, 0.73, 1.03, 1.25, 0.79, 1.5, 3.13]} \ No newline at end of file diff --git a/annotations_1/EPj1eq1csm4_filtered.json b/annotations_1/EPj1eq1csm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d74dfdda2e1b96809491c7b1b78135f3d7d127bd --- /dev/null +++ b/annotations_1/EPj1eq1csm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 56.76], [58.0, 95.81], [102.0, 102.73], [107.0, 126.79], [130.0, 166.28]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.32, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 53.0], ["quack", 4.75], ["rumble", 3.15]], null], "duration": [42.76, 37.81, 0.73, 19.79, 36.28]} \ No newline at end of file diff --git a/annotations_1/EQWtaLTOwCw_filtered.json b/annotations_1/EQWtaLTOwCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d91522d698ddabf78b73c67165740c3126c7f726 --- /dev/null +++ b/annotations_1/EQWtaLTOwCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[100.0, 109.44], [112.0, 123.87], [124.0, 197.33], [199.0, 249.99], [253.0, 269.54], [270.0, 269.94], [270.0, 270.19]], "keep_status": [true, true, false, false, false, false, false], "silence_prob": [32.88, 29.59, 0.0, 0.0, 30.48, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.04], ["music", 12.03], ["livestock, farm animals, working animals", 9.14]], [["livestock, farm animals, working animals", 40.56], ["cattle, bovinae", 7.39], ["smash, crash", 7.34]], null, null, [["music", 53.2], ["hum", 14.04], ["mains hum", 10.47]], null, null], "duration": [9.44, 11.87, 73.33, 50.99, 16.54, -0.06, 0.19]} \ No newline at end of file diff --git a/annotations_1/EQqdhMcUSAw_filtered.json b/annotations_1/EQqdhMcUSAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01d011c5c4ba9c8be199c39b3fef420471e11183 --- /dev/null +++ b/annotations_1/EQqdhMcUSAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [8.0, 8.51], [12.0, 12.7], [14.0, 14.62], [21.0, 21.37], [23.0, 23.94], [30.0, 31.99], [33.0, 33.86], [35.0, 36.78], [38.0, 65.6], [67.0, 103.65], [108.0, 135.78], [139.0, 152.44], [153.0, 153.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.35, 0.0, 28.82, 28.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 26.86], ["music", 25.16], ["throbbing", 24.55]], null, [["music", 29.32], ["speech", 20.4], ["whack, thwack", 5.86]], [["music", 34.95], ["whack, thwack", 8.37], ["smash, crash", 8.19]], null], "duration": [0.5, 0.51, 0.7, 0.62, 0.37, 0.94, 1.99, 0.86, 1.78, 27.6, 36.65, 27.78, 13.44, 0.71]} \ No newline at end of file diff --git a/annotations_1/ERlyrvQbqP8_filtered.json b/annotations_1/ERlyrvQbqP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89919e918479641b2d6e95507c26ed15f975d1a2 --- /dev/null +++ b/annotations_1/ERlyrvQbqP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.09], [16.0, 19.08], [21.0, 21.73], [26.0, 30.7], [32.0, 33.44], [35.0, 35.18], [38.0, 38.13], [39.0, 40.27], [41.0, 42.72], [44.0, 54.95], [55.0, 57.32], [58.0, 58.77], [59.0, 59.63], [61.0, 60.98], [62.0, 61.99], [64.0, 82.71], [84.0, 85.38], [88.0, 90.42], [91.0, 103.47], [104.0, 104.52], [107.0, 107.43], [111.0, 111.65], [113.0, 114.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.28, 99.59, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 76.7, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 55.67, 41.32, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.06], ["glass", 8.87], ["breaking", 8.42]], null, null, null, null], "duration": [7.09, 3.08, 0.73, 4.7, 1.44, 0.18, 0.13, 1.27, 1.72, 10.95, 2.32, 0.77, 0.63, -0.02, -0.01, 18.71, 1.38, 2.42, 12.47, 0.52, 0.43, 0.65, 1.02]} \ No newline at end of file diff --git a/annotations_1/ES496lmmGcM_filtered.json b/annotations_1/ES496lmmGcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b295c15e24749761b43b0c5a2cd37aefce77227c --- /dev/null +++ b/annotations_1/ES496lmmGcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.47], [24.0, 25.05], [29.0, 29.54], [32.0, 32.07], [37.0, 42.28], [45.0, 45.81], [47.0, 58.08], [63.0, 65.11], [69.0, 72.47], [76.0, 86.05], [88.0, 91.1]], "keep_status": [false, false, false, false, true, false, false, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.29, 0.0, 32.78, 48.69, 41.66, 34.11, 40.21], "audiomae_on_audioset": [null, null, null, null, [["music", 46.72], ["hum", 6.24], ["thunk", 5.43]], null, [["music", 50.92], ["speech", 30.41], ["throbbing", 3.33]], [["music", 48.44], ["didgeridoo", 13.62], ["musical instrument", 5.45]], [["hum", 22.57], ["music", 14.66], ["speech", 13.87]], [["hum", 33.98], ["music", 29.17], ["mains hum", 6.5]], [["speech", 48.93], ["boing", 9.25], ["fart", 3.7]]], "duration": [0.47, 1.05, 0.54, 0.07, 5.28, 0.81, 11.08, 2.11, 3.47, 10.05, 3.1]} \ No newline at end of file diff --git a/annotations_1/ESUdqZoRu3A_filtered.json b/annotations_1/ESUdqZoRu3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c0d06a99a32ffdf7021d7b16209b689f1aab836 --- /dev/null +++ b/annotations_1/ESUdqZoRu3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.26], [6.0, 19.89], [21.0, 22.59], [23.0, 24.11], [29.0, 30.42], [32.0, 35.55], [36.0, 38.67], [39.0, 40.12], [43.0, 43.88], [45.0, 51.76], [54.0, 54.8], [58.0, 59.09], [61.0, 62.38], [71.0, 72.28], [73.0, 76.69], [79.0, 80.87], [87.0, 90.9], [94.0, 95.17], [95.0, 96.84], [97.0, 98.96], [99.0, 99.55], [101.0, 102.66], [105.0, 105.68], [112.0, 112.75], [114.0, 114.86], [116.0, 115.67], [116.0, 116.16], [127.0, 127.9], [139.0, 140.83], [149.0, 149.27], [150.0, 151.95], [153.0, 154.36], [155.0, 156.22], [165.0, 166.21], [175.0, 188.32], [189.0, 190.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.68, 89.19, 0.0, 0.0, 0.0, 37.2, 59.15, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 82.49], ["hiccup", 3.82], ["radio", 1.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.26, 13.89, 1.59, 1.11, 1.42, 3.55, 2.67, 1.12, 0.88, 6.76, 0.8, 1.09, 1.38, 1.28, 3.69, 1.87, 3.9, 1.17, 1.84, 1.96, 0.55, 1.66, 0.68, 0.75, 0.86, -0.33, 0.16, 0.9, 1.83, 0.27, 1.95, 1.36, 1.22, 1.21, 13.32, 1.29]} \ No newline at end of file diff --git a/annotations_1/ETC85CgzTHM_filtered.json b/annotations_1/ETC85CgzTHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5023131888ae822cbc13a6bcf6fd0310fed067d1 --- /dev/null +++ b/annotations_1/ETC85CgzTHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 23.5], [24.0, 28.31], [31.0, 32.91], [37.0, 38.08], [40.0, 46.9], [54.0, 80.5], [81.0, 80.7], [81.0, 80.77], [81.0, 80.81], [81.0, 80.84], [83.0, 99.99], [102.0, 118.03], [118.0, 129.57], [131.0, 143.88], [148.0, 149.22]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.04, 42.74, 0.0, 0.0, 30.99, 30.18, 0.0, 0.0, 0.0, 0.0, 29.95, 29.74, 29.93, 33.78, 0.0], "audiomae_on_audioset": [[["music", 84.96], ["country", 1.01], ["musical instrument", 0.92]], [["music", 57.12], ["guitar", 5.33], ["musical instrument", 5.04]], null, null, [["music", 77.97], ["funny music", 3.04], ["swing music", 1.73]], [["music", 78.08], ["singing", 1.67], ["reggae", 1.18]], null, null, null, null, [["music", 88.55], ["country", 0.75], ["musical instrument", 0.65]], [["music", 82.69], ["reggae", 3.06], ["swing music", 1.8]], [["music", 67.14], ["reggae", 3.76], ["boing", 2.13]], [["speech", 44.33], ["cheering", 17.13], ["crowd", 14.77]], null], "duration": [4.5, 4.31, 1.91, 1.08, 6.9, 26.5, -0.3, -0.23, -0.19, -0.16, 16.99, 16.03, 11.57, 12.88, 1.22]} \ No newline at end of file diff --git a/annotations_1/ETu553EnTJM_filtered.json b/annotations_1/ETu553EnTJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31c7048c24d375180de6de0f3560f150e4ccb7dc --- /dev/null +++ b/annotations_1/ETu553EnTJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.69], [16.0, 17.14], [26.0, 26.52], [28.0, 28.7], [33.0, 33.99], [43.0, 43.29], [44.0, 45.47], [57.0, 58.41], [65.0, 67.44], [71.0, 70.83], [73.0, 75.47], [82.0, 83.25], [87.0, 89.5], [92.0, 94.22], [98.0, 98.96], [103.0, 103.98], [106.0, 128.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 39.41, 0.0, 39.6, 74.92, 0.0, 0.0, 33.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 42.48], ["noise", 7.7], ["electronic music", 7.36]], null, [["music", 40.41], ["musical instrument", 7.42], ["noise", 5.14]], null, null, null, [["music", 66.14], ["noise", 11.61], ["synthesizer", 4.38]]], "duration": [0.69, 1.14, 0.52, 0.7, 0.99, 0.29, 1.47, 1.41, 2.44, -0.17, 2.47, 1.25, 2.5, 2.22, 0.96, 0.98, 22.58]} \ No newline at end of file diff --git a/annotations_1/ETxIJN_avuM_filtered.json b/annotations_1/ETxIJN_avuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9a664f8d304bb2111be33955a6b5108dec72dd2 --- /dev/null +++ b/annotations_1/ETxIJN_avuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 62.72], [66.0, 68.98], [70.0, 106.34], [107.0, 110.94], [112.0, 137.78], [145.0, 151.26], [152.0, 151.7], [152.0, 151.88], [157.0, 159.95], [164.0, 166.06], [168.0, 184.4], [184.0, 184.45]], "keep_status": [true, true, false, false, true, false, false, false, true, false, true, false], "silence_prob": [29.87, 30.92, 0.0, 33.84, 29.97, 32.26, 0.0, 0.0, 31.52, 35.91, 28.68, 0.0], "audiomae_on_audioset": [[["whack, thwack", 32.56], ["throbbing", 12.76], ["music", 12.15]], [["speech", 41.45], ["music", 14.92], ["door", 6.8]], null, [["throbbing", 46.66], ["music", 25.34], ["hum", 18.19]], [["speech", 44.28], ["music", 19.13], ["hum", 4.92]], [["music", 66.18], ["throbbing", 5.04], ["electronic music", 3.67]], null, null, [["music", 58.54], ["throbbing", 5.07], ["electronic music", 4.21]], [["music", 67.75], ["musical instrument", 8.26], ["synthesizer", 3.73]], [["speech", 22.81], ["hum", 13.88], ["music", 11.5]], null], "duration": [18.72, 2.98, 36.34, 3.94, 25.78, 6.26, -0.3, -0.12, 2.95, 2.06, 16.4, 0.45]} \ No newline at end of file diff --git a/annotations_1/EVvEtTyJYCo_filtered.json b/annotations_1/EVvEtTyJYCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26ec56da3a596d5310b71789c4e078bb036902be --- /dev/null +++ b/annotations_1/EVvEtTyJYCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 41.27], [47.0, 50.11], [53.0, 53.23], [53.0, 53.74], [58.0, 156.91], [158.0, 163.71], [169.0, 168.69], [169.0, 168.74], [169.0, 168.91]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [31.59, 30.43, 0.0, 0.0, 0.0, 40.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.36], ["music", 33.34], ["outside, rural or natural", 3.89]], [["music", 35.95], ["throbbing", 10.57], ["hum", 6.89]], null, null, null, [["music", 42.03], ["speech", 21.31], ["sidetone", 6.85]], null, null, null], "duration": [11.27, 3.11, 0.23, 0.74, 98.91, 5.71, -0.31, -0.26, -0.09]} \ No newline at end of file diff --git a/annotations_1/EWSHsRBP88Y_filtered.json b/annotations_1/EWSHsRBP88Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1510b8d13be92f0044e9e874f909964ec4c030b --- /dev/null +++ b/annotations_1/EWSHsRBP88Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.8], [43.0, 43.6], [45.0, 44.71], [47.0, 48.0], [61.0, 61.64], [69.0, 69.15], [69.0, 70.29], [78.0, 81.09], [83.0, 83.88], [85.0, 85.29], [90.0, 93.56], [95.0, 96.16], [100.0, 100.7], [101.0, 100.75], [101.0, 102.54], [103.0, 104.65], [106.0, 106.98], [108.0, 108.92], [109.0, 109.92], [111.0, 111.52], [113.0, 115.03], [119.0, 119.28], [124.0, 157.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 19.26], ["music", 14.03], ["rumble", 11.69]], null, null, null, null, null, null, null, null, null, [["music", 40.74], ["speech", 11.09], ["whale vocalization", 9.23]], null, null], "duration": [0.8, 0.6, -0.29, 1.0, 0.64, 0.15, 1.29, 3.09, 0.88, 0.29, 3.56, 1.16, 0.7, -0.25, 1.54, 1.65, 0.98, 0.92, 0.92, 0.52, 2.03, 0.28, 33.45]} \ No newline at end of file diff --git a/annotations_1/EXUzqVIocHI_filtered.json b/annotations_1/EXUzqVIocHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85d40c586702c9dbcb1d8443ab07e7900756d285 --- /dev/null +++ b/annotations_1/EXUzqVIocHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 22.65], [27.0, 35.87], [37.0, 39.51], [43.0, 64.44], [65.0, 101.31], [103.0, 144.24], [145.0, 145.79], [146.0, 173.62], [177.0, 179.47]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [28.83, 29.11, 29.96, 29.29, 0.0, 0.0, 0.0, 29.32, 29.15], "audiomae_on_audioset": [[["speech", 51.71], ["music", 30.39], ["breaking", 1.99]], [["music", 46.98], ["hum", 17.73], ["mains hum", 14.95]], [["cacophony", 22.21], ["hum", 18.1], ["throbbing", 7.71]], [["music", 64.08], ["cacophony", 7.7], ["throbbing", 3.57]], null, null, null, [["buzz", 75.42], ["hum", 6.91], ["music", 3.73]], [["music", 47.15], ["breaking", 29.47], ["speech", 2.64]]], "duration": [17.65, 8.87, 2.51, 21.44, 36.31, 41.24, 0.79, 27.62, 2.47]} \ No newline at end of file diff --git a/annotations_1/EXwr6U_YypE_filtered.json b/annotations_1/EXwr6U_YypE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93be90f6ddeff9710f23f1c7277febe570cafff5 --- /dev/null +++ b/annotations_1/EXwr6U_YypE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.08], [7.0, 6.99], [9.0, 9.73], [11.0, 10.61], [11.0, 11.16], [16.0, 16.98], [19.0, 20.09], [21.0, 21.66], [24.0, 27.89], [28.0, 29.42], [32.0, 32.98], [33.0, 35.18], [36.0, 36.27], [38.0, 37.88], [41.0, 41.77], [44.0, 44.85], [48.0, 48.78], [51.0, 51.98], [57.0, 58.9], [60.0, 59.59], [61.0, 64.49], [77.0, 78.87], [80.0, 81.03], [82.0, 92.57], [94.0, 95.32], [97.0, 104.99], [116.0, 117.1], [127.0, 128.19], [132.0, 131.85], [140.0, 140.37], [142.0, 141.83], [142.0, 143.04], [143.0, 144.85], [145.0, 146.62], [148.0, 148.37], [149.0, 150.57], [152.0, 153.01], [154.0, 154.31], [155.0, 155.29], [156.0, 156.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 94.81, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.08, -0.01, 0.73, -0.39, 0.16, 0.98, 1.09, 0.66, 3.89, 1.42, 0.98, 2.18, 0.27, -0.12, 0.77, 0.85, 0.78, 0.98, 1.9, -0.41, 3.49, 1.87, 1.03, 10.57, 1.32, 7.99, 1.1, 1.19, -0.15, 0.37, -0.17, 1.04, 1.85, 1.62, 0.37, 1.57, 1.01, 0.31, 0.29, 0.05]} \ No newline at end of file diff --git a/annotations_1/EYHLDJuEUoc_filtered.json b/annotations_1/EYHLDJuEUoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a684e6867f7de327276134fef2995beeead67012 --- /dev/null +++ b/annotations_1/EYHLDJuEUoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.65], [19.0, 19.16], [20.0, 22.06], [25.0, 25.64], [28.0, 36.76], [39.0, 40.86], [42.0, 41.89], [44.0, 44.52], [45.0, 46.26], [47.0, 47.75], [49.0, 53.94], [55.0, 58.6], [61.0, 61.84], [62.0, 65.65], [69.0, 70.28], [75.0, 74.71], [83.0, 83.89], [84.0, 83.93], [90.0, 90.68], [92.0, 92.99], [101.0, 102.66], [106.0, 107.06], [118.0, 120.19], [125.0, 124.88], [127.0, 129.44], [132.0, 132.48], [136.0, 137.39], [139.0, 144.17], [148.0, 164.56]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 32.88, 0.0, 32.35, 0.0, 0.0, 0.0, 0.0, 0.0, 30.76, 33.54, 0.0, 32.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.98, 0.0, 36.36, 0.0, 0.0, 30.96, 30.31], "audiomae_on_audioset": [null, null, [["music", 50.09], ["hum", 10.16], ["throbbing", 9.26]], null, [["music", 32.18], ["speech", 20.3], ["cacophony", 5.63]], null, null, null, null, null, [["music", 67.21], ["theremin", 5.92], ["throbbing", 4.93]], [["music", 39.06], ["hum", 20.21], ["theremin", 11.55]], null, [["music", 25.98], ["speech", 17.0], ["buzz", 12.66]], null, null, null, null, null, null, null, null, [["music", 61.78], ["singing", 2.52], ["chant", 1.95]], null, [["music", 22.41], ["speech", 16.34], ["sidetone", 5.05]], null, null, [["music", 43.99], ["electric shaver, electric razor", 5.79], ["speech", 4.99]], [["music", 86.11], ["mantra", 1.8], ["singing", 1.5]]], "duration": [1.65, 0.16, 2.06, 0.64, 8.76, 1.86, -0.11, 0.52, 1.26, 0.75, 4.94, 3.6, 0.84, 3.65, 1.28, -0.29, 0.89, -0.07, 0.68, 0.99, 1.66, 1.06, 2.19, -0.12, 2.44, 0.48, 1.39, 5.17, 16.56]} \ No newline at end of file diff --git a/annotations_1/EYKOpaD_s1U_filtered.json b/annotations_1/EYKOpaD_s1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c141c3233f1882b0c4028880cd076d94f11693a8 --- /dev/null +++ b/annotations_1/EYKOpaD_s1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.32], [3.0, 3.11], [4.0, 4.92], [6.0, 6.29], [8.0, 8.16], [11.0, 11.79], [18.0, 18.74], [21.0, 21.66], [23.0, 23.72], [25.0, 25.84], [29.0, 31.29], [32.0, 33.27], [76.0, 75.98], [90.0, 90.34], [98.0, 99.13], [100.0, 100.68], [125.0, 126.93], [129.0, 130.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 69.9], ["musical instrument", 4.24], ["effects unit", 3.07]], null, null, null, null, null, null, null], "duration": [0.32, 0.11, 0.92, 0.29, 0.16, 0.79, 0.74, 0.66, 0.72, 0.84, 2.29, 1.27, -0.02, 0.34, 1.13, 0.68, 1.93, 1.15]} \ No newline at end of file diff --git a/annotations_1/EYdIrPSIgio_filtered.json b/annotations_1/EYdIrPSIgio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b880cc8d6097a844103384b1deefeca2ffc300a0 --- /dev/null +++ b/annotations_1/EYdIrPSIgio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.48], [13.0, 13.56], [14.0, 13.63], [14.0, 43.5], [53.0, 55.75], [57.0, 59.73], [61.0, 61.25], [63.0, 70.97], [72.0, 80.7], [81.0, 87.4], [101.0, 103.37], [110.0, 114.76], [119.0, 118.52], [121.0, 123.8]], "keep_status": [false, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.55, 87.92, 49.64, 0.0, 99.99, 34.39, 31.29, 32.05, 31.27, 0.0, 59.77], "audiomae_on_audioset": [null, null, null, [["speech", 31.77], ["whack, thwack", 15.76], ["electric shaver, electric razor", 13.7]], null, [["speech", 65.4], ["frog", 4.17], ["croak", 3.32]], null, null, [["music", 54.57], ["sidetone", 14.94], ["speech", 9.08]], [["speech", 37.67], ["hum", 13.53], ["mains hum", 12.34]], [["livestock, farm animals, working animals", 11.36], ["roaring cats (lions, tigers)", 11.12], ["moo", 9.99]], [["speech", 45.45], ["livestock, farm animals, working animals", 13.46], ["cattle, bovinae", 11.76]], null, null], "duration": [0.48, 0.56, -0.37, 29.5, 2.75, 2.73, 0.25, 7.97, 8.7, 6.4, 2.37, 4.76, -0.48, 2.8]} \ No newline at end of file diff --git a/annotations_1/E_PIi8tRcCo_filtered.json b/annotations_1/E_PIi8tRcCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0685df2989906cab6b0da957390403d23d950ee --- /dev/null +++ b/annotations_1/E_PIi8tRcCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 3.91], [8.0, 8.6], [10.0, 11.85], [13.0, 21.78], [26.0, 30.27], [33.0, 35.34], [39.0, 44.69], [46.0, 47.76], [49.0, 50.92], [53.0, 53.33], [54.0, 54.89], [56.0, 58.24], [59.0, 61.57], [62.0, 81.24], [82.0, 82.86], [85.0, 86.61], [89.0, 90.14], [91.0, 123.55], [134.0, 133.91], [134.0, 141.79], [143.0, 145.79], [147.0, 157.4], [160.0, 168.76], [169.0, 177.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.37, 99.71, 87.55, 53.72, 0.0, 0.0, 0.0, 0.0, 99.99, 97.33, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 90.78, 46.09, 38.27, 37.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.4], ["ambient music", 26.61], ["electronic music", 4.48]], [["speech", 24.06], ["music", 21.79], ["ambient music", 14.09]], [["music", 37.33], ["ambient music", 18.74], ["hum", 6.41]]], "duration": [0.35, 0.91, 0.6, 1.85, 8.78, 4.27, 2.34, 5.69, 1.76, 1.92, 0.33, 0.89, 2.24, 2.57, 19.24, 0.86, 1.61, 1.14, 32.55, -0.09, 7.79, 2.79, 10.4, 8.76, 8.26]} \ No newline at end of file diff --git a/annotations_1/E_TbL7vdWGo_filtered.json b/annotations_1/E_TbL7vdWGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e716a9288253da6763415eaaa13373ea74bc283 --- /dev/null +++ b/annotations_1/E_TbL7vdWGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.18], [6.0, 7.92], [8.0, 7.96], [9.0, 19.63], [21.0, 24.92], [26.0, 29.44], [30.0, 31.53], [33.0, 33.13], [34.0, 34.86], [36.0, 38.18], [46.0, 49.01], [67.0, 78.98], [94.0, 102.91], [104.0, 103.99], [104.0, 106.34], [111.0, 112.53], [116.0, 116.73], [117.0, 120.06], [121.0, 128.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 57.4, 87.74, 50.81, 0.0, 0.0, 0.0, 45.18, 31.14, 33.37, 31.38, 0.0, 31.88, 0.0, 0.0, 32.2, 33.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 56.02], ["speech", 9.41], ["guitar", 6.69]], [["music", 23.06], ["speech", 13.19], ["didgeridoo", 8.57]], [["livestock, farm animals, working animals", 37.15], ["cattle, bovinae", 10.87], ["fly, housefly", 9.03]], [["music", 34.77], ["speech", 27.54], ["boing", 16.38]], null, [["speech", 51.43], ["music", 18.3], ["hum", 2.21]], null, null, [["music", 43.97], ["speech", 10.78], ["throbbing", 10.77]], [["music", 73.01], ["theremin", 4.81], ["hum", 3.22]]], "duration": [0.18, 1.92, -0.04, 10.63, 3.92, 3.44, 1.53, 0.13, 0.86, 2.18, 3.01, 11.98, 8.91, -0.01, 2.34, 1.53, 0.73, 3.06, 7.06]} \ No newline at end of file diff --git a/annotations_1/Eb9WH9OiKn8_filtered.json b/annotations_1/Eb9WH9OiKn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1c635ca95d215970aaa03da5c4689cebdfa586f --- /dev/null +++ b/annotations_1/Eb9WH9OiKn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.57], [46.0, 47.11], [49.0, 49.89], [50.0, 55.71], [57.0, 58.08], [67.0, 67.56], [78.0, 78.14], [92.0, 93.55], [94.0, 95.91], [97.0, 97.36], [105.0, 106.07], [117.0, 117.8], [118.0, 118.98], [120.0, 120.99], [122.0, 123.94], [128.0, 128.48], [132.0, 132.58], [146.0, 147.72], [151.0, 152.74], [154.0, 156.3], [157.0, 160.71], [162.0, 162.73], [174.0, 173.91], [176.0, 176.12], [177.0, 178.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 95.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.11, 0.89, 5.71, 1.08, 0.56, 0.14, 1.55, 1.91, 0.36, 1.07, 0.8, 0.98, 0.99, 1.94, 0.48, 0.58, 1.72, 1.74, 2.3, 3.71, 0.73, -0.09, 0.12, 1.41]} \ No newline at end of file diff --git a/annotations_1/Ec2ek8MmHRA_filtered.json b/annotations_1/Ec2ek8MmHRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af3e7ec371194efba25b3344180807e8c41ff37f --- /dev/null +++ b/annotations_1/Ec2ek8MmHRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 86.88], [90.0, 100.43], [102.0, 101.87], [103.0, 117.73], [121.0, 128.76], [133.0, 144.53], [147.0, 148.19], [148.0, 148.41], [148.0, 149.49], [150.0, 150.5]], "keep_status": [false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 37.67, 0.0, 29.45, 29.04, 29.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 48.55], ["throbbing", 13.47], ["synthesizer", 9.11]], null, [["speech", 36.75], ["music", 8.9], ["whack, thwack", 7.82]], [["mains hum", 32.49], ["speech", 20.85], ["hum", 15.02]], [["speech", 44.15], ["music", 12.74], ["ship", 5.33]], null, null, null, null], "duration": [31.88, 10.43, -0.13, 14.73, 7.76, 11.53, 1.19, 0.41, 1.49, 0.5]} \ No newline at end of file diff --git a/annotations_1/Ece-FTMuKFU_filtered.json b/annotations_1/Ece-FTMuKFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..602edfdb94ae060b19756c38b3a9c02346b4082e --- /dev/null +++ b/annotations_1/Ece-FTMuKFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [6.0, 8.01], [19.0, 19.41], [25.0, 25.79], [28.0, 28.46], [31.0, 32.07], [32.0, 35.46], [44.0, 47.41], [49.0, 50.77], [57.0, 61.32], [66.0, 66.6], [68.0, 68.52], [82.0, 84.55], [87.0, 87.91], [90.0, 90.0], [93.0, 93.55], [96.0, 97.68], [99.0, 100.4], [102.0, 103.05], [105.0, 105.63], [107.0, 110.2], [111.0, 111.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 95.78, 100.0, 0.0, 100.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 2.01, 0.41, 0.79, 0.46, 1.07, 3.46, 3.41, 1.77, 4.32, 0.6, 0.52, 2.55, 0.91, 0.0, 0.55, 1.68, 1.4, 1.05, 0.63, 3.2, 0.6]} \ No newline at end of file diff --git a/annotations_1/Ed8T-GzBcIY_filtered.json b/annotations_1/Ed8T-GzBcIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..120d4fc7a2816b4f59a66c7019b0cc0ba5bbafd0 --- /dev/null +++ b/annotations_1/Ed8T-GzBcIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 62.29], [63.0, 72.37], [74.0, 90.31]], "keep_status": [false, false, true], "silence_prob": [0.0, 59.33, 32.11], "audiomae_on_audioset": [null, null, [["music", 44.03], ["electric shaver, electric razor", 14.56], ["didgeridoo", 6.21]]], "duration": [1.29, 9.37, 16.31]} \ No newline at end of file diff --git a/annotations_1/Ed__PtLnaeo_filtered.json b/annotations_1/Ed__PtLnaeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5a069d368448347c9165329ce711bab9ec12b6c --- /dev/null +++ b/annotations_1/Ed__PtLnaeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.09], [6.0, 6.78], [9.0, 9.14], [16.0, 22.96], [25.0, 26.72], [28.0, 31.28], [32.0, 41.17], [43.0, 44.51], [45.0, 47.07], [55.0, 55.81], [60.0, 60.93], [67.0, 69.03], [70.0, 74.61], [78.0, 78.49], [83.0, 84.4], [86.0, 95.1], [96.0, 96.75], [98.0, 106.71], [108.0, 108.33], [119.0, 118.96], [120.0, 121.61], [131.0, 142.99], [146.0, 146.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 80.64, 0.0, 56.4, 87.74, 0.0, 79.59, 0.0, 0.0, 87.37, 78.04, 0.0, 0.0, 80.82, 0.0, 93.91, 0.0, 0.0, 0.0, 30.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.15], ["whack, thwack", 12.92], ["sidetone", 4.95]], null], "duration": [0.09, 0.78, 0.14, 6.96, 1.72, 3.28, 9.17, 1.51, 2.07, 0.81, 0.93, 2.03, 4.61, 0.49, 1.4, 9.1, 0.75, 8.71, 0.33, -0.04, 1.61, 11.99, 0.03]} \ No newline at end of file diff --git a/annotations_1/EdiZzm9bA2I_filtered.json b/annotations_1/EdiZzm9bA2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e5579bb4edbe282d4be1ac0fd7bb6b91af2c4a1 --- /dev/null +++ b/annotations_1/EdiZzm9bA2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [8.0, 8.26], [9.0, 10.42], [11.0, 12.29], [14.0, 15.75], [18.0, 19.45], [20.0, 20.92], [24.0, 28.71], [29.0, 30.06], [31.0, 33.22], [35.0, 35.97], [41.0, 41.67], [42.0, 62.48], [63.0, 64.3], [65.0, 67.36], [69.0, 70.11], [71.0, 71.22], [71.0, 71.56], [74.0, 74.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 93.6, 0.0, 0.0, 45.05, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 46.34], ["speech", 15.07], ["cattle, bovinae", 8.39]], null, null, null, null, null, null], "duration": [1.33, 0.26, 1.42, 1.29, 1.75, 1.45, 0.92, 4.71, 1.06, 2.22, 0.97, 0.67, 20.48, 1.3, 2.36, 1.11, 0.22, 0.56, 0.48]} \ No newline at end of file diff --git a/annotations_1/EelncXXu150_filtered.json b/annotations_1/EelncXXu150_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa5e53082726da6da25fbd0a700ef76a84ace02f --- /dev/null +++ b/annotations_1/EelncXXu150_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.4], [4.0, 5.1], [8.0, 16.77]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.4], "audiomae_on_audioset": [null, null, [["music", 38.58], ["theremin", 16.91], ["meow", 11.3]]], "duration": [1.4, 1.1, 8.77]} \ No newline at end of file diff --git a/annotations_1/EfHvcHYz-tY_filtered.json b/annotations_1/EfHvcHYz-tY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8d80af369e62a03e1847d864c70cc8ff34967d2 --- /dev/null +++ b/annotations_1/EfHvcHYz-tY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.65], [17.0, 21.42], [24.0, 33.45], [37.0, 39.01], [45.0, 46.09], [51.0, 51.92], [53.0, 61.08], [65.0, 82.92], [85.0, 107.6], [108.0, 110.64], [112.0, 114.86], [117.0, 128.58], [130.0, 130.6], [131.0, 132.83], [136.0, 140.9], [141.0, 142.62], [147.0, 146.72], [149.0, 150.31], [151.0, 152.02], [152.0, 152.52], [155.0, 156.61], [160.0, 161.64], [162.0, 164.79], [167.0, 170.09]], "keep_status": [false, true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.72, 32.15, 32.75, 0.0, 0.0, 32.93, 32.64, 33.49, 64.41, 40.11, 86.27, 0.0, 0.0, 39.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 91.98], "audiomae_on_audioset": [null, [["music", 53.88], ["speech", 6.41], ["guitar", 5.94]], [["music", 59.47], ["fly, housefly", 4.77], ["insect", 3.24]], [["music", 33.55], ["speech", 6.31], ["ding", 2.78]], null, null, [["music", 64.06], ["synthesizer", 6.2], ["musical instrument", 4.17]], [["music", 63.43], ["musical instrument", 6.97], ["synthesizer", 4.27]], [["music", 53.43], ["synthesizer", 6.04], ["didgeridoo", 5.19]], null, [["speech", 56.94], ["dial tone", 16.51], ["telephone", 9.71]], null, null, null, [["speech", 77.52], ["hum", 3.06], ["dial tone", 3.05]], null, null, null, null, null, null, null, null, null], "duration": [0.65, 4.42, 9.45, 2.01, 1.09, 0.92, 8.08, 17.92, 22.6, 2.64, 2.86, 11.58, 0.6, 1.83, 4.9, 1.62, -0.28, 1.31, 1.02, 0.52, 1.61, 1.64, 2.79, 3.09]} \ No newline at end of file diff --git a/annotations_1/Eh_0E0UdJcc_filtered.json b/annotations_1/Eh_0E0UdJcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Eh_0E0UdJcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/EiYxgC78ScI_filtered.json b/annotations_1/EiYxgC78ScI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a2df1a4a34ce25e32945be24600ddbfddea0e1 --- /dev/null +++ b/annotations_1/EiYxgC78ScI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 34.45], [38.0, 41.1], [42.0, 45.1], [46.0, 54.38], [55.0, 55.59], [57.0, 85.36], [90.0, 143.4]], "keep_status": [true, false, true, false, false, true, false], "silence_prob": [34.16, 28.83, 29.07, 36.57, 0.0, 28.44, 0.0], "audiomae_on_audioset": [[["hum", 19.05], ["speech", 16.64], ["mains hum", 14.9]], [["speech", 65.58], ["speech synthesizer", 20.47], ["reverberation", 3.63]], [["thunk", 48.8], ["music", 10.53], ["breaking", 8.42]], [["music", 47.65], ["hum", 17.3], ["throbbing", 8.65]], null, [["breaking", 15.72], ["music", 13.26], ["livestock, farm animals, working animals", 12.73]], null], "duration": [6.45, 3.1, 3.1, 8.38, 0.59, 28.36, 53.4]} \ No newline at end of file diff --git a/annotations_1/Ej1lqvtmcMg_filtered.json b/annotations_1/Ej1lqvtmcMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee05280b8c7cee50aab48a2e7765d1001f534bbc --- /dev/null +++ b/annotations_1/Ej1lqvtmcMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.78], [18.0, 17.93], [19.0, 46.53], [50.0, 53.27], [57.0, 64.71], [65.0, 69.85]], "keep_status": [false, false, true, false, false, true], "silence_prob": [82.25, 0.0, 35.59, 67.51, 30.22, 29.94], "audiomae_on_audioset": [null, null, [["burping, eructation", 47.31], ["sine wave", 10.45], ["animal", 6.7]], null, [["music", 64.33], ["theremin", 11.03], ["domestic animals, pets", 3.13]], [["music", 10.37], ["speech", 10.09], ["crowd", 9.97]]], "duration": [13.78, -0.07, 27.53, 3.27, 7.71, 4.85]} \ No newline at end of file diff --git a/annotations_1/EjAwbjng__4_filtered.json b/annotations_1/EjAwbjng__4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfac7130ec931af5f2e18cd8e094849efd4a8a6d --- /dev/null +++ b/annotations_1/EjAwbjng__4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.37], [58.0, 70.44], [73.0, 78.12], [84.0, 86.54], [87.0, 89.01], [91.0, 94.34], [95.0, 96.53], [97.0, 108.51], [111.0, 126.87]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.31, 99.98, 99.78, 84.8, 90.95, 0.0, 74.76, 67.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.37, 12.44, 5.12, 2.54, 2.01, 3.34, 1.53, 11.51, 15.87]} \ No newline at end of file diff --git a/annotations_1/ElBy0fKa9Ic_filtered.json b/annotations_1/ElBy0fKa9Ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e845e06ec26889aacc83fe09b2ab4dd29bd0bbb7 --- /dev/null +++ b/annotations_1/ElBy0fKa9Ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.97], [12.0, 12.72], [28.0, 28.36], [28.0, 28.54], [30.0, 30.99], [35.0, 35.29], [37.0, 37.12], [41.0, 40.85], [52.0, 52.86], [55.0, 55.81], [65.0, 65.69], [83.0, 84.0], [85.0, 86.44], [105.0, 108.62], [110.0, 111.28], [112.0, 116.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 80.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.72, 0.36, 0.54, 0.99, 0.29, 0.12, -0.15, 0.86, 0.81, 0.69, 1.0, 1.44, 3.62, 1.28, 4.13]} \ No newline at end of file diff --git a/annotations_1/ElidXD2F2eo_filtered.json b/annotations_1/ElidXD2F2eo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bca562b21bde8b5affd62b61f80a6ed4b696030 --- /dev/null +++ b/annotations_1/ElidXD2F2eo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [7.0, 8.16], [13.0, 14.37], [15.0, 23.53], [29.0, 34.16], [37.0, 88.25], [88.0, 90.12], [91.0, 101.85], [104.0, 117.78]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.79, 29.76, 0.0, 29.87, 29.98, 29.81], "audiomae_on_audioset": [null, null, null, [["music", 78.41], ["sampler", 3.14], ["synthesizer", 2.68]], [["music", 68.27], ["moo", 7.5], ["cattle, bovinae", 7.17]], null, [["music", 64.02], ["drum and bass", 3.4], ["speech", 2.94]], [["music", 74.37], ["motorcycle", 3.02], ["electronic music", 2.85]], [["music", 71.96], ["didgeridoo", 6.04], ["electronic music", 3.01]]], "duration": [0.78, 1.16, 1.37, 8.53, 5.16, 51.25, 2.12, 10.85, 13.78]} \ No newline at end of file diff --git a/annotations_1/En7TapBA84M_filtered.json b/annotations_1/En7TapBA84M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7798f494b3f6006d6da935c4cf895bf0c6dd35a --- /dev/null +++ b/annotations_1/En7TapBA84M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [14.0, 14.84], [16.0, 16.23], [18.0, 19.36], [31.0, 30.91], [31.0, 31.41], [32.0, 32.68], [35.0, 34.99], [38.0, 38.11], [44.0, 46.04], [48.0, 48.84], [50.0, 51.21], [59.0, 59.91], [74.0, 74.21], [76.0, 75.88], [86.0, 89.73], [94.0, 94.12], [99.0, 98.91], [99.0, 100.79], [101.0, 102.1], [105.0, 105.98], [117.0, 122.25], [125.0, 128.8], [137.0, 144.63], [145.0, 146.01], [153.0, 154.11], [155.0, 157.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 34.15, 33.24, 0.0, 0.0, 39.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 87.56], ["sound effect", 1.99], ["groan", 1.38]], [["boing", 15.88], ["music", 9.09], ["fly, housefly", 8.71]], [["music", 71.55], ["boing", 13.97], ["speech", 4.33]], null, null, [["music", 44.61], ["musical instrument", 10.19], ["synthesizer", 6.0]]], "duration": [0.52, 0.84, 0.23, 1.36, -0.09, 0.41, 0.68, -0.01, 0.11, 2.04, 0.84, 1.21, 0.91, 0.21, -0.12, 3.73, 0.12, -0.09, 1.79, 1.1, 0.98, 5.25, 3.8, 7.63, 1.01, 1.11, 2.64]} \ No newline at end of file diff --git a/annotations_1/EnfAVLatlmY_filtered.json b/annotations_1/EnfAVLatlmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85ddc27e7f68279653780b15e028a243b16fef5f --- /dev/null +++ b/annotations_1/EnfAVLatlmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.96], [4.0, 5.76], [6.0, 7.37], [9.0, 9.66], [11.0, 19.01], [21.0, 22.45], [24.0, 25.88], [27.0, 30.03], [32.0, 33.64], [35.0, 36.26], [37.0, 44.52], [47.0, 48.46], [49.0, 51.43], [52.0, 53.3], [54.0, 55.59], [58.0, 62.41], [64.0, 66.75], [68.0, 71.44], [73.0, 73.85], [77.0, 77.94], [79.0, 78.87], [81.0, 82.58], [87.0, 87.51], [94.0, 94.0], [96.0, 96.53], [105.0, 105.51], [107.0, 107.67], [109.0, 109.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 98.59, 0.0, 0.0, 93.91, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 1.76, 1.37, 0.66, 8.01, 1.45, 1.88, 3.03, 1.64, 1.26, 7.52, 1.46, 2.43, 1.3, 1.59, 4.41, 2.75, 3.44, 0.85, 0.94, -0.13, 1.58, 0.51, 0.0, 0.53, 0.51, 0.67, 0.22]} \ No newline at end of file diff --git a/annotations_1/Ent1UQJ4mdU_filtered.json b/annotations_1/Ent1UQJ4mdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b50a42050d8403edd2c82acc9b5eb248ff01e62 --- /dev/null +++ b/annotations_1/Ent1UQJ4mdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.66], [18.0, 26.89], [27.0, 27.57], [28.0, 29.54], [31.0, 31.01], [34.0, 34.4], [38.0, 38.99], [43.0, 43.68], [54.0, 57.08], [57.0, 58.82], [61.0, 62.88], [63.0, 66.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 54.04], "audiomae_on_audioset": [null, [["speech", 97.73], ["horse", 0.48], ["clip-clop", 0.32]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.34, 8.89, 0.57, 1.54, 0.01, 0.4, 0.99, 0.68, 3.08, 1.82, 1.88, 3.78]} \ No newline at end of file diff --git a/annotations_1/EodzQpkDFYo_filtered.json b/annotations_1/EodzQpkDFYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b0b9d044652d8bf316a20c8f44dbb1fb7c1af90 --- /dev/null +++ b/annotations_1/EodzQpkDFYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[63.0, 63.21]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.21]} \ No newline at end of file diff --git a/annotations_1/EoikWLSsmRk_filtered.json b/annotations_1/EoikWLSsmRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d1bdfd5d54839652ea643fe2cc19593469de96d --- /dev/null +++ b/annotations_1/EoikWLSsmRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [3.0, 4.29], [8.0, 8.95], [13.0, 15.33], [17.0, 17.44], [18.0, 19.25], [20.0, 21.0], [22.0, 22.01], [24.0, 24.98], [25.0, 27.95], [29.0, 29.91], [31.0, 31.68], [34.0, 34.82], [39.0, 40.02], [41.0, 41.94], [45.0, 46.04], [48.0, 49.44], [53.0, 53.22], [55.0, 55.0], [56.0, 56.32], [58.0, 58.46], [62.0, 62.45], [73.0, 75.46], [77.0, 78.24], [81.0, 84.92], [88.0, 87.71], [89.0, 91.4], [92.0, 94.49], [99.0, 99.32], [100.0, 101.58], [102.0, 102.71], [109.0, 109.44], [113.0, 113.22], [114.0, 114.32], [114.0, 114.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 74.92, 0.0, 52.68, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["insect", 33.02], ["fly, housefly", 31.35], ["bee, wasp, etc.", 22.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 1.29, 0.95, 2.33, 0.44, 1.25, 1.0, 0.01, 0.98, 2.95, 0.91, 0.68, 0.82, 1.02, 0.94, 1.04, 1.44, 0.22, 0.0, 0.32, 0.46, 0.45, 2.46, 1.24, 3.92, -0.29, 2.4, 2.49, 0.32, 1.58, 0.71, 0.44, 0.22, 0.32, 0.37]} \ No newline at end of file diff --git a/annotations_1/Eom_iOkd0-I_filtered.json b/annotations_1/Eom_iOkd0-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71b858366aa61b568380997ba331a62eb666b077 --- /dev/null +++ b/annotations_1/Eom_iOkd0-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.2], [9.0, 9.73], [13.0, 13.0], [14.0, 14.69], [15.0, 15.57], [17.0, 17.37], [19.0, 20.14], [22.0, 22.54], [25.0, 25.05], [31.0, 31.41], [36.0, 36.19], [38.0, 38.23], [42.0, 42.33], [46.0, 46.41], [47.0, 47.02], [52.0, 51.98], [53.0, 53.49], [55.0, 55.92], [62.0, 62.01], [62.0, 62.06], [66.0, 66.21], [72.0, 72.93], [73.0, 73.53], [78.0, 78.31], [79.0, 79.91], [80.0, 80.89], [83.0, 83.42], [89.0, 89.28], [90.0, 89.87], [93.0, 93.9], [97.0, 97.66], [99.0, 99.08], [100.0, 100.75], [102.0, 102.63], [103.0, 103.89], [104.0, 105.11], [108.0, 108.68], [111.0, 111.3], [112.0, 112.56], [114.0, 114.78], [118.0, 117.93], [119.0, 119.25], [120.0, 124.77], [128.0, 128.16], [129.0, 129.46], [132.0, 132.16], [132.0, 134.76], [136.0, 136.97], [138.0, 138.48], [145.0, 144.93], [146.0, 147.11], [152.0, 152.69], [155.0, 155.63], [157.0, 157.65], [158.0, 158.38], [159.0, 160.12], [168.0, 168.29], [171.0, 171.02], [173.0, 174.85], [175.0, 177.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 46.36], ["sine wave", 30.54], ["whale vocalization", 5.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.75], ["dial tone", 13.32], ["sidetone", 4.87]]], "duration": [0.2, 0.73, 0.0, 0.69, 0.57, 0.37, 1.14, 0.54, 0.05, 0.41, 0.19, 0.23, 0.33, 0.41, 0.02, -0.02, 0.49, 0.92, 0.01, 0.06, 0.21, 0.93, 0.53, 0.31, 0.91, 0.89, 0.42, 0.28, -0.13, 0.9, 0.66, 0.08, 0.75, 0.63, 0.89, 1.11, 0.68, 0.3, 0.56, 0.78, -0.07, 0.25, 4.77, 0.16, 0.46, 0.16, 2.76, 0.97, 0.48, -0.07, 1.11, 0.69, 0.63, 0.65, 0.38, 1.12, 0.29, 0.02, 1.85, 2.48]} \ No newline at end of file diff --git a/annotations_1/Ep30EE2v0mU_filtered.json b/annotations_1/Ep30EE2v0mU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f012cacf02e6d2f5a345adaa64e91c95d80abc49 --- /dev/null +++ b/annotations_1/Ep30EE2v0mU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [12.0, 12.41], [13.0, 13.88], [41.0, 41.77], [48.0, 48.91], [54.0, 56.56], [64.0, 64.57], [76.0, 76.76], [91.0, 107.32], [111.0, 117.32], [121.0, 121.76], [125.0, 127.03]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.48, 0.0, 0.0, 38.97, 48.69, 0.0, 69.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 43.72], ["musical instrument", 4.55], ["quack", 3.8]], null, null, [["music", 27.15], ["speech", 25.49], ["thunk", 5.66]], [["sidetone", 35.8], ["music", 34.94], ["speech", 14.2]], null, null], "duration": [0.52, 0.41, 0.88, 0.77, 0.91, 2.56, 0.57, 0.76, 16.32, 6.32, 0.76, 2.03]} \ No newline at end of file diff --git a/annotations_1/EpCLoqVPwqw_filtered.json b/annotations_1/EpCLoqVPwqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7596d0925029455843700afdf875f5250615f091 --- /dev/null +++ b/annotations_1/EpCLoqVPwqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 50.57], [51.0, 52.39], [55.0, 62.21], [62.0, 67.29], [69.0, 110.46], [111.0, 110.96], [111.0, 111.01]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [57.64, 0.0, 72.31, 41.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 21.57], ["hum", 20.68], ["music", 12.82]], null, null, null], "duration": [19.57, 1.39, 7.21, 5.29, 41.46, -0.04, 0.01]} \ No newline at end of file diff --git a/annotations_1/EpCp0rAGDNo_filtered.json b/annotations_1/EpCp0rAGDNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e29bb1f71f0aa9e603f697011e3643dea2156203 --- /dev/null +++ b/annotations_1/EpCp0rAGDNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.24], [6.0, 8.97], [10.0, 14.1], [16.0, 20.9], [33.0, 33.72], [44.0, 45.28], [47.0, 46.6], [47.0, 47.09], [50.0, 50.25], [53.0, 54.43], [55.0, 56.84], [58.0, 58.63], [60.0, 68.3]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.59, 45.21, 30.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13], "audiomae_on_audioset": [null, [["creak", 48.22], ["speech", 17.23], ["fly, housefly", 4.96]], [["speech", 30.75], ["music", 11.66], ["throbbing", 8.17]], [["speech", 56.5], ["music", 24.44], ["hum", 4.82]], null, null, null, null, null, null, null, null, null], "duration": [0.24, 2.97, 4.1, 4.9, 0.72, 1.28, -0.4, 0.09, 0.25, 1.43, 1.84, 0.63, 8.3]} \ No newline at end of file diff --git a/annotations_1/EpcWBu5f2uY_filtered.json b/annotations_1/EpcWBu5f2uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be1b22b61afdbdf0cf1c89035e100416f3bd9163 --- /dev/null +++ b/annotations_1/EpcWBu5f2uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.09], [8.0, 8.07], [10.0, 40.0], [47.0, 47.55], [49.0, 48.64], [60.0, 62.58], [65.0, 67.85], [71.0, 74.65], [77.0, 78.22], [81.0, 81.67], [85.0, 92.84], [110.0, 110.54], [112.0, 121.09], [124.0, 125.59], [129.0, 130.62], [135.0, 135.51], [137.0, 141.13], [142.0, 146.31], [147.0, 165.72], [166.0, 166.09], [166.0, 166.23], [166.0, 166.9], [168.0, 168.47], [169.0, 177.45]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [41.6, 0.0, 30.74, 0.0, 0.0, 83.16, 53.22, 77.36, 0.0, 0.0, 48.23, 0.0, 94.07, 0.0, 0.0, 0.0, 84.62, 49.59, 32.39, 0.0, 0.0, 0.0, 0.0, 35.82], "audiomae_on_audioset": [[["speech", 36.52], ["roaring cats (lions, tigers)", 5.5], ["frog", 5.0]], null, [["whack, thwack", 20.92], ["speech", 20.87], ["explosion", 8.35]], null, null, null, null, null, null, null, [["speech", 64.44], ["fart", 5.89], ["sine wave", 3.92]], null, null, null, null, null, null, [["speech", 31.91], ["foghorn", 15.47], ["music", 12.76]], [["music", 66.63], ["throbbing", 12.34], ["hum", 5.3]], null, null, null, null, [["music", 66.35], ["didgeridoo", 6.39], ["musical instrument", 3.72]]], "duration": [3.09, 0.07, 30.0, 0.55, -0.36, 2.58, 2.85, 3.65, 1.22, 0.67, 7.84, 0.54, 9.09, 1.59, 1.62, 0.51, 4.13, 4.31, 18.72, 0.09, 0.23, 0.9, 0.47, 8.45]} \ No newline at end of file diff --git a/annotations_1/EqFFgltjVbg_filtered.json b/annotations_1/EqFFgltjVbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f35eace8990365bc42f1892904d1ac8dbd6e5e7 --- /dev/null +++ b/annotations_1/EqFFgltjVbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.51], [11.0, 28.26], [30.0, 37.66], [38.0, 38.87], [42.0, 45.2], [46.0, 47.98], [49.0, 58.83], [61.0, 75.03], [75.0, 84.42]], "keep_status": [false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 29.43, 33.15, 0.0, 30.33, 0.0, 30.32, 30.72, 37.27], "audiomae_on_audioset": [null, [["mains hum", 19.61], ["hum", 14.2], ["speech", 14.07]], [["buzz", 13.89], ["fly, housefly", 11.9], ["bee, wasp, etc.", 11.62]], null, [["hum", 16.16], ["mains hum", 10.9], ["rumble", 10.51]], null, [["music", 46.1], ["machine gun", 25.12], ["noise", 5.18]], [["music", 52.97], ["coin (dropping)", 8.62], ["hum", 5.69]], [["speech", 56.05], ["mains hum", 10.77], ["hum", 9.9]]], "duration": [1.51, 17.26, 7.66, 0.87, 3.2, 1.98, 9.83, 14.03, 9.42]} \ No newline at end of file diff --git a/annotations_1/EqNTVkdsTL0_filtered.json b/annotations_1/EqNTVkdsTL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0ec1241f66969a70d06f7642b8fd08c85d195a3 --- /dev/null +++ b/annotations_1/EqNTVkdsTL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 6.93], [8.0, 8.55], [12.0, 11.97], [14.0, 14.91], [16.0, 18.91], [20.0, 22.99], [24.0, 25.02], [26.0, 28.68], [29.0, 31.35], [32.0, 34.03], [36.0, 38.89], [42.0, 44.34], [45.0, 46.23], [47.0, 48.0], [50.0, 53.11], [54.0, 54.82], [56.0, 56.56], [57.0, 58.36], [59.0, 60.24], [61.0, 63.27], [64.0, 66.82], [67.0, 69.08], [70.0, 70.23], [71.0, 72.67], [74.0, 78.33], [81.0, 83.49], [84.0, 87.24], [88.0, 92.03], [95.0, 95.66], [97.0, 97.14], [97.0, 98.12], [104.0, 108.11], [108.0, 108.28], [110.0, 109.81], [113.0, 113.27]], "keep_status": [false, true, false, false, false, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 31.57, 0.0, 0.0, 0.0, 39.67, 45.85, 0.0, 41.66, 43.64, 61.27, 58.13, 52.62, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 0.0, 51.34, 59.42, 60.42, 0.0, 0.0, 66.27, 41.66, 73.67, 36.69, 0.0, 0.0, 0.0, 29.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 19.52], ["music", 18.46], ["speech", 16.45]], null, null, null, [["hum", 21.42], ["mains hum", 20.25], ["fly, housefly", 5.42]], [["hum", 25.06], ["mains hum", 10.59], ["music", 8.37]], null, [["hum", 32.32], ["mains hum", 20.13], ["music", 13.95]], [["mains hum", 27.07], ["hum", 13.61], ["speech", 6.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.92], ["music", 23.53], ["busy signal", 4.7]], null, [["mains hum", 36.99], ["music", 28.59], ["hum", 16.87]], null, null, null, [["music", 45.92], ["brass instrument", 12.5], ["saxophone", 6.54]], null, null, null], "duration": [0.5, 5.93, 0.55, -0.03, 0.91, 2.91, 2.99, 1.02, 2.68, 2.35, 2.03, 2.89, 2.34, 1.23, 1.0, 3.11, 0.82, 0.56, 1.36, 1.24, 2.27, 2.82, 2.08, 0.23, 1.67, 4.33, 2.49, 3.24, 4.03, 0.66, 0.14, 1.12, 4.11, 0.28, -0.19, 0.27]} \ No newline at end of file diff --git a/annotations_1/EsTniU7j_yw_filtered.json b/annotations_1/EsTniU7j_yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1778236e9d259fa463626608189cb4881e467aa8 --- /dev/null +++ b/annotations_1/EsTniU7j_yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [4.0, 4.95], [12.0, 12.16], [13.0, 13.71], [19.0, 21.81], [23.0, 23.72], [34.0, 34.45], [38.0, 38.03], [42.0, 42.57], [44.0, 45.25], [48.0, 48.71], [51.0, 51.38], [54.0, 55.14], [58.0, 58.78], [64.0, 65.21], [72.0, 72.72], [85.0, 85.43], [101.0, 105.07], [107.0, 108.7], [110.0, 110.91], [113.0, 113.66], [115.0, 116.16], [120.0, 121.34], [122.0, 123.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 86.24], ["radio", 6.13], ["telephone", 2.36]], null, null, null, null, null, null], "duration": [0.92, 0.95, 0.16, 0.71, 2.81, 0.72, 0.45, 0.03, 0.57, 1.25, 0.71, 0.38, 1.14, 0.78, 1.21, 0.72, 0.43, 4.07, 1.7, 0.91, 0.66, 1.16, 1.34, 1.48]} \ No newline at end of file diff --git a/annotations_1/Eu1EfSDUKFg_filtered.json b/annotations_1/Eu1EfSDUKFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e33f98d9af585b33c4839210eb4424269503a7 --- /dev/null +++ b/annotations_1/Eu1EfSDUKFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.42], [24.0, 24.93], [25.0, 25.84], [39.0, 39.33], [44.0, 46.55], [54.0, 53.79], [91.0, 90.85], [92.0, 92.55], [100.0, 100.48], [109.0, 109.81], [136.0, 136.07], [149.0, 152.88], [154.0, 154.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.93, 0.84, 0.33, 2.55, -0.21, -0.15, 0.55, 0.48, 0.81, 0.07, 3.88, 0.62]} \ No newline at end of file diff --git a/annotations_1/EuZM3sfjqno_filtered.json b/annotations_1/EuZM3sfjqno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d738b0b4dc5c04e61b28e0a2b855fced41a2a99 --- /dev/null +++ b/annotations_1/EuZM3sfjqno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.54], [22.0, 23.99], [25.0, 25.39], [26.0, 29.62], [32.0, 41.81], [46.0, 54.85], [55.0, 65.16], [66.0, 69.53], [71.0, 70.93], [74.0, 74.78], [77.0, 77.18], [79.0, 83.89], [86.0, 87.45], [97.0, 103.65], [108.0, 108.51], [114.0, 120.04], [122.0, 123.03], [125.0, 131.99], [134.0, 134.0], [134.0, 134.1], [139.0, 140.93], [142.0, 143.16], [152.0, 151.63], [153.0, 153.55], [156.0, 156.0], [160.0, 161.15], [162.0, 162.23], [163.0, 165.01], [165.0, 166.51], [171.0, 177.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [60.05, 0.0, 0.0, 98.01, 57.97, 65.79, 58.89, 52.51, 0.0, 0.0, 0.0, 50.61, 0.0, 33.25, 0.0, 33.0, 0.0, 32.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.4, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.95], ["boing", 15.74], ["whack, thwack", 8.89]], null, [["music", 28.56], ["throbbing", 28.36], ["hum", 17.18]], null, [["speech", 19.74], ["whack, thwack", 16.72], ["music", 15.81]], null, null, null, null, null, null, null, null, null, [["tabla", 24.78], ["music", 16.81], ["percussion", 14.67]], null, null], "duration": [9.54, 1.99, 0.39, 3.62, 9.81, 8.85, 10.16, 3.53, -0.07, 0.78, 0.18, 4.89, 1.45, 6.65, 0.51, 6.04, 1.03, 6.99, 0.0, 0.1, 1.93, 1.16, -0.37, 0.55, 0.0, 1.15, 0.23, 2.01, 1.51, 6.94]} \ No newline at end of file diff --git a/annotations_1/EvUbi66AGKI_filtered.json b/annotations_1/EvUbi66AGKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c54d8fd60fe6c0ae9207b628e57e5b934204f5c --- /dev/null +++ b/annotations_1/EvUbi66AGKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [12.0, 13.07], [16.0, 19.53], [23.0, 24.24], [25.0, 27.46], [33.0, 34.45], [35.0, 35.24], [40.0, 40.37], [46.0, 47.98], [60.0, 60.08], [63.0, 63.68], [70.0, 71.51], [78.0, 87.02], [89.0, 89.67], [91.0, 95.66], [103.0, 103.01], [105.0, 109.73], [120.0, 125.83], [134.0, 135.73], [143.0, 143.56], [145.0, 156.3], [159.0, 164.49], [168.0, 172.12], [174.0, 176.79]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 29.42, 0.0, 37.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.98, 0.0, 31.36, 0.0, 29.3, 31.66, 0.0, 0.0, 29.91, 30.85, 30.79, 31.77], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 34.35], ["livestock, farm animals, working animals", 29.38], ["moo", 23.82]], null, [["moo", 28.26], ["cattle, bovinae", 20.78], ["livestock, farm animals, working animals", 13.82]], null, null, null, null, null, null, null, [["music", 33.35], ["speech", 28.79], ["basketball bounce", 6.43]], null, [["hum", 27.03], ["mains hum", 18.68], ["music", 16.29]], null, [["music", 62.46], ["speech", 7.48], ["electronic music", 4.17]], [["fly, housefly", 18.35], ["bee, wasp, etc.", 8.31], ["hum", 7.32]], null, null, [["hum", 26.04], ["music", 21.9], ["throbbing", 18.92]], [["speech", 56.96], ["vehicle", 8.84], ["car", 8.43]], [["speech", 27.01], ["fly, housefly", 13.9], ["music", 9.88]], [["moo", 28.88], ["cattle, bovinae", 26.89], ["livestock, farm animals, working animals", 8.94]]], "duration": [0.89, 1.07, 3.53, 1.24, 2.46, 1.45, 0.24, 0.37, 1.98, 0.08, 0.68, 1.51, 9.02, 0.67, 4.66, 0.01, 4.73, 5.83, 1.73, 0.56, 11.3, 5.49, 4.12, 2.79]} \ No newline at end of file diff --git a/annotations_1/Ew8AJsPAyLg_filtered.json b/annotations_1/Ew8AJsPAyLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21182c3b3ed78a35272937f179ab43cff83fb887 --- /dev/null +++ b/annotations_1/Ew8AJsPAyLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [5.0, 5.95], [6.0, 9.04], [11.0, 13.34], [26.0, 26.5], [30.0, 30.69], [31.0, 31.19], [56.0, 61.82], [67.0, 67.39], [75.0, 75.49], [78.0, 94.93], [96.0, 96.35], [98.0, 98.63], [99.0, 110.69], [113.0, 113.53], [115.0, 115.79], [116.0, 136.78], [138.0, 138.37], [140.0, 158.57], [160.0, 160.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 71.0, 91.81, 0.0, 0.0, 0.0, 29.22, 0.0, 0.0, 31.54, 0.0, 0.0, 30.83, 0.0, 0.0, 31.2, 0.0, 30.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 38.99], ["cattle, bovinae", 30.74], ["moo", 29.7]], null, null, [["music", 72.66], ["boing", 13.11], ["whack, thwack", 2.21]], null, null, [["music", 76.2], ["speech", 4.25], ["cacophony", 2.24]], null, null, [["music", 81.34], ["musical instrument", 4.25], ["beatboxing", 0.87]], null, [["music", 19.86], ["cattle, bovinae", 19.05], ["moo", 13.48]], null], "duration": [0.74, 0.95, 3.04, 2.34, 0.5, 0.69, 0.19, 5.82, 0.39, 0.49, 16.93, 0.35, 0.63, 11.69, 0.53, 0.79, 20.78, 0.37, 18.57, 0.74]} \ No newline at end of file diff --git a/annotations_1/Ewpzngfnvcc_filtered.json b/annotations_1/Ewpzngfnvcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a275af459c7ccfd3d76ee18821eb938e7fd84068 --- /dev/null +++ b/annotations_1/Ewpzngfnvcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [3.0, 3.13], [4.0, 5.51], [6.0, 14.47], [15.0, 15.48], [16.0, 73.36], [77.0, 91.81], [96.0, 98.47], [104.0, 104.46], [112.0, 120.58], [121.0, 122.5], [123.0, 126.01], [127.0, 127.82], [128.0, 128.61], [130.0, 132.24], [140.0, 140.32], [147.0, 147.88], [150.0, 150.53], [152.0, 154.28], [155.0, 160.71], [162.0, 169.47], [170.0, 172.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 45.02, 0.0, 0.0, 28.58, 60.14, 0.0, 99.97, 0.0, 99.76, 0.0, 0.0, 91.3, 0.0, 0.0, 0.0, 99.96, 34.18, 29.92, 28.27], "audiomae_on_audioset": [null, null, null, [["music", 49.37], ["thunk", 16.61], ["speech", 3.79]], null, null, [["speech", 71.69], ["vehicle", 4.39], ["music", 4.25]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.8], ["chirp tone", 11.53], ["sine wave", 10.98]], [["whale vocalization", 33.9], ["music", 15.24], ["hum", 8.49]], [["whale vocalization", 27.49], ["speech", 11.24], ["music", 7.68]]], "duration": [0.58, 0.13, 1.51, 8.47, 0.48, 57.36, 14.81, 2.47, 0.46, 8.58, 1.5, 3.01, 0.82, 0.61, 2.24, 0.32, 0.88, 0.53, 2.28, 5.71, 7.47, 2.42]} \ No newline at end of file diff --git a/annotations_1/ExsSDD8Lpsc_filtered.json b/annotations_1/ExsSDD8Lpsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99b8aed15332dfebe20b1ac9af32a8a3fb30b472 --- /dev/null +++ b/annotations_1/ExsSDD8Lpsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.15], [5.0, 5.78], [7.0, 7.62], [9.0, 9.42], [13.0, 13.61], [14.0, 14.94], [16.0, 23.36], [27.0, 43.01], [46.0, 46.62], [48.0, 50.11], [50.0, 53.5], [54.0, 53.92], [57.0, 56.98], [58.0, 58.87], [60.0, 60.18], [61.0, 62.5], [64.0, 65.01], [66.0, 66.06], [68.0, 68.2], [70.0, 70.21], [72.0, 72.35], [73.0, 72.84], [73.0, 74.58], [76.0, 79.17], [81.0, 81.21], [84.0, 84.15], [88.0, 88.75], [90.0, 92.38], [93.0, 93.85], [96.0, 96.31], [98.0, 99.28], [100.0, 100.01], [102.0, 103.28], [107.0, 107.43], [111.0, 111.67], [113.0, 115.45], [117.0, 116.95], [118.0, 118.32], [119.0, 120.26], [121.0, 122.54], [124.0, 124.07], [125.0, 125.74]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 83.16, 0.0, 84.07, 51.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["crowd", 29.49], ["battle cry", 20.04], ["speech", 11.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.78, 0.62, 0.42, 0.61, 0.94, 7.36, 16.01, 0.62, 2.11, 3.5, -0.08, -0.02, 0.87, 0.18, 1.5, 1.01, 0.06, 0.2, 0.21, 0.35, -0.16, 1.58, 3.17, 0.21, 0.15, 0.75, 2.38, 0.85, 0.31, 1.28, 0.01, 1.28, 0.43, 0.67, 2.45, -0.05, 0.32, 1.26, 1.54, 0.07, 0.74]} \ No newline at end of file diff --git a/annotations_1/Exw1_k7Hj6o_filtered.json b/annotations_1/Exw1_k7Hj6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe73cb913558d8ef77cd29d31782d7b006974d0d --- /dev/null +++ b/annotations_1/Exw1_k7Hj6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 64.59], [66.0, 78.95], [81.0, 81.18], [81.0, 109.31], [110.0, 119.96]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 29.92, 0.0, 30.84, 43.53], "audiomae_on_audioset": [null, [["music", 68.43], ["didgeridoo", 5.48], ["musical instrument", 4.26]], null, [["music", 85.69], ["didgeridoo", 2.4], ["throbbing", 2.15]], [["hum", 31.5], ["noise", 15.76], ["mains hum", 12.24]]], "duration": [33.59, 12.95, 0.18, 28.31, 9.96]} \ No newline at end of file diff --git a/annotations_1/Ey-zuaZV8pM_filtered.json b/annotations_1/Ey-zuaZV8pM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28a280d623f7588a19963f6899ebd3e2585d46d0 --- /dev/null +++ b/annotations_1/Ey-zuaZV8pM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [2.0, 4.78], [10.0, 14.98], [16.0, 16.93], [19.0, 20.16], [27.0, 30.92], [35.0, 36.14], [49.0, 50.09], [51.0, 53.54], [55.0, 69.67], [72.0, 72.89], [77.0, 79.96], [81.0, 84.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.79, 66.88, 0.0, 0.0, 64.52, 0.0, 0.0, 55.31, 38.9, 0.0, 39.33, 39.91], "audiomae_on_audioset": [null, [["speech", 65.19], ["music", 7.28], ["sidetone", 7.03]], null, null, null, null, null, null, null, [["music", 77.8], ["guitar", 2.73], ["musical instrument", 1.97]], null, [["music", 81.15], ["sampler", 2.23], ["musical instrument", 1.97]], [["music", 66.79], ["musical instrument", 4.14], ["guitar", 2.91]]], "duration": [0.66, 2.78, 4.98, 0.93, 1.16, 3.92, 1.14, 1.09, 2.54, 14.67, 0.89, 2.96, 3.54]} \ No newline at end of file diff --git a/annotations_1/EzRtOVxgKCI_filtered.json b/annotations_1/EzRtOVxgKCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/EzRtOVxgKCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/EzjFE2CnTBQ_filtered.json b/annotations_1/EzjFE2CnTBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef4844012a2dc000c6f67734e3eba8b679ab7698 --- /dev/null +++ b/annotations_1/EzjFE2CnTBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.46], [12.0, 15.48], [17.0, 27.13], [28.0, 28.0], [35.0, 35.97], [38.0, 38.38], [63.0, 69.42], [71.0, 82.21], [84.0, 84.27], [85.0, 87.37], [101.0, 101.46], [109.0, 111.35], [116.0, 116.58], [131.0, 131.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 29.84, 30.89, 0.0, 0.0, 0.0, 31.08, 30.59, 0.0, 31.05, 0.0, 30.03, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 74.0], ["trance music", 5.58], ["electronic music", 4.08]], [["music", 79.54], ["speech", 4.02], ["didgeridoo", 1.9]], null, null, null, [["music", 52.77], ["speech", 20.57], ["quack", 6.9]], [["music", 78.03], ["sidetone", 2.69], ["sampler", 1.82]], null, [["music", 57.84], ["funny music", 12.24], ["swing music", 2.47]], null, [["cattle, bovinae", 22.75], ["moo", 22.2], ["livestock, farm animals, working animals", 13.45]], null, null], "duration": [0.46, 3.48, 10.13, 0.0, 0.97, 0.38, 6.42, 11.21, 0.27, 2.37, 0.46, 2.35, 0.58, 0.94]} \ No newline at end of file diff --git a/annotations_1/F-HZzW_NS88_filtered.json b/annotations_1/F-HZzW_NS88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7034bc17a946709247524aefe7cebe5792661459 --- /dev/null +++ b/annotations_1/F-HZzW_NS88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 40.66], [44.0, 51.0], [57.0, 71.93], [74.0, 75.12], [75.0, 82.07], [85.0, 85.11], [85.0, 85.23], [85.0, 85.26], [85.0, 85.31], [85.0, 88.21], [91.0, 102.96], [104.0, 113.16], [116.0, 119.25]], "keep_status": [true, true, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [35.55, 35.24, 36.45, 0.0, 37.5, 0.0, 0.0, 0.0, 0.0, 45.43, 59.15, 44.29, 35.21], "audiomae_on_audioset": [[["buzz", 23.97], ["hum", 12.17], ["mains hum", 11.42]], [["music", 52.77], ["hum", 8.7], ["speech", 5.37]], [["music", 34.99], ["hum", 19.62], ["mains hum", 12.04]], null, [["music", 41.94], ["hum", 24.36], ["mains hum", 7.72]], null, null, null, null, [["hum", 14.84], ["fly, housefly", 12.37], ["music", 9.76]], null, [["music", 53.31], ["vehicle", 7.02], ["hum", 4.91]], [["hum", 37.11], ["music", 21.54], ["mains hum", 15.83]]], "duration": [25.66, 7.0, 14.93, 1.12, 7.07, 0.11, 0.23, 0.26, 0.31, 3.21, 11.96, 9.16, 3.25]} \ No newline at end of file diff --git a/annotations_1/F0VmzZy-AF4_filtered.json b/annotations_1/F0VmzZy-AF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5ff2a81a910265a3dd2cece949e9ce9552db49 --- /dev/null +++ b/annotations_1/F0VmzZy-AF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.62], [8.0, 13.31], [16.0, 16.56], [25.0, 25.66], [28.0, 44.47], [46.0, 46.35], [47.0, 82.61], [84.0, 89.58], [93.0, 99.33], [101.0, 101.33], [103.0, 104.14], [108.0, 108.94], [113.0, 119.77], [120.0, 119.87], [120.0, 119.94], [121.0, 122.07], [123.0, 123.6], [127.0, 127.89], [128.0, 129.17], [133.0, 133.44], [134.0, 168.89], [174.0, 174.72], [180.0, 180.35], [181.0, 181.4], [192.0, 192.77], [193.0, 194.56], [199.0, 199.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.09, 0.0, 0.0, 33.08, 0.0, 0.0, 31.15, 31.28, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 78.06], ["synthesizer", 1.71], ["singing", 1.41]], null, null, [["music", 45.75], ["boing", 26.34], ["moo", 5.37]], [["music", 79.91], ["singing", 3.49], ["musical instrument", 1.23]], null, null, null, [["music", 79.38], ["singing", 1.26], ["soundtrack music", 1.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 5.31, 0.56, 0.66, 16.47, 0.35, 35.61, 5.58, 6.33, 0.33, 1.14, 0.94, 6.77, -0.13, -0.06, 1.07, 0.6, 0.89, 1.17, 0.44, 34.89, 0.72, 0.35, 0.4, 0.77, 1.56, 0.34]} \ No newline at end of file diff --git a/annotations_1/F0ga5pmQjnc_filtered.json b/annotations_1/F0ga5pmQjnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c029369182893f718f62cd86f416e45ca0b768b --- /dev/null +++ b/annotations_1/F0ga5pmQjnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [3.0, 3.77], [5.0, 5.71], [7.0, 8.29], [10.0, 11.38], [12.0, 15.06], [16.0, 18.03], [19.0, 21.24], [26.0, 34.94], [35.0, 39.83], [44.0, 69.57], [76.0, 76.01], [79.0, 79.08], [81.0, 82.12], [86.0, 87.0], [93.0, 107.87], [108.0, 110.76], [112.0, 112.16], [113.0, 125.88], [129.0, 129.44], [131.0, 132.53]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 54.1, 60.05, 48.87, 47.82, 33.93, 0.0, 0.0, 0.0, 0.0, 33.52, 35.18, 0.0, 32.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 47.61], ["throbbing", 14.44], ["mains hum", 11.89]], [["speech", 37.76], ["hum", 16.03], ["rumble", 8.21]], [["music", 77.8], ["electronic music", 5.66], ["hum", 2.46]], null, null, null, null, [["music", 25.4], ["buzz", 7.55], ["fly, housefly", 7.52]], [["music", 62.2], ["throbbing", 9.61], ["hum", 5.82]], null, [["throbbing", 40.91], ["music", 32.65], ["hum", 18.17]], null, null], "duration": [1.37, 0.77, 0.71, 1.29, 1.38, 3.06, 2.03, 2.24, 8.94, 4.83, 25.57, 0.01, 0.08, 1.12, 1.0, 14.87, 2.76, 0.16, 12.88, 0.44, 1.53]} \ No newline at end of file diff --git a/annotations_1/F1nejgJdusQ_filtered.json b/annotations_1/F1nejgJdusQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ddc0a77639d9fbb02cb68a4ada3d2611f4e238e --- /dev/null +++ b/annotations_1/F1nejgJdusQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.63], [12.0, 12.38], [14.0, 15.38], [17.0, 18.72], [19.0, 20.56], [22.0, 22.81], [24.0, 24.9], [26.0, 25.69], [31.0, 57.74], [58.0, 60.64], [62.0, 68.71], [69.0, 69.97], [73.0, 78.98], [86.0, 87.76], [88.0, 88.94], [90.0, 90.26], [91.0, 94.0], [98.0, 114.71], [116.0, 132.34], [133.0, 134.0], [136.0, 138.91], [139.0, 151.53], [153.0, 154.55], [156.0, 165.67], [168.0, 172.72], [175.0, 175.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, true, false, false, true, false, false, true, false], "silence_prob": [33.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.6, 32.12, 28.28, 0.0, 28.79, 0.0, 0.0, 0.0, 28.45, 29.22, 31.97, 0.0, 42.74, 34.13, 0.0, 32.88, 44.23, 0.0], "audiomae_on_audioset": [[["music", 39.91], ["foghorn", 28.79], ["musical instrument", 6.8]], null, null, null, null, null, null, null, [["foghorn", 33.13], ["music", 24.1], ["theremin", 13.97]], [["speech", 18.58], ["music", 8.82], ["civil defense siren", 8.34]], [["music", 34.49], ["screaming", 6.79], ["outside, urban or manmade", 5.69]], null, [["music", 44.07], ["musical instrument", 10.65], ["trombone", 5.69]], null, null, null, [["music", 65.68], ["trombone", 4.69], ["orchestra", 2.46]], [["music", 19.98], ["theremin", 5.96], ["hum", 5.46]], [["music", 32.5], ["theremin", 24.0], ["musical instrument", 7.58]], null, [["fly, housefly", 45.62], ["mosquito", 25.71], ["insect", 16.99]], [["music", 29.41], ["cowbell", 7.99], ["livestock, farm animals, working animals", 7.41]], null, [["music", 51.16], ["musical instrument", 15.72], ["didgeridoo", 7.23]], [["music", 40.38], ["theremin", 18.32], ["wind instrument, woodwind instrument", 6.36]], null], "duration": [2.63, 0.38, 1.38, 1.72, 1.56, 0.81, 0.9, -0.31, 26.74, 2.64, 6.71, 0.97, 5.98, 1.76, 0.94, 0.26, 3.0, 16.71, 16.34, 1.0, 2.91, 12.53, 1.55, 9.67, 4.72, 0.83]} \ No newline at end of file diff --git a/annotations_1/F2AbEJnPRYM_filtered.json b/annotations_1/F2AbEJnPRYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c0c947c0f40a6778a2ba3539d52ad2d362b2203 --- /dev/null +++ b/annotations_1/F2AbEJnPRYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [3.0, 3.75], [7.0, 11.53], [16.0, 16.87], [18.0, 18.87], [20.0, 21.64], [22.0, 22.64], [26.0, 26.87], [28.0, 30.91], [34.0, 35.01], [36.0, 36.76], [38.0, 40.49], [41.0, 42.72], [43.0, 44.05], [44.0, 46.58], [48.0, 48.46], [65.0, 65.74], [69.0, 69.35], [71.0, 72.6], [74.0, 74.66], [82.0, 82.24], [84.0, 84.57], [88.0, 88.96], [95.0, 95.44], [107.0, 107.2], [110.0, 110.34], [111.0, 121.83], [123.0, 124.11], [130.0, 130.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 38.5, 0.0, 0.0, 53.22, 0.0, 0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 37.28], ["didgeridoo", 25.91], ["speech", 5.23]], null, null, null, null, null, [["music", 41.82], ["speech", 22.33], ["electronic music", 6.24]], null, null, null, null, null, null, null, null, null, null, null, [["music", 64.84], ["grunt", 8.51], ["musical instrument", 2.09]], null, null], "duration": [0.65, 0.75, 4.53, 0.87, 0.87, 1.64, 0.64, 0.87, 2.91, 1.01, 0.76, 2.49, 1.72, 1.05, 2.58, 0.46, 0.74, 0.35, 1.6, 0.66, 0.24, 0.57, 0.96, 0.44, 0.2, 0.34, 10.83, 1.11, 0.38]} \ No newline at end of file diff --git a/annotations_1/F2V5i3EyRd4_filtered.json b/annotations_1/F2V5i3EyRd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81a80756882027fd49a22cd56527cb3554bbcc69 --- /dev/null +++ b/annotations_1/F2V5i3EyRd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.39], [27.0, 27.6], [30.0, 31.11], [32.0, 33.62], [39.0, 44.04], [45.0, 46.14], [48.0, 54.97], [55.0, 62.68], [66.0, 77.3], [84.0, 109.19], [113.0, 120.34], [124.0, 139.26]], "keep_status": [false, false, false, false, true, false, true, true, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.64, 0.0, 32.57, 29.01, 28.9, 32.85, 30.66, 29.83], "audiomae_on_audioset": [null, null, null, null, [["hum", 24.79], ["mains hum", 20.94], ["music", 20.24]], null, [["music", 33.98], ["didgeridoo", 19.92], ["hum", 7.19]], [["speech", 29.66], ["music", 17.8], ["hum", 11.58]], [["explosion", 16.87], ["gunshot, gunfire", 13.88], ["burst, pop", 9.16]], [["hum", 31.17], ["throbbing", 29.72], ["music", 27.52]], [["music", 46.5], ["throbbing", 10.13], ["speech", 8.05]], [["music", 34.98], ["speech", 28.03], ["hum", 5.52]]], "duration": [1.39, 0.6, 1.11, 1.62, 5.04, 1.14, 6.97, 7.68, 11.3, 25.19, 7.34, 15.26]} \ No newline at end of file diff --git a/annotations_1/F4QzrKakPmU_filtered.json b/annotations_1/F4QzrKakPmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3034ec315063b547f26cdeaf9cd4635a9660eb59 --- /dev/null +++ b/annotations_1/F4QzrKakPmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.73], [14.0, 16.55], [18.0, 20.98], [26.0, 33.22], [38.0, 38.25], [41.0, 45.17], [47.0, 72.93], [74.0, 96.69], [97.0, 111.65], [116.0, 115.91], [117.0, 119.67]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 71.57, 52.74, 40.17, 0.0, 32.2, 31.0, 31.63, 40.21, 0.0, 57.72], "audiomae_on_audioset": [null, null, null, [["hum", 38.15], ["throbbing", 16.22], ["mains hum", 15.43]], null, [["throbbing", 32.31], ["hum", 19.33], ["mains hum", 19.27]], [["music", 45.25], ["cacophony", 7.86], ["buzz", 5.11]], [["music", 33.72], ["mains hum", 24.73], ["hum", 21.01]], [["music", 34.08], ["singing bowl", 21.88], ["hum", 7.27]], null, null], "duration": [0.73, 2.55, 2.98, 7.22, 0.25, 4.17, 25.93, 22.69, 14.65, -0.09, 2.67]} \ No newline at end of file diff --git a/annotations_1/F55uFHs0d-o_filtered.json b/annotations_1/F55uFHs0d-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2c05d8f6d56ed96ab010505d1d736cf3e46525 --- /dev/null +++ b/annotations_1/F55uFHs0d-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.35], [70.0, 72.42], [73.0, 74.21], [79.0, 79.84], [105.0, 106.52], [109.0, 110.56], [111.0, 111.87], [116.0, 116.4], [118.0, 118.54], [123.0, 123.4], [135.0, 136.11], [136.0, 136.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.88, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 37.9], ["music", 26.01], ["throbbing", 16.97]], null, null, null, null, null, null, null, null, null, null, null], "duration": [24.35, 2.42, 1.21, 0.84, 1.52, 1.56, 0.87, 0.4, 0.54, 0.4, 1.11, 0.66]} \ No newline at end of file diff --git a/annotations_1/F58XJgGx3DY_filtered.json b/annotations_1/F58XJgGx3DY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebae1e8af359fa469224740274e6ef287010e20d --- /dev/null +++ b/annotations_1/F58XJgGx3DY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.41], [11.0, 11.74], [14.0, 24.58], [25.0, 43.65], [46.0, 54.38], [61.0, 68.64], [70.0, 71.93], [72.0, 72.66], [86.0, 87.2], [116.0, 116.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.97, 0.0, 65.32, 43.08, 67.25, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 55.61], ["musical instrument", 10.87], ["speech", 6.99]], null, null, null, null, null, null], "duration": [2.41, 0.74, 10.58, 18.65, 8.38, 7.64, 1.93, 0.66, 1.2, 0.7]} \ No newline at end of file diff --git a/annotations_1/F5NFCYDB5hI_filtered.json b/annotations_1/F5NFCYDB5hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a22140539a68db25c57200307007ffadd276a94 --- /dev/null +++ b/annotations_1/F5NFCYDB5hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.17], [17.0, 16.93], [18.0, 18.69], [20.0, 20.28], [21.0, 21.3], [27.0, 31.28], [32.0, 34.03], [35.0, 36.02], [38.0, 38.42], [40.0, 40.66], [42.0, 54.19], [55.0, 55.16], [56.0, 74.9], [77.0, 78.6], [79.0, 112.89], [116.0, 116.28], [116.0, 116.5], [117.0, 118.59], [119.0, 118.64], [119.0, 119.37], [125.0, 133.0], [141.0, 145.88], [157.0, 164.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 99.84, 0.0, 0.0, 0.0, 99.8, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 88.83, 65.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, -0.07, 0.69, 0.28, 0.3, 4.28, 2.03, 1.02, 0.42, 0.66, 12.19, 0.16, 18.9, 1.6, 33.89, 0.28, 0.5, 1.59, -0.36, 0.37, 8.0, 4.88, 7.62]} \ No newline at end of file diff --git a/annotations_1/F6E2ojebPlA_filtered.json b/annotations_1/F6E2ojebPlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084b9e56a2af1f951e7347402b1da08c04f9046f --- /dev/null +++ b/annotations_1/F6E2ojebPlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [10.0, 11.4], [12.0, 13.09], [15.0, 16.53], [19.0, 19.95], [24.0, 24.27], [26.0, 25.78], [35.0, 35.63], [37.0, 38.1], [40.0, 39.92], [42.0, 42.6], [60.0, 64.54], [66.0, 67.29], [70.0, 71.83], [74.0, 75.49], [77.0, 77.08], [78.0, 81.78], [83.0, 83.71], [86.0, 88.32], [109.0, 109.59], [113.0, 114.22], [136.0, 145.44], [152.0, 154.97], [157.0, 165.97], [166.0, 170.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.83, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 53.59, 0.0, 0.0, 90.6, 74.13, 82.61, 58.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 1.4, 1.09, 1.53, 0.95, 0.27, -0.22, 0.63, 1.1, -0.08, 0.6, 4.54, 1.29, 1.83, 1.49, 0.08, 3.78, 0.71, 2.32, 0.59, 1.22, 9.44, 2.97, 8.97, 4.82]} \ No newline at end of file diff --git a/annotations_1/F70k-PX3p0o_filtered.json b/annotations_1/F70k-PX3p0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d496ba36a67b21c8ba7f1600a234c676427204cb --- /dev/null +++ b/annotations_1/F70k-PX3p0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.09], [22.0, 21.98], [25.0, 27.58], [31.0, 40.04], [42.0, 43.73], [46.0, 55.16], [57.0, 78.75], [80.0, 81.33], [84.0, 86.1], [89.0, 89.72], [92.0, 94.15], [96.0, 102.22], [106.0, 126.25], [127.0, 131.45], [132.0, 139.73], [141.0, 150.3], [153.0, 156.46], [157.0, 160.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.3, 85.9, 0.0, 75.55, 60.42, 0.0, 98.1, 0.0, 99.82, 78.55, 61.97, 95.78, 81.17, 65.44, 99.52, 99.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, -0.02, 2.58, 9.04, 1.73, 9.16, 21.75, 1.33, 2.1, 0.72, 2.15, 6.22, 20.25, 4.45, 7.73, 9.3, 3.46, 3.62]} \ No newline at end of file diff --git a/annotations_1/F8UwjJzF4LY_filtered.json b/annotations_1/F8UwjJzF4LY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26bcc97f88c5e49e6960b52b2248b920af1d9788 --- /dev/null +++ b/annotations_1/F8UwjJzF4LY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.08], [17.0, 17.37], [25.0, 30.4], [31.0, 35.55], [36.0, 71.64], [75.0, 75.66], [88.0, 108.7], [110.0, 110.61], [113.0, 142.67], [144.0, 145.02], [145.0, 145.15]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.34, 33.69, 0.0, 0.0, 33.16, 0.0, 32.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 63.32], ["insect", 20.96], ["mosquito", 15.05]], [["speech", 42.01], ["music", 20.19], ["hum", 5.13]], null, null, [["music", 67.47], ["speech", 2.77], ["theremin", 2.13]], null, [["music", 43.33], ["speech", 31.98], ["boing", 13.06]], null, null], "duration": [1.08, 0.37, 5.4, 4.55, 35.64, 0.66, 20.7, 0.61, 29.67, 1.02, 0.15]} \ No newline at end of file diff --git a/annotations_1/F8Y0hCMWyFg_filtered.json b/annotations_1/F8Y0hCMWyFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02c4c178da27d62fc01e8e72b150e3975b4667d5 --- /dev/null +++ b/annotations_1/F8Y0hCMWyFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.28], [15.0, 14.98], [27.0, 27.01], [31.0, 72.44], [74.0, 90.85], [92.0, 93.93], [96.0, 97.16], [99.0, 99.44], [102.0, 103.96], [105.0, 107.74], [109.0, 109.59], [113.0, 114.94], [116.0, 117.36], [118.0, 119.64], [120.0, 122.42], [126.0, 127.18], [129.0, 128.8], [130.0, 132.0], [135.0, 135.24], [139.0, 139.5], [145.0, 145.45], [147.0, 150.53], [152.0, 155.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.8, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 64.97, 92.15], "audiomae_on_audioset": [null, null, null, null, [["music", 76.63], ["speech", 3.93], ["hum", 3.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.28, -0.02, 0.01, 41.44, 16.85, 1.93, 1.16, 0.44, 1.96, 2.74, 0.59, 1.94, 1.36, 1.64, 2.42, 1.18, -0.2, 2.0, 0.24, 0.5, 0.45, 3.53, 3.24]} \ No newline at end of file diff --git a/annotations_1/F8q-K4BTbEk_filtered.json b/annotations_1/F8q-K4BTbEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b18b979b6833b66fad9efcb36b035f87caf527c --- /dev/null +++ b/annotations_1/F8q-K4BTbEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [5.0, 5.97], [9.0, 10.4], [16.0, 18.0], [18.0, 20.16], [20.0, 21.88], [23.0, 23.75], [25.0, 25.0], [27.0, 27.36], [30.0, 30.42], [32.0, 33.99], [39.0, 39.39], [42.0, 42.67], [51.0, 52.2], [53.0, 53.4], [54.0, 54.57], [55.0, 56.49], [57.0, 60.2], [63.0, 65.37], [67.0, 72.17], [74.0, 74.09], [75.0, 74.92], [76.0, 76.67], [78.0, 79.24], [80.0, 83.1], [85.0, 85.45], [87.0, 87.15], [89.0, 89.36], [90.0, 92.33], [92.0, 93.53]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 87.19, 44.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.97, 69.47, 54.5, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 35.87, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 20.25], ["speech", 19.29], ["hum", 4.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 34.09], ["sidetone", 18.9], ["speech", 10.9]], null], "duration": [1.16, 0.97, 1.4, 2.0, 2.16, 1.88, 0.75, 0.0, 0.36, 0.42, 1.99, 0.39, 0.67, 1.2, 0.4, 0.57, 1.49, 3.2, 2.37, 5.17, 0.09, -0.08, 0.67, 1.24, 3.1, 0.45, 0.15, 0.36, 2.33, 1.53]} \ No newline at end of file diff --git a/annotations_1/F8vcszMAya4_filtered.json b/annotations_1/F8vcszMAya4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..755a1bec042391c0211db214d1c9b90433b9d15f --- /dev/null +++ b/annotations_1/F8vcszMAya4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [6.0, 6.91], [8.0, 9.22], [11.0, 13.66], [16.0, 18.12], [22.0, 24.11], [26.0, 27.45], [28.0, 36.71], [41.0, 40.96], [47.0, 46.95], [50.0, 50.38], [58.0, 59.17], [60.0, 60.62], [64.0, 65.5], [67.0, 72.52], [76.0, 76.79], [81.0, 82.63], [83.0, 86.07], [88.0, 88.01], [98.0, 99.12], [100.0, 101.26], [102.0, 103.54], [111.0, 112.06], [113.0, 114.35], [115.0, 115.26], [116.0, 117.31], [118.0, 118.27], [123.0, 124.7], [132.0, 132.93], [147.0, 147.99], [153.0, 153.87], [155.0, 156.12], [158.0, 159.14], [161.0, 162.04], [163.0, 164.17], [165.0, 165.18], [167.0, 167.58], [170.0, 170.13], [172.0, 173.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.8, 90.25, 90.25, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 0.91, 1.22, 2.66, 2.12, 2.11, 1.45, 8.71, -0.04, -0.05, 0.38, 1.17, 0.62, 1.5, 5.52, 0.79, 1.63, 3.07, 0.01, 1.12, 1.26, 1.54, 1.06, 1.35, 0.26, 1.31, 0.27, 1.7, 0.93, 0.99, 0.87, 1.12, 1.14, 1.04, 1.17, 0.18, 0.58, 0.13, 1.57]} \ No newline at end of file diff --git a/annotations_1/F9ScROJxATc_filtered.json b/annotations_1/F9ScROJxATc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e197a378a5346c11f6e753bb9032c606b89b31eb --- /dev/null +++ b/annotations_1/F9ScROJxATc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [7.0, 6.84], [8.0, 8.41], [13.0, 13.51], [16.0, 16.85], [20.0, 20.66], [22.0, 23.28], [30.0, 30.69], [36.0, 37.67], [45.0, 45.81], [46.0, 48.07], [52.0, 52.88], [56.0, 56.67], [65.0, 65.77], [103.0, 103.35], [120.0, 120.07], [129.0, 130.32], [131.0, 131.9], [133.0, 133.71], [140.0, 141.24], [142.0, 142.84], [149.0, 148.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, -0.16, 0.41, 0.51, 0.85, 0.66, 1.28, 0.69, 1.67, 0.81, 2.07, 0.88, 0.67, 0.77, 0.35, 0.07, 1.32, 0.9, 0.71, 1.24, 0.84, -0.14]} \ No newline at end of file diff --git a/annotations_1/F9vKkW_NNjE_filtered.json b/annotations_1/F9vKkW_NNjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01e9a452453229efe8336e6688470ce0c856371e --- /dev/null +++ b/annotations_1/F9vKkW_NNjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.34], [20.0, 21.41], [26.0, 28.02], [37.0, 37.22], [38.0, 41.25], [49.0, 50.82], [53.0, 57.43], [62.0, 65.03], [65.0, 71.93], [75.0, 80.97], [82.0, 104.53], [107.0, 113.63], [114.0, 117.9], [122.0, 122.82]], "keep_status": [false, false, true, false, true, false, false, false, true, true, false, false, true, false], "silence_prob": [30.04, 0.0, 31.96, 0.0, 42.81, 0.0, 58.64, 71.87, 30.83, 36.52, 32.56, 32.85, 42.62, 0.0], "audiomae_on_audioset": [[["music", 67.39], ["speech", 13.57], ["salsa music", 1.92]], null, [["music", 53.85], ["speech", 10.59], ["musical instrument", 4.48]], null, [["music", 35.73], ["speech", 23.83], ["synthesizer", 2.34]], null, null, null, [["speech", 32.0], ["music", 17.03], ["sidetone", 9.92]], [["music", 20.36], ["boing", 11.77], ["whale vocalization", 8.54]], [["music", 33.76], ["didgeridoo", 30.03], ["speech", 13.67]], [["music", 37.4], ["foghorn", 24.05], ["speech", 9.44]], [["music", 51.84], ["speech", 12.75], ["didgeridoo", 2.83]], null], "duration": [10.34, 1.41, 2.02, 0.22, 3.25, 1.82, 4.43, 3.03, 6.93, 5.97, 22.53, 6.63, 3.9, 0.82]} \ No newline at end of file diff --git a/annotations_1/FAAKfmF5Jl4_filtered.json b/annotations_1/FAAKfmF5Jl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ed7b3bca9c9a2dd5d41b5485c83f1fce949b264 --- /dev/null +++ b/annotations_1/FAAKfmF5Jl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.97], [12.0, 13.02], [16.0, 18.18], [20.0, 22.15], [23.0, 24.85], [25.0, 26.18], [30.0, 30.2], [34.0, 34.26], [39.0, 39.46], [40.0, 40.0], [42.0, 41.66], [59.0, 59.21], [66.0, 66.73], [70.0, 70.07], [74.0, 74.36], [81.0, 81.92], [88.0, 87.84], [96.0, 96.65], [100.0, 100.36], [106.0, 107.27], [123.0, 124.93], [125.0, 126.05], [130.0, 135.9], [139.0, 141.52], [142.0, 146.43], [147.0, 149.59], [151.0, 150.87], [153.0, 156.27], [157.0, 157.38], [160.0, 160.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.85, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.85, 79.41, 62.58, 53.84, 0.0, 37.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.18], ["laughter", 18.45], ["music", 16.15]], null, null, null, null, [["speech", 57.5], ["thunk", 13.51], ["music", 13.19]], null, null], "duration": [-0.03, 1.02, 2.18, 2.15, 1.85, 1.18, 0.2, 0.26, 0.46, 0.0, -0.34, 0.21, 0.73, 0.07, 0.36, 0.92, -0.16, 0.65, 0.36, 1.27, 1.93, 1.05, 5.9, 2.52, 4.43, 2.59, -0.13, 3.27, 0.38, 0.81]} \ No newline at end of file diff --git a/annotations_1/FAK7ssvx3oE_filtered.json b/annotations_1/FAK7ssvx3oE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ead67366462a70269781f0bf0d66ef27c092b6d --- /dev/null +++ b/annotations_1/FAK7ssvx3oE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [5.0, 4.97], [13.0, 56.22], [60.0, 83.74], [88.0, 88.59], [90.0, 89.99], [94.0, 94.15], [97.0, 100.47], [102.0, 102.93], [103.0, 120.45], [123.0, 126.98], [135.0, 135.8], [138.0, 140.07], [142.0, 142.97], [152.0, 152.73], [155.0, 156.34]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.97, 0.0, 0.0, 0.0, 32.5, 0.0, 32.58, 33.38, 0.0, 35.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 73.53], ["musical instrument", 4.37], ["guitar", 3.06]], null, null, null, [["music", 49.31], ["musical instrument", 12.39], ["guitar", 6.76]], null, [["music", 52.44], ["guitar", 6.96], ["musical instrument", 6.58]], [["music", 35.94], ["synthesizer", 18.61], ["theremin", 15.32]], null, [["music", 51.31], ["guitar", 9.18], ["musical instrument", 8.37]], null, null, null], "duration": [0.94, -0.03, 43.22, 23.74, 0.59, -0.01, 0.15, 3.47, 0.93, 17.45, 3.98, 0.8, 2.07, 0.97, 0.73, 1.34]} \ No newline at end of file diff --git a/annotations_1/FAmaskY8eXE_filtered.json b/annotations_1/FAmaskY8eXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b8d3ca34dbdd4cad12c7855c8fb9ec291423f72 --- /dev/null +++ b/annotations_1/FAmaskY8eXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.82], [10.0, 11.06], [14.0, 16.77], [22.0, 27.67], [28.0, 30.6], [34.0, 37.76], [39.0, 43.31], [44.0, 47.83], [51.0, 51.95], [55.0, 56.37], [58.0, 63.05], [63.0, 64.18], [68.0, 71.9], [73.0, 73.03], [76.0, 79.51], [81.0, 80.76], [82.0, 82.53], [84.0, 87.05], [89.0, 94.63], [96.0, 97.31], [100.0, 100.6], [105.0, 106.93], [110.0, 110.37], [113.0, 113.58], [118.0, 120.12], [122.0, 122.59], [124.0, 126.32], [130.0, 132.27], [136.0, 138.43], [141.0, 140.81], [153.0, 155.17], [158.0, 167.17], [173.0, 177.2], [180.0, 181.41], [182.0, 183.83], [184.0, 186.61], [188.0, 190.88], [194.0, 194.75], [195.0, 201.12], [202.0, 202.61], [205.0, 209.21], [212.0, 213.24], [216.0, 217.56], [221.0, 222.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.98, 100.0, 100.0, 100.0, 78.21, 100.0, 0.0, 0.0, 85.54, 0.0, 94.22, 0.0, 88.64, 0.0, 0.0, 96.17, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 50.66, 52.05, 41.38, 0.0, 49.54, 32.43, 33.62, 0.0, 0.0, 36.84, 33.45, 0.0, 59.33, 0.0, 98.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.76], ["theremin", 4.19], ["synthesizer", 2.61]], null, [["music", 49.38], ["musical instrument", 6.78], ["plucked string instrument", 5.29]], [["music", 70.69], ["mantra", 8.35], ["cello", 3.57]], [["music", 69.07], ["mantra", 6.86], ["cello", 2.47]], null, null, [["music", 55.26], ["mantra", 6.23], ["accordion", 5.23]], [["music", 64.89], ["mantra", 4.79], ["singing", 1.98]], null, null, null, null, null, null, null], "duration": [5.82, 1.06, 2.77, 5.67, 2.6, 3.76, 4.31, 3.83, 0.95, 1.37, 5.05, 1.18, 3.9, 0.03, 3.51, -0.24, 0.53, 3.05, 5.63, 1.31, 0.6, 1.93, 0.37, 0.58, 2.12, 0.59, 2.32, 2.27, 2.43, -0.19, 2.17, 9.17, 4.2, 1.41, 1.83, 2.61, 2.88, 0.75, 6.12, 0.61, 4.21, 1.24, 1.56, 1.71]} \ No newline at end of file diff --git a/annotations_1/FAnP3FAu5sU_filtered.json b/annotations_1/FAnP3FAu5sU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4791d92f79d8969ec49f57932e6373a12193ae84 --- /dev/null +++ b/annotations_1/FAnP3FAu5sU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.64], [3.0, 30.87], [32.0, 32.56], [33.0, 34.13], [37.0, 37.56], [38.0, 38.97], [40.0, 44.0], [46.0, 47.28], [48.0, 81.19], [82.0, 82.48], [82.0, 85.33], [91.0, 91.93], [95.0, 95.99], [104.0, 106.08], [107.0, 107.81], [111.0, 111.74], [113.0, 113.39], [118.0, 118.49], [120.0, 122.13], [124.0, 125.52]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 30.96, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 37.52], ["glass", 11.42], ["hum", 8.03]], null, null, null, [["speech", 41.74], ["music", 13.17], ["cattle, bovinae", 8.84]], null, null, null, null, null, null, null, null, null], "duration": [-0.36, 27.87, 0.56, 1.13, 0.56, 0.97, 4.0, 1.28, 33.19, 0.48, 3.33, 0.93, 0.99, 2.08, 0.81, 0.74, 0.39, 0.49, 2.13, 1.52]} \ No newline at end of file diff --git a/annotations_1/FBpdDE96XhE_filtered.json b/annotations_1/FBpdDE96XhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47eae897494abd6abe1fea8b3f1561a3786d3749 --- /dev/null +++ b/annotations_1/FBpdDE96XhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [6.0, 6.07], [10.0, 10.15], [14.0, 56.4], [58.0, 60.49], [61.0, 60.62]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.9, 0.0], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 37.96], ["music", 23.72], ["didgeridoo", 7.74]], null], "duration": [1.13, 0.07, 0.15, 42.4, 2.49, -0.38]} \ No newline at end of file diff --git a/annotations_1/FBpzRIzISeY_filtered.json b/annotations_1/FBpzRIzISeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17d8a66ee0f40c379dbc72963f704f81f104e0de --- /dev/null +++ b/annotations_1/FBpzRIzISeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.67], [6.0, 7.99], [10.0, 12.7], [32.0, 31.85], [42.0, 44.04], [46.0, 48.15], [49.0, 51.31], [54.0, 56.27], [57.0, 58.78], [61.0, 61.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 99.99, 100.0, 100.0, 99.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 1.99, 2.7, -0.15, 2.04, 2.15, 2.31, 2.27, 1.78, 0.42]} \ No newline at end of file diff --git a/annotations_1/FC9AZFwoLVg_filtered.json b/annotations_1/FC9AZFwoLVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f98a594b207960fd02b465e432df0f22442afb2f --- /dev/null +++ b/annotations_1/FC9AZFwoLVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [4.0, 6.1], [7.0, 20.87], [22.0, 27.62], [30.0, 37.71], [40.0, 42.82], [44.0, 44.61], [62.0, 62.38], [81.0, 81.85], [90.0, 91.71], [133.0, 133.56], [134.0, 135.46]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.48, 88.64, 37.34, 53.72, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 40.65], ["music", 17.83], ["didgeridoo", 11.39]], null, null, null, null, null, null, null, null], "duration": [0.13, 2.1, 13.87, 5.62, 7.71, 2.82, 0.61, 0.38, 0.85, 1.71, 0.56, 1.46]} \ No newline at end of file diff --git a/annotations_1/FCJSJ2xtky8_filtered.json b/annotations_1/FCJSJ2xtky8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a41c4ed8d3950d4175fd36e60d43b77f43c14c00 --- /dev/null +++ b/annotations_1/FCJSJ2xtky8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.43], [11.0, 12.01], [12.0, 14.0], [15.0, 16.36], [17.0, 19.38], [21.0, 22.45], [25.0, 28.85], [30.0, 33.2], [35.0, 37.61], [39.0, 39.97], [42.0, 41.94], [46.0, 46.63], [48.0, 50.09], [51.0, 52.02], [55.0, 56.27], [59.0, 61.92], [63.0, 65.53], [66.0, 71.37], [77.0, 77.85], [80.0, 103.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 42.69, 0.0, 61.27, 0.0, 64.52, 51.44, 43.1, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 67.38, 68.28, 30.31, 0.0, 31.62], "audiomae_on_audioset": [null, null, [["speech", 48.61], ["music", 6.84], ["sidetone", 4.66]], null, null, null, null, null, [["hum", 31.76], ["throbbing", 27.36], ["mains hum", 12.18]], null, null, null, [["music", 37.38], ["didgeridoo", 11.4], ["percussion", 10.28]], null, null, null, null, [["speech", 40.83], ["music", 26.98], ["groan", 4.78]], null, [["music", 51.07], ["whale vocalization", 8.7], ["synthesizer", 6.54]]], "duration": [1.43, 1.01, 2.0, 1.36, 2.38, 1.45, 3.85, 3.2, 2.61, 0.97, -0.06, 0.63, 2.09, 1.02, 1.27, 2.92, 2.53, 5.37, 0.85, 23.62]} \ No newline at end of file diff --git a/annotations_1/FE42Xc_laYU_filtered.json b/annotations_1/FE42Xc_laYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32acbe4d228190e788cad0d91301c46888acb038 --- /dev/null +++ b/annotations_1/FE42Xc_laYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.44], [24.0, 25.35], [33.0, 35.24], [36.0, 41.99], [43.0, 44.31], [44.0, 44.42], [45.0, 45.25], [48.0, 48.88], [50.0, 51.93], [54.0, 56.74], [58.0, 60.35], [61.0, 62.07], [64.0, 66.82], [68.0, 69.3], [70.0, 76.2], [76.0, 77.52], [80.0, 82.05], [88.0, 88.57], [93.0, 92.82], [95.0, 99.54], [101.0, 103.87], [107.0, 111.74], [114.0, 115.23], [116.0, 118.32], [119.0, 120.65], [125.0, 125.1], [127.0, 129.84], [132.0, 133.34], [135.0, 135.24], [135.0, 143.38]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, true, false, true, false, true, false, false, false, true, true, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 44.37, 50.46, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 51.12, 0.0, 46.26, 0.0, 37.07, 0.0, 47.9, 0.0, 0.0, 53.84, 47.86, 44.66, 0.0, 44.93, 0.0, 0.0, 46.02, 0.0, 0.0, 32.5], "audiomae_on_audioset": [null, null, [["speech", 42.49], ["music", 12.35], ["dial tone", 9.92]], null, null, null, null, null, null, [["music", 45.49], ["electronic music", 9.86], ["gong", 9.58]], null, null, [["music", 33.66], ["hum", 22.27], ["mains hum", 12.75]], null, [["speech", 38.59], ["hum", 14.35], ["music", 12.85]], null, [["music", 45.19], ["ambient music", 11.33], ["hum", 6.09]], null, null, null, [["speech", 36.84], ["music", 25.42], ["hum", 4.23]], [["sonar", 23.87], ["music", 21.73], ["hum", 14.17]], null, [["music", 38.11], ["pulse", 6.23], ["electronic music", 6.06]], null, null, [["music", 29.3], ["theremin", 14.67], ["whale vocalization", 12.48]], null, null, [["speech", 29.65], ["quack", 8.82], ["music", 8.25]]], "duration": [1.44, 1.35, 2.24, 5.99, 1.31, 0.42, 0.25, 0.88, 1.93, 2.74, 2.35, 1.07, 2.82, 1.3, 6.2, 1.52, 2.05, 0.57, -0.18, 4.54, 2.87, 4.74, 1.23, 2.32, 1.65, 0.1, 2.84, 1.34, 0.24, 8.38]} \ No newline at end of file diff --git a/annotations_1/FETaRGJH_JE_filtered.json b/annotations_1/FETaRGJH_JE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83dc23dd19bd9bd9a59383193c83a219b73ef036 --- /dev/null +++ b/annotations_1/FETaRGJH_JE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.55], [31.0, 54.13], [55.0, 108.68], [109.0, 112.19], [113.0, 115.92], [118.0, 120.51], [121.0, 122.77], [125.0, 125.96], [127.0, 129.66], [132.0, 132.8], [135.0, 136.34], [139.0, 141.25], [142.0, 159.65]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.33, 34.52, 0.0, 41.52, 48.56, 53.1, 0.0, 0.0, 38.15, 0.0, 0.0, 42.53, 30.92], "audiomae_on_audioset": [[["hum", 25.17], ["throbbing", 21.56], ["music", 13.26]], [["music", 74.51], ["theremin", 7.57], ["musical instrument", 2.69]], null, [["music", 35.37], ["speech", 30.31], ["singing bowl", 5.08]], [["music", 61.16], ["musical instrument", 11.23], ["percussion", 4.13]], null, null, null, [["music", 35.57], ["speech", 23.95], ["whale vocalization", 5.14]], null, null, [["music", 45.09], ["hum", 16.44], ["throbbing", 8.49]], [["music", 67.11], ["throbbing", 13.5], ["hum", 5.8]]], "duration": [3.55, 23.13, 53.68, 3.19, 2.92, 2.51, 1.77, 0.96, 2.66, 0.8, 1.34, 2.25, 17.65]} \ No newline at end of file diff --git a/annotations_1/FEiK98h1IDc_filtered.json b/annotations_1/FEiK98h1IDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70d23497c23b229910474a0a0f8e00db8daa5baa --- /dev/null +++ b/annotations_1/FEiK98h1IDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [8.0, 8.24], [11.0, 12.53], [15.0, 16.11], [17.0, 21.81], [24.0, 26.25], [27.0, 71.73], [74.0, 81.06], [82.0, 83.32], [85.0, 89.94], [94.0, 98.47], [100.0, 102.59], [103.0, 109.63], [112.0, 134.62], [137.0, 159.68], [161.0, 168.44], [173.0, 180.12], [182.0, 188.54], [190.0, 190.63]], "keep_status": [false, false, false, false, true, false, false, true, false, true, true, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.65, 85.17, 0.0, 38.78, 0.0, 31.11, 33.77, 34.79, 32.41, 30.5, 31.91, 34.21, 33.63, 33.1, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 49.15], ["ambient music", 6.12], ["hum", 5.81]], null, null, [["fly, housefly", 18.58], ["speech", 15.71], ["whack, thwack", 12.28]], null, [["speech", 28.92], ["hum", 25.23], ["mains hum", 13.68]], [["didgeridoo", 30.84], ["music", 27.8], ["fly, housefly", 6.6]], [["music", 37.42], ["throbbing", 27.29], ["hum", 20.29]], [["music", 49.94], ["throbbing", 10.15], ["hum", 10.04]], [["music", 47.66], ["hum", 13.35], ["throbbing", 7.24]], [["music", 46.49], ["hum", 11.68], ["throbbing", 5.29]], [["music", 20.9], ["whack, thwack", 20.72], ["throbbing", 11.3]], [["meow", 37.96], ["cat", 27.58], ["domestic animals, pets", 12.8]], [["music", 32.21], ["groan", 12.94], ["livestock, farm animals, working animals", 9.02]], null], "duration": [0.88, 0.24, 1.53, 1.11, 4.81, 2.25, 44.73, 7.06, 1.32, 4.94, 4.47, 2.59, 6.63, 22.62, 22.68, 7.44, 7.12, 6.54, 0.63]} \ No newline at end of file diff --git a/annotations_1/FFnlaQlI1So_filtered.json b/annotations_1/FFnlaQlI1So_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97ed346fee1833fc0a417579e6c451213a9ceb4d --- /dev/null +++ b/annotations_1/FFnlaQlI1So_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [13.0, 17.04], [18.0, 19.5], [52.0, 53.0], [54.0, 55.56], [57.0, 57.43], [66.0, 67.29], [68.0, 69.8], [72.0, 73.84], [77.0, 78.87], [85.0, 85.87], [102.0, 106.19], [110.0, 110.86], [121.0, 120.87], [133.0, 134.6], [140.0, 141.47]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.56, 46.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.11, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 25.87], ["singing bowl", 18.45], ["music", 13.04]], [["hum", 51.17], ["rumble", 11.87], ["throbbing", 11.43]], null, null, null, null, null, null, null, null, null, [["sidetone", 46.81], ["speech", 15.15], ["didgeridoo", 10.35]], null, null, null, null], "duration": [2.36, 4.04, 1.5, 1.0, 1.56, 0.43, 1.29, 1.8, 1.84, 1.87, 0.87, 4.19, 0.86, -0.13, 1.6, 1.47]} \ No newline at end of file diff --git a/annotations_1/FFnyDGETjzA_filtered.json b/annotations_1/FFnyDGETjzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65db317cfe5a249091da4aeb8415b8f8bdfc9e0e --- /dev/null +++ b/annotations_1/FFnyDGETjzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.18], [17.0, 26.96], [31.0, 31.8], [35.0, 36.66], [38.0, 37.98], [44.0, 45.3], [50.0, 50.35], [52.0, 52.44], [59.0, 58.78], [87.0, 86.75], [90.0, 91.49], [93.0, 94.22], [99.0, 100.01], [108.0, 108.9], [110.0, 111.81], [114.0, 135.95], [136.0, 137.86], [140.0, 151.12], [152.0, 178.02], [181.0, 189.62], [192.0, 201.41]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [37.72, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.02, 0.0, 31.64, 31.09, 30.8, 31.26], "audiomae_on_audioset": [[["hum", 30.44], ["mains hum", 12.69], ["throbbing", 8.79]], [["hum", 39.81], ["mains hum", 32.3], ["music", 10.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.21], ["speech", 19.71], ["hum", 4.24]], null, [["music", 59.76], ["smash, crash", 11.87], ["speech", 2.69]], [["music", 54.9], ["buzz", 14.68], ["livestock, farm animals, working animals", 4.58]], [["music", 33.78], ["hum", 13.51], ["throbbing", 12.39]], [["music", 38.8], ["electric shaver, electric razor", 13.26], ["livestock, farm animals, working animals", 6.08]]], "duration": [2.18, 9.96, 0.8, 1.66, -0.02, 1.3, 0.35, 0.44, -0.22, -0.25, 1.49, 1.22, 1.01, 0.9, 1.81, 21.95, 1.86, 11.12, 26.02, 8.62, 9.41]} \ No newline at end of file diff --git a/annotations_1/FFvaLp9s1p0_filtered.json b/annotations_1/FFvaLp9s1p0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6edcdecee0073ed2c579294e720772b8a593dd4b --- /dev/null +++ b/annotations_1/FFvaLp9s1p0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [3.0, 3.08], [3.0, 7.74], [11.0, 28.8], [29.0, 30.0], [31.0, 54.46], [54.0, 54.51], [55.0, 79.69], [85.0, 112.33], [116.0, 118.76]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 58.38, 37.95, 0.0, 38.76, 0.0, 47.74, 32.34, 45.18], "audiomae_on_audioset": [null, null, null, [["music", 64.66], ["throbbing", 10.02], ["hum", 6.95]], null, [["speech", 63.07], ["sidetone", 14.87], ["music", 13.51]], null, [["music", 32.84], ["hum", 23.91], ["throbbing", 23.47]], [["music", 56.41], ["speech", 18.87], ["noise", 2.71]], [["music", 26.86], ["speech", 26.13], ["synthesizer", 6.86]]], "duration": [-0.04, 0.08, 4.74, 17.8, 1.0, 23.46, 0.51, 24.69, 27.33, 2.76]} \ No newline at end of file diff --git a/annotations_1/FGL4-sXko9w_filtered.json b/annotations_1/FGL4-sXko9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddb68513ae2d49578a086168b936267750094ea8 --- /dev/null +++ b/annotations_1/FGL4-sXko9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 51.36], [53.0, 69.74], [76.0, 90.58], [96.0, 122.74], [123.0, 126.79], [129.0, 130.44], [134.0, 134.7], [136.0, 136.49]], "keep_status": [false, true, true, false, true, false, false, false], "silence_prob": [0.0, 28.19, 28.39, 28.23, 30.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.48], ["explosion", 5.53], ["cacophony", 3.9]], [["whip", 12.91], ["music", 12.69], ["rumble", 10.77]], [["smash, crash", 29.64], ["music", 27.48], ["breaking", 15.44]], [["music", 19.33], ["thunk", 13.4], ["didgeridoo", 5.47]], null, null, null], "duration": [46.36, 16.74, 14.58, 26.74, 3.79, 1.44, 0.7, 0.49]} \ No newline at end of file diff --git a/annotations_1/FGLxQHJ5NEs_filtered.json b/annotations_1/FGLxQHJ5NEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d706de673f7c5e2fe9f3f1ad6f4047512547dd6 --- /dev/null +++ b/annotations_1/FGLxQHJ5NEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [9.0, 9.53], [11.0, 12.09], [14.0, 15.63], [17.0, 17.73], [19.0, 19.72], [20.0, 21.24], [22.0, 22.81], [23.0, 25.19], [26.0, 27.48], [29.0, 29.62], [33.0, 33.42], [35.0, 35.34], [36.0, 36.93], [45.0, 46.01], [53.0, 60.0], [62.0, 62.07], [64.0, 64.35], [82.0, 83.46], [85.0, 87.83], [89.0, 89.95], [93.0, 93.63], [95.0, 96.48], [98.0, 98.27], [101.0, 104.04]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 40.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 24.24], ["hum", 18.6], ["speech", 8.72]], null, null, null, null, null, null, [["throbbing", 41.59], ["hum", 21.29], ["music", 20.63]], null, null, null, [["hum", 31.38], ["music", 30.76], ["mains hum", 8.77]], null, null, null, null, [["music", 36.34], ["hum", 25.4], ["throbbing", 16.26]]], "duration": [1.11, 0.53, 1.09, 1.63, 0.73, 0.72, 1.24, 0.81, 2.19, 1.48, 0.62, 0.42, 0.34, 0.93, 1.01, 7.0, 0.07, 0.35, 1.46, 2.83, 0.95, 0.63, 1.48, 0.27, 3.04]} \ No newline at end of file diff --git a/annotations_1/FGWPKiI0YJQ_filtered.json b/annotations_1/FGWPKiI0YJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa5aca9d8c40c67c6e5993f5e032a310c52daab8 --- /dev/null +++ b/annotations_1/FGWPKiI0YJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 22.79], [30.0, 30.59], [35.0, 37.49], [43.0, 43.14], [52.0, 52.17], [56.0, 56.34], [73.0, 73.77]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [33.7, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 79.26], ["sampler", 3.58], ["synthesizer", 2.56]], null, null, null, null, null, null], "duration": [9.79, 0.59, 2.49, 0.14, 0.17, 0.34, 0.77]} \ No newline at end of file diff --git a/annotations_1/FGwgHAqBLDY_filtered.json b/annotations_1/FGwgHAqBLDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab5ed88539218ae377b1f14d9d159054c4b5cf23 --- /dev/null +++ b/annotations_1/FGwgHAqBLDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [10.0, 18.76], [21.0, 21.27], [26.0, 27.77], [31.0, 33.45], [39.0, 39.88], [45.0, 48.51], [52.0, 52.95], [54.0, 62.18], [63.0, 63.59], [67.0, 68.54], [73.0, 73.85], [88.0, 97.97], [101.0, 109.51], [111.0, 116.72], [118.0, 118.96], [122.0, 121.68], [133.0, 133.37], [136.0, 136.7], [139.0, 145.94], [151.0, 153.18]], "keep_status": [false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.71, 0.0, 0.0, 31.8, 0.0, 32.31, 0.0, 33.84, 0.0, 0.0, 0.0, 31.84, 31.56, 32.63, 0.0, 0.0, 0.0, 0.0, 30.97, 51.12], "audiomae_on_audioset": [null, [["music", 54.4], ["speech", 7.55], ["whack, thwack", 5.94]], null, null, [["music", 27.28], ["smash, crash", 16.0], ["boing", 9.67]], null, [["music", 20.35], ["boing", 12.41], ["clang", 5.12]], null, [["music", 68.9], ["boing", 8.34], ["theremin", 2.32]], null, null, null, [["music", 55.5], ["boing", 19.65], ["speech", 7.74]], [["music", 74.84], ["synthesizer", 6.03], ["cacophony", 4.95]], [["music", 72.18], ["sonar", 9.0], ["musical instrument", 2.87]], null, null, null, null, [["music", 79.07], ["musical instrument", 3.49], ["mains hum", 2.61]], null], "duration": [0.49, 8.76, 0.27, 1.77, 2.45, 0.88, 3.51, 0.95, 8.18, 0.59, 1.54, 0.85, 9.97, 8.51, 5.72, 0.96, -0.32, 0.37, 0.7, 6.94, 2.18]} \ No newline at end of file diff --git a/annotations_1/FHeC_tenzrw_filtered.json b/annotations_1/FHeC_tenzrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af9fa5cb145e15b68053e1b71c06ea1d19bbb96f --- /dev/null +++ b/annotations_1/FHeC_tenzrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.08], [14.0, 17.64], [26.0, 26.84], [28.0, 28.61], [29.0, 35.56], [39.0, 42.67], [46.0, 53.57], [55.0, 56.08], [58.0, 81.48], [84.0, 84.1], [87.0, 93.8], [94.0, 109.58], [110.0, 115.42]], "keep_status": [false, false, false, false, false, true, true, false, true, false, true, true, false], "silence_prob": [0.0, 31.2, 0.0, 0.0, 27.97, 27.88, 28.15, 0.0, 28.24, 0.0, 30.84, 28.52, 28.16], "audiomae_on_audioset": [null, [["hum", 36.94], ["music", 17.56], ["throbbing", 16.93]], null, null, [["speech", 62.57], ["mains hum", 7.97], ["hum", 6.39]], [["music", 30.14], ["speech", 11.24], ["hum", 10.83]], [["music", 43.6], ["speech", 17.86], ["animal", 2.83]], null, [["mains hum", 20.45], ["hum", 17.78], ["music", 12.55]], null, [["music", 43.67], ["whale vocalization", 16.07], ["rumble", 8.04]], [["music", 43.7], ["hum", 9.42], ["throbbing", 8.61]], [["speech", 63.12], ["mains hum", 5.74], ["hum", 4.23]]], "duration": [1.08, 3.64, 0.84, 0.61, 6.56, 3.67, 7.57, 1.08, 23.48, 0.1, 6.8, 15.58, 5.42]} \ No newline at end of file diff --git a/annotations_1/FHiB0ZTO8fU_filtered.json b/annotations_1/FHiB0ZTO8fU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d34fad7121d62dcce6176c402ed78a5b12a039a --- /dev/null +++ b/annotations_1/FHiB0ZTO8fU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [6.0, 29.37], [33.0, 34.79], [35.0, 45.0], [50.0, 57.21], [63.0, 64.23], [71.0, 71.68], [73.0, 77.67], [80.0, 81.3], [82.0, 81.77], [82.0, 82.04], [82.0, 82.07], [82.0, 82.38], [82.0, 82.41], [82.0, 82.48], [82.0, 83.2], [89.0, 90.07], [94.0, 94.31], [103.0, 103.64], [116.0, 120.95], [122.0, 128.17], [132.0, 133.57]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 41.1, 0.0, 38.06, 36.16, 0.0, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89, 31.8, 0.0], "audiomae_on_audioset": [null, [["music", 23.24], ["glockenspiel", 16.43], ["marimba, xylophone", 14.19]], null, [["music", 77.59], ["musical instrument", 2.55], ["vibraphone", 2.25]], [["music", 55.66], ["musical instrument", 7.13], ["effects unit", 4.0]], null, null, [["speech", 54.39], ["fart", 5.29], ["fly, housefly", 4.02]], null, null, null, null, null, null, null, null, null, null, null, [["animal", 40.49], ["speech", 16.56], ["sheep", 10.59]], [["speech", 47.43], ["music", 12.59], ["livestock, farm animals, working animals", 6.1]], null], "duration": [1.83, 23.37, 1.79, 10.0, 7.21, 1.23, 0.68, 4.67, 1.3, -0.23, 0.04, 0.07, 0.38, 0.41, 0.48, 1.2, 1.07, 0.31, 0.64, 4.95, 6.17, 1.57]} \ No newline at end of file diff --git a/annotations_1/FJWgF5XnVLY_filtered.json b/annotations_1/FJWgF5XnVLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..826f9bb7c1e96348d11dd6c1a332b3756785b87f --- /dev/null +++ b/annotations_1/FJWgF5XnVLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.36], [13.0, 12.77], [19.0, 18.84], [21.0, 26.52], [29.0, 29.66], [32.0, 36.76], [38.0, 39.28], [41.0, 54.09]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.23, 0.0, 99.88, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.36, -0.23, -0.16, 5.52, 0.66, 4.76, 1.28, 13.09]} \ No newline at end of file diff --git a/annotations_1/FKW1h53hSxs_filtered.json b/annotations_1/FKW1h53hSxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d279bd1a9b462a13c39c1b70273d265dc4cd5c5 --- /dev/null +++ b/annotations_1/FKW1h53hSxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.5], [19.0, 25.3], [30.0, 31.63], [35.0, 36.05], [37.0, 36.9], [38.0, 46.7], [49.0, 70.51], [71.0, 71.49], [72.0, 77.9]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [30.77, 29.38, 0.0, 0.0, 0.0, 30.85, 29.3, 0.0, 28.8], "audiomae_on_audioset": [[["music", 42.6], ["throbbing", 20.82], ["hum", 16.97]], [["music", 63.11], ["speech", 5.12], ["whack, thwack", 3.47]], null, null, null, [["music", 54.29], ["speech", 11.91], ["smash, crash", 2.71]], [["music", 86.97], ["electronic music", 2.9], ["theremin", 0.95]], null, [["speech", 46.85], ["music", 17.69], ["trombone", 4.7]]], "duration": [3.5, 6.3, 1.63, 1.05, -0.1, 8.7, 21.51, 0.49, 5.9]} \ No newline at end of file diff --git a/annotations_1/FLPGiFhKS28_filtered.json b/annotations_1/FLPGiFhKS28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3c4b449d92cea6aa393d6aebf7e6d7759c9e9ac --- /dev/null +++ b/annotations_1/FLPGiFhKS28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.36], [18.0, 18.54], [33.0, 34.67], [99.0, 100.68], [113.0, 115.62], [121.0, 123.48], [146.0, 146.94], [148.0, 149.47]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.7, 43.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 83.28], ["speech", 2.11], ["synthesizer", 1.81]], [["music", 46.74], ["speech", 31.79], ["musical instrument", 1.36]], null, null], "duration": [1.36, 0.54, 1.67, 1.68, 2.62, 2.48, 0.94, 1.47]} \ No newline at end of file diff --git a/annotations_1/FLjWVccRPOA_filtered.json b/annotations_1/FLjWVccRPOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4363cfacd1723b326b56a72ae76372fae8032d4c --- /dev/null +++ b/annotations_1/FLjWVccRPOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.42], [28.0, 36.05], [37.0, 37.4], [42.0, 41.99], [43.0, 44.61], [47.0, 49.08], [51.0, 52.2], [59.0, 65.67], [75.0, 78.6], [79.0, 79.54], [80.0, 80.81], [81.0, 81.87], [83.0, 83.22], [87.0, 94.9], [96.0, 97.68], [99.0, 101.19], [103.0, 106.93], [108.0, 109.41], [111.0, 113.85], [116.0, 126.69], [127.0, 128.33], [129.0, 134.67], [139.0, 141.79], [143.0, 144.07], [145.0, 147.06], [153.0, 153.35], [155.0, 155.83], [156.0, 156.88], [160.0, 160.69], [164.0, 165.92], [167.0, 168.08], [171.0, 171.66], [173.0, 176.91]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.4, 0.0, 0.0, 0.0, 38.31, 0.0, 34.12, 36.05, 0.0, 0.0, 0.0, 0.0, 31.34, 0.0, 32.08, 33.09, 0.0, 32.46, 32.57, 0.0, 32.91, 35.26, 0.0, 31.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17], "audiomae_on_audioset": [null, [["music", 24.16], ["hum", 21.98], ["thunk", 16.5]], null, null, null, [["music", 47.34], ["speech", 10.62], ["hum", 8.01]], null, [["speech", 26.62], ["rumble", 23.31], ["music", 10.49]], [["music", 75.45], ["hum", 5.49], ["mains hum", 1.97]], null, null, null, null, [["music", 80.3], ["hum", 3.46], ["soundtrack music", 3.34]], null, [["mains hum", 45.2], ["hum", 16.32], ["music", 12.77]], [["music", 32.39], ["speech", 30.48], ["hum", 12.2]], null, [["speech", 43.89], ["music", 21.72], ["hum", 9.61]], [["hum", 30.54], ["music", 28.84], ["mains hum", 18.12]], null, [["hum", 25.35], ["speech", 16.09], ["mains hum", 15.15]], [["music", 17.57], ["hum", 16.91], ["mains hum", 9.08]], null, [["speech", 57.36], ["fly, housefly", 5.99], ["insect", 5.44]], null, null, null, null, null, null, null, [["hum", 41.34], ["mains hum", 31.12], ["noise", 7.08]]], "duration": [0.42, 8.05, 0.4, -0.01, 1.61, 2.08, 1.2, 6.67, 3.6, 0.54, 0.81, 0.87, 0.22, 7.9, 1.68, 2.19, 3.93, 1.41, 2.85, 10.69, 1.33, 5.67, 2.79, 1.07, 2.06, 0.35, 0.83, 0.88, 0.69, 1.92, 1.08, 0.66, 3.91]} \ No newline at end of file diff --git a/annotations_1/FMDgoOi_HLk_filtered.json b/annotations_1/FMDgoOi_HLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65d46af2f397853ae5574de599bf549cf40539d7 --- /dev/null +++ b/annotations_1/FMDgoOi_HLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.63], [29.0, 44.0], [47.0, 47.83], [54.0, 54.58], [58.0, 59.95], [62.0, 62.41], [63.0, 63.73], [76.0, 76.33], [78.0, 78.06], [82.0, 82.9], [87.0, 87.64], [95.0, 96.25], [99.0, 99.33], [101.0, 101.56], [110.0, 110.83], [115.0, 115.99], [118.0, 119.08], [121.0, 122.55], [123.0, 124.12], [126.0, 127.2], [144.0, 144.37], [153.0, 153.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.22], ["hum", 7.46], ["ambient music", 3.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 15.0, 0.83, 0.58, 1.95, 0.41, 0.73, 0.33, 0.06, 0.9, 0.64, 1.25, 0.33, 0.56, 0.83, 0.99, 1.08, 1.55, 1.12, 1.2, 0.37, 0.69]} \ No newline at end of file diff --git a/annotations_1/FMbSH8g9vsU_filtered.json b/annotations_1/FMbSH8g9vsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a41b26c94bddfe970964e3bbc8ad23fce897134b --- /dev/null +++ b/annotations_1/FMbSH8g9vsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.27], [23.0, 26.47], [34.0, 97.33], [98.0, 110.59]], "keep_status": [true, true, false, true], "silence_prob": [29.06, 44.2, 0.0, 43.13], "audiomae_on_audioset": [[["music", 44.68], ["didgeridoo", 6.87], ["hum", 5.99]], [["effects unit", 28.68], ["music", 17.55], ["speech", 12.81]], null, [["whale vocalization", 27.49], ["music", 27.03], ["speech", 9.24]]], "duration": [3.27, 3.47, 63.33, 12.59]} \ No newline at end of file diff --git a/annotations_1/FN3SPnr9EZg_filtered.json b/annotations_1/FN3SPnr9EZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e2bed609f815f429221548dcd49bfeaa630df7a --- /dev/null +++ b/annotations_1/FN3SPnr9EZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [3.0, 3.08], [11.0, 11.87], [15.0, 18.05], [19.0, 19.97], [21.0, 22.17], [28.0, 27.92], [29.0, 29.51], [30.0, 32.86], [50.0, 51.02], [53.0, 53.62], [61.0, 61.26], [67.0, 67.58], [69.0, 69.45], [77.0, 77.57], [87.0, 87.42], [88.0, 88.18], [93.0, 94.53], [101.0, 100.94], [107.0, 107.94], [109.0, 109.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.08, 0.08, 0.87, 3.05, 0.97, 1.17, -0.08, 0.51, 2.86, 1.02, 0.62, 0.26, 0.58, 0.45, 0.57, 0.42, 0.18, 1.53, -0.06, 0.94, 0.17]} \ No newline at end of file diff --git a/annotations_1/FNA0Ejpu22Y_filtered.json b/annotations_1/FNA0Ejpu22Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..227f25b14de795f5dbfcc39855a5889a6580c552 --- /dev/null +++ b/annotations_1/FNA0Ejpu22Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [7.0, 9.81], [25.0, 25.52], [27.0, 29.13], [31.0, 34.45], [41.0, 41.35], [44.0, 44.41], [46.0, 49.17], [52.0, 56.76], [62.0, 62.73], [63.0, 63.73], [65.0, 69.74], [71.0, 74.44], [77.0, 76.84], [78.0, 80.18], [80.0, 80.28], [81.0, 88.65], [92.0, 92.94], [93.0, 95.1], [99.0, 109.34], [116.0, 118.03], [119.0, 120.16], [122.0, 122.91], [123.0, 127.84]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.2, 0.0, 77.36, 86.27, 0.0, 0.0, 58.64, 41.46, 0.0, 0.0, 61.27, 50.31, 0.0, 71.43, 0.0, 83.7, 0.0, 55.53, 62.68, 63.42, 0.0, 0.0, 88.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 53.03], ["musical instrument", 10.09], ["guitar", 5.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 2.81, 0.52, 2.13, 3.45, 0.35, 0.41, 3.17, 4.76, 0.73, 0.73, 4.74, 3.44, -0.16, 2.18, 0.28, 7.65, 0.94, 2.1, 10.34, 2.03, 1.16, 0.91, 4.84]} \ No newline at end of file diff --git a/annotations_1/FPYjy-ZWB-c_filtered.json b/annotations_1/FPYjy-ZWB-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4136cfe7cb3df63c26745a80be7b3cc9e1e032bc --- /dev/null +++ b/annotations_1/FPYjy-ZWB-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.97], [15.0, 16.56], [24.0, 25.66], [28.0, 28.26], [30.0, 31.18], [34.0, 35.67], [41.0, 42.97], [47.0, 47.66], [51.0, 51.54], [60.0, 67.58], [68.0, 72.57], [74.0, 85.14], [86.0, 86.85], [89.0, 90.19], [91.0, 102.96], [107.0, 115.72], [117.0, 117.32]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.07, 38.41, 39.14, 0.0, 0.0, 30.99, 33.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.8], ["fly, housefly", 13.81], ["boing", 10.95]], [["mosquito", 43.67], ["fly, housefly", 19.54], ["insect", 12.85]], [["music", 69.45], ["musical instrument", 7.57], ["guitar", 5.0]], null, null, [["speech", 46.87], ["music", 17.99], ["didgeridoo", 7.92]], [["music", 42.23], ["speech", 26.57], ["throbbing", 3.97]], null], "duration": [-0.03, 1.56, 1.66, 0.26, 1.18, 1.67, 1.97, 0.66, 0.54, 7.58, 4.57, 11.14, 0.85, 1.19, 11.96, 8.72, 0.32]} \ No newline at end of file diff --git a/annotations_1/FPpYxPOjtsw_filtered.json b/annotations_1/FPpYxPOjtsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cf07d16ff48d33ab4e1e3e7cb45616075911311 --- /dev/null +++ b/annotations_1/FPpYxPOjtsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 39.92], [43.0, 43.38], [44.0, 45.05], [52.0, 55.05], [56.0, 57.99], [60.0, 60.44], [63.0, 87.94], [92.0, 118.88]], "keep_status": [false, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 41.91, 0.0, 0.0, 33.36, 31.98], "audiomae_on_audioset": [null, null, null, [["sidetone", 30.91], ["speech", 29.19], ["throbbing", 4.14]], null, null, [["music", 40.27], ["speech", 17.27], ["synthesizer", 12.2]], [["speech", 10.45], ["thump, thud", 8.86], ["rumble", 6.37]]], "duration": [35.92, 0.38, 1.05, 3.05, 1.99, 0.44, 24.94, 26.88]} \ No newline at end of file diff --git a/annotations_1/FPtvpjBEEqo_filtered.json b/annotations_1/FPtvpjBEEqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..badbbe3376bbb8e26e0d7dde5060f4b8f1386ef4 --- /dev/null +++ b/annotations_1/FPtvpjBEEqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.57], [12.0, 19.04], [22.0, 26.1], [26.0, 26.32], [26.0, 26.45], [27.0, 26.97], [29.0, 33.81], [38.0, 58.82], [62.0, 67.47], [70.0, 83.32], [86.0, 94.26], [96.0, 134.79], [140.0, 151.55], [157.0, 156.84], [157.0, 159.73], [162.0, 168.42], [172.0, 194.12], [196.0, 223.05], [228.0, 235.45]], "keep_status": [false, true, true, false, false, false, true, false, true, true, true, false, false, false, false, true, true, true, true], "silence_prob": [30.69, 31.33, 30.92, 0.0, 0.0, 0.0, 30.93, 30.57, 30.18, 29.96, 30.02, 0.0, 31.29, 0.0, 30.91, 30.26, 29.42, 29.41, 29.27], "audiomae_on_audioset": [[["music", 80.51], ["country", 2.08], ["singing", 1.91]], [["music", 56.06], ["didgeridoo", 4.98], ["synthesizer", 2.0]], [["music", 55.53], ["singing", 4.15], ["musical instrument", 2.14]], null, null, null, [["music", 57.12], ["theremin", 5.79], ["musical instrument", 5.48]], [["music", 70.94], ["didgeridoo", 2.87], ["folk music", 2.12]], [["music", 42.35], ["didgeridoo", 14.27], ["musical instrument", 3.76]], [["music", 62.47], ["carnatic music", 3.72], ["singing", 2.24]], [["music", 43.88], ["country", 8.38], ["swing music", 5.86]], null, [["music", 72.11], ["guitar", 5.61], ["musical instrument", 5.32]], null, [["music", 80.19], ["musical instrument", 6.27], ["guitar", 3.37]], [["music", 62.04], ["middle eastern music", 2.15], ["swing music", 2.1]], [["music", 51.17], ["saxophone", 4.82], ["trombone", 4.81]], [["music", 63.09], ["musical instrument", 3.97], ["didgeridoo", 2.14]], [["music", 54.9], ["musical instrument", 4.44], ["guitar", 4.4]]], "duration": [8.57, 7.04, 4.1, 0.32, 0.45, -0.03, 4.81, 20.82, 5.47, 13.32, 8.26, 38.79, 11.55, -0.16, 2.73, 6.42, 22.12, 27.05, 7.45]} \ No newline at end of file diff --git a/annotations_1/FQH9s2dJe50_filtered.json b/annotations_1/FQH9s2dJe50_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7384b8bc27f92aa487ca3921b0829c7a176dec7a --- /dev/null +++ b/annotations_1/FQH9s2dJe50_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [3.0, 4.06], [13.0, 14.3], [17.0, 18.5], [20.0, 22.81], [24.0, 24.58], [25.0, 26.69], [27.0, 35.31], [36.0, 37.18], [38.0, 41.1], [42.0, 43.65], [44.0, 54.78], [55.0, 56.37], [61.0, 62.06], [68.0, 67.85], [68.0, 69.35], [70.0, 74.29], [75.0, 78.46], [81.0, 83.02], [84.0, 86.22], [87.0, 89.19], [90.0, 91.23], [99.0, 99.98], [103.0, 104.46], [106.0, 108.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 72.6, 0.0, 95.91, 0.0, 47.46, 0.0, 0.0, 0.0, 0.0, 92.31, 99.1, 99.76, 85.35, 99.59, 0.0, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.78], ["fly, housefly", 22.03], ["bee, wasp, etc.", 16.93]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 1.06, 1.3, 1.5, 2.81, 0.58, 1.69, 8.31, 1.18, 3.1, 1.65, 10.78, 1.37, 1.06, -0.15, 1.35, 4.29, 3.46, 2.02, 2.22, 2.19, 1.23, 0.98, 1.46, 2.99]} \ No newline at end of file diff --git a/annotations_1/FQLXXM-nktc_filtered.json b/annotations_1/FQLXXM-nktc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5907b1e4115031781480745284b3babeb8d6095 --- /dev/null +++ b/annotations_1/FQLXXM-nktc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.27], [7.0, 7.43], [9.0, 11.94], [13.0, 13.32], [15.0, 17.31], [19.0, 19.57], [28.0, 30.01], [34.0, 34.43], [37.0, 38.48], [42.0, 42.99], [45.0, 45.54], [48.0, 49.1], [51.0, 51.7], [55.0, 57.38], [58.0, 59.8], [63.0, 63.19], [67.0, 67.49], [69.0, 71.15], [77.0, 79.1], [83.0, 83.74], [86.0, 86.71], [88.0, 88.15], [95.0, 97.38], [105.0, 105.56], [107.0, 107.87], [116.0, 116.31]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.2, 0.0, 65.44, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 84.62, 74.29, 0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 26.62], ["fart", 12.34], ["sidetone", 10.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.43, 2.94, 0.32, 2.31, 0.57, 2.01, 0.43, 1.48, 0.99, 0.54, 1.1, 0.7, 2.38, 1.8, 0.19, 0.49, 2.15, 2.1, 0.74, 0.71, 0.15, 2.38, 0.56, 0.87, 0.31]} \ No newline at end of file diff --git a/annotations_1/FQoR9fu-CIE_filtered.json b/annotations_1/FQoR9fu-CIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ce7c25cad04d52dcba7b97f6d43322769cefe7e --- /dev/null +++ b/annotations_1/FQoR9fu-CIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [11.0, 12.46], [14.0, 61.1], [64.0, 64.47], [65.0, 65.69], [67.0, 68.47], [71.0, 71.54], [72.0, 73.3], [74.0, 81.16], [86.0, 86.02], [87.0, 87.17], [89.0, 89.73], [91.0, 91.71], [93.0, 93.66], [95.0, 96.35], [100.0, 101.48], [104.0, 105.31], [106.0, 106.91], [108.0, 108.72], [111.0, 112.68], [116.0, 118.71], [120.0, 122.99], [124.0, 124.95], [126.0, 126.54], [127.0, 127.92], [129.0, 130.5], [132.0, 152.61], [155.0, 157.69], [159.0, 162.99], [164.0, 167.14], [168.0, 173.47], [174.0, 175.93], [176.0, 178.7], [180.0, 180.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.46, 96.89, 0.0, 0.0, 0.0, 0.0, 94.95, 81.0, 91.81, 97.22, 72.9, 0.0, 61.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 57.76], ["sidetone", 15.91], ["chirp tone", 12.8]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.46, 47.1, 0.47, 0.69, 1.47, 0.54, 1.3, 7.16, 0.02, 0.17, 0.73, 0.71, 0.66, 1.35, 1.48, 1.31, 0.91, 0.72, 1.68, 2.71, 2.99, 0.95, 0.54, 0.92, 1.5, 20.61, 2.69, 3.99, 3.14, 5.47, 1.93, 2.7, 0.93]} \ No newline at end of file diff --git a/annotations_1/FQwv6AGpdus_filtered.json b/annotations_1/FQwv6AGpdus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3f73156491d82dbbf2fbe1bf4a1c07670fa139e --- /dev/null +++ b/annotations_1/FQwv6AGpdus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.38], [28.0, 28.05], [28.0, 69.45], [73.0, 86.73], [89.0, 89.5], [92.0, 139.23], [140.0, 151.07]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [33.71, 0.0, 0.0, 32.11, 0.0, 0.0, 31.88], "audiomae_on_audioset": [[["music", 67.61], ["didgeridoo", 8.41], ["sidetone", 3.12]], null, null, [["music", 57.1], ["didgeridoo", 10.22], ["mains hum", 5.13]], null, null, [["music", 63.95], ["effects unit", 5.94], ["synthesizer", 3.37]]], "duration": [3.38, 0.05, 41.45, 13.73, 0.5, 47.23, 11.07]} \ No newline at end of file diff --git a/annotations_1/FRSfDQyoav8_filtered.json b/annotations_1/FRSfDQyoav8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c084ddf43f9ca4613266231be7367e7006559443 --- /dev/null +++ b/annotations_1/FRSfDQyoav8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.93], [17.0, 60.03], [61.0, 74.16], [75.0, 75.88]], "keep_status": [true, false, false, false], "silence_prob": [28.73, 0.0, 30.0, 0.0], "audiomae_on_audioset": [[["sound effect", 18.02], ["reverberation", 11.54], ["music", 7.54]], null, [["hum", 34.23], ["mains hum", 30.3], ["throbbing", 6.72]], null], "duration": [6.93, 43.03, 13.16, 0.88]} \ No newline at end of file diff --git a/annotations_1/FRhbIIkLlFI_filtered.json b/annotations_1/FRhbIIkLlFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0ff3924e19bd57ebd0a1e26a73c778b5e051c6 --- /dev/null +++ b/annotations_1/FRhbIIkLlFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.66], [10.0, 20.41], [80.0, 82.29], [83.0, 89.67], [91.0, 91.66], [99.0, 99.62]], "keep_status": [false, true, false, true, false, false], "silence_prob": [0.0, 34.09, 99.98, 40.31, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 44.26], ["cacophony", 6.08], ["noise", 5.0]], null, [["animal", 22.23], ["dog", 15.79], ["speech", 7.63]], null, null], "duration": [1.66, 10.41, 2.29, 6.67, 0.66, 0.62]} \ No newline at end of file diff --git a/annotations_1/FSXijk37oNs_filtered.json b/annotations_1/FSXijk37oNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0e13d812bd4cb13340f4188a3e6fc2f400b8431 --- /dev/null +++ b/annotations_1/FSXijk37oNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.36], [33.0, 41.91], [45.0, 47.29], [72.0, 77.26], [95.0, 95.35], [96.0, 96.09], [96.0, 96.8], [97.0, 96.89], [109.0, 109.97], [116.0, 116.16], [135.0, 149.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.54, 33.43, 35.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.03], "audiomae_on_audioset": [null, [["music", 46.09], ["throbbing", 24.43], ["mosquito", 4.1]], [["music", 43.63], ["throbbing", 23.55], ["hum", 12.57]], [["music", 37.79], ["speech", 29.18], ["boing", 5.54]], null, null, null, null, null, null, [["cattle, bovinae", 24.7], ["moo", 23.66], ["livestock, farm animals, working animals", 17.98]]], "duration": [0.36, 8.91, 2.29, 5.26, 0.35, 0.09, 0.8, -0.11, 0.97, 0.16, 14.44]} \ No newline at end of file diff --git a/annotations_1/FSj-BCOlGPY_filtered.json b/annotations_1/FSj-BCOlGPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6654531427a608dfeaab6a1e1ec9a1adce9b99 --- /dev/null +++ b/annotations_1/FSj-BCOlGPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[136.0, 143.07], [143.0, 146.7], [150.0, 159.27], [160.0, 160.37], [162.0, 165.25], [166.0, 166.63]], "keep_status": [false, false, false, false, false, false], "silence_prob": [91.81, 83.7, 93.29, 0.0, 91.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [7.07, 3.7, 9.27, 0.37, 3.25, 0.63]} \ No newline at end of file diff --git a/annotations_1/FSlLXYohrJg_filtered.json b/annotations_1/FSlLXYohrJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af0fa5291a975b6c9a9d2be89987b47157eda29 --- /dev/null +++ b/annotations_1/FSlLXYohrJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.88], [18.0, 18.35], [21.0, 22.25], [27.0, 27.67], [31.0, 53.62], [55.0, 59.14], [59.0, 61.18], [63.0, 73.79], [75.0, 78.98], [80.0, 81.92], [83.0, 83.13], [83.0, 100.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [98.73, 0.0, 0.0, 0.0, 88.46, 67.51, 86.09, 58.55, 71.87, 0.0, 0.0, 42.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 12.53], ["fart", 9.56], ["whale vocalization", 5.4]]], "duration": [2.88, 0.35, 1.25, 0.67, 22.62, 4.14, 2.18, 10.79, 3.98, 1.92, 0.13, 17.35]} \ No newline at end of file diff --git a/annotations_1/FT1C1QdiMhw_filtered.json b/annotations_1/FT1C1QdiMhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95419b5f942bb2bb3878ef7df1ba09e63dd90086 --- /dev/null +++ b/annotations_1/FT1C1QdiMhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 40.71], [42.0, 42.5], [44.0, 50.19], [51.0, 51.93], [55.0, 56.05], [59.0, 59.93], [63.0, 64.2], [65.0, 66.06], [67.0, 67.41], [70.0, 70.71], [77.0, 77.38], [80.0, 81.11], [83.0, 83.39], [85.0, 109.14], [110.0, 116.83], [117.0, 118.17], [119.0, 119.75], [121.0, 122.37], [123.0, 124.82], [126.0, 129.22], [130.0, 130.52], [132.0, 137.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.42, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 94.37, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 38.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whistling", 65.26], ["speech", 12.41], ["chirp tone", 5.57]]], "duration": [4.71, 0.5, 6.19, 0.93, 1.05, 0.93, 1.2, 1.06, 0.41, 0.71, 0.38, 1.11, 0.39, 24.14, 6.83, 1.17, 0.75, 1.37, 1.82, 3.22, 0.52, 5.59]} \ No newline at end of file diff --git a/annotations_1/FTGtcjSMjy0_filtered.json b/annotations_1/FTGtcjSMjy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01bd83de935c2af41bddeee0befaecad5c4f82e0 --- /dev/null +++ b/annotations_1/FTGtcjSMjy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 80.82], [82.0, 83.29], [84.0, 85.16], [85.0, 88.42], [89.0, 90.46], [92.0, 92.8], [95.0, 98.07], [101.0, 102.22], [105.0, 106.05], [108.0, 110.56], [111.0, 113.91], [117.0, 117.05], [121.0, 121.8]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.99, 0.0, 0.0, 54.43, 0.0, 0.0, 41.68, 56.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["singing bowl", 38.87], ["music", 14.3], ["chirp tone", 4.95]], null, null, null, null, null, [["music", 34.56], ["speech", 20.6], ["hum", 5.47]], null, null, null], "duration": [0.82, 1.29, 1.16, 3.42, 1.46, 0.8, 3.07, 1.22, 1.05, 2.56, 2.91, 0.05, 0.8]} \ No newline at end of file diff --git a/annotations_1/FTO-jtC7Hf4_filtered.json b/annotations_1/FTO-jtC7Hf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5df3a380c08ec28cf433966ae46489d0ae26218e --- /dev/null +++ b/annotations_1/FTO-jtC7Hf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [6.0, 6.62], [8.0, 9.07], [14.0, 13.86], [15.0, 14.99], [19.0, 19.52], [22.0, 22.44], [28.0, 28.51], [30.0, 30.97], [43.0, 43.04], [54.0, 55.16], [61.0, 60.94], [63.0, 63.41], [68.0, 67.71], [72.0, 73.31], [77.0, 77.7], [84.0, 85.31], [90.0, 91.1], [93.0, 94.12], [96.0, 97.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.62, 1.07, -0.14, -0.01, 0.52, 0.44, 0.51, 0.97, 0.04, 1.16, -0.06, 0.41, -0.29, 1.31, 0.7, 1.31, 1.1, 1.12, 1.65]} \ No newline at end of file diff --git a/annotations_1/FTzUto6toxY_filtered.json b/annotations_1/FTzUto6toxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4a46ac4526b0a99b10c730a027953bbed02f14 --- /dev/null +++ b/annotations_1/FTzUto6toxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.44], [14.0, 14.49], [18.0, 17.91], [21.0, 23.25], [24.0, 35.75], [45.0, 45.89], [50.0, 50.55], [52.0, 55.41], [56.0, 56.39], [57.0, 60.67], [64.0, 63.9], [67.0, 66.85], [68.0, 67.86], [68.0, 69.38], [70.0, 71.12], [72.0, 91.91], [96.0, 96.52], [102.0, 103.08], [109.0, 111.32], [112.0, 113.16], [115.0, 115.89], [119.0, 119.45], [121.0, 122.42], [128.0, 128.49], [133.0, 145.99], [161.0, 174.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [30.86, 0.0, 0.0, 82.43, 32.64, 0.0, 0.0, 70.44, 0.0, 38.62, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 0.0, 0.0, 29.59, 0.0, 0.0, 0.0, 0.0, 0.0, 30.94, 73.82], "audiomae_on_audioset": [[["music", 65.72], ["hum", 9.32], ["throbbing", 6.38]], null, null, null, [["music", 80.65], ["didgeridoo", 5.17], ["theremin", 4.68]], null, null, null, null, [["fly, housefly", 20.41], ["thunk", 20.12], ["insect", 10.94]], null, null, null, null, null, [["insect", 33.37], ["fly, housefly", 30.01], ["music", 14.12]], null, null, [["gong", 21.31], ["speech", 15.15], ["music", 10.72]], null, null, null, null, null, [["music", 75.78], ["throbbing", 7.89], ["hum", 2.07]], null], "duration": [11.44, 0.49, -0.09, 2.25, 11.75, 0.89, 0.55, 3.41, 0.39, 3.67, -0.1, -0.15, -0.14, 1.38, 1.12, 19.91, 0.52, 1.08, 2.32, 1.16, 0.89, 0.45, 1.42, 0.49, 12.99, 13.82]} \ No newline at end of file diff --git a/annotations_1/FUWdPWW4csI_filtered.json b/annotations_1/FUWdPWW4csI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5dc3b8971f40e97c7b2529e6c66ba077c7a6a80 --- /dev/null +++ b/annotations_1/FUWdPWW4csI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [6.0, 6.64], [15.0, 15.13], [18.0, 19.13], [23.0, 23.6], [30.0, 31.63], [33.0, 42.4], [47.0, 47.83], [51.0, 51.26], [54.0, 57.77], [64.0, 64.61], [66.0, 66.7], [70.0, 70.8], [72.0, 72.01], [75.0, 74.92], [90.0, 90.54], [110.0, 110.89], [113.0, 113.29], [113.0, 113.34], [113.0, 113.51], [114.0, 115.08], [116.0, 118.4], [120.0, 119.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0, 34.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.67, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 66.13], ["speech", 10.51], ["boing", 5.78]], null, null, [["music", 66.2], ["throbbing", 4.49], ["musical instrument", 3.1]], null, null, null, null, null, null, null, null, null, null, null, [["music", 73.59], ["musical instrument", 6.8], ["guitar", 4.73]], null], "duration": [1.26, 0.64, 0.13, 1.13, 0.6, 1.63, 9.4, 0.83, 0.26, 3.77, 0.61, 0.7, 0.8, 0.01, -0.08, 0.54, 0.89, 0.29, 0.34, 0.51, 1.08, 2.4, -0.42]} \ No newline at end of file diff --git a/annotations_1/FVGKgrxQP9M_filtered.json b/annotations_1/FVGKgrxQP9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac8a008f108f7908b2438c73dbaa9838a0e960c8 --- /dev/null +++ b/annotations_1/FVGKgrxQP9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.37], [23.0, 24.24], [27.0, 33.15], [34.0, 36.41], [47.0, 47.26], [57.0, 58.06], [60.0, 63.44], [64.0, 79.14], [84.0, 84.43], [91.0, 94.29], [96.0, 96.67], [99.0, 99.71]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [30.21, 0.0, 29.1, 29.68, 0.0, 0.0, 37.51, 31.39, 0.0, 93.13, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.66], ["musical instrument", 7.01], ["guitar", 2.3]], null, [["music", 33.17], ["speech", 32.09], ["clarinet", 8.66]], [["music", 54.36], ["speech", 11.38], ["musical instrument", 5.16]], null, null, [["speech", 16.38], ["fly, housefly", 13.39], ["insect", 6.74]], [["music", 45.1], ["mains hum", 9.1], ["speech", 8.3]], null, null, null, null], "duration": [4.37, 1.24, 6.15, 2.41, 0.26, 1.06, 3.44, 15.14, 0.43, 3.29, 0.67, 0.71]} \ No newline at end of file diff --git a/annotations_1/FVRaOepQ02I_filtered.json b/annotations_1/FVRaOepQ02I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be6d60c1215117e10a95d20ba66f52151bbe4f6c --- /dev/null +++ b/annotations_1/FVRaOepQ02I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 16.93], [18.0, 21.9], [23.0, 27.18], [31.0, 31.21], [32.0, 35.97], [38.0, 51.88], [53.0, 70.83], [72.0, 73.43], [74.0, 75.07], [77.0, 95.42], [98.0, 98.9], [101.0, 128.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [42.46, 98.1, 34.64, 0.0, 38.58, 44.18, 33.39, 0.0, 0.0, 32.62, 0.0, 30.95], "audiomae_on_audioset": [[["music", 51.35], ["theremin", 10.14], ["speech", 9.75]], null, [["didgeridoo", 51.24], ["music", 33.51], ["musical instrument", 3.36]], null, [["didgeridoo", 36.53], ["music", 14.19], ["electric shaver, electric razor", 11.0]], [["music", 63.86], ["hum", 5.66], ["radio", 4.29]], [["music", 37.34], ["speech", 22.48], ["quack", 14.21]], null, null, [["music", 53.89], ["theremin", 13.34], ["didgeridoo", 5.5]], null, [["music", 83.0], ["musical instrument", 3.8], ["trombone", 1.51]]], "duration": [11.93, 3.9, 4.18, 0.21, 3.97, 13.88, 17.83, 1.43, 1.07, 18.42, 0.9, 27.31]} \ No newline at end of file diff --git a/annotations_1/FWznyZ9Znuw_filtered.json b/annotations_1/FWznyZ9Znuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..398b966017784f087400453e59e9548fe84775c2 --- /dev/null +++ b/annotations_1/FWznyZ9Znuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.77], [5.0, 6.17], [7.0, 9.15], [10.0, 11.57], [13.0, 21.29], [25.0, 33.78], [36.0, 36.36], [39.0, 39.18], [40.0, 41.39], [42.0, 45.32], [49.0, 51.38], [59.0, 59.36], [60.0, 70.75], [78.0, 90.56], [92.0, 96.47], [98.0, 106.57], [108.0, 115.55], [117.0, 134.11]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 51.12, 0.0, 55.96, 36.79, 0.0, 0.0, 0.0, 55.46, 76.37, 0.0, 33.07, 52.39, 63.42, 38.71, 38.66, 69.2], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 20.94], ["music", 12.43], ["mains hum", 11.42]], null, null, null, null, null, null, [["hum", 50.34], ["mains hum", 12.66], ["music", 11.99]], null, null, [["music", 31.16], ["hum", 16.99], ["rumble", 9.96]], [["speech", 33.27], ["music", 15.89], ["hum", 9.49]], null], "duration": [1.77, 1.17, 2.15, 1.57, 8.29, 8.78, 0.36, 0.18, 1.39, 3.32, 2.38, 0.36, 10.75, 12.56, 4.47, 8.57, 7.55, 17.11]} \ No newline at end of file diff --git a/annotations_1/FXeNdV-FTjI_filtered.json b/annotations_1/FXeNdV-FTjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55a3ef8d2e0a667b2438eea7aa72775fd141f0db --- /dev/null +++ b/annotations_1/FXeNdV-FTjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [7.0, 7.53], [8.0, 11.31], [19.0, 23.19], [24.0, 25.62], [26.0, 27.55], [31.0, 31.99], [34.0, 34.65], [36.0, 38.97], [41.0, 51.65], [53.0, 55.92], [58.0, 62.26], [63.0, 64.1], [65.0, 71.07], [72.0, 72.69], [74.0, 74.19], [77.0, 76.91], [83.0, 85.75], [87.0, 87.37], [89.0, 90.9], [92.0, 104.63], [106.0, 109.73], [110.0, 111.52], [113.0, 113.81], [116.0, 119.5], [121.0, 121.61], [124.0, 124.29], [127.0, 127.97], [129.0, 131.3], [136.0, 136.54], [138.0, 139.01], [140.0, 142.03], [142.0, 143.04], [146.0, 147.23], [149.0, 150.52], [151.0, 152.95], [155.0, 155.55], [157.0, 158.52], [160.0, 172.81], [173.0, 174.12], [175.0, 175.86], [180.0, 181.99], [184.0, 185.35], [189.0, 190.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.7, 95.78, 0.0, 0.0, 0.0, 0.0, 61.37, 46.94, 70.72, 44.29, 0.0, 72.9, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 41.18, 79.24, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["mains hum", 18.17], ["whale vocalization", 13.65], ["hum", 10.29]], null, [["music", 51.83], ["didgeridoo", 4.91], ["musical instrument", 4.82]], null, null, null, null, null, null, null, null, [["music", 25.95], ["chime", 12.1], ["speech", 7.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, 0.53, 3.31, 4.19, 1.62, 1.55, 0.99, 0.65, 2.97, 10.65, 2.92, 4.26, 1.1, 6.07, 0.69, 0.19, -0.09, 2.75, 0.37, 1.9, 12.63, 3.73, 1.52, 0.81, 3.5, 0.61, 0.29, 0.97, 2.3, 0.54, 1.01, 2.03, 1.04, 1.23, 1.52, 1.95, 0.55, 1.52, 12.81, 1.12, 0.86, 1.99, 1.35, 1.05]} \ No newline at end of file diff --git a/annotations_1/FY00zwMZsqM_filtered.json b/annotations_1/FY00zwMZsqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db0989ab014e1f40e40e1d4970970162ccf202ff --- /dev/null +++ b/annotations_1/FY00zwMZsqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.27], [27.0, 92.5], [95.0, 110.61], [112.0, 134.03]], "keep_status": [true, false, false, false], "silence_prob": [48.06, 0.0, 31.75, 32.44], "audiomae_on_audioset": [[["music", 44.33], ["hum", 11.03], ["speech", 7.03]], null, [["music", 50.26], ["speech", 22.4], ["buzz", 1.8]], [["music", 58.5], ["electric shaver, electric razor", 9.27], ["buzz", 5.08]]], "duration": [3.27, 65.5, 15.61, 22.03]} \ No newline at end of file diff --git a/annotations_1/FYDEheLGrKw_filtered.json b/annotations_1/FYDEheLGrKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09221d25af067037017c4abba2d5e5e461d7605d --- /dev/null +++ b/annotations_1/FYDEheLGrKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [10.0, 10.52], [12.0, 12.9], [15.0, 18.5], [20.0, 20.36], [21.0, 21.9], [22.0, 24.21], [29.0, 29.94], [44.0, 44.24], [48.0, 48.64], [51.0, 51.48], [53.0, 53.45], [56.0, 56.37], [60.0, 60.94], [62.0, 65.33], [66.0, 66.85], [67.0, 67.49], [70.0, 70.75], [72.0, 72.6], [79.0, 79.59], [85.0, 86.04], [92.0, 92.18], [96.0, 96.53], [98.0, 98.1], [101.0, 101.98], [104.0, 105.38], [106.0, 106.66], [109.0, 109.32], [110.0, 110.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.52, 0.9, 3.5, 0.36, 0.9, 2.21, 0.94, 0.24, 0.64, 0.48, 0.45, 0.37, 0.94, 3.33, 0.85, 0.49, 0.75, 0.6, 0.59, 1.04, 0.18, 0.53, 0.1, 0.98, 1.38, 0.66, 0.32, 0.46]} \ No newline at end of file diff --git a/annotations_1/FYnYxm5Awfg_filtered.json b/annotations_1/FYnYxm5Awfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e4ff9823f9d55639dc0447f62a8d763fd23c287 --- /dev/null +++ b/annotations_1/FYnYxm5Awfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.74], [20.0, 34.23], [36.0, 45.94], [47.0, 48.0], [49.0, 56.17], [62.0, 71.79], [72.0, 78.98], [81.0, 82.44], [84.0, 85.51], [87.0, 88.21], [90.0, 99.01], [101.0, 101.68], [103.0, 107.62], [109.0, 113.86], [117.0, 119.65], [121.0, 129.9], [130.0, 141.29], [142.0, 147.23], [155.0, 157.77], [159.0, 159.58], [160.0, 162.78], [170.0, 173.33], [175.0, 177.16], [178.0, 179.49], [180.0, 187.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.83, 99.93, 85.72, 0.0, 100.0, 85.35, 91.13, 0.0, 0.0, 0.0, 72.31, 0.0, 99.97, 81.35, 91.13, 56.93, 80.82, 67.51, 80.64, 0.0, 100.0, 99.87, 100.0, 0.0, 78.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.74, 14.23, 9.94, 1.0, 7.17, 9.79, 6.98, 1.44, 1.51, 1.21, 9.01, 0.68, 4.62, 4.86, 2.65, 8.9, 11.29, 5.23, 2.77, 0.58, 2.78, 3.33, 2.16, 1.49, 7.49]} \ No newline at end of file diff --git a/annotations_1/FZOF6ePjVcM_filtered.json b/annotations_1/FZOF6ePjVcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cbdb6c0634ed72b85adb87ccb8fb5d58b847550 --- /dev/null +++ b/annotations_1/FZOF6ePjVcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 109.83]], "keep_status": [false], "silence_prob": [29.54], "audiomae_on_audioset": [[["throbbing", 52.31], ["hum", 20.04], ["music", 9.87]]], "duration": [23.83]} \ No newline at end of file diff --git a/annotations_1/FZlm1ledK-I_filtered.json b/annotations_1/FZlm1ledK-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efb54c8b99e6bcd3c581e9cc5e61bce7e22868d0 --- /dev/null +++ b/annotations_1/FZlm1ledK-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.56], [27.0, 32.21], [33.0, 34.92], [37.0, 40.8], [42.0, 44.17], [47.0, 47.58], [51.0, 52.15], [53.0, 54.8], [57.0, 58.78], [60.0, 61.15], [63.0, 63.91], [65.0, 66.26], [68.0, 68.76], [71.0, 71.09], [71.0, 79.39], [80.0, 83.3], [84.0, 85.92], [88.0, 88.35], [89.0, 89.8], [96.0, 96.18], [97.0, 98.32], [101.0, 102.09], [105.0, 105.49], [106.0, 106.74], [108.0, 110.76], [111.0, 114.78], [117.0, 119.84], [121.0, 124.04], [125.0, 126.28], [128.0, 141.47], [143.0, 148.05], [149.0, 157.4], [158.0, 159.43], [161.0, 162.78], [165.0, 166.97], [169.0, 169.06], [171.0, 180.37], [181.0, 185.36], [186.0, 186.61], [189.0, 188.79], [189.0, 191.57], [194.0, 200.3], [201.0, 202.9], [204.0, 204.9], [206.0, 213.58], [214.0, 218.42], [219.0, 227.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.86, 99.59, 0.0, 99.71, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 63.21, 99.97, 98.44, 0.0, 0.0, 0.0, 0.0, 90.08, 99.93, 0.0, 0.0, 98.86, 93.91, 0.0, 0.0, 99.59, 94.52, 80.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.56, 5.21, 1.92, 3.8, 2.17, 0.58, 1.15, 1.8, 1.78, 1.15, 0.91, 1.26, 0.76, 0.09, 8.39, 3.3, 1.92, 0.35, 0.8, 0.18, 1.32, 1.09, 0.49, 0.74, 2.76, 3.78, 2.84, 3.04, 1.28, 13.47, 5.05, 8.4, 1.43, 1.78, 1.97, 0.06, 9.37, 4.36, 0.61, -0.21, 2.57, 6.3, 1.9, 0.9, 7.58, 4.42, 8.97]} \ No newline at end of file diff --git a/annotations_1/FaX0hq8BZc8_filtered.json b/annotations_1/FaX0hq8BZc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be93f7fec8f962e570f90269f0e4dcad76612596 --- /dev/null +++ b/annotations_1/FaX0hq8BZc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.92], [19.0, 19.85], [22.0, 28.26], [31.0, 47.02], [51.0, 79.14], [81.0, 83.84], [85.0, 86.68], [90.0, 92.58], [94.0, 115.35], [116.0, 117.66], [120.0, 125.19]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [55.81, 0.0, 42.65, 30.06, 29.73, 30.1, 0.0, 30.45, 29.98, 0.0, 31.39], "audiomae_on_audioset": [null, null, [["bee, wasp, etc.", 40.03], ["fly, housefly", 16.59], ["hum", 8.62]], [["music", 90.67], ["electronic music", 1.31], ["musical instrument", 0.92]], [["music", 80.41], ["vehicle", 3.33], ["electronic music", 2.92]], [["music", 25.44], ["hum", 22.64], ["throbbing", 14.06]], null, [["music", 18.43], ["speech", 14.72], ["vehicle", 11.23]], [["music", 66.0], ["throbbing", 7.6], ["hum", 5.82]], null, [["music", 62.93], ["throbbing", 14.95], ["hum", 8.05]]], "duration": [2.92, 0.85, 6.26, 16.02, 28.14, 2.84, 1.68, 2.58, 21.35, 1.66, 5.19]} \ No newline at end of file diff --git a/annotations_1/FbDFmWdG3NU_filtered.json b/annotations_1/FbDFmWdG3NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74a7c04327ddb50e3c8e99acf7272ad9d38820f5 --- /dev/null +++ b/annotations_1/FbDFmWdG3NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.63], [17.0, 18.62], [22.0, 23.3], [26.0, 28.66], [30.0, 34.08], [36.0, 36.86], [40.0, 41.77], [43.0, 44.79], [45.0, 47.33], [48.0, 51.34], [52.0, 53.72], [56.0, 79.93], [83.0, 87.86], [88.0, 89.16], [105.0, 155.06], [155.0, 156.61], [157.0, 170.72]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [54.1, 0.0, 0.0, 58.81, 60.89, 0.0, 0.0, 0.0, 50.21, 35.25, 0.0, 31.46, 32.02, 0.0, 0.0, 0.0, 33.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["knock", 16.7], ["thunk", 11.75], ["hum", 7.77]], null, [["hum", 44.9], ["music", 16.03], ["mains hum", 12.08]], [["music", 51.63], ["synthesizer", 7.99], ["throbbing", 6.83]], null, null, null, [["music", 59.23], ["hum", 5.74], ["mains hum", 5.1]]], "duration": [3.63, 1.62, 1.3, 2.66, 4.08, 0.86, 1.77, 1.79, 2.33, 3.34, 1.72, 23.93, 4.86, 1.16, 50.06, 1.61, 13.72]} \ No newline at end of file diff --git a/annotations_1/FbV4VCCk3Sc_filtered.json b/annotations_1/FbV4VCCk3Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f15dba9ab94d8995dcdc7a4d4de63a8f14fac67 --- /dev/null +++ b/annotations_1/FbV4VCCk3Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.69], [11.0, 11.1], [11.0, 11.53], [12.0, 20.92], [23.0, 44.64], [47.0, 61.97], [63.0, 86.58], [88.0, 91.1], [97.0, 108.77], [109.0, 108.8], [109.0, 142.55], [149.0, 151.78], [156.0, 162.04], [164.0, 164.93]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.75, 29.88, 30.09, 29.88, 29.78, 29.96, 0.0, 0.0, 35.02, 33.91, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 85.87], ["speech", 4.79], ["electronic music", 2.35]], [["music", 65.07], ["speech", 5.09], ["drum machine", 3.24]], [["music", 59.24], ["electronic music", 7.67], ["sampler", 4.52]], [["music", 45.88], ["electronic music", 7.67], ["throbbing", 6.31]], [["music", 34.92], ["speech", 9.5], ["crowd", 7.33]], [["music", 65.54], ["electronic music", 11.6], ["dubstep", 2.32]], null, null, [["music", 30.95], ["moo", 17.29], ["cattle, bovinae", 15.71]], [["music", 18.69], ["cattle, bovinae", 11.72], ["speech", 11.25]], null], "duration": [1.69, 0.1, 0.53, 8.92, 21.64, 14.97, 23.58, 3.1, 11.77, -0.2, 33.55, 2.78, 6.04, 0.93]} \ No newline at end of file diff --git a/annotations_1/FbY1BfonRu4_filtered.json b/annotations_1/FbY1BfonRu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbc9d5985d3a6b24e86b6f5bac5f70713209b36e --- /dev/null +++ b/annotations_1/FbY1BfonRu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [6.0, 6.08], [8.0, 8.61], [23.0, 23.79], [29.0, 29.86], [39.0, 41.61], [43.0, 49.98], [51.0, 56.44], [63.0, 63.14], [64.0, 64.91], [68.0, 69.87], [74.0, 81.14], [83.0, 90.17]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.21, 47.05, 34.97, 0.0, 0.0, 0.0, 38.63, 30.15], "audiomae_on_audioset": [null, null, null, null, null, [["emergency vehicle", 11.19], ["ambulance (siren)", 9.88], ["siren", 8.12]], [["speech", 35.0], ["hum", 13.67], ["music", 8.55]], [["speech", 66.7], ["livestock, farm animals, working animals", 6.09], ["cattle, bovinae", 5.08]], null, null, null, [["hum", 51.65], ["mains hum", 37.05], ["throbbing", 7.9]], [["speech", 58.2], ["siren", 10.08], ["noise", 6.53]]], "duration": [0.73, 0.08, 0.61, 0.79, 0.86, 2.61, 6.98, 5.44, 0.14, 0.91, 1.87, 7.14, 7.17]} \ No newline at end of file diff --git a/annotations_1/FcSSNKWcReg_filtered.json b/annotations_1/FcSSNKWcReg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5573fd27e5b9873d02d664b03002ff3f8a6452cb --- /dev/null +++ b/annotations_1/FcSSNKWcReg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.72], [13.0, 13.37], [14.0, 15.18], [18.0, 19.84], [20.0, 20.85], [34.0, 35.58], [38.0, 38.28], [46.0, 47.01], [48.0, 48.05], [49.0, 49.82], [51.0, 52.39], [53.0, 54.97], [56.0, 57.16], [58.0, 58.87], [59.0, 81.18], [85.0, 85.19], [99.0, 100.4], [105.0, 105.26], [110.0, 110.35], [110.0, 110.61], [111.0, 115.03], [117.0, 117.22], [119.0, 119.84], [120.0, 120.63], [126.0, 127.13], [131.0, 134.37], [135.0, 137.13], [138.0, 141.84], [143.0, 145.0], [146.0, 149.12], [150.0, 157.3], [164.0, 166.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [33.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.74, 0.0, 0.0, 0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 99.4, 91.81, 63.85, 60.23, 59.51, 49.0, 36.43], "audiomae_on_audioset": [[["speech", 47.64], ["music", 32.53], ["buzz", 3.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.28], ["theremin", 9.69], ["synthesizer", 4.13]], null, null, null, null, null, [["boing", 44.37], ["music", 17.56], ["speech", 11.77]], null, null, null, null, null, null, null, null, null, [["music", 24.93], ["hum", 22.84], ["thunk", 7.93]], [["music", 59.44], ["hum", 2.76], ["mains hum", 2.05]]], "duration": [7.72, 0.37, 1.18, 1.84, 0.85, 1.58, 0.28, 1.01, 0.05, 0.82, 1.39, 1.97, 1.16, 0.87, 22.18, 0.19, 1.4, 0.26, 0.35, 0.61, 4.03, 0.22, 0.84, 0.63, 1.13, 3.37, 2.13, 3.84, 2.0, 3.12, 7.3, 2.95]} \ No newline at end of file diff --git a/annotations_1/FcqJ2a3Dazs_filtered.json b/annotations_1/FcqJ2a3Dazs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9b79206563ecb34bc41fa850ee149482252ae39 --- /dev/null +++ b/annotations_1/FcqJ2a3Dazs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.93], [3.0, 4.26], [5.0, 5.8], [10.0, 11.38], [17.0, 17.61], [19.0, 26.45], [27.0, 30.18], [31.0, 33.79], [36.0, 38.11], [40.0, 40.44], [42.0, 43.58], [47.0, 47.82], [50.0, 50.75], [56.0, 58.97], [62.0, 64.13], [66.0, 66.56], [69.0, 75.46], [77.0, 78.17], [80.0, 81.75], [82.0, 82.68], [85.0, 85.45], [90.0, 91.61], [94.0, 94.17]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 64.86, 64.97, 48.95, 0.0, 0.0, 0.0, 0.0, 91.3, 88.64, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 33.5], ["speech", 20.78], ["hum", 9.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.07, 1.26, 0.8, 1.38, 0.61, 7.45, 3.18, 2.79, 2.11, 0.44, 1.58, 0.82, 0.75, 2.97, 2.13, 0.56, 6.46, 1.17, 1.75, 0.68, 0.45, 1.61, 0.17]} \ No newline at end of file diff --git a/annotations_1/Fdq_l2-C1wg_filtered.json b/annotations_1/Fdq_l2-C1wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6187898984cd062fe145bf29d6390a8ccffade39 --- /dev/null +++ b/annotations_1/Fdq_l2-C1wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 55.83], [58.0, 59.0], [60.0, 60.99], [64.0, 71.59], [76.0, 95.86], [97.0, 97.87], [99.0, 118.62], [119.0, 122.98], [123.0, 124.02], [125.0, 139.83], [143.0, 153.6], [155.0, 160.0]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [57.17, 0.0, 0.0, 60.32, 36.66, 0.0, 30.9, 71.29, 0.0, 31.46, 29.44, 42.79], "audiomae_on_audioset": [null, null, null, null, [["music", 61.16], ["theremin", 12.8], ["sonar", 2.63]], null, [["speech", 43.6], ["music", 27.24], ["crack", 5.43]], null, null, [["gunshot, gunfire", 29.71], ["explosion", 12.4], ["music", 12.06]], [["music", 52.02], ["bleat", 6.1], ["animal", 5.2]], [["music", 21.82], ["fly, housefly", 18.73], ["quack", 13.26]]], "duration": [11.83, 1.0, 0.99, 7.59, 19.86, 0.87, 19.62, 3.98, 1.02, 14.83, 10.6, 5.0]} \ No newline at end of file diff --git a/annotations_1/Fecoe2kJdD0_filtered.json b/annotations_1/Fecoe2kJdD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5af05f75e8e86fbe1c46d932f768ba45b365125c --- /dev/null +++ b/annotations_1/Fecoe2kJdD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[69.0, 78.36], [80.0, 132.75], [134.0, 139.6]], "keep_status": [true, false, true], "silence_prob": [32.95, 0.0, 39.24], "audiomae_on_audioset": [[["music", 25.45], ["throbbing", 22.21], ["hum", 16.95]], null, [["hum", 30.32], ["speech", 22.39], ["mains hum", 11.85]]], "duration": [9.36, 52.75, 5.6]} \ No newline at end of file diff --git a/annotations_1/Ff20ZDSj7d8_filtered.json b/annotations_1/Ff20ZDSj7d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cff31ec5f30a631866fe1fba8261fd0e84aad5b7 --- /dev/null +++ b/annotations_1/Ff20ZDSj7d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.37], [7.0, 9.09], [11.0, 12.88], [17.0, 17.98], [25.0, 24.97], [29.0, 29.27], [35.0, 35.8], [45.0, 46.21], [49.0, 73.53], [75.0, 86.16], [86.0, 87.64], [89.0, 92.23], [94.0, 95.1], [96.0, 98.95], [105.0, 106.89], [108.0, 109.0], [112.0, 111.82], [115.0, 116.38], [119.0, 122.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true], "silence_prob": [80.11, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 30.78, 0.0, 32.7, 0.0, 38.12, 0.0, 0.0, 0.0, 0.0, 30.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["didgeridoo", 49.37], ["music", 20.82], ["buzz", 8.45]], [["hum", 18.02], ["music", 10.19], ["livestock, farm animals, working animals", 7.36]], null, [["speech", 28.6], ["music", 25.37], ["rumble", 7.1]], null, [["speech", 28.72], ["music", 22.26], ["didgeridoo", 8.16]], null, null, null, null, [["music", 33.14], ["smash, crash", 7.79], ["noise", 6.01]]], "duration": [3.37, 2.09, 1.88, 0.98, -0.03, 0.27, 0.8, 1.21, 24.53, 11.16, 1.64, 3.23, 1.1, 2.95, 1.89, 1.0, -0.18, 1.38, 3.27]} \ No newline at end of file diff --git a/annotations_1/FgUKDQA1qFg_filtered.json b/annotations_1/FgUKDQA1qFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada030835ab3f9a70c5255880b047a3dcf7c9d04 --- /dev/null +++ b/annotations_1/FgUKDQA1qFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 4.5], [7.0, 9.66], [11.0, 18.59], [20.0, 21.09], [24.0, 23.84], [31.0, 31.24], [32.0, 33.25], [34.0, 34.3], [35.0, 37.34], [41.0, 41.99], [48.0, 49.28], [50.0, 51.66], [52.0, 53.64], [54.0, 55.54], [60.0, 60.42], [62.0, 63.49], [64.0, 67.53], [68.0, 70.98], [72.0, 75.84], [77.0, 77.53], [86.0, 87.24], [93.0, 98.27], [102.0, 102.71], [106.0, 109.98], [115.0, 119.6], [121.0, 121.47], [123.0, 123.94], [126.0, 127.43], [129.0, 131.72]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 95.91, 46.61, 0.0, 0.0, 0.0, 0.0, 0.0, 30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 46.83, 31.78, 0.0, 0.0, 30.94, 0.0, 30.33, 52.33, 0.0, 0.0, 0.0, 49.92], "audiomae_on_audioset": [null, null, null, [["music", 29.18], ["sonar", 11.5], ["theremin", 6.18]], null, null, null, null, null, [["music", 23.82], ["mains hum", 18.32], ["hum", 16.38]], null, null, null, null, null, null, null, null, [["music", 57.77], ["hum", 6.78], ["synthesizer", 4.86]], [["music", 70.66], ["explosion", 4.97], ["rumble", 3.67]], null, null, [["music", 47.05], ["throbbing", 16.96], ["hum", 5.9]], null, [["music", 37.13], ["throbbing", 34.63], ["hum", 9.0]], null, null, null, null, [["hum", 19.73], ["throbbing", 18.18], ["heart sounds, heartbeat", 9.85]]], "duration": [0.44, 0.5, 2.66, 7.59, 1.09, -0.16, 0.24, 1.25, 0.3, 2.34, 0.99, 1.28, 1.66, 1.64, 1.54, 0.42, 1.49, 3.53, 2.98, 3.84, 0.53, 1.24, 5.27, 0.71, 3.98, 4.6, 0.47, 0.94, 1.43, 2.72]} \ No newline at end of file diff --git a/annotations_1/FhXn_kxlWno_filtered.json b/annotations_1/FhXn_kxlWno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e3a2696bf426bb58b13378bffc6ae56858287f8 --- /dev/null +++ b/annotations_1/FhXn_kxlWno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.58], [15.0, 15.53], [17.0, 17.61], [19.0, 22.0], [28.0, 28.58], [29.0, 30.52], [35.0, 46.11], [56.0, 60.74], [63.0, 67.22], [69.0, 69.33], [70.0, 70.75], [72.0, 72.79], [73.0, 74.85], [77.0, 77.14], [78.0, 79.0], [80.0, 80.77], [83.0, 83.79], [87.0, 87.99], [89.0, 89.53], [100.0, 100.77], [102.0, 102.69], [104.0, 104.63], [107.0, 107.47], [108.0, 109.43], [113.0, 113.19]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.67, 0.0, 0.0, 30.43, 0.0, 0.0, 32.08, 29.62, 34.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["explosion", 44.86], ["speech", 20.02], ["burst, pop", 7.58]], null, null, [["explosion", 62.49], ["burst, pop", 18.15], ["eruption", 6.5]], null, null, [["explosion", 43.27], ["speech", 24.21], ["eruption", 5.16]], [["speech", 40.12], ["explosion", 16.27], ["eruption", 7.79]], [["speech", 40.62], ["sidetone", 40.51], ["radio", 2.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.58, 0.53, 0.61, 3.0, 0.58, 1.52, 11.11, 4.74, 4.22, 0.33, 0.75, 0.79, 1.85, 0.14, 1.0, 0.77, 0.79, 0.99, 0.53, 0.77, 0.69, 0.63, 0.47, 1.43, 0.19]} \ No newline at end of file diff --git a/annotations_1/FhsFZDrRvoM_filtered.json b/annotations_1/FhsFZDrRvoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa91263634f1cbabdc393d38310dbdfa1b53fb53 --- /dev/null +++ b/annotations_1/FhsFZDrRvoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [9.0, 9.73], [14.0, 14.45], [18.0, 18.55], [24.0, 25.35], [28.0, 28.34], [30.0, 30.86], [33.0, 34.45], [39.0, 40.09], [44.0, 45.17], [60.0, 60.83], [62.0, 63.64], [65.0, 66.33], [79.0, 79.88], [81.0, 82.61], [88.0, 88.01], [91.0, 91.42], [93.0, 94.73], [97.0, 97.28], [102.0, 102.79], [106.0, 106.37], [108.0, 108.9], [114.0, 115.1], [116.0, 117.1], [117.0, 118.84], [119.0, 120.34], [156.0, 157.38], [166.0, 167.1], [217.0, 221.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.53], ["drum machine", 8.68], ["synthesizer", 7.03]]], "duration": [0.98, 0.73, 0.45, 0.55, 1.35, 0.34, 0.86, 1.45, 1.09, 1.17, 0.83, 1.64, 1.33, 0.88, 1.61, 0.01, 0.42, 1.73, 0.28, 0.79, 0.37, 0.9, 1.1, 1.1, 1.84, 1.34, 1.38, 1.1, 4.7]} \ No newline at end of file diff --git a/annotations_1/FiVYtNf5Hos_filtered.json b/annotations_1/FiVYtNf5Hos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84151c10a7c86b882704c63caeda1a42397c28c2 --- /dev/null +++ b/annotations_1/FiVYtNf5Hos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.17], [11.0, 10.69], [11.0, 35.82], [37.0, 47.61], [49.0, 51.95], [54.0, 55.38], [56.0, 68.62], [70.0, 70.17], [73.0, 84.45], [86.0, 87.0]], "keep_status": [false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 45.05, 76.86, 48.39, 0.0, 31.62, 0.0, 66.76, 0.0], "audiomae_on_audioset": [null, null, [["music", 24.47], ["speech", 19.32], ["hum", 11.48]], null, [["dog", 20.9], ["howl", 19.8], ["canidae, dogs, wolves", 11.61]], null, [["sidetone", 16.99], ["mains hum", 14.95], ["hum", 14.12]], null, null, null], "duration": [1.17, -0.31, 24.82, 10.61, 2.95, 1.38, 12.62, 0.17, 11.45, 1.0]} \ No newline at end of file diff --git a/annotations_1/FjT4_Bi-F0I_filtered.json b/annotations_1/FjT4_Bi-F0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8d432f8dde560fb52d8081c6d16e12d9b35956f --- /dev/null +++ b/annotations_1/FjT4_Bi-F0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [5.0, 5.63], [12.0, 13.49], [16.0, 16.61], [17.0, 18.1], [20.0, 21.24], [28.0, 30.35], [33.0, 36.15], [38.0, 42.13], [47.0, 47.44], [50.0, 49.81], [57.0, 57.64], [59.0, 59.58], [63.0, 63.22], [65.0, 65.2], [74.0, 75.88], [80.0, 80.47], [82.0, 82.54], [88.0, 88.3], [90.0, 90.73], [92.0, 92.57], [93.0, 95.17], [100.0, 102.69], [104.0, 105.19], [110.0, 109.75], [114.0, 126.2], [128.0, 128.53], [131.0, 131.57], [132.0, 133.22], [141.0, 142.92], [145.0, 145.81], [152.0, 154.21], [154.0, 154.35], [156.0, 156.73], [165.0, 165.01], [171.0, 171.8], [174.0, 173.7], [174.0, 174.99], [179.0, 179.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.47, 69.07, 38.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.81, 40.55, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 44.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 29.26], ["speech", 24.45], ["music", 16.33]], null, [["music", 55.69], ["throbbing", 18.32], ["hum", 7.21]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.78], ["musical instrument", 7.75], ["guitar", 6.97]], [["music", 28.7], ["theremin", 9.16], ["speech", 6.61]], null, null, [["music", 23.12], ["saxophone", 15.48], ["speech", 8.61]], null, null, null, null, null, [["music", 54.74], ["didgeridoo", 6.69], ["synthesizer", 4.36]], null, null, null, null, null, null, null], "duration": [1.08, 0.63, 1.49, 0.61, 1.1, 1.24, 2.35, 3.15, 4.13, 0.44, -0.19, 0.64, 0.58, 0.22, 0.2, 1.88, 0.47, 0.54, 0.3, 0.73, 0.57, 2.17, 2.69, 1.19, -0.25, 12.2, 0.53, 0.57, 1.22, 1.92, 0.81, 2.21, 0.35, 0.73, 0.01, 0.8, -0.3, 0.99, 0.74]} \ No newline at end of file diff --git a/annotations_1/Fjr_CQHJiCo_filtered.json b/annotations_1/Fjr_CQHJiCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7897ecd429ae84d2fd8de25458f409b9107c2ffb --- /dev/null +++ b/annotations_1/Fjr_CQHJiCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [12.0, 13.02], [14.0, 15.87], [22.0, 22.5], [30.0, 30.86], [35.0, 36.04], [37.0, 42.8], [44.0, 45.87], [46.0, 51.54], [53.0, 54.33], [55.0, 56.93], [57.0, 58.35], [63.0, 64.94], [66.0, 66.77], [70.0, 88.11], [89.0, 90.49], [95.0, 98.22], [100.0, 104.14], [107.0, 108.9], [112.0, 112.5], [115.0, 115.87], [117.0, 118.56], [129.0, 130.45], [132.0, 147.93], [149.0, 155.51], [158.0, 161.18], [166.0, 169.65], [171.0, 172.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 56.4, 36.11, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 97.0, 34.38, 78.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.61], ["music", 19.27], ["noise", 11.66]], null, null, null, null, null, null, null, [["speech", 45.17], ["music", 12.3], ["sidetone", 7.2]], null, null], "duration": [0.39, 1.02, 1.87, 0.5, 0.86, 1.04, 5.8, 1.87, 5.54, 1.33, 1.93, 1.35, 1.94, 0.77, 18.11, 1.49, 3.22, 4.14, 1.9, 0.5, 0.87, 1.56, 1.45, 15.93, 6.51, 3.18, 3.65, 1.99]} \ No newline at end of file diff --git a/annotations_1/Fk69RQS7D8Y_filtered.json b/annotations_1/Fk69RQS7D8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Fk69RQS7D8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/FkEU_g5u_1c_filtered.json b/annotations_1/FkEU_g5u_1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae2bfb22106aa4a2e62670c5ac6a573ea48180ce --- /dev/null +++ b/annotations_1/FkEU_g5u_1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.58], [17.0, 17.32], [19.0, 19.06], [20.0, 20.63], [25.0, 26.05], [30.0, 30.32], [35.0, 34.91], [36.0, 36.07], [40.0, 39.95], [40.0, 42.38], [44.0, 44.54], [45.0, 45.6], [47.0, 52.29], [53.0, 55.56], [57.0, 57.32], [58.0, 60.81], [62.0, 65.84], [69.0, 69.92], [71.0, 71.68], [73.0, 73.36], [78.0, 78.06], [80.0, 82.59], [87.0, 86.68], [88.0, 89.4], [91.0, 91.62], [93.0, 93.56], [95.0, 95.82], [98.0, 99.17], [101.0, 101.12], [108.0, 108.03], [121.0, 121.32], [123.0, 140.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.3, 0.0, 0.0, 46.29, 50.41, 0.0, 56.25, 45.49, 0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.31], ["theremin", 19.21], ["speech", 15.7]], null, null, [["music", 64.12], ["musical instrument", 4.84], ["synthesizer", 2.37]], null, null, null, [["music", 45.14], ["speech", 4.01], ["musical instrument", 3.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.38], ["buzz", 10.43], ["crowd", 7.6]]], "duration": [0.58, 0.32, 0.06, 0.63, 1.05, 0.32, -0.09, 0.07, -0.05, 2.38, 0.54, 0.6, 5.29, 2.56, 0.32, 2.81, 3.84, 0.92, 0.68, 0.36, 0.06, 2.59, -0.32, 1.4, 0.62, 0.56, 0.82, 1.17, 0.12, 0.03, 0.32, 17.22]} \ No newline at end of file diff --git a/annotations_1/FlCzygStNzM_filtered.json b/annotations_1/FlCzygStNzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d7a572aba033617d6d36ef02fa40310d733b094 --- /dev/null +++ b/annotations_1/FlCzygStNzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.67], [7.0, 7.7], [10.0, 11.2], [12.0, 12.61], [15.0, 16.53], [18.0, 19.99], [24.0, 25.47], [29.0, 31.41], [32.0, 35.87], [36.0, 40.41], [43.0, 43.8], [46.0, 47.29], [47.0, 61.64], [63.0, 63.46], [65.0, 65.62], [66.0, 66.99], [69.0, 71.85], [75.0, 75.71], [77.0, 77.5], [79.0, 78.93], [80.0, 80.65], [82.0, 82.24], [83.0, 84.92], [85.0, 98.42], [99.0, 99.99]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 36.17, 36.67, 0.0, 0.0, 39.31, 0.0, 0.0, 0.0, 38.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 39.65], ["theremin", 3.66], ["hum", 3.05]], [["music", 34.27], ["speech", 16.49], ["throbbing", 9.07]], [["livestock, farm animals, working animals", 37.42], ["cattle, bovinae", 16.65], ["music", 16.49]], null, null, [["music", 45.71], ["hum", 16.73], ["mains hum", 13.55]], null, null, null, [["music", 40.67], ["throbbing", 12.97], ["hum", 9.49]], null, null, null, null, null, null, [["music", 53.04], ["speech", 24.96], ["fly, housefly", 4.73]], null], "duration": [0.67, 0.7, 1.2, 0.61, 1.53, 1.99, 1.47, 2.41, 3.87, 4.41, 0.8, 1.29, 14.64, 0.46, 0.62, 0.99, 2.85, 0.71, 0.5, -0.07, 0.65, 0.24, 1.92, 13.42, 0.99]} \ No newline at end of file diff --git a/annotations_1/FlQd5p9_XvY_filtered.json b/annotations_1/FlQd5p9_XvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ccee6d8fce478e7ee7718bb2bf57fcb874523c0 --- /dev/null +++ b/annotations_1/FlQd5p9_XvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.26], [28.0, 29.81], [30.0, 49.86], [52.0, 53.37], [55.0, 94.83], [97.0, 158.53], [159.0, 166.85], [167.0, 168.44], [170.0, 171.86], [173.0, 173.64]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.15, 0.0, 0.0, 0.0, 31.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 74.69], ["throbbing", 9.13], ["electronic music", 5.51]], null, null, null, [["music", 30.95], ["hum", 10.94], ["speech", 7.89]], null, null, null], "duration": [1.26, 1.81, 19.86, 1.37, 39.83, 61.53, 7.85, 1.44, 1.86, 0.64]} \ No newline at end of file diff --git a/annotations_1/FloKMOp4wN8_filtered.json b/annotations_1/FloKMOp4wN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12ff90b4dade6f15bed4e6d8cb6a8cb09924808e --- /dev/null +++ b/annotations_1/FloKMOp4wN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.41], [10.0, 9.9], [11.0, 23.94], [26.0, 26.35], [28.0, 29.22], [30.0, 31.87], [32.0, 33.1], [35.0, 35.41], [37.0, 41.01], [42.0, 45.22], [46.0, 47.76], [51.0, 64.94], [66.0, 81.36], [84.0, 105.88], [110.0, 112.51], [113.0, 114.15], [119.0, 119.31], [120.0, 128.43], [129.0, 161.99], [164.0, 185.09], [186.0, 188.25]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 31.67, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 59.33, 0.0, 31.78, 32.12, 31.62, 36.94, 0.0, 0.0, 33.38, 0.0, 33.73, 31.53], "audiomae_on_audioset": [null, null, [["music", 55.12], ["throbbing", 8.0], ["theremin", 6.83]], null, null, null, null, null, null, null, null, [["music", 66.12], ["speech", 15.23], ["sidetone", 8.84]], [["music", 59.02], ["boing", 15.26], ["speech", 5.79]], [["music", 50.29], ["boing", 9.61], ["speech", 6.24]], [["music", 34.86], ["whack, thwack", 11.58], ["groan", 7.52]], null, null, [["music", 49.64], ["speech", 12.97], ["fart", 10.27]], null, [["music", 69.4], ["funk", 5.04], ["speech", 3.63]], [["music", 48.46], ["boing", 12.15], ["sound effect", 4.38]]], "duration": [1.41, -0.1, 12.94, 0.35, 1.22, 1.87, 1.1, 0.41, 4.01, 3.22, 1.76, 13.94, 15.36, 21.88, 2.51, 1.15, 0.31, 8.43, 32.99, 21.09, 2.25]} \ No newline at end of file diff --git a/annotations_1/FmEHRr23Hro_filtered.json b/annotations_1/FmEHRr23Hro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46a659ecce7b0f2428e3f43cd8b3419723869672 --- /dev/null +++ b/annotations_1/FmEHRr23Hro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.21], [5.0, 5.91], [8.0, 12.11], [15.0, 15.5], [16.0, 16.34], [20.0, 20.49], [28.0, 33.84], [35.0, 35.46], [37.0, 37.39], [41.0, 41.91], [44.0, 45.17], [56.0, 56.86], [60.0, 60.13], [60.0, 60.17], [60.0, 66.19], [66.0, 66.75], [74.0, 80.84], [84.0, 112.31], [113.0, 122.22], [123.0, 128.14], [130.0, 131.92], [134.0, 133.86], [134.0, 135.09], [135.0, 135.31], [135.0, 135.38], [135.0, 135.41], [135.0, 137.57], [138.0, 146.55], [149.0, 148.8], [151.0, 152.71], [159.0, 159.14], [160.0, 160.32], [162.0, 172.74], [174.0, 176.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [63.64, 0.0, 55.89, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 44.43, 29.62, 38.59, 81.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.17, 43.98, 0.0, 0.0, 0.0, 0.0, 45.08, 51.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.86], ["beatboxing", 14.88], ["mains hum", 5.14]], null, [["music", 19.16], ["whale vocalization", 18.98], ["hum", 9.38]], [["speech", 21.47], ["gong", 15.77], ["music", 10.85]], [["hum", 35.45], ["mains hum", 27.39], ["speech", 8.3]], null, null, null, null, null, null, null, [["speech", 47.65], ["music", 26.08], ["percussion", 3.94]], [["music", 35.25], ["speech", 33.25], ["guitar", 5.8]], null, null, null, null, [["hum", 35.72], ["mains hum", 14.91], ["music", 11.54]], null], "duration": [4.21, 0.91, 4.11, 0.5, 0.34, 0.49, 5.84, 0.46, 0.39, 0.91, 1.17, 0.86, 0.13, 0.17, 6.19, 0.75, 6.84, 28.31, 9.22, 5.14, 1.92, -0.14, 1.09, 0.31, 0.38, 0.41, 2.57, 8.55, -0.2, 1.71, 0.14, 0.32, 10.74, 2.08]} \ No newline at end of file diff --git a/annotations_1/FmYGC2QdXd4_filtered.json b/annotations_1/FmYGC2QdXd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280ba27a12df1d3bc9988ff1b6d770ff78245439 --- /dev/null +++ b/annotations_1/FmYGC2QdXd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.5], [18.0, 18.13], [21.0, 22.74], [24.0, 24.48], [26.0, 29.15], [30.0, 31.41], [35.0, 35.65], [40.0, 43.14], [46.0, 45.96], [48.0, 48.71], [51.0, 51.19], [57.0, 57.21], [62.0, 63.36], [68.0, 69.55], [70.0, 72.35], [75.0, 75.34], [79.0, 80.25], [82.0, 83.84], [86.0, 87.81], [89.0, 90.17], [94.0, 94.51], [96.0, 97.63], [99.0, 102.17], [103.0, 104.8], [107.0, 108.8], [110.0, 113.53], [114.0, 113.61]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 53.28, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 37.58, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 24.59], ["music", 18.88], ["singing bowl", 10.22]], null, null, null, null, null, null, [["hum", 19.29], ["music", 15.74], ["mains hum", 12.06]], null, null, null, null, null, null, null, null, null, null, [["speech", 76.72], ["music", 9.05], ["speech synthesizer", 1.78]], null], "duration": [0.5, 0.13, 1.74, 0.48, 3.15, 1.41, 0.65, 3.14, -0.04, 0.71, 0.19, 0.21, 1.36, 1.55, 2.35, 0.34, 1.25, 1.84, 1.81, 1.17, 0.51, 1.63, 3.17, 1.8, 1.8, 3.53, -0.39]} \ No newline at end of file diff --git a/annotations_1/FnFMS11g4fM_filtered.json b/annotations_1/FnFMS11g4fM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87a6092b00b228d0393a784388d12d36457e4ff4 --- /dev/null +++ b/annotations_1/FnFMS11g4fM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[77.0, 82.43], [83.0, 84.33], [89.0, 91.25], [93.0, 93.45], [96.0, 98.44], [99.0, 99.74], [101.0, 102.3], [103.0, 105.21], [106.0, 107.77], [109.0, 118.1], [120.0, 123.77], [126.0, 130.94], [133.0, 133.37], [137.0, 138.57], [144.0, 144.02], [165.0, 165.52], [169.0, 179.39]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [49.64, 0.0, 99.16, 0.0, 36.73, 0.0, 0.0, 63.64, 0.0, 44.96, 38.1, 33.75, 0.0, 0.0, 0.0, 0.0, 32.44], "audiomae_on_audioset": [[["speech", 36.05], ["burping, eructation", 8.8], ["inside, small room", 6.47]], null, null, null, [["noise", 52.01], ["boing", 8.74], ["effects unit", 5.11]], null, null, null, null, [["music", 61.8], ["throbbing", 6.2], ["synthesizer", 4.97]], [["music", 64.88], ["musical instrument", 8.79], ["gong", 4.15]], [["speech", 49.35], ["didgeridoo", 12.36], ["mains hum", 9.29]], null, null, null, null, [["music", 32.05], ["hum", 18.58], ["speech", 17.24]]], "duration": [5.43, 1.33, 2.25, 0.45, 2.44, 0.74, 1.3, 2.21, 1.77, 9.1, 3.77, 4.94, 0.37, 1.57, 0.02, 0.52, 10.39]} \ No newline at end of file diff --git a/annotations_1/FnPOuK9RHH0_filtered.json b/annotations_1/FnPOuK9RHH0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8423f5957b5391c9d394f7fd682ff6075d87d9a --- /dev/null +++ b/annotations_1/FnPOuK9RHH0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [7.0, 6.91], [9.0, 14.91], [16.0, 17.59], [19.0, 20.68], [22.0, 35.63], [38.0, 41.99], [43.0, 44.2], [46.0, 53.22], [54.0, 83.4], [84.0, 103.52], [108.0, 120.07]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.71, 0.0, 0.0, 40.88, 83.34, 0.0, 58.22, 33.14, 35.07, 34.75], "audiomae_on_audioset": [null, null, [["speech", 43.26], ["music", 14.0], ["fart", 6.79]], null, null, [["whale vocalization", 82.36], ["music", 2.45], ["hum", 1.13]], null, null, null, [["whale vocalization", 24.75], ["noise", 14.65], ["music", 13.0]], [["speech", 29.71], ["fart", 23.87], ["music", 18.61]], [["speech", 64.07], ["music", 9.3], ["sidetone", 2.94]]], "duration": [0.48, -0.09, 5.91, 1.59, 1.68, 13.63, 3.99, 1.2, 7.22, 29.4, 19.52, 12.07]} \ No newline at end of file diff --git a/annotations_1/FovnKIV3VD0_filtered.json b/annotations_1/FovnKIV3VD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59aa9f7c1a63a5f729e27e3cc6cc8059ead3f2b2 --- /dev/null +++ b/annotations_1/FovnKIV3VD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 102.15], [105.0, 105.21], [106.0, 138.86], [142.0, 162.99], [164.0, 164.24], [166.0, 170.11], [172.0, 172.22], [175.0, 196.21], [197.0, 207.44], [209.0, 211.38], [212.0, 238.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 29.76, 0.0, 31.74, 0.0, 30.14, 29.56, 33.08, 29.56], "audiomae_on_audioset": [null, null, null, [["music", 46.31], ["speech", 33.88], ["throbbing", 5.68]], null, [["music", 73.59], ["throbbing", 7.08], ["hum", 5.29]], null, [["music", 54.22], ["throbbing", 16.96], ["hum", 12.02]], [["music", 71.5], ["throbbing", 6.25], ["speech", 5.08]], [["music", 47.19], ["sonar", 8.54], ["ambient music", 6.86]], [["music", 42.38], ["hum", 11.46], ["mains hum", 10.42]]], "duration": [57.15, 0.21, 32.86, 20.99, 0.24, 4.11, 0.22, 21.21, 10.44, 2.38, 26.94]} \ No newline at end of file diff --git a/annotations_1/Fp5iPmpZiNE_filtered.json b/annotations_1/Fp5iPmpZiNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78423783124dbe12ebf656be0b168157f2b8d569 --- /dev/null +++ b/annotations_1/Fp5iPmpZiNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [7.0, 8.31], [11.0, 11.8], [15.0, 15.96], [17.0, 28.98], [31.0, 31.09], [32.0, 32.0], [33.0, 35.85], [37.0, 38.43], [44.0, 44.27], [47.0, 47.6], [52.0, 55.27], [58.0, 59.34], [62.0, 69.94], [70.0, 71.2], [73.0, 73.4], [76.0, 76.0], [77.0, 77.67], [80.0, 81.23], [85.0, 88.48], [97.0, 98.91], [100.0, 100.28], [102.0, 102.42], [104.0, 103.89], [107.0, 107.32], [112.0, 112.06], [113.0, 114.86], [119.0, 119.43], [121.0, 122.12], [126.0, 127.79], [129.0, 131.5]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 86.09, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 28.33], ["insect", 14.12], ["creak", 9.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 1.31, 0.8, 0.96, 11.98, 0.09, 0.0, 2.85, 1.43, 0.27, 0.6, 3.27, 1.34, 7.94, 1.2, 0.4, 0.0, 0.67, 1.23, 3.48, 1.91, 0.28, 0.42, -0.11, 0.32, 0.06, 1.86, 0.43, 1.12, 1.79, 2.5]} \ No newline at end of file diff --git a/annotations_1/FpekkNyDPcc_filtered.json b/annotations_1/FpekkNyDPcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3f02b6aa0699bcc2815b52b1d63ec8c202c1838 --- /dev/null +++ b/annotations_1/FpekkNyDPcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.96], [12.0, 21.74], [24.0, 24.46], [33.0, 39.78], [42.0, 41.94], [43.0, 43.28], [43.0, 48.27], [53.0, 54.19], [55.0, 82.71], [84.0, 84.64], [87.0, 89.19], [91.0, 93.38], [97.0, 97.46], [102.0, 102.69], [103.0, 103.65], [114.0, 114.4], [115.0, 115.32], [128.0, 129.05], [130.0, 130.52], [132.0, 131.85], [136.0, 136.86], [144.0, 145.03], [147.0, 149.17], [170.0, 169.87], [170.0, 173.6], [177.0, 198.59]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 33.23, 0.0, 35.1, 0.0, 0.0, 31.54, 0.0, 34.78, 0.0, 99.99, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.27, 0.0, 33.07, 32.13], "audiomae_on_audioset": [null, [["music", 66.36], ["didgeridoo", 5.85], ["crowd", 2.55]], null, [["throbbing", 25.58], ["music", 19.5], ["hum", 16.53]], null, null, [["roar", 17.74], ["boing", 8.73], ["sound effect", 7.13]], null, [["music", 41.95], ["throbbing", 9.3], ["speech", 8.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 29.22], ["breaking", 13.56], ["sound effect", 6.52]], [["speech", 31.57], ["music", 19.97], ["throbbing", 10.11]]], "duration": [0.96, 9.74, 0.46, 6.78, -0.06, 0.28, 5.27, 1.19, 27.71, 0.64, 2.19, 2.38, 0.46, 0.69, 0.65, 0.4, 0.32, 1.05, 0.52, -0.15, 0.86, 1.03, 2.17, -0.13, 3.6, 21.59]} \ No newline at end of file diff --git a/annotations_1/Fr1A3ok_kfw_filtered.json b/annotations_1/Fr1A3ok_kfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9152a1d6e49dec83dddafc653d9612e70230df5e --- /dev/null +++ b/annotations_1/Fr1A3ok_kfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [13.0, 14.54], [20.0, 20.78], [26.0, 49.82], [50.0, 52.22], [53.0, 57.57], [59.0, 79.35], [81.0, 81.41], [83.0, 84.62], [86.0, 89.26], [91.0, 95.79], [97.0, 99.03], [99.0, 121.12], [127.0, 133.17], [133.0, 133.95], [136.0, 136.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.31, 74.29, 92.97, 61.87, 0.0, 0.0, 63.74, 86.27, 89.9, 45.21, 38.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.98], ["music", 18.95], ["cello", 10.92]], [["music", 50.63], ["cello", 6.08], ["double bass", 4.02]], null, null], "duration": [0.8, 1.54, 0.78, 23.82, 2.22, 4.57, 20.35, 0.41, 1.62, 3.26, 4.79, 2.03, 22.12, 6.17, 0.95, 0.44]} \ No newline at end of file diff --git a/annotations_1/Fr6fIMIc_Jo_filtered.json b/annotations_1/Fr6fIMIc_Jo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2a06eaf5d100b17563ff01006d3e440294c9e5b --- /dev/null +++ b/annotations_1/Fr6fIMIc_Jo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.92], [16.0, 19.87], [24.0, 23.85], [24.0, 25.1], [27.0, 26.92], [36.0, 37.94], [40.0, 39.92], [41.0, 42.3], [43.0, 45.4], [54.0, 54.35], [59.0, 61.96], [62.0, 63.54], [67.0, 68.4], [70.0, 70.26], [75.0, 78.56], [79.0, 80.65], [82.0, 83.15], [84.0, 86.75], [88.0, 91.0], [91.0, 91.79], [92.0, 91.94], [92.0, 93.19], [95.0, 99.99], [104.0, 106.0], [107.0, 109.34], [111.0, 115.96]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.74, 0.0, 34.3, 0.0, 0.0, 0.0, 31.9, 0.0, 0.0, 35.48, 32.62, 0.0, 0.0, 0.0, 31.02, 39.25, 34.97, 36.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.37], ["musical instrument", 4.72], ["theremin", 4.5]], null, [["music", 46.39], ["lullaby", 4.07], ["humming", 3.48]], null, null, null, [["music", 65.31], ["musical instrument", 5.62], ["lullaby", 4.1]], null, null, [["music", 55.25], ["musical instrument", 3.25], ["keyboard (musical)", 2.75]], [["music", 42.12], ["electronic tuner", 5.04], ["lullaby", 4.79]], null, null, null, [["music", 58.84], ["yodeling", 13.57], ["singing", 4.37]], [["music", 60.6], ["musical instrument", 6.41], ["plucked string instrument", 4.82]], [["music", 14.72], ["cello", 11.56], ["cattle, bovinae", 10.2]], [["music", 37.24], ["musical instrument", 9.98], ["guitar", 6.67]]], "duration": [1.92, 3.87, -0.15, 1.1, -0.08, 1.94, -0.08, 1.3, 2.4, 0.35, 2.96, 1.54, 1.4, 0.26, 3.56, 1.65, 1.15, 2.75, 3.0, 0.79, -0.06, 1.19, 4.99, 2.0, 2.34, 4.96]} \ No newline at end of file diff --git a/annotations_1/FtPj029E3Qk_filtered.json b/annotations_1/FtPj029E3Qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d34f92e4e0516469fda3dc1d6335479ad084ff9 --- /dev/null +++ b/annotations_1/FtPj029E3Qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [10.0, 10.34], [16.0, 16.9], [19.0, 24.97], [31.0, 32.54], [33.0, 35.45], [40.0, 40.95], [49.0, 51.22], [54.0, 56.81], [57.0, 59.27], [61.0, 62.23], [64.0, 67.66], [69.0, 71.83], [73.0, 75.44], [78.0, 78.44], [81.0, 81.18], [82.0, 84.65], [87.0, 87.69], [89.0, 90.37], [101.0, 106.32], [108.0, 108.5], [115.0, 115.8], [117.0, 117.22], [118.0, 120.8], [125.0, 126.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.05, 0.0, 57.25, 0.0, 91.13, 98.01, 56.7, 0.0, 80.11, 92.31, 36.44, 0.0, 0.0, 68.93, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 68.54, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.19], ["musical instrument", 5.53], ["speech", 5.34]], null, null, null, null, null, null, null, null, null, [["sonar", 23.01], ["sidetone", 22.3], ["music", 13.9]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 0.34, 0.9, 5.97, 1.54, 2.45, 0.95, 2.22, 2.81, 2.27, 1.23, 3.66, 2.83, 2.44, 0.44, 0.18, 2.65, 0.69, 1.37, 5.32, 0.5, 0.8, 0.22, 2.8, 1.08]} \ No newline at end of file diff --git a/annotations_1/FuYjhxmpoOQ_filtered.json b/annotations_1/FuYjhxmpoOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52e232a1aee7fad6d421743f821e9c97d8cb225b --- /dev/null +++ b/annotations_1/FuYjhxmpoOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [9.0, 9.59], [14.0, 17.52], [20.0, 40.8], [45.0, 50.75], [58.0, 69.92], [73.0, 74.82], [76.0, 80.18], [81.0, 85.21], [92.0, 103.59], [106.0, 107.33], [109.0, 113.24], [114.0, 115.37], [118.0, 119.89], [121.0, 124.19], [126.0, 126.47], [127.0, 128.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.79, 47.86, 32.9, 40.34, 0.0, 57.01, 40.12, 35.65, 0.0, 71.72, 0.0, 0.0, 98.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.09], ["synthesizer", 6.47], ["ambient music", 4.39]], [["didgeridoo", 66.28], ["music", 18.18], ["hum", 2.96]], [["music", 40.41], ["didgeridoo", 21.7], ["speech", 9.26]], null, null, [["music", 70.54], ["theremin", 12.82], ["musical instrument", 1.65]], [["music", 73.39], ["theremin", 7.53], ["didgeridoo", 3.26]], null, null, null, null, null, null, null], "duration": [0.82, 0.59, 3.52, 20.8, 5.75, 11.92, 1.82, 4.18, 4.21, 11.59, 1.33, 4.24, 1.37, 1.89, 3.19, 0.47, 1.93]} \ No newline at end of file diff --git a/annotations_1/FubpK1Tho6M_filtered.json b/annotations_1/FubpK1Tho6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc4d8600a5c37dd5be0b426d6c67ae5267f3b014 --- /dev/null +++ b/annotations_1/FubpK1Tho6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 41.94], [42.0, 42.52], [43.0, 45.45], [48.0, 54.09], [54.0, 54.33], [54.0, 54.45], [54.0, 111.6], [114.0, 130.89], [132.0, 134.77]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [29.82, 0.0, 29.72, 29.4, 0.0, 0.0, 0.0, 30.43, 32.77], "audiomae_on_audioset": [[["music", 40.73], ["gong", 27.24], ["ambient music", 7.18]], null, [["music", 35.95], ["ambient music", 29.68], ["synthesizer", 8.39]], [["gong", 44.15], ["music", 20.07], ["hum", 13.66]], null, null, null, [["music", 54.82], ["hum", 12.22], ["throbbing", 7.17]], [["music", 48.62], ["mains hum", 15.27], ["hum", 14.66]]], "duration": [11.94, 0.52, 2.45, 6.09, 0.33, 0.45, 57.6, 16.89, 2.77]} \ No newline at end of file diff --git a/annotations_1/Fw19beLDqn8_filtered.json b/annotations_1/Fw19beLDqn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a02077e329e41073d8e88d2fd2b12782ceb7be1d --- /dev/null +++ b/annotations_1/Fw19beLDqn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 53.99], [57.0, 61.94], [67.0, 68.17], [69.0, 69.18], [70.0, 70.34], [77.0, 77.4], [80.0, 81.65], [84.0, 84.43], [85.0, 85.89], [87.0, 98.51], [99.0, 103.22], [104.0, 112.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.99, 41.6, 83.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["echo", 11.82], ["effects unit", 11.61], ["quack", 10.65]], null], "duration": [0.99, 4.94, 1.17, 0.18, 0.34, 0.4, 1.65, 0.43, 0.89, 11.51, 4.22, 8.8]} \ No newline at end of file diff --git a/annotations_1/FxcIBbXalVg_filtered.json b/annotations_1/FxcIBbXalVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1243bdf4fc1d7510ebc604b546a6f0e0cf87cc29 --- /dev/null +++ b/annotations_1/FxcIBbXalVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.08], [17.0, 18.84], [27.0, 29.4], [30.0, 36.41], [40.0, 41.84], [44.0, 44.83], [46.0, 49.28], [52.0, 53.25], [55.0, 60.67], [64.0, 64.49], [67.0, 67.1], [68.0, 71.34], [73.0, 73.31], [75.0, 75.46], [76.0, 78.33], [79.0, 80.52], [82.0, 84.35], [85.0, 87.78], [91.0, 91.42], [92.0, 93.24], [94.0, 106.46], [111.0, 112.16], [112.0, 115.11], [116.0, 117.51], [120.0, 120.73], [121.0, 122.2], [125.0, 128.04], [130.0, 142.55], [148.0, 149.54], [165.0, 165.99], [169.0, 171.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [95.91, 0.0, 97.92, 53.28, 0.0, 0.0, 60.42, 0.0, 99.65, 0.0, 0.0, 97.83, 0.0, 0.0, 69.07, 0.0, 81.89, 47.12, 0.0, 0.0, 92.31, 0.0, 80.64, 0.0, 0.0, 0.0, 38.71, 31.4, 0.0, 0.0, 83.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.14], ["music", 30.36], ["guitar", 4.19]], null, null, null, null, null, null, null, null, [["speech", 51.28], ["sidetone", 12.54], ["radio", 10.31]], [["speech", 31.81], ["whack, thwack", 19.13], ["fart", 18.53]], null, null, null], "duration": [2.08, 1.84, 2.4, 6.41, 1.84, 0.83, 3.28, 1.25, 5.67, 0.49, 0.1, 3.34, 0.31, 0.46, 2.33, 1.52, 2.35, 2.78, 0.42, 1.24, 12.46, 1.16, 3.11, 1.51, 0.73, 1.2, 3.04, 12.55, 1.54, 0.99, 2.78]} \ No newline at end of file diff --git a/annotations_1/FxvvnlcqLz0_filtered.json b/annotations_1/FxvvnlcqLz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d9e5bdcfdb058c9f957881ea2bf7b5dd7956fe5 --- /dev/null +++ b/annotations_1/FxvvnlcqLz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 89.45], [96.0, 122.74], [124.0, 129.49]], "keep_status": [false, false, false], "silence_prob": [0.0, 30.95, 43.74], "audiomae_on_audioset": [null, [["music", 70.39], ["musical instrument", 2.65], ["theremin", 2.09]], [["music", 63.51], ["brass instrument", 3.47], ["musical instrument", 3.41]]], "duration": [73.45, 26.74, 5.49]} \ No newline at end of file diff --git a/annotations_1/Fz2HMTuqy98_filtered.json b/annotations_1/Fz2HMTuqy98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45ad7956b8d15a631f5196b394b654c20b83f8e1 --- /dev/null +++ b/annotations_1/Fz2HMTuqy98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.9], [7.0, 8.4], [11.0, 11.67], [31.0, 34.43], [40.0, 40.96], [41.0, 42.36], [44.0, 48.57], [63.0, 64.67], [66.0, 66.82], [68.0, 68.54], [71.0, 76.98], [83.0, 82.66], [83.0, 92.28], [94.0, 96.33], [99.0, 101.04], [102.0, 104.53], [105.0, 106.46], [108.0, 110.34], [111.0, 112.41], [113.0, 114.49], [115.0, 125.0], [128.0, 157.59], [159.0, 161.11]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [75.23, 0.0, 0.0, 35.65, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 29.88, 0.0, 42.3, 68.15, 50.51, 55.96, 0.0, 53.97, 0.0, 0.0, 30.9, 32.25, 40.21], "audiomae_on_audioset": [null, null, null, [["thunk", 16.51], ["didgeridoo", 15.86], ["speech", 7.72]], null, null, null, null, null, null, [["throbbing", 48.51], ["music", 33.01], ["hum", 7.91]], null, [["music", 61.84], ["didgeridoo", 7.33], ["speech", 5.86]], null, null, null, null, null, null, null, [["music", 56.73], ["didgeridoo", 21.63], ["hum", 5.65]], [["music", 37.91], ["throbbing", 35.92], ["hum", 12.19]], [["music", 48.16], ["didgeridoo", 7.03], ["electronic music", 5.93]]], "duration": [3.9, 1.4, 0.67, 3.43, 0.96, 1.36, 4.57, 1.67, 0.82, 0.54, 5.98, -0.34, 9.28, 2.33, 2.04, 2.53, 1.46, 2.34, 1.41, 1.49, 10.0, 29.59, 2.11]} \ No newline at end of file diff --git a/annotations_1/Fz43jl18aiY_filtered.json b/annotations_1/Fz43jl18aiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fccd8d0bde964053bb1d07e9554f2eaba4d7b815 --- /dev/null +++ b/annotations_1/Fz43jl18aiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 18.76], [20.0, 20.22], [24.0, 23.7], [26.0, 26.79], [28.0, 29.12], [30.0, 32.21], [33.0, 33.64], [36.0, 49.32], [57.0, 61.75], [63.0, 66.72]], "keep_status": [true, false, false, false, false, false, false, true, true, true], "silence_prob": [31.97, 0.0, 0.0, 0.0, 0.0, 53.22, 0.0, 33.31, 30.09, 30.83], "audiomae_on_audioset": [[["noise", 31.36], ["hum", 19.21], ["mains hum", 13.66]], null, null, null, null, null, null, [["animal", 39.57], ["roaring cats (lions, tigers)", 13.41], ["music", 10.66]], [["speech", 44.43], ["music", 16.53], ["animal", 5.57]], [["speech", 29.73], ["music", 19.68], ["laughter", 6.72]]], "duration": [7.76, 0.22, -0.3, 0.79, 1.12, 2.21, 0.64, 13.32, 4.75, 3.72]} \ No newline at end of file diff --git a/annotations_1/Fz7dtq-saJo_filtered.json b/annotations_1/Fz7dtq-saJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4625ac53c510f2111dfdccdd0e2fb6bac6b6f27 --- /dev/null +++ b/annotations_1/Fz7dtq-saJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.96], [8.0, 8.87], [13.0, 14.88], [17.0, 18.33], [22.0, 23.79], [25.0, 27.28], [29.0, 30.84], [37.0, 44.24], [54.0, 54.62], [56.0, 73.26], [75.0, 74.75], [86.0, 88.38], [92.0, 91.93], [97.0, 102.76], [105.0, 105.56], [106.0, 107.65], [109.0, 109.76], [111.0, 111.32], [112.0, 113.36], [116.0, 116.65], [121.0, 121.26], [126.0, 130.69], [131.0, 131.84], [133.0, 133.88], [135.0, 134.89], [138.0, 138.1], [147.0, 148.54], [153.0, 156.84], [158.0, 159.73], [162.0, 162.72], [164.0, 164.39], [165.0, 170.13], [171.0, 171.53], [176.0, 175.96], [178.0, 178.97], [184.0, 184.27], [185.0, 185.57], [186.0, 187.66], [191.0, 211.1], [214.0, 218.62], [220.0, 221.53], [223.0, 228.45], [229.0, 231.2], [233.0, 233.41], [243.0, 249.62], [252.0, 252.71], [257.0, 258.43], [259.0, 260.29], [263.0, 264.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 78.89, 0.0, 35.01, 0.0, 48.02, 0.0, 41.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.53, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 64.97, 0.0, 76.37, 46.64, 0.0, 44.32, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 55.11], ["noise", 13.39], ["sidetone", 12.77]], null, [["speech", 82.87], ["speech synthesizer", 8.53], ["radio", 2.76]], null, [["speech", 90.41], ["frog", 2.41], ["animal", 0.98]], null, null, null, null, null, null, null, [["speech", 70.63], ["boing", 8.8], ["music", 7.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.7], ["speech", 30.36], ["fart", 5.27]], null, [["music", 45.04], ["didgeridoo", 23.19], ["thunk", 3.34]], null, null, null, null], "duration": [0.96, 0.87, 1.88, 1.33, 1.79, 2.28, 1.84, 7.24, 0.62, 17.26, -0.25, 2.38, -0.07, 5.76, 0.56, 1.65, 0.76, 0.32, 1.36, 0.65, 0.26, 4.69, 0.84, 0.88, -0.11, 0.1, 1.54, 3.84, 1.73, 0.72, 0.39, 5.13, 0.53, -0.04, 0.97, 0.27, 0.57, 1.66, 20.1, 4.62, 1.53, 5.45, 2.2, 0.41, 6.62, 0.71, 1.43, 1.29, 1.22]} \ No newline at end of file diff --git a/annotations_1/G1uBkHVIGfc_filtered.json b/annotations_1/G1uBkHVIGfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f055f10503206ad4e46e0fed1701512ccf335408 --- /dev/null +++ b/annotations_1/G1uBkHVIGfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [5.0, 6.0], [7.0, 7.47], [8.0, 8.36], [9.0, 10.3], [11.0, 11.72], [14.0, 15.72], [16.0, 17.44], [23.0, 24.46], [28.0, 28.78], [33.0, 33.12], [36.0, 36.32], [40.0, 42.08], [46.0, 47.26], [50.0, 50.5], [60.0, 61.57], [63.0, 63.32], [64.0, 64.32], [66.0, 65.85], [68.0, 69.31], [72.0, 72.23], [79.0, 79.07], [80.0, 79.89], [86.0, 85.95], [87.0, 87.69], [91.0, 91.57], [92.0, 92.77], [93.0, 95.86], [96.0, 96.96], [99.0, 100.01], [107.0, 107.18], [111.0, 111.5], [114.0, 114.66], [120.0, 119.99], [120.0, 120.65], [122.0, 121.91], [122.0, 123.08], [124.0, 127.8], [129.0, 129.61], [130.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 1.0, 0.47, 0.36, 1.3, 0.72, 1.72, 1.44, 1.46, 0.78, 0.12, 0.32, 2.08, 1.26, 0.5, 1.57, 0.32, 0.32, -0.15, 1.31, 0.23, 0.07, -0.11, -0.05, 0.69, 0.57, 0.77, 2.86, 0.96, 1.01, 0.18, 0.5, 0.66, -0.01, 0.65, -0.09, 1.08, 3.8, 0.61, 0.91]} \ No newline at end of file diff --git a/annotations_1/G2EcYJ6Zjrk_filtered.json b/annotations_1/G2EcYJ6Zjrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d20d1c6e3513d4b4c6e25b94a5a939801c4b9b --- /dev/null +++ b/annotations_1/G2EcYJ6Zjrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.73], [27.0, 48.84], [50.0, 50.68], [55.0, 56.13], [57.0, 57.82], [61.0, 62.01], [64.0, 65.03], [67.0, 68.39], [68.0, 162.45], [164.0, 177.8]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [39.33, 31.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98], "audiomae_on_audioset": [[["fart", 23.51], ["mosquito", 8.81], ["fly, housefly", 6.73]], [["cattle, bovinae", 46.42], ["livestock, farm animals, working animals", 29.46], ["moo", 20.35]], null, null, null, null, null, null, null, null], "duration": [2.73, 21.84, 0.68, 1.13, 0.82, 1.01, 1.03, 1.39, 94.45, 13.8]} \ No newline at end of file diff --git a/annotations_1/G2ngOQwMMek_filtered.json b/annotations_1/G2ngOQwMMek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01f181f5778d14a2477d3c24a9a22717f52aa0b2 --- /dev/null +++ b/annotations_1/G2ngOQwMMek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.57], [15.0, 21.88], [45.0, 45.57], [48.0, 48.93], [58.0, 58.62], [59.0, 62.75], [70.0, 70.29], [72.0, 72.15], [84.0, 84.69], [86.0, 86.41], [90.0, 90.88], [101.0, 102.59], [103.0, 103.65], [108.0, 108.16], [112.0, 116.26], [124.0, 124.06], [127.0, 127.63], [128.0, 128.83], [136.0, 136.22], [139.0, 139.6], [140.0, 144.17], [146.0, 146.45], [152.0, 157.81]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 38.8, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.94, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 0.0, 41.3], "audiomae_on_audioset": [null, [["hum", 27.15], ["speech", 21.32], ["mains hum", 12.03]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.16], ["speech", 19.61], ["throbbing", 15.08]], null, null, null, null, null, [["fart", 34.86], ["grunt", 13.43], ["fly, housefly", 5.78]], null, [["fart", 23.21], ["whale vocalization", 22.98], ["animal", 6.95]]], "duration": [0.57, 6.88, 0.57, 0.93, 0.62, 3.75, 0.29, 0.15, 0.69, 0.41, 0.88, 1.59, 0.65, 0.16, 4.26, 0.06, 0.63, 0.83, 0.22, 0.6, 4.17, 0.45, 5.81]} \ No newline at end of file diff --git a/annotations_1/G3TWgClyD9E_filtered.json b/annotations_1/G3TWgClyD9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f24f76cc1fab7796f8550798b598a02cbd088cdd --- /dev/null +++ b/annotations_1/G3TWgClyD9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.29], [6.0, 6.44], [19.0, 20.58], [25.0, 26.86], [28.0, 31.14], [36.0, 39.61], [41.0, 51.24], [56.0, 55.9], [61.0, 61.82], [71.0, 71.19], [78.0, 100.38], [101.0, 102.29], [103.0, 106.07], [111.0, 111.15], [117.0, 117.58], [124.0, 125.27], [127.0, 127.36], [130.0, 131.7], [137.0, 138.69], [146.0, 149.55], [155.0, 156.14]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [28.22, 0.0, 0.0, 0.0, 28.97, 29.18, 28.85, 0.0, 0.0, 0.0, 33.3, 0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.52, 0.0], "audiomae_on_audioset": [[["vehicle", 23.86], ["car", 12.4], ["speech", 10.21]], null, null, null, [["whale vocalization", 50.49], ["music", 15.41], ["sound effect", 2.94]], [["music", 51.25], ["throbbing", 18.62], ["hum", 11.41]], [["speech", 16.49], ["music", 9.17], ["livestock, farm animals, working animals", 6.14]], null, null, null, [["music", 49.72], ["speech", 20.97], ["whack, thwack", 5.82]], null, [["music", 63.15], ["singing", 3.22], ["musical instrument", 2.74]], null, null, null, null, null, null, [["music", 74.71], ["guitar", 3.0], ["musical instrument", 2.69]], null], "duration": [2.29, 0.44, 1.58, 1.86, 3.14, 3.61, 10.24, -0.1, 0.82, 0.19, 22.38, 1.29, 3.07, 0.15, 0.58, 1.27, 0.36, 1.7, 1.69, 3.55, 1.14]} \ No newline at end of file diff --git a/annotations_1/G3qOB7PGBXE_filtered.json b/annotations_1/G3qOB7PGBXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bdc343654263978d16ba34d692f123baf56c8b5 --- /dev/null +++ b/annotations_1/G3qOB7PGBXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.98], [16.0, 21.22], [24.0, 24.44], [25.0, 43.41], [44.0, 45.67], [48.0, 51.95], [57.0, 58.26], [59.0, 63.39], [65.0, 66.55], [71.0, 71.15], [75.0, 75.76], [76.0, 77.36], [82.0, 87.25], [88.0, 89.45], [92.0, 99.77], [104.0, 107.67], [109.0, 110.54], [112.0, 112.08], [113.0, 119.04], [126.0, 131.25]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.86, 0.0, 37.44, 0.0, 57.48, 0.0, 43.03, 0.0, 0.0, 0.0, 0.0, 30.56, 0.0, 38.11, 61.67, 0.0, 0.0, 29.12, 29.52], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 30.71], ["moo", 20.72], ["cattle, bovinae", 17.76]], null, [["owl", 20.79], ["fly, housefly", 18.09], ["hoot", 14.61]], null, null, null, [["cattle, bovinae", 23.32], ["moo", 20.02], ["livestock, farm animals, working animals", 16.35]], null, null, null, null, [["music", 39.1], ["speech", 25.84], ["burst, pop", 3.11]], null, [["speech", 37.54], ["music", 34.07], ["hum", 4.22]], null, null, null, [["music", 61.27], ["speech", 22.74], ["rattle (instrument)", 3.2]], [["throbbing", 60.96], ["music", 23.03], ["hum", 6.34]]], "duration": [0.98, 5.22, 0.44, 18.41, 1.67, 3.95, 1.26, 4.39, 1.55, 0.15, 0.76, 1.36, 5.25, 1.45, 7.77, 3.67, 1.54, 0.08, 6.04, 5.25]} \ No newline at end of file diff --git a/annotations_1/G4ENL-T7Dyk_filtered.json b/annotations_1/G4ENL-T7Dyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d036d505ba98efecac44ca55e9993e5fe9d1ee3 --- /dev/null +++ b/annotations_1/G4ENL-T7Dyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [7.0, 6.99], [16.0, 20.07], [21.0, 22.92], [26.0, 30.67], [33.0, 37.45], [48.0, 48.52], [49.0, 49.0], [53.0, 60.67], [62.0, 70.43], [92.0, 91.86], [95.0, 95.25], [96.0, 95.94], [96.0, 96.62], [97.0, 106.22], [115.0, 115.86], [125.0, 127.41], [130.0, 133.08], [133.0, 133.47], [135.0, 134.92], [138.0, 144.58], [146.0, 158.36], [162.0, 163.61]], "keep_status": [false, false, false, false, true, true, false, false, true, true, false, false, false, false, true, false, true, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 60.14, 0.0, 33.42, 33.29, 0.0, 0.0, 32.52, 39.24, 0.0, 0.0, 0.0, 0.0, 34.81, 0.0, 42.53, 38.28, 0.0, 0.0, 34.78, 32.01, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 36.63], ["explosion", 7.57], ["whack, thwack", 5.96]], [["fly, housefly", 16.13], ["insect", 16.12], ["speech", 14.21]], null, null, [["speech", 21.7], ["livestock, farm animals, working animals", 17.19], ["cattle, bovinae", 11.85]], [["speech", 24.31], ["sidetone", 12.45], ["fly, housefly", 12.35]], null, null, null, null, [["speech", 56.77], ["rumble", 6.73], ["creak", 5.15]], null, [["speech", 14.85], ["music", 14.24], ["vehicle", 6.67]], [["speech", 51.32], ["music", 14.49], ["vehicle", 2.54]], null, null, [["speech", 52.91], ["eruption", 5.92], ["rumble", 5.73]], [["speech", 13.19], ["cattle, bovinae", 7.81], ["fly, housefly", 7.69]], null], "duration": [0.49, -0.01, 4.07, 1.92, 4.67, 4.45, 0.52, 0.0, 7.67, 8.43, -0.14, 0.25, -0.06, 0.62, 9.22, 0.86, 2.41, 3.08, 0.47, -0.08, 6.58, 12.36, 1.61]} \ No newline at end of file diff --git a/annotations_1/G5_nIhUCuhk_filtered.json b/annotations_1/G5_nIhUCuhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db3731915cc17fad6d8c659d1860054af27d5d0f --- /dev/null +++ b/annotations_1/G5_nIhUCuhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.69], [16.0, 18.1], [21.0, 24.39], [25.0, 27.01], [29.0, 29.83], [30.0, 31.5], [32.0, 33.15], [35.0, 41.13], [59.0, 59.48], [68.0, 68.37], [73.0, 73.7], [74.0, 74.83], [76.0, 76.37], [79.0, 78.9], [81.0, 80.91], [83.0, 82.8], [83.0, 94.2], [96.0, 96.08], [96.0, 96.85], [97.0, 98.32], [114.0, 114.71], [115.0, 115.57], [117.0, 117.64], [118.0, 117.98], [120.0, 120.18], [122.0, 122.28], [125.0, 124.83], [125.0, 127.45], [128.0, 129.81], [131.0, 130.92], [132.0, 133.3], [135.0, 134.87], [137.0, 136.8], [137.0, 138.16], [141.0, 140.88], [142.0, 142.26], [145.0, 144.88], [148.0, 148.73], [155.0, 155.58], [157.0, 157.27], [160.0, 160.0], [167.0, 167.41]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.1, 91.13, 39.74, 100.0, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 41.22], ["stomach rumble", 5.9], ["fart", 4.67]], null, [["speech", 51.26], ["telephone", 19.87], ["dial tone", 5.34]], null, null, null, null, [["speech", 51.32], ["music", 9.82], ["radio", 8.82]], null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 26.21], ["moo", 12.39], ["cattle, bovinae", 9.0]], null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 27.53], ["boing", 7.5], ["echo", 6.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.69, 2.1, 3.39, 2.01, 0.83, 1.5, 1.15, 6.13, 0.48, 0.37, 0.7, 0.83, 0.37, -0.1, -0.09, -0.2, 11.2, 0.08, 0.85, 1.32, 0.71, 0.57, 0.64, -0.02, 0.18, 0.28, -0.17, 2.45, 1.81, -0.08, 1.3, -0.13, -0.2, 1.16, -0.12, 0.26, -0.12, 0.73, 0.58, 0.27, 0.0, 0.41]} \ No newline at end of file diff --git a/annotations_1/G5aoRyZ-QtM_filtered.json b/annotations_1/G5aoRyZ-QtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef81e879e05539de998d4f9a168ca14900070de3 --- /dev/null +++ b/annotations_1/G5aoRyZ-QtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 30.16], [30.0, 51.39], [61.0, 67.44], [70.0, 80.84], [86.0, 87.12], [97.0, 97.68], [101.0, 101.68], [103.0, 104.6], [107.0, 108.4], [110.0, 110.61], [117.0, 119.97], [122.0, 122.71], [124.0, 128.82], [135.0, 135.43], [139.0, 139.38], [140.0, 143.95], [145.0, 149.32], [151.0, 155.65], [159.0, 160.02], [164.0, 164.62], [170.0, 172.02], [173.0, 174.06]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.63, 33.66, 32.17, 41.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 34.54, 0.0, 0.0, 39.74, 67.0, 56.93, 0.0, 0.0, 89.54, 0.0], "audiomae_on_audioset": [[["music", 35.82], ["throbbing", 33.6], ["hum", 17.25]], [["music", 66.06], ["speech", 7.2], ["didgeridoo", 6.69]], [["music", 51.95], ["throbbing", 12.0], ["speech", 11.85]], [["creak", 17.55], ["coin (dropping)", 11.58], ["mechanisms", 8.42]], null, null, null, null, null, null, null, null, [["music", 39.18], ["didgeridoo", 5.69], ["throbbing", 4.96]], null, null, [["hum", 60.83], ["mains hum", 10.88], ["throbbing", 10.83]], null, null, null, null, null, null], "duration": [10.16, 21.39, 6.44, 10.84, 1.12, 0.68, 0.68, 1.6, 1.4, 0.61, 2.97, 0.71, 4.82, 0.43, 0.38, 3.95, 4.32, 4.65, 1.02, 0.62, 2.02, 1.06]} \ No newline at end of file diff --git a/annotations_1/G61d-lcbLT4_filtered.json b/annotations_1/G61d-lcbLT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63332d6a02101c4d1ff00c3d6edf6d24b75c22ae --- /dev/null +++ b/annotations_1/G61d-lcbLT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.53], [12.0, 14.18], [18.0, 18.79], [26.0, 29.91], [38.0, 43.33], [44.0, 49.74], [51.0, 71.47], [73.0, 75.71], [78.0, 80.7], [81.0, 80.86], [85.0, 94.66], [99.0, 114.3], [122.0, 128.58], [133.0, 134.22], [137.0, 137.03], [138.0, 138.38]], "keep_status": [true, false, false, false, false, true, true, true, true, false, false, true, true, false, false, false], "silence_prob": [38.02, 48.61, 0.0, 29.9, 30.02, 32.56, 29.82, 28.86, 30.96, 0.0, 29.01, 29.27, 31.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 39.76], ["throbbing", 21.55], ["mains hum", 7.92]], [["hum", 61.77], ["mains hum", 21.7], ["throbbing", 8.29]], null, [["music", 65.01], ["electronic music", 5.49], ["synthesizer", 3.09]], [["music", 73.48], ["speech", 15.8], ["synthesizer", 3.06]], [["music", 25.0], ["hum", 24.24], ["speech", 16.63]], [["music", 35.41], ["throbbing", 19.93], ["synthesizer", 11.5]], [["aircraft", 20.71], ["propeller, airscrew", 14.47], ["vehicle", 13.69]], [["music", 50.19], ["throbbing", 8.58], ["single-lens reflex camera", 5.07]], null, [["music", 54.68], ["speech", 15.96], ["cacophony", 4.41]], [["music", 63.39], ["speech", 2.79], ["electronic music", 2.75]], [["speech", 21.37], ["hum", 12.67], ["music", 10.65]], null, null, null], "duration": [3.53, 2.18, 0.79, 3.91, 5.33, 5.74, 20.47, 2.71, 2.7, -0.14, 9.66, 15.3, 6.58, 1.22, 0.03, 0.38]} \ No newline at end of file diff --git a/annotations_1/G629a_3MkkI_filtered.json b/annotations_1/G629a_3MkkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2649ef6511072f7c017706da9082f07a3f8074d2 --- /dev/null +++ b/annotations_1/G629a_3MkkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.42], [10.0, 14.44], [15.0, 15.84], [17.0, 26.92], [30.0, 30.06], [31.0, 32.09], [33.0, 36.04], [37.0, 37.66], [40.0, 44.37], [45.0, 49.65], [51.0, 52.07], [53.0, 64.05], [73.0, 76.03], [107.0, 109.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.18, 74.44, 0.0, 98.66, 0.0, 0.0, 100.0, 0.0, 100.0, 83.34, 0.0, 99.48, 98.99, 88.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.42, 4.44, 0.84, 9.92, 0.06, 1.09, 3.04, 0.66, 4.37, 4.65, 1.07, 11.05, 3.03, 2.04]} \ No newline at end of file diff --git a/annotations_1/G64ubBUMVek_filtered.json b/annotations_1/G64ubBUMVek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bfeb40ebd0ffee3d30eeca94b9b5013030c1240 --- /dev/null +++ b/annotations_1/G64ubBUMVek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.39], [19.0, 18.59], [28.0, 27.87], [32.0, 33.86], [37.0, 38.33], [39.0, 39.41], [46.0, 48.14], [50.0, 52.0], [61.0, 61.25], [73.0, 73.21], [79.0, 82.78], [83.0, 84.11], [87.0, 87.66], [90.0, 90.78], [92.0, 92.96], [94.0, 93.78], [94.0, 94.93], [102.0, 102.52], [108.0, 109.32], [112.0, 112.43], [115.0, 114.71], [116.0, 116.55], [117.0, 118.03], [119.0, 119.57], [126.0, 127.52], [130.0, 130.01], [132.0, 134.49], [140.0, 141.74], [142.0, 143.06], [144.0, 144.26], [147.0, 147.45], [148.0, 148.44], [149.0, 149.15], [151.0, 152.2], [154.0, 154.2]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 88.83, 0.0, 0.0, 42.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.07], ["livestock, farm animals, working animals", 7.27], ["sheep", 5.15]], null, null, null, [["speech", 84.52], ["telephone", 2.63], ["conversation", 1.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.06], ["radio", 9.09], ["sidetone", 4.83]], null, null, null, null, null, null, null, null], "duration": [0.39, -0.41, -0.13, 1.86, 1.33, 0.41, 2.14, 2.0, 0.25, 0.21, 3.78, 1.11, 0.66, 0.78, 0.96, -0.22, 0.93, 0.52, 1.32, 0.43, -0.29, 0.55, 1.03, 0.57, 1.52, 0.01, 2.49, 1.74, 1.06, 0.26, 0.45, 0.44, 0.15, 1.2, 0.2]} \ No newline at end of file diff --git a/annotations_1/G6PcFmNCQpA_filtered.json b/annotations_1/G6PcFmNCQpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5d8cae634806d73e7f91ec82929ecd9710b9f0a --- /dev/null +++ b/annotations_1/G6PcFmNCQpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 6.15], [8.0, 8.88], [10.0, 11.23], [12.0, 13.46], [14.0, 29.07], [32.0, 34.38], [35.0, 37.64], [39.0, 43.73], [45.0, 45.91], [50.0, 83.94], [85.0, 85.55], [86.0, 86.9], [88.0, 88.48], [91.0, 96.5], [98.0, 98.73], [100.0, 104.84], [105.0, 105.68], [107.0, 106.96], [108.0, 108.82], [110.0, 110.93], [111.0, 111.52], [112.0, 127.7], [131.0, 139.67], [140.0, 141.89], [148.0, 148.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 69.07, 69.74, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 48.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.99], ["throbbing", 20.28], ["hum", 7.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.2], ["hum", 21.0], ["insect", 13.16]], null, null], "duration": [1.0, 1.15, 0.88, 1.23, 1.46, 15.07, 2.38, 2.64, 4.73, 0.91, 33.94, 0.55, 0.9, 0.48, 5.5, 0.73, 4.84, 0.68, -0.04, 0.82, 0.93, 0.52, 15.7, 8.67, 1.89, 0.98]} \ No newline at end of file diff --git a/annotations_1/G6f0w5BRasw_filtered.json b/annotations_1/G6f0w5BRasw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82cbf54f645ab00019020912369b2549d82a77a4 --- /dev/null +++ b/annotations_1/G6f0w5BRasw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [9.0, 11.74], [15.0, 16.29], [17.0, 25.35], [26.0, 35.07], [36.0, 35.94], [38.0, 48.41], [49.0, 50.04], [52.0, 59.66], [60.0, 62.38], [63.0, 65.3], [66.0, 68.13], [69.0, 72.01], [73.0, 73.72], [75.0, 76.96], [78.0, 82.75], [83.0, 86.8], [88.0, 88.35], [89.0, 89.51], [90.0, 92.16], [93.0, 94.12], [96.0, 95.86], [101.0, 104.18], [105.0, 110.66], [111.0, 112.16], [113.0, 114.18], [115.0, 116.14], [118.0, 120.06], [120.0, 122.35], [123.0, 132.12], [133.0, 134.87], [135.0, 158.38], [161.0, 162.75], [166.0, 168.44], [170.0, 173.79], [175.0, 175.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.19, 0.0, 64.07, 99.97, 0.0, 78.21, 0.0, 82.43, 62.78, 96.04, 62.27, 92.31, 0.0, 0.0, 75.39, 46.9, 0.0, 0.0, 40.66, 0.0, 0.0, 61.08, 37.75, 0.0, 0.0, 0.0, 47.82, 40.21, 34.85, 0.0, 33.11, 0.0, 77.36, 70.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["singing bowl", 40.14], ["speech", 25.51], ["music", 14.81]], null, null, [["music", 66.04], ["didgeridoo", 3.61], ["synthesizer", 2.72]], null, null, null, [["music", 53.92], ["speech", 10.53], ["quack", 7.94]], null, null, null, [["music", 40.64], ["musical instrument", 8.99], ["guitar", 5.97]], [["music", 35.13], ["speech", 31.62], ["boing", 4.04]], [["music", 49.47], ["speech", 39.34], ["tap", 1.81]], null, [["music", 47.73], ["whack, thwack", 17.86], ["speech", 10.29]], null, null, null, null], "duration": [0.94, 2.74, 1.29, 8.35, 9.07, -0.06, 10.41, 1.04, 7.66, 2.38, 2.3, 2.13, 3.01, 0.72, 1.96, 4.75, 3.8, 0.35, 0.51, 2.16, 1.12, -0.14, 3.18, 5.66, 1.16, 1.18, 1.14, 2.06, 2.35, 9.12, 1.87, 23.38, 1.75, 2.44, 3.79, 0.61]} \ No newline at end of file diff --git a/annotations_1/G76ThtqLvWk_filtered.json b/annotations_1/G76ThtqLvWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3382c2d9da148c3302bf7743cfe6bc7a9cc93367 --- /dev/null +++ b/annotations_1/G76ThtqLvWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.23], [13.0, 44.52], [47.0, 66.88], [67.0, 72.81], [74.0, 102.93], [107.0, 110.78], [112.0, 120.38], [121.0, 121.8], [122.0, 122.98], [124.0, 175.44], [177.0, 178.7], [180.0, 193.09], [193.0, 200.35], [202.0, 202.61]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [31.01, 0.0, 30.14, 30.28, 30.05, 30.06, 30.97, 0.0, 0.0, 0.0, 0.0, 35.03, 33.36, 0.0], "audiomae_on_audioset": [[["music", 53.87], ["throbbing", 8.92], ["hum", 8.26]], null, [["music", 49.37], ["throbbing", 16.04], ["hum", 12.11]], [["mains hum", 24.47], ["music", 21.06], ["hum", 18.91]], [["speech", 43.23], ["music", 18.11], ["hum", 10.41]], [["music", 28.03], ["vehicle", 16.76], ["buzz", 8.1]], [["music", 22.24], ["insect", 15.12], ["fly, housefly", 14.49]], null, null, null, null, [["hum", 40.34], ["throbbing", 38.15], ["mains hum", 8.12]], [["throbbing", 39.5], ["music", 26.02], ["speech", 8.8]], null], "duration": [11.23, 31.52, 19.88, 5.81, 28.93, 3.78, 8.38, 0.8, 0.98, 51.44, 1.7, 13.09, 7.35, 0.61]} \ No newline at end of file diff --git a/annotations_1/G77UaCXuoOs_filtered.json b/annotations_1/G77UaCXuoOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb02a4eb792acb4f0bf10e95c5ba77a086949531 --- /dev/null +++ b/annotations_1/G77UaCXuoOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 116.26], [117.0, 137.08]], "keep_status": [false, true], "silence_prob": [0.0, 34.15], "audiomae_on_audioset": [null, [["speech", 37.95], ["hum", 14.63], ["music", 13.4]]], "duration": [31.26, 20.08]} \ No newline at end of file diff --git a/annotations_1/G7gklW3Xbn8_filtered.json b/annotations_1/G7gklW3Xbn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4347b0e7f3c186b87897503dc0c1318131ba5be --- /dev/null +++ b/annotations_1/G7gklW3Xbn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.39], [10.0, 15.7], [16.0, 16.87], [18.0, 28.17], [29.0, 35.28], [40.0, 48.02], [49.0, 49.59], [50.0, 53.27], [58.0, 58.28], [62.0, 63.59], [66.0, 67.04], [71.0, 72.3], [82.0, 83.83], [85.0, 84.54], [85.0, 97.41], [98.0, 101.14], [115.0, 115.99], [117.0, 119.77], [123.0, 129.98], [131.0, 138.64], [139.0, 140.97], [143.0, 168.24]], "keep_status": [false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [98.1, 42.79, 0.0, 38.86, 33.63, 35.52, 0.0, 39.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 48.91, 0.0, 69.88, 33.8, 32.03, 0.0, 30.72], "audiomae_on_audioset": [null, [["music", 27.05], ["speech", 7.73], ["throbbing", 5.89]], null, [["music", 39.52], ["speech", 19.39], ["buzz", 4.94]], [["throbbing", 20.99], ["cattle, bovinae", 20.83], ["music", 17.58]], [["music", 61.23], ["throbbing", 17.54], ["hum", 8.6]], null, [["music", 57.04], ["didgeridoo", 11.63], ["speech", 5.02]], null, null, null, null, null, null, null, [["music", 42.38], ["synthesizer", 7.69], ["throbbing", 7.0]], null, null, [["music", 52.99], ["throbbing", 13.37], ["didgeridoo", 5.64]], [["music", 43.34], ["throbbing", 23.99], ["hum", 8.18]], null, [["music", 66.28], ["speech", 6.24], ["electronic music", 3.8]]], "duration": [4.39, 5.7, 0.87, 10.17, 6.28, 8.02, 0.59, 3.27, 0.28, 1.59, 1.04, 1.3, 1.83, -0.46, 12.41, 3.14, 0.99, 2.77, 6.98, 7.64, 1.97, 25.24]} \ No newline at end of file diff --git a/annotations_1/G8FhdcsVB_o_filtered.json b/annotations_1/G8FhdcsVB_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/G8FhdcsVB_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/G8_ch6wsWjs_filtered.json b/annotations_1/G8_ch6wsWjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd60f226b315bdd9d418ce6df54c0e8639e082a5 --- /dev/null +++ b/annotations_1/G8_ch6wsWjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.61], [16.0, 63.76]], "keep_status": [false, false], "silence_prob": [71.72, 0.0], "audiomae_on_audioset": [null, null], "duration": [9.61, 47.76]} \ No newline at end of file diff --git a/annotations_1/G8_iVf44j-s_filtered.json b/annotations_1/G8_iVf44j-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b6a6debc5e3ef6b21faa7c03660f5afb2b0c83c --- /dev/null +++ b/annotations_1/G8_iVf44j-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 48.71], [50.0, 51.71], [52.0, 52.17], [52.0, 52.41], [53.0, 56.78], [60.0, 71.63], [72.0, 72.17], [75.0, 87.64], [91.0, 92.03], [93.0, 94.04], [97.0, 97.98], [99.0, 124.16], [130.0, 130.33]], "keep_status": [true, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [32.51, 0.0, 0.0, 0.0, 90.43, 31.61, 0.0, 30.23, 0.0, 0.0, 0.0, 29.92, 0.0], "audiomae_on_audioset": [[["music", 37.01], ["noise", 13.8], ["buzz", 11.46]], null, null, null, null, [["music", 61.81], ["animal", 3.87], ["speech", 2.63]], null, [["fly, housefly", 30.08], ["insect", 10.63], ["hum", 7.42]], null, null, null, [["hum", 33.9], ["music", 24.16], ["mains hum", 13.15]], null], "duration": [19.71, 1.71, 0.17, 0.41, 3.78, 11.63, 0.17, 12.64, 1.03, 1.04, 0.98, 25.16, 0.33]} \ No newline at end of file diff --git a/annotations_1/G8r48HzrYHE_filtered.json b/annotations_1/G8r48HzrYHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecd950ae8a0b0471ade395588e5e2da6c8d8d058 --- /dev/null +++ b/annotations_1/G8r48HzrYHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [5.0, 5.36], [8.0, 8.68], [12.0, 14.13], [15.0, 15.74], [16.0, 16.9], [19.0, 19.87], [20.0, 22.59], [23.0, 24.04], [30.0, 31.23], [32.0, 32.8], [35.0, 35.63], [37.0, 36.93], [38.0, 38.82], [41.0, 40.98], [53.0, 54.68], [56.0, 56.98], [61.0, 64.66], [70.0, 70.5], [72.0, 73.3], [74.0, 73.72], [76.0, 76.65], [78.0, 80.82], [81.0, 82.0], [85.0, 85.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.84, 0.0, 0.0, 0.0, 0.0, 37.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 93.33], ["electronic music", 0.75], ["musical instrument", 0.65]], null, null, null, null, [["music", 35.92], ["didgeridoo", 15.51], ["musical instrument", 5.34]], null, null], "duration": [0.52, 0.36, 0.68, 2.13, 0.74, 0.9, 0.87, 2.59, 1.04, 1.23, 0.8, 0.63, -0.07, 0.82, -0.02, 1.68, 0.98, 3.66, 0.5, 1.3, -0.28, 0.65, 2.82, 1.0, 0.73]} \ No newline at end of file diff --git a/annotations_1/G9D_0pXaM68_filtered.json b/annotations_1/G9D_0pXaM68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49a9966bf267cb4ff5d4ff2e04662fe609727f21 --- /dev/null +++ b/annotations_1/G9D_0pXaM68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 21.52], [31.0, 36.29], [39.0, 39.51], [42.0, 43.04], [44.0, 49.03], [54.0, 54.3], [57.0, 61.5], [64.0, 64.81], [68.0, 68.93], [76.0, 77.16], [78.0, 78.98], [80.0, 80.74], [101.0, 100.85], [101.0, 101.46], [102.0, 107.89], [109.0, 119.11]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [36.9, 39.21, 0.0, 0.0, 39.02, 0.0, 41.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.8, 36.76], "audiomae_on_audioset": [[["music", 60.87], ["psychedelic rock", 2.64], ["skidding", 2.4]], [["music", 23.8], ["speech", 22.64], ["cacophony", 5.76]], null, null, [["music", 81.26], ["rock and roll", 2.13], ["trombone", 1.36]], null, [["music", 78.0], ["speech", 5.86], ["brass instrument", 0.94]], null, null, null, null, null, null, null, [["music", 50.15], ["speech", 14.47], ["cattle, bovinae", 2.01]], [["music", 22.78], ["moo", 18.54], ["cattle, bovinae", 15.51]]], "duration": [12.52, 5.29, 0.51, 1.04, 5.03, 0.3, 4.5, 0.81, 0.93, 1.16, 0.98, 0.74, -0.15, 0.46, 5.89, 10.11]} \ No newline at end of file diff --git a/annotations_1/GAozArqKtGQ_filtered.json b/annotations_1/GAozArqKtGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75fac7465151461fd651a54f0ab67e225d58c586 --- /dev/null +++ b/annotations_1/GAozArqKtGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [22.0, 23.23], [27.0, 26.84], [29.0, 31.92], [33.0, 38.26], [39.0, 51.6], [53.0, 113.34]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.17, 34.66, 30.41, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.06], ["boing", 16.93], ["speech", 11.42]], [["boing", 70.84], ["music", 14.96], ["whack, thwack", 2.81]], null], "duration": [-0.14, 1.23, -0.16, 2.92, 5.26, 12.6, 60.34]} \ No newline at end of file diff --git a/annotations_1/GBu5QE-EsSg_filtered.json b/annotations_1/GBu5QE-EsSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..694f34bc6c18bbc89938de36851e0597056924dc --- /dev/null +++ b/annotations_1/GBu5QE-EsSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.31], [28.0, 29.73], [30.0, 32.37], [33.0, 33.2], [34.0, 35.46], [39.0, 41.3], [42.0, 45.82], [47.0, 48.32], [50.0, 51.36], [53.0, 54.14], [56.0, 57.2], [58.0, 65.26], [66.0, 68.64], [70.0, 70.29], [73.0, 73.45], [76.0, 82.9], [83.0, 85.16], [86.0, 88.21], [89.0, 89.33], [92.0, 98.76], [100.0, 100.25], [102.0, 106.88], [107.0, 133.1], [133.0, 143.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.11, 0.0, 85.72, 0.0, 0.0, 99.8, 61.57, 0.0, 0.0, 0.0, 0.0, 67.89, 90.43, 0.0, 0.0, 57.01, 84.62, 73.36, 0.0, 91.64, 0.0, 79.07, 68.15, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.31, 1.73, 2.37, 0.2, 1.46, 2.3, 3.82, 1.32, 1.36, 1.14, 1.2, 7.26, 2.64, 0.29, 0.45, 6.9, 2.16, 2.21, 0.33, 6.76, 0.25, 4.88, 26.1, 10.58]} \ No newline at end of file diff --git a/annotations_1/GC6ksHacdXI_filtered.json b/annotations_1/GC6ksHacdXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52703017e5f5278697a40a8020b966a0bd962cd9 --- /dev/null +++ b/annotations_1/GC6ksHacdXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.66], [14.0, 19.23], [24.0, 49.08], [50.0, 51.61], [53.0, 54.28], [57.0, 64.74], [65.0, 65.67]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 47.7, 30.58, 0.0, 0.0, 36.86, 0.0], "audiomae_on_audioset": [null, [["music", 26.59], ["whale vocalization", 17.63], ["effects unit", 9.0]], [["music", 42.32], ["didgeridoo", 37.69], ["theremin", 3.37]], null, null, [["music", 38.81], ["speech", 32.38], ["speech synthesizer", 3.33]], null], "duration": [0.66, 5.23, 25.08, 1.61, 1.28, 7.74, 0.67]} \ No newline at end of file diff --git a/annotations_1/GC8KstVPxPM_filtered.json b/annotations_1/GC8KstVPxPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b64e0fbb5d9ffa053bb088b10e03eac34a721bb8 --- /dev/null +++ b/annotations_1/GC8KstVPxPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.51], [6.0, 9.29], [15.0, 15.15], [18.0, 21.57], [23.0, 28.24], [32.0, 32.43], [35.0, 34.94], [44.0, 44.78], [57.0, 58.38], [59.0, 61.97], [64.0, 64.49], [66.0, 73.53], [92.0, 95.3], [104.0, 105.07], [106.0, 107.23], [108.0, 111.42], [114.0, 115.48], [116.0, 115.59], [116.0, 118.57], [123.0, 124.16], [125.0, 127.25], [128.0, 128.29], [132.0, 132.54]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.36, 49.82, 0.0, 42.39, 51.34, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 33.28, 33.46, 0.0, 0.0, 69.34, 0.0, 0.0, 32.72, 0.0, 97.83, 0.0, 0.0], "audiomae_on_audioset": [[["sheep", 20.76], ["speech", 15.18], ["frog", 11.6]], [["speech", 24.19], ["electric shaver, electric razor", 10.1], ["hum", 9.92]], null, [["speech", 15.16], ["cattle, bovinae", 7.93], ["boing", 5.96]], null, null, null, null, null, null, null, [["music", 53.58], ["speech", 7.96], ["violin, fiddle", 3.4]], [["speech", 51.02], ["cattle, bovinae", 14.82], ["moo", 11.23]], null, null, null, null, null, [["speech", 75.21], ["wail, moan", 8.69], ["inside, small room", 1.46]], null, null, null, null], "duration": [3.51, 3.29, 0.15, 3.57, 5.24, 0.43, -0.06, 0.78, 1.38, 2.97, 0.49, 7.53, 3.3, 1.07, 1.23, 3.42, 1.48, -0.41, 2.57, 1.16, 2.25, 0.29, 0.54]} \ No newline at end of file diff --git a/annotations_1/GC9MkHzTnRg_filtered.json b/annotations_1/GC9MkHzTnRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38a9e2d667b7fe257b34290185a53f1d2bb441e2 --- /dev/null +++ b/annotations_1/GC9MkHzTnRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.37], [8.0, 12.48], [14.0, 16.07], [18.0, 19.3], [20.0, 21.05], [23.0, 25.84], [26.0, 31.29], [32.0, 34.21], [35.0, 38.04], [40.0, 46.65], [48.0, 48.91], [49.0, 50.31], [51.0, 52.86], [53.0, 55.8], [57.0, 59.41], [61.0, 89.24], [90.0, 98.05], [99.0, 143.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 99.93, 98.27, 0.0, 0.0, 99.98, 98.73, 99.96, 100.0, 98.93, 0.0, 0.0, 0.0, 78.38, 88.46, 92.48, 89.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.37, 4.48, 2.07, 1.3, 1.05, 2.84, 5.29, 2.21, 3.04, 6.65, 0.91, 1.31, 1.86, 2.8, 2.41, 28.24, 8.05, 44.75]} \ No newline at end of file diff --git a/annotations_1/GCSbGFMWzC4_filtered.json b/annotations_1/GCSbGFMWzC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2084056f277a5c400fc14410b19c220a2e324f71 --- /dev/null +++ b/annotations_1/GCSbGFMWzC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[113.0, 117.95], [118.0, 133.39], [136.0, 154.99], [159.0, 169.26]], "keep_status": [false, true, true, true], "silence_prob": [29.3, 31.96, 35.63, 37.16], "audiomae_on_audioset": [[["music", 62.25], ["theremin", 11.61], ["cacophony", 2.29]], [["hum", 30.6], ["music", 19.75], ["mains hum", 16.26]], [["music", 47.6], ["brass instrument", 10.71], ["speech", 8.37]], [["mains hum", 20.74], ["hum", 16.28], ["speech", 14.11]]], "duration": [4.95, 15.39, 18.99, 10.26]} \ No newline at end of file diff --git a/annotations_1/GCc99Gh-IEM_filtered.json b/annotations_1/GCc99Gh-IEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82695f9b625b2f7c2bcdf0b61ae47d5795ba0fc1 --- /dev/null +++ b/annotations_1/GCc99Gh-IEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.71], [6.0, 20.48], [24.0, 25.08], [26.0, 27.26], [29.0, 30.08], [31.0, 32.81], [33.0, 33.89], [38.0, 39.16], [40.0, 40.63], [42.0, 45.98], [47.0, 48.66], [49.0, 50.16], [52.0, 53.15], [54.0, 99.72], [101.0, 103.49], [107.0, 109.24], [110.0, 111.32], [113.0, 113.04], [117.0, 117.93], [120.0, 120.99], [123.0, 124.46]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 48.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 44.4, 46.79, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["bouncing", 20.87], ["radio", 9.07], ["animal", 4.71]], null, null, null, null, null, null, null, null, null, null, null, null, [["wheeze", 39.99], ["throat clearing", 19.15], ["cough", 11.65]], [["sine wave", 22.61], ["chirp tone", 12.35], ["domestic animals, pets", 8.39]], null, null, null, null, null], "duration": [0.71, 14.48, 1.08, 1.26, 1.08, 1.81, 0.89, 1.16, 0.63, 3.98, 1.66, 1.16, 1.15, 45.72, 2.49, 2.24, 1.32, 0.04, 0.93, 0.99, 1.46]} \ No newline at end of file diff --git a/annotations_1/GEAh4nF90iw_filtered.json b/annotations_1/GEAh4nF90iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ddfcc2d87eb303044d9c6ceecd6a0ee4463b72b --- /dev/null +++ b/annotations_1/GEAh4nF90iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [5.0, 6.39], [9.0, 11.53], [13.0, 16.24], [26.0, 27.03], [29.0, 30.03], [38.0, 39.77], [57.0, 57.35], [58.0, 58.4], [64.0, 64.5], [72.0, 74.8], [78.0, 78.41], [91.0, 91.59], [96.0, 99.4], [103.0, 104.23], [105.0, 106.95], [107.0, 108.48], [110.0, 109.59], [111.0, 111.82], [114.0, 118.98], [119.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 48.69, 69.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.9], ["whale vocalization", 16.74], ["mains hum", 6.28]], null], "duration": [1.38, 1.39, 2.53, 3.24, 1.03, 1.03, 1.77, 0.35, 0.4, 0.5, 2.8, 0.41, 0.59, 3.4, 1.23, 1.95, 1.48, -0.41, 0.82, 4.98, 3.22]} \ No newline at end of file diff --git a/annotations_1/GEB8rnOevpY_filtered.json b/annotations_1/GEB8rnOevpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aed3e7f0c8990fa90501d1fc3ec351831c35ae8f --- /dev/null +++ b/annotations_1/GEB8rnOevpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [6.0, 6.29], [8.0, 9.37], [15.0, 15.53], [18.0, 20.19], [21.0, 21.44], [22.0, 26.86], [30.0, 33.32], [35.0, 35.77], [37.0, 40.04], [48.0, 48.49], [51.0, 52.54], [54.0, 54.26], [56.0, 56.67], [58.0, 57.91], [63.0, 65.23], [71.0, 71.79], [73.0, 73.79], [74.0, 77.65], [78.0, 77.94], [85.0, 87.51], [100.0, 101.11], [109.0, 109.09], [116.0, 117.24], [120.0, 121.71], [124.0, 140.68], [141.0, 148.73], [150.0, 150.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.16, 0.0, 37.57, 37.36, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 32.42, 0.0, 35.16, 0.0, 0.0, 0.0, 0.0, 46.36, 40.47, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 46.69], ["radio", 30.04], ["frog", 6.12]], null, [["noise", 49.46], ["sidetone", 16.38], ["radio", 11.12]], [["sidetone", 54.8], ["noise", 10.64], ["radio", 8.84]], null, [["noise", 71.15], ["hum", 7.16], ["sidetone", 3.57]], null, null, null, null, null, [["speech", 70.0], ["radio", 11.76], ["telephone dialing, dtmf", 2.59]], null, null, [["radio", 50.9], ["speech", 23.07], ["sidetone", 21.39]], null, [["clang", 18.92], ["speech", 7.91], ["crackle", 6.47]], null, null, null, null, [["hum", 24.6], ["mains hum", 21.56], ["noise", 15.9]], [["music", 49.73], ["theremin", 10.25], ["speech", 5.92]], null], "duration": [1.18, 0.29, 1.37, 0.53, 2.19, 0.44, 4.86, 3.32, 0.77, 3.04, 0.49, 1.54, 0.26, 0.67, -0.09, 2.23, 0.79, 0.79, 3.65, -0.06, 2.51, 1.11, 0.09, 1.24, 1.71, 16.68, 7.73, 0.79]} \ No newline at end of file diff --git a/annotations_1/GH-oJGZKmq8_filtered.json b/annotations_1/GH-oJGZKmq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01eb14aa0596ecd68ec4872f104b8c36bcfb7008 --- /dev/null +++ b/annotations_1/GH-oJGZKmq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.03], [15.0, 15.7], [16.0, 18.01], [36.0, 39.12], [39.0, 40.59], [41.0, 41.76], [45.0, 45.4], [48.0, 48.61], [64.0, 63.9], [68.0, 69.38], [71.0, 70.93], [72.0, 72.12], [78.0, 78.8], [82.0, 84.81], [85.0, 87.02], [94.0, 94.14], [103.0, 104.3], [111.0, 113.44], [122.0, 122.32], [126.0, 126.66], [128.0, 127.97], [134.0, 134.11], [135.0, 135.57], [139.0, 139.8], [143.0, 143.23], [145.0, 145.07], [147.0, 148.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.64, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 95.23, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 0.7, 2.01, 3.12, 1.59, 0.76, 0.4, 0.61, -0.1, 1.38, -0.07, 0.12, 0.8, 2.81, 2.02, 0.14, 1.3, 2.44, 0.32, 0.66, -0.03, 0.11, 0.57, 0.8, 0.23, 0.07, 1.22]} \ No newline at end of file diff --git a/annotations_1/GHZSYBkKec4_filtered.json b/annotations_1/GHZSYBkKec4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f4bbd6c9b6cc70e7bca8731cdea68108e514e09 --- /dev/null +++ b/annotations_1/GHZSYBkKec4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.0], [13.0, 20.04], [22.0, 22.15], [24.0, 24.88], [28.0, 30.06], [33.0, 33.59], [35.0, 38.99], [44.0, 43.88], [44.0, 86.41], [93.0, 93.41], [108.0, 136.21], [142.0, 142.87], [144.0, 144.83], [146.0, 147.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.78, 35.2, 0.0, 0.0, 44.23, 0.0, 34.0, 0.0, 0.0, 0.0, 29.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 82.81], ["electronic music", 2.77], ["drum machine", 1.74]], [["music", 62.74], ["synthesizer", 6.48], ["electronic music", 4.65]], null, null, [["speech", 45.25], ["sidetone", 29.9], ["sine wave", 3.26]], null, [["moo", 44.24], ["cattle, bovinae", 33.28], ["livestock, farm animals, working animals", 12.19]], null, null, null, [["music", 62.27], ["didgeridoo", 8.56], ["buzz", 8.49]], null, null, null], "duration": [4.0, 7.04, 0.15, 0.88, 2.06, 0.59, 3.99, -0.12, 42.41, 0.41, 28.21, 0.87, 0.83, 1.95]} \ No newline at end of file diff --git a/annotations_1/GHpQUOP8vcE_filtered.json b/annotations_1/GHpQUOP8vcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b61a32bcb5373d11a83b25d13002e43f8ca50b0 --- /dev/null +++ b/annotations_1/GHpQUOP8vcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.88], [10.0, 11.1], [12.0, 13.88], [16.0, 16.28], [19.0, 19.63], [27.0, 37.67], [39.0, 40.39], [41.0, 42.11], [44.0, 45.45], [48.0, 50.84], [53.0, 53.81], [58.0, 58.62], [61.0, 62.18], [69.0, 71.49], [72.0, 71.98], [74.0, 75.41], [76.0, 76.18], [78.0, 78.17], [79.0, 80.69], [82.0, 82.48], [86.0, 88.6], [90.0, 92.72], [96.0, 96.69], [104.0, 104.97], [110.0, 110.88], [113.0, 113.71], [118.0, 118.1], [120.0, 122.74], [125.0, 125.22], [127.0, 127.94], [130.0, 130.25], [133.0, 137.05], [140.0, 140.58]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.34, 0.0, 0.0, 0.0, 54.23, 0.0, 0.0, 0.0, 34.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.68, 35.08, 0.0, 0.0, 0.0, 0.0, 0.0, 33.13, 0.0, 0.0, 0.0, 34.11, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["clang", 21.93], ["music", 11.23], ["hum", 9.76]], null, null, null, null, null, null, null, [["music", 43.81], ["theremin", 33.71], ["speech", 7.88]], null, null, null, null, null, null, [["music", 45.33], ["musical instrument", 9.43], ["theremin", 2.39]], [["theremin", 25.62], ["music", 23.08], ["synthesizer", 5.67]], null, null, null, null, null, [["theremin", 57.58], ["music", 30.8], ["musical instrument", 2.12]], null, null, null, [["music", 55.85], ["musical instrument", 9.91], ["guitar", 2.93]], null], "duration": [0.88, 1.1, 1.88, 0.28, 0.63, 10.67, 1.39, 1.11, 1.45, 2.84, 0.81, 0.62, 1.18, 2.49, -0.02, 1.41, 0.18, 0.17, 1.69, 0.48, 2.6, 2.72, 0.69, 0.97, 0.88, 0.71, 0.1, 2.74, 0.22, 0.94, 0.25, 4.05, 0.58]} \ No newline at end of file diff --git a/annotations_1/GI67NK5cmxk_filtered.json b/annotations_1/GI67NK5cmxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..083b00b952bc0f02d85922027ebc11f0542b4ff5 --- /dev/null +++ b/annotations_1/GI67NK5cmxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.05], [7.0, 7.3], [8.0, 10.76], [13.0, 13.12], [15.0, 15.21], [16.0, 16.97], [18.0, 18.45], [21.0, 22.08], [24.0, 24.78], [26.0, 26.86], [27.0, 27.85], [28.0, 28.88], [30.0, 30.74], [35.0, 35.24], [38.0, 39.02], [43.0, 44.09], [47.0, 48.29], [52.0, 53.89], [55.0, 58.09], [59.0, 60.32], [61.0, 62.61], [64.0, 64.88], [65.0, 66.51], [68.0, 70.41], [72.0, 81.28], [82.0, 84.15], [86.0, 96.11], [104.0, 107.18], [108.0, 108.45], [110.0, 118.76], [120.0, 120.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [100.0, 0.0, 34.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 99.71, 82.97, 35.77, 37.89, 64.97, 0.0, 47.58, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 70.94], ["dial tone", 9.44], ["speech", 8.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 53.6], ["chirp tone", 10.17], ["tuning fork", 8.58]], [["music", 27.81], ["hum", 9.76], ["synthesizer", 9.09]], null, null, [["music", 49.84], ["wind instrument, woodwind instrument", 23.68], ["theremin", 7.71]], null], "duration": [3.05, 0.3, 2.76, 0.12, 0.21, 0.97, 0.45, 1.08, 0.78, 0.86, 0.85, 0.88, 0.74, 0.24, 1.02, 1.09, 1.29, 1.89, 3.09, 1.32, 1.61, 0.88, 1.51, 2.41, 9.28, 2.15, 10.11, 3.18, 0.45, 8.76, 0.58]} \ No newline at end of file diff --git a/annotations_1/GIASYqV_Xds_filtered.json b/annotations_1/GIASYqV_Xds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43100bc5fa664064f0a75769bf5c4c2fa1b109a1 --- /dev/null +++ b/annotations_1/GIASYqV_Xds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.26], [5.0, 5.29], [5.0, 9.71], [13.0, 19.04], [20.0, 20.7], [25.0, 32.76], [34.0, 38.35], [41.0, 47.53], [55.0, 77.5], [80.0, 85.26], [87.0, 101.46], [103.0, 103.54]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [94.52, 0.0, 44.29, 33.3, 0.0, 32.63, 31.3, 39.44, 31.68, 99.82, 99.97, 0.0], "audiomae_on_audioset": [null, null, [["speech", 66.64], ["explosion", 7.64], ["burst, pop", 4.54]], [["didgeridoo", 54.92], ["music", 35.34], ["musical instrument", 4.45]], null, [["speech", 46.74], ["fly, housefly", 6.52], ["music", 5.24]], [["noise", 15.01], ["whale vocalization", 8.76], ["synthesizer", 8.57]], [["music", 43.93], ["didgeridoo", 10.28], ["speech", 9.67]], [["music", 45.82], ["vehicle", 10.87], ["musical instrument", 6.61]], null, null, null], "duration": [2.26, 0.29, 4.71, 6.04, 0.7, 7.76, 4.35, 6.53, 22.5, 5.26, 14.46, 0.54]} \ No newline at end of file diff --git a/annotations_1/GJ0-xGnrjBU_filtered.json b/annotations_1/GJ0-xGnrjBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f286db2557f737a2775ec7b853fa480d3ca7da51 --- /dev/null +++ b/annotations_1/GJ0-xGnrjBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.87], [34.0, 35.6], [36.0, 35.82], [36.0, 36.09], [45.0, 48.57], [56.0, 59.95], [62.0, 62.78], [64.0, 63.85], [68.0, 68.22], [72.0, 76.17], [80.0, 94.93], [97.0, 96.94], [97.0, 97.06], [97.0, 97.31], [97.0, 98.37]], "keep_status": [false, false, false, false, true, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.8, 38.1, 0.0, 0.0, 0.0, 30.23, 31.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 22.65], ["cattle, bovinae", 19.79], ["moo", 11.61]], [["music", 43.58], ["throbbing", 11.53], ["electronic music", 5.52]], null, null, null, [["speech", 43.59], ["motorcycle", 6.67], ["buzz", 5.31]], [["speech", 44.96], ["vehicle", 12.72], ["fart", 6.33]], null, null, null, null], "duration": [0.87, 1.6, -0.18, 0.09, 3.57, 3.95, 0.78, -0.15, 0.22, 4.17, 14.93, -0.06, 0.06, 0.31, 1.37]} \ No newline at end of file diff --git a/annotations_1/GJleW4TCQM0_filtered.json b/annotations_1/GJleW4TCQM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65e7b7472bfd42da1c520a64355bb4b012c093dd --- /dev/null +++ b/annotations_1/GJleW4TCQM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 22.11], [23.0, 30.13], [31.0, 41.81], [47.0, 46.68], [49.0, 49.79], [51.0, 52.76], [61.0, 65.45], [80.0, 90.49], [91.0, 91.45], [97.0, 104.36], [107.0, 114.05], [135.0, 175.22]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [42.08, 34.18, 32.07, 0.0, 0.0, 0.0, 31.67, 32.0, 0.0, 32.04, 32.84, 0.0], "audiomae_on_audioset": [[["hum", 44.68], ["throbbing", 22.38], ["music", 16.23]], [["music", 55.55], ["didgeridoo", 25.03], ["hum", 7.17]], [["music", 45.46], ["hum", 13.63], ["throbbing", 8.86]], null, null, null, [["throbbing", 39.96], ["hum", 37.37], ["music", 10.94]], [["music", 39.44], ["throbbing", 26.28], ["hum", 14.57]], null, [["music", 77.99], ["synthetic singing", 2.69], ["male singing", 1.22]], [["music", 54.52], ["theremin", 7.54], ["didgeridoo", 5.26]], null], "duration": [17.11, 7.13, 10.81, -0.32, 0.79, 1.76, 4.45, 10.49, 0.45, 7.36, 7.05, 40.22]} \ No newline at end of file diff --git a/annotations_1/GJwsVhQHggU_filtered.json b/annotations_1/GJwsVhQHggU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4532438e1b2c47b0fb76ba0bd08e35be3528b226 --- /dev/null +++ b/annotations_1/GJwsVhQHggU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.18], [6.0, 6.89], [9.0, 11.15], [12.0, 14.07], [16.0, 16.33], [18.0, 19.68], [21.0, 21.37], [25.0, 26.01], [27.0, 27.92], [29.0, 30.0], [34.0, 42.8], [46.0, 47.14], [48.0, 57.45], [59.0, 67.12], [68.0, 81.48], [83.0, 83.88], [86.0, 139.7], [142.0, 143.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [59.24, 0.0, 80.46, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 40.17, 39.93, 29.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 31.62], ["mains hum", 23.29], ["music", 20.48]], [["hum", 47.7], ["mains hum", 21.41], ["throbbing", 11.58]], [["speech", 48.11], ["music", 15.06], ["whack, thwack", 5.51]], null, null, null], "duration": [2.18, 0.89, 2.15, 2.07, 0.33, 1.68, 0.37, 1.01, 0.92, 1.0, 8.8, 1.14, 9.45, 8.12, 13.48, 0.88, 53.7, 1.41]} \ No newline at end of file diff --git a/annotations_1/GKuPSf9P3tw_filtered.json b/annotations_1/GKuPSf9P3tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f519cafbe11162c07fb1eeca1cc27293a9687a1 --- /dev/null +++ b/annotations_1/GKuPSf9P3tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [7.0, 19.4], [22.0, 42.13], [44.0, 56.35], [59.0, 62.85], [64.0, 65.03], [66.0, 78.17], [83.0, 83.13], [85.0, 85.95], [89.0, 99.35], [101.0, 129.95], [133.0, 135.36], [136.0, 153.91], [155.0, 157.52]], "keep_status": [false, true, true, false, true, false, true, false, false, false, false, true, true, true], "silence_prob": [0.0, 29.19, 29.88, 33.3, 35.37, 0.0, 30.33, 0.0, 0.0, 29.89, 29.87, 29.04, 28.85, 34.15], "audiomae_on_audioset": [null, [["music", 38.84], ["livestock, farm animals, working animals", 13.97], ["motorcycle", 7.05]], [["music", 30.97], ["throbbing", 16.99], ["speech", 11.3]], [["music", 61.54], ["hum", 10.0], ["mains hum", 4.18]], [["didgeridoo", 29.77], ["foghorn", 10.32], ["music", 10.21]], null, [["animal", 39.91], ["roaring cats (lions, tigers)", 12.35], ["wild animals", 8.99]], null, null, [["buzz", 64.64], ["music", 22.57], ["fly, housefly", 1.95]], [["music", 58.93], ["smash, crash", 14.87], ["buzz", 6.94]], [["music", 13.67], ["buzz", 9.08], ["noise", 5.61]], [["vehicle", 37.04], ["car", 15.96], ["speech", 8.29]], [["music", 23.07], ["speech", 6.67], ["vehicle", 5.99]]], "duration": [0.83, 12.4, 20.13, 12.35, 3.85, 1.03, 12.17, 0.13, 0.95, 10.35, 28.95, 2.36, 17.91, 2.52]} \ No newline at end of file diff --git a/annotations_1/GLeGjBbLSJI_filtered.json b/annotations_1/GLeGjBbLSJI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6031015791914d25c71bbc53b478e357c18c3a27 --- /dev/null +++ b/annotations_1/GLeGjBbLSJI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.97], [3.0, 3.23], [7.0, 8.63], [10.0, 10.29], [12.0, 13.1], [14.0, 14.32], [20.0, 21.12], [31.0, 31.51], [32.0, 41.25], [43.0, 44.78], [45.0, 53.1], [56.0, 81.75], [84.0, 85.23], [86.0, 88.32], [92.0, 92.64], [94.0, 96.42], [97.0, 104.4], [108.0, 108.43], [111.0, 113.75], [115.0, 115.52], [119.0, 119.55], [128.0, 128.83]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 44.09, 31.43, 0.0, 34.34, 0.0, 33.47, 34.24, 0.0, 35.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 40.24], ["sidetone", 12.25], ["music", 7.71]], null, [["hum", 50.36], ["mains hum", 14.06], ["music", 12.36]], [["whack, thwack", 36.47], ["groan", 22.84], ["music", 14.04]], null, [["fly, housefly", 22.64], ["insect", 16.97], ["music", 7.9]], null, [["music", 26.19], ["fly, housefly", 11.32], ["speech", 8.08]], [["hum", 49.77], ["mains hum", 23.25], ["throbbing", 11.91]], null, [["hum", 17.88], ["rumble", 13.46], ["speech", 10.6]], null, null, null], "duration": [-0.03, 0.23, 1.63, 0.29, 1.1, 0.32, 1.12, 0.51, 9.25, 1.78, 8.1, 25.75, 1.23, 2.32, 0.64, 2.42, 7.4, 0.43, 2.75, 0.52, 0.55, 0.83]} \ No newline at end of file diff --git a/annotations_1/GNAJWwqr8cM_filtered.json b/annotations_1/GNAJWwqr8cM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfe7ea7d513902a0ff7f9ba9b96e43d03bcbf223 --- /dev/null +++ b/annotations_1/GNAJWwqr8cM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [14.0, 24.44], [28.0, 29.05], [31.0, 32.1], [35.0, 35.95], [38.0, 38.43], [40.0, 40.63], [41.0, 42.9], [46.0, 48.34], [54.0, 54.72], [57.0, 57.64], [59.0, 60.66], [64.0, 64.71], [69.0, 70.56], [74.0, 75.54], [77.0, 78.63], [80.0, 81.36], [83.0, 84.5], [86.0, 86.97], [89.0, 90.26], [92.0, 92.75], [95.0, 97.68], [103.0, 103.42], [105.0, 105.9], [111.0, 111.64], [114.0, 114.86], [123.0, 124.19], [127.0, 127.38], [134.0, 134.59], [143.0, 147.95], [167.0, 168.0], [170.0, 171.68], [174.0, 176.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.87, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.13], ["boing", 23.53], ["fart", 5.48]], null, null, null], "duration": [0.28, 10.44, 1.05, 1.1, 0.95, 0.43, 0.63, 1.9, 2.34, 0.72, 0.64, 1.66, 0.71, 1.56, 1.54, 1.63, 1.36, 1.5, 0.97, 1.26, 0.75, 2.68, 0.42, 0.9, 0.64, 0.86, 1.19, 0.38, 0.59, 4.95, 1.0, 1.68, 2.66]} \ No newline at end of file diff --git a/annotations_1/GNSkaIuTNao_filtered.json b/annotations_1/GNSkaIuTNao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86a8474ad8a9c3cf90ebb0467e1492b294c62bb7 --- /dev/null +++ b/annotations_1/GNSkaIuTNao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.4], [7.0, 7.55], [24.0, 24.87], [37.0, 37.49], [41.0, 42.92], [50.0, 51.71], [53.0, 53.74], [54.0, 56.07], [59.0, 59.12], [95.0, 96.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.09], ["music", 14.21], ["hum", 3.22]], null, null], "duration": [1.4, 0.55, 0.87, 0.49, 1.92, 1.71, 0.74, 2.07, 0.12, 1.18]} \ No newline at end of file diff --git a/annotations_1/GOwehDo9xYQ_filtered.json b/annotations_1/GOwehDo9xYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc97329d5014435dbe1d5ca1b9e361dd86e6290a --- /dev/null +++ b/annotations_1/GOwehDo9xYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.1], [10.0, 11.94], [26.0, 26.32], [27.0, 27.01], [27.0, 27.33], [27.0, 27.5], [38.0, 39.18], [47.0, 50.13], [51.0, 56.51], [64.0, 64.05], [66.0, 65.7], [66.0, 69.33], [73.0, 74.33], [75.0, 79.93], [81.0, 81.46], [84.0, 87.45], [89.0, 94.37], [94.0, 94.44], [97.0, 98.37], [100.0, 101.82], [103.0, 103.76]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 30.26, 0.0, 0.0, 28.99, 0.0, 37.9, 0.0, 40.82, 33.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 54.41], ["music", 13.13], ["didgeridoo", 6.26]], [["whale vocalization", 24.97], ["speech", 23.51], ["music", 8.1]], null, null, [["speech", 39.88], ["vehicle", 28.54], ["car", 6.71]], null, [["speech", 36.31], ["music", 19.99], ["hum", 14.03]], null, [["speech", 25.14], ["cattle, bovinae", 15.15], ["moo", 12.03]], [["cattle, bovinae", 36.74], ["moo", 33.1], ["livestock, farm animals, working animals", 16.05]], null, null, null, null], "duration": [1.1, 1.94, 0.32, 0.01, 0.33, 0.5, 1.18, 3.13, 5.51, 0.05, -0.3, 3.33, 1.33, 4.93, 0.46, 3.45, 5.37, 0.44, 1.37, 1.82, 0.76]} \ No newline at end of file diff --git a/annotations_1/GP8HnRCjLGg_filtered.json b/annotations_1/GP8HnRCjLGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee0a4793ea92d819a7e3fe8067f872377cc045c3 --- /dev/null +++ b/annotations_1/GP8HnRCjLGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.73], [10.0, 10.4], [12.0, 13.8], [16.0, 16.63], [18.0, 19.3], [21.0, 24.75], [26.0, 26.22], [27.0, 33.02], [38.0, 57.84], [61.0, 80.55], [85.0, 86.17], [87.0, 88.53], [89.0, 99.84], [101.0, 102.78], [113.0, 116.21], [117.0, 117.68]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [54.97, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 52.33, 52.68, 35.13, 0.0, 0.0, 35.13, 0.0, 31.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 38.92], ["ambient music", 20.12], ["mains hum", 9.09]], null, null, [["music", 67.54], ["speech", 8.58], ["hum", 2.86]], null, [["music", 39.41], ["didgeridoo", 10.61], ["throbbing", 7.4]], null], "duration": [6.73, 0.4, 1.8, 0.63, 1.3, 3.75, 0.22, 6.02, 19.84, 19.55, 1.17, 1.53, 10.84, 1.78, 3.21, 0.68]} \ No newline at end of file diff --git a/annotations_1/GQM4dSjjQuE_filtered.json b/annotations_1/GQM4dSjjQuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f0c9b0fb8ab5d819bad980e1bf4f758e124aabb --- /dev/null +++ b/annotations_1/GQM4dSjjQuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.03], [30.0, 31.99], [34.0, 37.07], [51.0, 54.11], [55.0, 59.44], [62.0, 67.51], [69.0, 77.85], [79.0, 131.4], [134.0, 149.94], [152.0, 154.45], [157.0, 163.0], [168.0, 169.35], [170.0, 171.64], [173.0, 174.46], [175.0, 176.49], [177.0, 189.11], [189.0, 189.14]], "keep_status": [false, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.81, 33.01, 34.93, 36.97, 31.81, 0.0, 33.08, 95.51, 81.71, 0.0, 0.0, 0.0, 0.0, 38.3, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.6], ["speech", 8.35], ["didgeridoo", 4.44]], [["boing", 91.1], ["music", 2.23], ["speech", 1.74]], [["music", 36.45], ["throbbing", 22.94], ["breaking", 6.47]], [["music", 43.61], ["didgeridoo", 6.31], ["throbbing", 5.48]], [["fly, housefly", 64.33], ["insect", 9.61], ["speech", 6.94]], null, [["speech", 32.35], ["music", 24.62], ["hum", 12.02]], null, null, null, null, null, null, [["speech", 36.97], ["music", 31.24], ["theremin", 8.17]], null], "duration": [0.03, 1.99, 3.07, 3.11, 4.44, 5.51, 8.85, 52.4, 15.94, 2.45, 6.0, 1.35, 1.64, 1.46, 1.49, 12.11, 0.14]} \ No newline at end of file diff --git a/annotations_1/GQYCNF_zoDM_filtered.json b/annotations_1/GQYCNF_zoDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef9e5164594bc92201a1edf966e5c2e6a743d6f --- /dev/null +++ b/annotations_1/GQYCNF_zoDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.12], [12.0, 18.06], [21.0, 20.71], [24.0, 24.07], [28.0, 40.61], [50.0, 50.58], [54.0, 56.13], [76.0, 90.44]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [40.5, 33.5, 0.0, 0.0, 30.54, 0.0, 36.58, 30.77], "audiomae_on_audioset": [[["music", 33.04], ["hum", 31.68], ["mains hum", 13.25]], [["music", 34.06], ["mains hum", 19.73], ["hum", 18.49]], null, null, [["music", 30.13], ["hum", 19.64], ["mains hum", 8.96]], null, [["music", 47.0], ["throbbing", 29.76], ["hum", 7.94]], [["music", 58.88], ["speech", 9.75], ["boing", 4.73]]], "duration": [3.12, 6.06, -0.29, 0.07, 12.61, 0.58, 2.13, 14.44]} \ No newline at end of file diff --git a/annotations_1/GRADFiFVLJQ_filtered.json b/annotations_1/GRADFiFVLJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef6b271232c13bdd8d8a7538085759cf13af2b2f --- /dev/null +++ b/annotations_1/GRADFiFVLJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.63], [3.0, 11.72], [18.0, 34.52], [36.0, 47.63], [49.0, 49.28], [52.0, 56.17], [57.0, 57.05], [63.0, 63.17], [65.0, 65.69], [66.0, 68.1], [73.0, 89.83], [91.0, 93.77]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 39.64, 98.19, 64.07, 0.0, 35.95, 0.0, 0.0, 0.0, 33.28, 61.37, 38.94], "audiomae_on_audioset": [null, [["music", 46.82], ["musical instrument", 7.0], ["tap", 5.98]], null, null, null, [["wind instrument, woodwind instrument", 60.42], ["shofar", 6.87], ["music", 5.38]], null, null, null, [["music", 42.52], ["clarinet", 13.82], ["wind instrument, woodwind instrument", 13.21]], null, [["music", 36.26], ["brass instrument", 13.52], ["musical instrument", 11.04]]], "duration": [0.63, 8.72, 16.52, 11.63, 0.28, 4.17, 0.05, 0.17, 0.69, 2.1, 16.83, 2.77]} \ No newline at end of file diff --git a/annotations_1/GRrLWGMz5XY_filtered.json b/annotations_1/GRrLWGMz5XY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ed439f708c694e945141105c1e2ce68cd426148 --- /dev/null +++ b/annotations_1/GRrLWGMz5XY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [8.0, 9.05], [12.0, 13.27], [15.0, 17.64], [20.0, 20.66], [26.0, 27.35], [30.0, 34.01], [37.0, 41.55], [44.0, 44.58], [45.0, 45.86], [47.0, 48.1], [49.0, 49.94], [52.0, 52.83], [53.0, 54.58], [58.0, 59.12], [60.0, 61.52], [62.0, 71.2], [73.0, 72.99], [73.0, 73.13], [76.0, 76.0], [79.0, 83.62], [85.0, 89.65], [90.0, 92.1], [93.0, 94.27], [96.0, 98.86], [101.0, 101.76], [102.0, 104.75], [105.0, 105.46], [107.0, 107.67], [108.0, 113.16], [116.0, 119.16], [120.0, 120.8], [122.0, 130.72], [132.0, 132.95], [135.0, 136.7], [139.0, 139.33], [142.0, 144.85], [147.0, 148.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 63.1, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 76.37, 81.53, 43.08, 0.0, 92.48, 0.0, 52.98, 0.0, 0.0, 56.33, 93.76, 0.0, 79.41, 0.0, 0.0, 0.0, 97.73, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 39.44], ["hum", 20.77], ["noise", 13.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 1.05, 1.27, 2.64, 0.66, 1.35, 4.01, 4.55, 0.58, 0.86, 1.1, 0.94, 0.83, 1.58, 1.12, 1.52, 9.2, -0.01, 0.13, 0.0, 4.62, 4.65, 2.1, 1.27, 2.86, 0.76, 2.75, 0.46, 0.67, 5.16, 3.16, 0.8, 8.72, 0.95, 1.7, 0.33, 2.85, 1.58]} \ No newline at end of file diff --git a/annotations_1/GSkbcI9F5ec_filtered.json b/annotations_1/GSkbcI9F5ec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aef47dd343dc6c38a0cf0e3f438b29d28812325f --- /dev/null +++ b/annotations_1/GSkbcI9F5ec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 41.12], [53.0, 54.18], [61.0, 61.87], [63.0, 64.61], [66.0, 66.14], [67.0, 66.9], [80.0, 80.3], [88.0, 88.1], [101.0, 103.64], [106.0, 106.46], [122.0, 122.08], [138.0, 138.62], [140.0, 158.45], [162.0, 162.16], [168.0, 181.14], [182.0, 214.81]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.78, 0.0, 0.0, 0.0, 35.47, 0.0, 30.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 27.1], ["music", 25.8], ["fly, housefly", 4.01]], null, null, null, [["music", 54.32], ["speech", 17.58], ["throbbing", 3.78]], null, [["music", 75.17], ["hum", 6.13], ["electronic music", 3.78]], null], "duration": [1.12, 1.18, 0.87, 1.61, 0.14, -0.1, 0.3, 0.1, 2.64, 0.46, 0.08, 0.62, 18.45, 0.16, 13.14, 32.81]} \ No newline at end of file diff --git a/annotations_1/GSrtUVzdt6M_filtered.json b/annotations_1/GSrtUVzdt6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6f50d6f0e2100dda5396b1d66c06fcc251705e2 --- /dev/null +++ b/annotations_1/GSrtUVzdt6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [0.0, 0.36], [0.0, 8.5], [9.0, 10.56], [12.0, 12.87], [13.0, 17.78], [29.0, 34.21], [35.0, 89.33], [91.0, 91.22], [92.0, 110.24], [112.0, 111.64]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.51, 0.0, 0.0, 29.74, 29.43, 0.0, 0.0, 29.82, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.42], ["rumble", 21.36], ["boom", 7.6]], null, null, [["vehicle", 40.93], ["car", 19.77], ["race car, auto racing", 16.86]], [["race car, auto racing", 25.0], ["vehicle", 20.35], ["car", 20.18]], null, null, [["skidding", 27.81], ["vehicle", 26.5], ["car", 23.6]], null], "duration": [0.33, 0.36, 8.5, 1.56, 0.87, 4.78, 5.21, 54.33, 0.22, 18.24, -0.36]} \ No newline at end of file diff --git a/annotations_1/GU1zIn2BRN0_filtered.json b/annotations_1/GU1zIn2BRN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f260c3c69eb337a5f264ad210580e17894f83a8b --- /dev/null +++ b/annotations_1/GU1zIn2BRN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.3], [10.0, 30.5], [33.0, 48.83], [53.0, 55.27], [57.0, 69.11], [70.0, 75.51], [76.0, 79.51], [80.0, 81.13], [82.0, 86.0], [88.0, 88.65], [92.0, 93.85], [105.0, 107.11], [108.0, 109.66], [113.0, 120.56], [123.0, 128.02], [129.0, 132.29], [133.0, 178.34], [181.0, 183.69]], "keep_status": [true, false, false, false, true, false, true, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [31.36, 29.01, 28.66, 29.57, 29.11, 29.08, 29.84, 0.0, 29.56, 0.0, 0.0, 31.78, 0.0, 29.87, 29.7, 29.04, 0.0, 30.85], "audiomae_on_audioset": [[["music", 23.3], ["theremin", 16.37], ["trombone", 9.35]], [["speech", 55.73], ["music", 21.34], ["theremin", 2.54]], [["music", 61.15], ["throbbing", 4.65], ["speech", 4.52]], [["music", 52.88], ["hum", 10.66], ["mains hum", 8.79]], [["music", 44.96], ["electric shaver, electric razor", 7.02], ["didgeridoo", 6.22]], [["music", 53.61], ["didgeridoo", 14.47], ["theremin", 10.42]], [["music", 32.71], ["whale vocalization", 7.7], ["sound effect", 5.32]], null, [["hum", 39.28], ["mains hum", 15.35], ["music", 13.1]], null, null, [["music", 42.49], ["didgeridoo", 6.76], ["theremin", 4.51]], null, [["foghorn", 85.67], ["speech", 6.6], ["music", 3.72]], [["music", 46.51], ["hum", 16.59], ["mains hum", 16.0]], [["mains hum", 35.27], ["hum", 28.45], ["music", 9.88]], null, [["music", 44.51], ["throbbing", 11.52], ["speech", 10.72]]], "duration": [2.3, 20.5, 15.83, 2.27, 12.11, 5.51, 3.51, 1.13, 4.0, 0.65, 1.85, 2.11, 1.66, 7.56, 5.02, 3.29, 45.34, 2.69]} \ No newline at end of file diff --git a/annotations_1/GUDrinKzSus_filtered.json b/annotations_1/GUDrinKzSus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..355050cdffae981ecfca87430a488370b729367f --- /dev/null +++ b/annotations_1/GUDrinKzSus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.06], [11.0, 14.59], [21.0, 21.69], [23.0, 27.8], [35.0, 36.64], [39.0, 38.92], [41.0, 43.92], [45.0, 45.82], [47.0, 50.13], [51.0, 52.41], [57.0, 60.69], [62.0, 62.16], [63.0, 63.86], [64.0, 68.25], [69.0, 70.14], [71.0, 75.27], [76.0, 76.92], [78.0, 84.35], [85.0, 87.49], [88.0, 93.21], [96.0, 98.54], [99.0, 99.55], [101.0, 102.66], [108.0, 109.49], [112.0, 116.99], [118.0, 119.65], [122.0, 123.94], [126.0, 127.23], [129.0, 130.28], [131.0, 131.94], [134.0, 134.97], [136.0, 136.05], [137.0, 137.17], [138.0, 142.91]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.72, 0.0, 49.4, 0.0, 0.0, 99.76, 0.0, 87.37, 0.0, 80.11, 0.0, 0.0, 91.64, 0.0, 89.72, 0.0, 94.81, 99.1, 95.78, 94.81, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47], "audiomae_on_audioset": [null, null, null, [["speech", 46.31], ["hum", 10.27], ["throbbing", 8.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 3.59, 0.69, 4.8, 1.64, -0.08, 2.92, 0.82, 3.13, 1.41, 3.69, 0.16, 0.86, 4.25, 1.14, 4.27, 0.92, 6.35, 2.49, 5.21, 2.54, 0.55, 1.66, 1.49, 4.99, 1.65, 1.94, 1.23, 1.28, 0.94, 0.97, 0.05, 0.17, 4.91]} \ No newline at end of file diff --git a/annotations_1/GUw4G1lDGYE_filtered.json b/annotations_1/GUw4G1lDGYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d269793f6dd50372c83e6c5f8748144fb81dce71 --- /dev/null +++ b/annotations_1/GUw4G1lDGYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.05], [7.0, 8.63], [11.0, 11.5], [16.0, 15.74], [17.0, 17.46], [18.0, 19.04], [20.0, 20.26], [22.0, 25.42], [28.0, 28.59], [29.0, 32.32], [33.0, 34.64], [35.0, 37.93], [40.0, 42.6], [46.0, 59.02], [60.0, 61.37], [68.0, 74.46], [75.0, 75.69], [81.0, 84.84], [87.0, 87.35], [89.0, 89.95], [98.0, 98.78], [100.0, 100.67], [102.0, 103.44], [104.0, 106.32], [109.0, 114.79], [120.0, 124.51], [132.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 97.92, 0.0, 100.0, 100.0, 93.6, 0.0, 92.8, 0.0, 33.4, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 88.28, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 29.56], ["hum", 17.08], ["speech", 8.92]], null, null, null, null, null, null, null, null, null], "duration": [0.05, 1.63, 0.5, -0.26, 0.46, 1.04, 0.26, 3.42, 0.59, 3.32, 1.64, 2.93, 2.6, 13.02, 1.37, 6.46, 0.69, 3.84, 0.35, 0.95, 0.78, 0.67, 1.44, 2.32, 5.79, 4.51, 0.63]} \ No newline at end of file diff --git a/annotations_1/GVqoyzJUzJk_filtered.json b/annotations_1/GVqoyzJUzJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e894e1f54982173c8894b092987e6ba68685c82 --- /dev/null +++ b/annotations_1/GVqoyzJUzJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.45], [27.0, 37.84], [40.0, 40.32], [43.0, 115.05]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 33.92, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 18.91], ["livestock, farm animals, working animals", 14.64], ["music", 13.65]], null, null], "duration": [0.45, 10.84, 0.32, 72.05]} \ No newline at end of file diff --git a/annotations_1/GW475l4IoyU_filtered.json b/annotations_1/GW475l4IoyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4272908e3edb9d20502ed2279a58a8e194dcb83 --- /dev/null +++ b/annotations_1/GW475l4IoyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.3], [34.0, 38.82], [52.0, 52.51], [53.0, 53.65], [54.0, 54.18], [55.0, 55.86], [62.0, 62.95], [64.0, 65.85], [66.0, 69.53], [74.0, 75.3], [77.0, 82.0], [83.0, 86.39], [89.0, 91.12], [92.0, 104.87], [107.0, 107.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [74.13, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 60.23, 37.73, 99.1, 38.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.3], ["breaking", 4.89], ["water", 2.35]], null, [["speech", 57.17], ["clip-clop", 6.58], ["fart", 3.76]], null], "duration": [2.3, 4.82, 0.51, 0.65, 0.18, 0.86, 0.95, 1.85, 3.53, 1.3, 5.0, 3.39, 2.12, 12.87, 0.77]} \ No newline at end of file diff --git a/annotations_1/GWxf8Hb-Xis_filtered.json b/annotations_1/GWxf8Hb-Xis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565bf7fb779024e4b933db140ac1ff94381a25c3 --- /dev/null +++ b/annotations_1/GWxf8Hb-Xis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 54.46], [58.0, 58.63], [65.0, 65.97], [67.0, 68.1], [69.0, 74.88], [75.0, 83.98], [87.0, 93.45], [95.0, 96.52], [99.0, 104.23], [106.0, 116.45], [119.0, 125.25], [126.0, 126.96], [129.0, 131.36], [134.0, 134.81], [139.0, 142.25], [144.0, 144.05], [150.0, 150.36], [153.0, 153.69], [160.0, 162.99], [171.0, 171.73], [173.0, 173.62]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [31.57, 0.0, 0.0, 0.0, 42.76, 59.51, 98.19, 0.0, 92.8, 67.89, 35.22, 0.0, 74.76, 0.0, 68.54, 0.0, 0.0, 0.0, 35.52, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.59], ["cacophony", 4.39], ["reverberation", 3.35]], null, null, null, [["music", 28.47], ["fly, housefly", 15.88], ["hum", 9.44]], null, null, null, null, null, [["speech", 58.16], ["music", 14.27], ["hum", 3.42]], null, null, null, null, null, null, null, [["hum", 26.68], ["mains hum", 25.29], ["throbbing", 11.71]], null, null], "duration": [19.46, 0.63, 0.97, 1.1, 5.88, 8.98, 6.45, 1.52, 5.23, 10.45, 6.25, 0.96, 2.36, 0.81, 3.25, 0.05, 0.36, 0.69, 2.99, 0.73, 0.62]} \ No newline at end of file diff --git a/annotations_1/GXZSat3AqwE_filtered.json b/annotations_1/GXZSat3AqwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c44e6630465e03eca59b5b90f8e647b4bdb0aba --- /dev/null +++ b/annotations_1/GXZSat3AqwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 30.75], [32.0, 32.63], [37.0, 37.37], [59.0, 58.67], [61.0, 61.3], [63.0, 63.54], [64.0, 65.8], [70.0, 70.17], [74.0, 76.38], [77.0, 78.34], [80.0, 81.94], [82.0, 83.03], [85.0, 86.09], [86.0, 88.45], [93.0, 93.93], [94.0, 96.52], [97.0, 100.48], [102.0, 103.76], [104.0, 105.17], [108.0, 108.55], [122.0, 122.05], [123.0, 124.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 40.47, 81.17, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 31.02], ["chirp tone", 29.53], ["tuning fork", 16.42]], null, [["speech", 46.0], ["sidetone", 11.97], ["ping", 6.66]], null, null, null, null, null, null], "duration": [4.75, 0.63, 0.37, -0.33, 0.3, 0.54, 1.8, 0.17, 2.38, 1.34, 1.94, 1.03, 1.09, 2.45, 0.93, 2.52, 3.48, 1.76, 1.17, 0.55, 0.05, 1.92]} \ No newline at end of file diff --git a/annotations_1/GYexCnV6cLY_filtered.json b/annotations_1/GYexCnV6cLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..211892dd1dec8a1c82d86f4c14093aa1c2aea273 --- /dev/null +++ b/annotations_1/GYexCnV6cLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [3.0, 4.29], [6.0, 6.88], [8.0, 9.24], [10.0, 11.04], [11.0, 13.15], [14.0, 15.18], [18.0, 18.17], [20.0, 20.68], [26.0, 26.97], [28.0, 29.08], [32.0, 33.0], [38.0, 39.5], [42.0, 44.58], [51.0, 57.4], [58.0, 60.29], [61.0, 63.07], [64.0, 65.87], [67.0, 68.44], [69.0, 70.28], [72.0, 72.1], [84.0, 85.23], [86.0, 87.08], [89.0, 89.23], [90.0, 91.05], [93.0, 93.18], [96.0, 96.77], [102.0, 103.11], [103.0, 105.06], [106.0, 107.52], [109.0, 109.78], [112.0, 113.61], [114.0, 119.26], [121.0, 121.76], [123.0, 126.01], [127.0, 128.19], [129.0, 131.26], [132.0, 133.86], [135.0, 135.94], [138.0, 138.21], [143.0, 143.23], [147.0, 147.77], [155.0, 155.22], [157.0, 157.54], [158.0, 158.72], [159.0, 161.1], [162.0, 162.16], [163.0, 163.78], [165.0, 165.59], [166.0, 167.29], [168.0, 169.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 36.64, 49.22, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 90.95, 0.0, 73.21, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 39.23], ["dial tone", 23.87], ["telephone", 12.11]], null, null, null, null, null, null, null, [["speech", 30.36], ["sidetone", 10.73], ["domestic animals, pets", 8.0]], [["speech", 37.57], ["throbbing", 14.91], ["heart sounds, heartbeat", 8.68]], [["speech synthesizer", 21.98], ["speech", 19.01], ["mains hum", 10.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 57.55], ["hum", 35.62], ["sidetone", 2.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 1.29, 0.88, 1.24, 1.04, 2.15, 1.18, 0.17, 0.68, 0.97, 1.08, 1.0, 1.5, 2.58, 6.4, 2.29, 2.07, 1.87, 1.44, 1.28, 0.1, 1.23, 1.08, 0.23, 1.05, 0.18, 0.77, 1.11, 2.06, 1.52, 0.78, 1.61, 5.26, 0.76, 3.01, 1.19, 2.26, 1.86, 0.94, 0.21, 0.23, 0.77, 0.22, 0.54, 0.72, 2.1, 0.16, 0.78, 0.59, 1.29, 1.11]} \ No newline at end of file diff --git a/annotations_1/GYh7IHTeLus_filtered.json b/annotations_1/GYh7IHTeLus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a033ad030b3624d1644b63f104024db04a1d597 --- /dev/null +++ b/annotations_1/GYh7IHTeLus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.18], [4.0, 7.38], [20.0, 20.97], [30.0, 31.38], [35.0, 37.47], [41.0, 41.79], [51.0, 52.88], [57.0, 59.12], [66.0, 69.33], [70.0, 72.99], [75.0, 77.31], [79.0, 80.23], [82.0, 89.82], [91.0, 92.04], [93.0, 94.56], [96.0, 96.63], [99.0, 99.82], [102.0, 106.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.43, 0.0, 0.0, 65.44, 0.0, 0.0, 81.71, 79.07, 70.16, 56.25, 0.0, 56.78, 0.0, 0.0, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 3.38, 0.97, 1.38, 2.47, 0.79, 1.88, 2.12, 3.33, 2.99, 2.31, 1.23, 7.82, 1.04, 1.56, 0.63, 0.82, 4.71]} \ No newline at end of file diff --git a/annotations_1/GZ3fgYIUrJU_filtered.json b/annotations_1/GZ3fgYIUrJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff000d5e3a7e8ee9936b5a95cd8533468644d98a --- /dev/null +++ b/annotations_1/GZ3fgYIUrJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 26.45], [27.0, 27.72], [29.0, 29.25], [30.0, 78.48], [83.0, 89.07], [92.0, 95.22], [99.0, 99.72], [102.0, 102.81], [104.0, 104.3], [106.0, 106.81], [109.0, 111.33], [115.0, 115.15], [119.0, 119.87], [121.0, 122.01], [123.0, 125.73], [141.0, 140.73], [157.0, 157.57], [160.0, 161.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.81, 0.0, 0.0, 0.0, 81.89, 60.7, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["insect", 56.41], ["fly, housefly", 25.18], ["mosquito", 9.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.45, 0.72, 0.25, 48.48, 6.07, 3.22, 0.72, 0.81, 0.3, 0.81, 2.33, 0.15, 0.87, 1.01, 2.73, -0.27, 0.57, 1.4]} \ No newline at end of file diff --git a/annotations_1/GZauEya_plU_filtered.json b/annotations_1/GZauEya_plU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2840d261d16d743cbcd6bd78b0c9cd91369d1e78 --- /dev/null +++ b/annotations_1/GZauEya_plU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [15.0, 15.35], [36.0, 36.05], [38.0, 38.6], [39.0, 38.8], [57.0, 57.59], [88.0, 88.52], [89.0, 90.19], [91.0, 90.71], [92.0, 92.3], [96.0, 97.65], [101.0, 101.21], [115.0, 115.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 0.35, 0.05, 0.6, -0.2, 0.59, 0.52, 1.19, -0.29, 0.3, 1.65, 0.21, 0.52]} \ No newline at end of file diff --git a/annotations_1/GZiLvbk8fL8_filtered.json b/annotations_1/GZiLvbk8fL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33e64f8637f171ae83545525338f764ab39c61de --- /dev/null +++ b/annotations_1/GZiLvbk8fL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [9.0, 20.68], [24.0, 25.25], [26.0, 28.07], [30.0, 35.43], [42.0, 53.69], [57.0, 57.0], [59.0, 61.28], [66.0, 72.72], [73.0, 100.47]], "keep_status": [false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.61, 0.0, 28.84, 29.41, 31.19, 0.0, 32.71, 30.88, 28.8], "audiomae_on_audioset": [null, [["music", 48.41], ["echo", 8.16], ["musical instrument", 4.77]], null, [["music", 64.99], ["musical instrument", 11.54], ["guitar", 6.74]], [["music", 64.58], ["speech", 4.83], ["foghorn", 4.6]], [["music", 77.91], ["boing", 8.9], ["speech", 2.38]], null, [["music", 65.71], ["laughter", 6.38], ["speech", 2.28]], [["speech", 38.71], ["music", 25.27], ["throbbing", 8.54]], [["music", 36.26], ["speech", 21.25], ["throbbing", 6.51]]], "duration": [0.04, 11.68, 1.25, 2.07, 5.43, 11.69, 0.0, 2.28, 6.72, 27.47]} \ No newline at end of file diff --git a/annotations_1/GZxal1kvCfY_filtered.json b/annotations_1/GZxal1kvCfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a5377005faf2e76492f87a547f930c219cd7f75 --- /dev/null +++ b/annotations_1/GZxal1kvCfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.11], [26.0, 25.78], [29.0, 29.0], [44.0, 43.82], [44.0, 51.78], [58.0, 58.13], [65.0, 66.65], [85.0, 86.56], [88.0, 89.04], [90.0, 91.15], [91.0, 95.96], [99.0, 100.75], [103.0, 103.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.11, -0.22, 0.0, -0.18, 7.78, 0.13, 1.65, 1.56, 1.04, 1.15, 4.96, 1.75, 0.22]} \ No newline at end of file diff --git a/annotations_1/G_Rd3TcODj4_filtered.json b/annotations_1/G_Rd3TcODj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb95d1d3141b9cff5b6a9f0d0f2b11db8335ec8 --- /dev/null +++ b/annotations_1/G_Rd3TcODj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.35], [19.0, 19.74], [21.0, 21.59], [23.0, 22.67], [25.0, 26.28], [27.0, 28.09], [29.0, 32.04], [33.0, 72.35], [73.0, 83.12], [86.0, 86.49], [94.0, 95.1], [97.0, 99.45], [100.0, 104.45], [108.0, 126.87], [128.0, 133.17], [134.0, 135.26]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, true, true, true, false], "silence_prob": [52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 29.35, 0.0, 0.0, 29.3, 29.89, 30.05, 37.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 13.22], ["groan", 9.77], ["livestock, farm animals, working animals", 8.43]], null, [["hum", 32.53], ["speech", 24.96], ["mains hum", 22.21]], null, null, [["music", 39.89], ["hum", 16.53], ["mains hum", 8.77]], [["music", 50.48], ["speech", 13.89], ["mains hum", 4.47]], [["music", 47.36], ["cattle, bovinae", 11.05], ["livestock, farm animals, working animals", 9.13]], [["music", 12.03], ["speech", 9.68], ["rumble", 7.35]], null], "duration": [2.35, 0.74, 0.59, -0.33, 1.28, 1.09, 3.04, 39.35, 10.12, 0.49, 1.1, 2.45, 4.45, 18.87, 5.17, 1.26]} \ No newline at end of file diff --git a/annotations_1/GaIcAaHFc0U_filtered.json b/annotations_1/GaIcAaHFc0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9e9d0201f8b91ef24bbaf42faad46e585b8830 --- /dev/null +++ b/annotations_1/GaIcAaHFc0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 27.35], [30.0, 30.18], [31.0, 31.41], [33.0, 32.71], [34.0, 34.16], [37.0, 37.02], [38.0, 49.82], [51.0, 55.81], [62.0, 64.5], [65.0, 65.87], [67.0, 69.21], [70.0, 76.5], [77.0, 82.59], [84.0, 86.32], [87.0, 89.13], [93.0, 98.02], [101.0, 103.87], [109.0, 110.79], [115.0, 116.11], [120.0, 121.26], [127.0, 128.51], [129.0, 130.71], [135.0, 135.77], [139.0, 139.13], [144.0, 144.42], [146.0, 147.6], [150.0, 151.38], [153.0, 153.96], [157.0, 160.12], [165.0, 177.06], [181.0, 181.14], [187.0, 188.38], [194.0, 195.27], [203.0, 203.49], [205.0, 205.98], [208.0, 208.35], [209.0, 209.66], [213.0, 213.66], [215.0, 217.36], [220.0, 223.18], [224.0, 229.36], [231.0, 232.44], [233.0, 235.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [29.82, 0.0, 0.0, 0.0, 0.0, 0.0, 28.94, 37.68, 29.61, 0.0, 57.89, 30.58, 47.35, 34.64, 31.56, 31.52, 31.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.58, 36.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.4, 34.14, 42.69, 0.0, 31.65], "audiomae_on_audioset": [[["music", 55.18], ["speech", 29.63], ["electronic music", 1.55]], null, null, null, null, null, [["music", 50.71], ["hum", 13.8], ["throbbing", 11.5]], [["speech", 50.26], ["music", 18.47], ["sidetone", 3.77]], [["music", 13.47], ["electronic music", 11.74], ["sine wave", 8.86]], null, null, [["music", 38.22], ["hum", 14.53], ["throbbing", 5.63]], [["hum", 33.44], ["mains hum", 14.61], ["music", 9.86]], [["whale vocalization", 55.11], ["music", 3.1], ["quack", 3.04]], [["singing bowl", 31.58], ["music", 17.53], ["gong", 14.22]], [["hum", 26.57], ["music", 16.68], ["mains hum", 11.34]], [["gong", 77.64], ["music", 4.52], ["hum", 1.95]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 45.55], ["mains hum", 18.69], ["throbbing", 17.24]], [["throbbing", 29.37], ["hum", 25.59], ["music", 19.8]], null, null, null, null, null, null, null, null, [["hum", 30.44], ["mains hum", 19.8], ["speech", 14.3]], [["music", 49.27], ["theremin", 26.45], ["didgeridoo", 12.9]], [["music", 49.53], ["hum", 7.38], ["glass", 7.29]], null, [["music", 45.57], ["didgeridoo", 34.7], ["musical instrument", 3.15]]], "duration": [12.35, 0.18, 0.41, -0.29, 0.16, 0.02, 11.82, 4.81, 2.5, 0.87, 2.21, 6.5, 5.59, 2.32, 2.13, 5.02, 2.87, 1.79, 1.11, 1.26, 1.51, 1.71, 0.77, 0.13, 0.42, 1.6, 1.38, 0.96, 3.12, 12.06, 0.14, 1.38, 1.27, 0.49, 0.98, 0.35, 0.66, 0.66, 2.36, 3.18, 5.36, 1.44, 2.09]} \ No newline at end of file diff --git a/annotations_1/GaUGoueAS4Y_filtered.json b/annotations_1/GaUGoueAS4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c015ef7af69fe53317135e2ed967905a1c6ab460 --- /dev/null +++ b/annotations_1/GaUGoueAS4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 139.29], [143.0, 186.83]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [126.29, 43.83]} \ No newline at end of file diff --git a/annotations_1/Gae_um_eNZU_filtered.json b/annotations_1/Gae_um_eNZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b79cc841c3c4bcacabaca63ee49dc0b4ad88dd2a --- /dev/null +++ b/annotations_1/Gae_um_eNZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.35], [19.0, 20.14], [30.0, 31.45], [33.0, 33.17], [35.0, 35.11], [36.0, 36.49], [37.0, 39.73], [54.0, 55.29], [59.0, 60.08], [60.0, 60.17], [65.0, 82.0], [86.0, 86.43], [87.0, 87.08], [91.0, 91.18], [94.0, 99.23], [100.0, 100.23], [103.0, 103.0], [107.0, 110.08], [111.0, 113.09], [115.0, 115.92], [118.0, 118.3], [122.0, 128.51], [129.0, 128.56], [129.0, 129.57], [130.0, 132.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 87.19, 51.6, 0.0, 0.0, 70.72, 0.0, 0.0, 55.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, 1.14, 1.45, 0.17, 0.11, 0.49, 2.73, 1.29, 1.08, 0.17, 17.0, 0.43, 0.08, 0.18, 5.23, 0.23, 0.0, 3.08, 2.09, 0.92, 0.3, 6.51, -0.44, 0.57, 2.12]} \ No newline at end of file diff --git a/annotations_1/GbCytLu1-3k_filtered.json b/annotations_1/GbCytLu1-3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35c00306a7b0c8a351a2cd4e3f4afad19f5c9f76 --- /dev/null +++ b/annotations_1/GbCytLu1-3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.0], [13.0, 14.2], [17.0, 16.77], [17.0, 19.84], [32.0, 32.83], [37.0, 37.59], [38.0, 38.23], [44.0, 44.59], [45.0, 45.59], [54.0, 55.34], [56.0, 57.11], [69.0, 69.25], [70.0, 71.32], [72.0, 72.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.2, -0.23, 2.84, 0.83, 0.59, 0.23, 0.59, 0.59, 1.34, 1.11, 0.25, 1.32, 0.91]} \ No newline at end of file diff --git a/annotations_1/GbOXTIymvqc_filtered.json b/annotations_1/GbOXTIymvqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62257b89f2830ec98c7f90173c1a5c680b6554ee --- /dev/null +++ b/annotations_1/GbOXTIymvqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [6.0, 6.59], [7.0, 10.44], [11.0, 11.38], [12.0, 21.54], [25.0, 25.2], [29.0, 30.33], [33.0, 33.13], [43.0, 43.34], [44.0, 45.72], [46.0, 48.19], [50.0, 66.9], [67.0, 67.41], [67.0, 84.84], [86.0, 87.44], [89.0, 90.05], [96.0, 97.21], [103.0, 105.76], [108.0, 110.76], [117.0, 118.47], [122.0, 122.79], [123.0, 127.03], [128.0, 127.97], [129.0, 129.95], [137.0, 138.72], [144.0, 144.58], [160.0, 161.72]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.63, 0.0, 31.91, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 49.54, 0.0, 37.08, 0.0, 0.0, 0.0, 53.72, 37.59, 0.0, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.16], ["music", 4.41], ["didgeridoo", 2.7]], null, [["whale vocalization", 16.0], ["fly, housefly", 14.42], ["mosquito", 13.48]], null, null, null, null, null, null, [["music", 31.91], ["speech", 24.74], ["glass", 8.53]], null, [["hum", 24.88], ["speech", 18.96], ["music", 16.07]], null, null, null, null, [["hum", 31.33], ["fly, housefly", 16.08], ["mains hum", 14.34]], null, null, null, null, null, null, null, null], "duration": [0.45, 0.59, 3.44, 0.38, 9.54, 0.2, 1.33, 0.13, 0.34, 1.72, 2.19, 16.9, 0.41, 17.84, 1.44, 1.05, 1.21, 2.76, 2.76, 1.47, 0.79, 4.03, -0.03, 0.95, 1.72, 0.58, 1.72]} \ No newline at end of file diff --git a/annotations_1/GbQy-0SzshA_filtered.json b/annotations_1/GbQy-0SzshA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ca303d151e1c371b964029c7a4f929e3a5a5052 --- /dev/null +++ b/annotations_1/GbQy-0SzshA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 69.43], [70.0, 197.36]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [39.43, 127.36]} \ No newline at end of file diff --git a/annotations_1/GbZZ2TDY5dA_filtered.json b/annotations_1/GbZZ2TDY5dA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..791b913dbd22647c50165ec5140dc8336795708f --- /dev/null +++ b/annotations_1/GbZZ2TDY5dA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.47], [13.0, 16.51], [18.0, 32.61], [38.0, 40.24], [48.0, 49.5], [61.0, 61.5], [69.0, 69.06], [75.0, 76.55], [79.0, 81.09], [82.0, 84.48], [85.0, 88.92], [93.0, 92.82], [93.0, 93.38], [94.0, 97.17], [98.0, 149.12], [151.0, 152.93], [154.0, 159.04], [162.0, 166.13], [166.0, 167.73], [171.0, 174.36]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [43.15, 54.1, 59.86, 76.2, 0.0, 0.0, 0.0, 0.0, 43.51, 46.57, 55.53, 0.0, 0.0, 53.59, 0.0, 0.0, 49.36, 48.65, 0.0, 49.09], "audiomae_on_audioset": [[["music", 13.16], ["synthesizer", 10.75], ["sonar", 9.25]], null, null, null, null, null, null, null, [["hum", 19.79], ["throbbing", 16.55], ["whale vocalization", 10.16]], [["speech", 52.5], ["rumble", 11.67], ["hum", 5.91]], null, null, null, null, null, null, [["music", 23.4], ["speech", 17.24], ["didgeridoo", 10.45]], [["music", 63.09], ["speech", 14.7], ["synthesizer", 4.01]], null, [["music", 32.04], ["quack", 13.75], ["duck", 13.6]]], "duration": [2.47, 3.51, 14.61, 2.24, 1.5, 0.5, 0.06, 1.55, 2.09, 2.48, 3.92, -0.18, 0.38, 3.17, 51.12, 1.93, 5.04, 4.13, 1.73, 3.36]} \ No newline at end of file diff --git a/annotations_1/Gbvml-bH5Uc_filtered.json b/annotations_1/Gbvml-bH5Uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d40c04d996009a358722b758de92706b1cef0f2 --- /dev/null +++ b/annotations_1/Gbvml-bH5Uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [6.0, 7.43], [8.0, 10.35], [12.0, 15.35], [24.0, 25.12], [26.0, 26.65], [36.0, 38.52], [41.0, 40.86], [43.0, 46.09], [49.0, 49.55], [51.0, 52.08], [56.0, 83.89], [85.0, 86.83], [88.0, 89.01], [91.0, 91.57], [95.0, 95.45], [96.0, 97.34], [101.0, 102.29], [104.0, 105.04], [106.0, 114.66], [116.0, 125.32]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 99.82, 0.0, 41.32, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.02, 55.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 50.92], ["mosquito", 12.15], ["neigh, whinny", 5.01]], null, null, null, null, null, null, null, null, null, null, [["speech", 31.72], ["music", 26.86], ["hum", 3.67]], null], "duration": [1.94, 1.43, 2.35, 3.35, 1.12, 0.65, 2.52, -0.14, 3.09, 0.55, 1.08, 27.89, 1.83, 1.01, 0.57, 0.45, 1.34, 1.29, 1.04, 8.66, 9.32]} \ No newline at end of file diff --git a/annotations_1/Gdp4SEfQzy8_filtered.json b/annotations_1/Gdp4SEfQzy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e5ad08ab8c4537ace06a1122a6bef33ce839811 --- /dev/null +++ b/annotations_1/Gdp4SEfQzy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.19], [2.0, 7.21], [14.0, 35.43]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.53, 30.91], "audiomae_on_audioset": [null, [["music", 66.2], ["musical instrument", 4.76], ["guitar", 2.0]], [["music", 75.48], ["breaking", 6.56], ["hum", 2.9]]], "duration": [0.19, 5.21, 21.43]} \ No newline at end of file diff --git a/annotations_1/Gdpx9aiEtmg_filtered.json b/annotations_1/Gdpx9aiEtmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e1237c9179d13961fa63cdc7afacb701f92402 --- /dev/null +++ b/annotations_1/Gdpx9aiEtmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 45.89], [47.0, 73.03], [74.0, 86.24], [87.0, 87.67], [89.0, 89.67], [90.0, 100.36], [102.0, 103.59], [104.0, 111.3], [116.0, 123.35], [127.0, 129.64], [131.0, 130.87], [132.0, 132.48], [135.0, 137.94], [144.0, 176.5]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 33.23, 34.44, 0.0, 0.0, 29.08, 0.0, 28.4, 30.18, 31.2, 0.0, 0.0, 41.66, 0.0], "audiomae_on_audioset": [null, [["throbbing", 65.62], ["hum", 22.18], ["mains hum", 2.64]], [["hum", 14.84], ["fly, housefly", 12.4], ["insect", 7.86]], null, null, [["speech", 38.36], ["explosion", 25.01], ["burst, pop", 5.36]], null, [["speech", 45.56], ["music", 9.64], ["crying, sobbing", 5.64]], [["hum", 51.72], ["mains hum", 29.37], ["throbbing", 6.76]], [["speech", 39.28], ["music", 6.78], ["effects unit", 3.68]], null, null, [["music", 26.4], ["speech", 18.0], ["synthesizer", 7.28]], null], "duration": [-0.11, 26.03, 12.24, 0.67, 0.67, 10.36, 1.59, 7.3, 7.35, 2.64, -0.13, 0.48, 2.94, 32.5]} \ No newline at end of file diff --git a/annotations_1/GdrUYcOTUvY_filtered.json b/annotations_1/GdrUYcOTUvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..092c2f21bf41619a851a5873f5f377719e831721 --- /dev/null +++ b/annotations_1/GdrUYcOTUvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [5.0, 6.05], [8.0, 8.56], [12.0, 12.36], [14.0, 15.01], [16.0, 17.56], [19.0, 19.45], [21.0, 22.11], [23.0, 26.49], [28.0, 31.28], [32.0, 32.83], [35.0, 36.09], [36.0, 42.13], [43.0, 53.54], [55.0, 58.53], [60.0, 61.86], [63.0, 64.77], [66.0, 67.74], [69.0, 71.73], [72.0, 75.39], [77.0, 78.38], [79.0, 81.26], [82.0, 83.51], [87.0, 88.16], [91.0, 93.06], [97.0, 97.98], [99.0, 100.6], [103.0, 105.04], [106.0, 107.96], [109.0, 111.52], [112.0, 112.56], [123.0, 123.62], [128.0, 130.5], [132.0, 134.18], [135.0, 139.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 74.13, 88.64, 99.73, 0.0, 0.0, 0.0, 100.0, 98.99, 0.0, 97.43, 0.0, 0.0, 55.39, 0.0, 0.0, 79.07, 0.0, 36.16, 0.0, 0.0, 98.44, 96.77, 96.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 84.87], ["music", 4.75], ["theremin", 3.09]], null, null, null, null, null], "duration": [1.06, 1.05, 0.56, 0.36, 1.01, 1.56, 0.45, 1.11, 3.49, 3.28, 0.83, 1.09, 6.13, 10.54, 3.53, 1.86, 1.77, 1.74, 2.73, 3.39, 1.38, 2.26, 1.51, 1.16, 2.06, 0.98, 1.6, 2.04, 1.96, 2.52, 0.56, 0.62, 2.5, 2.18, 4.73]} \ No newline at end of file diff --git a/annotations_1/GeLDjQIIkdI_filtered.json b/annotations_1/GeLDjQIIkdI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbe22b6e8989ae0d01c6b085adb7865e5c35e622 --- /dev/null +++ b/annotations_1/GeLDjQIIkdI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [9.0, 9.32], [12.0, 14.32], [16.0, 20.93], [22.0, 22.2], [23.0, 23.57], [39.0, 39.58], [45.0, 45.6], [46.0, 48.34], [57.0, 77.94], [79.0, 103.18], [105.0, 107.45], [115.0, 116.41], [119.0, 135.21], [138.0, 139.56], [145.0, 150.11], [155.0, 171.59]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 36.99, 30.9, 0.0, 0.0, 0.0, 0.0, 30.05, 29.11, 29.1, 32.91, 0.0, 31.28, 0.0, 29.36, 29.7], "audiomae_on_audioset": [null, null, [["music", 30.58], ["whale vocalization", 25.3], ["electronic music", 12.12]], [["music", 57.31], ["hum", 7.82], ["rumble", 7.2]], null, null, null, null, [["music", 71.75], ["noise", 6.06], ["hum", 4.78]], [["music", 42.25], ["hum", 8.17], ["mains hum", 6.37]], [["music", 32.84], ["hum", 24.13], ["mains hum", 20.58]], [["music", 39.43], ["hum", 15.09], ["speech", 7.65]], null, [["music", 68.39], ["electronic music", 5.7], ["hum", 4.59]], null, [["music", 33.26], ["mains hum", 25.49], ["hum", 5.5]], [["music", 72.94], ["hum", 6.05], ["throbbing", 2.98]]], "duration": [0.11, 0.32, 2.32, 4.93, 0.2, 0.57, 0.58, 0.6, 2.34, 20.94, 24.18, 2.45, 1.41, 16.21, 1.56, 5.11, 16.59]} \ No newline at end of file diff --git a/annotations_1/Gfc_7pOTR28_filtered.json b/annotations_1/Gfc_7pOTR28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24edba6b6bdd5be78935df4a8a2d89bbbaadbcef --- /dev/null +++ b/annotations_1/Gfc_7pOTR28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.38], [10.0, 10.67], [13.0, 18.32], [19.0, 21.68], [23.0, 27.97], [30.0, 30.45], [34.0, 35.72], [40.0, 40.27], [42.0, 42.09], [51.0, 50.87], [53.0, 52.88], [58.0, 58.63], [60.0, 60.93], [69.0, 80.18], [80.0, 80.42], [82.0, 82.51], [85.0, 86.51], [87.0, 88.53], [111.0, 111.08], [127.0, 127.48], [131.0, 132.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.84, 100.0, 78.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.46], ["wail, moan", 28.42], ["crying, sobbing", 9.12]], null, null, null, null, null, null, null], "duration": [4.38, 0.67, 5.32, 2.68, 4.97, 0.45, 1.72, 0.27, 0.09, -0.13, -0.12, 0.63, 0.93, 11.18, 0.42, 0.51, 1.51, 1.53, 0.08, 0.48, 1.54]} \ No newline at end of file diff --git a/annotations_1/Gfje9_QRQbk_filtered.json b/annotations_1/Gfje9_QRQbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1194fe5041817e89bddb4fa504702c48424e4f09 --- /dev/null +++ b/annotations_1/Gfje9_QRQbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.19], [23.0, 39.85], [41.0, 41.5], [42.0, 46.6], [47.0, 47.66], [48.0, 50.19], [51.0, 73.23], [74.0, 108.45], [115.0, 117.53], [120.0, 120.01], [123.0, 123.18], [124.0, 124.36], [126.0, 126.01], [128.0, 128.92], [129.0, 131.75], [132.0, 132.95], [134.0, 137.27], [139.0, 142.74], [143.0, 145.86], [148.0, 153.03], [154.0, 166.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.01, 0.0, 96.04, 0.0, 90.43, 74.76, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 77.2, 75.39, 89.54, 67.13, 66.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 16.85, 0.5, 4.6, 0.66, 2.19, 22.23, 34.45, 2.53, 0.01, 0.18, 0.36, 0.01, 0.92, 2.75, 0.95, 3.27, 3.74, 2.86, 5.03, 12.73]} \ No newline at end of file diff --git a/annotations_1/GgBt0TlbwUY_filtered.json b/annotations_1/GgBt0TlbwUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c63da5c7111b787eb34d6530c52aad23b1fb94de --- /dev/null +++ b/annotations_1/GgBt0TlbwUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [21.0, 21.17], [23.0, 22.92], [32.0, 37.93], [48.0, 56.34], [102.0, 105.87], [115.0, 117.1], [122.0, 131.45], [133.0, 134.79], [137.0, 137.51], [154.0, 154.04], [167.0, 167.32], [177.0, 177.11], [182.0, 181.57], [188.0, 188.38], [192.0, 192.01], [209.0, 210.69], [211.0, 211.45], [217.0, 218.51], [220.0, 219.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.42, 31.46, 30.89, 31.09, 30.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 81.63], ["scratching (performance technique)", 2.75], ["speech", 1.81]], [["music", 71.69], ["speech", 7.35], ["boing", 5.66]], [["music", 85.75], ["electronic music", 2.41], ["scratching (performance technique)", 2.14]], [["speech", 58.35], ["music", 10.3], ["electronic music", 3.91]], [["music", 57.02], ["boing", 17.36], ["groan", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.17, -0.08, 5.93, 8.34, 3.87, 2.1, 9.45, 1.79, 0.51, 0.04, 0.32, 0.11, -0.43, 0.38, 0.01, 1.69, 0.45, 1.51, -0.09]} \ No newline at end of file diff --git a/annotations_1/Gh9kc9DiDnE_filtered.json b/annotations_1/Gh9kc9DiDnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48beea801c84fb351b507d68dceedfcc3028313b --- /dev/null +++ b/annotations_1/Gh9kc9DiDnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.31], [14.0, 40.12], [42.0, 44.41], [45.0, 45.27], [48.0, 57.55], [58.0, 61.05], [70.0, 70.77], [73.0, 73.75], [77.0, 77.52], [79.0, 79.93], [86.0, 86.81], [90.0, 90.81], [94.0, 96.25], [97.0, 98.83], [100.0, 101.8], [105.0, 105.65], [106.0, 114.08], [114.0, 114.54], [116.0, 116.77], [118.0, 118.66], [122.0, 123.65], [124.0, 131.77], [133.0, 133.39], [135.0, 140.27], [141.0, 141.34], [142.0, 142.1], [142.0, 142.13], [142.0, 142.16], [142.0, 142.45], [142.0, 142.5], [147.0, 146.92], [147.0, 146.96], [152.0, 152.58]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.67, 29.35, 52.51, 0.0, 68.41, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.61], ["throbbing", 15.82], ["hum", 8.38]], [["speech", 22.22], ["vehicle", 20.42], ["car", 6.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 25.2], ["speech", 19.43], ["smash, crash", 12.7]], null, null, null, null, null, null, null, null, null, null, null], "duration": [10.31, 26.12, 2.41, 0.27, 9.55, 3.05, 0.77, 0.75, 0.52, 0.93, 0.81, 0.81, 2.25, 1.83, 1.8, 0.65, 8.08, 0.54, 0.77, 0.66, 1.65, 7.77, 0.39, 5.27, 0.34, 0.1, 0.13, 0.16, 0.45, 0.5, -0.08, -0.04, 0.58]} \ No newline at end of file diff --git a/annotations_1/Ghexrw8bpc8_filtered.json b/annotations_1/Ghexrw8bpc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6f86fd12933e3ace53c72e1d61edd0de39f1522 --- /dev/null +++ b/annotations_1/Ghexrw8bpc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [7.0, 8.46], [10.0, 10.62], [12.0, 12.01], [13.0, 13.36], [14.0, 14.88], [16.0, 19.77], [22.0, 23.77], [25.0, 25.27], [29.0, 32.71], [34.0, 35.21], [43.0, 47.41], [50.0, 50.45], [52.0, 53.6], [61.0, 60.94], [64.0, 66.28], [68.0, 68.01], [70.0, 70.82], [73.0, 75.12], [75.0, 77.01], [78.0, 78.92], [79.0, 80.47], [83.0, 83.22], [85.0, 87.83], [105.0, 106.12], [113.0, 113.29], [115.0, 121.02], [122.0, 123.89], [125.0, 131.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 100.0, 99.9, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 58.38, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, 1.46, 0.62, 0.01, 0.36, 0.88, 3.77, 1.77, 0.27, 3.71, 1.21, 4.41, 0.45, 1.6, -0.06, 2.28, 0.01, 0.82, 2.12, 2.01, 0.92, 1.47, 0.22, 2.83, 1.12, 0.29, 6.02, 1.89, 6.65]} \ No newline at end of file diff --git a/annotations_1/Gi3K-CApAS4_filtered.json b/annotations_1/Gi3K-CApAS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc40cb5cea7f91d4d7844bc175523e5a25a76c3b --- /dev/null +++ b/annotations_1/Gi3K-CApAS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.45], [13.0, 27.19], [30.0, 35.26]], "keep_status": [true, false, true], "silence_prob": [47.78, 42.26, 38.16], "audiomae_on_audioset": [[["music", 54.3], ["sonar", 5.49], ["singing bowl", 5.17]], [["music", 57.39], ["ambient music", 12.28], ["electronic music", 4.91]], [["music", 47.43], ["harmonic", 10.51], ["synthesizer", 5.06]]], "duration": [7.45, 14.19, 5.26]} \ No newline at end of file diff --git a/annotations_1/Gif5ZnaOOQ8_filtered.json b/annotations_1/Gif5ZnaOOQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Gif5ZnaOOQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/Gk_2euKF9MY_filtered.json b/annotations_1/Gk_2euKF9MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58a2530d579bc137beee98ebb60526fba3357a0e --- /dev/null +++ b/annotations_1/Gk_2euKF9MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [14.0, 15.26], [16.0, 32.48], [33.0, 34.84], [37.0, 39.45], [41.0, 42.08], [43.0, 43.98], [45.0, 47.06], [50.0, 51.48], [54.0, 67.56], [70.0, 72.08], [73.0, 73.65], [76.0, 77.06], [80.0, 80.54], [82.0, 82.83], [86.0, 92.84], [94.0, 93.82], [106.0, 106.19], [110.0, 110.2], [114.0, 114.08], [117.0, 118.22], [121.0, 130.11], [137.0, 137.46], [144.0, 144.26], [157.0, 156.74]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.79, 0.0, 44.04, 0.0, 0.0, 45.4, 0.0, 46.09, 35.12, 0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 0.0, 0.0, 0.0, 29.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 41.82], ["heart sounds, heartbeat", 29.0], ["throbbing", 15.01]], null, [["speech", 33.04], ["music", 31.67], ["heart murmur", 7.32]], null, null, [["heart murmur", 24.06], ["music", 17.78], ["speech", 8.6]], null, [["music", 24.26], ["speech", 7.67], ["heart murmur", 7.6]], [["music", 69.84], ["speech", 5.38], ["drum machine", 4.38]], null, null, null, null, [["music", 82.99], ["drum machine", 2.64], ["musical instrument", 1.78]], null, null, null, null, null, [["music", 89.93], ["singing", 1.52], ["song", 0.98]], null, null, null], "duration": [0.89, 1.26, 16.48, 1.84, 2.45, 1.08, 0.98, 2.06, 1.48, 13.56, 2.08, 0.65, 1.06, 0.54, 0.83, 6.84, -0.18, 0.19, 0.2, 0.08, 1.22, 9.11, 0.46, 0.26, -0.26]} \ No newline at end of file diff --git a/annotations_1/Gklme1-eQGE_filtered.json b/annotations_1/Gklme1-eQGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd7315aa0bc1cd35f423c0359933da0172ed2fd2 --- /dev/null +++ b/annotations_1/Gklme1-eQGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.69], [21.0, 21.76], [26.0, 27.11], [29.0, 50.87], [52.0, 70.12], [70.0, 96.52], [98.0, 98.42], [98.0, 104.53], [106.0, 110.47], [112.0, 112.87]], "keep_status": [false, false, false, true, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.31, 34.08, 33.57, 0.0, 37.73, 37.9, 0.0], "audiomae_on_audioset": [null, null, null, [["tools", 16.76], ["vehicle", 16.56], ["speech", 14.5]], [["music", 58.53], ["hum", 5.77], ["theremin", 5.55]], [["music", 61.68], ["hum", 4.8], ["electronic music", 4.23]], null, [["fly, housefly", 27.64], ["speech", 9.63], ["music", 9.08]], [["insect", 13.26], ["music", 9.47], ["fly, housefly", 9.23]], null], "duration": [0.69, 0.76, 1.11, 21.87, 18.12, 26.52, 0.42, 6.53, 4.47, 0.87]} \ No newline at end of file diff --git a/annotations_1/Gl5GVViqvjo_filtered.json b/annotations_1/Gl5GVViqvjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b4a6aed806793dd05f2dab64f437b63da03905f --- /dev/null +++ b/annotations_1/Gl5GVViqvjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.2], [11.0, 20.51], [23.0, 35.58], [37.0, 60.18], [61.0, 65.85], [67.0, 67.2], [68.0, 78.48], [82.0, 88.4], [93.0, 97.31], [97.0, 97.44]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [32.06, 32.72, 30.94, 31.52, 32.16, 0.0, 32.51, 32.21, 30.79, 0.0], "audiomae_on_audioset": [[["music", 45.74], ["theremin", 8.19], ["musical instrument", 6.93]], [["music", 76.6], ["theremin", 3.61], ["throbbing", 1.77]], [["music", 87.65], ["boing", 0.88], ["musical instrument", 0.85]], [["music", 49.01], ["speech", 15.09], ["buzz", 6.85]], [["music", 72.9], ["theremin", 5.44], ["throbbing", 2.19]], null, [["bleat", 29.3], ["music", 27.75], ["sheep", 18.53]], [["music", 70.74], ["swing music", 1.39], ["musical instrument", 1.07]], [["music", 58.73], ["boing", 5.16], ["electronic music", 3.02]], null], "duration": [5.2, 9.51, 12.58, 23.18, 4.85, 0.2, 10.48, 6.4, 4.31, 0.44]} \ No newline at end of file diff --git a/annotations_1/GlCN1EPAoHI_filtered.json b/annotations_1/GlCN1EPAoHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cde3f678c2ee0348b15a7c41a1e89749b2bbaf58 --- /dev/null +++ b/annotations_1/GlCN1EPAoHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 28.44], [29.0, 32.9], [58.0, 63.95], [65.0, 80.92], [81.0, 81.45], [84.0, 83.76], [84.0, 84.1], [85.0, 123.85], [124.0, 126.06], [128.0, 128.17], [129.0, 129.84], [130.0, 130.45], [131.0, 130.96]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.28, 52.33, 28.76, 28.42, 0.0, 0.0, 0.0, 0.0, 28.96, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 13.54], ["thunk", 11.37], ["whack, thwack", 10.9]], null, [["speech", 42.61], ["music", 30.12], ["electric shaver, electric razor", 8.2]], [["music", 33.32], ["throbbing", 25.3], ["hum", 9.3]], null, null, null, null, [["music", 43.62], ["throbbing", 23.19], ["hum", 6.17]], null, null, null, null], "duration": [25.44, 3.9, 5.95, 15.92, 0.45, -0.24, 0.1, 38.85, 2.06, 0.17, 0.84, 0.45, -0.04]} \ No newline at end of file diff --git a/annotations_1/GlP6emuR3z8_filtered.json b/annotations_1/GlP6emuR3z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5039749310699659f50dfed48384e4f97eb0e19c --- /dev/null +++ b/annotations_1/GlP6emuR3z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 25.79], [28.0, 28.81], [29.0, 29.1], [29.0, 48.02], [50.0, 50.62], [53.0, 53.97], [56.0, 73.21], [75.0, 75.49], [76.0, 95.94], [100.0, 100.03], [101.0, 123.25], [125.0, 139.45], [139.0, 140.53]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [32.73, 0.0, 0.0, 29.56, 0.0, 0.0, 30.9, 0.0, 29.72, 0.0, 30.3, 32.01, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 41.42], ["livestock, farm animals, working animals", 28.29], ["moo", 18.8]], null, null, [["music", 45.93], ["speech", 40.83], ["throbbing", 2.18]], null, null, [["hum", 32.58], ["mains hum", 18.78], ["music", 13.51]], null, [["music", 67.97], ["didgeridoo", 4.44], ["throbbing", 3.0]], null, [["music", 45.77], ["groan", 5.84], ["electric shaver, electric razor", 4.32]], [["animal", 18.13], ["music", 10.35], ["speech", 10.02]], null], "duration": [7.79, 0.81, 0.1, 19.02, 0.62, 0.97, 17.21, 0.49, 19.94, 0.03, 22.25, 14.45, 1.53]} \ No newline at end of file diff --git a/annotations_1/Gnpxe9kO_V8_filtered.json b/annotations_1/Gnpxe9kO_V8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5533755db4a586027631184e1020b24149eea718 --- /dev/null +++ b/annotations_1/Gnpxe9kO_V8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.45], [31.0, 31.83], [33.0, 34.74], [35.0, 37.1], [38.0, 42.08], [45.0, 45.89], [47.0, 47.93], [48.0, 48.56], [51.0, 52.22], [59.0, 65.75], [71.0, 71.29], [73.0, 74.82], [77.0, 81.38], [83.0, 84.97], [86.0, 86.37], [93.0, 94.12], [95.0, 96.28], [97.0, 100.65], [108.0, 112.23], [120.0, 128.51], [130.0, 138.15], [140.0, 140.88], [142.0, 142.59], [143.0, 143.94], [146.0, 146.35], [148.0, 148.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 96.29, 99.05, 0.0, 0.0, 0.0, 0.0, 36.28, 0.0, 0.0, 28.78, 0.0, 0.0, 0.0, 0.0, 33.59, 29.75, 32.24, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 80.27], ["thunk", 2.27], ["fart", 1.42]], null, null, [["speech", 58.08], ["whack, thwack", 9.82], ["thump, thud", 8.49]], null, null, null, null, [["speech", 61.72], ["inside, small room", 4.68], ["fart", 3.29]], [["speech", 41.1], ["clip-clop", 11.28], ["horse", 6.41]], [["speech", 13.67], ["fart", 11.98], ["frog", 9.49]], null, null, null, null, null, null], "duration": [3.45, 0.83, 1.74, 2.1, 4.08, 0.89, 0.93, 0.56, 1.22, 6.75, 0.29, 1.82, 4.38, 1.97, 0.37, 1.12, 1.28, 3.65, 4.23, 8.51, 8.15, 0.88, 0.59, 0.94, 0.35, 0.91]} \ No newline at end of file diff --git a/annotations_1/Go55LztXeQA_filtered.json b/annotations_1/Go55LztXeQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fafa7a7e28a9bd9f86eeee0dccd89045b279a507 --- /dev/null +++ b/annotations_1/Go55LztXeQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.34], [11.0, 18.39], [24.0, 24.78], [27.0, 29.15], [35.0, 43.12], [50.0, 51.04], [52.0, 53.77], [57.0, 59.31], [60.0, 87.79], [93.0, 96.97], [98.0, 111.5]], "keep_status": [false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 33.55, 0.0, 31.13, 33.4, 0.0, 0.0, 28.55, 29.99, 31.06, 29.99], "audiomae_on_audioset": [null, [["music", 13.75], ["noise", 9.04], ["hum", 6.99]], null, [["whale vocalization", 59.13], ["speech", 25.78], ["vehicle", 2.1]], [["speech", 48.51], ["music", 21.81], ["vehicle", 5.71]], null, null, [["music", 14.04], ["noise", 8.32], ["vehicle", 4.49]], [["speech", 59.87], ["animal", 6.63], ["music", 5.44]], [["livestock, farm animals, working animals", 41.62], ["cattle, bovinae", 21.24], ["moo", 20.02]], [["music", 32.59], ["buzz", 24.54], ["vehicle", 8.86]]], "duration": [0.34, 7.39, 0.78, 2.15, 8.12, 1.04, 1.77, 2.31, 27.79, 3.97, 13.5]} \ No newline at end of file diff --git a/annotations_1/GpLeHrROqRE_filtered.json b/annotations_1/GpLeHrROqRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11b5c512e1a080c6e72e982d4d3bce12477438e4 --- /dev/null +++ b/annotations_1/GpLeHrROqRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.28], [21.0, 21.56], [23.0, 25.78], [27.0, 28.46], [43.0, 46.58], [47.0, 61.32], [66.0, 67.0], [71.0, 71.29], [71.0, 71.83], [73.0, 80.5], [83.0, 91.66], [94.0, 96.82], [103.0, 103.55], [106.0, 108.63]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.7, 0.0, 96.42, 45.27, 0.0, 0.0, 0.0, 34.45, 30.95, 33.08, 0.0, 39.66], "audiomae_on_audioset": [null, null, null, null, null, [["music", 36.64], ["livestock, farm animals, working animals", 7.57], ["animal", 5.65]], null, null, null, [["moo", 33.97], ["livestock, farm animals, working animals", 31.93], ["cattle, bovinae", 27.78]], [["cattle, bovinae", 38.83], ["livestock, farm animals, working animals", 33.53], ["moo", 26.17]], [["cattle, bovinae", 37.85], ["moo", 35.67], ["livestock, farm animals, working animals", 16.06]], null, [["music", 65.34], ["thunk", 8.21], ["synthesizer", 2.97]]], "duration": [0.28, 0.56, 2.78, 1.46, 3.58, 14.32, 1.0, 0.29, 0.83, 7.5, 8.66, 2.82, 0.55, 2.63]} \ No newline at end of file diff --git a/annotations_1/Gq43zgK0T94_filtered.json b/annotations_1/Gq43zgK0T94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f261ec863853603b4714e998318993ab12a0a44 --- /dev/null +++ b/annotations_1/Gq43zgK0T94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [16.0, 35.06], [40.0, 40.58], [45.0, 45.93], [55.0, 63.68], [66.0, 67.39], [68.0, 70.56], [78.0, 81.85]], "keep_status": [false, false, false, false, true, false, true, false], "silence_prob": [0.0, 43.3, 0.0, 0.0, 32.64, 0.0, 34.24, 80.64], "audiomae_on_audioset": [null, [["music", 63.2], ["electronic music", 3.65], ["electric shaver, electric razor", 3.6]], null, null, [["music", 35.49], ["buzz", 12.75], ["fart", 5.78]], null, [["music", 34.87], ["speech", 14.61], ["singing", 5.75]], null], "duration": [0.67, 19.06, 0.58, 0.93, 8.68, 1.39, 2.56, 3.85]} \ No newline at end of file diff --git a/annotations_1/GqGPu-X3cv8_filtered.json b/annotations_1/GqGPu-X3cv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c56e22bb231f6d30bb6991c8f4ba99d27452e9f --- /dev/null +++ b/annotations_1/GqGPu-X3cv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.44], [16.0, 16.19], [33.0, 33.22], [46.0, 46.47], [52.0, 52.41], [55.0, 56.05], [69.0, 69.92], [92.0, 97.41], [99.0, 102.02], [113.0, 113.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.06, 30.23, 0.0], "audiomae_on_audioset": [[["music", 37.69], ["speech", 33.68], ["hum", 10.65]], null, null, null, null, null, null, [["music", 68.48], ["boing", 4.67], ["musical instrument", 2.43]], [["music", 70.91], ["electronic music", 6.11], ["hum", 4.3]], null], "duration": [6.44, 0.19, 0.22, 0.47, 0.41, 1.05, 0.92, 5.41, 3.02, 0.54]} \ No newline at end of file diff --git a/annotations_1/Gqa-biM6qKM_filtered.json b/annotations_1/Gqa-biM6qKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c327bc3e4573701291b86496e90e695f434a9dc --- /dev/null +++ b/annotations_1/Gqa-biM6qKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.17], [23.0, 26.65], [28.0, 36.39], [37.0, 38.5], [40.0, 40.15], [42.0, 70.53], [72.0, 79.61], [81.0, 175.42], [177.0, 192.74], [194.0, 196.94]], "keep_status": [false, true, false, false, false, true, true, false, true, true], "silence_prob": [0.0, 28.82, 28.41, 0.0, 0.0, 28.53, 29.64, 0.0, 28.21, 28.32], "audiomae_on_audioset": [null, [["throbbing", 14.04], ["music", 12.9], ["hum", 10.53]], [["speech", 62.66], ["fart", 5.05], ["rumble", 4.26]], null, null, [["noise", 60.42], ["whale vocalization", 5.1], ["livestock, farm animals, working animals", 3.23]], [["noise", 22.3], ["rumble", 13.69], ["hum", 13.29]], null, [["buzz", 23.82], ["noise", 15.09], ["white noise", 13.85]], [["rumble", 23.33], ["speech", 18.06], ["hum", 7.2]]], "duration": [1.17, 3.65, 8.39, 1.5, 0.15, 28.53, 7.61, 94.42, 15.74, 2.94]} \ No newline at end of file diff --git a/annotations_1/Gr-s1mxnwM0_filtered.json b/annotations_1/Gr-s1mxnwM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fa3a54825219d94e3cd36982f1de75c19934f15 --- /dev/null +++ b/annotations_1/Gr-s1mxnwM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.37], [13.0, 13.69], [15.0, 19.48], [32.0, 35.97], [37.0, 38.06], [40.0, 43.61], [46.0, 60.72], [63.0, 63.34], [70.0, 72.45], [73.0, 74.65], [86.0, 87.18], [90.0, 90.51], [92.0, 96.33], [97.0, 101.28], [102.0, 103.06], [104.0, 104.87], [105.0, 116.83], [117.0, 118.88], [122.0, 122.34], [123.0, 126.62], [127.0, 128.02], [134.0, 139.68], [140.0, 141.39], [142.0, 146.33], [147.0, 163.46], [166.0, 170.46], [172.0, 173.08], [178.0, 181.43], [190.0, 192.18]], "keep_status": [true, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, true], "silence_prob": [34.44, 0.0, 37.43, 40.75, 0.0, 80.82, 38.59, 0.0, 42.04, 0.0, 0.0, 0.0, 43.2, 90.08, 0.0, 0.0, 42.67, 0.0, 0.0, 40.57, 0.0, 40.36, 0.0, 39.34, 76.04, 41.83, 0.0, 77.2, 30.35], "audiomae_on_audioset": [[["boing", 23.18], ["speech", 10.58], ["echo", 9.15]], null, [["music", 21.53], ["crack", 12.16], ["crushing", 10.97]], [["music", 25.74], ["thunk", 10.37], ["effects unit", 9.58]], null, null, [["hum", 31.94], ["mains hum", 15.59], ["thunk", 9.25]], null, [["throbbing", 30.81], ["hum", 26.71], ["mains hum", 20.4]], null, null, null, [["music", 39.84], ["hum", 9.83], ["musical instrument", 7.25]], null, null, null, [["speech", 59.34], ["music", 17.64], ["crack", 6.66]], null, null, [["speech", 43.72], ["thunk", 25.94], ["music", 5.7]], null, [["music", 20.09], ["hum", 16.47], ["throbbing", 13.79]], null, [["speech", 33.96], ["throbbing", 12.11], ["didgeridoo", 9.55]], null, [["music", 22.49], ["hum", 19.02], ["synthesizer", 12.75]], null, null, [["livestock, farm animals, working animals", 22.84], ["moo", 19.5], ["cattle, bovinae", 15.7]]], "duration": [9.37, 0.69, 4.48, 3.97, 1.06, 3.61, 14.72, 0.34, 2.45, 1.65, 1.18, 0.51, 4.33, 4.28, 1.06, 0.87, 11.83, 1.88, 0.34, 3.62, 1.02, 5.68, 1.39, 4.33, 16.46, 4.46, 1.08, 3.43, 2.18]} \ No newline at end of file diff --git a/annotations_1/GrCmVFX9tyQ_filtered.json b/annotations_1/GrCmVFX9tyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..396ed46414b269a71fd38f7e510ad1dacad0c981 --- /dev/null +++ b/annotations_1/GrCmVFX9tyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [4.0, 5.24], [6.0, 7.52], [9.0, 13.49], [15.0, 17.71], [20.0, 20.51], [23.0, 23.52], [24.0, 24.46], [25.0, 26.33], [28.0, 28.17], [30.0, 30.01], [31.0, 31.51], [34.0, 34.74], [36.0, 36.07], [40.0, 40.59], [44.0, 46.16], [47.0, 47.76], [49.0, 49.76], [50.0, 50.99], [52.0, 52.68], [53.0, 53.37], [54.0, 54.63], [55.0, 56.27], [59.0, 59.49], [61.0, 60.81], [62.0, 61.96], [68.0, 69.7], [73.0, 74.19], [78.0, 79.17], [80.0, 80.84], [88.0, 88.18], [89.0, 88.89], [96.0, 97.29], [98.0, 99.05], [100.0, 100.18], [101.0, 104.46], [111.0, 111.16], [117.0, 118.02], [119.0, 120.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.76, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 88.76], ["thunk", 2.07], ["telephone", 0.99]], null, null, null], "duration": [0.55, 1.24, 1.52, 4.49, 2.71, 0.51, 0.52, 0.46, 1.33, 0.17, 0.01, 0.51, 0.74, 0.07, 0.59, 2.16, 0.76, 0.76, 0.99, 0.68, 0.37, 0.63, 1.27, 0.49, -0.19, -0.04, 1.7, 1.19, 1.17, 0.84, 0.18, -0.11, 1.29, 1.05, 0.18, 3.46, 0.16, 1.02, 1.14]} \ No newline at end of file diff --git a/annotations_1/GrIJLWISdlQ_filtered.json b/annotations_1/GrIJLWISdlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/GrIJLWISdlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/GtSNSaW9IRI_filtered.json b/annotations_1/GtSNSaW9IRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..911f2d2a3040d74383d1a2fbc06d541d5e4aacb9 --- /dev/null +++ b/annotations_1/GtSNSaW9IRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 50.73], [52.0, 54.58], [55.0, 136.97], [137.0, 138.86], [139.0, 141.13], [142.0, 143.01]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 28.48, 0.0, 0.0, 28.65, 0.0], "audiomae_on_audioset": [null, [["music", 77.8], ["speech", 5.54], ["throbbing", 2.18]], null, null, [["speech", 56.5], ["music", 15.12], ["burst, pop", 2.63]], null], "duration": [47.73, 2.58, 81.97, 1.86, 2.13, 1.01]} \ No newline at end of file diff --git a/annotations_1/GtqIqWKdlD4_filtered.json b/annotations_1/GtqIqWKdlD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ae450f0fa4a546dc44344504f19f1dd59662eb3 --- /dev/null +++ b/annotations_1/GtqIqWKdlD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 10.77], [13.0, 21.96], [25.0, 25.51], [26.0, 29.29], [33.0, 33.45], [36.0, 38.47], [40.0, 40.05], [42.0, 43.46], [47.0, 47.17], [49.0, 49.72], [52.0, 55.21], [57.0, 59.9], [62.0, 63.19], [64.0, 64.3], [66.0, 79.74], [81.0, 81.68], [82.0, 82.51], [83.0, 83.57], [84.0, 84.75], [86.0, 86.88], [88.0, 88.75], [92.0, 92.23], [95.0, 96.4], [97.0, 99.64], [100.0, 101.06], [105.0, 105.49], [106.0, 106.24], [109.0, 109.21], [112.0, 111.82], [122.0, 122.88], [124.0, 131.87], [134.0, 137.05], [139.0, 139.94], [141.0, 141.76], [142.0, 154.45], [158.0, 158.72], [163.0, 163.95], [165.0, 165.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [34.02, 70.3, 0.0, 44.96, 0.0, 94.95, 0.0, 0.0, 0.0, 0.0, 32.61, 35.41, 0.0, 0.0, 29.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.52, 39.89, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 48.55], ["insect", 19.82], ["speech", 13.6]], null, null, [["music", 50.36], ["musical instrument", 6.75], ["drum", 6.5]], null, null, null, null, null, null, [["speech", 29.92], ["throbbing", 9.04], ["hum", 7.67]], [["music", 48.87], ["speech", 19.0], ["hum", 8.2]], null, null, [["hum", 30.64], ["vehicle", 15.93], ["speech", 15.66]], null, null, null, null, null, null, null, null, [["hum", 28.95], ["music", 21.35], ["throbbing", 18.43]], null, null, null, null, null, null, [["whack, thwack", 19.55], ["fly, housefly", 11.64], ["music", 9.13]], [["hum", 28.83], ["speech", 19.04], ["music", 12.25]], null, null, [["music", 58.53], ["electronic music", 6.39], ["hum", 5.06]], null, null, null], "duration": [10.77, 8.96, 0.51, 3.29, 0.45, 2.47, 0.05, 1.46, 0.17, 0.72, 3.21, 2.9, 1.19, 0.3, 13.74, 0.68, 0.51, 0.57, 0.75, 0.88, 0.75, 0.23, 1.4, 2.64, 1.06, 0.49, 0.24, 0.21, -0.18, 0.88, 7.87, 3.05, 0.94, 0.76, 12.45, 0.72, 0.95, 0.13]} \ No newline at end of file diff --git a/annotations_1/GuAHdW8FdLs_filtered.json b/annotations_1/GuAHdW8FdLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2578b820f1525300396baf10629956079d7a69a4 --- /dev/null +++ b/annotations_1/GuAHdW8FdLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.84], [12.0, 12.34], [17.0, 18.57], [22.0, 23.38], [29.0, 30.03], [31.0, 32.98], [34.0, 35.11], [36.0, 36.32], [37.0, 38.43], [41.0, 41.47], [44.0, 44.25], [48.0, 48.96], [50.0, 50.89], [52.0, 52.25], [53.0, 53.6], [55.0, 55.38], [63.0, 64.67], [73.0, 74.34], [82.0, 83.64], [85.0, 85.33], [86.0, 86.27], [88.0, 90.14], [91.0, 93.16], [96.0, 96.3], [97.0, 97.92], [99.0, 99.54], [101.0, 103.69], [105.0, 105.8], [107.0, 107.52], [108.0, 110.57], [113.0, 136.97], [138.0, 139.73], [140.0, 143.77], [144.0, 144.49], [152.0, 152.05], [154.0, 157.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 99.9, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 42.88, 52.33, 0.0, 43.79, 0.0, 0.0, 66.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.62], ["didgeridoo", 5.73], ["speech", 3.66]], null, null, [["music", 32.82], ["didgeridoo", 26.7], ["speech", 8.79]], null, null, null], "duration": [1.84, 0.34, 1.57, 1.38, 1.03, 1.98, 1.11, 0.32, 1.43, 0.47, 0.25, 0.96, 0.89, 0.25, 0.6, 0.38, 1.67, 1.34, 1.64, 0.33, 0.27, 2.14, 2.16, 0.3, 0.92, 0.54, 2.69, 0.8, 0.52, 2.57, 23.97, 1.73, 3.77, 0.49, 0.05, 3.25]} \ No newline at end of file diff --git a/annotations_1/GuqCibVW5wo_filtered.json b/annotations_1/GuqCibVW5wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..387b5721ca41bb2c4ad5ea64d659f870236b9a1f --- /dev/null +++ b/annotations_1/GuqCibVW5wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.58], [6.0, 6.29], [9.0, 9.81], [15.0, 18.72], [19.0, 21.79], [22.0, 23.13], [23.0, 24.41], [25.0, 34.8], [38.0, 39.39], [41.0, 41.2], [42.0, 42.72], [45.0, 48.56], [55.0, 58.5], [66.0, 68.62], [70.0, 70.83], [73.0, 76.82], [78.0, 80.81], [84.0, 87.54], [93.0, 98.49], [100.0, 105.44], [106.0, 105.85], [106.0, 105.95]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 56.4, 41.5, 0.0, 0.0, 32.87, 0.0, 0.0, 0.0, 29.21, 28.54, 32.36, 0.0, 30.01, 32.29, 35.15, 67.0, 40.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 34.14], ["speech", 15.0], ["scary music", 11.03]], null, null, [["music", 34.32], ["speech", 20.01], ["theremin", 15.01]], null, null, null, [["music", 53.4], ["speech", 26.93], ["hum", 5.19]], [["music", 34.74], ["speech", 22.37], ["static", 11.5]], [["music", 66.58], ["hum", 5.07], ["mains hum", 3.2]], null, [["music", 38.92], ["didgeridoo", 9.39], ["mains hum", 6.22]], [["music", 66.53], ["throbbing", 6.32], ["electronic music", 3.12]], [["music", 46.11], ["didgeridoo", 4.83], ["electronic music", 3.16]], null, [["music", 31.35], ["singing bowl", 25.74], ["theremin", 17.91]], null, null], "duration": [1.58, 0.29, 0.81, 3.72, 2.79, 1.13, 1.41, 9.8, 1.39, 0.2, 0.72, 3.56, 3.5, 2.62, 0.83, 3.82, 2.81, 3.54, 5.49, 5.44, -0.15, -0.05]} \ No newline at end of file diff --git a/annotations_1/GuqaloLJNJk_filtered.json b/annotations_1/GuqaloLJNJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d6f7b9e9ba1c4914da188968d496a2c42226264 --- /dev/null +++ b/annotations_1/GuqaloLJNJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [6.0, 8.58], [13.0, 26.81], [28.0, 30.4], [31.0, 34.23], [37.0, 44.86], [45.0, 48.47], [51.0, 57.2], [60.0, 72.74], [73.0, 74.31], [76.0, 79.54], [82.0, 115.16], [116.0, 117.32], [119.0, 119.52], [124.0, 125.27], [127.0, 127.26], [130.0, 130.1]], "keep_status": [false, true, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.59, 28.5, 29.25, 28.49, 28.38, 28.38, 28.18, 28.26, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.97], ["throbbing", 17.24], ["hum", 13.07]], [["breaking", 39.79], ["music", 11.63], ["speech", 8.58]], [["speech", 24.56], ["throbbing", 16.93], ["music", 15.51]], [["breaking", 57.1], ["smash, crash", 9.91], ["music", 6.56]], [["hum", 31.58], ["mains hum", 18.42], ["throbbing", 15.18]], [["speech", 67.73], ["music", 8.59], ["explosion", 4.07]], [["throbbing", 46.2], ["hum", 24.94], ["music", 9.73]], [["speech", 33.73], ["breaking", 8.19], ["music", 7.88]], null, [["hum", 43.69], ["mains hum", 22.42], ["throbbing", 14.12]], null, null, null, null, null, null], "duration": [0.19, 2.58, 13.81, 2.4, 3.23, 7.86, 3.47, 6.2, 12.74, 1.31, 3.54, 33.16, 1.32, 0.52, 1.27, 0.26, 0.1]} \ No newline at end of file diff --git a/annotations_1/GusR6qF81kc_filtered.json b/annotations_1/GusR6qF81kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e368cd44b6dcdbfdbcf2e97a36f7eed9f3f07adc --- /dev/null +++ b/annotations_1/GusR6qF81kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.89], [19.0, 21.22], [24.0, 34.01], [37.0, 42.72], [46.0, 53.77], [58.0, 62.13], [63.0, 73.28], [75.0, 75.37], [78.0, 78.56], [80.0, 88.79], [90.0, 93.75], [96.0, 96.96], [98.0, 99.13], [106.0, 109.0], [120.0, 120.63]], "keep_status": [true, true, false, false, true, true, true, false, false, true, false, false, false, true, false], "silence_prob": [33.82, 35.18, 32.14, 33.12, 33.15, 31.43, 31.76, 0.0, 0.0, 30.56, 30.48, 0.0, 0.0, 29.97, 0.0], "audiomae_on_audioset": [[["music", 25.62], ["speech", 20.39], ["musical instrument", 3.7]], [["music", 34.55], ["wind instrument, woodwind instrument", 11.68], ["speech", 10.44]], [["mains hum", 39.3], ["hum", 23.17], ["music", 16.45]], [["mains hum", 43.08], ["hum", 40.08], ["electric shaver, electric razor", 4.43]], [["music", 20.34], ["theremin", 14.93], ["hum", 7.22]], [["music", 46.71], ["theremin", 10.78], ["electronic music", 3.8]], [["music", 54.79], ["musical instrument", 9.49], ["speech", 1.81]], null, null, [["music", 23.33], ["organ", 16.72], ["keyboard (musical)", 11.08]], [["theremin", 38.76], ["music", 36.59], ["synthesizer", 4.1]], null, null, [["speech", 29.14], ["buzzer", 21.94], ["electric shaver, electric razor", 6.24]], null], "duration": [4.89, 2.22, 10.01, 5.72, 7.77, 4.13, 10.28, 0.37, 0.56, 8.79, 3.75, 0.96, 1.13, 3.0, 0.63]} \ No newline at end of file diff --git a/annotations_1/GvDcscZXfl8_filtered.json b/annotations_1/GvDcscZXfl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bfc7d1e2295abd0cbd8a384e68d9c42d1d9b68 --- /dev/null +++ b/annotations_1/GvDcscZXfl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 41.12], [53.0, 53.7], [55.0, 55.56], [57.0, 57.62], [67.0, 66.9], [75.0, 76.4], [77.0, 79.27], [89.0, 90.9], [97.0, 99.59], [100.0, 102.14], [106.0, 107.92], [109.0, 109.68], [111.0, 113.34], [115.0, 126.55], [127.0, 127.94]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.62, 0.0, 71.87, 73.82, 0.0, 0.0, 69.34, 39.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 14.59], ["wind instrument, woodwind instrument", 10.6], ["music", 8.79]], null, null, null, null, null, null, [["music", 35.24], ["speech", 23.04], ["musical instrument", 8.28]], null], "duration": [0.12, 0.7, 0.56, 0.62, -0.1, 1.4, 2.27, 1.9, 2.59, 2.14, 1.92, 0.68, 2.34, 11.55, 0.94]} \ No newline at end of file diff --git a/annotations_1/GvHBefStM7o_filtered.json b/annotations_1/GvHBefStM7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a6ebf4fb0410bc6bcc983e64dd67b655c3515ba --- /dev/null +++ b/annotations_1/GvHBefStM7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.61], [30.0, 31.38], [33.0, 33.47], [36.0, 36.19], [37.0, 38.3], [40.0, 46.28], [52.0, 52.12], [54.0, 54.09], [57.0, 58.02], [60.0, 97.78], [101.0, 102.95], [104.0, 112.92], [115.0, 115.4], [117.0, 117.8], [121.0, 121.1], [124.0, 124.9], [126.0, 129.57], [130.0, 131.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.46, 0.0, 0.0, 0.0, 0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 65.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 87.02], ["throbbing", 2.31], ["hum", 2.18]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.38, 0.47, 0.19, 1.3, 6.28, 0.12, 0.09, 1.02, 37.78, 1.95, 8.92, 0.4, 0.8, 0.1, 0.9, 3.57, 1.41]} \ No newline at end of file diff --git a/annotations_1/GwdgbTQ5cgU_filtered.json b/annotations_1/GwdgbTQ5cgU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf1394c9f3bf17e17535dbb7ed06e15225c52e35 --- /dev/null +++ b/annotations_1/GwdgbTQ5cgU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 68.27], [69.0, 69.9], [76.0, 78.85], [86.0, 118.64], [124.0, 142.38], [147.0, 158.11], [163.0, 163.34]], "keep_status": [false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 33.66, 0.0, 31.11, 32.31, 0.0], "audiomae_on_audioset": [null, null, [["music", 23.97], ["whale vocalization", 5.85], ["hum", 5.56]], null, [["music", 62.95], ["musical instrument", 3.73], ["brass instrument", 3.09]], [["speech", 33.26], ["vehicle", 10.98], ["car", 10.89]], null], "duration": [54.27, 0.9, 2.85, 32.64, 18.38, 11.11, 0.34]} \ No newline at end of file diff --git a/annotations_1/GwtcfnmV68I_filtered.json b/annotations_1/GwtcfnmV68I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a24b2027765f43fe1ad8c19801495d8f639c1536 --- /dev/null +++ b/annotations_1/GwtcfnmV68I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.67], [18.0, 18.25], [19.0, 20.29], [22.0, 25.12], [28.0, 29.49], [36.0, 40.85], [41.0, 40.88], [41.0, 40.96], [41.0, 42.62], [44.0, 48.02], [49.0, 49.74], [54.0, 54.82], [55.0, 56.12], [57.0, 58.01], [58.0, 65.15], [66.0, 67.8], [69.0, 70.53], [73.0, 73.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.13, 0.0, 57.17, 0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 0.25, 1.29, 3.12, 1.49, 4.85, -0.12, -0.04, 1.62, 4.02, 0.74, 0.82, 1.12, 1.01, 7.15, 1.8, 1.53, 0.04]} \ No newline at end of file diff --git a/annotations_1/GwvrEz7vTZY_filtered.json b/annotations_1/GwvrEz7vTZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c58972daebbfda26eb96dbdfff65b1cb73040f3 --- /dev/null +++ b/annotations_1/GwvrEz7vTZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [7.0, 11.08], [14.0, 17.36], [21.0, 22.33], [23.0, 25.71], [35.0, 36.41], [37.0, 37.89], [38.0, 39.01], [43.0, 44.78], [45.0, 45.66], [48.0, 53.18], [58.0, 58.01], [64.0, 66.39], [76.0, 78.11], [81.0, 84.32], [85.0, 85.46], [87.0, 89.94], [94.0, 97.23], [99.0, 99.39], [111.0, 111.64], [117.0, 119.47], [121.0, 126.42], [129.0, 133.27], [136.0, 137.2], [143.0, 144.54], [145.0, 150.15], [151.0, 151.43], [155.0, 156.81], [158.0, 164.44], [168.0, 172.22], [174.0, 175.17]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 35.05, 36.5, 0.0, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 34.73, 0.0, 37.53, 38.83, 35.99, 0.0, 30.92, 30.73, 0.0, 0.0, 38.31, 37.77, 31.87, 0.0, 0.0, 30.98, 0.0, 0.0, 32.44, 38.22, 0.0], "audiomae_on_audioset": [null, [["music", 64.77], ["didgeridoo", 13.38], ["effects unit", 2.55]], [["music", 43.34], ["singing", 5.08], ["frog", 4.07]], null, [["music", 57.3], ["french horn", 10.68], ["musical instrument", 9.64]], null, null, null, null, null, [["music", 78.95], ["theremin", 2.21], ["musical instrument", 1.79]], null, [["music", 41.84], ["musical instrument", 15.51], ["theremin", 14.1]], [["music", 55.74], ["musical instrument", 13.56], ["brass instrument", 8.25]], [["music", 79.22], ["singing", 3.13], ["musical instrument", 2.95]], null, [["music", 46.04], ["theremin", 25.43], ["cello", 3.22]], [["music", 77.6], ["singing", 2.41], ["classical music", 1.88]], null, null, [["music", 66.44], ["musical instrument", 3.27], ["theremin", 3.25]], [["music", 69.17], ["didgeridoo", 4.07], ["musical instrument", 3.65]], [["music", 43.94], ["theremin", 5.05], ["piano", 3.8]], null, null, [["music", 71.8], ["chant", 3.51], ["singing", 3.25]], null, null, [["music", 48.72], ["wind instrument, woodwind instrument", 11.02], ["musical instrument", 9.13]], [["music", 49.3], ["singing bowl", 13.25], ["ambient music", 6.5]], null], "duration": [0.38, 4.08, 3.36, 1.33, 2.71, 1.41, 0.89, 1.01, 1.78, 0.66, 5.18, 0.01, 2.39, 2.11, 3.32, 0.46, 2.94, 3.23, 0.39, 0.64, 2.47, 5.42, 4.27, 1.2, 1.54, 5.15, 0.43, 1.81, 6.44, 4.22, 1.17]} \ No newline at end of file diff --git a/annotations_1/Gx1K7ynF1JM_filtered.json b/annotations_1/Gx1K7ynF1JM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7094027523dc6749fd7630cc0d1b1acfd33c22ab --- /dev/null +++ b/annotations_1/Gx1K7ynF1JM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.98], [14.0, 17.46], [30.0, 33.83], [49.0, 49.87], [51.0, 53.59], [54.0, 54.03], [55.0, 57.7], [59.0, 59.37], [62.0, 62.48], [63.0, 63.24], [64.0, 65.92], [67.0, 67.76], [70.0, 70.43], [72.0, 71.91], [73.0, 72.87], [74.0, 74.12], [74.0, 75.0], [75.0, 75.61], [76.0, 77.79], [80.0, 81.33], [90.0, 93.61], [98.0, 99.42], [107.0, 107.1], [107.0, 118.57], [119.0, 135.46], [136.0, 141.4], [142.0, 172.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 52.62, 0.0, 95.64, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.44, 0.0, 0.0, 31.71, 31.29, 31.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.49], ["middle eastern music", 3.31], ["singing", 2.06]], null, null, [["music", 77.6], ["swing music", 8.29], ["funny music", 1.04]], [["music", 63.13], ["boing", 5.02], ["didgeridoo", 4.08]], [["music", 70.33], ["yodeling", 5.04], ["swing music", 2.99]], null], "duration": [-0.02, 3.46, 3.83, 0.87, 2.59, 0.03, 2.7, 0.37, 0.48, 0.24, 1.92, 0.76, 0.43, -0.09, -0.13, 0.12, 1.0, 0.61, 1.79, 1.33, 3.61, 1.42, 0.1, 11.57, 16.46, 5.4, 30.91]} \ No newline at end of file diff --git a/annotations_1/GylxYHpdxVQ_filtered.json b/annotations_1/GylxYHpdxVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bbe08db33402c4a79d601639427d4987feeb883 --- /dev/null +++ b/annotations_1/GylxYHpdxVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.76], [7.0, 15.48], [17.0, 17.78], [20.0, 26.5], [28.0, 29.29], [31.0, 31.18], [33.0, 33.69], [36.0, 51.75], [53.0, 74.61], [75.0, 77.31], [78.0, 82.88], [86.0, 116.63], [117.0, 124.01], [128.0, 129.3], [132.0, 133.24], [135.0, 139.04], [141.0, 142.01], [144.0, 151.41]], "keep_status": [false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [55.04, 48.74, 0.0, 66.63, 0.0, 0.0, 0.0, 35.32, 46.68, 65.32, 72.31, 0.0, 48.27, 0.0, 0.0, 51.02, 0.0, 42.88], "audiomae_on_audioset": [null, [["fly, housefly", 22.51], ["bee, wasp, etc.", 21.27], ["hum", 14.16]], null, null, null, null, null, [["speech", 31.73], ["whack, thwack", 9.39], ["hum", 5.77]], [["music", 60.87], ["gong", 3.91], ["electronic music", 1.59]], null, null, null, [["hum", 32.47], ["throbbing", 26.24], ["speech", 22.85]], null, null, null, null, [["music", 39.31], ["throbbing", 8.35], ["electronic music", 7.71]]], "duration": [4.76, 8.48, 0.78, 6.5, 1.29, 0.18, 0.69, 15.75, 21.61, 2.31, 4.88, 30.63, 7.01, 1.3, 1.24, 4.04, 1.01, 7.41]} \ No newline at end of file diff --git a/annotations_1/GzL4f-4uQVM_filtered.json b/annotations_1/GzL4f-4uQVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac5fe55d2fbde07ff90cae2ca1e9d4e4da3aaf93 --- /dev/null +++ b/annotations_1/GzL4f-4uQVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.23], [16.0, 16.36], [18.0, 18.13], [18.0, 19.26], [20.0, 20.92], [24.0, 24.09], [32.0, 32.26], [38.0, 38.72], [41.0, 41.57], [42.0, 42.7], [51.0, 51.14], [55.0, 63.91], [65.0, 67.78], [71.0, 71.58], [72.0, 73.63], [79.0, 80.96], [84.0, 86.21], [89.0, 89.45], [90.0, 90.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 78.04, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.23, 0.36, 0.13, 1.26, 0.92, 0.09, 0.26, 0.72, 0.57, 0.7, 0.14, 8.91, 2.78, 0.58, 1.63, 1.96, 2.21, 0.45, 0.02]} \ No newline at end of file diff --git a/annotations_1/GzMBisWrn_M_filtered.json b/annotations_1/GzMBisWrn_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903d52aec9cfe70a310fd31efd6089673bf35119 --- /dev/null +++ b/annotations_1/GzMBisWrn_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.55], [23.0, 25.29], [26.0, 30.1], [31.0, 33.3], [37.0, 41.2], [47.0, 46.99], [48.0, 51.85], [52.0, 53.54], [56.0, 56.76], [59.0, 60.76], [65.0, 68.94], [73.0, 73.03], [87.0, 89.01], [94.0, 96.35], [99.0, 98.85], [100.0, 100.62], [102.0, 101.88], [107.0, 106.74], [108.0, 108.97], [116.0, 117.61], [120.0, 121.12], [122.0, 123.62], [134.0, 142.1], [144.0, 145.96], [149.0, 151.8], [153.0, 154.53], [156.0, 160.05], [164.0, 165.37]], "keep_status": [false, true, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.19, 46.54, 40.57, 82.43, 36.5, 0.0, 75.55, 0.0, 0.0, 0.0, 71.43, 0.0, 90.78, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 97.64, 0.0, 91.64, 0.0], "audiomae_on_audioset": [null, [["music", 18.79], ["hum", 13.76], ["throbbing", 12.86]], [["fly, housefly", 11.3], ["crushing", 9.06], ["noise", 4.29]], null, [["speech", 43.91], ["throbbing", 9.02], ["hum", 8.62]], null, null, null, null, null, null, null, null, [["rumble", 30.69], ["skateboard", 25.68], ["thunk", 5.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.55, 2.29, 4.1, 2.3, 4.2, -0.01, 3.85, 1.54, 0.76, 1.76, 3.94, 0.03, 2.01, 2.35, -0.15, 0.62, -0.12, -0.26, 0.97, 1.61, 1.12, 1.62, 8.1, 1.96, 2.8, 1.53, 4.05, 1.37]} \ No newline at end of file diff --git a/annotations_1/H-Mr-QmgheY_filtered.json b/annotations_1/H-Mr-QmgheY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a6e8cfc80f093ab6dba37c15d5ff301a0f9a4d7 --- /dev/null +++ b/annotations_1/H-Mr-QmgheY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.17], [21.0, 21.66], [26.0, 32.46], [38.0, 43.39], [48.0, 49.42], [52.0, 63.41], [64.0, 69.55], [71.0, 71.04], [71.0, 72.52], [73.0, 83.93], [85.0, 94.36], [97.0, 104.87], [106.0, 106.49], [109.0, 110.05], [112.0, 113.31], [114.0, 117.95], [119.0, 121.61], [131.0, 132.04], [133.0, 134.49]], "keep_status": [false, false, true, true, false, false, true, false, false, true, true, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 29.62, 28.94, 0.0, 28.93, 29.59, 0.0, 0.0, 38.42, 42.96, 42.48, 0.0, 0.0, 0.0, 48.06, 48.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 19.0], ["speech", 14.72], ["buzz", 13.26]], [["fly, housefly", 34.77], ["mosquito", 20.25], ["insect", 7.5]], null, [["speech", 36.88], ["music", 27.94], ["hum", 6.96]], [["music", 25.15], ["throbbing", 22.65], ["speech", 17.36]], null, null, [["animal", 19.59], ["horse", 6.64], ["oink", 5.59]], [["rain on surface", 22.13], ["fly, housefly", 13.38], ["rain", 9.9]], [["fly, housefly", 33.42], ["insect", 11.66], ["hum", 7.2]], null, null, null, [["hum", 18.44], ["throbbing", 17.98], ["music", 6.37]], [["frog", 17.84], ["rain on surface", 12.78], ["rain", 9.83]], null, null], "duration": [1.17, 0.66, 6.46, 5.39, 1.42, 11.41, 5.55, 0.04, 1.52, 10.93, 9.36, 7.87, 0.49, 1.05, 1.31, 3.95, 2.61, 1.04, 1.49]} \ No newline at end of file diff --git a/annotations_1/H1IhRMtTUno_filtered.json b/annotations_1/H1IhRMtTUno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fa939bc5bec3d1627fefffa83d59820b743cffa --- /dev/null +++ b/annotations_1/H1IhRMtTUno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.03], [18.0, 18.81], [21.0, 21.39], [22.0, 22.5], [27.0, 27.3], [38.0, 38.1], [42.0, 43.6], [62.0, 67.8], [69.0, 69.25], [71.0, 70.88], [72.0, 74.14], [103.0, 103.82], [118.0, 119.69], [120.0, 122.34], [123.0, 123.62], [134.0, 135.67], [141.0, 142.16], [144.0, 144.22], [149.0, 149.0], [152.0, 153.3], [154.0, 155.12], [157.0, 157.01], [159.0, 160.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 91.81, 0.0, 0.0, 45.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.03], ["male speech, man speaking", 3.92], ["narration, monologue", 2.49]], null, null, null, null, null, null, null, null, null], "duration": [1.03, 0.81, 0.39, 0.5, 0.3, 0.1, 1.6, 5.8, 0.25, -0.12, 2.14, 0.82, 1.69, 2.34, 0.62, 1.67, 1.16, 0.22, 0.0, 1.3, 1.12, 0.01, 1.78]} \ No newline at end of file diff --git a/annotations_1/H1TQv3qA7PI_filtered.json b/annotations_1/H1TQv3qA7PI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c27558cc016d6261f730b0a936367135505e5c5c --- /dev/null +++ b/annotations_1/H1TQv3qA7PI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.22], [14.0, 16.51], [17.0, 17.66], [22.0, 35.28], [35.0, 45.13], [51.0, 92.87], [93.0, 93.23], [94.0, 94.24]], "keep_status": [true, true, false, false, false, false, false, false], "silence_prob": [40.79, 31.31, 0.0, 31.07, 32.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 18.64], ["musical instrument", 8.58], ["electric shaver, electric razor", 7.48]], [["music", 35.01], ["speech", 4.88], ["sheep", 4.73]], null, [["music", 31.78], ["hum", 23.07], ["mains hum", 19.54]], [["music", 59.09], ["scary music", 9.06], ["theremin", 7.28]], null, null, null], "duration": [2.22, 2.51, 0.66, 13.28, 10.13, 41.87, 0.23, 0.24]} \ No newline at end of file diff --git a/annotations_1/H1_mdoiwhBY_filtered.json b/annotations_1/H1_mdoiwhBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..524751273c3de57166689022002dbbb9432db2ec --- /dev/null +++ b/annotations_1/H1_mdoiwhBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.15], [28.0, 30.0], [33.0, 32.93], [43.0, 47.28], [48.0, 48.84], [55.0, 55.24], [56.0, 56.66], [63.0, 63.71], [73.0, 73.62]], "keep_status": [true, true, false, false, false, false, false, false, false], "silence_prob": [38.03, 32.79, 0.0, 48.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 35.2], ["boing", 10.43], ["moo", 8.05]], [["speech", 50.97], ["fireworks", 7.25], ["music", 6.43]], null, [["radio", 38.4], ["speech", 26.48], ["sidetone", 22.75]], null, null, null, null, null], "duration": [5.15, 2.0, -0.07, 4.28, 0.84, 0.24, 0.66, 0.71, 0.62]} \ No newline at end of file diff --git a/annotations_1/H2hbov4Rb6g_filtered.json b/annotations_1/H2hbov4Rb6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaa9590c6bf3863e1279d91db8b30f0d2d109b27 --- /dev/null +++ b/annotations_1/H2hbov4Rb6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.14], [12.0, 12.11], [12.0, 12.68], [13.0, 13.46], [14.0, 16.56], [17.0, 19.03], [19.0, 28.24], [29.0, 30.69], [32.0, 33.07], [34.0, 34.86], [37.0, 37.98], [39.0, 40.0], [42.0, 42.65], [44.0, 45.08], [46.0, 46.99], [48.0, 51.07], [53.0, 53.3], [54.0, 55.32], [57.0, 58.35], [61.0, 61.94], [65.0, 70.95], [74.0, 78.65], [79.0, 80.18], [82.0, 84.42], [85.0, 86.04], [88.0, 88.7], [91.0, 91.29], [95.0, 97.02], [101.0, 101.61], [107.0, 107.65], [110.0, 112.4], [116.0, 120.12], [121.0, 121.68]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [47.58, 0.0, 0.0, 0.0, 39.41, 69.47, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.8, 0.0, 99.68, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 36.07, 33.41, 0.0], "audiomae_on_audioset": [[["speech", 41.47], ["livestock, farm animals, working animals", 6.77], ["cattle, bovinae", 6.61]], null, null, null, [["cattle, bovinae", 52.28], ["moo", 38.27], ["livestock, farm animals, working animals", 6.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 25.28], ["sheep", 18.39], ["moo", 12.01]], [["music", 46.51], ["didgeridoo", 7.18], ["grunt", 3.97]], null], "duration": [2.14, 0.11, 0.68, 0.46, 2.56, 2.03, 9.24, 1.69, 1.07, 0.86, 0.98, 1.0, 0.65, 1.08, 0.99, 3.07, 0.3, 1.32, 1.35, 0.94, 5.95, 4.65, 1.18, 2.42, 1.04, 0.7, 0.29, 2.02, 0.61, 0.65, 2.4, 4.12, 0.68]} \ No newline at end of file diff --git a/annotations_1/H4YWQ0uEY2U_filtered.json b/annotations_1/H4YWQ0uEY2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ba6aa54a1e2441cfe3a64ed170a0dc4adf0431 --- /dev/null +++ b/annotations_1/H4YWQ0uEY2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.52], [32.0, 33.51], [40.0, 39.72], [60.0, 62.9], [71.0, 71.52], [72.0, 73.47], [79.0, 80.94], [86.0, 85.92], [87.0, 87.07], [88.0, 88.06], [90.0, 91.1], [97.0, 100.45], [105.0, 106.57], [108.0, 110.94], [115.0, 115.35]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.92, 0.0, 36.94, 0.0], "audiomae_on_audioset": [null, null, null, [["noise", 26.88], ["music", 14.57], ["whale vocalization", 7.73]], null, null, null, null, null, null, null, [["music", 70.18], ["carnatic music", 5.74], ["sitar", 4.77]], null, [["music", 64.33], ["theremin", 9.33], ["carnatic music", 6.33]], null], "duration": [0.52, 1.51, -0.28, 2.9, 0.52, 1.47, 1.94, -0.08, 0.07, 0.06, 1.1, 3.45, 1.57, 2.94, 0.35]} \ No newline at end of file diff --git a/annotations_1/H4d8EcquSUM_filtered.json b/annotations_1/H4d8EcquSUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27a70993640b8f25af58fc7bff9b65a37873849 --- /dev/null +++ b/annotations_1/H4d8EcquSUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.22], [10.0, 10.91], [13.0, 13.63], [14.0, 22.08], [23.0, 24.49], [26.0, 27.13], [35.0, 37.88], [43.0, 48.29], [49.0, 52.22], [53.0, 55.12], [65.0, 67.74], [70.0, 70.44], [70.0, 71.44], [72.0, 74.43], [77.0, 79.0], [85.0, 85.73], [90.0, 93.06], [96.0, 96.58], [100.0, 100.41]], "keep_status": [false, false, false, true, false, false, true, false, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.26, 0.0, 0.0, 32.85, 31.45, 33.75, 31.19, 65.79, 0.0, 0.0, 44.15, 61.67, 0.0, 41.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 35.74], ["hum", 14.9], ["mains hum", 10.98]], null, null, [["moo", 13.68], ["music", 12.82], ["livestock, farm animals, working animals", 12.61]], [["mains hum", 45.0], ["hum", 31.65], ["music", 7.33]], [["music", 59.85], ["throbbing", 10.72], ["hum", 6.35]], [["noise", 16.89], ["hum", 13.33], ["cacophony", 9.16]], null, null, null, [["hum", 11.54], ["music", 8.44], ["mains hum", 7.32]], null, null, [["music", 18.0], ["hum", 17.97], ["mains hum", 16.99]], null, null], "duration": [0.22, 0.91, 0.63, 8.08, 1.49, 1.13, 2.88, 5.29, 3.22, 2.12, 2.74, 0.44, 1.44, 2.43, 2.0, 0.73, 3.06, 0.58, 0.41]} \ No newline at end of file diff --git a/annotations_1/H4hjg6jAhOY_filtered.json b/annotations_1/H4hjg6jAhOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c49370e7f0abcfbae7659421e44487cf935869 --- /dev/null +++ b/annotations_1/H4hjg6jAhOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.55], [13.0, 13.53], [15.0, 18.91], [19.0, 19.77], [20.0, 22.5], [26.0, 27.41], [35.0, 34.94], [36.0, 37.35], [44.0, 48.07], [51.0, 55.31], [57.0, 57.55], [66.0, 73.68], [74.0, 74.78], [80.0, 81.5], [112.0, 112.58], [117.0, 117.34], [131.0, 132.8], [136.0, 137.56], [139.0, 141.13], [142.0, 142.06]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 38.14, 0.0, 34.01, 0.0, 0.0, 0.0, 49.92, 37.33, 0.0, 41.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.67, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 34.78], ["moo", 28.3], ["livestock, farm animals, working animals", 13.76]], null, [["music", 25.23], ["musical instrument", 9.73], ["moo", 8.09]], null, null, null, [["music", 45.73], ["boing", 9.58], ["musical instrument", 3.94]], [["music", 41.31], ["boing", 14.75], ["musical instrument", 5.55]], null, [["music", 37.23], ["effects unit", 18.3], ["guitar", 7.18]], null, null, null, null, null, null, [["music", 25.73], ["hum", 16.22], ["sonar", 5.07]], null], "duration": [1.55, 0.53, 3.91, 0.77, 2.5, 1.41, -0.06, 1.35, 4.07, 4.31, 0.55, 7.68, 0.78, 1.5, 0.58, 0.34, 1.8, 1.56, 2.13, 0.06]} \ No newline at end of file diff --git a/annotations_1/H5I1DyJ3w1g_filtered.json b/annotations_1/H5I1DyJ3w1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..189c1487714bbde6f7323484568379ecfcf72c86 --- /dev/null +++ b/annotations_1/H5I1DyJ3w1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 54.31], [59.0, 60.17], [61.0, 62.6], [64.0, 79.59], [84.0, 84.69], [88.0, 88.05], [88.0, 89.8], [91.0, 90.86], [92.0, 92.62], [96.0, 96.21], [96.0, 105.19], [106.0, 107.64], [109.0, 110.86], [111.0, 112.45], [113.0, 114.88], [116.0, 117.36], [119.0, 119.75], [122.0, 123.43], [127.0, 127.9], [132.0, 133.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.17, 1.6, 15.59, 0.69, 0.05, 1.8, -0.14, 0.62, 0.21, 9.19, 1.64, 1.86, 1.45, 1.88, 1.36, 0.75, 1.43, 0.9, 1.47]} \ No newline at end of file diff --git a/annotations_1/H5pj6ZuBgeE_filtered.json b/annotations_1/H5pj6ZuBgeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4db7a3658aabf8cbd6be2e5d2c943740e651aad4 --- /dev/null +++ b/annotations_1/H5pj6ZuBgeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.17], [6.0, 8.95], [10.0, 11.33], [12.0, 22.69], [23.0, 31.77], [33.0, 33.66], [34.0, 34.87], [35.0, 48.46], [50.0, 51.09], [55.0, 56.69], [58.0, 58.38], [59.0, 63.64], [65.0, 74.98], [76.0, 80.15], [81.0, 82.93], [85.0, 86.31], [93.0, 93.39], [97.0, 106.56], [109.0, 109.8], [123.0, 123.4], [124.0, 135.51], [141.0, 140.97], [142.0, 146.33], [146.0, 146.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.0, 0.0, 67.76, 70.02, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 61.87, 78.04, 59.96, 0.0, 0.0, 0.0, 28.98, 0.0, 0.0, 29.4, 0.0, 30.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.92], ["music", 21.26], ["vehicle", 5.22]], null, null, [["music", 72.91], ["throbbing", 2.11], ["electronic music", 1.63]], null, [["music", 51.32], ["speech", 16.97], ["electronic music", 3.59]], null], "duration": [0.17, 2.95, 1.33, 10.69, 8.77, 0.66, 0.87, 13.46, 1.09, 1.69, 0.38, 4.64, 9.98, 4.15, 1.93, 1.31, 0.39, 9.56, 0.8, 0.4, 11.51, -0.03, 4.33, 0.45]} \ No newline at end of file diff --git a/annotations_1/H6ImGh1Xolc_filtered.json b/annotations_1/H6ImGh1Xolc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9c0ee1ce0f8b267ea48879f4d77f1d09d22d76c --- /dev/null +++ b/annotations_1/H6ImGh1Xolc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.95], [3.0, 6.94], [7.0, 8.87], [11.0, 12.9], [16.0, 20.68], [24.0, 28.31], [29.0, 30.32], [31.0, 32.02], [33.0, 36.27], [38.0, 39.45], [40.0, 55.9], [57.0, 60.02], [61.0, 64.27], [66.0, 67.0], [73.0, 73.92], [80.0, 82.12], [89.0, 89.07], [89.0, 92.2], [95.0, 95.44], [99.0, 99.64], [101.0, 102.14], [103.0, 103.01], [103.0, 108.33], [109.0, 111.52], [113.0, 114.2], [115.0, 116.65], [117.0, 118.61], [121.0, 122.15], [126.0, 131.94], [133.0, 134.67], [136.0, 140.98], [143.0, 148.19], [149.0, 149.89], [151.0, 158.19], [159.0, 171.83], [174.0, 177.3], [180.0, 181.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.53, 0.0, 0.0, 90.6, 60.32, 0.0, 0.0, 63.42, 0.0, 93.91, 99.62, 99.73, 0.0, 0.0, 49.78, 0.0, 41.6, 0.0, 0.0, 0.0, 0.0, 58.55, 94.81, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 92.31, 72.9, 0.0, 67.76, 78.04, 99.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.16], ["music", 13.78], ["thunk", 5.36]], null, [["speech", 56.86], ["electric shaver, electric razor", 3.86], ["fart", 3.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 3.94, 1.87, 1.9, 4.68, 4.31, 1.32, 1.02, 3.27, 1.45, 15.9, 3.02, 3.27, 1.0, 0.92, 2.12, 0.07, 3.2, 0.44, 0.64, 1.14, 0.01, 5.33, 2.52, 1.2, 1.65, 1.61, 1.15, 5.94, 1.67, 4.98, 5.19, 0.89, 7.19, 12.83, 3.3, 1.09]} \ No newline at end of file diff --git a/annotations_1/H6XWqMB-Ow8_filtered.json b/annotations_1/H6XWqMB-Ow8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd8ea3c2bd9777542144bb0716571295fb66895 --- /dev/null +++ b/annotations_1/H6XWqMB-Ow8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.32], [10.0, 10.81], [15.0, 18.52], [22.0, 23.13], [25.0, 27.7], [29.0, 29.2], [31.0, 31.4], [36.0, 36.27], [43.0, 43.87], [104.0, 103.82], [105.0, 104.67], [105.0, 104.87], [105.0, 105.06], [105.0, 105.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.15, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 0.81, 3.52, 1.13, 2.7, 0.2, 0.4, 0.27, 0.87, -0.18, -0.33, -0.13, 0.06, 0.17]} \ No newline at end of file diff --git a/annotations_1/H6Y2GNQfNo4_filtered.json b/annotations_1/H6Y2GNQfNo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f807e01d0adb12add77d9668d8fbe91a909d36b --- /dev/null +++ b/annotations_1/H6Y2GNQfNo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [29.0, 29.42], [35.0, 36.96], [46.0, 46.84], [50.0, 50.48], [55.0, 55.61], [62.0, 62.41], [65.0, 67.66], [73.0, 73.53], [81.0, 81.94], [83.0, 83.49], [94.0, 93.9], [95.0, 95.77], [108.0, 109.31], [113.0, 118.37], [120.0, 120.56], [123.0, 123.06], [124.0, 124.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.53], ["inside, small room", 3.6], ["fart", 3.53]], null, null, null], "duration": [0.39, 0.42, 1.96, 0.84, 0.48, 0.61, 0.41, 2.66, 0.53, 0.94, 0.49, -0.1, 0.77, 1.31, 5.37, 0.56, 0.06, 0.34]} \ No newline at end of file diff --git a/annotations_1/H6jj52hYXeQ_filtered.json b/annotations_1/H6jj52hYXeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e76940adb91ee87c0f3434e2327f9251d4b99407 --- /dev/null +++ b/annotations_1/H6jj52hYXeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 73.18], [76.0, 77.4], [81.0, 80.86], [81.0, 88.8], [93.0, 133.39]], "keep_status": [true, false, false, false, false], "silence_prob": [31.15, 0.0, 0.0, 30.73, 0.0], "audiomae_on_audioset": [[["music", 39.52], ["thunk", 4.75], ["rumble", 4.59]], null, null, [["speech", 66.6], ["pant", 5.97], ["noise", 4.46]], null], "duration": [28.18, 1.4, -0.14, 7.8, 40.39]} \ No newline at end of file diff --git a/annotations_1/H7tyPUAH1lo_filtered.json b/annotations_1/H7tyPUAH1lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..674ffd2889235cd1df1d56c16d339d4814248f67 --- /dev/null +++ b/annotations_1/H7tyPUAH1lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 4.95], [5.0, 6.66], [8.0, 8.87], [9.0, 10.17], [12.0, 16.34], [17.0, 25.1], [26.0, 30.23], [32.0, 32.17], [33.0, 40.27], [40.0, 40.44], [40.0, 47.38], [48.0, 52.15], [54.0, 61.53], [62.0, 64.18], [65.0, 70.71], [72.0, 76.65], [79.0, 80.96], [82.0, 82.97], [84.0, 105.46], [107.0, 114.17], [116.0, 132.51], [133.0, 137.02], [139.0, 141.4], [143.0, 148.71], [150.0, 167.59], [169.0, 172.34], [174.0, 177.53], [179.0, 179.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.98, 0.0, 0.0, 0.0, 49.27, 59.68, 63.85, 0.0, 46.4, 0.0, 47.08, 68.67, 63.96, 57.89, 44.12, 99.99, 0.0, 0.0, 73.97, 99.71, 73.21, 98.51, 100.0, 97.22, 74.92, 100.0, 94.66, 0.0], "audiomae_on_audioset": [null, [["speech", 63.55], ["dial tone", 10.67], ["sidetone", 7.56]], null, null, null, [["grunt", 48.59], ["burping, eructation", 19.31], ["throat clearing", 10.75]], null, null, null, [["speech", 54.52], ["frog", 21.22], ["croak", 14.62]], null, [["speech", 71.02], ["sidetone", 14.68], ["chirp tone", 1.88]], null, null, null, [["speech", 59.36], ["grunt", 10.52], ["burping, eructation", 4.68]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 2.95, 1.66, 0.87, 1.17, 4.34, 8.1, 4.23, 0.17, 7.27, 0.44, 7.38, 4.15, 7.53, 2.18, 5.71, 4.65, 1.96, 0.97, 21.46, 7.17, 16.51, 4.02, 2.4, 5.71, 17.59, 3.34, 3.53, 0.73]} \ No newline at end of file diff --git a/annotations_1/H7zXX6EqGbI_filtered.json b/annotations_1/H7zXX6EqGbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0140c463c4f202c07dbe073b677d9f8272d17ed0 --- /dev/null +++ b/annotations_1/H7zXX6EqGbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.39], [11.0, 16.21], [20.0, 21.54], [27.0, 30.25], [31.0, 32.02], [34.0, 40.98], [43.0, 64.29], [73.0, 73.52], [77.0, 78.27], [79.0, 79.95], [81.0, 83.69], [85.0, 88.23], [89.0, 92.92], [95.0, 96.6], [100.0, 101.33], [105.0, 121.31], [126.0, 127.18], [131.0, 132.0], [135.0, 140.1], [141.0, 143.06], [144.0, 146.97], [148.0, 152.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [84.62, 75.88, 0.0, 92.15, 0.0, 89.72, 47.7, 0.0, 0.0, 0.0, 81.17, 88.1, 44.81, 0.0, 0.0, 48.23, 0.0, 0.0, 61.47, 90.95, 85.17, 82.07], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 39.59], ["mains hum", 22.11], ["music", 9.24]], null, null, null, null, null, [["music", 27.57], ["gong", 13.27], ["speech", 12.51]], null, null, [["music", 71.55], ["singing bowl", 4.74], ["ambient music", 4.28]], null, null, null, null, null, null], "duration": [3.39, 5.21, 1.54, 3.25, 1.02, 6.98, 21.29, 0.52, 1.27, 0.95, 2.69, 3.23, 3.92, 1.6, 1.33, 16.31, 1.18, 1.0, 5.1, 2.06, 2.97, 4.1]} \ No newline at end of file diff --git a/annotations_1/H92n6qsNHbY_filtered.json b/annotations_1/H92n6qsNHbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c76034f87eb618db548e905dabf19ea2543058f4 --- /dev/null +++ b/annotations_1/H92n6qsNHbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.88], [12.0, 15.62], [17.0, 24.78], [26.0, 26.43], [29.0, 29.89], [33.0, 33.98], [36.0, 60.08], [62.0, 64.5], [66.0, 79.27], [80.0, 83.76], [86.0, 108.03], [110.0, 111.23], [112.0, 114.39]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [32.75, 39.31, 30.31, 0.0, 0.0, 0.0, 30.26, 31.42, 30.64, 30.31, 29.51, 0.0, 32.98], "audiomae_on_audioset": [[["music", 72.5], ["quack", 9.83], ["speech", 7.33]], [["speech", 29.02], ["music", 28.41], ["hum", 10.12]], [["music", 79.49], ["throbbing", 5.12], ["grunt", 2.04]], null, null, null, [["music", 72.77], ["groan", 5.01], ["speech", 3.97]], [["music", 53.89], ["didgeridoo", 20.49], ["boing", 5.48]], [["music", 73.66], ["didgeridoo", 4.15], ["musical instrument", 4.06]], [["music", 36.82], ["hum", 15.96], ["throbbing", 12.41]], [["music", 42.18], ["fly, housefly", 17.3], ["insect", 4.03]], null, [["music", 41.87], ["speech", 32.72], ["synthesizer", 2.82]]], "duration": [5.88, 3.62, 7.78, 0.43, 0.89, 0.98, 24.08, 2.5, 13.27, 3.76, 22.03, 1.23, 2.39]} \ No newline at end of file diff --git a/annotations_1/H9PmpwhBg8w_filtered.json b/annotations_1/H9PmpwhBg8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..624ded54b8bc033f4f38fc7cbc9ef9c85d1ecbbc --- /dev/null +++ b/annotations_1/H9PmpwhBg8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [19.0, 26.74], [29.0, 29.08], [30.0, 30.7], [37.0, 41.72], [49.0, 49.11], [50.0, 53.33], [61.0, 64.45], [65.0, 64.89], [65.0, 64.94], [65.0, 64.99], [65.0, 66.58], [84.0, 85.82], [87.0, 89.18], [100.0, 100.65], [102.0, 102.9], [106.0, 107.3], [112.0, 111.84]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.42, 0.0, 0.0, 99.31, 0.0, 46.33, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 77.15], ["musical instrument", 4.34], ["tabla", 1.98]], null, null, null, null, [["music", 57.76], ["guitar", 4.23], ["speech", 3.83]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 7.74, 0.08, 0.7, 4.72, 0.11, 3.33, 3.45, -0.11, -0.06, -0.01, 1.58, 1.82, 2.18, 0.65, 0.9, 1.3, -0.16]} \ No newline at end of file diff --git a/annotations_1/HAal8jdk5gk_filtered.json b/annotations_1/HAal8jdk5gk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5385699a704bf89d58b39dee91cbd4b0f9173d3 --- /dev/null +++ b/annotations_1/HAal8jdk5gk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.73], [5.0, 5.41], [7.0, 7.25], [11.0, 11.47], [12.0, 13.14], [14.0, 15.7], [18.0, 18.15], [21.0, 22.77], [24.0, 25.29], [29.0, 29.67], [36.0, 36.98], [42.0, 42.87], [45.0, 45.66], [50.0, 51.29], [55.0, 55.9], [58.0, 58.9], [60.0, 67.63], [69.0, 89.31], [100.0, 99.99], [103.0, 103.3], [106.0, 106.44], [115.0, 118.0], [119.0, 132.14], [136.0, 136.32], [148.0, 148.69], [161.0, 161.18], [161.0, 163.32], [165.0, 166.29], [168.0, 168.78], [170.0, 172.03], [173.0, 173.25], [174.0, 176.13], [177.0, 178.14], [179.0, 179.93], [181.0, 183.83], [185.0, 185.8], [187.0, 187.61], [190.0, 190.93], [193.0, 193.21], [198.0, 198.8], [202.0, 202.86], [206.0, 206.19], [207.0, 207.64], [209.0, 209.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 47.82, 0.0, 0.0, 0.0, 99.96, 87.37, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 92.15, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.54], ["musical instrument", 5.15], ["harmonic", 2.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.27, 0.41, 0.25, 0.47, 1.14, 1.7, 0.15, 1.77, 1.29, 0.67, 0.98, 0.87, 0.66, 1.29, 0.9, 0.9, 7.63, 20.31, -0.01, 0.3, 0.44, 3.0, 13.14, 0.32, 0.69, 0.18, 2.32, 1.29, 0.78, 2.03, 0.25, 2.13, 1.14, 0.93, 2.83, 0.8, 0.61, 0.93, 0.21, 0.8, 0.86, 0.19, 0.64, 0.44]} \ No newline at end of file diff --git a/annotations_1/HBPQtYCDKrk_filtered.json b/annotations_1/HBPQtYCDKrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c96ee145fcf7e4683e5e7ea6eb7b226aa3b7acf --- /dev/null +++ b/annotations_1/HBPQtYCDKrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.57], [40.0, 43.95], [46.0, 60.88], [64.0, 67.83], [70.0, 71.52], [76.0, 79.1], [83.0, 83.47], [86.0, 104.25], [105.0, 109.8]], "keep_status": [false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 92.97, 37.93, 37.61, 0.0, 41.78, 0.0, 38.87, 90.95], "audiomae_on_audioset": [null, null, [["rumble", 56.04], ["hum", 13.07], ["mains hum", 9.68]], [["hum", 20.28], ["music", 11.31], ["sonar", 11.05]], null, [["hum", 38.08], ["mains hum", 19.91], ["pulse", 13.53]], null, [["hum", 18.79], ["mains hum", 14.03], ["whale vocalization", 13.75]], null], "duration": [1.57, 3.95, 14.88, 3.83, 1.52, 3.1, 0.47, 18.25, 4.8]} \ No newline at end of file diff --git a/annotations_1/HBj5pxrFyE4_filtered.json b/annotations_1/HBj5pxrFyE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df1176ce2e1d7aa9bb2b39949d57938c29e125b3 --- /dev/null +++ b/annotations_1/HBj5pxrFyE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.81], [3.0, 6.44], [8.0, 10.37], [12.0, 12.73], [16.0, 17.59], [20.0, 21.1], [21.0, 22.23], [23.0, 24.07], [28.0, 27.75], [28.0, 27.8], [30.0, 39.65], [41.0, 43.93], [46.0, 46.21], [47.0, 47.51], [48.0, 48.44], [58.0, 58.14], [58.0, 58.89], [66.0, 66.9], [67.0, 68.81], [77.0, 82.81], [86.0, 87.35], [88.0, 88.62], [94.0, 94.1], [95.0, 100.3], [103.0, 103.1], [104.0, 104.67], [105.0, 107.43], [108.0, 112.19], [113.0, 116.58], [117.0, 120.23], [121.0, 123.03], [124.0, 127.82], [129.0, 134.89], [138.0, 140.76], [142.0, 142.3], [145.0, 145.54], [148.0, 149.05], [154.0, 159.38], [165.0, 174.63]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 64.29, 36.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.58, 36.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.4, 0.0, 0.0, 0.0, 88.83, 0.0, 0.0, 89.72, 86.64, 76.53, 71.43, 58.64, 29.45, 29.34, 69.07, 0.0, 0.0, 0.0, 29.54, 29.72], "audiomae_on_audioset": [null, null, [["mains hum", 16.6], ["speech", 12.02], ["hum", 9.14]], null, null, null, null, null, null, null, [["cattle, bovinae", 49.54], ["livestock, farm animals, working animals", 27.43], ["moo", 22.53]], [["cattle, bovinae", 50.11], ["moo", 25.04], ["livestock, farm animals, working animals", 16.89]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 22.09], ["accelerating, revving, vroom", 10.36], ["clatter", 8.4]], [["speech", 26.19], ["vehicle", 10.98], ["music", 8.56]], null, null, null, null, [["music", 82.78], ["speech", 3.97], ["boing", 3.58]], [["music", 72.63], ["musical instrument", 6.84], ["guitar", 3.4]]], "duration": [0.81, 3.44, 2.37, 0.73, 1.59, 1.1, 1.23, 1.07, -0.25, -0.2, 9.65, 2.93, 0.21, 0.51, 0.44, 0.14, 0.89, 0.9, 1.81, 5.81, 1.35, 0.62, 0.1, 5.3, 0.1, 0.67, 2.43, 4.19, 3.58, 3.23, 2.03, 3.82, 5.89, 2.76, 0.3, 0.54, 1.05, 5.38, 9.63]} \ No newline at end of file diff --git a/annotations_1/HC1LN5AgjRU_filtered.json b/annotations_1/HC1LN5AgjRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565d7decd2cc675d06a237b0628aba541f129980 --- /dev/null +++ b/annotations_1/HC1LN5AgjRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [7.0, 8.34], [14.0, 13.69], [17.0, 17.68], [21.0, 21.03], [23.0, 22.98], [36.0, 37.07], [38.0, 38.82], [42.0, 41.96], [43.0, 44.32], [50.0, 50.87], [52.0, 52.62], [57.0, 56.89], [65.0, 66.04], [78.0, 84.03], [88.0, 89.16], [94.0, 94.22], [102.0, 110.08], [123.0, 122.99], [126.0, 134.77], [139.0, 139.87], [142.0, 150.28], [152.0, 153.44], [157.0, 159.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0, 0.0, 30.53, 0.0, 30.68, 0.0, 30.52, 0.0, 29.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.11], ["synthesizer", 2.93], ["funk", 2.07]], null, null, [["music", 75.64], ["guitar", 6.21], ["bass guitar", 4.45]], null, [["music", 58.91], ["synthesizer", 4.47], ["musical instrument", 3.28]], null, [["music", 77.22], ["guitar", 2.71], ["musical instrument", 2.65]], null, [["music", 83.66], ["musical instrument", 1.89], ["piano", 1.19]]], "duration": [0.39, 1.34, -0.31, 0.68, 0.03, -0.02, 1.07, 0.82, -0.04, 1.32, 0.87, 0.62, -0.11, 1.04, 6.03, 1.16, 0.22, 8.08, -0.01, 8.77, 0.87, 8.28, 1.44, 2.39]} \ No newline at end of file diff --git a/annotations_1/HCGVmIe_V1c_filtered.json b/annotations_1/HCGVmIe_V1c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06efdc44a36dfe043d07cb45f9a7495776ca6068 --- /dev/null +++ b/annotations_1/HCGVmIe_V1c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.26], [25.0, 26.32], [30.0, 33.91], [35.0, 36.21], [37.0, 37.67], [40.0, 40.61], [41.0, 41.59], [42.0, 42.82], [43.0, 43.51], [46.0, 45.96], [47.0, 49.77], [51.0, 51.04], [52.0, 53.18], [53.0, 54.33], [55.0, 60.44], [62.0, 63.1], [63.0, 64.72], [65.0, 67.27], [72.0, 73.16], [74.0, 74.22], [80.0, 82.21], [87.0, 88.3], [89.0, 90.31], [96.0, 95.72], [96.0, 96.55], [101.0, 101.31], [103.0, 105.8], [108.0, 108.14], [110.0, 113.93], [116.0, 116.97], [117.0, 121.26], [122.0, 125.37], [131.0, 132.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 40.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 43.05, 0.0, 0.0, 49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 39.47, 0.0, 37.95, 0.0, 40.79, 32.47, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.3], ["hum", 11.54], ["mains hum", 7.42]], null, null, null, null, null, null, null, [["throbbing", 14.03], ["hum", 13.89], ["tick", 5.72]], null, null, null, [["throbbing", 26.7], ["hum", 17.63], ["heart sounds, heartbeat", 5.22]], null, null, [["sidetone", 82.09], ["music", 4.72], ["sonar", 2.13]], null, null, [["speech", 44.78], ["sidetone", 30.04], ["busy signal", 4.53]], null, null, null, null, null, [["whale vocalization", 21.9], ["rumble", 19.3], ["hum", 11.78]], null, [["throbbing", 21.76], ["sine wave", 16.79], ["chirp tone", 15.83]], null, [["speech", 45.83], ["hum", 31.75], ["mains hum", 6.09]], [["speech", 55.57], ["music", 13.14], ["beatboxing", 2.72]], null], "duration": [0.26, 1.32, 3.91, 1.21, 0.67, 0.61, 0.59, 0.82, 0.51, -0.04, 2.77, 0.04, 1.18, 1.33, 5.44, 1.1, 1.72, 2.27, 1.16, 0.22, 2.21, 1.3, 1.31, -0.28, 0.55, 0.31, 2.8, 0.14, 3.93, 0.97, 4.26, 3.37, 1.88]} \ No newline at end of file diff --git a/annotations_1/HCRagorblVI_filtered.json b/annotations_1/HCRagorblVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ed14f086818d159785f4a43e2562cdf28bb3eca --- /dev/null +++ b/annotations_1/HCRagorblVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [14.0, 14.99], [16.0, 16.56], [18.0, 18.87], [24.0, 24.65], [27.0, 36.44], [39.0, 39.68], [43.0, 73.97], [79.0, 80.94], [91.0, 94.49], [97.0, 102.14], [106.0, 124.95], [126.0, 131.5], [133.0, 136.44], [140.0, 143.48], [151.0, 154.92], [162.0, 162.77], [167.0, 171.8], [176.0, 176.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.75, 0.0, 0.0, 0.0, 28.67, 28.29, 28.38, 29.36, 29.28, 28.94, 28.95, 0.0, 29.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 64.61], ["ambient music", 7.18], ["synthesizer", 5.25]], null, null, null, [["music", 29.93], ["noise", 23.54], ["vehicle", 5.73]], [["music", 64.9], ["musical instrument", 5.32], ["echo", 3.59]], [["music", 65.54], ["musical instrument", 6.78], ["guitar", 3.65]], [["livestock, farm animals, working animals", 27.89], ["civil defense siren", 15.99], ["cattle, bovinae", 15.8]], [["livestock, farm animals, working animals", 26.54], ["cattle, bovinae", 24.57], ["moo", 17.98]], [["theremin", 21.0], ["music", 12.48], ["reverberation", 6.38]], [["crowd", 43.5], ["cheering", 25.86], ["applause", 3.83]], null, [["crowd", 43.12], ["cheering", 26.03], ["clapping", 9.79]], null], "duration": [0.73, 0.99, 0.56, 0.87, 0.65, 9.44, 0.68, 30.97, 1.94, 3.49, 5.14, 18.95, 5.5, 3.44, 3.48, 3.92, 0.77, 4.8, 0.82]} \ No newline at end of file diff --git a/annotations_1/HFAGAjkDaOU_filtered.json b/annotations_1/HFAGAjkDaOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a826b522e43791c4c6ce3f46fd57ca296ca56755 --- /dev/null +++ b/annotations_1/HFAGAjkDaOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [9.0, 10.64], [20.0, 20.21], [21.0, 21.51], [22.0, 21.9], [24.0, 24.43], [25.0, 24.92], [29.0, 33.29], [34.0, 42.26], [44.0, 48.17], [49.0, 49.0], [53.0, 52.88], [54.0, 58.02], [59.0, 59.59], [61.0, 62.33], [64.0, 65.65], [73.0, 100.67], [101.0, 113.63]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.46, 70.58, 72.75, 0.0, 0.0, 32.26, 0.0, 0.0, 0.0, 32.45, 32.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 36.6], ["speech", 23.36], ["musical instrument", 7.35]], null, null, null, null, [["music", 18.77], ["wail, moan", 16.94], ["whack, thwack", 10.77]], null, null, null, [["music", 70.07], ["mallet percussion", 3.61], ["glockenspiel", 3.61]], [["music", 58.19], ["speech", 17.87], ["buzz", 2.46]]], "duration": [0.99, 1.64, 0.21, 0.51, -0.1, 0.43, -0.08, 4.29, 8.26, 4.17, 0.0, -0.12, 4.02, 0.59, 1.33, 1.65, 27.67, 12.63]} \ No newline at end of file diff --git a/annotations_1/HGL0CEjSHog_filtered.json b/annotations_1/HGL0CEjSHog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb23d3aaf532c421988de83bcef3e425b1b52895 --- /dev/null +++ b/annotations_1/HGL0CEjSHog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [6.0, 6.94], [10.0, 10.44], [12.0, 11.85], [15.0, 15.85], [19.0, 19.3], [21.0, 21.37], [22.0, 22.59], [23.0, 24.0], [25.0, 41.01], [44.0, 48.78], [53.0, 53.92], [56.0, 60.0], [63.0, 63.59], [66.0, 65.72], [68.0, 68.69], [70.0, 70.71]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.98, 35.47, 0.0, 32.24, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 23.13], ["explosion", 20.27], ["buzz", 13.93]], [["music", 48.97], ["throbbing", 13.83], ["hum", 7.5]], null, [["music", 24.4], ["throbbing", 21.26], ["hum", 6.68]], null, null, null, null], "duration": [0.1, 0.94, 0.44, -0.15, 0.85, 0.3, 0.37, 0.59, 1.0, 16.01, 4.78, 0.92, 4.0, 0.59, -0.28, 0.69, 0.71]} \ No newline at end of file diff --git a/annotations_1/HGZotWs54rU_filtered.json b/annotations_1/HGZotWs54rU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83d9268ef95df7adc51dc4a9b1ca365a0d00982b --- /dev/null +++ b/annotations_1/HGZotWs54rU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.09], [25.0, 27.55], [30.0, 30.38], [31.0, 34.11], [48.0, 50.7], [54.0, 54.48], [64.0, 64.29], [65.0, 65.7], [68.0, 68.44], [73.0, 73.63], [74.0, 77.11], [78.0, 78.81], [81.0, 82.43], [86.0, 94.64], [95.0, 99.87], [100.0, 105.39], [109.0, 110.74], [113.0, 138.55], [140.0, 140.46], [140.0, 159.49], [162.0, 164.32], [166.0, 166.94]], "keep_status": [true, true, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [32.67, 30.21, 0.0, 40.22, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 29.95, 0.0, 0.0, 30.3, 91.3, 67.89, 0.0, 31.66, 0.0, 30.46, 35.53, 0.0], "audiomae_on_audioset": [[["music", 44.96], ["speech", 14.88], ["quack", 9.47]], [["groan", 20.58], ["sound effect", 13.18], ["speech", 12.64]], null, [["music", 47.47], ["speech", 7.32], ["synthesizer", 4.05]], [["music", 65.34], ["didgeridoo", 6.33], ["speech", 4.28]], null, null, null, null, null, [["music", 30.34], ["theremin", 26.13], ["bell", 4.49]], null, null, [["music", 37.53], ["hum", 7.73], ["rumble", 5.24]], null, null, null, [["music", 68.03], ["speech", 3.33], ["musical instrument", 2.96]], null, [["music", 64.18], ["whack, thwack", 5.06], ["speech", 4.33]], [["music", 15.68], ["theremin", 12.98], ["didgeridoo", 11.64]], null], "duration": [10.09, 2.55, 0.38, 3.11, 2.7, 0.48, 0.29, 0.7, 0.44, 0.63, 3.11, 0.81, 1.43, 8.64, 4.87, 5.39, 1.74, 25.55, 0.46, 19.49, 2.32, 0.94]} \ No newline at end of file diff --git a/annotations_1/HGgfJkZAx8Y_filtered.json b/annotations_1/HGgfJkZAx8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdbe27cb6d59dcb6126c2b66f989c1f7e6c2d595 --- /dev/null +++ b/annotations_1/HGgfJkZAx8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [20.0, 21.49], [25.0, 26.97], [27.0, 28.71], [30.0, 37.42], [38.0, 46.23], [55.0, 55.11], [56.0, 56.67], [65.0, 73.82], [78.0, 103.52], [104.0, 104.65], [114.0, 115.03], [117.0, 117.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.19, 59.15, 0.0, 0.0, 84.25, 32.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 28.27], ["horse", 10.07], ["clip-clop", 9.68]], null, null, null], "duration": [0.32, 1.49, 1.97, 1.71, 7.42, 8.23, 0.11, 0.67, 8.82, 25.52, 0.65, 1.03, 0.61]} \ No newline at end of file diff --git a/annotations_1/HGrPKwsAvqE_filtered.json b/annotations_1/HGrPKwsAvqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..328b3e8c0c6b0171ce6679bc71602bebdcaff8e9 --- /dev/null +++ b/annotations_1/HGrPKwsAvqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [16.0, 16.53], [23.0, 35.34], [37.0, 37.54], [40.0, 42.16], [45.0, 46.58], [55.0, 59.63], [63.0, 65.58], [67.0, 67.04]], "keep_status": [false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.93, 0.0, 82.61, 0.0, 33.67, 41.7, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.44], ["boing", 9.84], ["electronic music", 9.44]], null, null, null, [["music", 45.56], ["howl", 3.78], ["animal", 3.7]], [["fly, housefly", 54.27], ["insect", 15.06], ["mosquito", 13.15]], null], "duration": [0.91, 0.53, 12.34, 0.54, 2.16, 1.58, 4.63, 2.58, 0.04]} \ No newline at end of file diff --git a/annotations_1/HH37JTBpi2A_filtered.json b/annotations_1/HH37JTBpi2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..073004286697ca018f1d7abc1b99d9b2ecf94d2e --- /dev/null +++ b/annotations_1/HH37JTBpi2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.59], [9.0, 16.95], [17.0, 22.64], [23.0, 23.85], [24.0, 29.4], [30.0, 35.28], [37.0, 43.43], [44.0, 50.85], [52.0, 57.55], [59.0, 65.52], [66.0, 69.58], [71.0, 76.38], [77.0, 89.34], [91.0, 96.8], [99.0, 108.23], [109.0, 114.52], [115.0, 139.62], [141.0, 142.7], [143.0, 153.59], [156.0, 157.08], [157.0, 186.66], [188.0, 188.84], [189.0, 192.01], [192.0, 193.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [65.79, 62.27, 61.67, 0.0, 57.64, 57.48, 66.63, 64.63, 69.47, 64.75, 69.2, 66.27, 60.14, 68.15, 65.79, 68.28, 54.9, 0.0, 42.48, 0.0, 42.46, 0.0, 45.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.92], ["noise", 11.87], ["white noise", 5.61]], null, [["speech", 44.43], ["white noise", 10.41], ["buzzer", 8.31]], null, [["speech", 58.13], ["dial tone", 10.07], ["buzzer", 8.82]], null], "duration": [2.59, 7.95, 5.64, 0.85, 5.4, 5.28, 6.43, 6.85, 5.55, 6.52, 3.58, 5.38, 12.34, 5.8, 9.23, 5.52, 24.62, 1.7, 10.59, 1.08, 29.66, 0.84, 3.01, 1.51]} \ No newline at end of file diff --git a/annotations_1/HHRCWQEM7UQ_filtered.json b/annotations_1/HHRCWQEM7UQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35a37cc03b13b48d4ef031f5b4ea6432afbb7c63 --- /dev/null +++ b/annotations_1/HHRCWQEM7UQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [4.0, 4.83], [7.0, 7.13], [9.0, 9.29], [14.0, 14.35], [17.0, 18.98], [20.0, 22.81], [25.0, 25.29], [26.0, 38.57], [40.0, 41.71], [42.0, 43.77], [44.0, 45.81], [49.0, 49.28], [51.0, 54.28], [55.0, 57.03], [58.0, 66.61], [69.0, 71.32], [72.0, 88.43], [89.0, 89.07], [91.0, 91.64], [92.0, 92.58], [95.0, 95.74], [116.0, 117.71], [118.0, 119.26], [121.0, 122.84], [123.0, 124.58], [127.0, 128.9], [129.0, 129.07], [131.0, 131.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 51.88, 0.0, 0.0, 0.0, 0.0, 99.44, 99.98, 50.51, 99.99, 39.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.78], ["applause", 5.01], ["animal", 4.56]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.83, 0.13, 0.29, 0.35, 1.98, 2.81, 0.29, 12.57, 1.71, 1.77, 1.81, 0.28, 3.28, 2.03, 8.61, 2.32, 16.43, 0.07, 0.64, 0.58, 0.74, 1.71, 1.26, 1.84, 1.58, 1.9, 0.07, 0.01]} \ No newline at end of file diff --git a/annotations_1/HIBYaeYQF0k_filtered.json b/annotations_1/HIBYaeYQF0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d3589b35554e081e26b3e3bfe429b64448b37e1 --- /dev/null +++ b/annotations_1/HIBYaeYQF0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.85], [26.0, 25.69], [34.0, 34.16], [50.0, 51.16], [55.0, 55.65], [73.0, 73.08], [99.0, 99.33], [100.0, 100.6], [104.0, 104.92], [114.0, 113.98], [115.0, 115.89], [117.0, 117.58], [120.0, 120.28], [122.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, -0.31, 0.16, 1.16, 0.65, 0.08, 0.33, 0.6, 0.92, -0.02, 0.89, 0.58, 0.28, 0.94]} \ No newline at end of file diff --git a/annotations_1/HJKL8Ta-kt8_filtered.json b/annotations_1/HJKL8Ta-kt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02cc7b3252c9dcbd87fae7a3dda5bf1336f04460 --- /dev/null +++ b/annotations_1/HJKL8Ta-kt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.43], [12.0, 25.46], [71.0, 71.69], [73.0, 75.51], [80.0, 81.14], [84.0, 85.06], [86.0, 99.72], [103.0, 104.52], [108.0, 126.5], [142.0, 158.8]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.26, 29.35, 0.0, 29.36, 0.0, 0.0, 29.34, 0.0, 29.14, 28.87], "audiomae_on_audioset": [[["hum", 56.81], ["throbbing", 29.17], ["mains hum", 11.82]], [["music", 35.81], ["hum", 22.32], ["throbbing", 13.37]], null, [["music", 58.84], ["didgeridoo", 11.75], ["musical instrument", 3.7]], null, null, [["music", 68.31], ["electronic music", 9.05], ["dubstep", 6.3]], null, [["music", 45.51], ["motorcycle", 12.65], ["vehicle", 9.84]], [["vehicle", 33.16], ["music", 27.87], ["car", 9.37]]], "duration": [5.43, 13.46, 0.69, 2.51, 1.14, 1.06, 13.72, 1.52, 18.5, 16.8]} \ No newline at end of file diff --git a/annotations_1/HKJOcRnkRQ4_filtered.json b/annotations_1/HKJOcRnkRQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde6be93320767d3aafb02d4111eb6bcb4d46fc9 --- /dev/null +++ b/annotations_1/HKJOcRnkRQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 39.19], [54.0, 60.18], [65.0, 68.32], [89.0, 90.42], [91.0, 91.29], [93.0, 93.23], [113.0, 113.41], [114.0, 114.35], [117.0, 117.46], [127.0, 127.3], [128.0, 128.48], [130.0, 130.94], [132.0, 132.61], [144.0, 144.59], [146.0, 146.25], [147.0, 148.36], [150.0, 151.26], [157.0, 158.01], [161.0, 161.45], [165.0, 166.72], [169.0, 169.77], [174.0, 173.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.57, 33.06, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 66.3], ["speech", 15.46], ["boing", 2.9]], [["music", 62.2], ["thunk", 5.74], ["throbbing", 3.86]], [["music", 62.37], ["throbbing", 5.85], ["techno", 3.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.19, 6.18, 3.32, 1.42, 0.29, 0.23, 0.41, 0.35, 0.46, 0.3, 0.48, 0.94, 0.61, 0.59, 0.25, 1.36, 1.26, 1.01, 0.45, 1.72, 0.77, -0.15]} \ No newline at end of file diff --git a/annotations_1/HKRXTzENFa4_filtered.json b/annotations_1/HKRXTzENFa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd05e9343aaaad8f72df585ce0bb4292ce10b4fb --- /dev/null +++ b/annotations_1/HKRXTzENFa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.52], [10.0, 11.11], [12.0, 12.07], [14.0, 14.05], [14.0, 15.43], [16.0, 16.66], [18.0, 18.01], [20.0, 20.46], [25.0, 25.74], [31.0, 30.99], [33.0, 34.28], [35.0, 36.1], [38.0, 38.2], [39.0, 39.5], [40.0, 41.27], [46.0, 47.73], [48.0, 50.84], [53.0, 53.27], [54.0, 55.11], [59.0, 59.81], [61.0, 62.26], [63.0, 64.29], [66.0, 68.05], [69.0, 71.15], [75.0, 76.15], [77.0, 76.74], [78.0, 78.71], [79.0, 79.42], [80.0, 80.74], [83.0, 83.32], [84.0, 85.02], [88.0, 89.99], [98.0, 100.9], [102.0, 102.69], [105.0, 105.33], [107.0, 107.69], [109.0, 111.06], [113.0, 119.3], [121.0, 122.81], [124.0, 128.19], [129.0, 133.62], [136.0, 140.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 98.8, 91.3, 0.0, 68.67, 85.17, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 1.11, 0.07, 0.05, 1.43, 0.66, 0.01, 0.46, 0.74, -0.01, 1.28, 1.1, 0.2, 0.5, 1.27, 1.73, 2.84, 0.27, 1.11, 0.81, 1.26, 1.29, 2.05, 2.15, 1.15, -0.26, 0.71, 0.42, 0.74, 0.32, 1.02, 1.99, 2.9, 0.69, 0.33, 0.69, 2.06, 6.3, 1.81, 4.19, 4.62, 4.26]} \ No newline at end of file diff --git a/annotations_1/HKcDfO71N1E_filtered.json b/annotations_1/HKcDfO71N1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..774edeea29187f38ca30e1c97be640139c3a0441 --- /dev/null +++ b/annotations_1/HKcDfO71N1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 27.03], [28.0, 43.07], [45.0, 45.08], [45.0, 46.63], [50.0, 70.16], [71.0, 72.05], [74.0, 74.28], [77.0, 76.71], [77.0, 78.97], [81.0, 81.94], [84.0, 86.34], [90.0, 90.27], [94.0, 94.59], [101.0, 102.02], [103.0, 105.98], [110.0, 115.03], [116.0, 116.36], [123.0, 126.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.3, 30.85, 0.0, 0.0, 36.11, 0.0, 0.0, 0.0, 0.0, 0.0, 43.69, 0.0, 0.0, 0.0, 49.54, 40.71, 0.0, 42.13], "audiomae_on_audioset": [[["music", 51.57], ["musical instrument", 14.61], ["guitar", 5.36]], [["music", 90.51], ["throbbing", 2.55], ["electronic music", 2.51]], null, null, [["music", 74.96], ["didgeridoo", 7.68], ["throbbing", 2.71]], null, null, null, null, null, [["hum", 28.96], ["music", 21.61], ["throbbing", 20.15]], null, null, null, [["music", 71.49], ["hum", 7.03], ["throbbing", 6.35]], [["music", 60.52], ["musical instrument", 8.72], ["didgeridoo", 7.25]], null, [["music", 72.36], ["didgeridoo", 9.66], ["musical instrument", 3.16]]], "duration": [14.03, 15.07, 0.08, 1.63, 20.16, 1.05, 0.28, -0.29, 1.97, 0.94, 2.34, 0.27, 0.59, 1.02, 2.98, 5.03, 0.36, 3.6]} \ No newline at end of file diff --git a/annotations_1/HLTpxttylTM_filtered.json b/annotations_1/HLTpxttylTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ad0fb2de56d5896697456fcbd0c91f560b19fd1 --- /dev/null +++ b/annotations_1/HLTpxttylTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.4], [15.0, 19.25], [22.0, 25.68], [26.0, 26.54], [27.0, 28.61], [29.0, 31.75], [35.0, 35.97], [37.0, 38.18], [39.0, 40.05], [42.0, 44.63], [48.0, 50.8], [52.0, 52.05], [53.0, 53.67], [65.0, 65.37], [69.0, 69.35], [70.0, 73.7], [75.0, 80.57], [84.0, 86.78], [88.0, 88.84], [90.0, 92.38], [95.0, 95.82], [99.0, 102.22], [117.0, 132.14], [133.0, 136.81], [151.0, 152.37], [161.0, 163.0], [168.0, 168.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [95.09, 83.7, 67.13, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 76.2, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 97.0, 0.0, 99.99, 0.0, 99.95, 99.93, 99.73, 0.0, 46.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.4], ["noise", 9.97], ["synthesizer", 8.32]], null], "duration": [2.4, 4.25, 3.68, 0.54, 1.61, 2.75, 0.97, 1.18, 1.05, 2.63, 2.8, 0.05, 0.67, 0.37, 0.35, 3.7, 5.57, 2.78, 0.84, 2.38, 0.82, 3.22, 15.14, 3.81, 1.37, 2.0, 0.24]} \ No newline at end of file diff --git a/annotations_1/HLlaSoozZbM_filtered.json b/annotations_1/HLlaSoozZbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f3a348ed61ebe2a591ea86e534a1fcd6ac61cb4 --- /dev/null +++ b/annotations_1/HLlaSoozZbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.93], [15.0, 15.96], [18.0, 20.02], [27.0, 26.97], [30.0, 32.7], [40.0, 40.68], [42.0, 43.61], [44.0, 44.61], [49.0, 57.91], [63.0, 63.46], [81.0, 84.79], [89.0, 110.0], [110.0, 110.59], [119.0, 119.3], [125.0, 126.03], [127.0, 127.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.1, 0.0, 99.76, 0.0, 62.17, 0.0, 0.0, 0.0, 60.32, 0.0, 97.64, 38.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 63.59], ["thunk", 10.81], ["marimba, xylophone", 4.48]], null, null, null, null], "duration": [7.93, 0.96, 2.02, -0.03, 2.7, 0.68, 1.61, 0.61, 8.91, 0.46, 3.79, 21.0, 0.59, 0.3, 1.03, 0.75]} \ No newline at end of file diff --git a/annotations_1/HLw1Og_JXK8_filtered.json b/annotations_1/HLw1Og_JXK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2422549e065893d1ec99dae268f2e45a0edc205e --- /dev/null +++ b/annotations_1/HLw1Og_JXK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [5.0, 5.54], [8.0, 10.07], [12.0, 12.36], [13.0, 14.2], [18.0, 19.16], [20.0, 21.2], [22.0, 25.74], [28.0, 28.51], [30.0, 34.53], [36.0, 39.8], [42.0, 42.16], [43.0, 43.48], [45.0, 44.93], [46.0, 46.65], [49.0, 49.67], [51.0, 52.15], [53.0, 53.15], [54.0, 54.97], [57.0, 57.91], [59.0, 59.7], [60.0, 61.79], [65.0, 65.25], [66.0, 67.32], [68.0, 68.88], [70.0, 72.71], [74.0, 75.63], [76.0, 76.96], [78.0, 80.2], [81.0, 81.7], [83.0, 88.6], [91.0, 92.47], [93.0, 96.8], [98.0, 113.7], [116.0, 117.49], [120.0, 139.5], [140.0, 141.22], [142.0, 149.25]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 48.39, 48.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.52, 0.0, 0.0, 53.84, 0.0, 49.87, 0.0, 75.55, 50.02, 0.0, 33.27, 0.0, 30.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 53.94], ["ambient music", 4.65], ["new-age music", 1.79]], [["tuning fork", 14.48], ["civil defense siren", 13.24], ["chirp tone", 12.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.03], ["mains hum", 12.93], ["musical instrument", 8.25]], null, null, null, null, [["music", 52.61], ["ambient music", 5.51], ["theremin", 4.77]], null, null, null, null, [["music", 72.05], ["guitar", 6.71], ["plucked string instrument", 4.45]], null, [["music", 76.08], ["foghorn", 4.9], ["theremin", 4.09]]], "duration": [0.62, 0.54, 2.07, 0.36, 1.2, 1.16, 1.2, 3.74, 0.51, 4.53, 3.8, 0.16, 0.48, -0.07, 0.65, 0.67, 1.15, 0.15, 0.97, 0.91, 0.7, 1.79, 0.25, 1.32, 0.88, 2.71, 1.63, 0.96, 2.2, 0.7, 5.6, 1.47, 3.8, 15.7, 1.49, 19.5, 1.22, 7.25]} \ No newline at end of file diff --git a/annotations_1/HMUbL4Vgb2E_filtered.json b/annotations_1/HMUbL4Vgb2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bfdc91e6faba0f262c1ef0a592e78f55cd99a67 --- /dev/null +++ b/annotations_1/HMUbL4Vgb2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.04], [19.0, 22.22], [25.0, 28.95], [34.0, 38.2], [49.0, 51.71], [54.0, 58.6], [62.0, 61.7], [63.0, 81.01], [81.0, 81.41], [87.0, 88.03], [90.0, 90.21], [94.0, 100.18], [114.0, 113.73], [116.0, 125.25], [126.0, 126.64], [129.0, 129.74]], "keep_status": [true, true, false, false, false, true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [36.65, 33.59, 31.6, 55.39, 82.43, 35.88, 0.0, 36.08, 0.0, 0.0, 0.0, 31.17, 0.0, 32.77, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.01], ["speech", 14.21], ["didgeridoo", 4.32]], [["music", 26.82], ["boing", 20.62], ["guitar", 6.04]], [["moo", 40.39], ["cattle, bovinae", 29.49], ["livestock, farm animals, working animals", 14.3]], null, null, [["explosion", 27.15], ["music", 17.44], ["burst, pop", 10.0]], null, [["music", 51.01], ["didgeridoo", 8.83], ["theremin", 5.12]], null, null, null, [["speech", 49.63], ["music", 25.69], ["breaking", 7.17]], null, [["fly, housefly", 27.64], ["music", 17.28], ["mosquito", 8.55]], null, null], "duration": [6.04, 3.22, 3.95, 4.2, 2.71, 4.6, -0.3, 18.01, 0.41, 1.03, 0.21, 6.18, -0.27, 9.25, 0.64, 0.74]} \ No newline at end of file diff --git a/annotations_1/HNPRZ2M3h-M_filtered.json b/annotations_1/HNPRZ2M3h-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..069825cd5b2481817e36cd0655057b4a206ae69a --- /dev/null +++ b/annotations_1/HNPRZ2M3h-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.56], [24.0, 24.56], [25.0, 25.49], [52.0, 68.12], [70.0, 70.63], [74.0, 74.82], [76.0, 79.57], [80.0, 82.44], [84.0, 91.83], [96.0, 99.99], [104.0, 121.61], [124.0, 124.39], [127.0, 127.16], [128.0, 128.04], [129.0, 129.44], [133.0, 137.19], [141.0, 141.27], [142.0, 142.89], [144.0, 149.27], [158.0, 158.06], [160.0, 159.81], [163.0, 163.02]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.65, 0.0, 0.0, 44.6, 46.61, 30.63, 34.86, 32.01, 0.0, 0.0, 0.0, 0.0, 36.93, 0.0, 0.0, 32.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 47.01], ["speech", 10.22], ["musical instrument", 3.92]], null, null, [["music", 65.35], ["didgeridoo", 11.48], ["musical instrument", 3.57]], [["livestock, farm animals, working animals", 12.65], ["cattle, bovinae", 10.96], ["moo", 9.9]], [["speech", 70.77], ["boing", 5.36], ["fart", 3.78]], [["speech", 37.84], ["boing", 16.66], ["music", 8.24]], [["speech", 70.89], ["hum", 4.06], ["sidetone", 3.58]], null, null, null, null, [["speech", 83.42], ["sidetone", 2.75], ["music", 2.44]], null, null, [["speech", 87.37], ["speech synthesizer", 3.51], ["echo", 1.19]], null, null, null], "duration": [0.56, 0.56, 0.49, 16.12, 0.63, 0.82, 3.57, 2.44, 7.83, 3.99, 17.61, 0.39, 0.16, 0.04, 0.44, 4.19, 0.27, 0.89, 5.27, 0.06, -0.19, 0.02]} \ No newline at end of file diff --git a/annotations_1/HNV5ksTBzLk_filtered.json b/annotations_1/HNV5ksTBzLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcbcc8f7f216198b835b85ebe33ef8bbd65f4328 --- /dev/null +++ b/annotations_1/HNV5ksTBzLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [7.0, 7.33], [8.0, 8.83], [10.0, 10.71], [12.0, 11.92], [12.0, 17.52], [20.0, 19.87], [21.0, 22.0], [24.0, 24.16], [25.0, 25.39], [30.0, 30.72], [37.0, 38.52], [42.0, 51.43], [56.0, 56.32], [71.0, 71.64], [72.0, 72.87], [73.0, 74.56], [82.0, 82.8], [85.0, 88.67], [89.0, 90.31], [91.0, 117.49], [123.0, 126.3], [127.0, 129.95]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 36.84, 49.4, 98.01], "audiomae_on_audioset": [null, null, null, null, null, [["snicker", 19.06], ["music", 10.47], ["chuckle, chortle", 10.02]], null, null, null, null, null, null, [["effects unit", 29.24], ["music", 20.81], ["distortion", 8.71]], null, null, null, null, null, null, null, [["music", 49.33], ["synthesizer", 11.29], ["musical instrument", 5.79]], [["crushing", 21.15], ["thunk", 16.61], ["sidetone", 4.72]], null], "duration": [0.4, 0.33, 0.83, 0.71, -0.08, 5.52, -0.13, 1.0, 0.16, 0.39, 0.72, 1.52, 9.43, 0.32, 0.64, 0.87, 1.56, 0.8, 3.67, 1.31, 26.49, 3.3, 2.95]} \ No newline at end of file diff --git a/annotations_1/HOY92xiGY2M_filtered.json b/annotations_1/HOY92xiGY2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cea7351977f404206cd337d36214b3547dd4759f --- /dev/null +++ b/annotations_1/HOY92xiGY2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [4.0, 5.05], [8.0, 10.72], [12.0, 13.46], [14.0, 15.47], [17.0, 17.51], [18.0, 18.89], [20.0, 20.98], [21.0, 22.08], [26.0, 27.09], [32.0, 31.87], [36.0, 36.58], [40.0, 40.41], [41.0, 43.11], [54.0, 54.58], [69.0, 68.74], [71.0, 71.64], [74.0, 74.22], [86.0, 87.05], [89.0, 89.92], [94.0, 94.05], [94.0, 95.15], [100.0, 104.18], [106.0, 106.52], [108.0, 109.83], [111.0, 111.03], [130.0, 131.43], [133.0, 132.73], [135.0, 134.84], [139.0, 139.41], [142.0, 143.53], [148.0, 148.39], [158.0, 158.41], [159.0, 160.37], [169.0, 170.53], [175.0, 176.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 1.05, 2.72, 1.46, 1.47, 0.51, 0.89, 0.98, 1.08, 1.09, -0.13, 0.58, 0.41, 2.11, 0.58, -0.26, 0.64, 0.22, 1.05, 0.92, 0.05, 1.15, 4.18, 0.52, 1.83, 0.03, 1.43, -0.27, -0.16, 0.41, 1.53, 0.39, 0.41, 1.37, 1.53, 1.99]} \ No newline at end of file diff --git a/annotations_1/HOjApJYsWC0_filtered.json b/annotations_1/HOjApJYsWC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a15b6639993d010e2a6c5e3987598dfe9470a76e --- /dev/null +++ b/annotations_1/HOjApJYsWC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.78], [15.0, 15.01], [15.0, 15.53], [16.0, 16.95], [20.0, 20.95], [22.0, 22.0], [22.0, 23.84], [34.0, 34.94], [53.0, 54.97], [58.0, 60.07], [68.0, 68.42], [82.0, 83.05], [83.0, 84.38], [88.0, 88.8], [93.0, 94.47], [98.0, 99.33], [101.0, 100.97], [105.0, 105.02], [109.0, 110.46], [114.0, 114.37], [124.0, 124.51], [125.0, 126.22], [133.0, 134.33], [136.0, 138.37], [140.0, 140.48], [157.0, 159.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 31.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.73], ["didgeridoo", 6.3], ["speech", 5.01]]], "duration": [1.78, 0.01, 0.53, 0.95, 0.95, 0.0, 1.84, 0.94, 1.97, 2.07, 0.42, 1.05, 1.38, 0.8, 1.47, 1.33, -0.03, 0.02, 1.46, 0.37, 0.51, 1.22, 1.33, 2.37, 0.48, 2.43]} \ No newline at end of file diff --git a/annotations_1/HPGSDBjsSWI_filtered.json b/annotations_1/HPGSDBjsSWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/HPGSDBjsSWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/HPcr2gT_cnA_filtered.json b/annotations_1/HPcr2gT_cnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..432bb1dabc8a82fd558276f75da0dd0c6b738a6d --- /dev/null +++ b/annotations_1/HPcr2gT_cnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [17.0, 19.58], [25.0, 25.41], [27.0, 28.27], [32.0, 35.02], [37.0, 39.16], [40.0, 43.38], [45.0, 48.19], [50.0, 52.22], [54.0, 55.78], [67.0, 68.57], [71.0, 72.25], [74.0, 77.08], [81.0, 82.48], [85.0, 87.07], [91.0, 92.08], [95.0, 95.2], [100.0, 100.47], [104.0, 104.82], [107.0, 107.97], [110.0, 111.06], [114.0, 114.1], [115.0, 115.57], [122.0, 124.19], [130.0, 133.81], [134.0, 135.3], [137.0, 138.81], [140.0, 142.11], [144.0, 145.81], [147.0, 148.2], [153.0, 154.08], [163.0, 176.99], [178.0, 178.6], [179.0, 180.5], [185.0, 185.04], [187.0, 188.08], [191.0, 192.43], [193.0, 195.52], [196.0, 196.53], [197.0, 214.95]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.48, 0.0, 0.0, 43.71, 47.86, 57.56, 55.18, 50.16, 0.0, 0.0, 0.0, 45.98, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 56.03, 0.0, 0.0, 39.07, 0.0, 0.0, 0.0, 54.04, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 69.47], "audiomae_on_audioset": [null, [["sidetone", 22.22], ["hum", 20.77], ["speech", 13.73]], null, null, [["music", 50.32], ["speech", 18.32], ["theremin", 3.89]], [["music", 32.16], ["speech", 12.14], ["cello", 6.78]], null, null, null, null, null, null, [["speech", 21.35], ["music", 19.6], ["sidetone", 16.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.69], ["speech", 16.16], ["singing bowl", 10.11]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 2.58, 0.41, 1.27, 3.02, 2.16, 3.38, 3.19, 2.22, 1.78, 1.57, 1.25, 3.08, 1.48, 2.07, 1.08, 0.2, 0.47, 0.82, 0.97, 1.06, 0.1, 0.57, 2.19, 3.81, 1.3, 1.81, 2.11, 1.81, 1.2, 1.08, 13.99, 0.6, 1.5, 0.04, 1.08, 1.43, 2.52, 0.53, 17.95]} \ No newline at end of file diff --git a/annotations_1/HPir9pU9shw_filtered.json b/annotations_1/HPir9pU9shw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcfaac65679ec3edd27486dc22852ee33cf9bf7d --- /dev/null +++ b/annotations_1/HPir9pU9shw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 54.31]], "keep_status": [false], "silence_prob": [55.11], "audiomae_on_audioset": [null], "duration": [17.31]} \ No newline at end of file diff --git a/annotations_1/HQCava8QqK8_filtered.json b/annotations_1/HQCava8QqK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda76bcf5f0d3c1cca80cae50eed46bb98734fb4 --- /dev/null +++ b/annotations_1/HQCava8QqK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [11.0, 11.13], [17.0, 19.26], [26.0, 26.55], [28.0, 28.05], [29.0, 29.76], [33.0, 35.07], [36.0, 37.54], [39.0, 39.58], [41.0, 42.38], [53.0, 53.69], [56.0, 56.44], [62.0, 62.7], [63.0, 64.44], [71.0, 70.85], [76.0, 76.05], [80.0, 81.51], [88.0, 88.77], [91.0, 91.62], [97.0, 100.28], [101.0, 107.69]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.12, 0.0, 0.0, 0.0, 33.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 62.68], "audiomae_on_audioset": [null, null, [["music", 22.06], ["throbbing", 20.28], ["hum", 16.33]], null, null, null, [["music", 9.55], ["vehicle", 8.78], ["civil defense siren", 5.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.06, 0.13, 2.26, 0.55, 0.05, 0.76, 2.07, 1.54, 0.58, 1.38, 0.69, 0.44, 0.7, 1.44, -0.15, 0.05, 1.51, 0.77, 0.62, 3.28, 6.69]} \ No newline at end of file diff --git a/annotations_1/HQrM6Rk7WWE_filtered.json b/annotations_1/HQrM6Rk7WWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a4d13cb07e8af8b83c5d224c8b4bd9b77f09ff7 --- /dev/null +++ b/annotations_1/HQrM6Rk7WWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.29], [9.0, 21.37], [22.0, 26.38], [33.0, 41.2], [48.0, 76.28], [92.0, 92.8], [96.0, 96.16], [99.0, 99.0], [100.0, 100.67], [109.0, 130.4], [136.0, 135.92], [137.0, 137.78], [146.0, 147.51], [152.0, 152.42], [154.0, 155.07], [161.0, 161.7], [171.0, 177.7], [180.0, 195.81], [200.0, 202.51], [217.0, 218.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [97.64, 48.74, 31.47, 31.14, 30.68, 0.0, 0.0, 0.0, 0.0, 28.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.65, 29.24, 28.51, 0.0], "audiomae_on_audioset": [null, [["music", 70.25], ["scary music", 8.79], ["thunk", 2.83]], [["music", 55.37], ["brass instrument", 13.1], ["trombone", 10.5]], [["theremin", 68.58], ["music", 22.91], ["musical instrument", 1.07]], [["music", 65.05], ["theremin", 7.73], ["hum", 7.02]], null, null, null, null, [["buzz", 39.23], ["speech", 30.02], ["boat, water vehicle", 3.36]], null, null, null, null, null, null, [["cattle, bovinae", 28.61], ["moo", 22.29], ["livestock, farm animals, working animals", 12.28]], [["music", 57.69], ["speech", 9.28], ["hum", 3.59]], [["cattle, bovinae", 21.28], ["livestock, farm animals, working animals", 19.09], ["moo", 13.68]], null], "duration": [3.29, 12.37, 4.38, 8.2, 28.28, 0.8, 0.16, 0.0, 0.67, 21.4, -0.08, 0.78, 1.51, 0.42, 1.07, 0.7, 6.7, 15.81, 2.51, 1.94]} \ No newline at end of file diff --git a/annotations_1/HR2-PHuh3W8_filtered.json b/annotations_1/HR2-PHuh3W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b4f5a41a3c607e78be623f57376f889968f76b9 --- /dev/null +++ b/annotations_1/HR2-PHuh3W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [6.0, 7.2], [9.0, 8.92], [19.0, 19.82], [24.0, 31.97], [37.0, 48.88], [50.0, 51.8], [74.0, 74.58], [82.0, 82.85], [84.0, 84.01], [89.0, 97.09], [99.0, 108.89], [118.0, 118.57], [119.0, 121.12]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.01, 45.02, 0.0, 0.0, 0.0, 0.0, 49.0, 31.63, 0.0, 41.44], "audiomae_on_audioset": [null, null, null, null, [["music", 57.66], ["whack, thwack", 12.76], ["thunk", 10.91]], [["music", 58.0], ["effects unit", 3.38], ["musical instrument", 3.19]], null, null, null, null, [["music", 57.3], ["cacophony", 2.95], ["theremin", 2.22]], [["speech", 31.61], ["whack, thwack", 17.59], ["music", 9.56]], null, [["music", 29.82], ["speech", 21.95], ["throbbing", 11.96]]], "duration": [0.79, 1.2, -0.08, 0.82, 7.97, 11.88, 1.8, 0.58, 0.85, 0.01, 8.09, 9.89, 0.57, 2.12]} \ No newline at end of file diff --git a/annotations_1/HR2kbOK8i6I_filtered.json b/annotations_1/HR2kbOK8i6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30e6a918e81b410ea9795bf0cd7b99f4ef4e66a9 --- /dev/null +++ b/annotations_1/HR2kbOK8i6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [4.0, 6.61], [7.0, 9.86], [11.0, 13.02], [14.0, 14.52], [16.0, 19.3], [21.0, 22.42], [25.0, 25.34], [27.0, 38.55], [40.0, 40.31], [41.0, 42.21], [45.0, 50.3], [51.0, 51.83], [54.0, 76.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 66.03, 47.86, 94.66, 0.0, 54.7, 0.0, 0.0, 30.64, 0.0, 0.0, 31.6, 0.0, 30.13], "audiomae_on_audioset": [null, null, [["sidetone", 53.26], ["speech", 17.01], ["busy signal", 6.46]], null, null, null, null, null, [["speech", 78.76], ["livestock, farm animals, working animals", 5.16], ["cattle, bovinae", 2.93]], null, null, [["throbbing", 36.45], ["hum", 35.92], ["mains hum", 16.48]], null, [["sidetone", 30.45], ["throbbing", 21.68], ["hum", 14.57]]], "duration": [0.6, 2.61, 2.86, 2.02, 0.52, 3.3, 1.42, 0.34, 11.55, 0.31, 1.21, 5.3, 0.83, 22.98]} \ No newline at end of file diff --git a/annotations_1/HRJ1g7i0Ob8_filtered.json b/annotations_1/HRJ1g7i0Ob8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e7ea711bd15c348504841f7757f4964b3c678e7 --- /dev/null +++ b/annotations_1/HRJ1g7i0Ob8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.07], [8.0, 8.48], [12.0, 12.51], [14.0, 17.2], [20.0, 22.86], [24.0, 24.97], [26.0, 27.35], [28.0, 28.14], [28.0, 37.52], [40.0, 48.44], [53.0, 53.79], [55.0, 64.34], [67.0, 67.91], [70.0, 72.37], [73.0, 73.84], [75.0, 76.44], [78.0, 79.64], [85.0, 85.08], [89.0, 89.61], [92.0, 94.04], [98.0, 100.75], [107.0, 107.72], [113.0, 113.21], [114.0, 114.47], [116.0, 118.64], [125.0, 124.85], [128.0, 129.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.41, 57.09, 0.0, 0.0, 0.0, 40.47, 37.82, 0.0, 55.67, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0, 51.55, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 80.11], ["musical instrument", 2.37], ["didgeridoo", 2.33]], [["music", 80.02], ["sampler", 2.26], ["musical instrument", 1.47]], null, null, null, null, null, null, null, null, null, [["speech", 51.33], ["cattle, bovinae", 7.41], ["moo", 6.4]], null, null, null, null, null, null, null], "duration": [1.07, 0.48, 0.51, 3.2, 2.86, 0.97, 1.35, 0.14, 9.52, 8.44, 0.79, 9.34, 0.91, 2.37, 0.84, 1.44, 1.64, 0.08, 0.61, 2.04, 2.75, 0.72, 0.21, 0.47, 2.64, -0.15, 1.74]} \ No newline at end of file diff --git a/annotations_1/HRmLJScvW8M_filtered.json b/annotations_1/HRmLJScvW8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a0148df50ae03e434478d90edbe4c4f3503adc8 --- /dev/null +++ b/annotations_1/HRmLJScvW8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 35.87], [38.0, 39.56], [43.0, 44.0], [47.0, 48.83], [50.0, 52.27], [53.0, 62.78], [64.0, 66.12], [68.0, 76.86], [78.0, 80.25], [82.0, 82.63], [86.0, 87.1], [91.0, 91.77], [102.0, 103.17], [118.0, 119.65], [120.0, 122.08], [124.0, 125.98]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [39.54, 0.0, 0.0, 0.0, 83.7, 48.06, 65.32, 39.46, 52.16, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0], "audiomae_on_audioset": [[["fly, housefly", 31.34], ["insect", 26.0], ["bee, wasp, etc.", 13.96]], null, null, null, null, [["music", 43.97], ["hum", 9.69], ["mains hum", 5.34]], null, [["speech", 30.64], ["mains hum", 18.98], ["music", 15.61]], null, null, null, null, null, null, null, null], "duration": [3.87, 1.56, 1.0, 1.83, 2.27, 9.78, 2.12, 8.86, 2.25, 0.63, 1.1, 0.77, 1.17, 1.65, 2.08, 1.98]} \ No newline at end of file diff --git a/annotations_1/HSjPTdKWcLA_filtered.json b/annotations_1/HSjPTdKWcLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1604eabd95ec3a0b9373c203b8d02610e5590177 --- /dev/null +++ b/annotations_1/HSjPTdKWcLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.13], [9.0, 24.36], [29.0, 60.15], [64.0, 91.89], [94.0, 104.46], [104.0, 104.53], [106.0, 128.28], [130.0, 130.23], [131.0, 133.96], [138.0, 139.23], [144.0, 144.19]], "keep_status": [true, true, false, true, false, false, true, false, true, false, false], "silence_prob": [34.59, 29.75, 0.0, 29.66, 29.38, 0.0, 29.46, 0.0, 46.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 26.17], ["hum", 20.68], ["mains hum", 16.41]], [["music", 38.51], ["speech", 12.37], ["buzz", 7.77]], null, [["music", 39.52], ["speech", 7.72], ["mains hum", 5.3]], [["hum", 41.35], ["mains hum", 21.75], ["throbbing", 18.0]], null, [["music", 32.19], ["whack, thwack", 5.57], ["electric shaver, electric razor", 4.82]], null, [["speech", 33.77], ["music", 22.99], ["didgeridoo", 7.05]], null, null], "duration": [5.13, 15.36, 31.15, 27.89, 10.46, 0.53, 22.28, 0.23, 2.96, 1.23, 0.19]} \ No newline at end of file diff --git a/annotations_1/HTFjrXA8bFI_filtered.json b/annotations_1/HTFjrXA8bFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dffbcd88cb98e458b6365c4012f96e103adf3e5d --- /dev/null +++ b/annotations_1/HTFjrXA8bFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.07], [25.0, 25.32], [30.0, 30.7], [34.0, 36.95], [37.0, 38.04]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.33, 0.0], "audiomae_on_audioset": [null, null, null, [["yodeling", 21.42], ["music", 21.4], ["humming", 15.9]], null], "duration": [0.07, 0.32, 0.7, 2.95, 1.04]} \ No newline at end of file diff --git a/annotations_1/HUKu_iqYDOA_filtered.json b/annotations_1/HUKu_iqYDOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1930747f08208636f5c3bdfa631a75ffb3108e8 --- /dev/null +++ b/annotations_1/HUKu_iqYDOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [6.0, 6.83], [12.0, 12.48], [18.0, 18.89], [23.0, 23.9], [30.0, 30.47], [32.0, 33.62], [34.0, 34.37], [35.0, 36.91], [37.0, 40.83], [48.0, 49.22], [49.0, 49.94], [50.0, 50.99], [52.0, 52.42], [54.0, 54.94], [58.0, 58.63], [59.0, 59.95], [61.0, 62.55], [66.0, 66.51], [67.0, 67.86], [70.0, 70.68], [74.0, 75.51], [81.0, 81.94], [87.0, 87.76], [90.0, 90.59], [93.0, 92.91], [98.0, 101.9], [103.0, 103.59], [104.0, 103.69], [105.0, 106.12], [112.0, 112.5], [116.0, 116.65], [118.0, 118.54], [119.0, 119.15], [121.0, 121.34], [124.0, 123.94], [127.0, 127.52], [128.0, 127.63], [128.0, 127.99], [133.0, 133.57], [136.0, 136.7], [137.0, 141.76], [144.0, 145.35], [146.0, 148.37], [149.0, 149.32], [150.0, 151.55], [153.0, 153.67], [157.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 45.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.34], ["sidetone", 4.9], ["radio", 3.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.17], ["speech", 27.0], ["sitar", 3.43]], null, [["speech", 37.65], ["music", 27.18], ["theremin", 6.54]], null, null, null, null], "duration": [0.96, 0.83, 0.48, 0.89, 0.9, 0.47, 1.62, 0.37, 1.91, 3.83, 1.22, 0.94, 0.99, 0.42, 0.94, 0.63, 0.95, 1.55, 0.51, 0.86, 0.68, 1.51, 0.94, 0.76, 0.59, -0.09, 3.9, 0.59, -0.31, 1.12, 0.5, 0.65, 0.54, 0.15, 0.34, -0.06, 0.52, -0.37, -0.01, 0.57, 0.7, 4.76, 1.35, 2.37, 0.32, 1.55, 0.67, 0.76]} \ No newline at end of file diff --git a/annotations_1/HUPoWdZ1ZdQ_filtered.json b/annotations_1/HUPoWdZ1ZdQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..400538a85177c6cdc7b9c5d938747f40e7a41b65 --- /dev/null +++ b/annotations_1/HUPoWdZ1ZdQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 30.94], [38.0, 38.99], [39.0, 46.48], [53.0, 59.53], [64.0, 64.3], [66.0, 76.74], [78.0, 79.1], [81.0, 85.95], [89.0, 89.5], [91.0, 92.52], [94.0, 94.98], [97.0, 105.41], [107.0, 110.52], [111.0, 113.31]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 32.34, 55.11, 0.0, 68.93, 0.0, 81.0, 0.0, 0.0, 0.0, 88.83, 47.58, 43.96], "audiomae_on_audioset": [null, null, [["speech", 28.66], ["music", 9.97], ["mosquito", 6.93]], null, null, null, null, null, null, null, null, null, [["music", 55.58], ["hum", 4.16], ["electronic music", 3.49]], [["throbbing", 16.34], ["music", 12.83], ["hum", 9.6]]], "duration": [-0.06, 0.99, 7.48, 6.53, 0.3, 10.74, 1.1, 4.95, 0.5, 1.52, 0.98, 8.41, 3.52, 2.31]} \ No newline at end of file diff --git a/annotations_1/HVgu-41adSY_filtered.json b/annotations_1/HVgu-41adSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae32eab2cb8f6fb18a23d38359fa4d34d4408d4a --- /dev/null +++ b/annotations_1/HVgu-41adSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.47], [21.0, 22.89], [24.0, 33.66], [34.0, 35.4], [37.0, 99.47], [100.0, 102.98], [105.0, 108.06], [112.0, 111.72], [113.0, 116.51], [117.0, 119.47], [120.0, 121.71], [124.0, 126.64], [127.0, 139.21], [139.0, 139.46], [139.0, 147.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.91, 0.0, 0.0, 95.51, 89.19, 0.0, 52.62, 91.47, 0.0, 96.54, 75.72, 0.0, 58.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 1.89, 9.66, 1.4, 62.47, 2.98, 3.06, -0.28, 3.51, 2.47, 1.71, 2.64, 12.21, 0.46, 8.83]} \ No newline at end of file diff --git a/annotations_1/HVlrXQ3qWqo_filtered.json b/annotations_1/HVlrXQ3qWqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc64c309165a54062a104bd234fcc7f47cd4fd25 --- /dev/null +++ b/annotations_1/HVlrXQ3qWqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [5.0, 5.68], [12.0, 12.55], [16.0, 16.06], [26.0, 26.47], [38.0, 38.69], [45.0, 45.67], [67.0, 66.77], [78.0, 77.7], [81.0, 82.81], [85.0, 85.85], [89.0, 91.35], [93.0, 96.4], [97.0, 99.0], [100.0, 100.4], [108.0, 107.86], [109.0, 108.89], [112.0, 113.49], [114.0, 114.62], [115.0, 115.05], [116.0, 116.55], [118.0, 118.86], [123.0, 124.26], [127.0, 127.87], [132.0, 132.68], [136.0, 135.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.33, 73.36, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 76.94], ["throbbing", 3.69], ["synthesizer", 2.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.68, 0.55, 0.06, 0.47, 0.69, 0.67, -0.23, -0.3, 1.81, 0.85, 2.35, 3.4, 2.0, 0.4, -0.14, -0.11, 1.49, 0.62, 0.05, 0.55, 0.86, 1.26, 0.87, 0.68, -0.01]} \ No newline at end of file diff --git a/annotations_1/HXmru6NrSAY_filtered.json b/annotations_1/HXmru6NrSAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76a7e41bc72fd96732509d8400179655cd064416 --- /dev/null +++ b/annotations_1/HXmru6NrSAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.99], [11.0, 15.5], [17.0, 16.95], [17.0, 17.0], [20.0, 22.0], [24.0, 26.91], [29.0, 31.38], [34.0, 36.44], [38.0, 40.91], [43.0, 170.19], [170.0, 171.36], [172.0, 171.64], [172.0, 201.12], [204.0, 204.94], [208.0, 221.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.2, 0.0, 0.0, 99.59, 88.28, 98.73, 99.59, 79.24, 0.0, 0.0, 0.0, 100.0, 0.0, 57.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 4.5, -0.05, 0.0, 2.0, 2.91, 2.38, 2.44, 2.91, 127.19, 1.36, -0.36, 29.12, 0.94, 13.37]} \ No newline at end of file diff --git a/annotations_1/HXubLg3o3qY_filtered.json b/annotations_1/HXubLg3o3qY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23845bf06fc5edff7e29b8952ac2816e6daec047 --- /dev/null +++ b/annotations_1/HXubLg3o3qY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.25], [7.0, 10.5], [11.0, 13.63], [14.0, 17.58], [18.0, 22.69], [26.0, 35.06], [35.0, 105.07], [106.0, 123.47], [124.0, 129.3], [133.0, 133.25]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.48, 99.97, 95.37, 49.87, 59.33, 46.97, 0.0, 32.97, 29.29, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 40.18], ["music", 21.19], ["electronic music", 6.65]], null, [["hum", 27.99], ["mains hum", 27.88], ["speech", 17.43]], null, [["music", 51.48], ["ambient music", 10.43], ["theremin", 8.83]], [["machine gun", 71.15], ["gunshot, gunfire", 22.5], ["speech", 3.41]], null], "duration": [4.25, 3.5, 2.63, 3.58, 4.69, 9.06, 70.07, 17.47, 5.3, 0.25]} \ No newline at end of file diff --git a/annotations_1/HYWSAtLFgXg_filtered.json b/annotations_1/HYWSAtLFgXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebda0e4d0d95cc3d7b93a08c59423068ba92b61 --- /dev/null +++ b/annotations_1/HYWSAtLFgXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [8.0, 8.34], [12.0, 13.05], [17.0, 18.05], [23.0, 23.9], [25.0, 30.57], [32.0, 55.27], [59.0, 100.63], [102.0, 102.96], [103.0, 104.36], [105.0, 117.56], [122.0, 122.71], [124.0, 125.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 29.52, 0.0, 0.0, 0.0, 33.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 56.17], ["musical instrument", 7.12], ["effects unit", 4.22]], [["music", 90.45], ["guitar", 1.54], ["musical instrument", 1.37]], null, null, null, [["hum", 18.95], ["mains hum", 17.25], ["speech", 16.84]], null, null], "duration": [0.48, 0.34, 1.05, 1.05, 0.9, 5.57, 23.27, 41.63, 0.96, 1.36, 12.56, 0.71, 1.9]} \ No newline at end of file diff --git a/annotations_1/HYctFVhe2Rc_filtered.json b/annotations_1/HYctFVhe2Rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ede510b8d8456563dcab9f1e5d762048424af68c --- /dev/null +++ b/annotations_1/HYctFVhe2Rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 48.51], [52.0, 56.24], [58.0, 59.31], [65.0, 65.26], [73.0, 88.5]], "keep_status": [false, false, false, false, false], "silence_prob": [30.61, 30.39, 0.0, 0.0, 30.42], "audiomae_on_audioset": [[["music", 64.61], ["theremin", 6.07], ["didgeridoo", 5.18]], [["music", 60.69], ["throbbing", 9.75], ["theremin", 7.64]], null, null, [["music", 65.63], ["didgeridoo", 6.12], ["musical instrument", 3.7]]], "duration": [21.51, 4.24, 1.31, 0.26, 15.5]} \ No newline at end of file diff --git a/annotations_1/HYog4UvM1zI_filtered.json b/annotations_1/HYog4UvM1zI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd945907eda8d45126a4fc5e2000f567830785a2 --- /dev/null +++ b/annotations_1/HYog4UvM1zI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.77], [11.0, 12.65], [16.0, 16.58], [20.0, 41.89], [43.0, 84.79], [86.0, 112.5], [115.0, 117.48], [118.0, 120.01], [121.0, 126.57], [127.0, 164.44], [164.0, 173.7], [175.0, 175.53]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.95, 0.0, 30.01, 31.54, 35.78, 31.29, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.14], ["throbbing", 26.95], ["hum", 11.41]], null, [["throbbing", 36.73], ["music", 20.68], ["hum", 16.5]], [["music", 62.41], ["throbbing", 12.48], ["hum", 6.0]], [["hum", 27.95], ["music", 24.25], ["throbbing", 16.24]], [["music", 20.41], ["hum", 17.73], ["whack, thwack", 14.37]], null, [["hum", 63.66], ["mains hum", 13.17], ["music", 7.33]], null], "duration": [0.77, 1.65, 0.58, 21.89, 41.79, 26.5, 2.48, 2.01, 5.57, 37.44, 9.7, 0.53]} \ No newline at end of file diff --git a/annotations_1/HYqSugRiG5Y_filtered.json b/annotations_1/HYqSugRiG5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78064fc1b0d7469719adc4994fb7cb724faad176 --- /dev/null +++ b/annotations_1/HYqSugRiG5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [8.0, 8.29], [14.0, 20.71], [24.0, 25.12], [29.0, 31.06], [33.0, 35.33], [38.0, 37.81], [40.0, 41.54], [43.0, 44.54], [46.0, 48.22], [49.0, 51.44], [52.0, 58.75], [60.0, 62.7], [64.0, 67.81], [68.0, 72.54], [77.0, 78.17], [80.0, 81.24], [83.0, 84.08], [85.0, 85.92], [87.0, 87.25], [88.0, 89.02], [91.0, 91.44], [97.0, 98.69], [108.0, 111.86], [114.0, 117.59], [123.0, 124.73], [126.0, 138.89], [141.0, 144.36], [148.0, 149.67]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [51.66, 0.0, 33.71, 0.0, 46.54, 46.19, 0.0, 0.0, 0.0, 54.97, 54.1, 54.23, 44.07, 40.92, 45.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03, 37.04, 0.0, 30.74, 35.33, 0.0], "audiomae_on_audioset": [null, null, [["music", 58.4], ["synthesizer", 7.81], ["musical instrument", 4.69]], null, [["music", 37.24], ["hum", 8.2], ["throbbing", 5.14]], [["music", 62.76], ["hum", 6.71], ["ambient music", 3.7]], null, null, null, null, null, null, [["speech", 19.63], ["music", 16.03], ["sidetone", 10.92]], [["hum", 25.59], ["music", 11.79], ["mains hum", 8.88]], [["speech", 52.12], ["hum", 7.37], ["caw", 4.3]], null, null, null, null, null, null, null, null, null, [["whimper", 21.6], ["music", 10.44], ["speech", 8.6]], null, [["music", 52.96], ["synthesizer", 20.33], ["musical instrument", 4.59]], [["music", 24.63], ["hum", 18.35], ["throbbing", 7.06]], null], "duration": [2.44, 0.29, 6.71, 1.12, 2.06, 2.33, -0.19, 1.54, 1.54, 2.22, 2.44, 6.75, 2.7, 3.81, 4.54, 1.17, 1.24, 1.08, 0.92, 0.25, 1.02, 0.44, 1.69, 3.86, 3.59, 1.73, 12.89, 3.36, 1.67]} \ No newline at end of file diff --git a/annotations_1/HYzSQZdBWVQ_filtered.json b/annotations_1/HYzSQZdBWVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e07ba3053b12f36e4d83a6b1475246359b539dfd --- /dev/null +++ b/annotations_1/HYzSQZdBWVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.84], [9.0, 13.09], [18.0, 19.84], [24.0, 28.43], [30.0, 30.99], [35.0, 36.75], [38.0, 38.58], [39.0, 41.08], [42.0, 43.44], [69.0, 72.96], [74.0, 75.78], [80.0, 80.16], [82.0, 81.97], [88.0, 88.99]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [56.55, 61.57, 0.0, 64.97, 0.0, 0.0, 0.0, 35.06, 0.0, 70.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 45.46], ["sine wave", 12.91], ["chirp tone", 7.26]], null, null, null, null, null, null], "duration": [5.84, 4.09, 1.84, 4.43, 0.99, 1.75, 0.58, 2.08, 1.44, 3.96, 1.78, 0.16, -0.03, 0.99]} \ No newline at end of file diff --git a/annotations_1/HZQlFhnFVjg_filtered.json b/annotations_1/HZQlFhnFVjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fe33d57bb2ebc90d93451a9b116964856d518ee --- /dev/null +++ b/annotations_1/HZQlFhnFVjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.14], [12.0, 13.22], [17.0, 17.09], [18.0, 18.45], [20.0, 21.74], [25.0, 25.66], [28.0, 28.78], [32.0, 32.71], [35.0, 36.21], [37.0, 37.94], [39.0, 39.97], [42.0, 42.15], [48.0, 48.32], [50.0, 51.61], [53.0, 54.31], [56.0, 56.12], [58.0, 58.75], [62.0, 63.48], [64.0, 86.7], [88.0, 87.99], [91.0, 147.41], [150.0, 156.14], [160.0, 161.82], [173.0, 173.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.43, 0.0, 0.0, 31.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.14], ["throbbing", 11.1], ["hum", 10.29]], null, null, [["music", 34.37], ["hum", 13.13], ["mains hum", 12.55]], null, null], "duration": [1.14, 1.22, 0.09, 0.45, 1.74, 0.66, 0.78, 0.71, 1.21, 0.94, 0.97, 0.15, 0.32, 1.61, 1.31, 0.12, 0.75, 1.48, 22.7, -0.01, 56.41, 6.14, 1.82, 0.26]} \ No newline at end of file diff --git a/annotations_1/H_pmwvIvi9Q_filtered.json b/annotations_1/H_pmwvIvi9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7aa395f970253c2bfd2d33e7c679332ba5a3b23 --- /dev/null +++ b/annotations_1/H_pmwvIvi9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.56], [27.0, 27.78], [31.0, 31.01], [31.0, 34.45], [38.0, 38.58], [41.0, 40.73], [41.0, 42.94], [44.0, 44.63], [48.0, 49.92], [50.0, 51.09], [56.0, 56.51], [57.0, 65.79], [67.0, 71.02], [84.0, 84.74], [89.0, 90.69], [91.0, 91.77], [93.0, 93.26], [94.0, 93.93], [95.0, 94.73], [103.0, 105.51], [121.0, 121.96], [127.0, 127.18], [128.0, 128.43], [131.0, 131.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 37.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 60.54], ["foghorn", 11.33], ["sine wave", 4.13]], [["music", 65.6], ["throbbing", 7.3], ["hum", 2.82]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 0.78, 0.01, 3.45, 0.58, -0.27, 1.94, 0.63, 1.92, 1.09, 0.51, 8.79, 4.02, 0.74, 1.69, 0.77, 0.26, -0.07, -0.27, 2.51, 0.96, 0.18, 0.43, 0.38]} \ No newline at end of file diff --git a/annotations_1/H_sYBmKxmvs_filtered.json b/annotations_1/H_sYBmKxmvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eef0a9097197c16aecc1d62af814b73e302db8f8 --- /dev/null +++ b/annotations_1/H_sYBmKxmvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [7.0, 9.66]], "keep_status": [false, true], "silence_prob": [0.0, 38.59], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 26.8], ["cattle, bovinae", 21.96], ["moo", 15.45]]], "duration": [0.48, 2.66]} \ No newline at end of file diff --git a/annotations_1/HavLrFJcqMs_filtered.json b/annotations_1/HavLrFJcqMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4349396d17a17056ed2aa116f89b9ea31e4df08b --- /dev/null +++ b/annotations_1/HavLrFJcqMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.47], [19.0, 38.55], [40.0, 42.82], [44.0, 44.61], [46.0, 46.63], [47.0, 47.97], [49.0, 49.67], [51.0, 52.15], [56.0, 56.79], [58.0, 59.24], [61.0, 61.48], [63.0, 64.35], [66.0, 66.88], [68.0, 68.37], [70.0, 81.85]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.24, 36.68, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.93], "audiomae_on_audioset": [[["thump, thud", 27.45], ["speech", 20.11], ["crowd", 5.12]], [["crowd", 17.72], ["fly, housefly", 13.1], ["speech", 9.37]], null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.39], ["hum", 18.99], ["mains hum", 15.66]]], "duration": [8.47, 19.55, 2.82, 0.61, 0.63, 0.97, 0.67, 1.15, 0.79, 1.24, 0.48, 1.35, 0.88, 0.37, 11.85]} \ No newline at end of file diff --git a/annotations_1/Hb8I1My6zOM_filtered.json b/annotations_1/Hb8I1My6zOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef3c75e4306db9ba2a8d4755ff4f1b4f7a766fe2 --- /dev/null +++ b/annotations_1/Hb8I1My6zOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [3.0, 3.97], [13.0, 13.68], [14.0, 16.66], [18.0, 18.45], [22.0, 21.96], [24.0, 24.6], [25.0, 25.52], [29.0, 74.07], [76.0, 84.21], [88.0, 89.06], [92.0, 92.38], [95.0, 97.48], [97.0, 97.51], [99.0, 106.25], [109.0, 109.54], [111.0, 111.23], [112.0, 112.48], [113.0, 119.48], [126.0, 134.16], [135.0, 135.95], [141.0, 141.39], [142.0, 142.59], [149.0, 149.76], [153.0, 153.44], [154.0, 155.09]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.08, 0.0, 0.0, 0.0, 0.0, 0.0, 36.96, 0.0, 0.0, 41.76, 0.0, 30.12, 0.0, 0.0, 0.0, 28.69, 30.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 19.38], ["speech", 17.11], ["cattle, bovinae", 16.76]], null, null, null, null, null, [["music", 80.14], ["throbbing", 2.37], ["synthesizer", 1.28]], null, null, [["speech", 38.3], ["music", 6.59], ["hum", 4.74]], null, [["music", 51.77], ["synthesizer", 8.18], ["livestock, farm animals, working animals", 3.93]], null, null, null, [["music", 33.97], ["speech", 10.28], ["didgeridoo", 5.41]], [["music", 56.87], ["hum", 7.25], ["throbbing", 5.42]], null, null, null, null, null, null], "duration": [1.43, 0.97, 0.68, 2.66, 0.45, -0.04, 0.6, 0.52, 45.07, 8.21, 1.06, 0.38, 2.48, 0.51, 7.25, 0.54, 0.23, 0.48, 6.48, 8.16, 0.95, 0.39, 0.59, 0.76, 0.44, 1.09]} \ No newline at end of file diff --git a/annotations_1/HbWD-eclNf4_filtered.json b/annotations_1/HbWD-eclNf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9b442495b887f893a51e8d7d1c8395f935c664a --- /dev/null +++ b/annotations_1/HbWD-eclNf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.63], [28.0, 28.26], [29.0, 34.45], [41.0, 48.64], [56.0, 67.12], [79.0, 84.69], [87.0, 88.7], [90.0, 93.93], [95.0, 101.09], [105.0, 105.41], [105.0, 105.46], [105.0, 109.32], [123.0, 125.22], [126.0, 126.45], [127.0, 131.19], [133.0, 133.74], [137.0, 138.55], [141.0, 142.64], [145.0, 145.45]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 29.69, 36.19, 37.96, 43.64, 0.0, 44.66, 34.28, 0.0, 0.0, 31.26, 31.83, 0.0, 30.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 69.38], ["throbbing", 4.37], ["didgeridoo", 4.21]], [["speech", 32.47], ["whack, thwack", 9.46], ["hum", 8.1]], [["speech", 45.64], ["hum", 21.16], ["music", 10.07]], [["music", 71.93], ["synthesizer", 11.32], ["musical instrument", 4.24]], null, [["music", 39.68], ["mains hum", 9.91], ["musical instrument", 5.14]], [["hum", 17.92], ["theremin", 15.29], ["fly, housefly", 14.5]], null, null, [["sidetone", 45.03], ["didgeridoo", 26.79], ["music", 10.86]], [["cattle, bovinae", 12.26], ["moo", 12.18], ["animal", 11.91]], null, [["speech", 51.9], ["groan", 10.76], ["whack, thwack", 6.92]], null, null, null, null], "duration": [0.63, 0.26, 5.45, 7.64, 11.12, 5.69, 1.7, 3.93, 6.09, 0.41, 0.46, 4.32, 2.22, 0.45, 4.19, 0.74, 1.55, 1.64, 0.45]} \ No newline at end of file diff --git a/annotations_1/HbgLp9_yU_c_filtered.json b/annotations_1/HbgLp9_yU_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05168e9598ef71f4e36e04cef6094e3e207984ec --- /dev/null +++ b/annotations_1/HbgLp9_yU_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [10.0, 15.53], [19.0, 52.3], [53.0, 53.69], [61.0, 65.75], [67.0, 88.5]], "keep_status": [false, true, false, false, true, true], "silence_prob": [0.0, 29.45, 0.0, 0.0, 28.47, 28.27], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 22.65], ["insect", 14.93], ["fly, housefly", 13.52]], null, null, [["speech", 28.46], ["music", 13.99], ["fly, housefly", 5.32]], [["music", 50.79], ["livestock, farm animals, working animals", 9.62], ["cattle, bovinae", 8.29]]], "duration": [0.49, 5.53, 33.3, 0.69, 4.75, 21.5]} \ No newline at end of file diff --git a/annotations_1/HcGpEScyT5o_filtered.json b/annotations_1/HcGpEScyT5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67595d62e63f4f7f5389b1102258d2cc7e756c1b --- /dev/null +++ b/annotations_1/HcGpEScyT5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [5.0, 6.94], [7.0, 7.5], [8.0, 10.3], [11.0, 12.01], [22.0, 23.35], [31.0, 32.63], [39.0, 39.99], [41.0, 47.58], [48.0, 50.38], [51.0, 51.65], [53.0, 52.89], [55.0, 64.29], [66.0, 79.49], [82.0, 113.44], [114.0, 114.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.96, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 42.86, 41.01, 0.0, 0.0, 35.11, 41.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 58.54], ["musical instrument", 7.48], ["guitar", 4.27]], [["music", 69.26], ["musical instrument", 7.65], ["didgeridoo", 4.7]], null, null, [["music", 74.66], ["musical instrument", 7.0], ["electronic music", 3.28]], [["music", 58.4], ["musical instrument", 6.33], ["electronic music", 5.8]], null, null], "duration": [2.15, 1.94, 0.5, 2.3, 1.01, 1.35, 1.63, 0.99, 6.58, 2.38, 0.65, -0.11, 9.29, 13.49, 31.44, 0.52]} \ No newline at end of file diff --git a/annotations_1/HceqAAw60vQ_filtered.json b/annotations_1/HceqAAw60vQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4ccefe13b7b5dec761a411a9b71065d8900d5a8 --- /dev/null +++ b/annotations_1/HceqAAw60vQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [3.0, 3.1], [6.0, 6.25], [13.0, 19.06], [21.0, 24.88], [31.0, 32.14], [36.0, 37.93], [40.0, 40.14], [41.0, 41.71], [42.0, 44.05], [45.0, 46.48], [49.0, 49.99], [65.0, 65.57], [80.0, 80.27], [84.0, 84.42], [94.0, 95.07], [97.0, 102.41], [104.0, 109.27], [120.0, 121.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 62.27, 69.34, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 48.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 30.69], ["throbbing", 27.89], ["music", 12.07]], null, null, null, null, null, null, null, [["music", 50.21], ["hum", 14.45], ["throbbing", 12.06]], null], "duration": [0.48, 0.1, 0.25, 6.06, 3.88, 1.14, 1.93, 0.14, 0.71, 2.05, 1.48, 0.99, 0.57, 0.27, 0.42, 1.07, 5.41, 5.27, 1.68]} \ No newline at end of file diff --git a/annotations_1/HcpDdWIaAuE_filtered.json b/annotations_1/HcpDdWIaAuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24714829ba5de78ed6df07b37f81bd7a9c920d3b --- /dev/null +++ b/annotations_1/HcpDdWIaAuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.8], [40.0, 41.64], [45.0, 45.47], [47.0, 48.47], [57.0, 59.14], [65.0, 65.89], [70.0, 71.47], [72.0, 73.85], [75.0, 76.64], [96.0, 107.74], [111.0, 112.82], [119.0, 119.58], [122.0, 123.55], [131.0, 133.35], [135.0, 136.54]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.69, 0.0, 0.0, 0.0, 0.0, 31.57, 0.0, 0.0, 0.0, 39.18, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 41.25], ["musical instrument", 7.81], ["brass instrument", 4.73]], null, null, null, null, [["music", 77.14], ["musical instrument", 3.03], ["effects unit", 2.68]], null, null, null, [["music", 51.76], ["theremin", 10.45], ["musical instrument", 3.9]], null], "duration": [0.8, 1.64, 0.47, 1.47, 2.14, 0.89, 1.47, 1.85, 1.64, 11.74, 1.82, 0.58, 1.55, 2.35, 1.54]} \ No newline at end of file diff --git a/annotations_1/HeRIwSpHZCk_filtered.json b/annotations_1/HeRIwSpHZCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bf421bade6bd7989b6921cc200d302396942ea6 --- /dev/null +++ b/annotations_1/HeRIwSpHZCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.78], [16.0, 16.8], [19.0, 19.23], [32.0, 32.04], [36.0, 37.02], [45.0, 45.49], [46.0, 46.67], [52.0, 52.17], [76.0, 76.59], [106.0, 107.15], [115.0, 116.46], [117.0, 118.29], [119.0, 119.55], [120.0, 120.34], [122.0, 122.07], [123.0, 122.81], [132.0, 132.43], [141.0, 148.59], [149.0, 150.2], [164.0, 164.94], [165.0, 168.42], [169.0, 172.2], [173.0, 174.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.36, 0.0, 0.0, 29.66, 29.21, 0.0], "audiomae_on_audioset": [[["hum", 27.54], ["throbbing", 16.3], ["mains hum", 11.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 40.13], ["noise", 24.11], ["mains hum", 18.3]], null, null, [["speech", 29.32], ["sidetone", 15.76], ["rumble", 15.24]], [["hum", 16.83], ["rumble", 14.75], ["noise", 12.32]], null], "duration": [2.78, 0.8, 0.23, 0.04, 1.02, 0.49, 0.67, 0.17, 0.59, 1.15, 1.46, 1.29, 0.55, 0.34, 0.07, -0.19, 0.43, 7.59, 1.2, 0.94, 3.42, 3.2, 1.36]} \ No newline at end of file diff --git a/annotations_1/HfEjIU7Qbj8_filtered.json b/annotations_1/HfEjIU7Qbj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b7fba34854bc9dc4108e48d9586887c55d63bc0 --- /dev/null +++ b/annotations_1/HfEjIU7Qbj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 2.56], [4.0, 4.97], [11.0, 13.81], [16.0, 16.16], [25.0, 26.65], [27.0, 29.03], [37.0, 38.57], [40.0, 42.3], [43.0, 43.11], [45.0, 46.62], [49.0, 50.03], [55.0, 56.27], [62.0, 62.02], [74.0, 73.74], [76.0, 76.08], [87.0, 88.1], [90.0, 91.56], [93.0, 93.7], [95.0, 95.28], [95.0, 96.5], [99.0, 101.17], [102.0, 102.76], [104.0, 109.39], [112.0, 115.53], [116.0, 117.69], [119.0, 123.77], [125.0, 130.72], [132.0, 133.88], [134.0, 146.11], [148.0, 148.96], [150.0, 150.74], [152.0, 152.83], [155.0, 155.68], [157.0, 157.87], [162.0, 161.7], [167.0, 169.38], [170.0, 186.7], [188.0, 189.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 99.8, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 88.46, 99.26, 0.0, 85.54, 31.17, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 36.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.49], ["hum", 26.99], ["mains hum", 11.19]], null, null, null, null, null, null, null, null, null, [["speech", 32.92], ["music", 17.91], ["hum", 11.33]], null], "duration": [0.21, 0.56, 0.97, 2.81, 0.16, 1.65, 2.03, 1.57, 2.3, 0.11, 1.62, 1.03, 1.27, 0.02, -0.26, 0.08, 1.1, 1.56, 0.7, 0.28, 1.5, 2.17, 0.76, 5.39, 3.53, 1.69, 4.77, 5.72, 1.88, 12.11, 0.96, 0.74, 0.83, 0.68, 0.87, -0.3, 2.38, 16.7, 1.16]} \ No newline at end of file diff --git a/annotations_1/HfFM7RZ5GxI_filtered.json b/annotations_1/HfFM7RZ5GxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc7598ce2f076444f284a0f9ccbf338ad66fb346 --- /dev/null +++ b/annotations_1/HfFM7RZ5GxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.48], [7.0, 7.59], [10.0, 13.59], [18.0, 26.28], [28.0, 59.22], [64.0, 89.72], [92.0, 168.0], [169.0, 170.02], [171.0, 170.7]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [38.26, 0.0, 31.63, 31.69, 0.0, 36.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.5], ["music", 9.15], ["whale vocalization", 7.45]], null, [["music", 81.69], ["throbbing", 10.74], ["hum", 1.22]], [["music", 79.16], ["throbbing", 7.08], ["synthesizer", 3.72]], null, [["music", 57.26], ["synthesizer", 12.54], ["electronic music", 5.89]], null, null, null], "duration": [4.48, 0.59, 3.59, 8.28, 31.22, 25.72, 76.0, 1.02, -0.3]} \ No newline at end of file diff --git a/annotations_1/HfgFZz6gCOM_filtered.json b/annotations_1/HfgFZz6gCOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b68b184cf57d2ee56a74ef54a0caee40cce0b178 --- /dev/null +++ b/annotations_1/HfgFZz6gCOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.98], [10.0, 12.14], [13.0, 14.57], [15.0, 16.04], [18.0, 18.32], [20.0, 28.04], [32.0, 37.76], [39.0, 39.73], [47.0, 52.49], [54.0, 54.78], [56.0, 57.0], [58.0, 58.56], [59.0, 71.52], [75.0, 74.73], [75.0, 77.13], [78.0, 83.88], [87.0, 94.02], [107.0, 111.37], [121.0, 125.12]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, true, false, false], "silence_prob": [51.94, 48.02, 0.0, 0.0, 0.0, 47.35, 49.59, 0.0, 42.3, 0.0, 0.0, 0.0, 47.5, 0.0, 45.65, 67.0, 37.34, 32.69, 30.21], "audiomae_on_audioset": [null, [["speech", 60.66], ["radio", 13.32], ["hum", 2.65]], null, null, null, [["music", 63.27], ["speech", 10.48], ["electronic music", 3.17]], [["music", 40.74], ["throbbing", 14.27], ["speech", 14.06]], null, [["speech", 31.75], ["music", 30.9], ["hum", 4.7]], null, null, null, [["speech", 37.2], ["music", 13.86], ["hum", 12.69]], null, [["throbbing", 39.68], ["hum", 22.54], ["music", 16.73]], null, [["music", 27.49], ["speech", 15.76], ["didgeridoo", 5.4]], [["speech", 59.65], ["music", 23.48], ["synthesizer", 5.46]], [["music", 88.29], ["carnatic music", 3.36], ["didgeridoo", 1.8]]], "duration": [3.98, 2.14, 1.57, 1.04, 0.32, 8.04, 5.76, 0.73, 5.49, 0.78, 1.0, 0.56, 12.52, -0.27, 2.13, 5.88, 7.02, 4.37, 4.12]} \ No newline at end of file diff --git a/annotations_1/HgQDAW28DsA_filtered.json b/annotations_1/HgQDAW28DsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c17f4c4acfb6227aac8e907e894b5b43004353b --- /dev/null +++ b/annotations_1/HgQDAW28DsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.19], [5.0, 5.78], [6.0, 9.85], [11.0, 13.81], [15.0, 15.79], [18.0, 19.03], [22.0, 23.36], [24.0, 26.27], [30.0, 31.45], [32.0, 32.8], [34.0, 35.24], [40.0, 42.21], [43.0, 44.42], [45.0, 48.34], [49.0, 59.53], [60.0, 63.44], [64.0, 66.56], [68.0, 69.25], [73.0, 74.09], [75.0, 79.42], [80.0, 81.73], [83.0, 83.51], [84.0, 86.34], [87.0, 91.29], [92.0, 97.63], [102.0, 102.81], [103.0, 103.0], [103.0, 105.17], [106.0, 107.62], [109.0, 117.98], [120.0, 122.71], [124.0, 127.08], [128.0, 148.47]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.88, 78.38, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.56, 99.71, 100.0, 99.73, 0.0, 0.0, 99.99, 0.0, 0.0, 95.23, 98.73, 91.81, 0.0, 0.0, 61.97, 0.0, 99.97, 89.54, 100.0, 98.73], "audiomae_on_audioset": [null, null, [["speech", 36.0], ["hum", 16.24], ["mains hum", 8.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.78, 3.85, 2.81, 0.79, 1.03, 1.36, 2.27, 1.45, 0.8, 1.24, 2.21, 1.42, 3.34, 10.53, 3.44, 2.56, 1.25, 1.09, 4.42, 1.73, 0.51, 2.34, 4.29, 5.63, 0.81, 0.0, 2.17, 1.62, 8.98, 2.71, 3.08, 20.47]} \ No newline at end of file diff --git a/annotations_1/Hgee-O7ZAnY_filtered.json b/annotations_1/Hgee-O7ZAnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6c22c90c1636c25918b98988c15f54310e4082a --- /dev/null +++ b/annotations_1/Hgee-O7ZAnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.01], [5.0, 5.27], [6.0, 7.43], [16.0, 16.6], [33.0, 33.1], [37.0, 44.83], [48.0, 48.79], [51.0, 55.59], [61.0, 61.37], [67.0, 75.29], [75.0, 76.42], [81.0, 81.3], [83.0, 83.78], [88.0, 87.99], [102.0, 102.46], [104.0, 104.58], [105.0, 111.57], [112.0, 113.46], [119.0, 119.15], [120.0, 126.77], [133.0, 133.96], [135.0, 135.51], [136.0, 137.86], [141.0, 141.84], [150.0, 149.81], [153.0, 152.83], [154.0, 154.8]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.49, 0.0, 88.46, 0.0, 30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 35.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 19.79], ["speech", 18.8], ["electric shaver, electric razor", 14.61]], null, null, null, [["moo", 30.23], ["cattle, bovinae", 19.78], ["speech", 13.05]], null, null, null, null, null, null, null, null, null, [["speech", 71.82], ["horse", 2.65], ["crowd", 1.87]], null, null, null, null, null, null, null], "duration": [0.01, 0.27, 1.43, 0.6, 0.1, 7.83, 0.79, 4.59, 0.37, 8.29, 1.42, 0.3, 0.78, -0.01, 0.46, 0.58, 6.57, 1.46, 0.15, 6.77, 0.96, 0.51, 1.86, 0.84, -0.19, -0.17, 0.8]} \ No newline at end of file diff --git a/annotations_1/HhmpYA22oio_filtered.json b/annotations_1/HhmpYA22oio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..352809d0c1db4d74c4b4246bf24ccc9f33ee6aa0 --- /dev/null +++ b/annotations_1/HhmpYA22oio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 17.83], [21.0, 21.54], [24.0, 30.1], [34.0, 37.54], [41.0, 49.13], [50.0, 55.85], [62.0, 66.6], [71.0, 72.1], [75.0, 75.09], [78.0, 78.11], [83.0, 83.57], [84.0, 91.35], [94.0, 108.67], [111.0, 113.43], [114.0, 115.92], [126.0, 128.66], [130.0, 150.11], [151.0, 150.94], [151.0, 152.27], [153.0, 156.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [29.81, 0.0, 30.37, 32.61, 29.74, 31.36, 30.82, 0.0, 0.0, 0.0, 0.0, 30.33, 32.12, 35.54, 0.0, 45.27, 41.18, 0.0, 0.0, 50.11], "audiomae_on_audioset": [[["music", 47.09], ["speech", 31.32], ["sampler", 2.73]], null, [["music", 69.97], ["speech", 7.42], ["throbbing", 4.65]], [["music", 64.19], ["cacophony", 5.21], ["throbbing", 3.9]], [["music", 49.73], ["speech", 36.29], ["applause", 7.61]], [["music", 73.55], ["speech", 9.92], ["applause", 4.34]], [["music", 64.18], ["electronic music", 3.47], ["echo", 2.93]], null, null, null, null, [["music", 66.11], ["hum", 5.85], ["mains hum", 5.56]], [["music", 67.6], ["hum", 7.13], ["mains hum", 3.0]], [["speech", 76.11], ["music", 5.06], ["hum", 2.39]], null, [["hum", 30.76], ["throbbing", 20.23], ["music", 16.72]], [["music", 55.37], ["throbbing", 9.41], ["synthesizer", 8.43]], null, null, null], "duration": [13.83, 0.54, 6.1, 3.54, 8.13, 5.85, 4.6, 1.1, 0.09, 0.11, 0.57, 7.35, 14.67, 2.43, 1.92, 2.66, 20.11, -0.06, 1.27, 3.2]} \ No newline at end of file diff --git a/annotations_1/Hi93mYJyO8I_filtered.json b/annotations_1/Hi93mYJyO8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a1c4b2a61d9cfd5195495cf6a7f634b4d2ebb3c --- /dev/null +++ b/annotations_1/Hi93mYJyO8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [8.0, 10.47], [13.0, 13.49], [33.0, 35.58], [39.0, 40.44], [43.0, 44.12], [46.0, 46.35], [47.0, 47.85], [49.0, 49.23], [51.0, 52.15], [57.0, 57.77], [60.0, 61.25], [63.0, 65.8], [71.0, 75.29]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 37.19, 0.0, 35.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 42.91], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 30.2], ["cattle, bovinae", 13.46], ["moo", 13.27]], null, [["radio", 22.31], ["fly, housefly", 8.99], ["speech", 8.13]], null, null, null, null, null, null, null, null, [["speech", 20.92], ["livestock, farm animals, working animals", 12.9], ["sheep", 11.67]], [["applause", 25.27], ["speech", 10.31], ["crowd", 4.26]]], "duration": [0.33, 2.47, 0.49, 2.58, 1.44, 1.12, 0.35, 0.85, 0.23, 1.15, 0.77, 1.25, 2.8, 4.29]} \ No newline at end of file diff --git a/annotations_1/HiPRBsFF-zU_filtered.json b/annotations_1/HiPRBsFF-zU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e0476728cee79268a71a18388ff390cb4712bc --- /dev/null +++ b/annotations_1/HiPRBsFF-zU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [17.0, 17.15], [22.0, 23.43], [26.0, 27.31], [31.0, 31.4], [37.0, 38.37], [41.0, 41.42], [45.0, 45.57], [47.0, 47.66], [55.0, 56.19], [60.0, 63.8], [65.0, 65.58], [66.0, 70.01], [72.0, 73.99], [76.0, 76.98], [79.0, 79.24], [80.0, 81.11], [84.0, 85.04], [88.0, 91.79], [97.0, 97.75], [101.0, 102.27], [114.0, 114.61], [116.0, 117.0], [128.0, 129.93], [136.0, 135.95], [145.0, 145.59], [147.0, 147.85], [150.0, 150.01], [158.0, 157.98], [159.0, 160.05], [161.0, 162.62], [164.0, 166.51]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 37.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.97], "audiomae_on_audioset": [[["music", 50.84], ["throbbing", 13.2], ["electronic music", 4.03]], null, null, null, null, null, null, null, null, null, [["hum", 36.38], ["mains hum", 11.58], ["throbbing", 9.59]], null, [["whale vocalization", 45.7], ["speech", 17.11], ["rumble", 4.92]], null, null, null, null, null, [["music", 60.81], ["musical instrument", 7.56], ["bass guitar", 5.2]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.25, 0.15, 1.43, 1.31, 0.4, 1.37, 0.42, 0.57, 0.66, 1.19, 3.8, 0.58, 4.01, 1.99, 0.98, 0.24, 1.11, 1.04, 3.79, 0.75, 1.27, 0.61, 1.0, 1.93, -0.05, 0.59, 0.85, 0.01, -0.02, 1.05, 1.62, 2.51]} \ No newline at end of file diff --git a/annotations_1/HiavOVW1Iv8_filtered.json b/annotations_1/HiavOVW1Iv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..962b06a987637ac132863da75ee7bea002c5d302 --- /dev/null +++ b/annotations_1/HiavOVW1Iv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [4.0, 9.78], [12.0, 12.63], [13.0, 14.69], [15.0, 16.04], [17.0, 20.97], [24.0, 23.77], [26.0, 26.45], [27.0, 41.2], [42.0, 53.3], [56.0, 57.3], [58.0, 77.01], [77.0, 81.06], [82.0, 84.28], [85.0, 92.74], [94.0, 101.31], [102.0, 102.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.51, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 44.18, 41.1, 0.0, 38.21, 65.2, 50.21, 93.6, 31.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 64.91], ["music", 3.85], ["noise", 3.26]], null, null, [["speech", 51.51], ["hum", 17.34], ["mains hum", 13.16]], [["speech", 60.97], ["music", 28.43], ["theremin", 1.33]], null, [["music", 51.96], ["throbbing", 15.96], ["hum", 6.33]], null, null, null, [["music", 57.1], ["theremin", 9.49], ["synthesizer", 6.95]], null], "duration": [1.37, 5.78, 0.63, 1.69, 1.04, 3.97, -0.23, 0.45, 14.2, 11.3, 1.3, 19.01, 4.06, 2.28, 7.74, 7.31, 0.93]} \ No newline at end of file diff --git a/annotations_1/Hiwu7Hu2hAs_filtered.json b/annotations_1/Hiwu7Hu2hAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc91b850230edce26d28b1bceb2dbc51a60a6858 --- /dev/null +++ b/annotations_1/Hiwu7Hu2hAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.58], [14.0, 14.64], [16.0, 18.22], [22.0, 22.32], [28.0, 36.81], [41.0, 40.91], [42.0, 42.63], [44.0, 45.27], [48.0, 49.23], [50.0, 52.02], [56.0, 59.59], [62.0, 69.89], [73.0, 73.77], [75.0, 75.22], [76.0, 77.68], [78.0, 78.12], [79.0, 86.76], [89.0, 91.98], [93.0, 94.98], [101.0, 103.62], [106.0, 107.87], [112.0, 113.09], [145.0, 145.57], [148.0, 148.0], [152.0, 152.56], [155.0, 165.03], [166.0, 172.02], [173.0, 181.92]], "keep_status": [false, false, true, false, true, false, false, false, false, true, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 46.94, 0.0, 35.75, 0.0, 0.0, 0.0, 0.0, 34.74, 39.22, 33.7, 0.0, 0.0, 0.0, 0.0, 34.69, 48.44, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 34.11, 33.98, 33.68], "audiomae_on_audioset": [null, null, [["music", 22.83], ["hum", 17.23], ["speech", 15.02]], null, [["music", 47.85], ["chant", 7.42], ["buzz", 4.89]], null, null, null, null, [["music", 32.55], ["didgeridoo", 5.57], ["musical instrument", 4.58]], [["music", 49.04], ["whale vocalization", 8.83], ["carnatic music", 6.1]], [["music", 30.33], ["electric shaver, electric razor", 19.83], ["speech", 18.12]], null, null, null, null, [["music", 40.74], ["throbbing", 22.51], ["hum", 13.01]], [["music", 52.41], ["throbbing", 6.14], ["didgeridoo", 3.59]], null, null, null, null, null, null, null, [["music", 65.19], ["synthetic singing", 6.96], ["didgeridoo", 4.43]], [["music", 47.31], ["didgeridoo", 8.72], ["throbbing", 5.13]], [["music", 55.95], ["electric shaver, electric razor", 3.53], ["singing", 3.08]]], "duration": [0.58, 0.64, 2.22, 0.32, 8.81, -0.09, 0.63, 1.27, 1.23, 2.02, 3.59, 7.89, 0.77, 0.22, 1.68, 0.12, 7.76, 2.98, 1.98, 2.62, 1.87, 1.09, 0.57, 0.0, 0.56, 10.03, 6.02, 8.92]} \ No newline at end of file diff --git a/annotations_1/Hj12WETYG0U_filtered.json b/annotations_1/Hj12WETYG0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9834a02188903923d4abcf5e0e0561a5a343361c --- /dev/null +++ b/annotations_1/Hj12WETYG0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.09], [13.0, 17.39], [23.0, 24.71], [28.0, 44.05], [48.0, 48.51], [50.0, 100.25]], "keep_status": [false, true, false, true, false, false], "silence_prob": [0.0, 38.82, 0.0, 39.61, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 27.06], ["hum", 16.08], ["mains hum", 9.45]], null, [["music", 42.74], ["electronic music", 13.49], ["throbbing", 12.97]], null, null], "duration": [0.09, 4.39, 1.71, 16.05, 0.51, 50.25]} \ No newline at end of file diff --git a/annotations_1/Hj52vD7KGxs_filtered.json b/annotations_1/Hj52vD7KGxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d75d1657473e75ee84c129fca93081decf57cf38 --- /dev/null +++ b/annotations_1/Hj52vD7KGxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.19], [30.0, 29.94], [31.0, 34.1], [35.0, 36.88], [40.0, 39.65], [43.0, 43.65], [45.0, 45.96], [51.0, 51.7], [54.0, 60.56], [66.0, 67.42], [73.0, 75.27], [76.0, 78.88], [79.0, 81.75], [83.0, 112.67], [116.0, 118.99], [129.0, 131.8], [132.0, 133.95]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 81.53, 89.19, 48.87, 42.06, 34.53, 54.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 21.55], ["noise", 15.67], ["bouncing", 7.47]], null, null, null, [["music", 28.29], ["speech", 19.21], ["thunk", 16.31]], [["speech", 71.12], ["door", 7.89], ["mains hum", 3.84]], [["creak", 37.3], ["mains hum", 13.77], ["hum", 10.06]], null, null], "duration": [0.19, -0.06, 3.1, 1.88, -0.35, 0.65, 0.96, 0.7, 6.56, 1.42, 2.27, 2.88, 2.75, 29.67, 2.99, 2.8, 1.95]} \ No newline at end of file diff --git a/annotations_1/Hj7OFElSIlM_filtered.json b/annotations_1/Hj7OFElSIlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d45d57f9a5fd06374120dc1cacfe1259e04afe --- /dev/null +++ b/annotations_1/Hj7OFElSIlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.0], [17.0, 18.44], [19.0, 19.9], [23.0, 25.27], [27.0, 27.63], [29.0, 29.96], [37.0, 37.13], [40.0, 42.33], [47.0, 46.67], [48.0, 48.2], [57.0, 58.8], [66.0, 67.0], [68.0, 68.88], [70.0, 80.37], [83.0, 83.34], [85.0, 85.7], [87.0, 87.07], [89.0, 89.95], [91.0, 92.04], [94.0, 95.66], [97.0, 99.69], [102.0, 107.54], [108.0, 109.54]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 43.23, 0.0, 0.0, 0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.6, 76.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fly, housefly", 26.56], ["bee, wasp, etc.", 15.68], ["hum", 14.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 1.44, 0.9, 2.27, 0.63, 0.96, 0.13, 2.33, -0.33, 0.2, 1.8, 1.0, 0.88, 10.37, 0.34, 0.7, 0.07, 0.95, 1.04, 1.66, 2.69, 5.54, 1.54]} \ No newline at end of file diff --git a/annotations_1/Hj9q4NlwcXo_filtered.json b/annotations_1/Hj9q4NlwcXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a3b5a97db7d92fd9e8232e1583c61556bce7db1 --- /dev/null +++ b/annotations_1/Hj9q4NlwcXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 78.46], [82.0, 175.31], [178.0, 182.9]], "keep_status": [false, false, false], "silence_prob": [30.93, 0.0, 30.22], "audiomae_on_audioset": [[["music", 37.7], ["speech", 37.67], ["sidetone", 2.58]], null, [["music", 74.55], ["scary music", 3.14], ["theremin", 2.61]]], "duration": [4.46, 93.31, 4.9]} \ No newline at end of file diff --git a/annotations_1/HkXGq2kJAlM_filtered.json b/annotations_1/HkXGq2kJAlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b2d02d9c24a0336f3b3b21e348b864d1ed0fe6 --- /dev/null +++ b/annotations_1/HkXGq2kJAlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.68], [18.0, 19.31], [28.0, 30.08], [32.0, 33.71], [35.0, 35.56], [36.0, 37.45], [40.0, 43.58], [46.0, 50.01], [52.0, 71.9], [72.0, 72.82], [74.0, 77.31], [88.0, 102.68], [108.0, 112.01], [116.0, 116.51], [118.0, 121.15], [126.0, 126.86], [127.0, 130.03]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [30.74, 0.0, 30.3, 0.0, 0.0, 0.0, 29.82, 29.85, 30.6, 0.0, 29.71, 30.09, 30.01, 0.0, 31.88, 0.0, 31.87], "audiomae_on_audioset": [[["music", 37.26], ["boing", 12.86], ["speech", 10.87]], null, [["music", 47.42], ["speech", 38.6], ["breaking", 3.35]], null, null, null, [["music", 60.21], ["throbbing", 7.71], ["noise", 5.22]], [["music", 68.78], ["didgeridoo", 4.07], ["throbbing", 2.71]], [["music", 47.07], ["speech", 5.18], ["electronic music", 4.02]], null, [["cattle, bovinae", 44.99], ["moo", 39.59], ["livestock, farm animals, working animals", 6.48]], [["music", 64.55], ["cattle, bovinae", 6.0], ["livestock, farm animals, working animals", 4.46]], [["speech", 22.34], ["throbbing", 17.81], ["hum", 15.65]], null, [["speech", 28.75], ["hum", 17.65], ["music", 14.99]], null, [["sidetone", 34.38], ["speech", 19.62], ["music", 16.52]]], "duration": [2.68, 1.31, 2.08, 1.71, 0.56, 1.45, 3.58, 4.01, 19.9, 0.82, 3.31, 14.68, 4.01, 0.51, 3.15, 0.86, 3.03]} \ No newline at end of file diff --git a/annotations_1/Hl9OzCY9fVE_filtered.json b/annotations_1/Hl9OzCY9fVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcbfdf77276a89932458a28162888bac3afd6bb7 --- /dev/null +++ b/annotations_1/Hl9OzCY9fVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [5.0, 12.61], [14.0, 14.42], [15.0, 15.55], [16.0, 18.59], [19.0, 20.41], [21.0, 22.49], [24.0, 25.1], [25.0, 26.08], [28.0, 29.19], [31.0, 32.61], [37.0, 37.77], [40.0, 40.69], [41.0, 41.47], [42.0, 43.04], [44.0, 44.31], [47.0, 48.24], [49.0, 50.84], [52.0, 52.2], [53.0, 53.74], [54.0, 68.72], [69.0, 71.15], [73.0, 87.66], [88.0, 89.46], [92.0, 98.25], [102.0, 103.08], [104.0, 104.63], [110.0, 112.21], [113.0, 113.41], [114.0, 114.15], [124.0, 129.86], [130.0, 130.89], [131.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.91, 77.87, 0.0, 99.94, 0.0, 0.0, 97.73, 0.0, 0.0, 34.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.61], ["theremin", 18.88], ["speech", 17.8]], null, null], "duration": [0.19, 7.61, 0.42, 0.55, 2.59, 1.41, 1.49, 1.1, 1.08, 1.19, 1.61, 0.77, 0.69, 0.47, 1.04, 0.31, 1.24, 1.84, 0.2, 0.74, 14.72, 2.15, 14.66, 1.46, 6.25, 1.08, 0.63, 2.21, 0.41, 0.15, 5.86, 0.89, -0.06]} \ No newline at end of file diff --git a/annotations_1/Hln19l9RtWg_filtered.json b/annotations_1/Hln19l9RtWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f126f76df68d98e2aa33d6e533877b55d37a7bb --- /dev/null +++ b/annotations_1/Hln19l9RtWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.29], [37.0, 37.89], [40.0, 40.49], [51.0, 50.82], [53.0, 53.33], [108.0, 109.05], [119.0, 120.21], [121.0, 121.8], [130.0, 130.74], [148.0, 156.98], [159.0, 159.53], [166.0, 166.01], [166.0, 170.68]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 78.89], "audiomae_on_audioset": [[["noise", 31.58], ["music", 19.71], ["effects unit", 14.35]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.29, 0.89, 0.49, -0.18, 0.33, 1.05, 1.21, 0.8, 0.74, 8.98, 0.53, 0.01, 4.68]} \ No newline at end of file diff --git a/annotations_1/HlsvFTNrKK8_filtered.json b/annotations_1/HlsvFTNrKK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f44665dd47183e91b7c3e4dfd48602fc3ec06a10 --- /dev/null +++ b/annotations_1/HlsvFTNrKK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 14.13], [16.0, 19.82], [22.0, 22.5], [24.0, 25.83], [28.0, 41.99], [47.0, 47.87], [49.0, 50.53], [52.0, 81.6], [82.0, 122.54], [124.0, 125.02], [127.0, 129.22], [130.0, 138.23], [141.0, 145.35], [146.0, 162.6]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, true, false, false], "silence_prob": [29.6, 36.35, 0.0, 0.0, 28.67, 0.0, 0.0, 28.3, 0.0, 0.0, 62.99, 30.39, 33.05, 28.84], "audiomae_on_audioset": [[["mains hum", 39.27], ["hum", 27.13], ["music", 13.57]], [["music", 70.24], ["theremin", 5.3], ["musical instrument", 3.87]], null, null, [["music", 36.86], ["speech", 21.08], ["buzz", 3.22]], null, null, [["music", 31.05], ["speech", 16.91], ["hum", 8.28]], null, null, null, [["music", 27.21], ["hum", 18.17], ["speech", 17.59]], [["hum", 68.68], ["mains hum", 15.5], ["throbbing", 5.81]], [["hum", 56.78], ["speech", 12.43], ["music", 10.31]]], "duration": [13.13, 3.82, 0.5, 1.83, 13.99, 0.87, 1.53, 29.6, 40.54, 1.02, 2.22, 8.23, 4.35, 16.6]} \ No newline at end of file diff --git a/annotations_1/HlyzLOPYuKc_filtered.json b/annotations_1/HlyzLOPYuKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd856a3c6b70e9ebf2db4eb8515b774565875dd4 --- /dev/null +++ b/annotations_1/HlyzLOPYuKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.04], [10.0, 18.94], [25.0, 27.31], [29.0, 30.59], [31.0, 32.37], [35.0, 35.56], [37.0, 38.33], [40.0, 41.18], [43.0, 67.93], [70.0, 88.86], [100.0, 100.47], [103.0, 107.1], [108.0, 108.45], [114.0, 114.74]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [38.03, 30.01, 31.06, 0.0, 0.0, 0.0, 0.0, 0.0, 30.86, 30.61, 0.0, 29.92, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.56], ["hum", 18.22], ["mains hum", 14.65]], [["cattle, bovinae", 13.24], ["moo", 11.58], ["speech", 8.79]], [["whack, thwack", 16.26], ["music", 14.98], ["speech", 11.82]], null, null, null, null, null, [["music", 51.19], ["speech", 19.01], ["fly, housefly", 3.16]], [["music", 62.68], ["hum", 10.3], ["throbbing", 8.61]], null, [["music", 25.19], ["grunt", 14.79], ["whack, thwack", 7.34]], null, null], "duration": [5.04, 8.94, 2.31, 1.59, 1.37, 0.56, 1.33, 1.18, 24.93, 18.86, 0.47, 4.1, 0.45, 0.74]} \ No newline at end of file diff --git a/annotations_1/Hm8hcRPGyME_filtered.json b/annotations_1/Hm8hcRPGyME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a05df0d63e00279adfe6a6bd72fea30f136dbf38 --- /dev/null +++ b/annotations_1/Hm8hcRPGyME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [14.0, 14.34], [15.0, 16.88], [18.0, 21.46], [23.0, 24.33], [25.0, 40.44], [42.0, 42.21], [47.0, 47.63], [55.0, 57.99], [59.0, 60.71], [69.0, 70.71], [75.0, 74.8], [76.0, 89.75], [91.0, 128.02], [133.0, 132.97], [136.0, 140.54], [143.0, 147.48], [149.0, 182.75], [188.0, 202.27]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 47.23, 0.0, 30.75, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 32.27, 0.0, 0.0, 43.51, 31.1, 0.0, 33.0], "audiomae_on_audioset": [null, null, null, [["throbbing", 39.34], ["hum", 22.75], ["music", 14.34]], null, [["speech", 35.05], ["throbbing", 10.06], ["hum", 9.16]], null, null, null, null, null, null, [["music", 25.55], ["speech", 16.63], ["whack, thwack", 11.84]], null, null, [["music", 77.47], ["boing", 3.81], ["musical instrument", 3.2]], [["music", 56.57], ["throbbing", 5.76], ["cacophony", 4.37]], null, [["music", 41.59], ["moo", 12.34], ["cattle, bovinae", 12.07]]], "duration": [0.93, 0.34, 1.88, 3.46, 1.33, 15.44, 0.21, 0.63, 2.99, 1.71, 1.71, -0.2, 13.75, 37.02, -0.03, 4.54, 4.48, 33.75, 14.27]} \ No newline at end of file diff --git a/annotations_1/HnhM0M5UzX0_filtered.json b/annotations_1/HnhM0M5UzX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f111b9d400bc8fc03557a50a13bc9f6cda3d5c82 --- /dev/null +++ b/annotations_1/HnhM0M5UzX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 3.05], [3.0, 4.31], [5.0, 5.66], [8.0, 8.23], [9.0, 9.51], [10.0, 31.33], [33.0, 33.12], [38.0, 40.76], [42.0, 42.55], [43.0, 43.73], [48.0, 53.4], [56.0, 62.73], [65.0, 67.34], [71.0, 73.7], [75.0, 79.49], [81.0, 94.02], [94.0, 95.91], [99.0, 103.03], [104.0, 106.88], [108.0, 110.61], [112.0, 118.84], [120.0, 121.69], [123.0, 127.87], [129.0, 131.65], [133.0, 139.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.87, 0.0, 0.0, 99.4, 96.66, 99.92, 100.0, 99.94, 99.88, 0.0, 100.0, 99.59, 99.99, 98.51, 0.0, 100.0, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.05, 1.31, 0.66, 0.23, 0.51, 21.33, 0.12, 2.76, 0.55, 0.73, 5.4, 6.73, 2.34, 2.7, 4.49, 13.02, 1.91, 4.03, 2.88, 2.61, 6.84, 1.69, 4.87, 2.65, 6.33]} \ No newline at end of file diff --git a/annotations_1/Ho0k513yN6E_filtered.json b/annotations_1/Ho0k513yN6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a67008f9c4df18ed7493399be4a5f67b5a7f8f9e --- /dev/null +++ b/annotations_1/Ho0k513yN6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 78.11], [83.0, 101.06], [106.0, 143.55], [146.0, 148.39]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 30.3, 0.0, 30.43], "audiomae_on_audioset": [null, [["music", 86.3], ["didgeridoo", 4.49], ["throbbing", 2.73]], null, [["sidetone", 66.35], ["speech", 11.97], ["radio", 11.19]]], "duration": [56.11, 18.06, 37.55, 2.39]} \ No newline at end of file diff --git a/annotations_1/Hp93d2bsfQc_filtered.json b/annotations_1/Hp93d2bsfQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9677561bdb4a498f38902e477122bef3ce8b32b --- /dev/null +++ b/annotations_1/Hp93d2bsfQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.06], [13.0, 13.93], [21.0, 23.63], [24.0, 24.29], [30.0, 30.33], [32.0, 32.07], [33.0, 34.01], [36.0, 36.61], [41.0, 41.47], [43.0, 43.58], [44.0, 44.93], [52.0, 52.52], [53.0, 53.35], [55.0, 56.81], [58.0, 58.73], [61.0, 61.2], [65.0, 99.15], [101.0, 101.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.93, 2.63, 0.29, 0.33, 0.07, 1.01, 0.61, 0.47, 0.58, 0.93, 0.52, 0.35, 1.81, 0.73, 0.2, 34.15, 0.53]} \ No newline at end of file diff --git a/annotations_1/HpGmAvMtScw_filtered.json b/annotations_1/HpGmAvMtScw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c0c62cb04e9745268ee2a660b4dafb3b286e70c --- /dev/null +++ b/annotations_1/HpGmAvMtScw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 38.58]], "keep_status": [true], "silence_prob": [33.12], "audiomae_on_audioset": [[["hum", 19.85], ["rumble", 15.71], ["mains hum", 14.24]]], "duration": [4.58]} \ No newline at end of file diff --git a/annotations_1/HrFlTjySp8E_filtered.json b/annotations_1/HrFlTjySp8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c26e9444051f2349f303bb2f8413998dbefafdf8 --- /dev/null +++ b/annotations_1/HrFlTjySp8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 42.08], [57.0, 111.4], [113.0, 112.77], [113.0, 132.06]], "keep_status": [false, false, false, false], "silence_prob": [32.14, 0.0, 0.0, 33.42], "audiomae_on_audioset": [[["music", 31.06], ["double bass", 29.9], ["cello", 13.47]], null, null, [["music", 72.73], ["musical instrument", 10.05], ["guitar", 3.68]]], "duration": [3.08, 54.4, -0.23, 19.06]} \ No newline at end of file diff --git a/annotations_1/Hs8mVGI7uVc_filtered.json b/annotations_1/Hs8mVGI7uVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7adfdb90544f9c5e15f1748cfb90b9a5b71c06b5 --- /dev/null +++ b/annotations_1/Hs8mVGI7uVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.46], [10.0, 11.82], [12.0, 13.37], [14.0, 15.04], [16.0, 17.79], [19.0, 20.44], [21.0, 24.31], [25.0, 32.51], [35.0, 35.28], [40.0, 40.41], [44.0, 44.71], [49.0, 49.13], [54.0, 56.91], [65.0, 65.72], [67.0, 67.69], [68.0, 69.06], [70.0, 70.02], [70.0, 71.42], [74.0, 75.39], [78.0, 78.87], [81.0, 82.29], [87.0, 89.6], [90.0, 90.95], [92.0, 92.67], [95.0, 94.95], [98.0, 99.22], [105.0, 105.11], [116.0, 122.23], [123.0, 123.55], [125.0, 125.15], [138.0, 158.09], [159.0, 159.31]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.73, 0.0, 0.0, 0.0, 0.0, 0.0, 34.08, 31.08, 0.0, 0.0, 0.0, 0.0, 38.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.72, 0.0, 0.0, 0.0, 0.0, 0.0, 31.51, 0.0, 0.0, 36.92, 0.0], "audiomae_on_audioset": [[["speech", 27.11], ["music", 17.24], ["hum", 13.39]], null, null, null, null, null, [["speech", 36.18], ["hum", 12.19], ["mains hum", 10.98]], [["hum", 35.61], ["mains hum", 30.49], ["music", 9.83]], null, null, null, null, [["hum", 46.78], ["throbbing", 12.52], ["music", 9.11]], null, null, null, null, null, null, null, null, [["music", 33.0], ["sound effect", 7.68], ["reverberation", 5.35]], null, null, null, null, null, [["hum", 41.94], ["mains hum", 18.88], ["throbbing", 11.31]], null, null, [["hum", 50.92], ["throbbing", 17.7], ["mains hum", 10.74]], null], "duration": [2.46, 1.82, 1.37, 1.04, 1.79, 1.44, 3.31, 7.51, 0.28, 0.41, 0.71, 0.13, 2.91, 0.72, 0.69, 1.06, 0.02, 1.42, 1.39, 0.87, 1.29, 2.6, 0.95, 0.67, -0.05, 1.22, 0.11, 6.23, 0.55, 0.15, 20.09, 0.31]} \ No newline at end of file diff --git a/annotations_1/HsMVFxZ43iU_filtered.json b/annotations_1/HsMVFxZ43iU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6ccfd36f5acd836ca8b32adc87ba9cdf302c16 --- /dev/null +++ b/annotations_1/HsMVFxZ43iU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 17.63], [19.0, 27.03], [29.0, 61.13], [63.0, 65.42], [73.0, 74.63], [78.0, 79.52], [82.0, 90.63], [93.0, 99.18], [103.0, 105.85], [108.0, 108.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.17, 30.51, 0.0, 30.56, 0.0, 0.0, 42.58, 30.63, 34.95, 0.0], "audiomae_on_audioset": [[["throbbing", 60.53], ["music", 21.15], ["hum", 11.01]], [["music", 73.85], ["throbbing", 15.37], ["hum", 3.3]], null, [["music", 39.97], ["throbbing", 32.96], ["hum", 11.96]], null, null, [["music", 56.34], ["didgeridoo", 10.6], ["throbbing", 4.91]], [["music", 81.44], ["throbbing", 2.38], ["electronic music", 1.61]], [["music", 49.14], ["speech", 31.83], ["electronic music", 5.71]], null], "duration": [11.63, 8.03, 32.13, 2.42, 1.63, 1.52, 8.63, 6.18, 2.85, 0.21]} \ No newline at end of file diff --git a/annotations_1/HsRwyJw5o7k_filtered.json b/annotations_1/HsRwyJw5o7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3adc76b48d43fb17419193cc1f1f42686267a397 --- /dev/null +++ b/annotations_1/HsRwyJw5o7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.24], [19.0, 32.02], [34.0, 58.04], [59.0, 103.44], [108.0, 108.5], [110.0, 110.67], [111.0, 110.86], [111.0, 111.32], [111.0, 135.3], [136.0, 135.65], [136.0, 166.77]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [29.87, 29.25, 28.83, 0.0, 0.0, 0.0, 0.0, 0.0, 29.01, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 45.8], ["hum", 24.74], ["music", 8.29]], [["hum", 23.33], ["mains hum", 22.13], ["music", 18.46]], [["eruption", 14.76], ["music", 12.76], ["hum", 7.68]], null, null, null, null, null, [["buzz", 62.99], ["music", 12.16], ["hum", 7.43]], null, null], "duration": [3.24, 13.02, 24.04, 44.44, 0.5, 0.67, -0.14, 0.32, 24.3, -0.35, 30.77]} \ No newline at end of file diff --git a/annotations_1/Hsg_ZUoSlCs_filtered.json b/annotations_1/Hsg_ZUoSlCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..236ea0aa042c3f4a9f97b071b00c5ae90d5a9514 --- /dev/null +++ b/annotations_1/Hsg_ZUoSlCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.46], [11.0, 11.04], [24.0, 25.79], [31.0, 31.01], [33.0, 33.91], [37.0, 46.28], [47.0, 48.96], [49.0, 50.79], [52.0, 52.07], [53.0, 54.14], [58.0, 69.15], [71.0, 71.78], [73.0, 77.31], [80.0, 80.82], [86.0, 86.16], [91.0, 91.45], [94.0, 96.13], [101.0, 102.76], [104.0, 104.36], [105.0, 107.03], [108.0, 113.54], [115.0, 115.2], [117.0, 118.23], [119.0, 119.67]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 0.0, 33.73, 0.0, 39.7, 0.0, 0.0, 0.0, 32.58, 0.0, 0.0, 58.55, 38.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["animal", 21.08], ["music", 19.17], ["dog", 9.8]], null, null, null, null, [["music", 32.35], ["hum", 27.76], ["mains hum", 27.57]], null, [["music", 40.45], ["speech", 22.28], ["didgeridoo", 20.14]], null, null, null, [["music", 48.65], ["throbbing", 5.54], ["speech", 5.12]], null, null, null, [["hum", 39.64], ["throbbing", 17.34], ["speech", 14.9]], null, null, null], "duration": [1.46, 0.04, 1.79, 0.01, 0.91, 9.28, 1.96, 1.79, 0.07, 1.14, 11.15, 0.78, 4.31, 0.82, 0.16, 0.45, 2.13, 1.76, 0.36, 2.03, 5.54, 0.2, 1.23, 0.67]} \ No newline at end of file diff --git a/annotations_1/Hsh6n5RfCoc_filtered.json b/annotations_1/Hsh6n5RfCoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f6b1e1489f1855aca33a3e0f18e6972e30f961c --- /dev/null +++ b/annotations_1/Hsh6n5RfCoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.18], [8.0, 8.88], [11.0, 23.23], [24.0, 24.85]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 30.33, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.75], ["buzz", 25.83], ["electric shaver, electric razor", 7.66]], null], "duration": [1.18, 0.88, 12.23, 0.85]} \ No newline at end of file diff --git a/annotations_1/Htp6crkePuw_filtered.json b/annotations_1/Htp6crkePuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680bf7213ac53d8e28adeab1535695db2349991c --- /dev/null +++ b/annotations_1/Htp6crkePuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 35.41], [39.0, 61.7], [67.0, 68.47], [69.0, 69.79], [70.0, 72.0], [75.0, 81.99], [84.0, 84.62], [89.0, 93.39], [96.0, 99.33], [103.0, 105.02], [109.0, 114.34], [117.0, 126.27], [129.0, 141.99], [143.0, 143.58], [147.0, 147.61], [149.0, 149.81]], "keep_status": [true, true, false, false, true, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [28.86, 29.88, 0.0, 0.0, 30.95, 30.65, 0.0, 31.29, 29.47, 31.7, 30.5, 30.13, 31.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["gunshot, gunfire", 35.12], ["machine gun", 18.47], ["smash, crash", 7.93]], [["whip", 24.15], ["music", 17.85], ["speech", 13.17]], null, null, [["music", 38.66], ["hum", 8.15], ["throbbing", 7.42]], [["hum", 30.52], ["mains hum", 25.61], ["music", 21.11]], null, [["music", 38.76], ["hum", 9.35], ["mains hum", 6.38]], [["explosion", 17.72], ["burst, pop", 16.62], ["speech", 13.14]], [["music", 39.7], ["gunshot, gunfire", 14.63], ["hum", 7.96]], [["music", 46.57], ["hum", 18.49], ["mains hum", 12.39]], [["machine gun", 36.86], ["gunshot, gunfire", 23.77], ["ding", 16.94]], [["mains hum", 46.63], ["hum", 33.93], ["music", 9.81]], null, null, null], "duration": [7.41, 22.7, 1.47, 0.79, 2.0, 6.99, 0.62, 4.39, 3.33, 2.02, 5.34, 9.27, 12.99, 0.58, 0.61, 0.81]} \ No newline at end of file diff --git a/annotations_1/HummNgSGn8k_filtered.json b/annotations_1/HummNgSGn8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f77b21358f8d45742dad60f064d47e6c44b67d6f --- /dev/null +++ b/annotations_1/HummNgSGn8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.31], [21.0, 50.62], [51.0, 52.47], [55.0, 56.37], [59.0, 59.56], [63.0, 64.45], [66.0, 67.34], [69.0, 70.65], [77.0, 78.63], [83.0, 84.25], [88.0, 88.5], [92.0, 93.11], [98.0, 98.46], [99.0, 99.59], [101.0, 101.22], [104.0, 104.55], [105.0, 111.75], [114.0, 114.74]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.91, 30.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.99, 0.0], "audiomae_on_audioset": [[["music", 55.27], ["theremin", 8.61], ["musical instrument", 4.95]], [["music", 73.64], ["mains hum", 6.09], ["hum", 4.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.71], ["hum", 5.87], ["theremin", 5.49]], null], "duration": [4.31, 29.62, 1.47, 1.37, 0.56, 1.45, 1.34, 1.65, 1.63, 1.25, 0.5, 1.11, 0.46, 0.59, 0.22, 0.55, 6.75, 0.74]} \ No newline at end of file diff --git a/annotations_1/HwaqZA54GTk_filtered.json b/annotations_1/HwaqZA54GTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3f364781222c22d3c912dcdb9c59e42a95778b6 --- /dev/null +++ b/annotations_1/HwaqZA54GTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 5.76], [8.0, 9.24], [14.0, 17.59], [19.0, 19.26], [21.0, 20.93], [22.0, 22.98], [26.0, 28.46], [31.0, 32.68], [33.0, 34.92], [42.0, 42.18], [47.0, 47.78], [57.0, 57.11], [60.0, 60.42], [62.0, 64.39], [65.0, 65.23], [66.0, 68.15], [84.0, 84.55], [88.0, 88.18], [92.0, 93.46], [100.0, 101.66], [106.0, 107.49], [126.0, 126.81], [132.0, 132.93], [135.0, 135.26], [138.0, 139.01], [140.0, 141.57], [142.0, 143.67], [148.0, 148.96], [151.0, 151.73], [153.0, 153.62], [155.0, 158.38], [167.0, 167.98], [169.0, 169.42], [170.0, 170.6], [175.0, 176.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.28, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.76, 1.24, 3.59, 0.26, -0.07, 0.98, 2.46, 1.68, 1.92, 0.18, 0.78, 0.11, 0.42, 2.39, 0.23, 2.15, 0.55, 0.18, 1.46, 1.66, 1.49, 0.81, 0.93, 0.26, 1.01, 1.57, 1.67, 0.96, 0.73, 0.62, 3.38, 0.98, 0.42, 0.6, 1.67]} \ No newline at end of file diff --git a/annotations_1/Hwczxp7h7Gg_filtered.json b/annotations_1/Hwczxp7h7Gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..350fb308f0bcd12db1b64b3f10f05fbeb0f7f492 --- /dev/null +++ b/annotations_1/Hwczxp7h7Gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.36], [6.0, 7.92], [16.0, 19.68], [26.0, 34.8], [35.0, 35.99], [41.0, 42.63], [44.0, 46.35], [51.0, 51.39], [52.0, 52.71], [53.0, 53.08], [59.0, 61.47], [64.0, 66.29], [67.0, 68.25], [71.0, 71.49], [74.0, 76.79], [78.0, 81.35], [86.0, 86.21], [110.0, 109.98], [110.0, 110.79], [119.0, 119.94], [121.0, 121.64], [123.0, 124.16], [127.0, 128.26], [128.0, 130.67], [131.0, 133.19], [135.0, 134.82], [138.0, 139.45], [147.0, 147.56], [151.0, 152.29], [154.0, 155.17], [156.0, 156.78], [157.0, 158.08], [160.0, 159.71], [160.0, 160.07]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.2, 100.0, 0.0, 0.0, 41.5, 0.0, 0.0, 0.0, 61.77, 100.0, 0.0, 0.0, 97.73, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 16.89], ["livestock, farm animals, working animals", 15.79], ["moo", 13.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 1.92, 3.68, 8.8, 0.99, 1.63, 2.35, 0.39, 0.71, 0.08, 2.47, 2.29, 1.25, 0.49, 2.79, 3.35, 0.21, -0.02, 0.79, 0.94, 0.64, 1.16, 1.26, 2.67, 2.19, -0.18, 1.45, 0.56, 1.29, 1.17, 0.78, 1.08, -0.29, 0.07]} \ No newline at end of file diff --git a/annotations_1/Hxc048RM18U_filtered.json b/annotations_1/Hxc048RM18U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b66a7600c18c829af50302c04443ab5b8c3ae005 --- /dev/null +++ b/annotations_1/Hxc048RM18U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 87.54], [89.0, 119.18], [120.0, 130.65]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.24], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 33.99], ["animal", 11.17], ["cattle, bovinae", 8.23]]], "duration": [36.54, 30.18, 10.65]} \ No newline at end of file diff --git a/annotations_1/HxfzrUYFsLk_filtered.json b/annotations_1/HxfzrUYFsLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b057cf34cc5e7d79be4cc46813d4b2e05a4fe3d --- /dev/null +++ b/annotations_1/HxfzrUYFsLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [8.0, 8.95], [18.0, 24.21], [26.0, 32.8], [36.0, 47.78], [49.0, 50.23], [51.0, 53.64], [58.0, 60.62], [64.0, 64.76], [66.0, 70.6], [73.0, 75.51], [80.0, 91.94], [95.0, 113.9]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 32.11, 32.93, 32.17, 0.0, 33.01, 31.77, 0.0, 32.49, 32.32, 30.63, 37.11], "audiomae_on_audioset": [null, null, [["music", 62.44], ["throbbing", 11.76], ["hum", 7.88]], [["music", 45.07], ["speech", 11.37], ["throbbing", 9.72]], [["music", 48.53], ["hum", 23.15], ["throbbing", 8.59]], null, [["music", 20.28], ["hum", 12.44], ["mains hum", 6.81]], [["music", 66.34], ["hum", 8.7], ["throbbing", 5.53]], null, [["speech", 36.01], ["music", 26.51], ["hum", 7.82]], [["speech", 39.05], ["music", 29.26], ["throbbing", 3.91]], [["music", 55.62], ["electronic music", 5.39], ["vehicle", 3.42]], [["music", 50.18], ["synthesizer", 18.12], ["electronic music", 4.11]]], "duration": [0.37, 0.95, 6.21, 6.8, 11.78, 1.23, 2.64, 2.62, 0.76, 4.6, 2.51, 11.94, 18.9]} \ No newline at end of file diff --git a/annotations_1/Hxtm9DG4k4o_filtered.json b/annotations_1/Hxtm9DG4k4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02639e16c9deec561c31dc248e0edcad9f2cb9cb --- /dev/null +++ b/annotations_1/Hxtm9DG4k4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 4.24], [5.0, 5.66], [6.0, 7.05], [9.0, 10.34], [11.0, 14.35], [15.0, 21.76], [22.0, 29.81], [30.0, 31.72], [32.0, 31.95], [33.0, 32.95], [36.0, 36.69], [40.0, 40.37], [42.0, 41.82], [42.0, 42.42], [43.0, 42.84], [44.0, 44.15], [46.0, 46.38], [61.0, 61.92], [62.0, 63.36], [64.0, 64.59], [65.0, 65.92], [68.0, 68.15], [69.0, 69.96], [71.0, 71.68], [72.0, 73.5], [74.0, 74.9], [75.0, 80.03], [87.0, 88.53], [107.0, 107.79], [109.0, 109.65], [112.0, 112.33], [124.0, 125.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 51.94, 44.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 37.33], ["musical instrument", 18.34], ["guitar", 11.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.14], ["piano", 13.38], ["keyboard (musical)", 13.17]], null, null, null, null, null], "duration": [0.13, 0.24, 0.66, 1.05, 1.34, 3.35, 6.76, 7.81, 1.72, -0.05, -0.05, 0.69, 0.37, -0.18, 0.42, -0.16, 0.15, 0.38, 0.92, 1.36, 0.59, 0.92, 0.15, 0.96, 0.68, 1.5, 0.9, 5.03, 1.53, 0.79, 0.65, 0.33, 1.14]} \ No newline at end of file diff --git a/annotations_1/HzvL4MonF-I_filtered.json b/annotations_1/HzvL4MonF-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56e05ba2ec35214afcdc06adf9708d1fbb707ea1 --- /dev/null +++ b/annotations_1/HzvL4MonF-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.58], [6.0, 7.62], [8.0, 9.54], [12.0, 13.9], [15.0, 15.74], [17.0, 19.38], [23.0, 23.68], [28.0, 36.93], [38.0, 41.07], [42.0, 43.44], [46.0, 55.85], [60.0, 60.34], [61.0, 62.28], [66.0, 67.68], [74.0, 74.56], [75.0, 76.87], [78.0, 81.09], [83.0, 83.4], [84.0, 86.91], [89.0, 89.13], [91.0, 94.29], [95.0, 96.65], [98.0, 98.66], [99.0, 99.77], [100.0, 100.85], [102.0, 103.76], [105.0, 107.01], [110.0, 111.75], [118.0, 119.42], [122.0, 122.71], [127.0, 128.75], [134.0, 137.2], [139.0, 145.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [47.9, 0.0, 0.0, 0.0, 0.0, 68.41, 0.0, 63.31, 71.0, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 0.0, 42.28, 0.0, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 38.6, 0.0, 0.0, 0.0, 0.0, 38.14, 38.52], "audiomae_on_audioset": [[["hum", 31.32], ["mains hum", 26.71], ["music", 12.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.45], ["whale vocalization", 9.81], ["theremin", 7.51]], null, [["music", 54.12], ["effects unit", 11.07], ["synthesizer", 9.41]], null, null, null, null, null, [["cowbell", 11.62], ["music", 10.33], ["speech", 7.78]], null, null, null, null, [["music", 37.87], ["guitar", 8.36], ["musical instrument", 8.06]], [["music", 39.9], ["guitar", 10.51], ["musical instrument", 9.21]]], "duration": [4.58, 1.62, 1.54, 1.9, 0.74, 2.38, 0.68, 8.93, 3.07, 1.44, 9.85, 0.34, 1.28, 1.68, 0.56, 1.87, 3.09, 0.4, 2.91, 0.13, 3.29, 1.65, 0.66, 0.77, 0.85, 1.76, 2.01, 1.75, 1.42, 0.71, 1.75, 3.2, 6.54]} \ No newline at end of file diff --git a/annotations_1/I-6XHJFUBDI_filtered.json b/annotations_1/I-6XHJFUBDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5dd646e3d3aa9821ce79ef30899ec934b83af87 --- /dev/null +++ b/annotations_1/I-6XHJFUBDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [8.0, 11.18], [12.0, 16.68], [18.0, 19.58], [22.0, 23.58], [26.0, 36.41], [37.0, 37.66], [39.0, 39.38], [40.0, 41.0], [46.0, 49.87], [50.0, 54.87], [55.0, 62.24], [66.0, 67.12], [96.0, 96.65], [99.0, 99.54], [109.0, 119.25], [121.0, 125.51], [126.0, 128.98], [130.0, 131.04], [141.0, 141.3], [143.0, 144.26], [148.0, 160.47], [161.0, 167.04], [168.0, 172.83], [176.0, 177.09], [181.0, 182.55], [189.0, 190.22], [194.0, 195.89]], "keep_status": [false, true, true, false, false, true, false, false, false, true, true, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 38.94, 34.99, 0.0, 0.0, 42.96, 0.0, 0.0, 0.0, 40.66, 40.07, 39.02, 0.0, 0.0, 0.0, 41.22, 99.1, 82.25, 0.0, 0.0, 0.0, 51.66, 76.2, 35.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 44.11], ["throbbing", 12.63], ["mains hum", 11.24]], [["music", 15.62], ["speech", 14.46], ["throbbing", 13.66]], null, null, [["music", 29.94], ["hum", 21.63], ["mains hum", 13.08]], null, null, null, [["hum", 24.82], ["music", 21.36], ["gong", 13.61]], [["hum", 24.77], ["music", 22.36], ["mains hum", 15.12]], [["music", 43.51], ["ambient music", 8.23], ["electronic music", 5.93]], null, null, null, [["music", 15.87], ["hum", 14.65], ["singing bowl", 13.05]], null, null, null, null, null, null, null, [["speech", 34.83], ["sine wave", 10.18], ["busy signal", 9.33]], null, null, null, null], "duration": [1.48, 3.18, 4.68, 1.58, 1.58, 10.41, 0.66, 0.38, 1.0, 3.87, 4.87, 7.24, 1.12, 0.65, 0.54, 10.25, 4.51, 2.98, 1.04, 0.3, 1.26, 12.47, 6.04, 4.83, 1.09, 1.55, 1.22, 1.89]} \ No newline at end of file diff --git a/annotations_1/I-6xj25pOP4_filtered.json b/annotations_1/I-6xj25pOP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82038bb6c85e5c5b1c605aeb60303b128acba1f7 --- /dev/null +++ b/annotations_1/I-6xj25pOP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [38.0, 38.99], [57.0, 59.75], [62.0, 70.65], [83.0, 83.27], [86.0, 86.34], [88.0, 88.05], [89.0, 90.39]], "keep_status": [true, false, false, true, false, false, false, false], "silence_prob": [32.74, 0.0, 31.0, 28.58, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.2], ["musical instrument", 7.99], ["guitar", 6.8]], null, [["music", 66.25], ["synthesizer", 4.82], ["hum", 2.47]], [["music", 37.71], ["groan", 20.63], ["speech", 5.37]], null, null, null, null], "duration": [2.09, 0.99, 2.75, 8.65, 0.27, 0.34, 0.05, 1.39]} \ No newline at end of file diff --git a/annotations_1/I-93Ijkhy4I_filtered.json b/annotations_1/I-93Ijkhy4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8377b09c0473f9fc80f520e3c58ed0fd30cd9178 --- /dev/null +++ b/annotations_1/I-93Ijkhy4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.32], [19.0, 18.98], [36.0, 46.11], [49.0, 56.57], [59.0, 59.17], [65.0, 70.98]], "keep_status": [false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 29.61, 29.58, 0.0, 28.15], "audiomae_on_audioset": [null, null, [["music", 43.35], ["trombone", 14.72], ["brass instrument", 11.04]], [["music", 46.24], ["brass instrument", 15.43], ["trombone", 12.09]], null, [["music", 51.75], ["musical instrument", 3.8], ["quack", 3.53]]], "duration": [1.32, -0.02, 10.11, 7.57, 0.17, 5.98]} \ No newline at end of file diff --git a/annotations_1/I-Iankzmv3I_filtered.json b/annotations_1/I-Iankzmv3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..034b172ae5fb3b9c6b9e5c9d098d2c4b41a01bf4 --- /dev/null +++ b/annotations_1/I-Iankzmv3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.79], [27.0, 27.82], [38.0, 42.15], [45.0, 48.2], [51.0, 56.62], [59.0, 58.7], [59.0, 58.87], [59.0, 69.62], [73.0, 73.8], [76.0, 77.18], [79.0, 79.39], [80.0, 80.92], [83.0, 85.31], [93.0, 94.93], [97.0, 100.57], [101.0, 107.52], [110.0, 122.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [62.17, 0.0, 46.09, 48.48, 40.62, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 0.0, 36.35, 0.0, 37.91, 43.87, 38.51], "audiomae_on_audioset": [null, null, [["music", 65.76], ["theremin", 5.28], ["synthesizer", 3.17]], [["music", 78.17], ["synthesizer", 2.93], ["didgeridoo", 2.51]], [["music", 74.41], ["synthesizer", 3.74], ["theremin", 2.53]], null, null, [["music", 82.66], ["hum", 1.49], ["theremin", 0.97]], null, null, null, null, [["livestock, farm animals, working animals", 30.19], ["moo", 29.19], ["cattle, bovinae", 26.91]], null, [["music", 69.63], ["singing", 4.4], ["song", 1.71]], [["music", 63.42], ["theremin", 2.99], ["humming", 2.66]], [["music", 73.18], ["singing", 2.49], ["soul music", 1.81]]], "duration": [4.79, 0.82, 4.15, 3.2, 5.62, -0.3, -0.13, 10.62, 0.8, 1.18, 0.39, 0.92, 2.31, 1.93, 3.57, 6.52, 12.13]} \ No newline at end of file diff --git a/annotations_1/I0jOVXcnjdg_filtered.json b/annotations_1/I0jOVXcnjdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cab93f58a0edc0751c052211ff74b968e41b7ef --- /dev/null +++ b/annotations_1/I0jOVXcnjdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.66], [31.0, 31.73], [32.0, 32.37], [33.0, 34.37], [38.0, 41.05], [42.0, 44.25], [49.0, 50.19], [56.0, 56.88], [67.0, 67.19], [71.0, 72.3], [80.0, 79.74], [94.0, 96.33], [115.0, 115.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.8, 0.0, 0.0, 0.0, 99.8, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.66, 0.73, 0.37, 1.37, 3.05, 2.25, 1.19, 0.88, 0.19, 1.3, -0.26, 2.33, 0.25]} \ No newline at end of file diff --git a/annotations_1/I2v7jlIBL1A_filtered.json b/annotations_1/I2v7jlIBL1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19e2cff4f00d7735024634b98689682d4d790fe --- /dev/null +++ b/annotations_1/I2v7jlIBL1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.16], [2.0, 9.34], [11.0, 12.28], [13.0, 14.57], [15.0, 16.44], [20.0, 20.58], [24.0, 26.43], [28.0, 32.41], [33.0, 34.11], [35.0, 40.95], [44.0, 47.16], [49.0, 73.21], [74.0, 75.17], [77.0, 80.67], [83.0, 82.81], [87.0, 88.32], [95.0, 95.96], [107.0, 121.95], [126.0, 128.6], [136.0, 136.53]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 64.52, 33.49, 0.0, 35.45, 33.65, 32.19, 0.0, 32.31, 0.0, 0.0, 0.0, 32.06, 49.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 34.69], ["music", 18.25], ["sidetone", 7.81]], null, [["speech", 50.94], ["animal", 10.84], ["dog", 9.19]], [["dog", 32.89], ["bow-wow", 18.17], ["animal", 17.95]], [["dog", 20.92], ["bow-wow", 20.04], ["animal", 16.62]], null, [["speech", 40.17], ["quack", 5.03], ["music", 4.9]], null, null, null, [["speech", 62.89], ["animal", 4.04], ["whack, thwack", 3.52]], [["fly, housefly", 33.49], ["insect", 26.12], ["mosquito", 6.0]], null], "duration": [0.16, 7.34, 1.28, 1.57, 1.44, 0.58, 2.43, 4.41, 1.11, 5.95, 3.16, 24.21, 1.17, 3.67, -0.19, 1.32, 0.96, 14.95, 2.6, 0.53]} \ No newline at end of file diff --git a/annotations_1/I30x5dMvcA8_filtered.json b/annotations_1/I30x5dMvcA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf603fe760d333295ae85f89e9ede09374065cc3 --- /dev/null +++ b/annotations_1/I30x5dMvcA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.92], [9.0, 9.56], [10.0, 10.32], [12.0, 14.69], [15.0, 15.47], [16.0, 17.64], [18.0, 20.58], [22.0, 22.62], [24.0, 25.07], [26.0, 33.59], [34.0, 62.83], [64.0, 126.2], [127.0, 147.5], [148.0, 151.09]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.31, 0.0, 0.0, 41.36, 0.0, 0.0, 32.28, 32.49, 0.0, 35.32, 32.53], "audiomae_on_audioset": [null, null, null, [["speech", 38.87], ["animal", 15.56], ["wild animals", 5.97]], null, null, [["whale vocalization", 93.02], ["music", 0.65], ["pulse", 0.54]], null, null, [["speech", 41.13], ["music", 25.91], ["sidetone", 11.37]], [["music", 57.12], ["didgeridoo", 16.95], ["buzz", 6.66]], null, [["music", 84.15], ["fart", 2.42], ["buzz", 2.28]], [["whale vocalization", 55.77], ["speech", 18.38], ["roaring cats (lions, tigers)", 8.92]]], "duration": [-0.08, 0.56, 0.32, 2.69, 0.47, 1.64, 2.58, 0.62, 1.07, 7.59, 28.83, 62.2, 20.5, 3.09]} \ No newline at end of file diff --git a/annotations_1/I3akC_INsFc_filtered.json b/annotations_1/I3akC_INsFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a97fad137d974f71443ffdfb562c3eccabeb2190 --- /dev/null +++ b/annotations_1/I3akC_INsFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [2.0, 2.22], [3.0, 3.38], [4.0, 4.26], [5.0, 5.21], [6.0, 7.13], [10.0, 10.37], [11.0, 11.5], [14.0, 15.15], [17.0, 19.67], [21.0, 21.24], [22.0, 22.49], [24.0, 24.51], [29.0, 28.93], [30.0, 31.21], [32.0, 32.93], [33.0, 33.62], [34.0, 34.18], [35.0, 35.16], [36.0, 38.28], [42.0, 42.6], [44.0, 45.59], [48.0, 47.9], [48.0, 48.93], [50.0, 50.38], [64.0, 64.56], [68.0, 68.35], [69.0, 71.59], [72.0, 77.26], [78.0, 78.58], [79.0, 80.08], [80.0, 81.72], [83.0, 83.39], [85.0, 85.24], [85.0, 85.82], [87.0, 88.3], [90.0, 89.78], [91.0, 92.85], [94.0, 95.18], [96.0, 97.41], [98.0, 98.14], [98.0, 102.17], [102.0, 103.37], [104.0, 104.48], [107.0, 109.78], [111.0, 112.13], [113.0, 113.91], [114.0, 121.07], [123.0, 123.25], [124.0, 124.48], [125.0, 125.68], [126.0, 128.51], [129.0, 129.12], [129.0, 130.01], [131.0, 135.85], [137.0, 138.43], [139.0, 139.45], [140.0, 141.51], [142.0, 142.45], [143.0, 146.11], [148.0, 148.93], [150.0, 151.88], [155.0, 155.38], [156.0, 156.59], [158.0, 159.31], [160.0, 169.7], [170.0, 171.53], [172.0, 174.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 0.0, 95.64, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0, 52.51, 0.0, 0.0, 50.26, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0, 52.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.56], ["radio", 10.83], ["noise", 6.29]], null, null, null, null, null, null, null, [["speech", 17.9], ["animal", 7.33], ["whale vocalization", 6.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 18.97], ["speech", 13.33], ["radio", 9.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.22, 0.38, 0.26, 0.21, 1.13, 0.37, 0.5, 1.15, 2.67, 0.24, 0.49, 0.51, -0.07, 1.21, 0.93, 0.62, 0.18, 0.16, 2.28, 0.6, 1.59, -0.1, 0.93, 0.38, 0.56, 0.35, 2.59, 5.26, 0.58, 1.08, 1.72, 0.39, 0.24, 0.82, 1.3, -0.22, 1.85, 1.18, 1.41, 0.14, 4.17, 1.37, 0.48, 2.78, 1.13, 0.91, 7.07, 0.25, 0.48, 0.68, 2.51, 0.12, 1.01, 4.85, 1.43, 0.45, 1.51, 0.45, 3.11, 0.93, 1.88, 0.38, 0.59, 1.31, 9.7, 1.53, 2.06]} \ No newline at end of file diff --git a/annotations_1/I4_AaEazcbk_filtered.json b/annotations_1/I4_AaEazcbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83097d0aa92631f09666fe55c824c98ecca55a41 --- /dev/null +++ b/annotations_1/I4_AaEazcbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [7.0, 134.22], [135.0, 170.36]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [1.39, 127.22, 35.36]} \ No newline at end of file diff --git a/annotations_1/I4mtL3Zs0Zs_filtered.json b/annotations_1/I4mtL3Zs0Zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16bce01302ee81e1931578a2bf71b6db3ead581e --- /dev/null +++ b/annotations_1/I4mtL3Zs0Zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [6.0, 12.48], [14.0, 15.5], [18.0, 25.54], [27.0, 28.65], [39.0, 39.26], [42.0, 42.99], [45.0, 48.76], [50.0, 50.26], [51.0, 50.89], [52.0, 69.53], [70.0, 71.56], [76.0, 76.2], [85.0, 85.85], [86.0, 86.21], [87.0, 91.86], [101.0, 108.68], [109.0, 109.63], [111.0, 117.24], [140.0, 140.1], [146.0, 146.62]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [37.97, 43.43, 0.0, 39.49, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 31.91, 0.0, 0.0, 0.0, 0.0, 34.78, 28.97, 0.0, 34.32, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.55], ["singing bowl", 18.12], ["effects unit", 4.7]], [["music", 42.69], ["hum", 14.64], ["speech", 11.48]], null, [["music", 28.97], ["hum", 17.25], ["mains hum", 14.05]], null, null, null, null, null, null, [["music", 58.51], ["hum", 15.46], ["throbbing", 9.52]], null, null, null, null, [["music", 68.02], ["speech", 6.51], ["throbbing", 5.9]], [["hum", 51.09], ["throbbing", 19.94], ["mains hum", 11.07]], null, [["music", 53.24], ["speech", 8.22], ["didgeridoo", 5.39]], null, null], "duration": [2.21, 6.48, 1.5, 7.54, 1.65, 0.26, 0.99, 3.76, 0.26, -0.11, 17.53, 1.56, 0.2, 0.85, 0.21, 4.86, 7.68, 0.63, 6.24, 0.1, 0.62]} \ No newline at end of file diff --git a/annotations_1/I5RKRQcsDKU_filtered.json b/annotations_1/I5RKRQcsDKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6c89a3e0fedc3eebdc87cf0b2ae8fdd9850c4aa --- /dev/null +++ b/annotations_1/I5RKRQcsDKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.92], [9.0, 10.88], [12.0, 19.16], [22.0, 24.63], [25.0, 29.03], [31.0, 32.64], [34.0, 41.17], [44.0, 45.06], [46.0, 48.19], [54.0, 60.96], [62.0, 63.17], [65.0, 65.58], [66.0, 66.92], [68.0, 93.6], [94.0, 95.4], [98.0, 98.86], [101.0, 102.66], [109.0, 109.17], [110.0, 111.01], [113.0, 114.59], [116.0, 127.6], [135.0, 137.1], [141.0, 168.08], [171.0, 171.42], [172.0, 175.2]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [46.47, 0.0, 35.87, 37.26, 33.96, 0.0, 33.73, 0.0, 48.74, 31.18, 0.0, 0.0, 0.0, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.24, 46.02, 31.54, 0.0, 84.8], "audiomae_on_audioset": [[["speech", 37.91], ["hum", 23.31], ["mains hum", 10.02]], null, [["rumble", 26.57], ["hum", 20.42], ["music", 19.39]], [["throbbing", 34.36], ["hum", 20.04], ["music", 16.54]], [["hum", 37.46], ["throbbing", 32.11], ["speech", 12.47]], null, [["hum", 22.76], ["music", 21.2], ["throbbing", 13.63]], null, [["music", 59.2], ["hum", 7.16], ["throbbing", 5.03]], [["music", 62.64], ["throbbing", 10.09], ["didgeridoo", 10.07]], null, null, null, [["music", 57.47], ["speech", 11.06], ["throbbing", 7.37]], null, null, null, null, null, null, [["music", 40.06], ["speech", 13.51], ["hum", 11.0]], [["music", 24.42], ["rumble", 9.97], ["throbbing", 9.47]], [["music", 58.96], ["didgeridoo", 21.95], ["hum", 1.95]], null, null], "duration": [4.92, 1.88, 7.16, 2.63, 4.03, 1.64, 7.17, 1.06, 2.19, 6.96, 1.17, 0.58, 0.92, 25.6, 1.4, 0.86, 1.66, 0.17, 1.01, 1.59, 11.6, 2.1, 27.08, 0.42, 3.2]} \ No newline at end of file diff --git a/annotations_1/I5ohJ4BBHzo_filtered.json b/annotations_1/I5ohJ4BBHzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f710323c714cda2e7598f60e97dcbde3b768c3a1 --- /dev/null +++ b/annotations_1/I5ohJ4BBHzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.06], [5.0, 5.68], [6.0, 5.73], [7.0, 8.26], [8.0, 18.28], [19.0, 20.29], [21.0, 23.4], [24.0, 24.39], [36.0, 40.37], [42.0, 43.77], [48.0, 48.61], [53.0, 54.63], [55.0, 55.88], [57.0, 61.87], [64.0, 71.93], [74.0, 81.89], [87.0, 86.71], [90.0, 90.69], [93.0, 95.77], [96.0, 98.91], [100.0, 105.92], [106.0, 108.63], [109.0, 110.39], [111.0, 121.54], [122.0, 124.87], [129.0, 130.27], [131.0, 134.32]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, true, true, false, false, false, true, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.75, 0.0, 43.69, 0.0, 28.83, 0.0, 0.0, 0.0, 0.0, 32.29, 29.35, 29.79, 0.0, 0.0, 30.19, 40.14, 49.59, 44.12, 0.0, 42.91, 41.46, 0.0, 45.72], "audiomae_on_audioset": [null, null, null, null, [["explosion", 35.79], ["speech", 24.48], ["burst, pop", 14.44]], null, [["music", 30.31], ["electronic music", 10.19], ["ambient music", 9.98]], null, [["speech", 41.1], ["mains hum", 9.3], ["music", 8.75]], null, null, null, null, [["music", 31.29], ["speech", 20.02], ["hum", 10.79]], [["music", 27.48], ["hum", 18.87], ["mains hum", 16.02]], [["music", 90.33], ["throbbing", 1.46], ["speech", 1.36]], null, null, [["hum", 23.56], ["mains hum", 18.02], ["speech", 10.45]], [["speech", 57.82], ["rumble", 13.78], ["inside, small room", 2.18]], [["music", 56.5], ["hum", 9.96], ["rumble", 4.06]], [["hum", 50.51], ["throbbing", 31.71], ["music", 4.3]], null, [["music", 27.47], ["mains hum", 20.36], ["hum", 16.95]], [["music", 31.73], ["speech", 13.63], ["hum", 8.24]], null, [["music", 24.1], ["rumble", 12.52], ["hum", 6.84]]], "duration": [0.06, 0.68, -0.27, 1.26, 10.28, 1.29, 2.4, 0.39, 4.37, 1.77, 0.61, 1.63, 0.88, 4.87, 7.93, 7.89, -0.29, 0.69, 2.77, 2.91, 5.92, 2.63, 1.39, 10.54, 2.87, 1.27, 3.32]} \ No newline at end of file diff --git a/annotations_1/I7-GvXsr40k_filtered.json b/annotations_1/I7-GvXsr40k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19521095817440a30e9d791693e4e1c3fa66e98f --- /dev/null +++ b/annotations_1/I7-GvXsr40k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 44.79], [60.0, 60.78], [61.0, 61.06], [61.0, 65.57], [67.0, 67.44], [69.0, 69.52], [83.0, 83.74], [84.0, 87.37], [104.0, 105.98]], "keep_status": [true, false, false, true, false, false, false, false, false], "silence_prob": [29.85, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 31.11, 0.0], "audiomae_on_audioset": [[["music", 25.03], ["boing", 23.45], ["speech", 10.47]], null, null, [["speech", 19.08], ["boing", 18.39], ["grunt", 13.6]], null, null, null, [["boing", 38.8], ["fart", 15.93], ["speech", 15.34]], null], "duration": [6.79, 0.78, 0.06, 4.57, 0.44, 0.52, 0.74, 3.37, 1.98]} \ No newline at end of file diff --git a/annotations_1/I7pEk2hB5OQ_filtered.json b/annotations_1/I7pEk2hB5OQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e2d40365cca878e723544c5c52cc67e3a0df64e --- /dev/null +++ b/annotations_1/I7pEk2hB5OQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.73], [16.0, 16.06], [19.0, 18.66], [21.0, 23.36], [24.0, 23.8], [26.0, 31.18], [34.0, 34.37], [35.0, 35.36], [44.0, 45.25], [47.0, 47.73], [52.0, 52.71], [69.0, 77.77], [82.0, 96.5], [97.0, 96.94], [98.0, 97.93], [99.0, 102.14], [111.0, 111.35]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [41.85, 0.0, 0.0, 41.16, 0.0, 41.83, 0.0, 0.0, 0.0, 0.0, 0.0, 47.82, 37.2, 0.0, 0.0, 76.37, 0.0], "audiomae_on_audioset": [[["speech", 29.2], ["didgeridoo", 23.07], ["boing", 17.59]], null, null, [["frog", 50.07], ["sidetone", 7.78], ["speech", 6.96]], null, [["music", 75.02], ["fly, housefly", 2.49], ["boing", 1.95]], null, null, null, null, null, [["music", 50.25], ["musical instrument", 6.43], ["effects unit", 3.84]], [["music", 68.26], ["speech", 9.64], ["musical instrument", 3.87]], null, null, null, null], "duration": [2.73, 0.06, -0.34, 2.36, -0.2, 5.18, 0.37, 0.36, 1.25, 0.73, 0.71, 8.77, 14.5, -0.06, -0.07, 3.14, 0.35]} \ No newline at end of file diff --git a/annotations_1/I8-3VpZrBww_filtered.json b/annotations_1/I8-3VpZrBww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a5b70fb43f11de8d5e24cfc14d24e5b04ffd710 --- /dev/null +++ b/annotations_1/I8-3VpZrBww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.28], [16.0, 24.85], [27.0, 29.88], [31.0, 31.35], [38.0, 39.48], [40.0, 40.22], [41.0, 43.38], [45.0, 57.25], [62.0, 69.45], [70.0, 69.65], [70.0, 72.32], [74.0, 74.31], [77.0, 77.5], [90.0, 89.94], [94.0, 94.76], [98.0, 98.24], [99.0, 99.62], [103.0, 104.08], [105.0, 110.91]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.4, 31.24, 0.0, 0.0, 0.0, 38.86, 30.96, 30.77, 0.0, 31.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.42], "audiomae_on_audioset": [null, [["hum", 54.34], ["throbbing", 19.02], ["mains hum", 13.66]], [["music", 31.0], ["hum", 19.78], ["mains hum", 13.04]], null, null, null, [["music", 59.58], ["musical instrument", 7.1], ["synthesizer", 5.16]], [["music", 61.78], ["throbbing", 12.53], ["hum", 11.22]], [["music", 49.07], ["throbbing", 29.35], ["hum", 8.12]], null, [["music", 35.58], ["hum", 22.55], ["throbbing", 11.24]], null, null, null, null, null, null, null, [["music", 29.31], ["hum", 23.58], ["throbbing", 18.5]]], "duration": [1.28, 8.85, 2.88, 0.35, 1.48, 0.22, 2.38, 12.25, 7.45, -0.35, 2.32, 0.31, 0.5, -0.06, 0.76, 0.24, 0.62, 1.08, 5.91]} \ No newline at end of file diff --git a/annotations_1/I8-FxxgRACE_filtered.json b/annotations_1/I8-FxxgRACE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02087679e4a29580a3db7d5cef847344c8693089 --- /dev/null +++ b/annotations_1/I8-FxxgRACE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.67], [19.0, 30.97], [31.0, 84.5], [88.0, 93.34], [94.0, 96.92], [100.0, 100.85], [101.0, 112.95], [120.0, 125.07], [129.0, 130.49], [131.0, 138.5], [142.0, 148.42]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 28.35, 0.0, 28.4, 28.72, 0.0, 29.03, 34.15, 0.0, 29.7, 46.29], "audiomae_on_audioset": [null, [["music", 37.67], ["didgeridoo", 7.15], ["electronic music", 5.84]], null, [["didgeridoo", 69.71], ["music", 10.01], ["throbbing", 4.56]], [["music", 83.93], ["didgeridoo", 5.37], ["musical instrument", 2.22]], null, [["music", 68.71], ["didgeridoo", 5.99], ["synthesizer", 3.89]], [["music", 53.46], ["didgeridoo", 11.92], ["gong", 6.35]], null, [["music", 43.97], ["didgeridoo", 25.5], ["musical instrument", 6.9]], [["music", 43.14], ["guitar", 7.75], ["didgeridoo", 5.82]]], "duration": [1.67, 11.97, 53.5, 5.34, 2.92, 0.85, 11.95, 5.07, 1.49, 7.5, 6.42]} \ No newline at end of file diff --git a/annotations_1/I8yvHZ7de2k_filtered.json b/annotations_1/I8yvHZ7de2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62207cfa6e2b54f69a6fd378b6b22f40ed7851e2 --- /dev/null +++ b/annotations_1/I8yvHZ7de2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.25], [17.0, 17.05], [20.0, 21.09], [22.0, 34.59], [37.0, 37.2], [39.0, 41.18], [44.0, 44.47], [46.0, 47.14], [48.0, 48.68], [50.0, 50.7], [52.0, 69.3], [73.0, 74.38], [75.0, 81.63], [102.0, 106.22], [110.0, 113.24], [116.0, 117.44], [121.0, 121.9]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.03, 0.0, 0.0, 35.98, 0.0, 50.41, 0.0, 0.0, 0.0, 0.0, 33.4, 0.0, 30.65, 31.96, 31.3, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.47], ["speech", 21.89], ["hum", 5.37]], null, null, [["music", 56.16], ["speech", 21.36], ["hum", 3.0]], null, null, null, null, null, null, [["music", 61.93], ["speech", 10.56], ["fart", 3.42]], null, [["music", 61.51], ["throbbing", 8.9], ["pulse", 4.31]], [["cattle, bovinae", 33.44], ["moo", 25.35], ["livestock, farm animals, working animals", 24.67]], [["cattle, bovinae", 55.18], ["moo", 30.31], ["livestock, farm animals, working animals", 12.79]], null, null], "duration": [2.25, 0.05, 1.09, 12.59, 0.2, 2.18, 0.47, 1.14, 0.68, 0.7, 17.3, 1.38, 6.63, 4.22, 3.24, 1.44, 0.9]} \ No newline at end of file diff --git a/annotations_1/I9NGZteE31I_filtered.json b/annotations_1/I9NGZteE31I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1209afee504d73f2242978c2878e2475306663aa --- /dev/null +++ b/annotations_1/I9NGZteE31I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.31], [10.0, 13.63], [18.0, 18.66], [23.0, 23.77], [25.0, 26.35], [42.0, 42.77], [44.0, 49.57], [53.0, 54.63], [56.0, 56.17], [57.0, 60.71], [65.0, 68.62], [71.0, 71.25], [75.0, 75.1], [79.0, 82.24], [85.0, 85.56], [96.0, 109.41], [127.0, 127.9], [129.0, 129.44], [133.0, 133.71], [135.0, 135.41], [136.0, 139.29], [142.0, 152.51], [154.0, 157.03], [158.0, 158.63], [161.0, 162.78]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [35.08, 45.33, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 37.36, 32.02, 0.0, 0.0, 31.9, 0.0, 32.26, 0.0, 0.0, 0.0, 0.0, 31.33, 30.56, 29.76, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.9], ["sidetone", 14.64], ["speech", 6.59]], [["music", 72.07], ["musical instrument", 4.46], ["synthesizer", 2.6]], null, null, null, null, [["music", 61.23], ["speech", 28.33], ["synthesizer", 1.91]], null, null, [["music", 39.35], ["speech", 20.98], ["ding-dong", 3.45]], [["music", 24.1], ["sidetone", 20.32], ["speech", 19.28]], null, null, [["music", 33.09], ["speech", 27.88], ["sidetone", 10.74]], null, [["music", 54.38], ["speech", 10.93], ["throbbing", 9.66]], null, null, null, null, [["speech", 51.47], ["music", 23.95], ["crack", 6.35]], [["music", 37.8], ["hum", 14.76], ["speech", 13.45]], [["mosquito", 62.08], ["fly, housefly", 30.15], ["insect", 4.3]], null, null], "duration": [5.31, 3.63, 0.66, 0.77, 1.35, 0.77, 5.57, 1.63, 0.17, 3.71, 3.62, 0.25, 0.1, 3.24, 0.56, 13.41, 0.9, 0.44, 0.71, 0.41, 3.29, 10.51, 3.03, 0.63, 1.78]} \ No newline at end of file diff --git a/annotations_1/I9r1j1ZKBYk_filtered.json b/annotations_1/I9r1j1ZKBYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67cd233f905558ac9c3e35f2c12309adacf4951c --- /dev/null +++ b/annotations_1/I9r1j1ZKBYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [5.0, 6.81], [13.0, 13.63], [16.0, 16.88], [22.0, 24.6], [25.0, 26.2], [27.0, 28.66], [31.0, 32.31], [38.0, 38.6], [46.0, 48.71], [52.0, 57.47], [71.0, 71.96], [73.0, 83.02], [85.0, 85.43], [86.0, 86.78], [88.0, 92.31], [93.0, 93.85], [96.0, 101.06], [102.0, 103.45], [105.0, 106.76], [111.0, 111.72], [113.0, 129.59], [133.0, 140.27], [145.0, 146.64], [149.0, 149.86], [151.0, 151.9]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 48.82, 0.0, 0.0, 0.0, 0.0, 41.52, 30.01, 0.0, 28.96, 0.0, 0.0, 34.12, 0.0, 34.31, 0.0, 0.0, 0.0, 28.85, 31.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 37.95], ["hum", 13.21], ["throbbing", 11.62]], null, null, null, null, [["vehicle", 13.83], ["motorcycle", 6.63], ["accelerating, revving, vroom", 6.09]], [["music", 64.16], ["hum", 9.8], ["mains hum", 7.37]], null, [["music", 48.6], ["throbbing", 14.05], ["didgeridoo", 9.33]], null, null, [["music", 63.05], ["scary music", 3.88], ["ambient music", 2.66]], null, [["music", 42.18], ["speech", 13.85], ["hum", 10.5]], null, null, null, [["music", 72.37], ["electronic music", 7.96], ["throbbing", 3.02]], [["music", 26.57], ["didgeridoo", 24.58], ["hum", 14.1]], null, null, null], "duration": [0.4, 1.81, 0.63, 0.88, 2.6, 1.2, 1.66, 1.31, 0.6, 2.71, 5.47, 0.96, 10.02, 0.43, 0.78, 4.31, 0.85, 5.06, 1.45, 1.76, 0.72, 16.59, 7.27, 1.64, 0.86, 0.9]} \ No newline at end of file diff --git a/annotations_1/IAaXyDc1gjk_filtered.json b/annotations_1/IAaXyDc1gjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e3cb7423db2201c44f0139b94dcd5244130eb1c --- /dev/null +++ b/annotations_1/IAaXyDc1gjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.92], [21.0, 21.47], [23.0, 23.7], [39.0, 47.49], [55.0, 64.69], [73.0, 83.08], [104.0, 104.11], [120.0, 122.13], [136.0, 136.19], [137.0, 146.5], [149.0, 152.93], [154.0, 156.29], [161.0, 162.33], [173.0, 172.94], [195.0, 195.88], [201.0, 202.05]], "keep_status": [false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.19, 34.16, 32.24, 0.0, 31.31, 0.0, 31.94, 32.57, 51.94, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 46.34], ["music", 28.14], ["throbbing", 4.65]], [["music", 55.01], ["speech", 29.32], ["synthesizer", 2.41]], [["music", 42.07], ["speech", 19.08], ["scary music", 6.2]], null, [["music", 30.34], ["civil defense siren", 17.4], ["speech", 5.76]], null, [["music", 63.16], ["speech", 17.0], ["theremin", 1.82]], [["music", 42.31], ["boing", 21.38], ["fly, housefly", 5.1]], null, null, null, null, null], "duration": [0.92, 0.47, 0.7, 8.49, 9.69, 10.08, 0.11, 2.13, 0.19, 9.5, 3.93, 2.29, 1.33, -0.06, 0.88, 1.05]} \ No newline at end of file diff --git a/annotations_1/IAb5uq3GzZI_filtered.json b/annotations_1/IAb5uq3GzZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd2b2819e3e7fc032375b979f095379935d8c082 --- /dev/null +++ b/annotations_1/IAb5uq3GzZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 26.01], [27.0, 27.48], [27.0, 27.65], [28.0, 42.69], [44.0, 47.24], [48.0, 51.31], [57.0, 59.31], [60.0, 60.98], [65.0, 65.55], [70.0, 70.12], [72.0, 73.82], [79.0, 84.48], [85.0, 87.59], [90.0, 90.69], [92.0, 92.89], [101.0, 104.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.17, 0.0, 0.0, 30.18, 96.66, 75.55, 95.37, 0.0, 0.0, 0.0, 0.0, 43.71, 55.11, 0.0, 0.0, 52.1], "audiomae_on_audioset": [[["music", 74.86], ["scary music", 8.72], ["ambient music", 4.06]], null, null, [["music", 80.83], ["theremin", 6.46], ["ambient music", 3.12]], null, null, null, null, null, null, null, [["music", 33.48], ["singing bowl", 18.71], ["ambient music", 14.65]], null, null, null, null], "duration": [17.01, 0.48, 0.65, 14.69, 3.24, 3.31, 2.31, 0.98, 0.55, 0.12, 1.82, 5.48, 2.59, 0.69, 0.89, 3.21]} \ No newline at end of file diff --git a/annotations_1/IB7BvgXIKOs_filtered.json b/annotations_1/IB7BvgXIKOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11a1397918297fc9487b194932ad0a77162ac348 --- /dev/null +++ b/annotations_1/IB7BvgXIKOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.94], [25.0, 24.97], [26.0, 26.33], [30.0, 30.86], [35.0, 36.42], [40.0, 47.21], [48.0, 55.27], [60.0, 60.61], [62.0, 62.73], [66.0, 67.88], [74.0, 74.04], [89.0, 89.88], [93.0, 94.31], [96.0, 97.36], [105.0, 105.06], [106.0, 107.18], [116.0, 116.68], [117.0, 117.95], [118.0, 118.54], [120.0, 121.95], [123.0, 123.8], [125.0, 125.83], [127.0, 128.61], [129.0, 129.12], [132.0, 132.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 34.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 64.52], ["electronic music", 8.31], ["synthesizer", 7.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.06, -0.03, 0.33, 0.86, 1.42, 7.21, 7.27, 0.61, 0.73, 1.88, 0.04, 0.88, 1.31, 1.36, 0.06, 1.18, 0.68, 0.95, 0.54, 1.95, 0.8, 0.83, 1.61, 0.12, 0.16]} \ No newline at end of file diff --git a/annotations_1/IBRkROD4KAU_filtered.json b/annotations_1/IBRkROD4KAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b662c7e64409a3e9e9a0356fde18a60f42853b6b --- /dev/null +++ b/annotations_1/IBRkROD4KAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [5.0, 6.1], [8.0, 9.59], [13.0, 13.32], [15.0, 15.04], [18.0, 21.44], [24.0, 24.7], [30.0, 32.1], [36.0, 37.52], [38.0, 38.52], [39.0, 40.15], [41.0, 44.37], [47.0, 48.0], [49.0, 50.31], [52.0, 53.22], [54.0, 54.41], [55.0, 56.49], [59.0, 59.63], [61.0, 61.6], [62.0, 63.64], [65.0, 67.04], [69.0, 69.11], [70.0, 70.34], [71.0, 72.25], [73.0, 79.34], [80.0, 84.28], [85.0, 85.01], [86.0, 86.7], [88.0, 88.55], [90.0, 89.75], [91.0, 91.03], [92.0, 92.28], [94.0, 94.93], [96.0, 97.61], [99.0, 100.8], [102.0, 103.69], [104.0, 105.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 100.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 78.38, 53.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 1.1, 1.59, 0.32, 0.04, 3.44, 0.7, 2.1, 1.52, 0.52, 1.15, 3.37, 1.0, 1.31, 1.22, 0.41, 1.49, 0.63, 0.6, 1.64, 2.04, 0.11, 0.34, 1.25, 6.34, 4.28, 0.01, 0.7, 0.55, -0.25, 0.03, 0.28, 0.93, 1.61, 1.8, 1.69, 1.92]} \ No newline at end of file diff --git a/annotations_1/IBTpVVTZJ5c_filtered.json b/annotations_1/IBTpVVTZJ5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2cd01944c9e9828c207b5a141f6bd39ec9b3565 --- /dev/null +++ b/annotations_1/IBTpVVTZJ5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.67], [13.0, 13.66], [15.0, 16.33], [18.0, 19.09], [22.0, 24.07], [28.0, 29.19], [30.0, 30.06], [31.0, 38.82], [40.0, 108.5], [109.0, 111.52], [112.0, 111.6], [112.0, 111.87], [112.0, 111.92], [112.0, 111.96], [112.0, 112.62], [115.0, 116.46], [120.0, 121.56]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 33.35, 0.0, 40.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 44.1], ["synthesizer", 13.45], ["hum", 9.33]], null, [["didgeridoo", 39.43], ["music", 11.68], ["speech", 8.23]], null, null, null, null, null, null, null], "duration": [0.67, 0.66, 1.33, 1.09, 2.07, 1.19, 0.06, 7.82, 68.5, 2.52, -0.4, -0.13, -0.08, -0.04, 0.62, 1.46, 1.56]} \ No newline at end of file diff --git a/annotations_1/IBdgRBvFwlM_filtered.json b/annotations_1/IBdgRBvFwlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..784490b83d874a8120357e5dce60b09a559e8dc8 --- /dev/null +++ b/annotations_1/IBdgRBvFwlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.5], [12.0, 12.87], [16.0, 15.97], [22.0, 24.0], [25.0, 25.42], [30.0, 30.28], [31.0, 31.41], [33.0, 33.47], [35.0, 37.54], [43.0, 44.12], [46.0, 46.16], [47.0, 51.54], [56.0, 56.64], [58.0, 64.47], [67.0, 68.55], [69.0, 69.69], [70.0, 71.36], [73.0, 73.28], [75.0, 75.44], [78.0, 87.47], [102.0, 102.44], [105.0, 105.29], [106.0, 105.87], [106.0, 109.09], [109.0, 111.1], [112.0, 113.36], [114.0, 114.34], [115.0, 115.08], [117.0, 117.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 95.37, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 66.88, 78.55, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 0.87, -0.03, 2.0, 0.42, 0.28, 0.41, 0.47, 2.54, 1.12, 0.16, 4.54, 0.64, 6.47, 1.55, 0.69, 1.36, 0.28, 0.44, 9.47, 0.44, 0.29, -0.13, 3.09, 2.1, 1.36, 0.34, 0.08, 0.19]} \ No newline at end of file diff --git a/annotations_1/IC-u2-aQXS4_filtered.json b/annotations_1/IC-u2-aQXS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3403905933b7dff542c878f5351a9d6da0f1cc90 --- /dev/null +++ b/annotations_1/IC-u2-aQXS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.87], [5.0, 8.23], [12.0, 12.55], [15.0, 15.67], [16.0, 17.31], [18.0, 27.23], [28.0, 27.67], [28.0, 27.7], [28.0, 27.73], [28.0, 27.77], [28.0, 28.21], [32.0, 51.17], [54.0, 61.18], [62.0, 69.4], [72.0, 72.5], [76.0, 110.44], [112.0, 113.37], [115.0, 117.8], [118.0, 119.1], [120.0, 128.93], [131.0, 137.3], [138.0, 138.64], [139.0, 146.2], [148.0, 151.65]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 46.75, 0.0, 0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 30.49, 32.73, 31.48, 0.0, 0.0, 0.0, 33.06, 0.0, 33.99, 38.35, 0.0, 47.74, 57.81], "audiomae_on_audioset": [null, [["speech", 48.81], ["music", 27.28], ["inside, small room", 1.72]], null, null, null, [["music", 34.96], ["speech", 10.81], ["hum", 10.21]], null, null, null, null, null, [["music", 37.7], ["cacophony", 8.7], ["explosion", 4.86]], [["music", 69.49], ["hum", 3.33], ["brass instrument", 2.63]], [["fly, housefly", 13.61], ["music", 12.88], ["buzz", 11.43]], null, null, null, [["music", 30.29], ["didgeridoo", 25.42], ["speech", 9.4]], null, [["music", 60.66], ["buzz", 15.03], ["musical instrument", 1.35]], [["music", 54.49], ["theremin", 6.13], ["effects unit", 5.09]], null, [["fly, housefly", 67.2], ["insect", 14.39], ["bee, wasp, etc.", 6.98]], null], "duration": [1.87, 3.23, 0.55, 0.67, 1.31, 9.23, -0.33, -0.3, -0.27, -0.23, 0.21, 19.17, 7.18, 7.4, 0.5, 34.44, 1.37, 2.8, 1.1, 8.93, 6.3, 0.64, 7.2, 3.65]} \ No newline at end of file diff --git a/annotations_1/IC21keB1yaM_filtered.json b/annotations_1/IC21keB1yaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21bbaf5179d1b3f71caca48bda43f626baf67ca9 --- /dev/null +++ b/annotations_1/IC21keB1yaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.74], [6.0, 6.02], [9.0, 10.17], [11.0, 12.66], [18.0, 18.3], [21.0, 21.73], [22.0, 23.13], [24.0, 23.97], [25.0, 25.88], [27.0, 28.0], [29.0, 29.25], [30.0, 30.18], [31.0, 31.78], [34.0, 35.85], [36.0, 37.37], [38.0, 38.18], [41.0, 41.18], [43.0, 49.74], [50.0, 53.28], [55.0, 56.2], [66.0, 68.76], [70.0, 72.99], [75.0, 76.1], [77.0, 77.95], [80.0, 80.11], [81.0, 81.89], [91.0, 91.67], [93.0, 93.6], [95.0, 94.9], [97.0, 101.56], [102.0, 103.22], [104.0, 105.11], [106.0, 107.1], [108.0, 109.56], [110.0, 129.88], [137.0, 137.56], [145.0, 150.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 100.0, 0.0, 61.77, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.47, 0.0, 0.0, 0.0, 0.0, 31.89, 0.0, 35.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.36], ["thunk", 10.0], ["music", 3.67]], null, null, null, null, [["music", 77.81], ["didgeridoo", 3.49], ["speech", 2.52]], null, [["music", 69.08], ["musical instrument", 2.92], ["hum", 2.15]]], "duration": [-0.26, 0.02, 1.17, 1.66, 0.3, 0.73, 1.13, -0.03, 0.88, 1.0, 0.25, 0.18, 0.78, 1.85, 1.37, 0.18, 0.18, 6.74, 3.28, 1.2, 2.76, 2.99, 1.1, 0.95, 0.11, 0.89, 0.67, 0.6, -0.1, 4.56, 1.22, 1.11, 1.1, 1.56, 19.88, 0.56, 5.87]} \ No newline at end of file diff --git a/annotations_1/ICJi_nMcUQc_filtered.json b/annotations_1/ICJi_nMcUQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a39b735e12a06a9ae462f28117e2938e600ff86b --- /dev/null +++ b/annotations_1/ICJi_nMcUQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 54.4], [56.0, 56.52], [57.0, 57.57], [59.0, 59.16]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [44.4, 0.52, 0.57, 0.16]} \ No newline at end of file diff --git a/annotations_1/ICRVd--TY-U_filtered.json b/annotations_1/ICRVd--TY-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd59396e9818146d512c19376ead91ee7767a871 --- /dev/null +++ b/annotations_1/ICRVd--TY-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.9], [15.0, 15.28], [17.0, 16.93], [21.0, 21.22], [26.0, 28.78], [52.0, 52.47], [57.0, 57.82], [61.0, 63.85], [64.0, 65.82], [67.0, 67.12], [68.0, 68.82], [77.0, 77.6], [81.0, 81.04], [82.0, 82.29], [87.0, 88.47], [90.0, 90.9], [92.0, 96.85], [100.0, 100.53], [102.0, 104.18], [116.0, 116.19], [117.0, 117.91], [126.0, 127.25], [128.0, 128.44], [135.0, 136.22], [137.0, 139.13], [141.0, 141.83], [144.0, 144.86], [151.0, 151.75], [153.0, 153.76], [156.0, 156.63], [160.0, 160.68], [170.0, 170.99], [173.0, 174.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.7, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.26], ["theremin", 19.08], ["musical instrument", 5.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.1, 0.28, -0.07, 0.22, 2.78, 0.47, 0.82, 2.85, 1.82, 0.12, 0.82, 0.6, 0.04, 0.29, 1.47, 0.9, 4.85, 0.53, 2.18, 0.19, 0.91, 1.25, 0.44, 1.22, 2.13, 0.83, 0.86, 0.75, 0.76, 0.63, 0.68, 0.99, 1.9]} \ No newline at end of file diff --git a/annotations_1/IE9S8CehYco_filtered.json b/annotations_1/IE9S8CehYco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c165b947fcd95ba2d2d91c307b2ab6abb7085a2a --- /dev/null +++ b/annotations_1/IE9S8CehYco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.34], [11.0, 11.23], [13.0, 13.41], [14.0, 15.84], [17.0, 18.3], [20.0, 20.6], [21.0, 21.86], [22.0, 23.87], [24.0, 36.24], [38.0, 40.0], [41.0, 45.2], [45.0, 54.82], [55.0, 56.64], [58.0, 59.36], [61.0, 62.01], [64.0, 64.91], [66.0, 65.92], [69.0, 69.43], [71.0, 71.88], [73.0, 75.34], [77.0, 77.79], [78.0, 79.51], [80.0, 79.96], [80.0, 83.15], [84.0, 85.02], [85.0, 86.39], [88.0, 88.96], [91.0, 92.79], [94.0, 95.08], [95.0, 96.7], [100.0, 102.1], [103.0, 108.28], [110.0, 115.08], [119.0, 133.74], [141.0, 141.98], [143.0, 144.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.55, 98.27, 83.88, 52.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 35.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 77.87, 92.48, 41.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.13], ["speech", 27.35], ["musical instrument", 3.63]], null, null, null, null, null, null, null, null, null, [["music", 51.86], ["clarinet", 11.11], ["theremin", 9.4]], null, null], "duration": [0.34, 0.23, 0.41, 1.84, 1.3, 0.6, 0.86, 1.87, 12.24, 2.0, 4.2, 9.82, 1.64, 1.36, 1.01, 0.91, -0.08, 0.43, 0.88, 2.34, 0.79, 1.51, -0.04, 3.15, 1.02, 1.39, 0.96, 1.79, 1.08, 1.7, 2.1, 5.28, 5.08, 14.74, 0.98, 1.12]} \ No newline at end of file diff --git a/annotations_1/IEaqLI9HAmA_filtered.json b/annotations_1/IEaqLI9HAmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32072c8ac11f35f0c8ba089faa382f6f58dbea2e --- /dev/null +++ b/annotations_1/IEaqLI9HAmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.56], [15.0, 15.75], [17.0, 18.71], [29.0, 31.55], [38.0, 40.61], [42.0, 45.67], [51.0, 51.19], [54.0, 61.91], [64.0, 66.56], [72.0, 74.22], [80.0, 80.47], [84.0, 88.33], [97.0, 98.24], [99.0, 100.63], [102.0, 104.85], [106.0, 106.61], [108.0, 109.59], [114.0, 114.93], [116.0, 117.31], [120.0, 119.75], [121.0, 120.82], [123.0, 123.26], [127.0, 127.43], [134.0, 135.46], [136.0, 137.46], [138.0, 139.46], [141.0, 141.35], [152.0, 152.63], [154.0, 154.33]], "keep_status": [false, false, false, true, false, true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.3, 64.52, 35.95, 0.0, 41.28, 41.01, 44.6, 0.0, 47.58, 0.0, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 34.52], ["speech", 15.55], ["crowd", 6.25]], null, [["fart", 33.05], ["speech", 25.62], ["hubbub, speech noise, speech babble", 5.0]], null, [["speech", 53.4], ["fart", 28.52], ["music", 4.33]], [["speech", 16.01], ["animal", 14.97], ["livestock, farm animals, working animals", 13.69]], [["speech", 27.02], ["moo", 20.83], ["cattle, bovinae", 17.96]], null, [["speech", 33.33], ["hum", 12.49], ["throbbing", 11.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 0.75, 1.71, 2.55, 2.61, 3.67, 0.19, 7.91, 2.56, 2.22, 0.47, 4.33, 1.24, 1.63, 2.85, 0.61, 1.59, 0.93, 1.31, -0.25, -0.18, 0.26, 0.43, 1.46, 1.46, 1.46, 0.35, 0.63, 0.33]} \ No newline at end of file diff --git a/annotations_1/IFBAXbrw31g_filtered.json b/annotations_1/IFBAXbrw31g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17e7c3a5fb91dfd91d73af69fd74f9320b7ee040 --- /dev/null +++ b/annotations_1/IFBAXbrw31g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 24.41], [33.0, 33.08], [37.0, 37.5], [39.0, 41.1], [42.0, 42.4], [45.0, 50.48], [54.0, 53.7], [54.0, 58.21], [62.0, 69.92], [70.0, 73.84], [78.0, 83.39], [88.0, 90.56], [91.0, 90.83], [91.0, 90.9], [91.0, 91.07], [91.0, 107.49], [108.0, 128.01], [128.0, 129.07], [130.0, 138.74], [147.0, 153.81], [157.0, 165.82], [169.0, 169.15], [170.0, 171.27], [172.0, 172.4], [178.0, 182.75], [184.0, 187.14], [190.0, 190.36], [191.0, 200.8]], "keep_status": [true, false, false, true, false, true, false, false, true, true, true, true, false, false, false, true, true, false, true, true, true, false, false, false, true, false, false, true], "silence_prob": [37.28, 0.0, 0.0, 44.57, 0.0, 29.35, 0.0, 31.38, 31.0, 31.67, 33.18, 32.11, 0.0, 0.0, 0.0, 30.92, 32.53, 0.0, 34.0, 31.36, 31.96, 0.0, 0.0, 0.0, 47.39, 35.9, 0.0, 34.25], "audiomae_on_audioset": [[["hum", 24.27], ["music", 23.94], ["mains hum", 16.2]], null, null, [["music", 41.87], ["fly, housefly", 5.65], ["mosquito", 4.26]], null, [["speech", 33.82], ["cattle, bovinae", 19.64], ["moo", 12.97]], null, [["speech", 36.86], ["music", 31.23], ["fart", 8.48]], [["whack, thwack", 37.59], ["music", 17.25], ["speech", 4.21]], [["moo", 21.34], ["music", 19.4], ["cattle, bovinae", 17.26]], [["sheep", 26.71], ["bleat", 24.37], ["music", 13.12]], [["speech", 36.71], ["grunt", 14.95], ["animal", 14.29]], null, null, null, [["speech", 48.33], ["grunt", 11.32], ["music", 7.91]], [["livestock, farm animals, working animals", 24.14], ["cattle, bovinae", 18.31], ["music", 15.52]], null, [["speech", 22.79], ["music", 16.48], ["livestock, farm animals, working animals", 8.56]], [["music", 22.33], ["speech", 21.04], ["livestock, farm animals, working animals", 6.33]], [["speech", 40.37], ["buzz", 11.86], ["hum", 7.76]], null, null, null, [["music", 45.83], ["hum", 12.24], ["mains hum", 8.3]], [["music", 44.02], ["throbbing", 22.63], ["hum", 12.45]], null, [["music", 22.78], ["speech", 20.76], ["throbbing", 14.28]]], "duration": [12.41, 0.08, 0.5, 2.1, 0.4, 5.48, -0.3, 4.21, 7.92, 3.84, 5.39, 2.56, -0.17, -0.1, 0.07, 16.49, 20.01, 1.07, 8.74, 6.81, 8.82, 0.15, 1.27, 0.4, 4.75, 3.14, 0.36, 9.8]} \ No newline at end of file diff --git a/annotations_1/IGFdF06VVF8_filtered.json b/annotations_1/IGFdF06VVF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c18145bec1b1ea444e5d5cf4bdbea66082d48b1 --- /dev/null +++ b/annotations_1/IGFdF06VVF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.97], [3.0, 3.52], [4.0, 8.24], [9.0, 11.16], [12.0, 17.44], [19.0, 20.26], [22.0, 35.31], [37.0, 38.16], [41.0, 41.99], [44.0, 44.19], [45.0, 45.96], [48.0, 48.98], [52.0, 53.69], [55.0, 56.93], [58.0, 57.94], [63.0, 64.13], [65.0, 68.18], [69.0, 70.51], [72.0, 73.8], [75.0, 78.98], [79.0, 89.45], [90.0, 91.79], [93.0, 94.61], [96.0, 97.61], [101.0, 101.82], [106.0, 106.07], [108.0, 109.68], [111.0, 111.92], [114.0, 115.52], [116.0, 118.1], [119.0, 125.1], [126.0, 127.21], [129.0, 135.5], [136.0, 137.69], [140.0, 140.17], [142.0, 144.37], [147.0, 148.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.97, 45.62, 47.39, 0.0, 69.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38, 0.0, 0.0, 53.59, 41.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.48, 58.22, 0.0, 57.97, 0.0, 0.0, 59.59, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 42.6], ["hum", 28.69], ["throbbing", 6.35]], [["thunk", 52.59], ["music", 37.33], ["thump, thud", 2.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.84], ["music", 22.74], ["gong", 9.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.52, 4.24, 2.16, 5.44, 1.26, 13.31, 1.16, 0.99, 0.19, 0.96, 0.98, 1.69, 1.93, -0.06, 1.13, 3.18, 1.51, 1.8, 3.98, 10.45, 1.79, 1.61, 1.61, 0.82, 0.07, 1.68, 0.92, 1.52, 2.1, 6.1, 1.21, 6.5, 1.69, 0.17, 2.37, 1.85]} \ No newline at end of file diff --git a/annotations_1/IGaJfcOD6gs_filtered.json b/annotations_1/IGaJfcOD6gs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a6d893b7448a8bbc89380f62a65d3f09499fa35 --- /dev/null +++ b/annotations_1/IGaJfcOD6gs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [5.0, 17.59], [26.0, 28.29], [32.0, 32.46], [37.0, 39.72]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 30.07, 30.31, 0.0, 52.51], "audiomae_on_audioset": [null, [["vehicle", 31.78], ["speech", 28.76], ["skidding", 14.11]], [["speech", 30.48], ["sidetone", 22.37], ["music", 12.08]], null, null], "duration": [0.5, 12.59, 2.29, 0.46, 2.72]} \ No newline at end of file diff --git a/annotations_1/IH8u5eKHNhs_filtered.json b/annotations_1/IH8u5eKHNhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e73e206fd36c8b2bc4e68136e31848d4fd7d3065 --- /dev/null +++ b/annotations_1/IH8u5eKHNhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.0], [26.0, 26.7], [28.0, 28.07], [32.0, 32.56], [35.0, 37.59], [42.0, 42.63], [44.0, 44.64], [46.0, 46.79], [50.0, 50.95], [52.0, 52.19], [57.0, 56.89], [60.0, 60.88], [65.0, 67.41], [68.0, 70.9], [73.0, 77.99], [79.0, 79.07], [79.0, 81.67], [82.0, 83.17], [83.0, 83.84], [84.0, 85.24], [86.0, 86.17], [88.0, 87.78], [93.0, 94.14], [95.0, 95.57], [97.0, 98.34], [100.0, 100.31], [104.0, 104.6], [116.0, 116.11], [128.0, 128.16], [129.0, 132.16], [139.0, 138.89], [140.0, 139.95], [141.0, 141.78], [143.0, 144.1], [145.0, 146.82], [151.0, 152.66], [156.0, 157.47], [170.0, 172.17], [176.0, 175.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.62, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.53], ["grunt", 5.49], ["sidetone", 3.42]], null, null, null, null, null, null, null, [["music", 72.15], ["speech", 7.91], ["drum machine", 2.01]], null], "duration": [0.0, 0.7, 0.07, 0.56, 2.59, 0.63, 0.64, 0.79, 0.95, 0.19, -0.11, 0.88, 2.41, 2.9, 4.99, 0.07, 2.67, 1.17, 0.84, 1.24, 0.17, -0.22, 1.14, 0.57, 1.34, 0.31, 0.6, 0.11, 0.16, 3.16, -0.11, -0.05, 0.78, 1.1, 1.82, 1.66, 1.47, 2.17, -0.24]} \ No newline at end of file diff --git a/annotations_1/IJnig4nc0xg_filtered.json b/annotations_1/IJnig4nc0xg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63b68c55442eea862f07effd20721c74ea5b9f4c --- /dev/null +++ b/annotations_1/IJnig4nc0xg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.59], [12.0, 37.25], [39.0, 41.28], [43.0, 49.82], [51.0, 55.16], [56.0, 68.66], [73.0, 80.99], [83.0, 93.7], [94.0, 104.14], [108.0, 117.58], [122.0, 124.24], [124.0, 124.56], [126.0, 126.72], [134.0, 138.74], [147.0, 157.38], [161.0, 161.76], [171.0, 171.0], [184.0, 184.37], [191.0, 194.61], [195.0, 196.45], [207.0, 206.66], [207.0, 208.55]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.96, 30.62, 30.0, 30.26, 30.08, 30.43, 31.36, 29.7, 31.09, 30.35, 0.0, 0.0, 30.93, 32.04, 0.0, 0.0, 0.0, 36.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 47.68], ["music", 26.19], ["buzz", 5.52]], [["music", 39.29], ["speech", 19.89], ["trombone", 4.79]], [["music", 82.31], ["speech", 7.6], ["boing", 2.06]], [["music", 59.1], ["cacophony", 6.25], ["throbbing", 5.8]], [["music", 55.63], ["didgeridoo", 7.48], ["speech", 5.15]], [["music", 46.65], ["speech", 25.19], ["synthesizer", 3.95]], [["buzz", 25.91], ["music", 22.24], ["livestock, farm animals, working animals", 15.98]], [["music", 50.26], ["speech", 27.52], ["synthesizer", 5.46]], [["music", 48.19], ["speech", 34.92], ["boing", 11.29]], [["music", 50.9], ["breaking", 12.58], ["speech", 8.37]], null, null, [["music", 42.47], ["speech", 34.16], ["whack, thwack", 4.18]], [["music", 49.87], ["speech", 18.93], ["boing", 8.39]], null, null, null, [["music", 62.73], ["sound effect", 6.57], ["reverberation", 5.07]], null, null, null], "duration": [0.59, 25.25, 2.28, 6.82, 4.16, 12.66, 7.99, 10.7, 10.14, 9.58, 2.24, 0.56, 0.72, 4.74, 10.38, 0.76, 0.0, 0.37, 3.61, 1.45, -0.34, 1.55]} \ No newline at end of file diff --git a/annotations_1/IKa2Mr-yHnE_filtered.json b/annotations_1/IKa2Mr-yHnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2db13f4e2115bf2643f21a131636399eae0d02af --- /dev/null +++ b/annotations_1/IKa2Mr-yHnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [8.0, 110.17]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.99, 102.17]} \ No newline at end of file diff --git a/annotations_1/IKnygn5ysHU_filtered.json b/annotations_1/IKnygn5ysHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d77ac7905a26cd3276667bda14a1c7c53df63c46 --- /dev/null +++ b/annotations_1/IKnygn5ysHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.48], [11.0, 15.97], [16.0, 93.28]], "keep_status": [false, true, false], "silence_prob": [0.0, 36.58, 0.0], "audiomae_on_audioset": [null, [["speech", 37.75], ["music", 21.0], ["radio", 8.17]], null], "duration": [0.48, 4.97, 77.28]} \ No newline at end of file diff --git a/annotations_1/IL-_pNnEuk8_filtered.json b/annotations_1/IL-_pNnEuk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76115b8bd5c8d0abd9d04b9035d23537628bff23 --- /dev/null +++ b/annotations_1/IL-_pNnEuk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.7], [11.0, 10.83], [14.0, 13.95], [15.0, 15.55], [17.0, 17.24], [19.0, 19.79], [21.0, 21.98], [24.0, 23.9], [27.0, 30.35], [32.0, 32.48], [39.0, 41.86], [46.0, 46.13], [56.0, 57.38], [58.0, 58.94], [60.0, 61.87], [70.0, 75.59], [77.0, 78.41], [89.0, 89.88], [91.0, 108.28], [115.0, 114.72], [115.0, 116.5], [119.0, 119.08], [124.0, 124.66], [127.0, 130.76], [132.0, 136.58], [138.0, 139.02], [141.0, 141.02], [151.0, 151.21], [165.0, 166.97], [168.0, 169.99], [170.0, 173.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 42.13, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 96.17, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["vehicle", 16.01], ["buzz", 11.65], ["hum", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, -0.17, -0.05, 0.55, 0.24, 0.79, 0.98, -0.1, 3.35, 0.48, 2.86, 0.13, 1.38, 0.94, 1.87, 5.59, 1.41, 0.88, 17.28, -0.28, 1.5, 0.08, 0.66, 3.76, 4.58, 1.02, 0.02, 0.21, 1.97, 1.99, 3.45]} \ No newline at end of file diff --git a/annotations_1/ILbn3iOiOiU_filtered.json b/annotations_1/ILbn3iOiOiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ecaa3743419cf0772b28398a3dfb65e9d1ab3be --- /dev/null +++ b/annotations_1/ILbn3iOiOiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [0.0, 71.71]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.38, 71.71]} \ No newline at end of file diff --git a/annotations_1/ILkyIHOOoq4_filtered.json b/annotations_1/ILkyIHOOoq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0548b3d1c4fdf7da32d49e41fe9f1ca215cd7f74 --- /dev/null +++ b/annotations_1/ILkyIHOOoq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.8], [3.0, 3.87], [9.0, 9.54], [10.0, 10.45], [15.0, 16.21], [17.0, 19.53], [22.0, 21.81], [22.0, 38.65], [39.0, 59.49], [60.0, 59.66], [60.0, 59.81], [60.0, 61.15], [62.0, 62.21], [63.0, 62.72], [63.0, 68.05], [68.0, 69.01], [70.0, 83.54], [85.0, 85.63], [86.0, 87.32], [88.0, 88.6], [103.0, 104.36], [106.0, 107.4], [109.0, 108.99], [109.0, 109.83], [114.0, 114.34], [116.0, 119.23], [124.0, 124.65], [125.0, 126.18], [128.0, 127.94], [133.0, 133.39], [134.0, 135.06], [136.0, 135.97], [142.0, 142.86], [144.0, 145.39], [148.0, 148.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 82.25, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.87, 0.54, 0.45, 1.21, 2.53, -0.19, 16.65, 20.49, -0.34, -0.19, 1.15, 0.21, -0.28, 5.05, 1.01, 13.54, 0.63, 1.32, 0.6, 1.36, 1.4, -0.01, 0.83, 0.34, 3.23, 0.65, 1.18, -0.06, 0.39, 1.06, -0.03, 0.86, 1.39, 0.83]} \ No newline at end of file diff --git a/annotations_1/ILwJA2feDRs_filtered.json b/annotations_1/ILwJA2feDRs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fad4f5ad3655ea93cabc4803b4fcab74739cf81b --- /dev/null +++ b/annotations_1/ILwJA2feDRs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 120.34]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [74.34]} \ No newline at end of file diff --git a/annotations_1/IMPHXKW9ntw_filtered.json b/annotations_1/IMPHXKW9ntw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3409988b4c87aa176aa182d15de709f69b7105fb --- /dev/null +++ b/annotations_1/IMPHXKW9ntw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.09], [10.0, 11.26], [11.0, 14.44], [16.0, 17.37], [19.0, 66.23], [68.0, 68.69], [69.0, 71.85], [74.0, 76.05], [76.0, 102.91], [105.0, 105.43], [108.0, 113.54], [114.0, 115.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [78.55, 0.0, 89.19, 0.0, 0.0, 0.0, 97.92, 96.89, 36.06, 0.0, 33.49, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 58.43], ["ambient music", 13.53], ["singing bowl", 6.4]], null, [["hum", 36.56], ["music", 18.4], ["throbbing", 12.63]], null], "duration": [3.09, 1.26, 3.44, 1.37, 47.23, 0.69, 2.85, 2.05, 26.91, 0.43, 5.54, 1.86]} \ No newline at end of file diff --git a/annotations_1/IMQADg1Dp9g_filtered.json b/annotations_1/IMQADg1Dp9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..977b856e6e7b6202715426cbbe8a6dec185b0f19 --- /dev/null +++ b/annotations_1/IMQADg1Dp9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.76], [2.0, 3.77], [5.0, 5.0], [5.0, 9.04], [13.0, 13.96], [19.0, 22.44], [24.0, 24.6], [26.0, 29.76], [30.0, 30.27], [31.0, 53.2], [55.0, 55.43], [59.0, 73.01], [75.0, 75.19], [76.0, 82.48], [85.0, 89.56], [90.0, 121.07], [124.0, 124.5], [126.0, 126.57], [128.0, 129.09], [130.0, 132.48], [133.0, 135.21], [141.0, 140.93], [142.0, 142.25], [145.0, 145.02], [147.0, 148.46], [152.0, 154.55]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.55, 0.0, 35.99, 0.0, 32.48, 0.0, 33.28, 0.0, 31.73, 0.0, 98.93, 67.13, 0.0, 0.0, 0.0, 0.0, 49.82, 46.26, 0.0, 0.0, 0.0, 0.0, 54.7], "audiomae_on_audioset": [null, null, null, null, null, [["mosquito", 25.99], ["music", 16.9], ["fly, housefly", 10.74]], null, [["music", 74.1], ["theremin", 8.82], ["musical instrument", 2.15]], null, [["music", 59.35], ["didgeridoo", 10.85], ["speech", 3.33]], null, [["music", 46.99], ["speech", 12.31], ["didgeridoo", 3.07]], null, null, null, null, null, null, null, [["speech", 67.42], ["throbbing", 4.15], ["sidetone", 2.38]], [["speech", 21.76], ["music", 11.74], ["moo", 6.98]], null, null, null, null, null], "duration": [-0.24, 1.77, 0.0, 4.04, 0.96, 3.44, 0.6, 3.76, 0.27, 22.2, 0.43, 14.01, 0.19, 6.48, 4.56, 31.07, 0.5, 0.57, 1.09, 2.48, 2.21, -0.07, 0.25, 0.02, 1.46, 2.55]} \ No newline at end of file diff --git a/annotations_1/IMT0EqTWI6I_filtered.json b/annotations_1/IMT0EqTWI6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd3e56a248b46144a1146df846f2755b7daff820 --- /dev/null +++ b/annotations_1/IMT0EqTWI6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.61], [10.0, 36.64], [39.0, 70.9], [72.0, 73.99], [76.0, 126.22], [127.0, 130.22], [131.0, 131.6], [135.0, 141.86], [145.0, 152.32], [153.0, 154.9], [157.0, 157.28], [159.0, 159.04], [161.0, 160.93], [162.0, 162.36], [164.0, 164.76], [166.0, 167.91], [169.0, 170.7], [174.0, 174.73], [178.0, 180.17], [181.0, 191.49], [192.0, 192.7], [196.0, 197.92], [199.0, 202.85]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.45, 29.48, 0.0, 0.0, 0.0, 48.23, 0.0, 57.48, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.11, 42.98, 0.0, 0.0, 55.89], "audiomae_on_audioset": [[["music", 35.98], ["didgeridoo", 12.27], ["brass instrument", 7.85]], [["music", 45.89], ["speech", 28.95], ["foghorn", 3.21]], null, null, null, [["music", 29.97], ["cattle, bovinae", 10.71], ["moo", 9.92]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.31], ["music", 11.42], ["theremin", 6.82]], [["theremin", 51.64], ["music", 32.84], ["didgeridoo", 3.84]], null, null, null], "duration": [5.61, 26.64, 31.9, 1.99, 50.22, 3.22, 0.6, 6.86, 7.32, 1.9, 0.28, 0.04, -0.07, 0.36, 0.76, 1.91, 1.7, 0.73, 2.17, 10.49, 0.7, 1.92, 3.85]} \ No newline at end of file diff --git a/annotations_1/IMr_irerhRE_filtered.json b/annotations_1/IMr_irerhRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56612dba84b18af0a53d9d072d648eaef1221b52 --- /dev/null +++ b/annotations_1/IMr_irerhRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.24], [13.0, 37.77], [40.0, 58.53], [60.0, 72.91], [74.0, 75.98], [76.0, 76.01], [78.0, 82.81], [86.0, 91.69], [95.0, 99.33], [103.0, 105.38], [109.0, 109.59], [110.0, 119.69], [122.0, 123.38]], "keep_status": [false, false, false, true, false, false, true, true, true, true, false, false, false], "silence_prob": [49.78, 43.23, 33.81, 31.18, 0.0, 0.0, 35.56, 33.3, 29.59, 29.82, 0.0, 55.46, 0.0], "audiomae_on_audioset": [[["music", 58.85], ["ambient music", 10.85], ["musical instrument", 3.34]], [["music", 79.02], ["ambient music", 4.08], ["electronic music", 1.73]], [["music", 42.29], ["hum", 18.23], ["mains hum", 14.57]], [["music", 42.68], ["speech", 12.95], ["hum", 12.29]], null, null, [["music", 30.27], ["hum", 15.11], ["mains hum", 10.79]], [["music", 23.95], ["speech", 17.85], ["hum", 10.13]], [["music", 22.82], ["mains hum", 21.84], ["hum", 16.36]], [["vehicle", 15.64], ["rumble", 10.71], ["livestock, farm animals, working animals", 8.6]], null, null, null], "duration": [4.24, 24.77, 18.53, 12.91, 1.98, 0.01, 4.81, 5.69, 4.33, 2.38, 0.59, 9.69, 1.38]} \ No newline at end of file diff --git a/annotations_1/INrZ0l5JbrA_filtered.json b/annotations_1/INrZ0l5JbrA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e1258fe2e2d113c0699966d771cd5f3360a2166 --- /dev/null +++ b/annotations_1/INrZ0l5JbrA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [5.0, 6.24], [18.0, 39.04], [40.0, 80.27], [86.0, 101.49], [103.0, 106.27]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.16, 0.0, 30.15, 29.48], "audiomae_on_audioset": [null, null, [["music", 79.51], ["didgeridoo", 7.51], ["percussion", 2.27]], null, [["music", 55.75], ["musical instrument", 8.53], ["synthesizer", 6.71]], [["music", 88.5], ["musical instrument", 0.91], ["techno", 0.77]]], "duration": [0.51, 1.24, 21.04, 40.27, 15.49, 3.27]} \ No newline at end of file diff --git a/annotations_1/IORWBsyIivo_filtered.json b/annotations_1/IORWBsyIivo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de82af84198e47bf4f8ddac53c7cc7b60d2686ee --- /dev/null +++ b/annotations_1/IORWBsyIivo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 8.43], [10.0, 11.62], [12.0, 12.88], [14.0, 29.56], [30.0, 37.18], [40.0, 47.78], [49.0, 48.83], [49.0, 49.94], [51.0, 75.0], [79.0, 81.77], [83.0, 84.54], [86.0, 86.48], [88.0, 91.69], [93.0, 93.28], [94.0, 96.52], [98.0, 98.32], [106.0, 105.8], [107.0, 109.36], [112.0, 113.98], [115.0, 117.31], [119.0, 120.36], [121.0, 122.08], [124.0, 126.2], [128.0, 128.09], [129.0, 138.15], [140.0, 147.55], [149.0, 149.88], [151.0, 155.48], [157.0, 160.69], [162.0, 172.54]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.04, 0.0, 0.0, 36.63, 32.09, 31.86, 0.0, 0.0, 34.66, 54.97, 0.0, 0.0, 35.83, 0.0, 59.42, 0.0, 0.0, 61.18, 0.0, 84.25, 0.0, 0.0, 76.7, 0.0, 60.32, 56.78, 0.0, 77.87, 79.41, 87.55], "audiomae_on_audioset": [[["music", 56.63], ["fart", 9.2], ["buzz", 8.76]], null, null, [["music", 20.02], ["buzz", 17.84], ["rumble", 14.82]], [["music", 48.67], ["throbbing", 16.37], ["didgeridoo", 3.85]], [["music", 47.35], ["noise", 11.36], ["grunt", 7.26]], null, null, [["music", 59.64], ["speech", 26.11], ["breaking", 1.19]], null, null, null, [["music", 37.5], ["roaring cats (lions, tigers)", 6.29], ["groan", 5.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.43, 1.62, 0.88, 15.56, 7.18, 7.78, -0.17, 0.94, 24.0, 2.77, 1.54, 0.48, 3.69, 0.28, 2.52, 0.32, -0.2, 2.36, 1.98, 2.31, 1.36, 1.08, 2.2, 0.09, 9.15, 7.55, 0.88, 4.48, 3.69, 10.54]} \ No newline at end of file diff --git a/annotations_1/IPPeDiU4Vdo_filtered.json b/annotations_1/IPPeDiU4Vdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd3509aac343605a31bf70b1a7bdd10d6ec36cd8 --- /dev/null +++ b/annotations_1/IPPeDiU4Vdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [9.0, 9.41], [13.0, 14.5], [17.0, 17.69], [19.0, 21.49], [22.0, 22.35], [23.0, 22.77], [23.0, 22.94], [26.0, 26.28], [27.0, 27.04], [32.0, 34.01], [34.0, 34.08], [34.0, 36.91], [37.0, 37.27], [47.0, 51.7], [58.0, 58.21], [69.0, 69.62], [85.0, 85.65], [92.0, 92.99], [100.0, 100.95], [105.0, 105.44], [106.0, 108.55], [110.0, 110.81], [116.0, 116.77], [119.0, 120.04], [126.0, 128.49], [129.0, 129.54], [132.0, 133.91], [137.0, 138.45], [139.0, 140.24], [141.0, 141.61], [144.0, 143.92], [146.0, 146.45], [158.0, 158.84], [164.0, 166.36], [168.0, 171.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 37.37, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 50.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 83.11], ["boing", 9.47], ["inside, small room", 2.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.32], ["music", 12.4], ["vehicle", 3.29]], null], "duration": [0.74, 0.41, 1.5, 0.69, 2.49, 0.35, -0.23, -0.06, 0.28, 0.04, 2.01, 0.08, 2.91, 0.27, 4.7, 0.21, 0.62, 0.65, 0.99, 0.95, 0.44, 2.55, 0.81, 0.77, 1.04, 2.49, 0.54, 1.91, 1.45, 1.24, 0.61, -0.08, 0.45, 0.84, 2.36, 3.78]} \ No newline at end of file diff --git a/annotations_1/IQWtTLEslg8_filtered.json b/annotations_1/IQWtTLEslg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b65e17453e7355303a660f0bce669b356e7a15b --- /dev/null +++ b/annotations_1/IQWtTLEslg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.51], [10.0, 9.95], [10.0, 23.75], [24.0, 33.0], [34.0, 38.23], [39.0, 46.87], [47.0, 49.92], [55.0, 147.34]], "keep_status": [true, false, true, false, false, true, true, false], "silence_prob": [34.21, 0.0, 28.98, 30.29, 30.05, 28.68, 28.26, 0.0], "audiomae_on_audioset": [[["music", 39.95], ["noise", 10.74], ["hum", 7.59]], null, [["music", 33.64], ["fart", 10.18], ["speech", 9.45]], [["music", 56.02], ["didgeridoo", 19.5], ["musical instrument", 2.99]], [["music", 79.19], ["hum", 2.74], ["electronic music", 2.51]], [["music", 24.25], ["vehicle", 16.72], ["motorcycle", 14.09]], [["music", 27.16], ["wild animals", 22.58], ["animal", 17.33]], null], "duration": [2.51, -0.05, 13.75, 9.0, 4.23, 7.87, 2.92, 92.34]} \ No newline at end of file diff --git a/annotations_1/IQuxKuLkByg_filtered.json b/annotations_1/IQuxKuLkByg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5a16b681bf2862431c21033fc62352707afd6f --- /dev/null +++ b/annotations_1/IQuxKuLkByg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.75], [9.0, 9.61], [11.0, 13.66], [15.0, 16.17], [17.0, 18.05], [19.0, 19.2], [22.0, 22.4], [27.0, 34.3], [36.0, 37.17], [39.0, 38.94], [39.0, 39.12], [40.0, 42.21], [42.0, 44.29], [45.0, 54.4], [56.0, 69.79], [71.0, 76.84], [78.0, 83.32], [87.0, 87.39], [91.0, 93.99], [96.0, 111.35], [115.0, 115.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 46.72, 44.72, 36.54, 46.36, 39.35, 34.67, 0.0, 31.06, 29.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.27], ["music", 16.61], ["mains hum", 12.05]], [["throbbing", 30.41], ["hum", 26.81], ["mains hum", 9.32]], [["hum", 35.26], ["music", 20.13], ["mains hum", 17.27]], [["music", 21.96], ["hum", 13.67], ["insect", 9.46]], [["music", 46.39], ["hum", 5.69], ["didgeridoo", 4.17]], [["music", 73.88], ["ambient music", 4.9], ["scary music", 3.92]], null, [["hum", 41.06], ["music", 24.25], ["mains hum", 18.67]], [["music", 67.74], ["musical instrument", 3.08], ["buzz", 2.92]], null], "duration": [-0.25, 0.61, 2.66, 1.17, 1.05, 0.2, 0.4, 7.3, 1.17, -0.06, 0.12, 2.21, 2.29, 9.4, 13.79, 5.84, 5.32, 0.39, 2.99, 15.35, 0.5]} \ No newline at end of file diff --git a/annotations_1/IRycPfFjVBI_filtered.json b/annotations_1/IRycPfFjVBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e48e5bf7785f1a043421df2939940ceb4ac3075 --- /dev/null +++ b/annotations_1/IRycPfFjVBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.89], [28.0, 33.99], [36.0, 40.12], [41.0, 41.37], [42.0, 57.38], [62.0, 80.42], [81.0, 119.43], [120.0, 121.63], [126.0, 126.72], [128.0, 129.91], [133.0, 133.96], [136.0, 137.13], [140.0, 140.56], [142.0, 157.72], [160.0, 177.45]], "keep_status": [false, true, true, false, true, true, false, false, false, false, false, false, false, true, true], "silence_prob": [30.0, 34.76, 28.57, 0.0, 28.45, 29.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.47, 28.56], "audiomae_on_audioset": [[["music", 63.64], ["throbbing", 10.06], ["hum", 9.3]], [["music", 31.1], ["speech", 16.87], ["hum", 16.8]], [["speech", 20.78], ["groan", 10.79], ["whack, thwack", 6.44]], null, [["music", 39.79], ["speech", 7.42], ["groan", 7.11]], [["speech", 34.05], ["music", 18.95], ["hum", 8.41]], null, null, null, null, null, null, null, [["music", 36.1], ["hum", 17.19], ["speech", 8.4]], [["music", 23.35], ["mains hum", 12.58], ["hum", 11.6]]], "duration": [24.89, 5.99, 4.12, 0.37, 15.38, 18.42, 38.43, 1.63, 0.72, 1.91, 0.96, 1.13, 0.56, 15.72, 17.45]} \ No newline at end of file diff --git a/annotations_1/IS-TH-YQbL8_filtered.json b/annotations_1/IS-TH-YQbL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3794084282ad5a84666a0a72dae0c64784232f8c --- /dev/null +++ b/annotations_1/IS-TH-YQbL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 40.09], [41.0, 42.42], [44.0, 51.68], [53.0, 53.32], [55.0, 55.68], [57.0, 61.23], [62.0, 62.41], [63.0, 63.96], [65.0, 67.49], [68.0, 69.03], [69.0, 69.25], [69.0, 69.31], [69.0, 77.31], [79.0, 79.88], [82.0, 82.29], [84.0, 84.77], [86.0, 86.54], [87.0, 87.89], [90.0, 91.25], [92.0, 92.18], [93.0, 93.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.96, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [24.09, 1.42, 7.68, 0.32, 0.68, 4.23, 0.41, 0.96, 2.49, 1.03, 0.25, 0.31, 8.31, 0.88, 0.29, 0.77, 0.54, 0.89, 1.25, 0.18, 0.31]} \ No newline at end of file diff --git a/annotations_1/ISKL5Sy_Mt8_filtered.json b/annotations_1/ISKL5Sy_Mt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c767a68541af8e7061c4081074371093037a0ca0 --- /dev/null +++ b/annotations_1/ISKL5Sy_Mt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.73], [10.0, 15.79], [18.0, 18.28], [19.0, 31.16], [34.0, 62.38], [65.0, 65.33], [66.0, 71.61], [72.0, 74.48], [76.0, 76.72], [77.0, 77.63], [83.0, 84.77], [85.0, 86.34], [89.0, 132.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.96, 0.0, 60.51, 83.7, 0.0, 51.28, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 5.79, 0.28, 12.16, 28.38, 0.33, 5.61, 2.48, 0.72, 0.63, 1.77, 1.34, 43.19]} \ No newline at end of file diff --git a/annotations_1/ISQMNhOd96w_filtered.json b/annotations_1/ISQMNhOd96w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2f4ab5d6dd2d11e2ec9d63d52166d82c7a959d4 --- /dev/null +++ b/annotations_1/ISQMNhOd96w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.04], [18.0, 19.82], [28.0, 28.68], [29.0, 32.49], [33.0, 34.77], [38.0, 38.16], [45.0, 46.55], [53.0, 53.77], [58.0, 59.31], [61.0, 61.87], [64.0, 65.31], [67.0, 66.87], [76.0, 78.19], [79.0, 80.97], [83.0, 83.86], [84.0, 84.89], [86.0, 86.75], [88.0, 87.94], [93.0, 94.83], [99.0, 100.31], [103.0, 108.55], [116.0, 117.14], [124.0, 123.82], [138.0, 139.26], [143.0, 143.36], [143.0, 154.14], [173.0, 173.13], [175.0, 176.57]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.38, 0.0, 0.0, 0.0, 0.0, 41.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 42.25], ["gunshot, gunfire", 10.0], ["music", 7.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 43.6], ["chirp tone", 12.83], ["speech", 8.76]], null, null, null, null, [["music", 72.3], ["theremin", 8.64], ["didgeridoo", 2.8]], null, null], "duration": [0.04, 1.82, 0.68, 3.49, 1.77, 0.16, 1.55, 0.77, 1.31, 0.87, 1.31, -0.13, 2.19, 1.97, 0.86, 0.89, 0.75, -0.06, 1.83, 1.31, 5.55, 1.14, -0.18, 1.26, 0.36, 11.14, 0.13, 1.57]} \ No newline at end of file diff --git a/annotations_1/IT236O8f-J8_filtered.json b/annotations_1/IT236O8f-J8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8aab1569c7d374efc792449ac502684098aceed2 --- /dev/null +++ b/annotations_1/IT236O8f-J8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.86], [11.0, 22.52], [23.0, 23.21], [23.0, 30.28], [31.0, 42.52], [45.0, 46.08], [52.0, 52.42], [54.0, 54.57], [60.0, 67.95], [69.0, 72.37], [74.0, 77.43], [78.0, 79.29], [82.0, 83.0], [84.0, 90.14], [91.0, 95.59], [98.0, 98.1], [101.0, 101.34], [108.0, 111.74], [115.0, 116.6], [118.0, 140.26], [141.0, 146.7], [147.0, 151.68], [152.0, 153.25], [154.0, 155.53], [159.0, 162.78], [166.0, 166.85], [168.0, 168.71]], "keep_status": [false, false, false, true, true, false, false, false, false, true, false, false, false, true, false, false, false, true, false, true, true, true, false, false, true, false, false], "silence_prob": [28.69, 28.72, 0.0, 29.01, 28.99, 0.0, 0.0, 0.0, 34.8, 35.93, 38.36, 0.0, 0.0, 28.87, 30.8, 0.0, 0.0, 29.34, 0.0, 29.09, 35.4, 38.02, 0.0, 0.0, 33.11, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 27.46], ["speech", 26.63], ["music", 16.99]], [["speech", 38.3], ["vehicle", 36.5], ["helicopter", 11.77]], null, [["speech", 36.23], ["music", 16.31], ["hum", 5.25]], [["music", 28.7], ["speech", 13.39], ["buzz", 7.22]], null, null, null, [["music", 70.7], ["scary music", 5.18], ["hum", 3.78]], [["music", 23.86], ["throbbing", 12.05], ["electronic music", 11.04]], [["music", 54.39], ["throbbing", 21.48], ["hum", 8.28]], null, null, [["music", 24.32], ["throbbing", 23.37], ["hum", 19.94]], [["throbbing", 28.01], ["hum", 22.81], ["mains hum", 19.81]], null, null, [["mains hum", 14.48], ["hum", 10.55], ["vehicle", 10.06]], null, [["speech", 23.92], ["music", 20.41], ["vehicle", 17.38]], [["speech", 26.25], ["hum", 16.49], ["music", 16.2]], [["speech", 40.44], ["hum", 13.27], ["mains hum", 9.01]], null, null, [["music", 45.49], ["hum", 6.87], ["speech", 6.19]], null, null], "duration": [6.86, 11.52, 0.21, 7.28, 11.52, 1.08, 0.42, 0.57, 7.95, 3.37, 3.43, 1.29, 1.0, 6.14, 4.59, 0.1, 0.34, 3.74, 1.6, 22.26, 5.7, 4.68, 1.25, 1.53, 3.78, 0.85, 0.71]} \ No newline at end of file diff --git a/annotations_1/IT4vcwIvSCI_filtered.json b/annotations_1/IT4vcwIvSCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9026f980d555d8a226b80497886a3fbb6f3da8 --- /dev/null +++ b/annotations_1/IT4vcwIvSCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.71], [4.0, 4.82], [5.0, 8.09], [9.0, 9.71], [11.0, 11.6], [16.0, 16.7], [17.0, 17.44], [17.0, 17.58], [19.0, 19.57], [23.0, 26.27], [27.0, 27.62], [30.0, 30.3], [31.0, 31.33], [32.0, 36.95], [37.0, 65.75], [68.0, 90.85], [93.0, 93.73], [94.0, 105.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0, 35.8, 32.52, 34.36, 0.0, 31.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 54.61], ["musical instrument", 4.82], ["thunk", 2.81]], null, null, null, [["music", 48.61], ["water", 12.0], ["liquid", 3.09]], [["music", 56.09], ["electronic music", 4.55], ["synthesizer", 4.0]], [["music", 70.5], ["electronic music", 3.97], ["crushing", 3.45]], null, [["music", 74.26], ["didgeridoo", 9.84], ["synthesizer", 2.3]]], "duration": [0.71, 0.82, 3.09, 0.71, 0.6, 0.7, 0.44, 0.58, 0.57, 3.27, 0.62, 0.3, 0.33, 4.95, 28.75, 22.85, 0.73, 11.54]} \ No newline at end of file diff --git a/annotations_1/IVRy-Jac660_filtered.json b/annotations_1/IVRy-Jac660_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29d72ff66912821327125aa1ea2db2c5aaf8abec --- /dev/null +++ b/annotations_1/IVRy-Jac660_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [9.0, 9.39], [12.0, 12.31], [19.0, 20.19], [22.0, 23.31], [24.0, 24.7], [28.0, 28.7], [30.0, 30.08], [35.0, 35.75], [40.0, 40.47], [41.0, 45.39], [47.0, 46.92], [48.0, 48.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 53.33], ["explosion", 17.63], ["music", 6.0]], null, null], "duration": [1.56, 0.39, 0.31, 1.19, 1.31, 0.7, 0.7, 0.08, 0.75, 0.47, 4.39, -0.08, 0.93]} \ No newline at end of file diff --git a/annotations_1/IWmzBLX4j8s_filtered.json b/annotations_1/IWmzBLX4j8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/IWmzBLX4j8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/IXep9SfBhrg_filtered.json b/annotations_1/IXep9SfBhrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76c94c207a0f2406c301e150c1a752189410a068 --- /dev/null +++ b/annotations_1/IXep9SfBhrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [11.0, 98.98], [101.0, 117.78], [121.0, 124.93], [126.0, 145.57], [147.0, 148.53]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 44.18, 32.62, 33.78, 0.0], "audiomae_on_audioset": [null, null, [["music", 30.26], ["theremin", 13.36], ["didgeridoo", 7.46]], [["music", 38.41], ["theremin", 32.47], ["foghorn", 4.12]], [["music", 72.18], ["electronic music", 7.4], ["trance music", 3.01]], null], "duration": [0.38, 87.98, 16.78, 3.93, 19.57, 1.53]} \ No newline at end of file diff --git a/annotations_1/IXl4S2_5sX4_filtered.json b/annotations_1/IXl4S2_5sX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3604d089141a7ba01f9f538f379c696102003c5 --- /dev/null +++ b/annotations_1/IXl4S2_5sX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 24.26], [25.0, 70.95], [73.0, 73.7]], "keep_status": [false, false, false], "silence_prob": [29.72, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 42.82], ["explosion", 35.84], ["burst, pop", 6.5]], null, null], "duration": [9.26, 45.95, 0.7]} \ No newline at end of file diff --git a/annotations_1/IXmWL4J2wwI_filtered.json b/annotations_1/IXmWL4J2wwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20900b4581f29858de009923f76c15f779738c36 --- /dev/null +++ b/annotations_1/IXmWL4J2wwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 79.62], [84.0, 95.27], [96.0, 96.63], [100.0, 99.96], [102.0, 124.6], [125.0, 126.08], [130.0, 140.14], [143.0, 146.96], [148.0, 148.41], [152.0, 151.92], [155.0, 158.94]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.0, 29.3, 0.0, 0.0, 28.95, 0.0, 29.05, 31.18, 0.0, 0.0, 33.71], "audiomae_on_audioset": [[["music", 34.45], ["hum", 9.07], ["electric shaver, electric razor", 7.9]], [["music", 50.63], ["race car, auto racing", 3.11], ["cowbell", 2.51]], null, null, [["music", 69.8], ["speech", 6.36], ["cacophony", 3.3]], null, [["music", 75.16], ["electronic music", 3.2], ["throbbing", 2.49]], [["fly, housefly", 43.4], ["mosquito", 15.11], ["insect", 12.7]], null, null, [["hum", 35.18], ["throbbing", 19.61], ["music", 16.78]]], "duration": [26.62, 11.27, 0.63, -0.04, 22.6, 1.08, 10.14, 3.96, 0.41, -0.08, 3.94]} \ No newline at end of file diff --git a/annotations_1/IXwwGEJkx8Y_filtered.json b/annotations_1/IXwwGEJkx8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1da3d3ad226d2b68972f605b141ff75b7ad6f30 --- /dev/null +++ b/annotations_1/IXwwGEJkx8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.58], [7.0, 9.56], [11.0, 11.35], [12.0, 12.68], [14.0, 14.05], [16.0, 16.28], [18.0, 18.89], [20.0, 20.76], [22.0, 23.18], [24.0, 25.44], [26.0, 27.38], [29.0, 30.08], [33.0, 34.99], [37.0, 37.74], [39.0, 41.03], [42.0, 42.63], [43.0, 43.36], [44.0, 46.55], [48.0, 49.03], [50.0, 52.3], [55.0, 55.58], [58.0, 59.16], [61.0, 62.24], [63.0, 66.12], [67.0, 68.0], [69.0, 72.0], [74.0, 74.46], [77.0, 77.72], [78.0, 79.2], [80.0, 80.5], [83.0, 85.67], [87.0, 87.52], [90.0, 90.83], [94.0, 94.07], [95.0, 96.4], [97.0, 98.61], [102.0, 105.0], [108.0, 112.7], [114.0, 116.46], [118.0, 119.28], [121.0, 121.95], [124.0, 125.58], [127.0, 128.71], [129.0, 133.05], [133.0, 138.08], [140.0, 141.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 48.14, 0.0, 60.14, 0.0, 0.0, 0.0, 93.6, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 63.85, 93.91, 0.0, 0.0, 0.0, 0.0, 85.54, 51.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.85], ["radio", 8.76], ["fly, housefly", 6.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 2.56, 0.35, 0.68, 0.05, 0.28, 0.89, 0.76, 1.18, 1.44, 1.38, 1.08, 1.99, 0.74, 2.03, 0.63, 0.36, 2.55, 1.03, 2.3, 0.58, 1.16, 1.24, 3.12, 1.0, 3.0, 0.46, 0.72, 1.2, 0.5, 2.67, 0.52, 0.83, 0.07, 1.4, 1.61, 3.0, 4.7, 2.46, 1.28, 0.95, 1.58, 1.71, 4.05, 5.08, 1.49]} \ No newline at end of file diff --git a/annotations_1/IYfuTlTiixA_filtered.json b/annotations_1/IYfuTlTiixA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d11a9dd893dd9e21a6a4f15a14090d73ac2b9b4 --- /dev/null +++ b/annotations_1/IYfuTlTiixA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.32], [7.0, 8.88], [10.0, 10.71], [12.0, 12.29], [14.0, 14.52], [17.0, 17.81], [20.0, 20.14], [41.0, 41.77], [48.0, 48.09], [51.0, 50.8], [93.0, 93.39], [96.0, 96.7], [100.0, 100.97], [103.0, 103.08], [130.0, 130.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 1.88, 0.71, 0.29, 0.52, 0.81, 0.14, 0.77, 0.09, -0.2, 0.39, 0.7, 0.97, 0.08, 0.71]} \ No newline at end of file diff --git a/annotations_1/IZxYRZdq2P0_filtered.json b/annotations_1/IZxYRZdq2P0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fcbc789ae3068f258abdd42a4d653ecb313ff18 --- /dev/null +++ b/annotations_1/IZxYRZdq2P0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.54]], "keep_status": [true], "silence_prob": [31.39], "audiomae_on_audioset": [[["speech", 17.04], ["music", 13.94], ["groan", 6.5]]], "duration": [9.54]} \ No newline at end of file diff --git a/annotations_1/I_TkNxwnJiY_filtered.json b/annotations_1/I_TkNxwnJiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..580d5b65823a8146f57d90b8293fcc67fdc8cb12 --- /dev/null +++ b/annotations_1/I_TkNxwnJiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 31.63], [33.0, 33.08], [34.0, 35.36], [37.0, 37.84], [40.0, 40.29], [43.0, 43.29], [51.0, 58.95], [61.0, 61.33], [62.0, 64.56], [79.0, 78.97], [85.0, 85.18], [87.0, 89.36], [93.0, 97.14], [97.0, 98.86], [101.0, 101.78], [102.0, 103.03], [104.0, 104.82], [105.0, 107.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 50.02, 0.0, 0.0, 83.34, 38.43, 0.0, 0.0, 0.0, 0.0, 92.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.65], ["thunk", 10.45], ["noise", 3.64]], null, null, null, null, null], "duration": [10.63, 0.08, 1.36, 0.84, 0.29, 0.29, 7.95, 0.33, 2.56, -0.03, 0.18, 2.36, 4.14, 1.86, 0.78, 1.03, 0.82, 2.06]} \ No newline at end of file diff --git a/annotations_1/I_X6zWElJdw_filtered.json b/annotations_1/I_X6zWElJdw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..394e0471001f7f5a661acf2e1df2dbb6e3ca1e4d --- /dev/null +++ b/annotations_1/I_X6zWElJdw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.97], [16.0, 17.91], [20.0, 22.54], [24.0, 24.38], [33.0, 34.3], [35.0, 35.77], [37.0, 44.44], [55.0, 57.7], [64.0, 65.01], [81.0, 81.26], [83.0, 82.92], [94.0, 95.69], [97.0, 99.79]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.03, 0.0, 32.62, 0.0, 0.0, 0.0, 30.26, 28.98, 0.0, 0.0, 0.0, 0.0, 98.1], "audiomae_on_audioset": [[["music", 47.69], ["speech", 14.93], ["synthesizer", 4.05]], null, [["music", 61.81], ["drum machine", 5.95], ["musical instrument", 5.14]], null, null, null, [["music", 62.68], ["didgeridoo", 16.69], ["musical instrument", 2.79]], [["moo", 29.39], ["cattle, bovinae", 23.28], ["music", 18.68]], null, null, null, null, null], "duration": [6.97, 1.91, 2.54, 0.38, 1.3, 0.77, 7.44, 2.7, 1.01, 0.26, -0.08, 1.69, 2.79]} \ No newline at end of file diff --git a/annotations_1/IaeWrM5PlmU_filtered.json b/annotations_1/IaeWrM5PlmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd599215a8b98fa8749809936ae37df555abc34f --- /dev/null +++ b/annotations_1/IaeWrM5PlmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 3.69], [4.0, 4.68], [5.0, 11.8], [13.0, 16.19], [17.0, 18.35], [19.0, 20.22], [22.0, 83.34], [85.0, 86.27], [90.0, 101.85], [104.0, 126.0], [127.0, 157.81]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 49.59, 53.72, 0.0, 0.0, 0.0, 0.0, 28.97, 29.86, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 47.53], ["musical instrument", 7.81], ["effects unit", 6.32]], null, null, null, null, null, [["vehicle", 58.43], ["car", 8.43], ["motorcycle", 5.04]], [["speech", 31.12], ["fly, housefly", 20.41], ["bee, wasp, etc.", 13.49]], null], "duration": [0.66, 0.69, 0.68, 6.8, 3.19, 1.35, 1.22, 61.34, 1.27, 11.85, 22.0, 30.81]} \ No newline at end of file diff --git a/annotations_1/IeCZqVq7_pY_filtered.json b/annotations_1/IeCZqVq7_pY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..520e345323072b78f817374a63d4c6961fed7975 --- /dev/null +++ b/annotations_1/IeCZqVq7_pY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [6.0, 6.18], [15.0, 15.47], [22.0, 23.7], [31.0, 36.15], [40.0, 40.83], [43.0, 46.53], [49.0, 60.1], [61.0, 61.33], [62.0, 62.45], [64.0, 64.05], [65.0, 65.42], [68.0, 73.7], [79.0, 79.49], [80.0, 82.83], [84.0, 83.98], [84.0, 88.92], [90.0, 90.27], [95.0, 95.84], [107.0, 108.7], [118.0, 118.57], [134.0, 134.5], [144.0, 146.58], [152.0, 159.98], [163.0, 164.88], [165.0, 166.06], [167.0, 171.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 71.72, 64.07, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 71.14, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 36.9, 0.0, 0.0, 35.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.43], ["music", 12.53], ["mains hum", 9.41]], null, null, [["speech", 33.32], ["music", 24.24], ["sheep", 7.35]]], "duration": [0.12, 0.18, 0.47, 1.7, 5.15, 0.83, 3.53, 11.1, 0.33, 0.45, 0.05, 0.42, 5.7, 0.49, 2.83, -0.02, 4.92, 0.27, 0.84, 1.7, 0.57, 0.5, 2.58, 7.98, 1.88, 1.06, 4.96]} \ No newline at end of file diff --git a/annotations_1/IegMpeJM1QU_filtered.json b/annotations_1/IegMpeJM1QU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e18b97404702538d9bb91a2c778fb94810122ad --- /dev/null +++ b/annotations_1/IegMpeJM1QU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 8.68], [9.0, 11.1], [12.0, 13.53], [15.0, 21.17], [23.0, 25.46], [28.0, 29.47], [31.0, 33.52], [36.0, 40.05], [41.0, 45.42], [46.0, 51.14], [54.0, 54.19], [56.0, 58.56], [59.0, 64.18], [65.0, 65.85], [68.0, 72.0], [74.0, 76.64], [78.0, 79.56], [80.0, 81.48], [83.0, 84.27], [89.0, 90.39], [92.0, 92.99], [96.0, 96.85], [97.0, 98.0], [100.0, 101.83], [105.0, 107.28], [109.0, 109.19], [115.0, 115.57], [121.0, 127.68], [129.0, 130.6], [132.0, 141.89], [149.0, 150.62], [151.0, 152.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 99.91, 64.63, 0.0, 93.29, 92.97, 0.0, 75.88, 99.91, 99.84, 54.3, 0.0, 99.1, 46.47, 0.0, 96.66, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.29, 0.0, 0.0, 34.06, 0.0, 36.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.22], ["speech", 13.05], ["heart sounds, heartbeat", 10.86]], null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 37.05], ["music", 21.72], ["hum", 19.64]], null, null, [["hum", 43.64], ["throbbing", 14.3], ["speech", 12.38]], null, [["speech", 31.15], ["hum", 21.9], ["mains hum", 10.83]], null, null], "duration": [0.84, 4.68, 2.1, 1.53, 6.17, 2.46, 1.47, 2.52, 4.05, 4.42, 5.14, 0.19, 2.56, 5.18, 0.85, 4.0, 2.64, 1.56, 1.48, 1.27, 1.39, 0.99, 0.85, 1.0, 1.83, 2.28, 0.19, 0.57, 6.68, 1.6, 9.89, 1.62, 1.31]} \ No newline at end of file diff --git a/annotations_1/IfNo8NJyy8U_filtered.json b/annotations_1/IfNo8NJyy8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8065497eede42e23a9f9648c1a630d542d0b1236 --- /dev/null +++ b/annotations_1/IfNo8NJyy8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 50.9], [52.0, 55.53], [56.0, 58.38], [59.0, 77.01], [78.0, 79.35], [80.0, 87.86], [89.0, 90.14], [91.0, 97.48], [98.0, 100.08], [100.0, 103.87], [105.0, 108.62], [110.0, 112.24], [113.0, 117.17], [119.0, 119.42], [120.0, 122.54], [124.0, 126.39], [128.0, 129.51], [132.0, 133.64], [135.0, 135.6], [136.0, 150.31], [151.0, 159.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 85.54, 87.37, 58.55, 0.0, 69.88, 0.0, 60.14, 60.23, 56.93, 68.54, 71.57, 75.39, 0.0, 73.36, 74.29, 0.0, 0.0, 0.0, 46.9, 35.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.83], ["mains hum", 12.53], ["hum", 11.86]], [["hum", 9.44], ["rumble", 8.22], ["singing bowl", 7.43]]], "duration": [46.9, 3.53, 2.38, 18.01, 1.35, 7.86, 1.14, 6.48, 2.08, 3.87, 3.62, 2.24, 4.17, 0.42, 2.54, 2.39, 1.51, 1.64, 0.6, 14.31, 8.54]} \ No newline at end of file diff --git a/annotations_1/IfO6AIsvlKw_filtered.json b/annotations_1/IfO6AIsvlKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3e30c7f1241aac4ae751c4b62b80c16d443e32 --- /dev/null +++ b/annotations_1/IfO6AIsvlKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.58], [15.0, 23.46], [29.0, 36.44], [39.0, 43.19], [43.0, 44.95], [46.0, 45.98], [50.0, 51.29], [70.0, 70.65], [73.0, 72.64], [75.0, 75.17], [78.0, 78.0], [80.0, 81.36], [93.0, 93.12], [98.0, 99.6], [102.0, 103.06], [106.0, 106.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.11, 30.31, 29.67, 29.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 83.17], ["drum machine", 4.08], ["speech", 2.68]], [["music", 74.79], ["sidetone", 11.05], ["speech", 2.34]], [["music", 81.3], ["sampler", 2.41], ["electronic music", 2.17]], [["music", 38.52], ["boing", 22.37], ["speech", 9.4]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.58, 8.46, 7.44, 4.19, 1.95, -0.02, 1.29, 0.65, -0.36, 0.17, 0.0, 1.36, 0.12, 1.6, 1.06, 0.24]} \ No newline at end of file diff --git a/annotations_1/IfZmBGcWkLI_filtered.json b/annotations_1/IfZmBGcWkLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcda9416fa8952c83eba78840238f05b62e2eb55 --- /dev/null +++ b/annotations_1/IfZmBGcWkLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.53], [10.0, 9.75], [10.0, 10.17], [13.0, 17.61], [19.0, 20.68], [24.0, 25.98], [29.0, 29.76], [30.0, 35.88], [39.0, 39.41], [47.0, 54.72], [55.0, 56.84], [63.0, 66.38], [67.0, 74.29], [80.0, 80.42], [82.0, 83.02], [85.0, 88.13], [93.0, 94.05], [94.0, 98.64], [100.0, 100.63], [101.0, 106.1], [113.0, 119.45], [123.0, 123.11], [123.0, 126.62], [128.0, 130.52], [132.0, 133.91], [135.0, 135.06], [137.0, 137.57], [141.0, 141.03], [145.0, 146.65], [148.0, 148.22], [151.0, 155.07], [156.0, 156.32], [158.0, 158.13], [159.0, 159.97], [161.0, 162.99], [170.0, 172.05], [173.0, 174.19], [177.0, 183.46], [183.0, 187.74]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 57.81, 0.0, 48.95, 0.0, 75.23, 72.01, 0.0, 0.0, 72.46, 0.0, 55.11, 0.0, 51.02, 92.15, 0.0, 33.72, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 29.96, 0.0, 51.55, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 34.53], ["effects unit", 19.84], ["music", 9.55]], null, null, null, null, null, null, null, null, null, null, null, null, [["singing bowl", 14.49], ["music", 11.06], ["reverberation", 10.52]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.2], ["radio", 6.89], ["sidetone", 6.73]], null, null, null], "duration": [1.53, -0.25, 0.17, 4.61, 1.68, 1.98, 0.76, 5.88, 0.41, 7.72, 1.84, 3.38, 7.29, 0.42, 1.02, 3.13, 1.05, 4.64, 0.63, 5.1, 6.45, 0.11, 3.62, 2.52, 1.91, 0.06, 0.57, 0.03, 1.65, 0.22, 4.07, 0.32, 0.13, 0.97, 1.99, 2.05, 1.19, 6.46, 4.74]} \ No newline at end of file diff --git a/annotations_1/IfecgEak80I_filtered.json b/annotations_1/IfecgEak80I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8452a3f90683f2aaa17662506f919a020fbaf210 --- /dev/null +++ b/annotations_1/IfecgEak80I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [7.0, 7.96], [10.0, 23.4], [26.0, 31.94], [33.0, 34.26], [36.0, 38.5], [39.0, 41.76], [43.0, 44.64], [48.0, 50.82], [52.0, 52.59], [54.0, 54.84], [60.0, 61.38], [64.0, 64.96], [66.0, 67.1], [68.0, 70.24], [72.0, 74.66], [76.0, 77.8], [79.0, 82.22], [83.0, 84.81], [86.0, 91.84], [93.0, 93.93], [95.0, 97.34], [99.0, 99.77], [100.0, 103.59], [105.0, 105.68], [108.0, 109.97], [112.0, 111.65], [115.0, 115.67], [117.0, 117.44], [118.0, 119.53], [120.0, 121.66], [122.0, 123.69], [124.0, 128.19], [129.0, 134.69], [135.0, 137.22], [138.0, 139.92], [140.0, 142.08], [143.0, 144.93], [150.0, 150.35], [151.0, 152.51], [154.0, 153.93], [156.0, 157.82], [165.0, 165.21], [168.0, 168.08], [172.0, 173.77], [176.0, 178.14], [180.0, 180.2], [183.0, 183.02], [190.0, 191.81], [194.0, 194.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.92, 81.53, 0.0, 99.91, 66.76, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 96.77, 0.0, 63.42, 0.0, 55.18, 0.0, 99.9, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81, 97.73, 70.58, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 29.23], ["boing", 28.25], ["music", 15.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.07], ["theremin", 6.8], ["humming", 2.42]], null, null, null, null], "duration": [1.41, 0.96, 13.4, 5.94, 1.26, 2.5, 2.76, 1.64, 2.82, 0.59, 0.84, 1.38, 0.96, 1.1, 2.24, 2.66, 1.8, 3.22, 1.81, 5.84, 0.93, 2.34, 0.77, 3.59, 0.68, 1.97, -0.35, 0.67, 0.44, 1.53, 1.66, 1.69, 4.19, 5.69, 2.22, 1.92, 2.08, 1.93, 0.35, 1.51, -0.07, 1.82, 0.21, 0.08, 1.77, 2.14, 0.2, 0.02, 1.81, 0.7]} \ No newline at end of file diff --git a/annotations_1/Ig6hIs0jsjg_filtered.json b/annotations_1/Ig6hIs0jsjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20232ef195ca848a09589dfb4349fd2043bd8069 --- /dev/null +++ b/annotations_1/Ig6hIs0jsjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.07], [6.0, 7.75], [9.0, 20.44], [24.0, 24.11], [25.0, 25.56], [30.0, 30.33], [31.0, 33.1], [40.0, 41.07], [46.0, 54.01], [55.0, 55.05], [55.0, 55.38], [60.0, 63.05], [63.0, 63.8], [67.0, 68.13], [68.0, 68.49], [69.0, 69.33], [71.0, 72.15], [75.0, 75.41], [76.0, 76.94], [81.0, 81.45], [82.0, 83.57], [88.0, 95.54], [96.0, 100.55], [104.0, 127.26], [128.0, 128.53]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 29.36, 0.0, 0.0, 0.0, 29.79, 0.0, 30.02, 0.0, 0.0, 30.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.36, 30.46, 30.55, 0.0], "audiomae_on_audioset": [null, null, [["hum", 25.47], ["music", 21.69], ["mains hum", 7.25]], null, null, null, [["speech", 53.02], ["skateboard", 11.26], ["vehicle", 2.73]], null, [["music", 56.66], ["speech", 8.66], ["didgeridoo", 6.3]], null, null, [["music", 35.0], ["musical instrument", 7.84], ["speech", 7.1]], null, null, null, null, null, null, null, null, null, [["didgeridoo", 19.47], ["music", 15.61], ["speech", 14.57]], [["music", 47.57], ["animal", 11.19], ["synthesizer", 9.47]], [["cattle, bovinae", 33.73], ["moo", 28.62], ["livestock, farm animals, working animals", 24.35]], null], "duration": [0.07, 1.75, 11.44, 0.11, 0.56, 0.33, 2.1, 1.07, 8.01, 0.05, 0.38, 3.05, 0.8, 1.13, 0.49, 0.33, 1.15, 0.41, 0.94, 0.45, 1.57, 7.54, 4.55, 23.26, 0.53]} \ No newline at end of file diff --git a/annotations_1/IgKQ8z_xNhk_filtered.json b/annotations_1/IgKQ8z_xNhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f081fb6b73c2d0e0c27da26271671b221ea066a --- /dev/null +++ b/annotations_1/IgKQ8z_xNhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.54], [11.0, 17.95], [19.0, 20.14], [23.0, 25.22], [29.0, 33.02], [34.0, 36.81], [39.0, 41.01], [42.0, 43.66], [47.0, 49.57], [51.0, 52.27], [53.0, 57.27], [59.0, 61.79], [64.0, 65.3], [66.0, 67.85], [69.0, 74.31], [75.0, 77.14], [78.0, 79.46], [80.0, 85.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.82, 99.78, 0.0, 99.48, 86.27, 99.44, 99.78, 0.0, 97.11, 0.0, 99.8, 78.04, 0.0, 0.0, 65.2, 84.62, 0.0, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.54, 6.95, 1.14, 2.22, 4.02, 2.81, 2.01, 1.66, 2.57, 1.27, 4.27, 2.79, 1.3, 1.85, 5.31, 2.14, 1.46, 5.68]} \ No newline at end of file diff --git a/annotations_1/IgTIy5MUBxM_filtered.json b/annotations_1/IgTIy5MUBxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a393454a9b46421a7bb303713c5a0c46d595ae9 --- /dev/null +++ b/annotations_1/IgTIy5MUBxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.61], [21.0, 56.54], [59.0, 69.9], [70.0, 90.56], [92.0, 97.53], [100.0, 100.33], [102.0, 102.25], [104.0, 104.23], [107.0, 106.91], [108.0, 108.41], [109.0, 109.56], [110.0, 110.89], [112.0, 120.78], [122.0, 122.07], [122.0, 122.5], [124.0, 124.11], [125.0, 125.54], [127.0, 127.97], [130.0, 130.65], [132.0, 132.54], [134.0, 135.21], [136.0, 138.99], [141.0, 141.51], [142.0, 143.18], [145.0, 146.52], [147.0, 148.15]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.5, 29.92, 31.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 25.9], ["drum machine", 8.36], ["musical instrument", 6.79]], [["music", 60.78], ["didgeridoo", 3.79], ["throbbing", 3.59]], [["speech", 63.91], ["echo", 3.76], ["music", 2.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 35.54, 10.9, 20.56, 5.53, 0.33, 0.25, 0.23, -0.09, 0.41, 0.56, 0.89, 8.78, 0.07, 0.5, 0.11, 0.54, 0.97, 0.65, 0.54, 1.21, 2.99, 0.51, 1.18, 1.52, 1.15]} \ No newline at end of file diff --git a/annotations_1/IgeW0MPX60Q_filtered.json b/annotations_1/IgeW0MPX60Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a234b475a6eaebafe18dcda69947a2d90b5c2d9a --- /dev/null +++ b/annotations_1/IgeW0MPX60Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.43], [22.0, 22.27], [24.0, 53.05], [57.0, 57.91], [70.0, 70.51], [73.0, 74.85], [76.0, 76.22], [79.0, 80.01], [91.0, 100.68], [114.0, 117.21], [120.0, 120.31], [123.0, 146.5], [147.0, 146.94], [147.0, 147.61]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.68, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 29.68, 0.0, 29.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.31], ["synthesizer", 8.5], ["sine wave", 4.11]], null, null, null, null, null, [["music", 71.8], ["synthesizer", 7.35], ["throbbing", 4.59]], [["music", 31.04], ["hum", 11.6], ["throbbing", 7.86]], null, [["music", 65.18], ["breaking", 12.21], ["hum", 8.87]], null, null], "duration": [0.43, 0.27, 29.05, 0.91, 0.51, 1.85, 0.22, 1.01, 9.68, 3.21, 0.31, 23.5, -0.06, 0.61]} \ No newline at end of file diff --git a/annotations_1/Igs1WM2pA54_filtered.json b/annotations_1/Igs1WM2pA54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b750211aa36921feed1fbdd08327e96bad5c3b3b --- /dev/null +++ b/annotations_1/Igs1WM2pA54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [8.0, 8.67], [10.0, 10.71], [13.0, 14.05], [18.0, 19.65], [21.0, 22.15], [26.0, 26.08], [28.0, 28.43], [30.0, 30.2], [31.0, 31.29], [37.0, 37.39], [44.0, 44.64], [47.0, 47.49], [49.0, 49.32], [51.0, 52.15], [54.0, 55.05], [56.0, 56.91], [58.0, 58.68], [65.0, 65.38], [72.0, 72.18], [75.0, 75.66], [78.0, 81.97], [87.0, 87.81], [90.0, 90.1], [92.0, 92.77], [94.0, 94.76], [97.0, 97.55], [103.0, 104.13], [107.0, 108.65], [111.0, 112.24], [115.0, 114.69], [116.0, 117.15], [119.0, 120.09], [122.0, 122.1], [124.0, 123.94], [126.0, 126.39], [132.0, 132.29], [135.0, 134.89], [140.0, 140.95], [143.0, 144.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.67, 0.71, 1.05, 1.65, 1.15, 0.08, 0.43, 0.2, 0.29, 0.39, 0.64, 0.49, 0.32, 1.15, 1.05, 0.91, 0.68, 0.38, 0.18, 0.66, 3.97, 0.81, 0.1, 0.77, 0.76, 0.55, 1.13, 1.65, 1.24, -0.31, 1.15, 1.09, 0.1, -0.06, 0.39, 0.29, -0.11, 0.95, 1.42]} \ No newline at end of file diff --git a/annotations_1/Ih-zPWi9INA_filtered.json b/annotations_1/Ih-zPWi9INA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f5a2f5dcb8067645245723943b0d6bdc892571e --- /dev/null +++ b/annotations_1/Ih-zPWi9INA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.13], [16.0, 24.31], [36.0, 38.4], [43.0, 44.96], [47.0, 48.76], [49.0, 50.62], [52.0, 53.28], [54.0, 58.4], [64.0, 67.64], [71.0, 70.95], [76.0, 77.65], [80.0, 80.42], [83.0, 88.94], [91.0, 100.06], [100.0, 103.47], [110.0, 111.23], [113.0, 113.19]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, true, true, true, false, false], "silence_prob": [64.29, 32.83, 50.81, 0.0, 0.0, 0.0, 0.0, 31.3, 49.97, 0.0, 0.0, 0.0, 36.31, 39.54, 47.78, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.42], ["sonar", 5.82], ["electronic music", 5.56]], null, null, null, null, null, [["whale vocalization", 30.06], ["mains hum", 9.16], ["speech", 8.31]], [["music", 12.19], ["throbbing", 11.96], ["hum", 6.99]], null, null, null, [["music", 44.64], ["hum", 8.4], ["throbbing", 6.81]], [["hum", 24.58], ["throbbing", 15.53], ["speech", 5.74]], [["music", 16.84], ["hum", 6.8], ["creak", 5.21]], null, null], "duration": [3.13, 8.31, 2.4, 1.96, 1.76, 1.62, 1.28, 4.4, 3.64, -0.05, 1.65, 0.42, 5.94, 9.06, 3.47, 1.23, 0.19]} \ No newline at end of file diff --git a/annotations_1/Ihkrc6Srv0Y_filtered.json b/annotations_1/Ihkrc6Srv0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..966d6ace08e3c4798c99edea77d62a826dfe946d --- /dev/null +++ b/annotations_1/Ihkrc6Srv0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.18], [9.0, 9.41], [23.0, 23.28], [25.0, 27.21], [33.0, 32.53], [33.0, 37.71], [39.0, 43.66], [47.0, 49.3], [51.0, 55.21], [56.0, 57.55], [64.0, 72.44], [73.0, 73.45], [87.0, 89.95], [93.0, 98.73], [100.0, 101.34], [106.0, 106.59], [110.0, 111.5], [115.0, 116.21], [120.0, 125.39], [138.0, 137.73], [139.0, 146.31], [148.0, 148.46], [149.0, 149.57], [154.0, 158.57], [160.0, 161.91], [163.0, 170.73], [174.0, 175.44], [177.0, 177.67], [179.0, 180.52], [182.0, 183.27], [184.0, 184.6], [189.0, 190.75]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.56, 0.0, 30.0, 40.45, 44.46, 43.03, 0.0, 49.64, 0.0, 46.75, 33.45, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 30.87, 0.0, 0.0, 34.58, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 55.65], ["whack, thwack", 16.42], ["zipper (clothing)", 6.8]], [["music", 18.13], ["speech", 13.71], ["animal", 5.67]], [["music", 27.31], ["speech", 14.49], ["cello", 5.12]], [["speech", 53.22], ["music", 20.35], ["hum", 4.9]], null, [["music", 62.85], ["speech", 17.32], ["boing", 6.02]], null, [["speech", 29.35], ["music", 19.59], ["mosquito", 11.89]], [["speech", 38.39], ["music", 23.2], ["beatboxing", 6.54]], null, null, null, null, [["speech", 41.23], ["music", 25.67], ["whack, thwack", 4.42]], null, [["music", 31.51], ["speech", 19.36], ["didgeridoo", 14.79]], null, null, [["music", 50.2], ["speech", 34.06], ["synthesizer", 2.14]], null, null, null, null, null, null, null, null], "duration": [0.18, 0.41, 0.28, 2.21, -0.47, 4.71, 4.66, 2.3, 4.21, 1.55, 8.44, 0.45, 2.95, 5.73, 1.34, 0.59, 1.5, 1.21, 5.39, -0.27, 7.31, 0.46, 0.57, 4.57, 1.91, 7.73, 1.44, 0.67, 1.52, 1.27, 0.6, 1.75]} \ No newline at end of file diff --git a/annotations_1/IiQlYWhL_UI_filtered.json b/annotations_1/IiQlYWhL_UI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85ce54a22e7d42999363844436e0d14ec89ccc1e --- /dev/null +++ b/annotations_1/IiQlYWhL_UI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.06], [12.0, 12.87], [13.0, 16.19], [17.0, 26.03], [28.0, 28.46], [30.0, 32.66], [34.0, 40.66], [41.0, 42.43], [60.0, 60.93], [70.0, 71.61], [82.0, 85.04], [86.0, 86.39], [95.0, 96.35], [103.0, 104.73], [110.0, 121.98], [129.0, 132.49], [135.0, 135.92], [137.0, 136.81], [138.0, 138.5], [149.0, 150.45], [151.0, 152.19], [153.0, 153.82], [156.0, 157.33]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.08, 29.74, 0.0, 45.3, 31.38, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0, 0.0, 33.77, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.2], ["electronic music", 10.43], ["speech", 4.97]], [["music", 45.34], ["sidetone", 17.51], ["speech", 11.91]], null, [["music", 30.7], ["hum", 16.6], ["mains hum", 9.9]], [["mains hum", 34.64], ["hum", 27.0], ["throbbing", 19.84]], null, null, null, [["speech", 45.27], ["music", 20.72], ["didgeridoo", 7.4]], null, null, null, [["speech", 37.85], ["sine wave", 7.7], ["ding", 7.69]], [["speech", 27.63], ["cattle, bovinae", 14.95], ["music", 14.94]], null, null, null, null, null, null, null], "duration": [1.06, 0.87, 3.19, 9.03, 0.46, 2.66, 6.66, 1.43, 0.93, 1.61, 3.04, 0.39, 1.35, 1.73, 11.98, 3.49, 0.92, -0.19, 0.5, 1.45, 1.19, 0.82, 1.33]} \ No newline at end of file diff --git a/annotations_1/Iii55E60gfg_filtered.json b/annotations_1/Iii55E60gfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59797d43dd1f8ceeef38ab9b217dee1c4a503535 --- /dev/null +++ b/annotations_1/Iii55E60gfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [7.0, 7.37], [8.0, 8.85], [12.0, 13.68], [21.0, 21.61], [23.0, 23.35], [33.0, 32.88], [40.0, 40.68], [43.0, 43.6], [44.0, 47.24], [48.0, 49.03], [50.0, 52.51], [60.0, 61.15], [67.0, 67.74], [74.0, 73.95], [76.0, 77.45], [80.0, 82.63], [86.0, 86.0], [86.0, 86.04], [102.0, 105.26], [107.0, 107.52], [116.0, 117.19], [119.0, 119.96], [120.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.79, 0.0, 38.54, 0.0, 0.0, 0.0, 0.0, 37.99, 0.0, 0.0, 35.06, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whistling", 54.75], ["music", 18.7], ["whistle", 3.93]], null, [["music", 55.86], ["synthesizer", 5.86], ["musical instrument", 3.57]], null, null, null, null, [["speech", 38.22], ["music", 30.75], ["boing", 3.93]], null, null, [["speech", 59.65], ["frog", 7.54], ["croak", 3.39]], null, null, null, null], "duration": [0.53, 0.37, 0.85, 1.68, 0.61, 0.35, -0.12, 0.68, 0.6, 3.24, 1.03, 2.51, 1.15, 0.74, -0.05, 1.45, 2.63, 0.0, 0.04, 3.26, 0.52, 1.19, 0.96, 1.98]} \ No newline at end of file diff --git a/annotations_1/IjGKv209gAE_filtered.json b/annotations_1/IjGKv209gAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3491e5e479fba2ce45441f00d226584dd40cb9d --- /dev/null +++ b/annotations_1/IjGKv209gAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 41.1], [42.0, 44.09], [47.0, 110.3], [113.0, 116.45], [119.0, 126.15], [129.0, 129.59], [131.0, 131.67], [134.0, 135.21], [135.0, 135.87], [137.0, 137.49], [139.0, 139.6], [141.0, 145.5]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.52, 37.16, 0.0, 54.04, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76], "audiomae_on_audioset": [[["music", 82.95], ["electronic music", 1.77], ["musical instrument", 1.45]], [["music", 47.76], ["speech", 3.87], ["throbbing", 2.75]], null, null, null, null, null, null, null, null, null, null], "duration": [5.1, 2.09, 63.3, 3.45, 7.15, 0.59, 0.67, 1.21, 0.87, 0.49, 0.6, 4.5]} \ No newline at end of file diff --git a/annotations_1/IkVavN1lo9E_filtered.json b/annotations_1/IkVavN1lo9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ff0f78182c54d0dfd3ac0b0204c12a67b2eaaf --- /dev/null +++ b/annotations_1/IkVavN1lo9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.0], [24.0, 29.66], [30.0, 31.38], [32.0, 50.48], [52.0, 54.13], [57.0, 72.08], [73.0, 74.38], [78.0, 79.74], [82.0, 83.0], [86.0, 88.47], [95.0, 95.88], [100.0, 101.07], [102.0, 104.55], [105.0, 105.92], [106.0, 107.35], [108.0, 109.22], [122.0, 123.15]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [86.45, 59.51, 0.0, 33.04, 64.07, 35.3, 0.0, 0.0, 0.0, 35.74, 0.0, 0.0, 51.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 35.16], ["insect", 34.54], ["cattle, bovinae", 7.35]], null, [["theremin", 37.72], ["music", 18.8], ["whale vocalization", 8.08]], null, null, null, [["fly, housefly", 41.6], ["mosquito", 14.08], ["insect", 12.84]], null, null, null, null, null, null, null], "duration": [6.0, 5.66, 1.38, 18.48, 2.13, 15.08, 1.38, 1.74, 1.0, 2.47, 0.88, 1.07, 2.55, 0.92, 1.35, 1.22, 1.15]} \ No newline at end of file diff --git a/annotations_1/IlH-egwG2pQ_filtered.json b/annotations_1/IlH-egwG2pQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..034998c3105437906131ca4841b24a478d143370 --- /dev/null +++ b/annotations_1/IlH-egwG2pQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.09], [1.0, 3.54], [6.0, 41.84], [42.0, 50.84], [52.0, 56.81], [59.0, 94.02], [99.0, 105.06], [107.0, 113.44], [117.0, 123.6], [126.0, 157.44], [159.0, 170.4]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 66.63, 0.0, 30.89, 30.96, 0.0, 32.65, 29.81, 30.54, 0.0, 30.52], "audiomae_on_audioset": [null, null, null, [["music", 45.38], ["theremin", 5.09], ["thump, thud", 3.51]], [["speech", 47.69], ["music", 19.65], ["hum", 4.69]], null, [["music", 62.89], ["hum", 5.64], ["ambient music", 4.08]], [["music", 17.05], ["whack, thwack", 10.97], ["electric shaver, electric razor", 5.77]], [["music", 45.82], ["hum", 9.49], ["didgeridoo", 8.96]], null, [["music", 63.63], ["throbbing", 10.76], ["hum", 6.48]]], "duration": [0.09, 2.54, 35.84, 8.84, 4.81, 35.02, 6.06, 6.44, 6.6, 31.44, 11.4]} \ No newline at end of file diff --git a/annotations_1/Im39PGAb82I_filtered.json b/annotations_1/Im39PGAb82I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fc9e14c3d9b3b3fd3170c5e5bb66674a2258e7d --- /dev/null +++ b/annotations_1/Im39PGAb82I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.57], [8.0, 14.61], [16.0, 24.48], [25.0, 28.44], [29.0, 29.52], [30.0, 42.69], [53.0, 67.95], [69.0, 72.74], [73.0, 73.95], [77.0, 77.13], [78.0, 79.1], [83.0, 90.24], [93.0, 94.74]], "keep_status": [false, true, false, true, false, true, true, false, false, false, false, true, false], "silence_prob": [0.0, 28.98, 28.72, 28.82, 0.0, 29.27, 28.84, 28.56, 0.0, 0.0, 0.0, 29.25, 0.0], "audiomae_on_audioset": [null, [["music", 25.61], ["effects unit", 22.87], ["distortion", 13.61]], [["speech", 75.74], ["music", 6.62], ["effects unit", 4.09]], [["music", 40.48], ["musical instrument", 11.8], ["effects unit", 10.97]], null, [["synthesizer", 17.89], ["cacophony", 9.09], ["buzz", 7.92]], [["noise", 38.26], ["cacophony", 9.62], ["effects unit", 7.3]], [["noise", 54.77], ["whale vocalization", 15.79], ["echo", 2.43]], null, null, null, [["music", 35.91], ["effects unit", 14.04], ["noise", 11.89]], null], "duration": [0.57, 6.61, 8.48, 3.44, 0.52, 12.69, 14.95, 3.74, 0.95, 0.13, 1.1, 7.24, 1.74]} \ No newline at end of file diff --git a/annotations_1/ImO-q-hTdAc_filtered.json b/annotations_1/ImO-q-hTdAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a35c69259bc49d74b4104fb99ac0416db0586e12 --- /dev/null +++ b/annotations_1/ImO-q-hTdAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.78], [8.0, 9.19], [10.0, 11.64], [13.0, 14.01], [18.0, 18.74], [19.0, 22.72], [28.0, 32.19], [35.0, 35.82], [38.0, 38.48], [41.0, 42.18], [49.0, 49.3], [50.0, 54.85], [57.0, 57.4], [59.0, 60.1], [66.0, 67.86], [71.0, 71.39], [74.0, 74.75], [78.0, 80.23], [83.0, 82.88], [84.0, 92.53], [96.0, 97.51], [99.0, 99.98], [102.0, 102.83], [106.0, 108.85], [110.0, 111.1], [113.0, 114.93], [120.0, 121.71], [123.0, 124.51], [126.0, 126.44], [129.0, 129.0], [132.0, 133.66], [134.0, 134.52], [145.0, 145.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 0.0, 0.0, 0.0, 0.0, 80.82, 39.55, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 55.96, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 79.48], ["scary music", 3.32], ["soundtrack music", 2.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.78, 1.19, 1.64, 1.01, 0.74, 3.72, 4.19, 0.82, 0.48, 1.18, 0.3, 4.85, 0.4, 1.1, 1.86, 0.39, 0.75, 2.23, -0.12, 8.53, 1.51, 0.98, 0.83, 2.85, 1.1, 1.93, 1.71, 1.51, 0.44, 0.0, 1.66, 0.52, 0.35]} \ No newline at end of file diff --git a/annotations_1/InkyowbQcIs_filtered.json b/annotations_1/InkyowbQcIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/InkyowbQcIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/IoQ4G5p-Z-g_filtered.json b/annotations_1/IoQ4G5p-Z-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c8ac8e42ca40818a4a7c6b406d7d9da4a4e185d --- /dev/null +++ b/annotations_1/IoQ4G5p-Z-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.54], [6.0, 7.05], [10.0, 10.74], [11.0, 15.26], [19.0, 18.76], [19.0, 19.74], [20.0, 36.36], [37.0, 38.15], [40.0, 40.34], [43.0, 48.34], [50.0, 51.07], [51.0, 52.44], [53.0, 57.59], [58.0, 60.32], [61.0, 69.53], [79.0, 79.59], [80.0, 80.54], [81.0, 84.42], [86.0, 86.22], [92.0, 92.69], [95.0, 95.17], [101.0, 102.1], [104.0, 104.31], [108.0, 109.39], [112.0, 112.46], [119.0, 119.43], [121.0, 121.41], [122.0, 126.32], [128.0, 128.11], [132.0, 132.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.49, 0.0, 0.0, 36.27, 0.0, 0.0, 29.28, 0.0, 0.0, 29.56, 30.97, 31.37, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 61.0], ["music", 16.9], ["synthesizer", 3.21]], null, null, [["speech", 50.32], ["music", 27.95], ["synthesizer", 5.54]], null, null, [["speech", 50.89], ["whack, thwack", 13.52], ["music", 8.35]], null, null, [["music", 63.25], ["speech", 12.31], ["animal", 6.92]], [["cattle, bovinae", 47.61], ["livestock, farm animals, working animals", 27.83], ["moo", 21.9]], [["music", 35.08], ["whack, thwack", 11.06], ["speech", 7.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.46, 1.05, 0.74, 4.26, -0.24, 0.74, 16.36, 1.15, 0.34, 5.34, 1.07, 1.44, 4.59, 2.32, 8.53, 0.59, 0.54, 3.42, 0.22, 0.69, 0.17, 1.1, 0.31, 1.39, 0.46, 0.43, 0.41, 4.32, 0.11, 0.26]} \ No newline at end of file diff --git a/annotations_1/IpoReT0HjsQ_filtered.json b/annotations_1/IpoReT0HjsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2df4f53c6808ab3445b5a0763cf5199cdb802548 --- /dev/null +++ b/annotations_1/IpoReT0HjsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [9.0, 10.05], [15.0, 16.61], [18.0, 19.9], [22.0, 23.04], [25.0, 27.67], [28.0, 32.21], [34.0, 35.55], [38.0, 46.04], [48.0, 52.91], [57.0, 58.38], [60.0, 61.75], [63.0, 64.91], [66.0, 66.61], [68.0, 72.2], [73.0, 74.39], [75.0, 76.94], [78.0, 79.37], [80.0, 81.21], [85.0, 85.35], [86.0, 88.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 0.0, 93.91, 86.82, 0.0, 0.0, 0.0, 0.0, 42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.39], ["thunk", 6.81], ["wood", 4.69]], null, null, null, null, null, null], "duration": [1.88, 1.05, 1.61, 1.9, 1.04, 2.67, 4.21, 1.55, 8.04, 4.91, 1.38, 1.75, 1.91, 0.61, 4.2, 1.39, 1.94, 1.37, 1.21, 0.35, 2.15]} \ No newline at end of file diff --git a/annotations_1/IqJWWBRnrH4_filtered.json b/annotations_1/IqJWWBRnrH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb09622afa45ba7b4f5cba8324e28e5d44f0585 --- /dev/null +++ b/annotations_1/IqJWWBRnrH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [9.0, 11.26], [21.0, 26.77], [28.0, 29.25], [31.0, 33.61], [35.0, 36.51], [39.0, 38.92], [44.0, 45.1], [49.0, 52.12], [54.0, 54.67], [55.0, 63.27], [67.0, 70.07], [72.0, 73.65], [91.0, 92.3], [99.0, 101.01]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 34.49, 34.8, 0.0, 56.93, 0.0, 0.0, 0.0, 32.56, 0.0, 38.95, 31.18, 0.0, 0.0, 30.83], "audiomae_on_audioset": [null, [["music", 53.69], ["speech", 21.0], ["electronic music", 3.81]], [["speech", 74.53], ["horse", 4.2], ["applause", 4.01]], null, null, null, null, null, [["speech", 32.81], ["crowd", 11.92], ["applause", 11.77]], null, [["speech", 58.88], ["animal", 7.98], ["horse", 5.3]], [["speech", 16.03], ["crowd", 11.24], ["fart", 6.83]], null, null, [["speech", 52.12], ["fart", 3.8], ["boing", 2.94]]], "duration": [0.4, 2.26, 5.77, 1.25, 2.61, 1.51, -0.08, 1.1, 3.12, 0.67, 8.27, 3.07, 1.65, 1.3, 2.01]} \ No newline at end of file diff --git a/annotations_1/Iqiyy26sW-Q_filtered.json b/annotations_1/Iqiyy26sW-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fdc6b9e2d3ce2ff9d7985e1244ba309d9cfb3d6 --- /dev/null +++ b/annotations_1/Iqiyy26sW-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 64.52], [69.0, 78.24], [80.0, 80.32], [87.0, 89.99], [91.0, 91.64], [92.0, 97.93], [99.0, 99.82], [101.0, 101.04], [102.0, 102.39], [103.0, 103.47], [106.0, 107.03], [110.0, 110.19], [115.0, 114.94]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [36.35, 34.01, 0.0, 99.96, 0.0, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 40.08], ["mains hum", 30.5], ["music", 9.84]], [["music", 37.63], ["synthesizer", 10.5], ["musical instrument", 3.96]], null, null, null, [["machine gun", 29.7], ["music", 14.9], ["gunshot, gunfire", 9.56]], null, null, null, null, null, null, null], "duration": [17.52, 9.24, 0.32, 2.99, 0.64, 5.93, 0.82, 0.04, 0.39, 0.47, 1.03, 0.19, -0.06]} \ No newline at end of file diff --git a/annotations_1/IqsvjhHv5wo_filtered.json b/annotations_1/IqsvjhHv5wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/IqsvjhHv5wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/IrTJjUQ_xGQ_filtered.json b/annotations_1/IrTJjUQ_xGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df39dd1ee9e611eb558d65d3e711bcc7206ff922 --- /dev/null +++ b/annotations_1/IrTJjUQ_xGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.68], [5.0, 5.32], [7.0, 7.33], [8.0, 11.23], [13.0, 17.32], [19.0, 27.53], [35.0, 40.58], [41.0, 47.82], [48.0, 48.66], [49.0, 50.67], [51.0, 52.81], [54.0, 55.04], [61.0, 61.25], [65.0, 66.51], [72.0, 73.53], [75.0, 75.52], [83.0, 87.35], [90.0, 90.69], [94.0, 95.23], [98.0, 98.39], [99.0, 100.4], [110.0, 113.19], [115.0, 115.5], [126.0, 126.35], [127.0, 126.93]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.63, 30.37, 32.05, 32.39, 35.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 0.0, 0.0, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["animal", 26.39], ["livestock, farm animals, working animals", 15.84], ["speech", 7.11]], [["fart", 42.41], ["speech", 29.61], ["whack, thwack", 7.28]], [["speech", 22.98], ["whack, thwack", 18.96], ["echo", 10.95]], [["speech", 78.44], ["fart", 9.25], ["radio", 1.43]], null, null, null, null, null, null, null, null, [["music", 8.29], ["radio", 8.22], ["theremin", 7.43]], null, null, null, null, [["speech", 60.46], ["radio", 19.45], ["sidetone", 4.34]], null, null, null], "duration": [0.68, 0.32, 0.33, 3.23, 4.32, 8.53, 5.58, 6.82, 0.66, 1.67, 1.81, 1.04, 0.25, 1.51, 1.53, 0.52, 4.35, 0.69, 1.23, 0.39, 1.4, 3.19, 0.5, 0.35, -0.07]} \ No newline at end of file diff --git a/annotations_1/Irf50_-vVtI_filtered.json b/annotations_1/Irf50_-vVtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8efcd94f8e0c7769320141142cca0265304a07a --- /dev/null +++ b/annotations_1/Irf50_-vVtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 50.68], [55.0, 56.3], [57.0, 58.14], [68.0, 124.12], [125.0, 135.48]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.69], "audiomae_on_audioset": [null, null, null, null, [["music", 63.63], ["speech", 25.79], ["explosion", 0.84]]], "duration": [1.68, 1.3, 1.14, 56.12, 10.48]} \ No newline at end of file diff --git a/annotations_1/Irq818Ek0Ro_filtered.json b/annotations_1/Irq818Ek0Ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9775939e1bf622fe47aac9ced4f57ba88749169e --- /dev/null +++ b/annotations_1/Irq818Ek0Ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.29], [30.0, 32.21], [33.0, 35.36], [37.0, 39.77], [44.0, 44.22], [45.0, 53.23], [55.0, 57.38], [58.0, 118.07]], "keep_status": [true, false, true, false, false, true, false, false], "silence_prob": [44.99, 50.86, 47.94, 54.04, 0.0, 49.36, 57.81, 0.0], "audiomae_on_audioset": [[["hum", 30.78], ["throbbing", 27.15], ["music", 11.75]], null, [["hum", 20.81], ["throbbing", 6.27], ["mains hum", 5.06]], null, null, [["fly, housefly", 18.62], ["bee, wasp, etc.", 12.04], ["music", 11.49]], null, null], "duration": [2.29, 2.21, 2.36, 2.77, 0.22, 8.23, 2.38, 60.07]} \ No newline at end of file diff --git a/annotations_1/IsG-jJcrlr0_filtered.json b/annotations_1/IsG-jJcrlr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cc61327ccb27a2fec7079c2ff5885dd6da55b80 --- /dev/null +++ b/annotations_1/IsG-jJcrlr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [10.0, 10.93], [32.0, 34.23], [39.0, 39.43], [52.0, 57.57], [63.0, 63.17], [83.0, 83.15], [92.0, 91.93], [96.0, 96.23], [98.0, 98.85], [105.0, 105.48], [126.0, 126.23], [129.0, 131.8], [137.0, 137.44], [138.0, 138.23], [148.0, 148.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.6, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 78.38], ["male speech, man speaking", 2.41], ["hum", 2.31]], null, [["speech", 55.78], ["growling", 23.73], ["whale vocalization", 8.84]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.93, 2.23, 0.43, 5.57, 0.17, 0.15, -0.07, 0.23, 0.85, 0.48, 0.23, 2.8, 0.44, 0.23, 0.68]} \ No newline at end of file diff --git a/annotations_1/IsZdfna1LKA_filtered.json b/annotations_1/IsZdfna1LKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07b4bafb83df8c6f25768cd2306baa4446254354 --- /dev/null +++ b/annotations_1/IsZdfna1LKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.23], [26.0, 32.29], [35.0, 36.54], [39.0, 40.66], [43.0, 44.91], [48.0, 54.14], [58.0, 59.8], [62.0, 62.77], [65.0, 67.85], [69.0, 71.71], [74.0, 74.01], [75.0, 81.24], [83.0, 85.6], [87.0, 92.96], [94.0, 95.2], [103.0, 103.0]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [35.22, 32.41, 0.0, 0.0, 0.0, 30.6, 0.0, 0.0, 30.57, 31.09, 0.0, 68.41, 84.98, 58.47, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.5], ["didgeridoo", 13.14], ["musical instrument", 11.7]], [["music", 79.81], ["synthesizer", 3.09], ["electronic music", 1.92]], null, null, null, [["music", 33.79], ["theremin", 8.53], ["foghorn", 6.71]], null, null, [["foghorn", 60.02], ["music", 25.17], ["brass instrument", 2.21]], [["music", 57.86], ["musical instrument", 5.13], ["foghorn", 5.07]], null, null, null, null, null, null], "duration": [2.23, 6.29, 1.54, 1.66, 1.91, 6.14, 1.8, 0.77, 2.85, 2.71, 0.01, 6.24, 2.6, 5.96, 1.2, 0.0]} \ No newline at end of file diff --git a/annotations_1/IspZWYlmYZY_filtered.json b/annotations_1/IspZWYlmYZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f930d09039cb7c33bc6994f049855b2d04d284 --- /dev/null +++ b/annotations_1/IspZWYlmYZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.62], [33.0, 33.57], [36.0, 36.21], [48.0, 49.17], [56.0, 57.6], [71.0, 71.61], [83.0, 89.46], [90.0, 91.12], [95.0, 95.98], [97.0, 98.56], [110.0, 109.92], [110.0, 110.79], [120.0, 121.09], [125.0, 126.3], [127.0, 127.45], [129.0, 129.25], [140.0, 141.86], [142.0, 144.14], [155.0, 158.57], [160.0, 163.09], [164.0, 165.23], [171.0, 173.52], [174.0, 175.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 95.09, 61.97, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 0.57, 0.21, 1.17, 1.6, 0.61, 6.46, 1.12, 0.98, 1.56, -0.08, 0.79, 1.09, 1.3, 0.45, 0.25, 1.86, 2.14, 3.57, 3.09, 1.23, 2.52, 1.04]} \ No newline at end of file diff --git a/annotations_1/ItDFQOAqEuA_filtered.json b/annotations_1/ItDFQOAqEuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1ac9fa46319445efc95791aa88223100ca56517 --- /dev/null +++ b/annotations_1/ItDFQOAqEuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.44], [12.0, 12.09], [13.0, 15.45], [18.0, 18.17], [19.0, 19.26], [20.0, 22.22], [27.0, 27.31], [30.0, 30.67], [45.0, 121.81], [124.0, 124.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.62, 0.0, 0.0, 54.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.44, 0.09, 2.45, 0.17, 0.26, 2.22, 0.31, 0.67, 76.81, 0.77]} \ No newline at end of file diff --git a/annotations_1/ItHtrNSJwDo_filtered.json b/annotations_1/ItHtrNSJwDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1592a9eb26f4e0442abc03d08bf0d67b997d2ab --- /dev/null +++ b/annotations_1/ItHtrNSJwDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.14], [13.0, 24.53], [29.0, 29.07], [30.0, 30.67], [32.0, 32.83], [74.0, 74.65], [86.0, 86.41], [89.0, 89.41], [100.0, 101.06], [107.0, 107.35], [118.0, 117.88], [122.0, 126.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [61.47, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.34], ["fart", 13.04], ["explosion", 10.38]]], "duration": [6.14, 11.53, 0.07, 0.67, 0.83, 0.65, 0.41, 0.41, 1.06, 0.35, -0.12, 4.47]} \ No newline at end of file diff --git a/annotations_1/ItMY_4RobkM_filtered.json b/annotations_1/ItMY_4RobkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b7b476e372e37813d6b178a37f149280c4a9604 --- /dev/null +++ b/annotations_1/ItMY_4RobkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.19], [25.0, 25.44], [39.0, 39.6], [50.0, 55.32], [65.0, 65.21], [69.0, 71.0], [73.0, 74.36], [76.0, 77.79], [88.0, 88.48], [90.0, 91.94], [93.0, 95.76], [104.0, 105.63], [107.0, 108.31], [110.0, 110.66], [112.0, 115.84], [122.0, 123.2], [126.0, 126.6]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.08, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 64.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["boing", 20.39], ["speech", 19.6], ["music", 13.62]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.44, 0.6, 5.32, 0.21, 2.0, 1.36, 1.79, 0.48, 1.94, 2.76, 1.63, 1.31, 0.66, 3.84, 1.2, 0.6]} \ No newline at end of file diff --git a/annotations_1/IuiKCwrTYO0_filtered.json b/annotations_1/IuiKCwrTYO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3600352f729f3c226aeaab13885cc9ecf55fc26c --- /dev/null +++ b/annotations_1/IuiKCwrTYO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.75], [14.0, 18.03], [20.0, 33.88], [35.0, 42.3], [44.0, 52.91], [54.0, 56.07], [57.0, 60.15], [62.0, 65.08]], "keep_status": [false, false, true, false, false, false, true, true], "silence_prob": [0.0, 32.95, 33.87, 34.88, 40.19, 41.56, 47.98, 40.04], "audiomae_on_audioset": [null, [["music", 28.52], ["mains hum", 24.26], ["hum", 22.43]], [["music", 42.18], ["whale vocalization", 13.53], ["hum", 8.72]], [["mains hum", 53.19], ["hum", 44.56], ["throbbing", 0.67]], [["hum", 37.67], ["mains hum", 21.1], ["speech", 12.15]], [["hum", 48.83], ["music", 16.25], ["throbbing", 13.87]], [["hum", 33.46], ["rumble", 13.28], ["mains hum", 12.26]], [["hum", 28.29], ["music", 22.08], ["whale vocalization", 16.55]]], "duration": [0.75, 4.03, 13.88, 7.3, 8.91, 2.07, 3.15, 3.08]} \ No newline at end of file diff --git a/annotations_1/IurXrQqZufM_filtered.json b/annotations_1/IurXrQqZufM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9c01b9fea4610170a79e50e76155cc5a76eab7b --- /dev/null +++ b/annotations_1/IurXrQqZufM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.06], [30.0, 35.28], [37.0, 49.4], [51.0, 78.73], [80.0, 84.21], [87.0, 89.56], [92.0, 119.74], [122.0, 149.37], [155.0, 158.99], [161.0, 216.95]], "keep_status": [true, true, false, false, true, false, false, false, false, false], "silence_prob": [29.51, 35.22, 41.68, 35.77, 38.28, 55.53, 32.25, 30.85, 33.7, 0.0], "audiomae_on_audioset": [[["music", 22.47], ["mains hum", 20.08], ["speech", 16.37]], [["music", 30.23], ["tabla", 10.1], ["explosion", 5.84]], [["music", 69.77], ["synthesizer", 5.6], ["musical instrument", 2.77]], [["music", 64.52], ["musical instrument", 4.13], ["synthesizer", 3.34]], [["hum", 18.99], ["vehicle", 12.99], ["mains hum", 8.39]], null, [["creak", 49.96], ["coin (dropping)", 12.03], ["microwave oven", 8.77]], [["music", 59.72], ["didgeridoo", 9.72], ["hum", 4.45]], [["livestock, farm animals, working animals", 37.44], ["moo", 20.12], ["cattle, bovinae", 16.21]], null], "duration": [6.06, 5.28, 12.4, 27.73, 4.21, 2.56, 27.74, 27.37, 3.99, 55.95]} \ No newline at end of file diff --git a/annotations_1/IvAjNuhubIM_filtered.json b/annotations_1/IvAjNuhubIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56dad27e5d614e8c85fc45c705922abb3ae07891 --- /dev/null +++ b/annotations_1/IvAjNuhubIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 59.97], [62.0, 81.21], [83.0, 117.59], [118.0, 118.86]], "keep_status": [true, true, false, false], "silence_prob": [37.84, 34.92, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.31], ["music", 7.7], ["buzz", 1.98]], [["speech", 34.57], ["hum", 10.27], ["buzz", 5.9]], null, null], "duration": [5.97, 19.21, 34.59, 0.86]} \ No newline at end of file diff --git a/annotations_1/IvFBobchMoc_filtered.json b/annotations_1/IvFBobchMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f80eb8a2725a54e32cab7ac4bfc4cde0ea2fac5 --- /dev/null +++ b/annotations_1/IvFBobchMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.68], [26.0, 27.85], [28.0, 27.89], [29.0, 43.92], [44.0, 44.63], [46.0, 56.44], [60.0, 73.33], [75.0, 85.9], [92.0, 94.78], [96.0, 107.11], [111.0, 113.97], [116.0, 116.19], [117.0, 173.38]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [46.64, 0.0, 0.0, 29.03, 0.0, 29.24, 29.27, 29.32, 30.53, 31.58, 34.83, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 50.92], ["groan", 16.0], ["music", 11.16]], null, null, [["music", 19.31], ["speech", 14.99], ["explosion", 10.68]], null, [["music", 40.24], ["animal", 11.73], ["wild animals", 6.37]], [["music", 70.54], ["cacophony", 3.65], ["electronic music", 2.63]], [["music", 59.29], ["throbbing", 14.43], ["hum", 8.99]], [["music", 52.43], ["hum", 5.23], ["musical instrument", 4.43]], [["foghorn", 45.22], ["music", 28.23], ["speech", 8.49]], [["cattle, bovinae", 48.77], ["moo", 26.82], ["livestock, farm animals, working animals", 21.48]], null, null], "duration": [13.68, 1.85, -0.11, 14.92, 0.63, 10.44, 13.33, 10.9, 2.78, 11.11, 2.97, 0.19, 56.38]} \ No newline at end of file diff --git a/annotations_1/IvGwIRIYlBo_filtered.json b/annotations_1/IvGwIRIYlBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88823b4d808d9f8846baec121a611149e51cf180 --- /dev/null +++ b/annotations_1/IvGwIRIYlBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.95], [10.0, 23.85], [39.0, 42.55], [49.0, 51.81], [54.0, 56.66], [61.0, 63.12], [68.0, 93.26], [96.0, 98.15], [99.0, 99.28], [101.0, 118.52], [122.0, 123.16], [130.0, 131.01], [134.0, 134.01], [139.0, 150.67], [152.0, 153.49], [157.0, 160.49], [167.0, 166.8]], "keep_status": [true, false, true, true, true, false, false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [46.57, 36.33, 28.91, 34.5, 36.23, 36.61, 33.28, 32.86, 0.0, 33.38, 0.0, 0.0, 0.0, 30.69, 0.0, 46.09, 0.0], "audiomae_on_audioset": [[["music", 44.56], ["synthesizer", 8.32], ["electronic music", 3.62]], [["music", 38.92], ["speech", 24.07], ["electric shaver, electric razor", 11.37]], [["music", 48.41], ["whack, thwack", 6.23], ["boing", 6.09]], [["music", 38.57], ["hum", 10.74], ["speech", 6.79]], [["speech", 53.31], ["vehicle", 4.35], ["music", 3.46]], [["burping, eructation", 74.23], ["grunt", 11.75], ["speech", 4.83]], [["music", 77.24], ["guitar", 6.77], ["musical instrument", 5.18]], [["music", 19.11], ["speech", 18.09], ["vehicle", 8.79]], null, [["music", 42.04], ["speech", 21.99], ["musical instrument", 4.19]], null, null, null, [["music", 29.54], ["mains hum", 21.53], ["electric shaver, electric razor", 13.67]], null, [["music", 38.52], ["didgeridoo", 27.23], ["mains hum", 6.99]], null], "duration": [2.95, 13.85, 3.55, 2.81, 2.66, 2.12, 25.26, 2.15, 0.28, 17.52, 1.16, 1.01, 0.01, 11.67, 1.49, 3.49, -0.2]} \ No newline at end of file diff --git a/annotations_1/IvgFrEk1JqA_filtered.json b/annotations_1/IvgFrEk1JqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b33defe28dafb0987f254892ef0e91120e83783d --- /dev/null +++ b/annotations_1/IvgFrEk1JqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [4.0, 4.56], [10.0, 10.86], [12.0, 15.08], [15.0, 17.07], [18.0, 36.83], [45.0, 44.68], [48.0, 48.96], [53.0, 53.25], [57.0, 65.16], [69.0, 83.03], [84.0, 101.93], [109.0, 109.92], [111.0, 111.21], [112.0, 113.22], [114.0, 114.54], [115.0, 116.6], [118.0, 119.21], [120.0, 120.56], [124.0, 125.51], [130.0, 131.13], [135.0, 135.77], [149.0, 149.72], [151.0, 151.14], [153.0, 153.72], [156.0, 158.08], [158.0, 159.17], [159.0, 160.24], [161.0, 163.36], [166.0, 167.75], [169.0, 169.25]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.05, 39.04, 30.08, 0.0, 0.0, 0.0, 29.81, 34.74, 33.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 79.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 37.15], ["music", 25.49], ["didgeridoo", 8.58]], [["music", 38.52], ["speech", 21.24], ["boing", 5.21]], [["music", 60.93], ["throbbing", 4.54], ["animal", 4.36]], null, null, null, [["speech", 43.93], ["music", 42.33], ["electronic music", 2.39]], [["music", 35.53], ["hum", 5.48], ["thunk", 5.4]], [["music", 34.83], ["speech", 30.01], ["hum", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.56, 0.86, 3.08, 2.07, 18.83, -0.32, 0.96, 0.25, 8.16, 14.03, 17.93, 0.92, 0.21, 1.22, 0.54, 1.6, 1.21, 0.56, 1.51, 1.13, 0.77, 0.72, 0.14, 0.72, 2.08, 1.17, 1.24, 2.36, 1.75, 0.25]} \ No newline at end of file diff --git a/annotations_1/IxRCDx-YV4I_filtered.json b/annotations_1/IxRCDx-YV4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed9a8f39e86af08404fe67485bf92cc141947b17 --- /dev/null +++ b/annotations_1/IxRCDx-YV4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.87], [42.0, 45.35], [48.0, 48.44], [51.0, 54.99], [58.0, 58.09], [58.0, 62.14], [64.0, 73.52], [78.0, 96.47], [108.0, 110.12], [113.0, 113.02], [117.0, 147.78], [151.0, 155.28]], "keep_status": [false, false, false, true, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 33.75, 0.0, 35.67, 0.0, 28.6, 28.82, 30.02, 29.26, 0.0, 0.0, 37.77], "audiomae_on_audioset": [null, [["music", 33.96], ["synthesizer", 25.1], ["musical instrument", 11.46]], null, [["music", 60.15], ["synthesizer", 4.45], ["effects unit", 3.29]], null, [["speech", 66.29], ["music", 22.82], ["explosion", 1.76]], [["music", 42.85], ["whale vocalization", 10.38], ["hum", 7.73]], [["music", 49.33], ["hum", 8.68], ["electronic music", 6.41]], [["music", 34.2], ["hum", 14.69], ["throbbing", 9.3]], null, null, [["music", 56.18], ["speech", 17.6], ["hum", 4.75]]], "duration": [0.87, 3.35, 0.44, 3.99, 0.09, 4.14, 9.52, 18.47, 2.12, 0.02, 30.78, 4.28]} \ No newline at end of file diff --git a/annotations_1/IxoCv_JpQVs_filtered.json b/annotations_1/IxoCv_JpQVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42a2ad73833dbc30bde8c962500eadf936a79c8b --- /dev/null +++ b/annotations_1/IxoCv_JpQVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.5], [13.0, 13.36], [14.0, 17.1], [18.0, 20.9], [22.0, 22.15], [26.0, 26.03], [28.0, 28.44], [31.0, 31.83], [36.0, 43.23], [45.0, 46.14], [49.0, 49.49], [50.0, 50.68], [52.0, 52.08], [53.0, 52.93], [53.0, 53.59], [57.0, 59.51], [67.0, 67.58], [70.0, 71.91], [75.0, 78.48], [82.0, 82.44], [83.0, 82.95], [83.0, 85.6], [90.0, 95.71], [98.0, 98.19], [99.0, 99.86], [100.0, 101.26], [104.0, 105.17], [109.0, 113.36], [115.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.16, 97.73, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 39.63, 0.0, 0.0, 61.57, 64.52, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.84], ["fireworks", 3.66], ["outside, rural or natural", 2.08]], null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.36, 3.1, 2.9, 0.15, 0.03, 0.44, 0.83, 7.23, 1.14, 0.49, 0.68, 0.08, -0.07, 0.59, 2.51, 0.58, 1.91, 3.48, 0.44, -0.05, 2.6, 5.71, 0.19, 0.86, 1.26, 1.17, 4.36, 1.16]} \ No newline at end of file diff --git a/annotations_1/Iy2kMtJa2q8_filtered.json b/annotations_1/Iy2kMtJa2q8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc07f2bf908bdf2a24fc0f625c3ee1c3030863e --- /dev/null +++ b/annotations_1/Iy2kMtJa2q8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.34], [16.0, 20.71], [23.0, 23.8], [26.0, 56.07], [57.0, 56.83], [62.0, 100.28], [105.0, 131.4], [135.0, 145.79], [150.0, 174.12], [176.0, 178.46], [179.0, 182.83], [184.0, 184.52], [185.0, 187.71], [190.0, 198.32]], "keep_status": [false, true, false, false, false, false, true, true, true, false, true, false, false, false], "silence_prob": [0.0, 37.43, 0.0, 0.0, 0.0, 0.0, 44.6, 43.05, 46.15, 59.33, 46.68, 0.0, 70.3, 71.0], "audiomae_on_audioset": [null, [["speech", 40.27], ["mosquito", 13.36], ["fly, housefly", 13.11]], null, null, null, null, [["music", 36.8], ["hum", 11.19], ["throbbing", 10.17]], [["music", 30.65], ["speech", 22.38], ["throbbing", 8.1]], [["hum", 29.24], ["throbbing", 19.11], ["music", 17.64]], null, [["hum", 29.24], ["music", 14.44], ["mains hum", 13.33]], null, null, null], "duration": [0.34, 4.71, 0.8, 30.07, -0.17, 38.28, 26.4, 10.79, 24.12, 2.46, 3.83, 0.52, 2.71, 8.32]} \ No newline at end of file diff --git a/annotations_1/IywRc7bHziQ_filtered.json b/annotations_1/IywRc7bHziQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de19098da0fabd893a979c7590a6328e851816df --- /dev/null +++ b/annotations_1/IywRc7bHziQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [6.0, 6.44], [15.0, 26.13], [27.0, 35.29], [38.0, 39.99], [45.0, 47.48], [48.0, 48.19], [49.0, 56.0], [59.0, 59.59], [61.0, 73.95], [77.0, 80.74]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 62.78, 31.4, 0.0, 71.14, 0.0, 100.0, 0.0, 48.35, 57.32], "audiomae_on_audioset": [null, null, null, [["speech", 40.09], ["wail, moan", 6.64], ["livestock, farm animals, working animals", 6.12]], null, null, null, null, null, [["speech", 40.14], ["telephone", 12.91], ["dial tone", 7.69]], null], "duration": [1.03, 0.44, 11.13, 8.29, 1.99, 2.48, 0.19, 7.0, 0.59, 12.95, 3.74]} \ No newline at end of file diff --git a/annotations_1/Izp0m24gYRU_filtered.json b/annotations_1/Izp0m24gYRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc7d6ad0002d7eb88634b9125c652d3aeaaa2204 --- /dev/null +++ b/annotations_1/Izp0m24gYRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 64.5], [65.0, 66.36], [68.0, 68.61], [69.0, 69.77], [72.0, 72.35], [74.0, 74.49], [75.0, 75.91], [79.0, 84.74], [86.0, 132.66], [134.0, 135.24], [137.0, 136.59], [138.0, 138.25], [141.0, 141.62], [145.0, 145.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.36, 0.61, 0.77, 0.35, 0.49, 0.91, 5.74, 46.66, 1.24, -0.41, 0.25, 0.62, 0.76]} \ No newline at end of file diff --git a/annotations_1/J-OLwCyAtBc_filtered.json b/annotations_1/J-OLwCyAtBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a96dea399183f99686c6745fe6fc84572bdb047 --- /dev/null +++ b/annotations_1/J-OLwCyAtBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.64], [9.0, 17.0], [19.0, 33.2], [34.0, 35.73], [40.0, 41.67], [44.0, 45.59], [46.0, 47.83], [48.0, 59.04], [60.0, 61.28], [62.0, 62.87], [64.0, 64.45], [66.0, 66.41], [68.0, 71.74], [75.0, 75.52], [91.0, 93.6], [95.0, 97.33], [101.0, 105.38], [106.0, 117.29], [118.0, 120.36], [122.0, 124.24], [126.0, 126.71], [129.0, 131.01], [131.0, 133.95], [135.0, 137.32], [138.0, 141.74], [145.0, 145.54], [147.0, 146.97], [147.0, 148.91], [150.0, 151.55], [152.0, 154.28], [156.0, 156.96], [160.0, 161.74], [167.0, 170.19]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 39.67, 34.43, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 38.93, 0.0, 52.16, 45.02, 40.95, 42.26, 48.19, 47.23, 0.0, 50.66, 40.57, 49.59, 40.22, 0.0, 0.0, 0.0, 0.0, 45.24, 0.0, 0.0, 42.69], "audiomae_on_audioset": [null, [["music", 50.56], ["carnatic music", 7.36], ["musical instrument", 5.06]], [["theremin", 69.37], ["music", 27.77], ["musical instrument", 0.46]], null, null, null, null, null, null, null, null, null, [["breaking", 57.83], ["whack, thwack", 19.34], ["smash, crash", 8.17]], null, null, [["music", 30.74], ["hum", 28.55], ["mains hum", 11.72]], [["hum", 39.36], ["mains hum", 39.34], ["music", 7.42]], [["music", 62.94], ["scary music", 8.56], ["wild animals", 4.71]], [["carnatic music", 34.65], ["music", 28.55], ["musical instrument", 10.15]], [["music", 27.6], ["hum", 25.71], ["mains hum", 18.4]], null, null, [["music", 58.49], ["didgeridoo", 13.11], ["theremin", 3.99]], [["music", 26.55], ["hum", 9.48], ["mains hum", 8.62]], [["music", 16.42], ["mains hum", 14.83], ["hum", 13.56]], null, null, null, null, [["pulse", 25.46], ["music", 24.29], ["hum", 10.08]], null, null, [["music", 28.11], ["livestock, farm animals, working animals", 12.44], ["moo", 8.73]]], "duration": [1.64, 8.0, 14.2, 1.73, 1.67, 1.59, 1.83, 11.04, 1.28, 0.87, 0.45, 0.41, 3.74, 0.52, 2.6, 2.33, 4.38, 11.29, 2.36, 2.24, 0.71, 2.01, 2.95, 2.32, 3.74, 0.54, -0.03, 1.91, 1.55, 2.28, 0.96, 1.74, 3.19]} \ No newline at end of file diff --git a/annotations_1/J-fa9awvFBY_filtered.json b/annotations_1/J-fa9awvFBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5aa461e05ad5cbfff9033125438e43929470155 --- /dev/null +++ b/annotations_1/J-fa9awvFBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [9.0, 14.37], [16.0, 18.0], [21.0, 23.25], [24.0, 24.65], [31.0, 31.08], [32.0, 33.12], [37.0, 37.84], [39.0, 40.04], [42.0, 43.5], [45.0, 45.57], [46.0, 47.48], [51.0, 51.81], [54.0, 54.55], [59.0, 62.01], [64.0, 66.23], [67.0, 70.04], [72.0, 73.52], [74.0, 78.66], [80.0, 80.55], [81.0, 85.92], [87.0, 89.26], [92.0, 92.28], [93.0, 96.8], [98.0, 98.25], [99.0, 100.77], [102.0, 102.79], [106.0, 107.01], [109.0, 111.6], [114.0, 115.2], [115.0, 115.67], [120.0, 126.76], [128.0, 128.83], [130.0, 135.77], [139.0, 184.25], [186.0, 187.86], [188.0, 190.14], [195.0, 197.7], [200.0, 200.58], [203.0, 203.81], [205.0, 206.04], [208.0, 208.21], [209.0, 209.98], [212.0, 212.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.77, 92.97, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 99.99, 98.27, 0.0, 77.7, 0.0, 80.46, 99.99, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 99.85, 0.0, 94.07, 0.0, 0.0, 40.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.4], ["tuning fork", 24.37], ["sine wave", 11.2]], null, null, null, null, null, null, null, [["fart", 29.87], ["fly, housefly", 18.93], ["speech", 9.94]], null, null, null, null, null, null, null], "duration": [1.34, 5.37, 2.0, 2.25, 0.65, 0.08, 1.12, 0.84, 1.04, 1.5, 0.57, 1.48, 0.81, 0.55, 3.01, 2.23, 3.04, 1.52, 4.66, 0.55, 4.92, 2.26, 0.28, 3.8, 0.25, 1.77, 0.79, 1.01, 2.6, 1.2, 0.67, 6.76, 0.83, 5.77, 45.25, 1.86, 2.14, 2.7, 0.58, 0.81, 1.04, 0.21, 0.98, 0.95]} \ No newline at end of file diff --git a/annotations_1/J03m0CzUvJU_filtered.json b/annotations_1/J03m0CzUvJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..799ae7f43c442f9c79cc2936a4ac0a9d05f068e5 --- /dev/null +++ b/annotations_1/J03m0CzUvJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.9], [34.0, 34.72], [47.0, 48.96], [52.0, 58.06], [61.0, 61.06], [63.0, 65.1], [69.0, 77.46], [82.0, 87.32], [91.0, 90.96], [104.0, 104.48], [106.0, 106.68], [111.0, 112.58], [131.0, 132.27], [140.0, 143.82], [165.0, 175.0]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.31, 0.0, 34.64, 37.67, 37.58, 0.0, 0.0, 0.0, 0.0, 0.0, 51.02, 29.27], "audiomae_on_audioset": [null, null, null, [["music", 34.53], ["hum", 16.36], ["synthesizer", 6.1]], null, [["sidetone", 29.62], ["speech", 25.5], ["music", 21.14]], [["music", 67.58], ["synthesizer", 8.59], ["throbbing", 3.75]], [["music", 42.36], ["synthesizer", 7.0], ["theremin", 6.97]], null, null, null, null, null, null, [["music", 62.71], ["electronic music", 11.14], ["trance music", 6.21]]], "duration": [-0.1, 0.72, 1.96, 6.06, 0.06, 2.1, 8.46, 5.32, -0.04, 0.48, 0.68, 1.58, 1.27, 3.82, 10.0]} \ No newline at end of file diff --git a/annotations_1/J329mOtIQ_Q_filtered.json b/annotations_1/J329mOtIQ_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77c36bc70da2cd3f3d21916a38cf6173a6982aae --- /dev/null +++ b/annotations_1/J329mOtIQ_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.41], [10.0, 11.4], [12.0, 20.02], [22.0, 23.43], [25.0, 25.91], [29.0, 45.01], [46.0, 50.5], [52.0, 52.86], [54.0, 63.69], [64.0, 68.59], [70.0, 71.93], [73.0, 76.18], [77.0, 88.82], [90.0, 90.54], [91.0, 91.59], [92.0, 93.38], [94.0, 95.99], [100.0, 101.93], [105.0, 106.12], [109.0, 113.98], [116.0, 118.08], [121.0, 121.74], [131.0, 131.18], [136.0, 137.79], [138.0, 138.84], [143.0, 144.14], [144.0, 146.96], [149.0, 150.06], [152.0, 153.66], [158.0, 159.04], [163.0, 163.76], [164.0, 165.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.8, 0.0, 0.0, 91.47, 91.13, 0.0, 90.6, 95.78, 0.0, 98.99, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 1.4, 8.02, 1.43, 0.91, 16.01, 4.5, 0.86, 9.69, 4.59, 1.93, 3.18, 11.82, 0.54, 0.59, 1.38, 1.99, 1.93, 1.12, 4.98, 2.08, 0.74, 0.18, 1.79, 0.84, 1.14, 2.96, 1.06, 1.66, 1.04, 0.76, 1.92]} \ No newline at end of file diff --git a/annotations_1/J38c6k11K3U_filtered.json b/annotations_1/J38c6k11K3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dc23aa41507df8906ce66d9a9dc0d5a63afe789 --- /dev/null +++ b/annotations_1/J38c6k11K3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 91.44]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [39.44]} \ No newline at end of file diff --git a/annotations_1/J3Sl8B7RzUg_filtered.json b/annotations_1/J3Sl8B7RzUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2676fc786a67c32cafd6ce9811ff1a78454d572 --- /dev/null +++ b/annotations_1/J3Sl8B7RzUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [6.0, 49.44], [51.0, 73.68], [77.0, 76.89], [78.0, 83.79], [85.0, 87.51], [89.0, 89.48], [90.0, 96.2], [97.0, 119.82]], "keep_status": [false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 30.13, 0.0, 30.46, 32.31, 0.0, 31.87, 30.71], "audiomae_on_audioset": [null, null, [["music", 47.45], ["speech", 8.08], ["livestock, farm animals, working animals", 5.69]], null, [["music", 55.89], ["speech", 6.77], ["sound effect", 3.68]], [["music", 64.61], ["musical instrument", 8.25], ["didgeridoo", 2.85]], null, [["music", 49.81], ["livestock, farm animals, working animals", 13.65], ["cattle, bovinae", 6.19]], [["music", 63.52], ["musical instrument", 4.56], ["synthesizer", 4.39]]], "duration": [0.6, 43.44, 22.68, -0.11, 5.79, 2.51, 0.48, 6.2, 22.82]} \ No newline at end of file diff --git a/annotations_1/J440ql0zXuE_filtered.json b/annotations_1/J440ql0zXuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e69c01510d552a766b0ea02c5c9485ce67662cd3 --- /dev/null +++ b/annotations_1/J440ql0zXuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.75], [3.0, 3.25], [4.0, 4.78], [8.0, 9.07], [14.0, 14.93], [18.0, 21.22], [23.0, 23.13], [24.0, 26.47], [28.0, 28.73], [31.0, 32.56], [34.0, 38.3], [39.0, 39.66], [41.0, 42.84], [44.0, 45.01], [45.0, 46.92], [48.0, 50.84], [52.0, 52.15], [52.0, 54.95], [56.0, 57.27], [62.0, 65.01], [68.0, 70.36], [74.0, 80.18], [81.0, 84.3], [88.0, 90.0], [91.0, 92.92], [95.0, 98.76], [101.0, 103.15], [104.0, 105.29], [106.0, 107.94], [108.0, 111.62], [112.0, 118.76], [120.0, 121.24], [124.0, 125.81], [131.0, 139.45], [142.0, 145.25], [148.0, 149.98], [150.0, 150.69], [151.0, 150.74], [151.0, 151.51], [152.0, 153.71], [156.0, 156.29], [163.0, 164.17], [165.0, 167.27], [169.0, 176.07], [177.0, 177.31], [185.0, 185.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.82, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 98.59, 99.96, 0.0, 0.0, 99.59, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 35.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 36.48], ["throbbing", 19.54], ["mains hum", 12.62]], null, null], "duration": [0.75, 0.25, 0.78, 1.07, 0.93, 3.22, 0.13, 2.47, 0.73, 1.56, 4.3, 0.66, 1.84, 1.01, 1.92, 2.84, 0.15, 2.95, 1.27, 3.01, 2.36, 6.18, 3.3, 2.0, 1.92, 3.76, 2.15, 1.29, 1.94, 3.62, 6.76, 1.24, 1.81, 8.45, 3.25, 1.98, 0.69, -0.26, 0.51, 1.71, 0.29, 1.17, 2.27, 7.07, 0.31, 0.11]} \ No newline at end of file diff --git a/annotations_1/J4ZnYc3tNyw_filtered.json b/annotations_1/J4ZnYc3tNyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0c7ee297ace0be75451abafd5225d0cb4e0ffb0 --- /dev/null +++ b/annotations_1/J4ZnYc3tNyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.6], [19.0, 32.09], [39.0, 40.86], [59.0, 69.04], [73.0, 74.26], [79.0, 108.75]], "keep_status": [true, true, false, true, false, true], "silence_prob": [32.23, 30.56, 0.0, 30.44, 0.0, 30.38], "audiomae_on_audioset": [[["cattle, bovinae", 29.58], ["music", 17.3], ["moo", 15.36]], [["music", 61.29], ["electronic music", 4.32], ["synthesizer", 4.18]], null, [["speech", 30.43], ["music", 21.12], ["buzz", 10.22]], null, [["speech", 35.0], ["music", 24.94], ["electronic music", 6.67]]], "duration": [6.6, 13.09, 1.86, 10.04, 1.26, 29.75]} \ No newline at end of file diff --git a/annotations_1/J5K0XKyL3i8_filtered.json b/annotations_1/J5K0XKyL3i8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63be4c6afc599429a68066b28b464b372b6426c6 --- /dev/null +++ b/annotations_1/J5K0XKyL3i8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.07], [16.0, 17.12], [18.0, 18.44], [20.0, 20.93], [24.0, 24.17], [27.0, 27.57], [28.0, 30.45], [32.0, 32.68], [36.0, 37.18], [38.0, 38.82], [39.0, 40.69], [43.0, 44.41], [45.0, 49.49], [52.0, 52.47], [54.0, 54.63], [57.0, 57.94], [58.0, 59.48], [61.0, 61.43], [61.0, 68.66], [69.0, 70.07], [72.0, 72.27], [75.0, 78.19], [79.0, 79.66], [82.0, 84.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 85.54, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 1.12, 0.44, 0.93, 0.17, 0.57, 2.45, 0.68, 1.18, 0.82, 1.69, 1.41, 4.49, 0.47, 0.63, 0.94, 1.48, 0.43, 7.66, 1.07, 0.27, 3.19, 0.66, 2.05]} \ No newline at end of file diff --git a/annotations_1/J5KvaQzBDoc_filtered.json b/annotations_1/J5KvaQzBDoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..856ad61756944ecd25210f7da55b3f1e3662f5ce --- /dev/null +++ b/annotations_1/J5KvaQzBDoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.25], [8.0, 8.68], [9.0, 11.04], [12.0, 15.96], [17.0, 24.6], [26.0, 27.85], [30.0, 30.84], [32.0, 31.92], [34.0, 35.07], [37.0, 37.18], [38.0, 39.18], [43.0, 43.75], [45.0, 46.23], [49.0, 52.39], [53.0, 54.18], [56.0, 57.15], [58.0, 58.87], [60.0, 60.03], [63.0, 64.59], [73.0, 73.55], [81.0, 82.56], [89.0, 89.68], [90.0, 94.07], [96.0, 97.53], [99.0, 99.03], [105.0, 105.98], [109.0, 111.18], [115.0, 119.01], [120.0, 121.37], [122.0, 122.64], [128.0, 129.34], [132.0, 133.56], [135.0, 135.48], [137.0, 137.69], [138.0, 139.83], [141.0, 142.72], [144.0, 145.5], [146.0, 146.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 100.0, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.68, 2.04, 3.96, 7.6, 1.85, 0.84, -0.08, 1.07, 0.18, 1.18, 0.75, 1.23, 3.39, 1.18, 1.15, 0.87, 0.03, 1.59, 0.55, 1.56, 0.68, 4.07, 1.53, 0.03, 0.98, 2.18, 4.01, 1.37, 0.64, 1.34, 1.56, 0.48, 0.69, 1.83, 1.72, 1.5, 0.48]} \ No newline at end of file diff --git a/annotations_1/J6osFXTp7WQ_filtered.json b/annotations_1/J6osFXTp7WQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f33b4d7c2969f6bfec4143a87c433d6904352c3b --- /dev/null +++ b/annotations_1/J6osFXTp7WQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 107.81], [109.0, 146.72]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [87.81, 37.72]} \ No newline at end of file diff --git a/annotations_1/J90JKBCDzSs_filtered.json b/annotations_1/J90JKBCDzSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6156da73333c6bfbf2e58441fa3f1411bf859df2 --- /dev/null +++ b/annotations_1/J90JKBCDzSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 46.97], [49.0, 87.18], [92.0, 131.85], [132.0, 141.56]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.84], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.03, 38.18, 39.85, 9.56]} \ No newline at end of file diff --git a/annotations_1/J96X6ei7LRE_filtered.json b/annotations_1/J96X6ei7LRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5ff7115837ccf0522c0be1dd852c86862517a50 --- /dev/null +++ b/annotations_1/J96X6ei7LRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 56.39], [57.0, 67.34], [68.0, 71.79], [75.0, 77.46], [78.0, 79.34], [80.0, 83.08], [87.0, 87.78], [89.0, 107.59], [110.0, 130.69], [136.0, 140.04], [144.0, 145.99], [148.0, 148.34], [153.0, 174.61], [177.0, 181.55]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 33.46, 38.15, 53.04, 0.0, 31.56, 0.0, 31.39, 31.59, 33.79, 0.0, 0.0, 32.54, 30.65], "audiomae_on_audioset": [null, [["speech", 44.52], ["music", 19.41], ["thunk", 11.08]], [["music", 30.83], ["thunk", 11.95], ["machine gun", 8.98]], null, null, [["explosion", 28.09], ["burst, pop", 9.39], ["speech", 6.29]], null, [["music", 31.32], ["throbbing", 17.42], ["hum", 15.41]], [["speech", 43.48], ["music", 33.38], ["boing", 4.67]], [["music", 81.5], ["cacophony", 4.28], ["musical instrument", 1.71]], null, null, [["music", 39.94], ["speech", 21.61], ["throbbing", 9.42]], [["music", 25.79], ["speech", 19.64], ["whack, thwack", 7.48]]], "duration": [1.39, 10.34, 3.79, 2.46, 1.34, 3.08, 0.78, 18.59, 20.69, 4.04, 1.99, 0.34, 21.61, 4.55]} \ No newline at end of file diff --git a/annotations_1/J9Sz39odDjw_filtered.json b/annotations_1/J9Sz39odDjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c0a77428e5645764962962958572d20eaece914 --- /dev/null +++ b/annotations_1/J9Sz39odDjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.33], [12.0, 12.18], [14.0, 15.53], [18.0, 27.3], [29.0, 32.36], [49.0, 55.27], [60.0, 60.37], [67.0, 68.74], [76.0, 76.33], [92.0, 92.77]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [95.64, 0.0, 0.0, 32.55, 33.35, 55.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 46.97], ["groan", 5.65], ["speech", 4.64]], [["music", 26.99], ["moo", 10.04], ["sheep", 8.19]], null, null, null, null, null], "duration": [2.33, 0.18, 1.53, 9.3, 3.36, 6.27, 0.37, 1.74, 0.33, 0.77]} \ No newline at end of file diff --git a/annotations_1/J9qv_a_s7Gs_filtered.json b/annotations_1/J9qv_a_s7Gs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3f956c0211b3a6a90f764d295f61c90915b8179 --- /dev/null +++ b/annotations_1/J9qv_a_s7Gs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.07], [19.0, 24.81], [27.0, 27.6], [29.0, 28.95], [31.0, 30.99], [32.0, 32.31], [33.0, 47.06], [48.0, 48.84], [54.0, 58.4], [59.0, 87.15], [88.0, 95.93]], "keep_status": [false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [95.09, 35.61, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 29.75, 28.82, 29.48], "audiomae_on_audioset": [null, [["sidetone", 57.94], ["noise", 11.37], ["radio", 8.76]], null, null, null, null, [["speech", 12.65], ["livestock, farm animals, working animals", 9.67], ["buzz", 8.34]], null, [["vehicle", 22.65], ["speech", 15.54], ["cattle, bovinae", 8.44]], [["speech", 45.34], ["vehicle", 5.19], ["explosion", 5.17]], [["buzz", 12.66], ["cattle, bovinae", 8.17], ["livestock, farm animals, working animals", 7.47]]], "duration": [7.07, 5.81, 0.6, -0.05, -0.01, 0.31, 14.06, 0.84, 4.4, 28.15, 7.93]} \ No newline at end of file diff --git a/annotations_1/JAXij_5Rr0U_filtered.json b/annotations_1/JAXij_5Rr0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aaaad5fd127c11e175f8093f6f0a76ff600c76e --- /dev/null +++ b/annotations_1/JAXij_5Rr0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [6.0, 6.76], [17.0, 18.44], [19.0, 19.63], [21.0, 20.88], [21.0, 28.61], [36.0, 37.86], [44.0, 44.02], [51.0, 51.58], [56.0, 59.75], [66.0, 66.51], [75.0, 76.77], [79.0, 90.95], [97.0, 97.98], [99.0, 100.57], [114.0, 114.22], [115.0, 126.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.55, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 31.01, 0.0, 0.0, 0.0, 31.67], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 67.67], ["male speech, man speaking", 5.2], ["music", 5.16]], null, null, null, null, null, null, [["music", 78.31], ["didgeridoo", 5.6], ["electronic music", 2.01]], null, null, null, [["music", 73.78], ["didgeridoo", 9.35], ["electronic music", 1.8]]], "duration": [0.2, 0.76, 1.44, 0.63, -0.12, 7.61, 1.86, 0.02, 0.58, 3.75, 0.51, 1.77, 11.95, 0.98, 1.57, 0.22, 11.98]} \ No newline at end of file diff --git a/annotations_1/JAd3SSNqZlI_filtered.json b/annotations_1/JAd3SSNqZlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37297f79a9501f67d7e11e7563903e40cb2740c9 --- /dev/null +++ b/annotations_1/JAd3SSNqZlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [5.0, 7.53], [9.0, 10.42], [13.0, 13.74], [20.0, 21.29], [23.0, 23.94], [33.0, 37.52], [39.0, 43.07], [46.0, 45.84], [49.0, 49.18], [56.0, 56.25], [57.0, 57.0], [57.0, 57.13], [59.0, 59.16], [66.0, 74.29], [75.0, 76.03], [82.0, 82.88], [93.0, 92.87], [96.0, 101.36], [103.0, 103.33], [106.0, 117.48], [121.0, 121.41], [122.0, 125.31], [127.0, 127.55], [129.0, 133.73], [134.0, 134.1]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 31.95, 0.0, 0.0, 0.0, 0.0, 29.85, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.19, 0.0, 0.0, 0.0, 31.29, 0.0, 31.07, 0.0, 29.98, 0.0, 37.23, 0.0], "audiomae_on_audioset": [null, [["music", 51.75], ["musical instrument", 10.71], ["guitar", 5.18]], null, null, null, null, [["music", 70.41], ["harmonica", 4.61], ["clarinet", 4.48]], [["harmonica", 70.52], ["music", 12.36], ["wind instrument, woodwind instrument", 5.38]], null, null, null, null, null, null, [["music", 71.83], ["harmonica", 10.83], ["clarinet", 2.24]], null, null, null, [["music", 68.96], ["musical instrument", 3.41], ["speech", 3.07]], null, [["music", 74.47], ["musical instrument", 8.13], ["guitar", 1.89]], null, [["music", 26.54], ["boing", 7.54], ["cattle, bovinae", 7.22]], null, [["music", 50.38], ["wind instrument, woodwind instrument", 14.98], ["theremin", 8.27]], null], "duration": [1.67, 2.53, 1.42, 0.74, 1.29, 0.94, 4.52, 4.07, -0.16, 0.18, 0.25, 0.0, 0.13, 0.16, 8.29, 1.03, 0.88, -0.13, 5.36, 0.33, 11.48, 0.41, 3.31, 0.55, 4.73, 0.1]} \ No newline at end of file diff --git a/annotations_1/JCGqUJddlS4_filtered.json b/annotations_1/JCGqUJddlS4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d27ce2e27fde3969589a0abeeb1586fee94232a2 --- /dev/null +++ b/annotations_1/JCGqUJddlS4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.93], [3.0, 4.45], [7.0, 7.99], [10.0, 10.44], [11.0, 13.19], [13.0, 13.22], [15.0, 16.39], [18.0, 19.03], [25.0, 34.72], [35.0, 36.66], [39.0, 40.85], [44.0, 45.13], [51.0, 52.59], [56.0, 62.75], [65.0, 66.77], [67.0, 68.3]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.4, 0.0, 0.0, 0.0, 39.7, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 37.93, 0.0, 0.0], "audiomae_on_audioset": [[["hammond organ", 19.39], ["music", 17.69], ["organ", 14.61]], null, null, null, [["speech", 59.39], ["music", 8.9], ["sidetone", 4.65]], null, null, null, null, null, null, null, null, [["music", 60.33], ["synthesizer", 9.23], ["musical instrument", 6.18]], null, null], "duration": [2.93, 1.45, 0.99, 0.44, 2.19, 0.22, 1.39, 1.03, 9.72, 1.66, 1.85, 1.13, 1.59, 6.75, 1.77, 1.3]} \ No newline at end of file diff --git a/annotations_1/JCo3QW-S310_filtered.json b/annotations_1/JCo3QW-S310_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57544096cca2163a8cbce33a466ab646ef68d48e --- /dev/null +++ b/annotations_1/JCo3QW-S310_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [6.0, 6.24], [10.0, 11.26], [17.0, 20.24], [23.0, 27.43], [31.0, 38.21], [42.0, 43.14], [44.0, 48.3], [50.0, 50.31], [51.0, 52.02], [53.0, 53.91], [56.0, 61.62], [62.0, 61.84], [62.0, 67.44], [68.0, 70.24], [71.0, 73.06], [74.0, 77.25], [79.0, 96.38], [97.0, 103.79], [104.0, 105.44], [106.0, 107.76], [108.0, 111.1], [112.0, 117.66], [119.0, 120.24], [126.0, 126.44], [131.0, 138.89], [141.0, 144.81], [145.0, 145.74], [146.0, 159.44]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.49, 29.19, 50.56, 0.0, 35.01, 0.0, 0.0, 0.0, 46.43, 0.0, 43.77, 41.22, 41.28, 45.43, 29.87, 33.58, 0.0, 0.0, 38.46, 29.65, 0.0, 0.0, 30.68, 32.3, 0.0, 31.24], "audiomae_on_audioset": [null, null, null, [["music", 49.78], ["ambient music", 8.74], ["electronic music", 5.85]], [["whip", 33.53], ["whack, thwack", 8.65], ["music", 6.57]], null, null, [["music", 33.74], ["speech", 30.19], ["whale vocalization", 10.35]], null, null, null, [["speech", 52.73], ["music", 28.7], ["electronic music", 4.14]], null, [["music", 62.93], ["synthesizer", 12.46], ["electronic music", 8.26]], [["music", 68.12], ["theremin", 8.82], ["musical instrument", 5.61]], [["music", 75.46], ["musical instrument", 5.51], ["didgeridoo", 3.51]], [["music", 70.13], ["synthesizer", 6.14], ["musical instrument", 6.06]], [["music", 50.05], ["throbbing", 14.98], ["hum", 9.98]], [["music", 70.55], ["synthesizer", 11.23], ["throbbing", 5.02]], null, null, [["hum", 46.18], ["mains hum", 12.56], ["speech", 9.16]], [["breaking", 44.13], ["speech", 28.13], ["music", 12.37]], null, null, [["speech", 32.89], ["music", 28.59], ["hum", 11.03]], [["sidetone", 26.24], ["speech", 21.83], ["throbbing", 16.0]], null, [["music", 46.3], ["speech", 34.06], ["hum", 2.23]]], "duration": [1.21, 0.24, 1.26, 3.24, 4.43, 7.21, 1.14, 4.3, 0.31, 1.02, 0.91, 5.62, -0.16, 5.44, 2.24, 2.06, 3.25, 17.38, 6.79, 1.44, 1.76, 3.1, 5.66, 1.24, 0.44, 7.89, 3.81, 0.74, 13.44]} \ No newline at end of file diff --git a/annotations_1/JFAAK6FfOSA_filtered.json b/annotations_1/JFAAK6FfOSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1468943fe7505d524e5d9a81fd3d955d8ca79919 --- /dev/null +++ b/annotations_1/JFAAK6FfOSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 27.23], [29.0, 30.62], [31.0, 34.53], [35.0, 36.42], [47.0, 50.3], [51.0, 55.78], [60.0, 100.31], [106.0, 106.98], [111.0, 114.32], [117.0, 119.25]], "keep_status": [false, false, false, false, true, false, false, false, false, true], "silence_prob": [53.34, 0.0, 58.98, 0.0, 34.54, 34.86, 0.0, 0.0, 40.33, 48.48], "audiomae_on_audioset": [null, null, null, null, [["gong", 21.23], ["music", 14.03], ["hum", 10.04]], [["shofar", 48.98], ["music", 24.11], ["quack", 7.84]], null, null, [["music", 63.84], ["synthesizer", 4.38], ["musical instrument", 3.53]], [["music", 34.61], ["hum", 9.99], ["throbbing", 7.5]]], "duration": [3.23, 1.62, 3.53, 1.42, 3.3, 4.78, 40.31, 0.98, 3.32, 2.25]} \ No newline at end of file diff --git a/annotations_1/JFeaWHDQzQA_filtered.json b/annotations_1/JFeaWHDQzQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..389d1d3ca5c2a4329a0fa31d2ac9032345703135 --- /dev/null +++ b/annotations_1/JFeaWHDQzQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [3.0, 4.23], [5.0, 8.95], [10.0, 11.23], [13.0, 17.73], [21.0, 22.11], [23.0, 31.13], [32.0, 32.78], [33.0, 34.33], [40.0, 41.03], [42.0, 46.25], [47.0, 48.74], [53.0, 53.49], [58.0, 58.43], [59.0, 59.41], [60.0, 60.93], [63.0, 62.82], [63.0, 63.61], [73.0, 72.86], [90.0, 90.68], [93.0, 93.48], [100.0, 101.82], [103.0, 103.0], [103.0, 105.07], [109.0, 111.15], [112.0, 112.6], [114.0, 114.03], [115.0, 117.71], [119.0, 120.14], [125.0, 126.91], [129.0, 133.02], [134.0, 136.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.1, 0.0, 67.51, 0.0, 97.54, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 98.8, 0.0, 0.0, 98.36, 0.0, 0.0, 95.09, 75.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.23, 3.95, 1.23, 4.73, 1.11, 8.13, 0.78, 1.33, 1.03, 4.25, 1.74, 0.49, 0.43, 0.41, 0.93, -0.18, 0.61, -0.14, 0.68, 0.48, 1.82, 0.0, 2.07, 2.15, 0.6, 0.03, 2.71, 1.14, 1.91, 4.02, 2.53]} \ No newline at end of file diff --git a/annotations_1/JHAtw0HRhho_filtered.json b/annotations_1/JHAtw0HRhho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9255069f48059fdc3319fb8e4d0577cec9b82f7 --- /dev/null +++ b/annotations_1/JHAtw0HRhho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.21], [29.0, 29.86], [43.0, 43.78], [57.0, 58.16], [79.0, 78.88], [89.0, 90.53], [100.0, 100.04], [100.0, 100.41], [101.0, 101.12], [109.0, 109.49], [112.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.86, 0.78, 1.16, -0.12, 1.53, 0.04, 0.41, 0.12, 0.49, 0.21]} \ No newline at end of file diff --git a/annotations_1/JIMykDzqRbY_filtered.json b/annotations_1/JIMykDzqRbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff8474c24d96c07c7a17e3b6f588ca4efe5bbb01 --- /dev/null +++ b/annotations_1/JIMykDzqRbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [11.0, 13.44], [24.0, 26.97], [43.0, 43.6], [54.0, 60.3], [73.0, 74.55], [86.0, 92.5], [95.0, 97.33], [99.0, 107.11], [116.0, 119.47], [121.0, 147.6]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.97, 32.23, 73.36, 0.0, 29.56, 0.0, 29.6, 30.22, 29.25, 30.68, 29.91], "audiomae_on_audioset": [[["music", 66.08], ["musical instrument", 7.31], ["guitar", 7.31]], [["music", 54.99], ["guitar", 10.38], ["musical instrument", 8.8]], null, null, [["music", 80.25], ["musical instrument", 5.07], ["male singing", 1.71]], null, [["music", 71.22], ["guitar", 5.46], ["musical instrument", 5.21]], [["music", 63.56], ["musical instrument", 11.67], ["guitar", 5.83]], [["music", 38.54], ["livestock, farm animals, working animals", 17.31], ["cattle, bovinae", 16.07]], [["music", 29.48], ["brass instrument", 17.64], ["didgeridoo", 16.02]], [["music", 57.34], ["didgeridoo", 13.66], ["synthesizer", 2.94]]], "duration": [2.25, 2.44, 2.97, 0.6, 6.3, 1.55, 6.5, 2.33, 8.11, 3.47, 26.6]} \ No newline at end of file diff --git a/annotations_1/JIsrqAWzVoA_filtered.json b/annotations_1/JIsrqAWzVoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e022bb80a2fad7fdfa66f7b3beda61b2ec38dd00 --- /dev/null +++ b/annotations_1/JIsrqAWzVoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 34.74]], "keep_status": [false], "silence_prob": [39.27], "audiomae_on_audioset": [[["music", 64.36], ["ambient music", 6.48], ["synthesizer", 4.37]]], "duration": [24.74]} \ No newline at end of file diff --git a/annotations_1/JJ0IOFvfu3Q_filtered.json b/annotations_1/JJ0IOFvfu3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4de559889142fd4441c90dc8f9b38a5446cbfffc --- /dev/null +++ b/annotations_1/JJ0IOFvfu3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 56.64], [59.0, 59.17], [60.0, 63.0], [65.0, 66.33], [70.0, 70.19], [71.0, 72.67], [73.0, 73.92], [77.0, 77.79], [81.0, 82.68], [86.0, 87.37], [89.0, 89.82], [98.0, 98.78], [99.0, 101.16], [107.0, 108.06], [110.0, 110.78], [112.0, 114.62], [116.0, 117.22], [123.0, 124.78], [126.0, 126.18], [128.0, 128.6], [131.0, 131.16], [132.0, 139.77]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.64, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 54.83], "audiomae_on_audioset": [[["speech", 19.21], ["frog", 11.05], ["electric shaver, electric razor", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.64, 0.17, 3.0, 1.33, 0.19, 1.67, 0.92, 0.79, 1.68, 1.37, 0.82, 0.78, 2.16, 1.06, 0.78, 2.62, 1.22, 1.78, 0.18, 0.6, 0.16, 7.77]} \ No newline at end of file diff --git a/annotations_1/JJrTnnaEZ_w_filtered.json b/annotations_1/JJrTnnaEZ_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a32c2643eb3e3de485d2ece9572f2f9601b27a09 --- /dev/null +++ b/annotations_1/JJrTnnaEZ_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.45], [9.0, 10.72], [11.0, 12.97], [18.0, 20.26], [21.0, 22.17], [24.0, 24.14], [25.0, 26.55], [27.0, 30.18], [35.0, 36.64], [42.0, 43.06], [45.0, 48.0], [52.0, 56.61], [57.0, 62.67], [63.0, 66.88], [67.0, 69.74], [71.0, 73.43], [76.0, 83.42], [84.0, 103.32], [104.0, 118.81], [121.0, 121.78], [124.0, 127.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 72.9, 58.55, 45.98, 90.6, 48.91, 92.48, 78.04, 97.22, 89.36, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 62.22], ["speech", 30.14], ["hiccup", 1.27]], null, [["speech", 59.24], ["sidetone", 15.27], ["hum", 6.69]], null, null, null, null, null, null], "duration": [1.45, 1.72, 1.97, 2.26, 1.17, 0.14, 1.55, 3.18, 1.64, 1.06, 3.0, 4.61, 5.67, 3.88, 2.74, 2.43, 7.42, 19.32, 14.81, 0.78, 3.11]} \ No newline at end of file diff --git a/annotations_1/JJwp_lEoOuI_filtered.json b/annotations_1/JJwp_lEoOuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11d9e50afee36db82b5d0c9fb5d33d7afe47fa81 --- /dev/null +++ b/annotations_1/JJwp_lEoOuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [11.0, 12.12], [18.0, 20.85], [24.0, 24.95], [33.0, 33.03], [35.0, 37.3], [39.0, 41.72], [45.0, 45.89], [47.0, 48.12], [49.0, 51.14], [56.0, 56.35], [58.0, 58.85], [62.0, 63.12], [75.0, 80.42], [83.0, 84.48], [100.0, 101.51], [109.0, 109.66], [113.0, 113.43]], "keep_status": [false, false, true, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.75, 0.0, 0.0, 32.71, 37.76, 0.0, 0.0, 32.13, 0.0, 0.0, 0.0, 39.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.5], ["musical instrument", 6.14], ["guitar", 5.89]], null, null, [["music", 58.08], ["musical instrument", 4.51], ["singing", 3.94]], [["music", 58.51], ["musical instrument", 4.9], ["effects unit", 3.6]], null, null, [["music", 31.86], ["thunk", 26.94], ["whack, thwack", 6.17]], null, null, null, [["music", 61.29], ["didgeridoo", 8.03], ["speech", 6.71]], null, null, null, null], "duration": [0.55, 1.12, 2.85, 0.95, 0.03, 2.3, 2.72, 0.89, 1.12, 2.14, 0.35, 0.85, 1.12, 5.42, 1.48, 1.51, 0.66, 0.43]} \ No newline at end of file diff --git a/annotations_1/JJyK0EX6s_Q_filtered.json b/annotations_1/JJyK0EX6s_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c93074b52451a61084394515fcd2a86d626eee --- /dev/null +++ b/annotations_1/JJyK0EX6s_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 73.9], [75.0, 75.17], [77.0, 78.66], [81.0, 81.63], [82.0, 82.95]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [46.9, 0.17, 1.66, 0.63, 0.95]} \ No newline at end of file diff --git a/annotations_1/JLH_smT7Qog_filtered.json b/annotations_1/JLH_smT7Qog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d0af2449729e4d2c675702b58a5aeaea5eb23ff --- /dev/null +++ b/annotations_1/JLH_smT7Qog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.04], [14.0, 14.25], [26.0, 29.59], [32.0, 32.73], [34.0, 36.44], [41.0, 41.66], [48.0, 51.43], [52.0, 52.74], [58.0, 58.16], [60.0, 61.69], [64.0, 65.37], [67.0, 67.07], [74.0, 74.97], [76.0, 77.53]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [76.7, 0.0, 63.53, 0.0, 42.91, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 15.6], ["thunk", 13.87], ["wind instrument, woodwind instrument", 6.81]], null, null, null, null, null, null, null, null, null], "duration": [8.04, 0.25, 3.59, 0.73, 2.44, 0.66, 3.43, 0.74, 0.16, 1.69, 1.37, 0.07, 0.97, 1.53]} \ No newline at end of file diff --git a/annotations_1/JLvkvjU_iyY_filtered.json b/annotations_1/JLvkvjU_iyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7d2e4eb0dbb3a69bf800c72209c8bbcb692644 --- /dev/null +++ b/annotations_1/JLvkvjU_iyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.29], [21.0, 21.44], [23.0, 22.69], [30.0, 30.91], [32.0, 32.85], [35.0, 41.18], [45.0, 48.49], [51.0, 64.23], [71.0, 73.01], [74.0, 74.28], [77.0, 78.98], [80.0, 81.48], [88.0, 88.77], [89.0, 93.51], [95.0, 95.45], [100.0, 101.95], [105.0, 106.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [63.64, 0.0, 0.0, 0.0, 0.0, 45.65, 77.53, 36.18, 67.51, 0.0, 0.0, 0.0, 0.0, 49.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["gong", 38.79], ["music", 34.17], ["musical instrument", 5.17]], null, [["cattle, bovinae", 33.22], ["moo", 26.09], ["livestock, farm animals, working animals", 21.7]], null, null, null, null, null, [["music", 44.63], ["livestock, farm animals, working animals", 6.27], ["speech", 4.77]], null, null, null], "duration": [7.29, 0.44, -0.31, 0.91, 0.85, 6.18, 3.49, 13.23, 2.01, 0.28, 1.98, 1.48, 0.77, 4.51, 0.45, 1.95, 1.52]} \ No newline at end of file diff --git a/annotations_1/JNcNy7bJxDg_filtered.json b/annotations_1/JNcNy7bJxDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fce6a4e4023df3870ddabbcc4b74cec3caefb403 --- /dev/null +++ b/annotations_1/JNcNy7bJxDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 6.89], [12.0, 12.93], [17.0, 17.49], [19.0, 20.92], [22.0, 22.99], [25.0, 25.56], [32.0, 35.23], [38.0, 43.83], [44.0, 45.3], [46.0, 46.72], [49.0, 51.36], [51.0, 53.25], [54.0, 55.12], [56.0, 56.93], [64.0, 64.64], [73.0, 72.99], [74.0, 74.04], [77.0, 77.14], [82.0, 82.56], [89.0, 90.46], [104.0, 109.16], [118.0, 121.73], [127.0, 126.99], [137.0, 136.76], [137.0, 141.54], [142.0, 142.57], [146.0, 145.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 91.98, 0.0, 0.0, 73.51, 46.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.25, 29.27, 0.0, 0.0, 31.06, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 52.17], ["speech", 32.79], ["radio", 2.84]], null, null, null, null, null, null, null, null, null, null, [["creak", 40.66], ["speech", 17.52], ["cattle, bovinae", 3.2]], null, null, null, null, null, null, null, null, [["speech", 14.75], ["music", 14.08], ["boing", 10.96]], [["speech", 24.53], ["animal", 15.31], ["bow-wow", 10.3]], null, null, [["boing", 25.91], ["speech", 23.21], ["noise", 9.48]], null, null], "duration": [0.84, 2.89, 0.93, 0.49, 1.92, 0.99, 0.56, 3.23, 5.83, 1.3, 0.72, 2.36, 2.25, 1.12, 0.93, 0.64, -0.01, 0.04, 0.14, 0.56, 1.46, 5.16, 3.73, -0.01, -0.24, 4.54, 0.57, -0.39]} \ No newline at end of file diff --git a/annotations_1/JOw4LqyJKyg_filtered.json b/annotations_1/JOw4LqyJKyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46efce0f32345902a40ed836f65f511158d25878 --- /dev/null +++ b/annotations_1/JOw4LqyJKyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 26.0], [27.0, 37.61], [42.0, 78.21], [80.0, 91.64], [96.0, 99.47], [100.0, 107.99], [109.0, 131.45]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [29.43, 28.47, 0.0, 28.65, 29.09, 28.29, 28.4], "audiomae_on_audioset": [[["hum", 36.36], ["mains hum", 21.5], ["music", 14.43]], [["music", 65.72], ["hum", 4.74], ["smash, crash", 3.86]], null, [["music", 50.53], ["hum", 12.88], ["buzz", 11.74]], [["music", 32.46], ["hum", 11.68], ["electronic music", 8.79]], [["music", 45.01], ["mains hum", 15.41], ["hum", 13.91]], [["music", 73.48], ["speech", 4.51], ["hum", 4.4]]], "duration": [11.0, 10.61, 36.21, 11.64, 3.47, 7.99, 22.45]} \ No newline at end of file diff --git a/annotations_1/JOzVMqp3vMc_filtered.json b/annotations_1/JOzVMqp3vMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..739d8e25fc450ace8eac4b320a75a9e72e76d76a --- /dev/null +++ b/annotations_1/JOzVMqp3vMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.98], [14.0, 23.67], [27.0, 27.53], [33.0, 40.29], [41.0, 42.47], [44.0, 44.0], [47.0, 52.46], [53.0, 53.57], [56.0, 67.22], [69.0, 78.66], [81.0, 96.7], [98.0, 108.16], [109.0, 112.8], [117.0, 144.46], [147.0, 150.31], [151.0, 158.85], [166.0, 165.91], [166.0, 170.45]], "keep_status": [false, true, false, true, false, false, false, false, false, true, true, true, false, true, false, false, false, true], "silence_prob": [0.0, 39.37, 0.0, 35.36, 0.0, 0.0, 38.97, 0.0, 44.12, 33.41, 32.91, 35.94, 32.71, 36.07, 66.39, 55.67, 0.0, 45.46], "audiomae_on_audioset": [null, [["speech", 14.7], ["explosion", 10.59], ["whack, thwack", 9.42]], null, [["music", 32.71], ["didgeridoo", 6.57], ["speech", 6.0]], null, null, [["speech", 50.11], ["music", 22.9], ["radio", 4.39]], null, [["speech", 84.39], ["hum", 3.16], ["music", 2.02]], [["speech", 47.28], ["buzz", 7.04], ["music", 6.28]], [["whale vocalization", 22.45], ["music", 16.79], ["speech", 14.12]], [["speech", 22.79], ["music", 18.5], ["sidetone", 7.06]], [["fart", 35.0], ["speech", 29.43], ["explosion", 9.82]], [["music", 29.11], ["speech", 14.35], ["synthesizer", 9.11]], null, null, null, [["music", 13.36], ["synthesizer", 13.1], ["speech", 10.42]]], "duration": [1.98, 9.67, 0.53, 7.29, 1.47, 0.0, 5.46, 0.57, 11.22, 9.66, 15.7, 10.16, 3.8, 27.46, 3.31, 7.85, -0.09, 4.45]} \ No newline at end of file diff --git a/annotations_1/JPjeOAVkSe4_filtered.json b/annotations_1/JPjeOAVkSe4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae5eff0fef1644d9b781f5f7b53c00686a22e48f --- /dev/null +++ b/annotations_1/JPjeOAVkSe4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.51], [17.0, 19.58], [25.0, 26.35], [27.0, 27.67], [30.0, 33.03], [62.0, 65.6], [69.0, 69.7], [70.0, 71.05], [72.0, 72.4], [76.0, 77.03], [77.0, 80.32], [81.0, 87.99], [89.0, 89.24], [91.0, 90.83], [92.0, 92.67], [98.0, 98.96], [101.0, 101.71], [105.0, 108.28], [109.0, 109.85], [111.0, 112.41], [113.0, 114.47], [120.0, 120.55], [122.0, 122.91], [124.0, 125.39]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.71, 32.3, 0.0, 0.0, 40.24, 55.11, 0.0, 0.0, 0.0, 0.0, 39.77, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 17.14], ["moo", 14.64], ["cattle, bovinae", 13.57]], [["music", 59.31], ["musical instrument", 6.19], ["synthesizer", 5.33]], null, null, [["mosquito", 28.35], ["frog", 19.5], ["fly, housefly", 13.57]], null, null, null, null, null, [["speech", 27.32], ["radio", 16.18], ["sidetone", 8.67]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.51, 2.58, 1.35, 0.67, 3.03, 3.6, 0.7, 1.05, 0.4, 1.03, 3.32, 6.99, 0.24, -0.17, 0.67, 0.96, 0.71, 3.28, 0.85, 1.41, 1.47, 0.55, 0.91, 1.39]} \ No newline at end of file diff --git a/annotations_1/JQOay4rjHas_filtered.json b/annotations_1/JQOay4rjHas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cda00da59a59625abd95bce643e89800cbd06c2 --- /dev/null +++ b/annotations_1/JQOay4rjHas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.45], [13.0, 17.02], [18.0, 18.55], [23.0, 23.5], [28.0, 29.39], [31.0, 32.07], [33.0, 48.47], [51.0, 63.8], [65.0, 65.96], [71.0, 71.31], [73.0, 74.48], [81.0, 84.52], [88.0, 98.95], [100.0, 101.36], [109.0, 114.83], [119.0, 131.16], [134.0, 134.64], [136.0, 142.92], [145.0, 149.22], [149.0, 149.25], [149.0, 149.28], [149.0, 149.89], [151.0, 194.09]], "keep_status": [true, true, false, false, false, false, true, true, false, false, false, true, true, false, false, true, false, true, true, false, false, false, false], "silence_prob": [28.57, 28.96, 0.0, 0.0, 0.0, 0.0, 28.82, 45.52, 0.0, 0.0, 0.0, 30.04, 29.73, 0.0, 29.78, 28.92, 0.0, 30.19, 29.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.88], ["mains hum", 10.29], ["throbbing", 10.23]], [["music", 29.94], ["mains hum", 17.71], ["hum", 11.88]], null, null, null, null, [["hum", 23.26], ["music", 21.09], ["buzz", 12.08]], [["throbbing", 26.89], ["hum", 25.74], ["mains hum", 8.41]], null, null, null, [["music", 34.65], ["speech", 27.59], ["whip", 5.95]], [["music", 54.78], ["speech", 10.1], ["grunt", 4.28]], null, [["speech", 60.64], ["music", 17.49], ["reverberation", 4.12]], [["music", 28.59], ["breaking", 17.74], ["buzz", 7.53]], null, [["whale vocalization", 38.98], ["music", 10.68], ["wild animals", 8.26]], [["speech", 18.04], ["music", 17.65], ["whale vocalization", 9.72]], null, null, null, null], "duration": [7.45, 4.02, 0.55, 0.5, 1.39, 1.07, 15.47, 12.8, 0.96, 0.31, 1.48, 3.52, 10.95, 1.36, 5.83, 12.16, 0.64, 6.92, 4.22, 0.25, 0.28, 0.89, 43.09]} \ No newline at end of file diff --git a/annotations_1/JSX5qtBpL2g_filtered.json b/annotations_1/JSX5qtBpL2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..123f357996dc7bd1ee56eb5e58f53af09f941400 --- /dev/null +++ b/annotations_1/JSX5qtBpL2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.07], [4.0, 4.36], [6.0, 6.03], [7.0, 8.88], [9.0, 10.5], [14.0, 14.47], [19.0, 20.19], [21.0, 22.52], [23.0, 34.99], [36.0, 36.36], [37.0, 37.61], [39.0, 39.7], [41.0, 41.49], [42.0, 43.09], [45.0, 45.59], [46.0, 47.09], [48.0, 48.81], [52.0, 52.91], [55.0, 55.51], [58.0, 59.21], [60.0, 61.01], [62.0, 62.77], [67.0, 67.53], [69.0, 69.31], [74.0, 75.51], [77.0, 77.63], [92.0, 93.66], [95.0, 96.7], [98.0, 100.67], [102.0, 107.25], [108.0, 110.19], [113.0, 116.38], [117.0, 117.75], [121.0, 127.58], [129.0, 133.79], [135.0, 137.96], [139.0, 141.42], [142.0, 144.83], [146.0, 147.68], [149.0, 149.82], [151.0, 150.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.8, 100.0, 94.66, 0.0, 99.99, 99.85, 97.22, 100.0, 66.39, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 0.36, 0.03, 1.88, 1.5, 0.47, 1.19, 1.52, 11.99, 0.36, 0.61, 0.7, 0.49, 1.09, 0.59, 1.09, 0.81, 0.91, 0.51, 1.21, 1.01, 0.77, 0.53, 0.31, 1.51, 0.63, 1.66, 1.7, 2.67, 5.25, 2.19, 3.38, 0.75, 6.58, 4.79, 2.96, 2.42, 2.83, 1.68, 0.82, -0.03]} \ No newline at end of file diff --git a/annotations_1/JSqbIAemGcs_filtered.json b/annotations_1/JSqbIAemGcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f3ea6958b0d5ddf600539b9eef6413a353d69c6 --- /dev/null +++ b/annotations_1/JSqbIAemGcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.31], [1.0, 2.24], [10.0, 10.57], [12.0, 18.12], [20.0, 21.22], [23.0, 25.05], [27.0, 28.66], [30.0, 30.28], [30.0, 32.49], [35.0, 36.48], [38.0, 38.2], [38.0, 39.02], [40.0, 40.76], [42.0, 43.78], [48.0, 49.2], [57.0, 58.38], [59.0, 59.83], [62.0, 62.77], [64.0, 64.71], [66.0, 66.5], [69.0, 69.26], [76.0, 76.18], [78.0, 78.14], [80.0, 80.27], [83.0, 84.4], [86.0, 86.73], [93.0, 93.75], [96.0, 96.23], [102.0, 102.57], [111.0, 134.42], [136.0, 144.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 45.05, 0.0, 69.88, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.06, 28.72], "audiomae_on_audioset": [null, null, null, [["speech", 81.26], ["busy signal", 5.98], ["dial tone", 2.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.16], ["didgeridoo", 8.9], ["throbbing", 4.7]], [["music", 55.76], ["speech", 21.93], ["breaking", 3.38]]], "duration": [0.31, 1.24, 0.57, 6.12, 1.22, 2.05, 1.66, 0.28, 2.49, 1.48, 0.2, 1.02, 0.76, 1.78, 1.2, 1.38, 0.83, 0.77, 0.71, 0.5, 0.26, 0.18, 0.14, 0.27, 1.4, 0.73, 0.75, 0.23, 0.57, 23.42, 8.95]} \ No newline at end of file diff --git a/annotations_1/JT_59yK4Gm4_filtered.json b/annotations_1/JT_59yK4Gm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c8c6cfba9134b8bb32061338a23dc0003756dc8 --- /dev/null +++ b/annotations_1/JT_59yK4Gm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.18], [15.0, 16.24], [20.0, 21.15], [28.0, 80.62], [88.0, 100.68], [102.0, 103.4], [107.0, 108.7], [112.0, 113.12], [115.0, 116.13], [122.0, 131.03], [133.0, 132.95], [133.0, 133.59]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [46.05, 0.0, 0.0, 0.0, 28.91, 0.0, 0.0, 0.0, 0.0, 28.35, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 40.86], ["mains hum", 27.02], ["throbbing", 10.63]], null, null, null, [["music", 64.56], ["speech", 12.48], ["theremin", 4.02]], null, null, null, null, [["music", 44.76], ["speech", 19.05], ["vehicle", 5.56]], null, null], "duration": [4.18, 1.24, 1.15, 52.62, 12.68, 1.4, 1.7, 1.12, 1.13, 9.03, -0.05, 0.59]} \ No newline at end of file diff --git a/annotations_1/JU_Vqys3Kp4_filtered.json b/annotations_1/JU_Vqys3Kp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbb35bbd35cd4925f601b65806d9c40321311e6b --- /dev/null +++ b/annotations_1/JU_Vqys3Kp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.7], [14.0, 18.55], [24.0, 31.95], [33.0, 34.48], [36.0, 36.24], [37.0, 40.37], [48.0, 49.47], [51.0, 75.76], [85.0, 96.87], [99.0, 100.38], [102.0, 110.69]], "keep_status": [false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 32.81, 99.95, 0.0, 0.0, 32.55, 0.0, 37.62, 44.34, 0.0, 47.31], "audiomae_on_audioset": [null, [["eruption", 11.17], ["throbbing", 10.18], ["applause", 8.19]], null, null, null, [["applause", 20.58], ["speech", 12.79], ["music", 10.3]], null, [["music", 54.57], ["theremin", 16.77], ["musical instrument", 2.93]], [["music", 43.79], ["cello", 11.19], ["double bass", 9.51]], null, [["music", 65.43], ["keyboard (musical)", 3.72], ["musical instrument", 3.58]]], "duration": [-0.3, 4.55, 7.95, 1.48, 0.24, 3.37, 1.47, 24.76, 11.87, 1.38, 8.69]} \ No newline at end of file diff --git a/annotations_1/JV05-E5FF2g_filtered.json b/annotations_1/JV05-E5FF2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5317be51f9022e832993f1b9326f3effc494ac8d --- /dev/null +++ b/annotations_1/JV05-E5FF2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 46.7], [48.0, 60.83], [63.0, 68.49], [71.0, 99.94], [103.0, 117.78], [119.0, 128.22], [129.0, 140.73], [141.0, 141.98], [143.0, 148.86], [151.0, 151.7]], "keep_status": [false, false, true, true, true, false, false, false, true, false], "silence_prob": [0.0, 31.7, 30.4, 30.11, 33.53, 65.44, 86.64, 0.0, 38.83, 0.0], "audiomae_on_audioset": [null, [["music", 62.92], ["hum", 5.18], ["cacophony", 3.72]], [["noise", 27.32], ["throbbing", 18.88], ["hum", 14.74]], [["music", 33.15], ["smash, crash", 17.38], ["whack, thwack", 7.27]], [["explosion", 39.7], ["burst, pop", 9.27], ["eruption", 7.76]], null, null, null, [["speech", 17.5], ["music", 11.49], ["drip", 9.82]], null], "duration": [40.7, 12.83, 5.49, 28.94, 14.78, 9.22, 11.73, 0.98, 5.86, 0.7]} \ No newline at end of file diff --git a/annotations_1/JV2dQauaWCU_filtered.json b/annotations_1/JV2dQauaWCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ab80bad903ce3b0c3a6e86c88e125458521fb01 --- /dev/null +++ b/annotations_1/JV2dQauaWCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.07], [13.0, 13.32], [15.0, 43.33], [44.0, 49.25], [51.0, 63.86], [64.0, 64.98], [68.0, 78.46], [85.0, 88.97], [89.0, 108.7], [113.0, 117.19], [120.0, 121.39], [122.0, 123.85], [124.0, 127.04], [128.0, 129.34], [130.0, 132.04], [134.0, 134.62]], "keep_status": [true, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [37.06, 0.0, 29.27, 28.89, 29.21, 0.0, 28.83, 28.61, 31.25, 68.67, 0.0, 0.0, 46.86, 0.0, 44.4, 0.0], "audiomae_on_audioset": [[["music", 26.36], ["hum", 21.06], ["mains hum", 19.41]], null, [["music", 67.64], ["mains hum", 8.93], ["hum", 7.29]], [["music", 34.74], ["speech", 18.13], ["breaking", 7.68]], [["music", 53.13], ["buzz", 4.98], ["cacophony", 4.25]], null, [["music", 38.9], ["breaking", 9.69], ["speech", 5.36]], [["music", 77.33], ["cacophony", 3.67], ["didgeridoo", 1.68]], [["machine gun", 22.08], ["smash, crash", 9.92], ["gunshot, gunfire", 9.0]], null, null, null, [["music", 44.99], ["speech", 24.47], ["synthesizer", 4.32]], null, [["music", 44.05], ["speech", 18.16], ["hum", 9.41]], null], "duration": [9.07, 0.32, 28.33, 5.25, 12.86, 0.98, 10.46, 3.97, 19.7, 4.19, 1.39, 1.85, 3.04, 1.34, 2.04, 0.62]} \ No newline at end of file diff --git a/annotations_1/JVRdRQaccL0_filtered.json b/annotations_1/JVRdRQaccL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9134e1aaefc34c0e1bf362c434f262311cebb63 --- /dev/null +++ b/annotations_1/JVRdRQaccL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 86.83]], "keep_status": [false], "silence_prob": [54.3], "audiomae_on_audioset": [null], "duration": [7.83]} \ No newline at end of file diff --git a/annotations_1/JWXgBi3HDac_filtered.json b/annotations_1/JWXgBi3HDac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7968e0cbbb888d2a27447df4176ee2cccc2b8a --- /dev/null +++ b/annotations_1/JWXgBi3HDac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.17], [14.0, 15.31], [30.0, 30.21]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.17, 1.31, 0.21]} \ No newline at end of file diff --git a/annotations_1/JWbqI-m3A3w_filtered.json b/annotations_1/JWbqI-m3A3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde894b005bebcec35dca979078ec618367d8e46 --- /dev/null +++ b/annotations_1/JWbqI-m3A3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 72.57], [75.0, 76.32], [77.0, 81.73], [83.0, 130.89]], "keep_status": [true, false, false, false], "silence_prob": [31.55, 0.0, 35.37, 0.0], "audiomae_on_audioset": [[["creak", 11.12], ["smash, crash", 11.04], ["music", 10.43]], null, [["fly, housefly", 59.69], ["insect", 16.77], ["mosquito", 9.22]], null], "duration": [2.57, 1.32, 4.73, 47.89]} \ No newline at end of file diff --git a/annotations_1/JWrDT-JGDug_filtered.json b/annotations_1/JWrDT-JGDug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd9e129c1bdbe497dfccaabda4ddbe6445e784f9 --- /dev/null +++ b/annotations_1/JWrDT-JGDug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.15], [12.0, 12.12], [13.0, 19.38], [22.0, 22.17], [22.0, 22.42], [22.0, 22.45], [22.0, 32.76], [35.0, 44.44], [49.0, 48.98], [51.0, 52.24], [62.0, 62.77], [65.0, 67.86], [70.0, 71.15], [72.0, 82.12], [84.0, 87.94], [89.0, 89.33], [90.0, 102.59], [103.0, 116.02], [117.0, 133.54], [136.0, 136.36]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [45.88, 0.0, 37.93, 0.0, 0.0, 0.0, 32.1, 38.33, 0.0, 0.0, 0.0, 35.46, 0.0, 33.58, 33.13, 0.0, 31.17, 31.35, 30.73, 0.0], "audiomae_on_audioset": [[["music", 38.36], ["bleat", 8.57], ["sheep", 8.08]], null, [["fly, housefly", 35.19], ["insect", 17.7], ["bee, wasp, etc.", 9.05]], null, null, null, [["mosquito", 34.73], ["fly, housefly", 31.0], ["insect", 17.41]], [["music", 25.21], ["fly, housefly", 11.99], ["throbbing", 9.99]], null, null, null, [["music", 64.8], ["didgeridoo", 13.28], ["electronic music", 3.84]], null, [["music", 62.35], ["didgeridoo", 8.91], ["theremin", 7.98]], [["music", 33.02], ["speech", 22.6], ["vehicle", 7.59]], null, [["speech", 40.95], ["didgeridoo", 30.39], ["music", 18.28]], [["music", 66.17], ["speech", 14.13], ["didgeridoo", 4.35]], [["music", 27.51], ["speech", 24.29], ["musical instrument", 4.56]], null], "duration": [5.15, 0.12, 6.38, 0.17, 0.42, 0.45, 10.76, 9.44, -0.02, 1.24, 0.77, 2.86, 1.15, 10.12, 3.94, 0.33, 12.59, 13.02, 16.54, 0.36]} \ No newline at end of file diff --git a/annotations_1/JX2gQZj3-NI_filtered.json b/annotations_1/JX2gQZj3-NI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eac46546fd5a732e72e7bc1308d543a72ea81b8c --- /dev/null +++ b/annotations_1/JX2gQZj3-NI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 26.69], [30.0, 52.3], [56.0, 111.7], [115.0, 131.01], [133.0, 133.1], [135.0, 153.84], [154.0, 163.02], [165.0, 164.79]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [61.37, 33.45, 0.0, 47.82, 0.0, 34.88, 36.98, 0.0], "audiomae_on_audioset": [null, [["music", 51.03], ["throbbing", 14.57], ["hum", 10.13]], null, [["music", 76.2], ["synthesizer", 3.73], ["electronic music", 2.34]], null, [["music", 30.83], ["didgeridoo", 15.91], ["livestock, farm animals, working animals", 5.69]], [["music", 26.73], ["speech", 13.15], ["hum", 7.01]], null], "duration": [5.69, 22.3, 55.7, 16.01, 0.1, 18.84, 9.02, -0.21]} \ No newline at end of file diff --git a/annotations_1/JXyisZLObHc_filtered.json b/annotations_1/JXyisZLObHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..137443a57d5677788028a5b3d85318db50251a27 --- /dev/null +++ b/annotations_1/JXyisZLObHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [5.0, 6.17], [7.0, 7.75], [8.0, 8.77], [9.0, 11.23], [12.0, 12.48], [14.0, 14.03], [19.0, 19.47], [39.0, 40.91], [48.0, 48.88], [52.0, 53.16], [54.0, 54.35], [57.0, 57.35], [62.0, 63.95], [71.0, 71.47], [79.0, 79.17], [90.0, 90.19], [93.0, 94.98], [95.0, 108.19], [112.0, 112.8], [115.0, 117.0], [119.0, 123.04], [128.0, 128.93], [136.0, 139.38], [140.0, 142.38], [143.0, 143.6], [145.0, 147.01], [152.0, 152.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.85, 0.0, 40.22, 43.93, 0.0, 100.0, 100.0, 0.0, 94.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 48.3], ["speech", 29.09], ["hum", 8.73]], null, [["speech", 69.32], ["telephone", 12.96], ["telephone bell ringing", 3.64]], [["speech", 46.85], ["telephone", 33.09], ["telephone bell ringing", 14.54]], null, null, null, null, null, null], "duration": [1.1, 1.17, 0.75, 0.77, 2.23, 0.48, 0.03, 0.47, 1.91, 0.88, 1.16, 0.35, 0.35, 1.95, 0.47, 0.17, 0.19, 1.98, 13.19, 0.8, 2.0, 4.04, 0.93, 3.38, 2.38, 0.6, 2.01, 0.83]} \ No newline at end of file diff --git a/annotations_1/JY4UoItJ_lA_filtered.json b/annotations_1/JY4UoItJ_lA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..112405d962b15ee01b3b60446e8dacadb77c0a3b --- /dev/null +++ b/annotations_1/JY4UoItJ_lA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.25], [18.0, 18.0], [20.0, 20.58], [24.0, 27.55], [28.0, 29.19], [32.0, 32.83], [33.0, 34.05], [35.0, 35.83], [37.0, 38.48], [40.0, 44.0], [45.0, 45.86], [47.0, 47.55], [49.0, 51.12], [52.0, 106.91], [111.0, 111.42], [113.0, 113.71], [115.0, 120.83], [125.0, 126.89], [128.0, 129.07], [130.0, 130.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 91.45], ["speech", 7.09], ["radio", 0.58]], null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 0.0, 0.58, 3.55, 1.19, 0.83, 1.05, 0.83, 1.48, 4.0, 0.86, 0.55, 2.12, 54.91, 0.42, 0.71, 5.83, 1.89, 1.07, 0.32]} \ No newline at end of file diff --git a/annotations_1/JYLVFSmlNFs_filtered.json b/annotations_1/JYLVFSmlNFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1970d5d26a96f66a1152b0137e4d6e00a2298a59 --- /dev/null +++ b/annotations_1/JYLVFSmlNFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.17], [14.0, 19.2], [20.0, 25.41], [26.0, 26.49], [32.0, 32.31], [37.0, 41.25], [43.0, 43.34], [43.0, 45.1], [48.0, 49.2], [63.0, 64.03], [68.0, 68.52], [69.0, 69.65], [77.0, 78.24], [78.0, 79.22], [80.0, 107.35], [110.0, 129.07], [131.0, 131.8], [133.0, 166.11], [168.0, 170.21], [171.0, 171.93]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 31.79, 31.12, 0.0, 0.0, 34.6, 0.0, 40.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 30.27, 0.0, 0.0, 34.46, 0.0], "audiomae_on_audioset": [null, [["speech", 54.53], ["music", 14.59], ["electric shaver, electric razor", 4.58]], [["music", 27.4], ["thunk", 13.15], ["speech", 10.95]], null, null, [["thunk", 19.26], ["buzzer", 10.81], ["music", 9.06]], null, [["music", 52.49], ["didgeridoo", 9.11], ["speech", 3.6]], null, null, null, null, null, null, [["speech", 39.19], ["music", 34.06], ["throbbing", 4.6]], [["music", 34.54], ["throbbing", 17.22], ["smash, crash", 9.91]], null, null, [["mains hum", 34.4], ["music", 23.72], ["hum", 16.52]], null], "duration": [1.17, 5.2, 5.41, 0.49, 0.31, 4.25, 0.34, 2.1, 1.2, 1.03, 0.52, 0.65, 1.24, 1.22, 27.35, 19.07, 0.8, 33.11, 2.21, 0.93]} \ No newline at end of file diff --git a/annotations_1/JYVhLnjKKC8_filtered.json b/annotations_1/JYVhLnjKKC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cebe84e2fe6eca228294b9f3c6f61c3ddf43c26 --- /dev/null +++ b/annotations_1/JYVhLnjKKC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 35.56], [36.0, 35.68], [36.0, 37.17], [38.0, 43.6], [48.0, 74.87], [76.0, 84.5], [85.0, 84.94], [85.0, 85.29], [90.0, 90.61], [92.0, 94.0], [102.0, 105.39], [107.0, 108.95], [110.0, 111.2], [113.0, 117.75], [119.0, 161.37], [168.0, 171.95], [172.0, 172.39], [172.0, 172.44]], "keep_status": [true, false, false, true, true, true, false, false, false, true, true, false, false, false, false, true, false, false], "silence_prob": [29.7, 0.0, 0.0, 30.57, 29.33, 28.66, 0.0, 0.0, 0.0, 29.1, 44.07, 0.0, 0.0, 41.87, 0.0, 28.12, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.62], ["speech", 20.67], ["buzz", 9.37]], null, null, [["speech", 46.0], ["music", 13.52], ["vehicle", 2.75]], [["speech", 41.42], ["vehicle", 13.09], ["music", 10.19]], [["speech", 32.38], ["hum", 8.45], ["explosion", 6.02]], null, null, null, [["explosion", 20.44], ["music", 20.25], ["speech", 5.93]], [["fly, housefly", 9.51], ["throbbing", 5.86], ["music", 5.82]], null, null, [["music", 62.02], ["hum", 8.21], ["throbbing", 4.75]], null, [["explosion", 22.48], ["burst, pop", 18.46], ["sound effect", 9.17]], null, null], "duration": [12.56, -0.32, 1.17, 5.6, 26.87, 8.5, -0.06, 0.29, 0.61, 2.0, 3.39, 1.95, 1.2, 4.75, 42.37, 3.95, 0.39, 0.44]} \ No newline at end of file diff --git a/annotations_1/JYwvFPjJ7dM_filtered.json b/annotations_1/JYwvFPjJ7dM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f5acb95d83276ff976a61d3392b564903f63e82 --- /dev/null +++ b/annotations_1/JYwvFPjJ7dM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.02], [2.0, 2.08], [3.0, 3.54], [7.0, 7.48], [8.0, 9.02], [11.0, 11.23], [13.0, 13.61], [16.0, 16.55], [19.0, 20.34], [21.0, 21.44], [23.0, 26.16], [30.0, 30.82], [36.0, 36.42], [40.0, 40.27], [41.0, 42.35], [43.0, 43.85], [44.0, 46.33], [47.0, 47.48], [48.0, 47.55], [48.0, 47.61], [48.0, 47.92], [48.0, 49.59], [51.0, 52.19], [54.0, 54.82], [56.0, 56.83], [58.0, 58.75], [59.0, 61.74], [63.0, 63.64], [64.0, 95.39], [99.0, 101.33], [102.0, 111.37], [112.0, 113.91], [114.0, 116.65], [118.0, 122.13], [124.0, 124.92], [126.0, 126.5], [128.0, 136.75], [137.0, 138.33], [138.0, 139.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 58.3, 71.29, 0.0, 84.98, 72.9, 0.0, 0.0, 79.94, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.92], ["telephone", 4.99], ["animal", 3.58]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 0.08, 0.54, 0.48, 1.02, 0.23, 0.61, 0.55, 1.34, 0.44, 3.16, 0.82, 0.42, 0.27, 1.35, 0.85, 2.33, 0.48, -0.45, -0.39, -0.08, 1.59, 1.19, 0.82, 0.83, 0.75, 2.74, 0.64, 31.39, 2.33, 9.37, 1.91, 2.65, 4.13, 0.92, 0.5, 8.75, 1.33, 1.7]} \ No newline at end of file diff --git a/annotations_1/JZCM0ZW-GMw_filtered.json b/annotations_1/JZCM0ZW-GMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02f82a2b676e210d6963b48fd07a66d7ca611f5c --- /dev/null +++ b/annotations_1/JZCM0ZW-GMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.17], [13.0, 13.53], [15.0, 17.9], [19.0, 18.81], [27.0, 26.94], [29.0, 29.83], [33.0, 34.3], [35.0, 35.75], [37.0, 37.4], [39.0, 40.09], [43.0, 43.48], [49.0, 49.76], [51.0, 51.58], [59.0, 61.6], [62.0, 62.55], [65.0, 66.34], [70.0, 72.44], [74.0, 91.1], [93.0, 93.18], [94.0, 98.24], [107.0, 107.79], [109.0, 112.45], [113.0, 112.67], [117.0, 117.42], [121.0, 121.86], [124.0, 124.36], [127.0, 127.06], [127.0, 128.16], [129.0, 131.33], [134.0, 134.54]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 32.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.2, 0.0, 0.0, 96.17, 35.91, 0.0, 43.98, 0.0, 30.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 20.6], ["mosquito", 11.29], ["fart", 11.01]], null, null, null, null, null, null, null, null, null, null, [["speech", 54.69], ["horse", 5.76], ["outside, urban or manmade", 4.18]], null, null, null, [["music", 31.72], ["throbbing", 28.18], ["hum", 20.47]], null, [["music", 58.45], ["hum", 13.83], ["throbbing", 5.09]], null, [["speech", 42.04], ["music", 21.58], ["explosion", 7.46]], null, null, null, null, null, null, [["speech", 28.66], ["animal", 8.2], ["livestock, farm animals, working animals", 7.94]], null], "duration": [1.17, 0.53, 2.9, -0.19, -0.06, 0.83, 1.3, 0.75, 0.4, 1.09, 0.48, 0.76, 0.58, 2.6, 0.55, 1.34, 2.44, 17.1, 0.18, 4.24, 0.79, 3.45, -0.33, 0.42, 0.86, 0.36, 0.06, 1.16, 2.33, 0.54]} \ No newline at end of file diff --git a/annotations_1/JZzbTqTLiqU_filtered.json b/annotations_1/JZzbTqTLiqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d5763b07c42c362544c85bf2af5df81e6d74dfb --- /dev/null +++ b/annotations_1/JZzbTqTLiqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.11], [10.0, 10.96], [14.0, 16.61], [19.0, 19.41], [21.0, 23.5], [25.0, 26.91], [29.0, 31.94], [33.0, 43.34], [44.0, 46.55], [47.0, 53.96], [55.0, 57.23], [58.0, 61.59], [62.0, 64.12], [65.0, 72.28], [73.0, 74.56], [75.0, 75.81], [77.0, 92.58], [93.0, 92.62], [94.0, 115.62], [119.0, 120.14], [123.0, 123.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 87.37, 0.0, 70.44, 0.0, 72.6, 47.35, 53.59, 98.44, 100.0, 61.67, 37.28, 54.83, 0.0, 0.0, 45.98, 0.0, 34.49, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 51.85], ["hum", 11.18], ["throbbing", 7.54]], null, null, null, null, [["speech", 66.44], ["guitar", 5.05], ["music", 4.73]], null, null, null, [["tuning fork", 54.48], ["music", 10.61], ["ding", 3.93]], null, [["music", 72.32], ["ping", 6.73], ["musical instrument", 2.57]], null, null], "duration": [1.11, 0.96, 2.61, 0.41, 2.5, 1.91, 2.94, 10.34, 2.55, 6.96, 2.23, 3.59, 2.12, 7.28, 1.56, 0.81, 15.58, -0.38, 21.62, 1.14, 0.67]} \ No newline at end of file diff --git a/annotations_1/J_wbvP9hEFQ_filtered.json b/annotations_1/J_wbvP9hEFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61333348d62def5156bd5db36debd9d066fee880 --- /dev/null +++ b/annotations_1/J_wbvP9hEFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.2], [13.0, 25.64], [27.0, 26.76], [29.0, 29.4], [31.0, 31.35], [34.0, 34.1], [41.0, 42.21], [43.0, 60.44], [60.0, 61.21], [62.0, 61.64], [62.0, 62.94], [65.0, 65.64], [78.0, 78.97], [80.0, 80.57], [91.0, 90.78], [96.0, 98.2], [102.0, 102.56], [113.0, 113.98], [120.0, 121.1], [122.0, 123.04], [125.0, 124.9], [139.0, 138.87], [142.0, 142.65], [149.0, 151.44], [152.0, 154.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.28, 0.0, 0.0, 0.0, 0.0, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.46, 35.93], "audiomae_on_audioset": [null, [["music", 67.22], ["didgeridoo", 15.41], ["musical instrument", 5.63]], null, null, null, null, null, [["music", 46.32], ["speech", 35.01], ["electric shaver, electric razor", 2.46]], null, null, null, null, null, null, null, [["effects unit", 11.11], ["speech", 9.6], ["noise", 7.04]], null, null, null, null, null, null, null, [["music", 55.8], ["theremin", 14.21], ["bell", 4.45]], [["foghorn", 38.12], ["music", 24.39], ["trombone", 8.46]]], "duration": [0.2, 12.64, -0.24, 0.4, 0.35, 0.1, 1.21, 17.44, 1.21, -0.36, 0.94, 0.64, 0.97, 0.57, -0.22, 2.2, 0.56, 0.98, 1.1, 1.04, -0.1, -0.13, 0.65, 2.44, 2.26]} \ No newline at end of file diff --git a/annotations_1/JaMejPOFVCc_filtered.json b/annotations_1/JaMejPOFVCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a92a0a48ba90a6ed01fa3dd3a99e28608e1dea3c --- /dev/null +++ b/annotations_1/JaMejPOFVCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 29.86], [35.0, 35.43], [36.0, 36.1], [41.0, 41.08], [44.0, 44.47], [55.0, 55.07], [60.0, 64.02], [65.0, 65.25], [66.0, 67.04], [69.0, 69.04], [73.0, 73.36], [75.0, 75.98], [80.0, 81.03], [82.0, 83.15], [84.0, 87.96], [89.0, 89.45], [91.0, 94.71], [96.0, 98.86], [103.0, 103.25], [120.0, 120.43], [130.0, 130.47], [132.0, 138.47], [145.0, 145.15], [166.0, 166.21], [168.0, 170.92], [200.0, 202.64], [205.0, 207.71], [209.0, 209.76]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 0.0, 34.7, 51.94, 0.0, 0.0, 0.0, 32.29, 0.0, 0.0, 30.5, 99.68, 99.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 18.34], ["burping, eructation", 14.54], ["whale vocalization", 13.17]], null, null, null, null, null, null, null, [["speech", 33.66], ["music", 22.45], ["fart", 7.93]], null, [["grunt", 17.18], ["music", 16.33], ["speech", 9.58]], null, null, null, null, [["groan", 58.93], ["music", 14.55], ["speech", 9.04]], null, null, [["groan", 12.05], ["whack, thwack", 11.87], ["boing", 10.25]], null, null, null], "duration": [-0.14, 0.43, 0.1, 0.08, 0.47, 0.07, 4.02, 0.25, 1.04, 0.04, 0.36, 0.98, 1.03, 1.15, 3.96, 0.45, 3.71, 2.86, 0.25, 0.43, 0.47, 6.47, 0.15, 0.21, 2.92, 2.64, 2.71, 0.76]} \ No newline at end of file diff --git a/annotations_1/JaTAjmSppvA_filtered.json b/annotations_1/JaTAjmSppvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef820e4577160afc65c0772d3a640e6d00662efd --- /dev/null +++ b/annotations_1/JaTAjmSppvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.96], [14.0, 17.32], [28.0, 71.83], [92.0, 98.07], [106.0, 106.95], [108.0, 111.03], [113.0, 113.59], [115.0, 119.57], [121.0, 148.22], [149.0, 152.81], [155.0, 159.02], [160.0, 162.73], [164.0, 164.0], [167.0, 167.64], [168.0, 173.74]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 41.01, 0.0, 31.54, 0.0, 51.71, 0.0, 35.87, 32.1, 42.22, 41.42, 67.25, 0.0, 0.0, 55.89], "audiomae_on_audioset": [null, [["speech", 56.86], ["explosion", 10.15], ["burst, pop", 4.17]], null, [["speech", 47.8], ["music", 17.88], ["fart", 2.99]], null, null, null, [["cattle, bovinae", 44.84], ["moo", 38.66], ["livestock, farm animals, working animals", 9.06]], [["music", 44.54], ["hum", 6.76], ["livestock, farm animals, working animals", 6.65]], [["speech", 38.89], ["music", 25.68], ["sidetone", 12.28]], [["cattle, bovinae", 49.13], ["moo", 33.74], ["livestock, farm animals, working animals", 5.59]], null, null, null, null], "duration": [-0.04, 3.32, 43.83, 6.07, 0.95, 3.03, 0.59, 4.57, 27.22, 3.81, 4.02, 2.73, 0.0, 0.64, 5.74]} \ No newline at end of file diff --git a/annotations_1/JanwLiyFPAU_filtered.json b/annotations_1/JanwLiyFPAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d30ef30a7ab50d11c870883ba776c141d06ad581 --- /dev/null +++ b/annotations_1/JanwLiyFPAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.32], [23.0, 24.68], [26.0, 31.38], [37.0, 38.06], [55.0, 55.22], [56.0, 56.64], [59.0, 58.8], [60.0, 62.34], [74.0, 74.33], [78.0, 78.56], [80.0, 80.05], [83.0, 83.69], [86.0, 88.03], [92.0, 92.6], [93.0, 94.74], [100.0, 101.17], [106.0, 105.98]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [99.62, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 37.45, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["moo", 31.09], ["cattle, bovinae", 28.36], ["livestock, farm animals, working animals", 5.98]], null, null, null, null, null, null, null, null, null], "duration": [4.32, 1.68, 5.38, 1.06, 0.22, 0.64, -0.2, 2.34, 0.33, 0.56, 0.05, 0.69, 2.03, 0.6, 1.74, 1.17, -0.02]} \ No newline at end of file diff --git a/annotations_1/Jb2egULZePg_filtered.json b/annotations_1/Jb2egULZePg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dcb6e85662b3269782f10cc381e9c8d4b613548 --- /dev/null +++ b/annotations_1/Jb2egULZePg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [6.0, 6.27], [7.0, 8.46], [9.0, 9.81], [29.0, 29.64], [31.0, 31.29], [34.0, 35.14], [38.0, 37.66], [43.0, 42.75], [48.0, 48.54], [53.0, 59.1], [61.0, 62.11], [63.0, 64.08], [66.0, 67.22], [71.0, 71.0], [72.0, 72.27], [74.0, 74.44], [83.0, 83.34], [88.0, 119.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.27, 1.46, 0.81, 0.64, 0.29, 1.14, -0.34, -0.25, 0.54, 6.1, 1.11, 1.08, 1.22, 0.0, 0.27, 0.44, 0.34, 31.77]} \ No newline at end of file diff --git a/annotations_1/JbuGOroCWaI_filtered.json b/annotations_1/JbuGOroCWaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13531642aeb3f7bcf2d3de881a67dac9ccc2f339 --- /dev/null +++ b/annotations_1/JbuGOroCWaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [9.0, 10.37], [11.0, 19.8], [21.0, 24.11], [25.0, 34.38], [35.0, 36.0], [38.0, 38.8], [46.0, 46.41], [51.0, 53.97], [56.0, 57.2], [59.0, 59.95], [63.0, 62.8], [66.0, 66.55], [79.0, 79.74], [84.0, 84.79], [101.0, 101.09], [114.0, 114.39], [123.0, 124.38], [148.0, 148.83], [152.0, 154.28], [160.0, 160.61], [164.0, 165.08]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.67, 48.48, 70.44, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 25.41], ["sidetone", 23.84], ["hum", 14.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.37, 8.8, 3.11, 9.38, 1.0, 0.8, 0.41, 2.97, 1.2, 0.95, -0.2, 0.55, 0.74, 0.79, 0.09, 0.39, 1.38, 0.83, 2.28, 0.61, 1.08]} \ No newline at end of file diff --git a/annotations_1/JcAdeY9KlpE_filtered.json b/annotations_1/JcAdeY9KlpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9401fb0ff47e819cce67cf7be550d9965a957ed2 --- /dev/null +++ b/annotations_1/JcAdeY9KlpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 0.97], [2.0, 2.25], [8.0, 8.28], [10.0, 9.76], [24.0, 24.58], [33.0, 35.36], [35.0, 35.45], [44.0, 45.03], [53.0, 54.03], [56.0, 56.71], [61.0, 60.99], [61.0, 61.7], [65.0, 65.65], [70.0, 70.38], [70.0, 70.41], [74.0, 73.99], [75.0, 75.86], [79.0, 79.46], [79.0, 82.83], [92.0, 92.23], [96.0, 95.89], [101.0, 101.21], [103.0, 104.82], [107.0, 106.84], [110.0, 110.22], [116.0, 116.97], [120.0, 120.04], [120.0, 120.5], [124.0, 125.54], [127.0, 126.87], [128.0, 147.65], [151.0, 152.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["frog", 41.4], ["croak", 25.8], ["speech", 11.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.61], ["speech", 4.08], ["boing", 3.74]], null], "duration": [0.5, -0.03, 0.25, 0.28, -0.24, 0.58, 2.36, 0.45, 1.03, 1.03, 0.71, -0.01, 0.7, 0.65, 0.38, 0.41, -0.01, 0.86, 0.46, 3.83, 0.23, -0.11, 0.21, 1.82, -0.16, 0.22, 0.97, 0.04, 0.5, 1.54, -0.13, 19.65, 1.0]} \ No newline at end of file diff --git a/annotations_1/JcC5XdvOWWM_filtered.json b/annotations_1/JcC5XdvOWWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72fc993a8e10f6f40d50d491c2423cef59914a7e --- /dev/null +++ b/annotations_1/JcC5XdvOWWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.72], [17.0, 16.92], [20.0, 20.29], [21.0, 21.02], [23.0, 25.1], [27.0, 32.14], [34.0, 35.61], [40.0, 39.95], [45.0, 45.96], [46.0, 46.87], [48.0, 49.49], [51.0, 54.21], [55.0, 55.0], [56.0, 57.35], [67.0, 70.8], [76.0, 107.72]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.13, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0, 32.33, 0.0, 0.0, 30.75, 0.0], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 27.69], ["hum", 20.28], ["music", 14.8]], [["music", 64.73], ["synthesizer", 7.64], ["musical instrument", 5.49]], null, null, null, null, null, [["whale vocalization", 39.4], ["speech", 17.33], ["fart", 14.38]], null, null, [["music", 49.97], ["speech", 12.9], ["boing", 9.94]], null], "duration": [0.72, -0.08, 0.29, 0.02, 2.1, 5.14, 1.61, -0.05, 0.96, 0.87, 1.49, 3.21, 0.0, 1.35, 3.8, 31.72]} \ No newline at end of file diff --git a/annotations_1/JcRuXU7cvmo_filtered.json b/annotations_1/JcRuXU7cvmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8ccb638206486fd7ea0556546a9f0ea8a0d2c03 --- /dev/null +++ b/annotations_1/JcRuXU7cvmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 70.06], [72.0, 72.72], [74.0, 78.09], [85.0, 103.49], [104.0, 105.78], [107.0, 110.07]], "keep_status": [false, false, false, false, false, false], "silence_prob": [58.89, 0.0, 73.06, 69.61, 0.0, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [14.06, 0.72, 4.09, 18.49, 1.78, 3.07]} \ No newline at end of file diff --git a/annotations_1/Jd0XiJie7Lo_filtered.json b/annotations_1/Jd0XiJie7Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a12029ba108bc4c4033b367b4869ef5d3b65b9e1 --- /dev/null +++ b/annotations_1/Jd0XiJie7Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.24], [9.0, 23.46], [28.0, 32.41], [33.0, 49.3], [50.0, 55.0], [55.0, 55.41], [70.0, 71.34], [72.0, 73.6]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 89.36, 33.77, 55.67, 32.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 34.69], ["whale vocalization", 18.04], ["hum", 5.33]], null, [["music", 30.52], ["speech", 26.81], ["boing", 12.84]], null, null, null], "duration": [0.24, 14.46, 4.41, 16.3, 5.0, 0.41, 1.34, 1.6]} \ No newline at end of file diff --git a/annotations_1/Jd3GwwxFDPY_filtered.json b/annotations_1/Jd3GwwxFDPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9ba114f42a030f0f582862b7647d804c2c3d92a --- /dev/null +++ b/annotations_1/Jd3GwwxFDPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 3.86], [5.0, 5.21], [7.0, 8.43], [10.0, 10.91], [12.0, 12.78], [15.0, 23.99], [27.0, 31.94], [32.0, 33.64], [34.0, 37.37], [43.0, 43.44], [44.0, 48.32], [49.0, 49.2], [51.0, 70.51], [79.0, 79.91], [81.0, 81.41], [83.0, 104.45], [107.0, 113.0], [116.0, 117.71], [119.0, 120.12], [122.0, 122.15], [128.0, 128.38], [129.0, 129.73], [132.0, 132.76], [133.0, 133.84], [135.0, 137.79], [140.0, 141.24], [144.0, 155.33]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 42.44, 0.0, 48.91, 0.0, 34.44, 0.0, 32.82, 0.0, 0.0, 44.93, 34.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.78, 0.0, 38.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cattle, bovinae", 22.46], ["speech", 19.75], ["livestock, farm animals, working animals", 13.75]], null, [["fly, housefly", 40.69], ["insect", 19.11], ["bee, wasp, etc.", 6.01]], null, [["mosquito", 49.36], ["fly, housefly", 32.96], ["insect", 10.94]], null, [["gong", 17.28], ["hum", 10.36], ["speech", 9.55]], null, null, [["livestock, farm animals, working animals", 39.23], ["cattle, bovinae", 10.43], ["clip-clop", 9.15]], [["fly, housefly", 47.68], ["insect", 23.58], ["speech", 13.94]], null, null, null, null, null, null, null, [["speech", 22.75], ["moo", 11.16], ["horse", 10.86]], null, [["speech", 39.6], ["horse", 5.17], ["knock", 4.19]]], "duration": [1.13, 0.86, 0.21, 1.43, 0.91, 0.78, 8.99, 4.94, 1.64, 3.37, 0.44, 4.32, 0.2, 19.51, 0.91, 0.41, 21.45, 6.0, 1.71, 1.12, 0.15, 0.38, 0.73, 0.76, 0.84, 2.79, 1.24, 11.33]} \ No newline at end of file diff --git a/annotations_1/JdZHXwqDXB4_filtered.json b/annotations_1/JdZHXwqDXB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076cb36a9ae72f5677d135dcd2eba8bcd2b3c1e5 --- /dev/null +++ b/annotations_1/JdZHXwqDXB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.73], [26.0, 26.6], [34.0, 34.13], [40.0, 40.47], [43.0, 43.68], [48.0, 49.35], [50.0, 52.83], [54.0, 55.16], [58.0, 57.74], [60.0, 61.89], [65.0, 65.31], [66.0, 69.3], [70.0, 70.88], [72.0, 72.4], [73.0, 73.48], [79.0, 83.29], [83.0, 83.32], [86.0, 91.17], [93.0, 94.09], [96.0, 97.28], [99.0, 99.44], [104.0, 104.31], [106.0, 106.76], [108.0, 108.24], [109.0, 110.12], [113.0, 115.32], [140.0, 140.97], [151.0, 151.93], [153.0, 153.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 40.22, 0.0, 32.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.44], ["musical instrument", 2.78], ["speech", 2.16]], null, [["music", 72.76], ["siren", 5.74], ["police car (siren)", 4.19]], null, null, null, null, null, null, null, [["ice cream truck, ice cream van", 80.22], ["music", 6.05], ["speech", 5.53]], null, null, null], "duration": [1.73, 0.6, 0.13, 0.47, 0.68, 1.35, 2.83, 1.16, -0.26, 1.89, 0.31, 3.3, 0.88, 0.4, 0.48, 4.29, 0.32, 5.17, 1.09, 1.28, 0.44, 0.31, 0.76, 0.24, 1.12, 2.32, 0.97, 0.93, 0.13]} \ No newline at end of file diff --git a/annotations_1/Je3Vjos0TlQ_filtered.json b/annotations_1/Je3Vjos0TlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff140743b3f1684721ecc9dd1c88c3746b36463e --- /dev/null +++ b/annotations_1/Je3Vjos0TlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 66.85], [69.0, 71.02], [74.0, 78.17], [79.0, 157.87], [159.0, 162.11], [163.0, 175.58], [176.0, 175.81]], "keep_status": [false, true, false, false, true, false, false], "silence_prob": [0.0, 38.15, 28.91, 0.0, 48.48, 35.5, 0.0], "audiomae_on_audioset": [null, [["music", 25.05], ["speech", 12.84], ["hum", 9.81]], [["music", 63.85], ["hum", 6.3], ["electronic music", 6.13]], null, [["animal", 8.55], ["cattle, bovinae", 8.39], ["speech", 7.63]], [["electric shaver, electric razor", 35.87], ["hum", 17.36], ["mains hum", 16.8]], null], "duration": [0.85, 2.02, 4.17, 78.87, 3.11, 12.58, -0.19]} \ No newline at end of file diff --git a/annotations_1/Jf7jVM7NoVE_filtered.json b/annotations_1/Jf7jVM7NoVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc1b7cb3e939397d1944df53718288e5bc5acd4d --- /dev/null +++ b/annotations_1/Jf7jVM7NoVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.94], [9.0, 9.69], [10.0, 11.1], [15.0, 15.58], [18.0, 18.87], [20.0, 22.77], [27.0, 27.35], [30.0, 30.08], [30.0, 32.41], [33.0, 34.1], [37.0, 40.22], [41.0, 40.86], [45.0, 45.42], [46.0, 46.21], [53.0, 54.36], [55.0, 56.73], [59.0, 59.37], [61.0, 61.67], [63.0, 63.78], [67.0, 68.52], [70.0, 72.3], [75.0, 76.13], [79.0, 81.62], [85.0, 84.92], [88.0, 89.09], [91.0, 92.4], [97.0, 99.08], [99.0, 99.45], [102.0, 102.19], [103.0, 103.49], [107.0, 108.43], [110.0, 110.57], [112.0, 111.64], [112.0, 112.83], [116.0, 116.01], [119.0, 119.03], [130.0, 130.59], [134.0, 134.5], [135.0, 135.58], [137.0, 136.93], [137.0, 138.82], [140.0, 140.39], [143.0, 143.92], [146.0, 146.37], [148.0, 148.63], [150.0, 150.21], [152.0, 159.98], [162.0, 162.46], [164.0, 164.81], [166.0, 166.24], [171.0, 171.12], [173.0, 174.33], [175.0, 175.9], [176.0, 180.62], [182.0, 183.07], [185.0, 188.74], [194.0, 196.05], [197.0, 199.72], [201.0, 204.69], [205.0, 207.4], [209.0, 209.56], [210.0, 210.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 94.66, 0.0, 32.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 59.86, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 90.25, 68.28, 80.82, 57.17, 56.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 31.25], ["noise", 7.02], ["animal", 5.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 0.69, 1.1, 0.58, 0.87, 2.77, 0.35, 0.08, 2.41, 1.1, 3.22, -0.14, 0.42, 0.21, 1.36, 1.73, 0.37, 0.67, 0.78, 1.52, 2.3, 1.13, 2.62, -0.08, 1.09, 1.4, 2.08, 0.45, 0.19, 0.49, 1.43, 0.57, -0.36, 0.83, 0.01, 0.03, 0.59, 0.5, 0.58, -0.07, 1.82, 0.39, 0.92, 0.37, 0.63, 0.21, 7.98, 0.46, 0.81, 0.24, 0.12, 1.33, 0.9, 4.62, 1.07, 3.74, 2.05, 2.72, 3.69, 2.4, 0.56, 0.59]} \ No newline at end of file diff --git a/annotations_1/Jf8Sheh4MD4_filtered.json b/annotations_1/Jf8Sheh4MD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ac6a637fc2fc09f5e03a6191e6b98aa58e765da --- /dev/null +++ b/annotations_1/Jf8Sheh4MD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 46.7], [49.0, 68.69], [69.0, 71.93], [75.0, 110.79]], "keep_status": [true, false, true, false], "silence_prob": [33.74, 31.31, 30.19, 0.0], "audiomae_on_audioset": [[["music", 44.63], ["electronic music", 8.83], ["musical instrument", 8.1]], [["hum", 35.52], ["music", 22.52], ["throbbing", 16.25]], [["music", 37.24], ["synthesizer", 4.5], ["heart murmur", 4.27]], null], "duration": [29.7, 19.69, 2.93, 35.79]} \ No newline at end of file diff --git a/annotations_1/JfEde8D6XE8_filtered.json b/annotations_1/JfEde8D6XE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72e80cf6584bc42680aad559835553404a12a23a --- /dev/null +++ b/annotations_1/JfEde8D6XE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [7.0, 8.87], [10.0, 10.37], [11.0, 11.3], [14.0, 15.35], [17.0, 17.81], [18.0, 19.55], [20.0, 20.95], [22.0, 22.32], [24.0, 24.02], [28.0, 29.89], [32.0, 33.57], [35.0, 36.29], [40.0, 41.3], [44.0, 44.95], [53.0, 54.75], [57.0, 57.59], [60.0, 61.28], [66.0, 66.07], [72.0, 72.15], [73.0, 74.11], [76.0, 77.21], [81.0, 81.46], [91.0, 91.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.87, 0.37, 0.3, 1.35, 0.81, 1.55, 0.95, 0.32, 0.02, 1.89, 1.57, 1.29, 1.3, 0.95, 1.75, 0.59, 1.28, 0.07, 0.15, 1.11, 1.21, 0.46, 0.35]} \ No newline at end of file diff --git a/annotations_1/JfsgeCwAYEM_filtered.json b/annotations_1/JfsgeCwAYEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d36a66d551f4e5631bdef6573b61281479018917 --- /dev/null +++ b/annotations_1/JfsgeCwAYEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.61], [26.0, 51.36], [54.0, 58.83], [60.0, 60.02], [60.0, 60.15], [75.0, 78.31], [79.0, 82.46], [86.0, 87.18], [90.0, 90.91], [94.0, 94.34], [97.0, 97.09], [100.0, 101.46], [103.0, 102.79], [105.0, 105.56], [107.0, 107.25], [108.0, 108.28], [111.0, 111.77], [113.0, 113.02], [116.0, 116.94], [118.0, 125.61]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.09, 30.11, 34.94, 0.0, 0.0, 36.9, 38.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.29], "audiomae_on_audioset": [[["music", 43.92], ["clarinet", 10.11], ["brass instrument", 9.82]], [["music", 58.33], ["didgeridoo", 7.51], ["musical instrument", 6.79]], [["music", 89.09], ["musical instrument", 1.97], ["synthesizer", 1.06]], null, null, [["music", 56.33], ["radio", 23.71], ["speech", 13.01]], [["music", 41.64], ["quack", 5.37], ["bleat", 4.25]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.44], ["didgeridoo", 6.8], ["synthesizer", 3.99]]], "duration": [10.61, 25.36, 4.83, 0.02, 0.15, 3.31, 3.46, 1.18, 0.91, 0.34, 0.09, 1.46, -0.21, 0.56, 0.25, 0.28, 0.77, 0.02, 0.94, 7.61]} \ No newline at end of file diff --git a/annotations_1/JgTgQvvqRqE_filtered.json b/annotations_1/JgTgQvvqRqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49cb0540d7d026a18fb0bf12881f3a33fed4834c --- /dev/null +++ b/annotations_1/JgTgQvvqRqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.23], [32.0, 34.42], [36.0, 40.73], [42.0, 141.72], [144.0, 153.2], [156.0, 168.47], [170.0, 184.64], [187.0, 216.16], [220.0, 223.06], [224.0, 262.38], [263.0, 299.29], [300.0, 299.94]], "keep_status": [true, true, true, false, true, true, false, true, true, false, false, false], "silence_prob": [28.65, 28.68, 28.61, 0.0, 31.02, 30.49, 34.29, 29.1, 27.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 24.4], ["mains hum", 23.06], ["speech", 17.68]], [["buzz", 39.81], ["mains hum", 13.2], ["hum", 8.88]], [["hum", 34.83], ["mains hum", 19.06], ["music", 10.93]], null, [["hum", 19.92], ["speech", 17.87], ["music", 14.03]], [["speech", 51.65], ["mains hum", 9.77], ["hum", 8.25]], [["speech", 36.33], ["mains hum", 24.52], ["hum", 15.66]], [["hum", 33.35], ["mains hum", 22.83], ["speech", 11.66]], [["music", 14.18], ["sound effect", 9.02], ["hum", 7.42]], null, null, null], "duration": [15.23, 2.42, 4.73, 99.72, 9.2, 12.47, 14.64, 29.16, 3.06, 38.38, 36.29, -0.06]} \ No newline at end of file diff --git a/annotations_1/Jgye_cEhfGQ_filtered.json b/annotations_1/Jgye_cEhfGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Jgye_cEhfGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/JhMWopjJiI8_filtered.json b/annotations_1/JhMWopjJiI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acf51c2fad6d341e74f9eb5724b4a25c20f9f028 --- /dev/null +++ b/annotations_1/JhMWopjJiI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 37.56], [39.0, 70.19], [72.0, 90.44], [92.0, 129.96], [130.0, 155.85]], "keep_status": [false, false, true, false, true], "silence_prob": [0.0, 0.0, 28.84, 0.0, 42.91], "audiomae_on_audioset": [null, null, [["speech", 40.73], ["music", 10.85], ["whack, thwack", 10.04]], null, [["hum", 26.32], ["insect", 12.3], ["fly, housefly", 9.36]]], "duration": [30.56, 31.19, 18.44, 37.96, 25.85]} \ No newline at end of file diff --git a/annotations_1/Jhzm2AvUGHA_filtered.json b/annotations_1/Jhzm2AvUGHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85bf40d62c826a904cb7b04f4590cda78d46d151 --- /dev/null +++ b/annotations_1/Jhzm2AvUGHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.67], [5.0, 6.34], [7.0, 7.86], [9.0, 9.39], [10.0, 14.1], [17.0, 19.77], [20.0, 26.87], [28.0, 28.49], [29.0, 29.73], [31.0, 32.32], [36.0, 39.19], [41.0, 46.47], [47.0, 51.17], [51.0, 51.39], [52.0, 52.76], [54.0, 54.65], [55.0, 56.89], [57.0, 59.1], [59.0, 59.64], [61.0, 67.68], [69.0, 72.52], [74.0, 76.65], [77.0, 78.22], [81.0, 82.36], [84.0, 85.36], [86.0, 98.19], [98.0, 100.95], [102.0, 102.73], [105.0, 105.48], [107.0, 106.61], [107.0, 108.14], [109.0, 117.88], [119.0, 119.31], [135.0, 136.05], [148.0, 149.69], [155.0, 155.53], [158.0, 158.92], [160.0, 160.74], [165.0, 165.94], [169.0, 169.25], [171.0, 171.63], [174.0, 174.24], [175.0, 175.27], [178.0, 178.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.83, 80.46, 42.42, 0.0, 0.0, 0.0, 72.01, 88.64, 73.51, 0.0, 0.0, 0.0, 0.0, 51.88, 0.0, 65.67, 79.59, 90.95, 0.0, 0.0, 0.0, 51.5, 87.37, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 44.87], ["speech", 38.71], ["boing", 3.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 1.34, 0.86, 0.39, 4.1, 2.77, 6.87, 0.49, 0.73, 1.32, 3.19, 5.47, 4.17, 0.39, 0.76, 0.65, 1.89, 2.1, 0.64, 6.68, 3.52, 2.65, 1.22, 1.36, 1.36, 12.19, 2.95, 0.73, 0.48, -0.39, 1.14, 8.88, 0.31, 1.05, 1.69, 0.53, 0.92, 0.74, 0.94, 0.25, 0.63, 0.24, 0.27, 0.66]} \ No newline at end of file diff --git a/annotations_1/JivWELi2rFw_filtered.json b/annotations_1/JivWELi2rFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9276de6c1f4432e4b5500a8be15d151676ff7c1 --- /dev/null +++ b/annotations_1/JivWELi2rFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.96], [12.0, 14.17], [18.0, 22.25], [27.0, 29.86], [31.0, 58.36], [60.0, 71.81], [73.0, 87.25]], "keep_status": [false, false, false, false, true, true, false], "silence_prob": [64.41, 53.4, 51.94, 44.72, 36.06, 39.91, 46.09], "audiomae_on_audioset": [null, null, null, [["music", 52.18], ["hum", 12.64], ["throbbing", 11.86]], [["music", 22.89], ["grunt", 10.19], ["fly, housefly", 7.3]], [["animal", 12.93], ["hum", 8.93], ["livestock, farm animals, working animals", 6.75]], [["music", 35.91], ["hum", 20.72], ["mains hum", 15.32]]], "duration": [6.96, 2.17, 4.25, 2.86, 27.36, 11.81, 14.25]} \ No newline at end of file diff --git a/annotations_1/Jj-mAiTMvX8_filtered.json b/annotations_1/Jj-mAiTMvX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd11ede110ca389b92d931131ac2423610caefc7 --- /dev/null +++ b/annotations_1/Jj-mAiTMvX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.62], [20.0, 21.09], [24.0, 24.9], [28.0, 28.41], [29.0, 31.45], [33.0, 33.62], [59.0, 59.37], [85.0, 91.44]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.05, 0.0, 0.0, 37.64], "audiomae_on_audioset": [null, null, null, null, [["music", 74.43], ["musical instrument", 3.87], ["guitar", 3.27]], null, null, [["music", 47.29], ["boing", 11.18], ["wail, moan", 7.36]]], "duration": [0.62, 1.09, 0.9, 0.41, 2.45, 0.62, 0.37, 6.44]} \ No newline at end of file diff --git a/annotations_1/Jj6H6tJvRjU_filtered.json b/annotations_1/Jj6H6tJvRjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dbb8c2ac2f55d0fe0b0987cfb90525b63a9ccd0 --- /dev/null +++ b/annotations_1/Jj6H6tJvRjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.29], [32.0, 32.34], [32.0, 35.36], [36.0, 35.95], [40.0, 64.12], [65.0, 87.89], [88.0, 103.06], [106.0, 110.4]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.0, 0.0, 34.89, 30.78, 29.99, 29.73], "audiomae_on_audioset": [null, null, [["speech", 62.44], ["music", 11.77], ["boing", 2.09]], null, [["didgeridoo", 56.31], ["music", 26.87], ["speech", 3.39]], [["music", 78.69], ["didgeridoo", 8.13], ["musical instrument", 4.25]], [["speech", 62.98], ["music", 22.46], ["synthesizer", 1.92]], [["music", 73.92], ["speech", 5.25], ["didgeridoo", 2.85]]], "duration": [0.29, 0.34, 3.36, -0.05, 24.12, 22.89, 15.06, 4.4]} \ No newline at end of file diff --git a/annotations_1/JjbIo_301ZA_filtered.json b/annotations_1/JjbIo_301ZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3556e2aa81ddc82607c9d40fad6efb2b71bdb5a --- /dev/null +++ b/annotations_1/JjbIo_301ZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 77.52], [80.0, 80.2], [83.0, 102.52], [112.0, 113.71], [115.0, 115.99], [119.0, 144.8]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.73, 0.0, 0.0, 29.51], "audiomae_on_audioset": [null, null, [["music", 54.43], ["hum", 12.38], ["throbbing", 10.55]], null, null, [["music", 40.96], ["smash, crash", 33.02], ["explosion", 3.2]]], "duration": [69.52, 0.2, 19.52, 1.71, 0.99, 25.8]} \ No newline at end of file diff --git a/annotations_1/JjfbxBMmXTI_filtered.json b/annotations_1/JjfbxBMmXTI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/JjfbxBMmXTI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/JkQzE831VM8_filtered.json b/annotations_1/JkQzE831VM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b45452ea46241afda48226582a1d6c14318128b2 --- /dev/null +++ b/annotations_1/JkQzE831VM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.2], [13.0, 19.82], [20.0, 21.61], [22.0, 56.3], [57.0, 94.71], [96.0, 96.85], [98.0, 100.11], [103.0, 104.23], [106.0, 107.82], [117.0, 119.13], [122.0, 139.26], [141.0, 156.47], [157.0, 162.51], [164.0, 164.91], [167.0, 167.73], [181.0, 182.19], [186.0, 187.52], [190.0, 194.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.97, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 86.45, 52.05, 58.72, 79.41, 0.0, 0.0, 0.0, 0.0, 61.47], "audiomae_on_audioset": [null, [["explosion", 13.4], ["sidetone", 10.55], ["fart", 8.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 6.82, 1.61, 34.3, 37.71, 0.85, 2.11, 1.23, 1.82, 2.13, 17.26, 15.47, 5.51, 0.91, 0.73, 1.19, 1.52, 4.04]} \ No newline at end of file diff --git a/annotations_1/JkrovwTh2rw_filtered.json b/annotations_1/JkrovwTh2rw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8560a0366831183e0a6a5e1376da7e16177fa849 --- /dev/null +++ b/annotations_1/JkrovwTh2rw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 36.19], [38.0, 70.26], [71.0, 71.47]], "keep_status": [true, false, false], "silence_prob": [30.25, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.13], ["boing", 14.36], ["speech", 12.53]], null, null], "duration": [28.19, 32.26, 0.47]} \ No newline at end of file diff --git a/annotations_1/JmSmZRCl6A4_filtered.json b/annotations_1/JmSmZRCl6A4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58350d6c077dabdeeffb27dd375abfb916ac7a18 --- /dev/null +++ b/annotations_1/JmSmZRCl6A4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.93], [20.0, 21.02], [22.0, 35.73], [38.0, 61.79], [62.0, 63.88], [65.0, 68.93], [69.0, 71.14], [73.0, 77.45], [78.0, 79.2], [80.0, 88.28], [89.0, 90.26], [92.0, 93.18], [94.0, 95.66], [97.0, 96.74], [104.0, 104.87], [121.0, 121.41], [122.0, 123.52], [125.0, 125.63]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.07, 0.0, 72.46, 36.78, 0.0, 33.79, 36.15, 36.98, 0.0, 31.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 67.92], ["musical instrument", 2.58], ["theremin", 1.98]], null, [["music", 36.8], ["musical instrument", 9.17], ["theremin", 6.11]], [["music", 25.4], ["speech", 5.88], ["brass instrument", 5.53]], [["music", 57.4], ["theremin", 5.0], ["synthesizer", 4.89]], null, [["music", 55.61], ["speech", 21.17], ["synthesizer", 5.33]], null, null, null, null, null, null, null, null], "duration": [6.93, 1.02, 13.73, 23.79, 1.88, 3.93, 2.14, 4.45, 1.2, 8.28, 1.26, 1.18, 1.66, -0.26, 0.87, 0.41, 1.52, 0.63]} \ No newline at end of file diff --git a/annotations_1/Jmf4o8UalVM_filtered.json b/annotations_1/Jmf4o8UalVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f1e6e8d9f92d643afca53742bd6ab03963e04df --- /dev/null +++ b/annotations_1/Jmf4o8UalVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.42], [41.0, 43.11], [45.0, 45.33], [51.0, 61.06], [64.0, 64.15], [65.0, 71.41], [73.0, 73.13], [74.0, 75.32], [77.0, 77.53], [78.0, 81.23], [83.0, 88.77], [93.0, 93.39], [118.0, 121.98], [123.0, 123.48], [125.0, 133.69], [137.0, 138.08], [141.0, 170.43], [175.0, 179.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 87.19, 0.0, 97.54, 0.0, 53.04, 0.0, 0.0, 0.0, 81.71, 80.11, 0.0, 47.7, 0.0, 35.62, 0.0, 36.36, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.27], ["thunk", 7.49], ["glass", 5.42]], null, [["music", 37.13], ["didgeridoo", 15.68], ["speech", 10.72]], null, [["music", 54.23], ["theremin", 8.86], ["synthesizer", 7.57]], null], "duration": [0.42, 2.11, 0.33, 10.06, 0.15, 6.41, 0.13, 1.32, 0.53, 3.23, 5.77, 0.39, 3.98, 0.48, 8.69, 1.08, 29.43, 4.78]} \ No newline at end of file diff --git a/annotations_1/Jmls6360U9Q_filtered.json b/annotations_1/Jmls6360U9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f191c2a52ae018fe24afc0c15e0d501c6bae662 --- /dev/null +++ b/annotations_1/Jmls6360U9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.72], [20.0, 21.05], [25.0, 26.47], [27.0, 29.15], [30.0, 31.24], [33.0, 34.5], [37.0, 37.49], [43.0, 44.49], [45.0, 45.12]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [47.82, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 56.96], ["eruption", 10.18], ["explosion", 2.91]], null, null, null, null, null, null, null, null], "duration": [2.72, 1.05, 1.47, 2.15, 1.24, 1.5, 0.49, 1.49, 0.12]} \ No newline at end of file diff --git a/annotations_1/JnjO0v-AYFo_filtered.json b/annotations_1/JnjO0v-AYFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ba48593b2c72e4d61dd53ec587eac8864197d8f --- /dev/null +++ b/annotations_1/JnjO0v-AYFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.12], [26.0, 27.14], [30.0, 51.53], [53.0, 63.76], [65.0, 66.16], [68.0, 73.04], [94.0, 95.08], [102.0, 102.22], [103.0, 103.05]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.55, 31.94, 0.0, 49.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.19], ["hum", 7.53], ["throbbing", 5.5]], [["hum", 38.04], ["throbbing", 21.78], ["mains hum", 16.94]], null, [["music", 43.96], ["throbbing", 25.24], ["hum", 5.41]], null, null, null], "duration": [0.12, 1.14, 21.53, 10.76, 1.16, 5.04, 1.08, 0.22, 0.05]} \ No newline at end of file diff --git a/annotations_1/JnuYlFhXWsU_filtered.json b/annotations_1/JnuYlFhXWsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0447e473cdb550ecab4a87bcc76f8291c5bc5e8a --- /dev/null +++ b/annotations_1/JnuYlFhXWsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.42], [10.0, 16.61], [17.0, 18.84], [21.0, 21.93], [24.0, 37.66], [38.0, 42.84], [44.0, 58.5], [65.0, 66.09], [67.0, 68.47], [69.0, 81.21], [81.0, 84.18], [87.0, 100.8], [104.0, 113.22], [117.0, 129.36], [132.0, 136.39], [137.0, 142.26], [147.0, 149.71], [151.0, 151.71]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, true, true, true, false, false], "silence_prob": [41.64, 35.35, 0.0, 0.0, 34.58, 35.45, 31.86, 0.0, 0.0, 34.88, 29.84, 30.05, 30.86, 30.2, 29.71, 30.43, 30.69, 0.0], "audiomae_on_audioset": [[["music", 65.0], ["synthesizer", 8.87], ["musical instrument", 4.51]], [["music", 70.34], ["thunk", 9.31], ["theremin", 3.05]], null, null, [["music", 62.26], ["musical instrument", 5.28], ["synthesizer", 5.02]], [["music", 15.98], ["speech", 15.64], ["synthesizer", 8.5]], [["music", 64.62], ["speech", 10.09], ["boing", 4.11]], null, null, [["speech", 55.09], ["music", 19.19], ["grunt", 8.25]], [["throbbing", 17.16], ["music", 11.53], ["boing", 10.93]], [["music", 40.7], ["boing", 19.56], ["whack, thwack", 5.11]], [["music", 65.81], ["quack", 4.96], ["animal", 4.26]], [["cattle, bovinae", 21.83], ["music", 21.78], ["moo", 17.52]], [["music", 23.04], ["trombone", 20.72], ["speech", 13.47]], [["music", 52.84], ["synthesizer", 6.22], ["brass instrument", 4.05]], [["music", 65.22], ["didgeridoo", 7.87], ["musical instrument", 7.17]], null], "duration": [4.42, 6.61, 1.84, 0.93, 13.66, 4.84, 14.5, 1.09, 1.47, 12.21, 3.18, 13.8, 9.22, 12.36, 4.39, 5.26, 2.71, 0.71]} \ No newline at end of file diff --git a/annotations_1/Jo1OjI4Yfv8_filtered.json b/annotations_1/Jo1OjI4Yfv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06ad30617e705fc1866efa2f10b0d2da51aa93a0 --- /dev/null +++ b/annotations_1/Jo1OjI4Yfv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.06], [8.0, 8.18], [16.0, 16.9], [18.0, 19.01], [21.0, 22.69], [24.0, 24.51], [35.0, 36.64], [39.0, 42.18], [55.0, 57.11], [59.0, 61.13], [62.0, 64.42], [66.0, 66.53], [68.0, 68.28], [71.0, 71.59], [72.0, 81.38], [85.0, 87.89], [89.0, 92.8], [96.0, 104.63], [110.0, 109.97], [111.0, 111.5], [112.0, 116.16], [118.0, 122.71], [125.0, 126.94], [128.0, 128.61], [131.0, 132.41], [135.0, 136.22], [137.0, 137.47], [141.0, 141.2], [144.0, 145.08], [147.0, 149.0], [150.0, 153.03], [155.0, 155.46], [160.0, 173.4], [175.0, 177.94], [179.0, 179.54]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 89.54, 81.0, 72.31, 0.0, 0.0, 0.0, 28.84, 32.43, 44.75, 31.61, 0.0, 0.0, 40.06, 30.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 51.71, 0.0, 30.05, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 24.26], ["gurgling", 6.12], ["explosion", 5.88]], null, null, null, null, null, null, [["noise", 21.35], ["mains hum", 15.52], ["music", 13.38]], [["hum", 36.46], ["music", 24.49], ["throbbing", 23.59]], [["hum", 47.86], ["throbbing", 25.33], ["music", 10.74]], [["music", 31.56], ["thump, thud", 16.86], ["thunk", 14.12]], null, null, [["music", 30.39], ["electronic music", 19.75], ["speech", 17.94]], [["music", 27.46], ["mains hum", 10.9], ["hum", 8.64]], null, null, null, null, null, null, null, null, null, null, [["music", 61.1], ["mains hum", 11.87], ["hum", 9.29]], null, null], "duration": [0.06, 0.18, 0.9, 1.01, 1.69, 0.51, 1.64, 3.18, 2.11, 2.13, 2.42, 0.53, 0.28, 0.59, 9.38, 2.89, 3.8, 8.63, -0.03, 0.5, 4.16, 4.71, 1.94, 0.61, 1.41, 1.22, 0.47, 0.2, 1.08, 2.0, 3.03, 0.46, 13.4, 2.94, 0.54]} \ No newline at end of file diff --git a/annotations_1/Joh9cLv0bp4_filtered.json b/annotations_1/Joh9cLv0bp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b46a38c4bf5b46f6773ea4dd1c907ba8374799b --- /dev/null +++ b/annotations_1/Joh9cLv0bp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.32], [16.0, 20.38], [22.0, 38.28], [40.0, 50.68], [52.0, 52.84], [54.0, 56.19], [58.0, 59.24], [61.0, 65.06], [67.0, 72.18], [75.0, 77.75], [79.0, 100.58], [101.0, 112.9], [114.0, 116.01], [118.0, 123.9], [125.0, 125.69], [127.0, 133.03], [134.0, 137.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.36, 74.92, 72.16, 0.0, 98.19, 0.0, 61.37, 58.05, 78.89, 79.94, 55.04, 80.64, 88.1, 0.0, 97.11, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 4.38, 16.28, 10.68, 0.84, 2.19, 1.24, 4.06, 5.18, 2.75, 21.58, 11.9, 2.01, 5.9, 0.69, 6.03, 3.46]} \ No newline at end of file diff --git a/annotations_1/Jou60MhXBcw_filtered.json b/annotations_1/Jou60MhXBcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..608a5d162c2cb7935297b59dd9fa2d6f539bc968 --- /dev/null +++ b/annotations_1/Jou60MhXBcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [6.0, 6.86], [7.0, 7.94], [9.0, 8.82], [10.0, 10.99], [12.0, 12.33], [15.0, 15.67], [17.0, 17.64], [18.0, 18.39], [22.0, 22.32], [23.0, 23.84], [25.0, 24.71], [27.0, 27.55], [33.0, 34.33], [35.0, 36.21], [38.0, 39.23], [43.0, 43.85], [45.0, 45.45], [47.0, 46.6], [47.0, 46.72], [50.0, 50.94], [52.0, 52.05], [53.0, 53.06], [59.0, 60.22], [61.0, 62.61], [64.0, 64.23], [69.0, 71.42], [73.0, 73.87], [78.0, 78.54], [79.0, 80.27], [81.0, 81.72], [83.0, 83.62], [86.0, 93.5], [95.0, 95.23], [99.0, 99.03], [100.0, 101.16], [102.0, 105.44], [113.0, 114.08], [119.0, 119.37], [121.0, 121.93], [122.0, 122.67], [127.0, 126.82], [129.0, 129.73], [132.0, 131.94], [133.0, 133.2], [137.0, 138.82], [144.0, 145.67], [146.0, 147.26], [147.0, 169.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 30.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 44.7], ["moo", 31.91], ["livestock, farm animals, working animals", 15.28]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.33], ["hum", 10.07], ["animal", 5.47]]], "duration": [0.39, 0.86, 0.94, -0.18, 0.99, 0.33, 0.67, 0.64, 0.39, 0.32, 0.84, -0.29, 0.55, 1.33, 1.21, 1.23, 0.85, 0.45, -0.4, -0.28, 0.94, 0.05, 0.06, 1.22, 1.61, 0.23, 2.42, 0.87, 0.54, 1.27, 0.72, 0.62, 7.5, 0.23, 0.03, 1.16, 3.44, 1.08, 0.37, 0.93, 0.67, -0.18, 0.73, -0.06, 0.2, 1.82, 1.67, 1.26, 22.62]} \ No newline at end of file diff --git a/annotations_1/JqYtHZw-M8c_filtered.json b/annotations_1/JqYtHZw-M8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9984f042079b45e5b7e95010a73593dbb88a24a5 --- /dev/null +++ b/annotations_1/JqYtHZw-M8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.91], [9.0, 9.81], [16.0, 15.74], [20.0, 22.57], [23.0, 27.14], [39.0, 40.24], [42.0, 42.38], [47.0, 47.58], [50.0, 54.87], [56.0, 57.6], [60.0, 64.96], [66.0, 66.65], [68.0, 68.23], [69.0, 71.71], [76.0, 86.63], [93.0, 93.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.4, 35.3, 0.0, 0.0, 0.0, 55.74, 0.0, 49.22, 0.0, 0.0, 39.41, 30.1, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.96], ["animal", 7.49], ["fart", 5.04]], null, null, null, null, null, [["speech", 45.12], ["sidetone", 24.95], ["dial tone", 3.71]], null, null, [["music", 66.09], ["synthesizer", 8.02], ["speech", 7.13]], [["music", 65.8], ["animal", 4.31], ["synthesizer", 2.98]], null], "duration": [0.91, 0.81, -0.26, 2.57, 4.14, 1.24, 0.38, 0.58, 4.87, 1.6, 4.96, 0.65, 0.23, 2.71, 10.63, 0.68]} \ No newline at end of file diff --git a/annotations_1/Jrn-OprEMLI_filtered.json b/annotations_1/Jrn-OprEMLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb8b664b6acc9ba494b935ad990c92f00431299b --- /dev/null +++ b/annotations_1/Jrn-OprEMLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [9.0, 9.96], [14.0, 15.31], [20.0, 21.36], [27.0, 29.02], [34.0, 34.91], [36.0, 38.33], [39.0, 41.61], [44.0, 45.22], [46.0, 46.95], [51.0, 52.74], [56.0, 57.38], [61.0, 61.33], [65.0, 65.04], [66.0, 66.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 87.92, 60.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.96, 1.31, 1.36, 2.02, 0.91, 2.33, 2.61, 1.22, 0.95, 1.74, 1.38, 0.33, 0.04, 0.34]} \ No newline at end of file diff --git a/annotations_1/JsdUzN20Sow_filtered.json b/annotations_1/JsdUzN20Sow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f184aaea59e8d78bd2aa4059d6d01224aaf26f62 --- /dev/null +++ b/annotations_1/JsdUzN20Sow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [14.0, 15.77], [21.0, 26.11], [29.0, 30.54], [36.0, 37.83], [52.0, 55.44], [61.0, 63.0], [68.0, 71.66], [76.0, 77.41], [98.0, 103.44], [108.0, 109.75], [115.0, 115.96], [121.0, 124.11], [126.0, 125.73], [129.0, 130.67], [146.0, 165.28], [169.0, 174.38], [178.0, 192.47]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 30.39, 0.0, 0.0, 30.87, 30.92, 30.05, 0.0, 30.44, 0.0, 0.0, 30.39, 0.0, 0.0, 30.01, 29.71, 29.62], "audiomae_on_audioset": [null, null, [["music", 66.39], ["swing music", 3.54], ["psychedelic rock", 1.94]], null, null, [["music", 60.91], ["didgeridoo", 4.24], ["musical instrument", 3.3]], [["music", 70.76], ["musical instrument", 1.63], ["sampler", 1.21]], [["music", 56.48], ["didgeridoo", 5.3], ["musical instrument", 5.27]], null, [["music", 52.13], ["didgeridoo", 4.35], ["psychedelic rock", 2.76]], null, null, [["music", 66.21], ["throbbing", 4.59], ["sidetone", 3.3]], null, null, [["music", 88.16], ["electronic music", 1.44], ["musical instrument", 1.22]], [["music", 47.45], ["rock and roll", 3.43], ["musical instrument", 3.0]], [["music", 61.42], ["motorcycle", 3.23], ["electronic music", 2.61]]], "duration": [0.69, 1.77, 5.11, 1.54, 1.83, 3.44, 2.0, 3.66, 1.41, 5.44, 1.75, 0.96, 3.11, -0.27, 1.67, 19.28, 5.38, 14.47]} \ No newline at end of file diff --git a/annotations_1/JuxyMqr7FNA_filtered.json b/annotations_1/JuxyMqr7FNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54cbec57533858330974130933436ed15fac8918 --- /dev/null +++ b/annotations_1/JuxyMqr7FNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.67], [9.0, 9.86], [10.0, 31.92], [33.0, 46.09], [51.0, 68.94], [69.0, 70.44]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.6, 56.93, 42.88, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 57.15], ["fart", 14.55], ["crushing", 9.78]], null], "duration": [1.67, 0.86, 21.92, 13.09, 17.94, 1.44]} \ No newline at end of file diff --git a/annotations_1/Jv7PzcVfULc_filtered.json b/annotations_1/Jv7PzcVfULc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587e4593d0e1fd03c3351a4a0490d6ffcdff67cf --- /dev/null +++ b/annotations_1/Jv7PzcVfULc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.64], [10.0, 11.1], [12.0, 12.75], [14.0, 15.69], [17.0, 17.78], [22.0, 23.79], [26.0, 29.02], [29.0, 30.94], [31.0, 33.29], [34.0, 35.78], [37.0, 38.13], [39.0, 40.37], [44.0, 44.34], [51.0, 54.14], [55.0, 67.88], [69.0, 70.53], [71.0, 72.01], [73.0, 73.33], [74.0, 75.68], [83.0, 84.79], [86.0, 89.9], [91.0, 92.28], [96.0, 96.48], [97.0, 99.03], [100.0, 100.99], [102.0, 103.91], [105.0, 106.19], [108.0, 109.27], [111.0, 114.0], [114.0, 115.57], [116.0, 116.43], [118.0, 118.5], [120.0, 125.74], [126.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 68.41, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 51.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 1.1, 0.75, 1.69, 0.78, 1.79, 3.02, 1.94, 2.29, 1.78, 1.13, 1.37, 0.34, 3.14, 12.88, 1.53, 1.01, 0.33, 1.68, 1.79, 3.9, 1.28, 0.48, 2.03, 0.99, 1.91, 1.19, 1.27, 3.0, 1.57, 0.43, 0.5, 5.74, 1.16]} \ No newline at end of file diff --git a/annotations_1/JvG1hHsOFUA_filtered.json b/annotations_1/JvG1hHsOFUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01650364cc3c92eefea413e1fb339e486f197da1 --- /dev/null +++ b/annotations_1/JvG1hHsOFUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.56], [16.0, 16.14], [24.0, 24.98], [28.0, 28.29], [29.0, 32.07], [34.0, 35.33], [36.0, 36.0], [37.0, 37.99], [40.0, 40.69], [50.0, 49.81], [51.0, 51.31], [52.0, 53.33], [56.0, 57.21], [58.0, 58.6], [61.0, 62.48], [69.0, 68.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 0.14, 0.98, 0.29, 3.07, 1.33, 0.0, 0.99, 0.69, -0.19, 0.31, 1.33, 1.21, 0.6, 1.48, -0.11]} \ No newline at end of file diff --git a/annotations_1/JvTQZxz-KBk_filtered.json b/annotations_1/JvTQZxz-KBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76fc14ead146994bf86e7bae303dd154fc132272 --- /dev/null +++ b/annotations_1/JvTQZxz-KBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.06], [21.0, 24.31], [26.0, 28.04], [28.0, 28.19], [28.0, 28.22], [36.0, 44.17], [51.0, 56.32], [61.0, 61.52], [64.0, 65.87], [71.0, 71.78], [76.0, 76.42], [77.0, 78.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.61, 31.15, 29.77, 0.0, 0.0, 29.06, 29.3, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.2], ["speech", 20.66], ["electronic music", 2.34]], [["music", 39.31], ["speech", 25.19], ["throbbing", 6.37]], [["music", 52.9], ["speech", 23.44], ["hum", 4.06]], null, null, [["music", 48.17], ["speech", 15.15], ["throbbing", 13.99]], [["hum", 46.44], ["throbbing", 26.22], ["music", 14.77]], null, null, null, null, null], "duration": [6.06, 3.31, 2.04, 0.19, 0.22, 8.17, 5.32, 0.52, 1.87, 0.78, 0.42, 1.06]} \ No newline at end of file diff --git a/annotations_1/JvclIUy-JlA_filtered.json b/annotations_1/JvclIUy-JlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64433edfbcc18ffeee42edf6b099d94cc698675a --- /dev/null +++ b/annotations_1/JvclIUy-JlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [11.0, 14.35], [15.0, 16.78], [18.0, 35.41], [38.0, 38.48], [43.0, 43.9], [48.0, 48.41], [49.0, 50.26], [52.0, 53.23], [56.0, 56.79], [60.0, 61.37], [65.0, 65.21], [65.0, 65.3], [79.0, 79.86], [93.0, 92.87], [93.0, 93.46], [96.0, 97.28], [100.0, 101.17], [102.0, 108.24], [114.0, 114.93], [117.0, 117.07], [120.0, 120.8], [122.0, 122.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.56, 0.0, 30.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.74], ["throbbing", 30.26], ["hum", 6.06]], null, [["music", 47.52], ["hum", 9.13], ["throbbing", 6.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.73], ["speech", 21.43], ["boing", 3.22]], null, null, null, null], "duration": [1.03, 3.35, 1.78, 17.41, 0.48, 0.9, 0.41, 1.26, 1.23, 0.79, 1.37, 0.21, 0.3, 0.86, -0.13, 0.46, 1.28, 1.17, 6.24, 0.93, 0.07, 0.8, 0.66]} \ No newline at end of file diff --git a/annotations_1/JwAVnG8iemw_filtered.json b/annotations_1/JwAVnG8iemw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..946092e44b9092b816e04621fc0011836936a3c6 --- /dev/null +++ b/annotations_1/JwAVnG8iemw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.43], [35.0, 36.73], [37.0, 37.64], [38.0, 39.39], [42.0, 45.33], [46.0, 47.63], [49.0, 62.51], [68.0, 72.44], [81.0, 82.48], [87.0, 91.5], [92.0, 95.99], [101.0, 101.92], [103.0, 103.91], [104.0, 108.99], [111.0, 110.67], [111.0, 115.08], [116.0, 124.82], [129.0, 137.27], [141.0, 186.51], [190.0, 193.65]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, true, false, true, false, true, false, true], "silence_prob": [46.02, 0.0, 0.0, 0.0, 48.39, 0.0, 40.33, 31.37, 0.0, 30.07, 31.03, 0.0, 0.0, 32.38, 0.0, 31.16, 31.03, 39.11, 0.0, 40.61], "audiomae_on_audioset": [[["music", 60.92], ["theremin", 5.52], ["synthesizer", 3.97]], null, null, null, [["music", 59.77], ["theremin", 10.38], ["scary music", 2.39]], null, [["music", 59.94], ["stomach rumble", 4.13], ["throbbing", 3.4]], [["music", 66.47], ["musical instrument", 6.11], ["cacophony", 4.23]], null, [["music", 24.23], ["grunt", 18.68], ["roar", 5.38]], [["music", 46.09], ["fart", 8.35], ["cattle, bovinae", 4.93]], null, null, [["mains hum", 23.97], ["music", 13.14], ["hum", 13.13]], null, [["music", 29.06], ["whack, thwack", 24.89], ["speech", 12.12]], [["speech", 45.72], ["music", 31.18], ["whack, thwack", 4.51]], [["speech", 44.93], ["music", 15.01], ["hum", 4.57]], null, [["music", 46.28], ["speech", 16.29], ["theremin", 4.96]]], "duration": [15.43, 1.73, 0.64, 1.39, 3.33, 1.63, 13.51, 4.44, 1.48, 4.5, 3.99, 0.92, 0.91, 4.99, -0.33, 4.08, 8.82, 8.27, 45.51, 3.65]} \ No newline at end of file diff --git a/annotations_1/JwlhFfOC5Zo_filtered.json b/annotations_1/JwlhFfOC5Zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3cbb612b791299ee8e1d1e86e979c84ec68cbe1 --- /dev/null +++ b/annotations_1/JwlhFfOC5Zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.47], [15.0, 15.31], [18.0, 20.02], [20.0, 21.57], [24.0, 25.86], [28.0, 28.86], [29.0, 29.73], [34.0, 34.33], [35.0, 35.48], [42.0, 42.55], [43.0, 45.2], [46.0, 46.92], [47.0, 47.71], [48.0, 53.11], [66.0, 66.26], [67.0, 68.88], [69.0, 68.94], [70.0, 71.86], [73.0, 73.89], [75.0, 76.32], [78.0, 79.59], [81.0, 82.16], [85.0, 85.11], [89.0, 92.55], [94.0, 94.2], [96.0, 96.89], [99.0, 99.44], [100.0, 99.57], [100.0, 104.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 33.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 53.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.12], ["music", 15.38], ["boing", 7.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 0.31, 2.02, 1.57, 1.86, 0.86, 0.73, 0.33, 0.48, 0.55, 2.2, 0.92, 0.71, 5.11, 0.26, 1.88, -0.06, 1.86, 0.89, 1.32, 1.59, 1.16, 0.11, 3.55, 0.2, 0.89, 0.44, -0.43, 4.09]} \ No newline at end of file diff --git a/annotations_1/Jx-I8OfW0GI_filtered.json b/annotations_1/Jx-I8OfW0GI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17d513ffd047937ba4d87a83a8664e93b8e9ed2b --- /dev/null +++ b/annotations_1/Jx-I8OfW0GI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [9.0, 9.26], [18.0, 18.94], [34.0, 34.57], [36.0, 36.09], [44.0, 44.0], [45.0, 46.18], [62.0, 62.53], [64.0, 65.47], [76.0, 76.37], [85.0, 86.0], [89.0, 90.04], [95.0, 95.76], [96.0, 99.82], [102.0, 102.54], [104.0, 104.41], [106.0, 106.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 20.55], ["moo", 15.11], ["sidetone", 11.45]], null, null, null], "duration": [0.59, 0.26, 0.94, 0.57, 0.09, 0.0, 1.18, 0.53, 1.47, 0.37, 1.0, 1.04, 0.76, 3.82, 0.54, 0.41, 0.3]} \ No newline at end of file diff --git a/annotations_1/JxbvOwAB-xI_filtered.json b/annotations_1/JxbvOwAB-xI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ec6e9d785a8e8637fe2fa7b93b65bcac54e77a7 --- /dev/null +++ b/annotations_1/JxbvOwAB-xI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [5.0, 5.0], [7.0, 7.94], [9.0, 10.47], [12.0, 12.78], [13.0, 14.72], [15.0, 18.03], [20.0, 20.34], [21.0, 22.0], [23.0, 23.65], [25.0, 25.37], [28.0, 29.57], [30.0, 30.86], [31.0, 31.99], [33.0, 33.32], [34.0, 34.86], [37.0, 37.29], [40.0, 40.58], [41.0, 41.4], [42.0, 43.82], [49.0, 51.24], [52.0, 52.51], [54.0, 55.04], [57.0, 57.35], [59.0, 59.81], [62.0, 63.27], [65.0, 64.72], [65.0, 67.58], [70.0, 70.51], [74.0, 76.81], [82.0, 82.11], [92.0, 92.03], [93.0, 93.87], [108.0, 108.92], [110.0, 110.66], [114.0, 115.21], [142.0, 142.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 0.0, 0.94, 1.47, 0.78, 1.72, 3.03, 0.34, 1.0, 0.65, 0.37, 1.57, 0.86, 0.99, 0.32, 0.86, 0.29, 0.58, 0.4, 1.82, 2.24, 0.51, 1.04, 0.35, 0.81, 1.27, -0.28, 2.58, 0.51, 2.81, 0.11, 0.03, 0.87, 0.92, 0.66, 1.21, 0.43]} \ No newline at end of file diff --git a/annotations_1/Jy2_J5WCzDY_filtered.json b/annotations_1/Jy2_J5WCzDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6325a6a799dfc0ceb65250a55f8f1636611d331 --- /dev/null +++ b/annotations_1/Jy2_J5WCzDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.16], [46.0, 46.06], [49.0, 49.82], [50.0, 51.65], [52.0, 53.06], [57.0, 77.4], [79.0, 92.28], [95.0, 103.99], [107.0, 151.55], [152.0, 171.78], [174.0, 177.62]], "keep_status": [false, false, false, false, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.43, 31.22, 31.33, 0.0, 33.87, 31.18], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.98], ["music", 21.99], ["whack, thwack", 13.79]], [["music", 41.97], ["speech", 23.25], ["fart", 4.88]], [["music", 51.39], ["throbbing", 12.68], ["sound effect", 3.69]], null, [["music", 25.62], ["didgeridoo", 21.45], ["cattle, bovinae", 9.25]], [["music", 14.78], ["speech", 8.55], ["whack, thwack", 7.95]]], "duration": [1.16, 0.06, 0.82, 1.65, 1.06, 20.4, 13.28, 8.99, 44.55, 19.78, 3.62]} \ No newline at end of file diff --git a/annotations_1/Jy8mz4gu2oQ_filtered.json b/annotations_1/Jy8mz4gu2oQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..823851d383e44893b1072b7e87b2e9eabf95988f --- /dev/null +++ b/annotations_1/Jy8mz4gu2oQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [35.0, 35.5], [46.0, 47.02], [51.0, 55.8], [57.0, 58.14], [71.0, 72.1], [74.0, 78.44], [81.0, 81.48], [82.0, 82.59], [83.0, 84.94], [89.0, 94.46], [96.0, 98.04], [101.0, 102.83], [103.0, 103.57], [107.0, 106.69], [115.0, 115.99], [118.0, 118.44], [119.0, 119.62], [120.0, 121.39], [122.0, 125.54], [127.0, 127.23]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.19, 0.0, 0.0, 29.04, 0.0, 0.0, 0.0, 31.03, 41.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 70.94], ["screaming", 13.21], ["inside, small room", 1.03]], null, null, [["fly, housefly", 26.03], ["mosquito", 12.5], ["whack, thwack", 11.59]], null, null, null, [["speech", 37.33], ["mains hum", 13.68], ["electric shaver, electric razor", 11.75]], [["music", 23.72], ["musical instrument", 9.98], ["guitar", 5.46]], null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.5, 1.02, 4.8, 1.14, 1.1, 4.44, 0.48, 0.59, 1.94, 5.46, 2.04, 1.83, 0.57, -0.31, 0.99, 0.44, 0.62, 1.39, 3.54, 0.23]} \ No newline at end of file diff --git a/annotations_1/JyAbZxxgLw8_filtered.json b/annotations_1/JyAbZxxgLw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40388b6b76ee32c5ed101e49365d1822c95fab93 --- /dev/null +++ b/annotations_1/JyAbZxxgLw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.25], [37.0, 37.86], [49.0, 49.1], [54.0, 55.26], [61.0, 62.45], [64.0, 63.69], [66.0, 67.76], [72.0, 72.49], [80.0, 80.3], [81.0, 80.96], [83.0, 85.09], [87.0, 87.44], [89.0, 89.6], [90.0, 90.54], [92.0, 93.87], [94.0, 94.91], [97.0, 97.75], [99.0, 99.23], [100.0, 100.72], [103.0, 104.09], [110.0, 110.51], [117.0, 116.87], [120.0, 124.41], [126.0, 134.05], [134.0, 152.15], [153.0, 155.12], [157.0, 160.96], [161.0, 161.06], [161.0, 164.73], [166.0, 171.63], [176.0, 178.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 99.94, 71.29, 99.82, 46.09, 0.0, 48.78, 33.85, 35.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 58.19], ["music", 6.62], ["hubbub, speech noise, speech babble", 4.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 67.87], ["music", 11.77], ["mains hum", 3.62]], null, [["music", 48.17], ["speech", 15.74], ["electronic music", 7.72]], [["music", 67.0], ["hum", 9.38], ["throbbing", 8.68]], [["sine wave", 33.12], ["music", 33.04], ["chirp tone", 10.98]]], "duration": [0.25, 0.86, 0.1, 1.26, 1.45, -0.31, 1.76, 0.49, 0.3, -0.04, 2.09, 0.44, 0.6, 0.54, 1.87, 0.91, 0.75, 0.23, 0.72, 1.09, 0.51, -0.13, 4.41, 8.05, 18.15, 2.12, 3.96, 0.06, 3.73, 5.63, 2.5]} \ No newline at end of file diff --git a/annotations_1/JyEYiaZW3Ok_filtered.json b/annotations_1/JyEYiaZW3Ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88e80dfbc0a1cc16dd316551bd047967f534460d --- /dev/null +++ b/annotations_1/JyEYiaZW3Ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [10.0, 10.2], [10.0, 12.43], [13.0, 17.76], [20.0, 20.88], [25.0, 26.42], [30.0, 33.3], [35.0, 36.27], [37.0, 37.94], [39.0, 41.27], [42.0, 43.28], [45.0, 49.2], [51.0, 53.33], [61.0, 64.35], [65.0, 70.17], [73.0, 73.89], [75.0, 75.07], [79.0, 79.19], [82.0, 85.24], [86.0, 86.85], [90.0, 92.94], [96.0, 97.41], [98.0, 99.15], [101.0, 102.88], [104.0, 108.01], [109.0, 113.17], [116.0, 116.75], [117.0, 132.16], [133.0, 151.12], [152.0, 153.93], [154.0, 164.74], [166.0, 168.64], [169.0, 170.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.89, 79.94, 0.0, 0.0, 70.86, 0.0, 0.0, 50.02, 0.0, 96.29, 56.93, 87.37, 85.9, 0.0, 0.0, 0.0, 95.37, 0.0, 99.71, 0.0, 0.0, 0.0, 96.66, 93.29, 0.0, 46.68, 57.48, 0.0, 74.76, 52.68, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 29.93], ["hum", 24.9], ["stomach rumble", 7.35]], null, null, null, null, null], "duration": [0.32, 0.2, 2.43, 4.76, 0.88, 1.42, 3.3, 1.27, 0.94, 2.27, 1.28, 4.2, 2.33, 3.35, 5.17, 0.89, 0.07, 0.19, 3.24, 0.85, 2.94, 1.41, 1.15, 1.88, 4.01, 4.17, 0.75, 15.16, 18.12, 1.93, 10.74, 2.64, 1.53]} \ No newline at end of file diff --git a/annotations_1/JyEvCZ8kwW4_filtered.json b/annotations_1/JyEvCZ8kwW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..869594d7570e4b7c699d0fc4aef1c3f9f3a9e01d --- /dev/null +++ b/annotations_1/JyEvCZ8kwW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.06], [32.0, 33.83], [36.0, 46.94], [47.0, 59.93], [65.0, 66.09], [68.0, 73.77], [75.0, 88.11], [92.0, 97.61], [100.0, 112.56], [113.0, 113.16], [113.0, 113.27], [113.0, 113.37], [113.0, 122.12]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 37.5, 31.74, 0.0, 67.0, 29.16, 28.72, 30.21, 0.0, 0.0, 0.0, 29.37], "audiomae_on_audioset": [null, null, [["music", 32.56], ["didgeridoo", 28.74], ["whale vocalization", 10.33]], [["music", 37.33], ["throbbing", 21.1], ["hum", 20.72]], null, null, [["music", 24.45], ["hum", 20.51], ["throbbing", 7.58]], [["music", 48.09], ["noise", 9.75], ["didgeridoo", 6.06]], [["throbbing", 66.3], ["music", 25.81], ["hum", 4.74]], null, null, null, [["music", 44.16], ["speech", 7.89], ["whack, thwack", 6.04]]], "duration": [1.06, 1.83, 10.94, 12.93, 1.09, 5.77, 13.11, 5.61, 12.56, 0.16, 0.27, 0.37, 9.12]} \ No newline at end of file diff --git a/annotations_1/JyQczb2eCf8_filtered.json b/annotations_1/JyQczb2eCf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2009060e7b37bf02634a971fc121772ea1883c93 --- /dev/null +++ b/annotations_1/JyQczb2eCf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 47.33], [48.0, 53.99], [58.0, 59.76], [61.0, 71.61], [72.0, 77.18], [78.0, 77.57], [78.0, 77.75], [78.0, 77.79], [78.0, 77.82], [78.0, 103.01], [108.0, 108.03]], "keep_status": [true, true, false, true, true, false, false, false, false, true, false], "silence_prob": [46.61, 49.68, 0.0, 35.13, 33.12, 0.0, 0.0, 0.0, 0.0, 32.87, 0.0], "audiomae_on_audioset": [[["music", 35.45], ["speech", 21.26], ["wind chime", 4.12]], [["music", 33.26], ["cowbell", 9.82], ["noise", 7.8]], null, [["speech", 32.1], ["music", 30.1], ["hum", 4.83]], [["music", 44.59], ["speech", 20.05], ["chime", 2.85]], null, null, null, null, [["speech", 30.85], ["music", 23.45], ["ice cream truck, ice cream van", 6.94]], null], "duration": [6.33, 5.99, 1.76, 10.61, 5.18, -0.43, -0.25, -0.21, -0.18, 25.01, 0.03]} \ No newline at end of file diff --git a/annotations_1/JyTf7wR8vWI_filtered.json b/annotations_1/JyTf7wR8vWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bdbec3110d63472c8f79ce96f7e3e220c9b4c0e --- /dev/null +++ b/annotations_1/JyTf7wR8vWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 81.72], [82.0, 84.84], [86.0, 92.33], [94.0, 94.81], [96.0, 96.99], [101.0, 100.99], [104.0, 106.29], [109.0, 109.71], [113.0, 114.54], [116.0, 117.29], [119.0, 120.41], [123.0, 123.55], [125.0, 126.1], [130.0, 133.25], [134.0, 135.77], [137.0, 138.86], [139.0, 140.78], [141.0, 176.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 99.87, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [63.72, 2.84, 6.33, 0.81, 0.99, -0.01, 2.29, 0.71, 1.54, 1.29, 1.41, 0.55, 1.1, 3.25, 1.77, 1.86, 1.78, 35.67]} \ No newline at end of file diff --git a/annotations_1/Jye1gDePzgY_filtered.json b/annotations_1/Jye1gDePzgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17346f07818f8cd21f29057138933489190d1226 --- /dev/null +++ b/annotations_1/Jye1gDePzgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.02], [14.0, 16.65], [18.0, 21.39], [23.0, 24.71], [27.0, 27.94], [29.0, 29.44], [31.0, 32.14], [35.0, 39.9], [51.0, 51.8], [53.0, 54.55], [58.0, 63.24], [69.0, 69.6], [72.0, 72.94], [78.0, 78.61], [80.0, 86.58], [94.0, 94.15], [100.0, 103.38], [106.0, 105.88], [113.0, 113.68], [118.0, 119.85], [142.0, 142.18], [143.0, 142.99]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.68, 35.22, 40.38, 0.0, 0.0, 0.0, 0.0, 34.44, 0.0, 0.0, 43.79, 0.0, 0.0, 0.0, 42.88, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.64], ["synthesizer", 6.43], ["musical instrument", 5.54]], [["music", 29.27], ["synthesizer", 23.86], ["musical instrument", 7.83]], [["music", 17.09], ["synthesizer", 15.35], ["speech", 7.08]], null, null, null, null, [["moo", 45.93], ["cattle, bovinae", 31.3], ["livestock, farm animals, working animals", 15.92]], null, null, [["boing", 48.34], ["music", 28.96], ["speech", 4.35]], null, null, null, [["music", 57.0], ["didgeridoo", 6.79], ["theremin", 3.21]], null, null, null, null, null, null, null], "duration": [4.02, 2.65, 3.39, 1.71, 0.94, 0.44, 1.14, 4.9, 0.8, 1.55, 5.24, 0.6, 0.94, 0.61, 6.58, 0.15, 3.38, -0.12, 0.68, 1.85, 0.18, -0.01]} \ No newline at end of file diff --git a/annotations_1/JzVCSXWeNnA_filtered.json b/annotations_1/JzVCSXWeNnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04848c4dca548c4e50f136eeb5674eed1f54205c --- /dev/null +++ b/annotations_1/JzVCSXWeNnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.9], [11.0, 12.41], [14.0, 35.24], [36.0, 38.43], [39.0, 46.8], [48.0, 56.64], [58.0, 59.17], [60.0, 70.46]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [99.92, 0.0, 96.42, 98.27, 97.43, 97.22, 0.0, 91.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [4.9, 1.41, 21.24, 2.43, 7.8, 8.64, 1.17, 10.46]} \ No newline at end of file diff --git a/annotations_1/JzmD5wQpm5c_filtered.json b/annotations_1/JzmD5wQpm5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bfb5bd2d14661f83a7575b9ea2c5ad4b59c8e12 --- /dev/null +++ b/annotations_1/JzmD5wQpm5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.04], [18.0, 18.1], [19.0, 52.89], [56.0, 71.29], [76.0, 105.41], [105.0, 125.58], [133.0, 140.22], [143.0, 152.56], [154.0, 154.87], [156.0, 156.27], [157.0, 169.13], [173.0, 175.37], [178.0, 180.12], [182.0, 182.21]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, true, false], "silence_prob": [29.89, 0.0, 0.0, 33.48, 31.17, 33.13, 43.45, 31.8, 0.0, 0.0, 32.82, 53.72, 29.45, 0.0], "audiomae_on_audioset": [[["music", 59.32], ["speech", 5.74], ["throbbing", 5.24]], null, null, [["music", 49.76], ["speech", 13.09], ["cattle, bovinae", 4.67]], [["music", 25.63], ["speech", 20.28], ["whip", 14.39]], [["music", 44.57], ["throbbing", 22.78], ["hum", 4.09]], [["music", 69.0], ["hum", 4.68], ["throbbing", 2.67]], [["music", 22.58], ["fly, housefly", 17.6], ["mosquito", 12.05]], null, null, [["music", 58.27], ["throbbing", 11.64], ["speech", 10.36]], null, [["music", 19.89], ["vehicle", 15.24], ["buzz", 7.75]], null], "duration": [10.04, 0.1, 33.89, 15.29, 29.41, 20.58, 7.22, 9.56, 0.87, 0.27, 12.13, 2.37, 2.12, 0.21]} \ No newline at end of file diff --git a/annotations_1/Jzr8lXSNRA8_filtered.json b/annotations_1/Jzr8lXSNRA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb34e3744cc81001a33876af5d64ea2310d14d11 --- /dev/null +++ b/annotations_1/Jzr8lXSNRA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [5.0, 7.11], [15.0, 14.94], [16.0, 16.44], [18.0, 20.87], [22.0, 34.74], [37.0, 38.75], [41.0, 57.16], [59.0, 62.53], [68.0, 76.84], [80.0, 81.7], [84.0, 85.99], [87.0, 98.85], [101.0, 100.8], [102.0, 103.11], [118.0, 118.42], [120.0, 120.99], [122.0, 123.04], [124.0, 125.1], [128.0, 128.41], [131.0, 130.76], [133.0, 133.1], [134.0, 134.13], [136.0, 139.85]], "keep_status": [false, true, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.88, 0.0, 0.0, 39.67, 31.32, 0.0, 31.83, 31.51, 30.59, 0.0, 0.0, 34.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.46], "audiomae_on_audioset": [null, [["hum", 27.92], ["throbbing", 14.76], ["gong", 10.69]], null, null, [["music", 33.44], ["hum", 6.08], ["electronic music", 5.49]], [["music", 44.34], ["throbbing", 9.19], ["synthesizer", 8.75]], null, [["hum", 28.22], ["music", 20.36], ["throbbing", 15.94]], [["music", 57.63], ["synthesizer", 10.22], ["musical instrument", 4.91]], [["music", 27.61], ["speech", 27.0], ["hum", 6.22]], null, null, [["music", 63.97], ["throbbing", 5.75], ["soundtrack music", 4.69]], null, null, null, null, null, null, null, null, null, null, [["speech", 42.35], ["music", 28.78], ["explosion", 8.02]]], "duration": [0.83, 2.11, -0.06, 0.44, 2.87, 12.74, 1.75, 16.16, 3.53, 8.84, 1.7, 1.99, 11.85, -0.2, 1.11, 0.42, 0.99, 1.04, 1.1, 0.41, -0.24, 0.1, 0.13, 3.85]} \ No newline at end of file diff --git a/annotations_1/K0QjNiVA6NU_filtered.json b/annotations_1/K0QjNiVA6NU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cacde2e031f7c7dce0dfc3482f318baa6033cce3 --- /dev/null +++ b/annotations_1/K0QjNiVA6NU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 4.77], [5.0, 8.38], [11.0, 11.18], [12.0, 12.36], [13.0, 13.88], [16.0, 17.54], [18.0, 17.61], [18.0, 18.0], [18.0, 18.98], [22.0, 22.91], [24.0, 26.28], [28.0, 29.05], [30.0, 32.49], [35.0, 35.9], [42.0, 43.11], [44.0, 45.12], [50.0, 51.02], [52.0, 53.25], [56.0, 58.45], [61.0, 61.16], [63.0, 63.9], [70.0, 71.27], [74.0, 77.63], [79.0, 79.98], [81.0, 83.67], [85.0, 88.38], [89.0, 90.37], [93.0, 94.05], [97.0, 99.99], [101.0, 102.39], [106.0, 106.15], [110.0, 110.02], [112.0, 113.71], [114.0, 126.94], [128.0, 130.18], [132.0, 133.79], [134.0, 134.67], [135.0, 135.57], [137.0, 140.46], [141.0, 143.94], [146.0, 150.36], [155.0, 156.83], [158.0, 158.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 73.51, 0.0, 90.95, 99.98, 0.0, 0.0, 41.2, 0.0, 0.0, 0.0, 0.0, 78.72, 55.31, 0.0, 0.0, 0.0, 99.98, 97.33, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 32.75], ["speech", 30.73], ["telephone", 5.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.77, 3.38, 0.18, 0.36, 0.88, 1.54, -0.39, 0.0, 0.98, 0.91, 2.28, 1.05, 2.49, 0.9, 1.11, 1.12, 1.02, 1.25, 2.45, 0.16, 0.9, 1.27, 3.63, 0.98, 2.67, 3.38, 1.37, 1.05, 2.99, 1.39, 0.15, 0.02, 1.71, 12.94, 2.18, 1.79, 0.67, 0.57, 3.46, 2.94, 4.36, 1.83, 0.7]} \ No newline at end of file diff --git a/annotations_1/K2LCoTSVORY_filtered.json b/annotations_1/K2LCoTSVORY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0817d39306b21365d13d516fac41ab57e62784c6 --- /dev/null +++ b/annotations_1/K2LCoTSVORY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.49], [15.0, 15.52], [17.0, 17.19], [26.0, 28.0], [29.0, 30.2], [32.0, 33.2], [35.0, 36.48], [38.0, 39.99], [42.0, 42.65], [43.0, 44.46], [46.0, 46.62], [48.0, 47.93], [49.0, 51.44], [52.0, 52.89], [56.0, 56.81], [58.0, 60.27], [61.0, 63.34], [65.0, 65.4], [66.0, 66.41], [79.0, 82.65], [86.0, 86.85], [88.0, 88.55], [89.0, 96.58], [98.0, 100.99], [107.0, 107.89], [110.0, 111.64], [112.0, 113.44], [114.0, 115.5], [117.0, 118.86], [119.0, 121.32], [122.0, 124.14], [125.0, 127.18], [129.0, 132.51], [133.0, 145.99], [152.0, 154.45], [157.0, 165.33], [169.0, 174.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 36.3, 78.89, 0.0, 0.0, 71.14, 0.0, 0.0, 54.5, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 49.68, 61.57, 67.38, 44.72, 39.31, 42.65, 31.51, 33.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.93], ["throat clearing", 11.61], ["hum", 6.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.91], ["music", 8.87], ["hum", 7.51]], null, null, [["speech", 61.31], ["whale vocalization", 7.58], ["music", 5.02]], [["speech", 32.7], ["music", 29.08], ["singing bowl", 17.53]], [["music", 35.15], ["rumble", 13.04], ["hum", 11.74]], [["music", 33.6], ["didgeridoo", 9.55], ["speech", 6.25]], [["speech", 21.65], ["hum", 13.41], ["mains hum", 11.8]]], "duration": [1.49, 0.52, 0.19, 2.0, 1.2, 1.2, 1.48, 1.99, 0.65, 1.46, 0.62, -0.07, 2.44, 0.89, 0.81, 2.27, 2.34, 0.4, 0.41, 3.65, 0.85, 0.55, 7.58, 2.99, 0.89, 1.64, 1.44, 1.5, 1.86, 2.32, 2.14, 2.18, 3.51, 12.99, 2.45, 8.33, 5.66]} \ No newline at end of file diff --git a/annotations_1/K2NNznJJadY_filtered.json b/annotations_1/K2NNznJJadY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eab8d5704a2911fa71492219f9288d4594a63d8 --- /dev/null +++ b/annotations_1/K2NNznJJadY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.04], [1.0, 1.17], [3.0, 3.54], [7.0, 10.86], [12.0, 13.83], [15.0, 16.71], [18.0, 17.85], [19.0, 23.72], [24.0, 28.17], [30.0, 58.11], [59.0, 60.05], [63.0, 73.7], [74.0, 76.15], [77.0, 85.97], [87.0, 105.8]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 39.46, 43.56, 31.28, 0.0, 28.88, 31.18, 30.04, 31.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fart", 25.05], ["speech", 21.87], ["fly, housefly", 19.25]], [["speech", 25.87], ["fly, housefly", 12.11], ["mosquito", 8.76]], [["speech", 44.5], ["eruption", 16.94], ["explosion", 11.07]], null, [["hum", 44.07], ["throbbing", 32.4], ["music", 9.61]], [["speech", 28.83], ["music", 16.44], ["fly, housefly", 14.43]], [["music", 42.77], ["speech", 12.79], ["hum", 12.71]], [["music", 64.3], ["speech", 12.97], ["buzz", 5.26]]], "duration": [0.0, 0.04, 0.17, 0.54, 3.86, 1.83, 1.71, -0.15, 4.72, 4.17, 28.11, 1.05, 10.7, 2.15, 8.97, 18.8]} \ No newline at end of file diff --git a/annotations_1/K2hcF1oOHb8_filtered.json b/annotations_1/K2hcF1oOHb8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32170e95e09f5db717ef778f61af86eb6a945be4 --- /dev/null +++ b/annotations_1/K2hcF1oOHb8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [9.0, 9.86], [11.0, 12.56], [19.0, 18.98], [33.0, 33.03], [36.0, 36.95], [38.0, 38.55], [40.0, 46.6], [52.0, 54.99], [55.0, 56.66], [60.0, 60.54], [63.0, 63.61], [65.0, 69.45], [70.0, 70.95], [72.0, 75.91], [78.0, 90.63], [96.0, 99.93], [119.0, 121.49], [133.0, 133.17], [133.0, 133.22], [141.0, 144.91], [151.0, 151.19]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.57, 32.61, 0.0, 0.0, 0.0, 34.12, 0.0, 30.22, 52.45, 33.17, 31.74, 0.0, 0.0, 33.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 51.25], ["speech", 6.08], ["groan", 5.27]], [["speech", 28.4], ["vehicle", 9.91], ["motorboat, speedboat", 6.01]], null, null, null, [["music", 36.1], ["throbbing", 9.52], ["hum", 5.97]], null, [["music", 42.57], ["speech", 9.08], ["singing", 4.23]], null, [["music", 31.15], ["cattle, bovinae", 20.39], ["moo", 19.19]], [["music", 42.44], ["speech", 33.49], ["synthesizer", 1.83]], null, null, [["music", 30.41], ["whack, thwack", 19.1], ["speech", 6.6]], null], "duration": [1.52, 0.86, 1.56, -0.02, 0.03, 0.95, 0.55, 6.6, 2.99, 1.66, 0.54, 0.61, 4.45, 0.95, 3.91, 12.63, 3.93, 2.49, 0.17, 0.22, 3.91, 0.19]} \ No newline at end of file diff --git a/annotations_1/K3OlytfxzHU_filtered.json b/annotations_1/K3OlytfxzHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3156a7dadafb3c91f3bab8824d6511874815c168 --- /dev/null +++ b/annotations_1/K3OlytfxzHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.2], [7.0, 100.21], [102.0, 102.83], [103.0, 104.8], [106.0, 106.86], [121.0, 121.61], [129.0, 129.14], [134.0, 136.29], [140.0, 141.1], [143.0, 144.22], [146.0, 146.28], [148.0, 148.1], [148.0, 149.23], [152.0, 152.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 93.21, 0.83, 1.8, 0.86, 0.61, 0.14, 2.29, 1.1, 1.22, 0.28, 0.1, 1.23, 0.81]} \ No newline at end of file diff --git a/annotations_1/K3dG3JrXAJc_filtered.json b/annotations_1/K3dG3JrXAJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37d982eff85db6b528923900beb30e129218064d --- /dev/null +++ b/annotations_1/K3dG3JrXAJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.41], [36.0, 36.64], [47.0, 46.84], [58.0, 58.53], [64.0, 64.89], [66.0, 70.29], [74.0, 75.1], [116.0, 116.4], [130.0, 133.27], [140.0, 141.78], [151.0, 151.75], [162.0, 163.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, 0.64, -0.16, 0.53, 0.89, 4.29, 1.1, 0.4, 3.27, 1.78, 0.75, 1.36]} \ No newline at end of file diff --git a/annotations_1/K3jk2RjLJ3c_filtered.json b/annotations_1/K3jk2RjLJ3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..593f20ee047a38ad628797e2f44a3f4de1ec695e --- /dev/null +++ b/annotations_1/K3jk2RjLJ3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 23.46], [24.0, 25.27], [27.0, 27.92], [29.0, 29.83], [31.0, 32.27], [34.0, 39.14], [41.0, 41.77], [45.0, 46.45], [49.0, 50.16], [53.0, 53.64], [55.0, 54.82], [56.0, 59.63], [60.0, 61.53], [66.0, 66.16], [69.0, 69.58], [70.0, 70.97], [74.0, 75.57], [80.0, 80.38], [92.0, 92.69], [94.0, 95.55], [96.0, 96.3], [97.0, 99.22], [100.0, 100.38], [103.0, 103.35], [112.0, 117.22], [118.0, 125.58], [133.0, 139.92], [140.0, 141.61], [143.0, 144.91], [150.0, 150.53], [153.0, 153.6], [154.0, 157.84], [161.0, 161.0], [164.0, 165.59], [167.0, 167.8], [169.0, 172.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [56.93, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0, 32.05, 29.5, 30.7, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 40.34], ["music", 5.99], ["musical instrument", 5.94]], null, null, [["speech", 72.0], ["music", 4.54], ["echo", 3.67]], [["fart", 29.02], ["speech", 8.26], ["livestock, farm animals, working animals", 5.82]], [["fart", 21.58], ["cattle, bovinae", 9.48], ["livestock, farm animals, working animals", 9.01]], null, null, null, null, null, null, null, null, null], "duration": [8.46, 1.27, 0.92, 0.83, 1.27, 5.14, 0.77, 1.45, 1.16, 0.64, -0.18, 3.63, 1.53, 0.16, 0.58, 0.97, 1.57, 0.38, 0.69, 1.55, 0.3, 2.22, 0.38, 0.35, 5.22, 7.58, 6.92, 1.61, 1.91, 0.53, 0.6, 3.84, 0.0, 1.59, 0.8, 3.72]} \ No newline at end of file diff --git a/annotations_1/K57aIbpF_Co_filtered.json b/annotations_1/K57aIbpF_Co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c21bed72940eaead9c189f8fe86cb6d1f669660c --- /dev/null +++ b/annotations_1/K57aIbpF_Co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[118.0, 151.23], [156.0, 172.2]], "keep_status": [false, true], "silence_prob": [0.0, 41.3], "audiomae_on_audioset": [null, [["hum", 33.05], ["throbbing", 12.53], ["mains hum", 4.62]]], "duration": [33.23, 16.2]} \ No newline at end of file diff --git a/annotations_1/K6Kkwi0nfHg_filtered.json b/annotations_1/K6Kkwi0nfHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..077609e6f0f39ad0f870bbd25c5e001e7cdd20e5 --- /dev/null +++ b/annotations_1/K6Kkwi0nfHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.95], [6.0, 7.33], [9.0, 10.59], [13.0, 14.17], [17.0, 17.17], [18.0, 19.99], [21.0, 24.44], [26.0, 42.53], [46.0, 47.33], [52.0, 52.56], [53.0, 53.5], [54.0, 151.53], [152.0, 154.45], [156.0, 156.52], [158.0, 160.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 29.77, 33.27, 0.0, 0.0, 0.0, 0.0, 46.57, 0.0, 36.75], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 47.09], ["hum", 17.11], ["synthesizer", 6.51]], [["music", 62.95], ["hum", 9.61], ["throbbing", 8.88]], null, null, null, null, [["fly, housefly", 20.72], ["music", 13.7], ["mosquito", 7.05]], null, [["music", 30.59], ["speech", 13.51], ["cowbell", 8.92]]], "duration": [2.95, 1.33, 1.59, 1.17, 0.17, 1.99, 3.44, 16.53, 1.33, 0.56, 0.5, 97.53, 2.45, 0.52, 2.3]} \ No newline at end of file diff --git a/annotations_1/K6O_Ep9bY0U_filtered.json b/annotations_1/K6O_Ep9bY0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6e696bbd4d2d557c6531a99f6bffbac516ef08c --- /dev/null +++ b/annotations_1/K6O_Ep9bY0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.36], [26.0, 27.16], [31.0, 32.04], [36.0, 36.85], [40.0, 40.34], [42.0, 42.89], [50.0, 49.86], [52.0, 55.27], [59.0, 61.4], [72.0, 72.79], [85.0, 89.02], [90.0, 94.66], [111.0, 111.48], [113.0, 113.05], [117.0, 118.44], [121.0, 122.89], [129.0, 130.03], [131.0, 131.67], [134.0, 134.05], [137.0, 136.97], [139.0, 140.53], [142.0, 142.57], [144.0, 146.21], [148.0, 150.6]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.28, 41.6, 0.0, 66.63, 39.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.09, 57.64], "audiomae_on_audioset": [[["music", 15.99], ["theremin", 12.6], ["foghorn", 6.63]], null, null, null, null, null, null, [["music", 69.49], ["synthetic singing", 4.85], ["carnatic music", 3.7]], [["music", 59.82], ["carnatic music", 4.19], ["synthetic singing", 2.69]], null, null, [["music", 29.09], ["speech", 9.49], ["mains hum", 8.27]], null, null, null, null, null, null, null, null, null, null, [["sidetone", 50.02], ["sine wave", 13.72], ["speech", 13.45]], null], "duration": [2.36, 1.16, 1.04, 0.85, 0.34, 0.89, -0.14, 3.27, 2.4, 0.79, 4.02, 4.66, 0.48, 0.05, 1.44, 1.89, 1.03, 0.67, 0.05, -0.03, 1.53, 0.57, 2.21, 2.6]} \ No newline at end of file diff --git a/annotations_1/K7I9ERiBZrc_filtered.json b/annotations_1/K7I9ERiBZrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d63936b52dd6b27f3a3edf79e0f359d9fe1d84b --- /dev/null +++ b/annotations_1/K7I9ERiBZrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.79], [7.0, 42.09], [45.0, 47.04], [50.0, 52.02], [54.0, 54.55], [60.0, 72.2], [73.0, 89.82], [92.0, 92.13], [95.0, 95.64], [97.0, 97.65], [98.0, 107.11], [108.0, 113.12], [114.0, 116.4], [118.0, 118.3], [122.0, 122.94], [125.0, 126.6]], "keep_status": [true, false, false, false, false, true, true, false, false, false, true, true, true, false, false, false], "silence_prob": [38.35, 0.0, 65.79, 95.78, 0.0, 34.56, 33.5, 0.0, 0.0, 0.0, 31.99, 30.9, 31.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 34.46], ["electric shaver, electric razor", 9.1], ["mosquito", 8.54]], null, null, null, null, [["speech", 32.57], ["fart", 19.09], ["electric shaver, electric razor", 10.55]], [["speech", 49.93], ["livestock, farm animals, working animals", 8.08], ["fly, housefly", 7.75]], null, null, null, [["speech", 42.86], ["whack, thwack", 9.96], ["cattle, bovinae", 9.21]], [["music", 27.47], ["moo", 13.42], ["cattle, bovinae", 11.28]], [["music", 50.48], ["carnatic music", 9.94], ["middle eastern music", 5.62]], null, null, null], "duration": [3.79, 35.09, 2.04, 2.02, 0.55, 12.2, 16.82, 0.13, 0.64, 0.65, 9.11, 5.12, 2.4, 0.3, 0.94, 1.6]} \ No newline at end of file diff --git a/annotations_1/K8yA801TQVQ_filtered.json b/annotations_1/K8yA801TQVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f692e4ba5763fbdc5672d2fac3d0dec88783e866 --- /dev/null +++ b/annotations_1/K8yA801TQVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.28], [18.0, 18.55], [33.0, 34.96], [36.0, 36.95], [38.0, 38.79], [43.0, 44.09], [47.0, 51.54], [54.0, 58.67], [60.0, 60.81], [62.0, 66.07], [68.0, 69.89], [70.0, 73.67], [75.0, 110.19], [111.0, 112.31], [113.0, 132.26], [142.0, 143.92], [155.0, 159.0], [161.0, 173.48], [174.0, 177.77], [179.0, 180.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 71.72, 0.0, 98.73, 0.0, 98.66, 0.0, 0.0, 31.49, 0.0, 99.99, 68.8, 54.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.95], ["reggae", 4.47], ["rhythm and blues", 1.37]], null, null, null, null, null], "duration": [6.28, 0.55, 1.96, 0.95, 0.79, 1.09, 4.54, 4.67, 0.81, 4.07, 1.89, 3.67, 35.19, 1.31, 19.26, 1.92, 4.0, 12.48, 3.77, 1.45]} \ No newline at end of file diff --git a/annotations_1/K93YrK48ZG0_filtered.json b/annotations_1/K93YrK48ZG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3cc8a17755eb8ac28f5aff58131752a60b687ae --- /dev/null +++ b/annotations_1/K93YrK48ZG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 29.27], [32.0, 51.24], [52.0, 76.91], [77.0, 83.17], [85.0, 91.15], [94.0, 104.52], [106.0, 106.24], [107.0, 144.24], [149.0, 149.08], [150.0, 178.38]], "keep_status": [false, true, false, false, true, false, false, false, false, false], "silence_prob": [61.37, 32.69, 31.55, 98.44, 30.6, 31.49, 0.0, 0.0, 0.0, 29.56], "audiomae_on_audioset": [null, [["music", 37.28], ["hum", 18.77], ["throbbing", 12.41]], [["music", 57.48], ["whack, thwack", 16.23], ["mosquito", 4.33]], null, [["music", 37.58], ["sidetone", 23.36], ["speech", 6.57]], [["music", 35.68], ["speech", 19.97], ["buzz", 15.92]], null, null, null, [["music", 72.16], ["synthesizer", 7.1], ["throbbing", 4.85]]], "duration": [13.27, 19.24, 24.91, 6.17, 6.15, 10.52, 0.24, 37.24, 0.08, 28.38]} \ No newline at end of file diff --git a/annotations_1/K9j6xEBFek4_filtered.json b/annotations_1/K9j6xEBFek4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3f5966e6f0c66cfbef8a32971865c94908d456 --- /dev/null +++ b/annotations_1/K9j6xEBFek4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 91.69], [92.0, 92.87], [96.0, 101.68]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 28.49], "audiomae_on_audioset": [null, null, [["music", 34.35], ["speech", 17.31], ["throbbing", 7.84]]], "duration": [32.69, 0.87, 5.68]} \ No newline at end of file diff --git a/annotations_1/K9z6npGGZAM_filtered.json b/annotations_1/K9z6npGGZAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb340a2bc4c75bbc4efcf98aeedde5633f0cf4b3 --- /dev/null +++ b/annotations_1/K9z6npGGZAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.08], [12.0, 12.16], [13.0, 13.59], [14.0, 14.45], [15.0, 15.26], [30.0, 30.64], [35.0, 35.04], [35.0, 36.69], [43.0, 43.21], [46.0, 46.74], [51.0, 55.22], [56.0, 57.16], [58.0, 65.53], [66.0, 66.51], [70.0, 74.12], [79.0, 79.69], [80.0, 80.62], [82.0, 82.86], [84.0, 84.94], [87.0, 87.4], [88.0, 89.07], [91.0, 92.53], [97.0, 97.93], [99.0, 99.94], [107.0, 107.76], [113.0, 112.63], [116.0, 116.33], [120.0, 121.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 30.96, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.3], ["gong", 12.55], ["speech", 11.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.16, 0.59, 0.45, 0.26, 0.64, 0.04, 1.69, 0.21, 0.74, 4.22, 1.16, 7.53, 0.51, 4.12, 0.69, 0.62, 0.86, 0.94, 0.4, 1.07, 1.53, 0.93, 0.94, 0.76, -0.37, 0.33, 1.17]} \ No newline at end of file diff --git a/annotations_1/KAByPJJecxQ_filtered.json b/annotations_1/KAByPJJecxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..694f1fa74c0c5b99a0b2d7164423fffbd295302f --- /dev/null +++ b/annotations_1/KAByPJJecxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.76], [10.0, 11.21], [12.0, 13.51], [14.0, 15.26], [18.0, 19.11], [20.0, 22.01], [23.0, 25.03], [28.0, 29.61], [31.0, 33.34], [35.0, 35.9], [36.0, 38.37], [39.0, 41.47], [43.0, 43.9], [45.0, 46.04], [49.0, 51.17], [52.0, 53.67], [55.0, 55.98], [57.0, 57.38], [58.0, 58.78], [60.0, 61.55], [63.0, 65.65], [66.0, 65.72], [66.0, 67.37], [69.0, 69.84], [71.0, 73.74], [75.0, 82.14], [85.0, 120.45], [123.0, 127.9], [130.0, 145.27], [146.0, 147.11], [148.0, 152.19], [155.0, 171.95], [172.0, 172.44], [173.0, 173.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 57.81, 70.58, 0.0, 57.97, 0.0, 48.39, 65.67, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 36.93, 0.0, 0.0, 0.0, 33.77, 32.57, 0.0, 30.72, 32.66, 0.0, 30.29, 29.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mains hum", 22.48], ["music", 21.32], ["speech", 12.92]], null, null, null, null, null, null, null, null, null, [["music", 48.93], ["brass instrument", 9.14], ["musical instrument", 6.84]], null, null, null, [["hum", 16.69], ["gong", 16.01], ["music", 14.35]], [["music", 42.09], ["mains hum", 13.42], ["hum", 12.55]], null, [["music", 33.03], ["didgeridoo", 15.32], ["musical instrument", 7.11]], [["music", 72.31], ["musical instrument", 7.92], ["didgeridoo", 2.63]], null, [["theremin", 15.24], ["music", 11.62], ["whale vocalization", 7.93]], [["artillery fire", 30.49], ["music", 10.36], ["buzz", 7.41]], null, null], "duration": [-0.24, 1.21, 1.51, 1.26, 1.11, 2.01, 2.03, 1.61, 2.34, 0.9, 2.37, 2.47, 0.9, 1.04, 2.17, 1.67, 0.98, 0.38, 0.78, 1.55, 2.65, -0.28, 1.37, 0.84, 2.74, 7.14, 35.45, 4.9, 15.27, 1.11, 4.19, 16.95, 0.44, 0.72]} \ No newline at end of file diff --git a/annotations_1/KAE8h2rqA6g_filtered.json b/annotations_1/KAE8h2rqA6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca77887c2d78bd1a9d46f53fd2fc828b9706c92b --- /dev/null +++ b/annotations_1/KAE8h2rqA6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [7.0, 8.82], [14.0, 15.26], [17.0, 23.72], [25.0, 25.32], [27.0, 26.82], [28.0, 28.16], [33.0, 34.26], [37.0, 55.39], [59.0, 59.78], [63.0, 79.68], [80.0, 81.57], [83.0, 83.79], [85.0, 85.82], [86.0, 91.67], [95.0, 104.38], [105.0, 113.86], [116.0, 126.55]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 37.52, 0.0, 0.0, 0.0, 0.0, 31.58, 0.0, 33.02, 0.0, 0.0, 0.0, 33.91, 31.39, 33.32, 30.69], "audiomae_on_audioset": [null, null, null, [["gong", 46.32], ["music", 36.55], ["ambient music", 5.33]], null, null, null, null, [["music", 53.0], ["scary music", 7.63], ["gong", 6.19]], null, [["rumble", 11.11], ["buzz", 7.96], ["fart", 7.41]], null, null, null, [["music", 55.41], ["didgeridoo", 3.37], ["whale vocalization", 3.28]], [["music", 67.74], ["wind instrument, woodwind instrument", 5.76], ["foghorn", 4.23]], [["music", 69.19], ["keyboard (musical)", 3.71], ["ambient music", 3.22]], [["music", 43.91], ["musical instrument", 6.77], ["brass instrument", 5.94]]], "duration": [0.88, 1.82, 1.26, 6.72, 0.32, -0.18, 0.16, 1.26, 18.39, 0.78, 16.68, 1.57, 0.79, 0.82, 5.67, 9.38, 8.86, 10.55]} \ No newline at end of file diff --git a/annotations_1/KAT5h_fimTM_filtered.json b/annotations_1/KAT5h_fimTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/KAT5h_fimTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/KBCL6GBurNw_filtered.json b/annotations_1/KBCL6GBurNw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0cc486fa2684f9c4bd11c9b17ea245e5a1a510d --- /dev/null +++ b/annotations_1/KBCL6GBurNw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.96], [14.0, 17.61], [19.0, 20.34], [22.0, 23.67], [26.0, 26.72], [28.0, 28.73], [31.0, 31.68], [38.0, 40.15], [46.0, 47.63], [48.0, 48.88], [53.0, 56.54], [60.0, 60.71], [62.0, 69.99], [70.0, 71.25], [72.0, 73.43], [74.0, 74.78], [75.0, 77.7], [79.0, 82.31], [83.0, 88.2], [90.0, 89.95], [98.0, 108.9], [111.0, 111.32], [113.0, 114.3], [126.0, 126.12], [128.0, 130.69], [131.0, 130.76], [135.0, 139.18], [146.0, 149.66], [150.0, 154.95], [156.0, 156.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, false, true, true, true, false], "silence_prob": [51.44, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 60.05, 0.0, 0.0, 84.07, 0.0, 56.78, 0.0, 0.0, 0.0, 46.15, 31.12, 33.39, 0.0, 31.44, 0.0, 0.0, 0.0, 32.29, 0.0, 31.58, 31.01, 36.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["beatboxing", 21.69], ["sidetone", 7.98], ["echo", 7.25]], [["speech", 20.61], ["music", 13.41], ["boing", 9.88]], [["music", 23.62], ["whack, thwack", 8.24], ["speech", 7.49]], null, [["speech", 41.39], ["thump, thud", 26.7], ["whack, thwack", 5.99]], null, null, null, [["speech", 41.1], ["music", 10.04], ["noise", 7.72]], null, [["music", 29.87], ["speech", 14.86], ["beatboxing", 5.32]], [["speech", 47.63], ["thump, thud", 9.66], ["thunk", 9.46]], [["hum", 35.26], ["throbbing", 22.86], ["mains hum", 8.28]], null], "duration": [5.96, 3.61, 1.34, 1.67, 0.72, 0.73, 0.68, 2.15, 1.63, 0.88, 3.54, 0.71, 7.99, 1.25, 1.43, 0.78, 2.7, 3.31, 5.2, -0.05, 10.9, 0.32, 1.3, 0.12, 2.69, -0.24, 4.18, 3.66, 4.95, 0.93]} \ No newline at end of file diff --git a/annotations_1/KBLBKR6bQCI_filtered.json b/annotations_1/KBLBKR6bQCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..203efecabc81540b0f08c32593bd4d9c642fcb0b --- /dev/null +++ b/annotations_1/KBLBKR6bQCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 20.29], [21.0, 22.45], [24.0, 25.49], [26.0, 28.34], [30.0, 30.86], [31.0, 31.92], [34.0, 44.46], [45.0, 47.44], [50.0, 51.87], [57.0, 58.04], [60.0, 60.45], [62.0, 63.15], [64.0, 64.18], [65.0, 66.14], [69.0, 71.91], [74.0, 75.05], [77.0, 77.8], [81.0, 81.8], [83.0, 83.17], [89.0, 89.87], [90.0, 96.94]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.65, 0.0, 0.0, 56.25, 0.0, 0.0, 55.53, 35.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12], "audiomae_on_audioset": [[["music", 45.7], ["speech", 12.5], ["synthesizer", 10.58]], null, null, null, null, null, null, [["music", 58.69], ["speech", 8.37], ["musical instrument", 2.25]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.41], ["speech", 27.56], ["grunt", 4.47]]], "duration": [8.29, 1.45, 1.49, 2.34, 0.86, 0.92, 10.46, 2.44, 1.87, 1.04, 0.45, 1.15, 0.18, 1.14, 2.91, 1.05, 0.8, 0.8, 0.17, 0.87, 6.94]} \ No newline at end of file diff --git a/annotations_1/KD6FsEaD-3U_filtered.json b/annotations_1/KD6FsEaD-3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/KD6FsEaD-3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/KEc0SGkBDJ4_filtered.json b/annotations_1/KEc0SGkBDJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13da9843bb851746f8bb9bff5e58dd02c1f96d50 --- /dev/null +++ b/annotations_1/KEc0SGkBDJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.29], [18.0, 19.57], [26.0, 32.97], [33.0, 33.57], [37.0, 37.83], [56.0, 59.14], [80.0, 81.97], [83.0, 82.95], [87.0, 87.39], [89.0, 88.97], [89.0, 89.45], [90.0, 90.83], [92.0, 92.58], [107.0, 106.91], [108.0, 108.9], [125.0, 129.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.29, 0.0, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43], "audiomae_on_audioset": [null, null, [["music", 31.9], ["speech", 17.67], ["mains hum", 4.98]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 1.57, 6.97, 0.57, 0.83, 3.14, 1.97, -0.05, 0.39, -0.03, 0.45, 0.83, 0.58, -0.09, 0.9, 4.84]} \ No newline at end of file diff --git a/annotations_1/KEwC94CY-Go_filtered.json b/annotations_1/KEwC94CY-Go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d47e2b2923231b7fddbf0a0b3ded8b44639f21d --- /dev/null +++ b/annotations_1/KEwC94CY-Go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [12.0, 13.8], [15.0, 15.43], [20.0, 20.49], [22.0, 23.43], [27.0, 27.19], [31.0, 31.68], [34.0, 34.32], [36.0, 37.94], [40.0, 44.78], [48.0, 50.13], [50.0, 50.16], [50.0, 50.31], [50.0, 56.78], [62.0, 67.15], [76.0, 78.09], [86.0, 86.78], [87.0, 87.0], [87.0, 87.17], [89.0, 89.58], [94.0, 94.96], [101.0, 104.82], [111.0, 120.46]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.01, 32.51, 0.0, 0.0, 31.14, 30.72, 46.97, 0.0, 0.0, 0.0, 0.0, 0.0, 30.52, 30.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 38.14], ["speech", 18.47], ["boing", 11.07]], [["music", 58.95], ["speech", 5.59], ["quack", 2.98]], null, null, [["boing", 44.83], ["music", 27.46], ["mosquito", 5.35]], [["cattle, bovinae", 36.5], ["livestock, farm animals, working animals", 35.92], ["moo", 26.91]], [["music", 34.97], ["speech", 21.33], ["electronic music", 2.06]], null, null, null, null, null, [["music", 34.14], ["fart", 23.15], ["speech", 11.26]], [["cattle, bovinae", 21.12], ["speech", 17.76], ["moo", 15.39]]], "duration": [0.73, 1.8, 0.43, 0.49, 1.43, 0.19, 0.68, 0.32, 1.94, 4.78, 2.13, 0.16, 0.31, 6.78, 5.15, 2.09, 0.78, 0.0, 0.17, 0.58, 0.96, 3.82, 9.46]} \ No newline at end of file diff --git a/annotations_1/KFwzRnTqgDU_filtered.json b/annotations_1/KFwzRnTqgDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e07b43f10e9ec569163388c8f110b5e308392c2f --- /dev/null +++ b/annotations_1/KFwzRnTqgDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.56], [27.0, 27.28], [29.0, 35.6], [36.0, 37.15], [38.0, 38.42], [40.0, 40.51], [42.0, 42.28], [44.0, 44.15], [48.0, 48.25], [49.0, 51.83], [54.0, 54.18], [56.0, 56.88], [58.0, 58.94], [60.0, 60.66], [64.0, 66.07], [67.0, 69.53], [72.0, 73.62], [78.0, 78.41], [79.0, 85.41], [86.0, 88.79], [89.0, 92.47], [94.0, 94.27], [95.0, 96.55], [97.0, 97.92]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 37.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.11, 0.0, 0.0, 0.0, 0.0, 72.31, 62.89, 0.0, 0.0, 55.31, 34.52, 40.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["electric shaver, electric razor", 27.56], ["hum", 11.45], ["mains hum", 10.55]], null, null, null, null, null, null, [["speech", 54.17], ["music", 8.41], ["fart", 7.89]], null, null, null, null, null, null, null, null, null, [["animal", 20.34], ["music", 13.53], ["dog", 7.85]], [["theremin", 14.57], ["music", 12.93], ["mosquito", 7.32]], null, null, null], "duration": [0.56, 0.28, 6.6, 1.15, 0.42, 0.51, 0.28, 0.15, 0.25, 2.83, 0.18, 0.88, 0.94, 0.66, 2.07, 2.53, 1.62, 0.41, 6.41, 2.79, 3.47, 0.27, 1.55, 0.92]} \ No newline at end of file diff --git a/annotations_1/KFzIZnYLKSo_filtered.json b/annotations_1/KFzIZnYLKSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee57120ecba837c7d18d69dc05474b97a759a2d2 --- /dev/null +++ b/annotations_1/KFzIZnYLKSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 30.7], [31.0, 34.11], [35.0, 39.55], [49.0, 49.35], [52.0, 52.02], [54.0, 59.44], [60.0, 121.64], [122.0, 123.75], [124.0, 127.28]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 30.69, 64.75, 50.02, 0.0, 0.0, 30.83, 0.0, 0.0, 39.78], "audiomae_on_audioset": [null, [["music", 55.03], ["theremin", 31.61], ["ambient music", 1.69]], null, null, null, null, [["music", 45.53], ["theremin", 17.43], ["brass instrument", 4.71]], null, null, [["music", 37.66], ["theremin", 20.72], ["synthesizer", 12.85]]], "duration": [1.13, 27.7, 3.11, 4.55, 0.35, 0.02, 5.44, 61.64, 1.75, 3.28]} \ No newline at end of file diff --git a/annotations_1/KGV-R-dVuGA_filtered.json b/annotations_1/KGV-R-dVuGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26e7e3c165c7ed9cfdb25463525ec470d8c1a7f5 --- /dev/null +++ b/annotations_1/KGV-R-dVuGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.17], [18.0, 18.39], [20.0, 20.19], [21.0, 21.73], [24.0, 24.83], [33.0, 46.3], [48.0, 51.54], [53.0, 53.42], [56.0, 56.37], [61.0, 62.11], [66.0, 65.77], [71.0, 71.42], [74.0, 74.76], [76.0, 76.71], [77.0, 78.02], [79.0, 79.93], [83.0, 82.98], [86.0, 86.56], [89.0, 89.55], [91.0, 91.66], [93.0, 92.84], [93.0, 94.0], [95.0, 96.06], [100.0, 100.26], [101.0, 101.83], [105.0, 105.04], [111.0, 111.48], [113.0, 113.7], [114.0, 117.91], [120.0, 120.63], [127.0, 128.17], [129.0, 130.22], [133.0, 134.11], [135.0, 138.77], [144.0, 144.26], [151.0, 151.17], [156.0, 164.0], [166.0, 166.83], [169.0, 170.18], [171.0, 171.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.97, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.56, 0.0, 0.0, 0.0, 0.0, 35.01, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 46.89], ["whack, thwack", 26.87], ["thump, thud", 5.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 19.75], ["cattle, bovinae", 14.23], ["speech", 9.1]], null, null, null, null, [["speech", 46.04], ["radio", 35.22], ["hum", 3.05]], null, null, null, null, null, null], "duration": [0.17, 0.39, 0.19, 0.73, 0.83, 13.3, 3.54, 0.42, 0.37, 1.11, -0.23, 0.42, 0.76, 0.71, 1.02, 0.93, -0.02, 0.56, 0.55, 0.66, -0.16, 1.0, 1.06, 0.26, 0.83, 0.04, 0.48, 0.7, 3.91, 0.63, 1.17, 1.22, 1.11, 3.77, 0.26, 0.17, 8.0, 0.83, 1.18, 0.26]} \ No newline at end of file diff --git a/annotations_1/KHsn2smp4N4_filtered.json b/annotations_1/KHsn2smp4N4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..191cf01fd633682e53cb6dc15a98a97e9f59a4b7 --- /dev/null +++ b/annotations_1/KHsn2smp4N4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [6.0, 8.9], [10.0, 12.33], [13.0, 19.89], [21.0, 21.83], [23.0, 24.68], [25.0, 26.37], [29.0, 33.12], [35.0, 36.58], [37.0, 41.07], [42.0, 42.42], [45.0, 46.41], [47.0, 52.68], [53.0, 53.96], [61.0, 64.1], [68.0, 72.23], [73.0, 74.21], [75.0, 75.51], [78.0, 79.56], [81.0, 83.0], [86.0, 86.71], [88.0, 91.74], [157.0, 161.06], [163.0, 165.64], [166.0, 174.34], [176.0, 178.77], [197.0, 197.38], [200.0, 201.16]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, true, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 45.11, 50.81, 68.15, 0.0, 0.0, 0.0, 46.94, 0.0, 47.43, 0.0, 0.0, 47.08, 0.0, 59.86, 41.14, 0.0, 0.0, 0.0, 43.45, 0.0, 39.28, 40.47, 39.72, 82.97, 63.74, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 62.0], ["singing bowl", 13.76], ["ambient music", 6.63]], null, null, null, null, null, [["speech", 46.71], ["singing bowl", 12.23], ["music", 6.81]], null, [["hum", 27.8], ["mains hum", 26.08], ["speech", 13.53]], null, null, [["speech", 29.4], ["music", 26.57], ["hum", 7.66]], null, null, [["speech", 33.6], ["hum", 27.63], ["mains hum", 7.26]], null, null, null, [["singing bowl", 29.2], ["music", 16.17], ["speech", 12.23]], null, [["music", 24.5], ["sonar", 13.88], ["thunk", 6.52]], [["music", 50.75], ["ambient music", 15.2], ["singing bowl", 6.42]], [["music", 38.37], ["hum", 19.42], ["mains hum", 7.5]], null, null, null, null], "duration": [0.74, 2.9, 2.33, 6.89, 0.83, 1.68, 1.37, 4.12, 1.58, 4.07, 0.42, 1.41, 5.68, 0.96, 3.1, 4.23, 1.21, 0.51, 1.56, 2.0, 0.71, 3.74, 4.06, 2.64, 8.34, 2.77, 0.38, 1.16]} \ No newline at end of file diff --git a/annotations_1/KJhlJ8p8v7A_filtered.json b/annotations_1/KJhlJ8p8v7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5fa37af864d4e38851622b86411cc6ef0c569e6 --- /dev/null +++ b/annotations_1/KJhlJ8p8v7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.93], [9.0, 9.44], [10.0, 11.57], [12.0, 12.77], [21.0, 22.96], [27.0, 29.91], [32.0, 32.64], [40.0, 43.28], [46.0, 48.66], [49.0, 52.47], [53.0, 53.47], [58.0, 59.58], [60.0, 60.57], [65.0, 66.46], [68.0, 68.44], [74.0, 74.75], [81.0, 81.16], [82.0, 82.31], [87.0, 87.79], [90.0, 90.69], [93.0, 94.54], [100.0, 101.44], [105.0, 106.62], [107.0, 108.11], [111.0, 111.06], [116.0, 116.83], [117.0, 125.12], [158.0, 158.26], [160.0, 161.08], [166.0, 167.76], [169.0, 174.85], [178.0, 179.91], [183.0, 187.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 97.73, 63.96, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 40.41, 0.0, 31.29], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 46.61], ["heart sounds, heartbeat", 24.13], ["throbbing", 20.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 13.35], ["speech", 12.1], ["cough", 9.36]], null, [["snicker", 25.42], ["chuckle, chortle", 16.52], ["laughter", 13.78]]], "duration": [-0.07, 0.44, 1.57, 0.77, 1.96, 2.91, 0.64, 3.28, 2.66, 3.47, 0.47, 1.58, 0.57, 1.46, 0.44, 0.75, 0.16, 0.31, 0.79, 0.69, 1.54, 1.44, 1.62, 1.11, 0.06, 0.83, 8.12, 0.26, 1.08, 1.76, 5.85, 1.91, 4.49]} \ No newline at end of file diff --git a/annotations_1/KJtmyW2urUk_filtered.json b/annotations_1/KJtmyW2urUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..320bc149d484aa276c2705aa5533b9cc12fed2ef --- /dev/null +++ b/annotations_1/KJtmyW2urUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [7.0, 7.92], [10.0, 10.52], [12.0, 41.86], [42.0, 86.04], [92.0, 92.75], [94.0, 95.61], [96.0, 96.92], [100.0, 100.95], [105.0, 106.42], [110.0, 110.67], [116.0, 117.31], [118.0, 118.71], [130.0, 130.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.99], ["speech", 13.32], ["cacophony", 9.04]], null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.92, 0.52, 29.86, 44.04, 0.75, 1.61, 0.92, 0.95, 1.42, 0.67, 1.31, 0.71, 0.79]} \ No newline at end of file diff --git a/annotations_1/KKD0B8uROMI_filtered.json b/annotations_1/KKD0B8uROMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0b07f69ee5f6d911458641c153d1b217cfb5cfb --- /dev/null +++ b/annotations_1/KKD0B8uROMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [6.0, 6.02], [15.0, 15.06], [16.0, 16.75], [19.0, 19.35], [22.0, 22.2], [23.0, 27.97], [29.0, 33.67], [37.0, 37.13], [44.0, 44.14], [47.0, 47.39], [49.0, 48.73], [50.0, 51.22], [52.0, 53.64], [54.0, 55.11], [56.0, 57.03], [60.0, 60.17], [62.0, 62.13], [62.0, 63.34], [66.0, 67.05], [71.0, 71.54], [72.0, 72.79], [76.0, 76.47], [78.0, 78.58], [81.0, 83.78], [90.0, 96.33], [97.0, 96.53], [97.0, 96.57], [97.0, 96.6], [97.0, 96.63], [97.0, 96.67], [98.0, 101.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 51.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 34.96, 0.0, 0.0, 0.0, 0.0, 0.0, 40.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.36], ["throbbing", 11.49], ["hum", 3.4]], [["music", 39.08], ["speech", 15.54], ["fart", 8.04]], null, null, null, null, null, [["music", 70.11], ["speech", 8.07], ["hum", 3.06]]], "duration": [1.06, 0.02, 0.06, 0.75, 0.35, 0.2, 4.97, 4.67, 0.13, 0.14, 0.39, -0.27, 1.22, 1.64, 1.11, 1.03, 0.17, 0.13, 1.34, 1.05, 0.54, 0.79, 0.47, 0.58, 2.78, 6.33, -0.47, -0.43, -0.4, -0.37, -0.33, 3.49]} \ No newline at end of file diff --git a/annotations_1/KKfz8C48EJk_filtered.json b/annotations_1/KKfz8C48EJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cce67c537c68b312fb250f61bd1dbea6a2adb7a --- /dev/null +++ b/annotations_1/KKfz8C48EJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 25.64], [29.0, 29.89], [36.0, 38.53], [40.0, 43.02], [44.0, 44.88], [46.0, 56.56], [59.0, 63.34], [73.0, 78.71], [84.0, 95.82], [101.0, 101.51], [102.0, 102.93], [104.0, 110.03], [112.0, 122.2], [128.0, 134.47], [136.0, 136.38], [137.0, 138.25], [151.0, 153.89], [154.0, 154.63], [166.0, 167.73]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.5, 0.0, 29.59, 29.07, 0.0, 28.97, 29.74, 31.28, 29.77, 0.0, 0.0, 31.0, 32.04, 30.62, 0.0, 0.0, 32.03, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.31], ["music", 24.96], ["mosquito", 10.79]], null, [["music", 81.58], ["yodeling", 2.83], ["carnatic music", 1.25]], [["whale vocalization", 63.78], ["music", 8.54], ["groan", 4.89]], null, [["music", 67.75], ["boing", 4.49], ["buzz", 2.65]], [["music", 23.44], ["breaking", 5.87], ["musical instrument", 4.26]], [["boing", 27.98], ["music", 18.89], ["speech", 16.52]], [["music", 55.45], ["speech", 8.82], ["boing", 5.76]], null, null, [["cattle, bovinae", 45.16], ["livestock, farm animals, working animals", 24.38], ["moo", 22.53]], [["music", 47.87], ["speech", 21.36], ["boing", 5.53]], [["fart", 39.43], ["speech", 26.88], ["groan", 8.75]], null, null, [["music", 27.26], ["speech", 14.37], ["whack, thwack", 6.37]], null, null], "duration": [17.64, 0.89, 2.53, 3.02, 0.88, 10.56, 4.34, 5.71, 11.82, 0.51, 0.93, 6.03, 10.2, 6.47, 0.38, 1.25, 2.89, 0.63, 1.73]} \ No newline at end of file diff --git a/annotations_1/KKsVK5R9q80_filtered.json b/annotations_1/KKsVK5R9q80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ea2c6667a770202a7d1aaa39bba1eb4ab15f2e7 --- /dev/null +++ b/annotations_1/KKsVK5R9q80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 28.09], [31.0, 31.68], [33.0, 33.86], [38.0, 38.11], [42.0, 42.48], [45.0, 45.82], [47.0, 51.33], [52.0, 53.54], [55.0, 59.02], [59.0, 61.16], [62.0, 63.27], [65.0, 65.69], [66.0, 67.09], [68.0, 69.04], [70.0, 70.56], [71.0, 72.17], [73.0, 76.79], [79.0, 78.85], [87.0, 88.21], [90.0, 91.71], [100.0, 113.66], [114.0, 116.01], [117.0, 118.08], [120.0, 121.8], [124.0, 132.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [43.1, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 97.64, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 36.54, 51.88, 0.0, 0.0, 47.74], "audiomae_on_audioset": [[["hum", 32.83], ["music", 12.7], ["mains hum", 10.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.29], ["hum", 10.13], ["speech", 4.67]], null, null, null, [["music", 48.88], ["speech", 7.53], ["didgeridoo", 5.89]]], "duration": [11.09, 0.68, 0.86, 0.11, 0.48, 0.82, 4.33, 1.54, 4.02, 2.16, 1.27, 0.69, 1.09, 1.04, 0.56, 1.17, 3.79, -0.15, 1.21, 1.71, 13.66, 2.01, 1.08, 1.8, 8.93]} \ No newline at end of file diff --git a/annotations_1/KMHmLy9C2hU_filtered.json b/annotations_1/KMHmLy9C2hU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2180128c6047a953a5f22367bccccadcd8f30470 --- /dev/null +++ b/annotations_1/KMHmLy9C2hU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.94], [21.0, 53.72], [56.0, 66.19], [67.0, 67.64], [70.0, 79.19], [86.0, 86.41], [88.0, 88.91], [93.0, 93.04], [94.0, 94.19], [96.0, 96.5], [109.0, 110.34], [111.0, 112.65], [116.0, 118.17], [119.0, 119.23]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 35.04, 0.0, 28.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.17, 0.0], "audiomae_on_audioset": [null, null, [["hum", 39.0], ["mains hum", 20.83], ["speech", 9.76]], null, [["music", 62.62], ["speech", 7.34], ["cacophony", 3.79]], null, null, null, null, null, null, null, [["music", 19.92], ["hum", 9.99], ["mains hum", 8.56]], null], "duration": [-0.06, 32.72, 10.19, 0.64, 9.19, 0.41, 0.91, 0.04, 0.19, 0.5, 1.34, 1.65, 2.17, 0.23]} \ No newline at end of file diff --git a/annotations_1/KMI-Sxq9Npg_filtered.json b/annotations_1/KMI-Sxq9Npg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..428ed2b772b6fbce540e77011fbed5020f940565 --- /dev/null +++ b/annotations_1/KMI-Sxq9Npg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.17], [17.0, 19.23], [20.0, 21.88], [23.0, 25.22], [29.0, 30.03], [31.0, 32.09], [35.0, 35.33], [42.0, 42.43], [44.0, 45.2], [48.0, 50.28], [52.0, 52.05], [54.0, 71.22], [72.0, 76.35], [78.0, 80.1], [101.0, 100.8], [101.0, 103.74], [107.0, 108.16], [111.0, 122.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.84, 94.95, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 53.91, 83.16, 81.53, 0.0, 94.66, 0.0, 71.29], "audiomae_on_audioset": [[["mains hum", 27.1], ["speech", 21.6], ["hum", 15.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 2.23, 1.88, 2.22, 1.03, 1.09, 0.33, 0.43, 1.2, 2.28, 0.05, 17.22, 4.35, 2.1, -0.2, 2.74, 1.16, 11.94]} \ No newline at end of file diff --git a/annotations_1/KMOr9s3kfM0_filtered.json b/annotations_1/KMOr9s3kfM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/KMOr9s3kfM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/KMkdp0Uy8t0_filtered.json b/annotations_1/KMkdp0Uy8t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d13cc2c3913ffaafc1c02d6b1d100d5c77501362 --- /dev/null +++ b/annotations_1/KMkdp0Uy8t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 49.65], [52.0, 55.0], [59.0, 65.96], [68.0, 77.84], [79.0, 97.11], [99.0, 106.46], [108.0, 108.84], [109.0, 146.75], [148.0, 155.41], [157.0, 157.77], [158.0, 159.19]], "keep_status": [false, true, true, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 34.37, 33.74, 31.93, 30.75, 31.43, 0.0, 0.0, 31.71, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 24.07], ["hum", 22.05], ["speech", 19.97]], [["electric shaver, electric razor", 24.27], ["music", 17.51], ["mains hum", 11.27]], [["music", 37.82], ["throbbing", 20.22], ["hum", 15.22]], [["music", 16.18], ["mains hum", 14.79], ["speech", 12.96]], [["speech", 33.11], ["music", 16.9], ["throbbing", 13.79]], null, null, [["speech", 31.26], ["music", 23.85], ["didgeridoo", 4.94]], null, null], "duration": [40.65, 3.0, 6.96, 9.84, 18.11, 7.46, 0.84, 37.75, 7.41, 0.77, 1.19]} \ No newline at end of file diff --git a/annotations_1/KNQpMgWWB5Y_filtered.json b/annotations_1/KNQpMgWWB5Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c74175cdeb6cec3cb5b5083956eda4cf36fde68 --- /dev/null +++ b/annotations_1/KNQpMgWWB5Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.47], [9.0, 9.19], [16.0, 16.56], [21.0, 20.83], [21.0, 21.63], [23.0, 22.87], [28.0, 28.65], [31.0, 32.39], [36.0, 36.91], [38.0, 38.79], [42.0, 43.39], [47.0, 46.67], [56.0, 56.0], [59.0, 60.07], [62.0, 62.02], [63.0, 63.44], [65.0, 65.5], [70.0, 71.41], [75.0, 75.78], [76.0, 78.29], [79.0, 80.33], [81.0, 82.29], [88.0, 90.27], [93.0, 94.09], [95.0, 95.69], [97.0, 101.04], [101.0, 104.92], [107.0, 107.89], [113.0, 112.73], [113.0, 114.83], [117.0, 119.15], [120.0, 120.34], [121.0, 122.71], [124.0, 125.17], [128.0, 129.68], [132.0, 133.19], [140.0, 140.86], [142.0, 141.81], [143.0, 146.7], [147.0, 148.95], [150.0, 150.89], [156.0, 159.19], [164.0, 165.15], [168.0, 169.42], [170.0, 169.91], [171.0, 172.35], [173.0, 173.4], [175.0, 175.02], [175.0, 177.58], [181.0, 184.23], [187.0, 191.71], [195.0, 196.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 0.0, 0.0, 68.28, 0.0, 0.0, 71.72, 47.05, 0.0, 0.0, 0.0, 38.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.98, 46.09, 41.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.42], ["sidetone", 4.75], ["music", 3.7]], null, null, null, null, null, null, [["mains hum", 30.83], ["hum", 27.32], ["speech", 14.26]], null, null, null, [["speech", 54.16], ["music", 10.64], ["busy signal", 4.28]], null, null, null, null, null, null, null, [["music", 24.8], ["hum", 16.05], ["guitar", 12.93]], null, null, [["music", 47.89], ["boing", 20.1], ["speech", 6.89]], null, null, null, null, null, null, [["music", 34.69], ["fly, housefly", 15.93], ["insect", 5.16]], [["music", 76.74], ["musical instrument", 6.2], ["guitar", 4.03]], [["music", 73.74], ["speech", 4.2], ["musical instrument", 3.88]], null], "duration": [5.47, 0.19, 0.56, -0.17, 0.63, -0.13, 0.65, 1.39, 0.91, 0.79, 1.39, -0.33, 0.0, 1.07, 0.02, 0.44, 0.5, 1.41, 0.78, 2.29, 1.33, 1.29, 2.27, 1.09, 0.69, 4.04, 3.92, 0.89, -0.27, 1.83, 2.15, 0.34, 1.71, 1.17, 1.68, 1.19, 0.86, -0.19, 3.7, 1.95, 0.89, 3.19, 1.15, 1.42, -0.09, 1.35, 0.4, 0.02, 2.58, 3.23, 4.71, 1.03]} \ No newline at end of file diff --git a/annotations_1/KNdmBWoCfAc_filtered.json b/annotations_1/KNdmBWoCfAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..637cd4d4546fd4ed9c69d50ac5d2ff80f4401d9a --- /dev/null +++ b/annotations_1/KNdmBWoCfAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.76], [9.0, 9.32], [14.0, 17.1], [22.0, 23.06], [27.0, 37.44], [39.0, 44.14], [45.0, 55.75], [58.0, 60.72], [63.0, 63.46], [64.0, 66.19], [67.0, 68.54]], "keep_status": [true, false, true, false, true, false, false, true, false, true, false], "silence_prob": [33.47, 0.0, 32.56, 0.0, 29.94, 28.86, 29.89, 30.17, 0.0, 29.89, 0.0], "audiomae_on_audioset": [[["noise", 43.12], ["music", 15.94], ["hum", 6.26]], null, [["music", 28.69], ["throbbing", 15.6], ["hum", 9.56]], null, [["music", 49.16], ["hum", 13.03], ["sidetone", 7.79]], [["music", 43.68], ["hum", 15.76], ["mains hum", 11.99]], [["music", 51.83], ["hum", 20.56], ["mains hum", 8.8]], [["music", 38.03], ["cattle, bovinae", 7.2], ["moo", 5.53]], null, [["music", 28.48], ["speech", 6.25], ["sound effect", 4.46]], null], "duration": [2.76, 0.32, 3.1, 1.06, 10.44, 5.14, 10.75, 2.72, 0.46, 2.19, 1.54]} \ No newline at end of file diff --git a/annotations_1/KNwhBAOLCXQ_filtered.json b/annotations_1/KNwhBAOLCXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bb7b7a81b5822014c98d41a316eeaf2ef1c8467 --- /dev/null +++ b/annotations_1/KNwhBAOLCXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.78], [28.0, 30.2], [31.0, 33.51], [36.0, 37.07], [39.0, 42.13], [43.0, 44.69], [49.0, 50.72], [51.0, 53.74], [60.0, 61.37], [63.0, 64.52], [65.0, 65.7], [67.0, 75.09], [76.0, 87.02], [87.0, 92.84], [99.0, 100.04], [101.0, 106.81], [107.0, 110.15], [111.0, 124.68], [126.0, 125.83], [134.0, 134.49], [135.0, 137.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.0, 99.59, 0.0, 82.43, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 93.91, 61.37, 46.9, 0.0, 47.5, 47.82, 39.5, 0.0, 0.0, 42.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.09], ["speech", 14.91], ["bass guitar", 6.51]], null, [["music", 77.53], ["musical instrument", 3.92], ["bass guitar", 3.35]], [["music", 69.22], ["bass guitar", 10.99], ["guitar", 5.59]], [["music", 68.73], ["guitar", 7.39], ["bass guitar", 5.46]], null, null, [["music", 66.56], ["guitar", 7.21], ["bass guitar", 6.28]]], "duration": [0.78, 2.2, 2.51, 1.07, 3.13, 1.69, 1.72, 2.74, 1.37, 1.52, 0.7, 8.09, 11.02, 5.84, 1.04, 5.81, 3.15, 13.68, -0.17, 0.49, 2.24]} \ No newline at end of file diff --git a/annotations_1/KOBGjFHXnqY_filtered.json b/annotations_1/KOBGjFHXnqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2981863e4ef75248fbf288d1550344b5429ab047 --- /dev/null +++ b/annotations_1/KOBGjFHXnqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.31], [14.0, 14.03], [15.0, 16.23], [18.0, 18.59], [20.0, 20.17], [24.0, 23.85], [35.0, 35.73], [37.0, 37.35], [39.0, 39.56], [40.0, 40.68], [41.0, 44.17], [45.0, 45.18], [56.0, 55.93], [63.0, 64.07], [66.0, 68.28], [71.0, 71.2], [79.0, 81.04], [82.0, 82.7], [90.0, 90.04], [91.0, 91.23], [106.0, 106.54], [107.0, 108.11], [108.0, 118.77], [121.0, 123.3], [129.0, 129.07], [133.0, 132.76], [137.0, 136.97], [143.0, 142.75], [148.0, 148.63], [150.0, 150.9], [151.0, 153.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.87, 0.0, 0.0, 0.0, 52.22, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 55.08], ["fly, housefly", 6.96], ["creak", 4.91]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.64], ["hum", 16.54], ["throbbing", 13.59]], null, null, null, null, null, null, null], "duration": [0.31, 0.03, 1.23, 0.59, 0.17, -0.15, 0.73, 0.35, 0.56, 0.68, 3.17, 0.18, -0.07, 1.07, 2.28, 0.2, 2.04, 0.7, 0.04, 0.23, 0.54, 1.11, 10.77, 2.3, 0.07, -0.24, -0.03, -0.25, 0.63, 0.9, 2.62]} \ No newline at end of file diff --git a/annotations_1/KOuClUYl0_U_filtered.json b/annotations_1/KOuClUYl0_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09d19722591e4f323f3278ac210838bd27acb6e2 --- /dev/null +++ b/annotations_1/KOuClUYl0_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.72], [22.0, 23.65], [24.0, 28.56], [29.0, 40.71], [41.0, 46.11], [51.0, 51.21], [52.0, 52.41], [59.0, 58.95], [65.0, 67.95], [77.0, 77.28], [91.0, 92.5], [95.0, 109.83], [110.0, 115.05], [118.0, 119.11], [121.0, 121.47], [125.0, 126.4], [130.0, 132.8], [139.0, 140.78], [141.0, 143.18], [146.0, 147.12], [153.0, 154.97], [156.0, 156.49], [164.0, 165.45], [169.0, 169.21], [173.0, 172.71], [174.0, 174.61], [176.0, 175.88], [178.0, 180.77], [186.0, 186.34], [190.0, 189.68], [194.0, 193.77], [199.0, 199.15], [208.0, 209.29], [212.0, 212.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [70.02, 0.0, 45.78, 39.91, 52.39, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 38.79, 41.4, 0.0, 0.0, 0.0, 38.67, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 68.99], ["lullaby", 8.4], ["electronic tuner", 2.27]], [["music", 57.4], ["lullaby", 9.4], ["electronic tuner", 5.23]], null, null, null, null, [["music", 74.95], ["mantra", 4.3], ["new-age music", 0.91]], null, null, [["music", 62.66], ["humming", 11.05], ["yodeling", 7.85]], [["music", 71.87], ["lullaby", 6.19], ["sad music", 1.45]], null, null, null, [["music", 67.27], ["lullaby", 2.75], ["cello", 2.5]], null, [["music", 50.86], ["double bass", 12.03], ["cello", 10.94]], null, null, null, null, null, null, null, null, [["music", 59.37], ["lullaby", 3.83], ["mantra", 2.84]], null, null, null, null, null, null], "duration": [2.72, 1.65, 4.56, 11.71, 5.11, 0.21, 0.41, -0.05, 2.95, 0.28, 1.5, 14.83, 5.05, 1.11, 0.47, 1.4, 2.8, 1.78, 2.18, 1.12, 1.97, 0.49, 1.45, 0.21, -0.29, 0.61, -0.12, 2.77, 0.34, -0.32, -0.23, 0.15, 1.29, 0.04]} \ No newline at end of file diff --git a/annotations_1/KPOx5tioLeY_filtered.json b/annotations_1/KPOx5tioLeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a3744bc06d548e28d95a34890463439648f56c4 --- /dev/null +++ b/annotations_1/KPOx5tioLeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.31], [22.0, 53.49], [54.0, 61.79], [64.0, 76.25], [78.0, 77.99], [84.0, 84.27], [86.0, 87.07], [91.0, 100.74], [102.0, 102.27], [104.0, 107.15], [110.0, 110.83], [112.0, 113.7], [115.0, 116.23], [117.0, 118.03], [119.0, 119.8], [120.0, 121.76], [123.0, 126.37], [127.0, 127.53], [128.0, 129.25], [132.0, 132.75], [134.0, 134.43], [135.0, 135.9], [137.0, 137.64], [139.0, 139.77], [140.0, 140.8], [142.0, 142.64], [143.0, 143.51], [145.0, 145.93], [147.0, 163.8]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.64, 0.0, 29.51, 29.72, 0.0, 0.0, 0.0, 46.43, 0.0, 39.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.34], "audiomae_on_audioset": [[["noise", 36.49], ["speech", 17.1], ["sidetone", 10.09]], null, [["music", 46.85], ["speech", 15.39], ["electronic music", 4.38]], [["music", 35.98], ["speech", 12.78], ["boing", 4.66]], null, null, null, [["animal", 21.61], ["neigh, whinny", 17.18], ["speech", 10.67]], null, [["speech", 42.39], ["sidetone", 29.37], ["music", 4.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.93], ["speech", 24.55], ["animal", 5.93]]], "duration": [5.31, 31.49, 7.79, 12.25, -0.01, 0.27, 1.07, 9.74, 0.27, 3.15, 0.83, 1.7, 1.23, 1.03, 0.8, 1.76, 3.37, 0.53, 1.25, 0.75, 0.43, 0.9, 0.64, 0.77, 0.8, 0.64, 0.51, 0.93, 16.8]} \ No newline at end of file diff --git a/annotations_1/KQDbtR9Z-zo_filtered.json b/annotations_1/KQDbtR9Z-zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c017b4508034c47bbc37c050586a1b2b24e4b15d --- /dev/null +++ b/annotations_1/KQDbtR9Z-zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.13], [15.0, 26.45]], "keep_status": [false, false], "silence_prob": [0.0, 54.9], "audiomae_on_audioset": [null, null], "duration": [0.13, 11.45]} \ No newline at end of file diff --git a/annotations_1/KQzNG70KguM_filtered.json b/annotations_1/KQzNG70KguM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d58ad531eed89b6bd9d701687f7cf0036f26a2ee --- /dev/null +++ b/annotations_1/KQzNG70KguM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 36.07], [39.0, 40.71], [46.0, 53.77], [61.0, 63.17], [79.0, 80.32], [85.0, 89.88], [101.0, 102.93], [107.0, 107.0], [111.0, 111.6]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.03, 44.04, 0.0, 43.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.63], ["mantra", 4.45], ["musical instrument", 3.95]], [["music", 62.67], ["musical instrument", 5.11], ["guitar", 4.73]], null, [["music", 66.72], ["musical instrument", 8.22], ["guitar", 6.18]], null, null, null], "duration": [31.07, 1.71, 7.77, 2.17, 1.32, 4.88, 1.93, 0.0, 0.6]} \ No newline at end of file diff --git a/annotations_1/KSZN8iThGZ8_filtered.json b/annotations_1/KSZN8iThGZ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aabdb15244c22e51a0adc5ee83e970513be02ac5 --- /dev/null +++ b/annotations_1/KSZN8iThGZ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.81], [23.0, 22.87], [41.0, 42.38], [43.0, 45.35], [47.0, 47.14], [57.0, 56.96], [59.0, 58.82], [62.0, 62.56], [63.0, 63.0], [63.0, 63.93], [69.0, 70.61], [73.0, 74.26], [76.0, 75.96], [77.0, 78.6], [79.0, 81.33], [82.0, 83.64], [85.0, 90.34], [95.0, 98.85], [101.0, 103.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 58.55, 70.72, 67.51], "audiomae_on_audioset": [null, null, null, [["sidetone", 48.37], ["speech", 37.45], ["hum", 1.76]], null, null, null, null, null, null, null, null, null, null, [["sidetone", 29.55], ["music", 17.93], ["hum", 9.78]], null, null, null, null], "duration": [1.81, -0.13, 1.38, 2.35, 0.14, -0.04, -0.18, 0.56, 0.0, 0.93, 1.61, 1.26, -0.04, 1.6, 2.33, 1.64, 5.34, 3.85, 2.33]} \ No newline at end of file diff --git a/annotations_1/KS_KStIPiwU_filtered.json b/annotations_1/KS_KStIPiwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2e529f604d6ae48396978f45ce5048d3f63c868 --- /dev/null +++ b/annotations_1/KS_KStIPiwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.81], [7.0, 7.01], [10.0, 11.03], [12.0, 13.24], [17.0, 18.54], [20.0, 20.43], [22.0, 25.42], [26.0, 39.21], [40.0, 50.3], [52.0, 67.12], [71.0, 96.08], [97.0, 103.2], [104.0, 116.61], [118.0, 118.3], [119.0, 121.47], [125.0, 128.41], [132.0, 131.58], [132.0, 143.92]], "keep_status": [false, false, false, false, false, false, true, true, false, true, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.42, 29.22, 28.33, 28.73, 29.34, 28.94, 31.49, 0.0, 28.67, 27.99, 0.0, 34.02], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 22.76], ["music", 22.08], ["hum", 10.7]], [["music", 25.91], ["speech", 14.83], ["hum", 13.88]], [["vehicle", 47.95], ["car", 29.92], ["race car, auto racing", 6.22]], [["music", 37.16], ["hum", 7.55], ["electronic music", 4.38]], [["vehicle", 12.5], ["buzz", 11.86], ["hum", 9.15]], [["music", 48.52], ["vehicle", 4.41], ["electronic music", 3.91]], [["music", 45.2], ["hum", 9.84], ["sonar", 4.5]], null, [["fart", 43.11], ["sound effect", 6.63], ["speech", 4.95]], [["explosion", 39.83], ["burst, pop", 9.36], ["music", 6.14]], null, [["speech", 55.71], ["sidetone", 30.05], ["hum", 4.09]]], "duration": [-0.19, 0.01, 1.03, 1.24, 1.54, 0.43, 3.42, 13.21, 10.3, 15.12, 25.08, 6.2, 12.61, 0.3, 2.47, 3.41, -0.42, 11.92]} \ No newline at end of file diff --git a/annotations_1/KTIw9F3TY88_filtered.json b/annotations_1/KTIw9F3TY88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af5ae59cf19d5213e795ece685b9372e656124ed --- /dev/null +++ b/annotations_1/KTIw9F3TY88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 104.53], [106.0, 108.48], [110.0, 110.74], [112.0, 112.21], [113.0, 114.1], [115.0, 117.12], [119.0, 122.27], [123.0, 124.75]], "keep_status": [false, true, false, false, false, true, false, false], "silence_prob": [0.0, 39.93, 0.0, 0.0, 0.0, 43.66, 47.12, 0.0], "audiomae_on_audioset": [null, [["speech", 28.19], ["music", 23.79], ["sonar", 17.06]], null, null, null, [["music", 41.58], ["ambient music", 5.04], ["hum", 4.61]], [["music", 75.93], ["musical instrument", 4.02], ["synthesizer", 2.91]], null], "duration": [94.53, 2.48, 0.74, 0.21, 1.1, 2.12, 3.27, 1.75]} \ No newline at end of file diff --git a/annotations_1/KToHdILd_p0_filtered.json b/annotations_1/KToHdILd_p0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56664382f0908783025fc9fabe73a42030c5c691 --- /dev/null +++ b/annotations_1/KToHdILd_p0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.39], [10.0, 10.72], [13.0, 13.14], [13.0, 17.37], [19.0, 19.7], [20.0, 23.25], [25.0, 27.11], [28.0, 29.19], [31.0, 31.46], [32.0, 32.88], [34.0, 62.5], [63.0, 63.22], [67.0, 72.86], [76.0, 76.44], [76.0, 76.55], [77.0, 76.59], [77.0, 77.4], [78.0, 78.48], [79.0, 80.42], [82.0, 85.53], [92.0, 92.3], [93.0, 104.6], [107.0, 107.25], [108.0, 121.66], [124.0, 147.34]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 38.27, 0.0, 32.47, 49.45, 0.0, 0.0, 0.0, 34.42, 0.0, 40.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.99, 0.0, 30.94, 0.0, 30.19, 33.62], "audiomae_on_audioset": [null, null, null, [["grunt", 37.14], ["music", 22.45], ["boing", 10.03]], null, [["music", 17.63], ["musical instrument", 6.32], ["synthesizer", 4.69]], [["speech", 46.04], ["groan", 15.22], ["sine wave", 3.87]], null, null, null, [["music", 45.9], ["theremin", 19.53], ["mosquito", 5.79]], null, [["speech", 54.59], ["music", 7.65], ["sidetone", 3.62]], null, null, null, null, null, null, [["whack, thwack", 21.64], ["music", 20.09], ["grunt", 11.85]], null, [["fly, housefly", 49.0], ["mosquito", 23.02], ["insect", 11.14]], null, [["speech", 40.12], ["music", 11.81], ["throbbing", 8.15]], [["music", 35.67], ["didgeridoo", 19.1], ["fly, housefly", 5.97]]], "duration": [1.39, 0.72, 0.14, 4.37, 0.7, 3.25, 2.11, 1.19, 0.46, 0.88, 28.5, 0.22, 5.86, 0.44, 0.55, -0.41, 0.4, 0.48, 1.42, 3.53, 0.3, 11.6, 0.25, 13.66, 23.34]} \ No newline at end of file diff --git a/annotations_1/KTxT13DzNsc_filtered.json b/annotations_1/KTxT13DzNsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2133635a6afae1400a6f2a1ae8f1c69ee7ec9a6 --- /dev/null +++ b/annotations_1/KTxT13DzNsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.29], [18.0, 21.81], [34.0, 34.45], [44.0, 44.36], [47.0, 50.25], [52.0, 55.51], [59.0, 59.7], [63.0, 63.48], [67.0, 69.85], [73.0, 73.35], [73.0, 73.38], [73.0, 73.45], [73.0, 80.35], [82.0, 82.12], [86.0, 86.81], [88.0, 89.82], [93.0, 93.56], [95.0, 97.51], [98.0, 99.01], [100.0, 100.11], [100.0, 100.36], [100.0, 102.02], [105.0, 111.59], [119.0, 123.7], [124.0, 124.61], [127.0, 130.86], [131.0, 133.34], [134.0, 136.09], [137.0, 144.96], [148.0, 148.39], [151.0, 153.4], [154.0, 155.66], [159.0, 159.9], [167.0, 167.32], [168.0, 173.08], [174.0, 174.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [56.7, 81.35, 0.0, 0.0, 85.17, 96.54, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 69.2, 86.09, 74.92, 0.0, 41.09, 32.48, 50.21, 60.32, 0.0, 51.88, 0.0, 0.0, 0.0, 73.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.19], ["fart", 24.89], ["whack, thwack", 3.92]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 32.51], ["mains hum", 15.68], ["speech", 13.01]], [["speech", 31.74], ["music", 11.25], ["hum", 6.7]], null, null, null, null, null, null, null, null, null], "duration": [7.29, 3.81, 0.45, 0.36, 3.25, 3.51, 0.7, 0.48, 2.85, 0.35, 0.38, 0.45, 7.35, 0.12, 0.81, 1.82, 0.56, 2.51, 1.01, 0.11, 0.36, 2.02, 6.59, 4.7, 0.61, 3.86, 2.34, 2.09, 7.96, 0.39, 2.4, 1.66, 0.9, 0.32, 5.08, 0.45]} \ No newline at end of file diff --git a/annotations_1/KU5yx6v_Jr8_filtered.json b/annotations_1/KU5yx6v_Jr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0490646bd1c5c3f1499cfc62df217ab4ac2ce74e --- /dev/null +++ b/annotations_1/KU5yx6v_Jr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.63], [10.0, 10.83], [12.0, 13.04], [14.0, 18.62], [22.0, 22.25], [23.0, 27.53], [35.0, 36.26], [39.0, 40.64], [52.0, 59.05], [80.0, 80.52], [84.0, 84.43], [86.0, 106.56], [109.0, 115.11], [116.0, 124.09], [126.0, 135.43], [140.0, 143.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 99.95, 0.0, 0.0, 46.97, 35.48, 34.09, 39.6, 59.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 33.85], ["wind instrument, woodwind instrument", 16.58], ["clarinet", 13.8]], [["music", 37.78], ["tabla", 20.37], ["percussion", 6.97]], [["music", 70.13], ["didgeridoo", 7.57], ["musical instrument", 5.08]], [["music", 52.54], ["musical instrument", 14.55], ["theremin", 3.79]], null], "duration": [0.63, 0.83, 1.04, 4.62, 0.25, 4.53, 1.26, 1.64, 7.05, 0.52, 0.43, 20.56, 6.11, 8.09, 9.43, 3.8]} \ No newline at end of file diff --git a/annotations_1/KUMoWS98jXM_filtered.json b/annotations_1/KUMoWS98jXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5aceae3dd528e4585e6711597e370722c3ef6e5 --- /dev/null +++ b/annotations_1/KUMoWS98jXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.07], [10.0, 10.1], [10.0, 10.13], [10.0, 10.17], [10.0, 10.2], [10.0, 10.23], [29.0, 31.55], [44.0, 49.4], [54.0, 54.89], [60.0, 61.38], [62.0, 61.6], [62.0, 69.9], [74.0, 74.31], [75.0, 75.22], [80.0, 81.16], [87.0, 87.69], [92.0, 92.15], [93.0, 114.74], [118.0, 141.0], [145.0, 147.34], [161.0, 161.43]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.75, 0.0, 0.0, 0.0, 0.0, 0.0, 30.12, 31.47, 0.0, 0.0, 0.0, 36.34, 0.0, 0.0, 0.0, 0.0, 0.0, 32.81, 34.13, 33.88, 0.0], "audiomae_on_audioset": [[["music", 60.82], ["speech", 20.01], ["sidetone", 1.55]], null, null, null, null, null, [["music", 37.6], ["speech", 33.79], ["sound effect", 2.93]], [["vehicle", 28.82], ["skidding", 16.74], ["music", 14.73]], null, null, null, [["music", 42.02], ["speech", 27.66], ["drum machine", 3.81]], null, null, null, null, null, [["music", 45.68], ["speech", 29.75], ["boing", 3.79]], [["music", 37.66], ["fly, housefly", 19.58], ["mosquito", 14.5]], [["music", 55.79], ["speech", 20.39], ["sidetone", 3.98]], null], "duration": [2.07, 0.1, 0.13, 0.17, 0.2, 0.23, 2.55, 5.4, 0.89, 1.38, -0.4, 7.9, 0.31, 0.22, 1.16, 0.69, 0.15, 21.74, 23.0, 2.34, 0.43]} \ No newline at end of file diff --git a/annotations_1/KVbBkEyaoT8_filtered.json b/annotations_1/KVbBkEyaoT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..435bd6218c38016e70c660623e7e10d6f5e0b397 --- /dev/null +++ b/annotations_1/KVbBkEyaoT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.78], [7.0, 6.94], [9.0, 10.39], [13.0, 13.96], [17.0, 17.05], [19.0, 19.03], [21.0, 21.46], [25.0, 35.01], [36.0, 36.64], [37.0, 37.57], [38.0, 43.02], [43.0, 45.84], [46.0, 47.11], [52.0, 56.4], [69.0, 69.77], [71.0, 71.9], [73.0, 73.25], [76.0, 76.55], [82.0, 86.34], [88.0, 88.25], [92.0, 92.5], [98.0, 98.52], [100.0, 101.56], [103.0, 110.71], [112.0, 113.29], [115.0, 115.26], [117.0, 134.4], [140.0, 144.86], [146.0, 145.64], [149.0, 152.61], [156.0, 160.81], [166.0, 167.95], [180.0, 180.81], [181.0, 182.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.11, 0.0, 0.0, 39.18, 39.11, 0.0, 40.55, 0.0, 0.0, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 41.03, 0.0, 0.0, 35.13, 30.2, 0.0, 70.3, 33.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 56.81], ["boing", 10.49], ["glass", 7.12]], null, null, [["music", 41.47], ["boing", 12.48], ["fart", 10.76]], [["music", 28.82], ["hum", 9.18], ["sonar", 7.94]], null, [["music", 62.93], ["electronic music", 5.3], ["throbbing", 2.95]], null, null, null, null, [["music", 37.72], ["speech", 36.4], ["thunk", 5.29]], null, null, null, null, [["music", 74.83], ["sonar", 5.02], ["ping", 3.77]], null, null, [["music", 51.88], ["throbbing", 13.13], ["hum", 7.39]], [["music", 21.91], ["speech", 9.52], ["grunt", 8.99]], null, null, [["music", 40.99], ["speech", 23.71], ["hum", 4.38]], null, null, null], "duration": [1.78, -0.06, 1.39, 0.96, 0.05, 0.03, 0.46, 10.01, 0.64, 0.57, 5.02, 2.84, 1.11, 4.4, 0.77, 0.9, 0.25, 0.55, 4.34, 0.25, 0.5, 0.52, 1.56, 7.71, 1.29, 0.26, 17.4, 4.86, -0.36, 3.61, 4.81, 1.95, 0.81, 1.95]} \ No newline at end of file diff --git a/annotations_1/KVvqRC018VA_filtered.json b/annotations_1/KVvqRC018VA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e50d08d7d7c0a747f303ae6f5b5766b291d40abe --- /dev/null +++ b/annotations_1/KVvqRC018VA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.1], [23.0, 26.13], [33.0, 34.35], [36.0, 54.62], [56.0, 59.29], [60.0, 69.26], [70.0, 73.55], [77.0, 90.31], [91.0, 95.0], [95.0, 98.52], [99.0, 100.8], [105.0, 106.74], [107.0, 108.6], [111.0, 112.4], [115.0, 116.61], [118.0, 120.45], [130.0, 151.01], [163.0, 169.33], [169.0, 169.4], [170.0, 178.19], [179.0, 179.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.47, 0.0, 58.98, 72.6, 98.66, 91.81, 98.66, 83.16, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 34.93, 83.34, 0.0, 66.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.89], ["speech", 11.61], ["theremin", 3.72]], null, null, null, null], "duration": [1.1, 3.13, 1.35, 18.62, 3.29, 9.26, 3.55, 13.31, 4.0, 3.52, 1.8, 1.74, 1.6, 1.4, 1.61, 2.45, 21.01, 6.33, 0.4, 8.19, 0.09]} \ No newline at end of file diff --git a/annotations_1/KW1fyTqH0oE_filtered.json b/annotations_1/KW1fyTqH0oE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..218a12669d527c3bbce4844b911a9bd3beb392af --- /dev/null +++ b/annotations_1/KW1fyTqH0oE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 137.86]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [91.86]} \ No newline at end of file diff --git a/annotations_1/KXMOURHEMpY_filtered.json b/annotations_1/KXMOURHEMpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..caae3419b04d3c5efc2cd4a418992defd4acf9ff --- /dev/null +++ b/annotations_1/KXMOURHEMpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.45], [23.0, 23.45], [28.0, 28.11], [29.0, 29.88], [38.0, 38.82], [41.0, 41.2], [42.0, 51.27], [53.0, 53.18], [56.0, 56.81], [57.0, 57.84], [59.0, 60.4], [62.0, 63.64], [65.0, 66.02], [70.0, 73.11], [74.0, 73.87], [75.0, 76.3], [80.0, 87.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.04, 0.0, 0.0, 32.6], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 92.94], ["radio", 3.93], ["noise", 0.69]], null, null, null, null, null, null, [["snicker", 30.99], ["baby laughter", 11.82], ["quack", 9.01]], null, null, [["snicker", 28.26], ["bouncing", 14.44], ["laughter", 6.94]]], "duration": [0.45, 0.45, 0.11, 0.88, 0.82, 0.2, 9.27, 0.18, 0.81, 0.84, 1.4, 1.64, 1.02, 3.11, -0.13, 1.3, 7.42]} \ No newline at end of file diff --git a/annotations_1/KXTBm9eUiko_filtered.json b/annotations_1/KXTBm9eUiko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b31a9a5f768a5c7b7b6f00ff46f1910eec32aafe --- /dev/null +++ b/annotations_1/KXTBm9eUiko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.61], [4.0, 4.13], [5.0, 7.16], [8.0, 11.1], [13.0, 12.93], [13.0, 14.62], [16.0, 17.24], [23.0, 24.06], [28.0, 35.34], [39.0, 49.17], [50.0, 50.55], [52.0, 52.47], [53.0, 54.09], [55.0, 56.46], [61.0, 62.58], [68.0, 69.15], [72.0, 72.42], [73.0, 74.6], [75.0, 74.63], [75.0, 74.73], [75.0, 75.25], [75.0, 77.09], [78.0, 78.07], [81.0, 82.22], [83.0, 84.69], [90.0, 90.75], [91.0, 93.04], [97.0, 99.05], [100.0, 100.3], [103.0, 103.22], [106.0, 118.05], [123.0, 123.84], [131.0, 132.36], [135.0, 137.12]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 60.23, 62.99, 0.0, 0.0, 0.0, 0.0, 33.95, 37.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.46, 0.0, 0.0, 0.0, 0.0, 45.46, 59.68, 0.0, 0.0, 35.99, 0.0, 0.0, 46.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 34.91], ["hum", 18.61], ["throbbing", 14.11]], [["hum", 34.75], ["speech", 29.31], ["mains hum", 14.39]], null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 34.19], ["hum", 34.01], ["speech", 7.07]], null, null, null, null, [["sidetone", 27.8], ["hum", 22.21], ["mains hum", 15.0]], null, null, null, [["speech", 52.38], ["hum", 8.76], ["rumble", 7.52]], null, null, [["speech", 53.55], ["music", 7.5], ["vehicle", 2.42]]], "duration": [1.61, 0.13, 2.16, 3.1, -0.07, 1.62, 1.24, 1.06, 7.34, 10.17, 0.55, 0.47, 1.09, 1.46, 1.58, 1.15, 0.42, 1.6, -0.37, -0.27, 0.25, 2.09, 0.07, 1.22, 1.69, 0.75, 2.04, 2.05, 0.3, 0.22, 12.05, 0.84, 1.36, 2.12]} \ No newline at end of file diff --git a/annotations_1/KY-bRBsLLtA_filtered.json b/annotations_1/KY-bRBsLLtA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30b3222af09d9ad0e981d178dcf71096a8cf2ae9 --- /dev/null +++ b/annotations_1/KY-bRBsLLtA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.19], [3.0, 3.59], [6.0, 5.95], [9.0, 9.27], [12.0, 12.9], [14.0, 15.38], [17.0, 47.34], [49.0, 62.5], [66.0, 67.05], [68.0, 69.06], [70.0, 78.97], [79.0, 98.14], [103.0, 116.95], [120.0, 123.15], [125.0, 129.05], [129.0, 133.81], [141.0, 173.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 100.0, 82.07, 53.16, 96.89, 88.28, 64.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.59, -0.05, 0.27, 0.9, 1.38, 30.34, 13.5, 1.05, 1.06, 8.97, 19.14, 13.95, 3.15, 4.05, 4.81, 32.97]} \ No newline at end of file diff --git a/annotations_1/K_NTydd3MqM_filtered.json b/annotations_1/K_NTydd3MqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0451c287b3fc46d3c7e86be462554bbef56d1d7 --- /dev/null +++ b/annotations_1/K_NTydd3MqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [3.0, 2.89], [3.0, 4.23], [8.0, 9.36], [10.0, 12.43], [35.0, 35.73], [54.0, 56.12], [73.0, 74.88], [77.0, 77.68], [89.0, 89.95], [100.0, 99.93], [103.0, 103.01], [110.0, 112.01], [120.0, 121.51], [122.0, 126.3], [133.0, 138.7], [140.0, 140.58], [144.0, 149.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 65.91, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 36.11, 0.0, 29.45, 33.77, 0.0, 29.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 57.93], ["music", 11.17], ["didgeridoo", 8.2]], null, [["music", 52.06], ["speech", 5.19], ["vehicle", 4.35]], [["music", 32.43], ["throbbing", 15.42], ["hum", 8.62]], null, [["music", 77.54], ["speech", 4.79], ["boing", 2.12]]], "duration": [0.86, -0.11, 1.23, 1.36, 2.43, 0.73, 2.12, 1.88, 0.68, 0.95, -0.07, 0.01, 2.01, 1.51, 4.3, 5.7, 0.58, 5.49]} \ No newline at end of file diff --git a/annotations_1/KaLpXs1SDWo_filtered.json b/annotations_1/KaLpXs1SDWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bc615f6513f5798ebc0d00c4b5bbe6efef8da3d --- /dev/null +++ b/annotations_1/KaLpXs1SDWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 36.78], [37.0, 36.81], [37.0, 36.85], [41.0, 45.22], [47.0, 47.92], [49.0, 49.71], [51.0, 55.58], [57.0, 63.07], [66.0, 70.5], [75.0, 77.19], [78.0, 78.78], [80.0, 81.73], [83.0, 85.48], [86.0, 90.27], [92.0, 98.9]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, false, true, true, false], "silence_prob": [29.58, 0.0, 0.0, 31.38, 0.0, 0.0, 30.75, 30.53, 30.98, 38.74, 0.0, 0.0, 30.24, 29.35, 31.92], "audiomae_on_audioset": [[["whack, thwack", 31.43], ["cattle, bovinae", 21.57], ["moo", 10.99]], null, null, [["music", 19.08], ["speech", 18.91], ["hum", 10.3]], null, null, [["hum", 53.54], ["mains hum", 24.82], ["throbbing", 6.65]], [["music", 31.94], ["speech", 18.53], ["hum", 6.47]], [["speech", 63.72], ["cattle, bovinae", 3.74], ["outside, urban or manmade", 2.6]], [["music", 49.51], ["hum", 9.74], ["throbbing", 6.87]], null, null, [["music", 17.31], ["boom", 13.65], ["hum", 12.98]], [["cattle, bovinae", 16.13], ["livestock, farm animals, working animals", 14.83], ["moo", 10.33]], [["music", 75.81], ["cacophony", 4.37], ["hum", 0.96]]], "duration": [15.78, -0.19, -0.15, 4.22, 0.92, 0.71, 4.58, 6.07, 4.5, 2.19, 0.78, 1.73, 2.48, 4.27, 6.9]} \ No newline at end of file diff --git a/annotations_1/KaVglFjQynk_filtered.json b/annotations_1/KaVglFjQynk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53a4210c19fbc4c7d0781089c80ba1df7728019c --- /dev/null +++ b/annotations_1/KaVglFjQynk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.27], [17.0, 28.65], [30.0, 38.47], [42.0, 43.07], [45.0, 45.5], [47.0, 47.55], [55.0, 57.43], [60.0, 61.69], [68.0, 68.15], [69.0, 69.38], [70.0, 73.21], [77.0, 77.06], [78.0, 78.22], [82.0, 86.56], [88.0, 88.74], [98.0, 98.34], [102.0, 105.76], [107.0, 115.1], [117.0, 117.76], [122.0, 126.86], [130.0, 130.42]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.99, 35.32, 33.68, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 38.27, 0.0, 0.0, 42.24, 36.72, 0.0, 55.96, 0.0], "audiomae_on_audioset": [[["music", 48.62], ["speech", 13.29], ["hum", 3.09]], [["music", 52.57], ["boing", 20.51], ["quack", 12.02]], [["music", 50.3], ["speech", 32.12], ["boing", 3.56]], null, null, null, null, null, null, null, null, null, null, [["music", 45.74], ["carnatic music", 37.21], ["musical instrument", 2.08]], null, null, [["music", 45.33], ["speech", 24.21], ["throbbing", 5.54]], [["speech", 67.11], ["music", 12.32], ["fart", 2.83]], null, null, null], "duration": [6.27, 11.65, 8.47, 1.07, 0.5, 0.55, 2.43, 1.69, 0.15, 0.38, 3.21, 0.06, 0.22, 4.56, 0.74, 0.34, 3.76, 8.1, 0.76, 4.86, 0.42]} \ No newline at end of file diff --git a/annotations_1/KaqzKhM9-nU_filtered.json b/annotations_1/KaqzKhM9-nU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42fb7d0d90627d33f7e8e997fbd5417bb0eee9dc --- /dev/null +++ b/annotations_1/KaqzKhM9-nU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.72], [15.0, 15.4], [17.0, 17.78], [25.0, 26.35], [28.0, 29.4], [30.0, 30.59], [31.0, 32.7], [33.0, 34.64], [65.0, 65.37], [75.0, 75.25], [76.0, 76.69], [80.0, 83.25], [100.0, 100.53], [101.0, 102.93], [109.0, 110.1], [112.0, 112.72], [132.0, 132.85], [142.0, 142.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.14], ["speech", 26.26], ["boing", 9.36]], null, null, null, null, null, null], "duration": [2.72, 0.4, 0.78, 1.35, 1.4, 0.59, 1.7, 1.64, 0.37, 0.25, 0.69, 3.25, 0.53, 1.93, 1.1, 0.72, 0.85, 0.77]} \ No newline at end of file diff --git a/annotations_1/Kb2WClrbrAc_filtered.json b/annotations_1/Kb2WClrbrAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86f49fb1f26822a7879e96e09865477694136883 --- /dev/null +++ b/annotations_1/Kb2WClrbrAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 5.58], [6.0, 8.29], [20.0, 21.0], [23.0, 25.12], [30.0, 30.67], [41.0, 41.89], [43.0, 45.06], [50.0, 51.16], [52.0, 53.43], [57.0, 57.94], [61.0, 61.82], [64.0, 64.77], [70.0, 70.36], [72.0, 73.2], [75.0, 76.99], [79.0, 79.42], [82.0, 83.34], [87.0, 88.45], [95.0, 95.89], [99.0, 100.72], [103.0, 105.19], [105.0, 105.78], [107.0, 107.87], [109.0, 114.25], [115.0, 116.02], [117.0, 118.56], [126.0, 127.5], [129.0, 131.16], [132.0, 174.61], [176.0, 195.88], [197.0, 197.14], [198.0, 201.5], [202.0, 202.24], [205.0, 204.84], [206.0, 211.08], [215.0, 222.71], [226.0, 241.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 79.41, 0.0, 92.64, 0.0, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 98.36, 0.0, 33.22, 0.0, 35.11, 0.0, 0.0, 31.47, 36.11, 33.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.74], ["scary music", 18.88], ["soundtrack music", 3.28]], null, [["speech", 27.17], ["music", 17.62], ["hum", 11.61]], null, null, [["music", 36.43], ["speech", 14.83], ["didgeridoo", 11.87]], [["hum", 50.4], ["mains hum", 17.85], ["throbbing", 9.88]], [["music", 21.37], ["speech", 12.92], ["throbbing", 9.77]]], "duration": [0.51, 0.58, 2.29, 1.0, 2.12, 0.67, 0.89, 2.06, 1.16, 1.43, 0.94, 0.82, 0.77, 0.36, 1.2, 1.99, 0.42, 1.34, 1.45, 0.89, 1.72, 2.19, 0.78, 0.87, 5.25, 1.02, 1.56, 1.5, 2.16, 42.61, 19.88, 0.14, 3.5, 0.24, -0.16, 5.08, 7.71, 15.44]} \ No newline at end of file diff --git a/annotations_1/KbRMCmnLU8o_filtered.json b/annotations_1/KbRMCmnLU8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3710112c2af022f404dcd752898396d9bd8b345d --- /dev/null +++ b/annotations_1/KbRMCmnLU8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 25.0], [26.0, 26.89], [29.0, 29.51], [31.0, 31.7], [33.0, 33.08], [34.0, 35.24], [38.0, 39.53], [42.0, 46.4], [48.0, 48.3], [51.0, 51.07], [53.0, 53.92], [57.0, 59.91], [62.0, 62.36], [67.0, 70.87], [71.0, 74.63], [76.0, 77.36], [79.0, 79.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 52.92, 0.0, 68.41, 62.99, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 67.9], ["thunk", 4.49], ["sidetone", 3.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.0, 0.89, 0.51, 0.7, 0.08, 1.24, 1.53, 4.4, 0.3, 0.07, 0.92, 2.91, 0.36, 3.87, 3.63, 1.36, 0.64]} \ No newline at end of file diff --git a/annotations_1/KblaujDjQ4g_filtered.json b/annotations_1/KblaujDjQ4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e2e6e5ef8795ca1b9939bb3c5e59e5d462ed1b5 --- /dev/null +++ b/annotations_1/KblaujDjQ4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [5.0, 7.18], [10.0, 10.62], [12.0, 28.63], [32.0, 33.37], [34.0, 35.46], [39.0, 39.8], [41.0, 40.86], [42.0, 45.67], [47.0, 48.24], [51.0, 52.32], [54.0, 54.21], [59.0, 59.58], [62.0, 63.0], [66.0, 65.82], [67.0, 68.13], [69.0, 70.29], [76.0, 76.47], [83.0, 84.23], [86.0, 86.58], [92.0, 92.18], [95.0, 95.3], [97.0, 97.97], [99.0, 100.31], [102.0, 105.14], [108.0, 108.06], [108.0, 110.56], [113.0, 114.74], [122.0, 123.08], [124.0, 124.95], [127.0, 127.7], [132.0, 132.87], [135.0, 135.77], [136.0, 137.35], [138.0, 144.58], [145.0, 148.19], [150.0, 151.78], [158.0, 158.7], [163.0, 165.05], [168.0, 169.6], [176.0, 179.34], [182.0, 182.8], [183.0, 183.63], [184.0, 185.7], [186.0, 188.76], [189.0, 191.69], [192.0, 195.84], [201.0, 213.36], [214.0, 215.57]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.05, 75.88, 0.0, 33.92, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.46, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 64.52, 0.0, 0.0, 98.1, 0.0, 97.43, 0.0, 0.0, 0.0, 58.64, 61.67, 62.07, 36.32, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.63], ["musical instrument", 11.07], ["didgeridoo", 7.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 33.2], ["music", 27.29], ["throbbing", 17.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 21.18], ["hum", 19.28], ["music", 17.34]], null], "duration": [2.06, 2.18, 0.62, 16.63, 1.37, 1.46, 0.8, -0.14, 3.67, 1.24, 1.32, 0.21, 0.58, 1.0, -0.18, 1.13, 1.29, 0.47, 1.23, 0.58, 0.18, 0.3, 0.97, 1.31, 3.14, 0.06, 2.56, 1.74, 1.08, 0.95, 0.7, 0.87, 0.77, 1.35, 6.58, 3.19, 1.78, 0.7, 2.05, 1.6, 3.34, 0.8, 0.63, 1.7, 2.76, 2.69, 3.84, 12.36, 1.57]} \ No newline at end of file diff --git a/annotations_1/KccpJ0xD-7E_filtered.json b/annotations_1/KccpJ0xD-7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..411bd860ef740f7d4c572aa8b1315302d96af154 --- /dev/null +++ b/annotations_1/KccpJ0xD-7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.79], [28.0, 28.7], [32.0, 41.74], [46.0, 48.64], [50.0, 51.41], [57.0, 65.79], [67.0, 67.88], [69.0, 88.96], [93.0, 94.49], [96.0, 96.58], [97.0, 100.72], [105.0, 110.46], [112.0, 134.45], [136.0, 150.35], [153.0, 154.52], [168.0, 168.59], [171.0, 171.96], [175.0, 175.83]], "keep_status": [false, false, true, true, false, true, false, true, false, false, true, false, false, true, false, false, false, false], "silence_prob": [78.21, 0.0, 37.72, 33.97, 0.0, 35.05, 0.0, 30.77, 0.0, 0.0, 35.7, 30.08, 30.31, 29.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 29.7], ["music", 25.89], ["mains hum", 14.25]], [["music", 26.76], ["buzz", 9.92], ["fly, housefly", 7.0]], null, [["mosquito", 34.24], ["fly, housefly", 16.22], ["music", 14.45]], null, [["music", 32.28], ["smash, crash", 18.38], ["sound effect", 14.35]], null, null, [["speech", 44.53], ["music", 14.36], ["hum", 6.31]], [["music", 77.57], ["electronic music", 3.12], ["speech", 2.12]], [["speech", 44.69], ["machine gun", 16.94], ["music", 16.77]], [["music", 19.19], ["vehicle", 18.08], ["car", 15.31]], null, null, null, null], "duration": [3.79, 0.7, 9.74, 2.64, 1.41, 8.79, 0.88, 19.96, 1.49, 0.58, 3.72, 5.46, 22.45, 14.35, 1.52, 0.59, 0.96, 0.83]} \ No newline at end of file diff --git a/annotations_1/Kcmz-QxexRo_filtered.json b/annotations_1/Kcmz-QxexRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00250a135099b1c52a6aeb634a42759ae3977d09 --- /dev/null +++ b/annotations_1/Kcmz-QxexRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.26], [10.0, 10.76], [12.0, 12.7], [17.0, 19.55], [20.0, 21.0], [22.0, 23.18], [30.0, 30.69], [36.0, 35.94], [38.0, 38.91], [41.0, 42.45], [43.0, 43.97], [45.0, 46.57], [47.0, 47.87], [48.0, 50.45], [57.0, 56.88], [71.0, 71.24], [74.0, 73.89], [81.0, 82.49], [83.0, 84.45], [103.0, 103.84], [105.0, 106.29], [110.0, 112.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.14], ["radio", 26.14], ["inside, small room", 2.56]], null, null, null, null, null, null, null, null], "duration": [1.26, 0.76, 0.7, 2.55, 1.0, 1.18, 0.69, -0.06, 0.91, 1.45, 0.97, 1.57, 0.87, 2.45, -0.12, 0.24, -0.11, 1.49, 1.45, 0.84, 1.29, 2.11]} \ No newline at end of file diff --git a/annotations_1/KdOgihoZjZY_filtered.json b/annotations_1/KdOgihoZjZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e824fa82c41c8069a5d06f44731b245d810b3e42 --- /dev/null +++ b/annotations_1/KdOgihoZjZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.88], [25.0, 26.4], [28.0, 28.36], [39.0, 41.81], [46.0, 46.53], [48.0, 48.56], [50.0, 50.43], [53.0, 53.2], [56.0, 57.1], [58.0, 57.55], [58.0, 64.99], [82.0, 83.61], [89.0, 90.24], [95.0, 95.01], [108.0, 108.9], [111.0, 111.3], [112.0, 116.18], [118.0, 118.76], [119.0, 119.82], [121.0, 122.94], [127.0, 131.68], [132.0, 134.05], [135.0, 135.68], [145.0, 145.52], [147.0, 149.96], [152.0, 152.29], [154.0, 155.33]], "keep_status": [true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false], "silence_prob": [30.39, 0.0, 0.0, 32.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.7, 0.0, 0.0, 0.0, 0.0, 0.0, 34.92, 0.0, 0.0, 0.0, 28.94, 34.8, 0.0, 0.0, 36.28, 0.0, 0.0], "audiomae_on_audioset": [[["foghorn", 17.38], ["speech", 14.71], ["whip", 9.49]], null, null, [["speech", 20.9], ["gong", 19.34], ["music", 13.52]], null, null, null, null, null, null, [["speech", 43.5], ["explosion", 20.36], ["burst, pop", 5.33]], null, null, null, null, null, [["music", 26.37], ["speech", 20.82], ["hum", 9.08]], null, null, null, [["music", 20.19], ["buzz", 8.2], ["explosion", 7.42]], [["gong", 63.86], ["music", 22.07], ["musical instrument", 1.18]], null, null, [["animal", 39.88], ["howl", 18.79], ["dog", 10.31]], null, null], "duration": [2.88, 1.4, 0.36, 2.81, 0.53, 0.56, 0.43, 0.2, 1.1, -0.45, 6.99, 1.61, 1.24, 0.01, 0.9, 0.3, 4.18, 0.76, 0.82, 1.94, 4.68, 2.05, 0.68, 0.52, 2.96, 0.29, 1.33]} \ No newline at end of file diff --git a/annotations_1/Kdu22nQNZmQ_filtered.json b/annotations_1/Kdu22nQNZmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87e556013b06990dc8d990f54cff6a2e44ba1080 --- /dev/null +++ b/annotations_1/Kdu22nQNZmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 23.45], [26.0, 61.74], [65.0, 80.72], [87.0, 100.06], [105.0, 106.71], [111.0, 115.7], [119.0, 122.5], [124.0, 124.19], [125.0, 154.06], [155.0, 160.56]], "keep_status": [true, false, true, true, false, true, false, false, true, false], "silence_prob": [30.53, 0.0, 29.66, 30.13, 0.0, 29.97, 30.56, 0.0, 29.93, 30.17], "audiomae_on_audioset": [[["music", 36.34], ["hum", 19.9], ["mains hum", 13.6]], null, [["hum", 26.03], ["music", 19.08], ["speech", 15.74]], [["music", 30.3], ["speech", 20.2], ["didgeridoo", 16.04]], null, [["music", 36.35], ["hum", 15.58], ["speech", 14.86]], [["music", 55.84], ["didgeridoo", 8.19], ["throbbing", 6.12]], null, [["music", 57.82], ["synthesizer", 6.79], ["didgeridoo", 4.97]], [["music", 63.94], ["ambient music", 9.13], ["theremin", 4.29]]], "duration": [16.45, 35.74, 15.72, 13.06, 1.71, 4.7, 3.5, 0.19, 29.06, 5.56]} \ No newline at end of file diff --git a/annotations_1/Ke-MYW3XORg_filtered.json b/annotations_1/Ke-MYW3XORg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b939abdcf67e1cf9fcf58377dcdbf2858cba0832 --- /dev/null +++ b/annotations_1/Ke-MYW3XORg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.48], [14.0, 14.25], [21.0, 23.63], [24.0, 24.83], [26.0, 26.91], [27.0, 28.32], [29.0, 30.28], [31.0, 31.83], [35.0, 35.56], [36.0, 37.39], [38.0, 46.26], [47.0, 47.21], [48.0, 54.46], [57.0, 57.4], [58.0, 58.68], [61.0, 61.82], [65.0, 65.37], [70.0, 70.85], [74.0, 75.9], [77.0, 78.17], [80.0, 80.65], [82.0, 83.12], [97.0, 97.53], [103.0, 108.21], [109.0, 111.67], [113.0, 113.9], [116.0, 122.81], [126.0, 126.06], [126.0, 126.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 30.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.23, 31.76, 0.0, 28.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 25.8], ["speech", 24.54], ["whack, thwack", 6.58]], null, [["music", 32.62], ["hum", 12.41], ["animal", 8.64]], null, null, null, null, null, null, null, null, null, null, [["boing", 53.97], ["speech", 17.16], ["echo", 2.93]], [["grunt", 12.8], ["music", 9.53], ["animal", 8.24]], null, [["music", 85.12], ["musical instrument", 1.61], ["mosquito", 1.01]], null, null], "duration": [0.48, 0.25, 2.63, 0.83, 0.91, 1.32, 1.28, 0.83, 0.56, 1.39, 8.26, 0.21, 6.46, 0.4, 0.68, 0.82, 0.37, 0.85, 1.9, 1.17, 0.65, 1.12, 0.53, 5.21, 2.67, 0.9, 6.81, 0.06, 0.22]} \ No newline at end of file diff --git a/annotations_1/Kei4Jlhhz-Q_filtered.json b/annotations_1/Kei4Jlhhz-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5354de08a523e4583ae25902b9650175e47bd6b --- /dev/null +++ b/annotations_1/Kei4Jlhhz-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [4.0, 4.11], [5.0, 5.59], [8.0, 7.94], [12.0, 13.49], [14.0, 14.44], [16.0, 15.92], [19.0, 19.45], [48.0, 48.05], [50.0, 55.26], [64.0, 66.06], [67.0, 71.88], [77.0, 83.94], [86.0, 86.58], [89.0, 89.9], [105.0, 105.49], [112.0, 112.68], [113.0, 113.9], [114.0, 116.9], [117.0, 116.97], [117.0, 118.1]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.56, 32.29, 31.2, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 58.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 25.01], ["speech", 21.25], ["hum", 16.11]], [["music", 23.9], ["mains hum", 17.17], ["hum", 11.38]], [["music", 35.5], ["speech", 18.1], ["sidetone", 17.11]], [["music", 78.13], ["carnatic music", 3.31], ["sitar", 3.3]], null, null, null, null, null, null, null, null], "duration": [-0.05, 0.11, 0.59, -0.06, 1.49, 0.44, -0.08, 0.45, 0.05, 5.26, 2.06, 4.88, 6.94, 0.58, 0.9, 0.49, 0.68, 0.9, 2.9, -0.03, 1.1]} \ No newline at end of file diff --git a/annotations_1/KeiJDMd8loM_filtered.json b/annotations_1/KeiJDMd8loM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5be638101d4787ac75e3a25c10e21b2b9a2e23d5 --- /dev/null +++ b/annotations_1/KeiJDMd8loM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 18.84], [22.0, 44.79], [49.0, 56.1], [59.0, 66.04], [66.0, 102.71], [104.0, 123.13], [123.0, 131.14]], "keep_status": [true, true, true, true, false, true, true], "silence_prob": [31.5, 35.7, 29.36, 34.85, 0.0, 30.98, 30.02], "audiomae_on_audioset": [[["speech", 40.19], ["grunt", 12.81], ["echo", 5.3]], [["speech", 56.16], ["explosion", 6.56], ["hum", 5.63]], [["speech", 30.82], ["hum", 17.2], ["throbbing", 12.15]], [["speech", 40.43], ["hum", 7.52], ["throbbing", 7.26]], null, [["hum", 26.52], ["music", 17.7], ["throbbing", 16.95]], [["music", 38.79], ["speech", 27.05], ["electronic music", 4.04]]], "duration": [16.84, 22.79, 7.1, 7.04, 36.71, 19.13, 8.14]} \ No newline at end of file diff --git a/annotations_1/KekChFdIe00_filtered.json b/annotations_1/KekChFdIe00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8bfd4108cca8daa33a33989bba096f94742f9db --- /dev/null +++ b/annotations_1/KekChFdIe00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.53], [18.0, 19.03], [21.0, 21.3], [22.0, 23.14], [24.0, 24.73], [26.0, 25.98], [33.0, 33.59], [46.0, 47.04], [56.0, 57.1], [58.0, 57.89], [61.0, 61.96], [63.0, 64.18], [66.0, 66.29], [68.0, 68.64], [70.0, 71.02], [79.0, 79.69], [82.0, 83.15], [83.0, 87.51], [89.0, 91.91], [93.0, 94.47], [97.0, 97.65], [102.0, 102.9], [106.0, 107.54], [140.0, 140.7], [148.0, 148.2], [149.0, 149.91], [158.0, 171.81], [173.0, 173.8], [174.0, 174.92], [176.0, 177.87], [180.0, 181.03], [183.0, 184.69], [186.0, 187.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.03, 0.3, 1.14, 0.73, -0.02, 0.59, 1.04, 1.1, -0.11, 0.96, 1.18, 0.29, 0.64, 1.02, 0.69, 1.15, 4.51, 2.91, 1.47, 0.65, 0.9, 1.54, 0.7, 0.2, 0.91, 13.81, 0.8, 0.92, 1.87, 1.03, 1.69, 1.83]} \ No newline at end of file diff --git a/annotations_1/Kekb8jHfDxI_filtered.json b/annotations_1/Kekb8jHfDxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80906cb1ef40e8dfa5b3492fdb3b3bd62519892f --- /dev/null +++ b/annotations_1/Kekb8jHfDxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [5.0, 6.03], [8.0, 8.21], [20.0, 20.04], [22.0, 24.0], [25.0, 110.56], [111.0, 122.25], [123.0, 124.98], [126.0, 130.05], [130.0, 131.6]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.5, 0.0, 30.47, 0.0, 32.19, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 28.61], ["boom", 15.8], ["whack, thwack", 9.13]], null, [["speech", 51.0], ["music", 14.43], ["noise", 4.95]], null, [["hum", 28.51], ["throbbing", 26.61], ["music", 17.03]], null], "duration": [0.92, 1.03, 0.21, 0.04, 2.0, 85.56, 11.25, 1.98, 4.05, 1.6]} \ No newline at end of file diff --git a/annotations_1/KfAm5nyHM3U_filtered.json b/annotations_1/KfAm5nyHM3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18956987fbf9a25bb1d03c0f10e4cbe2aa47647e --- /dev/null +++ b/annotations_1/KfAm5nyHM3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[62.0, 63.44], [64.0, 125.81], [127.0, 130.52]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 59.42], "audiomae_on_audioset": [null, null, null], "duration": [1.44, 61.81, 3.52]} \ No newline at end of file diff --git a/annotations_1/KfxQi9_BfHI_filtered.json b/annotations_1/KfxQi9_BfHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5763353b8f8c4a65b98d45783ceb71f253a4c0f --- /dev/null +++ b/annotations_1/KfxQi9_BfHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.39], [19.0, 25.24], [26.0, 27.14], [40.0, 41.0], [42.0, 42.26], [49.0, 49.54], [52.0, 52.17], [52.0, 52.91], [56.0, 55.83], [57.0, 57.59], [59.0, 59.8], [61.0, 65.69], [66.0, 72.0], [73.0, 74.07], [75.0, 77.28], [87.0, 96.18]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.12, 30.8, 0.0, 31.24, 30.64], "audiomae_on_audioset": [null, [["cattle, bovinae", 18.55], ["music", 17.68], ["speech", 13.07]], null, null, null, null, null, null, null, null, null, [["music", 17.18], ["sidetone", 15.37], ["whale vocalization", 11.57]], [["livestock, farm animals, working animals", 33.72], ["cattle, bovinae", 33.41], ["moo", 27.78]], null, [["music", 48.04], ["speech", 25.04], ["percussion", 2.44]], [["music", 38.75], ["hum", 23.86], ["throbbing", 19.46]]], "duration": [0.39, 6.24, 1.14, 1.0, 0.26, 0.54, 0.17, 0.91, -0.17, 0.59, 0.8, 4.69, 6.0, 1.07, 2.28, 9.18]} \ No newline at end of file diff --git a/annotations_1/Kfzxu_SIzGo_filtered.json b/annotations_1/Kfzxu_SIzGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..801af18b9297bfca2e3bef8f9cbf3ed56db1401b --- /dev/null +++ b/annotations_1/Kfzxu_SIzGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 102.36], [110.0, 111.05], [116.0, 118.27], [120.0, 128.49], [130.0, 131.75], [133.0, 133.51], [135.0, 136.54], [143.0, 156.29], [159.0, 167.58]], "keep_status": [false, false, true, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 39.34, 41.81, 0.0, 0.0, 0.0, 38.26, 28.16], "audiomae_on_audioset": [null, null, [["whale vocalization", 9.92], ["music", 8.07], ["noise", 7.25]], [["speech", 60.08], ["gong", 4.93], ["hum", 4.41]], null, null, null, [["buzz", 19.64], ["music", 18.43], ["hum", 7.77]], [["vehicle", 16.36], ["car", 10.42], ["hum", 7.89]]], "duration": [102.36, 1.05, 2.27, 8.49, 1.75, 0.51, 1.54, 13.29, 8.58]} \ No newline at end of file diff --git a/annotations_1/KgmFWHZXmiY_filtered.json b/annotations_1/KgmFWHZXmiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a81e3d94b2d2ba7e4a17337ccb44b48298e789d6 --- /dev/null +++ b/annotations_1/KgmFWHZXmiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [6.0, 6.29], [8.0, 8.95], [11.0, 13.26], [14.0, 15.79], [17.0, 18.67], [22.0, 28.24], [30.0, 33.88], [35.0, 35.51], [37.0, 42.94], [53.0, 54.78], [68.0, 69.09], [70.0, 71.05], [74.0, 74.29], [75.0, 75.52], [82.0, 81.62], [84.0, 85.26], [95.0, 95.66], [98.0, 98.39], [100.0, 100.77], [102.0, 102.9], [114.0, 114.29], [115.0, 115.89], [120.0, 120.14], [127.0, 127.55], [157.0, 162.14], [167.0, 166.87]], "keep_status": [false, false, false, true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 48.95, 0.0, 0.0, 34.75, 34.63, 0.0, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 20.26], ["heart sounds, heartbeat", 11.07], ["throbbing", 9.16]], null, null, [["vehicle", 13.99], ["rumble", 13.4], ["music", 10.93]], [["hum", 28.91], ["music", 17.39], ["mains hum", 13.68]], null, [["speech", 19.78], ["vehicle", 12.32], ["rumble", 5.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 19.36], ["gunshot, gunfire", 14.43], ["artillery fire", 14.42]], null], "duration": [0.5, 0.29, 0.95, 2.26, 1.79, 1.67, 6.24, 3.88, 0.51, 5.94, 1.78, 1.09, 1.05, 0.29, 0.52, -0.38, 1.26, 0.66, 0.39, 0.77, 0.9, 0.29, 0.89, 0.14, 0.55, 5.14, -0.13]} \ No newline at end of file diff --git a/annotations_1/KgnrxjgHngA_filtered.json b/annotations_1/KgnrxjgHngA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fafa8f15b10694efdf076a53d6f74c5591555ffd --- /dev/null +++ b/annotations_1/KgnrxjgHngA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [5.0, 14.1], [15.0, 17.59], [18.0, 26.23], [30.0, 42.99], [49.0, 73.6], [74.0, 88.48], [91.0, 97.34], [98.0, 98.61], [100.0, 101.07], [105.0, 114.72], [117.0, 127.97]], "keep_status": [false, false, true, true, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 39.4, 40.66, 39.86, 39.14, 35.42, 31.55, 31.9, 0.0, 0.0, 29.66, 31.73], "audiomae_on_audioset": [null, [["music", 55.11], ["theremin", 8.8], ["didgeridoo", 7.35]], [["music", 43.72], ["bell", 4.23], ["glockenspiel", 3.72]], [["music", 52.94], ["speech", 5.8], ["theremin", 3.0]], [["music", 62.83], ["didgeridoo", 11.66], ["bell", 1.69]], [["music", 55.93], ["didgeridoo", 7.22], ["bell", 5.63]], [["music", 59.57], ["throbbing", 7.63], ["bell", 6.65]], [["throbbing", 35.97], ["music", 20.5], ["hum", 3.31]], null, null, [["music", 56.49], ["speech", 12.89], ["boing", 2.91]], [["speech", 57.69], ["explosion", 6.88], ["whack, thwack", 4.89]]], "duration": [1.45, 9.1, 2.59, 8.23, 12.99, 24.6, 14.48, 6.34, 0.61, 1.07, 9.72, 10.97]} \ No newline at end of file diff --git a/annotations_1/KhS2-vKr1JY_filtered.json b/annotations_1/KhS2-vKr1JY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee08e1c0a926b8c606d21fd32ff59e438c6c20da --- /dev/null +++ b/annotations_1/KhS2-vKr1JY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.53], [19.0, 22.54], [24.0, 38.91], [40.0, 58.9], [61.0, 62.19], [65.0, 66.65], [68.0, 69.55], [72.0, 86.64], [90.0, 90.86], [91.0, 96.06], [101.0, 104.67], [107.0, 108.6], [116.0, 117.1], [118.0, 126.6], [128.0, 127.85], [130.0, 132.41], [139.0, 139.35], [143.0, 142.94], [145.0, 148.17], [150.0, 150.28], [154.0, 154.97], [157.0, 157.25], [161.0, 163.44], [169.0, 174.78], [178.0, 178.78], [180.0, 184.2], [185.0, 191.61], [193.0, 193.46], [194.0, 200.74], [205.0, 207.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.01, 45.65, 34.97, 0.0, 0.0, 0.0, 39.12, 0.0, 40.48, 41.32, 0.0, 0.0, 35.47, 0.0, 35.79, 0.0, 0.0, 32.82, 0.0, 0.0, 0.0, 34.52, 31.32, 0.0, 31.5, 31.18, 0.0, 32.85, 34.05], "audiomae_on_audioset": [null, null, [["throbbing", 39.52], ["music", 22.91], ["hum", 22.47]], [["music", 79.67], ["ambient music", 2.77], ["synthesizer", 2.02]], null, null, null, [["music", 43.98], ["bleat", 6.37], ["livestock, farm animals, working animals", 5.59]], null, [["music", 41.18], ["throbbing", 25.73], ["hum", 10.65]], [["music", 56.27], ["hum", 18.27], ["throbbing", 4.74]], null, null, [["music", 42.86], ["throbbing", 24.32], ["hum", 21.72]], null, [["music", 67.92], ["throbbing", 8.24], ["hum", 3.29]], null, null, [["music", 83.23], ["singing", 1.37], ["mantra", 1.26]], null, null, null, [["music", 36.65], ["mosquito", 6.74], ["didgeridoo", 6.27]], [["music", 69.29], ["didgeridoo", 3.46], ["singing", 2.77]], null, [["music", 38.29], ["throbbing", 36.98], ["hum", 9.97]], [["music", 66.39], ["throbbing", 3.4], ["hum", 2.41]], null, [["music", 70.53], ["theremin", 10.32], ["didgeridoo", 2.02]], [["music", 68.83], ["mantra", 6.44], ["musical instrument", 3.21]]], "duration": [1.53, 3.54, 14.91, 18.9, 1.19, 1.65, 1.55, 14.64, 0.86, 5.06, 3.67, 1.6, 1.1, 8.6, -0.15, 2.41, 0.35, -0.06, 3.17, 0.28, 0.97, 0.25, 2.44, 5.78, 0.78, 4.2, 6.61, 0.46, 6.74, 2.47]} \ No newline at end of file diff --git a/annotations_1/Kiw89e1mHpM_filtered.json b/annotations_1/Kiw89e1mHpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83f08c358eb64b318d7598e45b3ad794d6658195 --- /dev/null +++ b/annotations_1/Kiw89e1mHpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [4.0, 4.72], [6.0, 7.8], [10.0, 11.42], [16.0, 16.82], [18.0, 18.47], [22.0, 22.62], [25.0, 25.32], [36.0, 36.24], [38.0, 42.15], [44.0, 44.09], [48.0, 49.91], [51.0, 52.49], [54.0, 55.54], [57.0, 57.01], [59.0, 64.2], [66.0, 67.83], [69.0, 77.53], [79.0, 79.93], [81.0, 122.94], [123.0, 123.25], [124.0, 139.33], [140.0, 141.49], [142.0, 144.27], [146.0, 146.43], [149.0, 165.5], [167.0, 185.45], [186.0, 192.54], [193.0, 193.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 0.0, 41.6, 0.0, 0.0, 0.0, 32.28, 0.0, 28.42, 0.0, 29.66, 32.29, 29.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["bow-wow", 14.17], ["boing", 12.7], ["animal", 8.22]], null, null, null, [["music", 31.85], ["throbbing", 29.27], ["hum", 17.48]], null, [["music", 15.99], ["speech", 13.47], ["whoosh, swoosh, swish", 8.11]], null, [["music", 80.95], ["speech", 10.68], ["electronic music", 2.48]], [["music", 34.7], ["speech", 15.98], ["thump, thud", 6.15]], [["speech", 45.03], ["music", 36.54], ["didgeridoo", 3.29]], null], "duration": [0.86, 0.72, 1.8, 1.42, 0.82, 0.47, 0.62, 0.32, 0.24, 4.15, 0.09, 1.91, 1.49, 1.54, 0.01, 5.2, 1.83, 8.53, 0.93, 41.94, 0.25, 15.33, 1.49, 2.27, 0.43, 16.5, 18.45, 6.54, 0.83]} \ No newline at end of file diff --git a/annotations_1/KjWPSq6-Ets_filtered.json b/annotations_1/KjWPSq6-Ets_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48aeb3e42f5bc8e98ae5e30df91c037593978b04 --- /dev/null +++ b/annotations_1/KjWPSq6-Ets_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.17], [30.0, 30.35], [39.0, 44.96], [55.0, 55.59], [58.0, 58.92], [73.0, 76.5], [82.0, 85.51], [86.0, 87.64], [90.0, 92.21], [93.0, 93.36], [112.0, 112.62], [117.0, 117.05], [118.0, 118.49], [123.0, 123.62], [125.0, 125.04], [127.0, 136.56], [137.0, 137.32], [141.0, 142.69], [150.0, 150.43], [151.0, 150.82], [152.0, 152.14], [167.0, 171.05], [172.0, 178.34], [182.0, 183.71], [187.0, 189.11], [191.0, 192.72], [197.0, 199.05], [201.0, 201.46], [203.0, 216.46]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 0.0, 29.9, 33.9, 0.0, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.68, 0.0, 0.0, 0.0, 0.0, 0.0, 30.51, 35.22, 0.0, 42.13, 0.0, 32.61, 0.0, 28.65], "audiomae_on_audioset": [null, null, [["music", 18.51], ["speech", 11.15], ["throbbing", 8.04]], null, null, [["music", 49.6], ["roar", 4.82], ["didgeridoo", 4.54]], [["music", 80.84], ["didgeridoo", 2.29], ["musical instrument", 2.29]], null, [["music", 70.93], ["cacophony", 3.99], ["smash, crash", 2.89]], null, null, null, null, null, null, [["music", 71.16], ["throbbing", 5.78], ["speech", 5.69]], null, null, null, null, null, [["music", 50.91], ["buzz", 12.37], ["speech", 4.44]], [["music", 67.48], ["bleat", 16.64], ["sheep", 6.1]], null, [["music", 26.51], ["whimper", 22.59], ["speech", 10.03]], null, [["music", 45.18], ["speech", 16.16], ["dog", 4.98]], null, [["music", 69.71], ["synthesizer", 4.29], ["hum", 3.47]]], "duration": [0.17, 0.35, 5.96, 0.59, 0.92, 3.5, 3.51, 1.64, 2.21, 0.36, 0.62, 0.05, 0.49, 0.62, 0.04, 9.56, 0.32, 1.69, 0.43, -0.18, 0.14, 4.05, 6.34, 1.71, 2.11, 1.72, 2.05, 0.46, 13.46]} \ No newline at end of file diff --git a/annotations_1/KjbNSIIOEo4_filtered.json b/annotations_1/KjbNSIIOEo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b9150d509978d531fe3c2243fa0f3784544d0cb --- /dev/null +++ b/annotations_1/KjbNSIIOEo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 59.05], [59.0, 59.56], [60.0, 61.67], [62.0, 64.71], [65.0, 66.63], [75.0, 75.07], [86.0, 87.64], [92.0, 94.73], [97.0, 97.65], [100.0, 100.11], [101.0, 103.82], [104.0, 104.48], [105.0, 105.73], [111.0, 112.63], [113.0, 114.24]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 34.59, 0.0, 0.0, 45.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.1], ["throbbing", 8.07], ["hum", 4.48]], null, null, null, [["music", 38.56], ["quack", 13.96], ["speech", 7.98]], null, null, [["music", 67.65], ["throbbing", 5.66], ["electronic music", 2.83]], null, null, null, null], "duration": [40.05, 0.56, 1.67, 2.71, 1.63, 0.07, 1.64, 2.73, 0.65, 0.11, 2.82, 0.48, 0.73, 1.63, 1.24]} \ No newline at end of file diff --git a/annotations_1/KkBUMdYMw-8_filtered.json b/annotations_1/KkBUMdYMw-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0405e13c420f5aa3f5f9a6f6c688183875777af --- /dev/null +++ b/annotations_1/KkBUMdYMw-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 45.23], [47.0, 115.32]], "keep_status": [true, false], "silence_prob": [30.04, 0.0], "audiomae_on_audioset": [[["music", 52.62], ["speech", 10.71], ["electronic music", 6.14]], null], "duration": [4.23, 68.32]} \ No newline at end of file diff --git a/annotations_1/Kkl4-30oHVU_filtered.json b/annotations_1/Kkl4-30oHVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb13014e8db56d0ea2c00e2c3ed657ee9c1a496d --- /dev/null +++ b/annotations_1/Kkl4-30oHVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.85], [9.0, 13.2], [17.0, 17.52], [18.0, 19.36], [24.0, 31.95], [33.0, 33.05], [37.0, 38.13], [60.0, 60.32], [60.0, 60.79], [62.0, 63.02], [68.0, 68.55], [78.0, 78.06], [78.0, 78.29], [85.0, 86.07], [88.0, 88.42], [90.0, 90.8], [91.0, 92.4], [94.0, 95.45], [97.0, 97.6], [125.0, 127.63], [132.0, 137.51], [143.0, 143.48]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [45.98, 34.93, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.53, 38.25, 0.0], "audiomae_on_audioset": [[["speech", 21.04], ["livestock, farm animals, working animals", 13.86], ["cattle, bovinae", 11.2]], [["skidding", 26.02], ["vehicle", 25.52], ["car", 16.78]], null, null, [["speech", 54.14], ["vehicle", 7.24], ["car", 5.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 45.99], ["cattle, bovinae", 33.83], ["moo", 19.15]], [["livestock, farm animals, working animals", 20.78], ["speech", 18.04], ["cattle, bovinae", 13.51]], null], "duration": [4.85, 4.2, 0.52, 1.36, 7.95, 0.05, 1.13, 0.32, 0.79, 1.02, 0.55, 0.06, 0.29, 1.07, 0.42, 0.8, 1.4, 1.45, 0.6, 2.63, 5.51, 0.48]} \ No newline at end of file diff --git a/annotations_1/Km2lbJKGAqA_filtered.json b/annotations_1/Km2lbJKGAqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c559623846a7b7137740927d6f97facdfc1b4b5 --- /dev/null +++ b/annotations_1/Km2lbJKGAqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.39], [16.0, 16.53], [19.0, 31.11], [33.0, 40.39], [44.0, 45.57], [47.0, 51.02], [52.0, 74.04], [77.0, 77.85], [79.0, 82.88], [86.0, 86.81], [90.0, 95.66], [98.0, 105.39], [107.0, 109.61], [111.0, 111.48], [112.0, 112.6], [119.0, 121.69], [124.0, 130.1], [132.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [89.54, 0.0, 77.03, 77.2, 0.0, 88.83, 67.38, 0.0, 98.27, 0.0, 68.15, 50.16, 45.08, 0.0, 0.0, 37.54, 39.49, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.82], ["musical instrument", 2.63], ["bleat", 2.37]], null, null, [["music", 35.8], ["bleat", 8.8], ["sheep", 7.24]], [["music", 45.12], ["theremin", 35.95], ["musical instrument", 3.45]], null], "duration": [10.39, 0.53, 12.11, 7.39, 1.57, 4.02, 22.04, 0.85, 3.88, 0.81, 5.66, 7.39, 2.61, 0.48, 0.6, 2.69, 6.1, 1.1]} \ No newline at end of file diff --git a/annotations_1/KnI9MBbPCT8_filtered.json b/annotations_1/KnI9MBbPCT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3feac381f099ef56fff617b3833ffab8c2daf13d --- /dev/null +++ b/annotations_1/KnI9MBbPCT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 52.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [46.22]} \ No newline at end of file diff --git a/annotations_1/KnPfaGzmt4M_filtered.json b/annotations_1/KnPfaGzmt4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b062b750f318602978c06798c75bdb8a2fe20bad --- /dev/null +++ b/annotations_1/KnPfaGzmt4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [2.0, 3.21], [4.0, 6.42], [7.0, 6.89], [8.0, 8.31], [12.0, 12.7], [15.0, 15.38], [16.0, 16.78], [17.0, 17.95], [21.0, 21.91], [22.0, 24.43], [28.0, 30.52], [32.0, 32.76], [33.0, 34.11], [39.0, 43.7], [45.0, 46.52], [47.0, 49.44], [51.0, 54.14], [55.0, 54.95], [58.0, 59.93], [61.0, 65.16], [67.0, 67.09], [68.0, 70.77], [72.0, 73.01], [74.0, 75.03], [76.0, 76.71], [78.0, 84.2], [84.0, 84.81], [85.0, 84.86], [86.0, 86.9], [89.0, 90.14], [91.0, 91.81], [92.0, 94.69], [102.0, 105.53], [107.0, 106.95], [107.0, 111.28], [112.0, 119.57], [120.0, 124.24]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 76.7, 0.0, 0.0, 50.02, 0.0, 100.0, 94.37, 0.0, 0.0, 99.98, 0.0, 46.86, 0.0, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0, 0.0, 0.0, 36.8, 96.89, 0.0, 39.01, 29.18, 51.34], "audiomae_on_audioset": [null, null, [["frog", 28.1], ["speech", 11.21], ["animal", 7.06]], null, null, null, null, null, null, null, [["electric shaver, electric razor", 38.71], ["speech", 24.25], ["inside, small room", 6.36]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 92.44], ["sidetone", 1.66], ["inside, small room", 1.3]], null, null, null, [["speech", 74.16], ["electric shaver, electric razor", 7.37], ["sidetone", 6.17]], null, null, null, null, null, [["speech", 78.3], ["frog", 3.98], ["inside, small room", 3.96]], null, null, [["speech", 74.8], ["frog", 5.76], ["boing", 2.79]], [["explosion", 14.61], ["electric shaver, electric razor", 9.48], ["music", 6.75]], null], "duration": [0.65, 1.21, 2.42, -0.11, 0.31, 0.7, 0.38, 0.78, 0.95, 0.91, 2.43, 2.52, 0.76, 1.11, 4.7, 1.52, 2.44, 3.14, -0.05, 1.93, 4.16, 0.09, 2.77, 1.01, 1.03, 0.71, 6.2, 0.81, -0.14, 0.9, 1.14, 0.81, 2.69, 3.53, -0.05, 4.28, 7.57, 4.24]} \ No newline at end of file diff --git a/annotations_1/Ko8vqBmZRfE_filtered.json b/annotations_1/Ko8vqBmZRfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fb76d5b75a6f1fb3b4ffa272719e983013e6a55 --- /dev/null +++ b/annotations_1/Ko8vqBmZRfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.86], [36.0, 36.22]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.86, 0.22]} \ No newline at end of file diff --git a/annotations_1/KoY720x5fuw_filtered.json b/annotations_1/KoY720x5fuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ea9ae03c24dfdb7a8572fa3147bd19be706c17f --- /dev/null +++ b/annotations_1/KoY720x5fuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.33], [5.0, 5.14], [6.0, 6.72], [8.0, 8.9], [10.0, 13.9], [16.0, 17.54], [19.0, 19.9], [21.0, 30.43], [33.0, 35.16], [36.0, 47.71], [51.0, 58.53], [60.0, 62.87], [64.0, 64.27], [66.0, 71.79], [82.0, 90.14], [97.0, 122.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [68.8, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 53.84, 61.27, 47.9, 40.7, 41.12, 0.0, 34.04, 30.93, 29.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 39.94], ["mains hum", 25.42], ["throbbing", 5.37]], [["speech", 87.35], ["clip-clop", 1.27], ["fart", 1.21]], [["speech", 17.49], ["moo", 12.99], ["cattle, bovinae", 11.62]], null, [["livestock, farm animals, working animals", 21.79], ["speech", 19.75], ["horse", 7.39]], [["speech", 52.85], ["cattle, bovinae", 9.27], ["livestock, farm animals, working animals", 4.45]], [["music", 37.67], ["speech", 8.85], ["groan", 4.26]]], "duration": [2.33, 0.14, 0.72, 0.9, 3.9, 1.54, 0.9, 9.43, 2.16, 11.71, 7.53, 2.87, 0.27, 5.79, 8.14, 25.5]} \ No newline at end of file diff --git a/annotations_1/Kpxk3UkX5s4_filtered.json b/annotations_1/Kpxk3UkX5s4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..150843ee22dae7f6108e9feb46c6531519682b68 --- /dev/null +++ b/annotations_1/Kpxk3UkX5s4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.52], [24.0, 42.23], [43.0, 44.04], [45.0, 47.71], [49.0, 50.6], [52.0, 52.34], [55.0, 55.97], [57.0, 60.71], [61.0, 64.32], [66.0, 68.79], [71.0, 71.19], [72.0, 73.28], [78.0, 79.34], [81.0, 82.17], [83.0, 94.02], [99.0, 104.48], [108.0, 114.08]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [54.23, 36.11, 0.0, 51.39, 0.0, 0.0, 0.0, 64.29, 51.02, 63.1, 0.0, 0.0, 0.0, 0.0, 37.36, 29.84, 30.14], "audiomae_on_audioset": [null, [["fly, housefly", 36.48], ["insect", 15.65], ["mosquito", 10.74]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.31], ["sidetone", 16.94], ["sine wave", 5.39]], [["music", 62.38], ["synthesizer", 6.33], ["musical instrument", 4.01]], [["speech", 52.24], ["whack, thwack", 15.16], ["music", 5.95]]], "duration": [19.52, 18.23, 1.04, 2.71, 1.6, 0.34, 0.97, 3.71, 3.32, 2.79, 0.19, 1.28, 1.34, 1.17, 11.02, 5.48, 6.08]} \ No newline at end of file diff --git a/annotations_1/Kq3TiuRC-VQ_filtered.json b/annotations_1/Kq3TiuRC-VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b006abe8c82bb6dfda7bee9b5701122b97860a05 --- /dev/null +++ b/annotations_1/Kq3TiuRC-VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 23.99], [25.0, 34.32], [36.0, 37.64], [41.0, 52.56], [56.0, 57.27], [76.0, 77.09], [83.0, 83.37], [84.0, 84.55], [91.0, 94.04], [103.0, 103.71], [106.0, 106.71], [108.0, 108.24], [109.0, 109.65], [110.0, 112.28], [125.0, 125.58], [136.0, 143.01], [144.0, 143.78], [146.0, 159.14], [160.0, 164.15], [168.0, 168.32], [171.0, 172.13], [175.0, 176.17], [183.0, 185.03], [186.0, 193.4], [194.0, 203.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [31.28, 48.74, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 53.28, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 43.98, 0.0, 40.95, 98.44, 0.0, 0.0, 0.0, 100.0, 100.0, 29.88], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 40.24], ["cattle, bovinae", 22.52], ["moo", 20.4]], [["music", 61.92], ["synthesizer", 12.26], ["musical instrument", 2.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 75.94], ["didgeridoo", 6.09], ["musical instrument", 5.52]], null, [["music", 59.0], ["synthesizer", 5.64], ["hum", 3.01]], null, null, null, null, null, null, [["music", 28.81], ["groan", 11.37], ["electric shaver, electric razor", 8.46]]], "duration": [11.99, 9.32, 1.64, 11.56, 1.27, 1.09, 0.37, 0.55, 3.04, 0.71, 0.71, 0.24, 0.65, 2.28, 0.58, 7.01, -0.22, 13.14, 4.15, 0.32, 1.13, 1.17, 2.03, 7.4, 9.45]} \ No newline at end of file diff --git a/annotations_1/KrBI7YdIPYk_filtered.json b/annotations_1/KrBI7YdIPYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..921047836d2962fc699f073537fd276c8058277f --- /dev/null +++ b/annotations_1/KrBI7YdIPYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 79.39], [88.0, 88.7], [90.0, 100.38], [103.0, 108.94], [110.0, 158.03], [159.0, 159.44], [160.0, 196.42]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 67.0, 43.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 61.03], ["theremin", 13.26], ["musical instrument", 4.33]], null, null, null], "duration": [0.39, 0.7, 10.38, 5.94, 48.03, 0.44, 36.42]} \ No newline at end of file diff --git a/annotations_1/KsimmeikE7w_filtered.json b/annotations_1/KsimmeikE7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..718a3e84bb839c65ee4617b6794038e3cb406a81 --- /dev/null +++ b/annotations_1/KsimmeikE7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.0], [25.0, 28.43], [35.0, 36.68], [38.0, 38.72], [39.0, 39.43], [42.0, 44.95], [54.0, 56.44], [83.0, 83.57], [111.0, 114.32], [115.0, 116.04], [120.0, 121.47], [122.0, 123.03], [124.0, 124.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.55, 73.36, 0.0, 0.0, 0.0, 100.0, 94.52, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.0, 3.43, 1.68, 0.72, 0.43, 2.95, 2.44, 0.57, 3.32, 1.04, 1.47, 1.03, 0.61]} \ No newline at end of file diff --git a/annotations_1/KsmXx3hB968_filtered.json b/annotations_1/KsmXx3hB968_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..196f29ff299405b7f91e75a707880361ffb05316 --- /dev/null +++ b/annotations_1/KsmXx3hB968_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.54], [7.0, 10.71], [15.0, 18.3], [25.0, 61.53], [62.0, 68.72], [72.0, 81.95], [82.0, 99.45], [103.0, 115.64], [117.0, 175.1]], "keep_status": [false, true, true, false, true, true, true, false, false], "silence_prob": [0.0, 33.72, 29.8, 0.0, 29.65, 30.32, 28.81, 41.24, 0.0], "audiomae_on_audioset": [null, [["music", 37.56], ["throbbing", 9.74], ["hum", 5.19]], [["music", 38.17], ["throbbing", 5.69], ["hum", 5.32]], null, [["fart", 35.21], ["didgeridoo", 12.28], ["whale vocalization", 8.92]], [["speech", 23.07], ["music", 16.28], ["whack, thwack", 7.37]], [["speech", 31.81], ["music", 19.17], ["vehicle", 11.73]], [["cattle, bovinae", 30.51], ["livestock, farm animals, working animals", 24.81], ["moo", 16.47]], null], "duration": [1.54, 3.71, 3.3, 36.53, 6.72, 9.95, 17.45, 12.64, 58.1]} \ No newline at end of file diff --git a/annotations_1/KtwPWWCJHAE_filtered.json b/annotations_1/KtwPWWCJHAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed18d785bfe8b68289389232eb41d7abb2ae8da0 --- /dev/null +++ b/annotations_1/KtwPWWCJHAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 17.73], [18.0, 18.93], [19.0, 20.73], [21.0, 21.96], [23.0, 24.44], [25.0, 26.94], [30.0, 41.54], [42.0, 41.82], [56.0, 56.56], [58.0, 59.63], [67.0, 67.04], [67.0, 67.69], [68.0, 68.17], [87.0, 89.75], [98.0, 101.04], [103.0, 104.21], [110.0, 110.67], [115.0, 115.86], [117.0, 117.32], [118.0, 119.67], [120.0, 120.18], [123.0, 125.37], [133.0, 135.92], [137.0, 139.14], [151.0, 151.56], [152.0, 153.32], [158.0, 160.51], [162.0, 165.18], [167.0, 167.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 42.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.17, 28.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.64, 72.75, 50.76, 0.0, 0.0, 57.48, 36.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["frog", 67.67], ["hum", 5.74], ["caw", 3.11]], null, null, null, null, null, null, [["music", 56.42], ["rattle (instrument)", 12.19], ["beatboxing", 3.39]], [["music", 58.64], ["musical instrument", 3.68], ["singing", 3.1]], null, null, null, null, null, null, [["frog", 38.27], ["croak", 26.8], ["animal", 5.74]], null, null, null, null, null, [["music", 31.58], ["hum", 12.58], ["theremin", 8.71]], null], "duration": [16.73, 0.93, 1.73, 0.96, 1.44, 1.94, 11.54, -0.18, 0.56, 1.63, 0.04, 0.69, 0.17, 2.75, 3.04, 1.21, 0.67, 0.86, 0.32, 1.67, 0.18, 2.37, 2.92, 2.14, 0.56, 1.32, 2.51, 3.18, 0.24]} \ No newline at end of file diff --git a/annotations_1/KuStVllxFuI_filtered.json b/annotations_1/KuStVllxFuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b086adf7d681effe01075df793c79c8e6638905 --- /dev/null +++ b/annotations_1/KuStVllxFuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [8.0, 7.65], [10.0, 11.43], [12.0, 12.99], [15.0, 18.5], [19.0, 19.99], [21.0, 21.14], [26.0, 26.7], [28.0, 27.73], [28.0, 28.22], [37.0, 44.64], [45.0, 47.01], [52.0, 53.59], [55.0, 57.75], [59.0, 65.89], [68.0, 70.39], [71.0, 78.51], [80.0, 81.89], [82.0, 83.74], [85.0, 119.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 31.25, 80.46, 0.0, 49.31, 33.85, 31.65, 28.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 30.16], ["mains hum", 13.54], ["rumble", 12.95]], null, null, [["music", 41.24], ["sonar", 26.1], ["singing bowl", 3.75]], [["music", 25.2], ["throbbing", 17.69], ["sonar", 9.67]], [["music", 26.41], ["mains hum", 21.21], ["hum", 19.79]], [["hum", 25.49], ["music", 23.78], ["mains hum", 16.42]], null, null, null], "duration": [0.8, -0.35, 1.43, 0.99, 3.5, 0.99, 0.14, 0.7, -0.27, 0.22, 7.64, 2.01, 1.59, 2.75, 6.89, 2.39, 7.51, 1.89, 1.74, 34.69]} \ No newline at end of file diff --git a/annotations_1/Kuy5Qgp5pvg_filtered.json b/annotations_1/Kuy5Qgp5pvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3540c354b34f79562b593d8195232a626b36812a --- /dev/null +++ b/annotations_1/Kuy5Qgp5pvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.94], [38.0, 40.07], [42.0, 43.6], [46.0, 47.83], [49.0, 50.72], [53.0, 55.11], [56.0, 57.59], [58.0, 59.9], [61.0, 62.92], [74.0, 74.75], [76.0, 76.13], [82.0, 84.84], [86.0, 86.44], [86.0, 92.06], [93.0, 108.78], [111.0, 112.46], [113.0, 115.1], [115.0, 124.56], [125.0, 131.33], [132.0, 136.07], [137.0, 138.81], [140.0, 140.27], [141.0, 145.12], [148.0, 148.83], [152.0, 154.85], [155.0, 159.98], [162.0, 163.17], [166.0, 168.81], [169.0, 171.64], [175.0, 177.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 88.64, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 66.39, 78.04, 0.0, 97.22, 89.19, 76.2, 71.72, 0.0, 0.0, 99.96, 0.0, 99.98, 91.47, 0.0, 99.78, 97.83, 99.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 2.07, 1.6, 1.83, 1.72, 2.11, 1.59, 1.9, 1.92, 0.75, 0.13, 2.84, 0.44, 6.06, 15.78, 1.46, 2.1, 9.56, 6.33, 4.07, 1.81, 0.27, 4.12, 0.83, 2.85, 4.98, 1.17, 2.81, 2.64, 2.18]} \ No newline at end of file diff --git a/annotations_1/KvfIsbhIQLA_filtered.json b/annotations_1/KvfIsbhIQLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d39cffc6e41ec40c387eb121cfd2682789d74355 --- /dev/null +++ b/annotations_1/KvfIsbhIQLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.26], [24.0, 24.75], [25.0, 25.34], [30.0, 47.43], [56.0, 65.89], [70.0, 74.48]], "keep_status": [true, false, false, true, false, false], "silence_prob": [42.67, 0.0, 0.0, 47.5, 43.3, 42.24], "audiomae_on_audioset": [[["music", 45.49], ["bagpipes", 10.03], ["musical instrument", 4.44]], null, null, [["music", 53.85], ["musical instrument", 7.84], ["guitar", 4.91]], [["music", 89.05], ["mantra", 1.87], ["chant", 1.55]], [["carnatic music", 43.75], ["music", 40.44], ["musical instrument", 3.56]]], "duration": [3.26, 0.75, 0.34, 17.43, 9.89, 4.48]} \ No newline at end of file diff --git a/annotations_1/Kw6gubNxWQ4_filtered.json b/annotations_1/Kw6gubNxWQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d68e2e46964d573c31b2821b77accdc762ed16 --- /dev/null +++ b/annotations_1/Kw6gubNxWQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.33], [17.0, 23.95], [27.0, 31.18], [33.0, 40.88], [43.0, 96.01], [99.0, 99.13], [101.0, 101.29], [105.0, 105.8]], "keep_status": [true, false, true, true, false, false, false, false], "silence_prob": [31.05, 32.8, 33.71, 31.06, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 30.33], ["music", 27.13], ["throbbing", 6.0]], [["music", 76.81], ["musical instrument", 3.23], ["theremin", 2.9]], [["gong", 23.02], ["music", 22.44], ["hum", 7.13]], [["speech", 24.49], ["rumble", 19.25], ["hum", 19.12]], null, null, null, null], "duration": [10.33, 6.95, 4.18, 7.88, 53.01, 0.13, 0.29, 0.8]} \ No newline at end of file diff --git a/annotations_1/KwWHPqidGuA_filtered.json b/annotations_1/KwWHPqidGuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44399dc7bf39b5eb622aa80587ef0624ec823ad1 --- /dev/null +++ b/annotations_1/KwWHPqidGuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [13.0, 12.65], [13.0, 19.13], [19.0, 19.47], [22.0, 22.82], [23.0, 24.31], [27.0, 30.92], [35.0, 35.34], [35.0, 38.94], [46.0, 55.68], [56.0, 57.92], [60.0, 61.62], [64.0, 64.88], [72.0, 75.19], [81.0, 82.14], [89.0, 89.01], [91.0, 90.93], [94.0, 102.57], [106.0, 107.5], [115.0, 127.67], [134.0, 135.78], [140.0, 141.35], [145.0, 148.41], [155.0, 155.95], [157.0, 158.67], [162.0, 162.92], [169.0, 170.11], [173.0, 173.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 61.27, 0.0, 53.47, 34.44, 0.0, 0.0, 0.0, 37.21, 0.0, 0.0, 0.0, 34.26, 0.0, 35.43, 0.0, 0.0, 38.08, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 82.15], ["musical instrument", 1.62], ["speech", 1.23]], null, null, null, [["music", 82.75], ["synthesizer", 2.77], ["musical instrument", 2.43]], null, null, null, [["music", 84.76], ["musical instrument", 2.33], ["guitar", 1.25]], null, [["music", 42.1], ["harmonica", 32.31], ["musical instrument", 4.64]], null, null, [["harmonica", 33.21], ["music", 23.79], ["wind instrument, woodwind instrument", 15.75]], null, null, null, null, null], "duration": [0.38, -0.35, 6.13, 0.47, 0.82, 1.31, 3.92, 0.34, 3.94, 9.68, 1.92, 1.62, 0.88, 3.19, 1.14, 0.01, -0.07, 8.57, 1.5, 12.67, 1.78, 1.35, 3.41, 0.95, 1.67, 0.92, 1.11, 0.77]} \ No newline at end of file diff --git a/annotations_1/KwfnVFtdn_E_filtered.json b/annotations_1/KwfnVFtdn_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39714215e9d3d177d278eb047329809d150a2a4f --- /dev/null +++ b/annotations_1/KwfnVFtdn_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.05], [20.0, 20.14], [41.0, 42.63], [49.0, 49.05], [55.0, 55.26], [57.0, 57.43], [67.0, 70.43], [71.0, 72.12], [74.0, 75.98], [77.0, 79.42], [80.0, 82.12], [83.0, 83.32], [90.0, 93.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 43.98, 37.36, 0.0, 71.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["mains hum", 45.07], ["hum", 26.91], ["music", 4.15]], [["cattle, bovinae", 30.8], ["moo", 27.36], ["livestock, farm animals, working animals", 13.27]], null, null], "duration": [0.05, 0.14, 1.63, 0.05, 0.26, 0.43, 3.43, 1.12, 1.98, 2.42, 2.12, 0.32, 3.29]} \ No newline at end of file diff --git a/annotations_1/KwpO_4Rq13o_filtered.json b/annotations_1/KwpO_4Rq13o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d32c38f40ec9d58f52fb09ed7f5588c2b36d1b9 --- /dev/null +++ b/annotations_1/KwpO_4Rq13o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.86], [19.0, 28.59], [29.0, 63.36], [64.0, 85.83], [89.0, 90.32], [90.0, 90.36], [90.0, 145.96], [146.0, 164.08], [166.0, 173.03]], "keep_status": [true, false, false, false, false, false, false, true, true], "silence_prob": [36.42, 31.56, 0.0, 30.57, 0.0, 0.0, 0.0, 28.93, 28.46], "audiomae_on_audioset": [[["hum", 25.57], ["mains hum", 14.45], ["throbbing", 10.65]], [["music", 37.4], ["speech", 22.15], ["noise", 10.65]], null, [["hum", 65.61], ["mains hum", 13.02], ["music", 9.31]], null, null, null, [["music", 51.05], ["thump, thud", 9.52], ["whack, thwack", 7.48]], [["explosion", 16.0], ["music", 14.45], ["burst, pop", 9.68]]], "duration": [3.86, 9.59, 34.36, 21.83, 1.32, 0.36, 55.96, 18.08, 7.03]} \ No newline at end of file diff --git a/annotations_1/KxcKAGtHl3A_filtered.json b/annotations_1/KxcKAGtHl3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a744b6ce052d5001cbdbf7543e34cc207a2e90f6 --- /dev/null +++ b/annotations_1/KxcKAGtHl3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [13.0, 17.47], [18.0, 26.4], [27.0, 31.72], [32.0, 32.46], [33.0, 32.95], [35.0, 57.32], [59.0, 60.22]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 41.52, 36.37, 61.87, 0.0, 0.0, 45.46, 0.0], "audiomae_on_audioset": [null, [["music", 51.59], ["hum", 9.85], ["explosion", 3.45]], [["mains hum", 27.75], ["hum", 25.38], ["speech", 21.08]], null, null, null, [["insect", 44.12], ["speech", 16.32], ["fly, housefly", 14.9]], null], "duration": [0.69, 4.47, 8.4, 4.72, 0.46, -0.05, 22.32, 1.22]} \ No newline at end of file diff --git a/annotations_1/KxoJQx_MgAc_filtered.json b/annotations_1/KxoJQx_MgAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a879fb270063cceb5cde29d142953fd22fb3440e --- /dev/null +++ b/annotations_1/KxoJQx_MgAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [3.0, 13.17], [17.0, 33.71], [35.0, 44.73], [46.0, 80.22], [81.0, 81.01], [81.0, 96.21], [102.0, 165.3], [166.0, 166.85], [169.0, 169.75]], "keep_status": [false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 31.91, 30.26, 44.84, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 51.05], ["speech", 13.36], ["cattle, bovinae", 3.5]], [["music", 36.36], ["buzz", 9.88], ["throbbing", 6.93]], [["music", 35.32], ["whale vocalization", 17.56], ["ambient music", 9.59]], null, null, [["music", 80.1], ["theremin", 2.8], ["ambient music", 1.47]], null, null, null], "duration": [0.51, 10.17, 16.71, 9.73, 34.22, 0.01, 15.21, 63.3, 0.85, 0.75]} \ No newline at end of file diff --git a/annotations_1/Kxyzb8LbVKQ_filtered.json b/annotations_1/Kxyzb8LbVKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bae1777614a385f09a91aed1c8be5526e1b75953 --- /dev/null +++ b/annotations_1/Kxyzb8LbVKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.65], [13.0, 14.64], [18.0, 19.68], [26.0, 33.39], [34.0, 34.48], [35.0, 36.32], [40.0, 39.85], [41.0, 42.21], [45.0, 45.69], [46.0, 47.65], [50.0, 51.07], [52.0, 52.64], [54.0, 54.92], [56.0, 57.18], [60.0, 62.7], [68.0, 67.96], [72.0, 72.44], [77.0, 77.45], [84.0, 84.89], [93.0, 93.28], [104.0, 105.43], [107.0, 107.38], [110.0, 110.59], [112.0, 112.13], [119.0, 119.8], [121.0, 122.27], [123.0, 126.23], [127.0, 128.09], [141.0, 142.08], [143.0, 144.0], [145.0, 145.42], [147.0, 147.58], [153.0, 155.21], [156.0, 156.95], [158.0, 158.53], [159.0, 161.22], [166.0, 166.99], [168.0, 169.37], [170.0, 172.98], [174.0, 174.23], [175.0, 177.79], [180.0, 181.7], [185.0, 184.55], [185.0, 186.95], [187.0, 190.56], [192.0, 193.7], [196.0, 196.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.1, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 90.78, 0.0, 0.0, 99.62, 0.0, 100.0, 0.0, 0.0, 0.0, 61.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.65, 1.64, 1.68, 7.39, 0.48, 1.32, -0.15, 1.21, 0.69, 1.65, 1.07, 0.64, 0.92, 1.18, 2.7, -0.04, 0.44, 0.45, 0.89, 0.28, 1.43, 0.38, 0.59, 0.13, 0.8, 1.27, 3.23, 1.09, 1.08, 1.0, 0.42, 0.58, 2.21, 0.95, 0.53, 2.22, 0.99, 1.37, 2.98, 0.23, 2.79, 1.7, -0.45, 1.95, 3.56, 1.7, 0.26]} \ No newline at end of file diff --git a/annotations_1/Ky6GupHDuOw_filtered.json b/annotations_1/Ky6GupHDuOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72dcf7800382979808918720e7c4236cc0c07955 --- /dev/null +++ b/annotations_1/Ky6GupHDuOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [7.0, 7.8], [9.0, 9.31], [10.0, 11.18], [12.0, 12.78], [18.0, 19.38], [23.0, 30.6], [35.0, 36.32], [42.0, 60.91], [62.0, 64.66]], "keep_status": [false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 40.68, 36.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 43.69], ["fly, housefly", 13.67], ["fart", 8.59]], [["music", 37.67], ["throbbing", 14.42], ["hum", 9.72]]], "duration": [-0.09, 0.8, 0.31, 1.18, 0.78, 1.38, 7.6, 1.32, 18.91, 2.66]} \ No newline at end of file diff --git a/annotations_1/KyfXb39rGT0_filtered.json b/annotations_1/KyfXb39rGT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcb5c56e6ad52dcd5288a359386a6807694164ef --- /dev/null +++ b/annotations_1/KyfXb39rGT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 46.48], [49.0, 64.5], [69.0, 108.53], [110.0, 149.45]], "keep_status": [true, false, false, false], "silence_prob": [28.44, 37.07, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 24.9], ["music", 12.5], ["static", 12.28]], [["music", 57.65], ["hum", 19.59], ["throbbing", 7.6]], null, null], "duration": [2.48, 15.5, 39.53, 39.45]} \ No newline at end of file diff --git a/annotations_1/KzUKcXxbU4U_filtered.json b/annotations_1/KzUKcXxbU4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12764e2332961113367a3440fc1f073fab7722c2 --- /dev/null +++ b/annotations_1/KzUKcXxbU4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 35.24], [36.0, 36.85], [76.0, 75.93], [86.0, 86.83], [89.0, 97.56]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.4], "audiomae_on_audioset": [null, null, null, null, [["music", 43.56], ["throbbing", 13.15], ["hum", 11.9]]], "duration": [1.24, 0.85, -0.07, 0.83, 8.56]} \ No newline at end of file diff --git a/annotations_1/L-zzxADqlu8_filtered.json b/annotations_1/L-zzxADqlu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b42f0f3a6b6878ed0f4b3f3a92e26639ff7cf534 --- /dev/null +++ b/annotations_1/L-zzxADqlu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 101.34], [102.0, 104.48], [106.0, 107.72], [112.0, 112.62], [114.0, 114.79], [117.0, 117.69], [120.0, 119.79], [124.0, 124.14], [125.0, 125.86], [131.0, 131.53], [134.0, 137.91], [139.0, 141.2], [142.0, 142.45], [143.0, 142.55], [144.0, 149.0]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.68, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 61.18, 0.0, 0.0, 57.97], "audiomae_on_audioset": [null, [["speech", 32.59], ["hum", 12.68], ["stomach rumble", 5.48]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.34, 2.48, 1.72, 0.62, 0.79, 0.69, -0.21, 0.14, 0.86, 0.53, 3.91, 2.2, 0.45, -0.45, 5.0]} \ No newline at end of file diff --git a/annotations_1/L06qVvXrJus_filtered.json b/annotations_1/L06qVvXrJus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ba3b8a33010063f794954fa82600ae91515bdf1 --- /dev/null +++ b/annotations_1/L06qVvXrJus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.52], [8.0, 8.87], [10.0, 10.57], [12.0, 13.02], [14.0, 14.22], [17.0, 17.14], [19.0, 19.77], [21.0, 21.91], [27.0, 27.77], [37.0, 40.39], [42.0, 42.45], [43.0, 46.79], [47.0, 47.46], [48.0, 48.79], [51.0, 59.54], [67.0, 66.75], [78.0, 78.36], [87.0, 87.74], [89.0, 89.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 87.55, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 0.87, 0.57, 1.02, 0.22, 0.14, 0.77, 0.91, 0.77, 3.39, 0.45, 3.79, 0.46, 0.79, 8.54, -0.25, 0.36, 0.74, 0.41]} \ No newline at end of file diff --git a/annotations_1/L0PPveTZVsw_filtered.json b/annotations_1/L0PPveTZVsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70155b7e5024d8107d9ee45780c9591d51359c21 --- /dev/null +++ b/annotations_1/L0PPveTZVsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.81], [25.0, 25.84], [29.0, 34.94], [36.0, 47.26], [48.0, 49.3], [51.0, 54.19], [55.0, 55.92], [57.0, 59.64], [60.0, 64.88], [66.0, 68.34], [79.0, 79.74], [88.0, 88.26], [89.0, 89.29], [91.0, 93.39], [94.0, 98.12], [100.0, 101.61], [114.0, 116.67], [117.0, 118.49], [120.0, 120.5], [130.0, 130.18], [131.0, 132.21], [147.0, 147.41], [149.0, 160.59], [162.0, 164.57], [165.0, 165.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 97.43, 100.0, 0.0, 93.45, 0.0, 100.0, 99.97, 100.0, 0.0, 0.0, 0.0, 98.36, 51.18, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 98.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.81, 0.84, 5.94, 11.26, 1.3, 3.19, 0.92, 2.64, 4.88, 2.34, 0.74, 0.26, 0.29, 2.39, 4.12, 1.61, 2.67, 1.49, 0.5, 0.18, 1.21, 0.41, 11.59, 2.57, 0.82]} \ No newline at end of file diff --git a/annotations_1/L2inhzv1Rs8_filtered.json b/annotations_1/L2inhzv1Rs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40ae78852b21289b303779273c411ced0168d25d --- /dev/null +++ b/annotations_1/L2inhzv1Rs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.64], [13.0, 23.23], [37.0, 37.86], [40.0, 40.51], [44.0, 48.81], [58.0, 63.0], [66.0, 66.9], [72.0, 74.04], [79.0, 79.07], [86.0, 92.1], [96.0, 100.14], [104.0, 111.54], [113.0, 112.89], [117.0, 118.39], [119.0, 121.44], [124.0, 124.56], [127.0, 127.68], [128.0, 128.01], [128.0, 128.06], [128.0, 128.44], [132.0, 132.41], [133.0, 136.46], [141.0, 142.55], [148.0, 150.06], [151.0, 151.78], [158.0, 161.37], [165.0, 165.13], [173.0, 173.33], [181.0, 182.29], [183.0, 183.88], [190.0, 190.65], [193.0, 199.05], [200.0, 206.31]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.85, 0.0, 0.0, 54.56, 42.0, 0.0, 77.03, 0.0, 36.64, 34.86, 41.93, 0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 100.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 47.9], "audiomae_on_audioset": [null, null, null, null, null, [["music", 32.46], ["fart", 11.74], ["speech", 11.66]], null, null, null, [["music", 32.24], ["moo", 24.92], ["cattle, bovinae", 20.29]], [["speech", 59.95], ["music", 22.28], ["explosion", 2.07]], [["speech", 33.21], ["animal", 6.14], ["music", 5.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.57], ["foghorn", 12.96], ["theremin", 12.59]]], "duration": [-0.36, 10.23, 0.86, 0.51, 4.81, 5.0, 0.9, 2.04, 0.07, 6.1, 4.14, 7.54, -0.11, 1.39, 2.44, 0.56, 0.68, 0.01, 0.06, 0.44, 0.41, 3.46, 1.55, 2.06, 0.78, 3.37, 0.13, 0.33, 1.29, 0.88, 0.65, 6.05, 6.31]} \ No newline at end of file diff --git a/annotations_1/L3aF2hwu8yE_filtered.json b/annotations_1/L3aF2hwu8yE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c8319cb6b578240b212b9e83647d6f5c68c8472 --- /dev/null +++ b/annotations_1/L3aF2hwu8yE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [4.0, 5.86], [7.0, 8.94], [11.0, 11.55], [12.0, 15.67], [17.0, 19.06], [21.0, 21.73], [33.0, 33.89], [37.0, 37.79], [45.0, 47.66], [49.0, 50.9], [56.0, 56.79], [60.0, 63.61], [65.0, 75.71], [76.0, 77.31], [83.0, 84.27], [85.0, 85.14], [85.0, 88.4], [89.0, 89.24], [91.0, 91.2], [92.0, 92.82], [110.0, 111.77], [112.0, 114.69], [119.0, 119.26], [121.0, 121.53], [122.0, 122.49], [123.0, 123.63], [126.0, 127.04], [128.0, 128.26], [129.0, 130.42], [141.0, 145.67], [147.0, 147.5], [150.0, 150.45], [158.0, 158.21], [158.0, 158.25], [161.0, 166.5], [168.0, 170.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 82.43, 98.73, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 97.43, 67.63, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.33, 0.0, 0.0, 0.0, 0.0, 37.07, 89.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.92], ["beatboxing", 20.16], ["vocal music", 2.34]], null, null, null, null, [["music", 39.7], ["howl", 31.39], ["dog", 7.97]], null], "duration": [0.2, 1.86, 1.94, 0.55, 3.67, 2.06, 0.73, 0.89, 0.79, 2.66, 1.9, 0.79, 3.61, 10.71, 1.31, 1.27, 0.14, 3.4, 0.24, 0.2, 0.82, 1.77, 2.69, 0.26, 0.53, 0.49, 0.63, 1.04, 0.26, 1.42, 4.67, 0.5, 0.45, 0.21, 0.25, 5.5, 2.46]} \ No newline at end of file diff --git a/annotations_1/L3gtPb6y2xg_filtered.json b/annotations_1/L3gtPb6y2xg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbe23d7014316077f49e74868edc39a8bd053f0a --- /dev/null +++ b/annotations_1/L3gtPb6y2xg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.89], [23.0, 22.72], [23.0, 22.76], [23.0, 29.49], [33.0, 37.13], [40.0, 40.81], [44.0, 46.52], [50.0, 49.96], [58.0, 61.91], [64.0, 68.13], [70.0, 91.05], [100.0, 100.36], [123.0, 126.17]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.0, 31.73, 0.0, 29.52, 0.0, 30.49, 32.88, 36.06, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, [["speech", 35.4], ["boing", 27.73], ["electric shaver, electric razor", 7.46]], [["speech", 63.78], ["clip-clop", 6.73], ["horse", 6.7]], null, [["speech", 50.05], ["rumble", 4.3], ["cattle, bovinae", 3.65]], null, [["speech", 52.16], ["explosion", 13.92], ["artillery fire", 9.04]], [["speech", 35.49], ["music", 13.18], ["didgeridoo", 10.18]], [["hum", 18.07], ["speech", 17.38], ["music", 13.51]], null, null], "duration": [-0.11, -0.28, -0.24, 6.49, 4.13, 0.81, 2.52, -0.04, 3.91, 4.13, 21.05, 0.36, 3.17]} \ No newline at end of file diff --git a/annotations_1/L46syxgju18_filtered.json b/annotations_1/L46syxgju18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f45943cea5229e5d6cbb91a9e97d88ab9deb104 --- /dev/null +++ b/annotations_1/L46syxgju18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.98], [22.0, 25.05], [30.0, 30.82], [33.0, 38.67], [39.0, 40.22], [41.0, 42.18], [44.0, 44.59], [47.0, 47.21], [48.0, 47.97], [49.0, 49.45], [50.0, 51.81], [81.0, 82.14], [84.0, 84.82], [87.0, 88.16], [90.0, 90.54], [93.0, 93.55], [97.0, 96.6], [103.0, 103.44], [106.0, 106.57], [110.0, 110.66], [112.0, 112.82], [114.0, 114.03], [115.0, 114.64], [116.0, 116.61], [119.0, 118.81], [129.0, 128.87], [130.0, 130.42], [141.0, 142.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.17, 71.57, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.98, 3.05, 0.82, 5.67, 1.22, 1.18, 0.59, 0.21, -0.03, 0.45, 1.81, 1.14, 0.82, 1.16, 0.54, 0.55, -0.4, 0.44, 0.57, 0.66, 0.82, 0.03, -0.36, 0.61, -0.19, -0.13, 0.42, 1.69]} \ No newline at end of file diff --git a/annotations_1/L4MyGhbXKZU_filtered.json b/annotations_1/L4MyGhbXKZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25787c2c8e34f19efb063205051d46ce9a5b2f36 --- /dev/null +++ b/annotations_1/L4MyGhbXKZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [1.0, 4.02], [5.0, 5.8], [6.0, 7.08], [8.0, 10.1], [13.0, 14.17], [16.0, 15.9], [18.0, 23.33], [25.0, 26.18], [31.0, 32.32], [39.0, 41.28], [49.0, 50.06], [54.0, 58.8], [64.0, 65.52], [67.0, 68.18], [70.0, 86.93], [91.0, 93.8], [97.0, 97.66], [99.0, 104.52], [105.0, 110.27], [112.0, 113.85], [115.0, 116.73], [118.0, 128.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 60.14, 0.0, 0.0, 31.86, 0.0, 0.0, 32.32, 0.0, 0.0, 74.13, 0.0, 48.91, 0.0, 0.0, 34.89, 60.32, 0.0, 46.57, 81.53, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, [["hum", 40.59], ["mains hum", 21.02], ["throbbing", 10.81]], null, null, [["music", 35.7], ["speech", 14.34], ["hum", 8.93]], null, null, null, null, [["music", 35.73], ["theremin", 14.77], ["speech", 6.24]], null, null, [["music", 58.41], ["hum", 7.91], ["speech", 7.78]], null, null, [["music", 37.89], ["speech", 14.56], ["hum", 7.45]], null, null, null, null], "duration": [0.26, 3.02, 0.8, 1.08, 2.1, 1.17, -0.1, 5.33, 1.18, 1.32, 2.28, 1.06, 4.8, 1.52, 1.18, 16.93, 2.8, 0.66, 5.52, 5.27, 1.85, 1.73, 10.39]} \ No newline at end of file diff --git a/annotations_1/L5Jg3OVjPoo_filtered.json b/annotations_1/L5Jg3OVjPoo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e260fa68acaad95eb84557e50c6b39cd7186d54 --- /dev/null +++ b/annotations_1/L5Jg3OVjPoo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [4.0, 4.16], [7.0, 9.95], [11.0, 13.59], [22.0, 22.72], [25.0, 24.88], [29.0, 30.25], [32.0, 32.09], [33.0, 40.74], [42.0, 44.74], [45.0, 45.79], [47.0, 47.36], [50.0, 52.03], [54.0, 56.27], [57.0, 57.23], [60.0, 76.71], [78.0, 81.78], [85.0, 91.52], [99.0, 103.54], [107.0, 129.32], [130.0, 138.74], [139.0, 148.68], [150.0, 160.84], [163.0, 170.48], [171.0, 179.66], [183.0, 186.92], [188.0, 188.74], [190.0, 190.29]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.93, 39.22, 0.0, 0.0, 0.0, 0.0, 90.43, 99.56, 0.0, 0.0, 99.65, 83.52, 0.0, 30.44, 33.45, 39.46, 34.7, 31.34, 69.74, 96.66, 30.6, 47.78, 41.91, 82.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 20.68], ["speech", 19.84], ["music", 10.25]], [["music", 13.63], ["mosquito", 9.63], ["fly, housefly", 9.3]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.25], ["fly, housefly", 8.64], ["buzz", 6.66]], [["music", 16.21], ["moo", 15.24], ["livestock, farm animals, working animals", 14.87]], [["didgeridoo", 55.66], ["music", 15.67], ["musical instrument", 4.6]], [["music", 41.35], ["throbbing", 11.62], ["breaking", 6.07]], [["music", 24.53], ["didgeridoo", 15.47], ["buzz", 14.79]], null, null, [["music", 66.72], ["hum", 8.05], ["mains hum", 6.47]], [["speech", 74.47], ["synthesizer", 7.78], ["hum", 4.1]], [["speech", 50.48], ["sidetone", 13.09], ["whack, thwack", 4.72]], null, null, null], "duration": [0.08, 0.16, 2.95, 2.59, 0.72, -0.12, 1.25, 0.09, 7.74, 2.74, 0.79, 0.36, 2.03, 2.27, 0.23, 16.71, 3.78, 6.52, 4.54, 22.32, 8.74, 9.68, 10.84, 7.48, 8.66, 3.92, 0.74, 0.29]} \ No newline at end of file diff --git a/annotations_1/L6HWF_-Vmbw_filtered.json b/annotations_1/L6HWF_-Vmbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13e3a293d8e45a64b3968448e1d803ce7244a9b8 --- /dev/null +++ b/annotations_1/L6HWF_-Vmbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.23], [17.0, 17.42], [23.0, 24.8], [35.0, 35.9], [38.0, 38.62], [41.0, 47.02], [49.0, 50.3], [54.0, 57.67], [64.0, 64.59], [68.0, 69.47], [72.0, 73.31], [74.0, 75.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.1, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 0.42, 1.8, 0.9, 0.62, 6.02, 1.3, 3.67, 0.59, 1.47, 1.31, 1.2]} \ No newline at end of file diff --git a/annotations_1/L6f07_-wG9o_filtered.json b/annotations_1/L6f07_-wG9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88022bcd5f2e6df899f02d2b8f8ebd21b16fc264 --- /dev/null +++ b/annotations_1/L6f07_-wG9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.4], [10.0, 21.03], [25.0, 26.5], [29.0, 29.15], [32.0, 40.26], [48.0, 49.94], [59.0, 59.43], [65.0, 65.48], [77.0, 83.44], [88.0, 89.65], [106.0, 108.57], [112.0, 123.62], [127.0, 154.67], [157.0, 158.23]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 36.26, 0.0, 0.0, 30.09, 0.0, 0.0, 0.0, 30.39, 0.0, 30.94, 30.04, 30.09, 0.0], "audiomae_on_audioset": [null, [["music", 84.22], ["musical instrument", 1.56], ["singing bowl", 1.19]], null, null, [["music", 48.41], ["speech", 14.72], ["bleat", 9.24]], null, null, null, [["speech", 37.0], ["rumble", 17.08], ["hum", 9.07]], null, [["hum", 20.02], ["throbbing", 9.8], ["music", 9.52]], [["hum", 34.96], ["mains hum", 34.43], ["music", 11.3]], [["music", 44.54], ["groan", 15.86], ["speech", 10.41]], null], "duration": [0.4, 11.03, 1.5, 0.15, 8.26, 1.94, 0.43, 0.48, 6.44, 1.65, 2.57, 11.62, 27.67, 1.23]} \ No newline at end of file diff --git a/annotations_1/L6w-80CFfAs_filtered.json b/annotations_1/L6w-80CFfAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41a8967386e7d0ac5ec1781b414f06f6f734bc69 --- /dev/null +++ b/annotations_1/L6w-80CFfAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.23], [18.0, 19.97], [21.0, 21.03], [24.0, 25.81], [31.0, 41.44], [43.0, 48.91], [50.0, 50.85], [53.0, 55.09], [56.0, 56.89], [59.0, 64.02], [66.0, 84.45], [88.0, 105.68], [106.0, 106.98], [109.0, 109.26], [112.0, 121.39], [130.0, 140.44], [145.0, 172.15], [173.0, 172.99], [173.0, 173.28], [173.0, 173.45], [174.0, 177.5], [180.0, 192.38], [194.0, 206.22], [207.0, 223.59], [224.0, 226.67], [228.0, 229.8], [231.0, 231.06], [232.0, 234.0], [236.0, 236.22], [237.0, 274.04], [275.0, 276.64], [277.0, 284.99], [286.0, 290.16], [291.0, 292.5], [293.0, 294.54]], "keep_status": [false, false, false, false, true, true, false, true, false, true, false, false, false, false, true, false, true, false, false, false, true, false, true, true, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [32.01, 0.0, 0.0, 0.0, 35.1, 32.16, 0.0, 46.36, 0.0, 31.59, 31.62, 31.81, 0.0, 0.0, 31.92, 31.34, 31.93, 0.0, 0.0, 0.0, 33.11, 31.47, 31.82, 33.22, 33.86, 0.0, 0.0, 32.06, 0.0, 0.0, 0.0, 32.9, 33.5, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.6], ["static", 5.7], ["hum", 4.68]], null, null, null, [["music", 58.8], ["synthesizer", 5.75], ["keyboard (musical)", 4.52]], [["music", 30.19], ["theremin", 16.91], ["hum", 4.82]], null, [["music", 41.33], ["theremin", 14.73], ["foghorn", 7.25]], null, [["music", 34.01], ["hum", 11.41], ["cacophony", 8.57]], [["music", 58.19], ["theremin", 12.08], ["throbbing", 5.23]], [["music", 57.7], ["hum", 7.12], ["throbbing", 6.37]], null, null, [["speech", 47.27], ["vehicle", 8.36], ["livestock, farm animals, working animals", 4.19]], [["music", 81.67], ["electronic music", 3.16], ["throbbing", 1.58]], [["music", 33.71], ["throbbing", 15.39], ["speech", 13.52]], null, null, null, [["music", 51.66], ["throbbing", 9.43], ["speech", 6.77]], [["livestock, farm animals, working animals", 30.8], ["cowbell", 20.39], ["cattle, bovinae", 19.94]], [["speech", 22.32], ["music", 13.82], ["livestock, farm animals, working animals", 12.3]], [["speech", 24.88], ["livestock, farm animals, working animals", 11.5], ["music", 11.31]], [["music", 57.95], ["didgeridoo", 7.85], ["speech", 4.5]], null, null, [["music", 65.91], ["theremin", 10.03], ["musical instrument", 4.45]], null, null, null, [["music", 42.43], ["mosquito", 5.97], ["speech", 4.27]], [["music", 28.48], ["throbbing", 15.99], ["foghorn", 8.6]], null, null], "duration": [7.23, 1.97, 0.03, 1.81, 10.44, 5.91, 0.85, 2.09, 0.89, 5.02, 18.45, 17.68, 0.98, 0.26, 9.39, 10.44, 27.15, -0.01, 0.28, 0.45, 3.5, 12.38, 12.22, 16.59, 2.67, 1.8, 0.06, 2.0, 0.22, 37.04, 1.64, 7.99, 4.16, 1.5, 1.54]} \ No newline at end of file diff --git a/annotations_1/L7FVtB7mKEU_filtered.json b/annotations_1/L7FVtB7mKEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb4833861ec36bf9f5b204f1229a1e8950dc216a --- /dev/null +++ b/annotations_1/L7FVtB7mKEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [9.0, 8.85], [9.0, 8.88], [9.0, 13.76], [15.0, 29.96], [31.0, 32.8], [34.0, 36.75], [38.0, 63.19], [64.0, 65.2]], "keep_status": [false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 41.01, 37.25, 0.0, 39.88, 33.66, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 44.69], ["noise", 16.75], ["cacophony", 8.14]], [["mains hum", 29.93], ["speech", 19.44], ["music", 16.97]], null, [["foghorn", 25.51], ["music", 15.95], ["bee, wasp, etc.", 9.24]], [["music", 44.98], ["effects unit", 11.87], ["synthesizer", 9.63]], null], "duration": [0.38, -0.15, -0.12, 4.76, 14.96, 1.8, 2.75, 25.19, 1.2]} \ No newline at end of file diff --git a/annotations_1/L7YVcnBbeeI_filtered.json b/annotations_1/L7YVcnBbeeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e49ff319a0bd08e4311f9f5669db6b3f4fbf813 --- /dev/null +++ b/annotations_1/L7YVcnBbeeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.46], [10.0, 10.56], [13.0, 13.44], [16.0, 16.88], [17.0, 17.9], [19.0, 21.66], [23.0, 24.66], [25.0, 28.76], [30.0, 31.77], [37.0, 38.64], [40.0, 42.13], [44.0, 44.49], [51.0, 52.1], [53.0, 53.81], [56.0, 56.57], [64.0, 65.53], [67.0, 70.93], [73.0, 92.7], [95.0, 96.04], [98.0, 109.8], [112.0, 113.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 84.07, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 44.75, 49.09, 0.0, 31.12, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 14.04], ["fly, housefly", 9.58], ["cattle, bovinae", 8.93]], [["fly, housefly", 37.29], ["insect", 15.19], ["mosquito", 6.26]], null, [["speech", 64.5], ["explosion", 8.86], ["burst, pop", 7.05]], null], "duration": [0.46, 0.56, 0.44, 0.88, 0.9, 2.66, 1.66, 3.76, 1.77, 1.64, 2.13, 0.49, 1.1, 0.81, 0.57, 1.53, 3.93, 19.7, 1.04, 11.8, 1.91]} \ No newline at end of file diff --git a/annotations_1/L90uDzDbdV0_filtered.json b/annotations_1/L90uDzDbdV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5509e0dbaa010a4550e30162fafb85626e3d65dc --- /dev/null +++ b/annotations_1/L90uDzDbdV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.78], [16.0, 16.19], [18.0, 18.67], [20.0, 20.48], [38.0, 38.35], [49.0, 53.42], [54.0, 54.63], [77.0, 78.51], [87.0, 88.33], [92.0, 101.63], [104.0, 108.7], [114.0, 116.29], [117.0, 126.37], [129.0, 131.43], [138.0, 139.28], [147.0, 147.31], [151.0, 155.06]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.89, 0.0, 0.0, 0.0, 31.24, 30.67, 33.19, 30.89, 31.39, 0.0, 0.0, 29.57], "audiomae_on_audioset": [null, null, null, null, null, [["whale vocalization", 27.02], ["livestock, farm animals, working animals", 19.77], ["cattle, bovinae", 18.32]], null, null, null, [["music", 83.97], ["musical instrument", 3.04], ["synthesizer", 2.55]], [["music", 66.79], ["speech", 4.81], ["electronic music", 3.73]], [["music", 58.53], ["electronic music", 4.93], ["sidetone", 3.83]], [["music", 60.01], ["cacophony", 4.34], ["synthesizer", 3.92]], [["music", 36.62], ["brass instrument", 16.81], ["trombone", 14.34]], null, null, [["speech", 33.67], ["music", 13.49], ["vehicle", 8.06]]], "duration": [0.78, 0.19, 0.67, 0.48, 0.35, 4.42, 0.63, 1.51, 1.33, 9.63, 4.7, 2.29, 9.37, 2.43, 1.28, 0.31, 4.06]} \ No newline at end of file diff --git a/annotations_1/L91dx9ovcz8_filtered.json b/annotations_1/L91dx9ovcz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..362f3ac4e70fd4c7a7d4eeaf9aaf5945b78221a2 --- /dev/null +++ b/annotations_1/L91dx9ovcz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [1.0, 2.15], [5.0, 6.03], [10.0, 10.96], [12.0, 22.44], [23.0, 25.52], [28.0, 35.07], [36.0, 36.04], [40.0, 43.33], [43.0, 44.42], [46.0, 46.2], [47.0, 47.01], [51.0, 55.85], [57.0, 57.96], [59.0, 61.08], [62.0, 63.66], [66.0, 69.9], [71.0, 86.75], [88.0, 100.85]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.78, 51.12, 32.44, 0.0, 50.56, 0.0, 0.0, 0.0, 42.24, 0.0, 48.91, 0.0, 67.0, 31.77, 34.33], "audiomae_on_audioset": [null, null, null, null, [["hum", 42.99], ["mains hum", 24.14], ["music", 13.7]], null, [["music", 43.44], ["noise", 17.42], ["mains hum", 8.56]], null, null, null, null, null, [["music", 52.26], ["brass instrument", 8.07], ["trumpet", 3.56]], null, [["music", 36.01], ["single-lens reflex camera", 8.42], ["mosquito", 5.09]], null, null, [["mosquito", 33.24], ["fly, housefly", 29.7], ["music", 12.97]], [["speech", 46.62], ["music", 12.97], ["slosh", 3.12]]], "duration": [0.43, 1.15, 1.03, 0.96, 10.44, 2.52, 7.07, 0.04, 3.33, 1.42, 0.2, 0.01, 4.85, 0.96, 2.08, 1.66, 3.9, 15.75, 12.85]} \ No newline at end of file diff --git a/annotations_1/L9x5p-s4zKs_filtered.json b/annotations_1/L9x5p-s4zKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed639da36cd640947f3b42af670a6a6deb10c782 --- /dev/null +++ b/annotations_1/L9x5p-s4zKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.28], [14.0, 23.08], [24.0, 25.22], [26.0, 38.15], [40.0, 40.71], [42.0, 43.7], [45.0, 44.61], [46.0, 50.79], [57.0, 57.38], [59.0, 59.9], [63.0, 65.01], [69.0, 72.91], [83.0, 84.43], [87.0, 88.08], [96.0, 98.25], [101.0, 101.12], [102.0, 104.21], [106.0, 112.6], [114.0, 119.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [33.63, 29.7, 0.0, 36.15, 0.0, 0.0, 0.0, 35.81, 0.0, 0.0, 49.0, 46.64, 0.0, 0.0, 58.89, 0.0, 51.44, 54.23, 63.85], "audiomae_on_audioset": [[["music", 40.05], ["synthesizer", 21.65], ["electronic music", 9.68]], [["hum", 49.92], ["throbbing", 40.35], ["music", 2.2]], null, [["hum", 35.92], ["music", 22.44], ["throbbing", 8.85]], null, null, null, [["hum", 43.11], ["throbbing", 39.87], ["pulse", 4.52]], null, null, [["hum", 27.92], ["music", 15.2], ["throbbing", 9.18]], [["speech", 47.51], ["whale vocalization", 12.69], ["sidetone", 11.8]], null, null, null, null, null, null, null], "duration": [7.28, 9.08, 1.22, 12.15, 0.71, 1.7, -0.39, 4.79, 0.38, 0.9, 2.01, 3.91, 1.43, 1.08, 2.25, 0.12, 2.21, 6.6, 5.53]} \ No newline at end of file diff --git a/annotations_1/LABMISLl7Y8_filtered.json b/annotations_1/LABMISLl7Y8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1219e11f2d657803a4bed8f6265d77449a35aa9f --- /dev/null +++ b/annotations_1/LABMISLl7Y8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [4.0, 4.75], [6.0, 5.97], [26.0, 25.91], [29.0, 28.85], [32.0, 32.16], [33.0, 34.3], [36.0, 35.73], [39.0, 38.97], [41.0, 41.67], [46.0, 47.26], [59.0, 59.63], [64.0, 83.22], [84.0, 84.94], [87.0, 88.52], [108.0, 112.09], [121.0, 129.78], [133.0, 133.34], [159.0, 163.05], [170.0, 170.21], [172.0, 172.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 0.0, 37.35, 31.71, 0.0, 30.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 81.97], ["speech", 4.43], ["boing", 3.41]], null, null, [["music", 44.38], ["speech", 15.65], ["sidetone", 7.55]], [["music", 76.61], ["throbbing", 3.83], ["speech", 3.32]], null, [["speech", 43.99], ["sidetone", 20.5], ["music", 13.44]], null, null], "duration": [-0.04, 0.75, -0.03, -0.09, -0.15, 0.16, 1.3, -0.27, -0.03, 0.67, 1.26, 0.63, 19.22, 0.94, 1.52, 4.09, 8.78, 0.34, 4.05, 0.21, 0.71]} \ No newline at end of file diff --git a/annotations_1/LAajBhbC5Y8_filtered.json b/annotations_1/LAajBhbC5Y8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c75b5a7ce6c02aec0a413613c7ec26fd98d1a8c5 --- /dev/null +++ b/annotations_1/LAajBhbC5Y8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.35], [21.0, 22.82], [38.0, 41.01], [54.0, 54.33], [68.0, 68.2], [81.0, 81.7]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.25, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.35, 1.82, 3.01, 0.33, 0.2, 0.7]} \ No newline at end of file diff --git a/annotations_1/LAk5KEGLzmc_filtered.json b/annotations_1/LAk5KEGLzmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29f0ed069b4271989d9cedd5770e635b97c17291 --- /dev/null +++ b/annotations_1/LAk5KEGLzmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.94], [4.0, 5.83], [6.0, 10.44], [13.0, 13.47], [18.0, 19.21], [20.0, 24.19], [25.0, 27.23], [29.0, 29.52], [30.0, 30.15], [34.0, 35.34], [37.0, 38.04], [51.0, 51.83], [54.0, 54.62], [58.0, 58.13], [60.0, 63.34], [65.0, 71.71], [72.0, 76.99], [80.0, 81.26], [87.0, 88.15], [93.0, 94.71], [100.0, 100.8], [103.0, 102.79], [108.0, 108.01], [108.0, 108.89], [115.0, 114.79], [117.0, 116.75]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.35, 0.0, 0.0, 48.82, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.98, 42.24, 45.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.67], ["speech", 28.24], ["musical instrument", 5.34]], null, null, [["hum", 24.97], ["mains hum", 8.9], ["noise", 7.85]], [["speech", 23.0], ["hum", 11.82], ["rumble", 7.88]], null, null, null, null, null, null, null, [["music", 72.73], ["musical instrument", 5.22], ["guitar", 4.9]], [["music", 61.39], ["speech", 6.02], ["hum", 4.97]], [["music", 31.6], ["hum", 17.53], ["mains hum", 14.91]], null, null, null, null, null, null, null, null, null], "duration": [1.94, 1.83, 4.44, 0.47, 1.21, 4.19, 2.23, 0.52, 0.15, 1.34, 1.04, 0.83, 0.62, 0.13, 3.34, 6.71, 4.99, 1.26, 1.15, 1.71, 0.8, -0.21, 0.01, 0.89, -0.21, -0.25]} \ No newline at end of file diff --git a/annotations_1/LBLIa7bqcfY_filtered.json b/annotations_1/LBLIa7bqcfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe7729d36aab3d4f59a8470d469c170d103c2fe6 --- /dev/null +++ b/annotations_1/LBLIa7bqcfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.22], [15.0, 16.87], [19.0, 20.04], [22.0, 23.67], [36.0, 44.73], [46.0, 49.11], [53.0, 53.74], [55.0, 59.64], [61.0, 65.57], [68.0, 70.6], [77.0, 77.87], [78.0, 79.15], [79.0, 81.57], [85.0, 85.01], [96.0, 97.41], [100.0, 101.34], [102.0, 102.71], [110.0, 111.13], [113.0, 123.74], [124.0, 124.78], [137.0, 142.79]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [79.59, 0.0, 0.0, 0.0, 84.8, 93.13, 0.0, 86.82, 49.64, 40.62, 0.0, 0.0, 40.84, 0.0, 0.0, 0.0, 0.0, 0.0, 48.19, 0.0, 35.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 46.2], ["fly, housefly", 5.48], ["whack, thwack", 4.43]], [["speech", 45.18], ["music", 14.67], ["shuffle", 3.2]], null, null, [["frog", 50.97], ["insect", 19.91], ["fly, housefly", 6.12]], null, null, null, null, null, [["speech", 21.23], ["animal", 19.93], ["frog", 7.75]], null, [["speech", 44.87], ["fart", 32.6], ["explosion", 5.51]]], "duration": [5.22, 1.87, 1.04, 1.67, 8.73, 3.11, 0.74, 4.64, 4.57, 2.6, 0.87, 1.15, 2.57, 0.01, 1.41, 1.34, 0.71, 1.13, 10.74, 0.78, 5.79]} \ No newline at end of file diff --git a/annotations_1/LBm4aJ0ZcqY_filtered.json b/annotations_1/LBm4aJ0ZcqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..536717e9065183499e02b96bc39beac7aeefb516 --- /dev/null +++ b/annotations_1/LBm4aJ0ZcqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 10.44], [14.0, 152.39], [153.0, 154.4], [157.0, 158.11]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 31.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 33.61], ["insect", 22.2], ["mosquito", 9.97]], null, null, null], "duration": [1.13, 7.44, 138.39, 1.4, 1.11]} \ No newline at end of file diff --git a/annotations_1/LCj92toBBBE_filtered.json b/annotations_1/LCj92toBBBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f10c2f89251b5b69b42b8d21ee382fc947954af --- /dev/null +++ b/annotations_1/LCj92toBBBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.67], [22.0, 32.58], [38.0, 54.46], [55.0, 55.65], [57.0, 60.35], [63.0, 75.3], [78.0, 78.54], [82.0, 105.04], [105.0, 106.27], [109.0, 114.93], [116.0, 116.55], [118.0, 118.39], [119.0, 119.79], [122.0, 121.9], [122.0, 122.3], [127.0, 127.48], [128.0, 134.2]], "keep_status": [true, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [28.69, 28.73, 29.55, 0.0, 29.71, 28.91, 0.0, 28.73, 0.0, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.73], "audiomae_on_audioset": [[["music", 35.03], ["hum", 17.71], ["mains hum", 7.78]], [["music", 29.4], ["speech", 28.07], ["mains hum", 11.45]], [["speech", 20.73], ["explosion", 19.63], ["music", 16.43]], null, [["didgeridoo", 16.51], ["music", 13.05], ["hum", 10.35]], [["music", 48.74], ["hum", 15.45], ["speech", 9.61]], null, [["livestock, farm animals, working animals", 19.51], ["speech", 11.78], ["music", 11.54]], null, null, null, null, null, null, null, null, [["speech", 35.33], ["boing", 28.78], ["music", 9.31]]], "duration": [13.67, 10.58, 16.46, 0.65, 3.35, 12.3, 0.54, 23.04, 1.27, 5.93, 0.55, 0.39, 0.79, -0.1, 0.3, 0.48, 6.2]} \ No newline at end of file diff --git a/annotations_1/LCljgWh4L8Y_filtered.json b/annotations_1/LCljgWh4L8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bea68e18c326a0f1858327eda62f68b4ceb7e1c0 --- /dev/null +++ b/annotations_1/LCljgWh4L8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.07], [24.0, 38.21], [40.0, 46.58], [62.0, 64.18], [70.0, 70.36], [75.0, 74.83], [88.0, 90.1], [91.0, 90.98], [103.0, 105.07], [112.0, 116.94], [123.0, 127.09], [135.0, 148.51], [155.0, 155.06], [161.0, 163.22], [164.0, 167.61], [170.0, 172.37]], "keep_status": [false, true, true, false, false, false, true, false, true, true, true, false, false, false, false, false], "silence_prob": [29.96, 31.18, 31.42, 39.12, 0.0, 0.0, 35.59, 0.0, 35.94, 33.79, 30.8, 31.75, 0.0, 32.39, 32.9, 50.51], "audiomae_on_audioset": [[["music", 57.23], ["throbbing", 14.64], ["hum", 10.12]], [["music", 55.22], ["cacophony", 5.73], ["noise", 3.41]], [["music", 32.57], ["hum", 18.96], ["throbbing", 12.9]], [["music", 42.76], ["foghorn", 25.77], ["musical instrument", 2.99]], null, null, [["music", 20.51], ["cattle, bovinae", 10.36], ["speech", 8.01]], null, [["groan", 33.89], ["music", 22.84], ["grunt", 8.72]], [["music", 49.27], ["sidetone", 3.42], ["electronic music", 3.04]], [["music", 57.85], ["boing", 5.83], ["animal", 3.54]], [["music", 52.75], ["grunt", 11.87], ["groan", 9.59]], null, [["music", 44.13], ["mains hum", 18.25], ["hum", 12.16]], [["music", 74.6], ["scary music", 5.44], ["theremin", 1.74]], null], "duration": [15.07, 14.21, 6.58, 2.18, 0.36, -0.17, 2.1, -0.02, 2.07, 4.94, 4.09, 13.51, 0.06, 2.22, 3.61, 2.37]} \ No newline at end of file diff --git a/annotations_1/LDmKhGcB0Xs_filtered.json b/annotations_1/LDmKhGcB0Xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..319fb697fc8be716a9664765e672f3a0617644de --- /dev/null +++ b/annotations_1/LDmKhGcB0Xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.4], [7.0, 8.45], [9.0, 9.91], [10.0, 53.64], [54.0, 53.81], [54.0, 56.44], [58.0, 88.48], [89.0, 135.99], [139.0, 173.42]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [76.7, 0.0, 0.0, 0.0, 0.0, 28.01, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 66.78], ["didgeridoo", 4.72], ["throbbing", 4.49]], null, null, null], "duration": [2.4, 1.45, 0.91, 43.64, -0.19, 2.44, 30.48, 46.99, 34.42]} \ No newline at end of file diff --git a/annotations_1/LE0TUN0Po7I_filtered.json b/annotations_1/LE0TUN0Po7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed22c68cf0d51edcbf8046e27a0931cbe8201b1b --- /dev/null +++ b/annotations_1/LE0TUN0Po7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.2], [29.0, 31.14], [38.0, 37.98], [40.0, 51.49]], "keep_status": [false, false, false, true], "silence_prob": [52.8, 55.6, 0.0, 38.74], "audiomae_on_audioset": [null, null, null, [["music", 58.1], ["didgeridoo", 5.2], ["singing bowl", 5.01]]], "duration": [2.2, 2.14, -0.02, 11.49]} \ No newline at end of file diff --git a/annotations_1/LEq4-b61Hoo_filtered.json b/annotations_1/LEq4-b61Hoo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d19bbfa1348497ac78771ac3a2b568fea52cee0 --- /dev/null +++ b/annotations_1/LEq4-b61Hoo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.34], [15.0, 21.05], [21.0, 24.44], [26.0, 27.92], [30.0, 31.26], [33.0, 33.59], [34.0, 35.11], [43.0, 46.21], [51.0, 51.8], [65.0, 65.13], [82.0, 82.76], [86.0, 87.51], [91.0, 91.64], [93.0, 96.01], [97.0, 98.71], [99.0, 100.72], [103.0, 103.57], [109.0, 109.81], [112.0, 114.49], [115.0, 117.26], [119.0, 122.66], [123.0, 123.6], [124.0, 124.9], [126.0, 128.01], [130.0, 131.03], [131.0, 132.33], [133.0, 134.37]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.57, 92.31, 56.63, 0.0, 0.0, 0.0, 0.0, 54.83, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 90.78, 91.98, 74.76, 0.0, 0.0, 56.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 19.37], ["bee, wasp, etc.", 15.25], ["hum", 7.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.34, 6.05, 3.44, 1.92, 1.26, 0.59, 1.11, 3.21, 0.8, 0.13, 0.76, 1.51, 0.64, 3.01, 1.71, 1.72, 0.57, 0.81, 2.49, 2.26, 3.66, 0.6, 0.9, 2.01, 1.03, 1.33, 1.37]} \ No newline at end of file diff --git a/annotations_1/LF0dTioXk3A_filtered.json b/annotations_1/LF0dTioXk3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56c6dae2f535e5742aadb742245c1c1737632d29 --- /dev/null +++ b/annotations_1/LF0dTioXk3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.29], [24.0, 25.17], [26.0, 33.05], [34.0, 36.73], [38.0, 40.19], [43.0, 43.44], [54.0, 55.58], [64.0, 90.58], [92.0, 104.6], [106.0, 126.79], [131.0, 130.92]], "keep_status": [false, false, true, true, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 29.6, 30.76, 38.15, 0.0, 0.0, 29.83, 29.54, 29.54, 0.0], "audiomae_on_audioset": [null, null, [["fart", 24.26], ["livestock, farm animals, working animals", 13.45], ["speech", 12.53]], [["music", 43.76], ["cattle, bovinae", 7.96], ["moo", 7.01]], [["music", 47.52], ["synthesizer", 3.36], ["musical instrument", 3.06]], null, null, [["speech", 42.56], ["music", 22.61], ["theremin", 4.44]], [["music", 56.25], ["throbbing", 9.4], ["electronic music", 4.2]], [["music", 49.96], ["brass instrument", 14.84], ["trombone", 12.34]], null], "duration": [1.29, 1.17, 7.05, 2.73, 2.19, 0.44, 1.58, 26.58, 12.6, 20.79, -0.08]} \ No newline at end of file diff --git a/annotations_1/LFO-xqbWYpw_filtered.json b/annotations_1/LFO-xqbWYpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5839e4910701f7fa82a7d8105ff99d5971e3dee4 --- /dev/null +++ b/annotations_1/LFO-xqbWYpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.16], [23.0, 28.19], [33.0, 34.84], [51.0, 51.7], [56.0, 56.74], [63.0, 63.69], [66.0, 66.65], [69.0, 69.84], [73.0, 74.36], [76.0, 76.82], [86.0, 85.94], [86.0, 87.07], [93.0, 93.77], [103.0, 103.94], [105.0, 106.2], [108.0, 109.27], [118.0, 119.08], [135.0, 139.46], [144.0, 156.51], [160.0, 163.76], [164.0, 164.81], [166.0, 168.54], [169.0, 169.94], [184.0, 185.03], [195.0, 196.43], [200.0, 208.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 59.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 50.46, 49.97, 0.0, 46.68, 0.0, 0.0, 0.0, 58.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.51], ["speech", 18.42], ["hum", 17.5]], null, [["music", 10.11], ["didgeridoo", 9.6], ["hum", 9.23]], null, [["didgeridoo", 19.06], ["music", 4.48], ["animal", 3.53]], null, null, null, null], "duration": [1.16, 5.19, 1.84, 0.7, 0.74, 0.69, 0.65, 0.84, 1.36, 0.82, -0.06, 1.07, 0.77, 0.94, 1.2, 1.27, 1.08, 4.46, 12.51, 3.76, 0.81, 2.54, 0.94, 1.03, 1.43, 8.3]} \ No newline at end of file diff --git a/annotations_1/LHcbbXpKIrc_filtered.json b/annotations_1/LHcbbXpKIrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2e3be048d08eb4536abf7c0805c5492f0bde803 --- /dev/null +++ b/annotations_1/LHcbbXpKIrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [6.0, 6.0], [6.0, 9.78], [12.0, 11.96], [15.0, 16.78], [17.0, 19.14], [20.0, 20.63], [21.0, 21.49], [28.0, 28.36], [30.0, 30.59], [33.0, 33.45], [48.0, 48.52], [52.0, 53.05], [98.0, 101.29], [103.0, 103.64], [117.0, 117.61], [125.0, 129.83], [132.0, 138.01], [140.0, 140.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 0.0, 83.34, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 0.0, 94.07, 78.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.68, 0.0, 3.78, -0.04, 1.78, 2.14, 0.63, 0.49, 0.36, 0.59, 0.45, 0.52, 1.05, 3.29, 0.64, 0.61, 4.83, 6.01, 0.61]} \ No newline at end of file diff --git a/annotations_1/LIYNk4ARUR8_filtered.json b/annotations_1/LIYNk4ARUR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..245d9a4eae6726af15c7474a423163af2861fb77 --- /dev/null +++ b/annotations_1/LIYNk4ARUR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.46], [23.0, 23.89], [25.0, 25.62], [26.0, 27.63], [31.0, 31.83], [39.0, 44.9], [50.0, 50.43], [53.0, 53.23], [57.0, 58.04], [61.0, 65.35], [66.0, 65.96], [66.0, 67.2], [67.0, 70.61], [78.0, 78.97], [82.0, 82.95], [85.0, 86.68], [89.0, 97.68], [100.0, 107.01], [116.0, 116.6], [118.0, 122.13], [124.0, 138.45], [140.0, 147.43], [152.0, 161.55], [169.0, 169.33], [171.0, 171.73], [172.0, 173.38], [176.0, 176.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 39.05, 0.0, 0.0, 40.9, 0.0, 0.0, 0.0, 50.97, 39.88, 0.0, 36.98, 39.22, 38.59, 51.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 42.04], ["glockenspiel", 9.26], ["marimba, xylophone", 9.1]], null, null, [["music", 37.91], ["bell", 10.36], ["tubular bells", 9.79]], null, null, null, null, [["music", 57.18], ["theremin", 17.84], ["musical instrument", 3.95]], null, [["music", 49.65], ["theremin", 11.75], ["musical instrument", 6.4]], [["music", 67.99], ["musical instrument", 3.12], ["marimba, xylophone", 2.46]], [["music", 53.47], ["brass instrument", 11.6], ["trombone", 6.38]], null, null, null, null, null], "duration": [0.46, 0.89, 0.62, 1.63, 0.83, 5.9, 0.43, 0.23, 1.04, 4.35, -0.04, 1.2, 3.61, 0.97, 0.95, 1.68, 8.68, 7.01, 0.6, 4.13, 14.45, 7.43, 9.55, 0.33, 0.73, 1.38, 0.05]} \ No newline at end of file diff --git a/annotations_1/LJ8UoUA2_uE_filtered.json b/annotations_1/LJ8UoUA2_uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1324a874223f2389e7d6bc777271f8715b9b86ca --- /dev/null +++ b/annotations_1/LJ8UoUA2_uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.14], [14.0, 13.95], [14.0, 14.18], [14.0, 14.22], [14.0, 14.35], [16.0, 16.71], [18.0, 19.06], [21.0, 43.23], [50.0, 56.98], [57.0, 62.43], [63.0, 69.99], [71.0, 107.38], [110.0, 112.02], [113.0, 114.17], [115.0, 125.04], [126.0, 132.92], [135.0, 167.53]], "keep_status": [true, false, false, false, false, false, false, true, true, true, true, false, false, false, true, true, false], "silence_prob": [38.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.69, 29.11, 30.91, 36.04, 0.0, 69.47, 0.0, 28.61, 30.59, 0.0], "audiomae_on_audioset": [[["fly, housefly", 20.12], ["insect", 18.5], ["animal", 17.14]], null, null, null, null, null, null, [["thunder", 24.45], ["thunderstorm", 22.11], ["explosion", 9.55]], [["throbbing", 11.44], ["rain", 11.38], ["thunderstorm", 11.08]], [["hum", 9.12], ["horse", 8.89], ["throbbing", 8.56]], [["speech", 37.15], ["raindrop", 9.35], ["rain", 6.37]], null, null, null, [["animal", 38.91], ["livestock, farm animals, working animals", 12.61], ["roaring cats (lions, tigers)", 6.36]], [["hum", 20.06], ["explosion", 7.27], ["speech", 6.25]], null], "duration": [5.14, -0.05, 0.18, 0.22, 0.35, 0.71, 1.06, 22.23, 6.98, 5.43, 6.99, 36.38, 2.02, 1.17, 10.04, 6.92, 32.53]} \ No newline at end of file diff --git a/annotations_1/LJQAKDbq0hI_filtered.json b/annotations_1/LJQAKDbq0hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc9396a26bdbd1b7f3dbd2e084d9e10ae4225906 --- /dev/null +++ b/annotations_1/LJQAKDbq0hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.54], [12.0, 12.8], [16.0, 16.48], [22.0, 24.44], [25.0, 27.7], [28.0, 29.44], [32.0, 36.58], [38.0, 39.97], [41.0, 45.42], [49.0, 49.71], [51.0, 51.98], [54.0, 54.01], [55.0, 55.85], [57.0, 59.24], [60.0, 61.33], [62.0, 85.55], [87.0, 89.56], [92.0, 92.15], [93.0, 95.0], [96.0, 96.3], [97.0, 97.9], [98.0, 99.79], [101.0, 102.02], [104.0, 106.41], [107.0, 109.97], [112.0, 113.26], [114.0, 115.06], [117.0, 118.52], [119.0, 120.88], [122.0, 123.25], [125.0, 125.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.29, 0.0, 0.0, 95.37, 67.63, 0.0, 99.62, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 78.55, 45.56, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 52.74, 51.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.42], ["fly, housefly", 4.86], ["inside, small room", 4.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.54, 0.8, 0.48, 2.44, 2.7, 1.44, 4.58, 1.97, 4.42, 0.71, 0.98, 0.01, 0.85, 2.24, 1.33, 23.55, 2.56, 0.15, 2.0, 0.3, 0.9, 1.79, 1.02, 2.41, 2.97, 1.26, 1.06, 1.52, 1.88, 1.25, 0.17]} \ No newline at end of file diff --git a/annotations_1/LJgqSSZpdns_filtered.json b/annotations_1/LJgqSSZpdns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59f364103f070bea16b0a7ed433b8f83da31d04e --- /dev/null +++ b/annotations_1/LJgqSSZpdns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.22], [15.0, 41.88], [42.0, 51.95], [52.0, 51.98], [56.0, 105.24], [107.0, 119.67], [120.0, 126.22], [128.0, 136.59]], "keep_status": [false, false, true, false, false, true, false, false], "silence_prob": [57.89, 34.71, 34.01, 0.0, 0.0, 30.56, 35.58, 41.14], "audiomae_on_audioset": [null, [["hum", 34.74], ["speech", 23.46], ["mains hum", 14.89]], [["music", 43.47], ["speech", 9.45], ["didgeridoo", 7.05]], null, null, [["hum", 30.49], ["buzz", 17.51], ["throbbing", 12.04]], [["crushing", 59.37], ["music", 6.46], ["squish", 5.12]], [["speech", 61.03], ["hum", 8.59], ["vehicle", 3.02]]], "duration": [2.22, 26.88, 9.95, -0.02, 49.24, 12.67, 6.22, 8.59]} \ No newline at end of file diff --git a/annotations_1/LJl8SSI8MHA_filtered.json b/annotations_1/LJl8SSI8MHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ad730bd9e07985c6b29bc7faa1fe31f62eb6029 --- /dev/null +++ b/annotations_1/LJl8SSI8MHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.99], [19.0, 21.24], [21.0, 22.87], [23.0, 22.91], [23.0, 24.24], [26.0, 26.87], [29.0, 29.83], [30.0, 31.04], [32.0, 32.02], [33.0, 35.11], [36.0, 37.49], [41.0, 40.91], [42.0, 69.63], [72.0, 72.25], [73.0, 74.19], [80.0, 80.11], [83.0, 84.25]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.43, 0.0, 0.0, 32.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 28.12], ["hum", 18.98], ["throbbing", 10.99]], null, null, [["music", 40.21], ["didgeridoo", 28.32], ["speech", 15.58]], null, null, null, null], "duration": [0.99, 2.24, 1.87, -0.09, 1.24, 0.87, 0.83, 1.04, 0.02, 2.11, 1.49, -0.09, 27.63, 0.25, 1.19, 0.11, 1.25]} \ No newline at end of file diff --git a/annotations_1/LJvCFAHRAFI_filtered.json b/annotations_1/LJvCFAHRAFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce08ab09103704092022b10038cfee9f33bc3b7 --- /dev/null +++ b/annotations_1/LJvCFAHRAFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.32], [15.0, 106.3]], "keep_status": [false, false], "silence_prob": [45.49, 0.0], "audiomae_on_audioset": [[["music", 57.16], ["hum", 19.22], ["mains hum", 4.88]], null], "duration": [5.32, 91.3]} \ No newline at end of file diff --git a/annotations_1/LJye4-HVyCU_filtered.json b/annotations_1/LJye4-HVyCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19d5933613b1756ea15a848269e6bd785ae43683 --- /dev/null +++ b/annotations_1/LJye4-HVyCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.1], [12.0, 17.19], [18.0, 20.36], [23.0, 30.6], [32.0, 33.84], [36.0, 36.58], [40.0, 43.24], [46.0, 47.19], [48.0, 47.97], [48.0, 48.9], [49.0, 50.41], [52.0, 52.71], [54.0, 58.6], [61.0, 65.8], [68.0, 70.43], [72.0, 76.47], [78.0, 83.83], [86.0, 90.76], [92.0, 95.23], [97.0, 100.99], [103.0, 104.84], [106.0, 111.81], [113.0, 115.47], [117.0, 159.17], [160.0, 160.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 99.96, 99.94, 95.23, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 100.0, 100.0, 99.99, 99.93, 99.95, 99.56, 83.34, 0.0, 64.63, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.1, 5.19, 2.36, 7.6, 1.84, 0.58, 3.24, 1.19, -0.03, 0.9, 1.41, 0.71, 4.6, 4.8, 2.43, 4.47, 5.83, 4.76, 3.23, 3.99, 1.84, 5.81, 2.47, 42.17, 0.34]} \ No newline at end of file diff --git a/annotations_1/LJym4mTtLRY_filtered.json b/annotations_1/LJym4mTtLRY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3829f35dd7358c8b4c5cbe28fa607db1d5fd8c09 --- /dev/null +++ b/annotations_1/LJym4mTtLRY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.25], [4.0, 4.62], [11.0, 11.62], [12.0, 12.95], [16.0, 17.27], [19.0, 19.31], [23.0, 24.63], [33.0, 32.86], [37.0, 50.79], [57.0, 57.23], [62.0, 65.11], [68.0, 68.57], [71.0, 71.32], [71.0, 71.41], [79.0, 78.8], [79.0, 78.97], [83.0, 83.0], [88.0, 88.1], [92.0, 92.3], [99.0, 100.85], [101.0, 101.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.9, 0.0, 36.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 74.95], ["bleat", 3.79], ["sheep", 3.0]], null, [["music", 68.36], ["synthesizer", 5.65], ["musical instrument", 5.09]], null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.62, 0.62, 0.95, 1.27, 0.31, 1.63, -0.14, 13.79, 0.23, 3.11, 0.57, 0.32, 0.41, -0.2, -0.03, 0.0, 0.1, 0.3, 1.85, 0.78]} \ No newline at end of file diff --git a/annotations_1/LK-4Dmq6Hs0_filtered.json b/annotations_1/LK-4Dmq6Hs0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..555b4721370a3b4b40720eb6f3ec9e0f3cf89156 --- /dev/null +++ b/annotations_1/LK-4Dmq6Hs0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 19.94], [20.0, 26.0], [29.0, 35.38], [37.0, 37.18], [42.0, 44.93], [45.0, 53.94], [57.0, 66.18], [67.0, 68.4], [96.0, 96.89], [105.0, 111.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.15, 33.74, 33.88, 0.0, 32.73, 32.41, 30.23, 0.0, 0.0, 90.43], "audiomae_on_audioset": [[["music", 64.6], ["synthesizer", 3.76], ["hum", 2.8]], [["music", 57.55], ["synthesizer", 7.25], ["didgeridoo", 5.99]], [["music", 55.22], ["speech", 13.94], ["synthesizer", 9.17]], null, [["music", 50.84], ["synthesizer", 15.01], ["theremin", 7.63]], [["music", 72.28], ["theremin", 7.57], ["synthesizer", 7.14]], [["music", 63.87], ["theremin", 11.5], ["synthesizer", 10.54]], null, null, null], "duration": [7.94, 6.0, 6.38, 0.18, 2.93, 8.94, 9.18, 1.4, 0.89, 6.77]} \ No newline at end of file diff --git a/annotations_1/LK5QIZgbfZQ_filtered.json b/annotations_1/LK5QIZgbfZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a67c1723c6102d8501513e4ca2feda780ea01b5 --- /dev/null +++ b/annotations_1/LK5QIZgbfZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.2], [20.0, 20.8], [22.0, 29.71], [32.0, 38.2], [38.0, 38.23], [40.0, 39.95], [40.0, 52.47], [53.0, 55.51], [79.0, 83.44], [85.0, 86.46], [87.0, 94.63], [96.0, 96.67], [104.0, 105.16], [109.0, 111.54], [112.0, 113.32], [114.0, 114.66]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [47.78, 0.0, 64.07, 48.48, 0.0, 0.0, 47.9, 59.15, 31.31, 0.0, 37.16, 0.0, 0.0, 51.18, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 27.98], ["music", 24.42], ["throbbing", 5.23]], null, null, [["fly, housefly", 43.11], ["speech", 18.47], ["insect", 14.24]], null, null, [["hum", 22.45], ["mains hum", 15.72], ["noise", 11.08]], null, [["speech", 61.31], ["explosion", 5.16], ["music", 4.89]], null, [["speech", 37.9], ["music", 29.5], ["fart", 2.75]], null, null, null, null, null], "duration": [2.2, 0.8, 7.71, 6.2, 0.23, -0.05, 12.47, 2.51, 4.44, 1.46, 7.63, 0.67, 1.16, 2.54, 1.32, 0.66]} \ No newline at end of file diff --git a/annotations_1/LKJOXcFUSzc_filtered.json b/annotations_1/LKJOXcFUSzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..692d29a31f0c3b5d0e1cd0f618ff957cf2cc087c --- /dev/null +++ b/annotations_1/LKJOXcFUSzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.63], [44.0, 44.93], [45.0, 45.93], [46.0, 46.58], [51.0, 52.29], [54.0, 54.92], [57.0, 64.74], [68.0, 69.4], [77.0, 78.81], [84.0, 86.29], [100.0, 104.08], [105.0, 107.54], [108.0, 109.32], [128.0, 130.06], [130.0, 130.74], [137.0, 137.79], [140.0, 140.51], [142.0, 143.48], [144.0, 146.3], [147.0, 147.02], [148.0, 150.36], [157.0, 157.84]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.78, 0.0, 0.0, 31.09, 41.52, 37.07, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 66.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 44.08], ["keyboard (musical)", 10.46], ["piano", 10.1]], null, null, [["music", 64.8], ["musical instrument", 2.79], ["bell", 1.41]], [["music", 38.29], ["cello", 11.3], ["theremin", 8.38]], [["fly, housefly", 29.43], ["insect", 13.84], ["mosquito", 13.39]], null, [["music", 52.16], ["didgeridoo", 7.09], ["speech", 5.61]], null, null, null, null, null, null, null, null], "duration": [1.63, 0.93, 0.93, 0.58, 1.29, 0.92, 7.74, 1.4, 1.81, 2.29, 4.08, 2.54, 1.32, 2.06, 0.74, 0.79, 0.51, 1.48, 2.3, 0.02, 2.36, 0.84]} \ No newline at end of file diff --git a/annotations_1/LKrcDYvwV1Q_filtered.json b/annotations_1/LKrcDYvwV1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07fe447ba7bc9a5daa2d37692bfd09c0f183cd76 --- /dev/null +++ b/annotations_1/LKrcDYvwV1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.54], [22.0, 39.82], [40.0, 81.28], [83.0, 85.58], [102.0, 113.29], [118.0, 128.93], [130.0, 134.23], [135.0, 135.57], [137.0, 137.79], [138.0, 138.96]], "keep_status": [false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 94.22, 0.0, 29.71, 30.31, 28.87, 29.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.78], ["speech", 5.42], ["cattle, bovinae", 3.49]], [["music", 56.59], ["didgeridoo", 32.88], ["speech", 1.21]], [["music", 74.8], ["speech", 3.0], ["cacophony", 1.37]], [["speech", 29.98], ["didgeridoo", 29.22], ["music", 6.0]], null, null, null], "duration": [0.54, 17.82, 41.28, 2.58, 11.29, 10.93, 4.23, 0.57, 0.79, 0.96]} \ No newline at end of file diff --git a/annotations_1/LQFc7IKhUuE_filtered.json b/annotations_1/LQFc7IKhUuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c27d21e526e88ed94be0452df0b26bff78eea5df --- /dev/null +++ b/annotations_1/LQFc7IKhUuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 52.95], [57.0, 56.64], [57.0, 82.95]], "keep_status": [true, false, true], "silence_prob": [38.27, 0.0, 33.04], "audiomae_on_audioset": [[["speech", 32.36], ["cattle, bovinae", 18.46], ["livestock, farm animals, working animals", 17.58]], null, [["hum", 25.08], ["ding", 10.88], ["music", 9.45]]], "duration": [12.95, -0.36, 25.95]} \ No newline at end of file diff --git a/annotations_1/LRHNkBU6YWw_filtered.json b/annotations_1/LRHNkBU6YWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3a096766ee95c4e6f505c78f2336a2289b8295a --- /dev/null +++ b/annotations_1/LRHNkBU6YWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 55.21], [56.0, 56.15], [57.0, 57.21], [58.0, 60.37], [61.0, 64.86], [65.0, 67.1], [68.0, 68.82], [71.0, 71.59], [73.0, 73.77], [76.0, 76.96], [79.0, 81.06], [82.0, 84.05], [85.0, 85.65], [87.0, 88.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.04, 0.0, 0.0, 92.64, 99.36, 99.16, 0.0, 0.0, 0.0, 0.0, 99.84, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 0.15, 0.21, 2.37, 3.86, 2.1, 0.82, 0.59, 0.77, 0.96, 2.06, 2.05, 0.65, 1.23]} \ No newline at end of file diff --git a/annotations_1/LRc6Awco5aU_filtered.json b/annotations_1/LRc6Awco5aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5796d5c4464c07a91611c117f2a4144ebf7911f4 --- /dev/null +++ b/annotations_1/LRc6Awco5aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [12.0, 13.26], [16.0, 24.19], [25.0, 25.89], [29.0, 29.29], [35.0, 35.65], [37.0, 38.69], [40.0, 39.95], [41.0, 45.18], [47.0, 48.36], [50.0, 52.05], [54.0, 54.41], [57.0, 61.32], [64.0, 67.05], [72.0, 72.66], [77.0, 77.73], [79.0, 79.98], [81.0, 83.74], [84.0, 85.73], [88.0, 90.17], [97.0, 105.16], [106.0, 107.69], [109.0, 108.94], [111.0, 111.2], [113.0, 119.04], [121.0, 123.65], [127.0, 133.08], [135.0, 136.17], [138.0, 141.49], [144.0, 143.83], [146.0, 146.13], [147.0, 147.38], [150.0, 163.43], [165.0, 165.47], [167.0, 168.17], [172.0, 172.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.02, 0.0, 0.0, 0.0, 0.0, 0.0, 47.62, 0.0, 40.71, 0.0, 48.14, 74.6, 0.0, 0.0, 0.0, 77.53, 0.0, 43.18, 47.2, 0.0, 0.0, 0.0, 57.32, 61.77, 56.7, 0.0, 44.93, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.05], ["throbbing", 22.7], ["hum", 18.97]], null, null, null, null, null, [["music", 76.13], ["trance music", 3.52], ["electronic music", 3.4]], null, [["music", 43.7], ["throbbing", 18.24], ["hum", 4.76]], null, [["music", 16.04], ["animal", 12.62], ["livestock, farm animals, working animals", 7.95]], null, null, null, null, null, null, [["music", 47.81], ["speech", 14.07], ["musical instrument", 2.76]], [["hum", 28.99], ["music", 17.63], ["mains hum", 10.97]], null, null, null, null, null, null, null, [["music", 49.77], ["throbbing", 7.06], ["fart", 4.52]], null, null, null, [["music", 56.41], ["electronic music", 10.35], ["trance music", 6.96]], null, null, null], "duration": [0.29, 1.26, 8.19, 0.89, 0.29, 0.65, 1.69, -0.05, 4.18, 1.36, 2.05, 0.41, 4.32, 3.05, 0.66, 0.73, 0.98, 2.74, 1.73, 2.17, 8.16, 1.69, -0.06, 0.2, 6.04, 2.65, 6.08, 1.17, 3.49, -0.17, 0.13, 0.38, 13.43, 0.47, 1.17, 0.17]} \ No newline at end of file diff --git a/annotations_1/LSD1fq3xDA8_filtered.json b/annotations_1/LSD1fq3xDA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbbded0aaba4271e6fdfdc5450ab20beae6eafa --- /dev/null +++ b/annotations_1/LSD1fq3xDA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.17], [16.0, 18.96], [20.0, 44.47], [45.0, 46.99], [48.0, 49.2], [66.0, 66.41], [70.0, 78.33], [91.0, 91.62], [95.0, 101.16], [104.0, 105.04], [107.0, 107.06], [109.0, 110.35], [113.0, 116.6], [117.0, 118.84], [121.0, 122.34], [123.0, 124.5], [125.0, 127.14], [128.0, 129.27], [130.0, 132.24], [133.0, 135.51], [136.0, 145.94], [154.0, 176.59], [182.0, 186.26], [187.0, 190.53], [191.0, 193.21], [194.0, 196.26], [200.0, 201.31], [203.0, 206.02], [207.0, 210.3]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [89.72, 97.33, 37.96, 0.0, 0.0, 0.0, 31.3, 0.0, 30.35, 0.0, 0.0, 0.0, 51.6, 0.0, 0.0, 0.0, 99.56, 0.0, 95.37, 87.19, 50.02, 30.42, 37.42, 74.44, 95.23, 93.91, 0.0, 99.97, 83.52], "audiomae_on_audioset": [null, null, [["wind chime", 19.87], ["chime", 18.47], ["music", 18.32]], null, null, null, [["music", 29.69], ["speech", 25.0], ["sidetone", 14.95]], null, [["speech", 30.65], ["vehicle", 11.38], ["livestock, farm animals, working animals", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.66], ["hum", 5.57], ["musical instrument", 3.3]], [["music", 46.4], ["didgeridoo", 13.53], ["breaking", 6.98]], null, null, null, null, null, null], "duration": [6.17, 2.96, 24.47, 1.99, 1.2, 0.41, 8.33, 0.62, 6.16, 1.04, 0.06, 1.35, 3.6, 1.84, 1.34, 1.5, 2.14, 1.27, 2.24, 2.51, 9.94, 22.59, 4.26, 3.53, 2.21, 2.26, 1.31, 3.02, 3.3]} \ No newline at end of file diff --git a/annotations_1/LSTU_JJcJxQ_filtered.json b/annotations_1/LSTU_JJcJxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0869ee113af36586d3945b1d5bbf34d46eb12521 --- /dev/null +++ b/annotations_1/LSTU_JJcJxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 18.15], [24.0, 29.08], [30.0, 31.38], [32.0, 39.39], [41.0, 42.26], [45.0, 46.65], [48.0, 49.11], [50.0, 51.09], [52.0, 53.5], [56.0, 56.79], [61.0, 61.05], [62.0, 64.17], [66.0, 72.17], [74.0, 75.73], [76.0, 78.92], [80.0, 80.97], [82.0, 85.35], [87.0, 89.34], [91.0, 98.0], [98.0, 98.15], [99.0, 107.55], [108.0, 108.99], [114.0, 117.64], [118.0, 121.78], [122.0, 125.02], [126.0, 132.97], [135.0, 142.2], [144.0, 144.53], [145.0, 147.46], [149.0, 150.58], [151.0, 165.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [96.42, 42.39, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 35.44, 0.0, 49.68, 0.0, 87.0, 40.31, 88.1, 0.0, 69.2, 0.0, 92.31, 50.86, 46.4, 31.58, 46.54, 0.0, 51.55, 0.0, 56.78], "audiomae_on_audioset": [null, [["hum", 47.21], ["mains hum", 28.37], ["speech", 13.86]], null, null, null, null, null, null, null, null, null, null, [["music", 20.88], ["fart", 9.25], ["arrow", 5.39]], null, [["speech", 40.09], ["music", 16.02], ["didgeridoo", 5.06]], null, null, [["music", 35.11], ["speech", 12.15], ["musical instrument", 5.57]], null, null, null, null, null, null, [["hum", 27.98], ["speech", 26.65], ["mains hum", 19.33]], [["mains hum", 22.24], ["speech", 21.71], ["music", 16.94]], [["music", 34.23], ["theremin", 27.29], ["speech", 11.3]], null, null, null, null], "duration": [15.15, 5.08, 1.38, 7.39, 1.26, 1.65, 1.11, 1.09, 1.5, 0.79, 0.05, 2.17, 6.17, 1.73, 2.92, 0.97, 3.35, 2.34, 7.0, 0.15, 8.55, 0.99, 3.64, 3.78, 3.02, 6.97, 7.2, 0.53, 2.46, 1.58, 14.33]} \ No newline at end of file diff --git a/annotations_1/LTfMvliqiGk_filtered.json b/annotations_1/LTfMvliqiGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..872d56a87b8492f36ea3ef9cfc8496fbb620dd52 --- /dev/null +++ b/annotations_1/LTfMvliqiGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.17], [21.0, 32.61], [36.0, 38.72], [41.0, 42.47], [45.0, 46.08], [49.0, 57.92], [59.0, 60.24], [61.0, 123.92], [126.0, 126.89], [128.0, 128.48], [131.0, 132.38]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [44.2, 37.05, 44.07, 0.0, 0.0, 31.71, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.99], ["music", 30.8], ["sidetone", 5.42]], [["speech", 47.91], ["hum", 15.8], ["music", 13.73]], [["music", 37.23], ["throbbing", 11.15], ["hum", 7.76]], null, null, [["whale vocalization", 44.7], ["speech", 21.4], ["music", 10.63]], null, null, null, null, null], "duration": [2.17, 11.61, 2.72, 1.47, 1.08, 8.92, 1.24, 62.92, 0.89, 0.48, 1.38]} \ No newline at end of file diff --git a/annotations_1/LTyelOWIGh0_filtered.json b/annotations_1/LTyelOWIGh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e9a1091183b599a4be13c2102d18e1350f1d32f --- /dev/null +++ b/annotations_1/LTyelOWIGh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.82], [9.0, 17.91], [20.0, 22.77], [27.0, 28.51], [34.0, 35.18], [37.0, 41.79], [44.0, 45.42], [46.0, 47.65], [49.0, 55.05], [59.0, 61.32], [63.0, 65.3], [66.0, 70.82], [72.0, 88.08], [89.0, 99.77], [101.0, 149.47], [150.0, 155.63], [156.0, 170.4], [173.0, 174.88], [176.0, 177.33], [178.0, 240.0], [241.0, 242.57], [243.0, 244.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [32.99, 28.99, 91.3, 0.0, 0.0, 62.78, 0.0, 0.0, 92.48, 99.4, 61.47, 28.42, 28.59, 30.12, 0.0, 30.05, 31.63, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.56], ["throbbing", 19.66], ["speech", 18.84]], [["hum", 27.18], ["music", 26.85], ["mains hum", 17.73]], null, null, null, null, null, null, null, null, null, [["speech", 37.6], ["explosion", 21.14], ["music", 7.27]], [["speech", 34.85], ["explosion", 34.57], ["eruption", 14.17]], [["hum", 54.26], ["throbbing", 16.42], ["mains hum", 9.75]], null, [["speech", 28.3], ["music", 10.21], ["vehicle", 5.87]], [["music", 64.49], ["whale vocalization", 8.92], ["scary music", 2.95]], null, null, null, null, null], "duration": [7.82, 8.91, 2.77, 1.51, 1.18, 4.79, 1.42, 1.65, 6.05, 2.32, 2.3, 4.82, 16.08, 10.77, 48.47, 5.63, 14.4, 1.88, 1.33, 62.0, 1.57, 1.75]} \ No newline at end of file diff --git a/annotations_1/LVGZy2YKAh8_filtered.json b/annotations_1/LVGZy2YKAh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b744a459cd4888ef8d4eafad2b55f5b09313521 --- /dev/null +++ b/annotations_1/LVGZy2YKAh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [6.0, 6.4], [15.0, 16.31], [29.0, 31.18], [33.0, 34.48], [36.0, 38.38], [43.0, 44.98], [46.0, 47.7], [51.0, 58.29], [59.0, 60.59], [62.0, 80.62], [81.0, 82.56], [84.0, 164.27], [169.0, 169.35], [171.0, 172.59], [178.0, 191.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 82.97, 0.0, 81.53, 0.0, 0.0, 86.09, 0.0, 36.44, 0.0, 0.0, 0.0, 0.0, 39.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 31.0], ["hum", 21.03], ["throbbing", 20.74]], null, null, null, null, [["music", 34.23], ["synthesizer", 11.01], ["musical instrument", 7.02]]], "duration": [0.59, 0.4, 1.31, 2.18, 1.48, 2.38, 1.98, 1.7, 7.29, 1.59, 18.62, 1.56, 80.27, 0.35, 1.59, 13.71]} \ No newline at end of file diff --git a/annotations_1/LVbkD8ZogwA_filtered.json b/annotations_1/LVbkD8ZogwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1606e9fcfc5becd537fa184573c87d675f0e96de --- /dev/null +++ b/annotations_1/LVbkD8ZogwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.7], [48.0, 49.89], [51.0, 54.38], [59.0, 59.76], [61.0, 63.37], [67.0, 71.19], [72.0, 73.4], [79.0, 79.19], [80.0, 80.6], [88.0, 117.02], [121.0, 122.76], [129.0, 129.2]], "keep_status": [false, false, true, false, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.05, 0.0, 41.81, 37.92, 0.0, 0.0, 0.0, 37.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 11.05], ["cattle, bovinae", 8.98], ["hum", 8.13]], null, [["music", 36.53], ["musical instrument", 5.61], ["vehicle", 5.28]], [["music", 48.86], ["throbbing", 5.88], ["hum", 3.81]], null, null, null, [["speech", 37.79], ["hum", 14.47], ["music", 11.05]], null, null], "duration": [0.7, 1.89, 3.38, 0.76, 2.37, 4.19, 1.4, 0.19, 0.6, 29.02, 1.76, 0.2]} \ No newline at end of file diff --git a/annotations_1/LVvJj9sDilQ_filtered.json b/annotations_1/LVvJj9sDilQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d939fe845a39891af732560538aa6639765da7c --- /dev/null +++ b/annotations_1/LVvJj9sDilQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [4.0, 3.87], [6.0, 6.07], [7.0, 7.35], [11.0, 12.01], [14.0, 14.98], [16.0, 16.82], [20.0, 19.97], [21.0, 24.88], [28.0, 34.8], [35.0, 35.45], [37.0, 36.98], [39.0, 43.75], [47.0, 48.63], [49.0, 54.87], [56.0, 56.94], [58.0, 66.21], [67.0, 68.2], [70.0, 72.37], [73.0, 75.66], [76.0, 78.0], [80.0, 80.47], [82.0, 90.69], [93.0, 94.17], [95.0, 96.58], [98.0, 99.39], [102.0, 105.0], [106.0, 108.31], [110.0, 114.49], [117.0, 128.71], [129.0, 131.94], [133.0, 133.0], [134.0, 134.42], [135.0, 135.78], [137.0, 137.73], [138.0, 139.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.21, 74.13, 0.0, 0.0, 100.0, 0.0, 55.53, 0.0, 61.77, 0.0, 94.07, 71.43, 63.31, 0.0, 52.68, 0.0, 0.0, 0.0, 100.0, 99.99, 100.0, 76.04, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, -0.13, 0.07, 0.35, 1.01, 0.98, 0.82, -0.03, 3.88, 6.8, 0.45, -0.02, 4.75, 1.63, 5.87, 0.94, 8.21, 1.2, 2.37, 2.66, 2.0, 0.47, 8.69, 1.17, 1.58, 1.39, 3.0, 2.31, 4.49, 11.71, 2.94, 0.0, 0.42, 0.78, 0.73, 1.26]} \ No newline at end of file diff --git a/annotations_1/LW8M-U3Q8ug_filtered.json b/annotations_1/LW8M-U3Q8ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9d7d9d845e6d05192a1cfb1910bceb072eedcaa --- /dev/null +++ b/annotations_1/LW8M-U3Q8ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.15], [11.0, 12.26], [16.0, 17.29], [20.0, 21.09], [22.0, 22.91], [23.0, 25.19], [26.0, 25.96], [28.0, 30.62], [31.0, 36.24], [38.0, 50.45], [55.0, 60.05], [62.0, 63.51], [68.0, 68.76], [71.0, 71.96], [74.0, 75.3], [77.0, 79.29], [84.0, 84.4], [87.0, 87.17], [88.0, 89.77], [91.0, 91.89], [93.0, 93.93], [96.0, 100.31], [102.0, 105.06], [108.0, 110.56], [112.0, 112.87], [115.0, 115.87], [118.0, 118.54], [121.0, 121.31], [123.0, 125.88], [127.0, 128.39], [130.0, 133.52], [136.0, 138.03], [144.0, 144.07], [147.0, 148.85], [150.0, 150.15], [152.0, 154.62]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 46.29, 38.04, 40.93, 69.47, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 87.55, 67.38, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 72.31, 67.76, 0.0, 0.0, 0.0, 59.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 30.69], ["hum", 19.47], ["mains hum", 7.79]], [["rumble", 15.76], ["speech", 11.8], ["vehicle", 7.87]], [["hum", 50.21], ["mains hum", 14.85], ["rumble", 14.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 1.26, 1.29, 1.09, 0.91, 2.19, -0.04, 2.62, 5.24, 12.45, 5.05, 1.51, 0.76, 0.96, 1.3, 2.29, 0.4, 0.17, 1.77, 0.89, 0.93, 4.31, 3.06, 2.56, 0.87, 0.87, 0.54, 0.31, 2.88, 1.39, 3.52, 2.03, 0.07, 1.85, 0.15, 2.62]} \ No newline at end of file diff --git a/annotations_1/LWIAWDjHhx4_filtered.json b/annotations_1/LWIAWDjHhx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb3c258463ceed2d078974ab280898a9e3d4c5e4 --- /dev/null +++ b/annotations_1/LWIAWDjHhx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [6.0, 7.28], [11.0, 11.38], [13.0, 14.42], [17.0, 17.58], [21.0, 22.22], [24.0, 25.0], [27.0, 27.31], [35.0, 39.66], [41.0, 42.5], [46.0, 46.26], [50.0, 51.61], [52.0, 52.41], [59.0, 59.76], [62.0, 62.04], [69.0, 69.85], [73.0, 74.53], [78.0, 78.7], [80.0, 80.87], [82.0, 83.29], [85.0, 85.62], [88.0, 88.64], [89.0, 90.0], [92.0, 93.33], [94.0, 94.81], [96.0, 99.57], [101.0, 101.71], [104.0, 108.48], [110.0, 110.12], [113.0, 113.24], [115.0, 116.07], [116.0, 116.5], [117.0, 116.53], [117.0, 116.56], [117.0, 116.6], [117.0, 116.63], [122.0, 122.61], [124.0, 124.44], [127.0, 127.8], [129.0, 129.24], [130.0, 131.35], [132.0, 135.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.28, 0.38, 1.42, 0.58, 1.22, 1.0, 0.31, 4.66, 1.5, 0.26, 1.61, 0.41, 0.76, 0.04, 0.85, 1.53, 0.7, 0.87, 1.29, 0.62, 0.64, 1.0, 1.33, 0.81, 3.57, 0.71, 4.48, 0.12, 0.24, 1.07, 0.5, -0.47, -0.44, -0.4, -0.37, 0.61, 0.44, 0.8, 0.24, 1.35, 3.8]} \ No newline at end of file diff --git a/annotations_1/LWoKa0wYTJk_filtered.json b/annotations_1/LWoKa0wYTJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ea554694e2553f461da808f92baf80cf1c57d1c --- /dev/null +++ b/annotations_1/LWoKa0wYTJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.9], [11.0, 17.61], [25.0, 27.9], [29.0, 29.71], [33.0, 34.53], [36.0, 37.44], [39.0, 40.32], [41.0, 45.74], [47.0, 47.73], [52.0, 52.49], [56.0, 60.59], [62.0, 62.24], [64.0, 65.47], [66.0, 69.74], [71.0, 71.68]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.13, 33.7, 36.46, 0.0, 0.0, 0.0, 0.0, 35.87, 0.0, 0.0, 45.27, 0.0, 0.0, 41.03, 0.0], "audiomae_on_audioset": [[["siren", 20.94], ["civil defense siren", 19.37], ["theremin", 16.46]], [["cattle, bovinae", 31.32], ["moo", 23.6], ["livestock, farm animals, working animals", 13.02]], [["insect", 33.82], ["fly, housefly", 28.48], ["bee, wasp, etc.", 17.63]], null, null, null, null, [["fly, housefly", 41.97], ["bee, wasp, etc.", 29.18], ["insect", 28.63]], null, null, [["fly, housefly", 43.9], ["insect", 39.06], ["bee, wasp, etc.", 16.3]], null, null, [["fly, housefly", 37.11], ["insect", 28.52], ["bee, wasp, etc.", 6.93]], null], "duration": [2.9, 6.61, 2.9, 0.71, 1.53, 1.44, 1.32, 4.74, 0.73, 0.49, 4.59, 0.24, 1.47, 3.74, 0.68]} \ No newline at end of file diff --git a/annotations_1/LWvcLI0lcFQ_filtered.json b/annotations_1/LWvcLI0lcFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be6463b67d1b8ed7e99e16e1083e478642fcdad3 --- /dev/null +++ b/annotations_1/LWvcLI0lcFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.65], [17.0, 17.41], [18.0, 18.54], [23.0, 24.41], [28.0, 28.24], [33.0, 33.94], [35.0, 35.83], [39.0, 39.85], [41.0, 41.55], [46.0, 47.02], [49.0, 49.57], [52.0, 53.47], [59.0, 59.95], [61.0, 66.97], [68.0, 71.17], [72.0, 74.43], [75.0, 74.58], [75.0, 91.71], [92.0, 99.27], [100.0, 100.92], [101.0, 105.48], [109.0, 116.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.38, 98.36, 99.36, 0.0, 53.53, 42.06, 0.0, 49.27, 40.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 14.82], ["animal", 12.65], ["domestic animals, pets", 10.31]], null, null, null, null, [["music", 60.21], ["speech", 9.67], ["hum", 8.95]], null, [["music", 27.65], ["speech", 21.11], ["musical instrument", 5.82]], [["speech", 40.48], ["music", 35.26], ["drum machine", 3.34]]], "duration": [0.65, 0.41, 0.54, 1.41, 0.24, 0.94, 0.83, 0.85, 0.55, 1.02, 0.57, 1.47, 0.95, 5.97, 3.17, 2.43, -0.42, 16.71, 7.27, 0.92, 4.48, 7.67]} \ No newline at end of file diff --git a/annotations_1/LZ6HA66dXVw_filtered.json b/annotations_1/LZ6HA66dXVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fb4dd788dc19c5dd8a631e5d2f9d1301756a6c1 --- /dev/null +++ b/annotations_1/LZ6HA66dXVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.51], [15.0, 15.4], [19.0, 23.65], [25.0, 41.77], [45.0, 53.47], [64.0, 64.83], [68.0, 68.61], [69.0, 70.26], [71.0, 78.92], [80.0, 80.55], [86.0, 87.34], [88.0, 91.2], [92.0, 94.39], [95.0, 100.99], [102.0, 107.72], [108.0, 114.81], [116.0, 115.79], [119.0, 119.03], [119.0, 120.56], [122.0, 125.54], [127.0, 127.95], [129.0, 161.5]], "keep_status": [true, false, true, true, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [33.77, 0.0, 29.36, 30.08, 28.95, 0.0, 0.0, 0.0, 32.32, 0.0, 0.0, 78.04, 35.23, 33.33, 30.45, 31.43, 0.0, 0.0, 0.0, 34.02, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 20.34], ["eruption", 16.74], ["mains hum", 11.48]], null, [["speech", 36.09], ["sidetone", 11.62], ["bee, wasp, etc.", 5.41]], [["hum", 27.41], ["music", 26.14], ["sidetone", 14.87]], [["speech", 45.97], ["helicopter", 13.17], ["hum", 9.6]], null, null, null, [["whale vocalization", 31.81], ["music", 22.22], ["fly, housefly", 6.43]], null, null, null, [["music", 15.91], ["whale vocalization", 12.91], ["synthesizer", 5.45]], [["whale vocalization", 42.55], ["music", 12.21], ["hum", 8.2]], [["whale vocalization", 44.12], ["hum", 21.76], ["music", 13.48]], [["speech", 52.78], ["music", 26.87], ["gong", 4.34]], null, null, null, [["music", 45.3], ["hum", 15.86], ["throbbing", 13.78]], null, null], "duration": [2.51, 0.4, 4.65, 16.77, 8.47, 0.83, 0.61, 1.26, 7.92, 0.55, 1.34, 3.2, 2.39, 5.99, 5.72, 6.81, -0.21, 0.03, 1.56, 3.54, 0.95, 32.5]} \ No newline at end of file diff --git a/annotations_1/LZ7Thv4ztjg_filtered.json b/annotations_1/LZ7Thv4ztjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea8bdfb6b40a48cada300171825f9a3415fa5c1d --- /dev/null +++ b/annotations_1/LZ7Thv4ztjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.98], [16.0, 16.82], [18.0, 25.29], [27.0, 27.7], [49.0, 49.0], [63.0, 62.9], [64.0, 64.52], [81.0, 81.23], [89.0, 92.06], [99.0, 101.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 32.4, 31.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 32.72], ["music", 27.0], ["boing", 11.59]], [["music", 38.03], ["boing", 26.4], ["speech", 20.17]]], "duration": [0.98, 0.82, 7.29, 0.7, 0.0, -0.1, 0.52, 0.23, 3.06, 2.6]} \ No newline at end of file diff --git a/annotations_1/L_0imHGhC3o_filtered.json b/annotations_1/L_0imHGhC3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..556414cd6ff7d25875b0758c9ef3d84439edbb42 --- /dev/null +++ b/annotations_1/L_0imHGhC3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 26.45], [28.0, 45.86], [46.0, 52.19], [55.0, 61.2], [62.0, 71.1], [71.0, 73.25], [74.0, 74.17], [75.0, 77.7], [80.0, 83.0], [84.0, 89.63], [90.0, 90.95], [96.0, 96.21], [100.0, 101.65], [104.0, 104.85], [109.0, 109.36], [114.0, 115.05], [116.0, 119.33]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.42, 36.77, 96.54, 92.97, 67.38, 90.43, 0.0, 99.21, 99.48, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86], "audiomae_on_audioset": [[["hum", 42.87], ["music", 13.51], ["throbbing", 10.6]], [["hum", 21.09], ["electric shaver, electric razor", 13.83], ["music", 12.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [25.45, 17.86, 6.19, 6.2, 9.1, 2.25, 0.17, 2.7, 3.0, 5.63, 0.95, 0.21, 1.65, 0.85, 0.36, 1.05, 3.33]} \ No newline at end of file diff --git a/annotations_1/L_l2ii_25tc_filtered.json b/annotations_1/L_l2ii_25tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..016a4658969ffee1d8c9b1aababa6b23c4a00ead --- /dev/null +++ b/annotations_1/L_l2ii_25tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.29], [27.0, 28.92], [32.0, 33.52], [41.0, 44.63], [50.0, 52.42], [58.0, 60.3], [61.0, 61.86], [64.0, 64.05], [79.0, 79.2], [81.0, 81.53], [82.0, 87.32], [87.0, 94.14], [97.0, 98.14], [101.0, 101.07], [101.0, 101.11], [102.0, 110.96], [111.0, 111.05], [111.0, 119.79], [123.0, 133.03], [136.0, 189.33], [192.0, 213.31], [215.0, 223.11], [237.0, 238.94], [239.0, 238.98], [261.0, 262.21], [268.0, 270.65], [273.0, 274.46], [285.0, 285.35], [286.0, 286.31]], "keep_status": [false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false, false, false], "silence_prob": [41.22, 0.0, 0.0, 44.26, 42.42, 41.03, 0.0, 0.0, 0.0, 0.0, 33.63, 100.0, 0.0, 0.0, 0.0, 41.78, 0.0, 31.59, 30.7, 0.0, 43.48, 37.32, 0.0, 0.0, 0.0, 34.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.32], ["glockenspiel", 5.98], ["tubular bells", 4.61]], null, null, [["speech", 13.49], ["music", 11.82], ["singing bowl", 9.05]], [["music", 28.68], ["glockenspiel", 12.6], ["mallet percussion", 9.01]], [["music", 35.87], ["percussion", 14.75], ["musical instrument", 6.84]], null, null, null, null, [["cattle, bovinae", 21.53], ["moo", 20.1], ["speech", 15.67]], null, null, null, null, [["music", 73.68], ["echo", 3.85], ["speech", 3.62]], null, [["trombone", 37.03], ["music", 32.65], ["brass instrument", 16.25]], [["music", 31.32], ["clarinet", 19.08], ["brass instrument", 10.32]], null, [["music", 28.45], ["livestock, farm animals, working animals", 15.68], ["cattle, bovinae", 8.43]], [["music", 27.36], ["glockenspiel", 19.23], ["marimba, xylophone", 14.22]], null, null, null, [["music", 61.37], ["clock", 3.23], ["tick-tock", 2.87]], null, null, null], "duration": [7.29, 1.92, 1.52, 3.63, 2.42, 2.3, 0.86, 0.05, 0.2, 0.53, 5.32, 7.14, 1.14, 0.07, 0.11, 8.96, 0.05, 8.79, 10.03, 53.33, 21.31, 8.11, 1.94, -0.02, 1.21, 2.65, 1.46, 0.35, 0.31]} \ No newline at end of file diff --git a/annotations_1/LagXmjL6EeM_filtered.json b/annotations_1/LagXmjL6EeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81ce92765b0ed0c2d1625d99f8a8fc68dc05749f --- /dev/null +++ b/annotations_1/LagXmjL6EeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [2.0, 127.38], [129.0, 141.61], [143.0, 143.75], [145.0, 145.44]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 31.1], ["throbbing", 25.77], ["heart sounds, heartbeat", 17.08]], null, null], "duration": [-0.08, 125.38, 12.61, 0.75, 0.44]} \ No newline at end of file diff --git a/annotations_1/LahMUQTEbcY_filtered.json b/annotations_1/LahMUQTEbcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c911893794f77e0d0e106fd79154afa0fd82a866 --- /dev/null +++ b/annotations_1/LahMUQTEbcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 52.95], [53.0, 98.39], [108.0, 112.67], [120.0, 122.42], [123.0, 125.68], [127.0, 128.36], [130.0, 137.08], [142.0, 146.43], [148.0, 170.38]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.82, 55.96, 54.43, 0.0, 37.95, 37.17, 39.31], "audiomae_on_audioset": [null, null, [["didgeridoo", 47.96], ["music", 22.89], ["throbbing", 8.02]], null, null, null, [["music", 65.21], ["throbbing", 10.52], ["hum", 5.53]], [["throbbing", 32.29], ["music", 23.33], ["hum", 15.09]], [["music", 65.84], ["ambient music", 5.72], ["throbbing", 4.94]]], "duration": [50.95, 45.39, 4.67, 2.42, 2.68, 1.36, 7.08, 4.43, 22.38]} \ No newline at end of file diff --git a/annotations_1/LauRAuoFO0U_filtered.json b/annotations_1/LauRAuoFO0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3047ce6ab05a4453e9ca4187183d532a4e6837c --- /dev/null +++ b/annotations_1/LauRAuoFO0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.8], [17.0, 21.17], [23.0, 24.04], [28.0, 28.81], [33.0, 32.85], [40.0, 45.4], [52.0, 52.54], [57.0, 58.08], [61.0, 60.84], [62.0, 62.07], [63.0, 63.53], [65.0, 65.85], [67.0, 73.55], [77.0, 77.87], [83.0, 84.05], [86.0, 86.27], [88.0, 89.92], [90.0, 89.99], [91.0, 92.74], [98.0, 98.71], [100.0, 100.99], [103.0, 103.57], [105.0, 107.06], [108.0, 108.95], [110.0, 110.57], [112.0, 112.94], [115.0, 115.92], [116.0, 117.98], [119.0, 120.83], [122.0, 122.64], [123.0, 123.99], [126.0, 126.76], [129.0, 129.52], [132.0, 132.58]], "keep_status": [true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.93, 49.31, 0.0, 0.0, 0.0, 34.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 15.14], ["speech", 12.49], ["crowd", 11.4]], [["music", 28.33], ["hum", 7.1], ["throbbing", 6.76]], null, null, null, [["boing", 22.07], ["noise", 21.68], ["speech", 13.35]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.8, 4.17, 1.04, 0.81, -0.15, 5.4, 0.54, 1.08, -0.16, 0.07, 0.53, 0.85, 6.55, 0.87, 1.05, 0.27, 1.92, -0.01, 1.74, 0.71, 0.99, 0.57, 2.06, 0.95, 0.57, 0.94, 0.92, 1.98, 1.83, 0.64, 0.99, 0.76, 0.52, 0.58]} \ No newline at end of file diff --git a/annotations_1/LbCGyHkR0ko_filtered.json b/annotations_1/LbCGyHkR0ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53a2d2b636aad9bacd37965ca6cc72ca0bf4bc33 --- /dev/null +++ b/annotations_1/LbCGyHkR0ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 77.5], [82.0, 84.82], [88.0, 119.16], [121.0, 124.65], [125.0, 125.95], [129.0, 136.11], [139.0, 141.2], [143.0, 145.76], [147.0, 149.08], [150.0, 156.51], [158.0, 159.93], [160.0, 168.76], [170.0, 171.61]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.33, 0.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 99.85, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.73], ["gong", 16.89], ["hum", 7.02]], null, null, null, null, null, null, null, null, null, null, null], "duration": [53.5, 2.82, 31.16, 3.65, 0.95, 7.11, 2.2, 2.76, 2.08, 6.51, 1.93, 8.76, 1.61]} \ No newline at end of file diff --git a/annotations_1/Ld8KOUtkHHY_filtered.json b/annotations_1/Ld8KOUtkHHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Ld8KOUtkHHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/LdRoFo6JuNs_filtered.json b/annotations_1/LdRoFo6JuNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0de1a5ee13d574f30c51a7c2bff754954c46ead --- /dev/null +++ b/annotations_1/LdRoFo6JuNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.77], [13.0, 14.08], [15.0, 26.84], [28.0, 29.64], [34.0, 39.46], [41.0, 44.69], [46.0, 48.51], [50.0, 52.25], [53.0, 53.54], [54.0, 55.09], [58.0, 71.58], [76.0, 79.79], [81.0, 81.87], [83.0, 83.76], [87.0, 99.23], [100.0, 100.95], [102.0, 124.16], [128.0, 128.98], [131.0, 132.56], [134.0, 134.81], [135.0, 135.72], [139.0, 139.8], [142.0, 145.1], [149.0, 150.57], [152.0, 154.13]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 27.98, 0.0, 28.03, 49.22, 49.27, 42.04, 0.0, 0.0, 28.05, 36.0, 0.0, 0.0, 27.88, 0.0, 27.93, 0.0, 0.0, 0.0, 0.0, 0.0, 58.89, 0.0, 86.82], "audiomae_on_audioset": [null, null, [["music", 59.7], ["speech", 15.76], ["musical instrument", 4.16]], null, [["music", 51.21], ["buzz", 9.46], ["electric shaver, electric razor", 3.2]], [["music", 65.71], ["throbbing", 2.82], ["synthesizer", 2.8]], [["music", 48.61], ["didgeridoo", 33.16], ["musical instrument", 2.63]], [["music", 38.28], ["throbbing", 11.02], ["hum", 10.31]], null, null, [["music", 53.99], ["speech", 29.56], ["buzz", 1.2]], [["music", 64.07], ["throbbing", 5.9], ["didgeridoo", 4.74]], null, null, [["music", 53.2], ["hum", 8.33], ["mains hum", 7.73]], null, [["music", 31.73], ["livestock, farm animals, working animals", 7.18], ["electric shaver, electric razor", 7.03]], null, null, null, null, null, null, null, null], "duration": [-0.23, 1.08, 11.84, 1.64, 5.46, 3.69, 2.51, 2.25, 0.54, 1.09, 13.58, 3.79, 0.87, 0.76, 12.23, 0.95, 22.16, 0.98, 1.56, 0.81, 0.72, 0.8, 3.1, 1.57, 2.13]} \ No newline at end of file diff --git a/annotations_1/LehcJeNbFBw_filtered.json b/annotations_1/LehcJeNbFBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf399f7a59cdf8857ae0334a10baa57ceb635311 --- /dev/null +++ b/annotations_1/LehcJeNbFBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.24], [2.0, 2.2], [3.0, 3.01], [7.0, 9.1], [11.0, 14.5], [18.0, 19.47], [21.0, 21.96], [22.0, 23.06], [23.0, 23.7], [26.0, 28.46], [32.0, 32.95], [35.0, 34.94], [36.0, 37.05], [38.0, 39.01], [49.0, 49.72], [56.0, 61.1], [61.0, 62.95], [64.0, 68.52], [72.0, 75.22], [80.0, 80.64], [93.0, 115.42], [120.0, 125.46], [128.0, 134.05], [136.0, 150.57], [153.0, 153.93], [158.0, 158.33], [162.0, 163.53], [164.0, 164.15], [165.0, 165.1], [169.0, 169.28], [174.0, 176.82], [192.0, 192.13], [192.0, 192.4], [196.0, 196.52]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.31, 40.86, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 36.66, 0.0, 34.07, 33.32, 0.0, 30.55, 35.68, 31.36, 33.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 40.54], ["bell", 15.79], ["cowbell", 5.63]], [["music", 20.06], ["singing bowl", 13.18], ["effects unit", 11.61]], null, null, null, null, null, null, null, null, null, null, [["music", 49.1], ["speech", 14.71], ["musical instrument", 5.29]], null, [["music", 56.64], ["clip-clop", 19.44], ["horse", 10.62]], [["music", 35.23], ["speech", 22.16], ["theremin", 5.15]], null, [["music", 31.82], ["quack", 26.88], ["speech", 20.2]], [["music", 41.57], ["speech", 28.64], ["musical instrument", 3.25]], [["foghorn", 39.62], ["music", 16.9], ["trombone", 16.13]], [["music", 43.98], ["brass instrument", 12.9], ["speech", 11.96]], null, null, null, null, null, null, [["moo", 31.34], ["cattle, bovinae", 28.15], ["livestock, farm animals, working animals", 11.79]], null, null, null], "duration": [0.24, 0.2, 0.01, 2.1, 3.5, 1.47, 0.96, 1.06, 0.7, 2.46, 0.95, -0.06, 1.05, 1.01, 0.72, 5.1, 1.95, 4.52, 3.22, 0.64, 22.42, 5.46, 6.05, 14.57, 0.93, 0.33, 1.53, 0.15, 0.1, 0.28, 2.82, 0.13, 0.4, 0.52]} \ No newline at end of file diff --git a/annotations_1/LfL2xCfIMIU_filtered.json b/annotations_1/LfL2xCfIMIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5ee04a82a0e4decc2370c56e36dd8fd3d467b80 --- /dev/null +++ b/annotations_1/LfL2xCfIMIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.18], [13.0, 16.56], [18.0, 25.25], [33.0, 53.54], [54.0, 54.45], [54.0, 54.82], [55.0, 61.94], [66.0, 111.57], [115.0, 121.83]], "keep_status": [false, true, true, true, false, false, false, false, true], "silence_prob": [0.0, 44.66, 31.86, 32.48, 0.0, 0.0, 33.9, 0.0, 36.62], "audiomae_on_audioset": [null, [["music", 25.85], ["hiccup", 14.46], ["thunk", 9.66]], [["speech", 31.91], ["throbbing", 14.83], ["music", 14.7]], [["whack, thwack", 24.09], ["music", 16.89], ["groan", 9.63]], null, null, [["throbbing", 46.65], ["hum", 28.66], ["music", 6.02]], null, [["music", 43.89], ["hum", 9.69], ["soundtrack music", 4.26]]], "duration": [0.18, 3.56, 7.25, 20.54, 0.45, 0.82, 6.94, 45.57, 6.83]} \ No newline at end of file diff --git a/annotations_1/LgKIQbxZZgY_filtered.json b/annotations_1/LgKIQbxZZgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8b80654b9fc4e2a4bd531d404b2d1557e00d2e0 --- /dev/null +++ b/annotations_1/LgKIQbxZZgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [7.0, 9.56], [11.0, 14.2], [15.0, 27.3], [34.0, 36.8], [38.0, 38.55], [41.0, 42.67], [52.0, 55.58], [57.0, 91.81], [93.0, 98.36], [101.0, 108.84], [111.0, 112.21], [116.0, 120.73], [121.0, 122.57], [124.0, 124.75], [125.0, 128.49], [131.0, 147.31]], "keep_status": [false, false, false, true, true, false, false, true, false, true, false, false, true, false, false, true, true], "silence_prob": [0.0, 68.8, 39.57, 34.46, 35.01, 0.0, 0.0, 47.27, 0.0, 35.74, 40.55, 0.0, 37.24, 0.0, 0.0, 39.91, 35.19], "audiomae_on_audioset": [null, null, [["hum", 46.54], ["mains hum", 19.59], ["music", 9.5]], [["speech", 14.83], ["hum", 14.54], ["buzz", 13.05]], [["hum", 22.92], ["mains hum", 19.34], ["music", 14.88]], null, null, [["music", 26.66], ["mains hum", 14.2], ["hum", 9.75]], null, [["speech", 39.24], ["music", 26.08], ["fly, housefly", 4.28]], [["hum", 40.7], ["mains hum", 34.3], ["whale vocalization", 5.61]], null, [["fly, housefly", 31.31], ["insect", 19.26], ["mosquito", 8.1]], null, null, [["music", 20.06], ["speech", 13.43], ["hum", 13.31]], [["whale vocalization", 32.66], ["hum", 12.67], ["noise", 9.37]]], "duration": [1.08, 2.56, 3.2, 12.3, 2.8, 0.55, 1.67, 3.58, 34.81, 5.36, 7.84, 1.21, 4.73, 1.57, 0.75, 3.49, 16.31]} \ No newline at end of file diff --git a/annotations_1/LgNSetWhfhw_filtered.json b/annotations_1/LgNSetWhfhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b69f6992e6fa795c9ccc4369e2970521dbee2ca9 --- /dev/null +++ b/annotations_1/LgNSetWhfhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.72], [19.0, 21.54], [22.0, 23.16], [24.0, 24.87], [28.0, 29.05], [32.0, 32.81], [37.0, 37.64], [43.0, 43.5], [44.0, 44.63], [49.0, 49.96], [69.0, 71.66], [75.0, 78.81], [81.0, 86.0], [88.0, 100.53], [102.0, 109.24], [111.0, 125.63], [127.0, 129.51], [131.0, 135.75], [137.0, 137.84], [139.0, 141.78]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.68, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 57.25, 99.1, 99.91, 99.95, 100.0, 99.99, 100.0, 0.0, 100.0], "audiomae_on_audioset": [[["music", 40.23], ["brass instrument", 16.36], ["trumpet", 9.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.72, 2.54, 1.16, 0.87, 1.05, 0.81, 0.64, 0.5, 0.63, 0.96, 2.66, 3.81, 5.0, 12.53, 7.24, 14.63, 2.51, 4.75, 0.84, 2.78]} \ No newline at end of file diff --git a/annotations_1/Lgpg6frCrvw_filtered.json b/annotations_1/Lgpg6frCrvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94b7fd31871f18c66005b3e5bd88b13455770fb3 --- /dev/null +++ b/annotations_1/Lgpg6frCrvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.18], [12.0, 14.28], [16.0, 24.43], [25.0, 26.54], [28.0, 29.08], [30.0, 32.22], [35.0, 40.17], [44.0, 51.06], [52.0, 53.37], [55.0, 66.04], [67.0, 67.96], [68.0, 76.42], [79.0, 83.96], [87.0, 88.79], [91.0, 104.16], [107.0, 119.06], [121.0, 147.46], [148.0, 152.27], [153.0, 170.06], [171.0, 171.9], [173.0, 173.28], [175.0, 175.04], [176.0, 176.82], [180.0, 212.25], [215.0, 218.03], [219.0, 218.93], [219.0, 219.57]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 41.58, 38.97, 0.0, 0.0, 44.01, 39.98, 29.86, 0.0, 30.25, 0.0, 31.44, 31.66, 0.0, 30.55, 30.33, 30.73, 32.02, 31.08, 0.0, 0.0, 0.0, 0.0, 0.0, 31.71, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 20.25], ["rumble", 12.62], ["throbbing", 10.09]], [["hum", 48.85], ["mains hum", 37.4], ["throbbing", 5.02]], null, null, [["speech", 33.32], ["music", 26.81], ["hum", 9.94]], [["music", 34.2], ["speech", 18.61], ["throbbing", 15.21]], [["music", 39.97], ["hum", 17.72], ["throbbing", 10.39]], null, [["music", 45.43], ["speech", 23.89], ["buzz", 2.78]], null, [["speech", 35.84], ["buzz", 11.02], ["music", 10.25]], [["speech", 39.72], ["music", 21.23], ["electric shaver, electric razor", 6.84]], null, [["music", 61.44], ["boing", 5.9], ["speech", 4.25]], [["music", 58.44], ["speech", 10.05], ["throbbing", 4.85]], [["music", 66.82], ["speech", 7.17], ["buzz", 5.92]], [["music", 60.3], ["boing", 8.06], ["speech", 6.8]], [["music", 31.51], ["speech", 10.14], ["fart", 7.16]], null, null, null, null, null, [["music", 21.01], ["speech", 14.38], ["mosquito", 13.11]], null, null], "duration": [1.18, 2.28, 8.43, 1.54, 1.08, 2.22, 5.17, 7.06, 1.37, 11.04, 0.96, 8.42, 4.96, 1.79, 13.16, 12.06, 26.46, 4.27, 17.06, 0.9, 0.28, 0.04, 0.82, 32.25, 3.03, -0.07, 0.57]} \ No newline at end of file diff --git a/annotations_1/Lh3y_KLTwWc_filtered.json b/annotations_1/Lh3y_KLTwWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cc003cbe1d3e4b6789f2907ea436fd727a2f4e4 --- /dev/null +++ b/annotations_1/Lh3y_KLTwWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.61], [17.0, 17.39], [27.0, 26.92], [27.0, 27.95], [30.0, 55.78], [58.0, 70.75], [72.0, 77.79], [79.0, 83.79], [89.0, 90.49], [95.0, 104.09], [110.0, 113.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.52, 35.71, 33.66, 34.56, 0.0, 43.15, 38.52], "audiomae_on_audioset": [null, null, null, null, [["music", 71.24], ["didgeridoo", 2.81], ["speech", 1.68]], [["music", 54.38], ["speech", 19.4], ["hum", 4.65]], [["throbbing", 38.6], ["music", 21.21], ["hum", 16.47]], [["music", 72.36], ["speech", 6.71], ["didgeridoo", 5.53]], null, [["music", 57.66], ["livestock, farm animals, working animals", 5.26], ["throbbing", 3.32]], [["music", 44.22], ["hum", 19.7], ["mains hum", 13.43]]], "duration": [-0.39, 0.39, -0.08, 0.95, 25.78, 12.75, 5.79, 4.79, 1.49, 9.09, 3.27]} \ No newline at end of file diff --git a/annotations_1/LiAiWknkwcc_filtered.json b/annotations_1/LiAiWknkwcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ccd39992de39512de59e634f2ecea7d05f434f3 --- /dev/null +++ b/annotations_1/LiAiWknkwcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [9.0, 9.61], [11.0, 11.31], [13.0, 14.67], [27.0, 28.49], [29.0, 29.83], [37.0, 37.71], [39.0, 43.01], [48.0, 49.45], [53.0, 54.31], [57.0, 57.92], [60.0, 61.23], [62.0, 62.83], [69.0, 69.11], [75.0, 76.5], [77.0, 77.97], [79.0, 80.06], [81.0, 81.68], [97.0, 97.09], [102.0, 103.3], [105.0, 105.66], [110.0, 111.11], [112.0, 114.1], [116.0, 124.95], [126.0, 127.31], [128.0, 129.22], [130.0, 130.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.02, 31.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sine wave", 11.23], ["inside, small room", 11.03], ["animal", 10.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.03], ["fart", 4.0], ["beatboxing", 2.89]], [["speech", 23.15], ["inside, small room", 13.09], ["animal", 10.46]], null, null, null], "duration": [0.73, 0.61, 0.31, 1.67, 1.49, 0.83, 0.71, 4.01, 1.45, 1.31, 0.92, 1.23, 0.83, 0.11, 1.5, 0.97, 1.06, 0.68, 0.09, 1.3, 0.66, 1.11, 2.1, 8.95, 1.31, 1.22, 0.94]} \ No newline at end of file diff --git a/annotations_1/LiODoFVKD40_filtered.json b/annotations_1/LiODoFVKD40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9bb533d098a8f7dce2a5f96c36e73db816f5427 --- /dev/null +++ b/annotations_1/LiODoFVKD40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.19], [24.0, 26.08], [29.0, 38.74], [39.0, 38.89], [41.0, 41.61], [42.0, 42.23], [42.0, 42.67], [45.0, 47.36], [50.0, 51.07], [62.0, 62.85], [64.0, 70.34], [73.0, 72.66], [89.0, 89.9], [106.0, 107.38], [108.0, 108.72], [118.0, 119.85], [128.0, 130.92], [134.0, 137.94], [149.0, 159.7]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 44.2, 85.54, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 40.4, 0.0, 0.0, 0.0, 0.0, 0.0, 39.07, 37.96, 31.76], "audiomae_on_audioset": [null, [["thunk", 31.85], ["music", 16.22], ["speech", 15.8]], null, null, null, null, null, null, null, null, [["music", 50.5], ["boing", 16.76], ["theremin", 11.79]], null, null, null, null, null, [["speech", 41.74], ["music", 23.03], ["boing", 6.63]], [["music", 32.13], ["fly, housefly", 9.84], ["insect", 6.97]], [["music", 78.06], ["boing", 3.11], ["sampler", 1.33]]], "duration": [0.19, 2.08, 9.74, -0.11, 0.61, 0.23, 0.67, 2.36, 1.07, 0.85, 6.34, -0.34, 0.9, 1.38, 0.72, 1.85, 2.92, 3.94, 10.7]} \ No newline at end of file diff --git a/annotations_1/LiioO2L5ZA4_filtered.json b/annotations_1/LiioO2L5ZA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e91f85e42e0e96314f74491e8677c98814f49ec --- /dev/null +++ b/annotations_1/LiioO2L5ZA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [5.0, 6.83], [9.0, 9.68], [12.0, 12.29], [14.0, 14.12], [15.0, 15.52], [23.0, 23.04], [32.0, 32.19], [43.0, 44.63], [47.0, 48.14], [49.0, 49.32], [50.0, 50.72], [55.0, 55.34], [56.0, 56.35], [57.0, 57.48], [65.0, 65.62], [66.0, 67.32], [70.0, 69.85], [70.0, 70.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, 1.83, 0.68, 0.29, 0.12, 0.52, 0.04, 0.19, 1.63, 1.14, 0.32, 0.72, 0.34, 0.35, 0.48, 0.62, 1.32, -0.15, 0.58]} \ No newline at end of file diff --git a/annotations_1/Lk2gIdLgwz4_filtered.json b/annotations_1/Lk2gIdLgwz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0a489308718b736b6059e287a535164f101a57d --- /dev/null +++ b/annotations_1/Lk2gIdLgwz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [2.0, 8.04], [8.0, 8.07], [8.0, 8.45], [9.0, 9.64], [10.0, 10.62], [13.0, 15.09], [20.0, 22.3], [30.0, 32.49], [35.0, 36.49], [47.0, 47.65], [49.0, 49.6], [50.0, 51.75], [53.0, 53.91], [58.0, 60.24], [61.0, 62.95], [72.0, 72.4], [84.0, 87.71], [89.0, 88.64], [89.0, 88.72], [98.0, 98.51], [100.0, 100.82], [102.0, 101.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.94, 0.0, 0.0, 0.0, 0.0, 34.78, 65.44, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 46.99], ["mains hum", 21.18], ["speech", 7.15]], null, null, null, null, [["noise", 39.89], ["music", 22.83], ["speech", 10.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 6.04, 0.07, 0.45, 0.64, 0.62, 2.09, 2.3, 2.49, 1.49, 0.65, 0.6, 1.75, 0.91, 2.24, 1.95, 0.4, 3.71, -0.36, -0.28, 0.51, 0.82, -0.13]} \ No newline at end of file diff --git a/annotations_1/LlK6pn4qyrc_filtered.json b/annotations_1/LlK6pn4qyrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b81148b24dcf188d0d0bef0729832a71b93b2f4e --- /dev/null +++ b/annotations_1/LlK6pn4qyrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.8], [12.0, 19.38], [21.0, 24.24], [36.0, 36.85], [39.0, 39.61], [42.0, 42.89], [47.0, 49.65], [56.0, 56.79], [60.0, 60.54], [63.0, 63.29], [64.0, 63.95], [65.0, 67.31], [69.0, 69.38], [73.0, 73.08], [78.0, 78.43], [79.0, 79.17], [80.0, 90.69], [92.0, 96.53], [99.0, 100.06], [101.0, 101.58], [108.0, 108.13], [111.0, 123.79], [128.0, 128.8], [144.0, 145.74], [148.0, 153.98], [155.0, 155.38], [158.0, 159.06], [162.0, 164.29], [167.0, 167.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.38, 99.8, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 57.32, 97.92, 0.0, 0.0, 0.0, 28.72, 0.0, 0.0, 94.07, 0.0, 0.0, 58.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.18], ["music", 20.31], ["throbbing", 6.91]], null, null, null, null, null, null, null], "duration": [-0.2, 7.38, 3.24, 0.85, 0.61, 0.89, 2.65, 0.79, 0.54, 0.29, -0.05, 2.31, 0.38, 0.08, 0.43, 0.17, 10.69, 4.53, 1.06, 0.58, 0.13, 12.79, 0.8, 1.74, 5.98, 0.38, 1.06, 2.29, 0.31]} \ No newline at end of file diff --git a/annotations_1/LmK0bMGzHpU_filtered.json b/annotations_1/LmK0bMGzHpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7417d58bd3683572b7939ba2747ec203c7df4af --- /dev/null +++ b/annotations_1/LmK0bMGzHpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.3], [7.0, 48.27], [53.0, 57.5], [58.0, 58.8], [62.0, 72.93], [73.0, 74.44], [77.0, 78.11], [82.0, 86.19], [87.0, 88.2], [97.0, 102.24], [103.0, 104.89], [108.0, 111.54]], "keep_status": [true, false, true, false, true, false, false, true, false, true, false, false], "silence_prob": [47.94, 0.0, 32.54, 0.0, 38.0, 0.0, 0.0, 33.0, 0.0, 42.35, 0.0, 60.89], "audiomae_on_audioset": [[["music", 39.12], ["hum", 9.32], ["speech", 7.36]], null, [["mosquito", 26.57], ["music", 25.94], ["fly, housefly", 6.97]], null, [["speech", 22.32], ["hum", 13.33], ["buzz", 10.41]], null, null, [["fly, housefly", 29.54], ["insect", 11.38], ["mosquito", 8.87]], null, [["music", 43.1], ["hum", 12.55], ["mains hum", 7.78]], null, null], "duration": [2.3, 41.27, 4.5, 0.8, 10.93, 1.44, 1.11, 4.19, 1.2, 5.24, 1.89, 3.54]} \ No newline at end of file diff --git a/annotations_1/LmsnknGIx74_filtered.json b/annotations_1/LmsnknGIx74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..091daf15ab25f016164f52a47d27658fdaf44954 --- /dev/null +++ b/annotations_1/LmsnknGIx74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.17], [6.0, 6.13], [7.0, 8.13], [9.0, 8.95], [10.0, 10.15], [11.0, 12.16], [13.0, 19.13], [25.0, 28.54], [34.0, 38.96], [42.0, 54.73], [56.0, 62.94], [65.0, 64.72], [68.0, 68.18], [69.0, 69.82], [70.0, 76.59], [85.0, 86.17], [87.0, 89.8], [90.0, 90.75], [91.0, 99.47], [100.0, 102.12], [104.0, 113.9], [115.0, 121.53], [124.0, 124.46]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.98, 28.85, 28.77, 28.83, 28.76, 0.0, 0.0, 0.0, 29.46, 0.0, 28.91, 0.0, 28.83, 28.63, 28.79, 28.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 43.17], ["speech", 13.87], ["vehicle", 10.06]], [["music", 42.07], ["didgeridoo", 12.41], ["synthesizer", 9.14]], [["music", 50.51], ["vehicle", 14.39], ["car", 10.27]], [["music", 87.64], ["didgeridoo", 1.91], ["scratching (performance technique)", 0.82]], [["music", 70.76], ["dubstep", 5.33], ["synthesizer", 2.95]], null, null, null, [["music", 84.58], ["speech", 4.95], ["electronic music", 0.96]], null, [["music", 57.1], ["boing", 5.32], ["didgeridoo", 4.78]], null, [["music", 67.62], ["didgeridoo", 8.84], ["funk", 3.68]], [["music", 72.32], ["throbbing", 8.07], ["hum", 4.0]], [["music", 64.81], ["didgeridoo", 15.61], ["throbbing", 4.67]], [["music", 71.42], ["synthesizer", 2.51], ["electronic music", 2.35]], null], "duration": [1.17, 0.13, 1.13, -0.05, 0.15, 1.16, 6.13, 3.54, 4.96, 12.73, 6.94, -0.28, 0.18, 0.82, 6.59, 1.17, 2.8, 0.75, 8.47, 2.12, 9.9, 6.53, 0.46]} \ No newline at end of file diff --git a/annotations_1/Ln91UqmKxwI_filtered.json b/annotations_1/Ln91UqmKxwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9d493e2fd38c096c0f55cdf08c15f537c4d5c9f --- /dev/null +++ b/annotations_1/Ln91UqmKxwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.27], [24.0, 27.87], [31.0, 31.62], [33.0, 33.86], [36.0, 36.21], [37.0, 37.71], [40.0, 40.69], [43.0, 42.84], [44.0, 44.64], [53.0, 53.77], [55.0, 55.71], [59.0, 60.05], [62.0, 62.26], [64.0, 64.45], [65.0, 66.18], [67.0, 66.99], [67.0, 67.86], [72.0, 84.62], [88.0, 107.97], [108.0, 109.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [92.97, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.82, 30.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.6], ["whack, thwack", 10.56], ["smash, crash", 10.3]], [["music", 49.47], ["smash, crash", 8.03], ["buzz", 5.53]], null], "duration": [2.27, 3.87, 0.62, 0.86, 0.21, 0.71, 0.69, -0.16, 0.64, 0.77, 0.71, 1.05, 0.26, 0.45, 1.18, -0.01, 0.86, 12.62, 19.97, 1.32]} \ No newline at end of file diff --git a/annotations_1/LoBAmFanDhY_filtered.json b/annotations_1/LoBAmFanDhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..636a3e4dff4a06191ba0af553bada96482c63e7f --- /dev/null +++ b/annotations_1/LoBAmFanDhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 35.43], [37.0, 38.64], [41.0, 40.9], [44.0, 61.53], [64.0, 96.67], [99.0, 99.99], [101.0, 103.6], [104.0, 104.77]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.9, 0.0, 0.0, 97.64, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 43.51], ["music", 17.47], ["mains hum", 13.24]], null, null, null, null], "duration": [1.43, 1.64, -0.1, 17.53, 32.67, 0.99, 2.6, 0.77]} \ No newline at end of file diff --git a/annotations_1/LoCaeI5RffI_filtered.json b/annotations_1/LoCaeI5RffI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f26c7af79828b8507e7039daa33ae12b3c87d583 --- /dev/null +++ b/annotations_1/LoCaeI5RffI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 21.76], [23.0, 23.89], [32.0, 32.22], [33.0, 33.66], [39.0, 111.32], [112.0, 130.69], [131.0, 133.56], [135.0, 136.98], [138.0, 140.04], [143.0, 143.41], [158.0, 159.39], [161.0, 164.2], [165.0, 176.39], [177.0, 178.48], [180.0, 180.01], [190.0, 190.75], [191.0, 194.7], [196.0, 198.42], [200.0, 200.55]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.03, 0.0, 0.0, 0.0, 0.0, 76.04, 99.99, 0.0, 99.98, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 44.66, 98.99, 0.0], "audiomae_on_audioset": [[["speech", 20.22], ["music", 18.56], ["fly, housefly", 18.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.24], ["sidetone", 11.67], ["speech", 6.35]], null, null], "duration": [12.76, 0.89, 0.22, 0.66, 72.32, 18.69, 2.56, 1.98, 2.04, 0.41, 1.39, 3.2, 11.39, 1.48, 0.01, 0.75, 3.7, 2.42, 0.55]} \ No newline at end of file diff --git a/annotations_1/LoG_2u-0rWo_filtered.json b/annotations_1/LoG_2u-0rWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ff92c190f3a30e88a0262a9f2e9b2b28c8c48ed --- /dev/null +++ b/annotations_1/LoG_2u-0rWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.08], [2.0, 12.23], [18.0, 18.39], [19.0, 31.53], [33.0, 33.47], [37.0, 66.82], [72.0, 101.68], [103.0, 155.56], [160.0, 160.78], [164.0, 166.8], [169.0, 171.05]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 33.13, 0.0, 38.64, 0.0, 30.1, 30.54, 0.0, 0.0, 33.37, 45.3], "audiomae_on_audioset": [null, [["speech", 48.8], ["music", 12.55], ["didgeridoo", 8.0]], null, [["speech", 46.28], ["hum", 15.87], ["mains hum", 9.71]], null, [["music", 43.05], ["speech", 4.97], ["animal", 3.86]], [["music", 56.96], ["speech", 11.45], ["electronic music", 3.66]], null, null, [["thunk", 38.2], ["speech", 17.35], ["music", 13.77]], [["moo", 25.81], ["cattle, bovinae", 25.35], ["livestock, farm animals, working animals", 17.55]]], "duration": [1.08, 10.23, 0.39, 12.53, 0.47, 29.82, 29.68, 52.56, 0.78, 2.8, 2.05]} \ No newline at end of file diff --git a/annotations_1/LoRpJTD3HFY_filtered.json b/annotations_1/LoRpJTD3HFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..781b066a9b77ef05f51ac878955cd33bd595f7e5 --- /dev/null +++ b/annotations_1/LoRpJTD3HFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 36.59], [37.0, 48.95], [51.0, 87.47], [89.0, 135.18], [135.0, 161.52], [162.0, 164.25], [168.0, 169.16]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [29.71, 30.26, 0.0, 0.0, 29.67, 42.58, 0.0], "audiomae_on_audioset": [[["speech", 60.68], ["breaking", 8.3], ["music", 6.91]], [["throbbing", 32.44], ["hum", 19.78], ["music", 19.71]], null, null, [["music", 75.21], ["speech", 4.36], ["throbbing", 2.04]], [["hum", 21.21], ["throbbing", 9.51], ["noise", 8.5]], null], "duration": [19.59, 11.95, 36.47, 46.18, 26.52, 2.25, 1.16]} \ No newline at end of file diff --git a/annotations_1/LpDRf3h6OHw_filtered.json b/annotations_1/LpDRf3h6OHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c5e1163d19e3e4a477b2dc7757da204f6cacbee --- /dev/null +++ b/annotations_1/LpDRf3h6OHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.07], [10.0, 10.2], [12.0, 11.94], [12.0, 12.18], [13.0, 13.74], [15.0, 16.02], [17.0, 17.0], [19.0, 19.35], [23.0, 23.53], [26.0, 26.81], [28.0, 27.58], [31.0, 32.39], [36.0, 37.27], [53.0, 52.98], [55.0, 55.17], [58.0, 58.33], [64.0, 66.7], [67.0, 68.57], [71.0, 73.36], [76.0, 76.49], [82.0, 82.53], [144.0, 145.77], [148.0, 150.25], [152.0, 153.06], [153.0, 153.1], [153.0, 153.17], [153.0, 158.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [47.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 41.98, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 54.17], "audiomae_on_audioset": [[["whale vocalization", 42.39], ["speech", 20.02], ["rumble", 8.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.25], ["throbbing", 15.72], ["heart sounds, heartbeat", 14.79]], null, null, null, [["hum", 36.05], ["mains hum", 32.55], ["music", 5.17]], null, null, null, null], "duration": [3.07, 0.2, -0.06, 0.18, 0.74, 1.02, 0.0, 0.35, 0.53, 0.81, -0.42, 1.39, 1.27, -0.02, 0.17, 0.33, 2.7, 1.57, 2.36, 0.49, 0.53, 1.77, 2.25, 1.06, 0.1, 0.17, 5.28]} \ No newline at end of file diff --git a/annotations_1/Lr04AEabtnY_filtered.json b/annotations_1/Lr04AEabtnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654648fc1733258bab976df114d7775fd42bff15 --- /dev/null +++ b/annotations_1/Lr04AEabtnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 62.01]], "keep_status": [false], "silence_prob": [50.86], "audiomae_on_audioset": [null], "duration": [3.01]} \ No newline at end of file diff --git a/annotations_1/LrQqG7HxUao_filtered.json b/annotations_1/LrQqG7HxUao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a499d7593407d6f7ffa00f002cd3c782200ae968 --- /dev/null +++ b/annotations_1/LrQqG7HxUao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [11.0, 11.01], [12.0, 13.09], [14.0, 14.27], [15.0, 15.43], [17.0, 22.37], [24.0, 24.49], [27.0, 26.81], [30.0, 30.75], [32.0, 33.24], [35.0, 35.65], [39.0, 39.11], [43.0, 43.21], [51.0, 66.12], [68.0, 69.62], [71.0, 72.5], [74.0, 77.11], [78.0, 78.73], [81.0, 82.05], [84.0, 90.22], [91.0, 91.39], [94.0, 94.56], [97.0, 97.66], [100.0, 103.98], [106.0, 107.1], [110.0, 115.57], [122.0, 127.85], [135.0, 140.54], [145.0, 160.32], [162.0, 163.07], [165.0, 166.11], [170.0, 170.82], [178.0, 186.16], [189.0, 190.09], [192.0, 198.95], [202.0, 202.2], [203.0, 207.69], [213.0, 215.6]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.58, 0.0, 0.0, 38.95, 0.0, 0.0, 37.32, 0.0, 0.0, 0.0, 36.38, 0.0, 33.52, 32.55, 34.29, 33.56, 0.0, 0.0, 0.0, 31.33, 0.0, 31.88, 0.0, 33.12, 31.32], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 39.31], ["moo", 15.8], ["livestock, farm animals, working animals", 14.37]], null, null, null, null, null, null, null, [["music", 31.14], ["whale vocalization", 26.54], ["livestock, farm animals, working animals", 3.22]], null, null, [["music", 80.17], ["musical instrument", 2.21], ["singing", 1.75]], null, null, [["music", 75.03], ["lullaby", 1.85], ["singing", 1.56]], null, null, null, [["music", 79.13], ["singing", 2.09], ["guitar", 1.22]], null, [["music", 64.53], ["singing", 4.44], ["saxophone", 3.15]], [["music", 76.0], ["synthesizer", 1.93], ["reggae", 1.35]], [["music", 82.25], ["folk music", 1.5], ["singing", 1.43]], [["music", 83.83], ["soul music", 1.42], ["country", 1.2]], null, null, null, [["music", 81.32], ["yodeling", 2.01], ["musical instrument", 1.91]], null, [["music", 88.04], ["musical instrument", 1.07], ["didgeridoo", 0.93]], null, [["music", 69.46], ["synthesizer", 3.68], ["theremin", 3.48]], [["music", 78.28], ["musical instrument", 2.73], ["steel guitar, slide guitar", 2.71]]], "duration": [0.59, 0.01, 1.09, 0.27, 0.43, 5.37, 0.49, -0.19, 0.75, 1.24, 0.65, 0.11, 0.21, 15.12, 1.62, 1.5, 3.11, 0.73, 1.05, 6.22, 0.39, 0.56, 0.66, 3.98, 1.1, 5.57, 5.85, 5.54, 15.32, 1.07, 1.11, 0.82, 8.16, 1.09, 6.95, 0.2, 4.69, 2.6]} \ No newline at end of file diff --git a/annotations_1/LrsnIyCjvB8_filtered.json b/annotations_1/LrsnIyCjvB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ea52728a1abbeed0f0fbb35836938a59e310e6e --- /dev/null +++ b/annotations_1/LrsnIyCjvB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.76], [20.0, 20.17], [21.0, 22.64], [25.0, 25.42], [27.0, 27.43], [31.0, 32.29], [33.0, 33.35], [35.0, 36.1], [39.0, 42.97], [44.0, 53.72], [55.0, 55.56], [58.0, 58.6], [59.0, 64.71], [67.0, 69.57], [71.0, 72.01], [73.0, 73.8], [75.0, 76.17], [77.0, 79.89], [90.0, 90.86], [93.0, 94.49], [95.0, 97.92], [100.0, 104.21], [107.0, 110.47], [113.0, 115.08], [117.0, 117.17], [118.0, 117.85], [119.0, 119.31], [121.0, 124.29], [125.0, 127.75], [135.0, 136.68], [138.0, 142.2], [144.0, 156.95], [160.0, 159.9], [161.0, 163.22], [164.0, 164.46], [167.0, 166.97], [167.0, 168.96], [169.0, 171.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 93.76, 0.0, 0.0, 87.19, 99.95, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 99.99, 89.9, 89.54, 99.65, 0.0, 0.0, 0.0, 75.23, 34.21, 0.0, 37.92, 36.36, 0.0, 74.92, 0.0, 0.0, 0.0, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.87], ["music", 2.5], ["hum", 1.84]], null, [["hum", 46.7], ["throbbing", 18.23], ["speech", 10.88]], [["hum", 40.59], ["throbbing", 26.12], ["speech", 10.43]], null, null, null, null, null, null], "duration": [6.76, 0.17, 1.64, 0.42, 0.43, 1.29, 0.35, 1.1, 3.97, 9.72, 0.56, 0.6, 5.71, 2.57, 1.01, 0.8, 1.17, 2.89, 0.86, 1.49, 2.92, 4.21, 3.47, 2.08, 0.17, -0.15, 0.31, 3.29, 2.75, 1.68, 4.2, 12.95, -0.1, 2.22, 0.46, -0.03, 1.96, 2.26]} \ No newline at end of file diff --git a/annotations_1/LszhBmIWjeE_filtered.json b/annotations_1/LszhBmIWjeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbac4bf8503a77509dde02ce5c281f85247298b2 --- /dev/null +++ b/annotations_1/LszhBmIWjeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.74], [8.0, 10.32], [11.0, 12.06], [14.0, 15.28], [20.0, 20.6], [22.0, 22.74], [23.0, 24.44], [25.0, 25.89], [27.0, 27.24], [27.0, 28.29], [30.0, 31.31], [39.0, 39.46], [43.0, 49.25], [50.0, 51.46], [52.0, 56.0], [57.0, 59.14], [64.0, 67.44], [80.0, 81.26], [82.0, 81.73], [82.0, 82.81], [84.0, 85.08], [86.0, 86.43], [91.0, 93.19], [94.0, 96.06], [104.0, 107.7], [108.0, 113.04], [125.0, 125.54], [130.0, 130.96], [137.0, 137.56], [139.0, 140.75], [147.0, 148.14], [158.0, 158.35], [159.0, 160.15], [170.0, 170.51], [172.0, 172.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 75.07, 44.66, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 99.82, 99.97, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["busy signal", 13.18], ["speech", 8.38], ["singing bowl", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 2.32, 1.06, 1.28, 0.6, 0.74, 1.44, 0.89, 0.24, 1.29, 1.31, 0.46, 6.25, 1.46, 4.0, 2.14, 3.44, 1.26, -0.27, 0.81, 1.08, 0.43, 2.19, 2.06, 3.7, 5.04, 0.54, 0.96, 0.56, 1.75, 1.14, 0.35, 1.15, 0.51, 0.34]} \ No newline at end of file diff --git a/annotations_1/LtFw6_YJiFs_filtered.json b/annotations_1/LtFw6_YJiFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a60b4bf81cb281a055204168a3fd34d41ea3638 --- /dev/null +++ b/annotations_1/LtFw6_YJiFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [9.0, 24.71], [30.0, 31.87], [34.0, 39.01], [40.0, 40.73], [42.0, 59.49], [62.0, 65.8], [68.0, 70.53], [73.0, 101.92], [105.0, 108.55], [110.0, 111.74], [116.0, 120.34], [123.0, 124.41], [127.0, 142.72], [145.0, 145.22], [146.0, 145.76], [148.0, 150.5], [153.0, 177.79], [178.0, 178.56], [186.0, 188.25], [191.0, 197.53], [201.0, 203.08], [205.0, 209.43], [211.0, 224.16], [225.0, 229.64]], "keep_status": [false, false, false, true, false, true, true, true, false, true, false, true, false, true, false, false, true, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 34.34, 0.0, 30.93, 0.0, 34.38, 34.48, 29.65, 30.8, 32.29, 0.0, 32.66, 0.0, 32.9, 0.0, 0.0, 34.29, 30.91, 0.0, 30.24, 30.36, 31.33, 30.78, 29.5, 29.95], "audiomae_on_audioset": [null, [["hum", 52.22], ["mains hum", 31.98], ["throbbing", 5.69]], null, [["music", 42.44], ["hum", 8.44], ["throbbing", 7.94]], null, [["hum", 30.35], ["music", 29.01], ["mains hum", 7.52]], [["speech", 37.05], ["hum", 16.4], ["mains hum", 13.23]], [["music", 18.76], ["hum", 15.19], ["mains hum", 7.7]], [["hum", 41.64], ["mains hum", 30.07], ["speech", 7.73]], [["speech", 40.8], ["music", 22.56], ["vehicle", 4.29]], null, [["hum", 22.62], ["music", 20.21], ["speech", 18.54]], null, [["speech", 32.25], ["music", 11.71], ["fly, housefly", 8.72]], null, null, [["whale vocalization", 14.57], ["music", 11.82], ["theremin", 10.17]], [["music", 33.06], ["hum", 29.11], ["throbbing", 11.51]], null, [["music", 44.48], ["speech", 15.49], ["cacophony", 3.48]], [["music", 37.28], ["speech", 27.0], ["electronic music", 3.06]], [["speech", 37.65], ["music", 28.54], ["sidetone", 4.93]], [["buzz", 23.66], ["insect", 12.64], ["fly, housefly", 9.61]], [["buzz", 78.67], ["music", 6.32], ["speech", 3.09]], [["buzz", 27.72], ["music", 9.65], ["hum", 7.54]]], "duration": [1.17, 15.71, 1.87, 5.01, 0.73, 17.49, 3.8, 2.53, 28.92, 3.55, 1.74, 4.34, 1.41, 15.72, 0.22, -0.24, 2.5, 24.79, 0.56, 2.25, 6.53, 2.08, 4.43, 13.16, 4.64]} \ No newline at end of file diff --git a/annotations_1/Lurs1FzrSio_filtered.json b/annotations_1/Lurs1FzrSio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1329e7be2137fd08de5f01740ed4ed323b2df293 --- /dev/null +++ b/annotations_1/Lurs1FzrSio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.54], [27.0, 29.37], [32.0, 33.94], [37.0, 49.23], [52.0, 53.01], [56.0, 55.78], [56.0, 60.71], [63.0, 63.0], [65.0, 64.83], [69.0, 68.76], [69.0, 70.88], [72.0, 75.2], [76.0, 78.73], [79.0, 80.72], [81.0, 83.94], [84.0, 87.57], [88.0, 89.56], [91.0, 91.83], [101.0, 104.41], [104.0, 105.34], [107.0, 107.47], [120.0, 120.6], [122.0, 124.02], [127.0, 131.55], [135.0, 135.46], [144.0, 145.57], [151.0, 152.2], [155.0, 155.61], [168.0, 182.33], [184.0, 188.11], [188.0, 189.43], [191.0, 199.54], [201.0, 201.63], [207.0, 208.14], [209.0, 225.53]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [29.79, 33.19, 0.0, 28.74, 0.0, 0.0, 28.86, 0.0, 0.0, 0.0, 0.0, 50.71, 48.61, 0.0, 41.38, 51.82, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 28.58, 29.6, 0.0, 0.0, 0.0, 0.0, 44.46, 60.7, 0.0, 56.78, 0.0, 0.0, 31.22], "audiomae_on_audioset": [[["cattle, bovinae", 16.03], ["moo", 13.35], ["fly, housefly", 11.02]], [["music", 26.36], ["hum", 17.58], ["mains hum", 9.27]], null, [["music", 42.67], ["sound effect", 4.22], ["cacophony", 3.68]], null, null, [["speech", 37.96], ["machine gun", 35.34], ["music", 10.95]], null, null, null, null, null, [["music", 35.08], ["grunt", 8.56], ["roar", 7.03]], null, [["music", 25.57], ["hum", 24.33], ["throbbing", 18.3]], null, null, null, [["music", 44.28], ["speech", 31.87], ["thunk", 2.98]], null, null, null, [["sound effect", 17.86], ["static", 14.11], ["burst, pop", 5.25]], [["speech", 32.16], ["music", 28.74], ["machine gun", 21.68]], null, null, null, null, [["hum", 27.21], ["music", 15.98], ["mains hum", 14.04]], null, null, null, null, null, [["music", 36.82], ["throbbing", 25.45], ["hum", 12.01]]], "duration": [3.54, 2.37, 1.94, 12.23, 1.01, -0.22, 4.71, 0.0, -0.17, -0.24, 1.88, 3.2, 2.73, 1.72, 2.94, 3.57, 1.56, 0.83, 3.41, 1.34, 0.47, 0.6, 2.02, 4.55, 0.46, 1.57, 1.2, 0.61, 14.33, 4.11, 1.43, 8.54, 0.63, 1.14, 16.53]} \ No newline at end of file diff --git a/annotations_1/Lv41GcKWfJg_filtered.json b/annotations_1/Lv41GcKWfJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09812325964fae348739183c7b4ee1b4d234b534 --- /dev/null +++ b/annotations_1/Lv41GcKWfJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.93], [4.0, 6.44], [9.0, 10.98], [15.0, 15.11], [15.0, 15.87], [17.0, 18.27], [24.0, 26.33], [27.0, 29.67], [39.0, 39.26], [45.0, 46.23], [49.0, 54.77], [56.0, 64.88], [67.0, 68.34], [72.0, 73.94], [101.0, 103.35], [132.0, 133.49], [135.0, 135.38], [136.0, 141.03], [141.0, 143.45], [145.0, 148.31], [148.0, 151.07], [158.0, 161.67]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 42.46, 0.0, 0.0, 0.0, 0.0, 46.4, 36.88, 0.0, 0.0, 81.17, 72.16, 0.0, 0.0, 74.92, 0.0, 0.0, 98.1, 48.91, 91.81, 35.94, 94.52], "audiomae_on_audioset": [null, [["fly, housefly", 20.05], ["insect", 18.45], ["hum", 16.86]], null, null, null, null, [["music", 22.51], ["hum", 9.4], ["creak", 5.03]], [["music", 33.03], ["hum", 10.63], ["speech", 10.49]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 31.53], ["speech", 21.57], ["insect", 18.38]], null, [["chink, clink", 17.99], ["breaking", 13.8], ["glass", 10.6]], null], "duration": [1.93, 2.44, 1.98, 0.11, 0.87, 1.27, 2.33, 2.67, 0.26, 1.23, 5.77, 8.88, 1.34, 1.94, 2.35, 1.49, 0.38, 5.03, 2.45, 3.31, 3.07, 3.67]} \ No newline at end of file diff --git a/annotations_1/Lw5Ss6z8IoM_filtered.json b/annotations_1/Lw5Ss6z8IoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de5608c9ddeecb196308f4c7fa978383a24b37c2 --- /dev/null +++ b/annotations_1/Lw5Ss6z8IoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [6.0, 6.39], [7.0, 8.55], [9.0, 9.98], [14.0, 13.54], [15.0, 16.02], [18.0, 17.96], [22.0, 22.57], [24.0, 25.42], [27.0, 27.45], [30.0, 30.72], [32.0, 33.72], [35.0, 37.29], [41.0, 40.69], [43.0, 48.44], [49.0, 54.46], [56.0, 56.78], [58.0, 59.59], [61.0, 61.08], [65.0, 65.72], [68.0, 67.85], [69.0, 69.99], [71.0, 71.0], [72.0, 75.29], [77.0, 76.99], [80.0, 80.45], [83.0, 83.67], [87.0, 88.13], [89.0, 90.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 49.97, 43.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.81], ["musical instrument", 11.45], ["harp", 10.71]], [["music", 37.63], ["speech", 14.99], ["guitar", 11.61]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.58, 0.39, 1.55, 0.98, -0.46, 1.02, -0.04, 0.57, 1.42, 0.45, 0.72, 1.72, 2.29, -0.31, 5.44, 5.46, 0.78, 1.59, 0.08, 0.72, -0.15, 0.99, 0.0, 3.29, -0.01, 0.45, 0.67, 1.13, 1.64]} \ No newline at end of file diff --git a/annotations_1/LwSsrFFa2Wc_filtered.json b/annotations_1/LwSsrFFa2Wc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f658a048614b4661948230d0e233c0c400aa2ed9 --- /dev/null +++ b/annotations_1/LwSsrFFa2Wc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.78], [13.0, 14.08], [19.0, 19.5], [22.0, 22.72], [25.0, 24.93], [26.0, 26.35], [29.0, 29.29], [30.0, 30.5], [33.0, 33.45], [37.0, 48.71], [57.0, 57.52], [58.0, 59.21], [62.0, 62.6], [63.0, 63.41], [64.0, 65.57], [69.0, 70.58], [72.0, 72.98], [75.0, 75.93], [77.0, 77.75], [81.0, 83.91], [85.0, 89.45], [90.0, 90.69], [106.0, 106.32], [107.0, 108.14], [111.0, 118.37], [127.0, 134.57], [139.0, 144.59], [150.0, 169.77], [170.0, 170.23], [170.0, 170.43], [172.0, 175.86]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.93, 40.34, 0.0, 0.0, 0.0, 30.3, 30.27, 29.23, 28.61, 0.0, 0.0, 30.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.74], ["mains hum", 16.9], ["hum", 15.89]], null, null, null, null, null, null, null, null, null, [["theremin", 60.16], ["music", 17.88], ["speech", 12.19]], [["speech", 34.85], ["music", 33.22], ["sidetone", 6.79]], null, null, null, [["music", 45.7], ["hum", 14.41], ["throbbing", 13.59]], [["hum", 32.6], ["music", 28.41], ["mains hum", 11.86]], [["music", 39.72], ["electronic music", 10.77], ["vehicle", 7.83]], [["music", 66.77], ["electronic music", 4.17], ["siren", 1.98]], null, null, [["speech", 38.97], ["music", 21.57], ["musical instrument", 6.09]]], "duration": [0.78, 1.08, 0.5, 0.72, -0.07, 0.35, 0.29, 0.5, 0.45, 11.71, 0.52, 1.21, 0.6, 0.41, 1.57, 1.58, 0.98, 0.93, 0.75, 2.91, 4.45, 0.69, 0.32, 1.14, 7.37, 7.57, 5.59, 19.77, 0.23, 0.43, 3.86]} \ No newline at end of file diff --git a/annotations_1/LxAebgxJHyg_filtered.json b/annotations_1/LxAebgxJHyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/LxAebgxJHyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/LyGXFcfRyAQ_filtered.json b/annotations_1/LyGXFcfRyAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f01fa5374d10b0e088935345fc297e5c82c8aee9 --- /dev/null +++ b/annotations_1/LyGXFcfRyAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [8.0, 45.49], [47.0, 123.48]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.01, 37.49, 76.48]} \ No newline at end of file diff --git a/annotations_1/LzJ1fo-oUpk_filtered.json b/annotations_1/LzJ1fo-oUpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab1af75b84ac428afb96085236e97d242e85b136 --- /dev/null +++ b/annotations_1/LzJ1fo-oUpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.71], [17.0, 18.33], [19.0, 23.26], [24.0, 26.05], [28.0, 28.85], [31.0, 31.63], [34.0, 34.43], [35.0, 35.68], [48.0, 47.88], [53.0, 54.82], [65.0, 65.74], [72.0, 73.06], [84.0, 86.76], [95.0, 95.13], [101.0, 102.12], [103.0, 103.1], [107.0, 107.59], [112.0, 112.45], [124.0, 123.96], [125.0, 127.28], [128.0, 128.95], [132.0, 133.57], [137.0, 141.13], [142.0, 148.69], [160.0, 160.12], [165.0, 169.2], [171.0, 176.57], [182.0, 188.05], [195.0, 196.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 38.88, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 99.52, 36.65, 0.0, 75.88, 36.24, 42.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.2], ["speech", 29.34], ["thunk", 10.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cowbell", 40.14], ["animal", 21.68], ["horse", 8.91]], null, null, [["music", 57.51], ["fart", 3.31], ["snicker", 3.1]], [["music", 35.0], ["speech", 17.86], ["groan", 7.29]], null], "duration": [1.71, 1.33, 4.26, 2.05, 0.85, 0.63, 0.43, 0.68, -0.12, 1.82, 0.74, 1.06, 2.76, 0.13, 1.12, 0.1, 0.59, 0.45, -0.04, 2.28, 0.95, 1.57, 4.13, 6.69, 0.12, 4.2, 5.57, 6.05, 1.86]} \ No newline at end of file diff --git a/annotations_1/M06KzvYxlsc_filtered.json b/annotations_1/M06KzvYxlsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af5d2da0e0d0d1b4d9b1e5175ee7d5b081cbf468 --- /dev/null +++ b/annotations_1/M06KzvYxlsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [6.0, 10.07], [12.0, 12.11], [18.0, 18.05], [19.0, 28.7], [31.0, 38.84], [40.0, 40.22], [43.0, 44.07], [45.0, 59.07], [62.0, 66.72], [71.0, 77.3], [78.0, 78.14], [79.0, 78.68], [80.0, 93.19], [94.0, 122.74], [126.0, 156.95], [160.0, 165.43], [167.0, 171.58], [173.0, 198.58], [201.0, 201.83], [204.0, 206.91], [209.0, 210.52], [211.0, 210.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.36, 0.0, 0.0, 31.15, 33.05, 0.0, 0.0, 30.71, 35.18, 37.0, 0.0, 0.0, 37.71, 31.97, 0.0, 33.63, 40.29, 36.75, 0.0, 51.23, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 54.64], ["throbbing", 11.62], ["hum", 8.05]], [["music", 57.61], ["hum", 10.32], ["mains hum", 5.45]], null, null, [["music", 32.11], ["hum", 21.94], ["throbbing", 17.43]], [["mains hum", 37.64], ["hum", 33.6], ["speech", 10.43]], [["didgeridoo", 26.06], ["music", 25.66], ["noise", 15.46]], null, null, [["music", 27.73], ["hum", 17.75], ["noise", 14.31]], [["hum", 38.99], ["throbbing", 19.96], ["music", 18.63]], null, [["hum", 37.84], ["mains hum", 24.67], ["music", 18.65]], [["hum", 33.14], ["mains hum", 25.77], ["throbbing", 18.27]], [["music", 39.06], ["hum", 20.97], ["throbbing", 13.05]], null, null, null, null], "duration": [0.29, 4.07, 0.11, 0.05, 9.7, 7.84, 0.22, 1.07, 14.07, 4.72, 6.3, 0.14, -0.32, 13.19, 28.74, 30.95, 5.43, 4.58, 25.58, 0.83, 2.91, 1.52, -0.14]} \ No newline at end of file diff --git a/annotations_1/M0iif-dNJus_filtered.json b/annotations_1/M0iif-dNJus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5ae32c0c7e36ca51aa8a1ca09a7fdc528c7962 --- /dev/null +++ b/annotations_1/M0iif-dNJus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.81], [9.0, 20.53], [22.0, 22.32], [23.0, 23.89], [26.0, 31.19], [32.0, 32.36], [33.0, 33.91], [35.0, 39.04], [42.0, 60.25], [62.0, 67.44], [69.0, 71.56], [79.0, 79.79], [83.0, 83.64], [86.0, 87.59], [90.0, 90.54], [96.0, 97.06], [99.0, 99.27], [101.0, 103.05], [106.0, 106.69], [107.0, 108.45], [111.0, 111.79], [114.0, 115.18], [118.0, 119.06], [128.0, 128.16], [130.0, 134.4], [137.0, 137.0], [137.0, 140.8], [143.0, 144.76], [147.0, 149.01], [153.0, 159.56], [161.0, 162.92], [164.0, 165.35], [166.0, 170.83]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 31.93, 0.0, 0.0, 30.85, 0.0, 0.0, 29.11, 29.42, 30.32, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 64.75, 0.0, 70.3, 47.62, 0.0, 0.0, 68.15], "audiomae_on_audioset": [null, [["music", 67.62], ["synthesizer", 5.19], ["musical instrument", 3.84]], null, null, [["music", 31.46], ["cattle, bovinae", 10.59], ["buzz", 7.78]], null, null, [["music", 63.08], ["brass instrument", 5.53], ["trombone", 3.82]], [["music", 49.32], ["speech", 12.92], ["hum", 10.96]], [["music", 62.28], ["throbbing", 6.32], ["electronic music", 6.11]], [["music", 60.66], ["electronic music", 8.94], ["ambient music", 7.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.76], ["speech", 18.88], ["hum", 6.62]], null, null, null], "duration": [-0.19, 11.53, 0.32, 0.89, 5.19, 0.36, 0.91, 4.04, 18.25, 5.44, 2.56, 0.79, 0.64, 1.59, 0.54, 1.06, 0.27, 2.05, 0.69, 1.45, 0.79, 1.18, 1.06, 0.16, 4.4, 0.0, 3.8, 1.76, 2.01, 6.56, 1.92, 1.35, 4.83]} \ No newline at end of file diff --git a/annotations_1/M16l8dqWTuI_filtered.json b/annotations_1/M16l8dqWTuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6297e1c81a4317e71f0dadf5d0f5fd4a595e5330 --- /dev/null +++ b/annotations_1/M16l8dqWTuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.71], [15.0, 16.01], [17.0, 17.39], [18.0, 20.48], [22.0, 22.38], [25.0, 24.95], [26.0, 26.06], [26.0, 27.31], [29.0, 31.48], [32.0, 33.39], [34.0, 37.07], [38.0, 42.11], [43.0, 43.6], [45.0, 49.37], [50.0, 52.19], [53.0, 54.45], [55.0, 61.03], [62.0, 66.53], [68.0, 70.87], [72.0, 74.55], [75.0, 75.61], [77.0, 77.87], [80.0, 83.34], [87.0, 88.23], [90.0, 95.44], [98.0, 107.81], [109.0, 111.13], [117.0, 120.53], [122.0, 126.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true], "silence_prob": [58.72, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 80.64, 99.84, 0.0, 100.0, 98.36, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 98.73, 0.0, 88.64, 48.23, 43.74, 34.09, 46.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.37], ["speech", 13.92], ["thunk", 13.72]], [["music", 32.84], ["hum", 15.75], ["mains hum", 13.14]], [["speech", 13.44], ["music", 11.46], ["throbbing", 9.09]], [["music", 25.44], ["hum", 16.1], ["throbbing", 8.04]]], "duration": [10.71, 1.01, 0.39, 2.48, 0.38, -0.05, 0.06, 1.31, 2.48, 1.39, 3.07, 4.11, 0.6, 4.37, 2.19, 1.45, 6.03, 4.53, 2.87, 2.55, 0.61, 0.87, 3.34, 1.23, 5.44, 9.81, 2.13, 3.53, 4.67]} \ No newline at end of file diff --git a/annotations_1/M1hXX6aq1wA_filtered.json b/annotations_1/M1hXX6aq1wA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..610b772ee90e50280c169ba3dd21bf35126d7eb3 --- /dev/null +++ b/annotations_1/M1hXX6aq1wA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.68], [5.0, 5.63], [9.0, 22.62], [24.0, 27.84], [38.0, 37.84], [66.0, 66.66], [106.0, 105.8], [114.0, 118.69], [123.0, 124.09], [125.0, 126.57], [127.0, 129.66], [130.0, 130.91], [135.0, 135.99], [137.0, 138.52], [140.0, 144.15], [148.0, 156.47], [157.0, 158.75], [159.0, 164.12], [165.0, 166.46], [167.0, 167.39], [170.0, 172.91], [174.0, 176.57]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 66.63, 32.54, 0.0, 0.0, 0.0, 32.09, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 100.0, 99.95, 0.0, 99.8, 0.0, 0.0, 99.92, 99.9], "audiomae_on_audioset": [null, null, null, [["music", 52.62], ["speech", 13.58], ["musical instrument", 2.56]], null, null, null, [["music", 32.68], ["whale vocalization", 17.13], ["theremin", 16.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 0.63, 13.62, 3.84, -0.16, 0.66, -0.2, 4.69, 1.09, 1.57, 2.66, 0.91, 0.99, 1.52, 4.15, 8.47, 1.75, 5.12, 1.46, 0.39, 2.91, 2.57]} \ No newline at end of file diff --git a/annotations_1/M2E0xzfvDMw_filtered.json b/annotations_1/M2E0xzfvDMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51a839baa1d24375949818d2e9f1a59c32785d5c --- /dev/null +++ b/annotations_1/M2E0xzfvDMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.97], [9.0, 9.56], [13.0, 18.28], [22.0, 23.25], [31.0, 35.28], [39.0, 53.13], [56.0, 57.01], [60.0, 89.11], [93.0, 94.46], [98.0, 106.07], [109.0, 112.95], [115.0, 116.13], [126.0, 126.3], [127.0, 127.9], [128.0, 131.84]], "keep_status": [true, false, true, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [40.14, 0.0, 33.4, 0.0, 32.72, 29.82, 0.0, 29.73, 0.0, 33.79, 37.15, 0.0, 0.0, 0.0, 29.98], "audiomae_on_audioset": [[["music", 26.94], ["thunk", 17.23], ["livestock, farm animals, working animals", 7.55]], null, [["whale vocalization", 28.31], ["fart", 18.44], ["noise", 14.75]], null, [["speech", 78.93], ["music", 7.0], ["grunt", 2.29]], [["speech", 88.66], ["music", 6.47], ["sound effect", 0.59]], null, [["music", 30.09], ["hum", 14.68], ["throbbing", 14.56]], null, [["hum", 48.05], ["speech", 18.53], ["throbbing", 12.55]], [["hum", 25.13], ["music", 15.77], ["mains hum", 15.31]], null, null, null, [["speech", 48.49], ["music", 18.44], ["boing", 4.19]]], "duration": [3.97, 0.56, 5.28, 1.25, 4.28, 14.13, 1.01, 29.11, 1.46, 8.07, 3.95, 1.13, 0.3, 0.9, 3.84]} \ No newline at end of file diff --git a/annotations_1/M3FtlKHZXhs_filtered.json b/annotations_1/M3FtlKHZXhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe3a585b22970a5be4fa4cf988f858e41001e69e --- /dev/null +++ b/annotations_1/M3FtlKHZXhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.42], [12.0, 13.68], [14.0, 20.43], [21.0, 23.67], [27.0, 27.13], [32.0, 33.0], [36.0, 36.41], [43.0, 43.24], [45.0, 44.64], [45.0, 47.46], [49.0, 49.76], [54.0, 55.97], [60.0, 68.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 98.59, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 34.17, 0.0, 0.0, 66.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sine wave", 27.68], ["animal", 26.78], ["chirp tone", 8.82]], null, null, null], "duration": [1.42, 1.68, 6.43, 2.67, 0.13, 1.0, 0.41, 0.24, -0.36, 2.46, 0.76, 1.97, 8.5]} \ No newline at end of file diff --git a/annotations_1/M3Jts1DPcWk_filtered.json b/annotations_1/M3Jts1DPcWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b3e60fc67c46924515cbf1c468911b76ebd855b --- /dev/null +++ b/annotations_1/M3Jts1DPcWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.35], [6.0, 6.34], [8.0, 8.09], [16.0, 16.93], [18.0, 18.42], [19.0, 19.67], [25.0, 25.02], [33.0, 58.06], [60.0, 71.74], [74.0, 120.68]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.31, 31.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 42.51], ["music", 16.32], ["thump, thud", 10.16]], [["music", 70.12], ["musical instrument", 3.9], ["hum", 2.36]], null], "duration": [1.35, 0.34, 0.09, 0.93, 0.42, 0.67, 0.02, 25.06, 11.74, 46.68]} \ No newline at end of file diff --git a/annotations_1/M47Aq3yj_NQ_filtered.json b/annotations_1/M47Aq3yj_NQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6100f79a87fe4f0883ac88436e75c04c7dbb5626 --- /dev/null +++ b/annotations_1/M47Aq3yj_NQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 22.4], [26.0, 29.15], [35.0, 36.22], [39.0, 38.92], [45.0, 45.87], [48.0, 49.06], [50.0, 52.05], [53.0, 56.05], [56.0, 58.29], [62.0, 63.02], [70.0, 70.7], [76.0, 77.62], [83.0, 85.46], [87.0, 90.24], [92.0, 94.44], [95.0, 96.45], [98.0, 106.47], [108.0, 109.88], [111.0, 111.89], [118.0, 119.33]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [47.43, 50.97, 0.0, 0.0, 0.0, 0.0, 40.19, 41.6, 47.12, 0.0, 0.0, 0.0, 44.87, 41.66, 42.72, 0.0, 29.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 23.59], ["hum", 23.51], ["mains hum", 20.25]], null, null, null, null, null, [["music", 46.56], ["carnatic music", 26.82], ["musical instrument", 4.63]], [["music", 38.2], ["speech", 4.55], ["musical instrument", 4.28]], [["music", 71.66], ["musical instrument", 2.47], ["didgeridoo", 2.22]], null, null, null, [["music", 25.39], ["speech", 13.61], ["synthesizer", 6.71]], [["music", 44.12], ["piano", 6.5], ["keyboard (musical)", 6.04]], [["music", 45.3], ["ambient music", 11.91], ["keyboard (musical)", 6.65]], null, [["music", 80.77], ["musical instrument", 1.4], ["singing", 1.38]], null, null, null], "duration": [19.4, 3.15, 1.22, -0.08, 0.87, 1.06, 2.05, 3.05, 2.29, 1.02, 0.7, 1.62, 2.46, 3.24, 2.44, 1.45, 8.47, 1.88, 0.89, 1.33]} \ No newline at end of file diff --git a/annotations_1/M4LidfkbW68_filtered.json b/annotations_1/M4LidfkbW68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54aee3fa484710dd913d35d53c5a8b7a3c9bf393 --- /dev/null +++ b/annotations_1/M4LidfkbW68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 34.35], [36.0, 36.22], [40.0, 69.08], [73.0, 119.53], [121.0, 122.45], [126.0, 133.57], [135.0, 135.62], [136.0, 162.06], [162.0, 169.87], [171.0, 171.66], [178.0, 179.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.26, 0.0, 30.04, 0.0, 0.0, 32.52, 0.0, 31.8, 31.62, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.75], ["musical instrument", 7.0], ["effects unit", 6.53]], null, [["music", 52.66], ["brass instrument", 11.31], ["trombone", 7.03]], null, null, [["music", 39.09], ["theremin", 34.78], ["musical instrument", 3.92]], null, [["music", 54.39], ["brass instrument", 10.85], ["musical instrument", 10.03]], [["music", 47.11], ["brass instrument", 20.84], ["french horn", 11.36]], null, null], "duration": [8.35, 0.22, 29.08, 46.53, 1.45, 7.57, 0.62, 26.06, 7.87, 0.66, 1.46]} \ No newline at end of file diff --git a/annotations_1/M4YOZHoDSyg_filtered.json b/annotations_1/M4YOZHoDSyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e786c11029061fe28ec74a0d3c274d61e4ca9c3 --- /dev/null +++ b/annotations_1/M4YOZHoDSyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.01], [15.0, 15.18], [17.0, 17.37], [19.0, 19.21], [23.0, 23.03], [45.0, 46.9], [48.0, 48.52], [52.0, 52.83], [59.0, 59.85], [61.0, 61.7], [62.0, 63.12], [64.0, 64.47], [65.0, 66.53], [67.0, 100.87], [104.0, 111.32]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.01], "audiomae_on_audioset": [[["music", 56.33], ["speech", 6.7], ["gong", 4.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.03], ["speech", 21.41], ["hum", 4.49]]], "duration": [10.01, 0.18, 0.37, 0.21, 0.03, 1.9, 0.52, 0.83, 0.85, 0.7, 1.12, 0.47, 1.53, 33.87, 7.32]} \ No newline at end of file diff --git a/annotations_1/M4fuweiQQCA_filtered.json b/annotations_1/M4fuweiQQCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0496b6fbf938ac7ef67963ba976d9d6593f075bd --- /dev/null +++ b/annotations_1/M4fuweiQQCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.81], [10.0, 15.69], [23.0, 26.2], [32.0, 39.58], [42.0, 42.26], [45.0, 54.41], [58.0, 66.02], [70.0, 95.93], [97.0, 106.0], [107.0, 108.33], [110.0, 110.73], [115.0, 118.94], [120.0, 122.32], [125.0, 126.13], [129.0, 130.96]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.79, 31.28, 29.9, 0.0, 30.11, 29.81, 30.04, 37.19, 0.0, 0.0, 53.4, 48.56, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 75.61], ["didgeridoo", 8.75], ["theremin", 2.6]], [["music", 57.36], ["throbbing", 16.74], ["electronic music", 5.57]], [["music", 42.25], ["hum", 14.84], ["mains hum", 10.64]], null, [["music", 50.23], ["didgeridoo", 21.77], ["speech", 4.04]], [["speech", 36.24], ["sidetone", 24.54], ["music", 20.47]], [["groan", 26.06], ["grunt", 10.71], ["animal", 10.65]], [["music", 44.11], ["speech", 25.45], ["hum", 5.63]], null, null, null, [["music", 71.02], ["musical instrument", 5.93], ["didgeridoo", 4.64]], null, null], "duration": [1.81, 5.69, 3.2, 7.58, 0.26, 9.41, 8.02, 25.93, 9.0, 1.33, 0.73, 3.94, 2.32, 1.13, 1.96]} \ No newline at end of file diff --git a/annotations_1/M5DZzTtbV1g_filtered.json b/annotations_1/M5DZzTtbV1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6cd3843c37902c71bc5e153f8952c28ba3a85c5 --- /dev/null +++ b/annotations_1/M5DZzTtbV1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [5.0, 6.0], [8.0, 10.2], [17.0, 17.09], [18.0, 18.3], [34.0, 34.5], [36.0, 38.26], [40.0, 40.59], [41.0, 46.99], [52.0, 52.47], [53.0, 53.35], [58.0, 59.7], [63.0, 64.12], [65.0, 65.94], [68.0, 70.6], [81.0, 80.97], [90.0, 90.17], [110.0, 112.06], [113.0, 113.04], [122.0, 122.81], [126.0, 129.3], [130.0, 130.89], [132.0, 133.07], [141.0, 141.61]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.6, 0.0, 0.0, 0.0, 40.36, 0.0, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 38.2, 0.0, 0.0, 33.08, 0.0, 0.0, 34.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.0], ["speech", 8.61], ["electronic music", 6.39]], null, null, null, [["music", 55.99], ["musical instrument", 5.19], ["guitar", 5.0]], null, [["music", 36.21], ["speech", 8.43], ["drum machine", 5.97]], null, null, null, null, null, [["music", 71.34], ["musical instrument", 6.61], ["theremin", 3.19]], null, null, [["snicker", 23.14], ["chuckle, chortle", 15.36], ["baby laughter", 12.68]], null, null, [["boing", 38.79], ["music", 13.3], ["animal", 4.57]], null, null, null], "duration": [0.94, 1.0, 2.2, 0.09, 0.3, 0.5, 2.26, 0.59, 5.99, 0.47, 0.35, 1.7, 1.12, 0.94, 2.6, -0.03, 0.17, 2.06, 0.04, 0.81, 3.3, 0.89, 1.07, 0.61]} \ No newline at end of file diff --git a/annotations_1/M5ny5tMsxrs_filtered.json b/annotations_1/M5ny5tMsxrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2807074ddcbf0b4d662a12bb3ddfe3cb6a850d7 --- /dev/null +++ b/annotations_1/M5ny5tMsxrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.93], [10.0, 12.38], [17.0, 19.18], [27.0, 28.12], [31.0, 31.9], [35.0, 37.77], [49.0, 50.48], [57.0, 59.31], [62.0, 63.44], [66.0, 68.07], [69.0, 69.62], [75.0, 78.33], [82.0, 82.65], [85.0, 90.24], [93.0, 93.58], [100.0, 106.64], [111.0, 115.6]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.93, 42.88, 0.0, 0.0, 42.3, 0.0, 34.6, 0.0, 33.83, 0.0, 37.19, 0.0, 29.68, 0.0, 30.0, 30.12], "audiomae_on_audioset": [null, null, [["music", 46.18], ["theremin", 7.07], ["synthesizer", 5.21]], null, null, [["music", 30.56], ["singing bowl", 18.62], ["didgeridoo", 10.67]], null, [["music", 36.75], ["theremin", 18.08], ["didgeridoo", 11.95]], null, [["music", 24.71], ["fly, housefly", 7.44], ["speech", 6.86]], null, [["music", 67.98], ["ambient music", 6.51], ["synthesizer", 4.3]], null, [["music", 66.54], ["singing", 2.32], ["electronic music", 2.27]], null, [["music", 69.97], ["rock and roll", 3.87], ["roll", 1.73]], [["music", 87.89], ["rock and roll", 1.44], ["roll", 0.9]]], "duration": [1.93, 2.38, 2.18, 1.12, 0.9, 2.77, 1.48, 2.31, 1.44, 2.07, 0.62, 3.33, 0.65, 5.24, 0.58, 6.64, 4.6]} \ No newline at end of file diff --git a/annotations_1/M7CL4l-bu68_filtered.json b/annotations_1/M7CL4l-bu68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ef8ba8af562837a8912a5b1a000996ae3961a4f --- /dev/null +++ b/annotations_1/M7CL4l-bu68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.91], [4.0, 4.63], [17.0, 18.35], [19.0, 18.72], [22.0, 25.46], [28.0, 30.59], [36.0, 37.22], [46.0, 46.5], [51.0, 51.09], [59.0, 59.58], [64.0, 63.9], [67.0, 67.46], [69.0, 69.11], [73.0, 73.16], [75.0, 76.2], [78.0, 78.6], [80.0, 81.21], [82.0, 88.45], [89.0, 90.02], [112.0, 112.62], [115.0, 120.51], [121.0, 123.06], [125.0, 125.39], [126.0, 127.14], [129.0, 132.07], [133.0, 136.32], [140.0, 140.54], [142.0, 143.97], [147.0, 147.83], [150.0, 151.44], [152.0, 152.22], [153.0, 153.86], [154.0, 156.15], [157.0, 157.86], [159.0, 159.83], [161.0, 162.14], [162.0, 166.14], [172.0, 175.51], [176.0, 175.81], [177.0, 177.65], [184.0, 186.14], [188.0, 188.45], [197.0, 197.48], [199.0, 200.7], [201.0, 201.83], [203.0, 204.06]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.86, 40.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.8, 0.0, 0.0, 41.83, 46.83, 0.0, 0.0, 60.51, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 58.13, 64.75, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 14.19], ["radio", 9.89], ["effects unit", 6.8]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.78], ["music", 12.32], ["boing", 3.71]], null, null, [["music", 42.05], ["speech", 22.84], ["frog", 3.01]], [["music", 53.04], ["speech", 15.92], ["musical instrument", 3.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 0.63, 1.35, -0.28, 3.46, 2.59, 1.22, 0.5, 0.09, 0.58, -0.1, 0.46, 0.11, 0.16, 1.2, 0.6, 1.21, 6.45, 1.02, 0.62, 5.51, 2.06, 0.39, 1.14, 3.07, 3.32, 0.54, 1.97, 0.83, 1.44, 0.22, 0.86, 2.15, 0.86, 0.83, 1.14, 4.14, 3.51, -0.19, 0.65, 2.14, 0.45, 0.48, 1.7, 0.83, 1.06]} \ No newline at end of file diff --git a/annotations_1/M8yhM7zXdSI_filtered.json b/annotations_1/M8yhM7zXdSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3a787121c7c8b79621e0152e3351faee8c4dad9 --- /dev/null +++ b/annotations_1/M8yhM7zXdSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [6.0, 6.44], [10.0, 10.83], [12.0, 16.58], [21.0, 22.08], [23.0, 28.58], [29.0, 30.96], [34.0, 37.83], [40.0, 40.71], [41.0, 41.45], [50.0, 50.68], [52.0, 51.83], [54.0, 55.31], [57.0, 75.91], [77.0, 103.86], [106.0, 109.31], [113.0, 112.99], [115.0, 118.52], [121.0, 120.7], [125.0, 125.47], [133.0, 134.6], [135.0, 141.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 41.64, 0.0, 95.78, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 28.38, 28.41, 32.37, 0.0, 41.64, 0.0, 0.0, 0.0, 45.59], "audiomae_on_audioset": [null, null, null, [["speech", 49.57], ["hum", 19.61], ["mains hum", 3.7]], null, null, null, null, null, null, null, null, null, [["hum", 38.51], ["throbbing", 28.08], ["music", 13.48]], [["hum", 36.1], ["music", 26.69], ["mains hum", 14.03]], [["hum", 48.67], ["throbbing", 16.2], ["mains hum", 15.78]], null, [["speech", 69.25], ["fart", 3.3], ["beatboxing", 2.63]], null, null, null, [["speech", 33.08], ["hum", 13.04], ["mains hum", 12.02]]], "duration": [1.92, 0.44, 0.83, 4.58, 1.08, 5.58, 1.96, 3.83, 0.71, 0.45, 0.68, -0.17, 1.31, 18.91, 26.86, 3.31, -0.01, 3.52, -0.3, 0.47, 1.6, 6.39]} \ No newline at end of file diff --git a/annotations_1/M93XQJPV51c_filtered.json b/annotations_1/M93XQJPV51c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6a9cbcf1ad975f55c0c4cd14da4e09380293ee3 --- /dev/null +++ b/annotations_1/M93XQJPV51c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [7.0, 8.5], [11.0, 11.85], [27.0, 26.99], [33.0, 35.31], [39.0, 43.16], [44.0, 47.41], [48.0, 49.65], [55.0, 55.07], [56.0, 58.31], [60.0, 60.37], [62.0, 63.0], [63.0, 64.05], [69.0, 75.22], [147.0, 148.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.51, 98.93, 97.54, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 49.45, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.65], ["musical instrument", 9.54], ["synthesizer", 5.12]], null, null, null, null, null, null, null, null, [["music", 43.56], ["speech", 27.89], ["grunt", 5.1]], null], "duration": [0.52, 1.5, 0.85, -0.01, 2.31, 4.16, 3.41, 1.65, 0.07, 2.31, 0.37, 1.0, 1.05, 6.22, 1.27]} \ No newline at end of file diff --git a/annotations_1/M9CgWWkwvdw_filtered.json b/annotations_1/M9CgWWkwvdw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e3eb079942dcbc712ddf5b22efb6525fced320d --- /dev/null +++ b/annotations_1/M9CgWWkwvdw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.73], [12.0, 12.63], [13.0, 15.57], [17.0, 17.69], [21.0, 21.64], [52.0, 51.85], [53.0, 53.2], [55.0, 54.89], [65.0, 65.65], [71.0, 71.37], [76.0, 75.74], [78.0, 78.19], [81.0, 81.46], [90.0, 90.93], [95.0, 96.13], [97.0, 97.51], [100.0, 100.75], [109.0, 109.54], [123.0, 122.99], [125.0, 126.37], [132.0, 147.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.3], ["livestock, farm animals, working animals", 15.28], ["throbbing", 7.26]]], "duration": [0.73, 0.63, 2.57, 0.69, 0.64, -0.15, 0.2, -0.11, 0.65, 0.37, -0.26, 0.19, 0.46, 0.93, 1.13, 0.51, 0.75, 0.54, -0.01, 1.37, 15.72]} \ No newline at end of file diff --git a/annotations_1/M9FAInQwCm0_filtered.json b/annotations_1/M9FAInQwCm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..970b0981dc40067f62597a19e0501b95894e0d55 --- /dev/null +++ b/annotations_1/M9FAInQwCm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.16], [12.0, 13.31], [16.0, 17.09], [18.0, 19.89], [21.0, 27.23], [28.0, 31.33], [33.0, 36.68], [37.0, 42.65], [44.0, 49.13], [51.0, 51.07], [54.0, 56.42], [58.0, 65.82], [67.0, 69.21], [70.0, 71.29], [72.0, 87.15], [90.0, 93.18], [96.0, 98.22], [101.0, 101.93], [107.0, 108.97], [114.0, 116.16], [119.0, 120.68], [122.0, 128.22], [129.0, 131.16], [132.0, 134.99], [138.0, 141.35], [146.0, 146.65]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 81.17, 97.92, 99.99, 42.39, 75.39, 0.0, 98.73, 96.77, 68.67, 0.0, 87.74, 99.44, 99.71, 0.0, 0.0, 78.72, 0.0, 99.84, 99.62, 75.07, 75.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.83], ["music", 15.23], ["fart", 10.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.31, 1.09, 1.89, 6.23, 3.33, 3.68, 5.65, 5.13, 0.07, 2.42, 7.82, 2.21, 1.29, 15.15, 3.18, 2.22, 0.93, 1.97, 2.16, 1.68, 6.22, 2.16, 2.99, 3.35, 0.65]} \ No newline at end of file diff --git a/annotations_1/MAi6B_AFhH8_filtered.json b/annotations_1/MAi6B_AFhH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a440b3cd32c3ac2d33e6a33cf6ada95b0801ca --- /dev/null +++ b/annotations_1/MAi6B_AFhH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.96], [8.0, 9.39], [10.0, 11.13], [16.0, 16.53], [22.0, 22.35], [25.0, 26.43], [27.0, 27.84], [28.0, 29.49], [30.0, 30.45], [31.0, 32.09], [32.0, 34.37], [35.0, 37.84], [39.0, 44.71], [48.0, 49.3], [53.0, 53.22], [59.0, 69.69], [75.0, 78.85], [82.0, 85.99], [90.0, 90.59], [91.0, 92.87], [100.0, 101.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, true, false, false, false], "silence_prob": [46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 56.1, 39.34, 0.0, 0.0, 34.28, 43.43, 43.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.77], ["musical instrument", 14.49], ["guitar", 11.62]], null, null, null, null, null, null, null, null, null, [["speech", 21.53], ["creak", 17.08], ["radio", 12.56]], null, [["music", 40.64], ["speech", 10.71], ["guitar", 9.2]], null, null, [["music", 37.61], ["guitar", 14.17], ["bass guitar", 8.29]], [["music", 46.71], ["guitar", 11.63], ["bass guitar", 10.38]], [["music", 12.42], ["plucked string instrument", 9.37], ["guitar", 8.33]], null, null, null], "duration": [3.96, 1.39, 1.13, 0.53, 0.35, 1.43, 0.84, 1.49, 0.45, 1.09, 2.37, 2.84, 5.71, 1.3, 0.22, 10.69, 3.85, 3.99, 0.59, 1.87, 1.02]} \ No newline at end of file diff --git a/annotations_1/MBNiDwytFow_filtered.json b/annotations_1/MBNiDwytFow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7ac10bc473eaf8e77f222ef495e493947783aad --- /dev/null +++ b/annotations_1/MBNiDwytFow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [5.0, 6.22], [9.0, 8.85], [18.0, 18.42], [22.0, 22.91], [24.0, 26.3], [27.0, 28.21], [29.0, 29.64], [31.0, 31.36], [32.0, 32.91], [34.0, 35.38], [39.0, 40.81], [42.0, 49.35], [55.0, 58.62], [59.0, 59.16], [60.0, 69.94], [78.0, 89.97], [105.0, 105.71], [110.0, 113.26], [115.0, 115.84], [118.0, 119.77], [120.0, 122.05], [127.0, 132.14], [133.0, 137.34], [141.0, 142.47], [144.0, 146.1], [148.0, 148.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 100.0, 0.0, 47.12, 47.94, 0.0, 72.6, 0.0, 0.0, 88.64, 100.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.3], ["speech", 20.18], ["beatboxing", 13.43]], [["cattle, bovinae", 20.33], ["livestock, farm animals, working animals", 14.53], ["moo", 9.84]], null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 1.22, -0.15, 0.42, 0.91, 2.3, 1.21, 0.64, 0.36, 0.91, 1.38, 1.81, 7.35, 3.62, 0.16, 9.94, 11.97, 0.71, 3.26, 0.84, 1.77, 2.05, 5.14, 4.34, 1.47, 2.1, 0.83]} \ No newline at end of file diff --git a/annotations_1/MBSxl8y36zg_filtered.json b/annotations_1/MBSxl8y36zg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05891cb401e3b8d55c9beb62c1afcd2ee6144de0 --- /dev/null +++ b/annotations_1/MBSxl8y36zg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [8.0, 14.17], [19.0, 21.64], [24.0, 23.67], [25.0, 24.83], [31.0, 34.92], [36.0, 38.79], [40.0, 46.18], [48.0, 54.19], [57.0, 60.39], [61.0, 62.58], [70.0, 71.36], [73.0, 73.41], [80.0, 87.91], [89.0, 92.08], [93.0, 94.49], [95.0, 95.64], [98.0, 100.38], [101.0, 102.9], [104.0, 106.05], [110.0, 113.61], [115.0, 117.41], [120.0, 121.59], [123.0, 125.29], [128.0, 130.06], [132.0, 133.32], [140.0, 142.96], [144.0, 145.07], [150.0, 151.48], [153.0, 154.2]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 61.77, 53.72, 0.0, 0.0, 48.56, 56.78, 50.71, 53.91, 55.39, 0.0, 0.0, 0.0, 45.24, 45.27, 0.0, 0.0, 43.51, 0.0, 52.98, 58.72, 59.86, 0.0, 53.22, 42.58, 0.0, 60.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 25.69], ["music", 15.06], ["rumble", 6.63]], null, null, null, null, null, null, null, [["hum", 26.46], ["music", 19.34], ["throbbing", 8.23]], [["speech", 39.01], ["hum", 16.52], ["whale vocalization", 5.84]], null, null, [["music", 35.16], ["whale vocalization", 11.95], ["hum", 8.46]], null, null, null, null, null, null, [["speech", 44.94], ["music", 17.04], ["hum", 6.14]], null, null, null, null, null], "duration": [1.48, 6.17, 2.64, -0.33, -0.17, 3.92, 2.79, 6.18, 6.19, 3.39, 1.58, 1.36, 0.41, 7.91, 3.08, 1.49, 0.64, 2.38, 1.9, 2.05, 3.61, 2.41, 1.59, 2.29, 2.06, 1.32, 2.96, 1.07, 1.48, 1.2]} \ No newline at end of file diff --git a/annotations_1/MBeBFVoomg8_filtered.json b/annotations_1/MBeBFVoomg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c36828180dc4c2297159830b38453701f8b596d --- /dev/null +++ b/annotations_1/MBeBFVoomg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 25.46], [27.0, 27.43], [28.0, 28.78], [33.0, 34.06], [36.0, 53.25], [62.0, 62.29], [68.0, 68.5], [70.0, 70.95], [78.0, 81.55], [84.0, 85.89], [98.0, 101.61], [103.0, 132.53], [134.0, 155.09], [155.0, 156.78], [158.0, 158.25], [158.0, 159.09], [160.0, 161.22]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [34.37, 0.0, 0.0, 0.0, 31.84, 0.0, 0.0, 0.0, 34.89, 0.0, 66.63, 31.39, 29.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 35.22], ["hum", 23.55], ["music", 23.22]], null, null, null, [["music", 50.78], ["throbbing", 12.07], ["electronic music", 4.07]], null, null, null, [["explosion", 31.05], ["speech", 26.06], ["gunshot, gunfire", 8.58]], null, null, [["music", 80.22], ["animal", 6.68], ["musical instrument", 2.45]], [["speech", 24.91], ["music", 21.96], ["buzz", 10.64]], null, null, null, null], "duration": [6.46, 0.43, 0.78, 1.06, 17.25, 0.29, 0.5, 0.95, 3.55, 1.89, 3.61, 29.53, 21.09, 1.78, 0.25, 1.09, 1.22]} \ No newline at end of file diff --git a/annotations_1/MBgPSe_p1fk_filtered.json b/annotations_1/MBgPSe_p1fk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a01fbed66c4de6b093951f41929a11c332afa2b --- /dev/null +++ b/annotations_1/MBgPSe_p1fk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.42], [15.0, 22.72], [26.0, 37.2], [41.0, 41.88], [42.0, 44.63], [47.0, 46.68], [49.0, 51.68], [59.0, 61.38], [62.0, 97.56], [102.0, 115.16]], "keep_status": [false, false, true, false, true, false, true, true, false, true], "silence_prob": [40.43, 38.59, 30.43, 0.0, 30.01, 0.0, 31.44, 35.55, 0.0, 49.92], "audiomae_on_audioset": [[["speech", 58.26], ["music", 15.35], ["synthesizer", 4.98]], [["music", 69.15], ["synthesizer", 4.97], ["electronic music", 3.39]], [["music", 25.95], ["hum", 7.16], ["groan", 5.72]], null, [["civil defense siren", 23.36], ["speech", 13.57], ["music", 11.48]], null, [["music", 31.47], ["didgeridoo", 18.54], ["speech", 13.44]], [["fart", 44.89], ["music", 6.08], ["didgeridoo", 5.5]], null, [["music", 58.33], ["hum", 5.3], ["mains hum", 3.77]]], "duration": [3.42, 7.72, 11.2, 0.88, 2.63, -0.32, 2.68, 2.38, 35.56, 13.16]} \ No newline at end of file diff --git a/annotations_1/MBqT-UEySlI_filtered.json b/annotations_1/MBqT-UEySlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a4ec4c4cb7473d5c662f71f8276a4238a2d3920 --- /dev/null +++ b/annotations_1/MBqT-UEySlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 48.54], [51.0, 135.6], [137.0, 138.5], [141.0, 142.59], [144.0, 145.66], [147.0, 148.91], [150.0, 152.49], [155.0, 156.1]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [65.79, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [6.54, 84.6, 1.5, 1.59, 1.66, 1.91, 2.49, 1.1]} \ No newline at end of file diff --git a/annotations_1/MDG6JsXqaRA_filtered.json b/annotations_1/MDG6JsXqaRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/MDG6JsXqaRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/MFN2fMP05CI_filtered.json b/annotations_1/MFN2fMP05CI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76fd88988eb77e6ffdc988381ef284dd1968af35 --- /dev/null +++ b/annotations_1/MFN2fMP05CI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 26.32], [27.0, 28.75], [29.0, 31.56], [32.0, 33.05], [35.0, 35.8], [36.0, 37.99], [42.0, 45.15], [50.0, 50.35], [51.0, 51.48], [52.0, 56.66], [58.0, 67.19], [68.0, 70.56], [71.0, 83.49], [85.0, 101.75], [105.0, 112.92], [114.0, 118.13], [119.0, 121.39], [122.0, 123.92]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [32.24, 0.0, 37.9, 0.0, 0.0, 0.0, 42.42, 0.0, 0.0, 39.47, 30.04, 31.35, 29.96, 35.69, 34.16, 40.57, 41.01, 0.0], "audiomae_on_audioset": [[["hum", 39.97], ["throbbing", 22.21], ["music", 10.03]], null, [["hum", 27.82], ["mains hum", 11.69], ["throbbing", 10.89]], null, null, null, [["moo", 30.05], ["cattle, bovinae", 26.44], ["livestock, farm animals, working animals", 14.79]], null, null, [["speech", 60.67], ["hum", 8.29], ["didgeridoo", 4.39]], [["speech", 75.13], ["music", 7.15], ["didgeridoo", 3.9]], [["hum", 50.94], ["throbbing", 23.43], ["mains hum", 7.45]], [["hum", 24.82], ["speech", 22.17], ["whale vocalization", 10.13]], [["hum", 22.2], ["frog", 10.09], ["mains hum", 8.59]], [["hum", 34.86], ["throbbing", 33.99], ["mains hum", 8.21]], [["hum", 39.51], ["throbbing", 20.82], ["mains hum", 18.51]], [["hum", 26.97], ["music", 16.35], ["mains hum", 9.29]], null], "duration": [17.32, 1.75, 2.56, 1.05, 0.8, 1.99, 3.15, 0.35, 0.48, 4.66, 9.19, 2.56, 12.49, 16.75, 7.92, 4.13, 2.39, 1.92]} \ No newline at end of file diff --git a/annotations_1/MF_RlYTOmco_filtered.json b/annotations_1/MF_RlYTOmco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b2b53ac6c2414ce07a51b709c0c1ed070a75987 --- /dev/null +++ b/annotations_1/MF_RlYTOmco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [3.0, 3.01], [4.0, 4.56], [10.0, 10.98], [15.0, 15.8], [17.0, 18.5], [22.0, 24.07], [25.0, 25.44], [26.0, 27.84], [32.0, 32.24], [33.0, 33.52], [34.0, 34.82], [36.0, 36.56], [40.0, 43.65], [44.0, 44.74], [49.0, 51.0], [53.0, 53.43], [54.0, 54.77], [60.0, 65.55], [67.0, 68.25], [74.0, 74.87], [78.0, 81.48], [82.0, 82.58], [84.0, 84.92], [86.0, 86.81], [90.0, 93.46], [94.0, 95.96], [96.0, 96.85], [98.0, 98.78], [99.0, 101.76], [102.0, 103.05], [104.0, 107.05], [112.0, 115.62], [123.0, 123.62], [124.0, 125.1], [126.0, 127.11], [128.0, 129.95], [132.0, 133.2], [134.0, 134.54], [141.0, 141.67], [144.0, 144.75], [146.0, 146.91], [150.0, 150.11], [151.0, 152.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 41.42, 0.0, 95.37, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 54.94], ["chirp tone", 16.47], ["sine wave", 13.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.01, 0.56, 0.98, 0.8, 1.5, 2.07, 0.44, 1.84, 0.24, 0.52, 0.82, 0.56, 3.65, 0.74, 2.0, 0.43, 0.77, 5.55, 1.25, 0.87, 3.48, 0.58, 0.92, 0.81, 3.46, 1.96, 0.85, 0.78, 2.76, 1.05, 3.05, 3.62, 0.62, 1.1, 1.11, 1.95, 1.2, 0.54, 0.67, 0.75, 0.91, 0.11, 1.71]} \ No newline at end of file diff --git a/annotations_1/MFmLZibi7DE_filtered.json b/annotations_1/MFmLZibi7DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fb5fa9eff4b4746b58216eee081e16f690ea69f --- /dev/null +++ b/annotations_1/MFmLZibi7DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.82], [18.0, 20.58], [22.0, 73.21], [74.0, 75.29], [76.0, 79.71], [80.0, 81.11], [82.0, 93.02], [93.0, 94.93], [98.0, 100.62], [102.0, 106.81], [107.0, 107.59], [108.0, 110.91], [112.0, 115.45], [116.0, 119.67], [120.0, 120.65], [121.0, 123.08], [125.0, 129.91], [133.0, 133.68], [137.0, 136.95], [137.0, 141.39], [142.0, 146.99], [148.0, 149.91], [151.0, 154.04], [155.0, 156.24], [157.0, 158.52], [162.0, 166.51], [172.0, 174.77]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.18, 0.0, 0.0, 58.89, 0.0, 53.16, 0.0, 69.47, 78.55, 0.0, 86.09, 99.52, 46.36, 0.0, 95.37, 96.17, 0.0, 0.0, 62.89, 47.31, 0.0, 67.76, 0.0, 0.0, 99.31, 99.98], "audiomae_on_audioset": [null, [["vehicle", 17.67], ["eruption", 13.77], ["explosion", 9.02]], null, null, null, null, null, null, null, null, null, null, null, [["radio", 14.8], ["speech", 11.64], ["noise", 9.36]], null, null, null, null, null, null, [["speech", 39.46], ["radio", 14.01], ["frog", 4.44]], null, null, null, null, null, null], "duration": [0.82, 2.58, 51.21, 1.29, 3.71, 1.11, 11.02, 1.93, 2.62, 4.81, 0.59, 2.91, 3.45, 3.67, 0.65, 2.08, 4.91, 0.68, -0.05, 4.39, 4.99, 1.91, 3.04, 1.24, 1.52, 4.51, 2.77]} \ No newline at end of file diff --git a/annotations_1/MGBHNeYbsbg_filtered.json b/annotations_1/MGBHNeYbsbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e9d6ab7368f3d38ca3f893e968afbe3b4da4909 --- /dev/null +++ b/annotations_1/MGBHNeYbsbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 26.42], [28.0, 28.63], [32.0, 32.22], [44.0, 44.52], [45.0, 47.7], [66.0, 68.34], [71.0, 70.95], [73.0, 72.72], [79.0, 79.79], [84.0, 84.33], [84.0, 84.77], [89.0, 96.6], [109.0, 130.67], [134.0, 134.0], [134.0, 134.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.88, 0.0, 0.0, 0.0, 47.9, 51.94, 0.0, 0.0, 0.0, 0.0, 0.0, 35.94, 33.19, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.48], ["music", 23.44], ["didgeridoo", 18.81]], null, null, null, [["music", 55.28], ["electric shaver, electric razor", 10.12], ["speech", 7.03]], null, null, null, null, null, null, [["music", 38.47], ["didgeridoo", 28.3], ["whimper", 6.12]], [["music", 48.71], ["theremin", 21.52], ["didgeridoo", 3.37]], null, null], "duration": [25.42, 0.63, 0.22, 0.52, 2.7, 2.34, -0.05, -0.28, 0.79, 0.33, 0.77, 7.6, 21.67, 0.0, 0.2]} \ No newline at end of file diff --git a/annotations_1/MGGGksL1ziM_filtered.json b/annotations_1/MGGGksL1ziM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..971ad6d894ccf183a9f289778786b7915eb3a9da --- /dev/null +++ b/annotations_1/MGGGksL1ziM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [7.0, 8.56], [11.0, 12.45], [14.0, 14.27], [16.0, 16.06], [18.0, 19.67], [21.0, 21.76], [23.0, 27.53], [30.0, 30.96], [31.0, 33.39], [37.0, 41.35], [97.0, 104.11], [105.0, 106.68], [107.0, 107.94], [109.0, 109.58], [110.0, 110.73], [112.0, 116.02], [117.0, 125.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 70.58, 89.36, 97.73, 0.0, 0.0, 0.0, 0.0, 99.31, 98.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.4, 1.56, 1.45, 0.27, 0.06, 1.67, 0.76, 4.53, 0.96, 2.39, 4.35, 7.11, 1.68, 0.94, 0.58, 0.73, 4.02, 8.44]} \ No newline at end of file diff --git a/annotations_1/MGIjofJUXyo_filtered.json b/annotations_1/MGIjofJUXyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcaf7e9ec08ff481d692c6d7d843df62865fc780 --- /dev/null +++ b/annotations_1/MGIjofJUXyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 40.8], [44.0, 90.68], [92.0, 117.93], [120.0, 127.08], [129.0, 129.86]], "keep_status": [true, false, false, true, false], "silence_prob": [29.18, 0.0, 29.59, 30.09, 0.0], "audiomae_on_audioset": [[["music", 50.83], ["electronic music", 6.93], ["throbbing", 5.48]], null, [["music", 58.8], ["throbbing", 9.57], ["electronic music", 5.82]], [["music", 24.52], ["moo", 12.38], ["livestock, farm animals, working animals", 10.8]], null], "duration": [20.8, 46.68, 25.93, 7.08, 0.86]} \ No newline at end of file diff --git a/annotations_1/MGJlq-gjQj8_filtered.json b/annotations_1/MGJlq-gjQj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e7fd2e50c9d314babfb6ba196a69ac59275a9e8 --- /dev/null +++ b/annotations_1/MGJlq-gjQj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.6], [8.0, 29.1], [34.0, 36.78], [39.0, 50.97], [59.0, 61.13], [62.0, 63.02], [68.0, 69.35], [70.0, 72.27], [75.0, 79.96], [86.0, 88.35], [91.0, 135.84], [136.0, 148.83], [154.0, 155.41], [157.0, 157.74], [164.0, 164.69], [166.0, 175.95], [177.0, 177.43], [179.0, 179.56], [194.0, 202.14], [204.0, 204.89], [207.0, 218.91], [221.0, 223.77], [225.0, 228.14], [229.0, 229.29]], "keep_status": [true, false, true, true, false, false, false, true, true, true, false, true, false, false, false, true, false, false, true, false, false, true, false, false], "silence_prob": [30.32, 31.57, 46.26, 31.77, 42.86, 0.0, 0.0, 35.3, 31.85, 32.47, 0.0, 31.8, 0.0, 0.0, 0.0, 32.09, 0.0, 0.0, 33.34, 0.0, 35.89, 49.64, 56.48, 0.0], "audiomae_on_audioset": [[["music", 23.02], ["whale vocalization", 16.28], ["livestock, farm animals, working animals", 9.98]], [["speech", 39.11], ["music", 27.36], ["beatboxing", 9.06]], [["music", 50.58], ["synthesizer", 8.07], ["theremin", 5.89]], [["music", 49.53], ["hum", 10.15], ["mains hum", 4.06]], [["music", 57.06], ["synthesizer", 11.57], ["musical instrument", 2.62]], null, null, [["throbbing", 29.87], ["hum", 14.8], ["cattle, bovinae", 8.43]], [["music", 21.98], ["speech", 17.71], ["hum", 8.21]], [["music", 24.06], ["speech", 21.52], ["electric shaver, electric razor", 6.17]], null, [["speech", 41.42], ["music", 21.45], ["hum", 6.1]], null, null, null, [["speech", 34.18], ["music", 19.46], ["noise", 7.52]], null, null, [["music", 50.23], ["throbbing", 6.65], ["theremin", 5.2]], null, [["speech", 50.28], ["music", 17.43], ["fart", 4.99]], [["throbbing", 28.82], ["music", 28.04], ["hum", 12.55]], null, null], "duration": [2.6, 21.1, 2.78, 11.97, 2.13, 1.02, 1.35, 2.27, 4.96, 2.35, 44.84, 12.83, 1.41, 0.74, 0.69, 9.95, 0.43, 0.56, 8.14, 0.89, 11.91, 2.77, 3.14, 0.29]} \ No newline at end of file diff --git a/annotations_1/MGRJhDyY9ls_filtered.json b/annotations_1/MGRJhDyY9ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deba03231343a4248166b1b33bb8ef04571c711a --- /dev/null +++ b/annotations_1/MGRJhDyY9ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.08], [26.0, 27.26], [32.0, 102.81], [103.0, 102.84], [103.0, 103.38], [103.0, 103.42], [110.0, 109.65], [110.0, 113.41], [117.0, 117.59], [119.0, 121.9], [126.0, 129.12], [130.0, 130.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 99.65, 63.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 1.26, 70.81, -0.16, 0.38, 0.42, -0.35, 3.41, 0.59, 2.9, 3.12, 0.98]} \ No newline at end of file diff --git a/annotations_1/MHPp7bN1kXI_filtered.json b/annotations_1/MHPp7bN1kXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dbdbe07691a1eabf66eff24e20342582472b23c --- /dev/null +++ b/annotations_1/MHPp7bN1kXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [6.0, 6.07], [7.0, 8.75], [12.0, 20.58], [21.0, 21.73], [22.0, 25.17], [26.0, 27.03], [32.0, 33.07], [36.0, 36.9], [38.0, 38.75], [40.0, 40.27], [41.0, 40.86], [43.0, 44.46], [47.0, 48.9], [50.0, 50.72], [71.0, 71.58], [82.0, 85.16], [90.0, 103.35], [108.0, 109.65], [110.0, 110.42], [111.0, 111.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.01, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.69, 30.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 86.63], ["electronic music", 1.8], ["house music", 1.73]], [["music", 88.57], ["swing music", 3.9], ["funny music", 1.65]], null, null, null], "duration": [0.11, 0.07, 1.75, 8.58, 0.73, 3.17, 1.03, 1.07, 0.9, 0.75, 0.27, -0.14, 1.46, 1.9, 0.72, 0.58, 3.16, 13.35, 1.65, 0.42, 0.7]} \ No newline at end of file diff --git a/annotations_1/MIZSWO65BXQ_filtered.json b/annotations_1/MIZSWO65BXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c8abb6fbd8db72c15d47eede9ffa66c6216344a --- /dev/null +++ b/annotations_1/MIZSWO65BXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.81], [13.0, 12.99], [27.0, 28.83], [30.0, 31.36], [41.0, 42.63], [45.0, 45.3], [46.0, 46.41], [53.0, 54.01], [55.0, 55.66], [60.0, 60.94], [73.0, 73.06], [75.0, 75.51], [92.0, 93.77], [98.0, 98.83], [101.0, 102.05], [106.0, 106.19], [109.0, 109.29], [120.0, 119.64], [126.0, 126.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, -0.01, 1.83, 1.36, 1.63, 0.3, 0.41, 1.01, 0.66, 0.94, 0.06, 0.51, 1.77, 0.83, 1.05, 0.19, 0.29, -0.36, 0.35]} \ No newline at end of file diff --git a/annotations_1/MLCZ_B7FKc8_filtered.json b/annotations_1/MLCZ_B7FKc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2ba35ff77597f7947e2297d659705ba03845a90 --- /dev/null +++ b/annotations_1/MLCZ_B7FKc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 44.44], [46.0, 46.72], [54.0, 54.9], [77.0, 78.7], [80.0, 91.44], [94.0, 98.04]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.0, 30.66], "audiomae_on_audioset": [null, null, null, null, [["music", 57.98], ["theremin", 8.81], ["speech", 3.36]], [["music", 76.39], ["synthesizer", 5.47], ["ambient music", 4.6]]], "duration": [1.44, 0.72, 0.9, 1.7, 11.44, 4.04]} \ No newline at end of file diff --git a/annotations_1/MLaMV6zQND4_filtered.json b/annotations_1/MLaMV6zQND4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f94a07bc5cefdb212cc719272348d570c8eefb8 --- /dev/null +++ b/annotations_1/MLaMV6zQND4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [9.0, 8.95], [18.0, 18.89], [25.0, 25.47], [27.0, 27.3], [34.0, 35.63], [48.0, 47.78], [62.0, 62.41], [64.0, 64.89], [66.0, 67.93], [69.0, 72.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, -0.05, 0.89, 0.47, 0.3, 1.63, -0.22, 0.41, 0.89, 1.93, 3.42]} \ No newline at end of file diff --git a/annotations_1/MM1no56lIjw_filtered.json b/annotations_1/MM1no56lIjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6180786a897d09a16c16516abb7a676b2d9e7ea7 --- /dev/null +++ b/annotations_1/MM1no56lIjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [6.0, 6.24], [7.0, 8.01], [10.0, 11.3], [12.0, 12.95], [14.0, 14.17], [17.0, 19.13], [20.0, 21.96], [23.0, 23.26], [25.0, 25.07], [26.0, 26.6], [30.0, 31.5], [33.0, 34.33], [36.0, 37.13], [51.0, 51.66], [54.0, 54.55], [57.0, 58.13], [60.0, 65.65], [72.0, 75.39], [78.0, 79.35], [81.0, 84.62], [85.0, 86.73], [87.0, 88.5], [93.0, 93.92], [99.0, 100.87], [104.0, 105.33], [107.0, 112.48], [114.0, 115.3], [117.0, 118.2], [122.0, 122.07], [124.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 99.87, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 98.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.24, 1.01, 1.3, 0.95, 0.17, 2.13, 1.96, 0.26, 0.07, 0.6, 1.5, 1.33, 1.13, 0.66, 0.55, 1.13, 5.65, 3.39, 1.35, 3.62, 1.73, 1.5, 0.92, 1.87, 1.33, 5.48, 1.3, 1.2, 0.07, 7.04]} \ No newline at end of file diff --git a/annotations_1/MMNICLfHE3M_filtered.json b/annotations_1/MMNICLfHE3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d44271ebaa96a0448069b31a47afc5af8c005f3 --- /dev/null +++ b/annotations_1/MMNICLfHE3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 108.94], [111.0, 121.34], [123.0, 139.11], [140.0, 143.92], [148.0, 149.47], [151.0, 151.21], [157.0, 157.94], [159.0, 159.39], [161.0, 160.79], [162.0, 162.01], [163.0, 163.19], [164.0, 164.3], [166.0, 166.97], [173.0, 173.48]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.43, 42.65, 50.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 71.81], ["quack", 4.0], ["musical instrument", 2.65]], [["theremin", 37.28], ["music", 25.23], ["gong", 6.85]], null, null, null, null, null, null, null, null, null, null, null], "duration": [51.94, 10.34, 16.11, 3.92, 1.47, 0.21, 0.94, 0.39, -0.21, 0.01, 0.19, 0.3, 0.97, 0.48]} \ No newline at end of file diff --git a/annotations_1/MMxE41xM9ic_filtered.json b/annotations_1/MMxE41xM9ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a5d15a715423109afc2558a337c2a84cc36a0d --- /dev/null +++ b/annotations_1/MMxE41xM9ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 51.73], [53.0, 53.67], [54.0, 53.72], [54.0, 55.12], [60.0, 61.05], [67.0, 67.36], [69.0, 76.81], [78.0, 78.8], [85.0, 85.8], [88.0, 89.6], [90.0, 98.56], [111.0, 115.65], [116.0, 117.26], [119.0, 123.16], [130.0, 132.36], [136.0, 138.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.25, 0.0, 0.0, 0.0, 29.54, 38.51, 0.0, 33.94, 34.54, 39.4], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 52.49], ["throbbing", 22.4], ["mains hum", 11.02]], null, null, null, [["music", 53.48], ["theremin", 9.42], ["siren", 8.15]], [["speech", 24.96], ["sidetone", 21.07], ["music", 9.21]], null, [["sidetone", 40.59], ["music", 24.98], ["speech", 18.08]], [["throbbing", 37.8], ["hum", 36.82], ["music", 12.03]], [["speech", 39.66], ["hum", 13.65], ["siren", 10.03]]], "duration": [1.73, 0.67, -0.28, 1.12, 1.05, 0.36, 7.81, 0.8, 0.8, 1.6, 8.56, 4.65, 1.26, 4.16, 2.36, 2.35]} \ No newline at end of file diff --git a/annotations_1/MNQQS7QR9Vo_filtered.json b/annotations_1/MNQQS7QR9Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d38c881aabac4fa4266c52b9cd6290ab5c394b8 --- /dev/null +++ b/annotations_1/MNQQS7QR9Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.53], [11.0, 11.01], [12.0, 11.94], [14.0, 45.76], [50.0, 110.71], [113.0, 122.27], [126.0, 133.12]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.4, 28.56], "audiomae_on_audioset": [null, null, null, null, null, [["music", 75.46], ["speech", 6.27], ["thump, thud", 5.74]], [["music", 36.07], ["speech", 22.37], ["throbbing", 7.41]]], "duration": [0.53, 0.01, -0.06, 31.76, 60.71, 9.27, 7.12]} \ No newline at end of file diff --git a/annotations_1/MNmdm8voYFE_filtered.json b/annotations_1/MNmdm8voYFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f81b1ae7c1466d155a64cef42eed330c913f898 --- /dev/null +++ b/annotations_1/MNmdm8voYFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 63.26], [63.0, 69.09], [71.0, 76.17], [78.0, 79.35], [80.0, 83.3], [84.0, 83.64], [84.0, 84.77], [85.0, 84.94], [85.0, 87.37], [91.0, 101.41], [111.0, 113.49], [114.0, 115.74], [117.0, 118.5], [122.0, 123.6], [129.0, 131.04], [132.0, 171.12], [172.0, 172.66], [173.0, 180.94], [192.0, 209.19], [212.0, 218.32], [219.0, 226.4]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [31.88, 31.45, 35.71, 0.0, 32.43, 0.0, 0.0, 0.0, 32.15, 29.77, 82.07, 0.0, 0.0, 0.0, 33.69, 0.0, 0.0, 39.22, 32.61, 36.02, 53.47], "audiomae_on_audioset": [[["music", 72.62], ["didgeridoo", 7.38], ["musical instrument", 4.71]], [["speech", 30.47], ["music", 28.89], ["throbbing", 7.68]], [["throbbing", 29.21], ["hum", 26.57], ["music", 21.87]], null, [["music", 44.21], ["speech", 7.13], ["theremin", 5.81]], null, null, null, [["music", 61.59], ["didgeridoo", 5.24], ["musical instrument", 4.01]], [["music", 73.02], ["speech", 7.65], ["musical instrument", 2.78]], null, null, null, null, [["mains hum", 22.7], ["hum", 21.25], ["speech", 20.97]], null, null, [["music", 59.03], ["throbbing", 7.2], ["synthesizer", 2.53]], [["music", 46.42], ["throbbing", 14.31], ["theremin", 11.46]], [["music", 59.59], ["synthesizer", 8.94], ["theremin", 5.98]], null], "duration": [2.26, 6.09, 5.17, 1.35, 3.3, -0.36, 0.77, -0.06, 2.37, 10.41, 2.49, 1.74, 1.5, 1.6, 2.04, 39.12, 0.66, 7.94, 17.19, 6.32, 7.4]} \ No newline at end of file diff --git a/annotations_1/MODlCaeiT0M_filtered.json b/annotations_1/MODlCaeiT0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6e82951a3d886b247f1e73ac4b1d8030e54116b --- /dev/null +++ b/annotations_1/MODlCaeiT0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [6.0, 6.15], [8.0, 9.61], [11.0, 12.09], [16.0, 16.77], [47.0, 47.09], [55.0, 56.08], [89.0, 89.13], [91.0, 91.25], [95.0, 95.45], [114.0, 114.22], [116.0, 139.04], [153.0, 154.99], [158.0, 161.77], [164.0, 173.94], [175.0, 185.9], [190.0, 204.33], [205.0, 205.5], [210.0, 216.85], [217.0, 216.94], [217.0, 239.03], [240.0, 241.81], [244.0, 244.11], [248.0, 249.51], [251.0, 255.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.38, 0.0, 42.19, 41.05, 41.18, 38.45, 0.0, 38.56, 0.0, 83.52, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 61.66], ["speech", 5.9], ["synthesizer", 4.72]], null, [["music", 75.65], ["synthesizer", 3.46], ["musical instrument", 2.36]], [["music", 60.95], ["synthesizer", 5.45], ["didgeridoo", 3.62]], [["music", 60.57], ["hum", 6.87], ["mains hum", 3.16]], [["music", 76.23], ["hum", 1.89], ["mains hum", 1.78]], null, [["music", 51.59], ["carnatic music", 11.9], ["musical instrument", 6.99]], null, null, null, null, null, null], "duration": [0.78, 0.15, 1.61, 1.09, 0.77, 0.09, 1.08, 0.13, 0.25, 0.45, 0.22, 23.04, 1.99, 3.77, 9.94, 10.9, 14.33, 0.5, 6.85, -0.06, 22.03, 1.81, 0.11, 1.51, 4.45]} \ No newline at end of file diff --git a/annotations_1/MOLAFbjjOl0_filtered.json b/annotations_1/MOLAFbjjOl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e0f38d3d98dc57f9c256f08ba6aa650ff44c86a --- /dev/null +++ b/annotations_1/MOLAFbjjOl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 32.8], [34.0, 34.32], [35.0, 39.09], [40.0, 40.29], [46.0, 57.96], [58.0, 58.51], [61.0, 72.28], [81.0, 81.13], [82.0, 84.11], [85.0, 85.72], [88.0, 88.7], [102.0, 102.56], [113.0, 113.49], [119.0, 120.11], [172.0, 172.3], [178.0, 179.63], [180.0, 186.44], [188.0, 189.63], [190.0, 190.88], [191.0, 191.73], [195.0, 195.61]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [29.5, 0.0, 34.87, 0.0, 29.94, 0.0, 31.29, 0.0, 33.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 81.29], ["whack, thwack", 6.5], ["music", 2.13]], null, [["thunk", 23.02], ["music", 18.99], ["hum", 6.82]], null, [["music", 37.85], ["speech", 29.96], ["didgeridoo", 5.58]], null, [["music", 20.18], ["hum", 18.08], ["mains hum", 17.36]], null, [["music", 44.42], ["pulse", 9.63], ["speech", 8.9]], null, null, null, null, null, null, null, [["speech", 31.51], ["hum", 22.76], ["mains hum", 11.67]], null, null, null, null], "duration": [5.8, 0.32, 4.09, 0.29, 11.96, 0.51, 11.28, 0.13, 2.11, 0.72, 0.7, 0.56, 0.49, 1.11, 0.3, 1.63, 6.44, 1.63, 0.88, 0.73, 0.61]} \ No newline at end of file diff --git a/annotations_1/MP414NY4kfA_filtered.json b/annotations_1/MP414NY4kfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4f91a7e8eed6ada0b78edfca22e0a03e6cb797b --- /dev/null +++ b/annotations_1/MP414NY4kfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.18], [15.0, 20.78], [21.0, 22.54], [27.0, 28.11], [30.0, 30.23], [31.0, 32.05], [33.0, 46.9], [51.0, 51.07], [52.0, 51.76], [55.0, 55.24], [61.0, 61.33], [65.0, 71.15], [73.0, 73.95], [74.0, 76.01], [82.0, 83.02], [83.0, 86.8], [90.0, 91.27], [107.0, 109.93], [114.0, 116.02], [117.0, 117.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 99.4, 0.0, 99.26, 0.0, 96.42, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 5.78, 1.54, 1.11, 0.23, 1.05, 13.9, 0.07, -0.24, 0.24, 0.33, 6.15, 0.95, 2.01, 1.02, 3.8, 1.27, 2.93, 2.02, 0.93]} \ No newline at end of file diff --git a/annotations_1/MPQojemDuDo_filtered.json b/annotations_1/MPQojemDuDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f40c4c0de9169f941785135875cce20cbb4ab26c --- /dev/null +++ b/annotations_1/MPQojemDuDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.14], [10.0, 57.25], [58.0, 64.34], [68.0, 71.05], [74.0, 96.45], [97.0, 103.17], [104.0, 105.29]], "keep_status": [true, false, true, true, false, true, false], "silence_prob": [40.31, 0.0, 28.98, 29.68, 30.48, 30.07, 0.0], "audiomae_on_audioset": [[["music", 22.02], ["throbbing", 19.35], ["hum", 16.13]], null, [["sound effect", 11.06], ["vehicle", 9.2], ["whale vocalization", 7.63]], [["speech", 42.77], ["whale vocalization", 5.44], ["field recording", 5.41]], [["speech", 64.26], ["music", 8.16], ["whale vocalization", 4.67]], [["music", 50.95], ["mains hum", 10.63], ["hum", 6.36]], null], "duration": [2.14, 47.25, 6.34, 3.05, 22.45, 6.17, 1.29]} \ No newline at end of file diff --git a/annotations_1/MPhIzvgB31Y_filtered.json b/annotations_1/MPhIzvgB31Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9b22bf2f4cdd225fbdb99cc1598cd4a46c1aed --- /dev/null +++ b/annotations_1/MPhIzvgB31Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.55], [32.0, 37.99], [42.0, 42.3], [44.0, 53.15], [60.0, 66.07], [67.0, 67.24], [69.0, 70.46], [89.0, 91.99], [92.0, 92.2], [100.0, 100.75], [107.0, 110.37], [120.0, 121.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 40.38, 0.0, 38.83, 35.0, 0.0, 0.0, 30.65, 0.0, 0.0, 45.18, 0.0], "audiomae_on_audioset": [null, [["music", 49.33], ["moo", 15.46], ["cattle, bovinae", 9.12]], null, [["cattle, bovinae", 36.12], ["moo", 32.62], ["music", 20.06]], [["music", 78.66], ["middle eastern music", 3.46], ["singing", 1.67]], null, null, [["cattle, bovinae", 36.48], ["moo", 25.84], ["livestock, farm animals, working animals", 11.46]], null, null, [["speech", 27.97], ["cattle, bovinae", 13.14], ["music", 12.57]], null], "duration": [1.55, 5.99, 0.3, 9.15, 6.07, 0.24, 1.46, 2.99, 0.2, 0.75, 3.37, 1.14]} \ No newline at end of file diff --git a/annotations_1/MQ1E_qYia9Q_filtered.json b/annotations_1/MQ1E_qYia9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dbb1c93e10364e18394e1729bc19f2e48e20da3 --- /dev/null +++ b/annotations_1/MQ1E_qYia9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.71], [23.0, 24.04], [25.0, 25.64], [33.0, 34.15], [35.0, 35.51], [44.0, 43.83], [47.0, 47.11], [50.0, 54.46], [57.0, 58.58], [61.0, 61.62], [83.0, 83.1], [84.0, 84.4], [86.0, 86.43], [88.0, 89.4], [91.0, 91.77], [92.0, 92.92], [97.0, 97.39], [105.0, 105.44], [106.0, 112.99], [114.0, 119.92], [122.0, 125.15], [134.0, 137.81], [139.0, 143.29], [148.0, 148.85], [153.0, 153.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 36.07, 73.51, 46.61, 61.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 37.34], ["livestock, farm animals, working animals", 31.82], ["cattle, bovinae", 29.38]], null, [["music", 47.74], ["speech", 23.83], ["guitar", 5.05]], null, null, null], "duration": [0.71, 1.04, 0.64, 1.15, 0.51, -0.17, 0.11, 4.46, 1.58, 0.62, 0.1, 0.4, 0.43, 1.4, 0.77, 0.92, 0.39, 0.44, 6.99, 5.92, 3.15, 3.81, 4.29, 0.85, 0.37]} \ No newline at end of file diff --git a/annotations_1/MQ2PrvpAT-k_filtered.json b/annotations_1/MQ2PrvpAT-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ba0ec89f70b3c6c4aa0fcff4be9cbe70b9cb09f --- /dev/null +++ b/annotations_1/MQ2PrvpAT-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 21.42], [23.0, 24.68], [26.0, 32.68], [35.0, 36.69], [39.0, 42.31], [44.0, 46.08], [49.0, 52.76], [55.0, 60.51], [63.0, 64.83], [69.0, 69.33], [70.0, 72.5], [74.0, 75.76], [76.0, 83.17], [84.0, 89.11], [90.0, 90.98], [92.0, 93.85], [101.0, 121.64], [128.0, 132.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [100.0, 0.0, 100.0, 0.0, 97.54, 77.87, 59.33, 100.0, 0.0, 0.0, 100.0, 0.0, 99.96, 96.66, 0.0, 0.0, 33.63, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 24.42], ["music", 23.65], ["didgeridoo", 4.08]], null], "duration": [3.42, 1.68, 6.68, 1.69, 3.31, 2.08, 3.76, 5.51, 1.83, 0.33, 2.5, 1.76, 7.17, 5.11, 0.98, 1.85, 20.64, 4.04]} \ No newline at end of file diff --git a/annotations_1/MUEhAUpa7iA_filtered.json b/annotations_1/MUEhAUpa7iA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a94d214aaa1c4f14886551efc277c49050ecf893 --- /dev/null +++ b/annotations_1/MUEhAUpa7iA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [15.0, 15.2], [16.0, 101.93], [104.0, 109.78], [110.0, 112.29], [113.0, 115.65], [117.0, 118.22], [119.0, 120.78], [122.0, 123.8]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.9, 97.92, 99.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.2, 85.93, 5.78, 2.29, 2.65, 1.22, 1.78, 1.8]} \ No newline at end of file diff --git a/annotations_1/MUeKujlb6gc_filtered.json b/annotations_1/MUeKujlb6gc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f47d9a89b463eca8cb1a2cba0f65aeb1483dd24d --- /dev/null +++ b/annotations_1/MUeKujlb6gc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.97], [5.0, 8.02], [9.0, 10.69], [11.0, 12.73], [14.0, 16.31], [22.0, 22.23], [25.0, 25.57], [33.0, 35.72], [37.0, 37.64], [40.0, 40.54], [41.0, 43.31], [44.0, 46.13], [47.0, 47.56], [48.0, 58.19], [59.0, 60.3], [61.0, 64.94], [65.0, 67.27], [70.0, 87.42], [91.0, 90.93], [93.0, 94.05], [95.0, 96.79], [98.0, 98.36], [100.0, 104.87], [108.0, 109.09], [110.0, 110.24], [114.0, 114.44], [115.0, 115.84], [118.0, 119.16], [120.0, 120.68], [121.0, 123.01], [124.0, 132.54], [135.0, 136.39], [139.0, 152.49], [172.0, 171.75], [173.0, 173.28], [174.0, 175.54], [177.0, 179.05], [180.0, 180.5], [181.0, 182.38], [184.0, 184.4], [185.0, 185.85], [189.0, 191.24], [192.0, 193.43], [196.0, 196.97], [199.0, 199.88], [201.0, 201.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.51, 0.0, 0.0, 99.21, 0.0, 0.0, 60.89, 0.0, 0.0, 85.54, 99.68, 0.0, 80.64, 0.0, 92.8, 98.27, 79.07, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 73.21, 0.0, 61.87, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 3.02, 1.69, 1.73, 2.31, 0.23, 0.57, 2.72, 0.64, 0.54, 2.31, 2.13, 0.56, 10.19, 1.3, 3.94, 2.27, 17.42, -0.07, 1.05, 1.79, 0.36, 4.87, 1.09, 0.24, 0.44, 0.84, 1.16, 0.68, 2.01, 8.54, 1.39, 13.49, -0.25, 0.28, 1.54, 2.05, 0.5, 1.38, 0.4, 0.85, 2.24, 1.43, 0.97, 0.88, 0.99]} \ No newline at end of file diff --git a/annotations_1/MVRR0XlqA4g_filtered.json b/annotations_1/MVRR0XlqA4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5804195a1c7bc39774306ce79dddcf200e5eb68 --- /dev/null +++ b/annotations_1/MVRR0XlqA4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.81], [4.0, 4.94], [8.0, 9.09], [10.0, 12.01], [12.0, 14.2], [25.0, 24.95], [26.0, 26.43], [27.0, 27.89], [30.0, 30.7], [32.0, 33.13], [34.0, 34.26], [38.0, 38.64], [40.0, 41.57], [42.0, 42.77], [43.0, 44.86], [50.0, 50.94], [64.0, 64.07], [66.0, 66.85], [68.0, 69.53], [73.0, 73.2], [78.0, 78.6], [80.0, 80.92], [87.0, 88.11], [92.0, 91.94], [96.0, 96.38], [98.0, 98.96], [110.0, 110.49], [112.0, 112.6], [115.0, 120.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 72.46, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 15.35], ["moo", 5.41], ["cattle, bovinae", 5.35]]], "duration": [1.81, 0.94, 1.09, 2.01, 2.2, -0.05, 0.43, 0.89, 0.7, 1.13, 0.26, 0.64, 1.57, 0.77, 1.86, 0.94, 0.07, 0.85, 1.53, 0.2, 0.6, 0.92, 1.11, -0.06, 0.38, 0.96, 0.49, 0.6, 5.12]} \ No newline at end of file diff --git a/annotations_1/MVY7ci-BTI4_filtered.json b/annotations_1/MVY7ci-BTI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04abe372a00a03c1892d56156c667c9b72515308 --- /dev/null +++ b/annotations_1/MVY7ci-BTI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.07], [16.0, 21.37], [23.0, 25.0], [26.0, 39.68], [41.0, 52.62], [56.0, 60.34], [62.0, 64.98], [66.0, 88.03], [92.0, 109.7], [111.0, 114.24], [115.0, 115.94], [118.0, 117.93], [119.0, 119.38], [122.0, 123.04], [124.0, 124.8], [125.0, 127.2], [134.0, 135.82], [138.0, 139.94], [144.0, 144.21], [150.0, 152.12], [154.0, 154.18], [155.0, 163.95]], "keep_status": [true, false, true, false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [33.84, 33.49, 30.63, 30.46, 30.24, 30.58, 30.33, 30.91, 30.8, 32.45, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 0.0, 0.0, 0.0, 31.76, 0.0, 33.1], "audiomae_on_audioset": [[["music", 25.77], ["sidetone", 24.9], ["speech", 12.68]], [["hum", 31.45], ["throbbing", 22.12], ["music", 18.59]], [["music", 26.21], ["synthesizer", 5.79], ["vehicle", 4.85]], [["speech", 40.83], ["music", 38.41], ["throbbing", 5.48]], [["music", 60.16], ["throbbing", 7.85], ["smash, crash", 4.04]], [["music", 41.28], ["throbbing", 11.94], ["hum", 7.42]], [["hum", 23.45], ["music", 19.31], ["mains hum", 15.49]], [["music", 35.44], ["hum", 23.61], ["throbbing", 22.58]], [["music", 62.97], ["throbbing", 7.66], ["hum", 4.05]], [["music", 11.85], ["gunshot, gunfire", 10.62], ["clang", 9.7]], null, null, null, null, null, [["throbbing", 40.36], ["sidetone", 13.11], ["music", 11.74]], null, null, null, [["music", 64.29], ["synthesizer", 6.9], ["theremin", 3.68]], null, [["throbbing", 34.9], ["hum", 26.29], ["music", 17.52]]], "duration": [2.07, 5.37, 2.0, 13.68, 11.62, 4.34, 2.98, 22.03, 17.7, 3.24, 0.94, -0.07, 0.38, 1.04, 0.8, 2.2, 1.82, 1.94, 0.21, 2.12, 0.18, 8.95]} \ No newline at end of file diff --git a/annotations_1/MVo83HAnysQ_filtered.json b/annotations_1/MVo83HAnysQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feea4862e576053539a9b8cc52f78070c239b676 --- /dev/null +++ b/annotations_1/MVo83HAnysQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.71], [15.0, 15.09], [43.0, 44.96], [45.0, 45.81], [49.0, 49.2], [51.0, 51.49], [52.0, 54.65], [56.0, 58.87], [60.0, 60.88], [69.0, 70.21], [71.0, 73.31], [75.0, 75.22], [87.0, 87.51], [89.0, 89.48], [91.0, 92.01], [105.0, 105.61], [112.0, 112.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.55, 70.58, 0.0, 0.0, 33.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 59.91], ["speech", 18.17], ["boing", 4.55]], null, null, null, [["music", 47.5], ["speech", 20.8], ["boing", 10.15]], null, null, null, null, null, null], "duration": [0.71, 0.09, 1.96, 0.81, 0.2, 0.49, 2.65, 2.87, 0.88, 1.21, 2.31, 0.22, 0.51, 0.48, 1.01, 0.61, 0.26]} \ No newline at end of file diff --git a/annotations_1/MWAMJWYNpK8_filtered.json b/annotations_1/MWAMJWYNpK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5013348c41f69b64a19b57d3a8e2fc2fc4e0e7e1 --- /dev/null +++ b/annotations_1/MWAMJWYNpK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.96], [18.0, 18.94], [20.0, 21.1], [24.0, 24.27], [25.0, 40.61], [44.0, 71.17], [74.0, 106.35], [108.0, 108.01], [110.0, 121.54], [122.0, 121.58], [123.0, 122.74], [123.0, 122.89], [123.0, 123.01], [123.0, 123.04], [123.0, 151.93], [152.0, 152.59], [154.0, 154.43], [155.0, 178.31]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [34.51, 0.0, 0.0, 0.0, 29.51, 28.94, 0.0, 0.0, 30.16, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 0.0, 29.66], "audiomae_on_audioset": [[["whale vocalization", 74.39], ["hum", 4.21], ["stomach rumble", 2.63]], null, null, null, [["speech", 43.55], ["cacophony", 9.2], ["buzz", 7.15]], [["speech", 47.75], ["fart", 10.23], ["boom", 8.8]], null, null, [["clang", 54.12], ["ding", 24.93], ["speech", 7.51]], null, null, null, null, null, [["hum", 44.04], ["mains hum", 33.73], ["music", 8.39]], null, null, [["hum", 41.57], ["throbbing", 13.39], ["music", 10.02]]], "duration": [5.96, 0.94, 1.1, 0.27, 15.61, 27.17, 32.35, 0.01, 11.54, -0.42, -0.26, -0.11, 0.01, 0.04, 28.93, 0.59, 0.43, 23.31]} \ No newline at end of file diff --git a/annotations_1/MWc0I1-Sfj4_filtered.json b/annotations_1/MWc0I1-Sfj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f58f6df1bbe0d527c99ef3b0095fdc5da3a05f3 --- /dev/null +++ b/annotations_1/MWc0I1-Sfj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.81], [5.0, 6.86], [9.0, 9.88], [11.0, 10.79], [14.0, 14.18], [15.0, 15.31], [17.0, 17.09], [21.0, 22.64], [23.0, 34.11], [35.0, 34.91], [35.0, 35.24], [38.0, 38.79], [42.0, 51.29], [59.0, 59.71], [63.0, 64.52], [67.0, 67.66], [69.0, 70.19], [71.0, 71.93], [73.0, 74.8], [82.0, 83.1], [83.0, 83.27], [83.0, 97.34], [101.0, 102.64], [107.0, 110.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 0.0, 0.0, 0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.21, 0.0, 30.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.79], ["didgeridoo", 6.54], ["sidetone", 5.9]], null, null, null, null, null, null, null, null, [["music", 25.45], ["insect", 17.14], ["fly, housefly", 10.74]], null, [["boing", 23.55], ["sound effect", 15.56], ["fart", 11.23]]], "duration": [-0.19, 1.86, 0.88, -0.21, 0.18, 0.31, 0.09, 1.64, 11.11, -0.09, 0.24, 0.79, 9.29, 0.71, 1.52, 0.66, 1.19, 0.93, 1.8, 1.1, 0.27, 14.34, 1.64, 3.46]} \ No newline at end of file diff --git a/annotations_1/MWxa84PirUc_filtered.json b/annotations_1/MWxa84PirUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d706538a8144f0383e5629af62096d45f0861652 --- /dev/null +++ b/annotations_1/MWxa84PirUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.34], [7.0, 7.94], [9.0, 16.46], [18.0, 18.99], [20.0, 20.83], [23.0, 24.29], [27.0, 29.61], [30.0, 29.74], [32.0, 36.76], [39.0, 39.09], [41.0, 42.4], [45.0, 46.87], [49.0, 67.83], [69.0, 78.61], [80.0, 80.69], [84.0, 85.06], [86.0, 86.49], [88.0, 89.48], [91.0, 91.72], [93.0, 95.55], [96.0, 100.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 99.52, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 0.0, 0.0, 83.34, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 48.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.62], ["hum", 9.53], ["music", 4.77]]], "duration": [5.34, 0.94, 7.46, 0.99, 0.83, 1.29, 2.61, -0.26, 4.76, 0.09, 1.4, 1.87, 18.83, 9.61, 0.69, 1.06, 0.49, 1.48, 0.72, 2.55, 4.95]} \ No newline at end of file diff --git a/annotations_1/MYErK-XLJv0_filtered.json b/annotations_1/MYErK-XLJv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..827382a0fa32229b384e4a61c9e73caf7bac8f31 --- /dev/null +++ b/annotations_1/MYErK-XLJv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.16], [14.0, 18.17], [23.0, 22.62], [23.0, 26.4], [31.0, 50.16], [52.0, 80.27], [81.0, 81.6], [82.0, 83.29], [84.0, 84.33], [86.0, 87.07], [89.0, 92.74], [93.0, 93.41], [100.0, 100.5], [101.0, 102.96], [104.0, 105.22], [106.0, 106.51], [108.0, 109.58], [110.0, 111.16], [115.0, 115.42], [117.0, 117.37], [118.0, 118.94], [122.0, 121.85], [124.0, 124.63], [128.0, 128.46], [129.0, 130.03], [131.0, 132.39], [136.0, 136.0], [139.0, 143.77], [148.0, 149.81]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.19, 0.0, 34.81, 35.23, 100.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, [["speech", 68.5], ["music", 2.74], ["explosion", 2.61]], null, [["speech", 54.48], ["thunk", 5.17], ["whack, thwack", 2.66]], [["speech", 79.57], ["explosion", 2.26], ["eruption", 2.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 4.17, -0.38, 3.4, 19.16, 28.27, 0.6, 1.29, 0.33, 1.07, 3.74, 0.41, 0.5, 1.96, 1.22, 0.51, 1.58, 1.16, 0.42, 0.37, 0.94, -0.15, 0.63, 0.46, 1.03, 1.39, 0.0, 4.77, 1.81]} \ No newline at end of file diff --git a/annotations_1/MYkSUEjYLc0_filtered.json b/annotations_1/MYkSUEjYLc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..768a3e54734ebff3315bab40359358eb153d4f71 --- /dev/null +++ b/annotations_1/MYkSUEjYLc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.59], [18.0, 27.9], [29.0, 32.91], [34.0, 50.79], [53.0, 113.98], [115.0, 115.13], [137.0, 157.01], [161.0, 161.52], [162.0, 162.08], [163.0, 164.79], [167.0, 167.37]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 93.13, 99.96, 95.51, 0.0, 0.0, 40.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 56.72], ["didgeridoo", 6.67], ["hum", 4.23]], null, null, null, null], "duration": [1.59, 9.9, 3.91, 16.79, 60.98, 0.13, 20.01, 0.52, 0.08, 1.79, 0.37]} \ No newline at end of file diff --git a/annotations_1/MZG1HbQ3KCE_filtered.json b/annotations_1/MZG1HbQ3KCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..493f8bae2affd62642ec19827181c3e594b50daa --- /dev/null +++ b/annotations_1/MZG1HbQ3KCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.41], [17.0, 18.25], [20.0, 36.78], [51.0, 66.33], [67.0, 66.93], [76.0, 77.06], [79.0, 93.87], [94.0, 101.26], [104.0, 106.1], [106.0, 115.86], [125.0, 134.23], [142.0, 182.16], [185.0, 186.29]], "keep_status": [false, false, false, false, false, false, true, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 30.86, 32.25, 0.0, 0.0, 31.82, 30.42, 33.11, 32.14, 30.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 70.35], ["carnatic music", 6.65], ["sitar", 1.88]], [["speech", 47.71], ["music", 31.21], ["synthesizer", 3.59]], null, null, [["fly, housefly", 28.38], ["insect", 20.76], ["buzz", 20.63]], [["cattle, bovinae", 24.85], ["moo", 24.47], ["livestock, farm animals, working animals", 16.86]], [["speech", 35.02], ["music", 30.89], ["crowd", 3.37]], [["buzz", 54.9], ["speech", 13.1], ["music", 9.18]], [["speech", 28.92], ["vehicle", 18.39], ["bee, wasp, etc.", 5.47]], null, null], "duration": [1.41, 1.25, 16.78, 15.33, -0.07, 1.06, 14.87, 7.26, 2.1, 9.86, 9.23, 40.16, 1.29]} \ No newline at end of file diff --git a/annotations_1/MZIPOu6WeGg_filtered.json b/annotations_1/MZIPOu6WeGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25718aa64ea78700f8ccc3e1096bd80865e3d35f --- /dev/null +++ b/annotations_1/MZIPOu6WeGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.95], [3.0, 5.12], [7.0, 8.18], [14.0, 17.78], [19.0, 19.87], [22.0, 23.4], [26.0, 27.19], [30.0, 31.36], [34.0, 83.79], [85.0, 87.45], [91.0, 107.79], [109.0, 109.63], [111.0, 111.74], [119.0, 120.09], [124.0, 124.23], [125.0, 125.63], [129.0, 130.13], [131.0, 132.43], [133.0, 134.76], [136.0, 135.89], [137.0, 137.74], [145.0, 146.08], [147.0, 148.31], [150.0, 153.01], [153.0, 154.16], [155.0, 155.9], [159.0, 159.29]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 32.46, 0.0, 39.8, 0.0, 0.0, 0.0, 0.0, 0.0, 36.84, 30.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.99], ["music", 14.11], ["vehicle", 10.28]], null, [["music", 42.41], ["hum", 11.5], ["throbbing", 9.54]], null, null, null, null, null, [["music", 44.39], ["throbbing", 14.99], ["speech", 11.29]], [["music", 46.71], ["hum", 20.06], ["scary music", 8.45]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.1], ["rumble", 11.16], ["whale vocalization", 7.05]], null, null, null], "duration": [0.95, 2.12, 1.18, 3.78, 0.87, 1.4, 1.19, 1.36, 49.79, 2.45, 16.79, 0.63, 0.74, 1.09, 0.23, 0.63, 1.13, 1.43, 1.76, -0.11, 0.74, 1.08, 1.31, 3.01, 1.16, 0.9, 0.29]} \ No newline at end of file diff --git a/annotations_1/MZXC37sbqUM_filtered.json b/annotations_1/MZXC37sbqUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3164399463b5e07583fd00cdf4fd10f5b8fe0967 --- /dev/null +++ b/annotations_1/MZXC37sbqUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [3.0, 8.21], [9.0, 10.54], [11.0, 12.07], [13.0, 14.35], [15.0, 15.63], [16.0, 16.48], [19.0, 22.59], [23.0, 24.29], [25.0, 26.86], [27.0, 29.69], [30.0, 31.7], [32.0, 34.7], [38.0, 38.99], [39.0, 40.37], [41.0, 40.88], [41.0, 49.91], [51.0, 51.48], [62.0, 62.46], [64.0, 64.71], [65.0, 67.22], [70.0, 70.53], [71.0, 72.71], [73.0, 75.74], [76.0, 79.44], [82.0, 83.64], [84.0, 87.61], [88.0, 91.32], [92.0, 94.15], [95.0, 102.39], [104.0, 104.95], [106.0, 107.81], [111.0, 113.27], [116.0, 123.03], [126.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 44.49, 0.0, 97.83, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 73.51, 99.73, 0.0, 82.61, 99.65, 47.16, 96.17, 0.0, 0.0, 67.51, 99.76, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 55.73], ["sidetone", 33.18], ["radio", 4.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 39.07], ["speech", 33.91], ["whale vocalization", 11.74]], null, null, null, null, null, null], "duration": [1.01, 5.21, 1.54, 1.07, 1.35, 0.63, 0.48, 3.59, 1.29, 1.86, 2.69, 1.7, 2.7, 0.99, 1.37, -0.12, 8.91, 0.48, 0.46, 0.71, 2.22, 0.53, 1.71, 2.74, 3.44, 1.64, 3.61, 3.32, 2.15, 7.39, 0.95, 1.81, 2.27, 7.03, 2.24]} \ No newline at end of file diff --git a/annotations_1/MZaX-RbQ7ic_filtered.json b/annotations_1/MZaX-RbQ7ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f0c00f4ebeffe6fc8a76c35f956c8683fda2c4 --- /dev/null +++ b/annotations_1/MZaX-RbQ7ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.54], [6.0, 7.45], [8.0, 8.26], [9.0, 9.88], [16.0, 18.87], [19.0, 42.13], [42.0, 45.81], [46.0, 51.0], [52.0, 56.07], [57.0, 62.46], [63.0, 108.36], [110.0, 123.63]], "keep_status": [false, false, false, false, true, true, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.66, 29.36, 37.55, 36.29, 31.92, 31.68, 0.0, 29.04], "audiomae_on_audioset": [null, null, null, null, [["music", 26.08], ["hum", 8.09], ["sonar", 7.63]], [["music", 43.81], ["speech", 17.2], ["whack, thwack", 6.8]], [["speech", 26.42], ["music", 26.3], ["musical instrument", 5.99]], [["speech", 28.95], ["bow-wow", 6.15], ["dog", 5.58]], [["thunk", 33.15], ["music", 21.73], ["synthesizer", 3.26]], [["speech", 48.17], ["rumble", 10.97], ["groan", 6.37]], null, [["speech", 57.26], ["beatboxing", 10.98], ["fart", 3.48]]], "duration": [0.54, 1.45, 0.26, 0.88, 2.87, 23.13, 3.81, 5.0, 4.07, 5.46, 45.36, 13.63]} \ No newline at end of file diff --git a/annotations_1/M_7k0PCONF0_filtered.json b/annotations_1/M_7k0PCONF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c5487fa7aaf3180a8df234fbb65920d8b1d0d33 --- /dev/null +++ b/annotations_1/M_7k0PCONF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [9.0, 9.85], [12.0, 17.0], [19.0, 20.95], [25.0, 25.93], [27.0, 45.74], [46.0, 51.06], [52.0, 57.35], [61.0, 64.86], [66.0, 67.54], [70.0, 70.58], [71.0, 72.35], [75.0, 76.99], [80.0, 81.72], [82.0, 85.28], [88.0, 89.51], [90.0, 90.66], [91.0, 92.21], [95.0, 97.11], [98.0, 98.74], [99.0, 100.53], [104.0, 105.17], [108.0, 108.5], [116.0, 116.61], [120.0, 124.63], [125.0, 125.9], [126.0, 126.22], [127.0, 127.77], [129.0, 135.89], [144.0, 145.02], [150.0, 149.79], [150.0, 151.48], [154.0, 159.75], [162.0, 164.27], [166.0, 168.2]], "keep_status": [false, false, true, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 46.72, 0.0, 0.0, 45.49, 36.9, 35.41, 37.95, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 34.8, 0.0, 0.0, 0.0, 0.0, 0.0, 42.28, 0.0, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 92.64, 97.83, 54.76], "audiomae_on_audioset": [null, null, [["music", 28.22], ["synthesizer", 7.64], ["speech", 6.38]], null, null, [["speech", 24.91], ["hum", 19.31], ["mains hum", 16.51]], [["music", 39.78], ["hum", 10.6], ["mains hum", 8.54]], [["music", 53.88], ["speech", 6.31], ["mains hum", 5.0]], [["music", 54.0], ["musical instrument", 6.45], ["guitar", 5.6]], null, null, null, null, null, null, null, null, null, [["music", 33.24], ["cough", 26.59], ["throat clearing", 14.22]], null, null, null, null, null, [["music", 51.18], ["hum", 6.8], ["throbbing", 6.49]], null, null, null, [["music", 25.27], ["thunk", 22.24], ["guitar", 7.62]], null, null, null, null, null, null], "duration": [0.31, 0.85, 5.0, 1.95, 0.93, 18.74, 5.06, 5.35, 3.86, 1.54, 0.58, 1.35, 1.99, 1.72, 3.28, 1.51, 0.66, 1.21, 2.11, 0.74, 1.53, 1.17, 0.5, 0.61, 4.63, 0.9, 0.22, 0.77, 6.89, 1.02, -0.21, 1.48, 5.75, 2.27, 2.2]} \ No newline at end of file diff --git a/annotations_1/MaSm7idHMtI_filtered.json b/annotations_1/MaSm7idHMtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a200c9939b521dc6e4fc046cbed14c19b59c912 --- /dev/null +++ b/annotations_1/MaSm7idHMtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.04], [8.0, 9.81], [12.0, 40.47], [41.0, 49.18], [50.0, 51.66], [53.0, 53.69], [55.0, 57.7], [60.0, 62.94], [67.0, 68.07], [82.0, 83.37], [87.0, 89.04], [90.0, 93.78], [96.0, 97.29], [99.0, 101.11], [103.0, 106.46], [108.0, 109.85], [121.0, 135.36], [139.0, 140.39], [141.0, 149.35], [152.0, 153.3], [156.0, 178.09], [180.0, 184.35], [186.0, 188.1], [190.0, 210.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.66, 0.0, 99.8, 98.66, 0.0, 0.0, 100.0, 98.44, 0.0, 0.0, 99.26, 99.31, 0.0, 95.91, 98.1, 0.0, 98.27, 0.0, 99.36, 0.0, 99.52, 99.76, 99.96, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.04, 1.81, 28.47, 8.18, 1.66, 0.69, 2.7, 2.94, 1.07, 1.37, 2.04, 3.78, 1.29, 2.11, 3.46, 1.85, 14.36, 1.39, 8.35, 1.3, 22.09, 4.35, 2.1, 20.46]} \ No newline at end of file diff --git a/annotations_1/MaqzxDPwOB4_filtered.json b/annotations_1/MaqzxDPwOB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06bf0be9090b87eceb70ea4eb0479b0b1adb5cd1 --- /dev/null +++ b/annotations_1/MaqzxDPwOB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [4.0, 5.88], [9.0, 11.48], [16.0, 24.41], [26.0, 27.24], [28.0, 44.42], [46.0, 46.28], [49.0, 61.32], [65.0, 67.15], [69.0, 69.26], [73.0, 73.2], [82.0, 83.93], [88.0, 87.96], [89.0, 90.12], [102.0, 103.99], [108.0, 108.08], [112.0, 112.24], [117.0, 117.49], [119.0, 118.91], [119.0, 122.08], [127.0, 128.55], [131.0, 131.55], [135.0, 135.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.47, 37.57, 0.0, 87.55, 0.0, 100.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["boing", 39.12], ["speech", 12.33], ["groan", 10.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 1.88, 2.48, 8.41, 1.24, 16.42, 0.28, 12.32, 2.15, 0.26, 0.2, 1.93, -0.04, 1.12, 1.99, 0.08, 0.24, 0.49, -0.09, 3.08, 1.55, 0.55, 0.94]} \ No newline at end of file diff --git a/annotations_1/Mc_zp1s60NY_filtered.json b/annotations_1/Mc_zp1s60NY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db452466074c4ea1049a373eaf6ecd02a2ef0b41 --- /dev/null +++ b/annotations_1/Mc_zp1s60NY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.83], [19.0, 36.17], [38.0, 68.59], [69.0, 73.67], [75.0, 75.41], [77.0, 77.79], [81.0, 99.01], [99.0, 99.08]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 34.71, 0.0, 35.96, 0.0, 0.0, 33.2, 0.0], "audiomae_on_audioset": [null, [["theremin", 57.57], ["music", 34.45], ["musical instrument", 1.87]], null, [["music", 52.33], ["didgeridoo", 7.64], ["scary music", 4.86]], null, null, [["music", 73.48], ["synthesizer", 4.47], ["musical instrument", 2.52]], null], "duration": [0.83, 17.17, 30.59, 4.67, 0.41, 0.79, 18.01, 0.08]} \ No newline at end of file diff --git a/annotations_1/Mcf2hNBzwqg_filtered.json b/annotations_1/Mcf2hNBzwqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ece7a7a1fdd45982ea6f92238c93602dbc6edc --- /dev/null +++ b/annotations_1/Mcf2hNBzwqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.17], [4.0, 5.04], [5.0, 9.86], [11.0, 17.22], [20.0, 22.57], [27.0, 28.0], [33.0, 33.57], [40.0, 45.67], [48.0, 48.98], [50.0, 57.42], [59.0, 62.14], [63.0, 69.35], [70.0, 70.6], [71.0, 80.55], [81.0, 82.16], [83.0, 88.69], [89.0, 90.58], [91.0, 96.09], [96.0, 98.91], [101.0, 103.01], [105.0, 106.66], [108.0, 109.59], [111.0, 113.09], [114.0, 139.55]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.35, 45.98, 28.46, 0.0, 0.0, 28.89, 0.0, 90.78, 89.72, 97.73, 0.0, 97.22, 0.0, 94.66, 0.0, 98.01, 41.68, 99.62, 0.0, 0.0, 60.6, 94.95], "audiomae_on_audioset": [null, null, null, [["busy signal", 19.77], ["music", 13.36], ["radio", 11.25]], [["sidetone", 15.51], ["white noise", 10.87], ["radio", 10.41]], null, null, [["speech", 22.67], ["noise", 9.96], ["throbbing", 7.44]], null, null, null, null, null, null, null, null, null, null, [["frog", 21.63], ["whale vocalization", 19.76], ["speech", 7.54]], null, null, null, null, null], "duration": [0.17, 1.04, 4.86, 6.22, 2.57, 1.0, 0.57, 5.67, 0.98, 7.42, 3.14, 6.35, 0.6, 9.55, 1.16, 5.69, 1.58, 5.09, 2.91, 2.01, 1.66, 1.59, 2.09, 25.55]} \ No newline at end of file diff --git a/annotations_1/McmlPCS1kHc_filtered.json b/annotations_1/McmlPCS1kHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b9014057a8588fa03d9506cce02af1bd0340745 --- /dev/null +++ b/annotations_1/McmlPCS1kHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 48.05], [49.0, 51.66], [52.0, 67.07], [68.0, 76.45], [77.0, 83.2], [84.0, 85.68], [87.0, 93.99], [95.0, 105.6], [107.0, 107.45], [109.0, 115.08]], "keep_status": [false, false, true, true, true, false, true, false, false, false], "silence_prob": [0.0, 66.63, 39.4, 35.57, 32.24, 0.0, 32.29, 31.98, 0.0, 31.68], "audiomae_on_audioset": [null, null, [["buzz", 18.52], ["cattle, bovinae", 14.9], ["hum", 12.03]], [["whale vocalization", 45.69], ["music", 13.96], ["hum", 8.72]], [["whale vocalization", 14.33], ["music", 13.45], ["hum", 9.7]], null, [["whale vocalization", 18.19], ["hum", 17.55], ["music", 14.6]], [["livestock, farm animals, working animals", 40.53], ["cattle, bovinae", 21.34], ["moo", 13.32]], null, [["whale vocalization", 37.22], ["cattle, bovinae", 18.46], ["moo", 16.89]]], "duration": [38.05, 2.66, 15.07, 8.45, 6.2, 1.68, 6.99, 10.6, 0.45, 6.08]} \ No newline at end of file diff --git a/annotations_1/MczK8n5msJM_filtered.json b/annotations_1/MczK8n5msJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..249777b6fca75d658db2fea29cbbb3c3eb614533 --- /dev/null +++ b/annotations_1/MczK8n5msJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [5.0, 11.04], [15.0, 16.39], [20.0, 20.55], [21.0, 24.07], [25.0, 26.79], [37.0, 37.42], [38.0, 40.8], [47.0, 65.91], [68.0, 68.25], [69.0, 71.02], [73.0, 93.43], [95.0, 103.42], [104.0, 119.7], [125.0, 129.44], [131.0, 131.18], [132.0, 144.66], [145.0, 154.25], [160.0, 162.36], [168.0, 170.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 30.3, 0.0, 0.0, 30.52, 0.0, 0.0, 31.83, 30.45, 0.0, 31.47, 30.63, 31.06, 30.69, 30.59, 0.0, 30.51, 30.62, 32.64, 47.54], "audiomae_on_audioset": [null, [["speech", 69.14], ["vehicle", 11.55], ["car", 3.65]], null, null, [["speech", 51.51], ["music", 22.83], ["vehicle", 8.43]], null, null, [["mains hum", 27.27], ["hum", 26.97], ["music", 24.33]], [["music", 42.21], ["throbbing", 23.44], ["hum", 15.99]], null, [["music", 38.55], ["speech", 30.16], ["synthesizer", 5.86]], [["speech", 23.42], ["music", 22.06], ["hum", 12.01]], [["music", 47.29], ["speech", 14.36], ["throbbing", 10.06]], [["music", 22.19], ["throbbing", 17.43], ["vehicle", 17.13]], [["music", 28.73], ["speech", 25.61], ["throbbing", 12.2]], null, [["music", 69.16], ["throbbing", 6.11], ["speech", 5.54]], [["music", 74.32], ["speech", 7.79], ["buzz", 2.12]], [["livestock, farm animals, working animals", 62.44], ["cattle, bovinae", 18.31], ["moo", 7.92]], [["speech", 29.88], ["music", 12.16], ["hum", 7.29]]], "duration": [0.41, 6.04, 1.39, 0.55, 3.07, 1.79, 0.42, 2.8, 18.91, 0.25, 2.02, 20.43, 8.42, 15.7, 4.44, 0.18, 12.66, 9.25, 2.36, 2.45]} \ No newline at end of file diff --git a/annotations_1/MdI5DrJ6V3k_filtered.json b/annotations_1/MdI5DrJ6V3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa25e9e742ecec055236f67725673e85f22c814f --- /dev/null +++ b/annotations_1/MdI5DrJ6V3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.57], [9.0, 21.95], [24.0, 28.07], [30.0, 30.94], [32.0, 39.88], [42.0, 41.96], [43.0, 59.63], [63.0, 74.17], [76.0, 78.09], [78.0, 84.6]], "keep_status": [false, true, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 29.7, 30.48, 0.0, 31.8, 0.0, 28.81, 28.59, 29.99, 28.48], "audiomae_on_audioset": [null, [["speech", 25.87], ["music", 13.35], ["livestock, farm animals, working animals", 12.18]], [["mosquito", 26.26], ["whip", 8.49], ["music", 8.28]], null, [["speech", 48.37], ["music", 20.28], ["boat, water vehicle", 4.8]], null, [["clang", 23.33], ["smash, crash", 15.32], ["whack, thwack", 13.38]], [["music", 70.11], ["whack, thwack", 8.89], ["smash, crash", 5.38]], [["music", 33.77], ["throbbing", 29.22], ["hum", 14.64]], [["music", 32.0], ["hum", 24.09], ["throbbing", 21.83]]], "duration": [-0.43, 12.95, 4.07, 0.94, 7.88, -0.04, 16.63, 11.17, 2.09, 6.6]} \ No newline at end of file diff --git a/annotations_1/MdfwpCH1Ksk_filtered.json b/annotations_1/MdfwpCH1Ksk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b877c4e6be536352277b8eb1b2c4450fad8ecd4f --- /dev/null +++ b/annotations_1/MdfwpCH1Ksk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.38], [9.0, 9.85], [10.0, 10.52], [11.0, 17.31], [18.0, 20.53], [21.0, 23.36], [27.0, 29.83], [30.0, 32.04], [33.0, 34.35], [35.0, 36.26], [38.0, 39.11], [40.0, 40.71], [45.0, 47.87], [49.0, 50.57], [52.0, 54.78], [56.0, 58.19], [59.0, 63.73], [65.0, 67.78], [69.0, 71.9], [72.0, 74.56], [77.0, 80.55], [82.0, 83.24], [85.0, 85.72], [88.0, 89.55], [97.0, 99.98], [105.0, 108.18], [109.0, 111.08], [112.0, 112.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.4, 99.99, 99.9, 100.0, 75.23, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 99.76, 99.9, 99.84, 99.98, 93.6, 97.22, 99.97, 0.0, 0.0, 0.0, 99.88, 97.54, 88.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 0.85, 0.52, 6.31, 2.53, 2.36, 2.83, 2.04, 1.35, 1.26, 1.11, 0.71, 2.87, 1.57, 2.78, 2.19, 4.73, 2.78, 2.9, 2.56, 3.55, 1.24, 0.72, 1.55, 2.98, 3.18, 2.08, 0.9]} \ No newline at end of file diff --git a/annotations_1/MdoBOoR576Y_filtered.json b/annotations_1/MdoBOoR576Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcd1b33f98dc8d3a7821c644d9ed788ceaf8907 --- /dev/null +++ b/annotations_1/MdoBOoR576Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 34.92], [35.0, 35.95], [38.0, 38.06], [39.0, 39.92], [58.0, 57.97], [59.0, 59.54], [60.0, 60.29], [61.0, 62.56], [63.0, 64.96], [71.0, 72.86], [75.0, 76.03], [78.0, 80.16], [85.0, 85.02], [92.0, 95.98], [99.0, 101.11], [105.0, 112.53], [115.0, 117.64], [118.0, 118.99], [123.0, 123.04], [130.0, 130.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 59.59, 30.37, 30.09, 31.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 15.82], ["music", 10.04], ["speech", 9.64]], [["music", 39.16], ["throbbing", 19.62], ["speech", 11.11]], [["speech", 43.33], ["music", 8.98], ["didgeridoo", 3.53]], null, null, null], "duration": [5.92, 0.95, 0.06, 0.92, -0.03, 0.54, 0.29, 1.56, 1.96, 1.86, 1.03, 2.16, 0.02, 3.98, 2.11, 7.53, 2.64, 0.99, 0.04, 0.45]} \ No newline at end of file diff --git a/annotations_1/Mdp4T_G0Xsc_filtered.json b/annotations_1/Mdp4T_G0Xsc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47e7e5b7a8027be7ef277fc702b4549daac0298f --- /dev/null +++ b/annotations_1/Mdp4T_G0Xsc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 5.85], [9.0, 9.46], [11.0, 12.6], [15.0, 16.41], [18.0, 23.6], [26.0, 26.91], [28.0, 28.9], [33.0, 36.24], [39.0, 40.8], [43.0, 43.73], [44.0, 47.88], [51.0, 63.66], [65.0, 69.9], [72.0, 72.08], [74.0, 77.43], [78.0, 81.35], [83.0, 86.0], [87.0, 88.48], [90.0, 90.61], [93.0, 95.91], [98.0, 99.81], [101.0, 101.85], [103.0, 104.41], [105.0, 106.84], [108.0, 110.42], [112.0, 115.35], [116.0, 119.23], [121.0, 127.16], [128.0, 129.84], [131.0, 131.94], [133.0, 134.2], [135.0, 137.19], [138.0, 140.85], [142.0, 143.56], [145.0, 147.48], [149.0, 151.38], [152.0, 156.51], [157.0, 161.64], [163.0, 170.19], [171.0, 177.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 90.25, 0.0, 0.0, 62.37, 60.23, 48.78, 0.0, 51.39, 46.75, 52.33, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 43.74, 39.69, 54.3, 82.43, 0.0, 0.0, 0.0, 86.82, 81.89, 0.0, 88.46, 78.55, 68.41, 67.0, 72.31, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 30.23], ["music", 25.16], ["mains hum", 16.54]], null, null, [["music", 29.69], ["speech", 18.44], ["hum", 15.93]], null, null, null, null, null, null, null, null, [["hum", 31.13], ["mains hum", 10.68], ["music", 9.04]], [["music", 25.35], ["speech", 23.83], ["hum", 20.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 1.85, 0.46, 1.6, 1.41, 5.6, 0.91, 0.9, 3.24, 1.8, 0.73, 3.88, 12.66, 4.9, 0.08, 3.43, 3.35, 3.0, 1.48, 0.61, 2.91, 1.81, 0.85, 1.41, 1.84, 2.42, 3.35, 3.23, 6.16, 1.84, 0.94, 1.2, 2.19, 2.85, 1.56, 2.48, 2.38, 4.51, 4.64, 7.19, 6.79]} \ No newline at end of file diff --git a/annotations_1/Me3eSvA2K9k_filtered.json b/annotations_1/Me3eSvA2K9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd39fdb014244de171a4d36186dfcaea21bfa01c --- /dev/null +++ b/annotations_1/Me3eSvA2K9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [23.0, 24.76], [27.0, 28.8], [31.0, 31.45], [32.0, 33.15], [35.0, 38.13], [41.0, 47.48], [50.0, 56.22], [58.0, 60.47], [61.0, 68.03], [69.0, 76.49], [78.0, 79.84], [82.0, 82.22], [86.0, 85.82], [88.0, 88.5], [91.0, 91.89], [94.0, 94.83], [96.0, 98.31], [99.0, 100.06], [102.0, 103.6], [106.0, 106.3], [112.0, 115.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 1.76, 1.8, 0.45, 1.15, 3.13, 6.48, 6.22, 2.47, 7.03, 7.49, 1.84, 0.22, -0.18, 0.5, 0.89, 0.83, 2.31, 1.06, 1.6, 0.3, 3.15]} \ No newline at end of file diff --git a/annotations_1/MevYeKlyQM8_filtered.json b/annotations_1/MevYeKlyQM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae77fb3795235f610956ed8f7b1e51e70326976c --- /dev/null +++ b/annotations_1/MevYeKlyQM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.96], [16.0, 18.42], [21.0, 22.82], [24.0, 28.04], [29.0, 30.43], [31.0, 32.75], [34.0, 35.73], [36.0, 39.75], [40.0, 41.18], [42.0, 43.55], [47.0, 53.74], [54.0, 54.57], [55.0, 64.25], [64.0, 67.27], [69.0, 70.38], [76.0, 89.78], [91.0, 93.46], [96.0, 97.78], [100.0, 103.28], [104.0, 104.92], [105.0, 109.02], [109.0, 109.63], [111.0, 113.02], [114.0, 115.91], [117.0, 117.44], [119.0, 121.54], [123.0, 125.41], [127.0, 129.64], [132.0, 132.44], [136.0, 138.62], [140.0, 140.51], [141.0, 142.25], [145.0, 145.74], [146.0, 147.43], [148.0, 149.28], [150.0, 152.37], [153.0, 160.49]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.73, 0.0, 78.21, 0.0, 0.0, 0.0, 47.08, 0.0, 0.0, 97.73, 0.0, 36.94, 43.45, 0.0, 43.1, 90.95, 0.0, 53.22, 0.0, 48.82, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.01], ["hum", 14.29], ["mains hum", 10.06]], null, null, null, null, [["speech", 35.71], ["hum", 30.45], ["mains hum", 8.67]], [["speech", 38.13], ["hum", 12.08], ["mains hum", 10.72]], null, [["fart", 34.15], ["explosion", 20.62], ["burst, pop", 3.49]], null, null, null, null, [["speech", 58.74], ["sine wave", 11.51], ["chirp tone", 8.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 2.42, 1.82, 4.04, 1.43, 1.75, 1.73, 3.75, 1.18, 1.55, 6.74, 0.57, 9.25, 3.27, 1.38, 13.78, 2.46, 1.78, 3.28, 0.92, 4.02, 0.63, 2.02, 1.91, 0.44, 2.54, 2.41, 2.64, 0.44, 2.62, 0.51, 1.25, 0.74, 1.43, 1.28, 2.37, 7.49]} \ No newline at end of file diff --git a/annotations_1/MeyU68qSBMI_filtered.json b/annotations_1/MeyU68qSBMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e35e20942549d79cf460d5fb947e0ee77ebd92a5 --- /dev/null +++ b/annotations_1/MeyU68qSBMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.19]], "keep_status": [false], "silence_prob": [35.48], "audiomae_on_audioset": [[["speech", 50.24], ["music", 16.18], ["thunk", 14.47]]], "duration": [2.19]} \ No newline at end of file diff --git a/annotations_1/Mfcqb8DD400_filtered.json b/annotations_1/Mfcqb8DD400_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3366370b4ae37b2e775c51aa513abc9cc6c4e91 --- /dev/null +++ b/annotations_1/Mfcqb8DD400_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.32], [4.0, 5.0], [10.0, 11.1], [13.0, 13.9], [19.0, 18.89], [20.0, 26.32], [28.0, 27.84], [31.0, 31.35], [32.0, 32.91], [34.0, 34.87], [44.0, 48.03], [49.0, 49.18], [56.0, 60.08], [63.0, 63.63], [64.0, 64.72], [66.0, 66.24], [72.0, 72.32], [74.0, 82.68], [84.0, 84.59], [90.0, 92.77], [98.0, 99.99], [101.0, 107.84], [114.0, 115.4], [116.0, 118.83], [119.0, 120.73], [122.0, 122.91], [125.0, 127.55], [128.0, 130.03], [132.0, 133.1], [140.0, 154.14], [155.0, 155.88], [157.0, 157.81], [162.0, 162.43], [163.0, 164.61], [167.0, 167.17], [170.0, 173.99], [175.0, 176.42], [190.0, 192.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 63.31, 0.0, 93.45, 0.0, 89.9, 0.0, 94.07, 0.0, 0.0, 51.39, 80.11, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 93.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 1.0, 1.1, 0.9, -0.11, 6.32, -0.16, 0.35, 0.91, 0.87, 4.03, 0.18, 4.08, 0.63, 0.72, 0.24, 0.32, 8.68, 0.59, 2.77, 1.99, 6.84, 1.4, 2.83, 1.73, 0.91, 2.55, 2.03, 1.1, 14.14, 0.88, 0.81, 0.43, 1.61, 0.17, 3.99, 1.42, 2.3]} \ No newline at end of file diff --git a/annotations_1/Mg0bvyIEHcs_filtered.json b/annotations_1/Mg0bvyIEHcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Mg0bvyIEHcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/Mgc3y6p-Bys_filtered.json b/annotations_1/Mgc3y6p-Bys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4bef19f3b9b734266eb717ce4868f3d9fd64588 --- /dev/null +++ b/annotations_1/Mgc3y6p-Bys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.53], [36.0, 37.71], [39.0, 49.23], [50.0, 51.0], [52.0, 53.06], [56.0, 56.47], [60.0, 61.57], [64.0, 76.06], [79.0, 88.1], [90.0, 91.88], [93.0, 95.57], [97.0, 97.92], [98.0, 98.07], [98.0, 98.95], [100.0, 118.98], [120.0, 120.38], [121.0, 138.72], [139.0, 151.07], [152.0, 156.24], [158.0, 159.0], [160.0, 162.82], [164.0, 166.58]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, true, false, true, true], "silence_prob": [0.0, 0.0, 36.71, 0.0, 0.0, 0.0, 0.0, 30.37, 32.15, 0.0, 39.38, 0.0, 0.0, 0.0, 36.67, 0.0, 32.45, 35.26, 34.56, 0.0, 28.5, 29.57], "audiomae_on_audioset": [null, null, [["music", 38.16], ["sonar", 22.43], ["telephone bell ringing", 4.57]], null, null, null, null, [["hum", 61.26], ["mains hum", 16.67], ["throbbing", 11.14]], [["music", 30.07], ["speech", 21.97], ["door", 9.23]], null, [["music", 39.61], ["speech", 34.5], ["hum", 3.28]], null, null, null, [["hum", 24.96], ["music", 21.37], ["throbbing", 10.17]], null, [["whack, thwack", 24.88], ["thump, thud", 7.87], ["music", 5.31]], [["speech", 32.68], ["mechanisms", 24.17], ["gears", 16.15]], [["music", 22.02], ["creak", 10.57], ["theremin", 6.47]], null, [["electric shaver, electric razor", 9.26], ["sound effect", 8.38], ["buzz", 7.49]], [["whale vocalization", 21.51], ["cattle, bovinae", 8.07], ["white noise", 6.69]]], "duration": [0.53, 1.71, 10.23, 1.0, 1.06, 0.47, 1.57, 12.06, 9.1, 1.88, 2.57, 0.92, 0.07, 0.95, 18.98, 0.38, 17.72, 12.07, 4.24, 1.0, 2.82, 2.58]} \ No newline at end of file diff --git a/annotations_1/Mge3npvF4R0_filtered.json b/annotations_1/Mge3npvF4R0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c70cef04f29727f5a7b356b589f0f7f635c23396 --- /dev/null +++ b/annotations_1/Mge3npvF4R0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 77.16], [78.0, 126.47], [127.0, 132.09], [133.0, 133.0], [133.0, 133.74], [134.0, 136.29]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.93, 0.0, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [31.16, 48.47, 5.09, 0.0, 0.74, 2.29]} \ No newline at end of file diff --git a/annotations_1/Mh51HEise7Q_filtered.json b/annotations_1/Mh51HEise7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f27c4ee8aa78e4eefe624a164a5341bfbaddbce --- /dev/null +++ b/annotations_1/Mh51HEise7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.98], [20.0, 28.68], [29.0, 48.24], [51.0, 53.1], [54.0, 68.59], [70.0, 70.5], [72.0, 72.76], [77.0, 84.96], [87.0, 131.31], [133.0, 137.98], [140.0, 140.56], [147.0, 146.82], [149.0, 149.05], [152.0, 163.07]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [28.58, 29.29, 29.06, 28.59, 31.69, 0.0, 0.0, 37.69, 0.0, 31.34, 0.0, 0.0, 0.0, 29.35], "audiomae_on_audioset": [[["speech", 43.62], ["whoosh, swoosh, swish", 8.09], ["burst, pop", 7.91]], [["speech", 30.98], ["hum", 23.94], ["mains hum", 11.33]], [["hum", 32.52], ["music", 12.36], ["mains hum", 10.13]], [["vehicle", 46.82], ["car", 19.24], ["race car, auto racing", 9.76]], [["hum", 36.67], ["music", 23.45], ["mains hum", 16.54]], null, null, [["music", 31.79], ["synthesizer", 22.67], ["speech", 13.59]], null, [["music", 37.98], ["speech", 33.33], ["vehicle", 5.79]], null, null, null, [["music", 46.73], ["electronic music", 16.09], ["synthesizer", 5.55]]], "duration": [4.98, 8.68, 19.24, 2.1, 14.59, 0.5, 0.76, 7.96, 44.31, 4.98, 0.56, -0.18, 0.05, 11.07]} \ No newline at end of file diff --git a/annotations_1/MhS1b56Koxc_filtered.json b/annotations_1/MhS1b56Koxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1fa90ce707cbaddfea5e2e24c063f6faf452541 --- /dev/null +++ b/annotations_1/MhS1b56Koxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [6.0, 6.72], [14.0, 15.16], [18.0, 18.33], [19.0, 20.14], [23.0, 24.9], [26.0, 26.08], [27.0, 28.0], [31.0, 30.94], [34.0, 34.82], [41.0, 42.97], [45.0, 45.74], [47.0, 48.37], [49.0, 50.99], [54.0, 55.68], [60.0, 61.15], [65.0, 66.75], [68.0, 71.36], [74.0, 74.93], [75.0, 83.49], [86.0, 86.32], [88.0, 88.55], [91.0, 91.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 53.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.72, 1.16, 0.33, 1.14, 1.9, 0.08, 1.0, -0.06, 0.82, 1.97, 0.74, 1.37, 1.99, 1.68, 1.15, 1.75, 3.36, 0.93, 8.49, 0.32, 0.55, 0.49]} \ No newline at end of file diff --git a/annotations_1/Mi6CrAUhnzE_filtered.json b/annotations_1/Mi6CrAUhnzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2344a5fabe6672b26a84a836bba94c19bc891e54 --- /dev/null +++ b/annotations_1/Mi6CrAUhnzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.13], [38.0, 38.82], [39.0, 54.78], [56.0, 56.51], [58.0, 63.36], [65.0, 65.75], [76.0, 76.52], [81.0, 88.21], [89.0, 89.19], [90.0, 90.1], [90.0, 92.58], [103.0, 103.67], [107.0, 106.95], [108.0, 109.09], [119.0, 120.29], [121.0, 141.44]], "keep_status": [false, false, true, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.15, 0.0, 37.2, 0.0, 0.0, 36.42, 0.0, 0.0, 44.15, 0.0, 0.0, 0.0, 0.0, 35.1], "audiomae_on_audioset": [null, null, [["speech", 13.58], ["explosion", 9.85], ["outside, rural or natural", 5.83]], null, [["fly, housefly", 25.23], ["speech", 21.57], ["insect", 7.32]], null, null, [["moo", 19.71], ["speech", 13.36], ["cattle, bovinae", 12.92]], null, null, [["noise", 31.83], ["music", 14.0], ["speech", 6.58]], null, null, null, null, [["music", 71.41], ["hum", 9.1], ["throbbing", 8.81]]], "duration": [1.13, 0.82, 15.78, 0.51, 5.36, 0.75, 0.52, 7.21, 0.19, 0.1, 2.58, 0.67, -0.05, 1.09, 1.29, 20.44]} \ No newline at end of file diff --git a/annotations_1/MkNhAG2CUso_filtered.json b/annotations_1/MkNhAG2CUso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08d88e9e71ea964e64574ec1a39034de93fe4822 --- /dev/null +++ b/annotations_1/MkNhAG2CUso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.47], [12.0, 41.98], [44.0, 83.64], [86.0, 91.44], [94.0, 95.05], [96.0, 99.01], [104.0, 105.19], [108.0, 114.49], [115.0, 120.99], [123.0, 127.31], [129.0, 130.67], [132.0, 136.34], [138.0, 143.72], [144.0, 153.84], [159.0, 170.95], [173.0, 177.87]], "keep_status": [true, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [31.49, 29.91, 0.0, 35.53, 0.0, 55.74, 0.0, 48.78, 37.86, 41.28, 0.0, 40.97, 44.55, 54.3, 71.43, 45.85], "audiomae_on_audioset": [[["speech", 30.51], ["music", 22.93], ["throbbing", 4.16]], [["speech", 41.99], ["breaking", 5.56], ["music", 5.12]], null, [["speech", 33.18], ["music", 30.62], ["hum", 12.19]], null, null, null, [["music", 38.01], ["singing bowl", 13.68], ["burping, eructation", 10.52]], [["music", 70.14], ["speech", 5.51], ["electronic music", 4.94]], [["music", 40.63], ["speech", 34.59], ["grunt", 5.43]], null, [["music", 36.95], ["hum", 20.71], ["speech", 18.5]], [["speech", 36.06], ["music", 13.07], ["whale vocalization", 8.26]], null, null, [["throbbing", 39.02], ["hum", 25.66], ["music", 19.13]]], "duration": [4.47, 29.98, 39.64, 5.44, 1.05, 3.01, 1.19, 6.49, 5.99, 4.31, 1.67, 4.34, 5.72, 9.84, 11.95, 4.87]} \ No newline at end of file diff --git a/annotations_1/Mkkd7taPqEY_filtered.json b/annotations_1/Mkkd7taPqEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd8117e668f41749631b0bebe96e94840178d002 --- /dev/null +++ b/annotations_1/Mkkd7taPqEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.69], [11.0, 11.16], [11.0, 12.02], [12.0, 13.04], [16.0, 19.89], [21.0, 21.91], [24.0, 27.9], [48.0, 49.45], [64.0, 64.76], [69.0, 71.32], [78.0, 79.35], [83.0, 85.35], [87.0, 88.33], [90.0, 91.02], [93.0, 94.63], [95.0, 98.98], [103.0, 104.7], [105.0, 105.27], [107.0, 111.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.27, 0.0, 89.36, 0.0, 0.0, 93.13, 0.0, 84.25, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 48.61], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 20.24], ["chirp tone", 10.79], ["throbbing", 8.3]], null, null, null, null, null, null, null, null, null, null, [["music", 47.44], ["speech", 12.88], ["synthesizer", 4.02]], null, null, [["music", 55.49], ["hum", 6.57], ["singing bowl", 5.98]]], "duration": [0.69, 0.16, 1.02, 1.04, 3.89, 0.91, 3.9, 1.45, 0.76, 2.32, 1.35, 2.35, 1.33, 1.02, 1.63, 3.98, 1.7, 0.27, 4.38]} \ No newline at end of file diff --git a/annotations_1/Mkn0Iji6g9w_filtered.json b/annotations_1/Mkn0Iji6g9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18e96503e69d8e64b152ec445370f584ec3b9ea5 --- /dev/null +++ b/annotations_1/Mkn0Iji6g9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.73], [6.0, 6.81], [14.0, 14.99], [17.0, 18.87], [20.0, 29.57], [30.0, 41.4], [42.0, 44.83], [46.0, 45.71], [47.0, 51.78], [57.0, 62.09], [64.0, 75.32], [78.0, 80.05], [81.0, 128.87]], "keep_status": [false, false, false, false, true, false, true, false, true, true, true, true, false], "silence_prob": [71.14, 0.0, 0.0, 0.0, 39.94, 40.71, 48.35, 0.0, 47.62, 40.86, 48.52, 47.78, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 32.94], ["speech", 14.75], ["sine wave", 4.56]], [["hum", 39.22], ["throbbing", 20.67], ["mains hum", 14.43]], [["music", 32.6], ["didgeridoo", 20.74], ["speech", 11.07]], null, [["hum", 18.83], ["mains hum", 11.61], ["music", 11.56]], [["hum", 22.59], ["music", 15.75], ["mains hum", 8.39]], [["music", 35.18], ["speech", 25.89], ["radio", 6.88]], [["speech", 39.97], ["music", 21.07], ["ambient music", 5.2]], null], "duration": [4.73, 0.81, 0.99, 1.87, 9.57, 11.4, 2.83, -0.29, 4.78, 5.09, 11.32, 2.05, 47.87]} \ No newline at end of file diff --git a/annotations_1/MlUEy_9s0D0_filtered.json b/annotations_1/MlUEy_9s0D0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..573792866c2da8b948959404bb42ca713385f040 --- /dev/null +++ b/annotations_1/MlUEy_9s0D0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.84], [4.0, 6.66], [9.0, 10.13], [16.0, 17.68], [19.0, 19.53], [24.0, 25.51], [28.0, 28.75], [43.0, 51.39], [53.0, 54.57], [58.0, 60.59], [62.0, 62.45], [63.0, 64.74], [66.0, 67.96], [71.0, 71.29], [72.0, 75.24], [81.0, 80.84], [81.0, 83.1], [104.0, 112.29], [113.0, 116.77], [117.0, 117.83], [118.0, 120.5], [123.0, 132.54], [140.0, 140.75], [143.0, 143.46]], "keep_status": [true, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [37.11, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 47.43, 0.0, 0.0, 0.0, 0.0, 38.37, 0.0, 31.16, 59.86, 31.6, 0.0, 33.77, 32.93, 0.0, 0.0], "audiomae_on_audioset": [[["music", 11.59], ["speech", 10.83], ["animal", 6.49]], [["music", 30.23], ["musical instrument", 15.64], ["speech", 10.68]], null, null, null, null, null, [["grunt", 27.04], ["animal", 15.19], ["groan", 6.07]], null, [["music", 24.94], ["speech", 18.15], ["plop", 3.96]], null, null, null, null, [["music", 63.89], ["synthesizer", 8.74], ["musical instrument", 4.84]], null, [["music", 38.56], ["livestock, farm animals, working animals", 9.95], ["cattle, bovinae", 9.27]], null, [["moo", 41.05], ["cattle, bovinae", 37.95], ["whale vocalization", 6.97]], null, [["livestock, farm animals, working animals", 20.32], ["cattle, bovinae", 14.97], ["cowbell", 12.31]], [["boing", 68.42], ["music", 19.46], ["speech", 1.22]], null, null], "duration": [2.84, 2.66, 1.13, 1.68, 0.53, 1.51, 0.75, 8.39, 1.57, 2.59, 0.45, 1.74, 1.96, 0.29, 3.24, -0.16, 2.1, 8.29, 3.77, 0.83, 2.5, 9.54, 0.75, 0.46]} \ No newline at end of file diff --git a/annotations_1/Mm9Y9JEmekY_filtered.json b/annotations_1/Mm9Y9JEmekY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23d686f1729cd5ee5865b4e0b945014bff17b7e3 --- /dev/null +++ b/annotations_1/Mm9Y9JEmekY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.16], [22.0, 22.35], [32.0, 33.54], [36.0, 36.36], [42.0, 43.46], [47.0, 49.1], [52.0, 52.51], [54.0, 54.63], [55.0, 56.78], [59.0, 59.98], [76.0, 76.35], [90.0, 89.99], [92.0, 92.8], [102.0, 102.17], [107.0, 108.62], [109.0, 109.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.35, 1.54, 0.36, 1.46, 2.1, 0.51, 0.63, 1.78, 0.98, 0.35, -0.01, 0.8, 0.17, 1.62, 0.31]} \ No newline at end of file diff --git a/annotations_1/MmBx8AMHTxE_filtered.json b/annotations_1/MmBx8AMHTxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f0d069c9289aa1fdd286413d55e4540fa72b9ae --- /dev/null +++ b/annotations_1/MmBx8AMHTxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [6.0, 11.18], [12.0, 12.77], [14.0, 33.64], [38.0, 39.06], [41.0, 63.05], [65.0, 98.64], [102.0, 109.78], [112.0, 113.12], [116.0, 116.67], [118.0, 177.94]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 27.92, 0.0, 28.43, 0.0, 28.09, 0.0, 29.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 24.09], ["vehicle", 11.1], ["car", 5.83]], null, [["music", 38.71], ["cacophony", 17.18], ["noise", 11.77]], null, [["music", 47.03], ["mains hum", 23.48], ["hum", 15.49]], null, [["speech", 28.33], ["buzz", 6.93], ["animal", 6.24]], null, null, null], "duration": [0.79, 5.18, 0.77, 19.64, 1.06, 22.05, 33.64, 7.78, 1.12, 0.67, 59.94]} \ No newline at end of file diff --git a/annotations_1/MmKlIGkxGyM_filtered.json b/annotations_1/MmKlIGkxGyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fa154d9dcc3b555be7607798616db6072251082 --- /dev/null +++ b/annotations_1/MmKlIGkxGyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.03], [16.0, 16.33], [17.0, 17.24], [21.0, 30.52], [31.0, 32.54], [34.0, 35.53], [36.0, 44.22], [45.0, 45.99], [48.0, 50.85], [52.0, 53.86], [58.0, 59.97], [61.0, 62.34], [63.0, 70.44], [72.0, 73.31], [74.0, 80.79], [85.0, 85.5], [92.0, 97.43], [99.0, 99.72], [101.0, 109.21], [110.0, 121.2], [122.0, 126.94], [129.0, 129.63], [133.0, 134.15], [137.0, 137.49], [140.0, 140.58], [141.0, 144.22], [146.0, 147.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [29.17, 0.0, 0.0, 29.64, 0.0, 0.0, 68.15, 0.0, 99.21, 0.0, 0.0, 0.0, 54.04, 0.0, 38.79, 0.0, 39.66, 0.0, 72.16, 51.88, 61.27, 0.0, 0.0, 0.0, 0.0, 35.87, 0.0], "audiomae_on_audioset": [[["mains hum", 38.7], ["hum", 21.81], ["music", 19.85]], null, null, [["music", 64.92], ["didgeridoo", 6.47], ["musical instrument", 4.89]], null, null, null, null, null, null, null, null, null, null, [["music", 56.32], ["theremin", 19.18], ["musical instrument", 4.86]], null, [["music", 53.34], ["theremin", 14.53], ["foghorn", 4.11]], null, null, null, null, null, null, null, null, [["speech", 30.49], ["music", 12.39], ["dog", 9.02]], null], "duration": [5.03, 0.33, 0.24, 9.52, 1.54, 1.53, 8.22, 0.99, 2.85, 1.86, 1.97, 1.34, 7.44, 1.31, 6.79, 0.5, 5.43, 0.72, 8.21, 11.2, 4.94, 0.63, 1.15, 0.49, 0.58, 3.22, 1.38]} \ No newline at end of file diff --git a/annotations_1/MnLvPe6VSTM_filtered.json b/annotations_1/MnLvPe6VSTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79f0b4ff14d0ae498a180f265a3762e22a40ec4a --- /dev/null +++ b/annotations_1/MnLvPe6VSTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.57], [27.0, 29.81], [35.0, 35.01], [36.0, 37.74], [46.0, 46.04], [49.0, 49.91], [50.0, 50.48], [52.0, 52.14], [57.0, 57.16], [60.0, 60.66], [65.0, 66.07], [67.0, 96.38], [111.0, 114.74], [121.0, 128.24]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [41.22, 43.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.38, 31.19, 31.28], "audiomae_on_audioset": [[["speech", 51.46], ["radio", 28.25], ["telephone", 3.34]], [["moo", 27.41], ["cattle, bovinae", 23.18], ["speech", 17.73]], null, null, null, null, null, null, null, null, null, [["music", 59.23], ["throbbing", 10.91], ["synthesizer", 8.62]], [["speech", 64.02], ["explosion", 10.04], ["music", 4.15]], [["speech", 9.2], ["boing", 7.71], ["music", 6.17]]], "duration": [4.57, 2.81, 0.01, 1.74, 0.04, 0.91, 0.48, 0.14, 0.16, 0.66, 1.07, 29.38, 3.74, 7.24]} \ No newline at end of file diff --git a/annotations_1/MpaMbLDTxyY_filtered.json b/annotations_1/MpaMbLDTxyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c836018af9a06bab9610f8ba6221b443b16c1620 --- /dev/null +++ b/annotations_1/MpaMbLDTxyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.24], [10.0, 10.98], [14.0, 18.0], [18.0, 20.39], [24.0, 23.97], [27.0, 28.34], [31.0, 31.51], [43.0, 42.9], [47.0, 47.63], [53.0, 53.1], [56.0, 56.44], [57.0, 57.55], [69.0, 69.35], [70.0, 71.81], [74.0, 75.22], [77.0, 77.09], [79.0, 79.03], [81.0, 80.81], [83.0, 92.6], [94.0, 93.88], [98.0, 101.98], [103.0, 103.92], [104.0, 106.15], [107.0, 110.51], [112.0, 114.91]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.9, 41.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.56, 0.0, 62.27, 0.0, 87.0, 62.17, 99.68], "audiomae_on_audioset": [null, null, [["speech", 24.0], ["fly, housefly", 15.8], ["noise", 7.55]], [["speech", 31.33], ["fly, housefly", 21.47], ["insect", 8.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 40.3], ["speech", 34.1], ["mains hum", 7.86]], null, null, null, null, null, null], "duration": [0.24, 0.98, 4.0, 2.39, -0.03, 1.34, 0.51, -0.1, 0.63, 0.1, 0.44, 0.55, 0.35, 1.81, 1.22, 0.09, 0.03, -0.19, 9.6, -0.12, 3.98, 0.92, 2.15, 3.51, 2.91]} \ No newline at end of file diff --git a/annotations_1/MqIJKnUkGLY_filtered.json b/annotations_1/MqIJKnUkGLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..665a3a36e6e193037aaf9c29c85fe767e9c08443 --- /dev/null +++ b/annotations_1/MqIJKnUkGLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.75], [6.0, 6.27], [7.0, 8.16], [10.0, 10.86], [14.0, 15.13], [16.0, 16.56], [20.0, 25.88], [27.0, 27.35], [29.0, 30.15], [36.0, 38.03], [41.0, 41.57], [45.0, 44.85], [47.0, 47.6], [49.0, 49.92], [58.0, 60.25], [61.0, 61.55], [64.0, 64.64], [67.0, 67.15], [69.0, 70.53], [71.0, 72.17], [74.0, 73.97], [75.0, 75.07], [76.0, 82.93], [84.0, 84.59], [90.0, 91.02], [92.0, 91.57], [95.0, 96.03], [96.0, 96.77], [101.0, 101.53], [104.0, 103.92], [109.0, 108.89], [117.0, 117.78], [120.0, 120.26], [122.0, 122.89], [127.0, 127.43], [129.0, 130.65], [131.0, 130.96], [131.0, 131.6], [132.0, 133.46], [134.0, 135.03], [139.0, 140.66], [146.0, 146.69], [153.0, 153.27], [165.0, 165.45], [166.0, 166.13], [167.0, 167.75], [168.0, 169.62], [173.0, 173.8], [178.0, 179.49], [183.0, 183.71], [201.0, 202.1], [218.0, 218.27], [218.0, 218.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.28], ["speech", 18.74], ["musical instrument", 4.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.75, 0.27, 1.16, 0.86, 1.13, 0.56, 5.88, 0.35, 1.15, 2.03, 0.57, -0.15, 0.6, 0.92, 2.25, 0.55, 0.64, 0.15, 1.53, 1.17, -0.03, 0.07, 6.93, 0.59, 1.02, -0.43, 1.03, 0.77, 0.53, -0.08, -0.11, 0.78, 0.26, 0.89, 0.43, 1.65, -0.04, 0.6, 1.46, 1.03, 1.66, 0.69, 0.27, 0.45, 0.13, 0.75, 1.62, 0.8, 1.49, 0.71, 1.1, 0.27, 0.3]} \ No newline at end of file diff --git a/annotations_1/MrWZWfsif3E_filtered.json b/annotations_1/MrWZWfsif3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f82874d474d18e003c49a2f535049e841f4c41e --- /dev/null +++ b/annotations_1/MrWZWfsif3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.55], [26.0, 26.64], [35.0, 35.21], [46.0, 52.02], [53.0, 54.09], [55.0, 55.93], [60.0, 62.63], [66.0, 70.28], [76.0, 76.81], [77.0, 78.38], [80.0, 83.57], [86.0, 87.44], [88.0, 89.4], [91.0, 91.56], [92.0, 92.48], [93.0, 98.91], [104.0, 105.48], [114.0, 114.1], [123.0, 123.77], [124.0, 125.19], [127.0, 130.94]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 31.06, 35.67, 0.0, 0.0, 46.94, 0.0, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 69.47], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 23.86], ["livestock, farm animals, working animals", 9.06], ["moo", 7.39]], [["fart", 17.68], ["throbbing", 16.97], ["whack, thwack", 8.87]], null, null, [["speech", 48.52], ["sidetone", 28.41], ["radio", 9.67]], null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.64, 0.21, 6.02, 1.09, 0.93, 2.63, 4.28, 0.81, 1.38, 3.57, 1.44, 1.4, 0.56, 0.48, 5.91, 1.48, 0.1, 0.77, 1.19, 3.94]} \ No newline at end of file diff --git a/annotations_1/MrhV0mA-bWg_filtered.json b/annotations_1/MrhV0mA-bWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44a1d4472f1f8bdf7601aff32ddc20038884cecd --- /dev/null +++ b/annotations_1/MrhV0mA-bWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.12], [11.0, 31.23], [31.0, 32.02], [35.0, 42.36], [44.0, 60.93], [64.0, 79.98], [83.0, 90.96], [96.0, 116.73], [123.0, 126.44], [130.0, 129.74], [130.0, 130.87], [132.0, 133.52], [135.0, 135.41], [138.0, 156.63], [159.0, 159.49], [161.0, 162.41], [163.0, 169.43], [174.0, 174.41], [180.0, 200.13]], "keep_status": [false, true, false, false, true, true, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [35.87, 30.08, 0.0, 29.72, 30.51, 31.12, 29.98, 29.86, 61.18, 0.0, 0.0, 0.0, 0.0, 30.55, 0.0, 0.0, 31.46, 0.0, 49.09], "audiomae_on_audioset": [[["music", 75.5], ["musical instrument", 4.03], ["synthesizer", 2.39]], [["livestock, farm animals, working animals", 27.76], ["animal", 17.11], ["music", 11.94]], null, [["livestock, farm animals, working animals", 38.4], ["cattle, bovinae", 19.87], ["moo", 12.76]], [["music", 32.07], ["speech", 8.94], ["animal", 7.6]], [["music", 21.95], ["whale vocalization", 10.82], ["sheep", 9.09]], [["music", 55.44], ["musical instrument", 11.66], ["drum", 3.02]], [["livestock, farm animals, working animals", 22.45], ["music", 17.82], ["moo", 12.29]], null, null, null, null, null, [["speech", 30.11], ["electric shaver, electric razor", 24.3], ["mains hum", 12.14]], null, null, [["fly, housefly", 23.72], ["music", 22.44], ["insect", 11.23]], null, [["music", 71.91], ["glass", 4.28], ["glockenspiel", 3.23]]], "duration": [3.12, 20.23, 1.02, 7.36, 16.93, 15.98, 7.96, 20.73, 3.44, -0.26, 0.87, 1.52, 0.41, 18.63, 0.49, 1.41, 6.43, 0.41, 20.13]} \ No newline at end of file diff --git a/annotations_1/MriW09XMJeo_filtered.json b/annotations_1/MriW09XMJeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80eb6e90029fe7ed7d7ff71a0b466376c81d05ed --- /dev/null +++ b/annotations_1/MriW09XMJeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.05], [22.0, 25.25], [30.0, 31.48], [37.0, 40.31], [53.0, 68.72], [70.0, 72.89], [95.0, 100.85], [105.0, 109.05], [111.0, 112.43], [119.0, 121.07], [127.0, 128.48], [130.0, 132.8], [137.0, 139.89], [147.0, 147.43], [156.0, 181.36], [185.0, 187.74], [190.0, 198.04], [202.0, 202.32]], "keep_status": [true, true, false, true, true, false, false, true, false, true, false, true, false, false, false, true, true, false], "silence_prob": [34.96, 45.21, 0.0, 36.43, 32.48, 76.2, 30.46, 35.18, 0.0, 35.28, 0.0, 33.53, 87.74, 0.0, 31.41, 38.7, 31.82, 0.0], "audiomae_on_audioset": [[["music", 47.82], ["livestock, farm animals, working animals", 8.07], ["ice cream truck, ice cream van", 5.65]], [["music", 61.19], ["singing", 3.36], ["musical instrument", 1.78]], null, [["music", 34.37], ["theremin", 6.74], ["didgeridoo", 4.28]], [["music", 63.61], ["synthesizer", 3.65], ["mains hum", 2.69]], null, [["boing", 40.71], ["music", 28.05], ["speech", 5.0]], [["speech", 28.04], ["fart", 18.04], ["fly, housefly", 7.06]], null, [["speech", 21.54], ["didgeridoo", 21.37], ["music", 11.4]], null, [["speech", 32.78], ["fly, housefly", 15.38], ["insect", 11.14]], null, null, [["music", 79.26], ["speech", 3.22], ["noise", 2.6]], [["music", 34.9], ["groan", 9.58], ["speech", 8.76]], [["music", 49.47], ["speech", 15.6], ["breaking", 3.37]], null], "duration": [5.05, 3.25, 1.48, 3.31, 15.72, 2.89, 5.85, 4.05, 1.43, 2.07, 1.48, 2.8, 2.89, 0.43, 25.36, 2.74, 8.04, 0.32]} \ No newline at end of file diff --git a/annotations_1/MrrYu07MIbk_filtered.json b/annotations_1/MrrYu07MIbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7332cc9e637abb6f9f170cf961e8abc88267b30 --- /dev/null +++ b/annotations_1/MrrYu07MIbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.55], [28.0, 28.07], [28.0, 28.21], [28.0, 28.29], [30.0, 58.95], [62.0, 66.33], [68.0, 68.84], [70.0, 71.07], [75.0, 84.96], [93.0, 94.54], [96.0, 104.67]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.25, 30.45, 0.0, 0.0, 28.61, 0.0, 29.93], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.04], ["music", 19.71], ["fart", 13.72]], [["music", 51.5], ["hum", 4.9], ["sitar", 3.87]], null, null, [["throbbing", 44.77], ["hum", 32.94], ["music", 6.63]], null, [["music", 56.72], ["speech", 22.56], ["animal", 3.26]]], "duration": [0.55, 0.07, 0.21, 0.29, 28.95, 4.33, 0.84, 1.07, 9.96, 1.54, 8.67]} \ No newline at end of file diff --git a/annotations_1/MrtT-vOpAfc_filtered.json b/annotations_1/MrtT-vOpAfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2d93b79e4cd2c8ad2424563f1a5b9897494b38a --- /dev/null +++ b/annotations_1/MrtT-vOpAfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 50.08], [51.0, 86.97], [90.0, 92.52], [98.0, 103.77], [105.0, 105.49], [109.0, 111.94], [113.0, 115.5]], "keep_status": [false, false, true, false, false, true, false], "silence_prob": [77.36, 0.0, 48.19, 38.14, 0.0, 47.82, 51.6], "audiomae_on_audioset": [null, null, [["music", 18.89], ["foghorn", 16.29], ["hum", 14.67]], [["music", 73.47], ["throbbing", 6.31], ["hum", 4.46]], null, [["music", 53.38], ["theremin", 8.13], ["hum", 3.23]], null], "duration": [10.08, 35.97, 2.52, 5.77, 0.49, 2.94, 2.5]} \ No newline at end of file diff --git a/annotations_1/MsKaN_QrVT8_filtered.json b/annotations_1/MsKaN_QrVT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..576f728591c139057c845d25b6186c53c718ad2a --- /dev/null +++ b/annotations_1/MsKaN_QrVT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.26], [8.0, 8.33], [9.0, 9.19], [10.0, 15.97], [16.0, 16.8], [17.0, 17.71], [18.0, 18.74], [19.0, 20.16], [21.0, 22.59], [23.0, 33.45], [35.0, 39.7], [44.0, 46.4], [50.0, 50.03], [51.0, 51.27], [52.0, 59.76], [61.0, 63.64], [65.0, 68.98], [80.0, 81.11], [82.0, 82.78], [87.0, 87.42], [89.0, 90.22], [100.0, 100.41], [104.0, 104.25], [105.0, 105.43], [107.0, 107.59], [108.0, 108.7], [110.0, 111.45], [112.0, 112.68], [114.0, 115.32], [119.0, 119.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 94.95, 99.84, 0.0, 0.0, 77.87, 57.32, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.33, 0.19, 5.97, 0.8, 0.71, 0.74, 1.16, 1.59, 10.45, 4.7, 2.4, 0.03, 0.27, 7.76, 2.64, 3.98, 1.11, 0.78, 0.42, 1.22, 0.41, 0.25, 0.43, 0.59, 0.7, 1.45, 0.68, 1.32, 0.57]} \ No newline at end of file diff --git a/annotations_1/MtRlOvoq9Ls_filtered.json b/annotations_1/MtRlOvoq9Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d00ee54567591c09335747a56a6ebccd57a3059 --- /dev/null +++ b/annotations_1/MtRlOvoq9Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [4.0, 4.9], [8.0, 17.44], [18.0, 54.09], [56.0, 55.95], [58.0, 72.35], [73.0, 78.19], [81.0, 82.9], [89.0, 96.21], [98.0, 99.84], [101.0, 102.64], [104.0, 105.85], [107.0, 108.14], [109.0, 109.92], [111.0, 114.29], [115.0, 116.85], [123.0, 123.69]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.85, 0.0, 0.0, 31.07, 33.67, 0.0, 32.08, 0.0, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 19.79], ["hum", 18.22], ["speech", 15.89]], null, null, [["music", 57.59], ["hum", 15.52], ["throbbing", 5.27]], [["music", 78.51], ["speech", 4.45], ["hum", 2.89]], null, [["music", 42.85], ["hum", 10.34], ["speech", 9.59]], null, null, null, null, null, [["music", 29.79], ["hum", 16.98], ["rumble", 8.87]], null, null], "duration": [0.03, 0.9, 9.44, 36.09, -0.05, 14.35, 5.19, 1.9, 7.21, 1.84, 1.64, 1.85, 1.14, 0.92, 3.29, 1.85, 0.69]} \ No newline at end of file diff --git a/annotations_1/MtyfXKbZUus_filtered.json b/annotations_1/MtyfXKbZUus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b90c80ce40a612d178f6f17dbb1c2c9c3399b6d9 --- /dev/null +++ b/annotations_1/MtyfXKbZUus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.45], [7.0, 7.4], [9.0, 12.99], [14.0, 25.46], [26.0, 31.9], [34.0, 34.08], [35.0, 41.22], [43.0, 44.14], [46.0, 48.03], [49.0, 53.82], [55.0, 61.48], [63.0, 73.7], [74.0, 75.59]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.35, 58.55, 75.07, 0.0, 57.32, 0.0, 67.25, 65.91, 53.53, 59.86, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.87], ["foghorn", 10.98], ["speech", 8.7]], null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 0.4, 3.99, 11.46, 5.9, 0.08, 6.22, 1.14, 2.03, 4.82, 6.48, 10.7, 1.59]} \ No newline at end of file diff --git a/annotations_1/MuG157PWMWI_filtered.json b/annotations_1/MuG157PWMWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c97275784537a89639f011425201271af5d636b --- /dev/null +++ b/annotations_1/MuG157PWMWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [6.0, 15.9], [17.0, 21.54], [22.0, 29.74], [31.0, 32.04], [37.0, 37.81], [41.0, 41.79], [45.0, 47.04], [53.0, 53.38], [58.0, 60.29], [68.0, 69.04], [89.0, 92.91], [97.0, 103.5], [113.0, 116.36], [121.0, 120.93], [123.0, 123.8], [124.0, 124.77], [128.0, 129.2], [130.0, 131.26], [146.0, 146.5], [148.0, 148.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.52, 91.98, 48.23, 0.0, 0.0, 0.0, 81.53, 0.0, 94.37, 0.0, 32.78, 32.54, 37.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 61.61], ["theremin", 17.37], ["ambient music", 3.78]], null, null, null, null, null, null, null, [["cattle, bovinae", 51.36], ["moo", 42.97], ["livestock, farm animals, working animals", 5.54]], [["music", 32.39], ["speech", 14.29], ["fly, housefly", 8.3]], [["music", 70.0], ["musical instrument", 7.59], ["throbbing", 1.84]], null, null, null, null, null, null, null], "duration": [1.9, 9.9, 4.54, 7.74, 1.04, 0.81, 0.79, 2.04, 0.38, 2.29, 1.04, 3.91, 6.5, 3.36, -0.07, 0.8, 0.77, 1.2, 1.26, 0.5, 0.44]} \ No newline at end of file diff --git a/annotations_1/MuIkmspTRo0_filtered.json b/annotations_1/MuIkmspTRo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d9b8e85734a06a6a4b1819dc87fb5e1c00fa0da --- /dev/null +++ b/annotations_1/MuIkmspTRo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.95], [14.0, 25.25], [27.0, 34.25], [34.0, 81.6], [83.0, 120.7], [122.0, 139.73], [140.0, 156.24], [158.0, 175.86], [179.0, 193.18], [194.0, 193.94], [194.0, 194.0], [194.0, 194.49], [197.0, 207.0]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.47, 39.17, 0.0, 0.0, 30.55, 30.42, 30.57, 31.05, 0.0, 0.0, 0.0, 30.51], "audiomae_on_audioset": [null, [["music", 23.41], ["livestock, farm animals, working animals", 15.8], ["moo", 13.66]], [["music", 57.82], ["musical instrument", 9.8], ["guitar", 8.43]], null, null, [["music", 84.02], ["quack", 5.6], ["funny music", 2.25]], [["music", 84.54], ["musical instrument", 1.32], ["swing music", 1.3]], [["music", 70.39], ["trombone", 3.25], ["musical instrument", 2.76]], [["music", 61.41], ["clarinet", 6.9], ["musical instrument", 5.45]], null, null, null, [["music", 60.24], ["theremin", 9.37], ["trombone", 6.36]]], "duration": [0.95, 11.25, 7.25, 47.6, 37.7, 17.73, 16.24, 17.86, 14.18, -0.06, 0.0, 0.49, 10.0]} \ No newline at end of file diff --git a/annotations_1/MuW72eVCQno_filtered.json b/annotations_1/MuW72eVCQno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cf9ad6c29a78f0c9510ea1bdfcf58a2a41153d5 --- /dev/null +++ b/annotations_1/MuW72eVCQno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.82], [16.0, 17.29], [18.0, 24.24], [26.0, 28.38], [30.0, 31.95], [36.0, 36.34], [38.0, 43.83], [45.0, 47.26], [59.0, 61.1], [62.0, 90.54], [95.0, 95.84], [99.0, 112.02], [115.0, 137.78], [138.0, 148.29], [150.0, 169.7], [171.0, 171.69], [180.0, 181.41], [184.0, 184.91], [189.0, 190.8]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.84, 28.71, 0.0, 0.0, 34.99, 59.33, 49.82, 31.28, 0.0, 51.39, 29.74, 40.24, 36.69, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.58], ["throbbing", 23.05], ["hum", 22.75]], [["music", 47.49], ["hum", 15.43], ["mains hum", 7.21]], null, null, [["hum", 39.59], ["throbbing", 17.72], ["mains hum", 9.94]], null, [["music", 53.54], ["speech", 26.17], ["quack", 2.97]], [["music", 33.76], ["hum", 23.25], ["speech", 8.15]], null, null, [["whack, thwack", 13.64], ["thunk", 12.92], ["music", 11.01]], [["throbbing", 24.19], ["sidetone", 16.86], ["speech", 14.38]], [["cattle, bovinae", 32.27], ["livestock, farm animals, working animals", 21.78], ["moo", 16.11]], null, null, null, null], "duration": [1.82, 1.29, 6.24, 2.38, 1.95, 0.34, 5.83, 2.26, 2.1, 28.54, 0.84, 13.02, 22.78, 10.29, 19.7, 0.69, 1.41, 0.91, 1.8]} \ No newline at end of file diff --git a/annotations_1/MuYLaaVqJf0_filtered.json b/annotations_1/MuYLaaVqJf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdd56c427497cdd7d28f5a428946621d6c8510d4 --- /dev/null +++ b/annotations_1/MuYLaaVqJf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.27], [16.0, 19.14], [22.0, 32.98], [39.0, 39.01], [43.0, 43.82], [48.0, 48.0], [49.0, 49.15], [57.0, 58.35], [59.0, 59.58], [82.0, 82.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.64, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.21], ["theremin", 11.35], ["synthesizer", 5.54]], [["music", 75.38], ["whale vocalization", 4.98], ["speech", 2.92]], null, null, null, null, null, null, null], "duration": [0.27, 3.14, 10.98, 0.01, 0.82, 0.0, 0.15, 1.35, 0.58, 0.04]} \ No newline at end of file diff --git a/annotations_1/MucDLDFYNDE_filtered.json b/annotations_1/MucDLDFYNDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6a9ca99eeb7c61da0c907ae34e346c3b0e4b833 --- /dev/null +++ b/annotations_1/MucDLDFYNDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.18], [19.0, 18.76], [30.0, 30.05], [42.0, 47.01], [49.0, 56.27], [61.0, 61.38], [62.0, 66.92], [68.0, 70.24], [71.0, 71.59], [102.0, 102.34], [109.0, 109.34], [111.0, 111.89], [114.0, 115.33], [117.0, 118.3], [123.0, 123.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.67, 64.41, 0.0, 55.6, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 78.56], ["speech", 6.88], ["boing", 3.99]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, -0.24, 0.05, 5.01, 7.27, 0.38, 4.92, 2.24, 0.59, 0.34, 0.34, 0.89, 1.33, 1.3, 0.62]} \ No newline at end of file diff --git a/annotations_1/MvIqR1cMbv0_filtered.json b/annotations_1/MvIqR1cMbv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..164d9d2008557891c1c3a2f4b1a56dc8a4ff8962 --- /dev/null +++ b/annotations_1/MvIqR1cMbv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 20.68], [40.0, 40.81], [49.0, 49.33], [69.0, 69.58], [88.0, 90.17], [119.0, 119.96], [127.0, 127.03]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [35.77, 0.0, 0.0, 0.0, 28.59, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.79], ["hum", 8.79], ["synthesizer", 3.51]], null, null, null, [["music", 54.75], ["a capella", 4.1], ["outside, urban or manmade", 3.76]], null, null], "duration": [18.68, 0.81, 0.33, 0.58, 2.17, 0.96, 0.03]} \ No newline at end of file diff --git a/annotations_1/MvRfyxGjA90_filtered.json b/annotations_1/MvRfyxGjA90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feff948729f594208edaab70ce38c8c450fe001c --- /dev/null +++ b/annotations_1/MvRfyxGjA90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [2.0, 4.97], [9.0, 9.29], [11.0, 12.19], [15.0, 15.65], [23.0, 24.56], [26.0, 27.4], [29.0, 29.13], [41.0, 42.06], [44.0, 44.63], [46.0, 46.52], [47.0, 49.84], [52.0, 52.62], [57.0, 58.08], [59.0, 60.71], [66.0, 66.12], [66.0, 66.58], [73.0, 73.82], [77.0, 78.58], [79.0, 78.66], [79.0, 78.7], [79.0, 79.0], [79.0, 79.08], [79.0, 79.12], [79.0, 80.5], [100.0, 100.2], [107.0, 107.67], [111.0, 111.38], [112.0, 112.9], [114.0, 120.85], [122.0, 125.58], [130.0, 130.87], [132.0, 133.07], [139.0, 139.01], [143.0, 143.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 97.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["grunt", 16.0], ["cattle, bovinae", 8.63], ["moo", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 2.97, 0.29, 1.19, 0.65, 1.56, 1.4, 0.13, 1.06, 0.63, 0.52, 2.84, 0.62, 1.08, 1.71, 0.12, 0.58, 0.82, 1.58, -0.34, -0.3, 0.0, 0.08, 0.12, 1.5, 0.2, 0.67, 0.38, 0.9, 6.85, 3.58, 0.87, 1.07, 0.01, 0.46]} \ No newline at end of file diff --git a/annotations_1/MvkN3003iU4_filtered.json b/annotations_1/MvkN3003iU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4bf50d15609d9aa5b47cf1b9a7cd58e8d0d40fb --- /dev/null +++ b/annotations_1/MvkN3003iU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 28.09], [31.0, 45.4], [51.0, 54.75], [56.0, 71.68], [73.0, 73.97], [75.0, 76.25], [77.0, 78.65], [80.0, 80.72]], "keep_status": [false, true, true, false, false, false, false, false], "silence_prob": [31.2, 29.72, 30.62, 31.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 83.99], ["thunk", 3.91], ["thump, thud", 1.66]], [["speech", 39.73], ["music", 18.82], ["machine gun", 3.73]], [["music", 37.05], ["speech", 26.47], ["cattle, bovinae", 3.2]], [["music", 53.95], ["throbbing", 21.02], ["hum", 5.8]], null, null, null, null], "duration": [17.09, 14.4, 3.75, 15.68, 0.97, 1.25, 1.65, 0.72]} \ No newline at end of file diff --git a/annotations_1/MwcXLL103vE_filtered.json b/annotations_1/MwcXLL103vE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9659e5a5eebf218c73b984ba808e2c1ffd5e7e31 --- /dev/null +++ b/annotations_1/MwcXLL103vE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 40.59], [41.0, 43.36], [44.0, 44.52], [45.0, 45.79], [46.0, 63.76], [64.0, 65.45], [67.0, 73.47], [73.0, 74.26], [75.0, 114.2], [118.0, 118.2], [120.0, 120.83], [122.0, 137.37], [139.0, 143.23], [146.0, 152.69], [154.0, 154.65]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [32.36, 30.35, 0.0, 0.0, 30.0, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 29.61, 34.39, 28.8, 0.0], "audiomae_on_audioset": [[["music", 73.25], ["theremin", 5.66], ["whale vocalization", 3.44]], [["fly, housefly", 13.27], ["didgeridoo", 8.89], ["frog", 7.34]], null, null, [["music", 36.33], ["hum", 20.88], ["throbbing", 14.77]], null, [["speech", 20.08], ["music", 19.8], ["sidetone", 13.13]], null, null, null, null, [["buzz", 44.07], ["music", 37.17], ["groan", 1.99]], [["music", 78.48], ["theremin", 5.2], ["scary music", 3.29]], [["music", 32.09], ["speech", 21.14], ["theremin", 8.56]], null], "duration": [17.59, 2.36, 0.52, 0.79, 17.76, 1.45, 6.47, 1.26, 39.2, 0.2, 0.83, 15.37, 4.23, 6.69, 0.65]} \ No newline at end of file diff --git a/annotations_1/MwjIdhPU43A_filtered.json b/annotations_1/MwjIdhPU43A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af764f0c008479c385d8c588ee4adc097ef64d42 --- /dev/null +++ b/annotations_1/MwjIdhPU43A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.85], [18.0, 19.63], [24.0, 24.98], [27.0, 27.43], [30.0, 29.56], [32.0, 32.95], [35.0, 35.8], [37.0, 38.58], [42.0, 43.9], [46.0, 56.03], [62.0, 63.19], [64.0, 65.45], [68.0, 68.37], [71.0, 70.77], [71.0, 71.88], [72.0, 73.16], [75.0, 74.97], [81.0, 81.01], [87.0, 88.94], [93.0, 96.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 1.63, 0.98, 0.43, -0.44, 0.95, 0.8, 1.58, 1.9, 10.03, 1.19, 1.45, 0.37, -0.23, 0.88, 1.16, -0.03, 0.01, 1.94, 3.96]} \ No newline at end of file diff --git a/annotations_1/MxDtKTClKGI_filtered.json b/annotations_1/MxDtKTClKGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f99431d3dfc1b0dc615b2818f3c31cda4df91c76 --- /dev/null +++ b/annotations_1/MxDtKTClKGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.37], [4.0, 4.82], [7.0, 13.51], [14.0, 15.03], [18.0, 19.23], [22.0, 22.0], [25.0, 25.37], [30.0, 32.81], [37.0, 37.47], [39.0, 39.43], [46.0, 47.49], [49.0, 50.48], [52.0, 52.03], [53.0, 59.1], [77.0, 78.43], [80.0, 80.84], [91.0, 95.39], [96.0, 96.5], [98.0, 99.13], [100.0, 101.14], [102.0, 103.33], [105.0, 105.58], [111.0, 111.97], [112.0, 113.86], [115.0, 115.18], [117.0, 116.99], [118.0, 118.76], [119.0, 119.8], [120.0, 120.5], [123.0, 123.35], [124.0, 123.94], [125.0, 125.68], [126.0, 126.69], [130.0, 130.17], [130.0, 134.45], [137.0, 140.56], [144.0, 144.69]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [34.55, 0.0, 37.31, 0.0, 0.0, 0.0, 0.0, 41.54, 0.0, 0.0, 0.0, 0.0, 0.0, 31.42, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.85, 39.58, 0.0], "audiomae_on_audioset": [[["speech", 59.72], ["radio", 7.18], ["shuffle", 5.66]], null, [["beatboxing", 48.83], ["music", 13.17], ["speech", 5.39]], null, null, null, null, [["noise", 22.24], ["radio", 12.52], ["music", 8.35]], null, null, null, null, null, [["cattle, bovinae", 25.67], ["moo", 16.61], ["groan", 10.43]], null, null, [["speech", 67.2], ["sidetone", 4.38], ["stomach rumble", 3.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 19.41], ["hum", 18.71], ["music", 16.28]], [["didgeridoo", 50.59], ["music", 12.02], ["foghorn", 3.53]], null], "duration": [2.37, 0.82, 6.51, 1.03, 1.23, 0.0, 0.37, 2.81, 0.47, 0.43, 1.49, 1.48, 0.03, 6.1, 1.43, 0.84, 4.39, 0.5, 1.13, 1.14, 1.33, 0.58, 0.97, 1.86, 0.18, -0.01, 0.76, 0.8, 0.5, 0.35, -0.06, 0.68, 0.69, 0.17, 4.45, 3.56, 0.69]} \ No newline at end of file diff --git a/annotations_1/MxMpRqQQ6o4_filtered.json b/annotations_1/MxMpRqQQ6o4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..980113d6f5d5ed00c180692ccb215d3804447225 --- /dev/null +++ b/annotations_1/MxMpRqQQ6o4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [10.0, 11.82], [13.0, 12.72], [14.0, 14.62], [21.0, 22.92], [25.0, 25.52], [26.0, 27.82], [29.0, 29.89], [32.0, 33.72], [35.0, 36.44], [37.0, 36.76], [37.0, 36.8], [37.0, 37.03], [37.0, 37.35], [38.0, 38.92], [39.0, 40.19], [41.0, 41.3], [43.0, 44.49], [50.0, 52.27], [56.0, 61.64], [70.0, 69.72], [72.0, 79.37], [84.0, 85.11], [86.0, 86.46], [88.0, 93.19], [94.0, 95.03], [97.0, 98.71], [106.0, 107.3], [110.0, 110.98], [112.0, 112.62], [113.0, 113.27], [114.0, 114.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.37, 0.0, 54.36, 0.0, 0.0, 33.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 13.83], ["thunk", 12.92], ["synthesizer", 11.24]], null, null, null, null, null, null, null], "duration": [2.06, 1.82, -0.28, 0.62, 1.92, 0.52, 1.82, 0.89, 1.72, 1.44, -0.24, -0.2, 0.03, 0.35, 0.92, 1.19, 0.3, 1.49, 2.27, 5.64, -0.28, 7.37, 1.11, 0.46, 5.19, 1.03, 1.71, 1.3, 0.98, 0.62, 0.27, 0.71]} \ No newline at end of file diff --git a/annotations_1/My8kfz_Ddqg_filtered.json b/annotations_1/My8kfz_Ddqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0941ed9412e237b73d8e558647fd1fe1a8b0eafd --- /dev/null +++ b/annotations_1/My8kfz_Ddqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [6.0, 9.58], [10.0, 11.33], [13.0, 16.78], [21.0, 21.37], [24.0, 26.11], [27.0, 27.38], [30.0, 32.78], [34.0, 37.05], [38.0, 42.63], [44.0, 46.79], [48.0, 49.96], [50.0, 51.68], [53.0, 55.24], [59.0, 68.61], [104.0, 105.22], [110.0, 110.37], [113.0, 113.73], [115.0, 115.96]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 34.0, 0.0, 42.74, 0.0, 30.62, 0.0, 43.71, 46.26, 36.36, 40.95, 0.0, 0.0, 36.26, 28.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 47.22], ["didgeridoo", 30.6], ["musical instrument", 2.6]], null, [["music", 18.61], ["gong", 14.04], ["didgeridoo", 9.03]], null, [["music", 62.44], ["speech", 10.74], ["musical instrument", 6.07]], null, [["music", 52.56], ["didgeridoo", 10.04], ["synthesizer", 5.87]], [["music", 67.14], ["synthesizer", 3.9], ["didgeridoo", 3.89]], [["music", 49.2], ["speech", 15.2], ["didgeridoo", 14.75]], [["music", 70.58], ["synthesizer", 5.04], ["musical instrument", 4.62]], null, null, [["music", 37.07], ["ambient music", 11.29], ["hum", 8.41]], [["music", 44.78], ["hum", 23.27], ["throbbing", 17.41]], null, null, null, null], "duration": [0.07, 3.58, 1.33, 3.78, 0.37, 2.11, 0.38, 2.78, 3.05, 4.63, 2.79, 1.96, 1.68, 2.24, 9.61, 1.22, 0.37, 0.73, 0.96]} \ No newline at end of file diff --git a/annotations_1/MzzWzX-HGbA_filtered.json b/annotations_1/MzzWzX-HGbA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7291daea40b8bc08edcf72864f6013f3bddcba36 --- /dev/null +++ b/annotations_1/MzzWzX-HGbA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [5.0, 5.34], [17.0, 16.97], [27.0, 27.23], [30.0, 37.45], [38.0, 39.93], [44.0, 44.44], [45.0, 46.21], [47.0, 49.82], [52.0, 53.72], [57.0, 58.19], [59.0, 60.78], [63.0, 66.72], [69.0, 69.67], [73.0, 73.9], [74.0, 74.85], [76.0, 76.91], [78.0, 90.96], [91.0, 94.09], [95.0, 100.13], [101.0, 109.71], [112.0, 115.01], [116.0, 116.83], [127.0, 132.36], [134.0, 134.27], [135.0, 136.0], [137.0, 139.45], [145.0, 158.35], [159.0, 159.36], [160.0, 162.75], [164.0, 165.86]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.79, 0.0, 0.0, 0.0, 49.31, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 33.63, 33.67, 37.37, 45.02, 46.02, 0.0, 29.53, 0.0, 0.0, 30.14, 30.3, 0.0, 46.94, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 34.6], ["music", 17.24], ["sidetone", 16.17]], null, null, null, [["music", 37.23], ["didgeridoo", 12.3], ["theremin", 8.7]], null, null, null, null, null, null, null, null, [["hum", 33.89], ["music", 22.73], ["mains hum", 14.55]], [["hum", 44.28], ["mains hum", 25.4], ["music", 14.02]], [["music", 32.77], ["hum", 20.98], ["throbbing", 10.02]], [["music", 30.97], ["hum", 10.92], ["buzz", 9.76]], [["sine wave", 13.67], ["sonar", 13.66], ["hum", 12.24]], null, [["rumble", 22.04], ["explosion", 9.27], ["speech", 7.18]], null, null, [["speech", 18.41], ["cattle, bovinae", 15.41], ["moo", 14.53]], [["music", 46.86], ["buzz", 10.5], ["hum", 5.52]], null, [["sidetone", 26.86], ["speech", 25.84], ["whale vocalization", 4.38]], null], "duration": [-0.06, 0.34, -0.03, 0.23, 7.45, 1.93, 0.44, 1.21, 2.82, 1.72, 1.19, 1.78, 3.72, 0.67, 0.9, 0.85, 0.91, 12.96, 3.09, 5.13, 8.71, 3.01, 0.83, 5.36, 0.27, 1.0, 2.45, 13.35, 0.36, 2.75, 1.86]} \ No newline at end of file diff --git a/annotations_1/N-ZFty2-G7I_filtered.json b/annotations_1/N-ZFty2-G7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6928d82ab9edc291f17e9145483dd9affe574e18 --- /dev/null +++ b/annotations_1/N-ZFty2-G7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [5.0, 9.68], [11.0, 15.7], [17.0, 23.92], [25.0, 28.44], [29.0, 35.8], [37.0, 39.55], [41.0, 49.5], [52.0, 62.45], [62.0, 62.63], [63.0, 70.29], [70.0, 72.35], [72.0, 84.6], [85.0, 84.81], [86.0, 95.22], [98.0, 101.61], [102.0, 103.18], [104.0, 104.95], [106.0, 107.25], [110.0, 121.88], [124.0, 125.32]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, true, true, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 94.52, 91.3, 58.47, 58.55, 53.84, 52.62, 31.76, 33.68, 0.0, 30.46, 31.24, 32.2, 0.0, 32.77, 34.68, 0.0, 0.0, 0.0, 33.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cattle, bovinae", 29.94], ["moo", 20.06], ["livestock, farm animals, working animals", 19.97]], [["music", 47.36], ["speech", 7.96], ["hum", 5.41]], null, [["groan", 27.74], ["grunt", 23.64], ["music", 6.04]], [["speech", 26.13], ["music", 16.08], ["didgeridoo", 9.76]], [["animal", 11.19], ["music", 7.01], ["buzz", 6.48]], null, [["whale vocalization", 19.63], ["livestock, farm animals, working animals", 12.79], ["moo", 10.54]], [["whale vocalization", 55.34], ["music", 6.59], ["vehicle", 5.59]], null, null, null, [["hum", 19.26], ["music", 12.9], ["speech", 12.2]], null], "duration": [1.26, 4.68, 4.7, 6.92, 3.44, 6.8, 2.55, 8.5, 10.45, 0.63, 7.29, 2.35, 12.6, -0.19, 9.22, 3.61, 1.18, 0.95, 1.25, 11.88, 1.32]} \ No newline at end of file diff --git a/annotations_1/N-v-x6qmtcc_filtered.json b/annotations_1/N-v-x6qmtcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3360d314dbedd485f562fc3e4ea040514aca467 --- /dev/null +++ b/annotations_1/N-v-x6qmtcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 30.0], [32.0, 33.59], [35.0, 45.59], [47.0, 60.62], [63.0, 70.17], [74.0, 76.05], [76.0, 77.82], [79.0, 86.83], [91.0, 95.77], [96.0, 97.31], [98.0, 98.9], [100.0, 100.06], [101.0, 107.45], [112.0, 117.91], [121.0, 121.76], [122.0, 122.17], [124.0, 125.78], [128.0, 132.12]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, true, true, false, false, false, true], "silence_prob": [32.95, 0.0, 35.39, 47.01, 42.06, 43.33, 0.0, 42.48, 38.68, 0.0, 0.0, 0.0, 32.51, 33.17, 0.0, 0.0, 0.0, 35.17], "audiomae_on_audioset": [[["music", 53.28], ["speech", 19.71], ["thunk", 4.43]], null, [["music", 44.31], ["speech", 39.75], ["fart", 4.02]], [["music", 66.7], ["singing bowl", 3.36], ["theremin", 2.91]], [["music", 63.51], ["theremin", 14.77], ["musical instrument", 4.82]], [["music", 42.75], ["didgeridoo", 20.28], ["singing bowl", 6.71]], null, [["music", 28.68], ["singing bowl", 28.35], ["gong", 6.12]], [["livestock, farm animals, working animals", 44.57], ["moo", 26.11], ["cattle, bovinae", 25.59]], null, null, null, [["music", 23.44], ["speech", 10.57], ["insect", 7.89]], [["speech", 24.69], ["groan", 13.83], ["music", 13.08]], null, null, null, [["speech", 46.08], ["hum", 5.49], ["buzz", 3.66]]], "duration": [21.0, 1.59, 10.59, 13.62, 7.17, 2.05, 1.82, 7.83, 4.77, 1.31, 0.9, 0.06, 6.45, 5.91, 0.76, 0.17, 1.78, 4.12]} \ No newline at end of file diff --git a/annotations_1/N0gOaE92ogg_filtered.json b/annotations_1/N0gOaE92ogg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52a71fc1ce443f4a8ae21026741c41081d77e7ec --- /dev/null +++ b/annotations_1/N0gOaE92ogg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 4.31], [5.0, 6.15], [8.0, 8.6], [10.0, 13.05], [15.0, 17.88], [19.0, 20.16], [24.0, 26.47], [33.0, 34.2], [34.0, 34.37], [34.0, 35.77], [43.0, 44.1], [45.0, 47.31], [71.0, 101.6], [102.0, 101.82], [102.0, 101.9], [114.0, 114.37], [116.0, 117.0], [118.0, 118.03], [123.0, 132.66], [133.0, 134.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.1, 96.29, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.88], ["inside, small room", 2.81], ["sidetone", 2.26]], null, null, null, null, null, null, null, null], "duration": [0.5, 1.31, 1.15, 0.6, 3.05, 2.88, 1.16, 2.47, 1.2, 0.37, 1.77, 1.1, 2.31, 30.6, -0.18, -0.1, 0.37, 1.0, 0.03, 9.66, 1.55]} \ No newline at end of file diff --git a/annotations_1/N26K5UeOTPE_filtered.json b/annotations_1/N26K5UeOTPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c7dcc3f2145966ffb62e35b0b14554159c62e37 --- /dev/null +++ b/annotations_1/N26K5UeOTPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.65], [21.0, 43.65], [77.0, 77.25], [83.0, 83.39], [85.0, 86.37], [91.0, 92.7], [93.0, 100.43], [101.0, 110.67], [115.0, 116.09], [119.0, 119.48], [123.0, 123.45]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.22, 30.13, 0.0, 0.0, 0.0, 0.0, 30.38, 30.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 39.51], ["moo", 28.52], ["speech", 15.01]], [["cattle, bovinae", 35.22], ["moo", 26.84], ["livestock, farm animals, working animals", 23.78]], null, null, null, null, [["moo", 36.07], ["cattle, bovinae", 33.88], ["livestock, farm animals, working animals", 17.08]], [["speech", 36.34], ["livestock, farm animals, working animals", 10.7], ["sheep", 7.45]], null, null, null], "duration": [3.65, 22.65, 0.25, 0.39, 1.37, 1.7, 7.43, 9.67, 1.09, 0.48, 0.45]} \ No newline at end of file diff --git a/annotations_1/N27ZYQKRYnQ_filtered.json b/annotations_1/N27ZYQKRYnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa41e1f1b3f61cbe29482097ee6c4ce455c31fff --- /dev/null +++ b/annotations_1/N27ZYQKRYnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.31], [25.0, 25.03], [26.0, 28.38], [30.0, 31.01], [35.0, 61.43], [62.0, 77.25], [79.0, 93.6], [98.0, 98.1], [110.0, 111.43], [113.0, 117.12], [118.0, 118.99], [120.0, 120.26], [126.0, 126.08], [130.0, 130.71]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [29.53, 0.0, 29.52, 0.0, 29.47, 29.69, 29.88, 0.0, 0.0, 33.65, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 62.71], ["throbbing", 13.45], ["hum", 8.65]], null, [["music", 49.1], ["speech", 23.49], ["throbbing", 4.65]], null, [["music", 55.33], ["speech", 13.39], ["throbbing", 6.13]], [["music", 70.08], ["throbbing", 13.63], ["hum", 3.34]], [["music", 79.46], ["throbbing", 4.53], ["hum", 3.27]], null, null, [["music", 37.66], ["didgeridoo", 11.06], ["speech", 4.65]], null, null, null, null], "duration": [19.31, 0.03, 2.38, 1.01, 26.43, 15.25, 14.6, 0.1, 1.43, 4.12, 0.99, 0.26, 0.08, 0.71]} \ No newline at end of file diff --git a/annotations_1/N2s_Iij3Xfk_filtered.json b/annotations_1/N2s_Iij3Xfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..870aad1114da9843a3350891f94cce498427be02 --- /dev/null +++ b/annotations_1/N2s_Iij3Xfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [8.0, 9.27], [10.0, 11.85], [12.0, 23.75], [26.0, 26.54], [27.0, 30.94], [32.0, 59.32], [60.0, 83.13], [84.0, 83.86], [84.0, 84.2], [85.0, 97.87], [99.0, 120.07]], "keep_status": [false, false, false, false, false, true, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.27, 0.0, 28.85, 28.38, 28.36, 0.0, 0.0, 28.61, 29.18], "audiomae_on_audioset": [null, null, null, [["music", 45.18], ["speech", 37.83], ["effects unit", 2.99]], null, [["cattle, bovinae", 21.03], ["moo", 15.1], ["livestock, farm animals, working animals", 11.74]], [["chainsaw", 12.97], ["speech", 11.43], ["livestock, farm animals, working animals", 8.11]], [["music", 32.4], ["groan", 9.63], ["livestock, farm animals, working animals", 7.91]], null, null, [["music", 56.05], ["musical instrument", 6.16], ["plucked string instrument", 4.26]], [["speech", 45.28], ["music", 22.67], ["civil defense siren", 4.03]]], "duration": [1.59, 1.27, 1.85, 11.75, 0.54, 3.94, 27.32, 23.13, -0.14, 0.2, 12.87, 21.07]} \ No newline at end of file diff --git a/annotations_1/N35FsMxEmSc_filtered.json b/annotations_1/N35FsMxEmSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ae88ebc5b6e6e9d34726ad3b42908a9574d0c13 --- /dev/null +++ b/annotations_1/N35FsMxEmSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.71], [20.0, 20.93], [22.0, 24.78], [25.0, 24.81], [29.0, 33.18], [34.0, 34.67], [36.0, 37.3], [38.0, 41.23], [42.0, 42.79], [46.0, 46.95], [48.0, 48.57], [49.0, 49.74], [63.0, 63.07], [65.0, 65.08], [66.0, 66.34], [69.0, 72.5], [74.0, 76.89], [78.0, 79.15], [81.0, 81.16], [84.0, 85.23], [92.0, 92.25], [93.0, 93.34], [94.0, 96.69], [98.0, 99.18], [99.0, 112.53], [113.0, 112.62], [113.0, 113.49], [114.0, 113.53], [114.0, 113.61], [114.0, 121.81], [125.0, 125.0], [125.0, 125.05], [129.0, 147.41], [152.0, 153.98], [155.0, 157.06], [168.0, 170.29], [172.0, 173.35], [175.0, 176.67], [178.0, 181.47], [183.0, 185.46], [186.0, 188.11], [189.0, 191.67], [193.0, 194.83]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 41.85, 0.0, 47.39, 0.0, 0.0, 30.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.69, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 30.6, 0.0, 30.83, 0.0, 0.0, 0.0, 0.0, 29.78, 0.0, 0.0, 33.6, 0.0, 63.21, 47.39, 0.0, 0.0, 44.57, 59.07, 56.48, 91.81, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 32.03], ["music", 25.7], ["speech", 24.44]], null, [["music", 52.03], ["didgeridoo", 14.95], ["musical instrument", 3.68]], null, null, [["throbbing", 28.37], ["music", 26.3], ["hum", 7.99]], null, null, null, null, null, null, null, [["breaking", 48.52], ["music", 19.35], ["glass", 7.05]], null, null, null, null, null, null, [["thunk", 34.86], ["music", 8.98], ["whack, thwack", 7.78]], null, [["throbbing", 24.7], ["music", 23.82], ["hum", 23.7]], null, null, null, null, [["music", 44.29], ["hum", 17.48], ["mains hum", 13.55]], null, null, [["music", 40.9], ["hum", 18.25], ["throbbing", 16.37]], null, null, [["throbbing", 37.19], ["hum", 35.22], ["heart sounds, heartbeat", 5.76]], null, null, [["music", 28.7], ["hum", 12.78], ["didgeridoo", 8.71]], null, null, null, null], "duration": [0.71, 0.93, 2.78, -0.19, 4.18, 0.67, 1.3, 3.23, 0.79, 0.95, 0.57, 0.74, 0.07, 0.08, 0.34, 3.5, 2.89, 1.15, 0.16, 1.23, 0.25, 0.34, 2.69, 1.18, 13.53, -0.38, 0.49, -0.47, -0.39, 7.81, 0.0, 0.05, 18.41, 1.98, 2.06, 2.29, 1.35, 1.67, 3.47, 2.46, 2.11, 2.67, 1.83]} \ No newline at end of file diff --git a/annotations_1/N45Gbn2AtWk_filtered.json b/annotations_1/N45Gbn2AtWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8e98fff07894922a533aea01fbc5e8d4c60cb9c --- /dev/null +++ b/annotations_1/N45Gbn2AtWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.8], [22.0, 31.31], [34.0, 35.21], [36.0, 39.97], [43.0, 43.43], [45.0, 45.23], [50.0, 52.2], [53.0, 53.82], [57.0, 59.16], [60.0, 64.77], [68.0, 69.35]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [54.7, 37.85, 0.0, 90.6, 0.0, 0.0, 56.93, 0.0, 90.08, 57.72, 0.0], "audiomae_on_audioset": [null, [["music", 36.14], ["animal", 7.58], ["sheep", 6.38]], null, null, null, null, null, null, null, null, null], "duration": [3.8, 9.31, 1.21, 3.97, 0.43, 0.23, 2.2, 0.82, 2.16, 4.77, 1.35]} \ No newline at end of file diff --git a/annotations_1/N6SPrarFcBA_filtered.json b/annotations_1/N6SPrarFcBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db031ec3ffaa041a06b891f2824cc2ee99fddf52 --- /dev/null +++ b/annotations_1/N6SPrarFcBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.34], [20.0, 20.58], [24.0, 24.48], [61.0, 61.37], [72.0, 74.88], [76.0, 75.9], [76.0, 81.5], [84.0, 123.82], [125.0, 128.6], [131.0, 130.92], [143.0, 143.48], [155.0, 155.07], [155.0, 155.11], [155.0, 155.14], [155.0, 155.17], [155.0, 155.21], [155.0, 155.24], [155.0, 155.28], [155.0, 157.17], [159.0, 162.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [36.16, 0.0, 0.0, 0.0, 31.0, 0.0, 30.72, 0.0, 29.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.78, 29.84], "audiomae_on_audioset": [[["speech", 45.44], ["humming", 38.3], ["music", 5.74]], null, null, null, [["music", 73.39], ["musical instrument", 6.21], ["theremin", 3.98]], null, [["music", 72.9], ["guitar", 7.43], ["musical instrument", 5.46]], null, [["music", 68.0], ["bass guitar", 9.07], ["guitar", 6.1]], null, null, null, null, null, null, null, null, null, [["music", 48.79], ["singing", 11.18], ["musical instrument", 5.1]], [["music", 57.21], ["carnatic music", 15.56], ["musical instrument", 5.93]]], "duration": [5.34, 0.58, 0.48, 0.37, 2.88, -0.1, 5.5, 39.82, 3.6, -0.08, 0.48, 0.07, 0.11, 0.14, 0.17, 0.21, 0.24, 0.28, 2.17, 3.36]} \ No newline at end of file diff --git a/annotations_1/N6bOUves6hI_filtered.json b/annotations_1/N6bOUves6hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d9e090f1606bd5959eae7bd9aecfd4dd108f3d --- /dev/null +++ b/annotations_1/N6bOUves6hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.58], [8.0, 9.02], [12.0, 12.7], [14.0, 15.55], [21.0, 22.11], [24.0, 24.39], [28.0, 29.0], [33.0, 34.91], [42.0, 43.14], [47.0, 48.61], [50.0, 51.41], [53.0, 52.95], [56.0, 56.51], [65.0, 65.13], [65.0, 65.58], [68.0, 68.45], [70.0, 71.64], [88.0, 88.42], [102.0, 102.71], [111.0, 112.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.02, 0.7, 1.55, 1.11, 0.39, 1.0, 1.91, 1.14, 1.61, 1.41, -0.05, 0.51, 0.13, 0.58, 0.45, 1.64, 0.42, 0.71, 1.9]} \ No newline at end of file diff --git a/annotations_1/N6jkWHo8D_s_filtered.json b/annotations_1/N6jkWHo8D_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d43d971968b9b934ebf0022c51c02ed21271bb9c --- /dev/null +++ b/annotations_1/N6jkWHo8D_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.01], [30.0, 31.21], [36.0, 36.19], [38.0, 39.31], [42.0, 43.5], [44.0, 44.61], [51.0, 53.62], [54.0, 64.07], [67.0, 70.28], [71.0, 71.56], [72.0, 72.79], [74.0, 76.4], [77.0, 83.44], [86.0, 87.47], [88.0, 88.4], [89.0, 89.85]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 53.4, 42.91, 0.0, 0.0, 79.59, 55.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["mosquito", 47.73], ["fly, housefly", 21.9], ["insect", 9.15]], null, [["speech", 26.17], ["music", 20.74], ["synthesizer", 17.63]], null, null, null, null, null, null, null], "duration": [1.01, 1.21, 0.19, 1.31, 1.5, 0.61, 2.62, 10.07, 3.28, 0.56, 0.79, 2.4, 6.44, 1.47, 0.4, 0.85]} \ No newline at end of file diff --git a/annotations_1/N7i4yZhm6V0_filtered.json b/annotations_1/N7i4yZhm6V0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a15af7a82d15dbb8791d090baba11f717d24041 --- /dev/null +++ b/annotations_1/N7i4yZhm6V0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.57], [9.0, 9.8], [12.0, 12.09], [14.0, 15.31], [23.0, 23.9], [26.0, 25.74], [29.0, 30.4], [32.0, 32.59], [34.0, 37.32], [38.0, 38.96], [39.0, 44.63], [48.0, 51.02], [54.0, 54.35], [56.0, 56.59], [57.0, 57.64], [67.0, 84.0], [86.0, 89.61], [92.0, 93.33], [95.0, 96.16], [100.0, 101.06], [104.0, 105.92], [106.0, 107.97], [111.0, 113.27], [116.0, 116.73], [118.0, 118.91], [121.0, 121.91], [123.0, 124.63], [126.0, 130.27], [132.0, 132.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 53.28, 50.06, 0.0, 0.0, 0.0, 94.52, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 41.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.59], ["wild animals", 8.88], ["animal", 7.98]], null], "duration": [2.57, 0.8, 0.09, 1.31, 0.9, -0.26, 1.4, 0.59, 3.32, 0.96, 5.63, 3.02, 0.35, 0.59, 0.64, 17.0, 3.61, 1.33, 1.16, 1.06, 1.92, 1.97, 2.27, 0.73, 0.91, 0.91, 1.63, 4.27, 0.75]} \ No newline at end of file diff --git a/annotations_1/N7vSJzq1zAY_filtered.json b/annotations_1/N7vSJzq1zAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02b507fce763548b367ef6a12524a1fb396b6125 --- /dev/null +++ b/annotations_1/N7vSJzq1zAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 78.95], [80.0, 133.46], [135.0, 134.91], [141.0, 141.0], [142.0, 142.32], [150.0, 151.41], [156.0, 159.14], [161.0, 161.47], [163.0, 163.49], [165.0, 166.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.04, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.47], ["throbbing", 12.14], ["electronic music", 4.15]], null, null, null, null, null, null, null, null, null], "duration": [27.95, 53.46, -0.09, 0.0, 0.32, 1.41, 3.14, 0.47, 0.49, 1.62]} \ No newline at end of file diff --git a/annotations_1/N8QzCj1RdpU_filtered.json b/annotations_1/N8QzCj1RdpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07813ffe7d02bc5f2758bc377adc80de8ccb25f9 --- /dev/null +++ b/annotations_1/N8QzCj1RdpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 22.99], [24.0, 24.98], [26.0, 25.96], [28.0, 30.28], [31.0, 32.71], [33.0, 34.69], [36.0, 36.61], [37.0, 38.03], [40.0, 40.49], [41.0, 42.62], [43.0, 43.9], [45.0, 45.01], [45.0, 45.49], [46.0, 46.33], [54.0, 59.73], [61.0, 62.5], [63.0, 63.21], [65.0, 66.21], [67.0, 66.95], [67.0, 68.15], [69.0, 69.7], [78.0, 78.63], [79.0, 79.98], [80.0, 80.4], [81.0, 82.58], [83.0, 83.74], [84.0, 84.33], [84.0, 86.32], [88.0, 88.06], [89.0, 91.72], [94.0, 94.46], [96.0, 97.31], [99.0, 100.23], [103.0, 103.76], [106.0, 109.07], [111.0, 111.62], [112.0, 112.75], [115.0, 116.06], [116.0, 117.56], [118.0, 122.44], [123.0, 125.07], [127.0, 126.96], [128.0, 129.79], [132.0, 132.95], [133.0, 133.51], [134.0, 133.91], [135.0, 135.33], [138.0, 138.64], [142.0, 144.37], [145.0, 145.84], [147.0, 149.08], [152.0, 152.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.82, 0.0, 0.0, 34.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 89.19, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 94.22, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 41.22], ["livestock, farm animals, working animals", 28.18], ["moo", 23.75]], null, null, [["livestock, farm animals, working animals", 54.35], ["moo", 16.47], ["cattle, bovinae", 14.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.99, 0.98, -0.04, 2.28, 1.71, 1.69, 0.61, 1.03, 0.49, 1.62, 0.9, 0.01, 0.49, 0.33, 5.73, 1.5, 0.21, 1.21, -0.05, 1.15, 0.7, 0.63, 0.98, 0.4, 1.58, 0.74, 0.33, 2.32, 0.06, 2.72, 0.46, 1.31, 1.23, 0.76, 3.07, 0.62, 0.75, 1.06, 1.56, 4.44, 2.07, -0.04, 1.79, 0.95, 0.51, -0.09, 0.33, 0.64, 2.37, 0.84, 2.08, 0.71]} \ No newline at end of file diff --git a/annotations_1/N9EnEuH0Tgo_filtered.json b/annotations_1/N9EnEuH0Tgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66a9b30d5e8aa48777a5eccfc56f3e9e60b7946c --- /dev/null +++ b/annotations_1/N9EnEuH0Tgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.94], [14.0, 41.37]], "keep_status": [false, true], "silence_prob": [76.2, 30.04], "audiomae_on_audioset": [null, [["music", 36.77], ["theremin", 26.87], ["hum", 4.85]]], "duration": [4.94, 27.37]} \ No newline at end of file diff --git a/annotations_1/N9d-c9ooO7s_filtered.json b/annotations_1/N9d-c9ooO7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d178f25e723510246c198211434ee20491697e05 --- /dev/null +++ b/annotations_1/N9d-c9ooO7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 4.36], [5.0, 5.61], [9.0, 8.87], [11.0, 12.16], [13.0, 14.27], [16.0, 15.84], [16.0, 20.68], [22.0, 21.63], [22.0, 23.03], [25.0, 24.92], [25.0, 26.06], [30.0, 30.65], [34.0, 34.45], [35.0, 36.54], [40.0, 40.12], [44.0, 45.01], [45.0, 48.52], [50.0, 50.38], [52.0, 52.2], [54.0, 54.48], [56.0, 57.01], [59.0, 59.27], [61.0, 61.21], [62.0, 64.02], [67.0, 67.66], [70.0, 70.33], [76.0, 76.5], [79.0, 80.3], [84.0, 84.54], [86.0, 86.46], [88.0, 88.03], [97.0, 97.11], [99.0, 99.6], [102.0, 102.44], [105.0, 105.21], [107.0, 107.6], [113.0, 114.15], [115.0, 115.13], [117.0, 121.83], [123.0, 123.53], [125.0, 125.64], [134.0, 134.65], [135.0, 136.49], [154.0, 154.87], [158.0, 158.57], [159.0, 159.92], [161.0, 162.9], [164.0, 164.88], [165.0, 169.62], [172.0, 174.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.58, 30.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.59], ["theremin", 26.76], ["didgeridoo", 22.18]], [["sidetone", 27.24], ["music", 22.82], ["didgeridoo", 8.67]]], "duration": [1.0, 0.36, 0.61, -0.13, 1.16, 1.27, -0.16, 4.68, -0.37, 1.03, -0.08, 1.06, 0.65, 0.45, 1.54, 0.12, 1.01, 3.52, 0.38, 0.2, 0.48, 1.01, 0.27, 0.21, 2.02, 0.66, 0.33, 0.5, 1.3, 0.54, 0.46, 0.03, 0.11, 0.6, 0.44, 0.21, 0.6, 1.15, 0.13, 4.83, 0.53, 0.64, 0.65, 1.49, 0.87, 0.57, 0.92, 1.9, 0.88, 4.62, 2.21]} \ No newline at end of file diff --git a/annotations_1/N9v6VJLZ8_I_filtered.json b/annotations_1/N9v6VJLZ8_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb945fff74270f168cb7272b9d5d4767c112844c --- /dev/null +++ b/annotations_1/N9v6VJLZ8_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 16.93], [20.0, 20.97], [23.0, 23.65], [25.0, 27.48], [30.0, 30.11], [34.0, 35.97], [37.0, 38.37], [40.0, 40.78], [51.0, 51.95], [54.0, 54.99], [56.0, 57.03], [59.0, 60.44], [63.0, 63.95], [65.0, 66.8], [68.0, 69.28], [71.0, 70.73], [72.0, 72.37], [76.0, 77.79], [79.0, 80.49], [81.0, 82.73], [85.0, 85.7], [88.0, 88.77], [91.0, 91.54], [94.0, 94.66], [97.0, 98.0], [101.0, 101.93], [103.0, 104.13], [106.0, 107.43], [109.0, 110.4], [112.0, 112.51], [115.0, 115.84], [117.0, 118.05], [118.0, 118.98], [123.0, 124.5], [126.0, 127.38], [131.0, 132.07], [135.0, 136.44], [138.0, 140.93], [144.0, 146.21], [152.0, 152.19], [154.0, 156.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [45.33, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.34, 83.7, 0.0, 35.25], "audiomae_on_audioset": [[["music", 19.39], ["hum", 17.02], ["speech", 15.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.18], ["foghorn", 4.68], ["theremin", 3.98]], null, null, [["speech", 56.06], ["cattle, bovinae", 4.44], ["radio", 3.85]]], "duration": [11.93, 0.97, 0.65, 2.48, 0.11, 1.97, 1.37, 0.78, 0.95, 0.99, 1.03, 1.44, 0.95, 1.8, 1.28, -0.27, 0.37, 1.79, 1.49, 1.73, 0.7, 0.77, 0.54, 0.66, 1.0, 0.93, 1.13, 1.43, 1.4, 0.51, 0.84, 1.05, 0.98, 1.5, 1.38, 1.07, 1.44, 2.93, 2.21, 0.19, 2.44]} \ No newline at end of file diff --git a/annotations_1/NBY0l7A2uLA_filtered.json b/annotations_1/NBY0l7A2uLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81ab8e6a98ddf14854743cdbe3faf9f9b01a8427 --- /dev/null +++ b/annotations_1/NBY0l7A2uLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [14.0, 17.37], [18.0, 18.96], [22.0, 21.84], [23.0, 23.41], [27.0, 27.21], [30.0, 30.45], [35.0, 40.46], [41.0, 54.55], [62.0, 78.68], [79.0, 81.04], [82.0, 84.57], [86.0, 100.31], [103.0, 114.44], [121.0, 122.64], [125.0, 125.63], [127.0, 128.11], [131.0, 136.09], [141.0, 151.33], [151.0, 155.44], [155.0, 164.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 72.01, 50.86, 68.54, 55.39, 47.7, 65.44, 0.0, 0.0, 0.0, 60.7, 66.76, 41.87, 48.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.38], ["siren", 5.68], ["throbbing", 5.49]], null, null, null, null, null, null, [["speech", 46.81], ["music", 17.03], ["hum", 4.42]], [["music", 62.46], ["throbbing", 12.42], ["door", 2.99]]], "duration": [0.92, 3.37, 0.96, -0.16, 0.41, 0.21, 0.45, 5.46, 13.55, 16.68, 2.04, 2.57, 14.31, 11.44, 1.64, 0.63, 1.11, 5.09, 10.33, 4.44, 9.39]} \ No newline at end of file diff --git a/annotations_1/NBYfDP0IO18_filtered.json b/annotations_1/NBYfDP0IO18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..047ee1d2c48bf146db96eaeeaab2730dd86abc9f --- /dev/null +++ b/annotations_1/NBYfDP0IO18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.06], [8.0, 16.73], [20.0, 29.67], [31.0, 31.43], [32.0, 64.18], [66.0, 96.55]], "keep_status": [false, true, true, false, false, false], "silence_prob": [0.0, 31.82, 29.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 38.94], ["throbbing", 21.7], ["rumble", 8.45]], [["hum", 27.67], ["music", 21.15], ["mains hum", 18.61]], null, null, null], "duration": [0.06, 8.73, 9.67, 0.43, 32.18, 30.55]} \ No newline at end of file diff --git a/annotations_1/NBfCeTdLDbQ_filtered.json b/annotations_1/NBfCeTdLDbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4eb7618e9a5068d0589b28afcd855872f3f9851 --- /dev/null +++ b/annotations_1/NBfCeTdLDbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [14.0, 15.11], [21.0, 21.34], [22.0, 22.81], [24.0, 24.88], [27.0, 27.97], [29.0, 29.64], [31.0, 31.48], [33.0, 33.29], [36.0, 37.47], [39.0, 40.24], [42.0, 42.97], [44.0, 44.41], [46.0, 46.41], [49.0, 49.03], [51.0, 51.95], [56.0, 56.62], [60.0, 61.1], [67.0, 69.42], [70.0, 70.19], [76.0, 76.57], [81.0, 80.76], [82.0, 84.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.11, 0.34, 0.81, 0.88, 0.97, 0.64, 0.48, 0.29, 1.47, 1.24, 0.97, 0.41, 0.41, 0.03, 0.95, 0.62, 1.1, 2.42, 0.19, 0.57, -0.24, 2.55]} \ No newline at end of file diff --git a/annotations_1/NBxg8a4TAng_filtered.json b/annotations_1/NBxg8a4TAng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3395b9b13ebbf5fd8a474a32b321fd7472472d98 --- /dev/null +++ b/annotations_1/NBxg8a4TAng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.82], [27.0, 34.1], [35.0, 34.57], [35.0, 34.6], [35.0, 53.55], [58.0, 63.98], [64.0, 64.03], [64.0, 64.71], [65.0, 76.67]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.97, 0.0, 0.0, 31.34, 31.31, 0.0, 0.0, 38.37], "audiomae_on_audioset": [null, [["music", 50.76], ["theremin", 10.51], ["hum", 7.49]], null, null, [["music", 39.42], ["animal", 22.19], ["livestock, farm animals, working animals", 12.42]], [["theremin", 64.93], ["music", 25.11], ["synthesizer", 0.85]], null, null, [["music", 44.36], ["theremin", 38.49], ["glass", 2.93]]], "duration": [0.82, 7.1, -0.43, -0.4, 18.55, 5.98, 0.03, 0.71, 11.67]} \ No newline at end of file diff --git a/annotations_1/NC34ce5BkWQ_filtered.json b/annotations_1/NC34ce5BkWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4501ca9d47a35db45cddc149e54fcfea7ed055ff --- /dev/null +++ b/annotations_1/NC34ce5BkWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [4.0, 4.48], [5.0, 5.39], [6.0, 6.4], [9.0, 9.61], [14.0, 13.95], [15.0, 20.56], [21.0, 22.22], [23.0, 24.39], [25.0, 26.22], [29.0, 29.44], [31.0, 32.14], [33.0, 35.41], [37.0, 37.13], [37.0, 39.16], [40.0, 40.64], [42.0, 44.17], [46.0, 47.11], [48.0, 55.85], [57.0, 61.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 64.41, 0.0, 61.08, 0.0, 47.58, 37.14], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 30.58], ["moo", 24.85], ["cattle, bovinae", 24.78]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 41.73], ["mains hum", 24.38], ["music", 10.05]], [["theremin", 35.92], ["music", 33.87], ["didgeridoo", 4.45]]], "duration": [1.3, 0.48, 0.39, 0.4, 0.61, -0.05, 5.56, 1.22, 1.39, 1.22, 0.44, 1.14, 2.41, 0.13, 2.16, 0.64, 2.17, 1.11, 7.85, 4.11]} \ No newline at end of file diff --git a/annotations_1/NCUOJMkDAyI_filtered.json b/annotations_1/NCUOJMkDAyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0fba3f87fe7c250cce4ded4a5b110b11777f31 --- /dev/null +++ b/annotations_1/NCUOJMkDAyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [14.0, 14.13], [15.0, 16.07], [17.0, 17.86], [19.0, 22.22], [23.0, 28.19], [31.0, 31.01], [36.0, 36.48], [37.0, 37.99], [40.0, 40.59], [42.0, 42.57], [51.0, 52.37], [55.0, 55.41], [65.0, 66.8], [69.0, 70.7], [76.0, 80.59], [82.0, 82.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.27, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.57], ["hum", 2.18], ["sidetone", 1.67]], null], "duration": [0.1, 0.13, 1.07, 0.86, 3.22, 5.19, 0.01, 0.48, 0.99, 0.59, 0.57, 1.37, 0.41, 1.8, 1.7, 4.59, 0.44]} \ No newline at end of file diff --git a/annotations_1/NCi4QNKpVB8_filtered.json b/annotations_1/NCi4QNKpVB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af5a4a7cbc2e2c71a15280639469158ddcc86cf2 --- /dev/null +++ b/annotations_1/NCi4QNKpVB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.43], [17.0, 17.42], [20.0, 23.19], [26.0, 30.1], [34.0, 49.17], [51.0, 52.46], [54.0, 67.86], [77.0, 83.62], [87.0, 92.08], [93.0, 94.24], [96.0, 96.6], [101.0, 113.95], [114.0, 114.35], [114.0, 122.12]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 29.28, 29.28, 29.1, 0.0, 30.42, 32.64, 30.88, 0.0, 0.0, 29.38, 0.0, 29.73], "audiomae_on_audioset": [null, null, [["music", 22.1], ["cattle, bovinae", 8.66], ["moo", 8.63]], [["music", 29.36], ["breaking", 18.82], ["speech", 6.88]], [["music", 56.83], ["didgeridoo", 6.06], ["boing", 4.72]], null, [["music", 68.52], ["synthesizer", 4.57], ["throbbing", 2.74]], [["music", 54.51], ["speech", 12.19], ["throbbing", 5.66]], [["music", 62.45], ["speech", 15.43], ["boing", 11.58]], null, null, [["music", 67.67], ["didgeridoo", 8.32], ["throbbing", 4.91]], null, [["insect", 24.42], ["mosquito", 22.62], ["fly, housefly", 17.97]]], "duration": [0.43, 0.42, 3.19, 4.1, 15.17, 1.46, 13.86, 6.62, 5.08, 1.24, 0.6, 12.95, 0.35, 8.12]} \ No newline at end of file diff --git a/annotations_1/NCjjqtamXzU_filtered.json b/annotations_1/NCjjqtamXzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1163174a2081ed665abb1e8a8fddd7d1e4bdeaf3 --- /dev/null +++ b/annotations_1/NCjjqtamXzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [12.0, 12.53], [15.0, 16.17], [18.0, 18.72], [23.0, 42.35], [58.0, 59.02], [59.0, 61.13], [62.0, 62.14], [66.0, 68.15], [71.0, 73.3], [96.0, 96.33], [100.0, 100.65], [106.0, 108.35], [112.0, 112.78], [120.0, 125.78]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.88, 0.0, 31.43, 0.0, 30.82, 29.19, 0.0, 0.0, 31.1, 0.0, 34.7], "audiomae_on_audioset": [null, null, null, null, [["music", 44.34], ["synthesizer", 16.76], ["electronic music", 7.83]], null, [["music", 44.13], ["techno", 8.8], ["speech", 6.26]], null, [["music", 64.73], ["speech", 8.11], ["techno", 3.66]], [["music", 64.1], ["speech", 17.52], ["vehicle", 2.92]], null, null, [["speech", 30.8], ["cattle, bovinae", 18.1], ["moo", 17.81]], null, [["music", 43.43], ["musical instrument", 7.04], ["theremin", 6.8]]], "duration": [0.67, 0.53, 1.17, 0.72, 19.35, 1.02, 2.13, 0.14, 2.15, 2.3, 0.33, 0.65, 2.35, 0.78, 5.78]} \ No newline at end of file diff --git a/annotations_1/NE6nLFq0eqc_filtered.json b/annotations_1/NE6nLFq0eqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71543aa94a1f38f2284abf10d02ebce70961571b --- /dev/null +++ b/annotations_1/NE6nLFq0eqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 95.03], [103.0, 104.89], [106.0, 106.2], [107.0, 106.74], [110.0, 110.76]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.03, 1.89, 0.2, -0.26, 0.76]} \ No newline at end of file diff --git a/annotations_1/NFj82X1Fdh4_filtered.json b/annotations_1/NFj82X1Fdh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdcf6725cbf34bb2e08c145da61e52f56eeb7b17 --- /dev/null +++ b/annotations_1/NFj82X1Fdh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.58], [7.0, 8.33], [10.0, 11.62], [13.0, 14.84], [20.0, 20.51], [23.0, 24.54], [27.0, 27.13], [30.0, 30.11], [34.0, 35.53], [42.0, 42.79], [52.0, 53.23], [55.0, 56.69], [58.0, 61.57], [65.0, 67.05], [71.0, 72.52], [76.0, 81.23], [84.0, 90.96], [92.0, 94.56], [97.0, 109.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 28.96, 0.0, 28.75, 46.4, 42.53, 31.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.82], ["hum", 18.66], ["mains hum", 18.66]], [["music", 18.91], ["rumble", 13.7], ["vehicle", 7.48]], null, [["buzz", 31.94], ["moo", 9.35], ["livestock, farm animals, working animals", 8.91]], [["music", 68.96], ["didgeridoo", 6.18], ["hum", 3.16]], [["music", 33.28], ["hum", 11.38], ["mains hum", 10.94]], [["music", 62.45], ["theremin", 13.96], ["synthesizer", 4.9]]], "duration": [1.58, 1.33, 1.62, 1.84, 0.51, 1.54, 0.13, 0.11, 1.53, 0.79, 1.23, 1.69, 3.57, 2.05, 1.52, 5.23, 6.96, 2.56, 12.04]} \ No newline at end of file diff --git a/annotations_1/NGkLen8TbHc_filtered.json b/annotations_1/NGkLen8TbHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/NGkLen8TbHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/NHg_SEfj38M_filtered.json b/annotations_1/NHg_SEfj38M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab820d804469a7d9f24add557f0eba7ea21f4537 --- /dev/null +++ b/annotations_1/NHg_SEfj38M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [6.0, 6.57], [8.0, 8.8], [16.0, 16.23], [23.0, 23.06], [28.0, 29.76], [31.0, 31.04], [34.0, 35.77], [36.0, 37.22], [44.0, 47.63], [66.0, 69.9], [79.0, 78.85], [98.0, 106.81], [107.0, 120.34], [122.0, 129.59]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 40.68, 0.0, 34.71, 35.97, 61.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 23.35], ["music", 17.66], ["fart", 10.41]], [["speech", 25.6], ["music", 10.03], ["mosquito", 6.4]], null, [["music", 64.13], ["synthesizer", 9.49], ["musical instrument", 5.89]], [["speech", 29.87], ["music", 22.75], ["buzz", 14.22]], null], "duration": [1.27, 0.57, 0.8, 0.23, 0.06, 1.76, 0.04, 1.77, 1.22, 3.63, 3.9, -0.15, 8.81, 13.34, 7.59]} \ No newline at end of file diff --git a/annotations_1/NIDabDkcS8o_filtered.json b/annotations_1/NIDabDkcS8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d720951574c07bb6aa1c972719f3b2d6ebb4cb1 --- /dev/null +++ b/annotations_1/NIDabDkcS8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.02], [14.0, 50.73], [52.0, 122.25], [123.0, 132.44]], "keep_status": [true, false, false, false], "silence_prob": [41.01, 0.0, 0.0, 29.23], "audiomae_on_audioset": [[["music", 45.62], ["cello", 10.43], ["double bass", 10.3]], null, null, [["music", 58.5], ["theremin", 13.98], ["buzz", 3.37]]], "duration": [4.02, 36.73, 70.25, 9.44]} \ No newline at end of file diff --git a/annotations_1/NIMWmy-1l4Y_filtered.json b/annotations_1/NIMWmy-1l4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f0b5c7e9d2d7e98fb981e19b2c7ac8d6222402b --- /dev/null +++ b/annotations_1/NIMWmy-1l4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.86], [11.0, 13.36], [17.0, 17.59], [23.0, 22.96], [25.0, 26.18], [28.0, 28.09], [31.0, 32.49], [33.0, 34.37], [37.0, 37.66], [40.0, 41.01], [42.0, 42.18], [43.0, 43.31], [49.0, 50.75], [53.0, 53.94], [57.0, 56.79], [58.0, 58.58], [59.0, 60.51], [66.0, 66.5], [71.0, 71.37], [76.0, 76.49], [80.0, 80.94], [81.0, 81.85], [115.0, 115.26], [118.0, 118.34], [125.0, 125.31], [128.0, 129.25], [131.0, 131.89], [135.0, 141.32], [149.0, 149.35], [159.0, 160.64], [176.0, 176.52], [179.0, 178.87], [179.0, 179.98], [189.0, 188.84], [191.0, 190.83], [193.0, 193.31], [195.0, 197.29], [200.0, 202.26], [204.0, 205.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.6, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 76.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.86, 2.36, 0.59, -0.04, 1.18, 0.09, 1.49, 1.37, 0.66, 1.01, 0.18, 0.31, 1.75, 0.94, -0.21, 0.58, 1.51, 0.5, 0.37, 0.49, 0.94, 0.85, 0.26, 0.34, 0.31, 1.25, 0.89, 6.32, 0.35, 1.64, 0.52, -0.13, 0.98, -0.16, -0.17, 0.31, 2.29, 2.26, 1.53]} \ No newline at end of file diff --git a/annotations_1/NInjsGq2yCA_filtered.json b/annotations_1/NInjsGq2yCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80df588cce58fed845a45005e540810a3a8a4b4f --- /dev/null +++ b/annotations_1/NInjsGq2yCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.47], [15.0, 72.42], [74.0, 80.16], [82.0, 98.49], [102.0, 109.46], [110.0, 110.86], [111.0, 113.02], [113.0, 113.63], [115.0, 115.28], [115.0, 115.57], [116.0, 119.72], [120.0, 120.36], [121.0, 130.17], [135.0, 173.94]], "keep_status": [false, false, true, false, true, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 30.32, 30.2, 42.55, 0.0, 48.95, 0.0, 0.0, 0.0, 45.08, 0.0, 36.31, 0.0], "audiomae_on_audioset": [null, null, [["speech", 28.37], ["fart", 7.88], ["music", 7.77]], [["speech", 62.67], ["music", 13.88], ["electronic music", 2.67]], [["whale vocalization", 20.49], ["music", 18.95], ["speech", 15.57]], null, [["singing bowl", 43.41], ["gong", 20.58], ["speech", 15.72]], null, null, null, [["speech", 36.54], ["music", 9.39], ["sine wave", 5.93]], null, [["music", 26.46], ["gong", 8.81], ["speech", 6.01]], null], "duration": [0.47, 57.42, 6.16, 16.49, 7.46, 0.86, 2.02, 0.63, 0.28, 0.57, 3.72, 0.36, 9.17, 38.94]} \ No newline at end of file diff --git a/annotations_1/NJNAE_e-gM0_filtered.json b/annotations_1/NJNAE_e-gM0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8ffa526217722f5f0052ac920887a8335c1637 --- /dev/null +++ b/annotations_1/NJNAE_e-gM0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.75], [13.0, 20.38], [23.0, 28.75], [29.0, 29.29], [30.0, 31.46], [33.0, 47.85], [49.0, 68.35], [85.0, 86.14], [91.0, 92.04], [97.0, 96.96], [100.0, 100.67], [106.0, 106.51], [110.0, 110.17], [111.0, 112.68], [114.0, 114.05], [133.0, 133.83], [134.0, 135.55], [145.0, 146.8]], "keep_status": [false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.11, 30.25, 0.0, 0.0, 29.82, 30.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.74], ["fly, housefly", 15.76], ["insect", 9.54]], [["cattle, bovinae", 31.14], ["livestock, farm animals, working animals", 23.67], ["moo", 13.55]], null, null, [["cattle, bovinae", 16.38], ["music", 12.26], ["speech", 8.97]], [["cattle, bovinae", 35.12], ["crowd", 18.96], ["moo", 17.19]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 7.38, 5.75, 0.29, 1.46, 14.85, 19.35, 1.14, 1.04, -0.04, 0.67, 0.51, 0.17, 1.68, 0.05, 0.83, 1.55, 1.8]} \ No newline at end of file diff --git a/annotations_1/NKewr9uDDck_filtered.json b/annotations_1/NKewr9uDDck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a51a854748f477027e5ae2547195606f294ba7ea --- /dev/null +++ b/annotations_1/NKewr9uDDck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.56], [6.0, 7.59], [8.0, 9.05], [18.0, 22.72], [25.0, 25.52], [26.0, 27.57], [28.0, 32.93], [34.0, 34.79], [35.0, 37.94], [50.0, 59.19], [59.0, 59.26], [59.0, 61.06], [82.0, 82.48], [96.0, 97.36], [98.0, 98.81], [103.0, 103.18], [112.0, 113.78], [115.0, 116.41], [124.0, 127.65], [128.0, 128.85], [134.0, 136.04], [137.0, 138.47], [142.0, 143.43], [144.0, 146.06], [156.0, 156.12], [159.0, 162.58], [165.0, 165.16], [167.0, 167.88]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [39.8, 0.0, 0.0, 32.2, 0.0, 0.0, 42.96, 0.0, 36.51, 33.49, 0.0, 35.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.32, 0.0, 31.48, 0.0, 0.0, 33.19, 0.0, 36.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.12], ["marimba, xylophone", 7.03], ["musical instrument", 3.4]], null, null, [["speech", 45.32], ["grunt", 25.08], ["groan", 7.86]], null, null, [["music", 73.22], ["musical instrument", 5.15], ["synthesizer", 3.19]], null, [["speech", 26.09], ["music", 17.22], ["burping, eructation", 6.95]], [["speech", 61.47], ["music", 22.17], ["synthesizer", 3.83]], null, [["boing", 44.0], ["speech", 38.47], ["music", 2.04]], null, null, null, null, null, null, [["boing", 53.63], ["music", 24.69], ["cattle, bovinae", 2.96]], null, [["music", 32.08], ["boing", 26.02], ["speech", 17.91]], null, null, [["music", 58.3], ["theremin", 12.97], ["didgeridoo", 4.33]], null, [["speech", 32.95], ["chirp tone", 7.64], ["burping, eructation", 7.62]], null, null], "duration": [2.56, 1.59, 1.05, 4.72, 0.52, 1.57, 4.93, 0.79, 2.94, 9.19, 0.26, 2.06, 0.48, 1.36, 0.81, 0.18, 1.78, 1.41, 3.65, 0.85, 2.04, 1.47, 1.43, 2.06, 0.12, 3.58, 0.16, 0.88]} \ No newline at end of file diff --git a/annotations_1/NKhTArRP31Q_filtered.json b/annotations_1/NKhTArRP31Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bea158bdbcb902be56e93cd66ffe773a7c1c1b6b --- /dev/null +++ b/annotations_1/NKhTArRP31Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.02], [15.0, 24.02], [34.0, 33.94], [40.0, 43.04], [49.0, 51.31], [53.0, 58.36], [60.0, 108.72], [109.0, 115.62], [118.0, 119.1], [123.0, 122.91]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [32.04, 36.03, 0.0, 33.92, 49.18, 50.51, 0.0, 39.04, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 32.52], ["hum", 29.24], ["music", 18.77]], [["explosion", 26.28], ["music", 19.54], ["speech", 7.41]], null, [["music", 21.29], ["chink, clink", 13.66], ["didgeridoo", 12.42]], [["speech", 34.03], ["music", 31.68], ["hum", 6.14]], null, null, [["music", 86.17], ["musical instrument", 1.59], ["sitar", 1.5]], null, null], "duration": [6.02, 9.02, -0.06, 3.04, 2.31, 5.36, 48.72, 6.62, 1.1, -0.09]} \ No newline at end of file diff --git a/annotations_1/NKjZRRw3-Fs_filtered.json b/annotations_1/NKjZRRw3-Fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cdbdb9d66cb6a650f5a690e6a5a94a75a891ef1 --- /dev/null +++ b/annotations_1/NKjZRRw3-Fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.1], [30.0, 35.72], [37.0, 37.02], [40.0, 40.44], [40.0, 43.36], [45.0, 45.91], [48.0, 49.32], [50.0, 52.74], [54.0, 55.76], [57.0, 60.15], [61.0, 62.19], [63.0, 64.91], [66.0, 67.07], [74.0, 73.95], [76.0, 78.0], [80.0, 82.81], [85.0, 85.28], [91.0, 91.56], [92.0, 92.64], [96.0, 97.44], [104.0, 103.99], [105.0, 106.24], [108.0, 109.16], [110.0, 115.67], [117.0, 118.45], [120.0, 120.93], [121.0, 123.58], [127.0, 127.7], [138.0, 139.67], [140.0, 141.81], [146.0, 147.29], [149.0, 149.71], [152.0, 152.61], [156.0, 157.3], [159.0, 160.62], [165.0, 170.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.36, 0.0, 0.0, 89.19, 0.0, 0.0, 98.86, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 99.62, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 5.72, 0.02, 0.44, 3.36, 0.91, 1.32, 2.74, 1.76, 3.15, 1.19, 1.91, 1.07, -0.05, 2.0, 2.81, 0.28, 0.56, 0.64, 1.44, -0.01, 1.24, 1.16, 5.67, 1.45, 0.93, 2.58, 0.7, 1.67, 1.81, 1.29, 0.71, 0.61, 1.3, 1.62, 5.21]} \ No newline at end of file diff --git a/annotations_1/NLfY3XAZ6c0_filtered.json b/annotations_1/NLfY3XAZ6c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5b17bfea27b80caacfd3fde8f7001f97a28af8c --- /dev/null +++ b/annotations_1/NLfY3XAZ6c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.64], [20.0, 20.41], [39.0, 40.24], [63.0, 62.94], [83.0, 84.25], [88.0, 88.25]], "keep_status": [false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [2.64, 0.41, 1.24, -0.06, 1.25, 0.25]} \ No newline at end of file diff --git a/annotations_1/NM0WEaC8LcQ_filtered.json b/annotations_1/NM0WEaC8LcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba2e5d0e5d0315bb16e5e0aaa649eb4212e6538b --- /dev/null +++ b/annotations_1/NM0WEaC8LcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 95.32], [100.0, 103.87], [107.0, 140.09], [141.0, 153.66]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 31.18, 0.0, 34.49], "audiomae_on_audioset": [null, [["music", 48.49], ["throbbing", 10.55], ["hum", 7.0]], null, [["music", 40.58], ["brass instrument", 11.91], ["trombone", 8.23]]], "duration": [37.32, 3.87, 33.09, 12.66]} \ No newline at end of file diff --git a/annotations_1/NMbSKSzRvF8_filtered.json b/annotations_1/NMbSKSzRvF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4140fd63a29c1ad5121e20170ff6279408b9d36c --- /dev/null +++ b/annotations_1/NMbSKSzRvF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [6.0, 6.17], [13.0, 13.81], [15.0, 16.98], [18.0, 36.51], [41.0, 47.49], [52.0, 52.14], [59.0, 59.26], [69.0, 69.28], [79.0, 79.74], [81.0, 81.82], [84.0, 85.82], [88.0, 87.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.74, 30.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 59.31], ["didgeridoo", 22.48], ["theremin", 6.12]], [["music", 39.57], ["fly, housefly", 7.56], ["insect", 4.69]], null, null, null, null, null, null, null], "duration": [1.08, 0.17, 0.81, 1.98, 18.51, 6.49, 0.14, 0.26, 0.28, 0.74, 0.82, 1.82, -0.12]} \ No newline at end of file diff --git a/annotations_1/NOACyJ1CYfo_filtered.json b/annotations_1/NOACyJ1CYfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7ed3d763428242d383f876f204456a6b0efbff3 --- /dev/null +++ b/annotations_1/NOACyJ1CYfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.95], [7.0, 8.51], [11.0, 10.94], [20.0, 20.43], [21.0, 23.55], [33.0, 33.86], [38.0, 44.1], [44.0, 44.29], [44.0, 44.85], [46.0, 46.41], [50.0, 50.46], [68.0, 72.52], [74.0, 81.9], [91.0, 95.12], [99.0, 105.26], [110.0, 110.27], [111.0, 120.51], [125.0, 125.1], [126.0, 126.2], [137.0, 138.43], [142.0, 156.88], [158.0, 159.98]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.33, 0.0, 29.59, 0.0, 0.0, 0.0, 0.0, 30.54, 29.87, 31.21, 29.0, 0.0, 29.27, 0.0, 0.0, 0.0, 29.43, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 48.71], ["didgeridoo", 10.95], ["musical instrument", 4.09]], null, [["speech", 53.91], ["music", 30.08], ["buzz", 2.89]], null, null, null, null, [["speech", 39.16], ["music", 30.22], ["whack, thwack", 4.67]], [["music", 43.55], ["livestock, farm animals, working animals", 10.26], ["boing", 6.42]], [["hum", 42.24], ["throbbing", 25.6], ["music", 11.14]], [["music", 79.22], ["speech", 7.54], ["throbbing", 1.66]], null, [["music", 52.39], ["speech", 27.71], ["buzz", 5.23]], null, null, null, [["throbbing", 30.91], ["music", 27.52], ["hum", 18.67]], null], "duration": [0.95, 1.51, -0.06, 0.43, 2.55, 0.86, 6.1, 0.29, 0.85, 0.41, 0.46, 4.52, 7.9, 4.12, 6.26, 0.27, 9.51, 0.1, 0.2, 1.43, 14.88, 1.98]} \ No newline at end of file diff --git a/annotations_1/NP2fSxIpvis_filtered.json b/annotations_1/NP2fSxIpvis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbef5c6e33adaa24057310d3bee9fc669ee8a641 --- /dev/null +++ b/annotations_1/NP2fSxIpvis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.78], [25.0, 24.85], [29.0, 61.74], [67.0, 74.17], [91.0, 106.12]], "keep_status": [false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 29.91, 36.23], "audiomae_on_audioset": [null, null, null, [["speech", 34.54], ["whale vocalization", 28.68], ["vehicle", 5.22]], [["speech", 46.27], ["music", 11.87], ["electric shaver, electric razor", 11.06]]], "duration": [0.78, -0.15, 32.74, 7.17, 15.12]} \ No newline at end of file diff --git a/annotations_1/NPY5Iq-tCvk_filtered.json b/annotations_1/NPY5Iq-tCvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c26631d1251c1b4750509106c08576b2d0675d4 --- /dev/null +++ b/annotations_1/NPY5Iq-tCvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.88], [7.0, 14.62], [16.0, 16.11], [18.0, 18.74], [20.0, 22.1], [23.0, 33.15], [34.0, 59.41], [61.0, 60.79], [67.0, 81.94], [83.0, 82.9], [83.0, 83.54], [87.0, 92.33], [93.0, 94.39], [101.0, 102.59], [104.0, 106.78], [108.0, 110.62], [112.0, 112.9], [114.0, 119.06], [120.0, 131.7], [133.0, 134.43]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 29.14, 0.0, 0.0, 32.33, 30.73, 29.45, 0.0, 29.69, 0.0, 0.0, 58.89, 0.0, 0.0, 95.09, 91.98, 0.0, 32.13, 39.27, 0.0], "audiomae_on_audioset": [null, [["music", 44.6], ["speech", 22.26], ["whack, thwack", 6.69]], null, null, [["music", 36.62], ["rumble", 12.28], ["hum", 10.03]], [["music", 43.21], ["hum", 8.17], ["sonar", 4.44]], [["speech", 67.55], ["music", 6.54], ["sound effect", 4.31]], null, [["music", 52.97], ["throbbing", 16.35], ["hum", 7.2]], null, null, null, null, null, null, null, null, [["thunk", 45.29], ["whack, thwack", 5.36], ["breaking", 5.24]], [["music", 51.24], ["speech", 30.69], ["buzz", 2.48]], null], "duration": [-0.12, 7.62, 0.11, 0.74, 2.1, 10.15, 25.41, -0.21, 14.94, -0.1, 0.54, 5.33, 1.39, 1.59, 2.78, 2.62, 0.9, 5.06, 11.7, 1.43]} \ No newline at end of file diff --git a/annotations_1/NPmAEqlzKqE_filtered.json b/annotations_1/NPmAEqlzKqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2be81f2489cdeeb60ded6fcef63e3caa7865934 --- /dev/null +++ b/annotations_1/NPmAEqlzKqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [5.0, 5.04], [8.0, 9.0], [9.0, 13.04], [14.0, 44.66], [46.0, 46.74], [50.0, 54.24], [55.0, 69.25], [70.0, 79.66], [94.0, 95.23]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 59.51, 81.17, 34.09, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 16.91], ["speech", 10.64], ["screaming", 6.78]], null], "duration": [-0.09, 0.04, 1.0, 4.04, 30.66, 0.74, 4.24, 14.25, 9.66, 1.23]} \ No newline at end of file diff --git a/annotations_1/NQBMjZqgGEI_filtered.json b/annotations_1/NQBMjZqgGEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b623206e53d5dcaf527b61ebb6cb7f86c404de6 --- /dev/null +++ b/annotations_1/NQBMjZqgGEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [26.0, 27.31], [28.0, 33.64], [41.0, 40.74], [74.0, 74.49], [83.0, 83.25], [85.0, 87.88], [91.0, 95.79], [97.0, 98.36]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 97.33, 44.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 46.25], ["music", 12.71], ["thunk", 3.81]], null], "duration": [0.13, 1.31, 5.64, -0.26, 0.49, 0.25, 2.88, 4.79, 1.36]} \ No newline at end of file diff --git a/annotations_1/NQcQ3bA_NXw_filtered.json b/annotations_1/NQcQ3bA_NXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..568832c844e31d251123bae489802f7653f97a21 --- /dev/null +++ b/annotations_1/NQcQ3bA_NXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [13.0, 13.51], [19.0, 19.47], [30.0, 31.48], [39.0, 39.73], [48.0, 47.88], [56.0, 55.86], [61.0, 61.1], [70.0, 70.28], [82.0, 82.63], [84.0, 84.03], [96.0, 96.45], [113.0, 113.76], [116.0, 115.99], [124.0, 125.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.51, 0.47, 1.48, 0.73, -0.12, -0.14, 0.1, 0.28, 0.63, 0.03, 0.45, 0.76, -0.01, 1.29]} \ No newline at end of file diff --git a/annotations_1/NQgAVrZRz3o_filtered.json b/annotations_1/NQgAVrZRz3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10c45e1ce111fb16c1de01e81c85574cc6beb381 --- /dev/null +++ b/annotations_1/NQgAVrZRz3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.91], [9.0, 10.23], [11.0, 13.1], [17.0, 18.62], [27.0, 31.31], [37.0, 38.69], [42.0, 45.89], [47.0, 49.22], [50.0, 51.81], [53.0, 85.36], [86.0, 86.44], [87.0, 87.62], [89.0, 90.39], [91.0, 97.56], [101.0, 101.97], [108.0, 108.58], [111.0, 115.15]], "keep_status": [false, false, true, false, true, false, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.85, 0.0, 34.58, 0.0, 38.23, 44.72, 0.0, 0.0, 0.0, 0.0, 0.0, 34.78, 0.0, 0.0, 44.72], "audiomae_on_audioset": [null, null, [["vehicle", 21.77], ["music", 14.7], ["toot", 5.84]], null, [["hum", 24.21], ["rumble", 19.92], ["buzz", 15.35]], null, [["whale vocalization", 28.6], ["rumble", 21.18], ["music", 7.03]], [["rumble", 22.43], ["frog", 10.21], ["throbbing", 8.89]], null, null, null, null, null, [["hum", 46.1], ["mains hum", 35.3], ["whale vocalization", 5.0]], null, null, [["hum", 28.1], ["mains hum", 27.52], ["rumble", 10.02]]], "duration": [0.91, 1.23, 2.1, 1.62, 4.31, 1.69, 3.89, 2.22, 1.81, 32.36, 0.44, 0.62, 1.39, 6.56, 0.97, 0.58, 4.15]} \ No newline at end of file diff --git a/annotations_1/NQtL20JoP3Q_filtered.json b/annotations_1/NQtL20JoP3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38721a957c1f06cc770ed8b00f73afa79788b741 --- /dev/null +++ b/annotations_1/NQtL20JoP3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 34.55], [36.0, 41.25], [44.0, 44.2], [45.0, 45.94], [47.0, 49.1], [53.0, 54.48], [58.0, 58.6], [64.0, 64.93], [67.0, 67.86], [68.0, 67.91]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [39.77, 60.42, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 11.11], ["music", 10.7], ["rumble", 9.04]], null, null, null, null, null, null, null, null, null], "duration": [10.55, 5.25, 0.2, 0.94, 2.1, 1.48, 0.6, 0.93, 0.86, -0.09]} \ No newline at end of file diff --git a/annotations_1/NQw5e3HJgfk_filtered.json b/annotations_1/NQw5e3HJgfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47bfa61f041aeec6786d2c68a0c338b95bee17a4 --- /dev/null +++ b/annotations_1/NQw5e3HJgfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.76], [20.0, 20.82], [30.0, 34.92], [37.0, 37.4], [44.0, 49.92], [51.0, 51.06], [52.0, 52.79], [60.0, 68.39], [73.0, 73.8], [79.0, 78.54], [83.0, 83.03]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 50.21, 0.0, 35.08, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 55.02], ["cattle, bovinae", 19.87], ["moo", 15.94]], null, null, [["didgeridoo", 43.64], ["cattle, bovinae", 7.98], ["wind instrument, woodwind instrument", 7.13]], null, null, null], "duration": [1.76, 0.82, 4.92, 0.4, 5.92, 0.06, 0.79, 8.39, 0.8, -0.46, 0.03]} \ No newline at end of file diff --git a/annotations_1/NRBLTtDkQXU_filtered.json b/annotations_1/NRBLTtDkQXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8b70172fb766390498330410ee51c478fdfacee --- /dev/null +++ b/annotations_1/NRBLTtDkQXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.0], [13.0, 13.29], [14.0, 14.67], [17.0, 19.89], [21.0, 21.98], [23.0, 23.6], [26.0, 26.89], [28.0, 29.08], [31.0, 32.19], [34.0, 34.52], [35.0, 36.51], [39.0, 39.46], [52.0, 52.61], [56.0, 57.64], [58.0, 69.08], [69.0, 70.97], [72.0, 77.38], [81.0, 84.16], [85.0, 93.07], [100.0, 99.76], [100.0, 102.86], [106.0, 107.59], [116.0, 118.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 93.91, 100.0, 42.04, 0.0, 98.86, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.15], ["sidetone", 12.69], ["hum", 2.02]], null, null, null, null], "duration": [2.0, 0.29, 0.67, 2.89, 0.98, 0.6, 0.89, 1.08, 1.19, 0.52, 1.51, 0.46, 0.61, 1.64, 11.08, 1.97, 5.38, 3.16, 8.07, -0.24, 2.86, 1.59, 2.89]} \ No newline at end of file diff --git a/annotations_1/NSTXoI3j4ko_filtered.json b/annotations_1/NSTXoI3j4ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..029e3816ae9dce4d674ca5b48c196f948701f5fa --- /dev/null +++ b/annotations_1/NSTXoI3j4ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.81], [10.0, 13.51], [16.0, 19.65], [23.0, 33.0], [36.0, 38.85], [44.0, 44.31], [46.0, 47.17], [64.0, 66.88], [67.0, 71.79], [87.0, 89.18], [90.0, 125.56], [132.0, 132.36], [138.0, 139.33]], "keep_status": [false, true, false, true, true, false, false, true, true, true, false, false, false], "silence_prob": [0.0, 32.79, 31.22, 31.61, 33.31, 0.0, 0.0, 30.75, 35.09, 33.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 31.75], ["music", 9.2], ["cattle, bovinae", 8.23]], [["cattle, bovinae", 35.39], ["moo", 29.85], ["livestock, farm animals, working animals", 10.51]], [["music", 39.89], ["speech", 22.07], ["cattle, bovinae", 6.01]], [["music", 28.9], ["throbbing", 15.44], ["speech", 9.08]], null, null, [["crowd", 14.83], ["speech", 12.39], ["boing", 5.37]], [["fly, housefly", 35.28], ["insect", 15.09], ["frog", 9.35]], [["cattle, bovinae", 13.37], ["moo", 11.68], ["music", 11.57]], null, null, null], "duration": [0.81, 3.51, 3.65, 10.0, 2.85, 0.31, 1.17, 2.88, 4.79, 2.18, 35.56, 0.36, 1.33]} \ No newline at end of file diff --git a/annotations_1/NTdHPAY7rOE_filtered.json b/annotations_1/NTdHPAY7rOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adc7b945d4df683d8135aa8cc0fabb4cfe4992bc --- /dev/null +++ b/annotations_1/NTdHPAY7rOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.67], [19.0, 31.56], [35.0, 35.07], [37.0, 42.45], [43.0, 43.78], [47.0, 48.47], [50.0, 50.19], [52.0, 51.85], [60.0, 60.86], [61.0, 65.48], [74.0, 78.75], [84.0, 84.91], [104.0, 112.7], [113.0, 116.65], [119.0, 125.27], [129.0, 135.8], [139.0, 141.12], [143.0, 144.21], [149.0, 158.48], [160.0, 172.99], [175.0, 182.71], [185.0, 186.24], [189.0, 189.24], [194.0, 198.9], [200.0, 200.6], [201.0, 202.73]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [36.17, 29.86, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 43.28, 43.4, 0.0, 36.88, 31.91, 33.47, 40.29, 37.39, 0.0, 36.5, 34.69, 34.44, 0.0, 0.0, 35.03, 0.0, 0.0], "audiomae_on_audioset": [[["music", 66.03], ["didgeridoo", 4.12], ["theremin", 2.62]], [["music", 45.57], ["speech", 8.05], ["cacophony", 7.45]], null, null, null, null, null, null, null, [["sidetone", 44.71], ["music", 20.65], ["speech", 14.55]], [["music", 25.36], ["clang", 17.68], ["hum", 8.27]], null, [["fly, housefly", 39.42], ["mosquito", 26.05], ["insect", 14.51]], [["cattle, bovinae", 22.14], ["livestock, farm animals, working animals", 19.6], ["moo", 16.97]], [["music", 42.11], ["boing", 27.8], ["cacophony", 2.53]], [["music", 53.22], ["speech", 11.91], ["livestock, farm animals, working animals", 3.32]], [["music", 45.42], ["theremin", 10.01], ["breaking", 6.34]], null, [["music", 46.99], ["throbbing", 19.44], ["electronic music", 7.77]], [["music", 46.31], ["throbbing", 19.76], ["hum", 12.72]], [["music", 31.96], ["throbbing", 20.89], ["hum", 9.73]], null, null, [["music", 44.73], ["hum", 15.01], ["throbbing", 11.45]], null, null], "duration": [2.67, 12.56, 0.07, 5.45, 0.78, 1.47, 0.19, -0.15, 0.86, 4.48, 4.75, 0.91, 8.7, 3.65, 6.27, 6.8, 2.12, 1.21, 9.48, 12.99, 7.71, 1.24, 0.24, 4.9, 0.6, 1.73]} \ No newline at end of file diff --git a/annotations_1/NUmE-c4ym40_filtered.json b/annotations_1/NUmE-c4ym40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d01412523bb8f974166c964985179f8eeeae2611 --- /dev/null +++ b/annotations_1/NUmE-c4ym40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.46], [5.0, 20.29], [22.0, 24.88], [26.0, 26.11], [27.0, 30.3], [31.0, 32.9], [36.0, 36.71], [38.0, 38.79], [42.0, 45.94], [50.0, 52.88], [57.0, 58.04], [61.0, 69.69], [70.0, 73.01], [75.0, 75.68], [79.0, 79.19], [80.0, 80.65], [83.0, 83.46], [84.0, 83.52], [84.0, 83.62], [84.0, 83.69], [84.0, 83.73], [84.0, 83.76], [84.0, 87.0], [89.0, 89.34]], "keep_status": [false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.13, 37.37, 36.52, 0.0, 47.01, 0.0, 0.0, 0.0, 43.45, 51.39, 0.0, 73.51, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0], "audiomae_on_audioset": [null, [["music", 52.57], ["speech", 6.4], ["radio", 4.09]], [["mains hum", 47.17], ["hum", 27.54], ["throbbing", 10.92]], null, [["didgeridoo", 34.24], ["music", 22.2], ["gong", 5.47]], null, null, null, [["music", 28.74], ["fart", 12.98], ["speech", 9.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.46, 15.29, 2.88, 0.11, 3.3, 1.9, 0.71, 0.79, 3.94, 2.88, 1.04, 8.69, 3.01, 0.68, 0.19, 0.65, 0.46, -0.48, -0.38, -0.31, -0.27, -0.24, 3.0, 0.34]} \ No newline at end of file diff --git a/annotations_1/NV9oKGj_CcU_filtered.json b/annotations_1/NV9oKGj_CcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42aa59526fa2ee8c9370927a118715e3b022f729 --- /dev/null +++ b/annotations_1/NV9oKGj_CcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [3.0, 2.57], [3.0, 12.51], [16.0, 23.06], [28.0, 31.06], [31.0, 31.09], [31.0, 34.75], [38.0, 38.38], [41.0, 50.6], [51.0, 75.91], [79.0, 81.28], [83.0, 95.34]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.14, 32.13, 30.82, 0.0, 30.95, 0.0, 31.86, 31.84, 33.44, 32.88], "audiomae_on_audioset": [null, null, [["music", 48.19], ["clarinet", 9.68], ["musical instrument", 7.39]], [["music", 48.25], ["brass instrument", 12.65], ["saxophone", 10.75]], [["music", 58.23], ["theremin", 7.76], ["synthesizer", 6.92]], null, [["music", 45.7], ["musical instrument", 9.39], ["brass instrument", 7.86]], null, [["music", 45.89], ["brass instrument", 12.71], ["musical instrument", 8.56]], [["music", 42.38], ["theremin", 24.67], ["clarinet", 7.47]], [["music", 46.74], ["clarinet", 18.28], ["musical instrument", 5.48]], [["music", 66.84], ["musical instrument", 7.96], ["synthesizer", 5.85]]], "duration": [1.42, -0.43, 9.51, 7.06, 3.06, 0.09, 3.75, 0.38, 9.6, 24.91, 2.28, 12.34]} \ No newline at end of file diff --git a/annotations_1/NVXDwL6XG_c_filtered.json b/annotations_1/NVXDwL6XG_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..578f29b25d6d1ee674e0cf4fbf65ad454f93451a --- /dev/null +++ b/annotations_1/NVXDwL6XG_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 23.95]], "keep_status": [false], "silence_prob": [35.62], "audiomae_on_audioset": [[["music", 69.79], ["scary music", 7.81], ["hum", 6.11]]], "duration": [13.95]} \ No newline at end of file diff --git a/annotations_1/NWUxk3JPaqU_filtered.json b/annotations_1/NWUxk3JPaqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44f7bf218b6d9f72a31415b35a7ca2b96d3ba51a --- /dev/null +++ b/annotations_1/NWUxk3JPaqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [4.0, 6.0], [13.0, 16.63], [17.0, 29.47], [30.0, 49.18], [51.0, 81.35], [86.0, 88.18], [90.0, 91.5], [94.0, 94.42], [96.0, 97.31], [99.0, 100.77], [105.0, 104.87]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.08, 77.36, 98.66, 29.79, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 25.02], ["sine wave", 13.11], ["mains hum", 8.45]], null, null, [["speech", 36.9], ["music", 7.54], ["keys jangling", 5.54]], null, null, null, null, null, null, null], "duration": [0.54, 2.0, 3.63, 12.47, 19.18, 30.35, 2.18, 1.5, 0.42, 1.31, 1.77, -0.13]} \ No newline at end of file diff --git a/annotations_1/NWvUNDAsYqE_filtered.json b/annotations_1/NWvUNDAsYqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c72eee7ca5faa2c60fac5de96cebc47a059946c8 --- /dev/null +++ b/annotations_1/NWvUNDAsYqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.87], [26.0, 26.97], [28.0, 28.8], [30.0, 34.43], [37.0, 37.5], [46.0, 46.74], [50.0, 49.96], [51.0, 51.39], [53.0, 55.31], [56.0, 59.95], [63.0, 63.48], [65.0, 67.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.97, 0.8, 4.43, 0.5, 0.74, -0.04, 0.39, 2.31, 3.95, 0.48, 2.04]} \ No newline at end of file diff --git a/annotations_1/NX12Wu1uqbI_filtered.json b/annotations_1/NX12Wu1uqbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96550f7222eec290981c83ac476b7d0db4571483 --- /dev/null +++ b/annotations_1/NX12Wu1uqbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.15], [17.0, 20.36], [24.0, 25.62], [28.0, 31.41], [32.0, 32.68], [34.0, 52.35], [53.0, 58.87], [60.0, 62.29], [63.0, 65.31], [66.0, 67.9], [71.0, 75.41], [77.0, 79.39], [85.0, 88.47], [89.0, 92.48], [101.0, 103.57], [105.0, 108.4], [109.0, 109.92], [111.0, 111.57], [112.0, 112.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.66, 0.0, 95.51, 0.0, 95.37, 91.47, 97.33, 96.66, 0.0, 99.95, 87.37, 76.7, 99.99, 81.53, 97.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 3.36, 1.62, 3.41, 0.68, 18.35, 5.87, 2.29, 2.31, 1.9, 4.41, 2.39, 3.47, 3.48, 2.57, 3.4, 0.92, 0.57, 0.14]} \ No newline at end of file diff --git a/annotations_1/NXTrMtrTjlI_filtered.json b/annotations_1/NXTrMtrTjlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84aec80ffe1fbdf1cf2f6a7d182e8610de0927a6 --- /dev/null +++ b/annotations_1/NXTrMtrTjlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.74], [10.0, 10.52], [12.0, 13.26], [15.0, 15.58], [19.0, 20.41], [21.0, 22.96], [25.0, 26.76], [31.0, 32.49], [34.0, 35.97], [40.0, 41.34], [42.0, 50.92], [51.0, 55.05], [57.0, 57.96], [61.0, 62.5], [66.0, 68.84], [76.0, 77.41], [83.0, 83.39], [87.0, 88.3], [91.0, 90.69], [93.0, 94.29], [97.0, 98.39], [99.0, 99.37], [100.0, 100.74], [102.0, 104.31], [105.0, 110.12], [116.0, 117.49], [119.0, 120.04], [125.0, 125.56], [131.0, 132.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 91.47, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 54.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 0.52, 1.26, 0.58, 1.41, 1.96, 1.76, 1.49, 1.97, 1.34, 8.92, 4.05, 0.96, 1.5, 2.84, 1.41, 0.39, 1.3, -0.31, 1.29, 1.39, 0.37, 0.74, 2.31, 5.12, 1.49, 1.04, 0.56, 1.61]} \ No newline at end of file diff --git a/annotations_1/NY9q_Vfbi5Q_filtered.json b/annotations_1/NY9q_Vfbi5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50228b21d0d9ecd285f5060ea209d0a887a83e59 --- /dev/null +++ b/annotations_1/NY9q_Vfbi5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [6.0, 7.35], [11.0, 12.07], [16.0, 18.66], [34.0, 46.38], [47.0, 80.87], [82.0, 103.18], [104.0, 105.34], [107.0, 168.05], [168.0, 168.27], [168.0, 168.37]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.43, 37.12, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 32.89], ["music", 20.95], ["hum", 11.25]], [["music", 36.42], ["hum", 21.94], ["mains hum", 13.2]], null, [["speech", 20.43], ["music", 19.77], ["smash, crash", 7.84]], null, null, null, null], "duration": [0.0, 1.35, 1.07, 2.66, 12.38, 33.87, 21.18, 1.34, 61.05, 0.27, 0.37]} \ No newline at end of file diff --git a/annotations_1/NYBMaVtMaEM_filtered.json b/annotations_1/NYBMaVtMaEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db4ac7ae8fcf77f854d354ab8ab42d585296c249 --- /dev/null +++ b/annotations_1/NYBMaVtMaEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 22.6], [24.0, 24.7], [27.0, 27.03], [34.0, 38.04], [40.0, 40.34], [46.0, 102.56], [103.0, 103.49], [110.0, 130.79]], "keep_status": [false, false, false, true, false, false, false, true], "silence_prob": [29.34, 0.0, 0.0, 29.54, 0.0, 0.0, 0.0, 29.82], "audiomae_on_audioset": [[["hum", 41.9], ["throbbing", 24.92], ["mains hum", 10.04]], null, null, [["music", 36.04], ["speech", 11.57], ["noise", 4.38]], null, null, null, [["music", 23.12], ["speech", 7.32], ["vehicle", 5.76]]], "duration": [17.6, 0.7, 0.03, 4.04, 0.34, 56.56, 0.49, 20.79]} \ No newline at end of file diff --git a/annotations_1/NYRHTYWWiGU_filtered.json b/annotations_1/NYRHTYWWiGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f658337c31cc2b8930814b3df8e9ab42b2a6c36d --- /dev/null +++ b/annotations_1/NYRHTYWWiGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.03], [16.0, 16.87], [41.0, 54.3], [62.0, 73.03], [76.0, 75.64], [77.0, 77.77], [84.0, 88.3], [89.0, 95.34], [110.0, 112.7], [117.0, 120.88], [121.0, 135.46], [136.0, 139.9], [142.0, 141.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 28.85, 28.97, 0.0, 0.0, 28.92, 28.88, 31.05, 28.99, 29.18, 60.23, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.58], ["speech", 33.7], ["hum", 3.14]], [["music", 60.02], ["speech", 9.26], ["vehicle", 2.44]], null, null, [["music", 66.04], ["dubstep", 8.56], ["electronic music", 5.29]], [["music", 75.06], ["speech", 7.94], ["electronic music", 6.16]], [["music", 37.93], ["speech", 18.5], ["static", 5.96]], [["speech", 46.14], ["music", 21.96], ["electronic music", 4.7]], [["music", 43.34], ["breaking", 13.91], ["speech", 7.04]], null, null], "duration": [1.03, 0.87, 13.3, 11.03, -0.36, 0.77, 4.3, 6.34, 2.7, 3.88, 14.46, 3.9, -0.36]} \ No newline at end of file diff --git a/annotations_1/NZ-u1BXI0YQ_filtered.json b/annotations_1/NZ-u1BXI0YQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..994c5065d5b2ba09d7fec14dec2140c282c6b001 --- /dev/null +++ b/annotations_1/NZ-u1BXI0YQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.82], [18.0, 19.45], [20.0, 21.03], [21.0, 22.13], [26.0, 27.18], [29.0, 29.88], [34.0, 34.16], [47.0, 47.39], [50.0, 50.85], [57.0, 58.38], [62.0, 62.23], [63.0, 63.31], [64.0, 64.49], [65.0, 65.18], [68.0, 69.06], [71.0, 71.42], [72.0, 72.35], [75.0, 75.79], [77.0, 77.7], [80.0, 80.97], [99.0, 99.69], [102.0, 102.95], [106.0, 106.34], [109.0, 110.56], [115.0, 115.62], [120.0, 119.99], [123.0, 124.04], [128.0, 129.3], [135.0, 135.65], [141.0, 141.44], [144.0, 144.02], [146.0, 146.33], [156.0, 156.27], [165.0, 166.36], [166.0, 166.75], [199.0, 201.14], [204.0, 207.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 50.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 1.45, 1.03, 1.13, 1.18, 0.88, 0.16, 0.39, 0.85, 1.38, 0.23, 0.31, 0.49, 0.18, 1.06, 0.42, 0.35, 0.79, 0.7, 0.97, 0.69, 0.95, 0.34, 1.56, 0.62, -0.01, 1.04, 1.3, 0.65, 0.44, 0.02, 0.33, 0.27, 1.36, 0.75, 2.14, 3.03]} \ No newline at end of file diff --git a/annotations_1/NZ2qhFm6LO8_filtered.json b/annotations_1/NZ2qhFm6LO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ad5d4cc2fe210d88b339a813517a4fba4b4ee33 --- /dev/null +++ b/annotations_1/NZ2qhFm6LO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [4.0, 3.72], [7.0, 8.87], [11.0, 15.97], [17.0, 17.52], [19.0, 21.44], [23.0, 24.04], [27.0, 29.78], [30.0, 31.19], [33.0, 34.05], [36.0, 37.47], [39.0, 39.92], [43.0, 44.02], [45.0, 46.33], [48.0, 47.87], [49.0, 50.06], [52.0, 52.25], [54.0, 57.45], [59.0, 60.25], [68.0, 70.77], [72.0, 74.34], [76.0, 78.24], [79.0, 89.68], [94.0, 96.23], [96.0, 96.35], [97.0, 97.17], [97.0, 97.31], [98.0, 98.85], [101.0, 116.95], [118.0, 127.03], [128.0, 131.45], [135.0, 148.42], [149.0, 154.45], [154.0, 154.48]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.75, 0.0, 35.09, 0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.07, 0.0, 66.63, 76.37, 99.99, 30.46, 31.95, 0.0, 0.0, 0.0, 0.0, 31.18, 29.95, 30.11, 34.53, 35.42, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 19.77], ["speech", 14.36], ["music", 13.13]], null, [["music", 37.7], ["chirp tone", 7.28], ["whale vocalization", 7.09]], null, null, null, null, null, null, null, null, null, null, null, [["music", 41.55], ["speech", 15.84], ["whimper", 11.32]], null, null, null, null, [["animal", 31.26], ["music", 20.07], ["dog", 8.54]], [["cattle, bovinae", 20.31], ["livestock, farm animals, working animals", 17.37], ["moo", 12.64]], null, null, null, null, [["animal", 40.16], ["music", 9.67], ["speech", 8.28]], [["wild animals", 21.84], ["grunt", 19.03], ["buzz", 17.11]], [["music", 36.53], ["animal", 14.75], ["dog", 9.29]], [["music", 35.81], ["theremin", 24.17], ["musical instrument", 6.91]], [["music", 63.84], ["foghorn", 6.98], ["brass instrument", 5.06]], null], "duration": [0.27, -0.28, 1.87, 4.97, 0.52, 2.44, 1.04, 2.78, 1.19, 1.05, 1.47, 0.92, 1.02, 1.33, -0.13, 1.06, 0.25, 3.45, 1.25, 2.77, 2.34, 2.24, 10.68, 2.23, 0.35, 0.17, 0.31, 0.85, 15.95, 9.03, 3.45, 13.42, 5.45, 0.48]} \ No newline at end of file diff --git a/annotations_1/NZzeLRspnMg_filtered.json b/annotations_1/NZzeLRspnMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f235f998613efd37e9a6a2b6a4cd1ad0bb9d11e --- /dev/null +++ b/annotations_1/NZzeLRspnMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [2.0, 3.43], [4.0, 4.56], [6.0, 6.3], [8.0, 9.93], [12.0, 12.46], [13.0, 13.86], [19.0, 19.92], [21.0, 21.93], [24.0, 24.88], [25.0, 25.86], [28.0, 28.9], [30.0, 30.23], [40.0, 40.19], [42.0, 42.06], [45.0, 44.96], [46.0, 46.48], [47.0, 46.77], [48.0, 49.55], [50.0, 50.77], [56.0, 57.01], [59.0, 59.43], [62.0, 62.95], [64.0, 64.76], [66.0, 67.07], [70.0, 71.0], [73.0, 73.13], [76.0, 76.55], [81.0, 81.68], [82.0, 83.37], [86.0, 87.39], [91.0, 92.3], [94.0, 93.8], [96.0, 96.4], [97.0, 97.58], [100.0, 100.48], [103.0, 104.18], [108.0, 108.14], [109.0, 110.96], [114.0, 114.96], [120.0, 121.14], [124.0, 125.44], [128.0, 129.0], [132.0, 133.0], [135.0, 137.57], [138.0, 138.62], [140.0, 140.86], [142.0, 144.12], [147.0, 147.68], [151.0, 152.2], [153.0, 154.84], [156.0, 156.59], [159.0, 159.33], [162.0, 162.21], [163.0, 163.85], [165.0, 166.9], [168.0, 169.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.27, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.73], ["sidetone", 30.71], ["dial tone", 6.42]], null, null, null, null, null, null, null, null, null], "duration": [1.43, 1.43, 0.56, 0.3, 1.93, 0.46, 0.86, 0.92, 0.93, 0.88, 0.86, 0.9, 0.23, 0.19, 0.06, -0.04, 0.48, -0.23, 1.55, 0.77, 1.01, 0.43, 0.95, 0.76, 1.07, 1.0, 0.13, 0.55, 0.68, 1.37, 1.39, 1.3, -0.2, 0.4, 0.58, 0.48, 1.18, 0.14, 1.96, 0.96, 1.14, 1.44, 1.0, 1.0, 2.57, 0.62, 0.86, 2.12, 0.68, 1.2, 1.84, 0.59, 0.33, 0.21, 0.85, 1.9, 1.92]} \ No newline at end of file diff --git a/annotations_1/N_3_HB0AfdY_filtered.json b/annotations_1/N_3_HB0AfdY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67afa20f06caa7f4e272f940cd62aaa7118a4b0a --- /dev/null +++ b/annotations_1/N_3_HB0AfdY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.73], [12.0, 12.56], [14.0, 15.42], [19.0, 19.4], [21.0, 21.54], [23.0, 24.12], [27.0, 27.57], [31.0, 32.05], [38.0, 39.36], [42.0, 41.86], [44.0, 44.19], [45.0, 45.67], [57.0, 61.03], [76.0, 76.84], [81.0, 81.72], [87.0, 87.47], [104.0, 104.52], [106.0, 108.97], [113.0, 114.49], [117.0, 118.72], [126.0, 127.31], [130.0, 131.72], [133.0, 134.77], [135.0, 136.98], [138.0, 139.29], [141.0, 141.67], [143.0, 143.36], [144.0, 147.12], [148.0, 149.12], [156.0, 155.82], [160.0, 160.54], [163.0, 168.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.16, 0.0, 0.0, 0.0, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.75], ["speech synthesizer", 10.98], ["sidetone", 2.0]], null, null, null, null], "duration": [4.73, 0.56, 1.42, 0.4, 0.54, 1.12, 0.57, 1.05, 1.36, -0.14, 0.19, 0.67, 4.03, 0.84, 0.72, 0.47, 0.52, 2.97, 1.49, 1.72, 1.31, 1.72, 1.77, 1.98, 1.29, 0.67, 0.36, 3.12, 1.12, -0.18, 0.54, 5.83]} \ No newline at end of file diff --git a/annotations_1/N_aPyfiVWEE_filtered.json b/annotations_1/N_aPyfiVWEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc454851ef0663d2fccfd4c4cade8e114e5b4fbd --- /dev/null +++ b/annotations_1/N_aPyfiVWEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [5.0, 6.47], [12.0, 14.22], [25.0, 26.06], [29.0, 30.54], [38.0, 38.79], [41.0, 41.34], [50.0, 53.37], [63.0, 78.31], [83.0, 83.67], [87.0, 94.31], [97.0, 99.55], [109.0, 111.27], [112.0, 112.16], [118.0, 120.88], [122.0, 122.67], [125.0, 127.04], [129.0, 130.01], [133.0, 138.45]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 51.07, 0.0, 0.0, 0.0, 0.0, 33.76, 32.56, 0.0, 32.81, 31.6, 35.14, 0.0, 32.3, 0.0, 38.42, 0.0, 32.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 34.29], ["music", 14.51], ["sidetone", 7.74]], [["boing", 48.66], ["music", 8.14], ["speech", 7.33]], null, [["music", 69.1], ["speech", 19.2], ["thump, thud", 1.33]], [["speech", 20.23], ["throbbing", 11.31], ["crowd", 9.64]], [["music", 28.68], ["speech", 17.92], ["didgeridoo", 9.35]], null, [["cattle, bovinae", 45.53], ["moo", 34.52], ["livestock, farm animals, working animals", 14.6]], null, [["music", 50.16], ["speech", 14.44], ["throbbing", 3.95]], null, [["cattle, bovinae", 39.46], ["moo", 27.57], ["livestock, farm animals, working animals", 15.7]]], "duration": [0.21, 1.47, 2.22, 1.06, 1.54, 0.79, 0.34, 3.37, 15.31, 0.67, 7.31, 2.55, 2.27, 0.16, 2.88, 0.67, 2.04, 1.01, 5.45]} \ No newline at end of file diff --git a/annotations_1/N_c0y8BcKBU_filtered.json b/annotations_1/N_c0y8BcKBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aab5767614aaf0a397eec07e810129533bb670a --- /dev/null +++ b/annotations_1/N_c0y8BcKBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.56], [11.0, 11.64]], "keep_status": [false, false], "silence_prob": [70.02, 0.0], "audiomae_on_audioset": [null, null], "duration": [6.56, 0.64]} \ No newline at end of file diff --git a/annotations_1/N_ooI6Wa0H0_filtered.json b/annotations_1/N_ooI6Wa0H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed002b73107466443c0fe07eaae9854a6c8e45f7 --- /dev/null +++ b/annotations_1/N_ooI6Wa0H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.2], [22.0, 23.6], [25.0, 27.06], [29.0, 30.4], [35.0, 37.62], [41.0, 42.15], [43.0, 45.23], [47.0, 48.14], [50.0, 51.68], [52.0, 54.55], [55.0, 57.43], [61.0, 111.92], [114.0, 131.14], [132.0, 153.13]], "keep_status": [false, false, false, false, true, false, true, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 51.77, 0.0, 48.39, 0.0, 39.49, 0.0, 0.0, 49.4, 44.49, 0.0, 29.79, 30.02], "audiomae_on_audioset": [null, null, null, null, [["music", 45.38], ["singing bowl", 16.35], ["didgeridoo", 5.05]], null, [["cattle, bovinae", 26.66], ["livestock, farm animals, working animals", 24.89], ["moo", 17.66]], null, null, [["speech", 42.64], ["rumble", 13.98], ["vehicle", 6.02]], [["music", 18.2], ["speech", 10.72], ["ambient music", 10.29]], null, [["music", 89.51], ["breaking", 2.73], ["theremin", 0.96]], [["music", 54.51], ["speech", 24.38], ["hum", 6.58]]], "duration": [1.2, 1.6, 2.06, 1.4, 2.62, 1.15, 2.23, 1.14, 1.68, 2.55, 2.43, 50.92, 17.14, 21.13]} \ No newline at end of file diff --git a/annotations_1/N_qIfvDbZjc_filtered.json b/annotations_1/N_qIfvDbZjc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e2a168920fa74e2ee0c766a1e6babcb13a3d763 --- /dev/null +++ b/annotations_1/N_qIfvDbZjc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.33], [25.0, 27.65], [31.0, 33.25], [35.0, 40.95], [42.0, 42.92], [44.0, 44.83], [47.0, 47.29], [54.0, 54.33], [56.0, 56.0], [57.0, 57.37], [60.0, 60.22], [62.0, 63.85], [64.0, 75.54], [94.0, 95.15], [98.0, 101.75], [103.0, 103.45], [104.0, 108.04], [109.0, 110.08], [118.0, 118.96], [120.0, 120.04], [121.0, 121.51], [125.0, 126.25], [128.0, 128.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 65.55, 64.75, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.76, 0.0, 39.08, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 58.93], ["synthesizer", 11.05], ["hum", 6.64]], null, null, null, null, null, null, null, null, [["music", 74.16], ["didgeridoo", 3.66], ["musical instrument", 2.03]], null, [["music", 58.95], ["fly, housefly", 3.83], ["synthesizer", 3.17]], null, [["music", 78.33], ["boing", 3.58], ["theremin", 2.32]], null, null, null, null, null, null], "duration": [1.33, 2.65, 2.25, 5.95, 0.92, 0.83, 0.29, 0.33, 0.0, 0.37, 0.22, 1.85, 11.54, 1.15, 3.75, 0.45, 4.04, 1.08, 0.96, 0.04, 0.51, 1.25, 0.12]} \ No newline at end of file diff --git a/annotations_1/Na3loD5Xpew_filtered.json b/annotations_1/Na3loD5Xpew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14ce2f7fca8006eab2a7c611862db0a20dd61248 --- /dev/null +++ b/annotations_1/Na3loD5Xpew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.27], [13.0, 13.14], [15.0, 18.5], [19.0, 20.28], [22.0, 23.65], [28.0, 28.58], [30.0, 30.0], [33.0, 32.75], [35.0, 35.73], [42.0, 42.7], [43.0, 44.29], [45.0, 46.36], [48.0, 49.74], [51.0, 51.51], [60.0, 62.01], [63.0, 64.25], [65.0, 65.62], [67.0, 68.34], [71.0, 71.95], [73.0, 76.06], [79.0, 80.79], [89.0, 90.09], [96.0, 96.42], [98.0, 100.01], [102.0, 103.54], [105.0, 105.61], [107.0, 108.33], [110.0, 110.89], [112.0, 113.1], [114.0, 115.26], [118.0, 126.27], [129.0, 135.28], [137.0, 140.78], [143.0, 143.97], [146.0, 146.75], [148.0, 149.35], [150.0, 151.7], [153.0, 154.09], [155.0, 156.96], [159.0, 161.23], [162.0, 163.34], [165.0, 167.26], [168.0, 170.31], [176.0, 178.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.06, 0.0, 0.0, 0.0, 0.0, 36.1, 0.0, 0.0, 0.0, 36.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.37, 35.03, 42.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 55.67, 41.72, 45.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 31.44], ["mains hum", 30.47], ["music", 4.96]], null, null, null, null, [["hum", 31.42], ["throbbing", 16.18], ["music", 11.91]], null, null, null, [["music", 32.32], ["speech", 32.12], ["electronic music", 3.95]], null, null, null, null, null, null, [["fart", 17.62], ["hum", 11.47], ["didgeridoo", 9.01]], [["speech", 76.95], ["music", 8.07], ["boing", 2.28]], [["bouncing", 20.49], ["effects unit", 14.16], ["distortion", 9.59]], null, null, null, null, null, null, null, null, null, [["music", 31.82], ["didgeridoo", 21.57], ["musical instrument", 9.3]], [["hum", 20.05], ["throbbing", 15.01], ["music", 6.51]]], "duration": [0.27, 0.14, 3.5, 1.28, 1.65, 0.58, 0.0, -0.25, 0.73, 0.7, 1.29, 1.36, 1.74, 0.51, 2.01, 1.25, 0.62, 1.34, 0.95, 3.06, 1.79, 1.09, 0.42, 2.01, 1.54, 0.61, 1.33, 0.89, 1.1, 1.26, 8.27, 6.28, 3.78, 0.97, 0.75, 1.35, 1.7, 1.09, 1.96, 2.23, 1.34, 2.26, 2.31, 2.75]} \ No newline at end of file diff --git a/annotations_1/Na9qhz28ZWQ_filtered.json b/annotations_1/Na9qhz28ZWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e43209d6d5b157c79f56ffae6c9fadd2969cb279 --- /dev/null +++ b/annotations_1/Na9qhz28ZWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.95], [19.0, 20.76], [22.0, 22.59], [26.0, 26.11], [28.0, 27.89], [37.0, 37.45], [57.0, 57.27], [124.0, 124.53], [125.0, 126.42], [172.0, 173.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 1.76, 0.59, 0.11, -0.11, 0.45, 0.27, 0.53, 1.42, 1.7]} \ No newline at end of file diff --git a/annotations_1/NadEkwOLA7k_filtered.json b/annotations_1/NadEkwOLA7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..361f1beb0bbe0a925db5b61619424f5017d003be --- /dev/null +++ b/annotations_1/NadEkwOLA7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.68], [11.0, 15.6], [19.0, 56.39], [60.0, 144.26], [146.0, 152.44], [155.0, 202.95]], "keep_status": [false, false, false, false, true, false], "silence_prob": [29.28, 31.77, 0.0, 0.0, 28.95, 0.0], "audiomae_on_audioset": [[["music", 64.52], ["throbbing", 7.76], ["electronic music", 7.74]], [["music", 70.75], ["electronic music", 4.83], ["throbbing", 3.19]], null, null, [["music", 13.08], ["explosion", 12.15], ["groan", 8.29]], null], "duration": [2.68, 4.6, 37.39, 84.26, 6.44, 47.95]} \ No newline at end of file diff --git a/annotations_1/NcMHcR5IzEY_filtered.json b/annotations_1/NcMHcR5IzEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ede333a60e32404308e0b13c3531e9692852413c --- /dev/null +++ b/annotations_1/NcMHcR5IzEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.01], [18.0, 18.25], [25.0, 119.13], [120.0, 122.64]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.32], "audiomae_on_audioset": [null, null, null, [["burst, pop", 17.63], ["explosion", 16.54], ["whoosh, swoosh, swish", 12.66]]], "duration": [1.01, 0.25, 94.13, 2.64]} \ No newline at end of file diff --git a/annotations_1/NclH5qEfL5c_filtered.json b/annotations_1/NclH5qEfL5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae92c8ebba747d6e3d02ceb0d3a422f3030f3b5c --- /dev/null +++ b/annotations_1/NclH5qEfL5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [22.0, 22.62], [28.0, 28.26], [41.0, 41.13], [47.0, 47.49], [49.0, 49.94], [55.0, 81.18], [87.0, 115.84], [116.0, 133.15], [136.0, 142.26], [146.0, 159.65]], "keep_status": [false, false, false, false, false, false, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.18, 28.34, 28.26, 28.12, 28.29], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 20.99], ["livestock, farm animals, working animals", 5.0], ["hum", 4.81]], [["explosion", 19.94], ["speech", 18.33], ["music", 10.54]], [["music", 38.16], ["vehicle", 10.34], ["car", 8.29]], [["explosion", 32.23], ["burst, pop", 13.12], ["speech", 10.65]], [["speech", 68.27], ["music", 7.62], ["reverberation", 2.74]]], "duration": [1.34, 0.62, 0.26, 0.13, 0.49, 0.94, 26.18, 28.84, 17.15, 6.26, 13.65]} \ No newline at end of file diff --git a/annotations_1/NdGB1rnPcR0_filtered.json b/annotations_1/NdGB1rnPcR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..799d6c38bfb6ed1f56d5fb8b02d4a1a828fb3ac9 --- /dev/null +++ b/annotations_1/NdGB1rnPcR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.93], [2.0, 5.86], [6.0, 17.25], [18.0, 67.36], [68.0, 68.13], [70.0, 115.89], [116.0, 118.34]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 58.55, 66.03, 0.0, 0.0, 0.0, 31.65], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 41.99], ["moo", 8.02], ["cattle, bovinae", 5.41]]], "duration": [-0.07, 3.86, 11.25, 49.36, 0.13, 45.89, 2.34]} \ No newline at end of file diff --git a/annotations_1/NdaWQm_UAF0_filtered.json b/annotations_1/NdaWQm_UAF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9353ae3f8639a6bc7d8461176a729fa6d63b3691 --- /dev/null +++ b/annotations_1/NdaWQm_UAF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[104.0, 106.83], [112.0, 114.17]], "keep_status": [true, true], "silence_prob": [29.48, 29.99], "audiomae_on_audioset": [[["grunt", 26.51], ["music", 16.97], ["moo", 14.03]], [["music", 22.26], ["groan", 10.56], ["whimper", 6.4]]], "duration": [2.83, 2.17]} \ No newline at end of file diff --git a/annotations_1/NdbZtOpgsUY_filtered.json b/annotations_1/NdbZtOpgsUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7352ceb745a07ec1364ef6b1784097501f713755 --- /dev/null +++ b/annotations_1/NdbZtOpgsUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 65.94], [67.0, 71.66], [72.0, 80.1], [80.0, 111.97], [113.0, 114.0]], "keep_status": [false, true, true, false, false], "silence_prob": [0.0, 39.57, 41.42, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.14], ["hum", 11.99], ["throbbing", 8.04]], [["whale vocalization", 32.52], ["hum", 15.3], ["music", 13.49]], null, null], "duration": [41.94, 4.66, 8.1, 31.97, 1.0]} \ No newline at end of file diff --git a/annotations_1/NePF08sMSDA_filtered.json b/annotations_1/NePF08sMSDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee0e05b919fb1cbdd350c8eb51c97e10e3df171d --- /dev/null +++ b/annotations_1/NePF08sMSDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.13], [15.0, 15.84], [18.0, 18.55], [23.0, 26.01], [30.0, 31.33], [32.0, 37.91], [52.0, 55.31], [56.0, 56.39], [65.0, 65.84], [70.0, 73.92], [76.0, 76.49], [79.0, 80.72], [82.0, 82.34], [86.0, 88.65], [89.0, 91.32], [94.0, 94.59], [95.0, 95.47], [97.0, 97.56], [100.0, 100.4], [101.0, 101.55], [102.0, 102.96], [104.0, 109.65], [110.0, 110.02], [112.0, 112.23], [116.0, 117.64], [119.0, 121.22], [122.0, 122.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.65, 0.0, 30.65, 31.77, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 99.95, 48.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 31.5, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 50.42], ["boing", 15.52], ["sidetone", 14.8]], null, [["music", 31.39], ["foghorn", 17.1], ["trombone", 12.35]], [["speech", 60.25], ["zipper (clothing)", 13.56], ["fart", 3.77]], null, null, null, null, null, null, null, [["speech", 66.22], ["fart", 4.18], ["hum", 3.47]], null, null, null, null, null, null, [["speech", 69.99], ["whack, thwack", 6.63], ["hammer", 3.79]], null, null, null, [["boing", 27.15], ["speech", 26.75], ["cattle, bovinae", 8.05]], null], "duration": [1.13, 0.84, 0.55, 3.01, 1.33, 5.91, 3.31, 0.39, 0.84, 3.92, 0.49, 1.72, 0.34, 2.65, 2.32, 0.59, 0.47, 0.56, 0.4, 0.55, 0.96, 5.65, 0.02, 0.23, 1.64, 2.22, 0.59]} \ No newline at end of file diff --git a/annotations_1/NfDBhc__ntM_filtered.json b/annotations_1/NfDBhc__ntM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d090c5a484947a83fd54559895968b7cfcc0e17a --- /dev/null +++ b/annotations_1/NfDBhc__ntM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.09], [14.0, 16.01], [17.0, 18.62], [20.0, 21.36], [22.0, 24.39], [26.0, 34.42], [35.0, 35.58], [38.0, 38.69], [41.0, 42.04], [43.0, 43.44], [43.0, 43.48], [44.0, 43.95], [49.0, 49.79], [54.0, 54.7], [66.0, 67.32], [69.0, 69.47], [70.0, 71.04], [72.0, 72.93], [75.0, 75.81], [82.0, 83.2], [97.0, 98.63], [101.0, 101.17], [109.0, 111.92], [113.0, 120.77], [121.0, 122.57], [132.0, 132.73], [133.0, 133.68], [135.0, 135.85], [140.0, 141.17], [144.0, 144.42], [154.0, 155.26], [156.0, 159.49], [162.0, 162.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [46.33, 43.35, 0.0, 0.0, 38.03, 33.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.51, 46.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 0.0], "audiomae_on_audioset": [[["music", 78.63], ["didgeridoo", 8.19], ["musical instrument", 1.84]], [["music", 59.95], ["didgeridoo", 13.9], ["musical instrument", 4.0]], null, null, [["sidetone", 95.2], ["mains hum", 1.29], ["hum", 0.89]], [["music", 52.4], ["didgeridoo", 29.21], ["musical instrument", 2.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.39], ["fly, housefly", 16.66], ["speech", 14.56]], [["hum", 26.26], ["music", 19.51], ["mains hum", 16.12]], null, null, null, null, null, null, null, [["speech", 74.56], ["music", 3.6], ["gunshot, gunfire", 2.95]], null], "duration": [4.09, 2.01, 1.62, 1.36, 2.39, 8.42, 0.58, 0.69, 1.04, 0.44, 0.48, -0.05, 0.79, 0.7, 1.32, 0.47, 1.04, 0.93, 0.81, 1.2, 1.63, 0.17, 2.92, 7.77, 1.57, 0.73, 0.68, 0.85, 1.17, 0.42, 1.26, 3.49, 0.51]} \ No newline at end of file diff --git a/annotations_1/NfQcD7ZLWL0_filtered.json b/annotations_1/NfQcD7ZLWL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c08d8f5f580212e8781319ee71549c6d0a957547 --- /dev/null +++ b/annotations_1/NfQcD7ZLWL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [5.0, 6.86], [9.0, 9.76], [12.0, 14.52], [16.0, 16.82], [17.0, 33.42], [34.0, 34.77], [36.0, 38.03], [39.0, 40.63], [43.0, 43.23], [45.0, 46.38], [49.0, 51.06], [53.0, 55.53], [60.0, 62.7], [64.0, 64.57], [69.0, 69.47], [70.0, 81.38], [83.0, 83.15], [84.0, 84.03], [87.0, 102.54], [104.0, 107.99], [113.0, 113.9], [115.0, 115.42], [116.0, 116.85], [119.0, 119.91], [123.0, 123.82], [127.0, 127.92], [129.0, 129.91]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.52, 0.0, 41.16, 0.0, 83.16, 0.0, 0.0, 0.0, 32.38, 36.64, 40.17, 0.0, 0.0, 32.71, 0.0, 0.0, 35.28, 43.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 31.77], ["mains hum", 17.3], ["music", 16.47]], null, [["music", 57.41], ["theremin", 8.48], ["musical instrument", 4.0]], null, null, null, null, null, [["honk", 22.49], ["goose", 20.08], ["radio", 11.08]], [["cattle, bovinae", 19.96], ["moo", 17.53], ["livestock, farm animals, working animals", 17.4]], [["music", 45.79], ["throbbing", 12.79], ["didgeridoo", 6.49]], null, null, [["music", 28.65], ["fart", 27.62], ["speech", 7.28]], null, null, [["hum", 49.97], ["mains hum", 27.77], ["music", 10.86]], [["hum", 35.22], ["music", 20.09], ["throbbing", 16.92]], null, null, null, null, null, null, null], "duration": [1.38, 1.86, 0.76, 2.52, 0.82, 16.42, 0.77, 2.03, 1.63, 0.23, 1.38, 2.06, 2.53, 2.7, 0.57, 0.47, 11.38, 0.15, 0.03, 15.54, 3.99, 0.9, 0.42, 0.85, 0.91, 0.82, 0.92, 0.91]} \ No newline at end of file diff --git a/annotations_1/NgAjrtEmWxI_filtered.json b/annotations_1/NgAjrtEmWxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d33336cca55c5a5224a1afb8e804643873d1f726 --- /dev/null +++ b/annotations_1/NgAjrtEmWxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.9], [16.0, 28.56], [29.0, 29.69], [31.0, 46.67], [47.0, 51.7], [57.0, 58.4], [59.0, 59.78], [64.0, 68.18], [72.0, 74.92], [75.0, 79.83], [80.0, 85.09], [86.0, 87.08], [88.0, 91.22], [92.0, 93.21], [95.0, 95.71], [97.0, 97.24], [99.0, 100.77], [101.0, 101.29], [102.0, 103.49], [105.0, 108.19], [109.0, 109.86], [112.0, 112.24], [113.0, 113.88], [115.0, 114.98], [116.0, 115.97], [116.0, 117.29], [119.0, 119.06], [120.0, 120.56], [123.0, 124.58], [125.0, 126.82], [136.0, 137.24], [139.0, 139.6], [140.0, 141.99], [152.0, 155.21], [157.0, 156.96], [157.0, 157.77], [163.0, 163.53], [165.0, 165.67]], "keep_status": [false, true, false, true, true, false, false, true, true, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 31.12, 0.0, 29.0, 33.24, 0.0, 0.0, 34.89, 33.31, 34.55, 33.77, 0.0, 32.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 26.6], ["hum", 14.56], ["mains hum", 13.3]], null, [["speech", 28.32], ["music", 23.2], ["cacophony", 5.22]], [["music", 41.17], ["speech", 8.28], ["didgeridoo", 5.07]], null, null, [["bow-wow", 16.71], ["dog", 14.75], ["music", 11.23]], [["speech", 33.74], ["thunk", 7.63], ["music", 6.92]], [["music", 20.47], ["cattle, bovinae", 18.04], ["didgeridoo", 14.25]], [["music", 54.41], ["musical instrument", 4.94], ["guitar", 4.44]], null, [["fly, housefly", 40.17], ["mosquito", 13.03], ["insect", 10.75]], null, null, null, null, null, null, [["music", 73.55], ["groan", 4.3], ["whimper", 2.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 19.03], ["hum", 19.03], ["speech", 11.94]], null, null, null, null], "duration": [1.9, 12.56, 0.69, 15.67, 4.7, 1.4, 0.78, 4.18, 2.92, 4.83, 5.09, 1.08, 3.22, 1.21, 0.71, 0.24, 1.77, 0.29, 1.49, 3.19, 0.86, 0.24, 0.88, -0.02, -0.03, 1.29, 0.06, 0.56, 1.58, 1.82, 1.24, 0.6, 1.99, 3.21, -0.04, 0.77, 0.53, 0.67]} \ No newline at end of file diff --git a/annotations_1/Nhj2rSOUjwU_filtered.json b/annotations_1/Nhj2rSOUjwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d81425c6d6c3bab1c9482979b259d6c5b6df9df --- /dev/null +++ b/annotations_1/Nhj2rSOUjwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 30.18], [47.0, 66.45], [72.0, 82.78], [86.0, 89.21], [94.0, 115.45], [118.0, 123.36]], "keep_status": [false, false, false, false, false, true], "silence_prob": [29.36, 29.62, 29.73, 29.57, 29.83, 29.78], "audiomae_on_audioset": [[["music", 80.62], ["gospel music", 2.39], ["singing", 2.13]], [["music", 69.61], ["singing", 2.8], ["synthesizer", 2.09]], [["music", 82.94], ["musical instrument", 3.74], ["guitar", 1.68]], [["music", 61.06], ["musical instrument", 4.93], ["didgeridoo", 4.66]], [["moo", 39.77], ["cattle, bovinae", 28.79], ["livestock, farm animals, working animals", 27.81]], [["music", 52.47], ["singing", 4.85], ["jingle, tinkle", 2.39]]], "duration": [13.18, 19.45, 10.78, 3.21, 21.45, 5.36]} \ No newline at end of file diff --git a/annotations_1/NhtvtnrHon8_filtered.json b/annotations_1/NhtvtnrHon8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..363eab99b7abe132939241fa2814ecab6c10a855 --- /dev/null +++ b/annotations_1/NhtvtnrHon8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.11], [9.0, 9.75], [11.0, 18.27], [20.0, 48.9], [50.0, 50.62], [51.0, 53.08], [55.0, 92.08], [93.0, 103.99], [105.0, 105.38], [107.0, 120.45]], "keep_status": [false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 33.45, 32.86, 0.0, 39.77, 0.0, 30.92, 0.0, 31.04], "audiomae_on_audioset": [null, null, [["hum", 42.63], ["mains hum", 20.59], ["throbbing", 18.29]], [["hum", 40.92], ["mains hum", 12.99], ["throbbing", 7.99]], null, [["music", 28.67], ["hum", 16.22], ["throbbing", 14.67]], null, [["music", 38.18], ["throbbing", 36.08], ["hum", 11.26]], null, [["speech", 43.28], ["music", 17.13], ["vehicle", 6.65]]], "duration": [1.11, 0.75, 7.27, 28.9, 0.62, 2.08, 37.08, 10.99, 0.38, 13.45]} \ No newline at end of file diff --git a/annotations_1/NieC8KA0EvI_filtered.json b/annotations_1/NieC8KA0EvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3006eaa20ba156954d1e566a2b5d72d8ef9fa7e0 --- /dev/null +++ b/annotations_1/NieC8KA0EvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [9.0, 9.48], [19.0, 20.14], [26.0, 27.53], [50.0, 53.52], [61.0, 60.84], [66.0, 69.09], [73.0, 76.94], [80.0, 80.6], [83.0, 83.54], [84.0, 84.99], [92.0, 92.52], [109.0, 109.59], [110.0, 112.9], [120.0, 120.61], [135.0, 136.34], [138.0, 140.91], [145.0, 148.44], [150.0, 151.83], [177.0, 177.58], [179.0, 179.27], [179.0, 179.31], [182.0, 183.41], [183.0, 183.57], [184.0, 186.11], [189.0, 189.5], [190.0, 190.54], [193.0, 200.89], [209.0, 211.59], [230.0, 230.76], [241.0, 256.0], [259.0, 270.73], [271.0, 272.02]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.45, 0.0, 59.42, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 0.0, 38.6, 49.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.2, 0.0, 0.0, 36.49, 32.41, 0.0, 32.24, 56.93, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 51.2], ["didgeridoo", 6.43], ["hum", 6.34]], null, null, null, null, null, null, null, null, [["music", 72.92], ["a capella", 3.91], ["singing", 2.98]], null, null, [["music", 74.12], ["carnatic music", 4.65], ["theremin", 2.87]], [["music", 56.01], ["mantra", 14.46], ["chant", 6.64]], null, null, null, null, null, null, [["music", 55.24], ["synthetic singing", 3.38], ["electronic music", 2.14]], null, null, [["music", 82.15], ["singing", 1.37], ["electronic music", 1.33]], [["music", 26.01], ["hum", 19.46], ["mains hum", 17.79]], null, [["music", 78.46], ["musical instrument", 5.37], ["carnatic music", 2.36]], null, null], "duration": [0.5, 0.48, 1.14, 1.53, 3.52, -0.16, 3.09, 3.94, 0.6, 0.54, 0.99, 0.52, 0.59, 2.9, 0.61, 1.34, 2.91, 3.44, 1.83, 0.58, 0.27, 0.31, 1.41, 0.57, 2.11, 0.5, 0.54, 7.89, 2.59, 0.76, 15.0, 11.73, 1.02]} \ No newline at end of file diff --git a/annotations_1/NipqouLNqAY_filtered.json b/annotations_1/NipqouLNqAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..857c8dd2f0c060ee16103548625634f954f9cf1b --- /dev/null +++ b/annotations_1/NipqouLNqAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.01], [18.0, 24.02], [29.0, 33.42], [40.0, 41.32], [42.0, 43.36], [45.0, 45.33], [47.0, 49.37], [51.0, 51.21], [52.0, 54.97], [57.0, 57.6], [61.0, 60.61], [64.0, 63.96], [68.0, 68.28], [69.0, 69.85], [71.0, 72.0], [74.0, 74.9], [80.0, 80.82], [84.0, 90.02], [92.0, 94.15], [96.0, 96.45], [98.0, 101.6], [118.0, 117.73], [119.0, 121.12], [127.0, 127.68], [130.0, 134.65], [139.0, 138.97], [161.0, 163.75], [166.0, 182.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 62.58, 70.44, 0.0, 0.0, 0.0, 89.36, 0.0, 57.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 78.89, 0.0, 69.61, 0.0, 57.01, 0.0, 45.59, 0.0, 29.16, 35.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.95], ["hum", 22.45], ["throbbing", 14.93]], null, [["music", 38.53], ["speech", 18.86], ["hum", 9.02]], [["groan", 21.19], ["sigh", 14.57], ["sound effect", 11.43]]], "duration": [1.01, 6.02, 4.42, 1.32, 1.36, 0.33, 2.37, 0.21, 2.97, 0.6, -0.39, -0.04, 0.28, 0.85, 1.0, 0.9, 0.82, 6.02, 2.15, 0.45, 3.6, -0.27, 2.12, 0.68, 4.65, -0.03, 2.75, 16.61]} \ No newline at end of file diff --git a/annotations_1/NirTc-GvKLk_filtered.json b/annotations_1/NirTc-GvKLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36777078015f6dab3d13a919b1381e93496cca8c --- /dev/null +++ b/annotations_1/NirTc-GvKLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.24], [25.0, 28.44], [29.0, 29.89], [34.0, 38.7], [41.0, 40.81]], "keep_status": [true, true, false, false, false], "silence_prob": [27.86, 27.76, 0.0, 28.69, 0.0], "audiomae_on_audioset": [[["speech", 34.15], ["screaming", 11.71], ["animal", 7.09]], [["speech", 61.92], ["baby cry, infant cry", 3.68], ["inside, small room", 3.67]], null, [["speech", 81.67], ["hum", 1.82], ["animal", 1.54]], null], "duration": [4.24, 3.44, 0.89, 4.7, -0.19]} \ No newline at end of file diff --git a/annotations_1/NizLAsFlvww_filtered.json b/annotations_1/NizLAsFlvww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32dd922d2f85db2e1f5d3bf75cf65507d1c1c15a --- /dev/null +++ b/annotations_1/NizLAsFlvww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.68], [2.0, 2.35], [2.0, 6.45], [7.0, 7.16], [28.0, 48.3], [52.0, 55.86], [57.0, 56.78], [61.0, 60.94], [63.0, 62.92]], "keep_status": [false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 29.53, 0.0, 29.29, 28.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 41.22], ["music", 17.35], ["synthesizer", 12.49]], null, [["music", 28.83], ["throbbing", 19.28], ["speech", 18.95]], [["music", 30.31], ["speech", 18.64], ["didgeridoo", 4.77]], null, null, null], "duration": [0.68, 0.35, 4.45, 0.16, 20.3, 3.86, -0.22, -0.06, -0.08]} \ No newline at end of file diff --git a/annotations_1/Nj61hQhTwW0_filtered.json b/annotations_1/Nj61hQhTwW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8165c44fe1224517e700ae1f8924b0dddb2794 --- /dev/null +++ b/annotations_1/Nj61hQhTwW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [5.0, 5.78], [12.0, 14.89], [16.0, 19.13], [21.0, 23.97], [29.0, 29.76], [31.0, 32.36], [41.0, 42.11], [43.0, 44.39], [46.0, 52.15], [57.0, 58.92], [62.0, 61.86], [63.0, 64.45], [65.0, 69.11], [70.0, 72.33], [75.0, 78.95], [80.0, 81.8], [82.0, 85.8], [87.0, 95.47], [96.0, 104.13], [105.0, 106.41], [109.0, 115.42], [118.0, 117.85], [119.0, 123.26], [124.0, 126.42], [128.0, 131.7], [132.0, 137.88], [139.0, 139.73], [141.0, 143.94], [145.0, 149.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.95, 92.64, 96.04, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 98.86, 97.0, 52.62, 0.0, 74.92, 94.95, 59.59, 0.0, 63.21, 0.0, 90.43, 97.11, 94.07, 84.43, 0.0, 73.36, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.78, 2.89, 3.13, 2.97, 0.76, 1.36, 1.11, 1.39, 6.15, 1.92, -0.14, 1.45, 4.11, 2.33, 3.95, 1.8, 3.8, 8.47, 8.13, 1.41, 6.42, -0.15, 4.26, 2.42, 3.7, 5.88, 0.73, 2.94, 4.18]} \ No newline at end of file diff --git a/annotations_1/NjUtH1NBFyY_filtered.json b/annotations_1/NjUtH1NBFyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ec128de88c0c279a891bb93708ae57e9027bccb --- /dev/null +++ b/annotations_1/NjUtH1NBFyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [8.0, 10.25], [12.0, 16.53], [18.0, 19.04], [20.0, 22.79], [28.0, 39.01], [41.0, 45.79], [48.0, 51.58], [53.0, 54.8], [55.0, 61.8], [68.0, 87.29], [88.0, 94.02], [102.0, 114.86], [128.0, 127.9], [132.0, 133.56], [140.0, 140.43]], "keep_status": [false, false, true, false, true, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 33.15, 33.08, 0.0, 31.62, 29.06, 32.13, 32.76, 0.0, 30.23, 29.26, 30.44, 29.42, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.41], ["synthesizer", 4.31], ["musical instrument", 4.16]], [["music", 18.51], ["clang", 17.57], ["hum", 11.5]], null, [["music", 32.22], ["speech", 13.55], ["hum", 10.89]], [["cattle, bovinae", 44.41], ["moo", 30.49], ["livestock, farm animals, working animals", 22.22]], [["cattle, bovinae", 27.17], ["livestock, farm animals, working animals", 25.24], ["moo", 23.22]], [["livestock, farm animals, working animals", 33.6], ["moo", 27.1], ["cattle, bovinae", 24.31]], null, [["music", 25.23], ["boing", 21.4], ["whack, thwack", 16.64]], [["music", 36.67], ["speech", 13.93], ["throbbing", 9.27]], [["foghorn", 53.7], ["music", 19.51], ["speech", 10.91]], [["music", 26.17], ["speech", 8.11], ["livestock, farm animals, working animals", 6.85]], null, null, null], "duration": [0.55, 2.25, 4.53, 1.04, 2.79, 11.01, 4.79, 3.58, 1.8, 6.8, 19.29, 6.02, 12.86, -0.1, 1.56, 0.43]} \ No newline at end of file diff --git a/annotations_1/NjfviAKKVj4_filtered.json b/annotations_1/NjfviAKKVj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33a87b7bfaee79ced118f75deca6612079ec0106 --- /dev/null +++ b/annotations_1/NjfviAKKVj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.14], [13.0, 13.42], [16.0, 17.71], [26.0, 28.07], [31.0, 32.09], [34.0, 34.77], [36.0, 39.56], [41.0, 45.67], [47.0, 48.93], [49.0, 50.8], [52.0, 56.03], [57.0, 57.5], [59.0, 59.75], [63.0, 63.39], [66.0, 65.97], [71.0, 71.24], [72.0, 72.33], [75.0, 75.64], [76.0, 76.5], [78.0, 77.82], [80.0, 80.27], [85.0, 101.09], [102.0, 105.73], [106.0, 107.38], [108.0, 109.04], [110.0, 111.75], [114.0, 114.62], [117.0, 119.15], [120.0, 123.87], [124.0, 124.75], [127.0, 137.37], [140.0, 140.21], [141.0, 153.52], [154.0, 160.89], [163.0, 164.39], [165.0, 165.6], [169.0, 169.69], [171.0, 170.95], [172.0, 173.11], [174.0, 174.88], [176.0, 177.8]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.75, 0.0, 0.0, 98.1, 0.0, 0.0, 71.29, 47.16, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 99.95, 0.0, 0.0, 0.0, 0.0, 99.88, 99.93, 0.0, 90.43, 0.0, 100.0, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 38.71], ["hum", 13.55], ["mains hum", 12.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 0.42, 1.71, 2.07, 1.09, 0.77, 3.56, 4.67, 1.93, 1.8, 4.03, 0.5, 0.75, 0.39, -0.03, 0.24, 0.33, 0.64, 0.5, -0.18, 0.27, 16.09, 3.73, 1.38, 1.04, 1.75, 0.62, 2.15, 3.87, 0.75, 10.37, 0.21, 12.52, 6.89, 1.39, 0.6, 0.69, -0.05, 1.11, 0.88, 1.8]} \ No newline at end of file diff --git a/annotations_1/NkhIROsY7Pg_filtered.json b/annotations_1/NkhIROsY7Pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3147a4c0cbed7b12f70dcb411e2e983b0c20191e --- /dev/null +++ b/annotations_1/NkhIROsY7Pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 53.86], [54.0, 100.68]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [47.86, 46.68]} \ No newline at end of file diff --git a/annotations_1/NkmUIQL4spM_filtered.json b/annotations_1/NkmUIQL4spM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..405d3cd1d2485d09f224521ee83f097e43c1ba51 --- /dev/null +++ b/annotations_1/NkmUIQL4spM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [7.0, 6.84], [9.0, 9.42], [11.0, 11.4], [13.0, 20.34], [31.0, 32.39], [36.0, 40.69], [43.0, 43.63], [56.0, 56.71], [59.0, 59.43], [61.0, 61.23], [64.0, 64.89], [67.0, 68.03], [70.0, 70.09], [72.0, 71.96], [73.0, 73.38], [74.0, 74.71], [76.0, 75.81], [79.0, 78.71], [80.0, 80.32], [87.0, 87.24], [88.0, 89.07], [90.0, 90.27], [92.0, 94.09], [95.0, 98.27], [99.0, 102.15], [103.0, 104.48], [107.0, 106.81], [108.0, 108.41], [109.0, 110.03], [111.0, 111.7], [116.0, 116.21], [118.0, 118.57], [122.0, 121.8], [124.0, 124.73], [126.0, 126.62], [128.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 39.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 60.86], ["speech", 7.5], ["radio", 4.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, -0.16, 0.42, 0.4, 7.34, 1.39, 4.69, 0.63, 0.71, 0.43, 0.23, 0.89, 1.03, 0.09, -0.04, 0.38, 0.71, -0.19, -0.29, 0.32, 0.24, 1.07, 0.27, 2.09, 3.27, 3.15, 1.48, -0.19, 0.41, 1.03, 0.7, 0.21, 0.57, -0.2, 0.73, 0.62, 0.24]} \ No newline at end of file diff --git a/annotations_1/NkzG9RZBERE_filtered.json b/annotations_1/NkzG9RZBERE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccd65a33d3a052ad1050a976182ee9251af4bfaa --- /dev/null +++ b/annotations_1/NkzG9RZBERE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.99], [9.0, 9.41], [10.0, 27.45], [29.0, 32.27], [33.0, 35.77], [37.0, 38.69], [41.0, 41.27], [49.0, 49.45], [51.0, 51.29], [54.0, 54.09], [56.0, 55.86], [64.0, 64.69], [76.0, 77.36], [91.0, 91.52], [97.0, 98.37], [98.0, 100.25], [101.0, 104.94], [108.0, 108.51], [117.0, 116.55], [121.0, 120.75], [124.0, 128.44], [130.0, 131.48], [134.0, 133.86], [134.0, 135.31], [142.0, 143.33], [146.0, 147.12], [149.0, 150.69], [153.0, 153.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.85, 0.0, 50.02, 89.54, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 46.02, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 44.9], ["music", 21.54], ["hum", 6.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.97], ["radio", 18.32], ["fly, housefly", 1.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.99, 0.41, 17.45, 3.27, 2.77, 1.69, 0.27, 0.45, 0.29, 0.09, -0.14, 0.69, 1.36, 0.52, 1.37, 2.25, 3.94, 0.51, -0.45, -0.25, 4.44, 1.48, -0.14, 1.31, 1.33, 1.12, 1.69, 0.87]} \ No newline at end of file diff --git a/annotations_1/NlPC4ag5S54_filtered.json b/annotations_1/NlPC4ag5S54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c58b115f9b406bf0adce7c0820dc16ae8837324d --- /dev/null +++ b/annotations_1/NlPC4ag5S54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.13], [7.0, 7.62], [14.0, 26.11], [28.0, 34.94], [36.0, 54.53], [56.0, 75.76], [78.0, 87.3], [88.0, 89.28], [90.0, 93.23]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.09, 29.96, 28.76, 30.21, 30.8, 0.0, 37.9], "audiomae_on_audioset": [null, null, [["speech", 55.69], ["electric shaver, electric razor", 9.0], ["animal", 7.03]], [["speech", 16.56], ["sidetone", 12.95], ["hum", 11.98]], [["speech", 58.62], ["music", 7.91], ["buzz", 5.17]], [["music", 36.3], ["didgeridoo", 31.51], ["throbbing", 6.69]], [["music", 69.51], ["explosion", 2.0], ["breaking", 1.46]], null, [["hum", 32.49], ["mains hum", 23.27], ["music", 15.33]]], "duration": [1.13, 0.62, 12.11, 6.94, 18.53, 19.76, 9.3, 1.28, 3.23]} \ No newline at end of file diff --git a/annotations_1/NlREC9TagHY_filtered.json b/annotations_1/NlREC9TagHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c575348b4dc91473336a6dffcd5aa6b459777f9e --- /dev/null +++ b/annotations_1/NlREC9TagHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [9.0, 10.07], [24.0, 24.11], [26.0, 27.04], [29.0, 30.32], [57.0, 57.62], [78.0, 78.56], [80.0, 81.21], [91.0, 91.84], [94.0, 94.34], [96.0, 95.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 1.07, 0.11, 1.04, 1.32, 0.62, 0.56, 1.21, 0.84, 0.34, -0.14]} \ No newline at end of file diff --git a/annotations_1/NmSNUylSNvo_filtered.json b/annotations_1/NmSNUylSNvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f820b27753468435eafd9b76d90d52bdaf36f80 --- /dev/null +++ b/annotations_1/NmSNUylSNvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [3.0, 4.16], [16.0, 18.33], [26.0, 26.33], [28.0, 28.02], [39.0, 39.23], [40.0, 40.46], [47.0, 50.09], [51.0, 52.59], [53.0, 56.15], [57.0, 58.7], [60.0, 65.28], [67.0, 68.25], [70.0, 70.71], [72.0, 73.09], [73.0, 73.72], [76.0, 77.41], [80.0, 80.86], [83.0, 83.34], [85.0, 88.26], [88.0, 90.51], [94.0, 94.39], [96.0, 97.36], [98.0, 101.04], [104.0, 106.64], [112.0, 113.16], [114.0, 114.74], [126.0, 126.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 60.6, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 63.85, 0.0, 0.0, 66.76, 54.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 1.16, 2.33, 0.33, 0.02, 0.23, 0.46, 3.09, 1.59, 3.15, 1.7, 5.28, 1.25, 0.71, 1.09, 0.72, 1.41, 0.86, 0.34, 3.26, 2.51, 0.39, 1.36, 3.04, 2.64, 1.16, 0.74, 0.67]} \ No newline at end of file diff --git a/annotations_1/NnDKut3pxoU_filtered.json b/annotations_1/NnDKut3pxoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..292d7691c53a2fefa6b4619192052d2509a3b4c1 --- /dev/null +++ b/annotations_1/NnDKut3pxoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.47], [11.0, 12.5], [15.0, 21.9], [23.0, 30.11], [33.0, 36.88], [37.0, 97.04], [98.0, 168.4], [171.0, 171.34]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 99.71, 90.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.47, 1.5, 6.9, 7.11, 3.88, 60.04, 70.4, 0.34]} \ No newline at end of file diff --git a/annotations_1/NpoB6-TCGWw_filtered.json b/annotations_1/NpoB6-TCGWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cedaadb4b2e4469148a3f60a4b9e61d938e1388e --- /dev/null +++ b/annotations_1/NpoB6-TCGWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [7.0, 14.22], [16.0, 30.45], [32.0, 42.75], [47.0, 52.71], [56.0, 64.08], [66.0, 66.9], [68.0, 68.82], [70.0, 83.93], [86.0, 127.94]], "keep_status": [false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 30.13, 30.8, 30.46, 40.02, 30.47, 0.0, 0.0, 31.6, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 49.79], ["mosquito", 22.51], ["insect", 15.54]], [["music", 19.63], ["speech", 16.37], ["machine gun", 14.39]], [["cacophony", 17.82], ["mains hum", 14.46], ["hum", 12.46]], [["music", 54.02], ["hum", 8.35], ["mains hum", 7.8]], [["music", 60.25], ["breaking", 5.47], ["crack", 5.41]], null, null, [["hum", 48.59], ["mains hum", 19.99], ["music", 15.91]], null], "duration": [0.57, 7.22, 14.45, 10.75, 5.71, 8.08, 0.9, 0.82, 13.93, 41.94]} \ No newline at end of file diff --git a/annotations_1/NpzigSg-YkI_filtered.json b/annotations_1/NpzigSg-YkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2671476ba243c65759ce86beb36e80b1fc782154 --- /dev/null +++ b/annotations_1/NpzigSg-YkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.93], [7.0, 12.04], [12.0, 16.21], [17.0, 17.17], [20.0, 20.33], [21.0, 21.15], [22.0, 24.34], [25.0, 26.43], [28.0, 28.09], [45.0, 45.12], [46.0, 48.17], [49.0, 50.84], [58.0, 60.69], [64.0, 64.18], [65.0, 69.21], [70.0, 72.47], [73.0, 73.7], [74.0, 75.9], [77.0, 77.85], [79.0, 79.35], [95.0, 101.56], [102.0, 103.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.09, 99.21, 92.48, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 97.73, 0.0, 93.45, 0.0, 81.53, 89.19, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.93, 5.04, 4.21, 0.17, 0.33, 0.15, 2.34, 1.43, 0.09, 0.12, 2.17, 1.84, 2.69, 0.18, 4.21, 2.47, 0.7, 1.9, 0.85, 0.35, 6.56, 1.06]} \ No newline at end of file diff --git a/annotations_1/NqJ6llRZg-M_filtered.json b/annotations_1/NqJ6llRZg-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d156bd290195fe04f8a11960d20bddb07a865a1 --- /dev/null +++ b/annotations_1/NqJ6llRZg-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [9.0, 10.49], [11.0, 12.92], [14.0, 17.42], [21.0, 26.99], [27.0, 68.25]], "keep_status": [false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 45.02, 34.8, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 36.04], ["hum", 9.52], ["music", 8.06]], [["music", 39.1], ["speech", 14.45], ["whack, thwack", 4.53]], null], "duration": [0.5, 1.49, 1.92, 3.42, 5.99, 41.25]} \ No newline at end of file diff --git a/annotations_1/NqmZSSpvghU_filtered.json b/annotations_1/NqmZSSpvghU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb94840d52596674e61e7206d0448337e56462c5 --- /dev/null +++ b/annotations_1/NqmZSSpvghU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.68], [19.0, 19.2], [30.0, 31.01], [33.0, 33.64], [34.0, 35.02], [37.0, 37.96], [39.0, 39.77], [43.0, 43.63], [44.0, 46.4], [54.0, 82.29], [92.0, 92.2], [94.0, 94.59], [95.0, 98.96], [102.0, 102.91], [105.0, 105.6], [107.0, 118.71]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.62, 34.64, 0.0, 0.0, 51.28, 0.0, 0.0, 56.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 27.8], ["wood block", 10.66], ["bass guitar", 4.16]], [["music", 83.74], ["brass instrument", 0.96], ["musical instrument", 0.74]], null, null, null, null, null, null], "duration": [0.68, 0.2, 1.01, 0.64, 1.02, 0.96, 0.77, 0.63, 2.4, 28.29, 0.2, 0.59, 3.96, 0.91, 0.6, 11.71]} \ No newline at end of file diff --git a/annotations_1/Nqt6-rPGGEo_filtered.json b/annotations_1/Nqt6-rPGGEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cceb3125340cb22f6675a1e35c312b289043b1ee --- /dev/null +++ b/annotations_1/Nqt6-rPGGEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.54], [7.0, 10.52], [12.0, 12.51], [15.0, 15.13], [17.0, 17.32], [29.0, 30.65], [33.0, 34.65], [36.0, 36.36], [38.0, 110.32], [111.0, 112.6], [117.0, 117.66], [118.0, 118.57], [120.0, 122.93], [124.0, 127.21], [128.0, 131.26], [132.0, 132.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 48.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7, 31.46, 37.25, 0.0], "audiomae_on_audioset": [null, [["music", 24.31], ["hum", 12.05], ["didgeridoo", 8.21]], null, null, null, null, null, null, null, null, null, null, [["hum", 32.29], ["music", 26.58], ["electronic music", 9.83]], [["hum", 33.37], ["whale vocalization", 14.51], ["mains hum", 10.68]], [["hum", 42.71], ["mains hum", 14.73], ["music", 12.98]], null], "duration": [1.54, 3.52, 0.51, 0.13, 0.32, 1.65, 1.65, 0.36, 72.32, 1.6, 0.66, 0.57, 2.93, 3.21, 3.26, 0.75]} \ No newline at end of file diff --git a/annotations_1/NrhBIkWlIfA_filtered.json b/annotations_1/NrhBIkWlIfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..315285e50728775f132b53a4ff7f3cbcffc3e48a --- /dev/null +++ b/annotations_1/NrhBIkWlIfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [6.0, 6.93], [8.0, 9.39], [11.0, 13.2], [16.0, 16.26], [17.0, 18.57], [22.0, 24.33], [27.0, 28.26], [33.0, 33.96], [40.0, 42.18], [43.0, 46.4], [48.0, 49.27], [52.0, 56.84], [59.0, 63.27], [65.0, 65.45], [70.0, 73.53], [75.0, 79.12], [80.0, 82.85], [83.0, 101.01], [106.0, 106.61], [108.0, 110.91], [111.0, 113.8], [115.0, 117.12], [118.0, 123.63], [124.0, 126.84], [128.0, 137.54], [138.0, 148.47], [152.0, 152.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 49.97, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 90.08, 0.0, 95.64, 79.76, 100.0, 87.19, 100.0, 85.72, 29.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 53.13], ["mouse", 4.7], ["clicking", 3.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.58], ["crowd", 17.94], ["cheering", 5.36]], null], "duration": [1.97, 0.93, 1.39, 2.2, 0.26, 1.57, 2.33, 1.26, 0.96, 2.18, 3.4, 1.27, 4.84, 4.27, 0.45, 3.53, 4.12, 2.85, 18.01, 0.61, 2.91, 2.8, 2.12, 5.63, 2.84, 9.54, 10.47, 0.54]} \ No newline at end of file diff --git a/annotations_1/NufzJ2YVJB4_filtered.json b/annotations_1/NufzJ2YVJB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dd324d311ccff4d7cceeafc3c36838f11225c78 --- /dev/null +++ b/annotations_1/NufzJ2YVJB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [4.0, 6.0], [20.0, 20.46], [24.0, 24.51], [33.0, 34.87], [38.0, 38.65], [45.0, 45.99], [61.0, 61.45], [68.0, 68.13], [71.0, 70.93], [71.0, 81.21], [81.0, 88.08], [91.0, 100.77], [106.0, 106.59], [110.0, 111.18], [115.0, 116.09], [120.0, 121.63], [129.0, 129.0], [136.0, 135.78], [137.0, 137.22], [149.0, 150.04], [152.0, 153.62], [155.0, 156.29], [158.0, 160.89], [162.0, 165.77], [170.0, 176.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 43.77, 51.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 72.75, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.48], ["hum", 12.45], ["throbbing", 10.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 2.0, 0.46, 0.51, 1.87, 0.65, 0.99, 0.45, 0.13, -0.07, 10.21, 7.08, 9.77, 0.59, 1.18, 1.09, 1.63, 0.0, -0.22, 0.22, 1.04, 1.62, 1.29, 2.89, 3.77, 6.39]} \ No newline at end of file diff --git a/annotations_1/NulXXh0cw4c_filtered.json b/annotations_1/NulXXh0cw4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd66841cde23f2a9e35891cfdd074d519cc241cc --- /dev/null +++ b/annotations_1/NulXXh0cw4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.15], [14.0, 14.17], [15.0, 15.04], [17.0, 20.93], [29.0, 29.37], [40.0, 41.23], [42.0, 42.4], [46.0, 46.38], [46.0, 49.44], [56.0, 57.08], [61.0, 61.32], [62.0, 64.03], [65.0, 65.08], [68.0, 72.28], [75.0, 109.56], [110.0, 117.49], [118.0, 117.53], [118.0, 121.71], [128.0, 138.27], [141.0, 144.85], [147.0, 160.78], [164.0, 164.51], [167.0, 167.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.99, 0.0, 0.0, 0.0, 0.0, 38.16, 0.0, 0.0, 66.51, 0.0, 30.0, 0.0, 30.96, 0.0, 33.83, 34.64, 36.85, 31.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 50.89], ["sonar", 15.47], ["hum", 8.52]], null, null, null, null, [["music", 23.7], ["moo", 19.88], ["cattle, bovinae", 14.59]], null, null, null, null, [["cattle, bovinae", 34.41], ["moo", 28.96], ["livestock, farm animals, working animals", 21.42]], null, [["music", 31.09], ["speech", 18.91], ["hum", 13.0]], null, [["music", 36.64], ["hum", 18.68], ["mains hum", 8.04]], [["hum", 30.61], ["music", 13.79], ["buzz", 5.87]], [["music", 62.24], ["buzz", 4.62], ["noise", 2.76]], [["speech", 59.82], ["music", 8.11], ["vehicle", 7.18]], null, null], "duration": [1.15, 0.17, 0.04, 3.93, 0.37, 1.23, 0.4, 0.38, 3.44, 1.08, 0.32, 2.03, 0.08, 4.28, 34.56, 7.49, -0.47, 3.71, 10.27, 3.85, 13.78, 0.51, 0.44]} \ No newline at end of file diff --git a/annotations_1/Nuwu9VTP3Ak_filtered.json b/annotations_1/Nuwu9VTP3Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be894863293c71d53eb03053dc445da3807617a8 --- /dev/null +++ b/annotations_1/Nuwu9VTP3Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.35], [8.0, 9.19], [12.0, 14.03], [15.0, 16.36], [17.0, 18.77], [23.0, 25.3], [28.0, 28.8], [32.0, 37.45], [40.0, 41.74], [43.0, 47.85], [50.0, 51.53], [53.0, 53.11], [62.0, 65.94], [70.0, 75.14], [75.0, 77.57], [78.0, 79.83], [83.0, 85.46], [88.0, 88.79], [94.0, 95.52], [96.0, 98.25], [101.0, 104.16], [111.0, 113.61], [117.0, 117.83], [121.0, 125.73]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [83.16, 0.0, 52.92, 0.0, 0.0, 47.66, 0.0, 84.8, 0.0, 88.83, 0.0, 0.0, 80.82, 50.86, 47.46, 0.0, 37.68, 0.0, 0.0, 73.51, 73.21, 78.72, 0.0, 69.2], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 24.74], ["radio", 22.48], ["sidetone", 17.99]], null, null, null, null, null, null, null, null, [["speech", 27.05], ["music", 18.12], ["hum", 9.29]], null, [["speech", 20.55], ["foghorn", 14.15], ["music", 8.91]], null, null, null, null, null, null, null], "duration": [2.35, 1.19, 2.03, 1.36, 1.77, 2.3, 0.8, 5.45, 1.74, 4.85, 1.53, 0.11, 3.94, 5.14, 2.57, 1.83, 2.46, 0.79, 1.52, 2.25, 3.16, 2.61, 0.83, 4.73]} \ No newline at end of file diff --git a/annotations_1/NvKYxRmWYEs_filtered.json b/annotations_1/NvKYxRmWYEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcf301f0f2fc3821d049134df566f5b974bc018 --- /dev/null +++ b/annotations_1/NvKYxRmWYEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.77], [13.0, 13.29], [15.0, 16.17], [23.0, 23.85], [25.0, 25.62], [28.0, 27.8], [29.0, 29.37], [30.0, 32.85], [34.0, 35.95], [39.0, 38.8], [40.0, 41.25], [42.0, 43.53], [47.0, 48.81], [50.0, 56.2], [60.0, 68.54], [71.0, 71.47], [73.0, 74.48], [77.0, 78.26], [80.0, 80.3], [84.0, 85.55], [89.0, 89.53], [92.0, 93.53], [94.0, 95.45], [98.0, 99.22], [106.0, 109.56], [115.0, 116.11], [118.0, 118.86], [123.0, 123.7], [126.0, 126.54], [140.0, 140.24], [145.0, 148.49], [153.0, 156.12], [163.0, 163.7], [166.0, 166.97], [173.0, 173.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 41.26, 39.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 99.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.1], ["music", 31.58], ["theremin", 4.11]], [["speech", 27.35], ["music", 19.68], ["moo", 8.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 0.29, 1.17, 0.85, 0.62, -0.2, 0.37, 2.85, 1.95, -0.2, 1.25, 1.53, 1.81, 6.2, 8.54, 0.47, 1.48, 1.26, 0.3, 1.55, 0.53, 1.53, 1.45, 1.22, 3.56, 1.11, 0.86, 0.7, 0.54, 0.24, 3.49, 3.12, 0.7, 0.97, 0.79]} \ No newline at end of file diff --git a/annotations_1/NvvU_4PsiKo_filtered.json b/annotations_1/NvvU_4PsiKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f015b0341d30fe1e96d84db252fd3257cd3aaff --- /dev/null +++ b/annotations_1/NvvU_4PsiKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.14], [8.0, 11.74], [13.0, 14.49], [15.0, 101.29]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 97.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.14, 3.74, 1.49, 86.29]} \ No newline at end of file diff --git a/annotations_1/Nwru3-Uif_Q_filtered.json b/annotations_1/Nwru3-Uif_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6eac21bebe98e865e60d32d546ed9d2aeb39ce0 --- /dev/null +++ b/annotations_1/Nwru3-Uif_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.69], [11.0, 16.41], [26.0, 26.16], [28.0, 28.41], [31.0, 30.87], [34.0, 38.13], [41.0, 46.31], [53.0, 55.93], [57.0, 58.99], [66.0, 67.27], [70.0, 71.81], [74.0, 74.51], [77.0, 77.65], [81.0, 83.07], [94.0, 98.39], [103.0, 103.5], [104.0, 107.3], [110.0, 110.47], [123.0, 126.89], [134.0, 134.5], [143.0, 143.23], [148.0, 147.65], [148.0, 151.56]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 33.3, 0.0, 0.0, 0.0, 33.65, 32.48, 36.98, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 30.7, 0.0, 28.86, 0.0, 32.38, 0.0, 0.0, 0.0, 29.17], "audiomae_on_audioset": [null, [["didgeridoo", 26.3], ["speech", 21.11], ["music", 14.07]], null, null, null, [["theremin", 23.38], ["speech", 17.9], ["boing", 3.28]], [["moo", 47.06], ["cattle, bovinae", 23.04], ["music", 7.52]], [["music", 22.16], ["didgeridoo", 18.54], ["speech", 9.47]], null, null, null, null, null, [["moo", 40.88], ["cattle, bovinae", 29.39], ["speech", 14.96]], [["music", 17.63], ["theremin", 15.79], ["brass instrument", 13.71]], null, [["wind instrument, woodwind instrument", 25.66], ["shofar", 22.34], ["music", 11.77]], null, [["speech", 27.72], ["music", 6.23], ["animal", 5.65]], null, null, null, [["music", 52.09], ["didgeridoo", 20.73], ["musical instrument", 8.66]]], "duration": [0.69, 5.41, 0.16, 0.41, -0.13, 4.13, 5.31, 2.93, 1.99, 1.27, 1.81, 0.51, 0.65, 2.07, 4.39, 0.5, 3.3, 0.47, 3.89, 0.5, 0.23, -0.35, 3.56]} \ No newline at end of file diff --git a/annotations_1/NxCa0cVaxQo_filtered.json b/annotations_1/NxCa0cVaxQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9048b1ab9d733a108d36aaab9ecbd2a0f2ea54a --- /dev/null +++ b/annotations_1/NxCa0cVaxQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [11.0, 10.99], [12.0, 14.72], [16.0, 16.31], [18.0, 20.34], [24.0, 24.76], [26.0, 26.59], [28.0, 29.61], [30.0, 31.19], [33.0, 33.84], [37.0, 37.2], [46.0, 46.36], [48.0, 50.04], [52.0, 52.27], [53.0, 54.58], [59.0, 59.64], [67.0, 66.8], [80.0, 81.24], [84.0, 88.97], [93.0, 93.28], [94.0, 94.66], [95.0, 96.03], [98.0, 97.66], [98.0, 98.66], [100.0, 100.82], [108.0, 108.53], [109.0, 109.65], [110.0, 126.87], [128.0, 128.63], [130.0, 130.52], [132.0, 136.8], [137.0, 140.76], [146.0, 148.88], [149.0, 151.14], [152.0, 154.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 85.72, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 31.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 0.0, 100.0, 79.24, 40.09, 62.68, 35.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 64.23], ["knock", 28.91], ["fart", 1.41]], null, null, null, null, null, null, null, null, [["speech", 42.29], ["frog", 12.57], ["insect", 8.13]], null, null, null, null, [["music", 24.2], ["speech", 11.71], ["cattle, bovinae", 9.54]], null, [["music", 34.19], ["ice cream truck, ice cream van", 9.63], ["speech", 6.79]]], "duration": [0.46, -0.01, 2.72, 0.31, 2.34, 0.76, 0.59, 1.61, 1.19, 0.84, 0.2, 0.36, 2.04, 0.27, 1.58, 0.64, -0.2, 1.24, 4.97, 0.28, 0.66, 1.03, -0.34, 0.66, 0.82, 0.53, 0.65, 16.87, 0.63, 0.52, 4.8, 3.76, 2.88, 2.14, 2.28]} \ No newline at end of file diff --git a/annotations_1/NxnafGrvcqU_filtered.json b/annotations_1/NxnafGrvcqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aeabed278272addaf1dbbf1ca9ce421e218478b8 --- /dev/null +++ b/annotations_1/NxnafGrvcqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.7], [13.0, 13.88], [15.0, 17.02], [20.0, 20.82], [22.0, 22.92], [26.0, 25.73], [26.0, 32.81], [34.0, 38.45], [39.0, 51.58], [55.0, 54.85], [58.0, 59.64], [61.0, 67.44], [69.0, 91.77], [93.0, 117.04]], "keep_status": [true, false, true, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [33.2, 0.0, 48.31, 0.0, 0.0, 0.0, 45.62, 43.43, 51.44, 0.0, 0.0, 41.91, 36.88, 33.63], "audiomae_on_audioset": [[["noise", 33.36], ["sidetone", 17.89], ["speech", 14.93]], null, [["mains hum", 25.85], ["hum", 25.77], ["music", 9.28]], null, null, null, [["creak", 22.56], ["fly, housefly", 18.37], ["mosquito", 13.39]], [["speech", 26.06], ["music", 19.97], ["musical instrument", 3.67]], null, null, null, [["speech", 52.94], ["whale vocalization", 24.56], ["music", 11.26]], [["theremin", 39.22], ["speech", 23.02], ["music", 16.78]], [["music", 66.09], ["synthesizer", 3.96], ["soundtrack music", 3.21]]], "duration": [5.7, 0.88, 2.02, 0.82, 0.92, -0.27, 6.81, 4.45, 12.58, -0.15, 1.64, 6.44, 22.77, 24.04]} \ No newline at end of file diff --git a/annotations_1/NyamI2ALbIA_filtered.json b/annotations_1/NyamI2ALbIA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7ba9af753126b6c45b38eb072b1cd00c557fabd --- /dev/null +++ b/annotations_1/NyamI2ALbIA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.73], [16.0, 18.62], [21.0, 22.23], [24.0, 25.19], [29.0, 39.41], [41.0, 58.31], [59.0, 59.71], [60.0, 81.01], [82.0, 86.86], [88.0, 91.59], [98.0, 100.25], [104.0, 128.51], [130.0, 143.99], [146.0, 198.22], [200.0, 221.88], [224.0, 225.91], [227.0, 227.28]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.08, 74.13, 0.0, 0.0, 49.36, 39.11, 0.0, 36.53, 65.09, 40.68, 41.3, 33.82, 32.07, 0.0, 38.84, 0.0, 0.0], "audiomae_on_audioset": [[["music", 19.28], ["gong", 17.24], ["synthesizer", 12.95]], null, null, null, [["music", 45.86], ["hum", 10.02], ["electronic music", 9.82]], [["music", 60.73], ["theremin", 11.84], ["musical instrument", 4.34]], null, [["music", 42.51], ["theremin", 36.95], ["didgeridoo", 4.8]], null, [["theremin", 75.69], ["music", 14.28], ["cello", 1.0]], [["music", 33.31], ["foghorn", 27.08], ["theremin", 12.31]], [["music", 57.89], ["clarinet", 7.48], ["brass instrument", 6.79]], [["music", 43.95], ["theremin", 36.38], ["musical instrument", 3.77]], null, [["music", 43.36], ["theremin", 33.2], ["wind instrument, woodwind instrument", 6.21]], null, null], "duration": [9.73, 2.62, 1.23, 1.19, 10.41, 17.31, 0.71, 21.01, 4.86, 3.59, 2.25, 24.51, 13.99, 52.22, 21.88, 1.91, 0.28]} \ No newline at end of file diff --git a/annotations_1/Nz4zu_fSHYY_filtered.json b/annotations_1/Nz4zu_fSHYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..910068e5a8d15fa8c786adbc3be4676f64f8c11d --- /dev/null +++ b/annotations_1/Nz4zu_fSHYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.52], [18.0, 19.23], [20.0, 21.68], [22.0, 23.19], [25.0, 34.75], [35.0, 39.23], [40.0, 48.95], [50.0, 56.47], [57.0, 65.26], [66.0, 83.08], [84.0, 85.08], [85.0, 97.8], [98.0, 106.34], [112.0, 125.95], [129.0, 134.35], [135.0, 135.5], [138.0, 138.57], [139.0, 143.13], [146.0, 152.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.29, 71.0, 71.29, 99.16, 99.97, 35.83, 0.0, 29.68, 34.3, 30.42, 29.6, 0.0, 0.0, 30.19, 30.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 58.65], ["musical instrument", 6.86], ["theremin", 5.39]], null, [["fireworks", 20.05], ["speech", 16.49], ["explosion", 13.88]], [["fart", 23.04], ["hum", 7.83], ["rumble", 6.1]], [["speech", 31.03], ["crowd", 9.59], ["music", 6.46]], [["cattle, bovinae", 28.41], ["moo", 20.11], ["livestock, farm animals, working animals", 6.66]], null, null, [["whale vocalization", 20.64], ["speech", 9.34], ["cattle, bovinae", 7.09]], [["cattle, bovinae", 32.09], ["moo", 23.96], ["livestock, farm animals, working animals", 13.83]]], "duration": [1.52, 1.23, 1.68, 1.19, 9.75, 4.23, 8.95, 6.47, 8.26, 17.08, 1.08, 12.8, 8.34, 13.95, 5.35, 0.5, 0.57, 4.13, 6.54]} \ No newline at end of file diff --git a/annotations_1/NzCTDwlquaQ_filtered.json b/annotations_1/NzCTDwlquaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0147516d7f7cdacf5667caa23485728c3b70aecd --- /dev/null +++ b/annotations_1/NzCTDwlquaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 109.46], [113.0, 116.38], [120.0, 120.41], [124.0, 124.14], [125.0, 125.15]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 30.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 31.15], ["musical instrument", 8.99], ["classical music", 8.56]], null, null, null], "duration": [33.46, 3.38, 0.41, 0.14, 0.15]} \ No newline at end of file diff --git a/annotations_1/NzJH4towI_A_filtered.json b/annotations_1/NzJH4towI_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8ed8a04ca81c39e8112024835a5b0b94e94b25b --- /dev/null +++ b/annotations_1/NzJH4towI_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [9.0, 8.8], [15.0, 15.8], [16.0, 23.67], [26.0, 26.0], [27.0, 28.09], [30.0, 34.01], [35.0, 36.19], [38.0, 38.58], [42.0, 42.63], [45.0, 45.2], [47.0, 48.9], [49.0, 55.34], [58.0, 58.06], [58.0, 59.05], [60.0, 60.98], [68.0, 69.67], [77.0, 81.08], [83.0, 83.46], [85.0, 85.89], [88.0, 88.42], [92.0, 91.98], [94.0, 94.58], [96.0, 97.16], [98.0, 99.59], [102.0, 104.79], [110.0, 111.11], [115.0, 123.8], [124.0, 134.1], [135.0, 135.19], [136.0, 137.62], [138.0, 140.61], [143.0, 145.98]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.91, 0.0, 0.0, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 31.04, 0.0, 0.0, 0.0, 0.0, 30.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.81, 0.0, 45.05, 31.16, 0.0, 0.0, 37.39, 37.54], "audiomae_on_audioset": [null, null, null, [["music", 37.47], ["throbbing", 15.0], ["mains hum", 12.33]], null, null, [["hum", 25.82], ["mains hum", 17.67], ["music", 10.82]], null, null, null, null, null, [["music", 26.78], ["speech", 18.75], ["throbbing", 12.76]], null, null, null, null, [["music", 68.26], ["rumble", 5.03], ["hum", 3.09]], null, null, null, null, null, null, null, [["music", 22.82], ["crow", 9.99], ["caw", 9.07]], null, [["hum", 38.59], ["throbbing", 33.48], ["music", 11.02]], [["music", 24.9], ["speech", 24.9], ["hum", 16.75]], null, null, [["music", 60.91], ["hum", 5.27], ["sidetone", 5.19]], [["music", 32.96], ["throbbing", 25.17], ["hum", 14.94]]], "duration": [0.57, -0.2, 0.8, 7.67, 0.0, 1.09, 4.01, 1.19, 0.58, 0.63, 0.2, 1.9, 6.34, 0.06, 1.05, 0.98, 1.67, 4.08, 0.46, 0.89, 0.42, -0.02, 0.58, 1.16, 1.59, 2.79, 1.11, 8.8, 10.1, 0.19, 1.62, 2.61, 2.98]} \ No newline at end of file diff --git a/annotations_1/O-QaGllHqN0_filtered.json b/annotations_1/O-QaGllHqN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ef9e61d109ff6e97a47edcb11fcc1f60053df0 --- /dev/null +++ b/annotations_1/O-QaGllHqN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.85], [12.0, 12.28], [13.0, 14.98], [17.0, 17.76], [19.0, 23.19], [25.0, 25.47], [28.0, 30.81], [34.0, 36.41], [39.0, 41.71], [47.0, 47.97], [49.0, 49.5], [57.0, 60.51], [61.0, 68.82], [72.0, 94.27]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.65, 0.0, 32.72, 30.69, 31.89, 0.0, 0.0, 36.29, 31.41, 31.38], "audiomae_on_audioset": [null, null, null, null, [["music", 36.41], ["hum", 21.78], ["mains hum", 19.15]], null, [["mains hum", 46.3], ["hum", 27.98], ["music", 10.72]], [["grunt", 24.83], ["whale vocalization", 7.75], ["music", 7.29]], [["music", 41.21], ["whale vocalization", 8.94], ["hum", 6.85]], null, null, [["music", 38.97], ["hum", 25.51], ["mains hum", 14.92]], [["hum", 59.61], ["mains hum", 34.74], ["throbbing", 3.08]], [["music", 34.22], ["livestock, farm animals, working animals", 9.03], ["cattle, bovinae", 8.42]]], "duration": [0.85, 0.28, 1.98, 0.76, 4.19, 0.47, 2.81, 2.41, 2.71, 0.97, 0.5, 3.51, 7.82, 22.27]} \ No newline at end of file diff --git a/annotations_1/O-W3C2RQduY_filtered.json b/annotations_1/O-W3C2RQduY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a3eb37f620c314101e43e5519667fa2a67feda2 --- /dev/null +++ b/annotations_1/O-W3C2RQduY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [8.0, 8.73], [13.0, 15.53], [20.0, 21.57], [32.0, 32.44], [38.0, 44.73], [46.0, 53.03], [61.0, 61.37], [67.0, 68.77], [74.0, 74.55], [77.0, 79.46], [80.0, 87.24], [88.0, 110.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 36.03, 0.0, 0.0, 57.4, 30.85, 0.0, 0.0, 0.0, 31.01, 29.05, 29.07], "audiomae_on_audioset": [null, null, [["music", 59.69], ["throbbing", 9.95], ["hum", 4.97]], null, null, null, [["speech", 55.16], ["music", 11.05], ["sidetone", 6.04]], null, null, null, [["music", 58.43], ["theremin", 4.54], ["electronic music", 3.78]], [["speech", 22.72], ["electric shaver, electric razor", 20.34], ["throbbing", 12.02]], [["speech", 46.65], ["music", 27.41], ["throbbing", 6.2]]], "duration": [0.13, 0.73, 2.53, 1.57, 0.44, 6.73, 7.03, 0.37, 1.77, 0.55, 2.46, 7.24, 22.08]} \ No newline at end of file diff --git a/annotations_1/O0fQ_rrQedE_filtered.json b/annotations_1/O0fQ_rrQedE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..739c78d92c7f572739a87655df2d624effc7865e --- /dev/null +++ b/annotations_1/O0fQ_rrQedE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 16.04], [20.0, 20.88], [23.0, 25.22], [26.0, 29.91], [34.0, 34.06], [35.0, 37.4], [40.0, 40.09], [47.0, 48.0], [51.0, 55.43], [62.0, 77.28], [79.0, 86.68], [87.0, 88.28], [89.0, 89.77], [91.0, 92.16], [93.0, 93.21], [97.0, 101.76], [121.0, 125.86]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [29.4, 0.0, 30.24, 30.55, 0.0, 32.29, 0.0, 0.0, 39.01, 29.68, 30.4, 0.0, 0.0, 0.0, 0.0, 30.14, 32.03], "audiomae_on_audioset": [[["music", 76.83], ["didgeridoo", 3.01], ["singing", 2.46]], null, [["music", 65.87], ["hum", 3.97], ["throbbing", 3.13]], [["music", 54.78], ["speech", 6.07], ["didgeridoo", 5.48]], null, [["music", 30.21], ["cattle, bovinae", 18.33], ["moo", 13.9]], null, null, [["music", 33.45], ["speech", 15.74], ["hum", 14.77]], [["mains hum", 40.97], ["hum", 25.84], ["music", 9.52]], [["music", 63.51], ["speech", 12.82], ["musical instrument", 2.31]], null, null, null, null, [["music", 57.94], ["speech", 12.01], ["electronic music", 5.43]], [["music", 38.68], ["throbbing", 18.95], ["hum", 13.42]]], "duration": [11.04, 0.88, 2.22, 3.91, 0.06, 2.4, 0.09, 1.0, 4.43, 15.28, 7.68, 1.28, 0.77, 1.16, 0.21, 4.76, 4.86]} \ No newline at end of file diff --git a/annotations_1/O12Ve5AFu7o_filtered.json b/annotations_1/O12Ve5AFu7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b403577c4faf48b2fdf42414f888934b73d0a6 --- /dev/null +++ b/annotations_1/O12Ve5AFu7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 58.41], [60.0, 75.98], [80.0, 104.18], [110.0, 111.1], [114.0, 115.75]], "keep_status": [false, false, true, false, false], "silence_prob": [32.33, 32.06, 31.29, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.42], ["speech", 26.39], ["groan", 13.53]], [["music", 65.79], ["didgeridoo", 13.54], ["musical instrument", 2.7]], [["fly, housefly", 23.38], ["music", 14.33], ["insect", 11.99]], null, null], "duration": [15.41, 15.98, 24.18, 1.1, 1.75]} \ No newline at end of file diff --git a/annotations_1/O2yNsybczj4_filtered.json b/annotations_1/O2yNsybczj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98c68c35b1298f8c7da46d84d604b164544c86df --- /dev/null +++ b/annotations_1/O2yNsybczj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.21], [14.0, 14.76], [16.0, 26.06], [27.0, 30.1], [31.0, 32.44], [34.0, 35.06], [37.0, 38.11], [40.0, 42.11], [47.0, 48.17], [50.0, 51.09], [54.0, 55.39], [57.0, 58.19], [60.0, 61.92], [63.0, 63.66], [66.0, 66.23], [67.0, 67.07], [68.0, 73.06], [74.0, 75.29], [78.0, 79.51], [81.0, 81.73], [84.0, 86.16], [87.0, 89.11], [90.0, 94.86], [99.0, 98.78], [100.0, 101.85], [104.0, 104.58], [105.0, 106.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 53.22, 94.22, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 100.0, 100.0, 41.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 21.43], ["mains hum", 17.85], ["hum", 16.25]], null, null, null, null], "duration": [1.21, 0.76, 10.06, 3.1, 1.44, 1.06, 1.11, 2.11, 1.17, 1.09, 1.39, 1.19, 1.92, 0.66, 0.23, 0.07, 5.06, 1.29, 1.51, 0.73, 2.16, 2.11, 4.86, -0.22, 1.85, 0.58, 1.1]} \ No newline at end of file diff --git a/annotations_1/O3-W1ng-UWI_filtered.json b/annotations_1/O3-W1ng-UWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc8244ef2cc56c7dc09668ea425d64d2f33c97d6 --- /dev/null +++ b/annotations_1/O3-W1ng-UWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [4.0, 4.83], [5.0, 6.86], [9.0, 9.19], [15.0, 15.99], [17.0, 18.12], [19.0, 19.47], [28.0, 32.07], [32.0, 32.46], [34.0, 33.94], [38.0, 43.02], [51.0, 51.88], [55.0, 54.72], [57.0, 57.72], [67.0, 68.55], [73.0, 73.38], [78.0, 80.1], [85.0, 85.38], [97.0, 99.59], [101.0, 102.81], [104.0, 106.34], [107.0, 108.14], [111.0, 110.88], [112.0, 113.07], [133.0, 133.83], [138.0, 140.48], [141.0, 141.42], [142.0, 142.57], [144.0, 145.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0, 0.0, 58.3, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 0.0, 41.72, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 88.6], ["radio", 3.77], ["noise", 1.69]], null, null, null, null, null, null, null, null, null, null, [["speech", 82.85], ["telephone", 8.25], ["radio", 3.98]], null, null, null, null, null, null, [["speech", 29.08], ["music", 20.04], ["didgeridoo", 5.39]], null, null, null], "duration": [0.81, 0.83, 1.86, 0.19, 0.99, 1.12, 0.47, 4.07, 0.46, -0.06, 5.02, 0.88, -0.28, 0.72, 1.55, 0.38, 2.1, 0.38, 2.59, 1.81, 2.34, 1.14, -0.12, 1.07, 0.83, 2.48, 0.42, 0.57, 1.62]} \ No newline at end of file diff --git a/annotations_1/O4TmwflckcU_filtered.json b/annotations_1/O4TmwflckcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7f145d66f78e6bbc4b009032f22d8d6a50f5b37 --- /dev/null +++ b/annotations_1/O4TmwflckcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [9.0, 10.03], [11.0, 11.77], [15.0, 15.57], [18.0, 17.79], [19.0, 19.58], [21.0, 32.26], [34.0, 33.94], [38.0, 38.96], [40.0, 40.32], [49.0, 49.64], [53.0, 54.28], [56.0, 56.03], [57.0, 59.76], [60.0, 61.03], [62.0, 63.31], [64.0, 66.41], [67.0, 69.04], [72.0, 71.95], [78.0, 78.68], [80.0, 80.87], [87.0, 89.77], [93.0, 93.66], [102.0, 102.42], [109.0, 114.96], [119.0, 119.16], [124.0, 124.17], [127.0, 134.0], [145.0, 147.16], [150.0, 150.15], [155.0, 155.7], [158.0, 158.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 92.31, 41.36, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 33.86, 0.0, 0.0, 40.77, 32.63, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 45.21], ["throbbing", 18.44], ["hum", 17.22]], null, null, null, null, null, null, null, null, null, null, [["speech", 38.69], ["music", 33.95], ["didgeridoo", 3.85]], null, null, null, [["music", 45.46], ["synthesizer", 7.01], ["musical instrument", 6.96]], null, null, [["music", 44.93], ["speech", 20.62], ["foghorn", 12.69]], null, null, [["speech", 31.49], ["music", 24.72], ["foghorn", 15.87]], [["fly, housefly", 32.55], ["mosquito", 17.38], ["speech", 9.98]], null, null, null], "duration": [0.34, 1.03, 0.77, 0.57, -0.21, 0.58, 11.26, -0.06, 0.96, 0.32, 0.64, 1.28, 0.03, 2.76, 1.03, 1.31, 2.41, 2.04, -0.05, 0.68, 0.87, 2.77, 0.66, 0.42, 5.96, 0.16, 0.17, 7.0, 2.16, 0.15, 0.7, 0.33]} \ No newline at end of file diff --git a/annotations_1/O4brzUAaTS0_filtered.json b/annotations_1/O4brzUAaTS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d2c2f2997cc2b4db0e431802d9c98c17c935cc9 --- /dev/null +++ b/annotations_1/O4brzUAaTS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 32.16], [40.0, 41.89], [62.0, 61.96], [68.0, 68.77], [77.0, 83.08], [86.0, 91.4], [99.0, 102.42], [109.0, 112.16], [124.0, 124.17], [127.0, 128.16], [129.0, 130.17], [144.0, 143.99], [146.0, 145.86], [149.0, 157.72], [158.0, 159.48], [161.0, 165.97], [182.0, 191.32], [216.0, 216.11], [222.0, 222.66], [226.0, 226.67]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [33.24, 0.0, 0.0, 0.0, 35.33, 40.31, 33.8, 35.01, 0.0, 0.0, 0.0, 0.0, 0.0, 36.25, 0.0, 49.27, 41.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.41], ["music", 24.48], ["foghorn", 4.32]], null, null, null, [["music", 32.06], ["throbbing", 20.28], ["hum", 15.48]], [["music", 65.58], ["speech", 13.93], ["electronic music", 3.1]], [["throbbing", 33.15], ["hum", 19.24], ["music", 17.06]], [["music", 68.0], ["musical instrument", 6.31], ["buzz", 2.27]], null, null, null, null, null, [["music", 51.73], ["hum", 11.95], ["noise", 6.31]], null, [["music", 24.3], ["speech", 14.85], ["noise", 13.91]], [["music", 57.52], ["theremin", 14.87], ["synthesizer", 7.56]], null, null, null], "duration": [23.16, 1.89, -0.04, 0.77, 6.08, 5.4, 3.42, 3.16, 0.17, 1.16, 1.17, -0.01, -0.14, 8.72, 1.48, 4.97, 9.32, 0.11, 0.66, 0.67]} \ No newline at end of file diff --git a/annotations_1/O6Stx_mwAVY_filtered.json b/annotations_1/O6Stx_mwAVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a23d37e99240f7fd7ccb0b6f1071e7b9cde884bb --- /dev/null +++ b/annotations_1/O6Stx_mwAVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.22], [9.0, 9.46], [10.0, 10.61], [12.0, 12.7], [18.0, 19.18], [20.0, 21.41], [23.0, 23.16], [26.0, 26.7], [28.0, 28.71], [43.0, 44.1], [48.0, 56.12], [57.0, 59.04], [65.0, 65.87], [71.0, 73.7], [80.0, 80.52], [82.0, 83.51], [84.0, 86.34], [88.0, 88.13], [92.0, 93.12], [95.0, 97.14], [98.0, 104.53], [107.0, 108.89], [110.0, 111.05], [113.0, 118.02], [119.0, 122.98], [124.0, 127.23], [129.0, 128.95], [129.0, 129.34], [130.0, 134.5], [135.0, 135.77], [146.0, 152.64], [153.0, 156.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [51.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 68.28, 0.0, 56.55, 0.0, 0.0, 58.22, 0.0, 0.0, 45.75, 56.78, 0.0, 0.0, 58.47, 33.37, 38.46, 0.0, 0.0, 45.59, 0.0, 59.07, 37.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.47], ["speech", 23.38], ["singing bowl", 20.14]], null, null, null, null, [["music", 49.07], ["speech", 14.51], ["throbbing", 5.71]], [["music", 28.53], ["speech", 26.34], ["hum", 5.09]], null, null, [["music", 53.34], ["speech", 31.33], ["electronic music", 2.26]], null, null, [["music", 57.88], ["speech", 25.81], ["hum", 2.88]]], "duration": [2.22, 0.46, 0.61, 0.7, 1.18, 1.41, 0.16, 0.7, 0.71, 1.1, 8.12, 2.04, 0.87, 2.7, 0.52, 1.51, 2.34, 0.13, 1.12, 2.14, 6.53, 1.89, 1.05, 5.02, 3.98, 3.23, -0.05, 0.34, 4.5, 0.77, 6.64, 3.96]} \ No newline at end of file diff --git a/annotations_1/O7S9X8e2uhA_filtered.json b/annotations_1/O7S9X8e2uhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..563e9a48cf1cc7eadfffcd340728e6eb659871de --- /dev/null +++ b/annotations_1/O7S9X8e2uhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [4.0, 4.43], [4.0, 4.5], [5.0, 4.56], [5.0, 4.6], [5.0, 5.78], [8.0, 13.83], [19.0, 19.57], [20.0, 19.72], [20.0, 32.95], [37.0, 52.27], [54.0, 54.62], [56.0, 57.64], [64.0, 63.96], [65.0, 65.8], [66.0, 66.55], [76.0, 77.16], [86.0, 86.75], [89.0, 89.02], [91.0, 92.64], [94.0, 96.4], [97.0, 96.94], [97.0, 97.02], [97.0, 97.23], [99.0, 99.81], [104.0, 122.86], [126.0, 125.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 0.0, 30.51, 30.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.25, 0.0, 0.0, 0.0, 0.0, 31.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 36.45], ["livestock, farm animals, working animals", 29.44], ["moo", 17.72]], null, null, [["music", 63.0], ["didgeridoo", 21.19], ["musical instrument", 2.74]], [["speech", 41.79], ["music", 24.78], ["theremin", 4.03]], null, null, null, null, null, null, null, null, null, [["music", 64.76], ["synthesizer", 4.21], ["theremin", 2.74]], null, null, null, null, [["hum", 46.2], ["mains hum", 19.21], ["throbbing", 14.26]], null], "duration": [0.4, 0.43, 0.5, -0.44, -0.4, 0.78, 5.83, 0.57, -0.28, 12.95, 15.27, 0.62, 1.64, -0.04, 0.8, 0.55, 1.16, 0.75, 0.02, 1.64, 2.4, -0.06, 0.02, 0.23, 0.81, 18.86, -0.17]} \ No newline at end of file diff --git a/annotations_1/O7jHiw8IyxQ_filtered.json b/annotations_1/O7jHiw8IyxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd00766ce2c54e15a61f8d8d909af00a7a62e2a5 --- /dev/null +++ b/annotations_1/O7jHiw8IyxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.82], [20.0, 19.99], [20.0, 22.17], [26.0, 26.33], [34.0, 34.43], [40.0, 40.59], [42.0, 41.99], [51.0, 51.81], [58.0, 60.39], [68.0, 68.71], [70.0, 70.65], [85.0, 89.78], [93.0, 94.76], [98.0, 107.45], [110.0, 135.11], [136.0, 145.77]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 42.28, 0.0, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 29.96, 0.0, 29.95, 29.99, 30.59], "audiomae_on_audioset": [null, null, [["speech", 36.82], ["music", 24.99], ["synthesizer", 6.23]], null, null, null, null, null, [["music", 29.38], ["throbbing", 15.12], ["hum", 13.22]], null, null, [["music", 47.06], ["hum", 8.45], ["throbbing", 7.69]], null, [["hum", 34.7], ["music", 27.95], ["mains hum", 24.32]], [["music", 32.62], ["mains hum", 19.23], ["hum", 16.18]], [["music", 59.5], ["cacophony", 9.02], ["throbbing", 8.41]]], "duration": [0.82, -0.01, 2.17, 0.33, 0.43, 0.59, -0.01, 0.81, 2.39, 0.71, 0.65, 4.78, 1.76, 9.45, 25.11, 9.77]} \ No newline at end of file diff --git a/annotations_1/O7z6rV8Gdbs_filtered.json b/annotations_1/O7z6rV8Gdbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2983bcf200dc0fb15d9858b06d2a5d107dfaf1cd --- /dev/null +++ b/annotations_1/O7z6rV8Gdbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.09], [11.0, 42.2], [43.0, 73.63], [77.0, 78.31], [79.0, 87.35], [89.0, 93.36], [94.0, 94.44], [95.0, 119.72], [123.0, 138.87]], "keep_status": [true, false, false, false, true, false, false, true, true], "silence_prob": [28.78, 0.0, 0.0, 0.0, 30.71, 28.82, 0.0, 28.72, 28.65], "audiomae_on_audioset": [[["music", 23.31], ["whack, thwack", 13.58], ["fart", 10.85]], null, null, null, [["speech", 26.8], ["music", 23.45], ["hum", 9.62]], [["music", 73.32], ["speech", 7.19], ["throbbing", 5.8]], null, [["music", 27.3], ["hum", 23.16], ["throbbing", 14.15]], [["sound effect", 35.98], ["music", 11.14], ["whack, thwack", 5.33]]], "duration": [8.09, 31.2, 30.63, 1.31, 8.35, 4.36, 0.44, 24.72, 15.87]} \ No newline at end of file diff --git a/annotations_1/O9Q_5-rAw_k_filtered.json b/annotations_1/O9Q_5-rAw_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7de72c74ffd28e80731340c71c833139ee96d4ae --- /dev/null +++ b/annotations_1/O9Q_5-rAw_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.78], [9.0, 10.67], [11.0, 13.04], [13.0, 19.41], [21.0, 22.13], [24.0, 25.29], [27.0, 29.19], [29.0, 29.29], [29.0, 41.0], [41.0, 45.05], [47.0, 48.63], [50.0, 50.82], [59.0, 58.97], [60.0, 64.12], [65.0, 65.4], [72.0, 83.19], [84.0, 87.15], [90.0, 99.42], [102.0, 107.38], [115.0, 120.68], [125.0, 125.51], [127.0, 129.69], [131.0, 132.44], [133.0, 134.4], [142.0, 142.11], [142.0, 163.48], [166.0, 166.58], [168.0, 175.34]], "keep_status": [false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [73.36, 0.0, 41.1, 35.28, 0.0, 0.0, 29.01, 0.0, 30.88, 36.02, 0.0, 0.0, 0.0, 32.52, 0.0, 29.28, 31.12, 29.69, 29.44, 29.66, 0.0, 54.23, 0.0, 0.0, 0.0, 29.42, 0.0, 31.04], "audiomae_on_audioset": [null, null, [["speech", 45.64], ["music", 42.53], ["throbbing", 0.98]], [["music", 28.37], ["hum", 18.7], ["throbbing", 17.57]], null, null, [["music", 57.77], ["throbbing", 4.28], ["motorcycle", 4.26]], null, [["music", 50.64], ["hum", 26.26], ["throbbing", 9.0]], [["music", 39.33], ["synthesizer", 5.59], ["inside, small room", 3.93]], null, null, null, [["music", 62.08], ["breaking", 9.4], ["whack, thwack", 6.67]], null, [["hum", 32.01], ["music", 31.86], ["throbbing", 16.46]], [["music", 55.2], ["crushing", 6.53], ["electronic music", 5.02]], [["music", 59.46], ["throbbing", 18.01], ["hum", 9.58]], [["music", 50.63], ["throbbing", 20.71], ["speech", 9.71]], [["music", 33.0], ["hum", 18.51], ["throbbing", 17.5]], null, null, null, null, null, [["music", 63.59], ["throbbing", 22.58], ["hum", 4.02]], null, [["breaking", 19.21], ["music", 16.37], ["smash, crash", 10.03]]], "duration": [5.78, 1.67, 2.04, 6.41, 1.13, 1.29, 2.19, 0.29, 12.0, 4.05, 1.63, 0.82, -0.03, 4.12, 0.4, 11.19, 3.15, 9.42, 5.38, 5.68, 0.51, 2.69, 1.44, 1.4, 0.11, 21.48, 0.58, 7.34]} \ No newline at end of file diff --git a/annotations_1/OArHd5pe8Ls_filtered.json b/annotations_1/OArHd5pe8Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b797a383e643be92a852860197d1311e6f77f57 --- /dev/null +++ b/annotations_1/OArHd5pe8Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [5.0, 29.69], [30.0, 88.45], [89.0, 91.81], [92.0, 105.16], [107.0, 114.91], [115.0, 119.43], [126.0, 131.99]], "keep_status": [false, false, false, true, true, false, true, false], "silence_prob": [0.0, 30.46, 0.0, 34.1, 35.52, 35.09, 42.76, 31.39], "audiomae_on_audioset": [null, [["music", 80.86], ["theremin", 2.85], ["electronic music", 1.32]], null, [["music", 35.85], ["thunk", 10.52], ["carnatic music", 5.63]], [["music", 23.53], ["whack, thwack", 10.3], ["tuning fork", 8.12]], [["didgeridoo", 68.3], ["music", 18.75], ["mosquito", 2.73]], [["music", 34.99], ["theremin", 23.43], ["mosquito", 5.36]], [["didgeridoo", 35.43], ["theremin", 24.28], ["music", 16.78]]], "duration": [-0.15, 24.69, 58.45, 2.81, 13.16, 7.91, 4.43, 5.99]} \ No newline at end of file diff --git a/annotations_1/OAtwRoFSlOE_filtered.json b/annotations_1/OAtwRoFSlOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..722d3aaeb7785cedd992fd8b25cf4f4a103ba748 --- /dev/null +++ b/annotations_1/OAtwRoFSlOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.78], [14.0, 19.36], [21.0, 29.02], [30.0, 36.12], [37.0, 41.86], [42.0, 44.04], [45.0, 49.13], [50.0, 51.39], [52.0, 53.38], [54.0, 61.45], [62.0, 66.9], [68.0, 78.8], [80.0, 81.14], [82.0, 83.35], [85.0, 85.85], [86.0, 88.96], [90.0, 92.2], [94.0, 97.34], [100.0, 100.68], [106.0, 108.87], [110.0, 110.54], [112.0, 114.49], [117.0, 118.07], [119.0, 120.53], [123.0, 123.82], [125.0, 125.96], [126.0, 130.25], [132.0, 133.32], [136.0, 138.27], [143.0, 152.04], [154.0, 154.62], [156.0, 165.86]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 65.2, 70.16, 48.44, 89.54, 71.87, 97.64, 0.0, 0.0, 99.26, 48.23, 40.95, 0.0, 0.0, 0.0, 72.9, 60.7, 73.82, 0.0, 90.25, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 97.64, 38.55, 0.0, 33.4], "audiomae_on_audioset": [null, null, null, [["music", 23.44], ["throbbing", 11.74], ["synthesizer", 9.05]], null, null, null, null, null, null, [["chirp tone", 15.6], ["sine wave", 13.19], ["hum", 12.16]], [["whale vocalization", 19.13], ["grunt", 17.9], ["animal", 12.7]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["outside, rural or natural", 7.59], ["echo", 7.36], ["groan", 5.66]], null, [["speech", 26.47], ["noise", 15.55], ["sidetone", 9.46]]], "duration": [1.78, 5.36, 8.02, 6.12, 4.86, 2.04, 4.13, 1.39, 1.38, 7.45, 4.9, 10.8, 1.14, 1.35, 0.85, 2.96, 2.2, 3.34, 0.68, 2.87, 0.54, 2.49, 1.07, 1.53, 0.82, 0.96, 4.25, 1.32, 2.27, 9.04, 0.62, 9.86]} \ No newline at end of file diff --git a/annotations_1/OBXQr25dHQE_filtered.json b/annotations_1/OBXQr25dHQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd095c3fbf10d498208d42b29bb6c44a1d184e70 --- /dev/null +++ b/annotations_1/OBXQr25dHQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.13], [25.0, 29.79], [30.0, 33.78], [34.0, 37.79], [39.0, 51.51], [54.0, 78.14], [78.0, 90.73], [91.0, 106.89]], "keep_status": [false, true, false, false, false, false, false, true], "silence_prob": [0.0, 39.41, 38.36, 33.41, 72.46, 36.31, 30.77, 29.15], "audiomae_on_audioset": [null, [["music", 51.21], ["wind instrument, woodwind instrument", 9.67], ["musical instrument", 7.38]], [["cattle, bovinae", 33.73], ["moo", 23.23], ["livestock, farm animals, working animals", 14.72]], [["speech", 79.15], ["civil defense siren", 2.98], ["hum", 2.88]], null, [["music", 44.06], ["theremin", 38.51], ["wind instrument, woodwind instrument", 4.99]], [["music", 47.05], ["speech", 19.27], ["theremin", 11.18]], [["music", 34.75], ["livestock, farm animals, working animals", 15.19], ["cattle, bovinae", 6.79]]], "duration": [0.13, 4.79, 3.78, 3.79, 12.51, 24.14, 12.73, 15.89]} \ No newline at end of file diff --git a/annotations_1/OByY45anMr4_filtered.json b/annotations_1/OByY45anMr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d98ef30fc51030b4824ec9fa624dba7b5d1694 --- /dev/null +++ b/annotations_1/OByY45anMr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.81], [15.0, 14.89], [16.0, 16.34], [17.0, 17.74], [19.0, 19.68], [20.0, 22.18], [24.0, 25.83], [27.0, 29.69], [31.0, 31.29], [33.0, 33.88], [35.0, 36.12], [37.0, 37.86], [39.0, 42.52], [43.0, 43.39], [48.0, 48.76], [54.0, 54.11], [55.0, 58.24], [60.0, 60.05], [64.0, 68.47], [69.0, 71.9], [74.0, 76.01], [77.0, 80.65], [81.0, 85.62], [93.0, 94.17], [95.0, 94.85], [97.0, 98.36], [101.0, 101.65], [102.0, 102.9], [104.0, 105.68], [107.0, 111.97], [112.0, 114.74], [115.0, 114.81], [115.0, 116.29], [117.0, 118.02], [118.0, 124.31], [125.0, 126.17], [127.0, 129.2], [133.0, 134.15], [135.0, 140.59], [141.0, 143.38], [144.0, 149.54], [150.0, 163.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.86, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 55.67, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 78.04, 0.0, 79.07, 68.02, 81.89, 63.31, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 48.82, 0.0, 0.0, 0.0, 64.97, 0.0, 86.82, 0.0, 77.7, 94.07, 96.42, 74.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.74], ["speech", 28.25], ["hum", 3.79]], null, null, null, null, null, null, null, null, null, null, null], "duration": [8.81, -0.11, 0.34, 0.74, 0.68, 2.18, 1.83, 2.69, 0.29, 0.88, 1.12, 0.86, 3.52, 0.39, 0.76, 0.11, 3.24, 0.05, 4.47, 2.9, 2.01, 3.65, 4.62, 1.17, -0.15, 1.36, 0.65, 0.9, 1.68, 4.97, 2.74, -0.19, 1.29, 1.02, 6.31, 1.17, 2.2, 1.15, 5.59, 2.38, 5.54, 13.22]} \ No newline at end of file diff --git a/annotations_1/ODIZKyevVxQ_filtered.json b/annotations_1/ODIZKyevVxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f7e9640704e428f98f2bb1bf4bffb0867f8d6a6 --- /dev/null +++ b/annotations_1/ODIZKyevVxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.13], [16.0, 16.66], [22.0, 22.33], [23.0, 24.22], [29.0, 29.46], [33.0, 35.33], [38.0, 38.69], [40.0, 41.01], [42.0, 43.5], [46.0, 53.81], [57.0, 64.22], [70.0, 73.4], [74.0, 75.24], [78.0, 88.82], [90.0, 91.23], [93.0, 94.49], [96.0, 98.98], [99.0, 100.13], [102.0, 103.54], [104.0, 104.8], [106.0, 109.04], [111.0, 111.59], [112.0, 113.46], [121.0, 123.94], [124.0, 126.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [29.37, 0.0, 0.0, 0.0, 0.0, 29.24, 0.0, 0.0, 0.0, 30.61, 28.96, 29.38, 0.0, 30.4, 0.0, 0.0, 29.02, 0.0, 0.0, 0.0, 29.99, 0.0, 0.0, 28.58, 28.75], "audiomae_on_audioset": [[["speech", 34.59], ["music", 31.67], ["hum", 5.94]], null, null, null, null, [["speech", 57.84], ["fixed-wing aircraft, airplane", 11.62], ["aircraft", 9.08]], null, null, null, [["music", 38.37], ["hum", 24.9], ["mains hum", 13.3]], [["mains hum", 30.19], ["speech", 17.52], ["sidetone", 15.1]], [["hum", 13.59], ["aircraft", 11.47], ["mains hum", 11.26]], null, [["buzz", 18.1], ["music", 12.89], ["hum", 9.88]], null, null, [["music", 40.87], ["mains hum", 9.91], ["pulse", 5.8]], null, null, null, [["vehicle", 19.55], ["aircraft", 11.47], ["fixed-wing aircraft, airplane", 9.14]], null, null, [["speech", 63.75], ["explosion", 11.79], ["vehicle", 5.48]], [["speech", 72.29], ["field recording", 2.91], ["vehicle", 2.25]]], "duration": [8.13, 0.66, 0.33, 1.22, 0.46, 2.33, 0.69, 1.01, 1.5, 7.81, 7.22, 3.4, 1.24, 10.82, 1.23, 1.49, 2.98, 1.13, 1.54, 0.8, 3.04, 0.59, 1.46, 2.94, 2.42]} \ No newline at end of file diff --git a/annotations_1/ODeWs0Eu8n0_filtered.json b/annotations_1/ODeWs0Eu8n0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30809103841a87a56ffc264c69158e6df662720d --- /dev/null +++ b/annotations_1/ODeWs0Eu8n0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.74], [8.0, 12.66], [14.0, 17.63], [19.0, 36.96], [38.0, 40.34], [41.0, 43.55], [44.0, 45.3], [46.0, 47.46], [48.0, 50.6], [51.0, 53.08], [57.0, 58.09], [59.0, 59.95], [63.0, 84.64], [85.0, 88.38], [90.0, 92.06], [93.0, 92.72], [93.0, 92.91], [95.0, 94.78], [96.0, 99.59], [100.0, 101.41], [103.0, 104.89], [106.0, 110.64], [117.0, 118.59], [136.0, 137.69], [147.0, 146.85], [147.0, 146.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [94.37, 99.99, 99.44, 99.99, 99.8, 84.43, 0.0, 0.0, 99.85, 54.36, 0.0, 0.0, 70.58, 41.76, 39.43, 0.0, 0.0, 0.0, 42.44, 0.0, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.09], ["door", 6.91], ["inside, small room", 3.95]], [["speech", 43.0], ["thunk", 16.91], ["music", 7.3]], null, null, null, [["speech", 42.24], ["music", 19.88], ["mains hum", 7.08]], null, null, [["music", 46.24], ["didgeridoo", 12.95], ["speech", 7.81]], null, null, null, null], "duration": [2.74, 4.66, 3.63, 17.96, 2.34, 2.55, 1.3, 1.46, 2.6, 2.08, 1.09, 0.95, 21.64, 3.38, 2.06, -0.28, -0.09, -0.22, 3.59, 1.41, 1.89, 4.64, 1.59, 1.69, -0.15, -0.03]} \ No newline at end of file diff --git a/annotations_1/OE7aSKZDjTo_filtered.json b/annotations_1/OE7aSKZDjTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2beb916cec2ec95f4345822e9a58a2d3c00257d6 --- /dev/null +++ b/annotations_1/OE7aSKZDjTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 51.97], [53.0, 53.43], [55.0, 55.71], [59.0, 59.71], [63.0, 68.39], [72.0, 72.74], [74.0, 84.18], [85.0, 85.95], [88.0, 88.55], [90.0, 90.44], [91.0, 91.5], [98.0, 99.33], [100.0, 101.43], [104.0, 113.0], [114.0, 115.8], [117.0, 118.13], [119.0, 120.5], [123.0, 124.11], [127.0, 128.75], [130.0, 133.25], [135.0, 142.94], [147.0, 166.97], [169.0, 176.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [33.18, 0.0, 0.0, 0.0, 64.29, 0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 51.88, 44.04, 42.98], "audiomae_on_audioset": [[["music", 47.81], ["theremin", 28.7], ["scary music", 3.81]], null, null, null, null, null, [["music", 64.66], ["speech", 20.07], ["grunt", 5.18]], null, null, null, null, null, null, [["music", 33.65], ["speech", 15.21], ["gong", 11.05]], null, null, null, null, null, null, null, [["theremin", 68.53], ["music", 21.21], ["synthesizer", 2.19]], [["music", 41.1], ["ambient music", 10.86], ["theremin", 9.93]]], "duration": [7.97, 0.43, 0.71, 0.71, 5.39, 0.74, 10.18, 0.95, 0.55, 0.44, 0.5, 1.33, 1.43, 9.0, 1.8, 1.13, 1.5, 1.11, 1.75, 3.25, 7.94, 19.97, 7.89]} \ No newline at end of file diff --git a/annotations_1/OFDJnI4RczY_filtered.json b/annotations_1/OFDJnI4RczY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa9266c04a383e65fe8cd5b5f36b554fc72e96e --- /dev/null +++ b/annotations_1/OFDJnI4RczY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.63], [2.0, 3.06], [5.0, 5.09], [7.0, 7.67], [9.0, 9.39], [15.0, 15.38], [16.0, 19.26], [21.0, 22.72], [24.0, 24.41], [25.0, 26.4], [30.0, 33.0], [42.0, 43.58], [46.0, 45.98], [47.0, 50.16], [53.0, 53.67], [54.0, 55.34], [56.0, 56.51], [57.0, 58.29], [59.0, 62.24], [70.0, 72.3], [73.0, 73.45], [75.0, 75.32], [76.0, 76.23], [79.0, 79.51], [80.0, 79.57], [80.0, 81.33], [82.0, 83.03], [83.0, 83.67], [87.0, 89.63], [91.0, 91.27], [92.0, 93.45], [98.0, 98.47], [104.0, 106.19], [111.0, 111.06], [114.0, 115.25], [123.0, 124.23], [130.0, 133.29], [137.0, 143.14], [144.0, 144.58], [148.0, 148.66], [154.0, 156.69], [157.0, 159.11]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.43, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 33.53, 0.0, 0.0, 0.0, 0.0, 81.53, 82.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.43, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 79.94, 49.13, 0.0, 0.0, 54.56, 45.49], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 33.34], ["sidetone", 15.05], ["fly, housefly", 10.88]], null, null, null, null, null, null, [["speech", 55.53], ["mains hum", 12.55], ["hum", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.47], ["hum", 26.49], ["heart sounds, heartbeat", 5.53]], null, null, null, [["music", 40.75], ["quack", 11.52], ["musical instrument", 6.39]], null, null, null, null, [["music", 57.17], ["hum", 6.25], ["mains hum", 3.08]], null, null, null, [["music", 74.18], ["boing", 5.25], ["musical instrument", 2.29]]], "duration": [0.63, 1.06, 0.09, 0.67, 0.39, 0.38, 3.26, 1.72, 0.41, 1.4, 3.0, 1.58, -0.02, 3.16, 0.67, 1.34, 0.51, 1.29, 3.24, 2.3, 0.45, 0.32, 0.23, 0.51, -0.43, 1.33, 1.03, 0.67, 2.63, 0.27, 1.45, 0.47, 2.19, 0.06, 1.25, 1.23, 3.29, 6.14, 0.58, 0.66, 2.69, 2.11]} \ No newline at end of file diff --git a/annotations_1/OFJKL2POF5I_filtered.json b/annotations_1/OFJKL2POF5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b618b92ea07db96f60deb6d15679d342056c76e3 --- /dev/null +++ b/annotations_1/OFJKL2POF5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [6.0, 6.45], [7.0, 11.37], [14.0, 14.99], [17.0, 16.9], [18.0, 18.28], [19.0, 29.94], [32.0, 33.4], [37.0, 43.56], [45.0, 55.61], [59.0, 63.59], [64.0, 64.4], [66.0, 67.24], [71.0, 74.8], [81.0, 82.17], [84.0, 87.1], [89.0, 96.08], [107.0, 108.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 45.82, 0.0, 55.53, 43.9, 41.14, 0.0, 0.0, 37.76, 0.0, 39.77, 38.83, 0.0], "audiomae_on_audioset": [null, null, [["speech", 54.4], ["sidetone", 15.28], ["music", 6.7]], null, null, null, [["music", 64.4], ["speech", 7.91], ["didgeridoo", 5.57]], null, null, [["music", 44.2], ["mains hum", 10.44], ["speech", 8.25]], [["hum", 26.57], ["music", 23.36], ["mains hum", 20.15]], null, null, [["music", 76.01], ["didgeridoo", 6.85], ["speech", 3.28]], null, [["music", 33.4], ["hum", 4.21], ["sound effect", 3.41]], [["music", 49.23], ["didgeridoo", 12.68], ["speech", 12.03]], null], "duration": [0.77, 0.45, 4.37, 0.99, -0.1, 0.28, 10.94, 1.4, 6.56, 10.61, 4.59, 0.4, 1.24, 3.8, 1.17, 3.1, 7.08, 1.9]} \ No newline at end of file diff --git a/annotations_1/OGEfW_fV9ZI_filtered.json b/annotations_1/OGEfW_fV9ZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ede5645b8d449db1cf2289fb4e215f5ac305a68a --- /dev/null +++ b/annotations_1/OGEfW_fV9ZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.45], [19.0, 19.84], [22.0, 24.09], [25.0, 27.67], [29.0, 28.97], [30.0, 30.6], [33.0, 33.57], [36.0, 36.44], [37.0, 37.25], [41.0, 41.18], [45.0, 45.08], [46.0, 47.8], [53.0, 53.43], [55.0, 55.31], [56.0, 56.29], [58.0, 58.16], [61.0, 61.84], [63.0, 63.17], [64.0, 64.3], [65.0, 65.31], [66.0, 66.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.84, 2.09, 2.67, -0.03, 0.6, 0.57, 0.44, 0.25, 0.18, 0.08, 1.8, 0.43, 0.31, 0.29, 0.16, 0.84, 0.17, 0.3, 0.31, 0.9]} \ No newline at end of file diff --git a/annotations_1/OHCVQcnqGcY_filtered.json b/annotations_1/OHCVQcnqGcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37ac68adb1285095088709b02633c88aeb45bee9 --- /dev/null +++ b/annotations_1/OHCVQcnqGcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 45.52], [53.0, 72.28], [72.0, 79.35], [83.0, 92.79], [94.0, 93.93], [95.0, 95.47], [102.0, 102.79], [104.0, 103.99], [111.0, 110.61], [112.0, 113.34], [126.0, 129.27], [134.0, 134.54], [136.0, 136.63], [137.0, 137.39], [138.0, 138.1], [144.0, 144.88], [147.0, 147.9], [149.0, 148.95], [152.0, 153.89], [155.0, 156.12], [157.0, 157.49], [159.0, 161.77], [165.0, 165.5]], "keep_status": [true, true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.6, 31.47, 33.71, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0], "audiomae_on_audioset": [[["hum", 23.33], ["whack, thwack", 11.1], ["music", 10.14]], [["music", 35.1], ["speech", 7.81], ["whack, thwack", 7.6]], [["hum", 27.52], ["didgeridoo", 15.23], ["mains hum", 14.32]], [["hum", 30.55], ["music", 9.6], ["sidetone", 9.47]], null, null, null, null, null, null, [["animal", 12.82], ["cattle, bovinae", 11.18], ["speech", 10.84]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.52, 19.28, 7.35, 9.79, -0.07, 0.47, 0.79, -0.01, -0.39, 1.34, 3.27, 0.54, 0.63, 0.39, 0.1, 0.88, 0.9, -0.05, 1.89, 1.12, 0.49, 2.77, 0.5]} \ No newline at end of file diff --git a/annotations_1/OIf1BFh8UwA_filtered.json b/annotations_1/OIf1BFh8UwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8870663568b54ced962963d0f073f6f635a7340b --- /dev/null +++ b/annotations_1/OIf1BFh8UwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.29], [29.0, 30.55], [34.0, 34.2], [38.0, 37.69], [41.0, 41.84], [43.0, 49.77], [52.0, 52.14], [53.0, 54.33], [55.0, 55.05], [57.0, 58.77], [69.0, 69.77], [86.0, 85.82], [87.0, 90.51], [96.0, 103.0], [107.0, 109.86], [111.0, 114.89], [125.0, 127.03], [131.0, 135.14], [136.0, 137.84], [141.0, 147.45], [150.0, 157.18], [160.0, 173.21], [174.0, 173.65], [174.0, 173.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85, 30.99, 39.67, 29.65, 32.22, 30.12, 0.0, 30.66, 33.84, 29.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 53.39], ["music", 19.38], ["didgeridoo", 9.35]], null, null, null, null, null, null, [["rumble", 23.74], ["hum", 23.67], ["music", 15.88]], [["music", 72.59], ["synthesizer", 3.82], ["throbbing", 3.6]], [["music", 66.02], ["synthesizer", 6.42], ["mains hum", 4.2]], [["mains hum", 41.05], ["hum", 27.98], ["throbbing", 13.43]], [["music", 30.63], ["hum", 21.6], ["mains hum", 20.35]], [["cattle, bovinae", 13.75], ["moo", 13.68], ["music", 11.66]], null, [["music", 18.31], ["fly, housefly", 17.02], ["mosquito", 14.46]], [["didgeridoo", 77.28], ["music", 7.41], ["throbbing", 6.5]], [["music", 39.4], ["speech", 20.51], ["synthesizer", 4.37]], null, null], "duration": [0.29, 1.55, 0.2, -0.31, 0.84, 6.77, 0.14, 1.33, 0.05, 1.77, 0.77, -0.18, 3.51, 7.0, 2.86, 3.89, 2.03, 4.14, 1.84, 6.45, 7.18, 13.21, -0.35, -0.25]} \ No newline at end of file diff --git a/annotations_1/OJyRbpjlrmA_filtered.json b/annotations_1/OJyRbpjlrmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7035069589d16f0889fd2b450eb4ab6edba8d45 --- /dev/null +++ b/annotations_1/OJyRbpjlrmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [7.0, 7.03], [12.0, 13.47], [15.0, 17.04], [19.0, 19.43], [27.0, 27.06], [31.0, 31.28], [33.0, 34.03], [42.0, 43.63], [44.0, 45.37], [47.0, 47.55], [49.0, 50.18], [52.0, 53.06], [62.0, 61.6], [65.0, 65.45], [66.0, 67.15], [72.0, 73.48], [86.0, 85.95], [88.0, 88.21], [105.0, 105.51], [107.0, 107.45], [116.0, 116.75], [118.0, 124.73], [126.0, 126.44], [127.0, 127.75], [128.0, 128.65], [133.0, 133.79], [135.0, 136.49], [137.0, 139.58], [140.0, 143.38], [144.0, 145.52], [146.0, 146.75], [148.0, 148.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 78.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 41.11], ["animal", 14.41], ["speech", 11.1]], null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.03, 1.47, 2.04, 0.43, 0.06, 0.28, 1.03, 1.63, 1.37, 0.55, 1.18, 1.06, -0.4, 0.45, 1.15, 1.48, -0.05, 0.21, 0.51, 0.45, 0.75, 6.73, 0.44, 0.75, 0.65, 0.79, 1.49, 2.58, 3.38, 1.52, 0.75, 0.78]} \ No newline at end of file diff --git a/annotations_1/OLZhL2R4cfg_filtered.json b/annotations_1/OLZhL2R4cfg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907f98b5eafadc513c03bdaa5c8a1394fa268128 --- /dev/null +++ b/annotations_1/OLZhL2R4cfg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.47], [12.0, 12.7], [26.0, 26.23], [40.0, 41.17], [42.0, 43.16], [45.0, 46.35], [52.0, 52.25], [65.0, 64.72], [82.0, 87.86], [92.0, 91.98], [95.0, 97.85], [100.0, 110.44], [111.0, 112.06], [113.0, 115.25], [120.0, 125.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, true], "silence_prob": [37.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 45.3, 32.22, 0.0, 39.27, 30.75], "audiomae_on_audioset": [[["music", 48.93], ["speech", 18.0], ["synthesizer", 9.13]], null, null, null, null, null, null, null, null, null, [["music", 50.46], ["throbbing", 7.14], ["hum", 6.21]], [["music", 34.28], ["speech", 19.37], ["didgeridoo", 13.08]], null, [["music", 46.36], ["synthesizer", 13.76], ["musical instrument", 5.87]], [["speech", 28.99], ["music", 26.47], ["didgeridoo", 6.51]]], "duration": [2.47, 0.7, 0.23, 1.17, 1.16, 1.35, 0.25, -0.28, 5.86, -0.02, 2.85, 10.44, 1.06, 2.25, 5.95]} \ No newline at end of file diff --git a/annotations_1/ONRzdzRMVsQ_filtered.json b/annotations_1/ONRzdzRMVsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3351f223f0068550d29a4155ab33b8caafba1606 --- /dev/null +++ b/annotations_1/ONRzdzRMVsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.62], [7.0, 7.53], [8.0, 14.25], [16.0, 16.71], [17.0, 18.06], [21.0, 22.05], [23.0, 23.89], [25.0, 26.03], [26.0, 27.35], [28.0, 33.22], [37.0, 42.25], [46.0, 46.45], [51.0, 51.9], [55.0, 54.97], [57.0, 57.47], [59.0, 59.37], [61.0, 61.69], [62.0, 63.02], [63.0, 64.56], [65.0, 65.7], [66.0, 66.83], [69.0, 69.8], [70.0, 71.95], [74.0, 74.82], [76.0, 79.71], [81.0, 81.3], [82.0, 82.44], [83.0, 83.56], [85.0, 86.21], [90.0, 90.56], [93.0, 93.92], [95.0, 95.08], [98.0, 98.05], [99.0, 103.45], [106.0, 107.54], [110.0, 110.52], [113.0, 114.32], [117.0, 128.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 83.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 0.53, 6.25, 0.71, 1.06, 1.05, 0.89, 1.03, 1.35, 5.22, 5.25, 0.45, 0.9, -0.03, 0.47, 0.37, 0.69, 1.02, 1.56, 0.7, 0.83, 0.8, 1.95, 0.82, 3.71, 0.3, 0.44, 0.56, 1.21, 0.56, 0.92, 0.08, 0.05, 4.45, 1.54, 0.52, 1.32, 11.95]} \ No newline at end of file diff --git a/annotations_1/OO4LqRUxinE_filtered.json b/annotations_1/OO4LqRUxinE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17a12f82b98549dfe9834d440faeefdd172540f --- /dev/null +++ b/annotations_1/OO4LqRUxinE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.64], [35.0, 50.13], [52.0, 64.93], [67.0, 68.98], [78.0, 87.44], [91.0, 92.16], [96.0, 98.78], [101.0, 112.36], [117.0, 130.74], [133.0, 143.6], [144.0, 148.64], [154.0, 154.68]], "keep_status": [false, true, true, false, true, false, true, true, true, true, true, false], "silence_prob": [0.0, 29.52, 29.02, 0.0, 28.95, 0.0, 31.62, 29.2, 29.55, 28.77, 28.8, 0.0], "audiomae_on_audioset": [null, [["music", 46.3], ["speech", 15.01], ["vehicle", 6.54]], [["speech", 46.48], ["music", 12.63], ["explosion", 10.81]], null, [["speech", 46.16], ["music", 17.86], ["eruption", 3.59]], null, [["music", 27.56], ["fly, housefly", 7.82], ["hum", 3.69]], [["music", 45.28], ["speech", 10.16], ["outside, rural or natural", 4.49]], [["foghorn", 19.48], ["music", 17.47], ["vehicle", 7.31]], [["speech", 47.31], ["music", 17.44], ["outside, urban or manmade", 3.5]], [["music", 42.71], ["speech", 13.11], ["crowd", 6.7]], null], "duration": [0.64, 15.13, 12.93, 1.98, 9.44, 1.16, 2.78, 11.36, 13.74, 10.6, 4.64, 0.68]} \ No newline at end of file diff --git a/annotations_1/OPuOk309lSE_filtered.json b/annotations_1/OPuOk309lSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edcbdb759ea2f6969808ce29b99943aabeaf246c --- /dev/null +++ b/annotations_1/OPuOk309lSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [9.0, 11.33], [20.0, 21.64], [23.0, 24.39], [26.0, 27.16], [30.0, 30.67], [32.0, 32.73], [38.0, 39.33], [47.0, 49.11], [56.0, 77.33], [78.0, 81.01], [83.0, 84.27], [89.0, 90.58], [91.0, 92.87], [97.0, 98.31], [103.0, 103.87], [105.0, 110.13], [112.0, 113.37], [116.0, 116.23], [117.0, 118.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 99.93, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 2.33, 1.64, 1.39, 1.16, 0.67, 0.73, 1.33, 2.11, 21.33, 3.01, 1.27, 1.58, 1.87, 1.31, 0.87, 5.13, 1.37, 0.23, 1.23]} \ No newline at end of file diff --git a/annotations_1/ORV1uYzvZzo_filtered.json b/annotations_1/ORV1uYzvZzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de3880aec17769b84c25a28bf95ccf29826fbe68 --- /dev/null +++ b/annotations_1/ORV1uYzvZzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [5.0, 6.15], [7.0, 7.11], [8.0, 8.38], [10.0, 10.76], [18.0, 18.2], [20.0, 20.73], [32.0, 32.34], [37.0, 37.66], [41.0, 41.44], [46.0, 45.82], [47.0, 47.53], [48.0, 48.19], [49.0, 49.77], [52.0, 51.93], [62.0, 64.07], [67.0, 67.73], [69.0, 69.92], [72.0, 73.9], [75.0, 75.69], [77.0, 77.46], [79.0, 82.61], [83.0, 84.23], [86.0, 86.21], [89.0, 89.67], [91.0, 92.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.15, 0.11, 0.38, 0.76, 0.2, 0.73, 0.34, 0.66, 0.44, -0.18, 0.53, 0.19, 0.77, -0.07, 2.07, 0.73, 0.92, 1.9, 0.69, 0.46, 3.61, 1.23, 0.21, 0.67, 1.15]} \ No newline at end of file diff --git a/annotations_1/ORrQKFliVLM_filtered.json b/annotations_1/ORrQKFliVLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91229571674995508506aa0ccdcf843dc6aa65e3 --- /dev/null +++ b/annotations_1/ORrQKFliVLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.84], [4.0, 5.31], [10.0, 17.59], [19.0, 25.24], [28.0, 29.1], [31.0, 32.78], [34.0, 48.15], [51.0, 51.36], [57.0, 80.37], [82.0, 121.98], [124.0, 134.81], [137.0, 177.5], [182.0, 184.59], [185.0, 185.48], [187.0, 190.0], [192.0, 219.6], [225.0, 228.63], [231.0, 247.68], [249.0, 264.83]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, false, true, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 29.23, 29.27, 0.0, 0.0, 30.3, 0.0, 28.83, 0.0, 28.57, 0.0, 29.41, 0.0, 29.42, 29.46, 29.93, 28.94, 29.17], "audiomae_on_audioset": [null, null, [["music", 18.44], ["smash, crash", 12.62], ["whack, thwack", 12.6]], [["speech", 37.77], ["music", 24.98], ["explosion", 4.69]], null, null, [["speech", 34.44], ["music", 31.95], ["throbbing", 4.44]], null, [["speech", 27.4], ["music", 25.56], ["vehicle", 6.51]], null, [["music", 70.92], ["speech", 11.65], ["electronic music", 2.77]], null, [["music", 42.86], ["speech", 15.9], ["rumble", 5.77]], null, [["music", 65.08], ["speech", 15.51], ["smash, crash", 3.7]], [["music", 24.61], ["speech", 22.94], ["hum", 8.26]], [["speech", 64.53], ["music", 6.5], ["whack, thwack", 5.91]], [["speech", 36.05], ["explosion", 17.24], ["eruption", 5.63]], [["music", 30.16], ["speech", 14.5], ["foghorn", 5.68]]], "duration": [1.84, 1.31, 7.59, 6.24, 1.1, 1.78, 14.15, 0.36, 23.37, 39.98, 10.81, 40.5, 2.59, 0.48, 3.0, 27.6, 3.63, 16.68, 15.83]} \ No newline at end of file diff --git a/annotations_1/OS0rZQtDsoc_filtered.json b/annotations_1/OS0rZQtDsoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..179ffba532d4d345218eaafb3c37c685347cc779 --- /dev/null +++ b/annotations_1/OS0rZQtDsoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 103.87]], "keep_status": [true], "silence_prob": [45.02], "audiomae_on_audioset": [[["music", 35.3], ["hum", 15.33], ["sonar", 9.23]]], "duration": [2.87]} \ No newline at end of file diff --git a/annotations_1/OSkFsRL177o_filtered.json b/annotations_1/OSkFsRL177o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a02160107bb82046a666ca2d58b74ce9bdaa8ccc --- /dev/null +++ b/annotations_1/OSkFsRL177o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.8], [10.0, 10.61], [12.0, 12.29], [14.0, 15.09], [18.0, 29.2], [31.0, 32.88], [34.0, 34.65], [37.0, 39.04], [40.0, 42.13], [43.0, 46.53], [48.0, 107.64], [108.0, 108.28], [110.0, 114.61], [117.0, 118.5], [122.0, 125.42], [129.0, 131.72], [133.0, 161.67], [166.0, 168.4], [170.0, 171.46], [173.0, 173.87]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 48.27, 37.37, 45.95, 0.0, 0.0, 38.64, 0.0, 32.57, 40.24, 29.32, 63.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 76.61], ["ambient music", 5.34], ["electronic music", 3.9]], null, null, [["music", 46.29], ["electronic music", 4.48], ["rumble", 3.57]], [["music", 36.63], ["whale vocalization", 6.65], ["theremin", 3.61]], [["speech", 65.59], ["hum", 3.17], ["vehicle", 3.08]], null, null, [["music", 43.11], ["hum", 8.73], ["scary music", 8.34]], null, [["music", 44.57], ["hum", 22.68], ["mains hum", 13.15]], [["music", 61.2], ["hum", 3.38], ["noise", 2.84]], [["music", 57.31], ["hum", 10.83], ["buzz", 5.87]], null, null, null], "duration": [1.8, 0.61, 0.29, 1.09, 11.2, 1.88, 0.65, 2.04, 2.13, 3.53, 59.64, 0.28, 4.61, 1.5, 3.42, 2.72, 28.67, 2.4, 1.46, 0.87]} \ No newline at end of file diff --git a/annotations_1/OT61p6s77_U_filtered.json b/annotations_1/OT61p6s77_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4219abbea2fd17caeff51f14eedde180525297bd --- /dev/null +++ b/annotations_1/OT61p6s77_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.73], [8.0, 9.29], [10.0, 10.86], [11.0, 16.8], [17.0, 26.62], [29.0, 30.87], [31.0, 34.2], [36.0, 38.23], [41.0, 42.38], [42.0, 43.55], [44.0, 45.96], [51.0, 51.53], [52.0, 56.34], [59.0, 60.25], [61.0, 63.26], [67.0, 70.63], [71.0, 72.4], [75.0, 75.74], [76.0, 77.19], [80.0, 82.49], [83.0, 85.5], [88.0, 97.12], [98.0, 102.78], [104.0, 112.56], [116.0, 133.07], [135.0, 134.79], [146.0, 151.61], [152.0, 152.1], [154.0, 164.84], [167.0, 167.1], [171.0, 193.78], [194.0, 193.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, false, false, false, true, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.04, 51.23, 0.0, 58.38, 49.54, 0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 39.57, 34.44, 0.0, 0.0, 0.0, 29.43, 33.2, 66.03, 66.88, 36.38, 30.71, 0.0, 33.11, 0.0, 30.09, 0.0, 29.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 16.53], ["music", 12.56], ["hum", 2.83]], null, null, null, null, [["hum", 24.28], ["mains hum", 20.5], ["speech", 8.73]], null, [["hum", 26.41], ["mains hum", 23.41], ["speech", 11.91]], [["speech", 34.74], ["mains hum", 19.85], ["hum", 12.05]], null, null, null, [["animal", 23.5], ["fart", 18.15], ["speech", 10.63]], [["speech", 58.26], ["didgeridoo", 5.01], ["music", 4.89]], null, null, [["speech", 37.93], ["thunk", 23.03], ["hum", 8.53]], [["hum", 45.15], ["mains hum", 22.51], ["music", 11.27]], null, [["music", 16.28], ["knock", 9.89], ["throbbing", 7.27]], null, [["hum", 34.62], ["mains hum", 26.79], ["speech", 9.45]], null, [["whale vocalization", 69.27], ["music", 7.84], ["hum", 3.82]], null], "duration": [-0.27, 1.29, 0.86, 5.8, 9.62, 1.87, 3.2, 2.23, 1.38, 1.55, 1.96, 0.53, 4.34, 1.25, 2.26, 3.63, 1.4, 0.74, 1.19, 2.49, 2.5, 9.12, 4.78, 8.56, 17.07, -0.21, 5.61, 0.1, 10.84, 0.1, 22.78, -0.06]} \ No newline at end of file diff --git a/annotations_1/OXUmjMKCR_c_filtered.json b/annotations_1/OXUmjMKCR_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7fc8e872a35ee6b01abbebe8d9e4c0eaa4607b1 --- /dev/null +++ b/annotations_1/OXUmjMKCR_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [14.0, 14.15], [16.0, 16.63], [18.0, 20.75], [22.0, 21.88], [23.0, 24.12], [26.0, 27.23], [29.0, 29.79], [31.0, 31.62], [33.0, 34.28], [37.0, 38.11], [39.0, 39.56], [44.0, 44.76], [48.0, 52.17], [53.0, 55.22], [56.0, 56.17], [60.0, 60.45], [63.0, 63.42], [69.0, 70.51], [71.0, 72.64], [73.0, 74.38], [78.0, 78.14], [79.0, 79.69], [86.0, 87.44], [91.0, 92.55], [97.0, 97.93], [109.0, 110.13], [113.0, 113.21], [114.0, 114.61], [120.0, 120.87], [130.0, 136.21], [137.0, 138.65], [143.0, 144.22], [145.0, 147.92], [150.0, 150.45], [151.0, 151.75], [152.0, 156.83], [158.0, 159.22], [160.0, 162.73], [164.0, 166.82], [170.0, 171.41]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.14, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 100.0, 0.0, 0.0, 84.62, 0.0, 96.04, 99.97, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 19.8], ["burping, eructation", 11.1], ["speech", 7.04]], null, null, null, null, null, null, null, null, null, [["music", 30.24], ["noise", 6.0], ["stomach rumble", 4.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.15, 0.63, 2.75, -0.12, 1.12, 1.23, 0.79, 0.62, 1.28, 1.11, 0.56, 0.76, 4.17, 2.22, 0.17, 0.45, 0.42, 1.51, 1.64, 1.38, 0.14, 0.69, 1.44, 1.55, 0.93, 1.13, 0.21, 0.61, 0.87, 6.21, 1.65, 1.22, 2.92, 0.45, 0.75, 4.83, 1.22, 2.73, 2.82, 1.41]} \ No newline at end of file diff --git a/annotations_1/Oa6OoTVXG6E_filtered.json b/annotations_1/Oa6OoTVXG6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2296801b111f6356ded0ac846c2e13f475f3cf6 --- /dev/null +++ b/annotations_1/Oa6OoTVXG6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [9.0, 9.9], [14.0, 14.22], [18.0, 19.38], [23.0, 24.8], [28.0, 35.16], [48.0, 48.24], [52.0, 56.37], [63.0, 63.64], [70.0, 70.9], [72.0, 73.33], [76.0, 76.23], [77.0, 79.3], [82.0, 83.46], [85.0, 85.9], [87.0, 91.88], [101.0, 102.98], [111.0, 117.59], [118.0, 128.38], [131.0, 135.75], [142.0, 143.38], [153.0, 154.13], [165.0, 170.02], [172.0, 172.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.87, 0.0, 42.22, 0.0, 0.0, 0.0, 0.0, 35.5, 0.0, 0.0, 38.38, 0.0, 34.61, 39.96, 37.75, 0.0, 0.0, 34.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 56.17], ["carnatic music", 12.9], ["didgeridoo", 12.55]], null, [["speech", 34.17], ["music", 26.77], ["brass instrument", 12.71]], null, null, null, null, [["moo", 17.24], ["music", 15.12], ["carnatic music", 12.24]], null, null, [["music", 34.76], ["animal", 7.99], ["dog", 7.5]], null, [["music", 68.37], ["theremin", 6.74], ["musical instrument", 2.21]], [["music", 37.31], ["trombone", 20.3], ["brass instrument", 17.42]], [["music", 60.43], ["theremin", 7.86], ["clarinet", 4.39]], null, null, [["speech", 37.56], ["music", 20.04], ["mosquito", 5.08]], null], "duration": [1.24, 0.9, 0.22, 1.38, 1.8, 7.16, 0.24, 4.37, 0.64, 0.9, 1.33, 0.23, 2.3, 1.46, 0.9, 4.88, 1.98, 6.59, 10.38, 4.75, 1.38, 1.13, 5.02, 0.4]} \ No newline at end of file diff --git a/annotations_1/ObCiRECeCdM_filtered.json b/annotations_1/ObCiRECeCdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..123cf33dfbd09020b563b32167728fdb7dd7fe8d --- /dev/null +++ b/annotations_1/ObCiRECeCdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 28.53], [29.0, 54.01], [54.0, 112.08], [113.0, 124.53], [125.0, 125.61], [127.0, 138.72]], "keep_status": [true, false, false, true, false, false], "silence_prob": [37.36, 34.08, 0.0, 41.66, 0.0, 57.81], "audiomae_on_audioset": [[["music", 23.74], ["hum", 18.35], ["mains hum", 11.72]], [["speech", 67.99], ["fire", 12.14], ["music", 3.7]], null, [["animal", 26.43], ["clip-clop", 16.4], ["horse", 10.68]], null, null], "duration": [21.53, 25.01, 58.08, 11.53, 0.61, 11.72]} \ No newline at end of file diff --git a/annotations_1/Oe_cBDzqBUI_filtered.json b/annotations_1/Oe_cBDzqBUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b925ef425670703683fb45ec41454e46e65fbe1f --- /dev/null +++ b/annotations_1/Oe_cBDzqBUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.96], [14.0, 18.99], [20.0, 26.74], [28.0, 29.47], [35.0, 35.94], [37.0, 38.4], [42.0, 43.01], [43.0, 44.86], [47.0, 48.93], [51.0, 70.97], [82.0, 91.37], [94.0, 94.46], [96.0, 96.04], [97.0, 98.68], [99.0, 109.31], [111.0, 111.67], [112.0, 124.07], [126.0, 127.47]], "keep_status": [true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.54, 37.86, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.17, 29.64, 0.0, 0.0, 0.0, 30.46, 0.0, 30.54, 0.0], "audiomae_on_audioset": [[["speech", 31.66], ["hum", 19.9], ["music", 14.32]], [["cough", 20.43], ["music", 15.37], ["hum", 11.42]], null, null, null, null, null, null, null, [["hum", 48.74], ["throbbing", 17.58], ["mains hum", 14.99]], [["music", 21.95], ["smash, crash", 17.05], ["thump, thud", 8.93]], null, null, null, [["music", 59.57], ["didgeridoo", 23.45], ["throbbing", 6.09]], null, [["hum", 34.73], ["speech", 24.68], ["mains hum", 15.12]], null], "duration": [8.96, 4.99, 6.74, 1.47, 0.94, 1.4, 1.01, 1.86, 1.93, 19.97, 9.37, 0.46, 0.04, 1.68, 10.31, 0.67, 12.07, 1.47]} \ No newline at end of file diff --git a/annotations_1/OeknFyEHaMw_filtered.json b/annotations_1/OeknFyEHaMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80bb6efc65bf17a15970778e420284ac109959bb --- /dev/null +++ b/annotations_1/OeknFyEHaMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.92], [12.0, 12.5], [13.0, 17.81], [18.0, 19.35], [26.0, 28.49], [29.0, 33.13], [35.0, 37.3], [51.0, 54.58], [56.0, 63.09], [64.0, 69.47], [75.0, 75.2], [76.0, 76.57], [77.0, 77.9], [80.0, 79.95], [86.0, 89.82], [95.0, 95.27], [97.0, 98.81], [100.0, 103.11]], "keep_status": [false, false, true, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.8, 0.0, 29.02, 28.66, 30.68, 30.12, 28.69, 28.33, 0.0, 0.0, 0.0, 0.0, 30.15, 0.0, 0.0, 35.28], "audiomae_on_audioset": [null, null, [["music", 22.31], ["whack, thwack", 18.1], ["speech", 7.76]], null, [["music", 28.76], ["fly, housefly", 12.39], ["throbbing", 7.24]], [["throbbing", 9.66], ["hum", 9.55], ["mains hum", 6.88]], [["speech", 32.21], ["whale vocalization", 12.82], ["sidetone", 7.26]], [["throbbing", 48.56], ["fly, housefly", 19.24], ["music", 7.07]], [["music", 71.52], ["throbbing", 6.26], ["mosquito", 2.35]], [["throbbing", 49.02], ["hum", 33.32], ["mains hum", 3.19]], null, null, null, null, [["cattle, bovinae", 37.45], ["moo", 21.79], ["livestock, farm animals, working animals", 15.95]], null, null, [["music", 52.56], ["didgeridoo", 17.35], ["speech", 12.28]]], "duration": [-0.08, 0.5, 4.81, 1.35, 2.49, 4.13, 2.3, 3.58, 7.09, 5.47, 0.2, 0.57, 0.9, -0.05, 3.82, 0.27, 1.81, 3.11]} \ No newline at end of file diff --git a/annotations_1/OfLhd_wJux8_filtered.json b/annotations_1/OfLhd_wJux8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd14833867e01ed241542a68bef0c9614a5d7d9 --- /dev/null +++ b/annotations_1/OfLhd_wJux8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.31], [12.0, 12.45], [13.0, 13.81], [14.0, 19.21], [24.0, 47.53], [71.0, 82.11], [94.0, 98.56], [102.0, 114.1], [115.0, 116.23], [119.0, 122.49], [123.0, 124.23], [126.0, 159.83], [161.0, 172.29], [173.0, 188.32]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.66, 32.02, 35.09, 41.81, 37.97, 0.0, 39.77, 0.0, 0.0, 51.71, 42.93], "audiomae_on_audioset": [null, null, null, [["speech", 44.62], ["music", 12.97], ["theremin", 6.58]], [["music", 45.72], ["didgeridoo", 12.94], ["throbbing", 5.45]], [["theremin", 72.48], ["music", 20.65], ["didgeridoo", 1.55]], [["music", 68.67], ["electronic music", 4.71], ["ambient music", 3.31]], [["music", 70.68], ["theremin", 5.71], ["quack", 3.75]], null, [["theremin", 49.71], ["music", 33.99], ["musical instrument", 3.41]], null, null, null, [["music", 63.76], ["musical instrument", 5.5], ["synthesizer", 5.07]]], "duration": [0.31, 0.45, 0.81, 5.21, 23.53, 11.11, 4.56, 12.1, 1.23, 3.49, 1.23, 33.83, 11.29, 15.32]} \ No newline at end of file diff --git a/annotations_1/OfXLQt6B8v4_filtered.json b/annotations_1/OfXLQt6B8v4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ff1a05886528d87daa02b979566edab6e21579 --- /dev/null +++ b/annotations_1/OfXLQt6B8v4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 37.23], [37.0, 39.95], [44.0, 84.18], [84.0, 107.27], [110.0, 112.18], [117.0, 144.32], [145.0, 152.14], [154.0, 154.2], [159.0, 158.97], [159.0, 160.32]], "keep_status": [true, true, false, false, true, false, true, false, false, false], "silence_prob": [31.92, 29.75, 0.0, 31.16, 33.05, 28.59, 29.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 31.96], ["music", 31.22], ["hum", 3.76]], [["speech", 38.5], ["vehicle", 5.14], ["music", 3.96]], null, [["hum", 34.31], ["music", 20.29], ["mains hum", 16.17]], [["music", 21.64], ["mains hum", 21.0], ["hum", 11.38]], [["hum", 33.6], ["music", 25.96], ["mains hum", 24.34]], [["hum", 25.8], ["throbbing", 14.86], ["whale vocalization", 11.67]], null, null, null], "duration": [12.23, 2.95, 40.18, 23.27, 2.18, 27.32, 7.14, 0.2, -0.03, 1.32]} \ No newline at end of file diff --git a/annotations_1/Ofkb_7EnunM_filtered.json b/annotations_1/Ofkb_7EnunM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f81c8eeb126cc3c3890e7fc73eb05546bc24d0ce --- /dev/null +++ b/annotations_1/Ofkb_7EnunM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [4.0, 6.0], [7.0, 11.1], [12.0, 13.34], [17.0, 18.74], [20.0, 19.94], [22.0, 22.2], [23.0, 24.06], [25.0, 24.87], [28.0, 29.76], [31.0, 32.66], [33.0, 34.2], [37.0, 37.52], [39.0, 39.41], [41.0, 41.64], [47.0, 49.79], [52.0, 53.25], [54.0, 55.44], [57.0, 57.54], [59.0, 62.73], [64.0, 65.13], [68.0, 68.99], [70.0, 70.43], [71.0, 71.49], [73.0, 73.63], [75.0, 75.14], [82.0, 82.7], [86.0, 86.53], [90.0, 90.85], [92.0, 93.16], [94.0, 94.49], [102.0, 102.84], [105.0, 106.07], [110.0, 111.11], [112.0, 112.16], [115.0, 116.73], [118.0, 120.28], [121.0, 122.12], [125.0, 125.22], [127.0, 128.8], [130.0, 131.67], [135.0, 136.26], [139.0, 145.18], [146.0, 147.29], [150.0, 163.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.92, 43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 95.78], "audiomae_on_audioset": [null, null, [["speech", 62.96], ["radio", 10.3], ["sidetone", 5.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.0, 4.1, 1.34, 1.74, -0.06, 0.2, 1.06, -0.13, 1.76, 1.66, 1.2, 0.52, 0.41, 0.64, 2.79, 1.25, 1.44, 0.54, 3.73, 1.13, 0.99, 0.43, 0.49, 0.63, 0.14, 0.7, 0.53, 0.85, 1.16, 0.49, 0.84, 1.07, 1.11, 0.16, 1.73, 2.28, 1.12, 0.22, 1.8, 1.67, 1.26, 6.18, 1.29, 13.27]} \ No newline at end of file diff --git a/annotations_1/OflOQW_pkvc_filtered.json b/annotations_1/OflOQW_pkvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf24d29b01b8f0f392f9fe19f33f0f5beaba2854 --- /dev/null +++ b/annotations_1/OflOQW_pkvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 23.3], [24.0, 26.59], [27.0, 27.85], [28.0, 28.76], [33.0, 34.06], [36.0, 38.55], [43.0, 49.86], [51.0, 51.7], [52.0, 52.59], [53.0, 89.92], [96.0, 97.58], [98.0, 103.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [42.98, 73.82, 0.0, 0.0, 0.0, 100.0, 47.78, 0.0, 0.0, 0.0, 0.0, 40.31], "audiomae_on_audioset": [[["sidetone", 51.48], ["noise", 22.43], ["microwave oven", 4.76]], null, null, null, null, null, [["arrow", 51.23], ["speech", 15.09], ["whack, thwack", 12.97]], null, null, null, null, [["speech", 39.25], ["fly, housefly", 7.57], ["mains hum", 6.25]]], "duration": [4.3, 2.59, 0.85, 0.76, 1.06, 2.55, 6.86, 0.7, 0.59, 36.92, 1.58, 5.52]} \ No newline at end of file diff --git a/annotations_1/OfnIw7Y8IUY_filtered.json b/annotations_1/OfnIw7Y8IUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8df84886f593996ac03934cb04e854ab724398c2 --- /dev/null +++ b/annotations_1/OfnIw7Y8IUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.79], [9.0, 18.99], [19.0, 20.71], [24.0, 40.66], [42.0, 77.79], [78.0, 79.07], [80.0, 82.92], [84.0, 87.27], [89.0, 92.04], [99.0, 100.68], [101.0, 102.49], [104.0, 104.16], [106.0, 107.43], [108.0, 121.12], [122.0, 124.07], [124.0, 124.21], [124.0, 124.41], [126.0, 129.78], [130.0, 131.41]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [30.05, 30.23, 0.0, 29.9, 0.0, 0.0, 31.43, 31.13, 31.2, 0.0, 0.0, 0.0, 0.0, 29.57, 30.71, 0.0, 0.0, 29.9, 0.0], "audiomae_on_audioset": [[["music", 45.83], ["hum", 21.03], ["throbbing", 13.51]], [["speech", 44.16], ["music", 24.43], ["gunshot, gunfire", 6.0]], null, [["music", 76.26], ["cacophony", 2.51], ["throbbing", 2.42]], null, null, [["music", 53.11], ["synthesizer", 6.89], ["musical instrument", 4.57]], [["music", 31.83], ["hum", 16.83], ["throbbing", 10.0]], [["music", 36.85], ["hum", 10.72], ["throbbing", 8.82]], null, null, null, null, [["music", 33.27], ["whack, thwack", 6.09], ["sound effect", 5.32]], [["music", 61.56], ["musical instrument", 13.29], ["guitar", 5.94]], null, null, [["breaking", 23.1], ["sound effect", 10.82], ["music", 9.32]], null], "duration": [2.79, 9.99, 1.71, 16.66, 35.79, 1.07, 2.92, 3.27, 3.04, 1.68, 1.49, 0.16, 1.43, 13.12, 2.07, 0.21, 0.41, 3.78, 1.41]} \ No newline at end of file diff --git a/annotations_1/Oh0635HLx5s_filtered.json b/annotations_1/Oh0635HLx5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ce883a8e3d8e877274f29df05743085a4feec33 --- /dev/null +++ b/annotations_1/Oh0635HLx5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 5.93], [7.0, 13.83], [21.0, 27.67], [29.0, 29.83], [32.0, 32.21], [35.0, 35.16], [36.0, 36.29], [37.0, 38.03], [38.0, 39.23], [43.0, 43.88], [47.0, 48.29], [52.0, 53.65], [56.0, 56.44], [58.0, 58.36], [61.0, 61.47], [64.0, 65.03], [66.0, 66.82], [67.0, 67.96], [69.0, 69.28], [72.0, 72.37], [76.0, 76.35], [79.0, 79.91], [83.0, 83.69], [104.0, 104.97], [106.0, 106.73], [110.0, 114.29], [122.0, 122.88], [126.0, 126.62], [127.0, 127.52], [128.0, 128.95], [131.0, 132.09], [132.0, 133.47], [137.0, 137.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.92, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, -0.07, 6.83, 6.67, 0.83, 0.21, 0.16, 0.29, 1.03, 1.23, 0.88, 1.29, 1.65, 0.44, 0.36, 0.47, 1.03, 0.82, 0.96, 0.28, 0.37, 0.35, 0.91, 0.69, 0.97, 0.73, 4.29, 0.88, 0.62, 0.52, 0.95, 1.09, 1.47, 0.4]} \ No newline at end of file diff --git a/annotations_1/OiJ8mt6Nn5s_filtered.json b/annotations_1/OiJ8mt6Nn5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..457a7f3b78a36121c009cf5a2dd9a267ed86a718 --- /dev/null +++ b/annotations_1/OiJ8mt6Nn5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.03], [7.0, 41.91], [43.0, 53.97], [55.0, 55.63], [57.0, 63.46], [64.0, 71.44], [74.0, 75.15], [75.0, 75.2], [75.0, 75.27], [75.0, 75.49], [76.0, 76.38], [78.0, 81.99], [83.0, 87.86], [89.0, 139.13], [140.0, 140.75], [142.0, 159.36]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [48.91, 0.0, 43.4, 0.0, 47.12, 44.96, 0.0, 0.0, 0.0, 0.0, 0.0, 32.94, 47.98, 0.0, 0.0, 33.26], "audiomae_on_audioset": [[["cattle, bovinae", 41.37], ["livestock, farm animals, working animals", 29.06], ["moo", 28.94]], null, [["hum", 47.67], ["mains hum", 16.47], ["sidetone", 9.66]], null, [["hum", 41.31], ["mains hum", 18.83], ["throbbing", 8.06]], [["hum", 34.35], ["mains hum", 22.4], ["rumble", 7.12]], null, null, null, null, null, [["music", 45.11], ["hum", 9.5], ["synthesizer", 8.43]], [["hum", 59.66], ["mains hum", 12.75], ["music", 6.45]], null, null, [["music", 47.3], ["theremin", 26.69], ["throbbing", 4.57]]], "duration": [2.03, 34.91, 10.97, 0.63, 6.46, 7.44, 1.15, 0.2, 0.27, 0.49, 0.38, 3.99, 4.86, 50.13, 0.75, 17.36]} \ No newline at end of file diff --git a/annotations_1/Oj8S0fNum9g_filtered.json b/annotations_1/Oj8S0fNum9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3915162b28de505fbb3f54a7a1789ba8b03c7a80 --- /dev/null +++ b/annotations_1/Oj8S0fNum9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.18], [9.0, 11.1], [15.0, 16.16], [18.0, 20.22], [23.0, 23.03], [28.0, 28.53], [30.0, 31.13], [33.0, 36.95], [43.0, 47.56], [51.0, 54.67], [59.0, 59.32], [63.0, 63.42], [64.0, 83.46], [86.0, 87.45], [89.0, 91.3], [93.0, 94.31], [98.0, 100.82], [104.0, 120.51]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 99.82, 0.0, 0.0, 0.0, 37.38, 42.79, 33.16, 0.0, 0.0, 45.59, 0.0, 100.0, 0.0, 97.92, 78.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 22.95], ["hum", 18.07], ["sidetone", 8.22]], [["speech", 37.51], ["music", 17.78], ["glass", 6.5]], [["speech", 62.02], ["sidetone", 11.32], ["music", 8.04]], null, null, [["sidetone", 51.45], ["speech", 37.58], ["hum", 1.59]], null, null, null, null, null], "duration": [0.18, 2.1, 1.16, 2.22, 0.03, 0.53, 1.13, 3.95, 4.56, 3.67, 0.32, 0.42, 19.46, 1.45, 2.3, 1.31, 2.82, 16.51]} \ No newline at end of file diff --git a/annotations_1/OjDuQ7O9XUo_filtered.json b/annotations_1/OjDuQ7O9XUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ee9485ec3c95205e41445c218ed78a13011d0a7 --- /dev/null +++ b/annotations_1/OjDuQ7O9XUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [5.0, 16.66], [20.0, 22.65], [31.0, 32.31], [34.0, 137.39], [139.0, 158.43], [158.0, 159.07], [162.0, 164.42], [168.0, 194.16], [203.0, 223.06], [225.0, 233.36], [234.0, 238.32], [241.0, 243.51], [247.0, 247.82], [261.0, 262.3], [263.0, 264.12], [265.0, 266.62], [275.0, 279.34], [283.0, 283.39], [287.0, 288.2]], "keep_status": [false, true, true, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 34.56, 49.18, 0.0, 0.0, 29.71, 0.0, 31.93, 31.91, 29.98, 30.41, 32.11, 37.3, 0.0, 0.0, 0.0, 0.0, 28.79, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.71], ["speech", 15.94], ["fart", 8.59]], [["didgeridoo", 30.47], ["music", 22.16], ["musical instrument", 6.22]], null, null, [["music", 60.22], ["speech", 13.23], ["sidetone", 5.59]], null, [["music", 31.04], ["foghorn", 18.02], ["trombone", 9.54]], [["speech", 44.93], ["music", 10.65], ["vehicle", 10.08]], [["music", 55.42], ["hum", 3.24], ["horse", 3.17]], [["music", 44.82], ["brass instrument", 17.02], ["trombone", 14.55]], [["music", 63.65], ["trombone", 5.49], ["brass instrument", 4.38]], [["hum", 44.85], ["throbbing", 42.73], ["heart sounds, heartbeat", 4.35]], null, null, null, null, [["speech", 18.99], ["music", 18.34], ["hum", 7.71]], null, null], "duration": [0.76, 11.66, 2.65, 1.31, 103.39, 19.43, 1.07, 2.42, 26.16, 20.06, 8.36, 4.32, 2.51, 0.82, 1.3, 1.12, 1.62, 4.34, 0.39, 1.2]} \ No newline at end of file diff --git a/annotations_1/OjkIBSE3yfY_filtered.json b/annotations_1/OjkIBSE3yfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab2e81576cd43645d7c9fc600149f775fb597283 --- /dev/null +++ b/annotations_1/OjkIBSE3yfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [6.0, 6.57], [14.0, 21.83], [26.0, 26.32], [27.0, 28.31], [29.0, 30.2], [31.0, 33.13], [44.0, 44.85], [46.0, 47.8], [50.0, 53.57], [58.0, 61.64], [63.0, 68.79], [70.0, 70.82], [72.0, 72.67], [77.0, 81.99], [110.0, 113.0], [117.0, 117.53], [119.0, 119.23], [123.0, 123.58]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.2, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 42.6, 58.55, 36.76, 0.0, 0.0, 49.59, 80.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.07], ["livestock, farm animals, working animals", 12.36], ["speech", 9.23]], null, null, null, null, null, null, [["sidetone", 27.23], ["speech", 26.7], ["music", 13.29]], null, [["music", 61.32], ["speech", 11.78], ["boing", 4.17]], null, null, [["music", 70.56], ["speech", 6.93], ["musical instrument", 2.6]], null, null, null, null], "duration": [0.34, 0.57, 7.83, 0.32, 1.31, 1.2, 2.13, 0.85, 1.8, 3.57, 3.64, 5.79, 0.82, 0.67, 4.99, 3.0, 0.53, 0.23, 0.58]} \ No newline at end of file diff --git a/annotations_1/Ok3_qMNWAo0_filtered.json b/annotations_1/Ok3_qMNWAo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514e8327f448371cccb7094f8e6d90c573332cba --- /dev/null +++ b/annotations_1/Ok3_qMNWAo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 48.54], [50.0, 56.35], [57.0, 59.09], [63.0, 72.76], [78.0, 78.88], [80.0, 81.7], [82.0, 89.7], [93.0, 93.8], [94.0, 95.37], [98.0, 99.86], [100.0, 104.25], [106.0, 109.21], [113.0, 116.61], [118.0, 121.49], [123.0, 124.61]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 64.29, 40.06, 92.97, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 66.88, 38.3, 93.76, 56.33, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.44], ["didgeridoo", 7.49], ["synthesizer", 5.75]], null, null, null, null, null, null, null, null, [["music", 36.46], ["whale vocalization", 7.18], ["didgeridoo", 7.07]], null, null, null], "duration": [40.54, 6.35, 2.09, 9.76, 0.88, 1.7, 7.7, 0.8, 1.37, 1.86, 4.25, 3.21, 3.61, 3.49, 1.61]} \ No newline at end of file diff --git a/annotations_1/OkBaZLq7gnU_filtered.json b/annotations_1/OkBaZLq7gnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..641afa9c74584dfe6f7c9b88b6ecda623f592ffa --- /dev/null +++ b/annotations_1/OkBaZLq7gnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 30.05], [36.0, 36.85], [39.0, 39.21], [43.0, 43.17], [46.0, 49.64], [51.0, 66.87], [73.0, 72.72], [73.0, 72.94], [78.0, 79.3], [114.0, 125.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.38, 0.0, 0.0, 0.0, 43.2, 29.82, 0.0, 0.0, 0.0, 39.58], "audiomae_on_audioset": [[["music", 42.05], ["didgeridoo", 36.59], ["speech", 5.98]], null, null, null, [["speech", 64.34], ["telephone", 4.49], ["radio", 3.71]], [["music", 66.21], ["speech", 27.08], ["throbbing", 0.58]], null, null, null, [["music", 77.11], ["thunk", 10.35], ["synthesizer", 3.58]]], "duration": [9.05, 0.85, 0.21, 0.17, 3.64, 15.87, -0.28, -0.06, 1.3, 11.07]} \ No newline at end of file diff --git a/annotations_1/OlLMqN-vjKk_filtered.json b/annotations_1/OlLMqN-vjKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f753e33afecc9bdf40cb8831cf80967657821bc4 --- /dev/null +++ b/annotations_1/OlLMqN-vjKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.83], [9.0, 11.55], [13.0, 14.86], [22.0, 22.54], [24.0, 26.23], [27.0, 27.78], [29.0, 29.52], [30.0, 30.45], [32.0, 65.57], [70.0, 93.75]], "keep_status": [false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 42.55, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 33.48], "audiomae_on_audioset": [null, [["music", 21.57], ["fly, housefly", 11.23], ["didgeridoo", 10.92]], null, null, [["hum", 11.46], ["mains hum", 7.59], ["fly, housefly", 6.39]], null, null, null, null, [["hum", 68.93], ["mains hum", 16.79], ["throbbing", 3.48]]], "duration": [0.83, 2.55, 1.86, 0.54, 2.23, 0.78, 0.52, 0.45, 33.57, 23.75]} \ No newline at end of file diff --git a/annotations_1/OliOEVSIsmY_filtered.json b/annotations_1/OliOEVSIsmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7d95f7efe26e72d00a6ca51b62924b6bb774a97 --- /dev/null +++ b/annotations_1/OliOEVSIsmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.02], [12.0, 19.5], [63.0, 63.36], [68.0, 68.62], [70.0, 70.09]], "keep_status": [false, false, false, false, false], "silence_prob": [30.15, 28.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["moo", 39.91], ["cattle, bovinae", 30.91], ["livestock, farm animals, working animals", 26.24]], [["music", 74.4], ["electronic music", 4.09], ["house music", 3.21]], null, null, null], "duration": [3.02, 7.5, 0.36, 0.62, 0.09]} \ No newline at end of file diff --git a/annotations_1/Omdvu0f-Wuw_filtered.json b/annotations_1/Omdvu0f-Wuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dba8684b8c233d9435c76d172c21823a1e5c9f03 --- /dev/null +++ b/annotations_1/Omdvu0f-Wuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.8], [27.0, 27.41], [28.0, 28.17], [30.0, 29.96], [48.0, 56.84], [92.0, 92.8], [94.0, 96.85], [103.0, 103.5], [106.0, 105.83], [106.0, 107.23], [113.0, 112.82], [115.0, 115.48], [131.0, 131.5], [172.0, 172.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.25, 0.0, 35.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["fart", 68.99], ["speech", 15.49], ["music", 5.73]], null, [["speech", 58.81], ["sidetone", 19.06], ["telephone", 7.23]], null, null, null, null, null, null, null], "duration": [0.8, 0.41, 0.17, -0.04, 8.84, 0.8, 2.85, 0.5, -0.17, 1.23, -0.18, 0.48, 0.5, 0.3]} \ No newline at end of file diff --git a/annotations_1/Omewqh9iivg_filtered.json b/annotations_1/Omewqh9iivg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3069bcd92b651dd7061709b8c86bb1d11ad7f3d --- /dev/null +++ b/annotations_1/Omewqh9iivg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 19.72], [21.0, 22.08], [24.0, 24.92], [27.0, 28.43], [32.0, 42.67], [47.0, 48.32], [50.0, 56.52], [67.0, 71.58], [72.0, 74.73], [83.0, 85.73], [90.0, 90.56], [96.0, 97.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.33, 0.0, 0.0, 0.0, 67.0, 0.0, 51.77, 53.4, 55.67, 54.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.72, 1.08, 0.92, 1.43, 10.67, 1.32, 6.52, 4.58, 2.73, 2.73, 0.56, 1.38]} \ No newline at end of file diff --git a/annotations_1/OnJAp2emJ4U_filtered.json b/annotations_1/OnJAp2emJ4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38f5c6104c3d1d8c5f5bca651e26b977f2fac9d4 --- /dev/null +++ b/annotations_1/OnJAp2emJ4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 15.96], [22.0, 22.76], [35.0, 36.24], [61.0, 62.01], [80.0, 80.99], [85.0, 88.65], [91.0, 92.26]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 32.07], ["music", 21.91], ["throbbing", 6.35]], null], "duration": [-0.04, 0.76, 1.24, 1.01, 0.99, 3.65, 1.26]} \ No newline at end of file diff --git a/annotations_1/Oo67jMp9UbI_filtered.json b/annotations_1/Oo67jMp9UbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b22ae775b94fe2ee17f6ffd83ad63acdce6ff9d --- /dev/null +++ b/annotations_1/Oo67jMp9UbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [5.0, 5.05], [7.0, 7.06], [7.0, 7.8], [12.0, 12.26], [14.0, 13.58], [22.0, 22.59], [24.0, 23.8], [25.0, 25.07], [32.0, 33.72], [37.0, 39.95], [42.0, 42.65], [46.0, 48.47], [49.0, 56.46], [57.0, 59.04], [59.0, 61.08], [64.0, 64.81], [66.0, 66.11], [68.0, 69.4], [84.0, 85.09], [97.0, 172.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.9, 0.0, 60.42, 44.37, 38.19, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 12.5], ["music", 8.9], ["sine wave", 8.38]], null, null, [["music", 53.22], ["rumble", 3.42], ["hum", 3.26]], [["hum", 40.98], ["throbbing", 21.74], ["music", 10.07]], [["hum", 35.18], ["music", 17.27], ["mains hum", 16.79]], null, null, null, null, null], "duration": [0.64, 0.05, 0.06, 0.8, 0.26, -0.42, 0.59, -0.2, 0.07, 1.72, 2.95, 0.65, 2.47, 7.46, 2.04, 2.08, 0.81, 0.11, 1.4, 1.09, 75.74]} \ No newline at end of file diff --git a/annotations_1/Ooiw8ZYnzdU_filtered.json b/annotations_1/Ooiw8ZYnzdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3cea66d1ef9232caec5dfc3ed7b65ab3b2e7f29 --- /dev/null +++ b/annotations_1/Ooiw8ZYnzdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.67], [15.0, 15.7], [17.0, 46.5], [47.0, 48.02], [50.0, 61.94], [67.0, 71.64], [82.0, 91.27], [102.0, 150.3], [151.0, 151.71], [156.0, 163.0], [164.0, 174.18], [176.0, 175.69], [178.0, 181.68], [183.0, 183.34], [185.0, 184.69]], "keep_status": [true, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [29.4, 0.0, 29.33, 0.0, 29.41, 29.77, 29.45, 0.0, 0.0, 29.19, 60.89, 0.0, 81.71, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 44.6], ["crowd", 4.59], ["vehicle", 4.56]], null, [["music", 70.5], ["electronic music", 7.34], ["drum machine", 3.75]], null, [["music", 74.6], ["didgeridoo", 3.91], ["electronic music", 3.76]], [["music", 25.98], ["didgeridoo", 22.47], ["beatboxing", 14.67]], [["music", 75.67], ["didgeridoo", 16.85], ["electronic music", 1.25]], null, null, [["speech", 21.39], ["livestock, farm animals, working animals", 21.2], ["moo", 10.13]], null, null, null, null, null], "duration": [6.67, 0.7, 29.5, 1.02, 11.94, 4.64, 9.27, 48.3, 0.71, 7.0, 10.18, -0.31, 3.68, 0.34, -0.31]} \ No newline at end of file diff --git a/annotations_1/OosAKayGMj4_filtered.json b/annotations_1/OosAKayGMj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c87519dcb698d121ab0fdb1a387f65e630655db8 --- /dev/null +++ b/annotations_1/OosAKayGMj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.02], [18.0, 26.45], [27.0, 26.7], [28.0, 28.83], [30.0, 33.0], [34.0, 35.28], [39.0, 43.73], [44.0, 45.6], [46.0, 47.41], [48.0, 49.15], [50.0, 50.6], [52.0, 52.51], [54.0, 69.42], [75.0, 75.22], [76.0, 77.01], [78.0, 78.83], [80.0, 80.55], [83.0, 83.96], [85.0, 87.76], [90.0, 91.42], [94.0, 102.57], [105.0, 105.11], [106.0, 107.01], [108.0, 109.86], [110.0, 111.2]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.35, 0.0, 0.0, 73.06, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 83.25], ["electric shaver, electric razor", 3.33], ["boing", 2.88]], null, null, null, null, [["whale vocalization", 24.69], ["speech", 16.59], ["moo", 9.87]], null, null, null, null, null, [["speech", 76.3], ["radio", 3.81], ["noise", 2.73]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 8.45, -0.3, 0.83, 3.0, 1.28, 4.73, 1.6, 1.41, 1.15, 0.6, 0.51, 15.42, 0.22, 1.01, 0.83, 0.55, 0.96, 2.76, 1.42, 8.57, 0.11, 1.01, 1.86, 1.2]} \ No newline at end of file diff --git a/annotations_1/OpAEdqIIWpY_filtered.json b/annotations_1/OpAEdqIIWpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ac09aab61ad109f36650e99350a09d751250c16 --- /dev/null +++ b/annotations_1/OpAEdqIIWpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[141.0, 164.69], [170.0, 178.31]], "keep_status": [true, true], "silence_prob": [33.12, 48.82], "audiomae_on_audioset": [[["whack, thwack", 15.28], ["crack", 14.64], ["sound effect", 12.5]], [["music", 32.81], ["speech", 25.13], ["sidetone", 8.46]]], "duration": [23.69, 8.31]} \ No newline at end of file diff --git a/annotations_1/OpwYfz6uFaQ_filtered.json b/annotations_1/OpwYfz6uFaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68904449ef5cc16a5f88d1eab9f73dcf7dfeb751 --- /dev/null +++ b/annotations_1/OpwYfz6uFaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.67], [8.0, 9.04], [10.0, 10.67], [15.0, 15.67], [26.0, 26.92], [27.0, 28.61], [33.0, 34.6], [37.0, 37.69], [38.0, 38.7], [42.0, 43.6], [64.0, 64.66], [68.0, 69.53], [70.0, 73.89], [75.0, 76.92], [79.0, 81.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.72, 0.0, 57.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.44], ["sidetone", 10.83], ["music", 9.18]], null, null], "duration": [-0.33, 1.04, 0.67, 0.67, 0.92, 1.61, 1.6, 0.69, 0.7, 1.6, 0.66, 1.53, 3.89, 1.92, 2.31]} \ No newline at end of file diff --git a/annotations_1/OqGw-1_vIWk_filtered.json b/annotations_1/OqGw-1_vIWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c378500b6bd2535ff59d9a1ba4252fc3ca0ec95 --- /dev/null +++ b/annotations_1/OqGw-1_vIWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.23], [9.0, 9.09], [11.0, 11.84], [13.0, 37.47], [44.0, 45.23], [46.0, 54.36], [57.0, 58.41], [63.0, 73.74], [76.0, 98.52], [102.0, 114.71], [121.0, 124.21], [126.0, 137.91], [139.0, 149.81], [150.0, 158.14], [160.0, 160.66], [163.0, 163.43], [164.0, 170.24], [173.0, 177.31], [179.0, 190.32], [194.0, 194.0]], "keep_status": [false, false, false, false, false, true, false, false, true, true, true, false, false, true, false, false, false, false, false, false], "silence_prob": [28.8, 0.0, 0.0, 28.56, 0.0, 28.64, 0.0, 28.69, 28.49, 28.54, 30.35, 28.56, 28.51, 28.36, 0.0, 0.0, 28.43, 28.51, 29.72, 0.0], "audiomae_on_audioset": [[["mains hum", 54.54], ["hum", 20.25], ["speech", 8.21]], null, null, [["mains hum", 32.64], ["hum", 22.05], ["music", 19.43]], null, [["music", 31.98], ["speech", 25.96], ["sidetone", 10.63]], null, [["mains hum", 42.7], ["music", 25.01], ["hum", 17.9]], [["music", 48.1], ["speech", 10.56], ["cacophony", 3.99]], [["music", 18.86], ["buzz", 14.3], ["hum", 13.36]], [["hum", 36.6], ["mains hum", 19.69], ["throbbing", 13.57]], [["music", 50.58], ["didgeridoo", 16.34], ["hum", 11.08]], [["hum", 30.89], ["mains hum", 27.5], ["music", 15.86]], [["speech", 55.18], ["music", 7.36], ["outside, rural or natural", 3.5]], null, null, [["speech", 58.47], ["music", 14.51], ["electric shaver, electric razor", 4.29]], [["mains hum", 35.19], ["music", 23.38], ["hum", 15.55]], [["hum", 41.61], ["mains hum", 18.36], ["music", 13.86]], null], "duration": [4.23, 0.09, 0.84, 24.47, 1.23, 8.36, 1.41, 10.74, 22.52, 12.71, 3.21, 11.91, 10.81, 8.14, 0.66, 0.43, 6.24, 4.31, 11.32, 0.0]} \ No newline at end of file diff --git a/annotations_1/OqgFY6ZhOfQ_filtered.json b/annotations_1/OqgFY6ZhOfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df48c52f496a15b78089010d9d793ca86f8fd449 --- /dev/null +++ b/annotations_1/OqgFY6ZhOfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.72], [16.0, 16.97], [20.0, 20.01], [25.0, 24.93], [26.0, 26.99], [29.0, 34.28], [37.0, 38.11], [39.0, 39.51], [40.0, 40.54], [43.0, 42.92], [45.0, 45.44], [46.0, 47.04], [49.0, 49.94], [52.0, 53.15], [55.0, 54.95], [55.0, 55.49], [57.0, 57.37], [59.0, 72.18], [74.0, 74.16], [78.0, 83.27], [89.0, 91.1], [93.0, 97.24], [98.0, 104.01], [105.0, 106.52], [108.0, 115.16]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true], "silence_prob": [35.51, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.32, 0.0, 30.21, 32.35, 31.09, 31.06, 0.0, 31.39], "audiomae_on_audioset": [[["music", 14.07], ["reverberation", 10.87], ["echo", 8.76]], null, null, null, null, [["chirp tone", 13.65], ["sine wave", 13.06], ["radio", 10.42]], null, null, null, null, null, null, null, null, null, null, null, [["noise", 73.69], ["music", 6.06], ["didgeridoo", 2.89]], null, [["music", 56.13], ["echo", 6.44], ["musical instrument", 4.65]], [["speech", 28.12], ["music", 5.28], ["siren", 3.57]], [["music", 55.1], ["speech", 16.28], ["double bass", 4.24]], [["music", 63.88], ["synthesizer", 9.42], ["musical instrument", 6.2]], null, [["music", 37.01], ["musical instrument", 6.47], ["boing", 6.37]]], "duration": [3.72, 0.97, 0.01, -0.07, 0.99, 5.28, 1.11, 0.51, 0.54, -0.08, 0.44, 1.04, 0.94, 1.15, -0.05, 0.49, 0.37, 13.18, 0.16, 5.27, 2.1, 4.24, 6.01, 1.52, 7.16]} \ No newline at end of file diff --git a/annotations_1/OqvD4NC-s9E_filtered.json b/annotations_1/OqvD4NC-s9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c68b13222a1321033f41b15b6228ad7b7a35a024 --- /dev/null +++ b/annotations_1/OqvD4NC-s9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [19.0, 20.83], [90.0, 91.62], [101.0, 104.25], [113.0, 113.56], [114.0, 117.76], [118.0, 138.2], [140.0, 145.54], [151.0, 151.17], [153.0, 156.59], [158.0, 160.08], [161.0, 164.66], [165.0, 165.62], [167.0, 169.43], [173.0, 176.08], [181.0, 181.31]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 37.11, 0.0, 36.41, 31.37, 30.91, 0.0, 36.61, 98.19, 46.29, 0.0, 44.2, 40.34, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.4], ["didgeridoo", 4.54], ["musical instrument", 4.51]], null, [["speech", 74.76], ["busy signal", 3.06], ["groan", 2.38]], [["music", 75.6], ["electronic music", 2.58], ["speech", 1.28]], [["music", 66.01], ["singing", 3.24], ["rattle (instrument)", 2.84]], null, [["music", 48.15], ["cello", 7.83], ["singing", 3.74]], null, [["music", 23.76], ["mains hum", 19.01], ["hum", 10.03]], null, [["music", 36.84], ["mains hum", 17.09], ["hum", 9.65]], [["mains hum", 24.2], ["music", 20.31], ["buzz", 17.76]], null], "duration": [0.41, 1.83, 1.62, 3.25, 0.56, 3.76, 20.2, 5.54, 0.17, 3.59, 2.08, 3.66, 0.62, 2.43, 3.08, 0.31]} \ No newline at end of file diff --git a/annotations_1/OqyvMY1fcr4_filtered.json b/annotations_1/OqyvMY1fcr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dd208a12cdf6d10dcd8f6acbd898392015f46bd --- /dev/null +++ b/annotations_1/OqyvMY1fcr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [7.0, 8.33], [15.0, 16.75], [20.0, 20.36], [35.0, 37.02], [41.0, 41.1], [43.0, 50.92], [52.0, 53.22], [57.0, 57.81], [58.0, 59.66], [60.0, 61.86], [65.0, 65.91], [69.0, 70.04], [73.0, 74.07], [76.0, 77.67], [90.0, 90.1], [91.0, 101.78], [107.0, 119.03], [120.0, 120.26], [125.0, 127.35], [130.0, 130.62]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 32.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.97, 31.78, 0.0, 31.44, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.9], ["speech", 6.16], ["musical instrument", 4.37]], null, [["music", 80.28], ["speech", 4.01], ["synthesizer", 2.04]], null, null, null, null, null, null, null, null, null, [["music", 87.11], ["singing", 1.44], ["humming", 0.85]], [["music", 75.01], ["theremin", 3.69], ["funk", 2.06]], null, [["music", 75.24], ["musical instrument", 4.11], ["guitar", 2.7]], null], "duration": [1.03, 1.33, 1.75, 0.36, 2.02, 0.1, 7.92, 1.22, 0.81, 1.66, 1.86, 0.91, 1.04, 1.07, 1.67, 0.1, 10.78, 12.03, 0.26, 2.35, 0.62]} \ No newline at end of file diff --git a/annotations_1/OqzgxMFTQfU_filtered.json b/annotations_1/OqzgxMFTQfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..475cdc12a0a560102c297136ea0d5d166eca5e60 --- /dev/null +++ b/annotations_1/OqzgxMFTQfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 21.17], [24.0, 26.01], [26.0, 27.08], [33.0, 34.23], [35.0, 35.31], [36.0, 39.92], [46.0, 46.9], [47.0, 48.49], [50.0, 52.57], [54.0, 55.61], [56.0, 56.52], [58.0, 58.19], [60.0, 60.0], [60.0, 60.44], [61.0, 61.48], [62.0, 62.85], [63.0, 64.81], [66.0, 66.72], [67.0, 68.07], [69.0, 70.7], [77.0, 78.53], [81.0, 81.13], [84.0, 84.72], [86.0, 86.81], [91.0, 91.84], [95.0, 94.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.56, 39.15, 0.0, 0.0, 0.0, 44.87, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.36], ["breaking", 13.36], ["glass", 12.16]], [["speech", 48.41], ["glass", 16.41], ["breaking", 10.35]], null, null, null, [["speech", 12.72], ["animal", 9.33], ["livestock, farm animals, working animals", 6.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.17, 2.01, 1.08, 1.23, 0.31, 3.92, 0.9, 1.49, 2.57, 1.61, 0.52, 0.19, 0.0, 0.44, 0.48, 0.85, 1.81, 0.72, 1.07, 1.7, 1.53, 0.13, 0.72, 0.81, 0.84, -0.1]} \ No newline at end of file diff --git a/annotations_1/Or4t1d_h0Y0_filtered.json b/annotations_1/Or4t1d_h0Y0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c4886984fc98fbc56b23524fdbd2cd39a1d5175 --- /dev/null +++ b/annotations_1/Or4t1d_h0Y0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.47], [23.0, 29.74], [32.0, 33.08], [34.0, 34.72], [36.0, 36.64], [38.0, 38.72], [40.0, 40.49], [46.0, 48.36], [50.0, 50.65], [53.0, 54.13], [56.0, 57.84], [58.0, 60.1], [61.0, 62.61], [65.0, 67.14], [69.0, 70.73], [73.0, 75.68], [82.0, 82.27], [87.0, 87.15], [88.0, 88.1], [89.0, 88.94], [90.0, 95.86], [100.0, 100.6], [108.0, 108.48], [124.0, 124.9], [125.0, 125.63], [137.0, 137.71], [139.0, 138.67], [142.0, 142.7], [144.0, 145.25], [149.0, 148.9], [154.0, 154.21], [156.0, 157.17], [158.0, 161.99]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [44.09, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0, 41.7, 0.0, 99.8, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.31], "audiomae_on_audioset": [[["speech", 31.42], ["arrow", 25.13], ["firecracker", 4.37]], null, null, null, null, null, null, null, null, null, null, [["speech", 37.5], ["busy signal", 21.47], ["sidetone", 11.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 21.09], ["livestock, farm animals, working animals", 16.63], ["cattle, bovinae", 11.42]]], "duration": [2.47, 6.74, 1.08, 0.72, 0.64, 0.72, 0.49, 2.36, 0.65, 1.13, 1.84, 2.1, 1.61, 2.14, 1.73, 2.68, 0.27, 0.15, 0.1, -0.06, 5.86, 0.6, 0.48, 0.9, 0.63, 0.71, -0.33, 0.7, 1.25, -0.1, 0.21, 1.17, 3.99]} \ No newline at end of file diff --git a/annotations_1/OroiRWIR2gQ_filtered.json b/annotations_1/OroiRWIR2gQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe67ed60f0a4694fffd0b2e82fb62dae2c9d30b7 --- /dev/null +++ b/annotations_1/OroiRWIR2gQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [10.0, 11.6], [12.0, 13.88], [16.0, 18.93], [21.0, 21.63], [24.0, 26.28], [30.0, 31.78], [34.0, 34.53], [41.0, 51.58], [53.0, 53.99], [58.0, 58.01], [61.0, 63.54], [66.0, 74.06], [86.0, 87.66], [89.0, 90.02], [98.0, 99.03], [102.0, 102.3], [103.0, 103.23], [106.0, 106.66], [108.0, 115.32], [118.0, 118.39], [119.0, 119.35], [119.0, 153.82], [154.0, 156.19], [158.0, 157.77], [161.0, 165.87], [182.0, 182.38], [183.0, 183.05], [183.0, 184.27], [190.0, 192.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.28, 0.0, 92.97, 0.0, 0.0, 99.99, 0.0, 0.0, 58.38, 32.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.89, 0.0, 0.0, 0.0, 65.2, 0.0, 33.92, 0.0, 0.0, 0.0, 60.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 41.61], ["moo", 21.48], ["livestock, farm animals, working animals", 17.82]], null, null, null, null, null, null, [["carnatic music", 46.5], ["music", 19.34], ["moo", 7.24]], null, null, null, null, null, [["fly, housefly", 27.22], ["mosquito", 16.6], ["insect", 16.36]], null, null, null, null], "duration": [1.56, 1.6, 1.88, 2.93, 0.63, 2.28, 1.78, 0.53, 10.58, 0.99, 0.01, 2.54, 8.06, 1.66, 1.02, 1.03, 0.3, 0.23, 0.66, 7.32, 0.39, 0.35, 34.82, 2.19, -0.23, 4.87, 0.38, 0.05, 1.27, 2.06]} \ No newline at end of file diff --git a/annotations_1/OstLbMEQM4Q_filtered.json b/annotations_1/OstLbMEQM4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d30940ea8850d13598d629d4eeba9e16189db942 --- /dev/null +++ b/annotations_1/OstLbMEQM4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.2], [11.0, 14.71], [18.0, 19.03], [21.0, 21.51], [22.0, 24.16], [29.0, 29.56], [32.0, 31.9], [33.0, 46.04], [47.0, 48.52], [59.0, 59.7], [76.0, 88.3], [90.0, 93.75], [96.0, 101.75], [102.0, 103.79], [107.0, 107.94], [115.0, 116.11], [118.0, 118.49], [119.0, 118.52], [119.0, 125.74], [126.0, 127.52], [129.0, 130.17], [131.0, 131.6], [133.0, 134.2], [135.0, 136.97], [140.0, 141.86], [143.0, 143.04], [144.0, 144.14], [145.0, 146.37], [150.0, 150.31], [155.0, 155.49], [156.0, 156.63], [158.0, 158.48], [160.0, 160.69], [163.0, 163.27], [167.0, 168.02], [172.0, 172.69]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.67, 0.0, 0.0, 30.44, 0.0, 0.0, 29.46, 0.0, 0.0, 34.19, 82.43, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 34.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 66.63], ["synthesizer", 7.64], ["ambient music", 4.34]], null, null, [["music", 58.13], ["theremin", 14.88], ["musical instrument", 7.49]], null, null, [["music", 27.63], ["speech", 21.06], ["sidetone", 12.35]], null, null, [["gong", 53.81], ["gunshot, gunfire", 11.95], ["machine gun", 7.97]], null, null, null, null, null, null, null, [["music", 22.07], ["whale vocalization", 9.94], ["chant", 9.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 3.71, 1.03, 0.51, 2.16, 0.56, -0.1, 13.04, 1.52, 0.7, 12.3, 3.75, 5.75, 1.79, 0.94, 1.11, 0.49, -0.48, 6.74, 1.52, 1.17, 0.6, 1.2, 1.97, 1.86, 0.04, 0.14, 1.37, 0.31, 0.49, 0.63, 0.48, 0.69, 0.27, 1.02, 0.69]} \ No newline at end of file diff --git a/annotations_1/OtjQUwKlR0U_filtered.json b/annotations_1/OtjQUwKlR0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be319d7cdd513c355c3c06018cdeeddb4eb1c659 --- /dev/null +++ b/annotations_1/OtjQUwKlR0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.21], [9.0, 20.56], [22.0, 23.08], [25.0, 32.04], [33.0, 35.55], [39.0, 41.37], [42.0, 46.9], [48.0, 52.27], [54.0, 66.12], [69.0, 70.88], [72.0, 75.42], [75.0, 75.49], [79.0, 88.03], [89.0, 90.95], [91.0, 91.22], [93.0, 93.45], [94.0, 98.78], [100.0, 101.44], [103.0, 103.96], [112.0, 112.68], [113.0, 113.9]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.76, 48.91, 0.0, 93.29, 91.13, 81.89, 92.15, 92.15, 70.86, 0.0, 70.86, 0.0, 69.74, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 25.69], ["music", 20.16], ["speech", 17.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.21, 11.56, 1.08, 7.04, 2.55, 2.37, 4.9, 4.27, 12.12, 1.88, 3.42, 0.49, 9.03, 1.95, 0.22, 0.45, 4.78, 1.44, 0.96, 0.68, 0.9]} \ No newline at end of file diff --git a/annotations_1/OuQTes47k14_filtered.json b/annotations_1/OuQTes47k14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df23b265ca85ca60fcb85e1f1a71ec7e33f47894 --- /dev/null +++ b/annotations_1/OuQTes47k14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.2], [35.0, 35.09], [35.0, 35.4], [44.0, 44.27], [56.0, 59.56], [61.0, 63.98], [66.0, 66.63], [67.0, 67.44], [68.0, 67.81], [68.0, 68.08], [70.0, 82.93], [84.0, 86.91], [88.0, 88.52], [89.0, 94.71], [98.0, 97.8], [98.0, 98.07], [98.0, 101.26], [101.0, 101.51], [102.0, 101.6], [102.0, 111.57], [121.0, 127.45], [131.0, 131.26], [138.0, 143.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.12, 38.82, 0.0, 0.0, 0.0, 0.0, 53.28, 39.75, 0.0, 39.74, 0.0, 0.0, 33.84, 0.0, 0.0, 33.07, 41.7, 0.0, 31.15], "audiomae_on_audioset": [null, null, null, null, [["music", 46.21], ["speech", 34.01], ["bleat", 4.77]], [["speech", 63.98], ["music", 8.86], ["speech synthesizer", 7.58]], null, null, null, null, null, [["music", 35.3], ["theremin", 13.77], ["cello", 5.33]], null, [["music", 73.26], ["mantra", 2.88], ["singing", 1.96]], null, null, [["moo", 28.37], ["cattle, bovinae", 26.7], ["livestock, farm animals, working animals", 12.28]], null, null, [["music", 63.68], ["speech", 7.0], ["theremin", 3.2]], [["speech", 38.25], ["sidetone", 33.64], ["music", 6.91]], null, [["music", 33.73], ["vehicle", 8.57], ["speech", 6.46]]], "duration": [0.2, 0.09, 0.4, 0.27, 3.56, 2.98, 0.63, 0.44, -0.19, 0.08, 12.93, 2.91, 0.52, 5.71, -0.2, 0.07, 3.26, 0.51, -0.4, 9.57, 6.45, 0.26, 5.23]} \ No newline at end of file diff --git a/annotations_1/Oui5yj3OvxQ_filtered.json b/annotations_1/Oui5yj3OvxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..530bb9c0c06656b10134adafd79d5e4ce776fb08 --- /dev/null +++ b/annotations_1/Oui5yj3OvxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.15], [19.0, 19.18], [36.0, 40.95], [51.0, 58.06], [62.0, 62.5], [64.0, 67.98], [68.0, 71.95], [79.0, 85.16], [86.0, 92.21], [95.0, 100.97], [110.0, 110.67], [112.0, 112.14], [121.0, 121.17], [126.0, 126.69], [127.0, 130.99], [141.0, 144.59], [145.0, 145.42], [146.0, 154.79], [157.0, 161.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 0.0, 42.72, 41.42, 0.0, 44.87, 40.79, 46.36, 41.28, 41.32, 0.0, 0.0, 0.0, 0.0, 39.15, 34.74, 0.0, 35.37, 35.74], "audiomae_on_audioset": [null, null, [["music", 69.22], ["swing music", 2.84], ["singing", 2.77]], [["music", 86.01], ["musical instrument", 0.98], ["singing", 0.88]], null, [["music", 70.4], ["male singing", 1.96], ["yodeling", 1.84]], [["music", 71.6], ["singing", 4.88], ["guitar", 2.7]], [["music", 72.82], ["singing", 3.08], ["musical instrument", 2.81]], [["music", 78.65], ["singing", 1.97], ["christmas music", 0.87]], [["music", 84.14], ["carnatic music", 3.32], ["musical instrument", 1.63]], null, null, null, null, [["music", 72.96], ["singing", 3.57], ["humming", 2.1]], [["music", 68.02], ["singing", 4.79], ["musical instrument", 2.3]], null, [["music", 78.82], ["singing", 3.35], ["musical instrument", 2.53]], [["music", 69.09], ["singing", 3.56], ["musical instrument", 2.86]]], "duration": [3.15, 0.18, 4.95, 7.06, 0.5, 3.98, 3.95, 6.16, 6.21, 5.97, 0.67, 0.14, 0.17, 0.69, 3.99, 3.59, 0.42, 8.79, 4.62]} \ No newline at end of file diff --git a/annotations_1/Ov2ErYiFemg_filtered.json b/annotations_1/Ov2ErYiFemg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d58a2b0066e12c1ef03c75a3f588e863ca11217 --- /dev/null +++ b/annotations_1/Ov2ErYiFemg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 14.34], [19.0, 54.38], [57.0, 71.05], [76.0, 80.94], [83.0, 92.67], [93.0, 93.78], [94.0, 95.01], [95.0, 95.94], [97.0, 97.73], [101.0, 101.01], [101.0, 104.4], [106.0, 107.05], [109.0, 109.97]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.03, 0.0, 53.59, 50.91, 47.43, 0.0, 0.0, 0.0, 0.0, 0.0, 34.44, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 28.76], ["mosquito", 24.31], ["insect", 16.65]], null, null, null, [["hum", 57.67], ["mains hum", 25.7], ["throbbing", 5.32]], null, null, null, null, null, [["speech", 60.94], ["vehicle", 5.05], ["music", 4.74]], null, null], "duration": [11.34, 35.38, 14.05, 4.94, 9.67, 0.78, 1.01, 0.94, 0.73, 0.01, 3.4, 1.05, 0.97]} \ No newline at end of file diff --git a/annotations_1/Ov6nBKuu6pI_filtered.json b/annotations_1/Ov6nBKuu6pI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9514cbc002f23d39a50d9144d3e961d4831827f8 --- /dev/null +++ b/annotations_1/Ov6nBKuu6pI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 48.83], [50.0, 53.27], [55.0, 56.84], [62.0, 68.03], [69.0, 69.9], [70.0, 69.94], [70.0, 91.76], [104.0, 114.62], [118.0, 127.26], [128.0, 138.18], [142.0, 175.95], [184.0, 188.89]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 85.54, 0.0, 99.62, 0.0, 0.0, 35.19, 52.92, 31.74, 30.49, 0.0, 31.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 67.71], ["didgeridoo", 9.33], ["theremin", 3.38]], null, [["sidetone", 44.36], ["speech", 18.55], ["music", 18.52]], [["hum", 21.6], ["mains hum", 17.33], ["music", 12.69]], null, [["speech", 39.97], ["sidetone", 20.48], ["music", 15.97]]], "duration": [0.83, 3.27, 1.84, 6.03, 0.9, -0.06, 21.76, 10.62, 9.26, 10.18, 33.95, 4.89]} \ No newline at end of file diff --git a/annotations_1/OvQctA3xsoE_filtered.json b/annotations_1/OvQctA3xsoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d619c45533829bb354ec6076026e21cfb7166439 --- /dev/null +++ b/annotations_1/OvQctA3xsoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.61], [14.0, 14.37], [17.0, 18.71], [21.0, 21.3], [22.0, 22.37], [22.0, 22.44], [23.0, 22.59], [23.0, 22.99], [24.0, 24.76], [30.0, 30.15], [30.0, 30.18], [32.0, 36.98], [39.0, 40.36], [43.0, 43.01], [49.0, 53.32], [57.0, 58.01], [63.0, 63.42], [69.0, 69.97], [77.0, 78.41], [79.0, 80.6], [100.0, 100.77], [105.0, 105.65], [107.0, 110.24], [115.0, 115.84], [116.0, 117.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 73.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.37, 1.71, 0.3, 0.37, 0.44, -0.41, -0.01, 0.76, 0.15, 0.18, 4.98, 1.36, 0.01, 4.32, 1.01, 0.42, 0.97, 1.41, 1.6, 0.77, 0.65, 3.24, 0.84, 1.05]} \ No newline at end of file diff --git a/annotations_1/Ovyfd29a1ik_filtered.json b/annotations_1/Ovyfd29a1ik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb848c5d072ea92944c2922d3a00285e32b195cb --- /dev/null +++ b/annotations_1/Ovyfd29a1ik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [4.0, 4.21], [5.0, 5.49], [7.0, 8.02], [12.0, 14.76], [18.0, 19.16], [21.0, 21.81], [24.0, 24.73], [27.0, 29.22], [30.0, 33.32], [34.0, 34.05], [35.0, 39.41], [40.0, 41.13], [41.0, 42.11], [43.0, 43.93], [45.0, 45.25], [46.0, 46.33], [48.0, 51.31], [52.0, 54.09], [57.0, 58.11], [61.0, 61.57], [64.0, 64.15], [65.0, 65.1], [66.0, 66.14], [68.0, 69.11], [70.0, 74.06], [77.0, 78.85], [81.0, 81.57], [83.0, 84.91], [86.0, 92.16], [93.0, 94.14], [96.0, 96.63], [100.0, 100.2], [102.0, 102.9], [105.0, 116.24], [117.0, 117.71], [120.0, 134.55], [135.0, 139.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 89.54, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 95.37, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.21, 0.49, 1.02, 2.76, 1.16, 0.81, 0.73, 2.22, 3.32, 0.05, 4.41, 1.13, 1.11, 0.93, 0.25, 0.33, 3.31, 2.09, 1.11, 0.57, 0.15, 0.1, 0.14, 1.11, 4.06, 1.85, 0.57, 1.91, 6.16, 1.14, 0.63, 0.2, 0.9, 11.24, 0.71, 14.55, 4.97]} \ No newline at end of file diff --git a/annotations_1/OwG27DvQf68_filtered.json b/annotations_1/OwG27DvQf68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac12e45329fdb69543d0f13521bb6eae1f3fa135 --- /dev/null +++ b/annotations_1/OwG27DvQf68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.75], [2.0, 2.83], [18.0, 18.79], [23.0, 23.3], [23.0, 23.46], [25.0, 30.47], [43.0, 49.94], [54.0, 58.75], [67.0, 73.55], [77.0, 82.66], [90.0, 97.44], [101.0, 100.97], [106.0, 106.84], [114.0, 118.32], [144.0, 145.4], [150.0, 150.28], [151.0, 152.76], [154.0, 154.5], [155.0, 155.73], [157.0, 157.49], [160.0, 159.85], [161.0, 161.06]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.57, 28.34, 34.37, 29.54, 29.04, 30.79, 0.0, 0.0, 28.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.96], ["burst, pop", 11.28], ["speech", 4.24]], [["music", 52.68], ["speech", 16.47], ["electronic music", 3.11]], [["music", 60.87], ["speech", 6.38], ["hum", 5.57]], [["music", 46.47], ["speech", 39.83], ["boing", 3.17]], [["music", 35.12], ["speech", 19.08], ["electronic music", 4.73]], [["music", 56.04], ["speech", 16.0], ["synthesizer", 3.19]], null, null, [["music", 15.19], ["sound effect", 10.65], ["groan", 10.04]], null, null, null, null, null, null, null, null], "duration": [0.75, 0.83, 0.79, 0.3, 0.46, 5.47, 6.94, 4.75, 6.55, 5.66, 7.44, -0.03, 0.84, 4.32, 1.4, 0.28, 1.76, 0.5, 0.73, 0.49, -0.15, 0.06]} \ No newline at end of file diff --git a/annotations_1/OwfT8yTBPYs_filtered.json b/annotations_1/OwfT8yTBPYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74313e53d4e6ac7dc30b86ee09c3dab18665fe5e --- /dev/null +++ b/annotations_1/OwfT8yTBPYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [8.0, 8.34], [9.0, 9.24], [10.0, 10.88], [12.0, 13.09], [17.0, 54.87], [62.0, 62.94], [65.0, 66.04], [71.0, 71.59], [72.0, 71.69], [72.0, 72.01], [74.0, 91.94], [92.0, 92.1], [92.0, 102.39], [107.0, 107.87], [111.0, 114.84], [118.0, 119.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.13, 0.0, 30.94, 0.0, 30.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.49], ["livestock, farm animals, working animals", 13.78], ["cattle, bovinae", 13.76]], null, [["speech", 46.3], ["buzz", 17.04], ["music", 7.56]], null, [["speech", 30.05], ["buzzer", 9.55], ["music", 8.58]], null], "duration": [1.14, 0.34, 0.24, 0.88, 1.09, 37.87, 0.94, 1.04, 0.59, -0.31, 0.01, 17.94, 0.1, 10.39, 0.87, 3.84, 1.04]} \ No newline at end of file diff --git a/annotations_1/OxBd2RQI4eQ_filtered.json b/annotations_1/OxBd2RQI4eQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19decbea8dbd6cdb959e77356ee7e35e9f1ce0e0 --- /dev/null +++ b/annotations_1/OxBd2RQI4eQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [8.0, 24.78], [25.0, 27.24], [28.0, 32.0], [33.0, 33.4], [36.0, 37.08], [38.0, 39.29], [42.0, 43.8], [46.0, 64.12], [68.0, 69.23], [70.0, 70.28], [72.0, 94.1], [95.0, 95.89], [97.0, 97.68], [100.0, 114.91], [115.0, 118.1], [119.0, 119.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 29.8, 34.46, 31.73, 0.0, 0.0, 0.0, 0.0, 31.38, 0.0, 0.0, 30.05, 0.0, 0.0, 29.25, 30.23, 0.0], "audiomae_on_audioset": [null, [["music", 54.47], ["hum", 12.85], ["electronic music", 7.76]], [["sidetone", 38.2], ["speech", 22.41], ["music", 9.75]], [["whale vocalization", 51.59], ["music", 23.1], ["hum", 5.16]], null, null, null, null, [["music", 33.67], ["speech", 30.26], ["hum", 9.13]], null, null, [["music", 27.26], ["noise", 10.9], ["ambient music", 10.87]], null, null, [["music", 20.43], ["synthesizer", 10.75], ["hum", 8.72]], [["music", 39.08], ["foghorn", 14.25], ["speech", 6.61]], null], "duration": [1.06, 16.78, 2.24, 4.0, 0.4, 1.08, 1.29, 1.8, 18.12, 1.23, 0.28, 22.1, 0.89, 0.68, 14.91, 3.1, 0.84]} \ No newline at end of file diff --git a/annotations_1/OxEcQFG6U4g_filtered.json b/annotations_1/OxEcQFG6U4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..900d5afb19e63e786a8a1e6f09dceccbb8429b7b --- /dev/null +++ b/annotations_1/OxEcQFG6U4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.72], [8.0, 8.53], [10.0, 10.64], [12.0, 12.45], [15.0, 15.85], [17.0, 19.48], [22.0, 25.51], [33.0, 43.12], [46.0, 47.28], [50.0, 53.97], [57.0, 57.13], [58.0, 74.95], [75.0, 76.54], [77.0, 78.88], [85.0, 85.55], [102.0, 102.51], [103.0, 103.57], [108.0, 108.04], [109.0, 110.62], [114.0, 114.42], [126.0, 128.04], [130.0, 130.3], [136.0, 136.41], [152.0, 152.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 100.0, 62.89, 0.0, 75.72, 0.0, 40.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 59.79], ["speech", 12.8], ["musical instrument", 3.16]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 0.53, 0.64, 0.45, 0.85, 2.48, 3.51, 10.12, 1.28, 3.97, 0.13, 16.95, 1.54, 1.88, 0.55, 0.51, 0.57, 0.04, 1.62, 0.42, 2.04, 0.3, 0.41, 0.93]} \ No newline at end of file diff --git a/annotations_1/OxKXKwijH_g_filtered.json b/annotations_1/OxKXKwijH_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56c528f4627fd6a66f5b3e0dfc3d5f8123900339 --- /dev/null +++ b/annotations_1/OxKXKwijH_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.99], [17.0, 16.92], [18.0, 17.85], [20.0, 20.11], [26.0, 27.03], [28.0, 29.47], [30.0, 31.77], [32.0, 33.56], [34.0, 34.45], [35.0, 35.83], [38.0, 50.23], [56.0, 57.43], [63.0, 62.73], [64.0, 65.92], [66.0, 67.27], [67.0, 70.34], [71.0, 71.71], [90.0, 93.29], [98.0, 98.22], [102.0, 102.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [50.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0, 0.0, 0.0, 40.55, 0.0, 34.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["dial tone", 22.26], ["bouncing", 19.02], ["telephone", 14.26]], null, null, null, null, [["sidetone", 56.71], ["speech", 8.07], ["hum", 6.97]], null, [["speech", 81.94], ["radio", 2.36], ["music", 1.33]], null, null], "duration": [7.99, -0.08, -0.15, 0.11, 1.03, 1.47, 1.77, 1.56, 0.45, 0.83, 12.23, 1.43, -0.27, 1.92, 1.27, 3.34, 0.71, 3.29, 0.22, 0.51]} \ No newline at end of file diff --git a/annotations_1/OxLmmTv6CTs_filtered.json b/annotations_1/OxLmmTv6CTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daf4150df281ae0d253575e9e573d678639a9e07 --- /dev/null +++ b/annotations_1/OxLmmTv6CTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [2.0, 2.47], [8.0, 15.21], [17.0, 17.78], [19.0, 26.65], [34.0, 35.26], [38.0, 39.18], [41.0, 45.62], [46.0, 48.29], [49.0, 49.33], [49.0, 49.77], [50.0, 49.94], [50.0, 50.11], [50.0, 50.31], [53.0, 54.24], [55.0, 65.74], [67.0, 69.47], [81.0, 90.39], [92.0, 92.99], [95.0, 96.89], [98.0, 99.17], [101.0, 101.14], [102.0, 102.74], [111.0, 112.26], [113.0, 113.97], [122.0, 123.6], [125.0, 128.85], [130.0, 141.07], [145.0, 145.64], [148.0, 148.37], [151.0, 150.96], [153.0, 153.01], [154.0, 155.38], [158.0, 158.68], [160.0, 161.3], [164.0, 164.02], [166.0, 167.81], [169.0, 170.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.24, 0.0, 58.72, 0.0, 0.0, 99.96, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 99.97, 74.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.47, 7.21, 0.78, 7.65, 1.26, 1.18, 4.62, 2.29, 0.33, 0.77, -0.06, 0.11, 0.31, 1.24, 10.74, 2.47, 9.39, 0.99, 1.89, 1.17, 0.14, 0.74, 1.26, 0.97, 1.6, 3.85, 11.07, 0.64, 0.37, -0.04, 0.01, 1.38, 0.68, 1.3, 0.02, 1.81, 1.5]} \ No newline at end of file diff --git a/annotations_1/Oy9R8mpKSmM_filtered.json b/annotations_1/Oy9R8mpKSmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3280450de6afbf90c39127e4d5b931493670d96a --- /dev/null +++ b/annotations_1/Oy9R8mpKSmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 88.05], [89.0, 111.67], [113.0, 133.54]], "keep_status": [false, true, false], "silence_prob": [0.0, 29.8, 45.59], "audiomae_on_audioset": [null, [["music", 41.98], ["car", 17.34], ["vehicle", 10.35]], [["throbbing", 43.99], ["hum", 30.96], ["heart sounds, heartbeat", 5.73]]], "duration": [0.05, 22.67, 20.54]} \ No newline at end of file diff --git a/annotations_1/OyziGbUQBIc_filtered.json b/annotations_1/OyziGbUQBIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd7bf9db5eb476b4e0c22a137e22310e681a482a --- /dev/null +++ b/annotations_1/OyziGbUQBIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 45.2], [46.0, 47.48], [53.0, 61.06], [61.0, 63.58], [67.0, 88.42], [89.0, 90.54], [92.0, 111.03], [119.0, 120.66], [126.0, 126.2], [126.0, 126.25], [127.0, 127.31], [130.0, 129.64], [131.0, 132.31], [134.0, 134.76], [142.0, 142.47]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [98.66, 0.0, 80.64, 70.72, 32.2, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 73.62], ["electronic music", 6.74], ["house music", 6.42]], null, [["music", 28.78], ["speech", 15.28], ["musical instrument", 5.05]], null, null, null, null, null, null, null, null], "duration": [4.2, 1.48, 8.06, 2.58, 21.42, 1.54, 19.03, 1.66, 0.2, 0.25, 0.31, -0.36, 1.31, 0.76, 0.47]} \ No newline at end of file diff --git a/annotations_1/OzliqFzK36E_filtered.json b/annotations_1/OzliqFzK36E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..723e1332794a841b4f438c754c9218e74751badd --- /dev/null +++ b/annotations_1/OzliqFzK36E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 39.19], [40.0, 55.14]], "keep_status": [false, false], "silence_prob": [30.3, 29.09], "audiomae_on_audioset": [[["music", 48.74], ["hum", 16.89], ["electronic music", 7.93]], [["music", 45.1], ["speech", 22.19], ["throbbing", 7.43]]], "duration": [22.19, 15.14]} \ No newline at end of file diff --git a/annotations_1/P-KZ7N30lFY_filtered.json b/annotations_1/P-KZ7N30lFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95cb9fab9f02e05e190ea7be02356d5f6372ac6e --- /dev/null +++ b/annotations_1/P-KZ7N30lFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.84], [16.0, 16.77], [18.0, 18.2], [18.0, 27.46], [28.0, 28.9], [29.0, 29.94], [31.0, 34.18], [34.0, 37.03], [38.0, 39.09], [40.0, 40.53], [41.0, 42.09], [43.0, 44.1], [48.0, 48.27], [49.0, 54.35], [64.0, 64.96], [68.0, 100.82], [105.0, 106.19], [110.0, 123.18], [132.0, 134.1]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 44.01, 0.0, 0.0, 87.0, 45.27, 0.0, 0.0, 0.0, 0.0, 0.0, 28.67, 0.0, 0.0, 0.0, 29.1, 31.65], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 36.94], ["cattle, bovinae", 34.99], ["moo", 24.76]], null, null, null, [["speech", 50.72], ["whale vocalization", 7.44], ["sine wave", 4.79]], null, null, null, null, null, [["speech", 65.95], ["vehicle", 13.65], ["music", 3.74]], null, null, null, [["music", 61.94], ["buzz", 20.96], ["electronic music", 2.41]], [["speech", 24.62], ["bee, wasp, etc.", 15.48], ["fly, housefly", 14.47]]], "duration": [0.84, 0.77, 0.2, 9.46, 0.9, 0.94, 3.18, 3.03, 1.09, 0.53, 1.09, 1.1, 0.27, 5.35, 0.96, 32.82, 1.19, 13.18, 2.1]} \ No newline at end of file diff --git a/annotations_1/P-mT2D6iM5k_filtered.json b/annotations_1/P-mT2D6iM5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1401a7e2bba4a71a5e9679c36be8de8e1ca92555 --- /dev/null +++ b/annotations_1/P-mT2D6iM5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 32.39], [34.0, 44.34], [49.0, 50.09], [55.0, 55.22], [59.0, 83.15], [84.0, 85.02], [87.0, 89.16], [90.0, 99.42]], "keep_status": [true, true, false, false, false, false, true, true], "silence_prob": [29.65, 29.96, 0.0, 0.0, 28.92, 0.0, 30.77, 29.19], "audiomae_on_audioset": [[["music", 32.16], ["hum", 16.32], ["speech", 12.25]], [["music", 25.54], ["speech", 18.21], ["hum", 5.09]], null, null, [["speech", 43.84], ["music", 29.55], ["throbbing", 6.02]], null, [["boing", 14.47], ["music", 13.01], ["drum", 7.75]], [["speech", 30.96], ["vehicle", 17.05], ["music", 9.82]]], "duration": [14.39, 10.34, 1.09, 0.22, 24.15, 1.02, 2.16, 9.42]} \ No newline at end of file diff --git a/annotations_1/P20hrE8pmoI_filtered.json b/annotations_1/P20hrE8pmoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a6815fed41e8c830459faf6a8889929c61f58ce --- /dev/null +++ b/annotations_1/P20hrE8pmoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [3.0, 3.91], [8.0, 12.36], [15.0, 16.77], [23.0, 23.65], [25.0, 26.57], [29.0, 29.22], [30.0, 29.81], [30.0, 32.24], [34.0, 34.01], [34.0, 34.64], [35.0, 35.82], [37.0, 37.61], [39.0, 40.54], [46.0, 49.2], [50.0, 52.25], [54.0, 55.02], [55.0, 57.55], [59.0, 59.02], [60.0, 59.75], [63.0, 69.26], [70.0, 71.34], [77.0, 81.38], [86.0, 109.59], [111.0, 111.23], [112.0, 112.36]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 36.02, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 75.07, 0.0, 49.78, 0.0, 0.0, 40.28, 0.0, 32.36, 32.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 28.88], ["cattle, bovinae", 14.23], ["livestock, farm animals, working animals", 13.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 29.8], ["insect", 17.42], ["music", 10.87]], null, null, [["speech", 55.85], ["sidetone", 19.73], ["radio", 4.56]], null, [["livestock, farm animals, working animals", 19.03], ["ding", 14.08], ["clang", 8.81]], [["fart", 55.58], ["speech", 14.73], ["buzz", 7.48]], null, null], "duration": [0.53, 0.91, 4.36, 1.77, 0.65, 1.57, 0.22, -0.19, 2.24, 0.01, 0.64, 0.82, 0.61, 1.54, 3.2, 2.25, 1.02, 2.55, 0.02, -0.25, 6.26, 1.34, 4.38, 23.59, 0.23, 0.36]} \ No newline at end of file diff --git a/annotations_1/P27sTXSGrhQ_filtered.json b/annotations_1/P27sTXSGrhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3524f2c4e4245797985a3a2601e46f54f79773c8 --- /dev/null +++ b/annotations_1/P27sTXSGrhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 41.34], [43.0, 43.58], [50.0, 54.09], [60.0, 70.95], [72.0, 75.34]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 99.93, 99.73], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.34, 0.58, 4.09, 10.95, 3.34]} \ No newline at end of file diff --git a/annotations_1/P2rpcVDPZEY_filtered.json b/annotations_1/P2rpcVDPZEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7ed04fc8ad9fcd240cffeb842b260e157ba5b26 --- /dev/null +++ b/annotations_1/P2rpcVDPZEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [16.0, 15.92], [21.0, 21.93], [28.0, 28.93], [39.0, 39.26], [45.0, 44.74], [46.0, 47.39], [54.0, 54.09], [57.0, 57.55], [61.0, 61.5], [69.0, 69.62], [71.0, 71.1], [78.0, 88.89], [92.0, 92.79], [97.0, 96.77], [104.0, 104.75], [108.0, 108.77], [115.0, 114.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, -0.08, 0.93, 0.93, 0.26, -0.26, 1.39, 0.09, 0.55, 0.5, 0.62, 0.1, 10.89, 0.79, -0.23, 0.75, 0.77, -0.01]} \ No newline at end of file diff --git a/annotations_1/P3Mo5t61kO4_filtered.json b/annotations_1/P3Mo5t61kO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b33317dc4150d312ddee548d112fddc990cf57d --- /dev/null +++ b/annotations_1/P3Mo5t61kO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [12.0, 12.02], [16.0, 16.23], [17.0, 17.63], [19.0, 18.86], [22.0, 22.52], [23.0, 26.55], [33.0, 33.69], [38.0, 39.65], [42.0, 43.56], [44.0, 45.12], [49.0, 49.1], [56.0, 56.83], [59.0, 59.34], [62.0, 68.0], [69.0, 72.67], [74.0, 74.93], [76.0, 77.45], [80.0, 80.7], [83.0, 82.75], [88.0, 88.87], [91.0, 91.3], [91.0, 91.49], [92.0, 92.75], [94.0, 94.63], [97.0, 96.89], [97.0, 98.25], [100.0, 101.61], [103.0, 103.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.77, 37.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.55], ["mains hum", 22.1], ["frog", 6.55]], [["frog", 75.61], ["croak", 20.65], ["sidetone", 0.72]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.02, 0.23, 0.63, -0.14, 0.52, 3.55, 0.69, 1.65, 1.56, 1.12, 0.1, 0.83, 0.34, 6.0, 3.67, 0.93, 1.45, 0.7, -0.25, 0.87, 0.3, 0.49, 0.75, 0.63, -0.11, 1.25, 1.61, 0.67]} \ No newline at end of file diff --git a/annotations_1/P4aGofKtJsA_filtered.json b/annotations_1/P4aGofKtJsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3938f22d1e631819b2e9ee02c63c4f4cd2f4fdbd --- /dev/null +++ b/annotations_1/P4aGofKtJsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.8], [14.0, 14.55], [17.0, 20.04], [23.0, 22.87], [27.0, 28.54], [34.0, 35.02], [36.0, 36.66], [37.0, 38.11], [39.0, 40.39], [47.0, 46.7], [56.0, 56.83], [68.0, 68.22], [83.0, 84.06], [89.0, 89.75], [103.0, 103.76], [105.0, 105.33], [115.0, 117.53], [122.0, 122.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.82, 0.0], "audiomae_on_audioset": [null, null, [["music", 73.25], ["rock and roll", 3.78], ["roll", 2.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.39], ["whip", 24.03], ["boing", 5.21]], null], "duration": [0.8, 0.55, 3.04, -0.13, 1.54, 1.02, 0.66, 1.11, 1.39, -0.3, 0.83, 0.22, 1.06, 0.75, 0.76, 0.33, 2.53, 0.23]} \ No newline at end of file diff --git a/annotations_1/P5kDAUzl-T4_filtered.json b/annotations_1/P5kDAUzl-T4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af8c177506d43ab8bfdc898ed1f734c4b7ec029f --- /dev/null +++ b/annotations_1/P5kDAUzl-T4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 85.68], [86.0, 94.19], [99.0, 106.22], [108.0, 119.97]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 87.92, 60.89, 31.84], "audiomae_on_audioset": [null, null, null, [["speech", 37.44], ["music", 9.11], ["mains hum", 7.54]]], "duration": [65.68, 8.19, 7.22, 11.97]} \ No newline at end of file diff --git a/annotations_1/P6c_kQL3ZdU_filtered.json b/annotations_1/P6c_kQL3ZdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a182abdb2595eb245a55c7babd97868921af0e --- /dev/null +++ b/annotations_1/P6c_kQL3ZdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.64], [12.0, 14.52], [15.0, 18.13], [20.0, 20.02], [21.0, 21.34], [22.0, 22.38], [24.0, 24.53], [26.0, 27.3], [29.0, 29.37], [32.0, 32.8], [51.0, 51.24], [65.0, 65.15], [68.0, 69.48], [85.0, 85.89], [95.0, 96.42], [107.0, 108.18], [109.0, 110.54], [113.0, 113.93], [116.0, 117.59], [121.0, 123.45], [125.0, 126.72], [130.0, 132.14], [133.0, 135.04], [135.0, 140.51], [143.0, 147.83], [149.0, 149.44], [150.0, 154.95]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, true], "silence_prob": [31.04, 57.97, 29.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.54, 0.0, 42.51, 29.72, 29.82, 30.45, 0.0, 29.67], "audiomae_on_audioset": [[["music", 17.08], ["thunk", 15.05], ["synthesizer", 10.9]], null, [["whale vocalization", 23.37], ["music", 11.53], ["hum", 7.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.06], ["hum", 4.52], ["singing bowl", 2.86]], null, [["hum", 32.71], ["mains hum", 13.03], ["music", 9.61]], [["music", 34.02], ["speech", 31.28], ["whip", 5.12]], [["music", 41.48], ["throbbing", 13.48], ["speech", 6.99]], [["speech", 25.09], ["whale vocalization", 23.08], ["music", 5.92]], null, [["music", 34.19], ["whale vocalization", 23.33], ["electronic music", 5.8]]], "duration": [2.64, 2.52, 3.13, 0.02, 0.34, 0.38, 0.53, 1.3, 0.37, 0.8, 0.24, 0.15, 1.48, 0.89, 1.42, 1.18, 1.54, 0.93, 1.59, 2.45, 1.72, 2.14, 2.04, 5.51, 4.83, 0.44, 4.95]} \ No newline at end of file diff --git a/annotations_1/P7-rs7H1CAE_filtered.json b/annotations_1/P7-rs7H1CAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a070f31d5e436ffa2d933966425f5e552ba5727 --- /dev/null +++ b/annotations_1/P7-rs7H1CAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.91], [12.0, 12.53], [15.0, 17.15], [18.0, 18.17], [19.0, 19.35], [20.0, 21.36], [24.0, 25.64], [28.0, 27.65], [28.0, 27.73], [34.0, 34.8], [35.0, 38.91], [41.0, 55.48], [59.0, 64.03], [66.0, 68.0], [69.0, 70.04], [77.0, 77.48], [77.0, 78.58], [80.0, 92.26], [92.0, 92.42], [93.0, 92.8], [93.0, 92.85], [93.0, 93.07], [94.0, 94.1], [97.0, 97.66], [98.0, 108.19], [111.0, 110.98], [111.0, 111.89], [114.0, 116.75], [123.0, 124.95]], "keep_status": [true, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.08, 0.0, 33.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.76, 32.1, 35.2, 35.88, 0.0, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.79, 0.0, 0.0, 33.99, 0.0], "audiomae_on_audioset": [[["music", 26.36], ["sidetone", 23.3], ["speech", 20.2]], null, [["music", 28.84], ["crowd", 6.55], ["speech", 6.52]], null, null, null, null, null, null, null, [["speech", 16.6], ["music", 14.99], ["hum", 10.92]], [["speech", 51.82], ["music", 16.52], ["vehicle", 8.48]], [["music", 38.71], ["throbbing", 10.03], ["sidetone", 9.87]], [["music", 67.14], ["speech", 4.68], ["boing", 3.62]], null, null, null, [["music", 52.37], ["speech", 15.75], ["animal", 2.18]], null, null, null, null, null, null, [["speech", 41.95], ["music", 24.78], ["fart", 3.43]], null, null, [["music", 28.1], ["speech", 23.26], ["hum", 6.05]], null], "duration": [5.91, 0.53, 2.15, 0.17, 0.35, 1.36, 1.64, -0.35, -0.27, 0.8, 3.91, 14.48, 5.03, 2.0, 1.04, 0.48, 1.58, 12.26, 0.42, -0.2, -0.15, 0.07, 0.1, 0.66, 10.19, -0.02, 0.89, 2.75, 1.95]} \ No newline at end of file diff --git a/annotations_1/P8ZCZJpluDA_filtered.json b/annotations_1/P8ZCZJpluDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca246ab37b7d58eef7cf48e61dae03640fc1c7e6 --- /dev/null +++ b/annotations_1/P8ZCZJpluDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.88], [7.0, 12.28], [19.0, 19.74], [22.0, 23.26], [25.0, 25.29], [26.0, 26.91], [31.0, 30.81], [36.0, 36.49], [43.0, 44.46], [48.0, 48.47], [55.0, 58.02], [59.0, 60.02], [65.0, 66.19], [67.0, 67.74], [69.0, 76.79], [82.0, 83.49], [85.0, 85.16], [86.0, 86.14], [89.0, 89.85], [92.0, 92.13], [98.0, 100.06], [108.0, 108.67], [114.0, 114.94], [120.0, 120.11], [120.0, 121.44], [123.0, 125.73], [130.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["burping, eructation", 28.39], ["music", 13.41], ["hum", 8.28]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 5.28, 0.74, 1.26, 0.29, 0.91, -0.19, 0.49, 1.46, 0.47, 3.02, 1.02, 1.19, 0.74, 7.79, 1.49, 0.16, 0.14, 0.85, 0.13, 2.06, 0.67, 0.94, 0.11, 1.44, 2.73, 0.42]} \ No newline at end of file diff --git a/annotations_1/P94mqkWtfxU_filtered.json b/annotations_1/P94mqkWtfxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6d916a68db4f5113cf3bb32cc179c18ae444b9f --- /dev/null +++ b/annotations_1/P94mqkWtfxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 25.44], [34.0, 35.6], [40.0, 52.64], [55.0, 54.82], [58.0, 64.61], [65.0, 66.77], [67.0, 84.82], [92.0, 97.92], [100.0, 103.05], [103.0, 103.87], [104.0, 120.09], [121.0, 124.75], [126.0, 130.86], [135.0, 155.51], [166.0, 165.96]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, true, true, true, false], "silence_prob": [31.86, 0.0, 31.5, 0.0, 36.11, 0.0, 34.11, 37.27, 33.99, 0.0, 33.1, 35.62, 33.4, 33.06, 0.0], "audiomae_on_audioset": [[["music", 63.71], ["hum", 5.97], ["throbbing", 3.54]], null, [["speech", 50.57], ["fart", 19.74], ["music", 5.21]], null, [["music", 28.72], ["throbbing", 17.87], ["boing", 10.5]], null, [["music", 47.33], ["speech", 25.53], ["didgeridoo", 8.29]], [["chirp tone", 28.72], ["hum", 10.43], ["music", 6.91]], [["groan", 39.2], ["music", 25.83], ["noise", 8.47]], null, [["music", 39.52], ["groan", 25.11], ["speech", 5.01]], [["music", 54.14], ["fart", 7.51], ["speech", 4.71]], [["throbbing", 27.62], ["hum", 16.81], ["speech", 15.47]], [["music", 42.79], ["fly, housefly", 8.03], ["throbbing", 6.63]], null], "duration": [14.44, 1.6, 12.64, -0.18, 6.61, 1.77, 17.82, 5.92, 3.05, 0.87, 16.09, 3.75, 4.86, 20.51, -0.04]} \ No newline at end of file diff --git a/annotations_1/P9jJ6Bejayg_filtered.json b/annotations_1/P9jJ6Bejayg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ae4b1989f55a52beeb90acbe0462e19c9991379 --- /dev/null +++ b/annotations_1/P9jJ6Bejayg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 28.86], [35.0, 35.6], [41.0, 41.4], [49.0, 76.2], [78.0, 104.01], [105.0, 112.26], [116.0, 116.9], [121.0, 122.12], [134.0, 135.77], [136.0, 137.47], [138.0, 138.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.1, 30.23, 31.33, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["mains hum", 39.08], ["hum", 36.44], ["electric shaver, electric razor", 5.83]], [["music", 44.65], ["throbbing", 22.28], ["hum", 16.95]], [["hum", 46.39], ["throbbing", 31.86], ["music", 8.13]], null, null, null, null, null], "duration": [-0.14, 0.6, 0.4, 27.2, 26.01, 7.26, 0.9, 1.12, 1.77, 1.47, 0.94]} \ No newline at end of file diff --git a/annotations_1/PAw7vAf6HMg_filtered.json b/annotations_1/PAw7vAf6HMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1842ea5468d88f63e63d96b499cffaca17e40ca --- /dev/null +++ b/annotations_1/PAw7vAf6HMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [5.0, 7.26], [8.0, 8.55], [14.0, 15.09], [16.0, 16.7], [37.0, 37.83], [39.0, 39.93], [42.0, 42.85], [44.0, 44.49], [48.0, 48.66], [54.0, 54.58], [89.0, 89.58], [90.0, 90.78], [93.0, 93.83], [94.0, 94.96], [96.0, 97.19], [99.0, 99.06], [100.0, 100.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 2.26, 0.55, 1.09, 0.7, 0.83, 0.93, 0.85, 0.49, 0.66, 0.58, 0.58, 0.78, 0.83, 0.96, 1.19, 0.06, 0.87]} \ No newline at end of file diff --git a/annotations_1/PB-KpT4zhWo_filtered.json b/annotations_1/PB-KpT4zhWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fa3d37c4df86500dddaca59b37e33c46eda2c71 --- /dev/null +++ b/annotations_1/PB-KpT4zhWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.81], [20.0, 22.86], [24.0, 24.83], [32.0, 45.55], [47.0, 48.76], [49.0, 53.3], [54.0, 54.89], [58.0, 59.07], [61.0, 62.29], [64.0, 64.17], [64.0, 69.38], [70.0, 72.45], [80.0, 81.58], [82.0, 84.0], [86.0, 89.53], [90.0, 97.51], [98.0, 100.3], [102.0, 103.01], [104.0, 153.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [100.0, 98.8, 0.0, 81.53, 0.0, 33.15, 0.0, 0.0, 0.0, 0.0, 68.93, 34.15, 0.0, 32.85, 37.67, 31.18, 39.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 54.16], ["thunk", 21.87], ["music", 3.99]], null, null, null, null, null, [["speech", 45.93], ["music", 17.84], ["rumble", 7.72]], null, [["music", 47.9], ["sidetone", 6.04], ["effects unit", 5.46]], [["speech", 34.91], ["sidetone", 12.5], ["music", 10.63]], [["speech", 59.13], ["machine gun", 6.26], ["gunshot, gunfire", 5.56]], [["music", 17.36], ["gasp", 10.33], ["synthesizer", 9.08]], null, null], "duration": [12.81, 2.86, 0.83, 13.55, 1.76, 4.3, 0.89, 1.07, 1.29, 0.17, 5.38, 2.45, 1.58, 2.0, 3.53, 7.51, 2.3, 1.01, 49.57]} \ No newline at end of file diff --git a/annotations_1/PBHYbeg2nao_filtered.json b/annotations_1/PBHYbeg2nao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f4bb5cdab1616c4d85ceedf687ece230b2c9f30 --- /dev/null +++ b/annotations_1/PBHYbeg2nao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.37], [7.0, 7.77], [9.0, 9.49], [11.0, 11.92], [13.0, 14.54], [15.0, 15.7], [16.0, 16.29], [23.0, 23.08], [34.0, 35.36], [36.0, 36.39], [39.0, 39.9], [44.0, 45.0], [57.0, 58.06], [59.0, 59.88], [60.0, 60.51], [61.0, 61.47], [65.0, 65.57], [71.0, 72.2], [76.0, 76.38], [81.0, 81.11], [83.0, 83.61], [84.0, 84.47], [86.0, 87.17], [88.0, 88.4], [90.0, 92.52], [93.0, 94.88], [107.0, 107.94], [117.0, 118.29], [120.0, 121.24], [122.0, 122.2], [129.0, 130.89], [133.0, 132.81], [158.0, 158.38], [176.0, 176.42], [177.0, 177.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.77, 0.49, 0.92, 1.54, 0.7, 0.29, 0.08, 1.36, 0.39, 0.9, 1.0, 1.06, 0.88, 0.51, 0.47, 0.57, 1.2, 0.38, 0.11, 0.61, 0.47, 1.17, 0.4, 2.52, 1.88, 0.94, 1.29, 1.24, 0.2, 1.89, -0.19, 0.38, 0.42, 0.23]} \ No newline at end of file diff --git a/annotations_1/PBVW7az0PkM_filtered.json b/annotations_1/PBVW7az0PkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fefdea1ea67fea9a9a8ef61ea802098d37a5eb8 --- /dev/null +++ b/annotations_1/PBVW7az0PkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [11.0, 11.16], [14.0, 14.37], [16.0, 18.69], [19.0, 28.51], [33.0, 33.49], [38.0, 39.01], [44.0, 45.12], [46.0, 49.52], [58.0, 58.23], [61.0, 61.26], [64.0, 65.06], [65.0, 68.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 69.61, 57.89, 0.0, 0.0, 0.0, 49.04, 0.0, 0.0, 0.0, 65.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 57.23], ["sidetone", 20.05], ["radio", 2.9]], null, null, null, null], "duration": [0.84, 0.16, 0.37, 2.69, 9.51, 0.49, 1.01, 1.12, 3.52, 0.23, 0.26, 1.06, 3.05]} \ No newline at end of file diff --git a/annotations_1/PBaQezez_UU_filtered.json b/annotations_1/PBaQezez_UU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6226b4da4a9863fc3b94caeda687e08ec3c36b0 --- /dev/null +++ b/annotations_1/PBaQezez_UU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [7.0, 8.61], [9.0, 13.78], [16.0, 18.22], [19.0, 19.58], [20.0, 22.22], [24.0, 24.07], [26.0, 26.25], [27.0, 29.37], [32.0, 32.34], [35.0, 35.43], [37.0, 37.2], [41.0, 41.99], [43.0, 44.27], [46.0, 46.41], [48.0, 48.46], [53.0, 52.96], [57.0, 62.83], [64.0, 74.85], [78.0, 81.82], [82.0, 91.29], [94.0, 118.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.92, 91.81, 0.0, 84.62, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 75.07, 90.78, 35.07, 29.24], "audiomae_on_audioset": [null, null, [["speech", 49.5], ["hum", 16.28], ["mains hum", 7.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.85], ["glass", 9.89], ["music", 6.28]], [["speech", 74.26], ["whack, thwack", 14.42], ["music", 2.44]]], "duration": [0.4, 1.61, 4.78, 2.22, 0.58, 2.22, 0.07, 0.25, 2.37, 0.34, 0.43, 0.2, 0.99, 1.27, 0.41, 0.46, -0.04, 5.83, 10.85, 3.82, 9.29, 24.03]} \ No newline at end of file diff --git a/annotations_1/PCn1uAs_0VQ_filtered.json b/annotations_1/PCn1uAs_0VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8985a339c29d3eb9750b8817cd131ce3da8b19a8 --- /dev/null +++ b/annotations_1/PCn1uAs_0VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.14], [25.0, 28.27], [29.0, 28.71], [29.0, 30.3], [31.0, 33.49], [34.0, 40.0], [40.0, 40.46], [52.0, 69.36], [71.0, 71.47], [73.0, 83.03], [84.0, 88.82], [91.0, 128.39], [129.0, 129.44]], "keep_status": [false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 53.47, 0.0, 0.0, 39.02, 34.94, 0.0, 65.91, 0.0, 49.73, 36.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 28.37], ["livestock, farm animals, working animals", 25.89], ["cattle, bovinae", 12.86]], [["grunt", 38.92], ["groan", 14.43], ["outside, rural or natural", 6.45]], null, null, null, [["music", 34.37], ["hum", 17.5], ["throbbing", 14.24]], [["speech", 51.66], ["music", 11.31], ["hum", 8.47]], null, null], "duration": [1.14, 3.27, -0.29, 1.3, 2.49, 6.0, 0.46, 17.36, 0.47, 10.03, 4.82, 37.39, 0.44]} \ No newline at end of file diff --git a/annotations_1/PD4Gq5GPcN8_filtered.json b/annotations_1/PD4Gq5GPcN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b425761326d31c539972375e5f7d4f16359d4d80 --- /dev/null +++ b/annotations_1/PD4Gq5GPcN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.4], [10.0, 15.47], [16.0, 17.78], [19.0, 25.66], [28.0, 71.71], [76.0, 76.6], [80.0, 83.64], [87.0, 87.83], [92.0, 93.28], [100.0, 101.19]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 48.65, 0.0, 36.84, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 29.73], ["music", 21.3], ["animal", 6.46]], null, [["music", 17.86], ["hum", 11.18], ["fowl", 10.9]], null, null, null, null, null, null], "duration": [1.4, 5.47, 1.78, 6.66, 43.71, 0.6, 3.64, 0.83, 1.28, 1.19]} \ No newline at end of file diff --git a/annotations_1/PDnA3LOm-xY_filtered.json b/annotations_1/PDnA3LOm-xY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..251e737076b8c8a91b3944629289e1605564d7ea --- /dev/null +++ b/annotations_1/PDnA3LOm-xY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [16.0, 16.9], [19.0, 20.87], [23.0, 22.69], [27.0, 27.11], [31.0, 31.75], [41.0, 41.28], [44.0, 44.42], [48.0, 48.07], [49.0, 49.65], [58.0, 58.28], [62.0, 62.61], [64.0, 64.84], [69.0, 69.35], [72.0, 73.38], [75.0, 77.67], [81.0, 92.57], [98.0, 98.71], [101.0, 101.7], [103.0, 103.18], [137.0, 138.23], [139.0, 139.68], [140.0, 140.66], [141.0, 141.79], [155.0, 158.63], [160.0, 160.25], [178.0, 178.44], [180.0, 181.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.69, 37.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 32.53], ["hum", 17.78], ["music", 5.72]], [["throbbing", 38.14], ["hum", 34.1], ["music", 14.02]], null, null, null, null, null, null, null, [["clang", 35.21], ["ding", 31.56], ["coin (dropping)", 5.2]], null, null, null], "duration": [0.24, 0.9, 1.87, -0.31, 0.11, 0.75, 0.28, 0.42, 0.07, 0.65, 0.28, 0.61, 0.84, 0.35, 1.38, 2.67, 11.57, 0.71, 0.7, 0.18, 1.23, 0.68, 0.66, 0.79, 3.63, 0.25, 0.44, 1.55]} \ No newline at end of file diff --git a/annotations_1/PECLt8uCcRk_filtered.json b/annotations_1/PECLt8uCcRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b14e09c045cb0414ebf2bc86e4c84d0b8fe2f8c5 --- /dev/null +++ b/annotations_1/PECLt8uCcRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 5.8], [7.0, 8.04], [9.0, 9.24], [15.0, 15.82], [17.0, 17.59], [19.0, 19.01], [21.0, 22.01], [23.0, 22.6], [23.0, 22.79], [23.0, 22.92], [23.0, 23.08], [24.0, 24.54], [25.0, 26.97], [30.0, 34.13], [35.0, 35.73], [37.0, 38.94], [40.0, 41.89], [49.0, 51.11], [61.0, 62.38], [63.0, 66.63], [67.0, 72.79], [73.0, 75.42], [77.0, 77.14], [79.0, 79.46], [81.0, 82.11], [84.0, 101.22], [102.0, 111.82], [113.0, 116.55], [121.0, 145.71], [146.0, 145.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.7, 0.0, 0.0, 0.0, 35.56, 0.0, 34.91, 65.67, 75.23, 0.0, 0.0, 0.0, 30.14, 32.2, 54.7, 36.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.52], ["music", 19.51], ["mains hum", 6.11]], null, null, null, [["chirp tone", 27.75], ["hum", 13.66], ["sine wave", 10.3]], null, [["speech", 12.36], ["music", 12.29], ["hum", 10.5]], null, null, null, null, null, [["whack, thwack", 25.85], ["whip", 11.57], ["thump, thud", 9.67]], [["hum", 31.17], ["throbbing", 29.06], ["speech", 8.85]], null, [["music", 56.66], ["hum", 12.33], ["throbbing", 6.23]], null], "duration": [0.6, 0.8, 1.04, 0.24, 0.82, 0.59, 0.01, 1.01, -0.4, -0.21, -0.08, 0.08, 0.54, 1.97, 4.13, 0.73, 1.94, 1.89, 2.11, 1.38, 3.63, 5.79, 2.42, 0.14, 0.46, 1.11, 17.22, 9.82, 3.55, 24.71, -0.06]} \ No newline at end of file diff --git a/annotations_1/PF2hIgWupGU_filtered.json b/annotations_1/PF2hIgWupGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be1b6b8207cf43cc70d349051bd8f4ce7c8c08e2 --- /dev/null +++ b/annotations_1/PF2hIgWupGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [4.0, 3.91], [4.0, 3.94], [8.0, 9.02], [10.0, 14.86], [18.0, 28.68], [32.0, 35.75], [42.0, 50.01], [55.0, 56.02], [64.0, 64.4], [66.0, 66.31], [66.0, 66.34], [66.0, 72.4], [74.0, 90.19], [96.0, 96.47], [98.0, 98.44]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.9, 32.04, 33.27, 32.22, 0.0, 0.0, 0.0, 0.0, 51.07, 36.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 67.46], ["musical instrument", 3.56], ["throbbing", 1.81]], [["music", 57.88], ["speech", 4.25], ["electronic music", 2.96]], [["music", 67.54], ["electronic music", 3.3], ["throbbing", 3.21]], [["music", 45.58], ["hum", 11.96], ["didgeridoo", 7.97]], null, null, null, null, null, [["music", 57.03], ["hum", 9.67], ["mains hum", 7.34]], null, null], "duration": [0.87, -0.09, -0.06, 1.02, 4.86, 10.68, 3.75, 8.01, 1.02, 0.4, 0.31, 0.34, 6.4, 16.19, 0.47, 0.44]} \ No newline at end of file diff --git a/annotations_1/PGbBz0m0pTc_filtered.json b/annotations_1/PGbBz0m0pTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..694fcc7d0677f73ae7ba13474d225e5ec3ef858e --- /dev/null +++ b/annotations_1/PGbBz0m0pTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 40.73], [41.0, 43.24], [44.0, 44.66], [52.0, 53.59], [54.0, 55.83], [60.0, 59.73], [61.0, 61.91], [64.0, 64.64], [66.0, 66.24], [67.0, 68.01], [69.0, 69.57], [71.0, 71.73], [74.0, 75.29], [77.0, 137.62], [139.0, 139.24], [142.0, 143.73], [144.0, 148.32], [149.0, 157.65], [159.0, 159.65], [162.0, 162.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.79, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03, 72.46, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 49.15], ["hum", 35.6], ["music", 4.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [26.73, 2.24, 0.66, 1.59, 1.83, -0.27, 0.91, 0.64, 0.24, 1.01, 0.57, 0.73, 1.29, 60.62, 0.24, 1.73, 4.32, 8.65, 0.65, 0.48]} \ No newline at end of file diff --git a/annotations_1/PHJisUS7KSg_filtered.json b/annotations_1/PHJisUS7KSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b62e269d79138449986aef8f08abc88adeb64c49 --- /dev/null +++ b/annotations_1/PHJisUS7KSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.25], [21.0, 68.99], [70.0, 71.74], [72.0, 80.3], [83.0, 87.22], [90.0, 93.61], [94.0, 95.23], [96.0, 97.95], [101.0, 104.8], [110.0, 168.98], [170.0, 191.44]], "keep_status": [false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [32.7, 0.0, 0.0, 30.47, 29.14, 28.97, 0.0, 0.0, 28.76, 0.0, 29.47], "audiomae_on_audioset": [[["hum", 29.44], ["throbbing", 29.04], ["music", 23.32]], null, null, [["music", 56.29], ["hum", 17.86], ["throbbing", 9.1]], [["music", 40.95], ["throbbing", 25.14], ["hum", 12.39]], [["music", 37.46], ["speech", 16.29], ["throbbing", 11.5]], null, null, [["music", 31.27], ["electronic music", 6.58], ["throbbing", 5.37]], null, [["throbbing", 24.42], ["hum", 22.98], ["music", 18.67]]], "duration": [4.25, 47.99, 1.74, 8.3, 4.22, 3.61, 1.23, 1.95, 3.8, 58.98, 21.44]} \ No newline at end of file diff --git a/annotations_1/PI35KfPB7nM_filtered.json b/annotations_1/PI35KfPB7nM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a65cd8875cb340e7c6bafd670b53c0097c5bd54 --- /dev/null +++ b/annotations_1/PI35KfPB7nM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.77], [9.0, 9.63], [13.0, 17.1], [18.0, 21.42], [22.0, 37.76], [38.0, 38.2], [38.0, 38.26], [38.0, 38.91], [39.0, 40.17], [41.0, 43.43], [45.0, 48.05], [49.0, 50.43], [51.0, 67.02], [68.0, 81.48], [82.0, 87.02], [89.0, 90.68], [92.0, 93.5], [94.0, 98.39], [101.0, 104.43], [106.0, 108.19], [113.0, 118.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 100.0, 99.76, 99.87, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.99, 99.85, 100.0, 0.0, 0.0, 100.0, 34.07, 39.88, 39.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["snicker", 19.63], ["baby laughter", 8.94], ["chuckle, chortle", 7.51]], [["didgeridoo", 44.04], ["music", 13.48], ["inside, small room", 4.23]], [["snicker", 39.55], ["chuckle, chortle", 15.87], ["laughter", 11.23]]], "duration": [1.77, 0.63, 4.1, 3.42, 15.76, 0.2, 0.26, 0.91, 1.17, 2.43, 3.05, 1.43, 16.02, 13.48, 5.02, 1.68, 1.5, 4.39, 3.43, 2.19, 5.32]} \ No newline at end of file diff --git a/annotations_1/PI6Q87pjO0o_filtered.json b/annotations_1/PI6Q87pjO0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2851bf68a6e58085321e293fb9434361bb7e95a8 --- /dev/null +++ b/annotations_1/PI6Q87pjO0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [4.0, 4.41], [5.0, 7.43], [8.0, 8.88], [14.0, 14.13], [16.0, 17.27], [20.0, 20.34], [21.0, 22.59], [25.0, 26.54], [28.0, 29.0], [40.0, 42.3], [43.0, 44.78], [47.0, 47.49], [51.0, 51.61], [58.0, 59.22], [62.0, 62.16], [66.0, 66.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.15], ["speech", 13.81], ["sitar", 4.88]], null, null, null, null, null, null, null, [["music", 43.44], ["mains hum", 9.7], ["whip", 8.58]], null, null, null, null, null, null], "duration": [0.52, 0.41, 2.43, 0.88, 0.13, 1.27, 0.34, 1.59, 1.54, 1.0, 2.3, 1.78, 0.49, 0.61, 1.22, 0.16, 0.77]} \ No newline at end of file diff --git a/annotations_1/PI8G4wCa8m4_filtered.json b/annotations_1/PI8G4wCa8m4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70711e77247f5546282f9457773d5606c08128e6 --- /dev/null +++ b/annotations_1/PI8G4wCa8m4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [0.0, 0.3], [4.0, 6.1], [9.0, 10.07], [13.0, 12.9], [19.0, 28.86], [33.0, 33.51], [34.0, 40.49], [44.0, 45.3], [47.0, 47.87], [48.0, 48.36], [49.0, 52.0], [54.0, 54.78], [59.0, 60.12], [62.0, 62.99], [64.0, 67.96], [69.0, 69.89], [72.0, 72.94], [75.0, 76.54], [82.0, 82.86], [83.0, 82.92], [84.0, 84.16], [105.0, 106.89], [108.0, 109.43], [112.0, 113.66], [115.0, 115.23], [116.0, 120.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 44.18, 0.0, 0.0, 43.08, 0.0, 61.77, 0.0, 0.0, 0.0, 74.92, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.03], "audiomae_on_audioset": [null, null, [["thunk", 66.76], ["door", 5.6], ["creak", 3.28]], null, null, [["thunk", 86.96], ["speech", 3.61], ["breaking", 1.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 15.04], ["fart", 10.06], ["sound effect", 8.14]]], "duration": [0.04, 0.3, 2.1, 1.07, -0.1, 9.86, 0.51, 6.49, 1.3, 0.87, 0.36, 3.0, 0.78, 1.12, 0.99, 3.96, 0.89, 0.94, 1.54, 0.86, -0.08, 0.16, 1.89, 1.43, 1.66, 0.23, 4.16]} \ No newline at end of file diff --git a/annotations_1/PIHPbvviS2w_filtered.json b/annotations_1/PIHPbvviS2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..030295a16abb2a38203bbac863de3c7f7a47d1cb --- /dev/null +++ b/annotations_1/PIHPbvviS2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [3.0, 3.5], [6.0, 7.35], [13.0, 16.04], [17.0, 17.05], [18.0, 18.25], [20.0, 19.95], [22.0, 24.61], [25.0, 25.56], [30.0, 30.94], [31.0, 31.58], [32.0, 32.22], [35.0, 35.99], [37.0, 44.81], [53.0, 54.41], [59.0, 61.57], [66.0, 66.31], [70.0, 70.73], [75.0, 75.0], [77.0, 80.87], [83.0, 87.3], [91.0, 91.94], [92.0, 96.48], [98.0, 102.69], [105.0, 109.05], [110.0, 115.77], [119.0, 122.1], [123.0, 127.5], [133.0, 133.76], [139.0, 139.55], [141.0, 142.94], [143.0, 144.88], [146.0, 148.2], [149.0, 154.63], [157.0, 160.74], [162.0, 167.39], [170.0, 172.84], [173.0, 173.52], [175.0, 194.73], [195.0, 196.47], [198.0, 197.55], [200.0, 200.38], [203.0, 205.87], [212.0, 212.7], [216.0, 217.16], [219.0, 219.28], [219.0, 220.18], [223.0, 224.29], [226.0, 226.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false, true, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 34.43, 0.0, 0.0, 0.0, 35.23, 51.82, 0.0, 40.19, 43.13, 46.86, 43.56, 46.22, 32.18, 0.0, 0.0, 0.0, 0.0, 40.02, 38.4, 46.12, 37.56, 48.48, 0.0, 33.36, 0.0, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.9], ["guitar", 14.4], ["musical instrument", 11.29]], null, [["music", 58.23], ["singing", 5.38], ["guitar", 4.07]], null, null, null, [["music", 49.29], ["speech", 12.82], ["guitar", 11.84]], null, null, [["music", 49.52], ["keyboard (musical)", 7.82], ["musical instrument", 7.47]], [["music", 55.34], ["electric piano", 10.83], ["keyboard (musical)", 5.44]], [["music", 46.4], ["musical instrument", 8.46], ["keyboard (musical)", 3.48]], [["music", 63.12], ["electric piano", 7.8], ["keyboard (musical)", 4.32]], [["music", 34.05], ["synthesizer", 8.37], ["effects unit", 8.33]], [["music", 56.84], ["musical instrument", 4.65], ["mantra", 3.2]], null, null, null, null, [["music", 55.07], ["musical instrument", 7.94], ["keyboard (musical)", 6.71]], [["music", 45.09], ["musical instrument", 12.26], ["guitar", 4.72]], [["music", 46.48], ["piano", 8.39], ["musical instrument", 7.54]], [["music", 54.03], ["electric piano", 14.52], ["keyboard (musical)", 6.76]], [["music", 53.42], ["chorus effect", 10.29], ["effects unit", 4.14]], null, [["music", 24.93], ["synthesizer", 15.78], ["effects unit", 9.79]], null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.5, 1.35, 3.04, 0.05, 0.25, -0.05, 2.61, 0.56, 0.94, 0.58, 0.22, 0.99, 7.81, 1.41, 2.57, 0.31, 0.73, 0.0, 3.87, 4.3, 0.94, 4.48, 4.69, 4.05, 5.77, 3.1, 4.5, 0.76, 0.55, 1.94, 1.88, 2.2, 5.63, 3.74, 5.39, 2.84, 0.52, 19.73, 1.47, -0.45, 0.38, 2.87, 0.7, 1.16, 0.28, 1.18, 1.29, 0.15]} \ No newline at end of file diff --git a/annotations_1/PJTb9EdYZDg_filtered.json b/annotations_1/PJTb9EdYZDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b27ece2a9e1e479ec3011a3d81a18d84cc6a13c --- /dev/null +++ b/annotations_1/PJTb9EdYZDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 94.1], [96.0, 100.8], [102.0, 105.27], [107.0, 107.55], [112.0, 115.89]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 36.39, 37.53, 0.0, 36.02], "audiomae_on_audioset": [null, [["music", 42.46], ["throbbing", 12.4], ["hum", 11.53]], [["music", 53.24], ["throbbing", 7.36], ["hum", 5.78]], null, [["speech", 27.46], ["hum", 18.0], ["mains hum", 12.7]]], "duration": [41.1, 4.8, 3.27, 0.55, 3.89]} \ No newline at end of file diff --git a/annotations_1/PLOSA5L0dxE_filtered.json b/annotations_1/PLOSA5L0dxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c12a0f6c94a2de4c7ece363d1b54fc77a48d73c0 --- /dev/null +++ b/annotations_1/PLOSA5L0dxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.6], [4.0, 15.18], [19.0, 20.95], [22.0, 24.56], [31.0, 32.71], [35.0, 36.68], [39.0, 41.61], [44.0, 44.32], [47.0, 48.0], [49.0, 51.8], [53.0, 54.24], [54.0, 54.28], [54.0, 55.16], [56.0, 57.48], [59.0, 62.51], [69.0, 69.65], [77.0, 78.81], [83.0, 85.31], [87.0, 89.24], [91.0, 93.78], [96.0, 98.61], [105.0, 105.21], [106.0, 105.92], [112.0, 113.98], [116.0, 117.0], [121.0, 122.74], [127.0, 127.47], [131.0, 136.05], [149.0, 152.64], [157.0, 160.44], [161.0, 165.06]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [38.66, 48.02, 0.0, 62.68, 0.0, 0.0, 79.76, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0, 53.84, 40.52, 35.33, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.28, 39.19, 51.71, 38.88], "audiomae_on_audioset": [[["speech", 27.62], ["hum", 24.26], ["throbbing", 13.3]], [["crushing", 22.98], ["walk, footsteps", 10.25], ["thunk", 9.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["gong", 38.48], ["music", 16.4], ["singing bowl", 10.37]], [["singing bowl", 29.21], ["music", 24.81], ["gong", 9.55]], [["music", 40.66], ["singing bowl", 18.02], ["electronic music", 7.58]], null, null, null, null, null, null, [["hum", 40.8], ["mains hum", 19.43], ["music", 11.61]], [["music", 19.64], ["singing bowl", 19.31], ["speech", 11.22]], null, [["music", 27.75], ["hum", 21.39], ["electronic music", 9.63]]], "duration": [2.6, 11.18, 1.95, 2.56, 1.71, 1.68, 2.61, 0.32, 1.0, 2.8, 1.24, 0.28, 1.16, 1.48, 3.51, 0.65, 1.81, 2.31, 2.24, 2.78, 2.61, 0.21, -0.08, 1.98, 1.0, 1.74, 0.47, 5.05, 3.64, 3.44, 4.06]} \ No newline at end of file diff --git a/annotations_1/PLgNzEctkO4_filtered.json b/annotations_1/PLgNzEctkO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3ae4623817927b1157fa5851ffdd45126ea0a7f --- /dev/null +++ b/annotations_1/PLgNzEctkO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 59.48], [60.0, 70.51], [71.0, 78.38], [79.0, 104.63], [110.0, 113.07], [115.0, 153.0], [161.0, 162.82]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [97.64, 99.85, 91.47, 99.99, 99.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [14.48, 10.51, 7.38, 25.63, 3.07, 38.0, 1.82]} \ No newline at end of file diff --git a/annotations_1/PLr1f84fj8U_filtered.json b/annotations_1/PLr1f84fj8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..518104cfc4e2b72f79c94909b85ccb24c938f00b --- /dev/null +++ b/annotations_1/PLr1f84fj8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 76.98], [77.0, 101.22], [102.0, 102.22], [105.0, 108.68], [112.0, 167.95]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 31.31, 0.0, 35.1, 0.0], "audiomae_on_audioset": [null, [["music", 48.77], ["mains hum", 12.07], ["hum", 11.75]], null, [["music", 38.16], ["animal", 21.81], ["theremin", 11.39]], null], "duration": [38.98, 24.22, 0.22, 3.68, 55.95]} \ No newline at end of file diff --git a/annotations_1/PM8-Hmfy6OU_filtered.json b/annotations_1/PM8-Hmfy6OU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73eee6315889b8ac1a835b51faa8d1452f8170ab --- /dev/null +++ b/annotations_1/PM8-Hmfy6OU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [10.0, 16.23], [18.0, 24.38], [28.0, 28.02], [30.0, 29.98], [34.0, 36.22], [50.0, 54.19], [55.0, 57.16], [60.0, 61.32], [62.0, 63.32], [66.0, 66.68], [68.0, 69.11], [70.0, 72.17], [74.0, 75.93], [81.0, 85.26], [88.0, 142.57]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 29.77, 28.62, 0.0, 0.0, 42.88, 37.53, 52.56, 0.0, 0.0, 0.0, 0.0, 43.77, 0.0, 30.3, 0.0], "audiomae_on_audioset": [null, [["hum", 43.44], ["mains hum", 21.44], ["music", 17.95]], [["music", 68.89], ["synthesizer", 5.58], ["noise", 2.82]], null, null, [["hum", 29.01], ["music", 14.95], ["sidetone", 14.23]], [["music", 69.07], ["didgeridoo", 6.42], ["musical instrument", 4.92]], null, null, null, null, null, [["animal", 27.67], ["domestic animals, pets", 10.2], ["dog", 7.6]], null, [["fly, housefly", 10.27], ["livestock, farm animals, working animals", 8.93], ["cattle, bovinae", 7.72]], null], "duration": [0.31, 6.23, 6.38, 0.02, -0.02, 2.22, 4.19, 2.16, 1.32, 1.32, 0.68, 1.11, 2.17, 1.93, 4.26, 54.57]} \ No newline at end of file diff --git a/annotations_1/PMjbPEGDJ7w_filtered.json b/annotations_1/PMjbPEGDJ7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b553c06e404b150683ed5530fa816ae317653c1f --- /dev/null +++ b/annotations_1/PMjbPEGDJ7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.38], [13.0, 18.79], [19.0, 27.55], [30.0, 30.52], [34.0, 41.66], [42.0, 47.76], [58.0, 60.86], [68.0, 73.03], [74.0, 78.24], [80.0, 80.57], [84.0, 85.33], [86.0, 86.59], [88.0, 94.15], [97.0, 102.05], [103.0, 105.71], [106.0, 128.09], [128.0, 135.82], [141.0, 185.67], [187.0, 188.64], [189.0, 194.76], [195.0, 195.44], [196.0, 197.19], [200.0, 200.45], [202.0, 203.18]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [29.21, 29.21, 30.53, 0.0, 28.69, 29.47, 30.82, 29.25, 30.63, 0.0, 0.0, 0.0, 29.11, 30.18, 28.77, 31.43, 40.22, 0.0, 0.0, 36.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 19.24], ["wild animals", 19.0], ["groan", 12.31]], [["music", 55.45], ["throbbing", 4.33], ["sound effect", 3.35]], [["speech", 49.86], ["whack, thwack", 21.44], ["music", 6.2]], null, [["hum", 41.48], ["music", 22.17], ["speech", 12.27]], [["whale vocalization", 44.81], ["music", 19.81], ["livestock, farm animals, working animals", 6.5]], [["hum", 30.86], ["mains hum", 24.32], ["throbbing", 18.87]], [["hum", 32.91], ["mains hum", 25.66], ["music", 14.75]], [["speech", 23.89], ["throbbing", 19.0], ["music", 18.98]], null, null, null, [["music", 20.24], ["throbbing", 19.39], ["whack, thwack", 11.67]], [["hum", 59.66], ["mains hum", 20.88], ["throbbing", 17.43]], [["whale vocalization", 18.72], ["vehicle", 13.03], ["motorcycle", 10.12]], [["speech", 51.44], ["hum", 14.32], ["throbbing", 9.35]], [["speech", 18.17], ["fly, housefly", 14.8], ["music", 9.36]], null, null, [["music", 59.74], ["synthesizer", 11.27], ["hum", 7.51]], null, null, null, null], "duration": [8.38, 5.79, 8.55, 0.52, 7.66, 5.76, 2.86, 5.03, 4.24, 0.57, 1.33, 0.59, 6.15, 5.05, 2.71, 22.09, 7.82, 44.67, 1.64, 5.76, 0.44, 1.19, 0.45, 1.18]} \ No newline at end of file diff --git a/annotations_1/POu3JnhEmT4_filtered.json b/annotations_1/POu3JnhEmT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f053f7e26b754498a1fdd15d1be4b8948bfe5c4f --- /dev/null +++ b/annotations_1/POu3JnhEmT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.32], [15.0, 19.3], [28.0, 29.15], [37.0, 37.39], [38.0, 38.77], [52.0, 52.37], [55.0, 56.1], [60.0, 60.98], [66.0, 66.34], [69.0, 69.94], [77.0, 77.04], [78.0, 78.34], [82.0, 82.75], [88.0, 88.15], [93.0, 93.06], [96.0, 96.3], [103.0, 104.03], [109.0, 109.53], [113.0, 113.31], [116.0, 116.23], [117.0, 118.99], [119.0, 120.24], [121.0, 121.31], [123.0, 123.25], [131.0, 131.84], [139.0, 139.16], [144.0, 144.85], [146.0, 147.82], [150.0, 150.65], [151.0, 151.82], [153.0, 154.16], [161.0, 168.69], [169.0, 169.4], [170.0, 170.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["rowboat, canoe, kayak", 33.78], ["boat, water vehicle", 6.69], ["bouncing", 6.42]], null, null], "duration": [0.32, 4.3, 1.15, 0.39, 0.77, 0.37, 1.1, 0.98, 0.34, 0.94, 0.04, 0.34, 0.75, 0.15, 0.06, 0.3, 1.03, 0.53, 0.31, 0.23, 1.99, 1.24, 0.31, 0.25, 0.84, 0.16, 0.85, 1.82, 0.65, 0.82, 1.16, 7.69, 0.4, 0.01]} \ No newline at end of file diff --git a/annotations_1/PPhxsJho48c_filtered.json b/annotations_1/PPhxsJho48c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78fb5ee6c5a322aa9748f9a96d66c61a18b05f8c --- /dev/null +++ b/annotations_1/PPhxsJho48c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.89], [9.0, 9.68], [13.0, 13.22], [14.0, 15.36], [16.0, 16.63], [19.0, 19.25], [22.0, 22.74], [31.0, 33.74], [35.0, 35.53], [49.0, 49.99], [54.0, 54.62], [61.0, 74.82], [79.0, 86.73], [92.0, 92.97], [95.0, 97.53], [98.0, 99.03], [100.0, 100.13], [101.0, 101.58], [102.0, 103.15], [104.0, 106.91], [120.0, 120.65], [122.0, 122.66], [124.0, 124.65], [135.0, 135.03], [135.0, 139.62], [144.0, 147.02], [148.0, 147.85], [149.0, 150.08], [151.0, 163.0], [165.0, 167.61], [173.0, 173.96], [175.0, 175.8], [176.0, 176.18], [178.0, 178.61], [181.0, 181.11]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [32.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 33.68, 44.78, 0.0, 35.68, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 51.99, 32.21, 0.0, 0.0, 32.27, 37.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 34.84], ["radio", 24.46], ["speech", 5.65]], null, null, null, null, null, null, null, null, null, null, [["speech", 53.59], ["music", 32.76], ["harmonica", 2.63]], [["hum", 13.57], ["fly, housefly", 13.26], ["speech", 11.93]], null, [["whale vocalization", 20.63], ["mains hum", 17.44], ["hum", 7.9]], null, null, null, null, [["speech", 61.67], ["music", 9.88], ["radio", 2.67]], null, null, null, null, null, [["music", 33.3], ["musical instrument", 13.82], ["brass instrument", 13.01]], null, null, [["music", 49.07], ["musical instrument", 11.1], ["saxophone", 10.63]], [["music", 50.13], ["clarinet", 26.55], ["wind instrument, woodwind instrument", 5.5]], null, null, null, null, null], "duration": [2.89, 0.68, 0.22, 1.36, 0.63, 0.25, 0.74, 2.74, 0.53, 0.99, 0.62, 13.82, 7.73, 0.97, 2.53, 1.03, 0.13, 0.58, 1.15, 2.91, 0.65, 0.66, 0.65, 0.03, 4.62, 3.02, -0.15, 1.08, 12.0, 2.61, 0.96, 0.8, 0.18, 0.61, 0.11]} \ No newline at end of file diff --git a/annotations_1/PQ3Qc8bOqlY_filtered.json b/annotations_1/PQ3Qc8bOqlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3da89916cd3719857f507deabdc3cfb68ccdd188 --- /dev/null +++ b/annotations_1/PQ3Qc8bOqlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.12], [44.0, 45.03], [46.0, 47.28], [50.0, 132.9], [134.0, 138.81], [140.0, 140.91], [142.0, 143.67], [147.0, 150.25], [153.0, 161.25], [161.0, 166.35], [168.0, 172.74], [174.0, 177.23]], "keep_status": [false, false, false, false, true, false, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.61, 0.0, 0.0, 38.51, 35.71, 37.66, 32.2, 34.38], "audiomae_on_audioset": [null, null, null, null, [["music", 46.27], ["speech", 10.11], ["hum", 9.11]], null, null, [["speech", 25.74], ["music", 11.79], ["mains hum", 11.43]], [["music", 23.51], ["hum", 23.16], ["throbbing", 11.38]], [["grunt", 30.13], ["music", 18.96], ["sound effect", 11.4]], [["music", 50.83], ["whale vocalization", 28.08], ["scrape", 1.85]], [["music", 25.9], ["whale vocalization", 22.95], ["grunt", 8.59]]], "duration": [0.12, 1.03, 1.28, 82.9, 4.81, 0.91, 1.67, 3.25, 8.25, 5.35, 4.74, 3.23]} \ No newline at end of file diff --git a/annotations_1/PQbyl1vsn1o_filtered.json b/annotations_1/PQbyl1vsn1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54635f9c7e1aa3658982975a979f01e5926a8acd --- /dev/null +++ b/annotations_1/PQbyl1vsn1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.99], [15.0, 21.32], [32.0, 31.92], [33.0, 34.05], [36.0, 36.59], [39.0, 40.32], [43.0, 43.23], [45.0, 46.26], [50.0, 49.98], [52.0, 54.73], [56.0, 56.42], [58.0, 59.48], [60.0, 61.45], [64.0, 69.09], [69.0, 73.75], [74.0, 79.25], [80.0, 87.0], [88.0, 89.23], [90.0, 92.4], [95.0, 97.88], [100.0, 101.16], [102.0, 107.13], [108.0, 109.44], [111.0, 111.25], [112.0, 114.44], [116.0, 116.26], [118.0, 117.9], [119.0, 120.93], [127.0, 127.43], [128.0, 129.17], [131.0, 132.27], [134.0, 135.82], [137.0, 139.28], [141.0, 143.45], [144.0, 145.44], [146.0, 148.17], [151.0, 152.93], [154.0, 156.34], [157.0, 159.58], [163.0, 164.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.28, 0.0, 0.0, 0.0, 73.51, 50.36, 99.26, 57.4, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 100.0, 0.0, 100.0, 99.44, 0.0], "audiomae_on_audioset": [null, [["speech", 54.25], ["vehicle", 15.2], ["car", 6.49]], null, null, null, null, null, null, null, [["speech", 49.13], ["hum", 14.89], ["mains hum", 7.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 6.32, -0.08, 1.05, 0.59, 1.32, 0.23, 1.26, -0.02, 2.73, 0.42, 1.48, 1.45, 5.09, 4.75, 5.25, 7.0, 1.23, 2.4, 2.88, 1.16, 5.13, 1.44, 0.25, 2.44, 0.26, -0.1, 1.93, 0.43, 1.17, 1.27, 1.82, 2.28, 2.45, 1.44, 2.17, 1.93, 2.34, 2.58, 1.59]} \ No newline at end of file diff --git a/annotations_1/PRk69Z74hPs_filtered.json b/annotations_1/PRk69Z74hPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcbc067c1b5d466b354bf6f44bdd4b4a66429c44 --- /dev/null +++ b/annotations_1/PRk69Z74hPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.86]], "keep_status": [true], "silence_prob": [34.05], "audiomae_on_audioset": [[["music", 26.82], ["cacophony", 7.49], ["hum", 7.2]]], "duration": [2.86]} \ No newline at end of file diff --git a/annotations_1/PSW5cd8WVwM_filtered.json b/annotations_1/PSW5cd8WVwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ebd65f1acddc3f5609bd8bafca48cb94b1ca87d --- /dev/null +++ b/annotations_1/PSW5cd8WVwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 17.54], [19.0, 19.28], [20.0, 19.53], [20.0, 19.84], [20.0, 56.27], [59.0, 67.17], [69.0, 69.3], [70.0, 70.58], [71.0, 74.41], [76.0, 96.55], [98.0, 98.37], [102.0, 103.96], [110.0, 110.51], [111.0, 113.61], [114.0, 120.85], [129.0, 132.88], [134.0, 136.41]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [29.99, 0.0, 0.0, 0.0, 0.0, 32.78, 0.0, 0.0, 32.68, 29.71, 0.0, 0.0, 0.0, 29.92, 29.97, 31.73, 30.08], "audiomae_on_audioset": [[["music", 25.65], ["hum", 16.27], ["speech", 13.11]], null, null, null, null, [["hum", 37.52], ["music", 25.2], ["throbbing", 13.26]], null, null, [["hum", 62.14], ["mains hum", 19.06], ["throbbing", 5.93]], [["music", 37.52], ["throbbing", 21.1], ["hum", 17.5]], null, null, null, [["breaking", 66.87], ["music", 13.26], ["whack, thwack", 9.05]], [["music", 42.47], ["breaking", 20.8], ["hum", 9.09]], [["mains hum", 23.91], ["noise", 19.93], ["hum", 19.24]], [["music", 22.37], ["throbbing", 19.05], ["hum", 9.53]]], "duration": [12.54, 0.28, -0.47, -0.16, 36.27, 8.17, 0.3, 0.58, 3.41, 20.55, 0.37, 1.96, 0.51, 2.61, 6.85, 3.88, 2.41]} \ No newline at end of file diff --git a/annotations_1/PSWgZzUr_Yw_filtered.json b/annotations_1/PSWgZzUr_Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0046f61865fdc3abbe4a5ca1442803e5bcd5e1 --- /dev/null +++ b/annotations_1/PSWgZzUr_Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [7.0, 7.62], [8.0, 10.12], [11.0, 11.28], [13.0, 13.86], [16.0, 17.31], [18.0, 17.74], [18.0, 17.81], [18.0, 17.85], [18.0, 17.88], [26.0, 29.46], [33.0, 36.56], [38.0, 44.79], [45.0, 49.1], [57.0, 58.83], [64.0, 67.47], [68.0, 68.61], [69.0, 91.5], [95.0, 97.48], [102.0, 102.64], [111.0, 112.4], [118.0, 119.18], [119.0, 119.25], [129.0, 129.74], [140.0, 146.7], [152.0, 151.88], [152.0, 152.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 40.4, 98.86, 33.41, 0.0, 33.26, 0.0, 35.68, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 31.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 45.88], ["mosquito", 22.82], ["insect", 21.22]], null, [["noise", 24.64], ["music", 17.63], ["moo", 16.34]], null, [["music", 48.77], ["speech", 5.78], ["whale vocalization", 5.26]], null, [["music", 37.37], ["whale vocalization", 6.5], ["animal", 6.32]], null, null, null, null, null, null, [["speech", 27.47], ["hum", 13.03], ["music", 7.5]], null, null], "duration": [0.85, 0.62, 2.12, 0.28, 0.86, 1.31, -0.26, -0.19, -0.15, -0.12, 3.46, 3.56, 6.79, 4.1, 1.83, 3.47, 0.61, 22.5, 2.48, 0.64, 1.4, 1.18, 0.25, 0.74, 6.7, -0.12, 0.31]} \ No newline at end of file diff --git a/annotations_1/PTQLBv8sgDI_filtered.json b/annotations_1/PTQLBv8sgDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..796829317189a48cb51acd942baef63696192d8a --- /dev/null +++ b/annotations_1/PTQLBv8sgDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.16], [10.0, 10.37], [11.0, 15.11], [16.0, 15.87], [16.0, 16.77], [21.0, 21.63], [22.0, 28.88], [30.0, 37.08], [39.0, 39.82], [40.0, 41.5], [43.0, 43.16], [45.0, 59.98], [60.0, 60.69], [62.0, 62.43], [65.0, 67.9], [68.0, 70.29], [72.0, 73.92], [75.0, 76.0], [77.0, 77.41], [80.0, 81.08], [82.0, 83.73], [84.0, 91.03], [92.0, 93.39], [94.0, 102.71], [104.0, 106.69], [108.0, 114.81], [115.0, 117.71], [119.0, 120.02], [123.0, 123.47], [124.0, 125.42], [127.0, 126.84], [130.0, 130.33], [131.0, 132.06], [134.0, 138.01], [139.0, 139.87], [140.0, 142.53], [144.0, 147.29], [148.0, 162.19], [164.0, 169.7], [171.0, 177.25], [180.0, 180.77], [181.0, 182.26], [183.0, 184.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.42, 0.0, 78.55, 0.0, 0.0, 0.0, 55.04, 73.51, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 99.98, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 83.16, 78.89, 85.54, 44.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 71.72, 100.0, 97.92, 88.64, 99.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.79], ["sidetone", 6.38], ["dial tone", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.16, 0.37, 4.11, -0.13, 0.77, 0.63, 6.88, 7.08, 0.82, 1.5, 0.16, 14.98, 0.69, 0.43, 2.9, 2.29, 1.92, 1.0, 0.41, 1.08, 1.73, 7.03, 1.39, 8.71, 2.69, 6.81, 2.71, 1.02, 0.47, 1.42, -0.16, 0.33, 1.06, 4.01, 0.87, 2.53, 3.29, 14.19, 5.7, 6.25, 0.77, 1.26, 1.47]} \ No newline at end of file diff --git a/annotations_1/PUFwiKDWxUo_filtered.json b/annotations_1/PUFwiKDWxUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8cd0be6c060c79bf42e9654b69f9cedbd6b209 --- /dev/null +++ b/annotations_1/PUFwiKDWxUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 25.51], [26.0, 35.87], [37.0, 42.63], [45.0, 46.58], [64.0, 68.08], [73.0, 83.69], [92.0, 95.62], [106.0, 106.78]], "keep_status": [false, false, false, false, true, true, true, false], "silence_prob": [29.41, 28.99, 30.77, 0.0, 28.41, 28.97, 31.47, 0.0], "audiomae_on_audioset": [[["music", 49.43], ["speech", 14.3], ["didgeridoo", 11.93]], [["speech", 40.9], ["music", 38.24], ["musical instrument", 3.37]], [["music", 41.08], ["speech", 28.86], ["synthesizer", 3.79]], null, [["music", 20.93], ["speech", 8.23], ["livestock, farm animals, working animals", 7.79]], [["speech", 39.56], ["music", 15.16], ["livestock, farm animals, working animals", 11.42]], [["speech", 24.63], ["hum", 13.22], ["throbbing", 9.43]], null], "duration": [12.51, 9.87, 5.63, 1.58, 4.08, 10.69, 3.62, 0.78]} \ No newline at end of file diff --git a/annotations_1/PVEIr4MGaT8_filtered.json b/annotations_1/PVEIr4MGaT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cd3e33f97e9b20ffb9ca588f3f6a374c121dcdd --- /dev/null +++ b/annotations_1/PVEIr4MGaT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.24], [9.0, 26.35], [28.0, 60.94], [61.0, 61.33], [61.0, 114.49], [116.0, 124.06], [125.0, 127.6], [129.0, 131.87], [133.0, 134.76], [136.0, 140.59], [142.0, 142.89]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [49.31, 37.49, 0.0, 0.0, 0.0, 92.8, 79.59, 99.65, 0.0, 88.28, 0.0], "audiomae_on_audioset": [[["music", 28.71], ["foghorn", 14.41], ["mains hum", 10.84]], [["mains hum", 22.52], ["hum", 19.47], ["music", 17.78]], null, null, null, null, null, null, null, null, null], "duration": [3.24, 17.35, 32.94, 0.33, 53.49, 8.06, 2.6, 2.87, 1.76, 4.59, 0.89]} \ No newline at end of file diff --git a/annotations_1/PW20LbwAmng_filtered.json b/annotations_1/PW20LbwAmng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d9b58573b6ff905f1dc880dc7f45ea610019de1 --- /dev/null +++ b/annotations_1/PW20LbwAmng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [4.0, 5.54], [8.0, 10.12], [11.0, 13.66], [14.0, 14.66], [15.0, 16.48], [18.0, 19.11], [21.0, 25.78], [26.0, 35.92], [37.0, 40.32], [43.0, 57.45], [61.0, 64.45], [65.0, 71.32], [82.0, 86.04], [88.0, 89.41], [91.0, 92.25], [99.0, 100.87], [103.0, 103.06], [104.0, 105.04], [109.0, 110.03], [111.0, 112.77], [115.0, 116.51], [118.0, 118.67], [120.0, 123.09], [123.0, 126.06], [127.0, 128.75], [131.0, 142.21], [146.0, 145.94], [146.0, 149.99], [153.0, 153.69], [154.0, 155.82], [157.0, 158.46], [162.0, 172.96], [173.0, 173.03], [174.0, 179.15], [181.0, 183.41], [185.0, 185.41], [189.0, 189.63], [190.0, 195.94], [197.0, 197.83], [198.0, 200.92], [210.0, 211.38]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.0, 99.44, 0.0, 0.0, 0.0, 60.98, 33.6, 44.04, 34.37, 43.45, 95.91, 56.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 68.8, 0.0, 88.1, 0.0, 44.46, 0.0, 0.0, 0.0, 38.28, 0.0, 39.09, 48.19, 0.0, 0.0, 35.87, 0.0, 32.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 22.2], ["music", 21.88], ["mains hum", 11.24]], [["hum", 16.21], ["speech", 11.84], ["mains hum", 7.94]], [["hum", 53.77], ["throbbing", 22.32], ["mains hum", 10.16]], [["hum", 37.73], ["music", 21.39], ["mains hum", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.17], ["hum", 19.41], ["mains hum", 9.92]], null, null, null, [["speech", 44.07], ["sidetone", 35.93], ["hum", 7.52]], null, [["speech", 43.49], ["throbbing", 20.27], ["sidetone", 9.54]], [["speech", 26.68], ["hum", 15.54], ["stomach rumble", 10.88]], null, null, [["sidetone", 78.39], ["speech", 13.73], ["whale vocalization", 2.36]], null, [["speech", 61.54], ["sidetone", 9.97], ["music", 9.2]], null], "duration": [1.08, 1.54, 2.12, 2.66, 0.66, 1.48, 1.11, 4.78, 9.92, 3.32, 14.45, 3.45, 6.32, 4.04, 1.41, 1.25, 1.87, 0.06, 1.04, 1.03, 1.77, 1.51, 0.67, 3.09, 3.06, 1.75, 11.21, -0.06, 3.99, 0.69, 1.82, 1.46, 10.96, 0.03, 5.15, 2.41, 0.41, 0.63, 5.94, 0.83, 2.92, 1.38]} \ No newline at end of file diff --git a/annotations_1/PW3WxPo74c8_filtered.json b/annotations_1/PW3WxPo74c8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0879945ccf4f28de5b2e3173bd44a688f13ff194 --- /dev/null +++ b/annotations_1/PW3WxPo74c8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 79.32], [80.0, 98.17], [99.0, 120.66], [123.0, 123.45], [123.0, 136.54]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 38.59, 90.43, 0.0, 91.98], "audiomae_on_audioset": [null, [["speech", 89.08], ["fart", 1.59], ["beatboxing", 1.5]], null, null, null], "duration": [51.32, 18.17, 21.66, 0.45, 13.54]} \ No newline at end of file diff --git a/annotations_1/PWz21cujw28_filtered.json b/annotations_1/PWz21cujw28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5e29a60c77a7ff0851c86d43bd2023ede762710 --- /dev/null +++ b/annotations_1/PWz21cujw28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.25], [20.0, 21.56], [29.0, 29.15], [42.0, 41.82], [45.0, 46.14], [50.0, 53.28], [62.0, 62.77], [64.0, 64.66], [66.0, 67.85], [70.0, 70.34], [71.0, 79.62], [84.0, 88.45], [89.0, 94.26], [95.0, 95.86], [99.0, 100.74], [107.0, 108.85], [110.0, 111.15], [112.0, 113.61], [119.0, 119.92]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.42, 0.0, 0.0, 0.0, 0.0, 62.27, 89.36, 65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 20.37], ["burping, eructation", 10.46], ["fart", 8.52]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 1.56, 0.15, -0.18, 1.14, 3.28, 0.77, 0.66, 1.85, 0.34, 8.62, 4.45, 5.26, 0.86, 1.74, 1.85, 1.15, 1.61, 0.92]} \ No newline at end of file diff --git a/annotations_1/PX3By_Y0jTA_filtered.json b/annotations_1/PX3By_Y0jTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba554c3b7d4f129bedbf87a3f6183f4410a89679 --- /dev/null +++ b/annotations_1/PX3By_Y0jTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.63], [11.0, 11.74], [14.0, 14.77], [16.0, 26.05], [33.0, 48.24], [50.0, 51.16], [52.0, 51.97], [53.0, 63.81], [66.0, 67.0], [70.0, 92.74], [101.0, 116.6]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [29.52, 0.0, 0.0, 29.0, 31.22, 0.0, 0.0, 30.19, 0.0, 29.35, 29.46], "audiomae_on_audioset": [[["music", 61.14], ["scary music", 6.95], ["electronic music", 4.14]], null, null, [["music", 65.45], ["theremin", 6.03], ["musical instrument", 4.11]], [["noise", 19.64], ["hum", 18.46], ["mains hum", 17.6]], null, null, [["music", 60.87], ["speech", 13.74], ["hum", 7.82]], null, [["music", 28.96], ["buzz", 13.27], ["explosion", 5.06]], [["music", 21.61], ["hum", 14.66], ["mains hum", 10.99]]], "duration": [4.63, 0.74, 0.77, 10.05, 15.24, 1.16, -0.03, 10.81, 1.0, 22.74, 15.6]} \ No newline at end of file diff --git a/annotations_1/PX5QjCErMgU_filtered.json b/annotations_1/PX5QjCErMgU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..578fde6bc0e59c3bcb741fc07e34be126d022282 --- /dev/null +++ b/annotations_1/PX5QjCErMgU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 45.77], [58.0, 59.95], [62.0, 63.73], [66.0, 66.36], [82.0, 83.35], [91.0, 92.82], [93.0, 94.27], [106.0, 109.19], [111.0, 112.31]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [47.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0], "audiomae_on_audioset": [[["speech", 86.7], ["radio", 2.88], ["speech synthesizer", 1.39]], null, null, null, null, null, null, [["speech", 45.69], ["boing", 8.0], ["stomach rumble", 5.84]], null], "duration": [2.77, 1.95, 1.73, 0.36, 1.35, 1.82, 1.27, 3.19, 1.31]} \ No newline at end of file diff --git a/annotations_1/PXMASW5YQl8_filtered.json b/annotations_1/PXMASW5YQl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9759a2c3655132b3bfa96c8ff451cfb4e18126a9 --- /dev/null +++ b/annotations_1/PXMASW5YQl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.73], [27.0, 33.96]], "keep_status": [false, false], "silence_prob": [98.59, 88.64], "audiomae_on_audioset": [null, null], "duration": [3.73, 6.96]} \ No newline at end of file diff --git a/annotations_1/PXSMKQqZjaE_filtered.json b/annotations_1/PXSMKQqZjaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33e60307d182b64733467a0b9951cafe4e1e60b3 --- /dev/null +++ b/annotations_1/PXSMKQqZjaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 32.02], [32.0, 32.83], [34.0, 47.55], [48.0, 49.42], [53.0, 53.77], [57.0, 74.07], [78.0, 91.54], [92.0, 97.8], [111.0, 111.69], [113.0, 118.0], [121.0, 130.25]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [36.16, 0.0, 32.44, 0.0, 0.0, 31.83, 32.52, 30.79, 0.0, 38.82, 30.77], "audiomae_on_audioset": [[["music", 54.17], ["throbbing", 15.5], ["hum", 7.71]], null, [["music", 75.36], ["buzz", 3.53], ["hum", 2.96]], null, null, [["music", 57.84], ["speech", 12.18], ["didgeridoo", 4.24]], [["music", 71.44], ["synthesizer", 3.75], ["theremin", 3.33]], [["speech", 23.68], ["music", 21.0], ["explosion", 10.96]], null, [["music", 49.83], ["synthesizer", 9.77], ["hum", 5.84]], [["animal", 34.56], ["music", 20.4], ["speech", 9.74]]], "duration": [2.02, 0.83, 13.55, 1.42, 0.77, 17.07, 13.54, 5.8, 0.69, 5.0, 9.25]} \ No newline at end of file diff --git a/annotations_1/PXaE-weoKCo_filtered.json b/annotations_1/PXaE-weoKCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afeefa577acdeabf9ab7aa1c3755086065b0fc70 --- /dev/null +++ b/annotations_1/PXaE-weoKCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [2.0, 3.0], [3.0, 3.87], [5.0, 6.07], [8.0, 10.54], [13.0, 14.4], [15.0, 28.19], [29.0, 30.18], [33.0, 33.17], [34.0, 34.42], [35.0, 35.6], [36.0, 36.53], [37.0, 38.97], [40.0, 40.27], [41.0, 41.98], [46.0, 46.18], [48.0, 49.15], [59.0, 59.91], [60.0, 64.35], [66.0, 67.46], [70.0, 70.58], [75.0, 76.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.42], ["boing", 15.07], ["speech", 2.14]], null, null, null], "duration": [0.0, 1.0, 0.87, 1.07, 2.54, 1.4, 13.19, 1.18, 0.17, 0.42, 0.6, 0.53, 1.97, 0.27, 0.98, 0.18, 1.15, 0.91, 4.35, 1.46, 0.58, 1.49]} \ No newline at end of file diff --git a/annotations_1/PYkBs86HnUc_filtered.json b/annotations_1/PYkBs86HnUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f965d495c95f96742bb5b8d3b212176fcb35c05 --- /dev/null +++ b/annotations_1/PYkBs86HnUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.11], [8.0, 13.12], [14.0, 14.57], [20.0, 25.51], [28.0, 31.72], [32.0, 67.76], [69.0, 83.78], [85.0, 88.33], [90.0, 93.39], [94.0, 103.47], [108.0, 108.33], [109.0, 117.14], [134.0, 135.94], [137.0, 138.33], [139.0, 141.54]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 46.33, 0.0, 41.09, 35.12, 0.0, 32.12, 45.24, 39.09, 30.85, 0.0, 30.87, 0.0, 0.0, 39.21], "audiomae_on_audioset": [null, [["music", 58.85], ["throbbing", 10.22], ["hum", 4.53]], null, [["music", 61.97], ["throbbing", 10.65], ["croak", 3.66]], [["music", 50.63], ["speech", 15.13], ["sonar", 7.81]], null, [["music", 40.91], ["cattle, bovinae", 25.16], ["moo", 17.84]], [["throbbing", 29.32], ["music", 26.61], ["hum", 14.11]], [["didgeridoo", 30.46], ["music", 23.48], ["hum", 8.61]], [["music", 57.73], ["throbbing", 19.47], ["hum", 7.25]], null, [["music", 54.88], ["speech", 6.63], ["electronic music", 5.35]], null, null, [["bee, wasp, etc.", 45.36], ["speech", 19.33], ["fly, housefly", 6.09]]], "duration": [0.11, 5.12, 0.57, 5.51, 3.72, 35.76, 14.78, 3.33, 3.39, 9.47, 0.33, 8.14, 1.94, 1.33, 2.54]} \ No newline at end of file diff --git a/annotations_1/PZBy1m-MmlQ_filtered.json b/annotations_1/PZBy1m-MmlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff589b74f23e40859dcf62f99ddc90159a27bf9a --- /dev/null +++ b/annotations_1/PZBy1m-MmlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 30.84], [32.0, 34.11], [35.0, 37.22], [38.0, 40.05], [43.0, 82.75]], "keep_status": [false, false, true, true, false], "silence_prob": [29.36, 28.71, 29.86, 29.25, 0.0], "audiomae_on_audioset": [[["speech", 41.48], ["music", 27.38], ["hum", 4.02]], [["livestock, farm animals, working animals", 33.52], ["cattle, bovinae", 26.87], ["cowbell", 10.07]], [["music", 30.32], ["speech", 10.42], ["breaking", 5.91]], [["fly, housefly", 26.3], ["insect", 12.53], ["mosquito", 7.86]], null], "duration": [25.84, 2.11, 2.22, 2.05, 39.75]} \ No newline at end of file diff --git a/annotations_1/PZeVTlloWxw_filtered.json b/annotations_1/PZeVTlloWxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31c02851e69b83f3fef6e2f501c6f013b27e0255 --- /dev/null +++ b/annotations_1/PZeVTlloWxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.4], [8.0, 8.43], [11.0, 12.19], [16.0, 22.57], [23.0, 25.81], [27.0, 27.45], [28.0, 29.25], [31.0, 31.95], [33.0, 34.08], [37.0, 38.35], [39.0, 40.1], [42.0, 42.11], [45.0, 44.96], [48.0, 48.76], [49.0, 49.6], [52.0, 53.52], [55.0, 55.98], [57.0, 61.89], [63.0, 63.19], [66.0, 66.48], [71.0, 77.11], [78.0, 80.69], [82.0, 83.93], [85.0, 86.61], [87.0, 90.42], [92.0, 92.75], [97.0, 97.97], [105.0, 106.32], [111.0, 111.87], [113.0, 115.7], [117.0, 118.5], [122.0, 123.36], [124.0, 124.87], [125.0, 125.93], [127.0, 127.9], [128.0, 131.31], [133.0, 136.44], [138.0, 150.94], [153.0, 159.7], [162.0, 163.76], [164.0, 166.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 74.29, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 100.0, 93.6, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 96.42, 63.64, 100.0, 0.0, 98.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.4, 0.43, 1.19, 6.57, 2.81, 0.45, 1.25, 0.95, 1.08, 1.35, 1.1, 0.11, -0.04, 0.76, 0.6, 1.52, 0.98, 4.89, 0.19, 0.48, 6.11, 2.69, 1.93, 1.61, 3.42, 0.75, 0.97, 1.32, 0.87, 2.7, 1.5, 1.36, 0.87, 0.93, 0.9, 3.31, 3.44, 12.94, 6.7, 1.76, 2.31]} \ No newline at end of file diff --git a/annotations_1/P_Iz-WhpmXY_filtered.json b/annotations_1/P_Iz-WhpmXY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4701e2465b8e11e319a4dc4a0c614f41f2a4c7c2 --- /dev/null +++ b/annotations_1/P_Iz-WhpmXY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.42], [12.0, 13.64], [15.0, 15.25], [15.0, 19.38], [25.0, 25.66], [26.0, 30.1], [35.0, 37.02], [41.0, 41.23], [49.0, 49.5], [53.0, 53.22], [56.0, 56.37], [59.0, 59.29], [60.0, 61.28], [65.0, 65.94], [66.0, 67.91], [70.0, 71.37], [73.0, 73.62], [75.0, 76.22], [77.0, 78.11], [80.0, 82.17], [83.0, 83.88], [85.0, 86.53], [89.0, 89.77], [92.0, 93.36], [94.0, 95.1], [99.0, 100.74], [102.0, 106.02], [117.0, 119.96], [122.0, 124.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [83.88, 0.0, 0.0, 62.58, 0.0, 84.8, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 95.23, 98.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.42, 1.64, 0.25, 4.38, 0.66, 4.1, 2.02, 0.23, 0.5, 0.22, 0.37, 0.29, 1.28, 0.94, 1.91, 1.37, 0.62, 1.22, 1.11, 2.17, 0.88, 1.53, 0.77, 1.36, 1.1, 1.74, 4.02, 2.96, 2.29]} \ No newline at end of file diff --git a/annotations_1/PahRJMVNho0_filtered.json b/annotations_1/PahRJMVNho0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a58bbf6719d6a1f3e56d3ca1631bd3a2245055ae --- /dev/null +++ b/annotations_1/PahRJMVNho0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.86], [7.0, 7.43], [10.0, 10.54], [19.0, 20.56], [25.0, 25.52], [31.0, 31.24], [39.0, 40.34], [42.0, 42.92], [44.0, 44.63], [45.0, 45.25], [47.0, 48.15], [50.0, 53.3], [54.0, 55.22], [58.0, 57.79], [60.0, 60.24], [66.0, 68.61], [88.0, 90.49], [91.0, 91.69], [95.0, 95.86], [99.0, 100.03], [102.0, 102.57], [104.0, 105.51], [106.0, 109.17], [109.0, 110.46], [112.0, 113.29], [115.0, 117.69], [127.0, 131.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 0.0, 31.95, 41.14, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 0.0, 0.0, 43.87, 32.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.58], ["carnatic music", 4.03], ["singing", 2.53]], [["music", 83.23], ["musical instrument", 1.29], ["didgeridoo", 0.91]], null, null, null, null, null, [["music", 55.12], ["shofar", 11.85], ["wind instrument, woodwind instrument", 6.83]], null, null, [["music", 60.53], ["quack", 22.43], ["duck", 2.99]], [["music", 65.07], ["mosquito", 4.02], ["musical instrument", 2.54]]], "duration": [0.86, 0.43, 0.54, 1.56, 0.52, 0.24, 1.34, 0.92, 0.63, 0.25, 1.15, 3.3, 1.22, -0.21, 0.24, 2.61, 2.49, 0.69, 0.86, 1.03, 0.57, 1.51, 3.17, 1.46, 1.29, 2.69, 4.57]} \ No newline at end of file diff --git a/annotations_1/PaqNqocHJ-o_filtered.json b/annotations_1/PaqNqocHJ-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05530c81893415e604e5974965c1d44debab8477 --- /dev/null +++ b/annotations_1/PaqNqocHJ-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 90.64], [95.0, 119.03], [121.0, 130.06], [143.0, 143.07], [144.0, 146.94], [148.0, 152.52], [153.0, 157.67], [159.0, 158.9], [161.0, 168.99], [172.0, 181.4], [184.0, 185.31], [189.0, 189.84], [191.0, 193.04]], "keep_status": [true, true, true, false, false, true, false, false, false, false, false, false, true], "silence_prob": [31.88, 31.79, 31.11, 0.0, 44.26, 38.74, 33.19, 0.0, 29.94, 42.91, 0.0, 0.0, 49.45], "audiomae_on_audioset": [[["speech", 34.32], ["music", 17.82], ["mains hum", 8.36]], [["music", 22.64], ["hum", 13.31], ["throbbing", 12.6]], [["speech", 41.08], ["music", 17.94], ["throbbing", 4.52]], null, [["hum", 44.3], ["mains hum", 24.58], ["throbbing", 15.39]], [["music", 37.88], ["hum", 20.03], ["mains hum", 8.1]], [["mains hum", 53.18], ["hum", 26.94], ["music", 7.04]], null, [["cacophony", 27.94], ["music", 26.98], ["speech", 15.18]], [["throbbing", 57.94], ["hum", 22.5], ["music", 6.54]], null, null, [["speech", 24.39], ["clip-clop", 16.55], ["horse", 11.02]]], "duration": [2.64, 24.03, 9.06, 0.07, 2.94, 4.52, 4.67, -0.1, 7.99, 9.4, 1.31, 0.84, 2.04]} \ No newline at end of file diff --git a/annotations_1/PbC7alhpFBE_filtered.json b/annotations_1/PbC7alhpFBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8223000af86c894f8c0c2ea54e9d270a8bdf84d1 --- /dev/null +++ b/annotations_1/PbC7alhpFBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.19], [27.0, 27.33], [27.0, 27.45], [27.0, 33.44], [37.0, 37.52], [39.0, 41.15], [42.0, 44.19], [47.0, 48.49], [50.0, 51.9], [53.0, 54.55], [57.0, 65.53], [66.0, 67.76], [71.0, 76.0], [96.0, 98.56], [105.0, 107.33], [111.0, 113.17], [116.0, 117.83], [120.0, 120.92], [122.0, 124.36], [125.0, 127.08], [131.0, 132.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.64, 0.0, 87.92, 98.73, 0.0, 0.0, 0.0, 95.23, 0.0, 96.04, 77.36, 87.92, 99.56, 0.0, 0.0, 60.6, 97.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.33, 0.45, 6.44, 0.52, 2.15, 2.19, 1.49, 1.9, 1.55, 8.53, 1.76, 5.0, 2.56, 2.33, 2.17, 1.83, 0.92, 2.36, 2.08, 1.39]} \ No newline at end of file diff --git a/annotations_1/PdgSo4Ts7D4_filtered.json b/annotations_1/PdgSo4Ts7D4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..864e7f31f3f7f002a7eb0459361c679083aa39f4 --- /dev/null +++ b/annotations_1/PdgSo4Ts7D4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 34.94], [37.0, 145.27]], "keep_status": [false, false], "silence_prob": [29.97, 0.0], "audiomae_on_audioset": [[["fly, housefly", 38.48], ["insect", 34.62], ["mosquito", 6.38]], null], "duration": [13.94, 108.27]} \ No newline at end of file diff --git a/annotations_1/PdmlJSk6QAk_filtered.json b/annotations_1/PdmlJSk6QAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5ae8d3f592fc3c27f101a903d59889b9baab21f --- /dev/null +++ b/annotations_1/PdmlJSk6QAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 69.13], [70.0, 71.47], [73.0, 87.93], [89.0, 97.68], [98.0, 103.79], [106.0, 108.45], [110.0, 117.15], [118.0, 132.88], [134.0, 138.21], [139.0, 162.51]], "keep_status": [true, false, true, true, false, false, false, false, false, true], "silence_prob": [34.94, 0.0, 31.07, 37.08, 34.51, 35.14, 38.4, 37.49, 41.81, 31.71], "audiomae_on_audioset": [[["hum", 25.42], ["music", 16.81], ["throbbing", 11.93]], null, [["gunshot, gunfire", 32.99], ["machine gun", 16.03], ["speech", 10.86]], [["hum", 23.25], ["single-lens reflex camera", 20.54], ["throbbing", 10.45]], [["speech", 36.23], ["rumble", 28.21], ["hum", 9.87]], [["speech", 75.48], ["hum", 5.0], ["rumble", 2.96]], [["music", 56.55], ["throbbing", 8.18], ["hum", 7.7]], [["hum", 35.89], ["throbbing", 20.28], ["speech", 14.8]], [["music", 61.63], ["hum", 11.56], ["throbbing", 8.66]], [["music", 27.28], ["throbbing", 22.62], ["hum", 16.73]]], "duration": [16.13, 1.47, 14.93, 8.68, 5.79, 2.45, 7.15, 14.88, 4.21, 23.51]} \ No newline at end of file diff --git a/annotations_1/PdzjDn5zVXo_filtered.json b/annotations_1/PdzjDn5zVXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcd3ae9a83260b02920ddb0fa8f37cd9401c24da --- /dev/null +++ b/annotations_1/PdzjDn5zVXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [9.0, 10.0], [15.0, 30.92], [34.0, 34.65], [35.0, 50.09], [53.0, 55.26], [56.0, 62.97], [67.0, 67.44], [72.0, 96.26], [104.0, 118.17], [121.0, 135.99], [138.0, 138.52], [148.0, 154.79], [157.0, 157.52], [168.0, 173.08], [173.0, 173.23], [173.0, 173.3], [173.0, 173.45]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 37.04, 0.0, 30.56, 33.51, 33.2, 0.0, 48.52, 32.11, 31.1, 0.0, 30.35, 0.0, 30.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 69.1], ["sonar", 6.94], ["foghorn", 3.52]], null, [["music", 79.01], ["brass instrument", 2.26], ["musical instrument", 1.89]], [["music", 40.97], ["hum", 7.71], ["mains hum", 6.63]], [["music", 49.37], ["theremin", 31.12], ["musical instrument", 4.95]], null, [["music", 72.56], ["theremin", 10.13], ["ambient music", 3.62]], [["music", 54.45], ["speech", 11.29], ["sidetone", 3.79]], [["vehicle", 29.81], ["skidding", 18.33], ["speech", 16.54]], null, [["music", 44.27], ["speech", 15.91], ["hum", 4.62]], null, [["music", 28.13], ["cattle, bovinae", 15.94], ["moo", 14.12]], null, null, null], "duration": [1.09, 1.0, 15.92, 0.65, 15.09, 2.26, 6.97, 0.44, 24.26, 14.17, 14.99, 0.52, 6.79, 0.52, 5.08, 0.23, 0.3, 0.45]} \ No newline at end of file diff --git a/annotations_1/Pe5eL8LQdY0_filtered.json b/annotations_1/Pe5eL8LQdY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f764506ff39f8b8f62535448d00623b5cdce4da2 --- /dev/null +++ b/annotations_1/Pe5eL8LQdY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 6.61], [8.0, 8.23], [9.0, 9.09], [10.0, 10.49], [12.0, 13.76], [14.0, 17.25], [20.0, 26.54], [32.0, 32.44], [36.0, 36.04], [38.0, 38.8], [39.0, 46.45], [48.0, 48.63], [50.0, 49.98], [51.0, 51.39], [59.0, 67.59], [69.0, 69.82], [73.0, 73.63], [74.0, 74.97], [77.0, 76.86], [81.0, 87.45], [91.0, 120.66]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.76, 37.55, 0.0, 0.0, 0.0, 30.56, 0.0, 0.0, 0.0, 35.85, 0.0, 0.0, 0.0, 0.0, 28.39, 28.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 32.95], ["hum", 11.69], ["mains hum", 10.99]], null, null, null, [["music", 30.72], ["whale vocalization", 29.91], ["speech", 7.18]], null, null, null, [["music", 50.74], ["theremin", 36.85], ["musical instrument", 2.05]], null, null, null, null, [["music", 26.54], ["fly, housefly", 21.98], ["mosquito", 10.7]], [["speech", 44.29], ["boat, water vehicle", 13.32], ["vehicle", 9.53]]], "duration": [0.75, 0.61, 0.23, 0.09, 0.49, 1.76, 3.25, 6.54, 0.44, 0.04, 0.8, 7.45, 0.63, -0.02, 0.39, 8.59, 0.82, 0.63, 0.97, -0.14, 6.45, 29.66]} \ No newline at end of file diff --git a/annotations_1/Pf2LbcDDW5E_filtered.json b/annotations_1/Pf2LbcDDW5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Pf2LbcDDW5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/PhLfIqO2SLI_filtered.json b/annotations_1/PhLfIqO2SLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58b722d0d9e38de86a4e4e06f7052ade510e3de5 --- /dev/null +++ b/annotations_1/PhLfIqO2SLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.08], [9.0, 11.23], [15.0, 18.01], [21.0, 21.91], [22.0, 22.99], [24.0, 24.65], [38.0, 38.99], [40.0, 44.41], [44.0, 44.44], [45.0, 52.86], [56.0, 68.22], [69.0, 69.18], [70.0, 100.3], [101.0, 102.36], [105.0, 106.35], [108.0, 108.01], [109.0, 131.58], [133.0, 134.06], [136.0, 137.17], [140.0, 144.54], [145.0, 147.93], [151.0, 153.4], [156.0, 157.54], [158.0, 159.07], [166.0, 172.39], [174.0, 174.48]], "keep_status": [true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [29.91, 30.07, 29.74, 0.0, 0.0, 0.0, 0.0, 30.55, 0.0, 38.27, 34.23, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 0.0, 0.0, 64.18, 77.2, 85.9, 0.0, 0.0, 30.12, 0.0], "audiomae_on_audioset": [[["speech", 38.7], ["music", 7.5], ["cattle, bovinae", 4.7]], [["music", 25.34], ["mains hum", 24.36], ["hum", 18.63]], [["music", 65.52], ["synthesizer", 6.49], ["musical instrument", 5.61]], null, null, null, null, [["music", 19.93], ["groan", 17.57], ["didgeridoo", 9.15]], null, [["music", 64.94], ["hum", 6.28], ["speech", 5.83]], [["music", 46.31], ["hum", 20.42], ["mains hum", 12.92]], null, null, null, null, null, [["music", 41.03], ["hum", 16.91], ["buzz", 7.76]], null, null, null, null, null, null, null, [["music", 56.65], ["throbbing", 18.36], ["hum", 3.48]], null], "duration": [4.08, 2.23, 3.01, 0.91, 0.99, 0.65, 0.99, 4.41, 0.44, 7.86, 12.22, 0.18, 30.3, 1.36, 1.35, 0.01, 22.58, 1.06, 1.17, 4.54, 2.93, 2.4, 1.54, 1.07, 6.39, 0.48]} \ No newline at end of file diff --git a/annotations_1/PhRyzmcEOVA_filtered.json b/annotations_1/PhRyzmcEOVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5070cf146bb6a6f9020537906f52ebb81b01e32f --- /dev/null +++ b/annotations_1/PhRyzmcEOVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.28], [20.0, 20.43], [20.0, 20.48], [20.0, 52.57], [53.0, 54.87], [59.0, 73.01], [74.0, 74.07], [74.0, 74.51], [78.0, 82.63], [83.0, 82.88], [83.0, 84.38], [88.0, 91.89], [93.0, 93.12], [94.0, 94.2], [95.0, 99.42], [99.0, 99.55], [100.0, 106.19], [107.0, 109.14], [110.0, 115.13], [119.0, 119.91], [120.0, 122.13], [122.0, 123.85], [127.0, 127.01], [128.0, 141.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 0.0, 36.11, 0.0, 0.0, 57.4, 0.0, 0.0, 44.34, 0.0, 35.67, 40.06, 38.82, 0.0, 47.12, 0.0, 0.0, 37.21], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 63.69], ["music", 7.17], ["sidetone", 6.63]], null, null, [["speech", 50.34], ["boing", 15.7], ["cattle, bovinae", 4.76]], null, null, null, null, null, [["speech", 68.63], ["music", 11.3], ["electric shaver, electric razor", 5.6]], null, [["speech", 45.32], ["boing", 27.78], ["laughter", 2.86]], [["speech", 47.99], ["whale vocalization", 17.31], ["music", 6.8]], [["grunt", 25.2], ["speech", 19.57], ["burping, eructation", 6.58]], null, [["moo", 33.91], ["cattle, bovinae", 20.74], ["livestock, farm animals, working animals", 17.25]], null, null, [["music", 41.32], ["speech", 24.24], ["didgeridoo", 11.65]]], "duration": [0.28, 0.43, 0.48, 32.57, 1.87, 14.01, 0.07, 0.51, 4.63, -0.12, 1.38, 3.89, 0.12, 0.2, 4.42, 0.55, 6.19, 2.14, 5.13, 0.91, 2.13, 1.85, 0.01, 13.07]} \ No newline at end of file diff --git a/annotations_1/PhkGK4ga-Gs_filtered.json b/annotations_1/PhkGK4ga-Gs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..142f878148c61e019180fe3610d63669c5cf74e0 --- /dev/null +++ b/annotations_1/PhkGK4ga-Gs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.42], [10.0, 10.76], [12.0, 12.36], [16.0, 15.9], [18.0, 18.82], [19.0, 19.72], [31.0, 31.29], [32.0, 32.64], [36.0, 36.93], [40.0, 40.39], [41.0, 41.94], [48.0, 48.17], [51.0, 53.89], [55.0, 55.98], [56.0, 57.57], [59.0, 68.84], [74.0, 74.63], [82.0, 81.89], [83.0, 83.44], [85.0, 90.0], [92.0, 92.82], [94.0, 94.14], [107.0, 106.79], [108.0, 108.28], [110.0, 111.37], [112.0, 119.1], [120.0, 120.65], [122.0, 122.42], [125.0, 124.78], [127.0, 130.59], [132.0, 132.51], [134.0, 138.11], [139.0, 140.21], [141.0, 141.15], [143.0, 143.88], [145.0, 145.4], [150.0, 150.43], [162.0, 165.35], [169.0, 169.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 46.64, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.16, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.61], ["livestock, farm animals, working animals", 17.05], ["sheep", 9.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.76, 0.36, -0.1, 0.82, 0.72, 0.29, 0.64, 0.93, 0.39, 0.94, 0.17, 2.89, 0.98, 1.57, 9.84, 0.63, -0.11, 0.44, 5.0, 0.82, 0.14, -0.21, 0.28, 1.37, 7.1, 0.65, 0.42, -0.22, 3.59, 0.51, 4.11, 1.21, 0.15, 0.88, 0.4, 0.43, 3.35, 0.79]} \ No newline at end of file diff --git a/annotations_1/PiL1okP-jbc_filtered.json b/annotations_1/PiL1okP-jbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0f5257352ed4c5ac743ee5139b508592cf63ef --- /dev/null +++ b/annotations_1/PiL1okP-jbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.9], [15.0, 24.81], [41.0, 51.22], [53.0, 59.98], [63.0, 91.0], [93.0, 102.36], [104.0, 111.79], [118.0, 117.9], [118.0, 118.1], [118.0, 131.43], [138.0, 144.48], [147.0, 148.27], [150.0, 149.91], [150.0, 150.53]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [28.27, 28.43, 31.18, 29.96, 28.7, 29.21, 29.21, 0.0, 0.0, 29.61, 28.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.72], ["breaking", 4.4], ["sound effect", 3.04]], [["music", 68.7], ["speech", 12.57], ["synthesizer", 3.05]], [["music", 45.54], ["speech", 31.37], ["synthesizer", 6.3]], [["foghorn", 33.62], ["fly, housefly", 19.49], ["music", 17.97]], [["speech", 62.46], ["music", 14.88], ["vehicle", 2.69]], [["music", 33.96], ["speech", 25.17], ["outside, rural or natural", 3.63]], [["music", 82.4], ["synthesizer", 2.18], ["musical instrument", 1.98]], null, null, [["music", 57.72], ["speech", 18.64], ["electronic music", 3.3]], [["music", 51.44], ["didgeridoo", 5.97], ["synthesizer", 5.34]], null, null, null], "duration": [3.9, 9.81, 10.22, 6.98, 28.0, 9.36, 7.79, -0.1, 0.1, 13.43, 6.48, 1.27, -0.09, 0.53]} \ No newline at end of file diff --git a/annotations_1/PitkS4aYur8_filtered.json b/annotations_1/PitkS4aYur8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..150b8e918e60235f4ca4e63c12e86dcf517d87e9 --- /dev/null +++ b/annotations_1/PitkS4aYur8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.44], [16.0, 16.71], [39.0, 41.08], [53.0, 54.67], [67.0, 67.49], [89.0, 90.29], [119.0, 120.33], [135.0, 149.45], [150.0, 151.19], [174.0, 175.85], [177.0, 177.92], [179.0, 179.07], [183.0, 183.9], [185.0, 186.12], [192.0, 201.99], [203.0, 205.34]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.93, 0.0, 31.41, 0.0, 0.0, 0.0, 0.0, 30.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.69, 67.0], "audiomae_on_audioset": [[["hum", 43.26], ["music", 21.86], ["mains hum", 14.21]], null, [["explosion", 23.79], ["speech", 13.35], ["burst, pop", 10.6]], null, null, null, null, [["hum", 46.1], ["mains hum", 17.9], ["music", 12.48]], null, null, null, null, null, null, [["music", 39.36], ["speech", 31.89], ["hum", 6.9]], null], "duration": [6.44, 0.71, 2.08, 1.67, 0.49, 1.29, 1.33, 14.45, 1.19, 1.85, 0.92, 0.07, 0.9, 1.12, 9.99, 2.34]} \ No newline at end of file diff --git a/annotations_1/Pj2K4FrqTmw_filtered.json b/annotations_1/Pj2K4FrqTmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40f50fd279ffceed942b7a8ce4e214a9c7587c00 --- /dev/null +++ b/annotations_1/Pj2K4FrqTmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 13.8], [15.0, 15.75], [19.0, 19.67], [21.0, 22.38], [24.0, 25.03], [28.0, 28.76], [30.0, 31.24], [36.0, 37.2], [38.0, 39.19], [41.0, 42.18], [44.0, 45.45], [47.0, 49.37], [50.0, 54.75], [57.0, 57.89], [62.0, 62.68], [65.0, 66.63], [69.0, 69.31], [73.0, 74.16], [75.0, 75.59], [77.0, 89.13], [91.0, 92.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 59.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.8, 0.75, 0.67, 1.38, 1.03, 0.76, 1.24, 1.2, 1.19, 1.18, 1.45, 2.37, 4.75, 0.89, 0.68, 1.63, 0.31, 1.16, 0.59, 12.13, 1.7]} \ No newline at end of file diff --git a/annotations_1/Pk-vHw-mstI_filtered.json b/annotations_1/Pk-vHw-mstI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4f576da2697f228cd04d84a86e5a047d262289f --- /dev/null +++ b/annotations_1/Pk-vHw-mstI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[82.0, 113.19], [119.0, 119.42], [126.0, 139.65], [140.0, 141.44], [142.0, 143.85], [146.0, 150.25], [152.0, 154.63], [156.0, 181.97]], "keep_status": [false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 47.2, 0.0, 0.0, 53.04, 55.89, 36.82], "audiomae_on_audioset": [null, null, [["music", 45.74], ["synthesizer", 10.75], ["throbbing", 7.81]], null, null, null, null, [["hum", 27.37], ["mains hum", 16.57], ["rumble", 8.39]]], "duration": [31.19, 0.42, 13.65, 1.44, 1.85, 4.25, 2.63, 25.97]} \ No newline at end of file diff --git a/annotations_1/Pk-zBUDgesM_filtered.json b/annotations_1/Pk-zBUDgesM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13964cad4495f21119f23d051924b3b38451989d --- /dev/null +++ b/annotations_1/Pk-zBUDgesM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [11.0, 15.99], [20.0, 20.66], [22.0, 23.55], [32.0, 31.99], [34.0, 37.39], [38.0, 38.57], [41.0, 42.16], [43.0, 44.0], [54.0, 53.72], [55.0, 57.23], [62.0, 62.18], [62.0, 65.11], [70.0, 70.11], [74.0, 74.92], [77.0, 78.44], [83.0, 82.95], [96.0, 97.01], [98.0, 98.24], [104.0, 105.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.86, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 4.99, 0.66, 1.55, -0.01, 3.39, 0.57, 1.16, 1.0, -0.28, 2.23, 0.18, 3.11, 0.11, 0.92, 1.44, -0.05, 1.01, 0.24, 1.11]} \ No newline at end of file diff --git a/annotations_1/PkCxda_9xRc_filtered.json b/annotations_1/PkCxda_9xRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a5b5aed918af459f040c170e61c224add7e47f4 --- /dev/null +++ b/annotations_1/PkCxda_9xRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.09], [7.0, 7.45], [8.0, 11.87], [16.0, 19.3], [21.0, 21.34], [24.0, 24.75], [26.0, 26.15], [33.0, 32.91], [34.0, 34.65], [37.0, 37.5], [39.0, 38.99], [40.0, 40.37], [45.0, 48.9], [56.0, 62.88], [65.0, 68.1], [69.0, 69.45], [73.0, 83.22], [85.0, 87.0], [87.0, 88.53], [90.0, 91.37], [92.0, 96.4], [97.0, 97.48], [99.0, 99.05], [102.0, 104.9], [106.0, 107.99], [108.0, 108.87], [111.0, 113.29], [114.0, 114.84], [116.0, 139.78], [140.0, 140.19], [143.0, 145.0], [150.0, 151.53], [153.0, 168.3], [172.0, 172.67], [173.0, 178.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 37.55, 57.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.26, 48.31, 54.83, 0.0, 69.88, 89.19, 0.0, 0.0, 40.4, 0.0, 0.0, 74.13, 0.0, 0.0, 84.98, 0.0, 34.07, 0.0, 32.91, 0.0, 34.85, 0.0, 31.47], "audiomae_on_audioset": [null, null, [["speech", 66.71], ["thunk", 5.09], ["boing", 5.07]], null, null, null, null, null, null, null, null, null, [["speech", 48.34], ["radio", 11.04], ["animal", 7.07]], [["speech", 41.87], ["sidetone", 13.15], ["animal", 5.48]], null, null, null, null, null, null, [["speech", 53.73], ["radio", 23.68], ["sidetone", 8.2]], null, null, null, null, null, null, null, [["speech", 67.94], ["sidetone", 4.49], ["telephone", 3.76]], null, [["didgeridoo", 22.18], ["throbbing", 13.57], ["hum", 10.34]], null, [["fly, housefly", 32.64], ["insect", 15.63], ["mosquito", 11.18]], null, [["music", 42.63], ["speech", 22.22], ["quack", 8.82]]], "duration": [0.09, 0.45, 3.87, 3.3, 0.34, 0.75, 0.15, -0.09, 0.65, 0.5, -0.01, 0.37, 3.9, 6.88, 3.1, 0.45, 10.22, 2.0, 1.53, 1.37, 4.4, 0.48, 0.05, 2.9, 1.99, 0.87, 2.29, 0.84, 23.78, 0.19, 2.0, 1.53, 15.3, 0.67, 5.6]} \ No newline at end of file diff --git a/annotations_1/PkLpd8Eaah0_filtered.json b/annotations_1/PkLpd8Eaah0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..244a9cdead8a04c268df7909f3e438af6cfb22f3 --- /dev/null +++ b/annotations_1/PkLpd8Eaah0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 42.35], [60.0, 62.88], [65.0, 72.4], [73.0, 83.78], [85.0, 85.46], [96.0, 97.9], [99.0, 99.89], [101.0, 102.17], [105.0, 106.1], [108.0, 109.95], [122.0, 123.01], [127.0, 127.89], [131.0, 135.95], [138.0, 138.64], [139.0, 139.67], [140.0, 145.59], [148.0, 158.63]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [32.47, 32.85, 32.11, 32.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 0.0, 0.0, 33.45, 33.29], "audiomae_on_audioset": [[["music", 40.87], ["brass instrument", 16.94], ["musical instrument", 12.09]], [["insect", 28.83], ["fly, housefly", 21.95], ["livestock, farm animals, working animals", 9.69]], [["music", 35.76], ["theremin", 8.78], ["musical instrument", 6.51]], [["music", 34.08], ["brass instrument", 21.43], ["trombone", 14.75]], null, null, null, null, null, null, null, null, [["music", 32.0], ["brass instrument", 22.13], ["musical instrument", 12.22]], null, null, [["music", 34.27], ["brass instrument", 27.25], ["musical instrument", 10.59]], [["brass instrument", 35.62], ["music", 26.3], ["saxophone", 17.01]]], "duration": [11.35, 2.88, 7.4, 10.78, 0.46, 1.9, 0.89, 1.17, 1.1, 1.95, 1.01, 0.89, 4.95, 0.64, 0.67, 5.59, 10.63]} \ No newline at end of file diff --git a/annotations_1/PkUS3Y9bR9s_filtered.json b/annotations_1/PkUS3Y9bR9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..265d1f6e2d647876a46d88e4de164454be6d8d3c --- /dev/null +++ b/annotations_1/PkUS3Y9bR9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 28.51], [31.0, 40.88], [42.0, 42.96], [43.0, 45.1], [47.0, 54.45], [56.0, 140.98], [142.0, 143.04]], "keep_status": [false, false, false, true, false, false, false], "silence_prob": [55.89, 76.2, 0.0, 37.89, 46.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 21.53], ["gong", 20.94], ["music", 14.46]], [["hum", 60.76], ["mains hum", 13.12], ["rumble", 7.48]], null, null], "duration": [9.51, 9.88, 0.96, 2.1, 7.45, 84.98, 1.04]} \ No newline at end of file diff --git a/annotations_1/Pku1UxtmkLM_filtered.json b/annotations_1/Pku1UxtmkLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1706daeee6d9198f82907866de3e6fa3c524ea3 --- /dev/null +++ b/annotations_1/Pku1UxtmkLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.06], [24.0, 31.23], [33.0, 59.95], [65.0, 76.13]], "keep_status": [true, true, true, true], "silence_prob": [37.24, 35.37, 39.15, 29.96], "audiomae_on_audioset": [[["music", 37.0], ["speech", 24.79], ["singing bowl", 4.65]], [["music", 60.55], ["didgeridoo", 2.61], ["fly, housefly", 2.28]], [["music", 45.7], ["hum", 12.15], ["didgeridoo", 7.29]], [["hum", 42.18], ["music", 13.38], ["throbbing", 12.48]]], "duration": [2.06, 7.23, 26.95, 11.13]} \ No newline at end of file diff --git a/annotations_1/Pl1dl--4OBE_filtered.json b/annotations_1/Pl1dl--4OBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dc9539f2a225e039a5b6b728b52aad479c8849c --- /dev/null +++ b/annotations_1/Pl1dl--4OBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.61], [21.0, 26.97], [28.0, 29.51], [31.0, 34.23], [39.0, 42.92], [44.0, 44.81], [46.0, 48.49], [56.0, 57.57], [59.0, 60.76], [62.0, 62.75], [63.0, 67.58], [69.0, 103.59]], "keep_status": [false, true, false, true, true, false, true, false, false, false, false, false], "silence_prob": [29.1, 28.86, 0.0, 30.46, 29.72, 0.0, 31.22, 0.0, 0.0, 0.0, 29.38, 0.0], "audiomae_on_audioset": [[["music", 34.56], ["throbbing", 20.29], ["hum", 16.42]], [["speech", 59.79], ["music", 4.98], ["vehicle", 4.9]], null, [["music", 33.58], ["foghorn", 9.87], ["hum", 7.94]], [["speech", 22.09], ["hum", 18.9], ["music", 14.07]], null, [["throbbing", 27.72], ["hum", 26.75], ["music", 10.23]], null, null, null, [["speech", 28.49], ["throbbing", 26.04], ["hum", 21.94]], null], "duration": [2.61, 5.97, 1.51, 3.23, 3.92, 0.81, 2.49, 1.57, 1.76, 0.75, 4.58, 34.59]} \ No newline at end of file diff --git a/annotations_1/Pl8E_9CTS1Y_filtered.json b/annotations_1/Pl8E_9CTS1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32a21f008a1af532121aac098d96eba183175c71 --- /dev/null +++ b/annotations_1/Pl8E_9CTS1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.39], [6.0, 7.05], [7.0, 7.86], [14.0, 14.81], [17.0, 17.88], [19.0, 20.53], [22.0, 21.91], [24.0, 28.07], [30.0, 29.83], [34.0, 36.09], [38.0, 40.73], [43.0, 44.73], [47.0, 48.39], [52.0, 52.52], [56.0, 56.66], [58.0, 58.75], [67.0, 67.61], [77.0, 77.33], [79.0, 79.3], [88.0, 89.01], [90.0, 90.22], [91.0, 91.61], [93.0, 93.28], [94.0, 95.0], [107.0, 116.18], [117.0, 117.81], [123.0, 126.4], [128.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.01, 0.0, 56.33, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 94.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.49], ["gong", 6.52], ["noise", 6.34]], null, null, [["music", 41.22], ["clarinet", 11.28], ["musical instrument", 8.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.05, 0.86, 0.81, 0.88, 1.53, -0.09, 4.07, -0.17, 2.09, 2.73, 1.73, 1.39, 0.52, 0.66, 0.75, 0.61, 0.33, 0.3, 1.01, 0.22, 0.61, 0.28, 1.0, 9.18, 0.81, 3.4, 0.24]} \ No newline at end of file diff --git a/annotations_1/PlJ-x-JNEj8_filtered.json b/annotations_1/PlJ-x-JNEj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa579d1f5b5f2f602409676e40b1d762436d19c3 --- /dev/null +++ b/annotations_1/PlJ-x-JNEj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.7], [27.0, 27.13], [34.0, 39.8], [46.0, 50.75], [52.0, 64.56], [68.0, 67.64], [73.0, 74.9], [80.0, 82.07], [83.0, 103.32], [108.0, 117.0]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.59, 29.84, 29.24, 0.0, 0.0, 30.96, 30.39, 30.43], "audiomae_on_audioset": [null, null, [["music", 30.75], ["speech", 24.0], ["whack, thwack", 11.34]], [["livestock, farm animals, working animals", 36.93], ["moo", 19.27], ["cattle, bovinae", 17.48]], [["music", 76.11], ["speech", 9.14], ["electric shaver, electric razor", 1.41]], null, null, [["music", 50.77], ["throbbing", 20.91], ["hum", 5.66]], [["music", 50.26], ["speech", 40.58], ["whale vocalization", 1.74]], [["speech", 51.47], ["music", 21.65], ["hum", 6.58]]], "duration": [1.7, 0.13, 5.8, 4.75, 12.56, -0.36, 1.9, 2.07, 20.32, 9.0]} \ No newline at end of file diff --git a/annotations_1/PlKDQqKh03Y_filtered.json b/annotations_1/PlKDQqKh03Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a568271cf60cf059e1a6c845e725a49167206ff6 --- /dev/null +++ b/annotations_1/PlKDQqKh03Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [5.0, 12.33], [14.0, 31.48], [32.0, 34.2], [39.0, 39.93], [41.0, 41.25], [43.0, 43.95], [46.0, 46.79], [48.0, 48.3], [49.0, 50.13], [51.0, 51.44], [56.0, 55.9], [60.0, 63.98], [65.0, 66.29], [67.0, 68.44], [71.0, 71.47], [73.0, 72.86], [78.0, 78.76], [80.0, 80.18], [83.0, 83.76], [87.0, 88.15], [90.0, 91.17], [92.0, 93.66], [95.0, 96.52], [97.0, 99.1], [101.0, 101.39], [102.0, 102.96], [104.0, 106.22], [107.0, 107.87], [123.0, 123.21], [128.0, 129.0], [130.0, 130.0], [131.0, 133.61], [134.0, 135.89], [147.0, 147.58], [168.0, 169.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.59, 97.92, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 35.39, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.47], ["music", 12.97], ["beatboxing", 7.87]], null, null, null, null, null, null, null, null], "duration": [0.08, 7.33, 17.48, 2.2, 0.93, 0.25, 0.95, 0.79, 0.3, 1.13, 0.44, -0.1, 3.98, 1.29, 1.44, 0.47, -0.14, 0.76, 0.18, 0.76, 1.15, 1.17, 1.66, 1.52, 2.1, 0.39, 0.96, 2.22, 0.87, 0.21, 1.0, 0.0, 2.61, 1.89, 0.58, 1.92]} \ No newline at end of file diff --git a/annotations_1/PlkvQ0NbjUs_filtered.json b/annotations_1/PlkvQ0NbjUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..038b92b261d1992acdeaf4c83a0c588f5dc4b09c --- /dev/null +++ b/annotations_1/PlkvQ0NbjUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.61], [16.0, 16.36], [20.0, 22.11], [24.0, 25.0], [35.0, 34.74], [36.0, 36.58], [39.0, 39.43], [46.0, 46.33], [50.0, 50.97], [52.0, 52.49], [56.0, 56.05], [59.0, 60.57], [62.0, 62.23], [65.0, 65.45], [66.0, 67.15], [68.0, 68.93], [70.0, 71.58], [75.0, 75.71], [80.0, 81.3], [83.0, 84.79], [86.0, 87.27], [90.0, 90.78], [95.0, 95.23], [98.0, 98.25], [101.0, 108.57], [110.0, 110.93], [118.0, 118.99], [120.0, 122.89], [123.0, 124.66], [127.0, 126.94], [129.0, 136.29], [138.0, 143.5], [146.0, 149.93], [160.0, 161.74], [163.0, 163.98], [168.0, 170.26], [171.0, 172.15], [173.0, 175.22], [177.0, 180.03], [183.0, 183.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.59, 0.0, 0.0, 30.51, 30.29, 96.54, 0.0, 0.0, 94.37, 0.0, 96.66, 99.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.87], ["hum", 26.63], ["mains hum", 9.33]], [["whip", 31.38], ["gong", 14.95], ["music", 11.69]], null, null, null, null, null, null, null, null], "duration": [5.61, 0.36, 2.11, 1.0, -0.26, 0.58, 0.43, 0.33, 0.97, 0.49, 0.05, 1.57, 0.23, 0.45, 1.15, 0.93, 1.58, 0.71, 1.3, 1.79, 1.27, 0.78, 0.23, 0.25, 7.57, 0.93, 0.99, 2.89, 1.66, -0.06, 7.29, 5.5, 3.93, 1.74, 0.98, 2.26, 1.15, 2.22, 3.03, 0.56]} \ No newline at end of file diff --git a/annotations_1/PmYdvwAqwDg_filtered.json b/annotations_1/PmYdvwAqwDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd0f54f7044bf8477be41100b1478b9a91b6afee --- /dev/null +++ b/annotations_1/PmYdvwAqwDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [6.0, 7.5], [10.0, 11.42], [17.0, 17.91], [21.0, 21.73], [22.0, 24.87], [26.0, 50.01], [54.0, 54.94], [56.0, 56.17], [58.0, 58.02], [62.0, 77.13], [78.0, 84.92], [86.0, 87.37], [88.0, 88.96]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 40.36, 29.15, 0.0, 0.0, 0.0, 29.79, 64.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.15], ["speech", 17.74], ["theremin", 2.51]], [["music", 62.06], ["timpani", 2.75], ["hum", 2.63]], null, null, null, [["theremin", 30.12], ["music", 28.86], ["noise", 6.56]], null, null, null], "duration": [0.43, 1.5, 1.42, 0.91, 0.73, 2.87, 24.01, 0.94, 0.17, 0.02, 15.13, 6.92, 1.37, 0.96]} \ No newline at end of file diff --git a/annotations_1/Pm_7ga5bxeI_filtered.json b/annotations_1/Pm_7ga5bxeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d933ab21f5262046cfc3a17e8594cd1bc59773b --- /dev/null +++ b/annotations_1/Pm_7ga5bxeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 102.52], [104.0, 108.5], [109.0, 129.37]], "keep_status": [true, true, false], "silence_prob": [41.16, 45.92, 34.89], "audiomae_on_audioset": [[["music", 50.6], ["hum", 6.87], ["mains hum", 5.92]], [["music", 53.91], ["singing bowl", 11.35], ["didgeridoo", 3.8]], [["music", 54.13], ["ambient music", 9.29], ["singing bowl", 7.46]]], "duration": [6.52, 4.5, 20.37]} \ No newline at end of file diff --git a/annotations_1/PoAxZJMYRWE_filtered.json b/annotations_1/PoAxZJMYRWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8da001e80c113aeffc9531a0b0a7e3115ee0ebfc --- /dev/null +++ b/annotations_1/PoAxZJMYRWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.16], [8.0, 12.6], [14.0, 14.13], [17.0, 16.8], [18.0, 18.52], [19.0, 20.02], [21.0, 22.62], [25.0, 25.37], [27.0, 27.55], [38.0, 38.43], [42.0, 41.89], [45.0, 45.99], [50.0, 51.88], [52.0, 56.35], [60.0, 61.42], [64.0, 65.37], [66.0, 69.26], [70.0, 72.17], [74.0, 75.52], [78.0, 80.37], [87.0, 87.66], [89.0, 102.95], [104.0, 106.19], [112.0, 120.55], [122.0, 122.81], [125.0, 124.68], [126.0, 125.9], [126.0, 125.96], [126.0, 126.08], [126.0, 127.58], [128.0, 128.8], [139.0, 138.87], [147.0, 148.42], [165.0, 164.96], [166.0, 166.94], [177.0, 178.43], [180.0, 183.61], [187.0, 187.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 93.45, 69.34, 0.0, 97.0, 0.0, 32.83, 47.98, 31.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 27.57], ["clang", 20.01], ["ding", 9.68]], [["music", 14.63], ["speech", 10.36], ["boing", 8.59]], [["livestock, farm animals, working animals", 15.54], ["cattle, bovinae", 14.71], ["whack, thwack", 9.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 4.6, 0.13, -0.2, 0.52, 1.02, 1.62, 0.37, 0.55, 0.43, -0.11, 0.99, 1.88, 4.35, 1.42, 1.37, 3.26, 2.17, 1.52, 2.37, 0.66, 13.95, 2.19, 8.55, 0.81, -0.32, -0.1, -0.04, 0.08, 1.58, 0.8, -0.13, 1.42, -0.04, 0.94, 1.43, 3.61, 0.12]} \ No newline at end of file diff --git a/annotations_1/PoIuiCAepLU_filtered.json b/annotations_1/PoIuiCAepLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..804870574f9c38b0a02a340e64b5f3ccbff784db --- /dev/null +++ b/annotations_1/PoIuiCAepLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [6.0, 8.07], [9.0, 10.37], [41.0, 41.45], [52.0, 52.69], [54.0, 54.16], [57.0, 60.49], [63.0, 63.78], [71.0, 72.54], [74.0, 82.97], [88.0, 88.53], [94.0, 94.69], [100.0, 100.84], [103.0, 106.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 45.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 18.35], ["cattle, bovinae", 17.19], ["speech", 16.64]]], "duration": [0.29, 2.07, 1.37, 0.45, 0.69, 0.16, 3.49, 0.78, 1.54, 8.97, 0.53, 0.69, 0.84, 3.0]} \ No newline at end of file diff --git a/annotations_1/PomVYrPHoAg_filtered.json b/annotations_1/PomVYrPHoAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01a86cee78d2131b8158fe01b5d793cb11603394 --- /dev/null +++ b/annotations_1/PomVYrPHoAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.46], [14.0, 14.93], [111.0, 113.66], [129.0, 128.68]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.46, 0.93, 2.66, -0.32]} \ No newline at end of file diff --git a/annotations_1/PpxLYsi1Yk4_filtered.json b/annotations_1/PpxLYsi1Yk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da56692813266523150a346187bf2f70f6f7c57e --- /dev/null +++ b/annotations_1/PpxLYsi1Yk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [10.0, 10.89], [13.0, 14.13], [15.0, 18.47], [22.0, 27.18], [32.0, 36.44], [42.0, 43.26], [49.0, 60.72], [61.0, 73.94], [78.0, 81.9], [83.0, 88.53]], "keep_status": [false, false, false, true, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 48.23, 49.59, 37.16, 0.0, 34.32, 30.56, 31.13, 32.88], "audiomae_on_audioset": [null, null, null, [["music", 39.05], ["speech", 20.51], ["ambient music", 2.36]], [["hum", 27.72], ["music", 24.06], ["mains hum", 8.01]], [["music", 39.04], ["speech", 31.02], ["didgeridoo", 6.8]], null, [["music", 89.21], ["soundtrack music", 2.28], ["throbbing", 1.36]], [["music", 43.04], ["speech", 14.18], ["didgeridoo", 4.09]], [["speech", 51.79], ["horse", 13.76], ["animal", 9.83]], [["music", 25.16], ["hum", 21.02], ["speech", 14.43]]], "duration": [0.83, 0.89, 1.13, 3.47, 5.18, 4.44, 1.26, 11.72, 12.94, 3.9, 5.53]} \ No newline at end of file diff --git a/annotations_1/PqOlbM-zmuI_filtered.json b/annotations_1/PqOlbM-zmuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d51976061fc7b2068767b5c6759334f2ea741ac --- /dev/null +++ b/annotations_1/PqOlbM-zmuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.05], [11.0, 11.85], [13.0, 17.74], [20.0, 24.68], [26.0, 27.3], [29.0, 30.32], [32.0, 32.53], [45.0, 46.57], [51.0, 52.05], [55.0, 55.93], [58.0, 58.58], [59.0, 60.61], [67.0, 67.1], [79.0, 79.46], [80.0, 80.54], [90.0, 90.98], [99.0, 99.47], [108.0, 115.11], [116.0, 117.76], [119.0, 118.76], [119.0, 120.46], [122.0, 122.42], [123.0, 122.67], [127.0, 127.3], [129.0, 129.37], [130.0, 130.42], [131.0, 130.54], [131.0, 134.08], [136.0, 136.27], [137.0, 138.06]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.4, 38.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["rumble", 27.97], ["speech", 23.57], ["whack, thwack", 13.17]], [["music", 15.53], ["single-lens reflex camera", 9.85], ["coin (dropping)", 8.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.7], ["speech", 11.06], ["fly, housefly", 6.12]], null, null, null, null, null, null, null, null, null, [["speech", 29.88], ["inside, small room", 5.1], ["breaking", 3.52]], null, null], "duration": [1.05, 0.85, 4.74, 4.68, 1.3, 1.32, 0.53, 1.57, 1.05, 0.93, 0.58, 1.61, 0.1, 0.46, 0.54, 0.98, 0.47, 7.11, 1.76, -0.24, 1.46, 0.42, -0.33, 0.3, 0.37, 0.42, -0.46, 3.08, 0.27, 1.06]} \ No newline at end of file diff --git a/annotations_1/PrBVgtAeNhE_filtered.json b/annotations_1/PrBVgtAeNhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28d26c7e5ce85ca2a9cf7c222493223b8f436d16 --- /dev/null +++ b/annotations_1/PrBVgtAeNhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.88], [16.0, 16.92], [20.0, 20.7], [22.0, 22.4], [23.0, 24.21], [30.0, 30.94], [36.0, 35.97], [39.0, 39.36], [49.0, 49.23], [53.0, 53.3], [66.0, 65.97], [69.0, 69.35], [91.0, 91.44], [98.0, 98.86], [101.0, 101.53], [103.0, 103.64], [115.0, 115.48], [124.0, 124.24], [127.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 0.92, 0.7, 0.4, 1.21, 0.94, -0.03, 0.36, 0.23, 0.3, -0.03, 0.35, 0.44, 0.86, 0.53, 0.64, 0.48, 0.24, 0.63]} \ No newline at end of file diff --git a/annotations_1/Ps3MsEdfpAw_filtered.json b/annotations_1/Ps3MsEdfpAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18e2b1c6a800b3b512fa2a892689b6caa1605e9b --- /dev/null +++ b/annotations_1/Ps3MsEdfpAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.94], [18.0, 27.82], [30.0, 33.76], [37.0, 46.8], [48.0, 49.1], [51.0, 62.31], [64.0, 67.1], [72.0, 72.33], [74.0, 74.7], [76.0, 77.23], [89.0, 90.44], [92.0, 95.98], [99.0, 113.66], [115.0, 115.96], [121.0, 121.47], [124.0, 129.52], [137.0, 152.74], [162.0, 164.05], [177.0, 177.84], [183.0, 183.36], [187.0, 190.31]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [31.11, 31.37, 33.91, 30.78, 0.0, 31.36, 37.31, 0.0, 0.0, 0.0, 0.0, 34.51, 32.15, 0.0, 0.0, 34.64, 30.52, 31.98, 0.0, 0.0, 35.8], "audiomae_on_audioset": [[["music", 64.45], ["electronic music", 3.91], ["techno", 3.42]], [["music", 61.74], ["livestock, farm animals, working animals", 6.13], ["speech", 5.86]], [["music", 33.79], ["hum", 19.72], ["throbbing", 18.5]], [["music", 81.97], ["grunt", 2.54], ["throbbing", 1.11]], null, [["music", 28.28], ["speech", 18.61], ["outside, rural or natural", 5.34]], [["speech", 58.72], ["music", 7.57], ["hiccup", 2.86]], null, null, null, null, [["boing", 26.66], ["speech", 16.43], ["groan", 15.16]], [["music", 75.86], ["sampler", 3.66], ["electronic music", 2.71]], null, null, [["music", 57.09], ["hum", 8.49], ["throbbing", 7.91]], [["music", 56.13], ["synthesizer", 9.21], ["electronic music", 7.84]], [["music", 17.62], ["speech", 17.45], ["vehicle", 3.92]], null, null, [["cattle, bovinae", 44.95], ["moo", 41.88], ["livestock, farm animals, working animals", 10.16]]], "duration": [9.94, 9.82, 3.76, 9.8, 1.1, 11.31, 3.1, 0.33, 0.7, 1.23, 1.44, 3.98, 14.66, 0.96, 0.47, 5.52, 15.74, 2.05, 0.84, 0.36, 3.31]} \ No newline at end of file diff --git a/annotations_1/PsRTAWDrNYo_filtered.json b/annotations_1/PsRTAWDrNYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f8e78850bdd8b68699b6d310825f3bb363d3ea8 --- /dev/null +++ b/annotations_1/PsRTAWDrNYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.61], [10.0, 33.67], [35.0, 35.29], [38.0, 65.69], [66.0, 122.01], [124.0, 123.69], [133.0, 136.66]], "keep_status": [true, false, false, true, false, false, true], "silence_prob": [32.95, 28.62, 0.0, 28.36, 0.0, 0.0, 30.54], "audiomae_on_audioset": [[["music", 31.17], ["hum", 26.77], ["electronic music", 7.56]], [["whale vocalization", 33.0], ["music", 20.41], ["hum", 19.82]], null, [["whale vocalization", 18.8], ["sound effect", 17.96], ["music", 10.17]], null, null, [["music", 28.42], ["cacophony", 11.38], ["synthesizer", 8.77]]], "duration": [3.61, 23.67, 0.29, 27.69, 56.01, -0.31, 3.66]} \ No newline at end of file diff --git a/annotations_1/Pt6VzQ_0k_I_filtered.json b/annotations_1/Pt6VzQ_0k_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74a2e17081375e596a8e9618735ab6ec45a67ade --- /dev/null +++ b/annotations_1/Pt6VzQ_0k_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 41.08], [42.0, 41.93], [44.0, 48.44], [57.0, 59.12], [64.0, 169.1], [171.0, 171.29], [171.0, 179.85], [183.0, 204.58], [206.0, 206.42], [207.0, 206.79]], "keep_status": [false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.0, 36.16, 0.0, 0.0, 32.77, 29.83, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.16], ["mains hum", 18.44], ["hum", 12.07]], [["music", 31.97], ["speech", 9.92], ["fly, housefly", 5.02]], null, null, [["music", 73.05], ["speech", 10.56], ["groan", 1.89]], [["mains hum", 32.3], ["hum", 17.9], ["buzz", 17.13]], null, null], "duration": [32.08, -0.07, 4.44, 2.12, 105.1, 0.29, 8.85, 21.58, 0.42, -0.21]} \ No newline at end of file diff --git a/annotations_1/Pu8AnCsWdiM_filtered.json b/annotations_1/Pu8AnCsWdiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be07c8ec80f7d295c8f89e24c0fa4146a1f0f544 --- /dev/null +++ b/annotations_1/Pu8AnCsWdiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 92.52], [94.0, 94.68], [95.0, 96.15], [96.0, 97.51]], "keep_status": [false, false, false, false], "silence_prob": [60.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [3.52, 0.68, 1.15, 1.51]} \ No newline at end of file diff --git a/annotations_1/Pui9t9vPUTc_filtered.json b/annotations_1/Pui9t9vPUTc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..695c26aeb8d83ac0e26d5689ac1dcff115251b14 --- /dev/null +++ b/annotations_1/Pui9t9vPUTc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.85], [12.0, 13.27], [14.0, 14.84], [17.0, 16.65], [17.0, 20.73], [24.0, 38.2], [39.0, 40.26], [41.0, 42.82], [51.0, 51.33], [53.0, 54.4], [60.0, 84.55], [97.0, 106.74]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [34.21, 0.0, 0.0, 0.0, 29.53, 30.09, 0.0, 0.0, 0.0, 0.0, 29.55, 29.78], "audiomae_on_audioset": [[["music", 43.27], ["middle eastern music", 12.14], ["synthetic singing", 5.81]], null, null, null, [["fly, housefly", 48.5], ["mosquito", 17.07], ["insect", 13.57]], [["music", 49.85], ["trombone", 4.94], ["buzz", 4.16]], null, null, null, null, [["music", 35.59], ["whale vocalization", 25.74], ["sound effect", 3.8]], [["music", 51.76], ["cacophony", 37.74], ["noise", 1.4]]], "duration": [2.85, 1.27, 0.84, -0.35, 3.73, 14.2, 1.26, 1.82, 0.33, 1.4, 24.55, 9.74]} \ No newline at end of file diff --git a/annotations_1/PurV6BzV3fI_filtered.json b/annotations_1/PurV6BzV3fI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95df3a06d74db937d484799aea030df9a56f7fd8 --- /dev/null +++ b/annotations_1/PurV6BzV3fI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.28], [11.0, 11.94], [24.0, 25.78], [29.0, 29.81], [33.0, 35.23], [36.0, 37.54], [40.0, 41.62], [44.0, 44.39], [53.0, 53.72], [56.0, 56.76], [63.0, 64.18], [67.0, 68.01], [70.0, 71.19], [79.0, 80.84], [81.0, 81.45], [83.0, 83.47], [84.0, 84.7], [86.0, 88.75], [100.0, 102.44], [115.0, 115.82], [116.0, 122.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.07, 32.51, 0.0, 42.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hoot", 37.75], ["speech", 33.44], ["owl", 12.05]], [["speech", 42.46], ["burping, eructation", 19.94], ["animal", 10.19]], null, [["speech", 48.37], ["animal", 7.16], ["fly, housefly", 6.04]]], "duration": [1.28, 0.94, 1.78, 0.81, 2.23, 1.54, 1.62, 0.39, 0.72, 0.76, 1.18, 1.01, 1.19, 1.84, 0.45, 0.47, 0.7, 2.75, 2.44, 0.82, 6.42]} \ No newline at end of file diff --git a/annotations_1/Pv70ImW-l3s_filtered.json b/annotations_1/Pv70ImW-l3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f693dce042f012c0910d1a62a20c253a07498a9d --- /dev/null +++ b/annotations_1/Pv70ImW-l3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 156.79], [158.0, 173.21]], "keep_status": [false, false], "silence_prob": [0.0, 52.98], "audiomae_on_audioset": [null, null], "duration": [145.79, 15.21]} \ No newline at end of file diff --git a/annotations_1/PvEongWRs5Q_filtered.json b/annotations_1/PvEongWRs5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21082a1d8e0829ad2a80ffb9a3b49093430d23ff --- /dev/null +++ b/annotations_1/PvEongWRs5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 119.58], [122.0, 122.52], [124.0, 125.34], [127.0, 127.5]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [48.58, 0.52, 1.34, 0.5]} \ No newline at end of file diff --git a/annotations_1/PvMk6sjZlTU_filtered.json b/annotations_1/PvMk6sjZlTU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1fcec4d3f37c01a7f79817e9c590f586b19f653 --- /dev/null +++ b/annotations_1/PvMk6sjZlTU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.96], [23.0, 23.58], [24.0, 25.22], [26.0, 37.99], [44.0, 55.56], [65.0, 65.23], [84.0, 83.93], [93.0, 94.73], [106.0, 105.92], [110.0, 109.83], [115.0, 116.26], [127.0, 127.09], [132.0, 134.77], [136.0, 136.04], [137.0, 138.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [29.22, 0.0, 0.0, 29.87, 29.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0], "audiomae_on_audioset": [[["music", 80.09], ["cacophony", 2.27], ["singing", 1.78]], null, null, [["music", 63.2], ["speech", 23.16], ["sidetone", 2.72]], [["music", 45.42], ["breaking", 9.28], ["cacophony", 8.29]], null, null, null, null, null, null, null, [["sidetone", 29.25], ["speech", 23.88], ["music", 7.48]], null, null], "duration": [10.96, 0.58, 1.22, 11.99, 11.56, 0.23, -0.07, 1.73, -0.08, -0.17, 1.26, 0.09, 2.77, 0.04, 1.38]} \ No newline at end of file diff --git a/annotations_1/Pve6cemkiDg_filtered.json b/annotations_1/Pve6cemkiDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7aa8525ceaae292c5ba09042f517cd064f142a01 --- /dev/null +++ b/annotations_1/Pve6cemkiDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 50.01], [50.0, 98.96], [101.0, 112.11], [113.0, 150.96], [153.0, 169.7], [170.0, 174.92], [175.0, 175.59]], "keep_status": [false, false, true, false, true, false, false], "silence_prob": [28.68, 0.0, 30.42, 0.0, 32.61, 43.98, 0.0], "audiomae_on_audioset": [[["music", 54.89], ["speech", 13.67], ["cattle, bovinae", 3.69]], null, [["whack, thwack", 25.33], ["groan", 21.69], ["music", 12.11]], null, [["music", 51.55], ["groan", 8.68], ["thump, thud", 3.8]], [["didgeridoo", 48.77], ["music", 26.77], ["speech", 5.63]], null], "duration": [9.01, 48.96, 11.11, 37.96, 16.7, 4.92, 0.59]} \ No newline at end of file diff --git a/annotations_1/PvoBUI7uz-w_filtered.json b/annotations_1/PvoBUI7uz-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af6175ca3e4df765620417b2360d2e0a4826dddd --- /dev/null +++ b/annotations_1/PvoBUI7uz-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [4.0, 8.16], [10.0, 18.4], [21.0, 39.7], [40.0, 46.4], [47.0, 48.03], [49.0, 58.67], [66.0, 66.29], [67.0, 78.34], [80.0, 95.86], [104.0, 104.72], [106.0, 108.78], [110.0, 109.81], [111.0, 111.74], [112.0, 112.53], [113.0, 113.19], [114.0, 115.1], [116.0, 116.46], [118.0, 119.62], [120.0, 121.37], [122.0, 174.51]], "keep_status": [false, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.09, 30.74, 37.27, 58.22, 0.0, 41.66, 0.0, 35.91, 31.25, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 26.07], ["moo", 18.08], ["speech", 11.44]], [["speech", 38.2], ["music", 35.55], ["hum", 4.19]], [["hum", 38.79], ["mains hum", 25.09], ["music", 14.72]], null, null, [["music", 30.65], ["didgeridoo", 21.2], ["livestock, farm animals, working animals", 4.82]], null, [["hum", 55.72], ["mains hum", 9.51], ["cattle, bovinae", 6.09]], [["music", 62.5], ["musical instrument", 3.84], ["didgeridoo", 3.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 4.16, 8.4, 18.7, 6.4, 1.03, 9.67, 0.29, 11.34, 15.86, 0.72, 2.78, -0.19, 0.74, 0.53, 0.19, 1.1, 0.46, 1.62, 1.37, 52.51]} \ No newline at end of file diff --git a/annotations_1/PvqQnJ7Fvz4_filtered.json b/annotations_1/PvqQnJ7Fvz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b73914e6af1e78cef6273cead4eeca2ddca077 --- /dev/null +++ b/annotations_1/PvqQnJ7Fvz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [3.0, 3.2], [10.0, 11.55], [15.0, 15.99], [18.0, 19.21], [23.0, 24.31], [29.0, 28.76], [30.0, 30.89], [34.0, 34.67], [35.0, 37.37], [47.0, 48.0], [54.0, 55.48], [59.0, 60.39], [68.0, 68.44], [70.0, 70.98], [77.0, 84.23], [87.0, 87.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.2, 1.55, 0.99, 1.21, 1.31, -0.24, 0.89, 0.67, 2.37, 1.0, 1.48, 1.39, 0.44, 0.98, 7.23, 0.45]} \ No newline at end of file diff --git a/annotations_1/Pvva0sdUEkc_filtered.json b/annotations_1/Pvva0sdUEkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c49dc3d0bb6fdca79e8bfa04db426cb1931824 --- /dev/null +++ b/annotations_1/Pvva0sdUEkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.53], [15.0, 23.21], [28.0, 28.76], [37.0, 46.53], [47.0, 49.18], [51.0, 53.6], [55.0, 56.27], [59.0, 68.07], [68.0, 68.17], [68.0, 75.27], [76.0, 81.4], [82.0, 102.49], [104.0, 103.82], [106.0, 120.78], [121.0, 125.79], [129.0, 132.31], [133.0, 147.11], [149.0, 149.72], [155.0, 157.57], [161.0, 166.28], [169.0, 170.04], [170.0, 170.55]], "keep_status": [false, true, false, true, false, true, false, true, false, true, false, false, false, true, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 32.09, 0.0, 32.69, 31.45, 31.26, 0.0, 32.57, 0.0, 33.84, 30.72, 31.24, 0.0, 33.11, 35.29, 32.21, 31.62, 0.0, 33.3, 36.81, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.2], ["honk", 13.8], ["music", 13.19]], null, [["fowl", 24.33], ["honk", 22.7], ["music", 17.13]], [["music", 52.95], ["speech", 18.41], ["musical instrument", 3.45]], [["speech", 25.17], ["music", 10.03], ["whale vocalization", 5.11]], null, [["fly, housefly", 21.4], ["insect", 16.79], ["buzz", 14.03]], null, [["music", 39.48], ["hum", 13.38], ["mains hum", 5.34]], [["hum", 45.86], ["mains hum", 18.47], ["throbbing", 11.55]], [["throbbing", 40.68], ["music", 32.73], ["hum", 14.16]], null, [["music", 25.31], ["hum", 15.54], ["mains hum", 12.11]], [["mains hum", 27.42], ["music", 23.67], ["hum", 23.27]], [["music", 44.44], ["speech", 17.86], ["hum", 4.99]], [["fly, housefly", 18.07], ["mains hum", 14.23], ["hum", 14.04]], null, [["mosquito", 60.45], ["fly, housefly", 28.38], ["insect", 4.77]], [["noise", 33.03], ["music", 14.83], ["mosquito", 5.4]], null, null], "duration": [0.53, 8.21, 0.76, 9.53, 2.18, 2.6, 1.27, 9.07, 0.17, 7.27, 5.4, 20.49, -0.18, 14.78, 4.79, 3.31, 14.11, 0.72, 2.57, 5.28, 1.04, 0.55]} \ No newline at end of file diff --git a/annotations_1/PwgxGA6pLhc_filtered.json b/annotations_1/PwgxGA6pLhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66fc474c55336a7ec9cceef22c848f46552309a8 --- /dev/null +++ b/annotations_1/PwgxGA6pLhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [8.0, 8.36], [10.0, 21.71], [22.0, 26.69], [27.0, 28.78], [29.0, 38.13], [38.0, 51.49], [52.0, 52.51], [55.0, 71.46], [74.0, 75.73], [77.0, 81.03], [82.0, 83.17], [84.0, 84.21], [84.0, 102.83], [104.0, 111.67]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 55.18, 49.31, 0.0, 39.54, 40.54, 0.0, 36.37, 0.0, 50.56, 0.0, 0.0, 42.93, 39.99], "audiomae_on_audioset": [null, null, null, [["music", 48.49], ["whale vocalization", 12.04], ["mains hum", 3.82]], null, [["music", 61.97], ["electric shaver, electric razor", 5.0], ["skateboard", 3.21]], [["music", 68.76], ["animal", 9.38], ["grunt", 2.17]], null, [["grunt", 56.16], ["music", 26.58], ["groan", 3.55]], null, null, null, null, [["music", 54.0], ["speech", 4.72], ["hum", 4.52]], [["speech", 71.48], ["electric shaver, electric razor", 6.02], ["burping, eructation", 2.09]]], "duration": [0.45, 0.36, 11.71, 4.69, 1.78, 9.13, 13.49, 0.51, 16.46, 1.73, 4.03, 1.17, 0.21, 18.83, 7.67]} \ No newline at end of file diff --git a/annotations_1/Px2L96GVrKs_filtered.json b/annotations_1/Px2L96GVrKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c883e0cb95dea63f8d37bc650abc04e14c22306 --- /dev/null +++ b/annotations_1/Px2L96GVrKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.87], [6.0, 8.77], [10.0, 11.01], [13.0, 14.64], [16.0, 17.41], [20.0, 21.19], [22.0, 58.94], [60.0, 61.45]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [58.89, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [2.87, 2.77, 1.01, 1.64, 1.41, 1.19, 36.94, 1.45]} \ No newline at end of file diff --git a/annotations_1/PxKcm6wWUJ0_filtered.json b/annotations_1/PxKcm6wWUJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fc9c622960ff52ba374192d70c3dcf15c6b321a --- /dev/null +++ b/annotations_1/PxKcm6wWUJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 9.26], [11.0, 12.26], [13.0, 14.03], [15.0, 15.48], [16.0, 17.78], [19.0, 25.35], [26.0, 29.57], [32.0, 32.48], [38.0, 40.22], [49.0, 49.5], [52.0, 53.72], [64.0, 68.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 99.1, 99.97, 0.0, 100.0, 0.0, 0.0, 98.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 3.26, 1.26, 1.03, 0.48, 1.78, 6.35, 3.57, 0.48, 2.22, 0.5, 1.72, 4.0]} \ No newline at end of file diff --git a/annotations_1/PxuQ1n3xaRQ_filtered.json b/annotations_1/PxuQ1n3xaRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bd337b130fbca5729ef027f2363513562f4e3f0 --- /dev/null +++ b/annotations_1/PxuQ1n3xaRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[69.0, 69.92], [71.0, 71.47], [74.0, 118.74], [119.0, 126.77]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.18], "audiomae_on_audioset": [null, null, null, [["hum", 45.46], ["music", 18.03], ["mains hum", 8.16]]], "duration": [0.92, 0.47, 44.74, 7.77]} \ No newline at end of file diff --git a/annotations_1/PyUqYOB4ey8_filtered.json b/annotations_1/PyUqYOB4ey8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..634ebc129a4ecd3ec291e74ba5a3e032bba8826c --- /dev/null +++ b/annotations_1/PyUqYOB4ey8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.65], [8.0, 8.73], [19.0, 21.29], [35.0, 36.81], [40.0, 42.11], [44.0, 44.98], [45.0, 46.67], [47.0, 51.0], [59.0, 59.53], [70.0, 74.65]], "keep_status": [false, false, true, false, true, false, false, true, false, true], "silence_prob": [30.07, 0.0, 29.77, 0.0, 30.48, 0.0, 0.0, 29.29, 0.0, 29.17], "audiomae_on_audioset": [[["sidetone", 39.76], ["music", 24.33], ["speech", 19.34]], null, [["music", 26.93], ["speech", 13.41], ["boing", 6.8]], null, [["music", 62.19], ["speech", 4.64], ["vehicle", 2.05]], null, null, [["music", 27.81], ["vehicle", 17.68], ["speech", 10.39]], null, [["music", 44.36], ["vehicle", 6.61], ["crowd", 5.64]]], "duration": [2.65, 0.73, 2.29, 1.81, 2.11, 0.98, 1.67, 4.0, 0.53, 4.65]} \ No newline at end of file diff --git a/annotations_1/PywpJSG1dTM_filtered.json b/annotations_1/PywpJSG1dTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..318e59354b3c084e67c8f16720c0273e0fd26f8b --- /dev/null +++ b/annotations_1/PywpJSG1dTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 61.77], [67.0, 71.44], [72.0, 84.45], [85.0, 104.46], [104.0, 104.62], [105.0, 105.29], [106.0, 122.32], [123.0, 135.23], [137.0, 140.68], [142.0, 169.25], [170.0, 170.45], [171.0, 171.93], [172.0, 177.82], [178.0, 179.05]], "keep_status": [true, false, false, true, false, false, true, false, true, false, false, false, true, false], "silence_prob": [35.98, 33.01, 31.81, 30.63, 0.0, 0.0, 32.0, 29.58, 29.17, 29.36, 0.0, 0.0, 40.86, 0.0], "audiomae_on_audioset": [[["music", 42.76], ["insect", 8.39], ["synthesizer", 6.07]], [["music", 45.85], ["mains hum", 12.4], ["hum", 11.88]], [["hum", 42.18], ["mains hum", 29.72], ["music", 15.64]], [["throbbing", 28.17], ["hum", 22.49], ["speech", 15.88]], null, null, [["didgeridoo", 33.71], ["hum", 16.35], ["music", 12.77]], [["throbbing", 33.59], ["siren", 23.51], ["hum", 15.06]], [["music", 21.78], ["throbbing", 21.44], ["speech", 19.34]], [["music", 41.46], ["hum", 21.06], ["throbbing", 15.51]], null, null, [["hum", 30.42], ["throbbing", 10.37], ["mains hum", 6.38]], null], "duration": [4.77, 4.44, 12.45, 19.46, 0.62, 0.29, 16.32, 12.23, 3.68, 27.25, 0.45, 0.93, 5.82, 1.05]} \ No newline at end of file diff --git a/annotations_1/PzTICfN0A-4_filtered.json b/annotations_1/PzTICfN0A-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fa5f9dd06335dfa79909285e641e4278ebeb210 --- /dev/null +++ b/annotations_1/PzTICfN0A-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [9.0, 10.56], [13.0, 14.72], [17.0, 20.78], [24.0, 25.66], [27.0, 28.44], [29.0, 33.27], [34.0, 36.17], [37.0, 38.08], [43.0, 53.49], [55.0, 56.86], [58.0, 60.57], [61.0, 63.37], [65.0, 74.09], [75.0, 79.93], [80.0, 84.27], [85.0, 86.9], [88.0, 92.35], [93.0, 97.55], [100.0, 102.14], [108.0, 119.26], [125.0, 127.06], [129.0, 134.72], [135.0, 135.9], [137.0, 138.01], [139.0, 142.89], [145.0, 146.75], [149.0, 149.79], [152.0, 152.73], [155.0, 158.87], [160.0, 168.37], [170.0, 169.97], [175.0, 185.4]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 48.61, 43.85, 0.0, 55.81, 0.0, 58.89, 47.62, 55.11, 55.74, 36.42, 0.0, 56.7, 48.02, 57.97, 51.18, 53.53, 35.8, 0.0, 0.0, 58.13, 0.0, 0.0, 0.0, 51.39, 54.23, 0.0, 42.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.08], ["hum", 17.27], ["rumble", 8.82]], [["speech", 65.37], ["whale vocalization", 18.24], ["music", 5.45]], null, null, null, null, [["speech", 25.8], ["music", 24.05], ["guitar", 8.35]], null, null, [["speech", 87.08], ["whale vocalization", 5.3], ["rumble", 1.92]], null, null, [["whale vocalization", 40.14], ["rumble", 24.43], ["hiccup", 10.57]], null, null, null, [["fly, housefly", 22.3], ["speech", 20.72], ["music", 11.43]], null, null, null, null, null, null, null, null, null, [["speech", 14.14], ["heart sounds, heartbeat", 9.37], ["whale vocalization", 5.29]]], "duration": [1.61, 1.56, 1.72, 3.78, 1.66, 1.44, 4.27, 2.17, 1.08, 10.49, 1.86, 2.57, 2.37, 9.09, 4.93, 4.27, 1.9, 4.35, 4.55, 2.14, 11.26, 2.06, 5.72, 0.9, 1.01, 3.89, 1.75, 0.79, 0.73, 3.87, 8.37, -0.03, 10.4]} \ No newline at end of file diff --git a/annotations_1/Q-ABzsALkYs_filtered.json b/annotations_1/Q-ABzsALkYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bc6b1502911ea0e432532c32716191e8a69d33d --- /dev/null +++ b/annotations_1/Q-ABzsALkYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.83], [32.0, 31.92], [39.0, 39.77], [42.0, 54.16], [58.0, 58.51], [61.0, 61.11], [64.0, 70.09], [72.0, 75.42], [116.0, 117.86], [125.0, 125.14]], "keep_status": [false, false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.85, 0.0, 0.0, 29.06, 28.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.41], ["hum", 9.03], ["speech", 4.65]], null, null, [["speech", 36.42], ["electric shaver, electric razor", 14.22], ["music", 6.88]], [["livestock, farm animals, working animals", 20.71], ["cattle, bovinae", 14.52], ["moo", 14.08]], null, null], "duration": [-0.17, -0.08, 0.77, 12.16, 0.51, 0.11, 6.09, 3.42, 1.86, 0.14]} \ No newline at end of file diff --git a/annotations_1/Q0IHL6WGFY0_filtered.json b/annotations_1/Q0IHL6WGFY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a54f98dade625a911a1c898abd5a6d11220d56df --- /dev/null +++ b/annotations_1/Q0IHL6WGFY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.68], [16.0, 15.6], [22.0, 22.82], [24.0, 24.27], [25.0, 27.51], [28.0, 30.0], [31.0, 32.49], [34.0, 54.28], [57.0, 57.27], [63.0, 71.31], [80.0, 80.18], [86.0, 91.34], [92.0, 92.91], [95.0, 98.9], [100.0, 101.95], [106.0, 106.47], [109.0, 115.55], [117.0, 146.37]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.43, 41.52, 0.0, 28.86, 0.0, 30.47, 0.0, 43.93, 0.0, 62.68, 0.0, 0.0, 39.72, 40.52], "audiomae_on_audioset": [null, null, null, null, [["music", 63.92], ["electronic music", 6.17], ["hum", 5.26]], [["didgeridoo", 26.83], ["music", 25.36], ["hum", 11.54]], null, [["music", 45.33], ["didgeridoo", 6.31], ["quack", 3.76]], null, [["speech", 35.54], ["hum", 11.3], ["music", 8.92]], null, [["music", 26.02], ["hum", 12.55], ["arrow", 8.08]], null, null, null, null, [["music", 36.67], ["speech", 17.03], ["hum", 14.11]], [["speech", 48.12], ["music", 33.98], ["whale vocalization", 4.71]]], "duration": [0.68, -0.4, 0.82, 0.27, 2.51, 2.0, 1.49, 20.28, 0.27, 8.31, 0.18, 5.34, 0.91, 3.9, 1.95, 0.47, 6.55, 29.37]} \ No newline at end of file diff --git a/annotations_1/Q0IQ3GHGXdM_filtered.json b/annotations_1/Q0IQ3GHGXdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5951a8d6bf108b1622b7acbd5a69f57ab625d81e --- /dev/null +++ b/annotations_1/Q0IQ3GHGXdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 31.87], [38.0, 38.55], [45.0, 46.36], [51.0, 56.42], [57.0, 56.62], [57.0, 60.0], [60.0, 62.67], [63.0, 65.75], [71.0, 79.47], [80.0, 81.16], [82.0, 88.8], [89.0, 91.94], [93.0, 93.29], [95.0, 96.06], [97.0, 99.12], [116.0, 116.34], [117.0, 117.96], [120.0, 120.65], [126.0, 126.79], [128.0, 128.65], [132.0, 133.76], [150.0, 151.11], [153.0, 152.78], [178.0, 178.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.29, 0.0, 0.0, 40.21, 0.0, 81.0, 52.74, 70.02, 94.07, 0.0, 92.97, 79.07, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 44.7], ["music", 36.18], ["beatboxing", 3.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.87, 0.55, 1.36, 5.42, -0.38, 3.0, 2.67, 2.75, 8.47, 1.16, 6.8, 2.94, 0.29, 1.06, 2.12, 0.34, 0.96, 0.65, 0.79, 0.65, 1.76, 1.11, -0.22, 0.82]} \ No newline at end of file diff --git a/annotations_1/Q0gx_D--iDw_filtered.json b/annotations_1/Q0gx_D--iDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..637400307da6f0b821fb83acedaa8c07397eddeb --- /dev/null +++ b/annotations_1/Q0gx_D--iDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 6.15], [8.0, 8.46], [18.0, 18.35], [21.0, 21.1], [24.0, 29.07], [34.0, 38.45], [42.0, 52.96], [53.0, 53.01], [53.0, 59.41], [60.0, 63.59], [68.0, 67.66], [71.0, 72.25], [73.0, 76.94], [81.0, 87.61], [88.0, 87.64], [88.0, 87.67], [88.0, 87.91], [88.0, 87.94], [88.0, 87.98], [88.0, 107.1], [108.0, 110.27], [111.0, 112.97], [114.0, 115.87], [117.0, 129.9], [131.0, 131.67], [132.0, 149.45], [150.0, 153.18], [154.0, 156.07], [157.0, 159.22], [161.0, 162.7], [165.0, 165.92]], "keep_status": [false, false, false, false, false, true, true, true, false, false, true, false, false, true, true, false, false, false, false, false, true, false, false, false, true, false, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.21, 28.46, 29.44, 0.0, 33.74, 28.83, 0.0, 0.0, 31.79, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0, 29.42, 33.8, 0.0, 0.0, 37.81, 0.0, 32.0, 35.49, 34.48, 29.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 25.4], ["cattle, bovinae", 19.96], ["speech", 8.48]], [["livestock, farm animals, working animals", 17.47], ["cattle, bovinae", 8.36], ["groan", 8.24]], [["speech", 20.08], ["outside, rural or natural", 6.44], ["whack, thwack", 5.68]], null, [["livestock, farm animals, working animals", 50.48], ["cattle, bovinae", 31.45], ["moo", 11.82]], [["speech", 28.38], ["livestock, farm animals, working animals", 13.73], ["animal", 9.43]], null, null, [["speech", 44.48], ["fart", 7.49], ["field recording", 5.92]], [["breaking", 20.33], ["speech", 10.41], ["fly, housefly", 9.35]], null, null, null, null, null, [["livestock, farm animals, working animals", 38.09], ["animal", 7.78], ["buzz", 5.59]], [["music", 44.09], ["speech", 34.63], ["electronic music", 1.8]], null, null, [["music", 22.33], ["crushing", 20.68], ["glass", 10.44]], null, [["music", 67.78], ["didgeridoo", 20.71], ["speech", 1.98]], [["music", 59.08], ["breaking", 5.61], ["theremin", 3.38]], [["music", 24.67], ["speech", 16.56], ["didgeridoo", 7.87]], [["speech", 58.46], ["smash, crash", 4.44], ["music", 4.05]], null, null], "duration": [0.34, 1.15, 0.46, 0.35, 0.1, 5.07, 4.45, 10.96, 0.01, 6.41, 3.59, -0.34, 1.25, 3.94, 6.61, -0.36, -0.33, -0.09, -0.06, -0.02, 19.1, 2.27, 1.97, 1.87, 12.9, 0.67, 17.45, 3.18, 2.07, 2.22, 1.7, 0.92]} \ No newline at end of file diff --git a/annotations_1/Q0okgIEkRJM_filtered.json b/annotations_1/Q0okgIEkRJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11d3dadf681f3240c49528f37c1f5665b33603e8 --- /dev/null +++ b/annotations_1/Q0okgIEkRJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 20.61], [22.0, 22.42], [24.0, 23.9], [25.0, 28.65], [29.0, 29.96], [33.0, 37.5], [40.0, 43.65], [46.0, 47.66], [51.0, 56.59], [59.0, 68.71], [74.0, 75.42], [79.0, 83.49], [89.0, 91.42], [100.0, 102.36], [107.0, 110.34]], "keep_status": [false, false, false, true, false, false, false, false, true, true, false, true, true, true, true], "silence_prob": [28.89, 0.0, 0.0, 30.38, 0.0, 28.74, 28.61, 0.0, 29.14, 29.44, 0.0, 30.38, 32.22, 28.55, 29.96], "audiomae_on_audioset": [[["speech", 69.13], ["explosion", 6.26], ["eruption", 4.79]], null, null, [["music", 29.8], ["throbbing", 12.26], ["speech", 9.23]], null, [["speech", 67.34], ["music", 10.32], ["burst, pop", 4.43]], [["machine gun", 38.84], ["speech", 30.11], ["music", 14.45]], null, [["speech", 25.53], ["music", 22.32], ["mains hum", 9.07]], [["mains hum", 24.03], ["music", 20.3], ["hum", 16.69]], null, [["music", 26.54], ["mains hum", 16.6], ["speech", 15.28]], [["music", 36.08], ["speech", 11.24], ["hum", 9.67]], [["music", 24.21], ["whack, thwack", 14.37], ["breaking", 9.42]], [["hum", 22.18], ["breaking", 18.87], ["mains hum", 18.72]]], "duration": [7.61, 0.42, -0.1, 3.65, 0.96, 4.5, 3.65, 1.66, 5.59, 9.71, 1.42, 4.49, 2.42, 2.36, 3.34]} \ No newline at end of file diff --git a/annotations_1/Q1khILbP8yU_filtered.json b/annotations_1/Q1khILbP8yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c290437026cf600d9f7775c52689b9d92be9f34 --- /dev/null +++ b/annotations_1/Q1khILbP8yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 96.97], [98.0, 130.81], [134.0, 135.48], [136.0, 150.4], [151.0, 152.0], [154.0, 164.17], [164.0, 164.51], [165.0, 164.84]], "keep_status": [false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.89, 0.0, 34.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.79], ["speech", 24.94], ["whack, thwack", 7.57]], null, [["music", 49.38], ["didgeridoo", 6.51], ["hum", 4.92]], null, null], "duration": [62.97, 32.81, 1.48, 14.4, 1.0, 10.17, 0.51, -0.16]} \ No newline at end of file diff --git a/annotations_1/Q2-4x2KuRqE_filtered.json b/annotations_1/Q2-4x2KuRqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac178b16f6e0fb04588ed5e42ce75b0b5aebb82e --- /dev/null +++ b/annotations_1/Q2-4x2KuRqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 31.83], [33.0, 39.56], [40.0, 52.34], [54.0, 57.47], [58.0, 66.12], [67.0, 70.66], [76.0, 76.45], [78.0, 78.53], [81.0, 81.14], [93.0, 105.21], [108.0, 113.88], [114.0, 117.8], [118.0, 119.33], [120.0, 121.68], [127.0, 128.43], [129.0, 129.98], [133.0, 133.66], [136.0, 136.95], [138.0, 138.82], [143.0, 144.05], [145.0, 145.2], [146.0, 165.96], [167.0, 175.95]], "keep_status": [true, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.63, 79.59, 32.73, 33.41, 42.48, 58.55, 0.0, 0.0, 0.0, 36.33, 50.46, 48.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 36.97], "audiomae_on_audioset": [[["rumble", 28.44], ["speech", 10.02], ["music", 9.8]], null, [["mosquito", 20.81], ["insect", 16.44], ["fly, housefly", 14.15]], [["music", 33.37], ["didgeridoo", 10.32], ["animal", 10.06]], [["hum", 34.69], ["throbbing", 31.13], ["music", 12.5]], null, null, null, null, [["music", 32.2], ["speech", 23.62], ["throbbing", 15.07]], null, [["fly, housefly", 18.42], ["insect", 10.05], ["mosquito", 8.73]], null, null, null, null, null, null, null, null, null, [["speech", 50.1], ["hum", 12.44], ["throbbing", 11.49]], [["hum", 47.62], ["music", 23.48], ["throbbing", 14.33]]], "duration": [5.83, 6.56, 12.34, 3.47, 8.12, 3.66, 0.45, 0.53, 0.14, 12.21, 5.88, 3.8, 1.33, 1.68, 1.43, 0.98, 0.66, 0.95, 0.82, 1.05, 0.2, 19.96, 8.95]} \ No newline at end of file diff --git a/annotations_1/Q2gFrTuZhFM_filtered.json b/annotations_1/Q2gFrTuZhFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ba085c7d3784d4cde73fb90cd66ae0c6fe0012a --- /dev/null +++ b/annotations_1/Q2gFrTuZhFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [2.0, 5.09], [8.0, 8.31], [9.0, 9.69], [11.0, 12.14], [13.0, 37.57], [39.0, 45.18], [47.0, 49.33], [56.0, 56.32], [57.0, 75.47], [77.0, 80.81], [83.0, 88.8], [92.0, 103.94], [109.0, 110.62]], "keep_status": [false, true, false, false, false, false, true, true, false, false, true, true, true, false], "silence_prob": [0.0, 41.68, 0.0, 0.0, 0.0, 28.52, 29.06, 28.19, 0.0, 28.16, 28.18, 30.21, 28.23, 0.0], "audiomae_on_audioset": [null, [["music", 24.72], ["sonar", 22.22], ["hum", 9.55]], null, null, null, [["speech", 71.61], ["music", 4.35], ["hum", 2.38]], [["speech", 41.92], ["music", 12.02], ["vehicle", 6.59]], [["vehicle", 24.38], ["music", 19.94], ["car", 8.6]], null, [["music", 50.1], ["speech", 29.68], ["fart", 4.71]], [["noise", 14.15], ["fixed-wing aircraft, airplane", 14.05], ["vehicle", 10.67]], [["music", 51.19], ["speech", 10.37], ["hum", 6.59]], [["music", 37.47], ["cacophony", 16.12], ["noise", 7.14]], null], "duration": [0.59, 3.09, 0.31, 0.69, 1.14, 24.57, 6.18, 2.33, 0.32, 18.47, 3.81, 5.8, 11.94, 1.62]} \ No newline at end of file diff --git a/annotations_1/Q37sWrXU39s_filtered.json b/annotations_1/Q37sWrXU39s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c254fc146e2bea14d1cf7f35fc1220c3ad5a40ba --- /dev/null +++ b/annotations_1/Q37sWrXU39s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.23], [27.0, 42.33], [43.0, 45.82], [47.0, 47.83], [51.0, 59.83], [62.0, 77.67], [78.0, 79.14], [83.0, 84.11], [88.0, 93.28], [95.0, 98.63], [100.0, 145.32], [146.0, 146.33], [147.0, 201.18]], "keep_status": [true, false, true, false, true, false, false, false, true, true, false, false, false], "silence_prob": [34.03, 33.0, 34.01, 0.0, 33.23, 32.92, 0.0, 0.0, 31.19, 31.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 26.99], ["music", 23.52], ["mains hum", 14.61]], [["music", 53.39], ["throbbing", 22.0], ["hum", 12.47]], [["music", 55.9], ["techno", 4.51], ["electronic music", 4.5]], null, [["music", 23.41], ["trance music", 15.82], ["hum", 12.08]], [["throbbing", 43.95], ["hum", 30.43], ["music", 13.84]], null, null, [["music", 46.89], ["speech", 16.84], ["throbbing", 4.8]], [["music", 40.84], ["fly, housefly", 5.74], ["hum", 4.27]], null, null, null], "duration": [17.23, 15.33, 2.82, 0.83, 8.83, 15.67, 1.14, 1.11, 5.28, 3.63, 45.32, 0.33, 54.18]} \ No newline at end of file diff --git a/annotations_1/Q3JqdmUTsLI_filtered.json b/annotations_1/Q3JqdmUTsLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca8eb97fe8345ff6da10705fed500149bf814a9b --- /dev/null +++ b/annotations_1/Q3JqdmUTsLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [15.0, 15.99], [18.0, 19.13], [19.0, 23.57], [26.0, 26.32], [29.0, 29.27], [37.0, 38.69], [40.0, 40.78], [46.0, 46.65], [48.0, 49.81], [58.0, 58.89], [60.0, 60.3], [62.0, 66.83], [68.0, 68.13], [69.0, 69.33], [72.0, 71.96], [73.0, 74.41], [75.0, 76.79], [81.0, 83.94], [85.0, 86.73], [100.0, 100.7], [101.0, 106.34], [108.0, 108.77], [110.0, 110.86], [113.0, 121.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 35.58, 0.0, 0.0, 38.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.31], ["fly, housefly", 27.63], ["insect", 11.62]], null, null, [["speech", 28.07], ["music", 22.29], ["didgeridoo", 14.37]]], "duration": [0.74, 0.99, 1.13, 4.57, 0.32, 0.27, 1.69, 0.78, 0.65, 1.81, 0.89, 0.3, 4.83, 0.13, 0.33, -0.04, 1.41, 1.79, 2.94, 1.73, 0.7, 5.34, 0.77, 0.86, 8.44]} \ No newline at end of file diff --git a/annotations_1/Q3n3k6XRQ8s_filtered.json b/annotations_1/Q3n3k6XRQ8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6446b5d64380a55e4244d4d3429f3e167eff58fc --- /dev/null +++ b/annotations_1/Q3n3k6XRQ8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.13], [14.0, 14.01], [17.0, 17.83], [21.0, 32.7], [41.0, 41.0], [42.0, 41.76]], "keep_status": [false, false, false, true, false, false], "silence_prob": [38.16, 0.0, 0.0, 36.81, 0.0, 0.0], "audiomae_on_audioset": [[["music", 73.57], ["musical instrument", 4.5], ["guitar", 3.97]], null, null, [["music", 29.48], ["whack, thwack", 18.2], ["boing", 15.33]], null, null], "duration": [3.13, 0.01, 0.83, 11.7, 0.0, -0.24]} \ No newline at end of file diff --git a/annotations_1/Q49KVa7jotI_filtered.json b/annotations_1/Q49KVa7jotI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e578a5d79b80ebd7bfa2edfe6752a3737a4c026 --- /dev/null +++ b/annotations_1/Q49KVa7jotI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.67], [16.0, 16.71], [28.0, 33.88], [34.0, 35.46], [37.0, 39.11], [43.0, 44.83], [46.0, 50.99], [65.0, 65.42], [67.0, 69.67], [72.0, 72.66], [73.0, 76.45], [77.0, 79.39], [83.0, 85.65], [86.0, 86.34], [90.0, 90.75], [92.0, 98.31], [99.0, 101.06], [101.0, 102.61], [103.0, 106.25], [107.0, 118.84], [119.0, 121.12], [126.0, 127.55], [134.0, 135.04], [136.0, 136.97], [137.0, 140.8], [142.0, 142.3], [143.0, 143.6], [145.0, 145.45], [147.0, 147.07]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [48.52, 0.0, 76.04, 0.0, 92.48, 0.0, 64.52, 0.0, 96.89, 0.0, 84.43, 96.54, 56.78, 0.0, 0.0, 58.72, 80.29, 0.0, 55.81, 46.61, 45.21, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.42], ["synthesizer", 5.7], ["speech", 5.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.49], ["theremin", 26.51], ["musical instrument", 4.17]], [["music", 17.63], ["musical instrument", 8.58], ["cattle, bovinae", 5.3]], null, null, null, [["music", 24.52], ["mosquito", 8.13], ["didgeridoo", 6.26]], null, null, null, null], "duration": [7.67, 0.71, 5.88, 1.46, 2.11, 1.83, 4.99, 0.42, 2.67, 0.66, 3.45, 2.39, 2.65, 0.34, 0.75, 6.31, 2.06, 1.61, 3.25, 11.84, 2.12, 1.55, 1.04, 0.97, 3.8, 0.3, 0.6, 0.45, 0.07]} \ No newline at end of file diff --git a/annotations_1/Q4KRYWe3ngs_filtered.json b/annotations_1/Q4KRYWe3ngs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9cff22613c4e76b9cb2fd7582265ba0ee15b999 --- /dev/null +++ b/annotations_1/Q4KRYWe3ngs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [8.0, 38.18], [39.0, 40.56], [42.0, 43.65], [49.0, 50.21], [54.0, 54.38], [60.0, 62.01], [66.0, 67.93], [70.0, 72.2], [73.0, 75.57], [78.0, 78.9], [86.0, 86.54], [88.0, 89.46], [92.0, 94.51], [97.0, 97.39], [102.0, 103.59], [107.0, 108.4], [109.0, 110.98], [112.0, 112.46], [115.0, 116.34], [120.0, 120.6], [121.0, 121.71], [125.0, 125.15], [126.0, 126.87], [127.0, 127.41], [129.0, 131.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 46.33, 93.29, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 70.57], ["hiccup", 2.1], ["gasp", 1.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 30.18, 1.56, 1.65, 1.21, 0.38, 2.01, 1.93, 2.2, 2.57, 0.9, 0.54, 1.46, 2.51, 0.39, 1.59, 1.4, 1.98, 0.46, 1.34, 0.6, 0.71, 0.15, 0.87, 0.41, 2.84]} \ No newline at end of file diff --git a/annotations_1/Q4r4jGPegHs_filtered.json b/annotations_1/Q4r4jGPegHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4407694f826159064dc96a6a63bc0683bd63a04a --- /dev/null +++ b/annotations_1/Q4r4jGPegHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [4.0, 10.62], [12.0, 16.66], [17.0, 18.86], [21.0, 24.29], [25.0, 26.99], [28.0, 32.02], [33.0, 34.65], [36.0, 37.47], [38.0, 40.31], [41.0, 43.61], [49.0, 50.4], [51.0, 54.99], [57.0, 56.79], [58.0, 60.62], [62.0, 67.81], [69.0, 79.93], [85.0, 85.63], [86.0, 87.37], [91.0, 92.7], [94.0, 94.85], [96.0, 96.5], [97.0, 101.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.7, 68.54, 0.0, 99.36, 0.0, 85.35, 0.0, 0.0, 69.2, 50.46, 0.0, 54.76, 0.0, 50.66, 46.19, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.13], ["singing bowl", 15.48], ["speech", 9.08]], null, null, null, null, null, null, null], "duration": [0.77, 6.62, 4.66, 1.86, 3.29, 1.99, 4.02, 1.65, 1.47, 2.31, 2.61, 1.4, 3.99, -0.21, 2.62, 5.81, 10.93, 0.63, 1.37, 1.7, 0.85, 0.5, 4.33]} \ No newline at end of file diff --git a/annotations_1/Q54GdrlgRoQ_filtered.json b/annotations_1/Q54GdrlgRoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a0c010f5f0ce625546241a88f0a50455b996852 --- /dev/null +++ b/annotations_1/Q54GdrlgRoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.7], [1.0, 3.5], [8.0, 11.11], [14.0, 15.48], [17.0, 19.53], [25.0, 26.28], [29.0, 35.46], [39.0, 40.27], [45.0, 45.54], [46.0, 48.61], [49.0, 49.57], [52.0, 98.27], [106.0, 105.66], [106.0, 106.51], [114.0, 114.79], [117.0, 127.18], [127.0, 127.26], [128.0, 128.41], [129.0, 129.27], [135.0, 146.62], [147.0, 147.99], [148.0, 148.69], [151.0, 151.56], [155.0, 156.24], [159.0, 159.39], [161.0, 162.89]], "keep_status": [false, true, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 30.93, 31.37, 0.0, 32.32, 0.0, 31.28, 0.0, 0.0, 33.54, 0.0, 0.0, 0.0, 0.0, 0.0, 28.56, 0.0, 0.0, 0.0, 29.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 24.42], ["mains hum", 15.21], ["throbbing", 5.16]], [["vehicle", 19.86], ["speech", 8.67], ["buzz", 6.55]], null, [["hum", 18.33], ["throbbing", 10.5], ["fly, housefly", 6.62]], null, [["fly, housefly", 32.33], ["insect", 27.34], ["bee, wasp, etc.", 12.28]], null, null, [["mains hum", 15.36], ["hum", 12.95], ["speech", 12.61]], null, null, null, null, null, [["music", 46.71], ["throbbing", 17.55], ["speech", 13.04]], null, null, null, [["music", 20.59], ["throbbing", 18.56], ["hum", 18.35]], null, null, null, null, null, null], "duration": [-0.3, 2.5, 3.11, 1.48, 2.53, 1.28, 6.46, 1.27, 0.54, 2.61, 0.57, 46.27, -0.34, 0.51, 0.79, 10.18, 0.26, 0.41, 0.27, 11.62, 0.99, 0.69, 0.56, 1.24, 0.39, 1.89]} \ No newline at end of file diff --git a/annotations_1/Q6jbNsSNxf4_filtered.json b/annotations_1/Q6jbNsSNxf4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a03dd7dec860550ba01a7d04a29b6d3b5673158 --- /dev/null +++ b/annotations_1/Q6jbNsSNxf4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 67.66], [68.0, 132.02], [134.0, 146.72]], "keep_status": [false, false, false], "silence_prob": [29.56, 0.0, 31.91], "audiomae_on_audioset": [[["music", 61.02], ["didgeridoo", 8.11], ["hum", 4.67]], null, [["speech", 30.91], ["hum", 30.5], ["sidetone", 12.63]]], "duration": [7.66, 64.02, 12.72]} \ No newline at end of file diff --git a/annotations_1/Q7--4JW6y6E_filtered.json b/annotations_1/Q7--4JW6y6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4923404192f2a858178d2cbac823dccae55ad4cd --- /dev/null +++ b/annotations_1/Q7--4JW6y6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [6.0, 6.02], [7.0, 20.22], [22.0, 86.75], [87.0, 90.26], [96.0, 96.77], [98.0, 102.22], [104.0, 107.86], [110.0, 112.5], [115.0, 116.78], [119.0, 132.92]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 29.09, 0.0, 33.46, 0.0, 31.21, 28.04, 28.4, 0.0, 34.55], "audiomae_on_audioset": [null, null, [["sonar", 40.94], ["rumble", 8.34], ["music", 7.9]], null, [["music", 40.1], ["hum", 15.78], ["mains hum", 14.37]], null, [["mains hum", 23.76], ["hum", 17.75], ["music", 15.06]], [["music", 66.38], ["synthesizer", 4.81], ["effects unit", 4.25]], [["vehicle", 26.3], ["car", 4.74], ["music", 4.11]], null, [["music", 56.97], ["hum", 7.34], ["electronic music", 7.08]]], "duration": [1.31, 0.02, 13.22, 64.75, 3.26, 0.77, 4.22, 3.86, 2.5, 1.78, 13.92]} \ No newline at end of file diff --git a/annotations_1/Q7r3HIkBJcg_filtered.json b/annotations_1/Q7r3HIkBJcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b626587401361d85af0663152922841a11d9417 --- /dev/null +++ b/annotations_1/Q7r3HIkBJcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.2], [17.0, 18.89], [21.0, 21.05], [21.0, 21.17], [24.0, 25.3], [27.0, 28.41], [29.0, 32.59], [42.0, 44.02], [48.0, 48.73], [55.0, 55.16], [58.0, 59.71], [63.0, 63.76], [70.0, 71.71], [73.0, 74.29], [75.0, 77.6], [79.0, 80.37], [82.0, 82.58], [88.0, 88.28], [91.0, 95.42], [105.0, 106.81], [111.0, 111.48], [115.0, 117.68], [123.0, 131.3], [133.0, 152.91], [154.0, 155.95], [160.0, 162.09], [169.0, 169.15], [182.0, 182.36], [197.0, 198.88]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 31.98, 35.31, 32.61, 0.0, 33.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 27.77], ["music", 17.7], ["fart", 4.89]], null, null, null, null, null, null, null, [["speech", 43.49], ["music", 29.54], ["breaking", 5.55]], null, null, null, null, null, null, [["groan", 32.39], ["sound effect", 11.92], ["music", 6.09]], [["throbbing", 24.23], ["music", 23.95], ["hum", 9.69]], [["music", 44.55], ["fart", 5.18], ["speech", 4.99]], null, [["moo", 31.6], ["cattle, bovinae", 26.54], ["livestock, farm animals, working animals", 23.48]], null, null, null], "duration": [0.2, 1.89, 0.05, 0.17, 1.3, 1.41, 3.59, 2.02, 0.73, 0.16, 1.71, 0.76, 1.71, 1.29, 2.6, 1.37, 0.58, 0.28, 4.42, 1.81, 0.48, 2.68, 8.3, 19.91, 1.95, 2.09, 0.15, 0.36, 1.88]} \ No newline at end of file diff --git a/annotations_1/Q85twbu-Vvk_filtered.json b/annotations_1/Q85twbu-Vvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d0978d4f7a2c1dfa8dedb8a85d61719523fecbc --- /dev/null +++ b/annotations_1/Q85twbu-Vvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 40.83], [47.0, 48.52], [53.0, 54.03], [55.0, 56.44], [58.0, 60.88], [62.0, 66.7], [77.0, 82.22], [85.0, 84.67], [87.0, 90.26], [92.0, 96.5], [102.0, 102.9], [113.0, 114.1], [117.0, 117.44], [126.0, 126.3], [128.0, 143.94], [145.0, 150.15], [151.0, 156.81]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [31.8, 0.0, 0.0, 0.0, 62.89, 35.0, 31.54, 0.0, 37.1, 31.69, 0.0, 0.0, 0.0, 0.0, 30.36, 46.02, 33.97], "audiomae_on_audioset": [[["music", 26.05], ["gong", 15.74], ["theremin", 7.89]], null, null, null, null, [["speech", 33.08], ["whale vocalization", 15.14], ["hum", 4.61]], [["speech", 49.58], ["music", 9.46], ["cattle, bovinae", 6.56]], null, [["livestock, farm animals, working animals", 31.18], ["moo", 25.8], ["cattle, bovinae", 16.28]], [["music", 44.43], ["speech", 14.18], ["electronic music", 13.8]], null, null, null, null, [["speech", 22.44], ["throbbing", 17.0], ["music", 15.28]], [["music", 30.62], ["mains hum", 19.66], ["hum", 17.02]], [["music", 58.88], ["ambient music", 23.77], ["electronic music", 3.86]]], "duration": [14.83, 1.52, 1.03, 1.44, 2.88, 4.7, 5.22, -0.33, 3.26, 4.5, 0.9, 1.1, 0.44, 0.3, 15.94, 5.15, 5.81]} \ No newline at end of file diff --git a/annotations_1/Q9Vl1VGj0LE_filtered.json b/annotations_1/Q9Vl1VGj0LE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9753ba4a4db57c78b47a0371409461d065f7e54d --- /dev/null +++ b/annotations_1/Q9Vl1VGj0LE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.22], [19.0, 21.1], [24.0, 25.08], [27.0, 33.25], [39.0, 39.12], [40.0, 40.86], [43.0, 46.47], [48.0, 49.0], [50.0, 53.13], [56.0, 59.41], [61.0, 69.72], [71.0, 71.81], [73.0, 73.63], [90.0, 123.11], [126.0, 126.33], [129.0, 131.03], [131.0, 132.06], [138.0, 138.1], [141.0, 141.44], [144.0, 144.8], [146.0, 146.97], [148.0, 148.98], [150.0, 152.81], [154.0, 155.04], [156.0, 157.67], [159.0, 160.95], [167.0, 168.37], [172.0, 180.01]], "keep_status": [false, true, false, true, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.11, 0.0, 39.75, 0.0, 0.0, 40.19, 0.0, 40.92, 34.93, 35.68, 0.0, 0.0, 0.0, 0.0, 38.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 83.16], "audiomae_on_audioset": [null, [["whale vocalization", 37.28], ["hum", 9.49], ["sine wave", 7.75]], null, [["hum", 31.09], ["rumble", 24.63], ["mains hum", 9.96]], null, null, [["whale vocalization", 22.87], ["hum", 21.06], ["sine wave", 13.51]], null, [["hum", 26.99], ["chirp tone", 20.62], ["sine wave", 16.93]], [["sidetone", 36.61], ["speech", 19.95], ["whale vocalization", 12.0]], [["hum", 45.04], ["throbbing", 21.42], ["mains hum", 14.32]], null, null, null, null, [["speech", 33.17], ["sidetone", 29.83], ["creak", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.22, 2.1, 1.08, 6.25, 0.12, 0.86, 3.47, 1.0, 3.13, 3.41, 8.72, 0.81, 0.63, 33.11, 0.33, 2.03, 1.06, 0.1, 0.44, 0.8, 0.97, 0.98, 2.81, 1.04, 1.67, 1.95, 1.37, 8.01]} \ No newline at end of file diff --git a/annotations_1/QAO6uTkGpjM_filtered.json b/annotations_1/QAO6uTkGpjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa8155810028fd987cd0f0af6a9498bfa10356a0 --- /dev/null +++ b/annotations_1/QAO6uTkGpjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 10.79], [13.0, 14.23], [15.0, 16.78], [18.0, 19.28], [21.0, 24.22], [26.0, 26.06], [33.0, 35.29], [39.0, 38.96], [46.0, 46.35], [51.0, 51.68], [55.0, 55.73], [60.0, 60.45], [61.0, 61.79], [65.0, 89.87], [91.0, 105.53], [106.0, 108.6], [109.0, 112.02], [113.0, 113.93], [115.0, 139.92], [144.0, 158.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 52.98, 0.0, 0.0, 0.0, 92.64, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.05, 33.72, 47.2, 85.54, 0.0, 30.65, 33.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.69], ["hum", 8.17], ["throbbing", 7.87]], [["speech", 26.43], ["gong", 20.78], ["music", 5.63]], [["music", 17.25], ["hum", 12.39], ["throbbing", 9.1]], null, null, [["hum", 24.76], ["mains hum", 22.2], ["music", 12.19]], [["music", 48.36], ["speech", 19.42], ["didgeridoo", 4.54]]], "duration": [0.16, 5.79, 1.23, 1.78, 1.28, 3.22, 0.06, 2.29, -0.04, 0.35, 0.68, 0.73, 0.45, 0.79, 24.87, 14.53, 2.6, 3.02, 0.93, 24.92, 14.26]} \ No newline at end of file diff --git a/annotations_1/QAiVcQifKfE_filtered.json b/annotations_1/QAiVcQifKfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5047899d3b95d9f209dba714ff8618d47ca8573 --- /dev/null +++ b/annotations_1/QAiVcQifKfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.49], [16.0, 16.24], [17.0, 20.06], [22.0, 29.81], [30.0, 30.86], [32.0, 34.01], [35.0, 38.35], [39.0, 40.74], [41.0, 48.03], [48.0, 51.49], [52.0, 65.03], [66.0, 70.06], [72.0, 76.82], [78.0, 80.37], [82.0, 83.49], [92.0, 96.48], [99.0, 98.95], [99.0, 99.37], [106.0, 106.59], [110.0, 110.67], [113.0, 114.71], [116.0, 117.71], [118.0, 120.34], [122.0, 125.12], [127.0, 129.57], [132.0, 138.33], [139.0, 139.16], [147.0, 149.84], [151.0, 153.0]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 86.09, 63.64, 0.0, 77.7, 77.7, 0.0, 46.79, 65.44, 67.38, 86.09, 87.55, 54.36, 0.0, 63.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 60.89, 44.93, 44.78, 0.0, 68.54, 80.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 38.77], ["sidetone", 11.72], ["telephone", 7.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.33], ["sidetone", 3.21], ["boing", 2.73]], null, [["sidetone", 52.23], ["speech", 10.23], ["radio", 7.96]], [["sidetone", 94.9], ["speech", 3.16], ["hum", 0.34]], null, null, null], "duration": [1.49, 0.24, 3.06, 7.81, 0.86, 2.01, 3.35, 1.74, 7.03, 3.49, 13.03, 4.06, 4.82, 2.37, 1.49, 4.48, -0.05, 0.37, 0.59, 0.67, 1.71, 1.71, 2.34, 3.12, 2.57, 6.33, 0.16, 2.84, 2.0]} \ No newline at end of file diff --git a/annotations_1/QB9AY9Em4To_filtered.json b/annotations_1/QB9AY9Em4To_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88f597e4760ca9eea809edf1d2f06962601970b7 --- /dev/null +++ b/annotations_1/QB9AY9Em4To_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 59.31], [62.0, 80.43], [82.0, 106.29], [107.0, 139.8], [140.0, 140.64], [141.0, 142.03], [143.0, 143.63], [144.0, 144.36], [146.0, 149.55], [151.0, 153.67], [155.0, 198.34], [201.0, 202.83], [205.0, 206.24], [208.0, 215.81], [217.0, 218.03], [219.0, 222.74]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.94, 31.39, 0.0, 0.0, 0.0, 0.0, 0.0, 35.48, 32.97, 0.0, 0.0, 0.0, 38.19, 0.0, 36.84], "audiomae_on_audioset": [null, [["music", 77.79], ["throbbing", 5.03], ["ambient music", 2.3]], [["throbbing", 45.54], ["hum", 38.29], ["music", 7.72]], null, null, null, null, null, [["speech", 21.59], ["music", 21.32], ["throbbing", 18.22]], [["music", 70.89], ["timpani", 8.65], ["musical instrument", 3.49]], null, null, null, [["music", 61.89], ["throbbing", 11.51], ["hum", 10.42]], null, [["music", 82.32], ["throbbing", 3.54], ["synthesizer", 3.4]]], "duration": [44.31, 18.43, 24.29, 32.8, 0.64, 1.03, 0.63, 0.36, 3.55, 2.67, 43.34, 1.83, 1.24, 7.81, 1.03, 3.74]} \ No newline at end of file diff --git a/annotations_1/QBUTO2RVjXU_filtered.json b/annotations_1/QBUTO2RVjXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3df78ada93c528e69a91d487260edbccb83fde --- /dev/null +++ b/annotations_1/QBUTO2RVjXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.23], [19.0, 21.93], [23.0, 24.48], [28.0, 30.11], [31.0, 30.96], [32.0, 38.91], [41.0, 46.52], [48.0, 52.0], [56.0, 68.76]], "keep_status": [true, true, false, true, false, false, true, true, true], "silence_prob": [44.87, 43.74, 0.0, 42.26, 0.0, 35.14, 44.52, 45.36, 42.62], "audiomae_on_audioset": [[["noise", 27.82], ["mains hum", 23.68], ["hum", 14.78]], [["sonar", 32.86], ["sidetone", 10.74], ["throbbing", 10.72]], null, [["croak", 19.89], ["frog", 11.36], ["hum", 9.37]], null, [["hum", 38.4], ["mains hum", 23.11], ["speech", 17.78]], [["hum", 25.28], ["music", 9.64], ["rumble", 8.57]], [["whale vocalization", 23.42], ["rumble", 20.78], ["hum", 19.35]], [["rumble", 22.78], ["frog", 16.88], ["speech", 12.03]]], "duration": [8.23, 2.93, 1.48, 2.11, -0.04, 6.91, 5.52, 4.0, 12.76]} \ No newline at end of file diff --git a/annotations_1/QC0kTcAlf64_filtered.json b/annotations_1/QC0kTcAlf64_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0889d4d36855a6d86038eb0c6b8accbbc73efdf4 --- /dev/null +++ b/annotations_1/QC0kTcAlf64_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.92], [22.0, 22.23], [29.0, 29.57], [53.0, 54.68], [58.0, 61.13], [63.0, 66.97], [74.0, 74.68], [79.0, 79.95], [84.0, 84.33], [85.0, 85.56], [92.0, 92.1], [96.0, 99.08], [105.0, 105.49], [111.0, 112.5], [135.0, 135.24], [139.0, 142.79], [152.0, 152.56], [168.0, 170.23], [170.0, 171.58], [177.0, 179.47]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.15, 28.55, 0.0, 0.0, 0.0, 0.0, 0.0, 29.65, 0.0, 0.0, 0.0, 29.12, 0.0, 30.87, 0.0, 28.68], "audiomae_on_audioset": [null, null, null, null, [["hum", 27.89], ["speech", 21.23], ["mains hum", 21.11]], [["music", 23.01], ["speech", 18.41], ["didgeridoo", 12.14]], null, null, null, null, null, [["fly, housefly", 16.98], ["mosquito", 16.77], ["moo", 15.88]], null, null, null, [["livestock, farm animals, working animals", 36.79], ["moo", 34.53], ["cattle, bovinae", 25.94]], null, [["speech", 15.45], ["crying, sobbing", 6.59], ["hoot", 6.0]], null, [["music", 32.84], ["buzz", 5.22], ["explosion", 4.41]]], "duration": [0.92, 0.23, 0.57, 1.68, 3.13, 3.97, 0.68, 0.95, 0.33, 0.56, 0.1, 3.08, 0.49, 1.5, 0.24, 3.79, 0.56, 2.23, 1.58, 2.47]} \ No newline at end of file diff --git a/annotations_1/QC5re6k5nLk_filtered.json b/annotations_1/QC5re6k5nLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a34fef4a556a98bd267424b9ca882030ea65e608 --- /dev/null +++ b/annotations_1/QC5re6k5nLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.48], [46.0, 47.58], [48.0, 50.23], [51.0, 52.56], [54.0, 56.25]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.1, 0.0, 54.83], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.48, 1.58, 2.23, 1.56, 2.25]} \ No newline at end of file diff --git a/annotations_1/QCsjm6QI4WM_filtered.json b/annotations_1/QCsjm6QI4WM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e15ccf603efaaf319f53ee9dcb14b79d5d3272d7 --- /dev/null +++ b/annotations_1/QCsjm6QI4WM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.68], [6.0, 5.93], [6.0, 7.94], [20.0, 21.22], [22.0, 22.98], [26.0, 26.65], [33.0, 34.05], [35.0, 35.46], [38.0, 38.82], [41.0, 42.35], [43.0, 43.51], [44.0, 43.55], [45.0, 45.42], [47.0, 47.68], [49.0, 50.08], [51.0, 52.07], [57.0, 58.7], [60.0, 60.3], [61.0, 61.79], [65.0, 65.28], [66.0, 68.39], [71.0, 72.67], [76.0, 76.3], [87.0, 94.83], [99.0, 99.54], [110.0, 110.39], [111.0, 111.97], [113.0, 114.07], [127.0, 131.92], [133.0, 140.22], [144.0, 143.65], [145.0, 145.44], [147.0, 148.19], [149.0, 153.64], [154.0, 154.45], [155.0, 157.22], [170.0, 169.75], [171.0, 171.36], [174.0, 174.46], [175.0, 175.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 44.66, 46.26, 0.0, 0.0, 0.0, 38.76, 0.0, 36.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.25], ["music", 14.39], ["musical instrument", 1.97]], null, null, null, null, null, null, null, [["door", 20.91], ["music", 10.59], ["effects unit", 8.32]], [["wood", 16.02], ["crushing", 14.37], ["speech", 12.33]], null, null, null, [["speech", 74.0], ["bouncing", 5.18], ["fart", 4.32]], null, [["music", 27.57], ["speech", 27.37], ["mosquito", 4.29]], null, null, null, null], "duration": [1.68, -0.07, 1.94, 1.22, 0.98, 0.65, 1.05, 0.46, 0.82, 1.35, 0.51, -0.45, 0.42, 0.68, 1.08, 1.07, 1.7, 0.3, 0.79, 0.28, 2.39, 1.67, 0.3, 7.83, 0.54, 0.39, 0.97, 1.07, 4.92, 7.22, -0.35, 0.44, 1.19, 4.64, 0.45, 2.22, -0.25, 0.36, 0.46, 0.07]} \ No newline at end of file diff --git a/annotations_1/QDARBy0jCgs_filtered.json b/annotations_1/QDARBy0jCgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c50f058b525b621b8b80ff149484b29d3fe6e02 --- /dev/null +++ b/annotations_1/QDARBy0jCgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [18.0, 18.01], [19.0, 22.28], [36.0, 36.44], [39.0, 39.28], [48.0, 85.68], [86.0, 90.49], [91.0, 91.59], [92.0, 94.93], [98.0, 98.79], [101.0, 101.12], [102.0, 103.03], [103.0, 105.51], [107.0, 108.04], [111.0, 112.46], [122.0, 124.63], [126.0, 126.32], [129.0, 130.27], [138.0, 139.09], [149.0, 148.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 40.11, 0.0, 99.26, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 76.26], ["boing", 3.01], ["sidetone", 1.86]], null, null, null, [["speech", 62.42], ["dishes, pots, and pans", 6.44], ["cutlery, silverware", 5.87]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.01, 3.28, 0.44, 0.28, 37.68, 4.49, 0.59, 2.93, 0.79, 0.12, 1.03, 2.51, 1.04, 1.46, 2.63, 0.32, 1.27, 1.09, -0.07]} \ No newline at end of file diff --git a/annotations_1/QDroSLQiSRI_filtered.json b/annotations_1/QDroSLQiSRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ee9939f1853d65958693ae4593d6755e616d6bb --- /dev/null +++ b/annotations_1/QDroSLQiSRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.55], [10.0, 13.74], [17.0, 18.08], [18.0, 21.54], [22.0, 23.11], [23.0, 29.74], [30.0, 35.18], [35.0, 38.96], [46.0, 46.6], [47.0, 49.35], [50.0, 52.76], [54.0, 55.21], [56.0, 65.52], [66.0, 73.18], [74.0, 74.24], [75.0, 75.15], [76.0, 80.32], [82.0, 84.74], [86.0, 87.03], [87.0, 88.91], [90.0, 95.49], [99.0, 103.74], [106.0, 108.21], [109.0, 118.71], [121.0, 126.49], [129.0, 131.13]], "keep_status": [false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.89, 0.0, 33.48, 0.0, 48.82, 58.38, 34.32, 0.0, 33.59, 33.52, 0.0, 58.22, 97.73, 0.0, 0.0, 89.36, 100.0, 0.0, 0.0, 98.73, 100.0, 99.98, 97.33, 98.73, 100.0], "audiomae_on_audioset": [null, [["speech", 36.41], ["music", 24.85], ["hum", 5.67]], null, [["music", 14.29], ["hum", 14.05], ["speech", 13.42]], null, [["telephone", 72.76], ["speech", 8.97], ["telephone dialing, dtmf", 8.34]], null, [["music", 26.06], ["throbbing", 25.49], ["tuning fork", 13.42]], null, [["throbbing", 36.1], ["hum", 19.62], ["music", 14.75]], [["speech", 20.12], ["didgeridoo", 15.47], ["music", 15.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 3.74, 1.08, 3.54, 1.11, 6.74, 5.18, 3.96, 0.6, 2.35, 2.76, 1.21, 9.52, 7.18, 0.24, 0.15, 4.32, 2.74, 1.03, 1.91, 5.49, 4.74, 2.21, 9.71, 5.49, 2.13]} \ No newline at end of file diff --git a/annotations_1/QEfuINMgcnI_filtered.json b/annotations_1/QEfuINMgcnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..510f992a00213d71ce354e11c67b0e278cb7b7e1 --- /dev/null +++ b/annotations_1/QEfuINMgcnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.12], [15.0, 15.74], [17.0, 17.68], [19.0, 22.03], [23.0, 23.58], [24.0, 23.72], [24.0, 23.77], [25.0, 29.15], [31.0, 31.36], [33.0, 34.74], [36.0, 47.71], [48.0, 49.33], [50.0, 54.85], [56.0, 56.54], [58.0, 70.97], [73.0, 73.89], [75.0, 77.43], [79.0, 78.83], [80.0, 86.56], [87.0, 87.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 42.17, 0.0, 37.96, 0.0, 33.0, 0.0, 50.56, 0.0, 30.54, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.54], ["didgeridoo", 40.42], ["musical instrument", 1.78]], null, null, null, [["music", 63.74], ["throbbing", 14.97], ["hum", 5.21]], null, null, [["throbbing", 32.03], ["music", 27.26], ["hum", 24.95]], null, [["music", 68.62], ["throbbing", 4.16], ["techno", 1.73]], null, [["music", 51.46], ["throbbing", 14.26], ["speech", 11.57]], null, null, null, [["speech", 51.0], ["hum", 7.71], ["music", 5.47]], null], "duration": [0.12, 0.74, 0.68, 3.03, 0.58, -0.28, -0.23, 4.15, 0.36, 1.74, 11.71, 1.33, 4.85, 0.54, 12.97, 0.89, 2.43, -0.17, 6.56, 0.59]} \ No newline at end of file diff --git a/annotations_1/QEv3zzKyiFQ_filtered.json b/annotations_1/QEv3zzKyiFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..652bfe7dcf7433e3524b5726d4b8bc800e763b7a --- /dev/null +++ b/annotations_1/QEv3zzKyiFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 87.44], [89.0, 93.39], [95.0, 102.19], [105.0, 105.66]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 37.25, 36.11, 0.0], "audiomae_on_audioset": [null, [["hum", 44.76], ["mains hum", 28.24], ["eruption", 5.48]], [["hum", 54.07], ["mains hum", 31.89], ["music", 4.01]], null], "duration": [30.44, 4.39, 7.19, 0.66]} \ No newline at end of file diff --git a/annotations_1/QFDZTfWnWGg_filtered.json b/annotations_1/QFDZTfWnWGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d72736ac1a4718b3dc162142674a359f8957fe1b --- /dev/null +++ b/annotations_1/QFDZTfWnWGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 49.72], [51.0, 53.15], [54.0, 172.44], [174.0, 185.11]], "keep_status": [false, false, false, false], "silence_prob": [86.82, 99.88, 0.0, 94.07], "audiomae_on_audioset": [null, null, null, null], "duration": [6.72, 2.15, 118.44, 11.11]} \ No newline at end of file diff --git a/annotations_1/QH2Z3rBA9C4_filtered.json b/annotations_1/QH2Z3rBA9C4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fb4810cf87ea197bc7109009b74278d69798f6a --- /dev/null +++ b/annotations_1/QH2Z3rBA9C4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 30.75], [32.0, 32.49], [34.0, 59.64], [61.0, 83.84], [85.0, 92.94], [94.0, 103.99], [109.0, 131.03]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [29.47, 0.0, 29.37, 29.37, 29.67, 29.61, 29.44], "audiomae_on_audioset": [[["music", 74.01], ["didgeridoo", 6.16], ["rock and roll", 2.51]], null, [["music", 85.18], ["didgeridoo", 6.42], ["musical instrument", 1.37]], [["music", 68.75], ["speech", 5.21], ["electronic music", 3.48]], [["music", 73.84], ["speech", 6.61], ["static", 1.14]], [["music", 52.13], ["speech", 11.17], ["throbbing", 7.97]], [["music", 30.45], ["speech", 19.59], ["didgeridoo", 8.23]]], "duration": [6.75, 0.49, 25.64, 22.84, 7.94, 9.99, 22.03]} \ No newline at end of file diff --git a/annotations_1/QHU65AAx6uk_filtered.json b/annotations_1/QHU65AAx6uk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53bab0bd303db2b2138712e40f6bd1967eb96921 --- /dev/null +++ b/annotations_1/QHU65AAx6uk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.05], [35.0, 37.61], [38.0, 38.64], [39.0, 42.4], [44.0, 44.22], [48.0, 48.2], [56.0, 57.91], [62.0, 61.96], [64.0, 74.16], [75.0, 83.07], [84.0, 83.91], [85.0, 151.88], [156.0, 168.27]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 95.78, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 34.0, 32.11, 0.0, 0.0, 29.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 48.23], ["piano", 8.68], ["electric piano", 7.52]], [["music", 46.04], ["speech", 20.51], ["musical instrument", 8.87]], null, null, [["music", 61.56], ["musical instrument", 3.8], ["maraca", 2.5]]], "duration": [1.05, 2.61, 0.64, 3.4, 0.22, 0.2, 1.91, -0.04, 10.16, 8.07, -0.09, 66.88, 12.27]} \ No newline at end of file diff --git a/annotations_1/QIIE8CobvEU_filtered.json b/annotations_1/QIIE8CobvEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f778d04bb96dcc3804a490981aefd265dd2faa32 --- /dev/null +++ b/annotations_1/QIIE8CobvEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 86.29], [87.0, 93.21], [95.0, 102.96], [107.0, 107.06], [108.0, 135.24], [137.0, 138.21], [139.0, 147.45], [150.0, 163.54]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.29, 58.98, 0.0, 48.91, 0.0, 38.28, 51.02], "audiomae_on_audioset": [null, null, null, null, [["hum", 34.48], ["mains hum", 25.57], ["music", 23.51]], null, [["mains hum", 37.71], ["hum", 30.28], ["music", 6.98]], null], "duration": [0.29, 6.21, 7.96, 0.06, 27.24, 1.21, 8.45, 13.54]} \ No newline at end of file diff --git a/annotations_1/QJX3XvkTJQk_filtered.json b/annotations_1/QJX3XvkTJQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d30a0522b85a138ce31dd63c3001c6846d61cfc --- /dev/null +++ b/annotations_1/QJX3XvkTJQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 30.32], [32.0, 36.14], [37.0, 37.61], [38.0, 39.38], [40.0, 40.29], [41.0, 41.5], [46.0, 47.31], [48.0, 49.47], [51.0, 51.7], [52.0, 53.13], [54.0, 55.7], [74.0, 74.31], [75.0, 75.52], [78.0, 79.76], [81.0, 82.29], [86.0, 86.73], [90.0, 90.26], [93.0, 93.09], [95.0, 99.05], [101.0, 102.07], [104.0, 104.21], [107.0, 106.95], [110.0, 111.47], [113.0, 113.85], [118.0, 121.36], [122.0, 123.53], [124.0, 126.35], [132.0, 133.29], [134.0, 135.3], [137.0, 137.47], [140.0, 142.91], [144.0, 147.36], [150.0, 151.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.19, 52.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 66.51, 0.0, 0.0, 0.0, 73.82, 78.38, 0.0], "audiomae_on_audioset": [[["hum", 28.57], ["music", 27.8], ["mains hum", 15.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [16.32, 4.14, 0.61, 1.38, 0.29, 0.5, 1.31, 1.47, 0.7, 1.13, 1.7, 0.31, 0.52, 1.76, 1.29, 0.73, 0.26, 0.09, 4.05, 1.07, 0.21, -0.05, 1.47, 0.85, 3.36, 1.53, 2.35, 1.29, 1.3, 0.47, 2.91, 3.36, 1.68]} \ No newline at end of file diff --git a/annotations_1/QKbA0PxeoaM_filtered.json b/annotations_1/QKbA0PxeoaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc251932e8df89568d6d0d4aaffece9095436b5 --- /dev/null +++ b/annotations_1/QKbA0PxeoaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 33.74], [35.0, 59.48], [60.0, 62.72], [67.0, 69.03], [73.0, 75.41]], "keep_status": [false, false, false, false, false], "silence_prob": [80.29, 94.22, 92.8, 91.13, 99.92], "audiomae_on_audioset": [null, null, null, null, null], "duration": [19.74, 24.48, 2.72, 2.03, 2.41]} \ No newline at end of file diff --git a/annotations_1/QLTlJDjPfHI_filtered.json b/annotations_1/QLTlJDjPfHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48bb10f05fd66d4b3f26d73c43c913571a5f1c4a --- /dev/null +++ b/annotations_1/QLTlJDjPfHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 25.93], [28.0, 42.85], [48.0, 48.41], [58.0, 58.29], [64.0, 65.15], [67.0, 109.97], [110.0, 136.29], [140.0, 140.02], [147.0, 147.46], [149.0, 150.15], [151.0, 152.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.54, 28.27, 0.0, 0.0, 0.0, 0.0, 28.23, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 89.56], ["electronic music", 1.68], ["throbbing", 1.67]], [["music", 65.34], ["speech", 6.43], ["throbbing", 2.05]], null, null, null, null, [["hum", 40.05], ["mains hum", 20.49], ["throbbing", 15.32]], null, null, null, null], "duration": [22.93, 14.85, 0.41, 0.29, 1.15, 42.97, 26.29, 0.02, 0.46, 1.15, 1.71]} \ No newline at end of file diff --git a/annotations_1/QLkt-SfsCsQ_filtered.json b/annotations_1/QLkt-SfsCsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94f15c4d44c6e33c33c1029669845bce327238e9 --- /dev/null +++ b/annotations_1/QLkt-SfsCsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.41], [6.0, 7.03], [9.0, 11.52], [13.0, 16.82], [17.0, 18.47], [19.0, 23.67], [25.0, 28.78], [29.0, 29.86], [32.0, 33.05], [34.0, 41.76], [43.0, 46.35], [50.0, 66.01], [69.0, 69.82], [71.0, 71.61], [73.0, 75.66], [77.0, 80.33], [82.0, 82.61], [83.0, 86.16], [87.0, 87.64], [89.0, 89.67], [90.0, 97.98], [99.0, 99.47], [100.0, 100.25], [102.0, 103.22], [108.0, 109.46], [110.0, 111.21], [112.0, 115.28], [116.0, 120.75], [123.0, 126.94], [128.0, 130.13], [131.0, 132.63], [133.0, 135.03], [136.0, 145.47], [146.0, 147.77], [149.0, 151.06], [156.0, 158.06], [159.0, 163.46], [166.0, 166.56], [167.0, 172.81], [177.0, 178.92], [180.0, 180.89], [182.0, 183.73], [185.0, 185.85], [187.0, 188.15], [189.0, 189.3], [190.0, 190.78], [192.0, 192.37], [193.0, 198.32], [201.0, 202.09]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.64, 95.78, 0.0, 58.72, 45.05, 0.0, 0.0, 94.66, 96.89, 94.81, 0.0, 0.0, 91.81, 97.43, 0.0, 62.17, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 98.51, 95.91, 91.64, 0.0, 79.07, 90.95, 0.0, 78.38, 88.1, 84.43, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.09], ["music", 14.06], ["didgeridoo", 10.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 1.03, 2.52, 3.82, 1.47, 4.67, 3.78, 0.86, 1.05, 7.76, 3.35, 16.01, 0.82, 0.61, 2.66, 3.33, 0.61, 3.16, 0.64, 0.67, 7.98, 0.47, 0.25, 1.22, 1.46, 1.21, 3.28, 4.75, 3.94, 2.13, 1.63, 2.03, 9.47, 1.77, 2.06, 2.06, 4.46, 0.56, 5.81, 1.92, 0.89, 1.73, 0.85, 1.15, 0.3, 0.78, 0.37, 5.32, 1.09]} \ No newline at end of file diff --git a/annotations_1/QM8StMC7V6Y_filtered.json b/annotations_1/QM8StMC7V6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2312e5e379491bae4da4e8e09cb6a1e01eb3512d --- /dev/null +++ b/annotations_1/QM8StMC7V6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.29], [7.0, 9.56], [15.0, 16.7], [19.0, 24.14]], "keep_status": [false, false, false, false], "silence_prob": [59.96, 42.04, 0.0, 61.27], "audiomae_on_audioset": [null, [["speech", 82.46], ["sidetone", 5.11], ["arrow", 1.14]], null, null], "duration": [5.29, 2.56, 1.7, 5.14]} \ No newline at end of file diff --git a/annotations_1/QMBLWE0pu8U_filtered.json b/annotations_1/QMBLWE0pu8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ca87161e59aceef28d8196a2b4b5740d47910d4 --- /dev/null +++ b/annotations_1/QMBLWE0pu8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 105.95], [108.0, 113.16], [115.0, 118.34], [119.0, 136.48], [138.0, 147.53], [149.0, 149.77], [151.0, 151.58], [152.0, 153.32], [154.0, 154.47], [157.0, 164.4], [165.0, 165.5], [167.0, 168.54], [169.0, 168.98], [169.0, 169.62]], "keep_status": [false, true, true, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 44.34, 32.5, 31.03, 31.62, 0.0, 0.0, 0.0, 0.0, 28.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.3], ["theremin", 11.66], ["hum", 11.0]], [["music", 32.87], ["mains hum", 7.3], ["musical instrument", 6.03]], [["music", 24.19], ["mains hum", 10.77], ["hum", 9.62]], [["buzz", 43.04], ["speech", 22.27], ["music", 8.66]], null, null, null, null, [["music", 30.02], ["reverberation", 7.93], ["explosion", 6.04]], null, null, null, null], "duration": [81.95, 5.16, 3.34, 17.48, 9.53, 0.77, 0.58, 1.32, 0.47, 7.4, 0.5, 1.54, -0.02, 0.62]} \ No newline at end of file diff --git a/annotations_1/QMmxxD7h5-Y_filtered.json b/annotations_1/QMmxxD7h5-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e4c8d287c2c6d38b87ba54641aee9a9d1fc367e --- /dev/null +++ b/annotations_1/QMmxxD7h5-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.2], [6.0, 6.94], [17.0, 17.02], [18.0, 20.43], [21.0, 22.35], [25.0, 27.33], [30.0, 31.26], [34.0, 45.82], [50.0, 52.46], [56.0, 57.43], [60.0, 63.81], [65.0, 71.02], [73.0, 76.62], [77.0, 82.44], [85.0, 87.39], [91.0, 93.12], [96.0, 96.82], [101.0, 102.76], [106.0, 107.59], [112.0, 114.03], [117.0, 118.66], [121.0, 121.41], [131.0, 132.97], [134.0, 134.27], [137.0, 138.37], [140.0, 141.34], [142.0, 144.1], [148.0, 148.47], [150.0, 151.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [54.1, 0.0, 0.0, 81.0, 0.0, 84.8, 0.0, 97.92, 92.8, 0.0, 100.0, 100.0, 100.0, 88.64, 99.91, 100.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.2, 0.94, 0.02, 2.43, 1.35, 2.33, 1.26, 11.82, 2.46, 1.43, 3.81, 6.02, 3.62, 5.44, 2.39, 2.12, 0.82, 1.76, 1.59, 2.03, 1.66, 0.41, 1.97, 0.27, 1.37, 1.34, 2.1, 0.47, 1.71]} \ No newline at end of file diff --git a/annotations_1/QN8ln3Hx1mc_filtered.json b/annotations_1/QN8ln3Hx1mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d998c0d0de129876583099d674cbb1847b981c9e --- /dev/null +++ b/annotations_1/QN8ln3Hx1mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.82], [15.0, 16.24], [17.0, 18.2], [20.0, 20.75], [28.0, 29.17], [30.0, 33.79], [34.0, 35.73], [36.0, 39.58], [41.0, 42.38], [49.0, 50.8], [51.0, 51.85], [53.0, 54.58], [57.0, 57.97], [59.0, 60.03], [63.0, 65.75], [67.0, 67.46], [69.0, 69.67], [78.0, 77.7], [78.0, 79.14], [83.0, 84.52], [87.0, 87.84], [92.0, 92.72], [93.0, 95.2], [100.0, 101.7], [103.0, 103.84], [109.0, 111.13], [113.0, 117.69], [118.0, 119.91], [121.0, 121.59], [123.0, 124.09], [128.0, 129.05], [130.0, 130.65], [132.0, 132.93], [135.0, 136.59], [137.0, 137.67], [139.0, 138.89], [142.0, 143.04], [145.0, 145.61], [147.0, 149.5], [151.0, 151.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 85.54, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.92], ["didgeridoo", 22.98], ["cello", 4.27]], null], "duration": [0.82, 1.24, 1.2, 0.75, 1.17, 3.79, 1.73, 3.58, 1.38, 1.8, 0.85, 1.58, 0.97, 1.03, 2.75, 0.46, 0.67, -0.3, 1.14, 1.52, 0.84, 0.72, 2.2, 1.7, 0.84, 2.13, 4.69, 1.91, 0.59, 1.09, 1.05, 0.65, 0.93, 1.59, 0.67, -0.11, 1.04, 0.61, 2.5, 0.14]} \ No newline at end of file diff --git a/annotations_1/QNUbwijCKfw_filtered.json b/annotations_1/QNUbwijCKfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82f85d6cb4db965607ce65dfd5dd6540fcf2563f --- /dev/null +++ b/annotations_1/QNUbwijCKfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [5.0, 7.32], [9.0, 9.24], [14.0, 14.55], [19.0, 19.09], [21.0, 22.25], [30.0, 29.66], [34.0, 34.75], [36.0, 36.66], [38.0, 37.69], [39.0, 47.17], [50.0, 50.7], [54.0, 54.35], [61.0, 61.25], [64.0, 65.33], [72.0, 76.72], [77.0, 77.58], [79.0, 80.89], [84.0, 84.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 39.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 39.68], ["speech", 26.37], ["whack, thwack", 4.97]], null, null, null], "duration": [0.82, 2.32, 0.24, 0.55, 0.09, 1.25, -0.34, 0.75, 0.66, -0.31, 8.17, 0.7, 0.35, 0.25, 1.33, 4.72, 0.58, 1.89, 0.25]} \ No newline at end of file diff --git a/annotations_1/QNlazlRan6A_filtered.json b/annotations_1/QNlazlRan6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c09cce513bbc3468c268a533af1027b5f92740 --- /dev/null +++ b/annotations_1/QNlazlRan6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [4.0, 5.49], [7.0, 7.26], [12.0, 15.18], [17.0, 19.26], [26.0, 28.05], [29.0, 45.06], [46.0, 47.29], [48.0, 52.54], [54.0, 56.07], [58.0, 58.67], [61.0, 65.77], [66.0, 72.3], [73.0, 100.87], [103.0, 106.2], [110.0, 129.49], [131.0, 132.26], [133.0, 137.12], [138.0, 140.73], [141.0, 141.88], [146.0, 147.41], [149.0, 155.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 71.57, 76.2, 85.54, 47.98, 0.0, 68.41, 73.36, 0.0, 33.48, 33.34, 33.25, 35.6, 32.84, 0.0, 31.6, 31.88, 0.0, 0.0, 39.94], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.2], ["ambient music", 10.68], ["synthesizer", 4.39]], null, null, null, null, [["music", 62.49], ["speech", 9.21], ["musical instrument", 3.11]], [["music", 48.92], ["speech", 21.9], ["didgeridoo", 13.83]], [["music", 68.17], ["didgeridoo", 13.29], ["throbbing", 2.15]], [["hum", 24.16], ["mains hum", 14.08], ["whale vocalization", 13.63]], [["music", 60.32], ["didgeridoo", 19.35], ["speech", 5.94]], null, [["music", 71.0], ["throbbing", 12.37], ["hum", 3.7]], [["music", 42.28], ["speech", 13.74], ["hum", 10.04]], null, null, [["speech", 49.57], ["music", 13.58], ["theremin", 4.24]]], "duration": [0.05, 1.49, 0.26, 3.18, 2.26, 2.05, 16.06, 1.29, 4.54, 2.07, 0.67, 4.77, 6.3, 27.87, 3.2, 19.49, 1.26, 4.12, 2.73, 0.88, 1.41, 6.43]} \ No newline at end of file diff --git a/annotations_1/QO0gZrQw9KU_filtered.json b/annotations_1/QO0gZrQw9KU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e60ba021bdade785456020a0cfe8a1e90ccd53b3 --- /dev/null +++ b/annotations_1/QO0gZrQw9KU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.57], [10.0, 10.47], [11.0, 13.02], [17.0, 23.85], [25.0, 26.25], [27.0, 31.18], [32.0, 67.88], [69.0, 69.18], [74.0, 75.79], [76.0, 77.21], [79.0, 90.12], [90.0, 90.36], [91.0, 90.73], [91.0, 91.29], [92.0, 92.53], [94.0, 100.36], [103.0, 107.7], [108.0, 108.41], [109.0, 110.47], [112.0, 156.51], [157.0, 156.54], [157.0, 157.45], [158.0, 157.91], [158.0, 179.44]], "keep_status": [true, false, false, true, false, true, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [38.1, 0.0, 52.86, 33.45, 0.0, 31.87, 0.0, 0.0, 0.0, 0.0, 28.92, 0.0, 0.0, 0.0, 0.0, 29.18, 31.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.37], "audiomae_on_audioset": [[["hum", 26.53], ["mechanisms", 11.29], ["mains hum", 11.09]], null, null, [["hum", 24.18], ["gong", 21.89], ["mains hum", 13.11]], null, [["speech", 18.82], ["sine wave", 18.68], ["chink, clink", 8.13]], null, null, null, null, [["speech", 28.54], ["music", 17.02], ["animal", 6.95]], null, null, null, null, [["speech", 28.98], ["music", 22.67], ["screaming", 11.96]], [["thunk", 29.87], ["speech", 11.43], ["music", 8.25]], null, null, null, null, null, null, [["speech", 71.25], ["music", 6.14], ["whack, thwack", 3.63]]], "duration": [2.57, 0.47, 2.02, 6.85, 1.25, 4.18, 35.88, 0.18, 1.79, 1.21, 11.12, 0.36, -0.27, 0.29, 0.53, 6.36, 4.7, 0.41, 1.47, 44.51, -0.46, 0.45, -0.09, 21.44]} \ No newline at end of file diff --git a/annotations_1/QP3Pzr7UFE4_filtered.json b/annotations_1/QP3Pzr7UFE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..051f201acf1fe4b84313a34a72d03ed008f07655 --- /dev/null +++ b/annotations_1/QP3Pzr7UFE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.07], [14.0, 24.61], [29.0, 30.16], [31.0, 51.9], [54.0, 56.44], [58.0, 59.34], [63.0, 64.25], [65.0, 65.57], [66.0, 72.27], [75.0, 77.58], [85.0, 85.26], [93.0, 98.59], [100.0, 101.34], [102.0, 102.66], [103.0, 104.13], [108.0, 110.84], [112.0, 112.82], [114.0, 114.61], [118.0, 119.74], [121.0, 123.9], [124.0, 126.74], [130.0, 140.56], [142.0, 144.04], [145.0, 160.14], [162.0, 162.6]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 55.39, 0.0, 50.06, 88.46, 0.0, 0.0, 0.0, 66.76, 41.01, 0.0, 40.64, 0.0, 0.0, 0.0, 41.16, 0.0, 0.0, 0.0, 45.4, 40.09, 40.61, 39.5, 35.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 56.92], ["throbbing", 7.32], ["cacophony", 4.31]], null, [["music", 64.95], ["didgeridoo", 11.8], ["hum", 3.4]], null, null, null, [["music", 61.37], ["didgeridoo", 13.83], ["speech", 6.0]], null, null, null, [["music", 40.26], ["hum", 12.59], ["mains hum", 9.89]], [["music", 49.97], ["speech", 11.92], ["hum", 5.91]], [["music", 28.35], ["moo", 20.39], ["cattle, bovinae", 12.17]], [["music", 60.66], ["throbbing", 6.35], ["musical instrument", 3.28]], [["speech", 30.14], ["hum", 20.33], ["sidetone", 10.14]], null], "duration": [1.07, 10.61, 1.16, 20.9, 2.44, 1.34, 1.25, 0.57, 6.27, 2.58, 0.26, 5.59, 1.34, 0.66, 1.13, 2.84, 0.82, 0.61, 1.74, 2.9, 2.74, 10.56, 2.04, 15.14, 0.6]} \ No newline at end of file diff --git a/annotations_1/QPDuZ_Wq7ZA_filtered.json b/annotations_1/QPDuZ_Wq7ZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4127305451c768c2c13bca442a1dd0eeae1089bd --- /dev/null +++ b/annotations_1/QPDuZ_Wq7ZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.95], [8.0, 8.99], [11.0, 11.74], [12.0, 13.85], [18.0, 18.89], [25.0, 24.92], [26.0, 26.06], [28.0, 28.02], [32.0, 32.68], [38.0, 39.43], [45.0, 48.02], [56.0, 56.51], [65.0, 66.33], [67.0, 71.85], [74.0, 77.28], [77.0, 77.82], [78.0, 78.36], [78.0, 78.49], [100.0, 103.4], [104.0, 107.54], [108.0, 111.05], [118.0, 120.65], [123.0, 136.36], [137.0, 137.24], [140.0, 150.08], [151.0, 151.85], [154.0, 154.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.64, 0.0, 0.0, 34.08, 38.88, 0.0, 0.0, 0.0, 31.79, 30.23, 30.31, 31.69, 32.91, 0.0, 34.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.57], ["theremin", 21.4], ["didgeridoo", 5.91]], null, null, [["music", 48.13], ["humming", 11.1], ["mantra", 3.69]], [["music", 58.68], ["carnatic music", 9.44], ["musical instrument", 6.0]], null, null, null, [["music", 76.98], ["theremin", 3.78], ["effects unit", 2.7]], [["music", 63.29], ["carnatic music", 14.76], ["musical instrument", 3.32]], [["music", 65.32], ["musical instrument", 5.48], ["guitar", 3.72]], [["music", 64.52], ["musical instrument", 4.59], ["theremin", 3.51]], [["music", 52.82], ["mantra", 11.2], ["lullaby", 8.82]], null, [["music", 34.13], ["theremin", 16.56], ["humming", 12.78]], null, null], "duration": [1.95, 0.99, 0.74, 1.85, 0.89, -0.08, 0.06, 0.02, 0.68, 1.43, 3.02, 0.51, 1.33, 4.85, 3.28, 0.82, 0.36, 0.49, 3.4, 3.54, 3.05, 2.65, 13.36, 0.24, 10.08, 0.85, 0.77]} \ No newline at end of file diff --git a/annotations_1/QP_o0yWJYKM_filtered.json b/annotations_1/QP_o0yWJYKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fd95a9908d903e1dedd77cdec23c3321f0d9cf7 --- /dev/null +++ b/annotations_1/QP_o0yWJYKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [3.0, 5.58], [8.0, 9.49], [11.0, 12.38], [19.0, 20.6], [22.0, 26.22], [28.0, 34.32], [35.0, 37.47], [39.0, 51.88], [53.0, 54.31], [55.0, 55.66], [57.0, 56.83], [58.0, 72.13], [74.0, 75.41], [81.0, 85.14], [86.0, 91.29], [93.0, 94.63], [99.0, 104.35], [106.0, 106.19], [108.0, 108.48], [113.0, 115.64], [120.0, 120.18], [123.0, 123.43], [125.0, 125.49], [132.0, 132.75], [136.0, 137.69], [140.0, 140.58], [141.0, 140.7], [141.0, 140.8], [141.0, 140.85], [141.0, 144.83], [150.0, 151.01], [154.0, 154.55], [156.0, 157.35], [158.0, 162.24], [163.0, 165.97], [168.0, 169.15], [173.0, 177.9], [178.0, 177.94], [178.0, 177.97], [178.0, 178.01], [179.0, 179.42], [181.0, 181.36], [183.0, 184.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.99, 0.0, 0.0, 0.0, 85.9, 85.54, 99.52, 84.98, 0.0, 0.0, 0.0, 73.21, 0.0, 43.77, 81.17, 0.0, 48.02, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.33, 0.0, 0.0, 0.0, 63.96, 63.64, 0.0, 50.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.25], ["music", 26.0], ["sidetone", 4.94]], null, null, [["speech", 55.26], ["music", 20.33], ["sidetone", 3.76]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.03], ["music", 24.8], ["sidetone", 5.41]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 2.58, 1.49, 1.38, 1.6, 4.22, 6.32, 2.47, 12.88, 1.31, 0.66, -0.17, 14.13, 1.41, 4.14, 5.29, 1.63, 5.35, 0.19, 0.48, 2.64, 0.18, 0.43, 0.49, 0.75, 1.69, 0.58, -0.3, -0.2, -0.15, 3.83, 1.01, 0.55, 1.35, 4.24, 2.97, 1.15, 4.9, -0.06, -0.03, 0.01, 0.42, 0.36, 1.57]} \ No newline at end of file diff --git a/annotations_1/QPaP-XRQeM8_filtered.json b/annotations_1/QPaP-XRQeM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6cebef49f3a71f8198b7b1e6f2dc50c37a0cf9 --- /dev/null +++ b/annotations_1/QPaP-XRQeM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [7.0, 7.59], [11.0, 12.26], [15.0, 15.8], [20.0, 20.68], [23.0, 27.58], [34.0, 35.26], [37.0, 37.64], [40.0, 41.05], [51.0, 52.68], [61.0, 64.25], [66.0, 87.99], [93.0, 94.2], [104.0, 104.5], [111.0, 112.89], [118.0, 118.05], [123.0, 123.35], [124.0, 124.16], [125.0, 126.06], [131.0, 132.17]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 0.0, 0.0, 29.43, 31.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["breaking", 37.62], ["glass", 17.68], ["music", 7.08]], null, null, null, null, [["hum", 15.59], ["shatter", 10.96], ["mains hum", 10.36]], [["music", 64.0], ["sheep", 5.34], ["speech", 4.2]], null, null, null, null, null, null, null, null], "duration": [0.38, 0.59, 1.26, 0.8, 0.68, 4.58, 1.26, 0.64, 1.05, 1.68, 3.25, 21.99, 1.2, 0.5, 1.89, 0.05, 0.35, 0.16, 1.06, 1.17]} \ No newline at end of file diff --git a/annotations_1/QPbUj6Ks8j4_filtered.json b/annotations_1/QPbUj6Ks8j4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9f5eae8882cfcc32cdcc2bcf3ebbb60b104dc1a --- /dev/null +++ b/annotations_1/QPbUj6Ks8j4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.92], [18.0, 18.15], [19.0, 19.89], [27.0, 30.05], [32.0, 33.12], [40.0, 40.2], [44.0, 49.33], [50.0, 51.27], [52.0, 52.3], [59.0, 74.43], [79.0, 90.8], [92.0, 91.94], [95.0, 95.5], [96.0, 102.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.19, 0.0, 0.0, 91.64, 0.0, 0.0, 74.13, 0.0, 0.0, 73.51, 46.97, 0.0, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 58.76], ["boing", 11.58], ["speech", 4.3]], null, null, null], "duration": [7.92, 0.15, 0.89, 3.05, 1.12, 0.2, 5.33, 1.27, 0.3, 15.43, 11.8, -0.06, 0.5, 6.12]} \ No newline at end of file diff --git a/annotations_1/QQaLVYSCwrc_filtered.json b/annotations_1/QQaLVYSCwrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96d4427989a4dc84d787f636062a35e883141a62 --- /dev/null +++ b/annotations_1/QQaLVYSCwrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [7.0, 7.7], [15.0, 15.77], [17.0, 17.24], [55.0, 54.89], [69.0, 69.62], [84.0, 88.96], [90.0, 96.21], [104.0, 108.11]], "keep_status": [false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.83, 37.66, 38.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 41.41], ["cattle, bovinae", 16.23], ["moo", 12.97]], [["music", 51.47], ["speech", 14.54], ["sheep", 3.26]], [["speech", 63.39], ["insect", 3.6], ["fly, housefly", 2.53]]], "duration": [1.37, 0.7, 0.77, 0.24, -0.11, 0.62, 4.96, 6.21, 4.11]} \ No newline at end of file diff --git a/annotations_1/QR6Ds-Tvd1g_filtered.json b/annotations_1/QR6Ds-Tvd1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d22a347a452d0ace9595801f0a4cadc24734b5 --- /dev/null +++ b/annotations_1/QR6Ds-Tvd1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 48.78], [49.0, 60.62], [64.0, 91.2]], "keep_status": [false, true, false], "silence_prob": [0.0, 30.33, 29.18], "audiomae_on_audioset": [null, [["music", 30.34], ["whack, thwack", 8.09], ["fart", 5.79]], [["music", 47.06], ["buzz", 15.56], ["speech", 14.35]]], "duration": [-0.22, 11.62, 27.2]} \ No newline at end of file diff --git a/annotations_1/QRoWiTcO7dk_filtered.json b/annotations_1/QRoWiTcO7dk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f450a6de72fcc12a0e4f16c1f1d4c446d3ef983 --- /dev/null +++ b/annotations_1/QRoWiTcO7dk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [17.0, 31.75], [35.0, 36.48], [38.0, 43.75], [48.0, 51.02], [54.0, 55.46], [82.0, 85.65], [91.0, 96.5], [110.0, 122.98], [125.0, 127.82], [132.0, 132.56], [139.0, 147.31], [154.0, 157.27], [163.0, 175.09], [182.0, 197.23], [199.0, 199.76], [203.0, 208.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.41, 0.0, 29.61, 29.66, 0.0, 29.07, 28.82, 29.59, 29.5, 0.0, 28.87, 28.96, 28.59, 28.88, 0.0, 28.64], "audiomae_on_audioset": [null, [["music", 82.52], ["funk", 3.35], ["middle eastern music", 0.99]], null, [["music", 87.85], ["sampler", 1.4], ["funk", 0.93]], [["music", 66.35], ["sampler", 2.85], ["drum machine", 2.82]], null, [["music", 62.52], ["speech", 5.35], ["boing", 3.52]], [["music", 95.21], ["singing", 0.73], ["independent music", 0.17]], [["music", 86.99], ["didgeridoo", 0.7], ["funk", 0.61]], [["music", 81.61], ["singing", 1.96], ["folk music", 1.25]], null, [["music", 57.56], ["didgeridoo", 15.4], ["musical instrument", 2.97]], [["music", 58.86], ["drum and bass", 3.66], ["static", 3.09]], [["music", 86.74], ["singing", 2.15], ["musical instrument", 0.88]], [["music", 82.12], ["sitar", 3.86], ["theremin", 1.07]], null, [["music", 79.36], ["rattle (instrument)", 2.44], ["singing", 1.32]]], "duration": [0.35, 14.75, 1.48, 5.75, 3.02, 1.46, 3.65, 5.5, 12.98, 2.82, 0.56, 8.31, 3.27, 12.09, 15.23, 0.76, 5.92]} \ No newline at end of file diff --git a/annotations_1/QS3UyqLs5KY_filtered.json b/annotations_1/QS3UyqLs5KY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50c78a15c98cbab8080c260c0559a6750868ce5e --- /dev/null +++ b/annotations_1/QS3UyqLs5KY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [3.0, 7.03], [8.0, 8.99], [10.0, 10.86], [13.0, 14.03], [15.0, 17.85], [21.0, 21.32], [24.0, 25.59], [30.0, 30.84], [32.0, 32.93], [35.0, 35.75], [43.0, 44.07], [47.0, 47.93], [49.0, 50.19], [51.0, 52.34], [54.0, 56.49], [58.0, 59.46], [61.0, 61.57], [63.0, 64.89], [66.0, 66.58], [68.0, 69.36], [71.0, 73.36], [76.0, 76.84], [78.0, 79.24], [81.0, 80.89], [83.0, 83.64], [89.0, 89.61], [91.0, 93.19], [94.0, 105.53], [106.0, 107.94], [109.0, 109.22], [109.0, 109.9], [115.0, 124.5], [125.0, 132.38], [133.0, 133.76], [135.0, 140.81], [143.0, 143.7], [145.0, 146.53], [148.0, 149.89], [150.0, 150.97], [151.0, 155.01], [155.0, 155.55], [156.0, 162.09], [163.0, 163.16], [164.0, 166.63], [167.0, 167.86], [169.0, 171.21], [174.0, 175.78], [176.0, 176.28], [178.0, 178.55], [181.0, 181.8], [182.0, 183.44], [185.0, 187.91], [188.0, 192.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 63.85, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 77.53, 0.0, 0.0, 0.0, 35.43, 99.71, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 95.78, 0.0, 99.36, 0.0, 98.51, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 29.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.66], ["theremin", 8.96], ["musical instrument", 7.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.01], ["groan", 17.97], ["screaming", 13.18]]], "duration": [0.85, 4.03, 0.99, 0.86, 1.03, 2.85, 0.32, 1.59, 0.84, 0.93, 0.75, 1.07, 0.93, 1.19, 1.34, 2.49, 1.46, 0.57, 1.89, 0.58, 1.36, 2.36, 0.84, 1.24, -0.11, 0.64, 0.61, 2.19, 11.53, 1.94, 0.22, 0.9, 9.5, 7.38, 0.76, 5.81, 0.7, 1.53, 1.89, 0.97, 4.01, 0.55, 6.09, 0.16, 2.63, 0.86, 2.21, 1.78, 0.28, 0.55, 0.8, 1.44, 2.91, 4.62]} \ No newline at end of file diff --git a/annotations_1/QS8fJMeJqsQ_filtered.json b/annotations_1/QS8fJMeJqsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0450065f2646640793fc66a9ea3a575aea415fd --- /dev/null +++ b/annotations_1/QS8fJMeJqsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 46.21], [46.0, 48.39], [49.0, 50.55], [51.0, 51.31], [51.0, 51.36], [51.0, 51.44], [51.0, 52.19], [54.0, 58.46], [64.0, 64.93], [66.0, 78.6], [80.0, 84.5], [86.0, 94.12], [95.0, 126.5], [128.0, 129.88], [131.0, 131.3], [134.0, 135.36], [137.0, 137.76], [138.0, 158.09], [159.0, 159.09]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.85, 32.07, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 94.22, 98.8, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0], "audiomae_on_audioset": [[["speech", 31.47], ["screaming", 11.6], ["rumble", 7.35]], [["speech", 9.92], ["hum", 9.13], ["throbbing", 5.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.21, 2.39, 1.55, 0.31, 0.36, 0.44, 1.19, 4.46, 0.93, 12.6, 4.5, 8.12, 31.5, 1.88, 0.3, 1.36, 0.76, 20.09, 0.09]} \ No newline at end of file diff --git a/annotations_1/QSqUVzkUvj8_filtered.json b/annotations_1/QSqUVzkUvj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37006896b1bc35641c5a50b3bbea06b077e67fcd --- /dev/null +++ b/annotations_1/QSqUVzkUvj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 105.9], [111.0, 119.7], [124.0, 127.45], [130.0, 169.18], [170.0, 170.23], [171.0, 175.9], [180.0, 182.49], [185.0, 184.74]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [0.0, 68.8, 60.79, 0.0, 0.0, 44.23, 48.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["groan", 21.36], ["speech", 17.64], ["mosquito", 7.85]], [["animal", 31.15], ["roaring cats (lions, tigers)", 10.74], ["moo", 9.16]], null], "duration": [89.9, 8.7, 3.45, 39.18, 0.23, 4.9, 2.49, -0.26]} \ No newline at end of file diff --git a/annotations_1/QT1Tl6npLic_filtered.json b/annotations_1/QT1Tl6npLic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e106c048c260ddba98412086d2d4262e2ac76304 --- /dev/null +++ b/annotations_1/QT1Tl6npLic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.37], [7.0, 7.67], [16.0, 21.24], [25.0, 24.98], [28.0, 28.21], [30.0, 30.59], [33.0, 33.64], [34.0, 33.74], [34.0, 33.91], [39.0, 39.12], [46.0, 48.57], [54.0, 57.27], [59.0, 60.64], [62.0, 61.91], [66.0, 66.24], [69.0, 68.94], [75.0, 76.0], [78.0, 79.25], [81.0, 80.82], [89.0, 90.8], [94.0, 96.43], [98.0, 99.27], [104.0, 107.22], [109.0, 112.36], [114.0, 114.54], [115.0, 115.55], [119.0, 121.34], [124.0, 127.33], [129.0, 130.35], [131.0, 132.14], [133.0, 134.25], [135.0, 136.32], [137.0, 137.91], [145.0, 146.53], [151.0, 152.49], [154.0, 158.3], [161.0, 170.19], [171.0, 172.79], [174.0, 173.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.48, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 88.28, 63.1, 0.0, 0.0, 82.97, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 85.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.37, 0.67, 5.24, -0.02, 0.21, 0.59, 0.64, -0.26, -0.09, 0.12, 2.57, 3.27, 1.64, -0.09, 0.24, -0.06, 1.0, 1.25, -0.18, 1.8, 2.43, 1.27, 3.22, 3.36, 0.54, 0.55, 2.34, 3.33, 1.35, 1.14, 1.25, 1.32, 0.91, 1.53, 1.49, 4.3, 9.19, 1.79, -0.33]} \ No newline at end of file diff --git a/annotations_1/QT2Anb4MY38_filtered.json b/annotations_1/QT2Anb4MY38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea11c385ee0af87cd2937c6b83912c3465d9ce64 --- /dev/null +++ b/annotations_1/QT2Anb4MY38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.48], [10.0, 10.52], [14.0, 15.25], [19.0, 18.57], [19.0, 18.98], [22.0, 23.23], [26.0, 26.0], [27.0, 30.6], [31.0, 32.61], [34.0, 34.67], [36.0, 37.56], [39.0, 42.09], [42.0, 42.89], [45.0, 48.27], [49.0, 52.29], [53.0, 54.8], [56.0, 57.05], [58.0, 60.94], [65.0, 66.26], [66.0, 68.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 29.22, 0.0, 35.47, 37.89, 0.0, 0.0, 36.55, 0.0, 35.44], "audiomae_on_audioset": [[["hum", 34.14], ["throbbing", 23.62], ["music", 20.95]], null, null, null, null, null, null, [["mains hum", 42.28], ["hum", 41.34], ["speech", 3.62]], null, null, null, [["speech", 42.62], ["music", 24.41], ["tabla", 5.28]], null, [["hum", 30.0], ["speech", 26.04], ["throbbing", 17.95]], [["hum", 40.15], ["throbbing", 29.56], ["whale vocalization", 7.08]], null, null, [["music", 30.78], ["speech", 21.53], ["didgeridoo", 10.18]], null, [["music", 49.77], ["hum", 12.53], ["throbbing", 6.86]]], "duration": [2.48, 0.52, 1.25, -0.43, -0.02, 1.23, 0.0, 3.6, 1.61, 0.67, 1.56, 3.09, 0.89, 3.27, 3.29, 1.8, 1.05, 2.94, 1.26, 2.74]} \ No newline at end of file diff --git a/annotations_1/QUI-9FAwA8w_filtered.json b/annotations_1/QUI-9FAwA8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c385a20bd890811449d548d1879371f3fce7a33e --- /dev/null +++ b/annotations_1/QUI-9FAwA8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.06], [17.0, 17.31], [18.0, 18.57], [33.0, 32.68], [34.0, 35.23], [36.0, 37.0], [40.0, 40.73], [48.0, 48.88], [50.0, 50.7], [54.0, 53.77], [63.0, 63.48], [66.0, 67.61], [68.0, 69.33], [70.0, 71.2], [72.0, 72.37], [76.0, 77.87], [79.0, 93.16], [98.0, 97.7], [103.0, 103.42], [104.0, 109.14], [110.0, 110.78], [112.0, 112.78], [115.0, 120.75], [122.0, 122.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.16, 0.0, 0.0, 34.27, 0.0, 0.0, 40.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 80.15], ["musical instrument", 1.64], ["guitar", 1.5]], null, null, [["music", 61.98], ["speech", 10.07], ["sidetone", 5.8]], null, null, [["mains hum", 35.19], ["hum", 18.3], ["music", 18.13]], null], "duration": [1.06, 0.31, 0.57, -0.32, 1.23, 1.0, 0.73, 0.88, 0.7, -0.23, 0.48, 1.61, 1.33, 1.2, 0.37, 1.87, 14.16, -0.3, 0.42, 5.14, 0.78, 0.78, 5.75, 0.2]} \ No newline at end of file diff --git a/annotations_1/QWiJ8VQXJzY_filtered.json b/annotations_1/QWiJ8VQXJzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b002ea77e10a1a9f2799501ff42b8bb2902de321 --- /dev/null +++ b/annotations_1/QWiJ8VQXJzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.9], [6.0, 6.86], [8.0, 9.0], [10.0, 11.33], [15.0, 16.95], [19.0, 27.53], [29.0, 31.8], [33.0, 36.63], [38.0, 40.09], [43.0, 51.17], [56.0, 57.33], [61.0, 61.28], [64.0, 65.04], [68.0, 69.97], [71.0, 72.98], [74.0, 74.44], [75.0, 75.57], [78.0, 77.89], [82.0, 89.6], [94.0, 97.88], [100.0, 102.05], [105.0, 107.35], [108.0, 111.81], [112.0, 113.78], [115.0, 116.41], [120.0, 123.53], [127.0, 127.18], [130.0, 130.32], [132.0, 133.66], [135.0, 137.96], [139.0, 140.12], [141.0, 141.84], [144.0, 145.4], [151.0, 152.14], [155.0, 156.41], [157.0, 157.79], [159.0, 160.81], [162.0, 164.47], [165.0, 172.64], [176.0, 178.14], [182.0, 186.0], [192.0, 192.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 100.0, 86.09, 71.29, 33.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.17, 31.41, 30.31, 58.72, 85.72, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 42.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.56, 32.75, 83.34, 37.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 60.06], ["hum", 6.3], ["didgeridoo", 5.98]], null, null, null, null, null, null, null, null, [["music", 69.62], ["electronic music", 6.32], ["ambient music", 4.19]], [["hum", 26.19], ["mains hum", 22.29], ["speech", 15.47]], [["music", 32.32], ["noise", 13.04], ["explosion", 6.88]], null, null, null, null, null, null, null, null, [["whale vocalization", 93.78], ["sound effect", 0.95], ["music", 0.83]], null, null, null, null, null, null, null, [["music", 24.06], ["speech", 18.79], ["hum", 11.18]], [["music", 49.82], ["synthesizer", 9.98], ["musical instrument", 6.84]], null, [["hum", 21.41], ["mains hum", 14.15], ["music", 9.35]], null], "duration": [-0.1, 0.86, 1.0, 1.33, 1.95, 8.53, 2.8, 3.63, 2.09, 8.17, 1.33, 0.28, 1.04, 1.97, 1.98, 0.44, 0.57, -0.11, 7.6, 3.88, 2.05, 2.35, 3.81, 1.78, 1.41, 3.53, 0.18, 0.32, 1.66, 2.96, 1.12, 0.84, 1.4, 1.14, 1.41, 0.79, 1.81, 2.47, 7.64, 2.14, 4.0, 0.92]} \ No newline at end of file diff --git a/annotations_1/QXeYlaZJ64k_filtered.json b/annotations_1/QXeYlaZJ64k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d25ce3765118bace60d9c1f95ed6f94d65e6414d --- /dev/null +++ b/annotations_1/QXeYlaZJ64k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 43.29], [44.0, 49.94], [51.0, 70.73], [73.0, 87.93], [89.0, 89.55], [92.0, 94.41], [98.0, 101.12], [103.0, 123.77]], "keep_status": [false, true, false, false, false, true, false, false], "silence_prob": [37.56, 30.25, 33.53, 33.06, 0.0, 30.19, 30.41, 30.61], "audiomae_on_audioset": [[["music", 75.59], ["smash, crash", 6.33], ["mechanisms", 2.71]], [["music", 53.39], ["sonar", 6.5], ["musical instrument", 2.91]], [["music", 48.02], ["hum", 16.31], ["throbbing", 6.08]], [["music", 47.96], ["speech", 27.2], ["fart", 2.4]], null, [["music", 30.46], ["throbbing", 11.56], ["hum", 11.44]], [["throbbing", 45.2], ["music", 24.96], ["hum", 7.09]], [["music", 59.91], ["throbbing", 15.41], ["hum", 4.88]]], "duration": [24.29, 5.94, 19.73, 14.93, 0.55, 2.41, 3.12, 20.77]} \ No newline at end of file diff --git a/annotations_1/QXruKKf3my4_filtered.json b/annotations_1/QXruKKf3my4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c62333147c77746bf44c1cb1b53f8f6db8ac88a6 --- /dev/null +++ b/annotations_1/QXruKKf3my4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 5.43], [8.0, 8.28], [9.0, 8.9], [13.0, 13.2], [19.0, 20.36], [23.0, 23.9], [25.0, 26.49], [32.0, 33.08], [34.0, 34.77], [44.0, 49.0], [50.0, 51.07], [52.0, 52.84], [56.0, 56.44], [62.0, 69.87], [71.0, 80.82], [82.0, 82.22], [86.0, 86.19], [87.0, 87.88], [89.0, 98.47], [101.0, 101.41], [114.0, 114.15], [117.0, 118.44], [126.0, 126.69], [130.0, 131.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 34.74, 31.91, 0.0, 0.0, 0.0, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 14.92], ["mosquito", 13.7], ["buzz", 11.43]], [["livestock, farm animals, working animals", 8.94], ["crowd", 7.5], ["cattle, bovinae", 6.99]], null, null, null, [["speech", 52.48], ["thunk", 5.28], ["electric shaver, electric razor", 3.46]], null, null, null, null, null], "duration": [0.58, 0.43, 0.28, -0.1, 0.2, 1.36, 0.9, 1.49, 1.08, 0.77, 5.0, 1.07, 0.84, 0.44, 7.87, 9.82, 0.22, 0.19, 0.88, 9.47, 0.41, 0.15, 1.44, 0.69, 1.3]} \ No newline at end of file diff --git a/annotations_1/QYUhwlQe0IU_filtered.json b/annotations_1/QYUhwlQe0IU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b1337e2c4652aa98f3e12ccbbe8f74ced7e98d8 --- /dev/null +++ b/annotations_1/QYUhwlQe0IU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.53], [12.0, 43.28], [44.0, 47.04], [51.0, 57.92], [59.0, 62.43], [64.0, 66.45], [68.0, 88.45], [90.0, 91.15], [92.0, 95.13], [96.0, 118.07], [119.0, 144.12], [145.0, 146.03], [147.0, 149.49], [150.0, 163.14]], "keep_status": [false, false, true, true, true, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 36.49, 41.07, 44.72, 46.5, 31.93, 0.0, 38.72, 31.38, 30.09, 0.0, 31.39, 29.22], "audiomae_on_audioset": [null, null, [["music", 46.67], ["hum", 11.27], ["electronic music", 9.0]], [["hum", 23.67], ["music", 23.22], ["whale vocalization", 18.12]], [["hum", 25.37], ["speech", 24.44], ["mains hum", 14.86]], [["hum", 22.87], ["mains hum", 18.52], ["music", 9.11]], [["music", 47.34], ["throbbing", 15.21], ["hum", 12.25]], null, [["music", 45.58], ["throbbing", 24.18], ["hum", 10.23]], [["music", 50.0], ["hum", 13.3], ["throbbing", 11.72]], [["throbbing", 38.88], ["hum", 26.73], ["music", 17.93]], null, [["music", 46.03], ["hum", 4.68], ["electronic music", 4.13]], [["music", 53.85], ["hum", 7.45], ["speech", 7.06]]], "duration": [-0.47, 31.28, 3.04, 6.92, 3.43, 2.45, 20.45, 1.15, 3.13, 22.07, 25.12, 1.03, 2.49, 13.14]} \ No newline at end of file diff --git a/annotations_1/Q_GqOe9HFRY_filtered.json b/annotations_1/Q_GqOe9HFRY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83ac97686ec07e5db11c0211dcbcd2fc1071a3dc --- /dev/null +++ b/annotations_1/Q_GqOe9HFRY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.44], [15.0, 22.89], [24.0, 25.07], [26.0, 27.82], [28.0, 29.0], [34.0, 35.09], [36.0, 36.8], [37.0, 38.67], [39.0, 39.78], [42.0, 42.82], [44.0, 44.88], [46.0, 46.99], [48.0, 51.16], [55.0, 55.44], [56.0, 56.4], [60.0, 60.17], [62.0, 62.29], [63.0, 63.86], [75.0, 76.96], [80.0, 80.82], [83.0, 83.73], [89.0, 89.21], [90.0, 90.46], [95.0, 95.71], [100.0, 100.43], [101.0, 101.63], [102.0, 102.73], [104.0, 106.61], [111.0, 111.33], [113.0, 113.27], [115.0, 121.02], [122.0, 122.22], [124.0, 123.9], [126.0, 127.28], [129.0, 130.67], [132.0, 133.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [37.11, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.2, 0.0, 0.0, 39.94, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 32.78], ["speech", 31.89], ["bow-wow", 6.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["crushing", 30.46], ["glass", 23.24], ["clang", 9.98]], null, null, null, null, null], "duration": [3.44, 7.89, 1.07, 1.82, 1.0, 1.09, 0.8, 1.67, 0.78, 0.82, 0.88, 0.99, 3.16, 0.44, 0.4, 0.17, 0.29, 0.86, 1.96, 0.82, 0.73, 0.21, 0.46, 0.71, 0.43, 0.63, 0.73, 2.61, 0.33, 0.27, 6.02, 0.22, -0.1, 1.28, 1.67, 1.64]} \ No newline at end of file diff --git a/annotations_1/Q_UdYBBk9XI_filtered.json b/annotations_1/Q_UdYBBk9XI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d23e983338d47616731edbe8674e8715ee733361 --- /dev/null +++ b/annotations_1/Q_UdYBBk9XI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.29], [16.0, 16.68], [18.0, 22.62], [23.0, 61.92], [65.0, 67.88], [71.0, 81.55], [82.0, 98.02], [98.0, 103.28], [106.0, 106.1], [106.0, 108.5], [112.0, 111.91]], "keep_status": [false, false, false, false, true, true, true, true, false, false, false], "silence_prob": [30.06, 0.0, 29.97, 0.0, 30.31, 30.79, 32.88, 33.99, 0.0, 65.2, 0.0], "audiomae_on_audioset": [[["music", 77.21], ["musical instrument", 6.09], ["didgeridoo", 2.91]], null, [["music", 62.07], ["musical instrument", 9.23], ["didgeridoo", 3.55]], null, [["music", 26.29], ["speech", 12.98], ["vehicle", 9.16]], [["music", 49.84], ["crowd", 7.46], ["hum", 4.09]], [["whale vocalization", 18.96], ["animal", 18.08], ["civil defense siren", 10.38]], [["livestock, farm animals, working animals", 17.47], ["frog", 16.38], ["bee, wasp, etc.", 7.22]], null, null, null], "duration": [4.29, 0.68, 4.62, 38.92, 2.88, 10.55, 16.02, 5.28, 0.1, 2.5, -0.09]} \ No newline at end of file diff --git a/annotations_1/QaUjGv3GLeg_filtered.json b/annotations_1/QaUjGv3GLeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a72e4250cbd370b8a8111829a70fb262c003c84 --- /dev/null +++ b/annotations_1/QaUjGv3GLeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 27.43], [30.0, 35.45], [38.0, 44.95], [46.0, 47.85], [48.0, 49.96], [51.0, 53.69], [59.0, 64.2], [68.0, 68.18], [70.0, 72.69], [73.0, 75.34], [79.0, 79.78], [82.0, 84.48], [86.0, 96.96], [98.0, 99.94], [104.0, 105.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 91.64, 79.59, 0.0, 0.0, 93.29, 54.1, 0.0, 53.28, 78.38, 0.0, 90.78, 66.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.43, 5.45, 6.95, 1.85, 1.96, 2.69, 5.2, 0.18, 2.69, 2.34, 0.78, 2.48, 10.96, 1.94, 1.38]} \ No newline at end of file diff --git a/annotations_1/QbJIRG4T680_filtered.json b/annotations_1/QbJIRG4T680_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cff014255bec962718d40be803586980159cf23 --- /dev/null +++ b/annotations_1/QbJIRG4T680_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [7.0, 8.14], [9.0, 10.13], [11.0, 13.95], [16.0, 19.79], [22.0, 25.98], [32.0, 33.74], [34.0, 35.99], [38.0, 40.19], [42.0, 42.55], [46.0, 46.97], [52.0, 52.46], [58.0, 58.73], [80.0, 80.4], [82.0, 82.54], [89.0, 89.78], [92.0, 93.12], [102.0, 102.05], [113.0, 114.18], [117.0, 119.43], [125.0, 127.11], [131.0, 132.85], [135.0, 148.63], [150.0, 152.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.5, 70.44, 54.43, 0.0, 0.0, 37.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 54.17, 0.0, 51.82, 67.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 39.1], ["music", 26.33], ["didgeridoo", 5.82]], null, null, null, null, null, null, null, null, null, null, [["music", 35.8], ["singing bowl", 9.5], ["didgeridoo", 8.81]], null, null, null, null], "duration": [0.54, 1.14, 1.13, 2.95, 3.79, 3.98, 1.74, 1.99, 2.19, 0.55, 0.97, 0.46, 0.73, 0.4, 0.54, 0.78, 1.12, 0.05, 1.18, 2.43, 2.11, 1.85, 13.63, 2.41]} \ No newline at end of file diff --git a/annotations_1/QbOo_FctFu4_filtered.json b/annotations_1/QbOo_FctFu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e84dc5502420de54de9683a3a2ab2f34001ab663 --- /dev/null +++ b/annotations_1/QbOo_FctFu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.61], [14.0, 15.74], [17.0, 24.22], [26.0, 32.41], [38.0, 54.38], [55.0, 55.81], [57.0, 57.52], [59.0, 58.97], [61.0, 61.59], [66.0, 74.28], [76.0, 76.03]], "keep_status": [false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 44.52, 33.02, 29.93, 0.0, 0.0, 0.0, 0.0, 44.78, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.06], ["effects unit", 15.56], ["guitar", 9.1]], [["music", 19.36], ["buzz", 13.63], ["effects unit", 11.27]], [["music", 34.29], ["effects unit", 10.49], ["buzz", 7.9]], null, null, null, null, [["music", 29.03], ["synthesizer", 22.01], ["musical instrument", 12.81]], null], "duration": [0.61, 1.74, 7.22, 6.41, 16.38, 0.81, 0.52, -0.03, 0.59, 8.28, 0.03]} \ No newline at end of file diff --git a/annotations_1/Qc-E0u_1Ei4_filtered.json b/annotations_1/Qc-E0u_1Ei4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b44ba51bf66721f528714ea9cee954c7d32dbc9 --- /dev/null +++ b/annotations_1/Qc-E0u_1Ei4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.11], [19.0, 19.62], [20.0, 26.97], [27.0, 27.01], [29.0, 29.78], [30.0, 33.59], [44.0, 43.77], [55.0, 57.25], [62.0, 63.81], [73.0, 73.35], [82.0, 84.42], [91.0, 91.57], [92.0, 116.58], [118.0, 118.66], [128.0, 128.58], [129.0, 129.47], [130.0, 131.97], [132.0, 135.36], [136.0, 140.86], [141.0, 142.67]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [30.01, 0.0, 29.46, 0.0, 0.0, 28.74, 0.0, 30.28, 0.0, 0.0, 36.44, 0.0, 29.57, 0.0, 0.0, 0.0, 0.0, 29.02, 29.98, 0.0], "audiomae_on_audioset": [[["music", 54.79], ["speech", 16.68], ["foghorn", 9.07]], null, [["music", 11.72], ["fart", 11.29], ["moo", 10.03]], null, null, [["music", 46.04], ["sound effect", 18.18], ["musical instrument", 5.69]], null, [["speech", 42.11], ["music", 29.35], ["boing", 1.7]], null, null, [["vehicle", 31.76], ["car", 23.22], ["race car, auto racing", 7.14]], null, [["music", 24.76], ["speech", 17.18], ["groan", 13.56]], null, null, null, null, [["cattle, bovinae", 49.94], ["moo", 29.79], ["livestock, farm animals, working animals", 17.03]], [["speech", 15.51], ["music", 12.98], ["explosion", 12.34]], null], "duration": [4.11, 0.62, 6.97, 0.01, 0.78, 3.59, -0.23, 2.25, 1.81, 0.35, 2.42, 0.57, 24.58, 0.66, 0.58, 0.47, 1.97, 3.36, 4.86, 1.67]} \ No newline at end of file diff --git a/annotations_1/Qc3voNxG1NM_filtered.json b/annotations_1/Qc3voNxG1NM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e4f7a8907b4edb2aef3deaa45a2a1015432e6b1 --- /dev/null +++ b/annotations_1/Qc3voNxG1NM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.57], [32.0, 36.15], [40.0, 44.24], [45.0, 46.09], [48.0, 49.18], [51.0, 53.3], [60.0, 61.53], [62.0, 64.99], [66.0, 73.03]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.59, 99.99, 0.0, 0.0, 90.08, 0.0, 62.89, 75.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.57, 4.15, 4.24, 1.09, 1.18, 2.3, 1.53, 2.99, 7.03]} \ No newline at end of file diff --git a/annotations_1/Qc9eycqDJKk_filtered.json b/annotations_1/Qc9eycqDJKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edce6000937ad30854c358de6127270bd2848821 --- /dev/null +++ b/annotations_1/Qc9eycqDJKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [6.0, 7.13], [8.0, 13.07], [14.0, 14.28], [30.0, 30.5], [31.0, 33.67], [35.0, 40.53], [46.0, 46.06], [55.0, 57.86], [59.0, 59.93], [60.0, 70.92], [75.0, 74.95], [76.0, 76.54], [80.0, 80.06], [87.0, 86.73], [87.0, 89.14], [92.0, 126.22]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.66, 0.0, 0.0, 48.56, 64.18, 0.0, 29.14, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 28.63, 0.0], "audiomae_on_audioset": [null, null, [["speech", 16.13], ["hum", 13.39], ["mains hum", 10.5]], null, null, [["speech", 42.33], ["sidetone", 25.32], ["dial tone", 7.29]], null, null, [["music", 57.37], ["speech", 8.19], ["boing", 6.83]], null, [["speech", 56.39], ["music", 36.59], ["boing", 1.37]], null, null, null, null, [["music", 45.46], ["didgeridoo", 28.57], ["speech", 10.4]], null], "duration": [1.46, 1.13, 5.07, 0.28, 0.5, 2.67, 5.53, 0.06, 2.86, 0.93, 10.92, -0.05, 0.54, 0.06, -0.27, 2.14, 34.22]} \ No newline at end of file diff --git a/annotations_1/Qch6oK4qX2k_filtered.json b/annotations_1/Qch6oK4qX2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd363fbd3a305be58a47332cbc0c9b308acebf9a --- /dev/null +++ b/annotations_1/Qch6oK4qX2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.37], [22.0, 32.51], [40.0, 45.98], [47.0, 46.65], [47.0, 48.32], [48.0, 53.18], [57.0, 66.18], [68.0, 71.0], [71.0, 71.29], [73.0, 83.25], [84.0, 94.22], [94.0, 94.26], [94.0, 94.29], [94.0, 94.49], [95.0, 94.53], [95.0, 94.56], [95.0, 94.59], [95.0, 94.63], [95.0, 94.66], [95.0, 94.73], [100.0, 103.55], [105.0, 106.51], [108.0, 108.14], [110.0, 109.93], [111.0, 113.26], [114.0, 117.69], [119.0, 119.42], [122.0, 122.05], [124.0, 124.65], [127.0, 127.31], [129.0, 129.91], [132.0, 133.81], [141.0, 152.66], [153.0, 153.32], [154.0, 158.41]], "keep_status": [false, true, true, false, false, true, true, true, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 32.43, 36.19, 0.0, 0.0, 38.88, 32.08, 32.9, 0.0, 31.68, 43.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.36, 0.0, 0.0, 0.0, 78.04, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.32, 0.0, 31.85], "audiomae_on_audioset": [null, [["music", 34.19], ["trombone", 22.64], ["brass instrument", 11.09]], [["music", 38.69], ["brass instrument", 20.45], ["foghorn", 8.55]], null, null, [["music", 31.94], ["cello", 19.02], ["musical instrument", 11.18]], [["music", 46.0], ["brass instrument", 10.04], ["trombone", 6.79]], [["music", 49.49], ["trombone", 8.97], ["musical instrument", 6.93]], null, [["music", 43.94], ["brass instrument", 8.75], ["musical instrument", 5.86]], [["music", 50.71], ["cello", 6.16], ["musical instrument", 4.34]], null, null, null, null, null, null, null, null, null, [["music", 35.53], ["brass instrument", 6.97], ["hum", 6.56]], null, null, null, null, null, null, null, null, null, null, null, [["music", 39.84], ["foghorn", 8.53], ["cello", 8.27]], null, [["music", 32.73], ["trombone", 16.29], ["brass instrument", 14.0]]], "duration": [1.37, 10.51, 5.98, -0.35, 1.32, 5.18, 9.18, 3.0, 0.29, 10.25, 10.22, 0.26, 0.29, 0.49, -0.47, -0.44, -0.41, -0.37, -0.34, -0.27, 3.55, 1.51, 0.14, -0.07, 2.26, 3.69, 0.42, 0.05, 0.65, 0.31, 0.91, 1.81, 11.66, 0.32, 4.41]} \ No newline at end of file diff --git a/annotations_1/Qe2m1wxb5_w_filtered.json b/annotations_1/Qe2m1wxb5_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d652f9688a16f883dbf7e40daaa6d56acddaaa66 --- /dev/null +++ b/annotations_1/Qe2m1wxb5_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.61], [18.0, 18.98], [22.0, 21.96], [30.0, 32.51], [37.0, 39.39], [44.0, 45.96], [55.0, 55.75], [85.0, 85.77], [93.0, 93.68], [95.0, 95.59], [98.0, 101.41], [104.0, 104.25], [113.0, 114.93], [120.0, 121.09], [121.0, 121.49], [124.0, 128.17], [145.0, 146.4], [167.0, 173.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.44, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 33.1, 0.0, 0.0, 0.0, 0.0, 31.29, 0.0, 71.29], "audiomae_on_audioset": [null, null, null, [["music", 53.88], ["carnatic music", 5.07], ["plucked string instrument", 4.4]], [["music", 74.83], ["musical instrument", 1.67], ["country", 1.07]], null, null, null, null, null, [["music", 56.57], ["bass guitar", 3.69], ["musical instrument", 2.96]], null, null, null, null, [["music", 72.51], ["dubstep", 4.84], ["electronic music", 2.26]], null, null], "duration": [1.61, 0.98, -0.04, 2.51, 2.39, 1.96, 0.75, 0.77, 0.68, 0.59, 3.41, 0.25, 1.93, 1.09, 0.49, 4.17, 1.4, 6.94]} \ No newline at end of file diff --git a/annotations_1/QeWifFsvr8o_filtered.json b/annotations_1/QeWifFsvr8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56a40ca18453e5bcdef2ddfa3d17ab439c750f4 --- /dev/null +++ b/annotations_1/QeWifFsvr8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [9.0, 13.24], [14.0, 15.28], [15.0, 19.53], [20.0, 25.61], [28.0, 30.13], [31.0, 31.43], [32.0, 42.7], [44.0, 46.09], [49.0, 51.06], [52.0, 54.18], [56.0, 57.65], [62.0, 65.89], [68.0, 72.54], [79.0, 82.12], [83.0, 84.87], [87.0, 88.84], [95.0, 97.29], [98.0, 100.48], [101.0, 102.03], [104.0, 105.24], [108.0, 108.72], [110.0, 113.64], [117.0, 120.06], [121.0, 126.15], [129.0, 129.91], [139.0, 142.72], [145.0, 147.5], [148.0, 148.56], [150.0, 150.28], [156.0, 158.55], [160.0, 161.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 95.78, 99.8, 99.93, 0.0, 99.99, 100.0, 100.0, 99.97, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0, 99.98, 98.73, 0.0, 0.0, 0.0, 100.0, 99.82, 99.16, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 4.24, 1.28, 4.53, 5.61, 2.13, 0.43, 10.7, 2.09, 2.06, 2.18, 1.65, 3.89, 4.54, 3.12, 1.87, 1.84, 2.29, 2.48, 1.03, 1.24, 0.72, 3.64, 3.06, 5.15, 0.91, 3.72, 2.5, 0.56, 0.28, 2.55, 1.5]} \ No newline at end of file diff --git a/annotations_1/QfSL-PSHTkQ_filtered.json b/annotations_1/QfSL-PSHTkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09509188e2af39312b3c57569a14e67ab0c3a888 --- /dev/null +++ b/annotations_1/QfSL-PSHTkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [3.0, 5.41], [7.0, 8.36], [10.0, 10.76], [11.0, 12.68], [14.0, 15.57], [18.0, 19.25], [21.0, 21.98], [24.0, 25.79], [28.0, 29.15], [31.0, 32.61], [37.0, 37.4], [41.0, 48.93], [51.0, 51.98], [54.0, 56.88], [60.0, 60.98], [62.0, 63.49], [65.0, 67.76], [69.0, 76.35], [81.0, 81.73], [83.0, 83.88], [85.0, 86.36], [87.0, 91.57], [94.0, 94.24], [97.0, 98.39], [103.0, 104.48], [106.0, 106.61], [108.0, 108.68], [110.0, 110.44], [112.0, 112.8], [114.0, 114.94], [119.0, 120.02], [122.0, 123.53], [127.0, 127.52], [129.0, 130.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.76, 0.0, 30.39, 0.0, 0.0, 86.27, 30.48, 0.0, 0.0, 0.0, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 64.56], ["musical instrument", 7.42], ["guitar", 5.88]], null, null, null, null, null, null, null, null, null, null, [["explosion", 81.56], ["eruption", 8.44], ["burst, pop", 3.79]], null, [["reverberation", 21.58], ["music", 20.02], ["echo", 13.23]], null, null, null, [["music", 41.28], ["effects unit", 9.2], ["reverberation", 6.27]], null, null, null, [["speech", 76.79], ["sidetone", 5.71], ["echo", 2.53]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 2.41, 1.36, 0.76, 1.68, 1.57, 1.25, 0.98, 1.79, 1.15, 1.61, 0.4, 7.93, 0.98, 2.88, 0.98, 1.49, 2.76, 7.35, 0.73, 0.88, 1.36, 4.57, 0.24, 1.39, 1.48, 0.61, 0.68, 0.44, 0.8, 0.94, 1.02, 1.53, 0.52, 1.13]} \ No newline at end of file diff --git a/annotations_1/Qf_EPkVA31c_filtered.json b/annotations_1/Qf_EPkVA31c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c417dd8c1da1edfba26061537e8918b1da8b3543 --- /dev/null +++ b/annotations_1/Qf_EPkVA31c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [12.0, 12.19], [13.0, 13.83], [16.0, 17.12], [20.0, 20.01], [22.0, 22.54], [27.0, 27.35], [31.0, 31.11], [32.0, 32.81], [35.0, 34.77], [36.0, 36.46], [37.0, 37.27], [37.0, 38.01], [39.0, 39.04], [43.0, 43.9], [46.0, 45.89], [48.0, 48.88], [49.0, 50.11], [55.0, 56.27], [57.0, 57.25], [58.0, 58.73], [62.0, 61.75], [63.0, 64.07], [66.0, 66.06], [66.0, 72.18], [74.0, 75.2], [77.0, 77.11], [79.0, 79.42], [80.0, 80.84], [86.0, 86.64], [87.0, 88.48], [89.0, 90.0], [94.0, 94.14], [95.0, 94.86], [96.0, 96.74], [97.0, 96.8], [98.0, 102.32], [103.0, 103.35], [104.0, 104.35], [105.0, 104.99], [106.0, 107.77], [109.0, 110.05], [112.0, 113.07], [113.0, 113.68], [116.0, 116.34], [118.0, 118.93], [120.0, 121.29], [122.0, 122.77], [124.0, 124.51], [127.0, 127.01], [128.0, 128.09], [129.0, 128.85], [132.0, 133.73], [137.0, 137.47], [141.0, 142.32], [145.0, 145.2], [146.0, 146.28], [153.0, 154.47], [155.0, 156.46], [157.0, 157.57], [160.0, 160.32], [161.0, 161.37], [161.0, 164.32], [165.0, 167.53], [169.0, 170.55], [171.0, 171.46], [172.0, 172.12], [173.0, 178.09], [181.0, 182.21], [183.0, 183.51], [184.0, 184.15], [185.0, 187.05], [188.0, 188.77], [190.0, 189.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.82, 42.28, 0.0, 0.0, 0.0, 35.52, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 29.76], ["insect", 23.13], ["mosquito", 9.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 25.2], ["fly, housefly", 10.8], ["frog", 8.88]], [["cattle, bovinae", 34.78], ["moo", 28.22], ["livestock, farm animals, working animals", 22.05]], null, null, null, [["animal", 24.84], ["pig", 17.01], ["frog", 8.37]], null, null, null, [["livestock, farm animals, working animals", 38.7], ["moo", 33.58], ["cattle, bovinae", 20.88]], null, null], "duration": [0.36, 0.19, 0.83, 1.12, 0.01, 0.54, 0.35, 0.11, 0.81, -0.23, 0.46, 0.27, 1.01, 0.04, 0.9, -0.11, 0.88, 1.11, 1.27, 0.25, 0.73, -0.25, 1.07, 0.06, 6.18, 1.2, 0.11, 0.42, 0.84, 0.64, 1.48, 1.0, 0.14, -0.14, 0.74, -0.2, 4.32, 0.35, 0.35, -0.01, 1.77, 1.05, 1.07, 0.68, 0.34, 0.93, 1.29, 0.77, 0.51, 0.01, 0.09, -0.15, 1.73, 0.47, 1.32, 0.2, 0.28, 1.47, 1.46, 0.57, 0.32, 0.37, 3.32, 2.53, 1.55, 0.46, 0.12, 5.09, 1.21, 0.51, 0.15, 2.05, 0.77, -0.03]} \ No newline at end of file diff --git a/annotations_1/Qfv31xWBgGI_filtered.json b/annotations_1/Qfv31xWBgGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d7329906e4cb4e8a970ad305efd628ca11655c0 --- /dev/null +++ b/annotations_1/Qfv31xWBgGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.65], [8.0, 9.73], [10.0, 10.91], [12.0, 13.39], [15.0, 18.64], [19.0, 19.84], [21.0, 22.92], [23.0, 24.27], [25.0, 26.35], [27.0, 29.22], [32.0, 32.78], [34.0, 35.06], [35.0, 36.36], [37.0, 37.07], [38.0, 39.43], [42.0, 42.72], [44.0, 45.15], [47.0, 50.53], [52.0, 52.15], [54.0, 54.13], [61.0, 61.52], [62.0, 63.75], [66.0, 65.99], [69.0, 69.5], [71.0, 71.59], [73.0, 74.02], [75.0, 76.45], [81.0, 82.0], [84.0, 86.14], [94.0, 96.25], [98.0, 99.84], [101.0, 101.22], [105.0, 105.44], [106.0, 106.62], [107.0, 107.7], [108.0, 114.52], [117.0, 117.78], [119.0, 119.8], [121.0, 122.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 50.36, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.3], ["music", 7.0], ["buzz", 4.63]], null, null, null], "duration": [0.65, 1.73, 0.91, 1.39, 3.64, 0.84, 1.92, 1.27, 1.35, 2.22, 0.78, 1.06, 1.36, 0.07, 1.43, 0.72, 1.15, 3.53, 0.15, 0.13, 0.52, 1.75, -0.01, 0.5, 0.59, 1.02, 1.45, 1.0, 2.14, 2.25, 1.84, 0.22, 0.44, 0.62, 0.7, 6.52, 0.78, 0.8, 1.01]} \ No newline at end of file diff --git a/annotations_1/QgqXAXhRvYU_filtered.json b/annotations_1/QgqXAXhRvYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33aaae1c2eab6b7cb6e1439541f89a2f0c4b9eba --- /dev/null +++ b/annotations_1/QgqXAXhRvYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.09], [14.0, 15.3], [18.0, 18.23], [23.0, 27.03], [34.0, 35.41], [45.0, 44.79], [59.0, 61.32], [67.0, 68.05], [74.0, 74.12], [86.0, 86.14], [88.0, 101.68], [105.0, 123.57], [129.0, 151.83], [157.0, 160.61], [163.0, 163.29], [165.0, 167.0], [169.0, 169.53]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 41.85, 0.0, 0.0, 0.0, 40.45, 31.78, 30.98, 30.68, 0.0, 31.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 19.53], ["throat clearing", 7.65], ["beatboxing", 5.8]], null, null, null, [["hum", 62.4], ["mains hum", 21.22], ["throbbing", 12.79]], [["scary music", 34.4], ["music", 34.31], ["hum", 11.27]], [["speech", 29.27], ["didgeridoo", 24.02], ["music", 17.33]], [["speech", 39.54], ["music", 10.39], ["fly, housefly", 3.38]], null, [["music", 27.85], ["speech", 12.79], ["fly, housefly", 6.07]], null], "duration": [1.09, 1.3, 0.23, 4.03, 1.41, -0.21, 2.32, 1.05, 0.12, 0.14, 13.68, 18.57, 22.83, 3.61, 0.29, 2.0, 0.53]} \ No newline at end of file diff --git a/annotations_1/Qgx38Vxw7Bc_filtered.json b/annotations_1/Qgx38Vxw7Bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22321ce09f184ec660dc27dfc2565cdc9a64a9ba --- /dev/null +++ b/annotations_1/Qgx38Vxw7Bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.94], [11.0, 11.16], [15.0, 15.45], [17.0, 17.98], [20.0, 26.25], [31.0, 33.37], [35.0, 34.89], [45.0, 45.4], [50.0, 50.7], [53.0, 54.14], [56.0, 57.72], [60.0, 61.43], [62.0, 62.68], [63.0, 64.1], [68.0, 68.99], [72.0, 71.96], [72.0, 75.14], [79.0, 80.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.62, 0.0, 0.0, 0.0, 75.23, 48.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 87.0], ["radio", 9.08], ["sidetone", 0.92]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.94, 0.16, 0.45, 0.98, 6.25, 2.37, -0.11, 0.4, 0.7, 1.14, 1.72, 1.43, 0.68, 1.1, 0.99, -0.04, 3.14, 1.81]} \ No newline at end of file diff --git a/annotations_1/QhZbpE7mdoU_filtered.json b/annotations_1/QhZbpE7mdoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c78a79eb64893cf5dfc1237b0f3e344a0c215baa --- /dev/null +++ b/annotations_1/QhZbpE7mdoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.48], [31.0, 32.0], [34.0, 34.67], [35.0, 36.86], [38.0, 86.54]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.48, 1.0, 0.67, 1.86, 48.54]} \ No newline at end of file diff --git a/annotations_1/QiCNpDYavbg_filtered.json b/annotations_1/QiCNpDYavbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af063c7ba99da23f8393217779afb7cd626875dc --- /dev/null +++ b/annotations_1/QiCNpDYavbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 35.06], [42.0, 52.96], [56.0, 56.15], [59.0, 60.78], [64.0, 66.29], [67.0, 78.33], [79.0, 89.6], [91.0, 92.4], [93.0, 96.65], [98.0, 99.57], [104.0, 104.45], [110.0, 112.68], [118.0, 119.21], [120.0, 121.04], [123.0, 124.07], [127.0, 127.55], [131.0, 132.85], [134.0, 134.87], [137.0, 140.43], [142.0, 145.03], [151.0, 154.72], [156.0, 165.47], [166.0, 167.43], [169.0, 168.93], [170.0, 174.16], [175.0, 181.74], [183.0, 184.06], [185.0, 189.5], [192.0, 193.14], [195.0, 196.55], [202.0, 203.35], [208.0, 210.0], [212.0, 212.79], [214.0, 215.7], [217.0, 218.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [46.09, 98.99, 0.0, 0.0, 99.96, 99.56, 88.28, 0.0, 82.79, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 77.2, 84.98, 70.3, 0.0, 0.0, 65.44, 46.79, 0.0, 40.48, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.74], ["ambient music", 6.08], ["hum", 4.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 36.24], ["music", 32.45], ["speech", 5.5]], null, [["music", 42.2], ["harp", 6.3], ["singing bowl", 4.91]], null, null, null, null, null, null, null], "duration": [29.06, 10.96, 0.15, 1.78, 2.29, 11.33, 10.6, 1.4, 3.65, 1.57, 0.45, 2.68, 1.21, 1.04, 1.07, 0.55, 1.85, 0.87, 3.43, 3.03, 3.72, 9.47, 1.43, -0.07, 4.16, 6.74, 1.06, 4.5, 1.14, 1.55, 1.35, 2.0, 0.79, 1.7, 1.66]} \ No newline at end of file diff --git a/annotations_1/QiT-jk74QMw_filtered.json b/annotations_1/QiT-jk74QMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ed50260ea65711993ff770519993de709567264 --- /dev/null +++ b/annotations_1/QiT-jk74QMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 64.03], [65.0, 65.92], [68.0, 72.08], [74.0, 77.19], [79.0, 82.95], [84.0, 85.46], [87.0, 92.01], [94.0, 94.46], [96.0, 98.63], [99.0, 113.14], [114.0, 114.45], [118.0, 120.12], [124.0, 124.75], [128.0, 129.49], [130.0, 130.33]], "keep_status": [true, false, true, false, true, false, true, false, false, true, false, true, false, false, false], "silence_prob": [34.92, 0.0, 43.28, 50.26, 48.1, 0.0, 37.04, 0.0, 33.77, 31.32, 0.0, 32.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 24.32], ["mains hum", 18.34], ["speech", 16.58]], null, [["music", 27.74], ["speech", 25.82], ["mains hum", 8.21]], null, [["didgeridoo", 21.83], ["music", 19.57], ["speech", 17.84]], null, [["music", 25.6], ["thunk", 14.16], ["hum", 11.62]], null, [["music", 64.63], ["musical instrument", 5.94], ["guitar", 3.4]], [["hum", 32.94], ["mains hum", 20.34], ["whack, thwack", 7.92]], null, [["music", 20.81], ["didgeridoo", 10.47], ["hum", 8.92]], null, null, null], "duration": [8.03, 0.92, 4.08, 3.19, 3.95, 1.46, 5.01, 0.46, 2.63, 14.14, 0.45, 2.12, 0.75, 1.49, 0.33]} \ No newline at end of file diff --git a/annotations_1/QjZUS2455z8_filtered.json b/annotations_1/QjZUS2455z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17c3f5f62340053a638a013ea27e465ad89e3c06 --- /dev/null +++ b/annotations_1/QjZUS2455z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.8], [12.0, 19.31], [20.0, 20.92], [21.0, 22.57], [23.0, 26.25], [30.0, 34.16], [37.0, 38.87], [49.0, 50.63], [58.0, 65.2], [67.0, 72.76], [81.0, 85.87], [88.0, 88.28], [91.0, 91.67], [92.0, 92.5], [93.0, 93.53], [94.0, 94.39], [95.0, 94.86], [96.0, 96.99]], "keep_status": [false, true, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.86, 0.0, 0.0, 54.23, 32.91, 0.0, 0.0, 52.1, 34.51, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.36], ["mosquito", 7.09], ["fly, housefly", 6.12]], null, null, null, [["speech", 43.89], ["sidetone", 17.63], ["quack", 7.87]], null, null, null, [["speech", 29.86], ["fart", 14.8], ["whale vocalization", 5.49]], [["animal", 13.05], ["grunt", 6.52], ["livestock, farm animals, working animals", 5.45]], null, null, null, null, null, null, null], "duration": [-0.2, 7.31, 0.92, 1.57, 3.25, 4.16, 1.87, 1.63, 7.2, 5.76, 4.87, 0.28, 0.67, 0.5, 0.53, 0.39, -0.14, 0.99]} \ No newline at end of file diff --git a/annotations_1/Qk1y1yVQkJQ_filtered.json b/annotations_1/Qk1y1yVQkJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fc62ca1f2b3f35809f0b0f10c5b7a2fbdf805d5 --- /dev/null +++ b/annotations_1/Qk1y1yVQkJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.9], [17.0, 18.08], [21.0, 21.98], [34.0, 35.97], [43.0, 45.1], [55.0, 60.57], [69.0, 97.46], [104.0, 115.91], [118.0, 118.42]], "keep_status": [false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.37, 33.06, 34.87, 39.49, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 10.54], ["music", 10.16], ["mains hum", 3.7]], [["crowd", 13.53], ["cheering", 12.62], ["speech", 12.06]], [["music", 61.26], ["theremin", 11.88], ["synthesizer", 8.88]], [["music", 69.58], ["didgeridoo", 8.45], ["musical instrument", 1.59]], null], "duration": [1.9, 1.08, 0.98, 1.97, 2.1, 5.57, 28.46, 11.91, 0.42]} \ No newline at end of file diff --git a/annotations_1/QkKXJ82vfJU_filtered.json b/annotations_1/QkKXJ82vfJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/QkKXJ82vfJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/QkrYlP8-Cmo_filtered.json b/annotations_1/QkrYlP8-Cmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ddf67849c6122c454524e9869eb65cdc2dc85f --- /dev/null +++ b/annotations_1/QkrYlP8-Cmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.62], [37.0, 37.07], [38.0, 38.6], [44.0, 48.71], [56.0, 76.37], [78.0, 85.82], [89.0, 90.93], [92.0, 112.28], [116.0, 127.25], [132.0, 141.51], [143.0, 143.6], [146.0, 147.61], [149.0, 149.55], [151.0, 155.61], [156.0, 179.58], [185.0, 185.75], [186.0, 187.68], [189.0, 195.78]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.6, 34.36, 32.14, 0.0, 30.24, 33.34, 43.93, 0.0, 0.0, 0.0, 36.44, 34.61, 0.0, 0.0, 30.16], "audiomae_on_audioset": [null, null, null, [["music", 39.44], ["speech", 13.72], ["quack", 7.53]], [["speech", 25.44], ["fly, housefly", 17.74], ["insect", 10.99]], [["music", 59.39], ["didgeridoo", 9.04], ["musical instrument", 4.78]], null, [["music", 65.13], ["throbbing", 3.36], ["electronic music", 3.02]], [["music", 43.23], ["whack, thwack", 8.23], ["speech", 5.27]], [["music", 43.66], ["speech", 30.57], ["hum", 3.76]], null, null, null, [["music", 43.13], ["thunk", 12.53], ["speech", 11.82]], [["music", 61.62], ["didgeridoo", 23.24], ["musical instrument", 3.09]], null, null, [["music", 47.22], ["speech", 17.15], ["whack, thwack", 7.16]]], "duration": [1.62, 0.07, 0.6, 4.71, 20.37, 7.82, 1.93, 20.28, 11.25, 9.51, 0.6, 1.61, 0.55, 4.61, 23.58, 0.75, 1.68, 6.78]} \ No newline at end of file diff --git a/annotations_1/QlDqtuo10fA_filtered.json b/annotations_1/QlDqtuo10fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c754599a120c6064260662cd060b750a58311255 --- /dev/null +++ b/annotations_1/QlDqtuo10fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.28], [9.0, 8.8], [17.0, 17.44], [21.0, 21.05], [25.0, 25.32], [28.0, 28.48], [32.0, 34.01], [35.0, 35.6], [36.0, 37.39], [39.0, 42.08], [43.0, 51.16], [52.0, 52.96], [54.0, 54.63], [56.0, 57.08], [67.0, 69.38], [73.0, 73.63], [75.0, 75.32], [77.0, 81.63], [83.0, 84.64], [86.0, 87.08], [88.0, 105.44], [112.0, 115.62], [119.0, 120.73], [123.0, 126.69], [127.0, 127.77], [131.0, 132.44]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, false, true, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 33.39, 36.39, 0.0, 0.0, 0.0, 31.69, 0.0, 0.0, 31.34, 0.0, 0.0, 29.69, 30.51, 0.0, 30.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["synthesizer", 25.91], ["music", 19.14], ["whale vocalization", 10.99]], null, null, [["music", 44.94], ["hum", 19.96], ["mains hum", 10.27]], [["music", 37.66], ["hum", 16.7], ["throbbing", 14.83]], null, null, null, [["music", 48.38], ["throbbing", 11.07], ["noise", 5.35]], null, null, [["music", 53.95], ["boom", 5.13], ["smash, crash", 4.55]], null, null, [["hum", 22.16], ["music", 20.56], ["mains hum", 8.96]], [["livestock, farm animals, working animals", 10.91], ["music", 6.14], ["throbbing", 6.13]], null, [["throbbing", 20.48], ["music", 19.09], ["speech", 14.72]], null, null], "duration": [0.28, -0.2, 0.44, 0.05, 0.32, 0.48, 2.01, 0.6, 1.39, 3.08, 8.16, 0.96, 0.63, 1.08, 2.38, 0.63, 0.32, 4.63, 1.64, 1.08, 17.44, 3.62, 1.73, 3.69, 0.77, 1.44]} \ No newline at end of file diff --git a/annotations_1/QmEz0udgJsA_filtered.json b/annotations_1/QmEz0udgJsA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddfcf98c94a3a5a27103afeba0dc8399aebe904b --- /dev/null +++ b/annotations_1/QmEz0udgJsA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.62], [9.0, 9.75], [10.0, 62.28], [64.0, 65.87], [67.0, 70.51], [72.0, 89.19], [92.0, 115.92], [117.0, 117.42], [119.0, 124.29], [128.0, 132.19]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [58.05, 0.0, 0.0, 0.0, 48.91, 36.92, 34.34, 0.0, 53.72, 72.6], "audiomae_on_audioset": [null, null, null, null, [["speech", 57.52], ["music", 6.02], ["inside, small room", 3.24]], [["mains hum", 36.55], ["hum", 33.69], ["electric shaver, electric razor", 3.54]], [["music", 46.33], ["throbbing", 13.86], ["hum", 12.54]], null, null, null], "duration": [2.62, 0.75, 52.28, 1.87, 3.51, 17.19, 23.92, 0.42, 5.29, 4.19]} \ No newline at end of file diff --git a/annotations_1/QnDgw7XXaOU_filtered.json b/annotations_1/QnDgw7XXaOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a184d81216fdbe09031e3294f358aeea81e0a085 --- /dev/null +++ b/annotations_1/QnDgw7XXaOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.16], [20.0, 21.36], [23.0, 29.0], [31.0, 32.85], [35.0, 35.95], [37.0, 40.8], [41.0, 46.23], [47.0, 49.13], [50.0, 52.68], [54.0, 56.39], [57.0, 58.43], [59.0, 59.48], [62.0, 62.9], [65.0, 66.75], [68.0, 69.62], [73.0, 73.68], [74.0, 76.59], [78.0, 79.56], [83.0, 82.7], [83.0, 83.66], [86.0, 86.95], [87.0, 94.76], [96.0, 97.68], [102.0, 104.11], [110.0, 110.52], [112.0, 113.39], [116.0, 119.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0, 0.0, 65.09, 76.2, 99.9, 99.05, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 94.37, 0.0, 0.0, 71.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 1.36, 6.0, 1.85, 0.95, 3.8, 5.23, 2.13, 2.68, 2.39, 1.43, 0.48, 0.9, 1.75, 1.62, 0.68, 2.59, 1.56, -0.3, 0.66, 0.95, 7.76, 1.68, 2.11, 0.52, 1.39, 3.1]} \ No newline at end of file diff --git a/annotations_1/QnX-Xgbi37I_filtered.json b/annotations_1/QnX-Xgbi37I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b46c462f01ca03936536a249591f1d5e84152fa5 --- /dev/null +++ b/annotations_1/QnX-Xgbi37I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.9], [45.0, 45.62], [47.0, 101.51]], "keep_status": [false, false, false], "silence_prob": [31.32, 0.0, 0.0], "audiomae_on_audioset": [[["music", 81.17], ["scary music", 5.36], ["grunt", 2.98]], null, null], "duration": [7.9, 0.62, 54.51]} \ No newline at end of file diff --git a/annotations_1/QoWIRCVeXBc_filtered.json b/annotations_1/QoWIRCVeXBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f6241d80755cf20b9889125a9b13186db5ce6ce --- /dev/null +++ b/annotations_1/QoWIRCVeXBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [10.0, 10.08], [15.0, 14.99], [20.0, 21.09], [26.0, 28.71], [32.0, 36.27], [37.0, 37.96], [40.0, 40.74], [42.0, 43.19], [47.0, 47.65], [48.0, 49.25], [52.0, 54.23], [55.0, 55.78], [57.0, 57.28], [59.0, 59.46], [60.0, 60.86], [62.0, 62.92], [64.0, 66.41], [67.0, 68.96], [69.0, 71.49], [72.0, 79.17], [100.0, 100.18], [103.0, 103.47], [105.0, 106.34], [109.0, 109.12], [110.0, 110.56], [112.0, 112.89], [116.0, 116.45], [119.0, 119.15], [119.0, 121.64], [124.0, 124.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 99.9, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.08, -0.01, 1.09, 2.71, 4.27, 0.96, 0.74, 1.19, 0.65, 1.25, 2.23, 0.78, 0.28, 0.46, 0.86, 0.92, 2.41, 1.96, 2.49, 7.17, 0.18, 0.47, 1.34, 0.12, 0.56, 0.89, 0.45, 0.15, 2.64, 0.68]} \ No newline at end of file diff --git a/annotations_1/QpmECKEHSQs_filtered.json b/annotations_1/QpmECKEHSQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..278d2078b3fdafb15f68ec19687b65ad990e7560 --- /dev/null +++ b/annotations_1/QpmECKEHSQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.37], [20.0, 23.33], [24.0, 24.81], [26.0, 26.16], [30.0, 55.73], [58.0, 58.02], [62.0, 71.49], [72.0, 73.79], [74.0, 78.0], [79.0, 80.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.74, 0.0, 0.0, 28.92, 0.0, 99.16, 0.0, 55.74, 0.0], "audiomae_on_audioset": [null, [["music", 60.53], ["didgeridoo", 18.25], ["musical instrument", 5.78]], null, null, [["music", 69.04], ["didgeridoo", 14.0], ["electronic music", 3.35]], null, null, null, null, null], "duration": [0.37, 3.33, 0.81, 0.16, 25.73, 0.02, 9.49, 1.79, 4.0, 1.5]} \ No newline at end of file diff --git a/annotations_1/QqFuGUbvgnQ_filtered.json b/annotations_1/QqFuGUbvgnQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..303f81972dea049eb50287ff730d578a1f15e5ff --- /dev/null +++ b/annotations_1/QqFuGUbvgnQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.17], [9.0, 14.45], [16.0, 18.3], [21.0, 24.87], [32.0, 36.66], [39.0, 47.34], [49.0, 49.4], [55.0, 63.0], [74.0, 83.67], [86.0, 102.12], [104.0, 103.69], [104.0, 106.24], [109.0, 109.46], [110.0, 140.68], [143.0, 150.74], [154.0, 168.79]], "keep_status": [true, false, true, true, true, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [31.27, 33.38, 41.5, 34.93, 34.46, 41.01, 0.0, 38.11, 30.17, 29.19, 0.0, 29.03, 0.0, 0.0, 39.64, 33.67], "audiomae_on_audioset": [[["music", 37.62], ["theremin", 9.31], ["hum", 4.9]], [["music", 62.66], ["speech", 4.01], ["hum", 3.55]], [["music", 19.52], ["speech", 6.87], ["throbbing", 6.07]], [["music", 28.82], ["hum", 20.83], ["throbbing", 10.93]], [["music", 50.27], ["speech", 9.35], ["sidetone", 8.35]], [["music", 38.74], ["throbbing", 20.84], ["hum", 19.43]], null, [["speech", 26.47], ["music", 20.89], ["sheep", 6.24]], [["music", 74.19], ["electronic music", 2.56], ["throbbing", 2.51]], [["music", 54.81], ["throbbing", 14.5], ["speech", 10.07]], null, [["music", 57.2], ["electronic music", 5.66], ["throbbing", 4.97]], null, null, [["throbbing", 34.77], ["music", 29.8], ["hum", 6.62]], [["music", 64.03], ["throbbing", 5.4], ["electronic music", 5.3]]], "duration": [2.17, 5.45, 2.3, 3.87, 4.66, 8.34, 0.4, 8.0, 9.67, 16.12, -0.31, 2.24, 0.46, 30.68, 7.74, 14.79]} \ No newline at end of file diff --git a/annotations_1/QqQYNj15OfI_filtered.json b/annotations_1/QqQYNj15OfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6624e578b26792c991b1b37ac6edc10647e7e058 --- /dev/null +++ b/annotations_1/QqQYNj15OfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.8], [13.0, 22.82], [23.0, 27.04], [37.0, 38.13], [42.0, 42.08], [57.0, 60.45], [64.0, 83.1], [85.0, 85.58], [89.0, 89.87], [93.0, 94.02], [95.0, 96.85], [102.0, 103.25], [117.0, 119.01], [121.0, 121.95], [127.0, 127.47], [131.0, 131.9], [138.0, 139.48], [141.0, 143.41], [145.0, 145.86], [151.0, 152.12], [157.0, 158.65], [160.0, 161.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.34, 54.5, 90.78, 0.0, 0.0, 100.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 33.06], ["moo", 31.15], ["livestock, farm animals, working animals", 21.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.8, 9.82, 4.04, 1.13, 0.08, 3.45, 19.1, 0.58, 0.87, 1.02, 1.85, 1.25, 2.01, 0.95, 0.47, 0.9, 1.48, 2.41, 0.86, 1.12, 1.65, 1.77]} \ No newline at end of file diff --git a/annotations_1/QsCBiq5cET4_filtered.json b/annotations_1/QsCBiq5cET4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b19ad733b34f24321e69cf91afba305064085b8b --- /dev/null +++ b/annotations_1/QsCBiq5cET4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 16.95], [18.0, 25.59], [26.0, 33.96], [35.0, 36.26], [41.0, 42.55], [46.0, 47.22], [48.0, 50.62], [52.0, 54.18], [56.0, 57.08], [59.0, 64.05], [67.0, 67.74], [70.0, 70.39], [72.0, 71.81]], "keep_status": [false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [48.23, 42.88, 37.06, 0.0, 0.0, 0.0, 43.61, 49.0, 0.0, 37.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.36], ["synthesizer", 12.87], ["musical instrument", 4.38]], [["music", 68.76], ["chirp tone", 6.41], ["electronic music", 2.23]], [["music", 64.06], ["musical instrument", 5.57], ["guitar", 4.98]], null, null, null, [["music", 24.52], ["dog", 12.72], ["animal", 12.6]], [["music", 51.02], ["speech", 13.28], ["electronic music", 3.52]], null, [["music", 54.33], ["speech", 9.06], ["animal", 3.64]], null, null, null], "duration": [11.95, 7.59, 7.96, 1.26, 1.55, 1.22, 2.62, 2.18, 1.08, 5.05, 0.74, 0.39, -0.19]} \ No newline at end of file diff --git a/annotations_1/QsP5Y1-eUIM_filtered.json b/annotations_1/QsP5Y1-eUIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fcb9efd9aeacf27a75bb183847304a5e743d0da --- /dev/null +++ b/annotations_1/QsP5Y1-eUIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.26], [6.0, 6.56], [7.0, 10.07], [11.0, 11.08], [12.0, 12.31], [13.0, 13.61], [20.0, 21.51], [22.0, 23.36], [25.0, 26.49], [27.0, 33.94], [37.0, 37.79], [40.0, 42.42], [51.0, 71.34], [84.0, 112.73], [124.0, 127.3], [131.0, 134.06], [136.0, 174.63], [178.0, 178.36], [181.0, 182.07]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [41.98, 0.0, 33.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.63, 0.0, 34.98, 29.32, 29.3, 29.09, 29.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 16.7], ["sidetone", 15.77], ["music", 11.55]], null, [["music", 74.92], ["synthesizer", 6.8], ["musical instrument", 4.33]], null, null, null, null, null, null, [["music", 79.39], ["musical instrument", 2.7], ["sampler", 1.36]], null, [["music", 76.42], ["electronic music", 3.71], ["synthesizer", 2.88]], [["music", 79.82], ["throbbing", 2.26], ["speech", 1.92]], [["music", 81.43], ["didgeridoo", 2.04], ["sampler", 1.52]], [["music", 73.82], ["sampler", 2.6], ["musical instrument", 1.97]], [["music", 62.33], ["sampler", 4.12], ["throbbing", 2.64]], null, null, null], "duration": [3.26, 0.56, 3.07, 0.08, 0.31, 0.61, 1.51, 1.36, 1.49, 6.94, 0.79, 2.42, 20.34, 28.73, 3.3, 3.06, 38.63, 0.36, 1.07]} \ No newline at end of file diff --git a/annotations_1/QsSD6_V2IYk_filtered.json b/annotations_1/QsSD6_V2IYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6623917795f2a2aeaefcca3e2e77e9033d309a13 --- /dev/null +++ b/annotations_1/QsSD6_V2IYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.85], [11.0, 11.82], [13.0, 15.8], [16.0, 17.88], [19.0, 20.28], [21.0, 22.01], [24.0, 24.41], [26.0, 28.14], [29.0, 29.93], [33.0, 34.59], [38.0, 39.21], [42.0, 44.51], [46.0, 47.36], [48.0, 48.09], [48.0, 49.05], [53.0, 61.37], [63.0, 63.81], [67.0, 71.39], [74.0, 74.8], [76.0, 76.96], [81.0, 81.67], [87.0, 87.69], [92.0, 94.88], [95.0, 101.95], [102.0, 104.16], [105.0, 115.03], [117.0, 117.24], [119.0, 119.13], [121.0, 121.93], [125.0, 126.1], [129.0, 129.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 37.09, 0.0, 37.53, 0.0, 0.0, 0.0, 0.0, 78.21, 38.63, 39.86, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.67], ["music", 15.26], ["sidetone", 14.31]], null, [["music", 46.26], ["speech", 38.4], ["musical instrument", 3.15]], null, null, null, null, null, [["music", 41.79], ["speech", 18.43], ["guitar", 12.18]], [["speech", 35.79], ["music", 24.43], ["musical instrument", 12.3]], null, null, null, null, null, null], "duration": [2.85, 0.82, 2.8, 1.88, 1.28, 1.01, 0.41, 2.14, 0.93, 1.59, 1.21, 2.51, 1.36, 0.09, 1.05, 8.37, 0.81, 4.39, 0.8, 0.96, 0.67, 0.69, 2.88, 6.95, 2.16, 10.03, 0.24, 0.13, 0.93, 1.1, 0.54]} \ No newline at end of file diff --git a/annotations_1/Qt6F9WCle9k_filtered.json b/annotations_1/Qt6F9WCle9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79b8e5604f72ed2460d134a37dc5fbbe107be46d --- /dev/null +++ b/annotations_1/Qt6F9WCle9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.51], [8.0, 9.53], [11.0, 15.04], [16.0, 16.04], [16.0, 18.06], [24.0, 25.39], [28.0, 28.93], [30.0, 31.95], [34.0, 44.24], [46.0, 46.65], [48.0, 57.16], [57.0, 59.24], [61.0, 61.03], [70.0, 71.31], [72.0, 77.57], [80.0, 80.54], [81.0, 84.59], [85.0, 88.37], [89.0, 89.43], [90.0, 90.63], [91.0, 92.37], [94.0, 96.72], [99.0, 101.48], [105.0, 112.63], [115.0, 117.88], [119.0, 120.53], [122.0, 126.25], [128.0, 132.24], [134.0, 136.98], [140.0, 150.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.4, 0.0, 99.31, 0.0, 0.0, 0.0, 60.7, 0.0, 99.82, 77.87, 0.0, 0.0, 47.31, 0.0, 81.17, 56.4, 0.0, 0.0, 0.0, 99.87, 99.84, 72.46, 98.86, 0.0, 99.96, 99.95, 78.55, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 52.14], ["tuning fork", 26.83], ["chirp tone", 4.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.53, 4.04, 0.04, 2.06, 1.39, 0.93, 1.95, 10.24, 0.65, 9.16, 2.24, 0.03, 1.31, 5.57, 0.54, 3.59, 3.37, 0.43, 0.63, 1.37, 2.72, 2.48, 7.63, 2.88, 1.53, 4.25, 4.24, 2.98, 10.04]} \ No newline at end of file diff --git a/annotations_1/QtQpMjuyHnM_filtered.json b/annotations_1/QtQpMjuyHnM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3a69d68336330915d35658afbd2c4e1b04e2202 --- /dev/null +++ b/annotations_1/QtQpMjuyHnM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 39.06], [44.0, 44.17], [47.0, 55.12], [56.0, 129.52], [132.0, 133.25]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 34.53], ["buzz", 6.17], ["speech", 4.79]], null, null], "duration": [36.06, 0.17, 8.12, 73.52, 1.25]} \ No newline at end of file diff --git a/annotations_1/QtVEk0oKtkM_filtered.json b/annotations_1/QtVEk0oKtkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3581c424114c3d46c0a18b2876ed67107748181 --- /dev/null +++ b/annotations_1/QtVEk0oKtkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.12], [13.0, 13.88], [15.0, 17.56], [23.0, 25.69], [27.0, 27.84], [31.0, 32.93], [34.0, 34.96], [36.0, 37.15], [39.0, 39.75], [43.0, 46.79], [48.0, 52.95], [54.0, 56.52], [58.0, 62.7], [63.0, 64.64], [67.0, 70.19], [72.0, 73.26], [75.0, 75.47], [76.0, 76.72], [78.0, 82.8], [87.0, 90.37], [91.0, 92.16], [93.0, 95.0], [96.0, 97.87], [100.0, 101.22], [102.0, 103.62], [105.0, 111.15], [112.0, 113.04], [114.0, 116.55], [118.0, 119.4], [120.0, 121.54], [122.0, 125.68], [126.0, 133.89], [135.0, 135.68], [137.0, 138.38], [139.0, 142.01], [143.0, 145.56], [147.0, 148.26], [149.0, 150.6], [151.0, 152.04], [153.0, 153.45], [156.0, 161.65]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.28, 0.0, 45.88, 36.66, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 56.1, 56.48, 74.6, 0.0, 63.74, 0.0, 0.0, 0.0, 51.66, 61.37, 0.0, 59.07, 0.0, 0.0, 0.0, 58.55, 0.0, 49.59, 0.0, 0.0, 52.92, 42.86, 0.0, 0.0, 37.17, 46.43, 0.0, 0.0, 0.0, 0.0, 52.1], "audiomae_on_audioset": [[["music", 32.45], ["hum", 24.95], ["whale vocalization", 7.37]], null, [["music", 25.29], ["hum", 21.73], ["electronic music", 8.27]], [["speech", 44.63], ["music", 13.25], ["hum", 12.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.27], ["quack", 26.28], ["duck", 10.89]], null, null, null, [["music", 35.37], ["speech", 24.98], ["hum", 12.96]], null, null, [["music", 57.31], ["hum", 7.02], ["pulse", 5.96]], [["hum", 45.03], ["mains hum", 14.97], ["throbbing", 13.42]], null, null, null, null, null], "duration": [9.12, 0.88, 2.56, 2.69, 0.84, 1.93, 0.96, 1.15, 0.75, 3.79, 4.95, 2.52, 4.7, 1.64, 3.19, 1.26, 0.47, 0.72, 4.8, 3.37, 1.16, 2.0, 1.87, 1.22, 1.62, 6.15, 1.04, 2.55, 1.4, 1.54, 3.68, 7.89, 0.68, 1.38, 3.01, 2.56, 1.26, 1.6, 1.04, 0.45, 5.65]} \ No newline at end of file diff --git a/annotations_1/QuZ_ak2qxeE_filtered.json b/annotations_1/QuZ_ak2qxeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddebae36a1e66e6db8f7dc8795a35f9ae59e9d1b --- /dev/null +++ b/annotations_1/QuZ_ak2qxeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [7.0, 8.26], [9.0, 10.79], [11.0, 11.67], [14.0, 14.79], [16.0, 16.83], [18.0, 18.84], [22.0, 23.38], [24.0, 24.19], [26.0, 26.16], [29.0, 30.0], [31.0, 31.41], [32.0, 33.72], [35.0, 35.82], [38.0, 38.77], [43.0, 43.53], [44.0, 45.67], [46.0, 48.64], [50.0, 51.65], [55.0, 55.93], [57.0, 57.33], [58.0, 58.36], [63.0, 63.58], [69.0, 69.77], [71.0, 70.92], [73.0, 73.21], [74.0, 75.57], [76.0, 77.09], [78.0, 81.08], [82.0, 83.86], [84.0, 87.13], [88.0, 89.31], [91.0, 92.01], [94.0, 98.74], [100.0, 100.8], [101.0, 102.41], [105.0, 106.12], [108.0, 108.21], [111.0, 111.77], [117.0, 118.4], [120.0, 121.26], [123.0, 123.13], [124.0, 129.3], [130.0, 130.81], [132.0, 132.75], [136.0, 137.78], [138.0, 138.97], [141.0, 141.3], [143.0, 144.83], [146.0, 146.55], [148.0, 152.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 84.8, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.33], ["musical instrument", 6.81], ["theremin", 6.74]], null, null, null, null, null, null, null, [["fly, housefly", 25.61], ["mosquito", 16.17], ["insect", 8.2]]], "duration": [0.41, 1.26, 1.79, 0.67, 0.79, 0.83, 0.84, 1.38, 0.19, 0.16, 1.0, 0.41, 1.72, 0.82, 0.77, 0.53, 1.67, 2.64, 1.65, 0.93, 0.33, 0.36, 0.58, 0.77, -0.08, 0.21, 1.57, 1.09, 3.08, 1.86, 3.13, 1.31, 1.01, 4.74, 0.8, 1.41, 1.12, 0.21, 0.77, 1.4, 1.26, 0.13, 5.3, 0.81, 0.75, 1.78, 0.97, 0.3, 1.83, 0.55, 4.22]} \ No newline at end of file diff --git a/annotations_1/QvVUxPcMZQE_filtered.json b/annotations_1/QvVUxPcMZQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1621878715d58f68ef4cc731cc57ff02823c8ba5 --- /dev/null +++ b/annotations_1/QvVUxPcMZQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.44], [4.0, 8.24], [17.0, 17.39], [19.0, 19.94], [28.0, 29.61], [30.0, 31.94], [34.0, 44.78], [51.0, 51.56], [55.0, 55.44], [57.0, 64.07], [66.0, 72.25], [73.0, 74.33], [76.0, 80.52], [85.0, 94.85], [95.0, 96.3]], "keep_status": [false, true, false, false, false, false, true, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 36.43, 0.0, 0.0, 32.98, 29.6, 0.0, 35.43, 33.45, 0.0], "audiomae_on_audioset": [null, [["speech", 31.97], ["music", 24.65], ["guitar", 9.0]], null, null, null, null, [["speech", 37.89], ["music", 10.41], ["hum", 8.61]], null, null, [["hum", 23.07], ["mains hum", 22.18], ["music", 9.18]], [["breaking", 47.66], ["speech", 33.3], ["smash, crash", 6.67]], null, [["speech", 52.88], ["hum", 6.94], ["mains hum", 4.8]], [["speech", 54.5], ["music", 7.15], ["noise", 4.94]], null], "duration": [1.44, 4.24, 0.39, 0.94, 1.61, 1.94, 10.78, 0.56, 0.44, 7.07, 6.25, 1.33, 4.52, 9.85, 1.3]} \ No newline at end of file diff --git a/annotations_1/QvdszN3x7M4_filtered.json b/annotations_1/QvdszN3x7M4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c883903f174c6f2a1b242c579c7a22ae6994c54 --- /dev/null +++ b/annotations_1/QvdszN3x7M4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 24.68], [26.0, 27.57], [28.0, 29.74], [31.0, 32.07], [33.0, 34.8], [36.0, 49.15], [49.0, 64.86], [71.0, 76.5], [77.0, 125.79], [127.0, 130.15], [131.0, 140.78], [141.0, 144.76], [145.0, 145.83]], "keep_status": [true, false, false, false, false, true, true, true, false, false, false, true, false], "silence_prob": [43.69, 0.0, 0.0, 0.0, 0.0, 38.62, 34.62, 39.58, 0.0, 31.33, 30.58, 29.3, 0.0], "audiomae_on_audioset": [[["speech", 20.75], ["thunk", 11.16], ["hum", 8.92]], null, null, null, null, [["animal", 22.66], ["speech", 16.16], ["dog", 6.22]], [["animal", 47.02], ["dog", 8.83], ["livestock, farm animals, working animals", 5.93]], [["speech", 55.94], ["fart", 8.02], ["music", 4.83]], null, [["music", 57.68], ["noise", 14.92], ["didgeridoo", 4.29]], [["music", 39.92], ["fart", 22.28], ["didgeridoo", 20.9]], [["music", 52.46], ["breaking", 7.84], ["reverberation", 3.77]], null], "duration": [4.68, 1.57, 1.74, 1.07, 1.8, 13.15, 15.86, 5.5, 48.79, 3.15, 9.78, 3.76, 0.83]} \ No newline at end of file diff --git a/annotations_1/QvfcWxGZv9M_filtered.json b/annotations_1/QvfcWxGZv9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5062e650c906e7178fec74d0d2801aa7ba6da0f2 --- /dev/null +++ b/annotations_1/QvfcWxGZv9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [11.0, 14.25], [15.0, 15.01], [16.0, 16.83], [19.0, 21.34], [29.0, 30.05], [36.0, 49.38], [51.0, 51.85], [53.0, 57.11], [63.0, 64.79], [68.0, 68.49], [69.0, 71.96], [75.0, 78.6], [96.0, 95.99], [100.0, 104.35], [108.0, 108.3], [109.0, 109.39], [110.0, 113.0], [115.0, 114.57], [123.0, 128.11], [131.0, 132.07], [143.0, 143.67], [144.0, 144.21], [148.0, 150.06], [152.0, 152.64], [155.0, 156.78], [158.0, 159.54], [160.0, 163.09], [166.0, 167.36]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 45.46, 0.0, 0.0, 34.21, 0.0, 34.07, 0.0, 33.81, 0.0, 0.0, 37.64, 58.38, 0.0, 43.15, 0.0, 0.0, 91.64, 0.0, 34.65, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 43.61, 0.0], "audiomae_on_audioset": [null, [["music", 25.24], ["grunt", 15.55], ["fart", 4.82]], null, null, [["music", 32.42], ["fart", 22.85], ["speech", 17.0]], null, [["music", 52.78], ["groan", 11.67], ["whack, thwack", 8.59]], null, [["music", 38.54], ["fart", 17.14], ["mosquito", 11.83]], null, null, [["animal", 39.94], ["sheep", 22.61], ["livestock, farm animals, working animals", 15.43]], null, null, [["speech", 77.4], ["animal", 2.44], ["crushing", 2.3]], null, null, null, null, [["livestock, farm animals, working animals", 32.09], ["moo", 15.3], ["cattle, bovinae", 12.69]], null, null, null, null, null, null, null, [["music", 38.98], ["guitar", 6.52], ["plucked string instrument", 5.65]], null], "duration": [0.89, 3.25, 0.01, 0.83, 2.34, 1.05, 13.38, 0.85, 4.11, 1.79, 0.49, 2.96, 3.6, -0.01, 4.35, 0.3, 0.39, 3.0, -0.43, 5.11, 1.07, 0.67, 0.21, 2.06, 0.64, 1.78, 1.54, 3.09, 1.36]} \ No newline at end of file diff --git a/annotations_1/QwkW-Rbo3kE_filtered.json b/annotations_1/QwkW-Rbo3kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f90e1d6f92924e37d6cec0e19f34025c2c66546b --- /dev/null +++ b/annotations_1/QwkW-Rbo3kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 3.65], [6.0, 7.21], [17.0, 23.23], [24.0, 24.73], [29.0, 30.08], [31.0, 33.17], [36.0, 35.94], [39.0, 39.23], [41.0, 41.03], [45.0, 45.89], [47.0, 56.03], [56.0, 59.07], [63.0, 65.26], [66.0, 66.56], [67.0, 67.83], [72.0, 73.03], [76.0, 76.13], [78.0, 78.71], [82.0, 82.05], [83.0, 83.4], [95.0, 95.49], [101.0, 101.58], [102.0, 103.32], [106.0, 107.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.55, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 90.08, 99.88, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 40.11], ["creak", 39.69], ["electric shaver, electric razor", 2.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.65, 1.21, 6.23, 0.73, 1.08, 2.17, -0.06, 0.23, 0.03, 0.89, 9.03, 3.07, 2.26, 0.56, 0.83, 1.03, 0.13, 0.71, 0.05, 0.4, 0.49, 0.58, 1.32, 1.28]} \ No newline at end of file diff --git a/annotations_1/Qwr539L6kCI_filtered.json b/annotations_1/Qwr539L6kCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a35e748977c39dbee694ddf5c37703abc0d6535a --- /dev/null +++ b/annotations_1/Qwr539L6kCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.24], [19.0, 18.84], [22.0, 22.05], [23.0, 24.24], [31.0, 30.87], [37.0, 38.28], [49.0, 52.17], [56.0, 58.33], [59.0, 59.83], [66.0, 66.04], [69.0, 69.92]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.41, 29.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["frog", 31.01], ["insect", 22.34], ["mosquito", 13.75]], [["fire alarm", 48.94], ["music", 8.99], ["buzzer", 6.15]], null, null, null], "duration": [1.24, -0.16, 0.05, 1.24, -0.13, 1.28, 3.17, 2.33, 0.83, 0.04, 0.92]} \ No newline at end of file diff --git a/annotations_1/Qwx9wZgxUoQ_filtered.json b/annotations_1/Qwx9wZgxUoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..995d8000b2e474b0843193c729a0f71982750206 --- /dev/null +++ b/annotations_1/Qwx9wZgxUoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 69.67]], "keep_status": [false], "silence_prob": [29.98], "audiomae_on_audioset": [[["music", 62.2], ["hum", 8.3], ["synthesizer", 6.78]]], "duration": [9.67]} \ No newline at end of file diff --git a/annotations_1/QxReNyiIprw_filtered.json b/annotations_1/QxReNyiIprw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ceac4e9f41d61dd21da234566ecdcc0bd78e6cef --- /dev/null +++ b/annotations_1/QxReNyiIprw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.88], [22.0, 21.91], [24.0, 30.89], [31.0, 30.94], [31.0, 55.98], [63.0, 63.09], [64.0, 74.48], [77.0, 77.41], [79.0, 133.15], [135.0, 136.65], [139.0, 139.09], [140.0, 141.13], [142.0, 153.49], [155.0, 154.99], [156.0, 158.01], [161.0, 172.3], [174.0, 179.56], [180.0, 182.17]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 30.64, 0.0, 28.88, 0.0, 29.04, 0.0, 0.0, 0.0, 0.0, 0.0, 34.69, 0.0, 31.5, 30.12, 31.25, 31.01], "audiomae_on_audioset": [null, null, [["speech", 28.6], ["music", 25.87], ["hum", 10.47]], null, [["music", 29.62], ["mains hum", 22.64], ["hum", 22.12]], null, [["sidetone", 31.97], ["mains hum", 19.62], ["hum", 19.34]], null, null, null, null, null, [["sidetone", 35.39], ["speech", 32.92], ["music", 10.64]], null, [["speech", 35.95], ["music", 24.36], ["didgeridoo", 6.69]], [["music", 48.49], ["throbbing", 17.18], ["hum", 16.36]], [["speech", 25.78], ["music", 17.27], ["bagpipes", 3.38]], [["mosquito", 17.23], ["music", 16.6], ["cattle, bovinae", 10.26]]], "duration": [-0.12, -0.09, 6.89, -0.06, 24.98, 0.09, 10.48, 0.41, 54.15, 1.65, 0.09, 1.13, 11.49, -0.01, 2.01, 11.3, 5.56, 2.17]} \ No newline at end of file diff --git a/annotations_1/QxrBZStJOGk_filtered.json b/annotations_1/QxrBZStJOGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d82be3ac86d0a09c4c3637b0460b40f33a03cdd9 --- /dev/null +++ b/annotations_1/QxrBZStJOGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.83], [20.0, 20.33], [25.0, 26.33], [27.0, 27.77], [28.0, 29.62], [30.0, 31.72], [32.0, 32.48], [34.0, 34.43], [39.0, 39.43], [41.0, 41.28], [47.0, 48.3], [50.0, 50.5], [51.0, 51.16], [54.0, 56.29], [57.0, 56.88], [57.0, 58.01], [59.0, 61.91], [73.0, 74.48], [83.0, 84.62], [87.0, 86.76], [89.0, 88.94], [92.0, 92.03], [96.0, 96.74], [99.0, 99.22], [104.0, 106.15], [107.0, 109.19], [112.0, 112.13], [114.0, 116.11], [119.0, 120.55], [125.0, 126.06], [127.0, 127.58], [129.0, 129.83], [132.0, 132.02], [134.0, 135.65], [138.0, 143.63], [144.0, 146.53], [147.0, 148.41], [149.0, 149.55], [153.0, 155.55], [157.0, 159.66], [161.0, 163.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 99.99, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.64, 40.77, 0.0, 0.0, 42.51, 49.5, 45.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.99], ["hum", 21.79], ["thunk", 10.65]], [["music", 44.12], ["speech", 24.5], ["musical instrument", 1.63]], null, null, [["speech", 37.73], ["music", 15.16], ["singing bowl", 12.5]], [["gong", 84.35], ["music", 4.65], ["singing bowl", 3.87]], [["music", 31.81], ["mains hum", 8.47], ["synthesizer", 5.24]]], "duration": [1.83, 0.33, 1.33, 0.77, 1.62, 1.72, 0.48, 0.43, 0.43, 0.28, 1.3, 0.5, 0.16, 2.29, -0.12, 1.01, 2.91, 1.48, 1.62, -0.24, -0.06, 0.03, 0.74, 0.22, 2.15, 2.19, 0.13, 2.11, 1.55, 1.06, 0.58, 0.83, 0.02, 1.65, 5.63, 2.53, 1.41, 0.55, 2.55, 2.66, 2.65]} \ No newline at end of file diff --git a/annotations_1/QyeYgwO4ADg_filtered.json b/annotations_1/QyeYgwO4ADg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7311a64f866d50c3621dc90e973ff0be3ee1ab59 --- /dev/null +++ b/annotations_1/QyeYgwO4ADg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.45], [34.0, 46.16], [48.0, 48.73], [50.0, 50.79], [53.0, 54.6], [55.0, 56.59], [58.0, 58.95], [59.0, 59.37], [61.0, 61.25], [62.0, 63.12], [64.0, 64.5], [68.0, 68.98], [71.0, 77.6], [79.0, 84.45], [86.0, 86.8], [91.0, 91.71], [96.0, 96.69], [101.0, 102.25], [110.0, 111.62], [117.0, 116.94], [118.0, 118.83], [120.0, 120.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.02, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [25.45, 12.16, 0.73, 0.79, 1.6, 1.59, 0.95, 0.37, 0.25, 1.12, 0.5, 0.98, 6.6, 5.45, 0.8, 0.71, 0.69, 1.25, 1.62, -0.06, 0.83, 0.56]} \ No newline at end of file diff --git a/annotations_1/QyvbqZqQ0xI_filtered.json b/annotations_1/QyvbqZqQ0xI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..614dfb04ae40f96444bb981ece24d7323def8f7a --- /dev/null +++ b/annotations_1/QyvbqZqQ0xI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [7.0, 8.14], [10.0, 10.56], [12.0, 13.12], [14.0, 15.13], [15.0, 18.44], [20.0, 25.19], [26.0, 28.0], [29.0, 28.88], [34.0, 35.63], [39.0, 39.28], [44.0, 44.95], [47.0, 47.63], [49.0, 49.32], [50.0, 50.94], [57.0, 58.13], [59.0, 58.85], [61.0, 61.26], [75.0, 75.95], [77.0, 79.03], [80.0, 80.87], [81.0, 81.85], [83.0, 84.05], [85.0, 88.01], [89.0, 90.26], [91.0, 92.15], [93.0, 96.11], [98.0, 98.93], [101.0, 101.01], [103.0, 124.8], [126.0, 137.57], [138.0, 145.02], [146.0, 147.51], [148.0, 148.69], [152.0, 152.19], [153.0, 153.67], [157.0, 157.3], [158.0, 160.17], [161.0, 163.17], [164.0, 164.91], [165.0, 165.75], [167.0, 167.14], [169.0, 170.95], [172.0, 176.37], [177.0, 179.95], [184.0, 185.9], [187.0, 187.0], [187.0, 192.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.83, 100.0, 58.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.31, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 100.0, 0.0, 0.0, 0.0, 0.0, 90.78, 61.97, 0.0, 0.0, 71.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 29.39], ["speech", 13.02], ["dog", 5.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.74, 1.14, 0.56, 1.12, 1.13, 3.44, 5.19, 2.0, -0.12, 1.63, 0.28, 0.95, 0.63, 0.32, 0.94, 1.13, -0.15, 0.26, 0.95, 2.03, 0.87, 0.85, 1.05, 3.01, 1.26, 1.15, 3.11, 0.93, 0.01, 21.8, 11.57, 7.02, 1.51, 0.69, 0.19, 0.67, 0.3, 2.17, 2.17, 0.91, 0.75, 0.14, 1.95, 4.37, 2.95, 1.9, 0.0, 5.47]} \ No newline at end of file diff --git a/annotations_1/QzcXi2irovs_filtered.json b/annotations_1/QzcXi2irovs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5f8b0215cde8d8949d4a77f88da056756faae27 --- /dev/null +++ b/annotations_1/QzcXi2irovs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.93], [27.0, 28.81], [30.0, 31.09], [33.0, 33.71], [35.0, 36.49], [44.0, 44.56], [46.0, 49.57], [50.0, 51.76], [52.0, 59.37], [60.0, 61.72], [62.0, 64.12], [66.0, 72.66], [73.0, 80.16], [81.0, 90.15], [91.0, 91.86], [93.0, 100.6], [101.0, 119.38], [123.0, 123.47], [159.0, 158.82]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.08, 0.0, 31.5, 0.0, 33.61, 30.23, 30.41, 30.75, 0.0, 34.31, 29.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.48], ["speech", 8.93], ["throbbing", 5.04]], null, [["music", 69.69], ["sampler", 2.06], ["electronic music", 2.06]], null, [["music", 54.42], ["speech", 7.29], ["electronic music", 4.95]], [["music", 69.58], ["electronic music", 5.72], ["techno", 2.75]], [["music", 72.16], ["electronic music", 3.27], ["speech", 2.76]], [["music", 34.88], ["hum", 25.43], ["throbbing", 19.17]], null, [["music", 29.15], ["hum", 26.66], ["throbbing", 24.53]], [["throbbing", 42.32], ["music", 32.67], ["hum", 12.77]], null, null], "duration": [0.93, 1.81, 1.09, 0.71, 1.49, 0.56, 3.57, 1.76, 7.37, 1.72, 2.12, 6.66, 7.16, 9.15, 0.86, 7.6, 18.38, 0.47, -0.18]} \ No newline at end of file diff --git a/annotations_1/Qzf3SFbaODw_filtered.json b/annotations_1/Qzf3SFbaODw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3022b4d377ccd28b7e6754bf6c0fbeaa713fe0d1 --- /dev/null +++ b/annotations_1/Qzf3SFbaODw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.88], [14.0, 13.95], [15.0, 15.31], [19.0, 19.36], [20.0, 65.3], [70.0, 71.51], [79.0, 85.87], [87.0, 94.59], [97.0, 106.41], [107.0, 108.21], [109.0, 110.19], [111.0, 111.45], [112.0, 111.59], [113.0, 117.14], [120.0, 136.11]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, true, true], "silence_prob": [28.75, 0.0, 0.0, 0.0, 0.0, 0.0, 33.2, 35.79, 30.65, 0.0, 0.0, 0.0, 0.0, 30.12, 31.89], "audiomae_on_audioset": [[["explosion", 57.98], ["burst, pop", 12.46], ["speech", 5.78]], null, null, null, null, null, [["music", 16.11], ["speech", 14.55], ["explosion", 9.66]], [["music", 20.55], ["mains hum", 19.57], ["hum", 13.88]], [["speech", 38.97], ["hum", 15.68], ["animal", 5.56]], null, null, null, null, [["rumble", 28.26], ["sound effect", 11.88], ["fart", 10.11]], [["music", 24.89], ["hum", 15.47], ["buzz", 11.54]]], "duration": [11.88, -0.05, 0.31, 0.36, 45.3, 1.51, 6.87, 7.59, 9.41, 1.21, 1.19, 0.45, -0.41, 4.14, 16.11]} \ No newline at end of file diff --git a/annotations_1/QzgJIF00Xdw_filtered.json b/annotations_1/QzgJIF00Xdw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea5d23d207ebbf3f524e5407f8a219f7b8d10ed --- /dev/null +++ b/annotations_1/QzgJIF00Xdw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.88], [9.0, 11.77], [15.0, 16.97], [21.0, 34.45], [35.0, 36.39], [37.0, 42.55], [45.0, 46.21], [48.0, 52.52], [54.0, 60.57], [61.0, 62.8], [65.0, 64.57], [65.0, 68.28], [69.0, 70.41], [71.0, 74.9], [76.0, 86.49], [87.0, 87.78], [91.0, 104.23], [106.0, 109.54], [110.0, 109.59], [110.0, 110.07], [110.0, 112.26], [114.0, 116.01], [118.0, 120.72], [124.0, 129.88], [130.0, 132.12], [133.0, 134.37], [136.0, 143.63], [144.0, 154.01], [154.0, 155.12], [161.0, 161.65], [163.0, 165.3], [167.0, 167.41], [169.0, 177.23], [179.0, 183.95], [187.0, 188.72], [191.0, 194.66], [198.0, 206.81], [207.0, 206.88], [207.0, 207.12], [208.0, 215.99], [217.0, 221.32], [223.0, 227.42], [229.0, 239.26], [241.0, 241.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [31.93, 30.97, 0.0, 29.82, 0.0, 31.18, 0.0, 31.28, 30.23, 0.0, 0.0, 30.84, 0.0, 30.49, 30.5, 0.0, 30.04, 31.58, 0.0, 0.0, 30.45, 32.21, 31.84, 29.71, 30.78, 0.0, 30.22, 30.23, 0.0, 0.0, 31.91, 0.0, 32.0, 31.64, 0.0, 32.14, 30.27, 0.0, 0.0, 30.12, 30.36, 30.41, 30.17, 0.0], "audiomae_on_audioset": [[["music", 87.49], ["synthesizer", 2.34], ["musical instrument", 2.04]], [["music", 66.43], ["rock and roll", 2.73], ["reggae", 2.1]], null, [["music", 78.13], ["middle eastern music", 4.71], ["reggae", 1.01]], null, [["music", 79.83], ["musical instrument", 1.39], ["keyboard (musical)", 1.26]], null, [["music", 76.04], ["reggae", 6.12], ["sampler", 3.98]], [["music", 77.57], ["reggae", 2.43], ["rock and roll", 2.14]], null, null, [["music", 74.85], ["didgeridoo", 4.43], ["musical instrument", 2.29]], null, [["music", 58.63], ["musical instrument", 4.57], ["guitar", 2.83]], [["music", 81.66], ["swing music", 3.75], ["reggae", 3.41]], null, [["music", 89.54], ["musical instrument", 2.0], ["carnatic music", 0.75]], [["music", 49.32], ["throbbing", 8.74], ["didgeridoo", 4.38]], null, null, [["music", 40.04], ["didgeridoo", 7.57], ["sound effect", 3.57]], [["music", 70.84], ["musical instrument", 2.46], ["throbbing", 1.91]], [["music", 69.07], ["drum machine", 8.0], ["sampler", 3.32]], [["music", 63.22], ["rock and roll", 2.61], ["roll", 2.21]], [["music", 67.44], ["musical instrument", 3.7], ["synthesizer", 2.23]], null, [["music", 73.76], ["carnatic music", 4.17], ["sitar", 2.77]], [["music", 86.04], ["reggae", 1.64], ["echo", 1.08]], null, null, [["music", 76.14], ["swing music", 2.88], ["musical instrument", 1.98]], null, [["music", 70.88], ["guitar", 5.64], ["musical instrument", 2.99]], [["music", 78.3], ["reggae", 4.05], ["didgeridoo", 2.51]], null, [["music", 68.12], ["musical instrument", 2.53], ["brass instrument", 2.51]], [["music", 68.9], ["throbbing", 7.92], ["reggae", 3.78]], null, null, [["music", 86.91], ["rock and roll", 0.88], ["roll", 0.76]], [["music", 75.49], ["throbbing", 6.85], ["electronic music", 1.02]], [["music", 52.78], ["throbbing", 12.74], ["electronic music", 3.19]], [["music", 69.52], ["speech", 12.92], ["throbbing", 2.09]], null], "duration": [2.88, 2.77, 1.97, 13.45, 1.39, 5.55, 1.21, 4.52, 6.57, 1.8, -0.43, 3.28, 1.41, 3.9, 10.49, 0.78, 13.23, 3.54, -0.41, 0.07, 2.26, 2.01, 2.72, 5.88, 2.12, 1.37, 7.63, 10.01, 1.12, 0.65, 2.3, 0.41, 8.23, 4.95, 1.72, 3.66, 8.81, -0.12, 0.12, 7.99, 4.32, 4.42, 10.26, 0.54]} \ No newline at end of file diff --git a/annotations_1/R-wQWw1geBM_filtered.json b/annotations_1/R-wQWw1geBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c21847b39a614063b53e4965723e967efc3ed5e --- /dev/null +++ b/annotations_1/R-wQWw1geBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [14.0, 14.45], [16.0, 17.0], [20.0, 20.95], [23.0, 35.55], [41.0, 65.64], [69.0, 70.97], [73.0, 73.33], [74.0, 74.36]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.27, 33.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 36.72], ["speech", 16.47], ["synthesizer", 5.28]], [["music", 69.41], ["speech", 9.02], ["hum", 2.09]], null, null, null], "duration": [1.27, 0.45, 1.0, 0.95, 12.55, 24.64, 1.97, 0.33, 0.36]} \ No newline at end of file diff --git a/annotations_1/R0CN7Enq4Rg_filtered.json b/annotations_1/R0CN7Enq4Rg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da20a00c0e22612a7afdd1099936b8dae642ddc6 --- /dev/null +++ b/annotations_1/R0CN7Enq4Rg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.39], [32.0, 33.32], [38.0, 38.26], [40.0, 53.42], [56.0, 56.13], [60.0, 79.61], [83.0, 92.21], [99.0, 106.02], [111.0, 114.64], [116.0, 116.07], [117.0, 118.29], [124.0, 125.0], [127.0, 128.87], [143.0, 151.06], [151.0, 155.11], [159.0, 161.2], [162.0, 174.39], [177.0, 188.64], [189.0, 189.92], [191.0, 193.38], [194.0, 195.57], [197.0, 198.07]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.2, 0.0, 32.69, 32.93, 32.87, 31.98, 0.0, 0.0, 0.0, 0.0, 34.89, 34.19, 45.82, 33.13, 34.16, 0.0, 36.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 52.05], ["brass instrument", 12.82], ["musical instrument", 9.46]], null, [["music", 61.12], ["synthesizer", 8.22], ["musical instrument", 3.97]], [["music", 54.34], ["cacophony", 5.05], ["synthesizer", 4.6]], [["music", 63.57], ["hum", 6.47], ["throbbing", 5.38]], [["speech", 14.59], ["music", 14.54], ["boing", 10.36]], null, null, null, null, [["music", 70.51], ["brass instrument", 7.59], ["trombone", 4.51]], [["music", 56.44], ["musical instrument", 6.88], ["brass instrument", 5.23]], [["music", 43.53], ["speech", 16.41], ["foghorn", 9.79]], [["music", 42.75], ["brass instrument", 13.42], ["trombone", 8.66]], [["music", 51.81], ["speech", 8.51], ["brass instrument", 4.96]], null, [["foghorn", 43.09], ["music", 21.22], ["speech", 7.53]], null, null], "duration": [1.39, 1.32, 0.26, 13.42, 0.13, 19.61, 9.21, 7.02, 3.64, 0.07, 1.29, 1.0, 1.87, 8.06, 4.11, 2.2, 12.39, 11.64, 0.92, 2.38, 1.57, 1.07]} \ No newline at end of file diff --git a/annotations_1/R0HGeVmyI5I_filtered.json b/annotations_1/R0HGeVmyI5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a52758751ae6356c8fbf4c55f6271aa9bf8c03e --- /dev/null +++ b/annotations_1/R0HGeVmyI5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.86], [11.0, 11.23], [17.0, 18.45], [21.0, 22.3], [24.0, 24.83], [26.0, 27.46], [29.0, 29.84], [31.0, 32.46], [35.0, 35.82], [43.0, 43.11], [48.0, 48.68], [96.0, 101.6], [104.0, 104.67], [105.0, 112.56], [114.0, 114.89], [118.0, 118.27], [119.0, 119.57], [127.0, 127.84], [131.0, 131.6], [134.0, 135.41], [141.0, 141.39], [143.0, 144.73], [151.0, 151.23], [156.0, 166.68], [170.0, 171.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 39.52], ["moo", 15.84], ["cattle, bovinae", 13.41]], null], "duration": [1.86, 0.23, 1.45, 1.3, 0.83, 1.46, 0.84, 1.46, 0.82, 0.11, 0.68, 5.6, 0.67, 7.56, 0.89, 0.27, 0.57, 0.84, 0.6, 1.41, 0.39, 1.73, 0.23, 10.68, 1.36]} \ No newline at end of file diff --git a/annotations_1/R1GZ5ajb_xc_filtered.json b/annotations_1/R1GZ5ajb_xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05a05aaf230faf7de40234b1d88df43d1bb44873 --- /dev/null +++ b/annotations_1/R1GZ5ajb_xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 21.25], [22.0, 27.08], [28.0, 28.71], [65.0, 64.67], [68.0, 68.91], [74.0, 73.74], [74.0, 79.47], [80.0, 81.7], [89.0, 92.43], [93.0, 94.49], [96.0, 109.04], [114.0, 114.86], [120.0, 125.17], [126.0, 125.59], [127.0, 141.07], [182.0, 182.97], [184.0, 186.49]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [34.47, 37.83, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 54.43, 0.0, 78.38, 0.0, 33.75, 0.0, 33.77, 0.0, 59.07], "audiomae_on_audioset": [[["music", 58.41], ["throbbing", 9.89], ["scary music", 8.52]], [["sidetone", 21.52], ["music", 18.1], ["speech", 16.36]], null, null, null, null, [["boing", 46.68], ["music", 17.96], ["speech", 14.98]], null, null, null, null, null, [["music", 41.29], ["hum", 14.04], ["mains hum", 13.38]], null, [["music", 71.59], ["didgeridoo", 13.13], ["musical instrument", 1.35]], null, null], "duration": [4.25, 5.08, 0.71, -0.33, 0.91, -0.26, 5.47, 1.7, 3.43, 1.49, 13.04, 0.86, 5.17, -0.41, 14.07, 0.97, 2.49]} \ No newline at end of file diff --git a/annotations_1/R1eDE5bXCds_filtered.json b/annotations_1/R1eDE5bXCds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f4885923c0e5f0e283c8fec3ae1c0dd77d7433f --- /dev/null +++ b/annotations_1/R1eDE5bXCds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.8], [12.0, 24.14], [24.0, 27.16], [29.0, 31.95], [34.0, 37.77], [42.0, 55.51], [58.0, 60.45], [61.0, 61.96], [74.0, 77.48], [89.0, 89.43], [90.0, 90.32], [92.0, 92.37], [98.0, 98.04], [98.0, 99.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.19, 57.81, 79.07, 55.04, 79.76, 52.22, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 12.14, 3.16, 2.95, 3.77, 13.51, 2.45, 0.96, 3.48, 0.43, 0.32, 0.37, 0.04, 1.32]} \ No newline at end of file diff --git a/annotations_1/R1hh6MVyQYg_filtered.json b/annotations_1/R1hh6MVyQYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da24f615fb001e8c269d2666e799bdfbfed78f68 --- /dev/null +++ b/annotations_1/R1hh6MVyQYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.81], [16.0, 17.96], [19.0, 19.82], [23.0, 32.51], [33.0, 34.05], [39.0, 39.99], [41.0, 41.08], [45.0, 45.87], [47.0, 47.95], [50.0, 51.12], [54.0, 55.05], [61.0, 61.37], [66.0, 66.34], [68.0, 69.21], [71.0, 71.22], [73.0, 73.23], [73.0, 74.11], [74.0, 74.65], [76.0, 76.79], [78.0, 79.54], [81.0, 82.24], [83.0, 84.11], [88.0, 89.11], [91.0, 91.54], [93.0, 96.26], [99.0, 99.35], [100.0, 100.74], [104.0, 106.14], [107.0, 106.81], [112.0, 112.13], [115.0, 115.7], [117.0, 118.13], [118.0, 118.67], [120.0, 120.65], [121.0, 122.59], [123.0, 123.48], [124.0, 127.75], [128.0, 129.0], [130.0, 130.06], [131.0, 133.46], [135.0, 136.0], [137.0, 137.76], [138.0, 138.45], [139.0, 140.97], [142.0, 143.87], [145.0, 145.5], [147.0, 147.19], [152.0, 153.93], [156.0, 156.44], [159.0, 159.93], [161.0, 161.67], [164.0, 164.62], [166.0, 166.4], [170.0, 170.55], [175.0, 175.47], [178.0, 179.63], [180.0, 180.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.16, 0.0, 0.0, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.38], ["theremin", 22.95], ["musical instrument", 5.16]], null, null, [["music", 46.61], ["theremin", 42.39], ["musical instrument", 3.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.81, 1.96, 0.82, 9.51, 1.05, 0.99, 0.08, 0.87, 0.95, 1.12, 1.05, 0.37, 0.34, 1.21, 0.22, 0.23, 1.11, 0.65, 0.79, 1.54, 1.24, 1.11, 1.11, 0.54, 3.26, 0.35, 0.74, 2.14, -0.19, 0.13, 0.7, 1.13, 0.67, 0.65, 1.59, 0.48, 3.75, 1.0, 0.06, 2.46, 1.0, 0.76, 0.45, 1.97, 1.87, 0.5, 0.19, 1.93, 0.44, 0.93, 0.67, 0.62, 0.4, 0.55, 0.47, 1.63, 0.15]} \ No newline at end of file diff --git a/annotations_1/R1zRKVLsmrM_filtered.json b/annotations_1/R1zRKVLsmrM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f22f4afc7680973c617946506a7bb49ce1869d35 --- /dev/null +++ b/annotations_1/R1zRKVLsmrM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.89], [27.0, 27.3], [31.0, 31.01], [54.0, 61.13], [62.0, 64.15], [77.0, 76.77], [84.0, 84.37], [102.0, 102.78], [104.0, 104.45]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [32.56, 0.0, 0.0, 35.96, 36.2, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["wind instrument, woodwind instrument", 52.22], ["shofar", 38.85], ["animal", 1.64]], null, null, [["music", 63.09], ["reggae", 4.54], ["swing music", 4.41]], [["music", 38.93], ["cattle, bovinae", 12.39], ["moo", 12.0]], null, null, null, null], "duration": [4.89, 0.3, 0.01, 7.13, 2.15, -0.23, 0.37, 0.78, 0.45]} \ No newline at end of file diff --git a/annotations_1/R2DhcfXooy8_filtered.json b/annotations_1/R2DhcfXooy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c59ae85eb05cf67ce8834a2cf23fb4d19b2c9748 --- /dev/null +++ b/annotations_1/R2DhcfXooy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.83], [26.0, 26.1], [30.0, 31.68], [33.0, 33.3], [36.0, 36.05], [45.0, 46.06], [48.0, 48.29], [50.0, 50.25], [57.0, 57.91], [61.0, 60.76], [69.0, 69.8], [71.0, 72.22], [75.0, 75.07], [76.0, 76.13], [77.0, 77.4], [79.0, 79.81], [80.0, 86.49], [88.0, 87.67], [88.0, 90.81], [92.0, 100.79], [102.0, 104.21], [104.0, 104.28], [104.0, 105.36], [107.0, 107.86], [109.0, 110.56], [112.0, 113.29], [114.0, 114.64], [118.0, 118.71], [120.0, 120.9], [121.0, 121.8], [123.0, 122.96], [123.0, 123.74], [124.0, 129.39], [131.0, 132.56], [134.0, 142.05], [147.0, 147.41], [148.0, 148.71], [150.0, 151.24], [156.0, 156.63], [158.0, 157.84], [159.0, 159.78], [163.0, 163.95], [164.0, 166.83], [168.0, 168.93], [169.0, 170.9], [172.0, 171.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 42.04, 34.64, 36.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.62], ["wild animals", 8.15], ["animal", 6.4]], [["music", 52.4], ["throbbing", 11.82], ["hum", 11.7]], [["music", 64.33], ["speech", 5.08], ["musical instrument", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.17, 0.1, 1.68, 0.3, 0.05, 1.06, 0.29, 0.25, 0.91, -0.24, 0.8, 1.22, 0.07, 0.13, 0.4, 0.81, 6.49, -0.33, 2.81, 8.79, 2.21, 0.28, 1.36, 0.86, 1.56, 1.29, 0.64, 0.71, 0.9, 0.8, -0.04, 0.74, 5.39, 1.56, 8.05, 0.41, 0.71, 1.24, 0.63, -0.16, 0.78, 0.95, 2.83, 0.93, 1.9, -0.19]} \ No newline at end of file diff --git a/annotations_1/R2lhQCxKx_Y_filtered.json b/annotations_1/R2lhQCxKx_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16eca9a93786ca151c8712643559d61272b32531 --- /dev/null +++ b/annotations_1/R2lhQCxKx_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.0], [16.0, 16.6], [26.0, 26.03], [28.0, 28.56], [46.0, 45.77], [49.0, 49.77], [63.0, 62.83], [66.0, 66.55], [76.0, 77.16], [82.0, 82.24], [85.0, 84.86], [89.0, 90.24], [92.0, 93.12], [94.0, 95.23], [99.0, 99.94], [103.0, 106.2], [107.0, 107.84], [110.0, 111.6], [118.0, 119.4], [120.0, 140.32], [141.0, 143.41], [146.0, 145.84], [150.0, 151.28], [153.0, 154.33], [155.0, 156.39], [165.0, 166.5], [170.0, 171.02], [174.0, 175.53], [178.0, 180.62], [182.0, 183.52], [184.0, 185.41], [192.0, 193.36], [195.0, 195.17], [200.0, 200.48], [202.0, 206.95], [208.0, 214.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 50.41, 40.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0, 0.0, 0.0, 29.71, 30.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.31], ["speech", 6.85], ["boing", 4.45]], null, null, null, null, null, null, null, [["music", 72.83], ["singing", 2.08], ["speech", 1.53]], null, null, null, null, null, [["music", 58.14], ["theme music", 2.37], ["didgeridoo", 2.28]], [["music", 77.04], ["singing", 2.47], ["country", 1.99]]], "duration": [1.0, 0.6, 0.03, 0.56, -0.23, 0.77, -0.17, 0.55, 1.16, 0.24, -0.14, 1.24, 1.12, 1.23, 0.94, 3.2, 0.84, 1.6, 1.4, 20.32, 2.41, -0.16, 1.28, 1.33, 1.39, 1.5, 1.02, 1.53, 2.62, 1.52, 1.41, 1.36, 0.17, 0.48, 4.95, 6.76]} \ No newline at end of file diff --git a/annotations_1/R3KOKpvoLIo_filtered.json b/annotations_1/R3KOKpvoLIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c1baf4640078da57de269068a74cbaa12362613 --- /dev/null +++ b/annotations_1/R3KOKpvoLIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.07], [37.0, 61.06], [62.0, 75.15], [78.0, 102.63]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 29.63, 30.06, 30.16], "audiomae_on_audioset": [null, [["speech", 47.05], ["music", 9.22], ["vehicle", 7.47]], [["music", 64.69], ["whack, thwack", 13.16], ["boing", 2.24]], [["music", 21.79], ["throbbing", 12.98], ["speech", 7.42]]], "duration": [0.07, 24.06, 13.15, 24.63]} \ No newline at end of file diff --git a/annotations_1/R5a3sZiNuu4_filtered.json b/annotations_1/R5a3sZiNuu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89327824db8035d004a17f2b787fb2234d40b69f --- /dev/null +++ b/annotations_1/R5a3sZiNuu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.76], [27.0, 40.96], [42.0, 56.15], [58.0, 62.9], [75.0, 75.24], [83.0, 87.35], [87.0, 88.5], [89.0, 91.0], [92.0, 94.31], [96.0, 97.14], [99.0, 105.27], [107.0, 108.21], [110.0, 123.42], [125.0, 125.81], [127.0, 128.51], [129.0, 130.82], [133.0, 133.05], [135.0, 135.24], [137.0, 138.2], [139.0, 143.13], [144.0, 166.01]], "keep_status": [true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [27.85, 27.89, 27.98, 28.76, 0.0, 31.31, 0.0, 40.86, 38.83, 0.0, 48.91, 0.0, 27.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.85, 28.49], "audiomae_on_audioset": [[["whack, thwack", 10.26], ["explosion", 9.82], ["burst, pop", 9.75]], [["music", 15.13], ["animal", 13.53], ["livestock, farm animals, working animals", 11.1]], [["music", 67.14], ["throbbing", 4.62], ["sound effect", 3.9]], [["speech", 48.39], ["music", 42.59], ["boing", 1.08]], null, [["speech", 36.85], ["music", 34.73], ["hum", 3.83]], null, [["music", 24.99], ["hum", 14.34], ["mains hum", 9.76]], [["music", 65.4], ["speech", 6.59], ["animal", 4.19]], null, [["music", 27.23], ["livestock, farm animals, working animals", 9.39], ["cattle, bovinae", 8.41]], null, [["music", 58.27], ["hum", 9.86], ["mains hum", 3.93]], null, null, null, null, null, null, [["music", 39.64], ["hum", 15.23], ["mains hum", 9.56]], [["foghorn", 23.52], ["music", 18.6], ["speech", 12.56]]], "duration": [18.76, 13.96, 14.15, 4.9, 0.24, 4.35, 1.5, 2.0, 2.31, 1.14, 6.27, 1.21, 13.42, 0.81, 1.51, 1.82, 0.05, 0.24, 1.2, 4.13, 22.01]} \ No newline at end of file diff --git a/annotations_1/R5wXxo6yIU4_filtered.json b/annotations_1/R5wXxo6yIU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28964461848caaef72f1acc0c911e8927ba4d384 --- /dev/null +++ b/annotations_1/R5wXxo6yIU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [4.0, 4.85], [10.0, 10.12], [13.0, 13.26], [15.0, 14.76], [17.0, 16.95], [18.0, 19.35], [21.0, 23.03], [27.0, 28.21], [29.0, 30.52], [34.0, 35.99], [39.0, 41.57], [42.0, 45.54], [46.0, 50.46], [51.0, 53.74], [55.0, 57.2], [61.0, 61.94], [63.0, 64.62], [68.0, 68.61], [70.0, 70.48], [73.0, 73.63], [75.0, 75.69], [80.0, 80.15], [82.0, 82.83], [84.0, 84.75], [86.0, 87.25], [88.0, 89.61], [91.0, 93.72], [95.0, 95.99], [97.0, 97.02], [102.0, 103.06], [106.0, 106.71], [109.0, 109.73], [112.0, 113.56], [116.0, 121.86], [122.0, 123.28], [125.0, 126.72], [128.0, 131.36]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.28, 0.0, 0.0, 0.0, 40.24, 46.61, 48.06, 42.74, 53.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 45.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["radio", 25.18], ["hum", 14.49], ["single-lens reflex camera", 7.27]], null, null, null, [["insect", 50.81], ["fly, housefly", 27.18], ["bee, wasp, etc.", 6.43]], [["fly, housefly", 33.46], ["insect", 33.32], ["frog", 7.87]], [["fly, housefly", 18.12], ["insect", 16.06], ["sidetone", 15.74]], [["frog", 38.7], ["fart", 11.84], ["croak", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, [["frog", 23.34], ["speech", 15.01], ["croak", 8.56]], null, null, null, null, null, null, null, null, null, [["frog", 59.91], ["croak", 13.98], ["radio", 4.81]]], "duration": [1.21, 0.85, 0.12, 0.26, -0.24, -0.05, 1.35, 2.03, 1.21, 1.52, 1.99, 2.57, 3.54, 4.46, 2.74, 2.2, 0.94, 1.62, 0.61, 0.48, 0.63, 0.69, 0.15, 0.83, 0.75, 1.25, 1.61, 2.72, 0.99, 0.02, 1.06, 0.71, 0.73, 1.56, 5.86, 1.28, 1.72, 3.36]} \ No newline at end of file diff --git a/annotations_1/R6nZpcweYXw_filtered.json b/annotations_1/R6nZpcweYXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d0aec6f5d31100c5404057995858d846031b88 --- /dev/null +++ b/annotations_1/R6nZpcweYXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.3], [12.0, 13.0], [15.0, 17.1], [35.0, 36.12], [38.0, 41.12], [43.0, 43.92], [45.0, 45.22], [47.0, 51.43], [52.0, 54.57], [59.0, 61.25], [64.0, 67.05], [69.0, 70.24], [71.0, 72.45], [74.0, 92.33], [94.0, 94.83], [97.0, 114.67], [117.0, 118.32], [119.0, 132.6], [137.0, 157.23], [158.0, 184.94], [186.0, 186.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false], "silence_prob": [45.95, 0.0, 59.24, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 88.28, 99.71, 0.0, 0.0, 33.55, 0.0, 31.51, 0.0, 35.21, 34.43, 32.38, 0.0], "audiomae_on_audioset": [[["moo", 43.28], ["cattle, bovinae", 33.07], ["livestock, farm animals, working animals", 23.42]], null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 45.15], ["music", 29.5], ["whack, thwack", 4.98]], null, [["music", 26.37], ["whip", 20.41], ["speech", 20.07]], null, [["music", 28.71], ["sidetone", 25.56], ["boing", 14.53]], [["music", 29.87], ["boing", 11.11], ["moo", 10.81]], [["boing", 29.42], ["music", 20.28], ["fly, housefly", 15.6]], null], "duration": [5.3, 1.0, 2.1, 1.12, 3.12, 0.92, 0.22, 4.43, 2.57, 2.25, 3.05, 1.24, 1.45, 18.33, 0.83, 17.67, 1.32, 13.6, 20.23, 26.94, 0.61]} \ No newline at end of file diff --git a/annotations_1/R76ux4iCRzI_filtered.json b/annotations_1/R76ux4iCRzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86b1d86953a694eb6400fbe0dce2295723f9b7e7 --- /dev/null +++ b/annotations_1/R76ux4iCRzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 5.98], [7.0, 8.43], [9.0, 11.75], [12.0, 15.16], [17.0, 17.78], [20.0, 20.95], [22.0, 23.99], [26.0, 26.11], [27.0, 52.78], [54.0, 63.58], [66.0, 69.33], [71.0, 70.87], [71.0, 71.36], [76.0, 76.89], [79.0, 80.7], [83.0, 88.72], [90.0, 93.92], [96.0, 100.53], [102.0, 105.93], [107.0, 107.7], [109.0, 152.04], [157.0, 160.95], [161.0, 162.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 47.16, 47.01, 0.0, 0.0, 0.0, 0.0, 30.73, 42.62, 44.04, 0.0, 0.0, 0.0, 0.0, 46.36, 45.95, 47.46, 47.43, 0.0, 0.0, 31.27, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.99], ["speech", 16.09], ["chirp tone", 15.52]], [["music", 32.8], ["speech", 31.76], ["chirp tone", 6.01]], null, null, null, null, [["music", 39.74], ["speech", 39.34], ["musical instrument", 2.23]], [["hum", 47.74], ["throbbing", 27.81], ["mains hum", 20.43]], [["rumble", 21.24], ["hum", 14.37], ["whale vocalization", 14.17]], null, null, null, null, [["hum", 40.96], ["rumble", 17.74], ["speech", 15.92]], [["music", 36.44], ["hum", 15.26], ["ambient music", 11.3]], [["sonar", 31.35], ["music", 18.36], ["hum", 10.05]], [["hum", 29.44], ["whale vocalization", 19.52], ["rumble", 13.11]], null, null, [["speech", 21.54], ["hum", 21.07], ["music", 17.48]], null], "duration": [0.33, 0.98, 1.43, 2.75, 3.16, 0.78, 0.95, 1.99, 0.11, 25.78, 9.58, 3.33, -0.13, 0.36, 0.89, 1.7, 5.72, 3.92, 4.53, 3.93, 0.7, 43.04, 3.95, 1.3]} \ No newline at end of file diff --git a/annotations_1/R7P5OWV436c_filtered.json b/annotations_1/R7P5OWV436c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..223a816b5b7239c6d92a15f2758a5483ad5c3927 --- /dev/null +++ b/annotations_1/R7P5OWV436c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [9.0, 9.21], [12.0, 12.36], [14.0, 14.45], [18.0, 19.68], [21.0, 22.59], [23.0, 23.35], [27.0, 28.17], [29.0, 29.59], [31.0, 69.36], [72.0, 73.85], [78.0, 78.78], [80.0, 79.81], [81.0, 83.0], [84.0, 88.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 41.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 65.16], ["alarm", 7.2], ["fire alarm", 6.58]]], "duration": [0.49, 0.21, 0.36, 0.45, 1.68, 1.59, 0.35, 1.17, 0.59, 38.36, 1.85, 0.78, -0.19, 2.0, 4.62]} \ No newline at end of file diff --git a/annotations_1/R7vFG7jQZGY_filtered.json b/annotations_1/R7vFG7jQZGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ca2dea9545312458e05c85a2a71852b5954b16c --- /dev/null +++ b/annotations_1/R7vFG7jQZGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.83], [22.0, 23.13], [23.0, 24.06], [26.0, 27.67], [28.0, 31.55], [32.0, 34.05], [35.0, 36.83], [38.0, 39.02], [40.0, 40.24], [41.0, 42.13], [43.0, 54.11], [55.0, 56.98], [60.0, 75.25], [79.0, 87.0], [89.0, 93.97], [94.0, 94.44], [94.0, 95.22], [98.0, 99.28], [101.0, 101.46], [102.0, 111.08], [114.0, 123.09], [125.0, 126.45], [129.0, 132.11], [133.0, 135.19], [136.0, 137.91], [138.0, 145.23], [147.0, 149.28]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, true, true, true, false, false, false, false, true, true, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.26, 39.14, 0.0, 0.0, 0.0, 0.0, 30.08, 0.0, 32.96, 33.92, 36.2, 0.0, 0.0, 0.0, 0.0, 34.61, 37.84, 0.0, 40.22, 32.4, 0.0, 30.84, 36.65], "audiomae_on_audioset": [null, null, null, null, [["hum", 40.5], ["throbbing", 13.21], ["sidetone", 9.3]], [["speech", 44.18], ["groan", 9.25], ["music", 8.7]], null, null, null, null, [["hum", 51.07], ["mains hum", 14.01], ["throbbing", 9.64]], null, [["speech", 26.8], ["hum", 19.23], ["music", 18.8]], [["music", 23.22], ["speech", 12.3], ["noise", 8.73]], [["speech", 33.38], ["music", 28.96], ["fart", 5.21]], null, null, null, null, [["music", 34.14], ["speech", 15.15], ["hum", 11.24]], [["music", 39.26], ["hum", 19.24], ["ambient music", 8.98]], null, [["music", 43.82], ["gong", 10.67], ["ambient music", 10.18]], [["hum", 27.29], ["mains hum", 14.02], ["throbbing", 12.11]], null, [["speech", 25.43], ["hum", 20.58], ["music", 12.59]], [["music", 54.78], ["synthesizer", 8.32], ["ambient music", 7.16]]], "duration": [1.83, 1.13, 1.06, 1.67, 3.55, 2.05, 1.83, 1.02, 0.24, 1.13, 11.11, 1.98, 15.25, 8.0, 4.97, 0.44, 1.22, 1.28, 0.46, 9.08, 9.09, 1.45, 3.11, 2.19, 1.91, 7.23, 2.28]} \ No newline at end of file diff --git a/annotations_1/R81ZAKQzJ5Q_filtered.json b/annotations_1/R81ZAKQzJ5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..946ed8783699cc4285f5134f92b54a1421f3d91c --- /dev/null +++ b/annotations_1/R81ZAKQzJ5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.43], [15.0, 15.09], [16.0, 16.11], [17.0, 18.44], [19.0, 19.5], [21.0, 23.79], [28.0, 36.9], [37.0, 37.93], [41.0, 42.47], [43.0, 44.12], [44.0, 47.51], [49.0, 49.32], [50.0, 51.02], [52.0, 53.25], [55.0, 60.29], [62.0, 62.36], [67.0, 67.74], [69.0, 70.07], [73.0, 75.07], [76.0, 78.14], [79.0, 79.15], [82.0, 82.92], [83.0, 85.6], [86.0, 86.41], [87.0, 89.85], [92.0, 97.88], [103.0, 109.32], [111.0, 113.21], [114.0, 116.55]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [50.91, 0.0, 0.0, 0.0, 0.0, 45.46, 54.76, 0.0, 0.0, 0.0, 45.05, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 87.37, 75.88, 0.0, 0.0, 33.4, 0.0, 70.16, 35.07, 45.56, 51.88, 64.41], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 26.93], ["grunt", 16.89], ["music", 10.57]], null, null, null, null, [["speech", 33.95], ["throbbing", 15.53], ["hum", 13.32]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.37], ["sidetone", 18.63], ["crackle", 5.31]], null, null, [["crushing", 55.72], ["fart", 13.39], ["breaking", 2.47]], [["fly, housefly", 62.43], ["mosquito", 10.82], ["insect", 9.36]], null, null], "duration": [9.43, 0.09, 0.11, 1.44, 0.5, 2.79, 8.9, 0.93, 1.47, 1.12, 3.51, 0.32, 1.02, 1.25, 5.29, 0.36, 0.74, 1.07, 2.07, 2.14, 0.15, 0.92, 2.6, 0.41, 2.85, 5.88, 6.32, 2.21, 2.55]} \ No newline at end of file diff --git a/annotations_1/R8JjTOsPHo4_filtered.json b/annotations_1/R8JjTOsPHo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff24a3af05980eca67647504adb8f6537c1f64bc --- /dev/null +++ b/annotations_1/R8JjTOsPHo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 24.0], [25.0, 42.11], [44.0, 45.33], [47.0, 48.02], [49.0, 78.61], [81.0, 81.21], [83.0, 84.3], [90.0, 91.44], [94.0, 94.71], [97.0, 99.2], [99.0, 158.67], [159.0, 164.1], [165.0, 164.94], [165.0, 208.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.58, 30.83, 0.0, 0.0, 30.61, 0.0, 0.0, 0.0, 0.0, 30.96, 0.0, 30.52, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 42.85], ["mains hum", 18.57], ["speech", 14.26]], [["music", 59.8], ["throbbing", 10.01], ["didgeridoo", 9.49]], null, null, [["music", 55.29], ["didgeridoo", 11.91], ["synthesizer", 4.4]], null, null, null, null, [["mains hum", 31.86], ["hum", 30.76], ["throbbing", 10.93]], null, [["hum", 27.64], ["throbbing", 24.7], ["music", 23.94]], null, null], "duration": [21.0, 17.11, 1.33, 1.02, 29.61, 0.21, 1.3, 1.44, 0.71, 2.2, 59.67, 5.1, -0.06, 43.45]} \ No newline at end of file diff --git a/annotations_1/R9l_adCi74g_filtered.json b/annotations_1/R9l_adCi74g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f35133d0b40c8b534fc6ba26e15632cecb3a4dfb --- /dev/null +++ b/annotations_1/R9l_adCi74g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.34], [11.0, 14.86], [16.0, 16.65], [20.0, 21.36], [22.0, 41.25], [42.0, 59.19], [61.0, 65.52], [67.0, 69.45], [71.0, 79.66], [80.0, 81.26], [86.0, 85.87], [90.0, 91.08], [92.0, 93.21], [95.0, 95.76], [97.0, 98.0], [104.0, 108.19], [109.0, 109.07], [114.0, 117.58], [128.0, 130.33]], "keep_status": [false, true, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 31.47, 0.0, 0.0, 29.72, 33.33, 32.5, 29.89, 34.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 49.87, 36.75], "audiomae_on_audioset": [null, [["throbbing", 37.52], ["speech", 23.07], ["heart sounds, heartbeat", 8.78]], null, null, [["music", 25.45], ["sidetone", 20.57], ["throbbing", 18.94]], [["hum", 35.97], ["speech", 8.42], ["mains hum", 8.22]], [["speech", 21.63], ["hum", 16.49], ["music", 14.81]], [["speech", 35.19], ["baby cry, infant cry", 22.39], ["whimper", 3.32]], [["groan", 71.88], ["speech", 9.67], ["whimper", 3.3]], null, null, null, null, null, null, [["music", 26.69], ["groan", 17.78], ["speech", 7.07]], null, [["hum", 34.97], ["throbbing", 26.07], ["music", 13.21]], [["music", 20.76], ["sheep", 20.46], ["bleat", 17.45]]], "duration": [1.34, 3.86, 0.65, 1.36, 19.25, 17.19, 4.52, 2.45, 8.66, 1.26, -0.13, 1.08, 1.21, 0.76, 1.0, 4.19, 0.07, 3.58, 2.33]} \ No newline at end of file diff --git a/annotations_1/RAsK38Vdep4_filtered.json b/annotations_1/RAsK38Vdep4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39095af2d81494b6f7ddf2bf63452dbfb69f87da --- /dev/null +++ b/annotations_1/RAsK38Vdep4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [5.0, 7.99], [15.0, 15.87], [16.0, 17.09], [19.0, 19.25], [20.0, 21.09], [28.0, 28.97], [30.0, 32.21], [38.0, 38.94], [39.0, 40.9], [41.0, 41.64], [51.0, 54.09], [70.0, 71.93], [81.0, 81.13], [89.0, 89.7], [92.0, 91.99], [95.0, 95.99], [97.0, 100.57], [101.0, 104.84], [106.0, 109.65], [110.0, 112.82], [114.0, 117.46], [119.0, 121.07], [123.0, 123.94], [129.0, 130.35], [131.0, 132.88], [134.0, 135.08], [136.0, 136.17], [137.0, 137.02], [137.0, 137.19], [137.0, 137.44]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 35.26, 0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 58.3, 51.99, 52.56, 53.78, 60.42, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cacophony", 9.86], ["noise", 7.1], ["vehicle", 6.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 2.99, 0.87, 1.09, 0.25, 1.09, 0.97, 2.21, 0.94, 1.9, 0.64, 3.09, 1.93, 0.13, 0.7, -0.01, 0.99, 3.57, 3.84, 3.65, 2.82, 3.46, 2.07, 0.94, 1.35, 1.88, 1.08, 0.17, 0.02, 0.19, 0.44]} \ No newline at end of file diff --git a/annotations_1/RDBywHkU6Wg_filtered.json b/annotations_1/RDBywHkU6Wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c2d0da6ea3d421220152074f28970880171ad4 --- /dev/null +++ b/annotations_1/RDBywHkU6Wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.83], [21.0, 22.33], [23.0, 45.96], [47.0, 51.51], [53.0, 67.83], [69.0, 69.84], [73.0, 160.73]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [30.88, 0.0, 28.95, 36.52, 31.88, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 31.92], ["music", 29.05], ["throbbing", 21.81]], null, [["speech", 60.75], ["music", 13.63], ["throbbing", 2.32]], [["music", 67.83], ["mains hum", 8.75], ["hum", 7.77]], [["music", 43.94], ["hum", 8.94], ["mains hum", 7.99]], null, null], "duration": [5.83, 1.33, 22.96, 4.51, 14.83, 0.84, 87.73]} \ No newline at end of file diff --git a/annotations_1/REWaiDiKDIE_filtered.json b/annotations_1/REWaiDiKDIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88458c9c29849eeef6022c4b944d31b3adb07c49 --- /dev/null +++ b/annotations_1/REWaiDiKDIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.84], [7.0, 7.32], [7.0, 10.54], [11.0, 10.88], [12.0, 11.77], [18.0, 18.93], [22.0, 22.87], [40.0, 39.77], [42.0, 43.16], [44.0, 45.93], [46.0, 47.48], [51.0, 53.45], [55.0, 59.19], [60.0, 61.64], [63.0, 64.94], [67.0, 72.39], [75.0, 76.77], [77.0, 81.9], [83.0, 84.38], [86.0, 87.52], [89.0, 90.12], [92.0, 92.8], [94.0, 95.34], [102.0, 102.19], [106.0, 108.45], [110.0, 112.46], [114.0, 119.57], [122.0, 122.13], [123.0, 123.23], [123.0, 125.0], [126.0, 128.17], [132.0, 133.74], [146.0, 146.11], [146.0, 146.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 99.76, 0.0, 0.0, 99.87, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 95.91, 98.51, 0.0, 0.0, 98.99, 79.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.98], ["music", 19.84], ["boing", 9.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.16, 0.32, 3.54, -0.12, -0.23, 0.93, 0.87, -0.23, 1.16, 1.93, 1.48, 2.45, 4.19, 1.64, 1.94, 5.39, 1.77, 4.9, 1.38, 1.52, 1.12, 0.8, 1.34, 0.19, 2.45, 2.46, 5.57, 0.13, 0.23, 2.0, 2.17, 1.74, 0.11, 0.53]} \ No newline at end of file diff --git a/annotations_1/REwimg6y1Cg_filtered.json b/annotations_1/REwimg6y1Cg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea9a4f56d4637fa6bb06fc1daf83e344378b44a --- /dev/null +++ b/annotations_1/REwimg6y1Cg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.67], [9.0, 10.25], [20.0, 45.12], [46.0, 47.78], [48.0, 62.97], [66.0, 66.78], [67.0, 67.98], [70.0, 74.97], [75.0, 81.31], [84.0, 84.89], [86.0, 89.4], [91.0, 91.35], [93.0, 93.9], [102.0, 102.25], [103.0, 103.79], [105.0, 105.38], [106.0, 112.65], [114.0, 118.42]], "keep_status": [false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.72, 0.0, 36.68, 0.0, 0.0, 36.17, 41.64, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 71.43], "audiomae_on_audioset": [null, null, [["music", 36.31], ["hum", 9.81], ["mains hum", 8.09]], null, [["fly, housefly", 36.36], ["mosquito", 25.76], ["insect", 18.59]], null, null, [["speech", 40.33], ["music", 9.47], ["fly, housefly", 7.31]], [["speech", 17.14], ["music", 16.97], ["buzz", 12.4]], null, null, null, null, null, null, null, [["hum", 61.85], ["mains hum", 25.68], ["throbbing", 3.41]], null], "duration": [0.67, 1.25, 25.12, 1.78, 14.97, 0.78, 0.98, 4.97, 6.31, 0.89, 3.4, 0.35, 0.9, 0.25, 0.79, 0.38, 6.65, 4.42]} \ No newline at end of file diff --git a/annotations_1/RFAiq0Qr6uQ_filtered.json b/annotations_1/RFAiq0Qr6uQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..814c44f7e8a76419213720c886f76f0fe51413ee --- /dev/null +++ b/annotations_1/RFAiq0Qr6uQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.13], [14.0, 14.1], [17.0, 18.01], [29.0, 29.2], [46.0, 46.14], [47.0, 47.02], [91.0, 92.6], [96.0, 96.38], [104.0, 104.45], [106.0, 106.95], [108.0, 107.92], [120.0, 120.12], [122.0, 122.03], [123.0, 123.47], [124.0, 129.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.13, 0.1, 1.01, 0.2, 0.14, 0.02, 1.6, 0.38, 0.45, 0.95, -0.08, 0.12, 0.03, 0.47, 5.36]} \ No newline at end of file diff --git a/annotations_1/RFBlDixa33k_filtered.json b/annotations_1/RFBlDixa33k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d610dd1c1a0a3dcbf1f6eddfa594c975d5ec2a8 --- /dev/null +++ b/annotations_1/RFBlDixa33k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.21], [12.0, 13.93], [16.0, 39.95], [44.0, 53.94], [54.0, 57.89], [59.0, 59.8], [61.0, 61.79], [66.0, 66.55], [74.0, 75.88], [80.0, 80.16], [94.0, 95.2], [96.0, 100.31], [105.0, 105.26], [116.0, 116.28], [117.0, 119.96], [121.0, 121.0], [122.0, 122.76], [126.0, 127.38], [130.0, 130.57], [131.0, 143.48], [146.0, 167.88], [168.0, 173.97], [175.0, 183.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [34.86, 0.0, 32.3, 45.3, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.65, 0.0, 0.0, 35.49, 0.0, 0.0, 0.0, 0.0, 32.22, 32.54, 35.14, 60.23], "audiomae_on_audioset": [[["music", 54.51], ["theremin", 11.92], ["synthesizer", 5.71]], null, [["music", 61.13], ["hum", 10.17], ["throbbing", 5.65]], [["music", 48.62], ["hum", 13.01], ["mains hum", 3.89]], null, null, null, null, null, null, null, [["music", 33.51], ["speech", 19.9], ["didgeridoo", 6.15]], null, null, [["music", 83.31], ["musical instrument", 2.8], ["effects unit", 2.22]], null, null, null, null, [["music", 47.78], ["synthesizer", 7.8], ["hum", 4.16]], [["music", 46.28], ["fly, housefly", 6.89], ["sound effect", 6.05]], [["fart", 18.21], ["music", 11.82], ["didgeridoo", 8.47]], null], "duration": [2.21, 1.93, 23.95, 9.94, 3.89, 0.8, 0.79, 0.55, 1.88, 0.16, 1.2, 4.31, 0.26, 0.28, 2.96, 0.0, 0.76, 1.38, 0.57, 12.48, 21.88, 5.97, 8.14]} \ No newline at end of file diff --git a/annotations_1/RFR3AJ-jE88_filtered.json b/annotations_1/RFR3AJ-jE88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..401e2ab8bb0957b8a2f9f0a06f6f0f883c90db40 --- /dev/null +++ b/annotations_1/RFR3AJ-jE88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.46], [25.0, 26.82], [28.0, 30.84], [34.0, 35.38], [37.0, 42.45], [44.0, 52.35], [53.0, 63.26], [65.0, 70.93], [76.0, 76.57], [80.0, 80.6], [82.0, 83.17], [84.0, 89.99], [91.0, 90.95], [96.0, 97.73], [99.0, 100.06], [101.0, 104.13], [109.0, 110.0], [112.0, 116.48], [119.0, 131.3]], "keep_status": [true, false, false, false, true, true, false, true, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [42.0, 0.0, 68.67, 0.0, 43.25, 41.4, 44.23, 43.96, 0.0, 0.0, 0.0, 31.08, 0.0, 0.0, 0.0, 32.61, 0.0, 36.47, 36.58], "audiomae_on_audioset": [[["music", 29.85], ["synthesizer", 12.59], ["speech", 9.63]], null, null, null, [["speech", 31.08], ["music", 26.61], ["hum", 5.8]], [["music", 52.97], ["hum", 6.55], ["throbbing", 4.23]], [["music", 44.41], ["boing", 34.19], ["throbbing", 2.19]], [["music", 28.61], ["sine wave", 6.33], ["speech", 4.77]], null, null, null, [["music", 34.1], ["didgeridoo", 24.9], ["noise", 9.48]], null, null, null, [["music", 40.58], ["speech", 15.47], ["thunk", 8.54]], null, [["music", 30.41], ["throbbing", 23.31], ["hum", 20.07]], [["music", 54.47], ["speech", 6.78], ["theremin", 3.71]]], "duration": [4.46, 1.82, 2.84, 1.38, 5.45, 8.35, 10.26, 5.93, 0.57, 0.6, 1.17, 5.99, -0.05, 1.73, 1.06, 3.13, 1.0, 4.48, 12.3]} \ No newline at end of file diff --git a/annotations_1/RFtZAVgf1Yg_filtered.json b/annotations_1/RFtZAVgf1Yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfce4b085572a3e0ae714d1843fbb26763797711 --- /dev/null +++ b/annotations_1/RFtZAVgf1Yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[82.0, 85.77], [87.0, 87.67]], "keep_status": [false, false], "silence_prob": [42.76, 0.0], "audiomae_on_audioset": [[["mains hum", 41.31], ["hum", 37.74], ["throbbing", 2.93]], null], "duration": [3.77, 0.67]} \ No newline at end of file diff --git a/annotations_1/RGaBXM3EHUo_filtered.json b/annotations_1/RGaBXM3EHUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a150ed93f5cf3bb1934024d22032559dfaf7c49 --- /dev/null +++ b/annotations_1/RGaBXM3EHUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.12], [14.0, 15.18], [16.0, 18.22], [20.0, 21.61], [23.0, 98.58], [99.0, 100.75], [102.0, 104.87]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [94.66, 0.0, 76.2, 0.0, 0.0, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [2.12, 1.18, 2.22, 1.61, 75.58, 1.75, 2.87]} \ No newline at end of file diff --git a/annotations_1/RHVyIHN6qOE_filtered.json b/annotations_1/RHVyIHN6qOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5792732f2f65f27fd53fb39373d4e9f1e5cedd8c --- /dev/null +++ b/annotations_1/RHVyIHN6qOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [8.0, 7.89], [9.0, 11.01], [12.0, 12.45], [14.0, 16.5], [18.0, 18.33], [22.0, 24.8], [26.0, 29.61], [30.0, 30.01], [31.0, 33.17], [34.0, 35.88], [50.0, 50.73], [51.0, 52.78], [58.0, 58.5], [64.0, 63.98], [71.0, 74.02], [75.0, 75.3], [77.0, 76.87], [81.0, 81.5]], "keep_status": [false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.74, 0.0, 45.72, 0.0, 40.54, 38.97, 0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 32.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 39.53], ["throbbing", 9.03], ["theremin", 6.13]], null, [["music", 66.55], ["didgeridoo", 8.09], ["musical instrument", 4.95]], null, [["music", 41.77], ["didgeridoo", 15.61], ["hum", 7.58]], [["hum", 26.92], ["throbbing", 26.74], ["music", 18.17]], null, [["speech", 21.29], ["throbbing", 18.88], ["hum", 15.68]], null, null, null, null, null, [["throbbing", 60.14], ["hum", 24.76], ["music", 5.09]], null, null, null], "duration": [0.59, -0.11, 2.01, 0.45, 2.5, 0.33, 2.8, 3.61, 0.01, 2.17, 1.88, 0.73, 1.78, 0.5, -0.02, 3.02, 0.3, -0.13, 0.5]} \ No newline at end of file diff --git a/annotations_1/RHlGpxG_-wM_filtered.json b/annotations_1/RHlGpxG_-wM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ac4f075c7b94247ce79617f7615da79b99dad20 --- /dev/null +++ b/annotations_1/RHlGpxG_-wM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.26], [11.0, 13.54], [17.0, 18.25], [30.0, 37.22], [40.0, 40.9], [49.0, 53.65], [60.0, 79.81], [83.0, 84.21], [100.0, 107.87], [111.0, 111.89], [115.0, 116.13], [119.0, 119.79], [122.0, 122.99], [127.0, 128.82]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [69.34, 33.21, 0.0, 35.52, 0.0, 31.24, 30.55, 0.0, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 11.51], ["rumble", 8.37], ["music", 6.97]], null, [["music", 57.14], ["speech", 28.99], ["boing", 1.92]], null, [["music", 41.33], ["throbbing", 5.9], ["sound effect", 4.41]], [["speech", 60.87], ["music", 22.24], ["didgeridoo", 3.49]], null, [["speech", 69.01], ["music", 18.12], ["cacophony", 1.73]], null, null, null, null, null], "duration": [3.26, 2.54, 1.25, 7.22, 0.9, 4.65, 19.81, 1.21, 7.87, 0.89, 1.13, 0.79, 0.99, 1.82]} \ No newline at end of file diff --git a/annotations_1/RHmp-rhCrLo_filtered.json b/annotations_1/RHmp-rhCrLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..581e2cd3ed0df51b36c540a32bab30e090f5939f --- /dev/null +++ b/annotations_1/RHmp-rhCrLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.65], [25.0, 26.4], [28.0, 28.46], [31.0, 38.87], [41.0, 45.49], [46.0, 45.52], [46.0, 52.24], [54.0, 57.59], [59.0, 59.44], [61.0, 69.89], [74.0, 77.04], [78.0, 79.39], [81.0, 80.77], [83.0, 83.4], [85.0, 97.12], [98.0, 110.39], [111.0, 111.32], [116.0, 116.65], [118.0, 118.79], [120.0, 120.95], [125.0, 126.71]], "keep_status": [false, false, false, false, true, false, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.91, 0.0, 0.0, 29.47, 30.94, 0.0, 29.56, 31.08, 0.0, 33.0, 31.65, 0.0, 0.0, 0.0, 30.21, 31.36, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 31.23], ["moo", 20.72], ["livestock, farm animals, working animals", 19.48]], null, null, [["music", 70.31], ["electronic music", 2.26], ["hum", 1.56]], [["whale vocalization", 24.6], ["cattle, bovinae", 10.61], ["moo", 9.87]], null, [["music", 52.25], ["livestock, farm animals, working animals", 5.69], ["cattle, bovinae", 4.86]], [["livestock, farm animals, working animals", 22.91], ["moo", 17.72], ["cattle, bovinae", 14.8]], null, [["cattle, bovinae", 21.19], ["moo", 17.99], ["livestock, farm animals, working animals", 17.5]], [["livestock, farm animals, working animals", 27.92], ["speech", 13.51], ["moo", 12.24]], null, null, null, [["music", 77.1], ["shout", 2.03], ["theremin", 1.98]], [["music", 66.11], ["theremin", 8.07], ["speech", 3.13]], null, null, null, null, null], "duration": [4.65, 1.4, 0.46, 7.87, 4.49, -0.48, 6.24, 3.59, 0.44, 8.89, 3.04, 1.39, -0.23, 0.4, 12.12, 12.39, 0.32, 0.65, 0.79, 0.95, 1.71]} \ No newline at end of file diff --git a/annotations_1/RHz9rXVt3cQ_filtered.json b/annotations_1/RHz9rXVt3cQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbcf0cf4d0bc538f6747e9c72f2eb151f70282ca --- /dev/null +++ b/annotations_1/RHz9rXVt3cQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [9.0, 9.05], [11.0, 12.75], [14.0, 17.2], [22.0, 22.84], [29.0, 29.24], [31.0, 33.56], [35.0, 35.21], [36.0, 38.23], [39.0, 39.23], [41.0, 41.28], [54.0, 53.84], [56.0, 56.51], [58.0, 58.78], [64.0, 64.52], [65.0, 66.26], [88.0, 88.53], [104.0, 108.33], [143.0, 160.96], [164.0, 169.59], [170.0, 170.72], [171.0, 193.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 99.1, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 99.97, 99.85, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.05, 1.75, 3.2, 0.84, 0.24, 2.56, 0.21, 2.23, 0.23, 0.28, -0.16, 0.51, 0.78, 0.52, 1.26, 0.53, 4.33, 17.96, 5.59, 0.72, 22.31]} \ No newline at end of file diff --git a/annotations_1/RIInmRkYOXc_filtered.json b/annotations_1/RIInmRkYOXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4e9d149c73f5d530d9007a3a4681d8c5e841f43 --- /dev/null +++ b/annotations_1/RIInmRkYOXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [4.0, 4.85], [6.0, 6.37], [9.0, 9.27], [11.0, 11.38], [12.0, 22.76], [23.0, 26.01], [27.0, 27.95], [29.0, 31.89], [32.0, 34.47], [35.0, 36.49], [40.0, 41.07], [42.0, 43.17], [44.0, 45.22], [46.0, 46.68], [55.0, 62.92], [63.0, 64.27], [64.0, 64.88], [65.0, 72.12], [74.0, 75.32], [78.0, 79.3], [80.0, 83.03], [84.0, 86.43], [88.0, 87.93], [93.0, 93.11], [95.0, 94.98], [97.0, 102.07], [108.0, 109.16], [113.0, 116.55], [117.0, 118.44], [119.0, 120.23], [142.0, 145.23], [145.0, 145.32], [146.0, 148.2], [150.0, 152.2], [155.0, 156.22], [157.0, 156.76], [158.0, 159.97], [160.0, 161.89], [163.0, 163.8], [166.0, 172.29], [174.0, 175.0], [176.0, 177.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 52.33, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 74.76, 0.0, 0.0, 81.53, 100.0, 0.0, 0.0, 0.0, 41.38, 0.0, 100.0, 0.0, 0.0, 40.64, 0.0, 37.85, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 87.25], ["male speech, man speaking", 1.41], ["inside, small room", 0.68]], null, null, null, null, null, null, null, null, null, null, [["thunk", 41.35], ["wood", 12.18], ["speech", 11.23]], null, null, null, null, [["speech", 93.08], ["sidetone", 1.82], ["boing", 1.66]], null, [["speech", 61.26], ["arrow", 5.81], ["telephone", 5.31]], null, null, null, null, null, null, [["speech", 59.69], ["thunk", 17.13], ["doorbell", 6.47]], null, null], "duration": [0.74, 0.85, 0.37, 0.27, 0.38, 10.76, 3.01, 0.95, 2.89, 2.47, 1.49, 1.07, 1.17, 1.22, 0.68, 7.92, 1.27, 0.88, 7.12, 1.32, 1.3, 3.03, 2.43, -0.07, 0.11, -0.02, 5.07, 1.16, 3.55, 1.44, 1.23, 3.23, 0.32, 2.2, 2.2, 1.22, -0.24, 1.97, 1.89, 0.8, 6.29, 1.0, 1.3]} \ No newline at end of file diff --git a/annotations_1/RIzrkbF1-SU_filtered.json b/annotations_1/RIzrkbF1-SU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b38fb9f28f5ee8e6254b2e1d57a19cafdde515c --- /dev/null +++ b/annotations_1/RIzrkbF1-SU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.76], [40.0, 39.87], [42.0, 48.02], [50.0, 60.93], [62.0, 77.09], [80.0, 81.18], [92.0, 92.85], [95.0, 95.67], [120.0, 122.59]], "keep_status": [false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 78.89, 39.8, 40.95, 0.0, 0.0, 0.0, 43.28], "audiomae_on_audioset": [null, null, null, [["explosion", 31.34], ["music", 19.59], ["speech", 12.99]], [["singing bowl", 34.14], ["music", 22.03], ["speech", 16.0]], null, null, null, [["speech", 27.97], ["music", 26.44], ["ambient music", 4.36]]], "duration": [0.76, -0.13, 6.02, 10.93, 15.09, 1.18, 0.85, 0.67, 2.59]} \ No newline at end of file diff --git a/annotations_1/RJEoUwZdwfk_filtered.json b/annotations_1/RJEoUwZdwfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7adede47e38dbfbd37cf48dc58d20ba5c5aab141 --- /dev/null +++ b/annotations_1/RJEoUwZdwfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 47.58], [49.0, 58.09], [59.0, 60.39], [61.0, 83.07], [84.0, 84.86], [89.0, 89.78], [95.0, 96.35], [103.0, 103.74], [123.0, 136.12], [140.0, 150.69]], "keep_status": [true, true, false, true, false, false, false, false, true, true], "silence_prob": [30.42, 30.23, 0.0, 30.77, 0.0, 0.0, 0.0, 0.0, 30.06, 29.45], "audiomae_on_audioset": [[["cattle, bovinae", 15.54], ["fly, housefly", 14.14], ["moo", 14.04]], [["speech", 23.91], ["music", 21.51], ["sidetone", 20.4]], null, [["wild animals", 22.26], ["animal", 16.18], ["speech", 12.05]], null, null, null, null, [["buzz", 23.05], ["speech", 15.44], ["hum", 7.24]], [["music", 29.01], ["smash, crash", 15.25], ["car", 5.39]]], "duration": [4.58, 9.09, 1.39, 22.07, 0.86, 0.78, 1.35, 0.74, 13.12, 10.69]} \ No newline at end of file diff --git a/annotations_1/RLbry-3z8yQ_filtered.json b/annotations_1/RLbry-3z8yQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72874a5af953dc55034a214fba4d5d1f154c4453 --- /dev/null +++ b/annotations_1/RLbry-3z8yQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [5.0, 6.17], [9.0, 13.95], [19.0, 19.8], [32.0, 44.32], [45.0, 45.91], [47.0, 70.16], [73.0, 73.14], [73.0, 73.18], [74.0, 75.71], [78.0, 85.9], [87.0, 87.51], [91.0, 91.52], [94.0, 94.44], [102.0, 103.38], [104.0, 105.66], [106.0, 106.84], [112.0, 115.65], [118.0, 119.1], [123.0, 123.4], [124.0, 125.93], [129.0, 129.47], [130.0, 131.14], [133.0, 135.78], [138.0, 138.6], [144.0, 144.88], [156.0, 157.42], [164.0, 166.11], [168.0, 169.08]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.38, 0.0, 33.98, 0.0, 32.79, 0.0, 0.0, 0.0, 35.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 0.0, 0.0, 0.0, 0.0, 42.19, 0.0, 0.0, 0.0, 52.22, 0.0], "audiomae_on_audioset": [null, null, [["music", 17.75], ["hum", 6.39], ["mains hum", 4.56]], null, [["music", 47.67], ["boing", 32.97], ["speech", 5.52]], null, [["music", 52.0], ["speech", 21.89], ["boing", 3.76]], null, null, null, [["music", 81.12], ["synthesizer", 3.6], ["didgeridoo", 3.17]], null, null, null, null, null, null, [["speech", 40.24], ["music", 20.24], ["mains hum", 6.21]], null, null, null, null, null, [["music", 18.34], ["buzz", 8.92], ["didgeridoo", 8.0]], null, null, null, null, null], "duration": [1.16, 1.17, 4.95, 0.8, 12.32, 0.91, 23.16, 0.14, 0.18, 1.71, 7.9, 0.51, 0.52, 0.44, 1.38, 1.66, 0.84, 3.65, 1.1, 0.4, 1.93, 0.47, 1.14, 2.78, 0.6, 0.88, 1.42, 2.11, 1.08]} \ No newline at end of file diff --git a/annotations_1/RM0NW8MF9wY_filtered.json b/annotations_1/RM0NW8MF9wY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e09d602a6256de733d240f4c6f6fec08c5ab4c09 --- /dev/null +++ b/annotations_1/RM0NW8MF9wY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.37], [8.0, 15.52], [17.0, 22.94], [24.0, 36.64], [41.0, 48.37], [49.0, 52.27], [61.0, 70.26], [76.0, 95.18], [98.0, 98.56], [103.0, 117.34], [120.0, 148.61], [149.0, 151.36], [155.0, 155.51], [159.0, 159.17]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, true, false, false], "silence_prob": [93.13, 72.75, 46.75, 30.0, 29.25, 29.24, 29.3, 29.38, 0.0, 28.83, 30.0, 40.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fly, housefly", 52.16], ["insect", 27.01], ["bee, wasp, etc.", 4.57]], [["vehicle", 18.48], ["car", 9.8], ["race car, auto racing", 9.54]], [["music", 40.53], ["sidetone", 32.54], ["speech", 7.78]], [["music", 79.63], ["didgeridoo", 4.53], ["musical instrument", 1.03]], [["music", 63.26], ["synthetic singing", 18.31], ["rock and roll", 1.74]], [["music", 89.03], ["didgeridoo", 1.96], ["speech", 1.04]], null, [["music", 73.2], ["musical instrument", 2.52], ["funny music", 2.41]], [["music", 41.44], ["cattle, bovinae", 10.12], ["livestock, farm animals, working animals", 10.1]], [["sidetone", 21.65], ["mosquito", 10.71], ["music", 8.71]], null, null], "duration": [5.37, 7.52, 5.94, 12.64, 7.37, 3.27, 9.26, 19.18, 0.56, 14.34, 28.61, 2.36, 0.51, 0.17]} \ No newline at end of file diff --git a/annotations_1/RMWfAkUhGCM_filtered.json b/annotations_1/RMWfAkUhGCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49e13cec0f5da6c6af010252fb809fe2fb4fe5a4 --- /dev/null +++ b/annotations_1/RMWfAkUhGCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 24.06], [28.0, 79.93], [82.0, 93.65], [102.0, 113.61], [114.0, 117.15], [119.0, 121.49], [122.0, 126.64], [132.0, 131.9], [133.0, 133.44], [137.0, 138.91]], "keep_status": [true, false, false, true, false, false, false, false, false, false], "silence_prob": [30.16, 0.0, 60.42, 36.82, 84.8, 91.3, 48.48, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.45], ["foghorn", 7.81], ["speech", 6.13]], null, null, [["music", 42.84], ["hum", 9.16], ["rumble", 5.82]], null, null, [["music", 74.57], ["synthesizer", 6.3], ["drum machine", 3.34]], null, null, null], "duration": [7.06, 51.93, 11.65, 11.61, 3.15, 2.49, 4.64, -0.1, 0.44, 1.91]} \ No newline at end of file diff --git a/annotations_1/RMaNfwSn-pw_filtered.json b/annotations_1/RMaNfwSn-pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1a2970057fff8a2dc75392f6b1a84aedebdc971 --- /dev/null +++ b/annotations_1/RMaNfwSn-pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.84], [10.0, 10.03], [17.0, 17.32], [26.0, 27.14], [29.0, 29.59], [31.0, 33.45], [39.0, 48.79], [50.0, 49.79], [50.0, 58.77], [62.0, 65.75], [70.0, 70.11], [71.0, 71.12], [78.0, 78.6], [88.0, 103.03], [109.0, 108.95], [110.0, 124.53], [126.0, 139.28], [141.0, 147.77], [160.0, 161.03], [162.0, 162.36], [169.0, 176.55], [177.0, 176.59]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, true, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 49.45, 53.72, 0.0, 33.65, 42.26, 0.0, 0.0, 0.0, 39.5, 0.0, 45.56, 46.19, 39.93, 0.0, 0.0, 47.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 37.57], ["pulse", 8.64], ["rumble", 6.38]], null, null, [["speech", 25.72], ["music", 15.01], ["groan", 8.65]], [["music", 30.07], ["rumble", 14.62], ["hum", 13.37]], null, null, null, [["speech", 14.19], ["siren", 11.29], ["whale vocalization", 10.73]], null, [["hum", 29.83], ["mains hum", 20.98], ["breaking", 6.56]], [["mains hum", 38.87], ["hum", 21.97], ["speech", 4.88]], [["noise", 18.39], ["speech", 11.4], ["hum", 11.03]], null, null, [["speech", 39.92], ["bee, wasp, etc.", 12.27], ["insect", 11.66]], null], "duration": [1.84, 0.03, 0.32, 1.14, 0.59, 2.45, 9.79, -0.21, 8.77, 3.75, 0.11, 0.12, 0.6, 15.03, -0.05, 14.53, 13.28, 6.77, 1.03, 0.36, 7.55, -0.41]} \ No newline at end of file diff --git a/annotations_1/RNJ7CL89IFM_filtered.json b/annotations_1/RNJ7CL89IFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed58f08354ad5a14cf9063565ee908b61b4ad4b9 --- /dev/null +++ b/annotations_1/RNJ7CL89IFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.48], [35.0, 35.92], [38.0, 40.42], [41.0, 41.89], [42.0, 43.7], [45.0, 45.5], [48.0, 48.98], [49.0, 49.6], [50.0, 52.34], [57.0, 58.13], [60.0, 60.81], [64.0, 65.15], [67.0, 68.74], [70.0, 74.21], [76.0, 91.17], [91.0, 98.83], [100.0, 103.28], [105.0, 105.36], [108.0, 113.05], [114.0, 119.55], [121.0, 122.42], [125.0, 127.06], [128.0, 129.37], [132.0, 133.71], [135.0, 137.74], [141.0, 143.11], [143.0, 145.57], [147.0, 150.97], [152.0, 176.81], [177.0, 180.01], [182.0, 183.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 41.44, 62.47, 59.59, 97.0, 0.0, 94.52, 99.73, 0.0, 96.66, 0.0, 0.0, 69.61, 87.19, 72.9, 77.2, 51.07, 61.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.62], ["speech", 29.38], ["guitar", 5.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 0.92, 2.42, 0.89, 1.7, 0.5, 0.98, 0.6, 2.34, 1.13, 0.81, 1.15, 1.74, 4.21, 15.17, 7.83, 3.28, 0.36, 5.05, 5.55, 1.42, 2.06, 1.37, 1.71, 2.74, 2.11, 2.57, 3.97, 24.81, 3.01, 1.41]} \ No newline at end of file diff --git a/annotations_1/RNPPrvhTKuc_filtered.json b/annotations_1/RNPPrvhTKuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deb89996208b6fad5b12f0da77657d32dc39c946 --- /dev/null +++ b/annotations_1/RNPPrvhTKuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.69], [32.0, 65.06], [66.0, 66.78], [69.0, 71.25], [74.0, 77.18], [78.0, 78.58], [80.0, 81.7], [84.0, 85.06], [87.0, 89.14], [91.0, 94.95], [96.0, 98.22], [102.0, 115.28], [120.0, 122.18], [123.0, 123.53], [125.0, 126.2], [129.0, 129.69], [131.0, 130.92]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [35.12, 0.0, 0.0, 44.99, 38.16, 0.0, 0.0, 0.0, 42.88, 86.64, 35.15, 31.72, 32.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.13], ["synthesizer", 4.87], ["hum", 4.28]], null, null, [["speech", 42.39], ["music", 20.06], ["sonar", 4.64]], [["music", 22.82], ["bell", 8.32], ["reverberation", 8.08]], null, null, null, [["noise", 29.95], ["radio", 23.37], ["mains hum", 11.35]], null, [["speech", 62.21], ["busy signal", 24.81], ["dial tone", 3.27]], [["speech", 53.39], ["sidetone", 8.27], ["electric shaver, electric razor", 5.87]], [["speech", 38.91], ["radio", 12.41], ["fire alarm", 5.14]], null, null, null, null], "duration": [16.69, 33.06, 0.78, 2.25, 3.18, 0.58, 1.7, 1.06, 2.14, 3.95, 2.22, 13.28, 2.18, 0.53, 1.2, 0.69, -0.08]} \ No newline at end of file diff --git a/annotations_1/ROXLPqlbJck_filtered.json b/annotations_1/ROXLPqlbJck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e01ee3ec446fa1c5d9bd18df00cd78fdaf1ec9a --- /dev/null +++ b/annotations_1/ROXLPqlbJck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 65.08], [66.0, 67.74], [69.0, 78.21], [84.0, 103.76], [106.0, 121.56], [123.0, 135.43], [138.0, 150.58]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [71.72, 0.0, 81.0, 59.33, 29.59, 30.55, 47.2], "audiomae_on_audioset": [null, null, null, null, [["hum", 27.46], ["mains hum", 25.98], ["music", 17.03]], [["music", 60.93], ["hum", 8.92], ["electronic music", 4.68]], [["music", 50.74], ["hum", 5.52], ["ambient music", 5.08]]], "duration": [10.08, 1.74, 9.21, 19.76, 15.56, 12.43, 12.58]} \ No newline at end of file diff --git a/annotations_1/ROeFmcvZRf8_filtered.json b/annotations_1/ROeFmcvZRf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff40844042c98382c43cf9dc1354c3f7cfe4e4d5 --- /dev/null +++ b/annotations_1/ROeFmcvZRf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.22], [28.0, 27.99], [32.0, 37.99], [40.0, 41.05], [45.0, 48.0], [51.0, 64.94], [73.0, 78.22], [78.0, 78.26], [79.0, 90.63], [91.0, 91.62], [92.0, 93.48], [94.0, 99.89], [101.0, 103.6], [104.0, 108.8], [112.0, 119.64], [124.0, 125.37], [126.0, 128.04], [134.0, 143.4], [147.0, 146.84], [148.0, 186.09], [188.0, 195.47], [196.0, 195.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [69.34, 0.0, 55.11, 0.0, 40.52, 29.91, 29.11, 0.0, 32.58, 0.0, 0.0, 30.43, 32.99, 30.67, 30.14, 0.0, 33.28, 30.84, 0.0, 0.0, 31.46, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.86], ["music", 23.91], ["sidetone", 5.35]], [["music", 40.31], ["speech", 30.18], ["didgeridoo", 2.8]], [["music", 38.49], ["speech", 34.18], ["whack, thwack", 5.03]], null, [["music", 67.29], ["sidetone", 11.79], ["throbbing", 3.97]], null, null, [["music", 32.15], ["speech", 27.72], ["throbbing", 11.18]], [["speech", 19.78], ["sidetone", 19.0], ["hum", 12.64]], [["thunk", 42.77], ["speech", 11.69], ["whack, thwack", 8.06]], [["music", 47.81], ["speech", 25.28], ["throbbing", 5.4]], null, [["throbbing", 38.19], ["hum", 29.85], ["music", 14.2]], [["music", 29.41], ["whack, thwack", 24.4], ["speech", 5.57]], null, null, [["hum", 41.75], ["mains hum", 24.77], ["throbbing", 14.92]], null], "duration": [2.22, -0.01, 5.99, 1.05, 3.0, 13.94, 5.22, 0.26, 11.63, 0.62, 1.48, 5.89, 2.6, 4.8, 7.64, 1.37, 2.04, 9.4, -0.16, 38.09, 7.47, -0.06]} \ No newline at end of file diff --git a/annotations_1/ROlSjAgE93Q_filtered.json b/annotations_1/ROlSjAgE93Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..146be2ed38bc3d300337c73ce827b767a111b13d --- /dev/null +++ b/annotations_1/ROlSjAgE93Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.94], [11.0, 11.97], [19.0, 19.6], [24.0, 25.47], [31.0, 34.21], [36.0, 36.75], [38.0, 40.37], [46.0, 54.97], [59.0, 60.51], [63.0, 64.81]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [41.68, 0.0, 0.0, 0.0, 59.42, 0.0, 47.12, 46.86, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 50.83], ["speech", 17.15], ["throbbing", 12.9]], null, null, null, null, null, [["hum", 43.21], ["music", 11.48], ["throbbing", 9.1]], [["music", 62.83], ["hum", 12.79], ["mains hum", 6.97]], null, null], "duration": [9.94, 0.97, 0.6, 1.47, 3.21, 0.75, 2.37, 8.97, 1.51, 1.81]} \ No newline at end of file diff --git a/annotations_1/ROqfvY68ijM_filtered.json b/annotations_1/ROqfvY68ijM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5b3ff16adae812269cfba9fd558befb0a458faf --- /dev/null +++ b/annotations_1/ROqfvY68ijM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 78.14], [78.0, 81.53], [84.0, 86.97], [88.0, 91.69], [96.0, 101.56], [103.0, 120.33], [121.0, 122.13], [126.0, 128.11]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [88.46, 99.73, 99.99, 83.16, 99.93, 99.1, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [2.14, 3.53, 2.97, 3.69, 5.56, 17.33, 1.13, 2.11]} \ No newline at end of file diff --git a/annotations_1/RPW4sx3UYjU_filtered.json b/annotations_1/RPW4sx3UYjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fa7659f4686125dc11465d1a2441843ef15d276 --- /dev/null +++ b/annotations_1/RPW4sx3UYjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [5.0, 6.25], [10.0, 14.34], [20.0, 21.54], [22.0, 23.94], [24.0, 24.93], [25.0, 25.44], [27.0, 29.46], [31.0, 31.8], [33.0, 40.42], [42.0, 43.06], [44.0, 44.78], [47.0, 48.42], [51.0, 52.37], [56.0, 56.91], [57.0, 58.13], [58.0, 60.05], [61.0, 61.84], [63.0, 63.04], [64.0, 65.7], [68.0, 67.61], [69.0, 70.06], [72.0, 73.06], [73.0, 73.57], [74.0, 78.58], [81.0, 103.1], [104.0, 104.79], [105.0, 105.71], [109.0, 109.43], [113.0, 113.32], [115.0, 115.62], [119.0, 120.14], [123.0, 125.2], [140.0, 140.1], [145.0, 145.17], [157.0, 157.23], [159.0, 159.24], [162.0, 163.04], [168.0, 168.86], [171.0, 170.78]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 47.82, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["creak", 12.63], ["hum", 11.16], ["music", 9.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 1.25, 4.34, 1.54, 1.94, 0.93, 0.44, 2.46, 0.8, 7.42, 1.06, 0.78, 1.42, 1.37, 0.91, 1.13, 2.05, 0.84, 0.04, 1.7, -0.39, 1.06, 1.06, 0.57, 4.58, 22.1, 0.79, 0.71, 0.43, 0.32, 0.62, 1.14, 2.2, 0.1, 0.17, 0.23, 0.24, 1.04, 0.86, -0.22]} \ No newline at end of file diff --git a/annotations_1/RRDbQPvtAxY_filtered.json b/annotations_1/RRDbQPvtAxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7103a30af1266cdacf767146f86bdf62b2f94b2f --- /dev/null +++ b/annotations_1/RRDbQPvtAxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [7.0, 8.61], [10.0, 11.91], [12.0, 12.87], [15.0, 16.77], [17.0, 21.63], [25.0, 24.73], [27.0, 27.9], [28.0, 28.36], [45.0, 45.1], [46.0, 50.04], [54.0, 63.1], [64.0, 64.52], [66.0, 74.17], [78.0, 80.03], [81.0, 81.57], [82.0, 82.39], [83.0, 86.31], [95.0, 96.43], [102.0, 102.36], [111.0, 111.1]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 32.39, 33.27, 0.0, 31.96, 32.05, 0.0, 0.0, 32.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["animal", 23.51], ["music", 19.03], ["cattle, bovinae", 8.28]], null, null, null, null, [["music", 55.61], ["whale vocalization", 6.58], ["cacophony", 3.31]], [["music", 27.27], ["livestock, farm animals, working animals", 10.75], ["moo", 9.36]], null, [["mosquito", 35.23], ["music", 21.81], ["fly, housefly", 17.85]], [["speech", 19.72], ["music", 16.87], ["sound effect", 5.36]], null, null, [["music", 65.0], ["musical instrument", 5.65], ["carnatic music", 2.02]], null, null, null], "duration": [0.04, 1.61, 1.91, 0.87, 1.77, 4.63, -0.27, 0.9, 0.36, 0.1, 4.04, 9.1, 0.52, 8.17, 2.03, 0.57, 0.39, 3.31, 1.43, 0.36, 0.1]} \ No newline at end of file diff --git a/annotations_1/RRDzDy5wLh4_filtered.json b/annotations_1/RRDzDy5wLh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bdff26eb9beccc03c7853fb7327431b990e0c55 --- /dev/null +++ b/annotations_1/RRDzDy5wLh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 21.73], [30.0, 30.64], [34.0, 34.1], [37.0, 41.77], [49.0, 49.38], [50.0, 53.25], [58.0, 89.06], [93.0, 94.8], [100.0, 103.42], [104.0, 104.55], [111.0, 127.94], [130.0, 133.73], [138.0, 142.96], [145.0, 151.71], [157.0, 164.0], [168.0, 180.28], [188.0, 188.79], [190.0, 190.48], [192.0, 192.55]], "keep_status": [false, false, false, true, false, true, false, false, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [33.9, 0.0, 0.0, 35.46, 0.0, 33.24, 0.0, 0.0, 36.82, 0.0, 34.35, 34.6, 31.77, 32.36, 32.96, 32.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 77.3], ["theremin", 2.83], ["hum", 2.32]], null, null, [["music", 38.59], ["mains hum", 11.76], ["theremin", 9.97]], null, [["music", 45.56], ["boing", 13.76], ["speech", 3.87]], null, null, [["speech", 37.76], ["music", 18.79], ["vehicle", 8.55]], null, [["music", 43.34], ["speech", 25.52], ["musical instrument", 2.64]], [["music", 50.83], ["hum", 10.71], ["mains hum", 6.92]], [["vehicle", 26.64], ["music", 12.41], ["car", 6.59]], [["speech", 36.47], ["music", 32.87], ["theremin", 14.67]], [["speech", 61.05], ["sidetone", 10.55], ["music", 7.83]], [["music", 78.44], ["musical instrument", 3.68], ["trombone", 2.38]], null, null, null], "duration": [18.73, 0.64, 0.1, 4.77, 0.38, 3.25, 31.06, 1.8, 3.42, 0.55, 16.94, 3.73, 4.96, 6.71, 7.0, 12.28, 0.79, 0.48, 0.55]} \ No newline at end of file diff --git a/annotations_1/RSl6bwZabjA_filtered.json b/annotations_1/RSl6bwZabjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e026f5f18349e0790b3dcb7cb09ae7677404526 --- /dev/null +++ b/annotations_1/RSl6bwZabjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.03], [9.0, 9.29], [10.0, 10.54], [12.0, 16.39], [17.0, 20.44], [22.0, 28.97], [30.0, 31.45], [34.0, 36.21], [39.0, 40.12], [42.0, 44.41], [50.0, 51.88], [53.0, 74.34], [76.0, 76.91], [78.0, 79.95], [82.0, 90.37], [91.0, 98.81], [99.0, 104.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.74, 0.0, 0.0, 53.53, 86.09, 68.28, 0.0, 77.03, 0.0, 50.41, 0.0, 71.0, 0.0, 0.0, 55.25, 73.06, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 0.29, 0.54, 4.39, 3.44, 6.97, 1.45, 2.21, 1.12, 2.41, 1.88, 21.34, 0.91, 1.95, 8.37, 7.81, 5.55]} \ No newline at end of file diff --git a/annotations_1/RU2IP_oUqyc_filtered.json b/annotations_1/RU2IP_oUqyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cef16b3d1da4a92752621b17fb83588631197f1 --- /dev/null +++ b/annotations_1/RU2IP_oUqyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.39], [17.0, 20.14], [22.0, 32.37], [34.0, 36.05], [38.0, 42.47], [51.0, 52.54], [53.0, 54.77], [55.0, 70.21], [74.0, 84.97], [91.0, 91.66], [93.0, 93.36], [98.0, 98.78], [100.0, 103.49], [106.0, 106.98], [108.0, 116.36], [119.0, 122.69], [124.0, 126.0], [128.0, 137.35], [140.0, 141.12], [143.0, 156.42], [162.0, 161.74]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, true, true, false, false, false], "silence_prob": [47.31, 45.27, 29.34, 36.72, 29.61, 0.0, 0.0, 40.93, 55.25, 0.0, 0.0, 0.0, 33.61, 0.0, 43.05, 35.93, 37.78, 42.44, 0.0, 29.28, 0.0], "audiomae_on_audioset": [[["music", 33.93], ["hum", 6.53], ["mains hum", 4.24]], [["music", 55.6], ["frog", 10.1], ["croak", 4.36]], [["speech", 52.47], ["music", 14.39], ["vehicle", 5.29]], [["speech", 64.62], ["vehicle", 7.14], ["motorcycle", 3.24]], [["speech", 68.68], ["vehicle", 4.51], ["music", 4.3]], null, null, [["music", 37.14], ["speech", 14.42], ["hum", 12.29]], null, null, null, null, [["hum", 30.37], ["mains hum", 26.45], ["music", 10.53]], null, [["crushing", 25.74], ["music", 16.39], ["hum", 16.37]], [["speech", 58.53], ["music", 4.29], ["hum", 3.1]], [["music", 52.62], ["theremin", 9.07], ["synthesizer", 3.54]], [["hum", 24.16], ["noise", 16.8], ["mains hum", 14.11]], null, [["music", 82.19], ["scary music", 5.6], ["soundtrack music", 2.22]], null], "duration": [2.39, 3.14, 10.37, 2.05, 4.47, 1.54, 1.77, 15.21, 10.97, 0.66, 0.36, 0.78, 3.49, 0.98, 8.36, 3.69, 2.0, 9.35, 1.12, 13.42, -0.26]} \ No newline at end of file diff --git a/annotations_1/RUUhcK3Pt14_filtered.json b/annotations_1/RUUhcK3Pt14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01dacc03f3a81a287a65281cf628803439ce1cbf --- /dev/null +++ b/annotations_1/RUUhcK3Pt14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.6], [24.0, 23.79], [36.0, 36.46], [45.0, 45.49], [46.0, 46.45], [48.0, 49.17], [50.0, 56.39], [60.0, 60.1], [61.0, 61.89], [65.0, 65.57], [74.0, 74.92], [79.0, 79.91], [81.0, 82.61], [89.0, 89.92], [93.0, 94.96], [97.0, 97.83], [101.0, 100.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.4, -0.21, 0.46, 0.49, 0.45, 1.17, 6.39, 0.1, 0.89, 0.57, 0.92, 0.91, 1.61, 0.92, 1.96, 0.83, -0.1]} \ No newline at end of file diff --git a/annotations_1/RV0EbFEZpT8_filtered.json b/annotations_1/RV0EbFEZpT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d3e7c4a7e4dbdc77b8a617fb8e0b1e84e37272b --- /dev/null +++ b/annotations_1/RV0EbFEZpT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.57], [11.0, 20.68], [22.0, 26.18], [27.0, 30.45], [31.0, 31.65], [33.0, 33.27], [36.0, 44.81], [46.0, 48.1], [49.0, 49.52], [51.0, 51.24], [53.0, 53.77], [55.0, 56.39], [57.0, 73.08], [78.0, 81.75], [82.0, 81.85], [82.0, 81.94], [82.0, 96.23], [101.0, 112.63], [113.0, 114.44], [114.0, 129.14]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true, true, false, false, true, true, false, false], "silence_prob": [73.82, 58.22, 60.05, 81.35, 0.0, 0.0, 35.76, 49.68, 0.0, 0.0, 0.0, 0.0, 36.31, 41.18, 0.0, 0.0, 34.98, 33.07, 0.0, 32.56], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 36.87], ["boat, water vehicle", 9.28], ["outside, rural or natural", 6.56]], [["speech", 24.32], ["fly, housefly", 17.04], ["bee, wasp, etc.", 6.81]], null, null, null, null, [["speech", 32.93], ["vehicle", 14.94], ["car", 6.49]], [["hum", 33.67], ["mains hum", 18.4], ["throbbing", 11.54]], null, null, [["speech", 25.61], ["hum", 15.0], ["buzz", 10.08]], [["speech", 33.77], ["vehicle", 25.2], ["car", 7.93]], null, [["mains hum", 33.41], ["music", 24.92], ["hum", 21.85]]], "duration": [2.57, 9.68, 4.18, 3.45, 0.65, 0.27, 8.81, 2.1, 0.52, 0.24, 0.77, 1.39, 16.08, 3.75, -0.15, -0.06, 14.23, 11.63, 1.44, 15.14]} \ No newline at end of file diff --git a/annotations_1/RWYM4Npp9rI_filtered.json b/annotations_1/RWYM4Npp9rI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4308b9dac9617bd017d07fdc93a5888fb1948970 --- /dev/null +++ b/annotations_1/RWYM4Npp9rI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.71], [23.0, 24.61], [28.0, 28.22], [31.0, 34.05], [34.0, 35.11], [39.0, 38.77], [39.0, 80.72], [83.0, 82.97], [84.0, 84.82], [91.0, 92.31], [95.0, 95.1], [97.0, 96.75], [99.0, 99.08], [100.0, 100.26], [103.0, 108.46], [110.0, 109.8], [110.0, 110.3], [111.0, 113.37], [116.0, 127.43], [128.0, 129.14], [130.0, 131.25], [134.0, 135.3], [138.0, 147.43], [149.0, 157.54], [161.0, 196.99], [197.0, 202.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [32.25, 0.0, 0.0, 30.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 71.0, 31.88, 0.0, 0.0, 0.0, 30.4, 30.55, 0.0, 32.93], "audiomae_on_audioset": [[["animal", 40.79], ["dog", 18.36], ["bow-wow", 14.7]], null, null, [["speech", 23.3], ["music", 22.6], ["wind instrument, woodwind instrument", 6.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.7], ["hum", 7.31], ["mains hum", 3.71]], null, null, null, [["speech", 73.64], ["music", 8.06], ["bleat", 2.9]], [["speech", 45.06], ["music", 19.13], ["buzz", 3.08]], null, [["speech", 52.92], ["music", 19.3], ["breaking", 4.91]]], "duration": [6.71, 1.61, 0.22, 3.05, 1.11, -0.23, 41.72, -0.03, 0.82, 1.31, 0.1, -0.25, 0.08, 0.26, 5.46, -0.2, 0.3, 2.37, 11.43, 1.14, 1.25, 1.3, 9.43, 8.54, 35.99, 5.66]} \ No newline at end of file diff --git a/annotations_1/RWfQwm_BgZY_filtered.json b/annotations_1/RWfQwm_BgZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b6d951128d94986df146d7f09700c61889f5a3 --- /dev/null +++ b/annotations_1/RWfQwm_BgZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.17], [24.0, 34.21], [57.0, 57.16], [64.0, 64.69], [69.0, 68.61], [72.0, 73.99], [77.0, 76.84], [98.0, 100.62], [134.0, 135.35], [136.0, 136.51], [139.0, 139.45], [144.0, 145.74], [146.0, 148.14], [150.0, 154.94], [162.0, 170.75], [173.0, 183.95]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [43.96, 38.2, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 49.59, 30.74, 29.59, 29.86], "audiomae_on_audioset": [[["speech", 11.99], ["pig", 8.64], ["animal", 6.62]], [["speech", 65.75], ["whale vocalization", 9.46], ["beatboxing", 2.17]], null, null, null, null, null, null, null, null, null, null, [["speech", 32.51], ["hum", 8.96], ["music", 6.8]], [["cattle, bovinae", 40.99], ["livestock, farm animals, working animals", 31.36], ["moo", 19.84]], [["speech", 57.16], ["animal", 13.46], ["livestock, farm animals, working animals", 4.71]], [["music", 51.31], ["speech", 15.26], ["cattle, bovinae", 1.94]]], "duration": [2.17, 10.21, 0.16, 0.69, -0.39, 1.99, -0.16, 2.62, 1.35, 0.51, 0.45, 1.74, 2.14, 4.94, 8.75, 10.95]} \ No newline at end of file diff --git a/annotations_1/RY1FQGd1Bb4_filtered.json b/annotations_1/RY1FQGd1Bb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..635f32e9a559be62d448bb9c1e4bdf3e0f774f60 --- /dev/null +++ b/annotations_1/RY1FQGd1Bb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.95], [11.0, 13.04], [16.0, 16.75], [19.0, 31.21], [32.0, 32.29], [34.0, 34.75], [39.0, 38.72], [42.0, 42.18], [62.0, 62.78], [67.0, 68.49], [70.0, 70.28], [76.0, 77.99], [80.0, 80.92], [82.0, 83.47], [84.0, 83.66], [84.0, 83.91], [94.0, 94.12], [95.0, 95.98], [102.0, 101.8], [103.0, 104.5], [109.0, 108.95], [113.0, 113.61], [120.0, 122.3], [123.0, 125.42], [128.0, 129.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.71, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 56.33, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 2.04, 0.75, 12.21, 0.29, 0.75, -0.28, 0.18, 0.78, 1.49, 0.28, 1.99, 0.92, 1.47, -0.34, -0.09, 0.12, 0.98, -0.2, 1.5, -0.05, 0.61, 2.3, 2.42, 1.27]} \ No newline at end of file diff --git a/annotations_1/RYP_NSi9g3Y_filtered.json b/annotations_1/RYP_NSi9g3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04a84d60552cccf3d497dc1636c4a5d20859b67 --- /dev/null +++ b/annotations_1/RYP_NSi9g3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 22.91], [24.0, 42.33], [54.0, 56.44], [57.0, 57.33], [64.0, 64.44], [65.0, 65.26], [68.0, 72.81], [76.0, 78.56], [79.0, 78.6], [83.0, 82.73], [83.0, 87.42]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [31.47, 31.59, 34.04, 0.0, 0.0, 0.0, 43.82, 29.97, 0.0, 0.0, 31.78], "audiomae_on_audioset": [[["speech", 54.3], ["helicopter", 20.27], ["vehicle", 12.46]], [["music", 21.69], ["electronic music", 21.53], ["hum", 17.05]], [["music", 77.46], ["musical instrument", 4.25], ["theremin", 1.99]], null, null, null, [["music", 45.43], ["guitar", 11.37], ["musical instrument", 9.28]], [["music", 67.93], ["piano", 4.3], ["musical instrument", 3.87]], null, null, [["music", 66.19], ["theremin", 6.23], ["musical instrument", 2.83]]], "duration": [4.91, 18.33, 2.44, 0.33, 0.44, 0.26, 4.81, 2.56, -0.4, -0.27, 4.42]} \ No newline at end of file diff --git a/annotations_1/RY_D9rFoWLo_filtered.json b/annotations_1/RY_D9rFoWLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e8ab8d964697fc8167757271477ebe3c73b1d6a --- /dev/null +++ b/annotations_1/RY_D9rFoWLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 41.74], [48.0, 53.42], [54.0, 70.06], [72.0, 95.69], [97.0, 157.69]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 75.72, 38.16, 31.49, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.85], ["music", 17.16], ["throbbing", 2.61]], [["speech", 45.81], ["music", 23.43], ["throbbing", 7.46]], null], "duration": [-0.26, 5.42, 16.06, 23.69, 60.69]} \ No newline at end of file diff --git a/annotations_1/RZKKrQ8y_Uw_filtered.json b/annotations_1/RZKKrQ8y_Uw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db4485e8f81797a354e464409306d31c29f63a4f --- /dev/null +++ b/annotations_1/RZKKrQ8y_Uw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.55], [13.0, 16.21], [18.0, 19.63], [21.0, 30.3], [31.0, 32.58], [33.0, 48.42], [49.0, 67.8], [68.0, 70.43], [75.0, 80.62], [85.0, 85.21], [87.0, 90.64], [92.0, 92.35], [96.0, 95.74], [96.0, 107.82], [110.0, 119.94], [125.0, 126.25], [128.0, 134.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.61, 98.99, 0.0, 99.26, 0.0, 79.76, 77.53, 83.34, 99.44, 0.0, 97.83, 0.0, 0.0, 62.47, 55.46, 0.0, 45.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.98], ["brass instrument", 9.37], ["trombone", 8.18]]], "duration": [2.55, 3.21, 1.63, 9.3, 1.58, 15.42, 18.8, 2.43, 5.62, 0.21, 3.64, 0.35, -0.26, 11.82, 9.94, 1.25, 6.47]} \ No newline at end of file diff --git a/annotations_1/RZdQIbRXNCU_filtered.json b/annotations_1/RZdQIbRXNCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5034e1e74631ba56e1d57ce7c685512e9276ef8 --- /dev/null +++ b/annotations_1/RZdQIbRXNCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [13.0, 16.01], [20.0, 26.16], [30.0, 33.86], [60.0, 61.11], [66.0, 66.09], [83.0, 83.94], [101.0, 102.19], [126.0, 130.4]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.97, 42.28, 45.3, 0.0, 0.0, 0.0, 0.0, 40.12], "audiomae_on_audioset": [null, null, [["sidetone", 37.78], ["speech", 35.78], ["fly, housefly", 5.7]], [["music", 60.46], ["speech", 11.51], ["sidetone", 5.44]], null, null, null, null, [["music", 56.57], ["throbbing", 15.24], ["hum", 4.78]]], "duration": [1.7, 3.01, 6.16, 3.86, 1.11, 0.09, 0.94, 1.19, 4.4]} \ No newline at end of file diff --git a/annotations_1/R_4_btP862g_filtered.json b/annotations_1/R_4_btP862g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6b16a9028e990c3c9262732402617b3fb70b6be --- /dev/null +++ b/annotations_1/R_4_btP862g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [9.0, 9.36], [30.0, 34.92], [39.0, 40.29], [49.0, 49.1], [51.0, 53.89], [56.0, 57.35], [62.0, 66.82], [68.0, 69.31], [80.0, 86.1], [91.0, 91.49], [95.0, 95.35], [96.0, 122.37], [131.0, 131.75], [139.0, 143.6], [149.0, 151.02]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 30.34, 0.0, 0.0, 48.27, 0.0, 35.37, 0.0, 28.95, 0.0, 0.0, 29.36, 0.0, 30.95, 68.67], "audiomae_on_audioset": [null, null, [["music", 35.26], ["buzz", 5.11], ["theremin", 4.71]], null, null, [["music", 63.13], ["hum", 8.75], ["throbbing", 4.74]], null, [["music", 60.97], ["didgeridoo", 8.39], ["speech", 5.49]], null, [["music", 63.6], ["speech", 13.73], ["throbbing", 3.38]], null, null, [["buzz", 26.71], ["speech", 14.15], ["vehicle", 11.04]], null, [["speech", 49.54], ["whack, thwack", 15.64], ["thunk", 4.07]], null], "duration": [1.13, 0.36, 4.92, 1.29, 0.1, 2.89, 1.35, 4.82, 1.31, 6.1, 0.49, 0.35, 26.37, 0.75, 4.6, 2.02]} \ No newline at end of file diff --git a/annotations_1/R_moIp38Fk8_filtered.json b/annotations_1/R_moIp38Fk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b8383e0113dcde9942d8ca31eedc1573eb11fa9 --- /dev/null +++ b/annotations_1/R_moIp38Fk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 26.15], [27.0, 36.0], [37.0, 40.81], [43.0, 47.71], [49.0, 49.62], [50.0, 58.14], [62.0, 65.85], [68.0, 72.23], [73.0, 89.9], [92.0, 92.26], [93.0, 94.58], [106.0, 106.46], [107.0, 108.01], [109.0, 109.81], [111.0, 112.89], [115.0, 115.15], [116.0, 118.79], [121.0, 122.18], [123.0, 123.7]], "keep_status": [false, false, true, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.08, 29.96, 30.49, 30.81, 0.0, 30.86, 30.49, 32.74, 31.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 74.36], ["music", 3.32], ["buzz", 3.23]], [["music", 80.15], ["breaking", 7.29], ["speech", 4.44]], [["music", 25.87], ["gunshot, gunfire", 17.32], ["thump, thud", 6.78]], [["music", 50.8], ["speech", 26.74], ["boing", 4.94]], null, [["music", 31.91], ["throbbing", 14.48], ["sidetone", 13.93]], [["music", 50.66], ["speech", 35.1], ["hum", 1.5]], [["music", 54.46], ["speech", 7.54], ["whip", 4.06]], [["music", 22.95], ["speech", 17.74], ["throbbing", 15.49]], null, null, null, null, null, null, null, null, null, null], "duration": [22.15, 9.0, 3.81, 4.71, 0.62, 8.14, 3.85, 4.23, 16.9, 0.26, 1.58, 0.46, 1.01, 0.81, 1.89, 0.15, 2.79, 1.18, 0.7]} \ No newline at end of file diff --git a/annotations_1/Ra7oqFqj9uU_filtered.json b/annotations_1/Ra7oqFqj9uU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Ra7oqFqj9uU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/RaicjdiN8ag_filtered.json b/annotations_1/RaicjdiN8ag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b5168145691ac767f66a96348569a840cc44ceb --- /dev/null +++ b/annotations_1/RaicjdiN8ag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [5.0, 5.95], [6.0, 6.78], [14.0, 14.4], [17.0, 18.42], [22.0, 22.08], [28.0, 28.97], [35.0, 37.42], [41.0, 40.71], [42.0, 43.41], [45.0, 45.98], [46.0, 47.12], [50.0, 50.7], [56.0, 56.96], [61.0, 62.21], [66.0, 67.49], [84.0, 83.73], [86.0, 87.83], [93.0, 94.0], [101.0, 100.99], [102.0, 104.67], [109.0, 111.18], [117.0, 118.2], [146.0, 147.23], [148.0, 149.32], [151.0, 152.86], [157.0, 159.88], [160.0, 160.76], [165.0, 165.52], [168.0, 168.37], [170.0, 170.14], [171.0, 171.78], [173.0, 173.91], [175.0, 175.19], [175.0, 175.85], [176.0, 177.8], [179.0, 179.64], [181.0, 183.12], [184.0, 184.15], [188.0, 187.88], [193.0, 193.38], [200.0, 205.63], [206.0, 206.44], [207.0, 220.26]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.13, 36.48, 0.0, 0.0, 0.0, 0.0, 40.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 39.46, 0.0, 30.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 38.66], ["sidetone", 9.9], ["chirp tone", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.57], ["echo", 14.72], ["beatboxing", 12.57]], [["beatboxing", 38.21], ["didgeridoo", 14.01], ["music", 11.72]], null, null, null, null, [["speech", 68.2], ["sidetone", 6.72], ["echo", 4.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.82], ["speech", 34.41], ["sidetone", 13.53]], null, [["music", 54.53], ["hum", 8.68], ["throbbing", 8.08]]], "duration": [0.32, 0.95, 0.78, 0.4, 1.42, 0.08, 0.97, 2.42, -0.29, 1.41, 0.98, 1.12, 0.7, 0.96, 1.21, 1.49, -0.27, 1.83, 1.0, -0.01, 2.67, 2.18, 1.2, 1.23, 1.32, 1.86, 2.88, 0.76, 0.52, 0.37, 0.14, 0.78, 0.91, 0.19, 0.85, 1.8, 0.64, 2.12, 0.15, -0.12, 0.38, 5.63, 0.44, 13.26]} \ No newline at end of file diff --git a/annotations_1/RbdGl6wRKDc_filtered.json b/annotations_1/RbdGl6wRKDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ffcc6a75152c51faf0b3a1f46c5bc1f5a00bf03 --- /dev/null +++ b/annotations_1/RbdGl6wRKDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.71], [7.0, 21.49], [22.0, 27.23], [28.0, 28.41], [29.0, 31.87], [33.0, 37.44], [39.0, 50.75], [53.0, 77.8], [79.0, 79.79], [82.0, 92.45], [94.0, 102.36], [103.0, 104.23], [105.0, 130.94], [131.0, 132.33], [133.0, 133.41], [134.0, 137.83], [138.0, 142.15], [144.0, 146.85], [147.0, 150.84], [151.0, 157.1], [158.0, 158.19], [159.0, 159.54], [160.0, 160.44]], "keep_status": [false, false, false, false, true, true, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.18, 35.57, 0.0, 28.75, 28.48, 29.62, 29.17, 0.0, 28.85, 31.97, 0.0, 33.89, 0.0, 0.0, 33.99, 35.08, 40.88, 35.26, 52.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.72], ["synthesizer", 8.22], ["throbbing", 6.46]], [["music", 49.46], ["didgeridoo", 17.09], ["foghorn", 10.43]], null, [["speech", 19.35], ["foghorn", 15.99], ["music", 15.01]], [["hum", 24.57], ["mains hum", 15.6], ["throbbing", 9.51]], [["music", 30.12], ["breaking", 9.8], ["animal", 7.7]], [["music", 43.86], ["whack, thwack", 26.75], ["didgeridoo", 6.64]], null, [["speech", 48.18], ["music", 19.32], ["vehicle", 4.97]], [["speech", 44.56], ["vehicle", 14.23], ["keys jangling", 5.1]], null, [["music", 52.26], ["hum", 10.08], ["theremin", 4.65]], null, null, [["fly, housefly", 12.83], ["insect", 11.68], ["music", 9.52]], [["fly, housefly", 48.99], ["insect", 22.87], ["mains hum", 6.36]], [["fly, housefly", 51.91], ["insect", 31.78], ["mosquito", 8.69]], [["fly, housefly", 48.18], ["insect", 21.37], ["bee, wasp, etc.", 3.1]], null, null, null, null], "duration": [1.71, 14.49, 5.23, 0.41, 2.87, 4.44, 11.75, 24.8, 0.79, 10.45, 8.36, 1.23, 25.94, 1.33, 0.41, 3.83, 4.15, 2.85, 3.84, 6.1, 0.19, 0.54, 0.44]} \ No newline at end of file diff --git a/annotations_1/RbsNzYdNM5I_filtered.json b/annotations_1/RbsNzYdNM5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1ea5b5192fd5f1fce11d2dd7e34b564d3012e7d --- /dev/null +++ b/annotations_1/RbsNzYdNM5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.69], [11.0, 14.08], [18.0, 29.12], [34.0, 48.95], [49.0, 69.87], [71.0, 71.85], [74.0, 80.01], [86.0, 88.55], [91.0, 95.12]], "keep_status": [false, true, true, false, false, false, false, true, true], "silence_prob": [0.0, 35.62, 31.26, 29.76, 29.4, 0.0, 30.45, 29.74, 29.55], "audiomae_on_audioset": [null, [["music", 27.14], ["thunk", 23.43], ["speech", 5.38]], [["music", 16.74], ["whack, thwack", 16.04], ["fly, housefly", 15.44]], [["music", 60.6], ["speech", 23.27], ["boing", 4.29]], [["music", 64.53], ["trombone", 3.88], ["speech", 3.88]], null, [["music", 31.99], ["boing", 29.02], ["throbbing", 12.52]], [["music", 44.53], ["smash, crash", 14.38], ["whack, thwack", 7.49]], [["music", 30.36], ["throbbing", 18.03], ["hum", 12.62]]], "duration": [1.69, 3.08, 11.12, 14.95, 20.87, 0.85, 6.01, 2.55, 4.12]} \ No newline at end of file diff --git a/annotations_1/RcC6K2k6cwk_filtered.json b/annotations_1/RcC6K2k6cwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17338984c574b86b67d0ae2e1dbf89d3233d647 --- /dev/null +++ b/annotations_1/RcC6K2k6cwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 75.41], [78.0, 84.27], [86.0, 104.45], [104.0, 104.5], [105.0, 104.57], [108.0, 109.78], [112.0, 116.85], [119.0, 120.33], [124.0, 127.13], [128.0, 163.56], [165.0, 168.44]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 28.8, 28.91, 0.0, 0.0, 0.0, 29.54, 0.0, 32.23, 0.0, 29.47], "audiomae_on_audioset": [null, [["music", 25.46], ["musical instrument", 4.77], ["didgeridoo", 4.37]], [["music", 60.36], ["didgeridoo", 9.89], ["speech", 8.12]], null, null, null, [["speech", 67.94], ["music", 6.7], ["roar", 4.58]], null, [["music", 38.49], ["mains hum", 3.9], ["rumble", 3.41]], null, [["fart", 25.15], ["groan", 16.75], ["grunt", 16.12]]], "duration": [62.41, 6.27, 18.45, 0.5, -0.43, 1.78, 4.85, 1.33, 3.13, 35.56, 3.44]} \ No newline at end of file diff --git a/annotations_1/RcZo8hHZqkY_filtered.json b/annotations_1/RcZo8hHZqkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97b13d0d4af6d84ef4035a7771e43c66ea80f2c7 --- /dev/null +++ b/annotations_1/RcZo8hHZqkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [4.0, 5.59], [6.0, 7.57], [9.0, 8.77], [9.0, 10.35], [12.0, 12.5], [16.0, 17.51], [19.0, 20.51], [22.0, 22.76], [25.0, 28.34], [30.0, 32.17], [33.0, 34.38], [35.0, 35.78], [36.0, 36.41], [41.0, 41.82], [46.0, 48.29], [50.0, 50.89], [53.0, 53.62], [57.0, 57.89], [59.0, 59.43], [60.0, 61.1], [63.0, 63.0], [65.0, 69.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 97.73, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 50.82], ["hum", 42.25], ["whale vocalization", 0.64]]], "duration": [1.01, 1.59, 1.57, -0.23, 1.35, 0.5, 1.51, 1.51, 0.76, 3.34, 2.17, 1.38, 0.78, 0.41, 0.82, 2.29, 0.89, 0.62, 0.89, 0.43, 1.1, 0.0, 4.53]} \ No newline at end of file diff --git a/annotations_1/RdG9KwpjxA0_filtered.json b/annotations_1/RdG9KwpjxA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aef24770c4d3254ff5e7830c5ac4a28c3e658bce --- /dev/null +++ b/annotations_1/RdG9KwpjxA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 41.74], [43.0, 43.92], [46.0, 50.21], [51.0, 75.14], [76.0, 79.24], [80.0, 81.03], [82.0, 87.2], [97.0, 98.49], [108.0, 109.46], [111.0, 111.62], [112.0, 112.16], [113.0, 113.9], [115.0, 115.13], [116.0, 117.34], [122.0, 122.22], [128.0, 134.76], [137.0, 137.84], [138.0, 139.48], [140.0, 140.44], [150.0, 152.42], [155.0, 163.36]], "keep_status": [true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [40.29, 0.0, 38.75, 36.97, 35.37, 0.0, 31.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.32, 0.0, 0.0, 0.0, 32.52, 34.36], "audiomae_on_audioset": [[["hum", 48.28], ["throbbing", 13.33], ["whale vocalization", 7.08]], null, [["hum", 44.05], ["mains hum", 23.69], ["speech", 4.09]], [["music", 28.38], ["speech", 26.87], ["mains hum", 3.98]], [["speech", 26.48], ["music", 23.98], ["quack", 13.89]], null, [["speech", 24.03], ["music", 23.78], ["didgeridoo", 18.21]], null, null, null, null, null, null, null, null, [["fart", 41.09], ["speech", 31.75], ["fly, housefly", 4.42]], null, null, null, [["speech", 44.06], ["music", 5.21], ["frog", 1.7]], [["speech", 83.91], ["electric shaver, electric razor", 2.27], ["inside, small room", 1.61]]], "duration": [7.74, 0.92, 4.21, 24.14, 3.24, 1.03, 5.2, 1.49, 1.46, 0.62, 0.16, 0.9, 0.13, 1.34, 0.22, 6.76, 0.84, 1.48, 0.44, 2.42, 8.36]} \ No newline at end of file diff --git a/annotations_1/RdTIzSuw-nI_filtered.json b/annotations_1/RdTIzSuw-nI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ab785b05438ef98da768a045e0efba855b70d46 --- /dev/null +++ b/annotations_1/RdTIzSuw-nI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [13.0, 15.6], [16.0, 16.8], [17.0, 23.19], [25.0, 33.4], [35.0, 61.37], [62.0, 62.72], [63.0, 63.42], [64.0, 68.99], [74.0, 75.81], [77.0, 77.57], [78.0, 80.11]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 51.28, 0.0, 32.68, 31.82, 31.33, 0.0, 0.0, 57.32, 0.0, 0.0, 88.83], "audiomae_on_audioset": [null, null, null, [["music", 27.7], ["speech", 24.07], ["musical instrument", 5.98]], [["music", 41.12], ["speech", 31.37], ["throbbing", 3.61]], [["speech", 20.82], ["mains hum", 9.21], ["music", 7.83]], null, null, null, null, null, null], "duration": [0.49, 2.6, 0.8, 6.19, 8.4, 26.37, 0.72, 0.42, 4.99, 1.81, 0.57, 2.11]} \ No newline at end of file diff --git a/annotations_1/RdpvBc4bahI_filtered.json b/annotations_1/RdpvBc4bahI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..660bd12c5c64a95851e3900dfbe34d30da0f2f44 --- /dev/null +++ b/annotations_1/RdpvBc4bahI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.74], [4.0, 4.94], [5.0, 5.88], [6.0, 6.83], [8.0, 9.53], [10.0, 10.57], [13.0, 13.34], [15.0, 15.72], [17.0, 17.22], [18.0, 17.93], [19.0, 19.52], [20.0, 44.79], [46.0, 46.31], [47.0, 47.48], [49.0, 53.01], [55.0, 55.58], [56.0, 60.89], [62.0, 62.43], [65.0, 77.84], [79.0, 80.54], [82.0, 84.05], [86.0, 86.95], [88.0, 89.04], [92.0, 98.02], [99.0, 99.67], [100.0, 104.46], [105.0, 109.36], [119.0, 129.91], [130.0, 131.72], [136.0, 136.93], [139.0, 139.36], [143.0, 143.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.8, 0.0, 0.0, 85.35, 0.0, 68.67, 0.0, 94.07, 0.0, 99.95, 0.0, 0.0, 97.54, 0.0, 98.73, 34.29, 28.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["animal", 13.21], ["sine wave", 12.03], ["dial tone", 5.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.71], ["dial tone", 18.36], ["sidetone", 13.56]], [["cattle, bovinae", 34.76], ["livestock, farm animals, working animals", 32.95], ["moo", 28.98]], null, null, null, null], "duration": [1.74, 0.94, 0.88, 0.83, 1.53, 0.57, 0.34, 0.72, 0.22, -0.07, 0.52, 24.79, 0.31, 0.48, 4.01, 0.58, 4.89, 0.43, 12.84, 1.54, 2.05, 0.95, 1.04, 6.02, 0.67, 4.46, 4.36, 10.91, 1.72, 0.93, 0.36, 0.43]} \ No newline at end of file diff --git a/annotations_1/Rfl2M8B9WA8_filtered.json b/annotations_1/Rfl2M8B9WA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..181d2ac6c29dbdee4048e26512316be323ee1ee9 --- /dev/null +++ b/annotations_1/Rfl2M8B9WA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.75], [10.0, 12.41], [14.0, 15.9], [17.0, 17.09], [18.0, 17.69], [20.0, 20.22], [22.0, 21.78], [38.0, 40.41], [42.0, 42.94], [46.0, 47.46], [50.0, 52.35], [53.0, 53.97], [55.0, 57.97], [59.0, 60.03], [61.0, 62.38], [68.0, 68.64], [71.0, 71.09], [72.0, 74.07], [84.0, 83.88], [84.0, 90.95], [91.0, 91.27], [91.0, 91.34], [99.0, 99.87], [105.0, 105.48], [108.0, 108.84], [111.0, 113.61], [117.0, 116.9], [118.0, 122.77], [125.0, 127.7], [128.0, 128.16], [129.0, 128.66], [129.0, 128.71], [129.0, 129.44], [130.0, 131.8], [136.0, 136.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 73.21, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 53.59, 0.0, 41.62, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 45.24, 55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.06], ["speech", 24.78], ["sidetone", 4.72]], null, null, null, null, null, null, null, [["music", 45.31], ["speech", 9.7], ["didgeridoo", 6.75]], null, null, null, null, null, null, null], "duration": [0.75, 2.41, 1.9, 0.09, -0.31, 0.22, -0.22, 2.41, 0.94, 1.46, 2.35, 0.97, 2.97, 1.03, 1.38, 0.64, 0.09, 2.07, -0.12, 6.95, 0.27, 0.34, 0.87, 0.48, 0.84, 2.61, -0.1, 4.77, 2.7, 0.16, -0.34, -0.29, 0.44, 1.8, 0.48]} \ No newline at end of file diff --git a/annotations_1/RgPuswoKZtw_filtered.json b/annotations_1/RgPuswoKZtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9a06f76024e181d4dcda3323954d7af17d9815e --- /dev/null +++ b/annotations_1/RgPuswoKZtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [16.0, 16.55], [18.0, 18.64], [22.0, 23.58], [24.0, 24.46], [25.0, 25.47], [27.0, 30.16], [31.0, 31.35], [34.0, 33.66], [42.0, 43.23], [44.0, 45.12], [52.0, 52.08], [57.0, 57.79], [60.0, 60.45], [65.0, 65.01], [78.0, 86.75], [88.0, 93.29], [95.0, 96.25], [97.0, 97.98], [100.0, 101.06], [102.0, 102.57], [105.0, 105.71], [107.0, 109.78], [110.0, 110.67], [113.0, 113.66], [116.0, 124.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 34.57, 0.0, 0.0, 0.0, 0.0, 0.0, 32.09, 0.0, 0.0, 36.68], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 36.48], ["music", 20.76], ["didgeridoo", 6.92]], null, null, null, null, null, null, null, null, [["music", 74.29], ["throbbing", 7.05], ["hum", 4.47]], [["music", 53.23], ["hum", 8.66], ["speech", 8.66]], null, null, null, null, null, [["speech", 35.41], ["livestock, farm animals, working animals", 12.24], ["whale vocalization", 7.08]], null, null, [["music", 37.48], ["throbbing", 21.98], ["speech", 15.29]]], "duration": [1.16, 0.55, 0.64, 1.58, 0.46, 0.47, 3.16, 0.35, -0.34, 1.23, 1.12, 0.08, 0.79, 0.45, 0.01, 8.75, 5.29, 1.25, 0.98, 1.06, 0.57, 0.71, 2.78, 0.67, 0.66, 8.02]} \ No newline at end of file diff --git a/annotations_1/RgubwsCVg1o_filtered.json b/annotations_1/RgubwsCVg1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..382b8834eaf04912bd7e859d5caddb39dd161117 --- /dev/null +++ b/annotations_1/RgubwsCVg1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [11.0, 16.29], [17.0, 17.2], [18.0, 18.13], [19.0, 18.55], [19.0, 18.94], [20.0, 21.68], [33.0, 34.08], [39.0, 39.7], [40.0, 91.44], [94.0, 107.11], [109.0, 109.26], [112.0, 114.08], [118.0, 119.31], [124.0, 138.91], [139.0, 139.77], [141.0, 145.76], [147.0, 149.59], [156.0, 155.97], [158.0, 160.56], [161.0, 162.4], [174.0, 174.99]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 43.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.17, 0.0, 38.35, 0.0, 31.02, 0.0, 40.28, 36.91, 0.0, 32.98, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 26.18], ["mains hum", 15.67], ["music", 13.67]], null, null, null, null, null, null, null, null, [["music", 50.93], ["smash, crash", 18.18], ["whack, thwack", 8.19]], null, [["speech", 61.09], ["music", 18.05], ["crow", 2.48]], null, [["music", 36.31], ["mains hum", 26.87], ["hum", 19.69]], null, [["speech", 81.63], ["grunt", 2.6], ["caw", 1.93]], [["fly, housefly", 10.87], ["livestock, farm animals, working animals", 10.1], ["music", 9.91]], null, [["speech", 36.59], ["music", 4.72], ["inside, small room", 2.97]], null, null], "duration": [0.35, 5.29, 0.2, 0.13, -0.45, -0.06, 1.68, 1.08, 0.7, 51.44, 13.11, 0.26, 2.08, 1.31, 14.91, 0.77, 4.76, 2.59, -0.03, 2.56, 1.4, 0.99]} \ No newline at end of file diff --git a/annotations_1/RjDv_swo0rY_filtered.json b/annotations_1/RjDv_swo0rY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..214b00b30205a00c06ca72d55c8e38292e6fc286 --- /dev/null +++ b/annotations_1/RjDv_swo0rY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [8.0, 7.55], [10.0, 11.08], [14.0, 15.38], [18.0, 18.71], [20.0, 21.69], [23.0, 23.82], [27.0, 29.24], [34.0, 35.67], [40.0, 40.44], [49.0, 51.88], [53.0, 81.36], [85.0, 85.55], [88.0, 89.24]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.46, 0.0, 0.0, 38.03, 29.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 32.65], ["throbbing", 18.71], ["rumble", 7.28]], null, null, [["hum", 42.59], ["mains hum", 24.33], ["speech", 9.34]], [["music", 68.53], ["musical instrument", 5.05], ["swing music", 2.83]], null, null], "duration": [0.78, -0.45, 1.08, 1.38, 0.71, 1.69, 0.82, 2.24, 1.67, 0.44, 2.88, 28.36, 0.55, 1.24]} \ No newline at end of file diff --git a/annotations_1/RmEZwxFSsWE_filtered.json b/annotations_1/RmEZwxFSsWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1faffef3374d0cc2c9cd00b93b639d201827e1 --- /dev/null +++ b/annotations_1/RmEZwxFSsWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.67], [44.0, 44.56], [47.0, 47.83], [51.0, 50.97], [63.0, 67.14], [67.0, 67.91], [69.0, 69.72], [77.0, 78.06], [83.0, 91.74], [111.0, 111.67], [115.0, 114.94], [128.0, 130.22], [131.0, 130.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 37.05, 0.0, 0.0, 62.99, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 62.09], ["boing", 9.21], ["musical instrument", 3.53]], null, null, null, [["music", 56.37], ["speech", 21.77], ["guitar", 4.24]], null, null, null, null], "duration": [0.67, 0.56, 0.83, -0.03, 4.14, 0.91, 0.72, 1.06, 8.74, 0.67, -0.06, 2.22, -0.02]} \ No newline at end of file diff --git a/annotations_1/RmkFsYUz4cs_filtered.json b/annotations_1/RmkFsYUz4cs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a85fc297152dfb0302180d779427a3bfbb0a2124 --- /dev/null +++ b/annotations_1/RmkFsYUz4cs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.32], [19.0, 19.95], [21.0, 25.32], [26.0, 27.33], [28.0, 28.38], [30.0, 31.19], [39.0, 40.86], [43.0, 44.85], [48.0, 49.47], [50.0, 51.14], [55.0, 57.27], [60.0, 61.84], [70.0, 72.86], [74.0, 75.17], [77.0, 77.3], [91.0, 91.61], [96.0, 96.13], [100.0, 102.81], [108.0, 115.57], [116.0, 116.24], [119.0, 122.64], [124.0, 137.46], [139.0, 139.6], [141.0, 141.4], [142.0, 144.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [55.04, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 40.22, 31.92, 0.0, 31.28, 30.68, 0.0, 0.0, 56.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.57], ["bass guitar", 5.58], ["electric shaver, electric razor", 4.11]], [["livestock, farm animals, working animals", 21.37], ["music", 17.27], ["cattle, bovinae", 15.7]], null, [["moo", 48.17], ["cattle, bovinae", 39.27], ["livestock, farm animals, working animals", 11.9]], [["music", 79.91], ["fireworks", 4.13], ["cacophony", 1.63]], null, null, null], "duration": [5.32, 0.95, 4.32, 1.33, 0.38, 1.19, 1.86, 1.85, 1.47, 1.14, 2.27, 1.84, 2.86, 1.17, 0.3, 0.61, 0.13, 2.81, 7.57, 0.24, 3.64, 13.46, 0.6, 0.4, 2.05]} \ No newline at end of file diff --git a/annotations_1/RmxqK1np7rY_filtered.json b/annotations_1/RmxqK1np7rY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69ff3e9fef71ff2093065ded9a308e376f843bdf --- /dev/null +++ b/annotations_1/RmxqK1np7rY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 17.37], [18.0, 35.13], [35.0, 46.36], [47.0, 67.42], [68.0, 69.21], [70.0, 71.19], [72.0, 72.45], [77.0, 78.54], [82.0, 84.11], [85.0, 88.03], [90.0, 92.2], [97.0, 100.06], [102.0, 103.15], [104.0, 105.53], [110.0, 111.21], [114.0, 115.25], [116.0, 117.61], [119.0, 123.62], [130.0, 132.68], [133.0, 134.92], [137.0, 139.11], [140.0, 142.87], [145.0, 144.83], [146.0, 150.92], [152.0, 153.05], [153.0, 157.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.78, 86.27, 99.48, 99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 99.9, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 100.0, 0.0, 99.94, 98.73, 0.0, 68.93, 0.0, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.37, 17.13, 11.36, 20.42, 1.21, 1.19, 0.45, 1.54, 2.11, 3.03, 2.2, 3.06, 1.15, 1.53, 1.21, 1.25, 1.61, 4.62, 2.68, 1.92, 2.11, 2.87, -0.17, 4.92, 1.05, 4.89]} \ No newline at end of file diff --git a/annotations_1/Rn0Qk4aHYfs_filtered.json b/annotations_1/Rn0Qk4aHYfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d091a55aeca9cd5add0d7e13e1f156be3bc835 --- /dev/null +++ b/annotations_1/Rn0Qk4aHYfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [13.0, 13.39], [14.0, 20.83], [27.0, 56.12], [62.0, 61.87], [63.0, 90.66]], "keep_status": [false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 37.3, 31.34, 0.0, 30.87], "audiomae_on_audioset": [null, null, [["mains hum", 24.25], ["hum", 21.81], ["electric shaver, electric razor", 13.97]], [["music", 31.95], ["speech", 10.55], ["hum", 10.45]], null, [["speech", 46.56], ["music", 12.13], ["explosion", 9.72]]], "duration": [0.56, 0.39, 6.83, 29.12, -0.13, 27.66]} \ No newline at end of file diff --git a/annotations_1/Rp8A7gf0dZ8_filtered.json b/annotations_1/Rp8A7gf0dZ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bacdde4d2d617f026010533d2b1b339428b7ed --- /dev/null +++ b/annotations_1/Rp8A7gf0dZ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [6.0, 6.99], [8.0, 9.12], [11.0, 18.77], [20.0, 24.07], [27.0, 29.76], [33.0, 36.22], [55.0, 55.86], [59.0, 59.48], [60.0, 63.61], [64.0, 74.63], [77.0, 77.58], [80.0, 80.23], [82.0, 106.61], [112.0, 164.94]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.65, 35.88, 36.37, 31.04, 0.0, 0.0, 31.43, 30.96, 0.0, 0.0, 31.83, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.29], ["cattle, bovinae", 24.41], ["moo", 20.12]], [["music", 66.27], ["didgeridoo", 6.06], ["throbbing", 4.53]], [["music", 46.52], ["speech", 15.45], ["boing", 3.1]], [["music", 45.32], ["didgeridoo", 19.06], ["sidetone", 13.88]], null, null, [["music", 50.73], ["sidetone", 10.52], ["speech", 6.19]], [["music", 51.69], ["speech", 13.2], ["throbbing", 7.77]], null, null, [["hum", 40.81], ["throbbing", 15.91], ["music", 12.03]], null], "duration": [1.51, 0.99, 1.12, 7.77, 4.07, 2.76, 3.22, 0.86, 0.48, 3.61, 10.63, 0.58, 0.23, 24.61, 52.94]} \ No newline at end of file diff --git a/annotations_1/Rpt-fbpiTU8_filtered.json b/annotations_1/Rpt-fbpiTU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a23a6759b44d7a4899f3015010c57749ab83c0e --- /dev/null +++ b/annotations_1/Rpt-fbpiTU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.37], [6.0, 6.24], [12.0, 12.31], [37.0, 37.76], [63.0, 63.12], [65.0, 67.59], [72.0, 72.6], [78.0, 78.6], [81.0, 81.03], [81.0, 81.13], [89.0, 90.19], [92.0, 92.53], [102.0, 102.36], [104.0, 104.73], [108.0, 109.31], [111.0, 116.92], [117.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 58.05], "audiomae_on_audioset": [null, null, null, null, null, [["thunk", 38.51], ["speech", 26.58], ["whack, thwack", 12.75]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.37, 0.24, 0.31, 0.76, 0.12, 2.59, 0.6, 0.6, 0.03, 0.13, 1.19, 0.53, 0.36, 0.73, 1.31, 5.92, 4.95]} \ No newline at end of file diff --git a/annotations_1/Rq3xZDyJtMk_filtered.json b/annotations_1/Rq3xZDyJtMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8700258e67479f685291a1316cf208790b83bcc6 --- /dev/null +++ b/annotations_1/Rq3xZDyJtMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.19], [6.0, 7.69], [18.0, 20.46], [30.0, 30.64], [32.0, 32.37], [41.0, 40.81], [50.0, 49.94], [52.0, 52.37], [59.0, 59.36], [75.0, 80.2]], "keep_status": [true, false, false, false, false, false, false, false, false, true], "silence_prob": [45.18, 0.0, 39.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.49], "audiomae_on_audioset": [[["speech", 17.83], ["animal", 7.85], ["hum", 7.55]], null, [["speech", 68.03], ["hum", 5.58], ["fly, housefly", 3.27]], null, null, null, null, null, null, [["music", 37.89], ["theremin", 15.26], ["speech", 7.96]]], "duration": [2.19, 1.69, 2.46, 0.64, 0.37, -0.19, -0.06, 0.37, 0.36, 5.2]} \ No newline at end of file diff --git a/annotations_1/RsJmRjseSzo_filtered.json b/annotations_1/RsJmRjseSzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..462d7411793c65e4e3437435da21f1a2bd737bbc --- /dev/null +++ b/annotations_1/RsJmRjseSzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.13], [25.0, 27.72], [37.0, 37.54], [40.0, 40.63], [41.0, 41.0], [41.0, 41.25], [45.0, 49.87], [50.0, 49.91], [50.0, 49.99], [55.0, 57.6], [61.0, 62.73], [70.0, 98.15], [100.0, 100.21], [102.0, 102.37], [104.0, 104.94], [106.0, 106.17], [108.0, 113.24]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [51.82, 54.83, 0.0, 0.0, 0.0, 0.0, 38.1, 0.0, 0.0, 42.28, 0.0, 35.13, 0.0, 0.0, 0.0, 0.0, 28.92], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 21.02], ["music", 17.37], ["mains hum", 15.81]], null, null, [["hum", 27.28], ["mains hum", 13.92], ["throbbing", 12.58]], null, [["music", 18.12], ["hum", 17.58], ["mains hum", 16.91]], null, null, null, null, [["speech", 63.71], ["vehicle", 11.88], ["outside, urban or manmade", 2.46]]], "duration": [3.13, 2.72, 0.54, 0.63, 0.0, 0.25, 4.87, -0.09, -0.01, 2.6, 1.73, 28.15, 0.21, 0.37, 0.94, 0.17, 5.24]} \ No newline at end of file diff --git a/annotations_1/RsSltFwkLPE_filtered.json b/annotations_1/RsSltFwkLPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9679c7cc033c3c81a01f24414ddcec0543aaba61 --- /dev/null +++ b/annotations_1/RsSltFwkLPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 62.78], [64.0, 79.02], [83.0, 83.69]], "keep_status": [true, false, false], "silence_prob": [35.8, 77.03, 0.0], "audiomae_on_audioset": [[["thunk", 60.75], ["door", 4.92], ["arrow", 3.97]], null, null], "duration": [20.78, 15.02, 0.69]} \ No newline at end of file diff --git a/annotations_1/Rt3u4bU6EMU_filtered.json b/annotations_1/Rt3u4bU6EMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e77e9ab933710d2798aa0e4001e7b546f28e5d6 --- /dev/null +++ b/annotations_1/Rt3u4bU6EMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.56], [9.0, 12.09], [16.0, 15.82], [19.0, 20.75], [26.0, 26.74], [28.0, 28.68], [33.0, 33.52], [37.0, 36.96], [42.0, 44.54], [45.0, 50.14], [52.0, 56.3], [58.0, 57.94], [62.0, 82.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.97, 95.51, 0.0, 30.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 51.65], ["hum", 37.89], ["speech", 3.98]]], "duration": [2.56, 3.09, -0.18, 1.75, 0.74, 0.68, 0.52, -0.04, 2.54, 5.14, 4.3, -0.06, 20.73]} \ No newline at end of file diff --git a/annotations_1/RtRffVRFz6M_filtered.json b/annotations_1/RtRffVRFz6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7742e18acc093234b88d0e41caf560af03ae767 --- /dev/null +++ b/annotations_1/RtRffVRFz6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [11.0, 12.18], [14.0, 14.5], [16.0, 20.46], [22.0, 23.09], [25.0, 26.38], [27.0, 32.29], [40.0, 41.03], [50.0, 49.84], [55.0, 93.63], [97.0, 126.18], [127.0, 136.11], [152.0, 153.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 32.86, 43.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 19.47], ["speech", 15.86], ["whack, thwack", 15.47]], [["music", 26.38], ["hum", 12.67], ["synthesizer", 10.93]], null], "duration": [0.29, 1.18, 0.5, 4.46, 1.09, 1.38, 5.29, 1.03, -0.16, 38.63, 29.18, 9.11, 1.15]} \ No newline at end of file diff --git a/annotations_1/RtxMw4sua3Q_filtered.json b/annotations_1/RtxMw4sua3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec4dcb0ca3ae1dc3a024bc110bec7e330916641c --- /dev/null +++ b/annotations_1/RtxMw4sua3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 54.65], [63.0, 63.21], [64.0, 68.44], [70.0, 98.64], [100.0, 102.39]], "keep_status": [false, false, true, false, true], "silence_prob": [0.0, 0.0, 29.93, 30.1, 31.21], "audiomae_on_audioset": [null, null, [["music", 33.72], ["speech", 17.36], ["hum", 9.77]], [["music", 78.89], ["electronic music", 3.98], ["sound effect", 3.26]], [["music", 21.9], ["throbbing", 14.34], ["vehicle", 9.61]]], "duration": [1.65, 0.21, 4.44, 28.64, 2.39]} \ No newline at end of file diff --git a/annotations_1/RuFd7DELPYc_filtered.json b/annotations_1/RuFd7DELPYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e7a7aa9b92e32811bd33a8651900cc73ed90492 --- /dev/null +++ b/annotations_1/RuFd7DELPYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.21], [20.0, 21.93], [25.0, 33.71], [35.0, 67.19], [68.0, 74.7], [81.0, 89.51], [90.0, 105.14], [108.0, 114.84], [118.0, 122.3], [123.0, 127.72]], "keep_status": [true, false, false, false, true, false, false, true, false, false], "silence_prob": [34.18, 0.0, 30.31, 0.0, 30.79, 30.01, 29.94, 36.55, 85.17, 92.15], "audiomae_on_audioset": [[["music", 24.54], ["sidetone", 19.12], ["siren", 11.12]], null, [["music", 75.4], ["electronic music", 4.79], ["speech", 1.21]], null, [["music", 56.24], ["electronic music", 8.11], ["throbbing", 3.71]], [["music", 77.58], ["electronic music", 2.38], ["speech", 2.17]], [["music", 52.39], ["throbbing", 16.95], ["hum", 6.92]], [["speech", 25.36], ["hum", 14.33], ["buzz", 9.5]], null, null], "duration": [3.21, 1.93, 8.71, 32.19, 6.7, 8.51, 15.14, 6.84, 4.3, 4.72]} \ No newline at end of file diff --git a/annotations_1/RuOjVbqLiZU_filtered.json b/annotations_1/RuOjVbqLiZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7bde3cbae42afdfcb65d34ddd56c3f68a3d2014 --- /dev/null +++ b/annotations_1/RuOjVbqLiZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [5.0, 4.78], [7.0, 8.95], [12.0, 13.96], [15.0, 17.04], [25.0, 26.33], [27.0, 27.36], [28.0, 28.53], [35.0, 35.61], [44.0, 45.03], [51.0, 51.85], [53.0, 53.05], [58.0, 59.24], [61.0, 62.63], [63.0, 64.17], [66.0, 66.61], [74.0, 75.76], [78.0, 80.52], [95.0, 95.61], [96.0, 96.85], [97.0, 97.6], [98.0, 99.18], [108.0, 111.57], [112.0, 112.5], [113.0, 113.14], [113.0, 117.36], [121.0, 121.71], [122.0, 125.42], [127.0, 127.14], [127.0, 128.29], [129.0, 130.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.69, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 49.54, 0.0, 42.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.72], ["cattle, bovinae", 22.76], ["moo", 20.92]], null, null, null, null, null, null, null, [["mains hum", 25.56], ["hum", 15.71], ["fly, housefly", 11.61]], null, [["music", 63.58], ["guitar", 11.81], ["musical instrument", 10.07]], null, null, null], "duration": [0.45, -0.22, 1.95, 1.96, 2.04, 1.33, 0.36, 0.53, 0.61, 1.03, 0.85, 0.05, 1.24, 1.63, 1.17, 0.61, 1.76, 2.52, 0.61, 0.85, 0.6, 1.18, 3.57, 0.5, 0.14, 4.36, 0.71, 3.42, 0.14, 1.29, 1.11]} \ No newline at end of file diff --git a/annotations_1/Ru_KziPyopw_filtered.json b/annotations_1/Ru_KziPyopw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d628bb60a115c83ddb3971204b391f123e0bbddc --- /dev/null +++ b/annotations_1/Ru_KziPyopw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.39], [8.0, 12.92], [17.0, 22.03], [24.0, 35.8], [38.0, 45.3], [52.0, 53.87], [60.0, 62.6], [67.0, 71.9], [76.0, 76.38], [78.0, 83.12], [86.0, 88.21], [90.0, 92.4], [99.0, 102.61], [107.0, 109.68], [115.0, 114.98], [116.0, 117.46], [134.0, 134.76], [138.0, 140.0], [148.0, 150.06], [157.0, 162.19], [171.0, 171.36], [174.0, 174.97]], "keep_status": [true, false, true, false, false, false, true, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [41.42, 33.12, 33.08, 32.01, 33.12, 0.0, 38.84, 33.29, 0.0, 33.93, 38.87, 40.9, 34.56, 39.18, 0.0, 0.0, 0.0, 52.62, 64.97, 37.2, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.06], ["musical instrument", 3.01], ["glockenspiel", 2.41]], [["music", 43.79], ["speech", 24.72], ["musical instrument", 5.13]], [["music", 35.46], ["fart", 24.66], ["didgeridoo", 5.54]], [["music", 50.39], ["theremin", 14.04], ["didgeridoo", 9.27]], [["music", 70.53], ["didgeridoo", 1.84], ["zither", 1.74]], null, [["music", 47.38], ["boing", 4.23], ["didgeridoo", 3.93]], [["music", 73.15], ["zither", 3.12], ["singing", 2.18]], null, [["music", 72.91], ["bass guitar", 2.46], ["didgeridoo", 2.42]], [["music", 36.33], ["speech", 10.86], ["guitar", 10.78]], [["music", 35.82], ["mains hum", 7.23], ["hum", 6.51]], [["music", 40.78], ["livestock, farm animals, working animals", 5.84], ["guitar", 5.01]], [["music", 56.69], ["fly, housefly", 4.42], ["guitar", 2.81]], null, null, null, null, null, [["music", 43.01], ["speech", 28.53], ["foghorn", 4.25]], null, null], "duration": [2.39, 4.92, 5.03, 11.8, 7.3, 1.87, 2.6, 4.9, 0.38, 5.12, 2.21, 2.4, 3.61, 2.68, -0.02, 1.46, 0.76, 2.0, 2.06, 5.19, 0.36, 0.97]} \ No newline at end of file diff --git a/annotations_1/RwMgEM9FNhE_filtered.json b/annotations_1/RwMgEM9FNhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71ea2aac671fbd494c81fddf87d6f1b45fdf4b61 --- /dev/null +++ b/annotations_1/RwMgEM9FNhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.0], [6.0, 8.48], [11.0, 11.72], [14.0, 15.47], [17.0, 22.45], [24.0, 24.54], [26.0, 26.74], [27.0, 29.2], [32.0, 32.31], [36.0, 47.11], [49.0, 51.46], [54.0, 55.78], [58.0, 58.62], [61.0, 62.29], [64.0, 64.49], [66.0, 66.8], [70.0, 70.31], [72.0, 77.01], [80.0, 79.62], [82.0, 82.9], [86.0, 87.88], [92.0, 92.18], [93.0, 93.82], [95.0, 95.72], [111.0, 114.25]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.55, 0.0, 0.0, 34.57, 0.0, 0.0, 62.27, 0.0, 34.22, 53.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.47], "audiomae_on_audioset": [null, [["speech", 36.11], ["music", 7.94], ["echo", 5.73]], null, null, [["speech", 50.0], ["telephone", 7.85], ["radio", 4.19]], null, null, null, null, [["speech", 78.75], ["fart", 7.86], ["radio", 2.04]], null, null, null, null, null, null, null, [["boing", 14.53], ["speech", 13.09], ["animal", 7.35]], null, null, null, null, null, null, [["noise", 11.88], ["roar", 10.47], ["boing", 6.81]]], "duration": [0.0, 2.48, 0.72, 1.47, 5.45, 0.54, 0.74, 2.2, 0.31, 11.11, 2.46, 1.78, 0.62, 1.29, 0.49, 0.8, 0.31, 5.01, -0.38, 0.9, 1.88, 0.18, 0.82, 0.72, 3.25]} \ No newline at end of file diff --git a/annotations_1/RxEkm4dDAL4_filtered.json b/annotations_1/RxEkm4dDAL4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01b1e2a6b20c528de1f2facbb1d349993dc6a884 --- /dev/null +++ b/annotations_1/RxEkm4dDAL4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [3.0, 18.03], [20.0, 23.55], [25.0, 25.2], [27.0, 27.13], [29.0, 30.89], [33.0, 33.45], [35.0, 61.53], [66.0, 66.78], [76.0, 76.01], [80.0, 82.8], [98.0, 104.36], [105.0, 105.95], [106.0, 108.23], [112.0, 113.81], [115.0, 117.34], [118.0, 132.98], [134.0, 135.53], [137.0, 138.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.86, 99.92, 0.0, 0.0, 0.0, 0.0, 54.04, 0.0, 0.0, 54.23, 56.1, 0.0, 75.23, 0.0, 88.83, 99.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 15.03, 3.55, 0.2, 0.13, 1.89, 0.45, 26.53, 0.78, 0.01, 2.8, 6.36, 0.95, 2.23, 1.81, 2.34, 14.98, 1.53, 1.37]} \ No newline at end of file diff --git a/annotations_1/RxLb-Iqyqps_filtered.json b/annotations_1/RxLb-Iqyqps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82386e88a0f540fb367200575699f4c08a02a349 --- /dev/null +++ b/annotations_1/RxLb-Iqyqps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.9], [7.0, 7.86], [9.0, 12.29], [12.0, 13.31], [16.0, 19.14], [21.0, 22.55], [24.0, 36.27], [37.0, 38.94], [41.0, 49.44], [51.0, 51.21], [52.0, 53.01], [55.0, 55.86], [58.0, 60.03], [62.0, 62.63], [65.0, 67.46], [69.0, 73.28], [74.0, 76.59], [78.0, 80.27], [81.0, 81.87], [84.0, 85.67], [86.0, 87.3], [88.0, 91.2], [92.0, 92.97], [95.0, 95.86], [97.0, 98.86], [100.0, 102.29], [102.0, 106.54], [108.0, 110.59], [112.0, 115.13], [116.0, 117.64], [119.0, 120.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 0.0, 97.22, 0.0, 99.94, 0.0, 97.64, 0.0, 96.89, 0.0, 0.0, 0.0, 100.0, 0.0, 72.31, 99.95, 95.51, 100.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 99.99, 98.1, 99.52, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.9, 0.86, 3.29, 1.31, 3.14, 1.55, 12.27, 1.94, 8.44, 0.21, 1.01, 0.86, 2.03, 0.63, 2.46, 4.28, 2.59, 2.27, 0.87, 1.67, 1.3, 3.2, 0.97, 0.86, 1.86, 2.29, 4.54, 2.59, 3.13, 1.64, 1.48]} \ No newline at end of file diff --git a/annotations_1/RxwUv1BcPwg_filtered.json b/annotations_1/RxwUv1BcPwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019087ab928458c8d7ff71daba7fceef43512a54 --- /dev/null +++ b/annotations_1/RxwUv1BcPwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.39], [17.0, 28.66], [33.0, 32.85], [35.0, 55.92], [60.0, 65.42], [70.0, 70.16], [72.0, 73.62], [75.0, 75.42], [81.0, 87.66], [92.0, 97.44], [98.0, 97.83], [99.0, 108.09]], "keep_status": [true, true, false, false, true, false, false, false, true, true, false, false], "silence_prob": [31.65, 34.16, 0.0, 31.33, 29.64, 0.0, 0.0, 0.0, 34.73, 31.13, 0.0, 32.32], "audiomae_on_audioset": [[["music", 51.2], ["musical instrument", 4.78], ["scary music", 3.27]], [["music", 45.86], ["brass instrument", 12.06], ["trombone", 7.31]], null, [["speech", 50.36], ["music", 19.69], ["vehicle", 8.53]], [["hum", 20.34], ["music", 16.67], ["mains hum", 10.14]], null, null, null, [["speech", 38.18], ["hum", 15.28], ["mains hum", 9.62]], [["speech", 33.5], ["vehicle", 14.76], ["car", 14.44]], null, [["speech", 60.08], ["music", 10.74], ["vehicle", 4.87]]], "duration": [6.39, 11.66, -0.15, 20.92, 5.42, 0.16, 1.62, 0.42, 6.66, 5.44, -0.17, 9.09]} \ No newline at end of file diff --git a/annotations_1/RxyMbaDX22g_filtered.json b/annotations_1/RxyMbaDX22g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..241505379aa28b41123d95136bde787493823034 --- /dev/null +++ b/annotations_1/RxyMbaDX22g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.05], [8.0, 9.41], [12.0, 13.63], [17.0, 20.43], [25.0, 29.29], [31.0, 31.14], [32.0, 40.78], [43.0, 44.66], [46.0, 46.95], [52.0, 53.5], [55.0, 55.53], [57.0, 72.71], [77.0, 77.72], [82.0, 83.57], [85.0, 89.55], [92.0, 100.47], [104.0, 112.45], [114.0, 117.81], [118.0, 121.0], [122.0, 122.4], [125.0, 126.98]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [31.05, 0.0, 0.0, 34.3, 38.54, 0.0, 29.76, 0.0, 0.0, 0.0, 0.0, 29.47, 0.0, 0.0, 32.21, 30.22, 32.73, 31.97, 40.61, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.21], ["throbbing", 20.8], ["hum", 6.11]], null, null, [["music", 57.85], ["speech", 7.87], ["electronic music", 4.74]], [["music", 50.51], ["synthesizer", 8.44], ["speech", 6.42]], null, [["mosquito", 24.66], ["music", 20.75], ["fly, housefly", 19.3]], null, null, null, null, [["music", 45.65], ["speech", 13.0], ["throbbing", 5.39]], null, null, [["music", 34.89], ["whack, thwack", 20.44], ["sound effect", 7.4]], [["music", 64.0], ["synthesizer", 7.83], ["theremin", 5.27]], [["music", 60.42], ["whack, thwack", 10.05], ["didgeridoo", 4.56]], [["music", 34.92], ["speech", 24.91], ["whack, thwack", 5.55]], [["music", 41.18], ["speech", 37.12], ["quack", 1.76]], null, null], "duration": [2.05, 1.41, 1.63, 3.43, 4.29, 0.14, 8.78, 1.66, 0.95, 1.5, 0.53, 15.71, 0.72, 1.57, 4.55, 8.47, 8.45, 3.81, 3.0, 0.4, 1.98]} \ No newline at end of file diff --git a/annotations_1/RyZ-saoiIzY_filtered.json b/annotations_1/RyZ-saoiIzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a39aa155c1ccb7d6f1aa4723a846cb0608c60572 --- /dev/null +++ b/annotations_1/RyZ-saoiIzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.49], [22.0, 21.78], [23.0, 24.98], [27.0, 27.87], [31.0, 34.28], [36.0, 76.28], [84.0, 154.03], [156.0, 174.38]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [29.6, 0.0, 0.0, 0.0, 32.02, 0.0, 0.0, 29.43], "audiomae_on_audioset": [[["electric shaver, electric razor", 22.87], ["mains hum", 17.53], ["hum", 14.29]], null, null, null, [["speech", 24.48], ["hum", 20.53], ["throbbing", 18.76]], null, null, [["livestock, farm animals, working animals", 47.41], ["cattle, bovinae", 19.12], ["moo", 9.07]]], "duration": [12.49, -0.22, 1.98, 0.87, 3.28, 40.28, 70.03, 18.38]} \ No newline at end of file diff --git a/annotations_1/RybQmyBoWEQ_filtered.json b/annotations_1/RybQmyBoWEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e734fbec45490edee18155f61482a3fef8366a --- /dev/null +++ b/annotations_1/RybQmyBoWEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.09], [26.0, 31.77], [33.0, 33.84], [36.0, 39.23], [42.0, 44.25], [45.0, 49.13], [50.0, 52.44], [54.0, 56.42], [59.0, 61.26], [65.0, 66.97], [69.0, 69.42], [71.0, 71.9], [78.0, 79.54], [81.0, 81.82], [82.0, 83.54], [85.0, 84.89], [87.0, 90.96]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.24, 48.44, 0.0, 82.43, 75.55, 92.15, 96.42, 99.84, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73], "audiomae_on_audioset": [[["speech", 60.22], ["explosion", 3.98], ["fireworks", 3.9]], [["speech", 52.99], ["sheep", 3.91], ["bleat", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.09, 5.77, 0.84, 3.23, 2.25, 4.13, 2.44, 2.42, 2.26, 1.97, 0.42, 0.9, 1.54, 0.82, 1.54, -0.11, 3.96]} \ No newline at end of file diff --git a/annotations_1/S-EfnfP_cGY_filtered.json b/annotations_1/S-EfnfP_cGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b67f60ec0a312b6709fe9e0de4879255aa5a91ab --- /dev/null +++ b/annotations_1/S-EfnfP_cGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.53], [11.0, 12.07], [15.0, 15.75], [22.0, 22.6], [27.0, 29.2], [31.0, 32.48], [37.0, 38.84], [40.0, 44.12], [46.0, 74.95], [76.0, 89.75], [93.0, 93.65], [97.0, 99.12], [101.0, 111.27], [114.0, 114.89], [117.0, 117.66], [123.0, 123.67], [126.0, 128.16], [129.0, 130.96], [132.0, 133.81], [137.0, 138.48], [140.0, 141.84], [150.0, 151.71], [155.0, 169.11], [170.0, 171.53], [175.0, 176.62], [179.0, 179.93], [182.0, 182.73], [187.0, 191.0], [194.0, 201.14], [204.0, 207.44], [209.0, 210.39], [214.0, 214.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [88.46, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 76.04, 32.24, 52.1, 0.0, 80.29, 70.02, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 54.5, 82.79, 46.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 33.65], ["hum", 30.06], ["mains hum", 20.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 37.25], ["music", 33.39], ["whale vocalization", 6.9]], null, null, null, null, null, null, [["music", 49.31], ["ambient music", 10.79], ["synthesizer", 9.77]], null, null], "duration": [5.53, 1.07, 0.75, 0.6, 2.2, 1.48, 1.84, 4.12, 28.95, 13.75, 0.65, 2.12, 10.27, 0.89, 0.66, 0.67, 2.16, 1.96, 1.81, 1.48, 1.84, 1.71, 14.11, 1.53, 1.62, 0.93, 0.73, 4.0, 7.14, 3.44, 1.39, 0.61]} \ No newline at end of file diff --git a/annotations_1/S-M0BOzttdg_filtered.json b/annotations_1/S-M0BOzttdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54e414d5def9200cb408dbe7fe54e99c1f6ae299 --- /dev/null +++ b/annotations_1/S-M0BOzttdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.59], [2.0, 5.19], [10.0, 13.66], [15.0, 16.75], [18.0, 19.82], [22.0, 22.54], [23.0, 25.91], [28.0, 30.92], [31.0, 32.49], [38.0, 38.01], [39.0, 40.68], [41.0, 60.18], [61.0, 63.1], [65.0, 67.09], [71.0, 85.94], [87.0, 89.73], [93.0, 93.61], [95.0, 114.13], [116.0, 117.24], [118.0, 119.23], [121.0, 123.09], [124.0, 130.99], [135.0, 139.77], [141.0, 143.48], [145.0, 145.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 53.47, 50.76, 0.0, 0.0, 0.0, 50.86, 57.72, 0.0, 0.0, 0.0, 31.92, 32.32, 33.86, 37.06, 58.05, 0.0, 43.85, 0.0, 0.0, 43.3, 40.29, 50.81, 42.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.5], ["music", 15.82], ["insect", 9.6]], [["hum", 27.11], ["music", 18.91], ["throbbing", 16.66]], [["music", 68.23], ["electronic music", 3.98], ["musical instrument", 3.28]], [["music", 28.79], ["hum", 14.58], ["rumble", 13.64]], null, null, [["speech", 30.11], ["hum", 25.0], ["mains hum", 10.02]], null, null, [["hum", 35.94], ["throbbing", 26.8], ["music", 13.77]], [["music", 25.16], ["hum", 15.18], ["mains hum", 13.65]], null, [["fly, housefly", 16.43], ["hum", 13.43], ["noise", 9.16]], null], "duration": [1.59, 3.19, 3.66, 1.75, 1.82, 0.54, 2.91, 2.92, 1.49, 0.01, 1.68, 19.18, 2.1, 2.09, 14.94, 2.73, 0.61, 19.13, 1.24, 1.23, 2.09, 6.99, 4.77, 2.48, 0.47]} \ No newline at end of file diff --git a/annotations_1/S-WVZ-d28yg_filtered.json b/annotations_1/S-WVZ-d28yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22fcba4560ee8429421a109b52921063273ab2f8 --- /dev/null +++ b/annotations_1/S-WVZ-d28yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 15.67], [18.0, 18.27], [28.0, 30.7], [32.0, 35.95], [41.0, 44.79], [48.0, 49.13], [50.0, 49.77], [55.0, 63.9], [68.0, 70.06], [76.0, 89.41], [91.0, 92.48], [101.0, 128.56], [130.0, 138.27], [140.0, 141.27], [142.0, 142.42]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [30.9, 0.0, 30.58, 31.04, 30.31, 0.0, 0.0, 30.63, 34.93, 30.4, 0.0, 30.58, 32.84, 0.0, 0.0], "audiomae_on_audioset": [[["music", 77.61], ["cacophony", 2.69], ["synthesizer", 2.23]], null, [["music", 14.35], ["fly, housefly", 8.32], ["mains hum", 8.19]], [["music", 71.34], ["musical instrument", 5.78], ["trombone", 1.69]], [["music", 78.2], ["musical instrument", 3.59], ["cacophony", 3.25]], null, null, [["music", 64.67], ["cacophony", 6.74], ["throbbing", 2.23]], [["music", 72.17], ["throbbing", 3.99], ["electronic music", 3.09]], [["music", 73.71], ["cacophony", 18.63], ["buzz", 1.66]], null, [["music", 18.32], ["buzz", 16.76], ["hum", 16.13]], [["music", 27.92], ["hum", 21.83], ["mains hum", 15.64]], null, null], "duration": [13.67, 0.27, 2.7, 3.95, 3.79, 1.13, -0.23, 8.9, 2.06, 13.41, 1.48, 27.56, 8.27, 1.27, 0.42]} \ No newline at end of file diff --git a/annotations_1/S-pmcO6U8eg_filtered.json b/annotations_1/S-pmcO6U8eg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51287407e4cda79939250db31dc471d61b35e8d0 --- /dev/null +++ b/annotations_1/S-pmcO6U8eg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.74], [15.0, 15.77], [17.0, 21.98], [23.0, 23.08], [24.0, 24.41], [25.0, 25.59], [26.0, 28.21], [29.0, 29.39], [33.0, 32.76], [34.0, 34.47], [38.0, 38.28], [39.0, 40.93], [41.0, 42.23], [43.0, 42.94], [44.0, 44.93], [46.0, 46.79], [47.0, 49.6], [50.0, 51.97], [55.0, 55.24], [67.0, 69.04], [69.0, 70.02], [71.0, 71.37], [72.0, 72.82], [81.0, 81.04], [84.0, 84.03], [87.0, 87.27], [89.0, 88.75], [93.0, 93.51], [96.0, 97.6], [98.0, 98.17], [100.0, 100.48], [103.0, 103.42], [105.0, 105.44], [108.0, 108.04], [110.0, 110.47], [114.0, 114.0], [117.0, 117.54], [119.0, 119.5], [123.0, 123.96], [126.0, 126.64], [128.0, 128.65], [131.0, 131.46], [134.0, 134.35], [135.0, 135.77], [137.0, 137.07], [137.0, 137.67]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.36, 0.0, 52.16, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.69, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 19.4], ["radio", 17.79], ["frog", 9.51]], null, null, null, null, null, [["speech", 47.34], ["telephone", 11.13], ["sidetone", 10.5]], null, null, null, null, null, null, null, null, null, [["speech", 68.89], ["insect", 9.53], ["radio", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.74, 0.77, 4.98, 0.08, 0.41, 0.59, 2.21, 0.39, -0.24, 0.47, 0.28, 1.93, 1.23, -0.06, 0.93, 0.79, 2.6, 1.97, 0.24, 2.04, 1.02, 0.37, 0.82, 0.04, 0.03, 0.27, -0.25, 0.51, 1.6, 0.17, 0.48, 0.42, 0.44, 0.04, 0.47, 0.0, 0.54, 0.5, 0.96, 0.64, 0.65, 0.46, 0.35, 0.77, 0.07, 0.67]} \ No newline at end of file diff --git a/annotations_1/S04wIhoGYQY_filtered.json b/annotations_1/S04wIhoGYQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acdd9caa0b6325e3e12ed6d80bd781363c1c38a6 --- /dev/null +++ b/annotations_1/S04wIhoGYQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.47], [24.0, 24.66], [26.0, 26.94], [30.0, 30.38], [33.0, 34.38], [36.0, 37.52], [40.0, 40.58], [44.0, 43.75], [56.0, 60.25], [68.0, 71.61], [72.0, 71.64], [72.0, 72.5], [73.0, 72.54], [73.0, 72.72], [73.0, 72.93], [73.0, 72.96], [73.0, 72.99], [77.0, 77.84], [81.0, 88.59], [91.0, 90.85], [99.0, 99.1], [105.0, 106.49], [114.0, 114.12], [115.0, 115.35], [116.0, 116.34], [121.0, 124.09], [125.0, 125.1], [132.0, 134.27], [138.0, 138.59], [150.0, 150.65], [152.0, 151.95], [153.0, 154.01], [156.0, 156.64], [161.0, 164.34], [177.0, 179.07], [189.0, 190.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 39.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 32.41, 0.0, 0.0, 0.0, 0.0, 0.0, 37.07, 34.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 26.41], ["hum", 16.81], ["speech", 11.61]], null, null, null, null, null, null, null, null, [["speech", 37.36], ["music", 19.54], ["hum", 12.75]], null, null, null, null, null, null, [["cattle, bovinae", 47.14], ["moo", 30.78], ["livestock, farm animals, working animals", 19.73]], null, [["music", 34.47], ["speech", 30.71], ["musical instrument", 2.11]], null, null, null, null, null, [["music", 35.77], ["speech", 33.09], ["boing", 3.47]], [["cattle, bovinae", 32.95], ["moo", 27.77], ["livestock, farm animals, working animals", 18.03]], null], "duration": [1.47, 0.66, 0.94, 0.38, 1.38, 1.52, 0.58, -0.25, 4.25, 3.61, -0.36, 0.5, -0.46, -0.28, -0.07, -0.04, -0.01, 0.84, 7.59, -0.15, 0.1, 1.49, 0.12, 0.35, 0.34, 3.09, 0.1, 2.27, 0.59, 0.65, -0.05, 1.01, 0.64, 3.34, 2.07, 1.54]} \ No newline at end of file diff --git a/annotations_1/S0IfbNVCoCE_filtered.json b/annotations_1/S0IfbNVCoCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9c2b9c882b896c866b1db6fdbb638e39e1b3693 --- /dev/null +++ b/annotations_1/S0IfbNVCoCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.38], [10.0, 11.85], [13.0, 14.15], [17.0, 20.95], [22.0, 23.48], [25.0, 25.91], [27.0, 28.68], [30.0, 32.9], [33.0, 36.96], [38.0, 38.85], [40.0, 41.59], [42.0, 45.22], [47.0, 49.86], [52.0, 53.37], [55.0, 55.95], [56.0, 58.53], [61.0, 62.87], [64.0, 65.52], [68.0, 68.96], [70.0, 73.74], [75.0, 76.49], [78.0, 78.22], [86.0, 86.32], [88.0, 87.99], [90.0, 91.05], [93.0, 93.83], [95.0, 95.81], [98.0, 98.9], [100.0, 100.45], [103.0, 106.44], [108.0, 109.81], [115.0, 114.81], [117.0, 117.68], [122.0, 122.47], [124.0, 124.26], [129.0, 130.47], [131.0, 132.97], [134.0, 135.67], [139.0, 139.21], [142.0, 142.94], [145.0, 149.81], [150.0, 150.63], [151.0, 153.08], [157.0, 157.86], [161.0, 161.94], [163.0, 170.92], [172.0, 177.82], [179.0, 179.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [78.89, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 94.66, 72.46, 0.0, 0.0, 82.97, 99.36, 0.0, 0.0, 44.49, 0.0, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 0.0, 99.82, 0.0, 0.0, 53.72, 58.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 38.41], ["livestock, farm animals, working animals", 37.86], ["moo", 22.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 16.79], ["mains hum", 11.83], ["caw", 5.18]], null, null, null, null, null, null, null], "duration": [3.38, 1.85, 1.15, 3.95, 1.48, 0.91, 1.68, 2.9, 3.96, 0.85, 1.59, 3.22, 2.86, 1.37, 0.95, 2.53, 1.87, 1.52, 0.96, 3.74, 1.49, 0.22, 0.32, -0.01, 1.05, 0.83, 0.81, 0.9, 0.45, 3.44, 1.81, -0.19, 0.68, 0.47, 0.26, 1.47, 1.97, 1.67, 0.21, 0.94, 4.81, 0.63, 2.08, 0.86, 0.94, 7.92, 5.82, 0.07]} \ No newline at end of file diff --git a/annotations_1/S0LBIxKRCHw_filtered.json b/annotations_1/S0LBIxKRCHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6b14b774007bdccb512651358fa59d4f979cce --- /dev/null +++ b/annotations_1/S0LBIxKRCHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.21], [6.0, 6.52], [8.0, 8.65], [13.0, 13.02], [24.0, 25.46], [29.0, 29.22], [35.0, 36.78], [38.0, 38.45], [49.0, 50.01], [54.0, 54.5], [55.0, 55.9], [59.0, 59.59], [62.0, 62.53], [66.0, 67.19], [79.0, 80.33], [83.0, 83.4], [84.0, 85.31], [87.0, 88.06], [90.0, 91.49], [92.0, 92.23], [99.0, 99.86], [100.0, 100.9], [105.0, 110.78], [112.0, 112.38], [114.0, 114.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.52, 0.65, 0.02, 1.46, 0.22, 1.78, 0.45, 1.01, 0.5, 0.9, 0.59, 0.53, 1.19, 1.33, 0.4, 1.31, 1.06, 1.49, 0.23, 0.86, 0.9, 5.78, 0.38, 0.89]} \ No newline at end of file diff --git a/annotations_1/S0X0KScmHvo_filtered.json b/annotations_1/S0X0KScmHvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62d34cc3ff33ac9160b880c20b2f3dd10bbc55bb --- /dev/null +++ b/annotations_1/S0X0KScmHvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 31.51], [33.0, 33.32], [36.0, 36.27], [40.0, 41.23], [45.0, 56.81], [57.0, 73.08], [75.0, 82.85], [84.0, 108.38], [113.0, 113.76], [116.0, 116.33]], "keep_status": [true, false, false, false, true, true, true, false, false, false], "silence_prob": [28.78, 0.0, 0.0, 0.0, 34.56, 43.56, 33.38, 30.79, 0.0, 0.0], "audiomae_on_audioset": [[["music", 26.09], ["throbbing", 23.24], ["speech", 12.85]], null, null, null, [["music", 29.49], ["animal", 25.17], ["hum", 6.48]], [["music", 32.76], ["speech", 26.32], ["hum", 6.49]], [["music", 48.74], ["hum", 12.73], ["speech", 8.13]], [["music", 67.96], ["speech", 9.31], ["fart", 5.6]], null, null], "duration": [7.51, 0.32, 0.27, 1.23, 11.81, 16.08, 7.85, 24.38, 0.76, 0.33]} \ No newline at end of file diff --git a/annotations_1/S0pCBDjC9Wk_filtered.json b/annotations_1/S0pCBDjC9Wk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..591f0f441cf2ca72da0e210c80c5358216d462b6 --- /dev/null +++ b/annotations_1/S0pCBDjC9Wk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [9.0, 9.78], [18.0, 24.54], [27.0, 29.56], [31.0, 36.15], [51.0, 51.73], [59.0, 59.41], [62.0, 62.38], [67.0, 67.47], [75.0, 75.52]], "keep_status": [false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.36, 49.64, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.16], ["speech", 21.15], ["music for children", 5.31]], [["music", 47.66], ["synthesizer", 6.88], ["boing", 4.99]], [["boing", 48.4], ["music", 19.28], ["speech", 11.89]], null, null, null, null, null], "duration": [0.5, 0.78, 6.54, 2.56, 5.15, 0.73, 0.41, 0.38, 0.47, 0.52]} \ No newline at end of file diff --git a/annotations_1/S0ymo6QHMc0_filtered.json b/annotations_1/S0ymo6QHMc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4c752ba48463c22aaf12a5d01ef8c49bf757e8 --- /dev/null +++ b/annotations_1/S0ymo6QHMc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 42.33], [44.0, 45.82], [49.0, 51.04], [54.0, 55.26], [56.0, 57.79], [58.0, 59.48], [62.0, 65.74], [66.0, 68.3], [71.0, 71.63], [72.0, 73.92], [75.0, 79.76], [84.0, 85.11], [86.0, 86.31], [87.0, 135.14], [137.0, 136.97], [139.0, 141.05], [144.0, 144.85], [147.0, 149.62], [151.0, 160.02], [160.0, 161.1], [161.0, 162.04], [167.0, 169.01], [169.0, 169.25], [169.0, 169.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [37.27, 0.0, 34.62, 0.0, 0.0, 0.0, 40.36, 39.69, 0.0, 0.0, 36.29, 0.0, 0.0, 0.0, 0.0, 43.98, 0.0, 69.88, 42.93, 0.0, 0.0, 33.32, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.18], ["singing bowl", 8.04], ["didgeridoo", 6.54]], null, [["music", 38.21], ["hum", 26.47], ["throbbing", 10.2]], null, null, null, [["music", 62.24], ["hum", 9.18], ["mains hum", 4.74]], [["music", 28.78], ["didgeridoo", 28.02], ["speech", 24.16]], null, null, [["music", 65.31], ["hum", 7.3], ["musical instrument", 4.63]], null, null, null, null, [["music", 41.24], ["whale vocalization", 4.94], ["hum", 4.45]], null, null, [["music", 35.76], ["hum", 27.77], ["mains hum", 11.91]], null, null, [["music", 42.57], ["foghorn", 8.49], ["musical instrument", 5.26]], null, null], "duration": [2.33, 1.82, 2.04, 1.26, 1.79, 1.48, 3.74, 2.3, 0.63, 1.92, 4.76, 1.11, 0.31, 48.14, -0.03, 2.05, 0.85, 2.62, 9.02, 1.1, 1.04, 2.01, 0.25, 0.32]} \ No newline at end of file diff --git a/annotations_1/S1Kbym7WYzs_filtered.json b/annotations_1/S1Kbym7WYzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c24c7a7dd12c3d221df41cf302a31df9992bb63c --- /dev/null +++ b/annotations_1/S1Kbym7WYzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.51], [23.0, 43.29], [45.0, 54.21], [58.0, 68.42], [74.0, 77.09], [82.0, 82.97], [84.0, 110.07], [111.0, 111.38], [111.0, 111.48], [112.0, 113.0], [115.0, 138.13], [141.0, 140.95], [143.0, 172.99], [181.0, 185.23], [188.0, 213.92], [215.0, 215.99]], "keep_status": [false, true, false, false, false, false, true, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 28.89, 28.9, 28.85, 32.43, 0.0, 29.24, 0.0, 0.0, 0.0, 28.59, 0.0, 28.42, 28.49, 28.66, 0.0], "audiomae_on_audioset": [null, [["speech", 31.16], ["music", 17.69], ["hum", 11.48]], [["music", 36.24], ["speech", 32.61], ["throbbing", 10.55]], [["music", 68.54], ["throbbing", 10.9], ["hum", 8.14]], [["hum", 39.37], ["throbbing", 36.42], ["mains hum", 8.38]], null, [["hum", 17.05], ["rumble", 12.78], ["speech", 10.97]], null, null, null, [["music", 14.86], ["speech", 12.87], ["hum", 9.17]], null, [["music", 27.59], ["speech", 16.63], ["explosion", 12.37]], [["music", 19.62], ["throbbing", 14.15], ["hum", 11.5]], [["music", 46.16], ["speech", 29.7], ["electronic music", 4.02]], null], "duration": [1.51, 20.29, 9.21, 10.42, 3.09, 0.97, 26.07, 0.38, 0.48, 1.0, 23.13, -0.05, 29.99, 4.23, 25.92, 0.99]} \ No newline at end of file diff --git a/annotations_1/S1NFRvZE3FA_filtered.json b/annotations_1/S1NFRvZE3FA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e856d5139e65c530452ea9fbdec33975521949c --- /dev/null +++ b/annotations_1/S1NFRvZE3FA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 68.45], [70.0, 79.46], [81.0, 84.3], [85.0, 106.79], [114.0, 114.66], [115.0, 115.18]], "keep_status": [true, false, false, false, false, false], "silence_prob": [42.6, 53.4, 71.0, 39.18, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 26.63], ["hum", 17.58], ["buzz", 11.69]], null, null, [["music", 53.38], ["hum", 11.45], ["mains hum", 5.63]], null, null], "duration": [9.45, 9.46, 3.3, 21.79, 0.66, 0.18]} \ No newline at end of file diff --git a/annotations_1/S1UpuPvAUss_filtered.json b/annotations_1/S1UpuPvAUss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3436c03fd80da7ffb98cc6a2133c96660a88705c --- /dev/null +++ b/annotations_1/S1UpuPvAUss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [3.0, 3.99], [5.0, 7.4], [15.0, 14.72], [16.0, 17.25], [19.0, 19.52], [20.0, 21.22], [25.0, 27.06], [28.0, 33.12], [37.0, 36.76], [37.0, 38.18], [42.0, 41.98], [45.0, 44.69], [49.0, 51.44], [53.0, 60.54], [62.0, 61.94], [62.0, 63.76], [65.0, 71.36], [85.0, 85.92], [97.0, 97.98], [104.0, 105.36], [107.0, 114.91], [116.0, 115.8], [118.0, 122.84], [123.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0, 94.07, 33.22, 0.0, 0.0, 0.0, 0.0, 85.35, 99.97, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 46.97, 0.0, 95.37, 0.0], "audiomae_on_audioset": [null, null, [["speech", 72.82], ["fart", 5.84], ["electric shaver, electric razor", 1.83]], null, null, null, null, null, [["speech", 83.9], ["grunt", 2.57], ["music", 1.74]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.06], ["sidetone", 17.37], ["hum", 7.81]], null, null, null], "duration": [0.25, 0.99, 2.4, -0.28, 1.25, 0.52, 1.22, 2.06, 5.12, -0.24, 1.18, -0.02, -0.31, 2.44, 7.54, -0.06, 1.76, 6.36, 0.92, 0.98, 1.36, 7.91, -0.2, 4.84, -0.06]} \ No newline at end of file diff --git a/annotations_1/S1Xm1jBc84U_filtered.json b/annotations_1/S1Xm1jBc84U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36021a4b11266ea3decb2d2359f2c3e42f2453fd --- /dev/null +++ b/annotations_1/S1Xm1jBc84U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.95], [7.0, 27.09], [28.0, 29.1], [29.0, 39.01], [42.0, 43.06], [44.0, 52.37], [60.0, 66.19], [70.0, 74.09], [77.0, 79.76], [85.0, 110.52]], "keep_status": [false, false, false, false, false, false, true, false, true, false], "silence_prob": [59.07, 32.79, 0.0, 35.97, 0.0, 36.55, 39.57, 37.58, 39.54, 35.91], "audiomae_on_audioset": [null, [["music", 41.46], ["speech", 37.35], ["hum", 3.6]], null, [["music", 73.54], ["musical instrument", 5.24], ["hum", 3.71]], null, [["music", 81.62], ["musical instrument", 2.18], ["ambient music", 1.78]], [["music", 52.75], ["musical instrument", 7.36], ["didgeridoo", 5.32]], [["music", 66.68], ["synthesizer", 6.56], ["musical instrument", 4.0]], [["music", 29.16], ["effects unit", 9.59], ["bass guitar", 8.79]], [["music", 72.58], ["synthesizer", 9.65], ["theremin", 2.84]]], "duration": [2.95, 20.09, 1.1, 10.01, 1.06, 8.37, 6.19, 4.09, 2.76, 25.52]} \ No newline at end of file diff --git a/annotations_1/S1_AkfEVPpI_filtered.json b/annotations_1/S1_AkfEVPpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a38224174d4b5a5123d1f064390accd0d17eeeea --- /dev/null +++ b/annotations_1/S1_AkfEVPpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.45], [8.0, 8.92], [11.0, 11.57], [12.0, 12.88], [14.0, 14.84], [15.0, 15.6], [16.0, 18.32], [19.0, 19.9], [38.0, 39.23], [44.0, 44.47], [45.0, 46.23], [48.0, 52.83], [54.0, 54.36], [55.0, 55.63], [58.0, 59.68], [62.0, 69.55], [71.0, 92.77], [93.0, 93.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 35.92, 0.0, 0.0, 0.0, 34.63, 36.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.35], ["music", 3.42], ["radio", 2.76]], null, null, null, [["speech", 32.8], ["fly, housefly", 12.94], ["mains hum", 5.93]], [["music", 73.24], ["hum", 13.69], ["throbbing", 2.71]], null], "duration": [2.45, 0.92, 0.57, 0.88, 0.84, 0.6, 2.32, 0.9, 1.23, 0.47, 1.23, 4.83, 0.36, 0.63, 1.68, 7.55, 21.77, 0.01]} \ No newline at end of file diff --git a/annotations_1/S1sbKYDgyWA_filtered.json b/annotations_1/S1sbKYDgyWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c03b0d21bdfb37950cd4b2a56c841b35e56c5f0 --- /dev/null +++ b/annotations_1/S1sbKYDgyWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.67], [20.0, 27.45], [30.0, 31.51], [33.0, 34.72], [38.0, 38.85], [41.0, 42.36], [46.0, 47.71], [51.0, 52.62], [56.0, 56.42], [61.0, 61.84], [64.0, 64.02], [66.0, 67.0], [68.0, 69.4], [70.0, 83.4], [85.0, 85.09], [97.0, 98.64], [103.0, 114.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.74, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.14, 0.0, 0.0, 33.16], "audiomae_on_audioset": [null, [["mains hum", 64.75], ["hum", 18.63], ["speech", 6.36]], null, null, null, null, null, null, null, null, null, null, null, [["music", 48.67], ["fart", 16.52], ["speech", 6.75]], null, null, [["music", 72.47], ["speech", 8.2], ["throbbing", 2.8]]], "duration": [9.67, 7.45, 1.51, 1.72, 0.85, 1.36, 1.71, 1.62, 0.42, 0.84, 0.02, 1.0, 1.4, 13.4, 0.09, 1.64, 11.74]} \ No newline at end of file diff --git a/annotations_1/S3-atF715Mg_filtered.json b/annotations_1/S3-atF715Mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3c3c72f15e4cdf36255b0a4b6a847df2b20527a --- /dev/null +++ b/annotations_1/S3-atF715Mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.46], [11.0, 12.23], [12.0, 13.09], [14.0, 15.48], [17.0, 16.98], [19.0, 20.38], [23.0, 33.18], [34.0, 35.23], [39.0, 43.61], [47.0, 49.11], [51.0, 51.95], [53.0, 53.86], [55.0, 62.95], [70.0, 71.0], [72.0, 72.81], [73.0, 74.11], [82.0, 83.83], [87.0, 86.63], [87.0, 87.54], [89.0, 90.59], [97.0, 99.33], [101.0, 104.99], [106.0, 106.39], [113.0, 113.8]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 60.6, 41.24, 0.0, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.19, 31.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 32.49], ["sidetone", 21.74], ["glass", 6.06]], null, null, [["hum", 20.03], ["speech", 15.83], ["music", 12.09]], null, null, [["speech", 38.54], ["mains hum", 18.62], ["hum", 13.7]], null, null, null, null, null, null, null, [["music", 27.39], ["speech", 21.31], ["static", 5.12]], [["speech", 47.29], ["music", 13.35], ["throbbing", 4.73]], null, null], "duration": [1.46, 1.23, 1.09, 1.48, -0.02, 1.38, 10.18, 1.23, 4.61, 2.11, 0.95, 0.86, 7.95, 1.0, 0.81, 1.11, 1.83, -0.37, 0.54, 1.59, 2.33, 3.99, 0.39, 0.8]} \ No newline at end of file diff --git a/annotations_1/S3MGT2fahAY_filtered.json b/annotations_1/S3MGT2fahAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f41cc6a5a6662c4905e6cb22425df02c40d4c093 --- /dev/null +++ b/annotations_1/S3MGT2fahAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.17], [12.0, 13.29], [14.0, 16.92], [17.0, 20.34], [31.0, 31.45], [33.0, 37.89], [39.0, 40.34], [47.0, 52.0], [52.0, 52.84], [53.0, 54.89], [55.0, 54.92], [55.0, 54.95], [55.0, 55.04], [55.0, 55.11], [55.0, 55.14], [55.0, 55.17], [55.0, 55.21], [55.0, 55.24], [55.0, 55.27], [55.0, 55.31], [55.0, 55.34], [55.0, 55.38], [55.0, 55.41], [55.0, 55.49], [56.0, 55.54], [56.0, 55.83], [56.0, 56.96], [58.0, 58.33], [63.0, 63.59], [66.0, 66.75], [71.0, 73.3], [74.0, 75.63], [77.0, 77.94], [79.0, 80.7], [81.0, 82.46], [87.0, 88.87], [90.0, 92.11], [96.0, 98.68], [99.0, 100.48], [105.0, 105.78], [106.0, 106.66], [107.0, 111.57], [112.0, 114.08], [116.0, 116.4], [117.0, 120.04], [123.0, 123.5], [125.0, 125.44], [129.0, 129.05], [129.0, 138.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, true], "silence_prob": [65.2, 0.0, 62.58, 33.77, 0.0, 30.83, 0.0, 30.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 57.32, 0.0, 0.0, 0.0, 49.68, 48.78, 0.0, 31.21, 0.0, 0.0, 0.0, 29.57], "audiomae_on_audioset": [null, null, null, [["mains hum", 31.04], ["hum", 27.08], ["music", 18.41]], null, [["music", 76.48], ["throbbing", 8.06], ["electronic music", 2.18]], null, [["music", 72.91], ["sidetone", 4.34], ["speech", 3.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 9.54], ["animal", 8.91], ["whack, thwack", 5.16]], null, null, null, null, null, [["music", 28.45], ["hum", 21.45], ["throbbing", 8.25]], null, null, null, null, [["music", 44.71], ["hum", 12.71], ["ambient music", 10.55]], [["music", 23.52], ["hum", 15.19], ["throbbing", 9.69]], null, [["gong", 12.07], ["music", 11.01], ["didgeridoo", 9.4]], null, null, null, [["music", 16.26], ["speech", 8.8], ["sound effect", 6.6]]], "duration": [5.17, 1.29, 2.92, 3.34, 0.45, 4.89, 1.34, 5.0, 0.84, 1.89, -0.08, -0.05, 0.04, 0.11, 0.14, 0.17, 0.21, 0.24, 0.27, 0.31, 0.34, 0.38, 0.41, 0.49, -0.46, -0.17, 0.96, 0.33, 0.59, 0.75, 2.3, 1.63, 0.94, 1.7, 1.46, 1.87, 2.11, 2.68, 1.48, 0.78, 0.66, 4.57, 2.08, 0.4, 3.04, 0.5, 0.44, 0.05, 9.37]} \ No newline at end of file diff --git a/annotations_1/S3Po0Tld8Po_filtered.json b/annotations_1/S3Po0Tld8Po_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e87ac54dbbc5563cfd2358ceb9ddf5edf6b4adb0 --- /dev/null +++ b/annotations_1/S3Po0Tld8Po_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [24.0, 24.33], [25.0, 26.1], [28.0, 28.97], [30.0, 29.84], [30.0, 36.64], [38.0, 39.18], [40.0, 40.02], [40.0, 41.05], [42.0, 42.08], [44.0, 44.81], [45.0, 45.72], [46.0, 47.07], [48.0, 48.9], [49.0, 49.71], [52.0, 55.17], [56.0, 56.94], [58.0, 58.87], [60.0, 61.87], [64.0, 65.82], [66.0, 66.61], [67.0, 66.82], [67.0, 67.9], [74.0, 73.79], [74.0, 75.52], [76.0, 77.65], [80.0, 81.4], [84.0, 85.23], [105.0, 106.41], [108.0, 107.96], [109.0, 109.92], [111.0, 112.02], [113.0, 114.37], [116.0, 116.04], [117.0, 117.63], [119.0, 120.68], [123.0, 124.01], [126.0, 126.23], [128.0, 127.85], [134.0, 135.73], [138.0, 138.7], [140.0, 142.05], [143.0, 143.55], [162.0, 162.77], [164.0, 164.44], [167.0, 167.83], [170.0, 181.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 30.47], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 35.64], ["hum", 15.65], ["mains hum", 12.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.49], ["livestock, farm animals, working animals", 7.08], ["whack, thwack", 6.41]]], "duration": [0.74, 0.33, 1.1, 0.97, -0.16, 6.64, 1.18, 0.02, 1.05, 0.08, 0.81, 0.72, 1.07, 0.9, 0.71, 3.17, 0.94, 0.87, 1.87, 1.82, 0.61, -0.18, 0.9, -0.21, 1.52, 1.65, 1.4, 1.23, 1.41, -0.04, 0.92, 1.02, 1.37, 0.04, 0.63, 1.68, 1.01, 0.23, -0.15, 1.73, 0.7, 2.05, 0.55, 0.77, 0.44, 0.83, 11.94]} \ No newline at end of file diff --git a/annotations_1/S3moqQqx3Nk_filtered.json b/annotations_1/S3moqQqx3Nk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f8fbb1d36323c436934c2841720dfbc3f7dd01 --- /dev/null +++ b/annotations_1/S3moqQqx3Nk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.44], [7.0, 12.72], [14.0, 29.15], [32.0, 45.08], [47.0, 47.09], [49.0, 71.51], [72.0, 97.6], [100.0, 107.18]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 28.25, 28.77, 28.55, 0.0, 28.2, 28.33, 28.66], "audiomae_on_audioset": [null, [["music", 28.02], ["speech", 22.53], ["vehicle", 6.78]], [["music", 45.58], ["speech", 23.45], ["didgeridoo", 3.67]], [["buzz", 27.26], ["speech", 15.54], ["music", 8.95]], null, [["music", 69.59], ["hum", 6.05], ["musical instrument", 4.74]], [["music", 37.82], ["hum", 23.16], ["mains hum", 16.77]], [["music", 76.34], ["speech", 4.67], ["buzz", 1.73]]], "duration": [1.44, 5.72, 15.15, 13.08, 0.09, 22.51, 25.6, 7.18]} \ No newline at end of file diff --git a/annotations_1/S4WqfcnVT2g_filtered.json b/annotations_1/S4WqfcnVT2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e675cafc9afb529f799b6cf1bc1c1a4051eef91 --- /dev/null +++ b/annotations_1/S4WqfcnVT2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.95], [10.0, 20.6], [25.0, 25.29], [27.0, 27.7], [32.0, 50.3], [59.0, 64.66], [66.0, 66.8], [69.0, 69.7], [75.0, 78.49], [93.0, 104.26], [105.0, 120.18], [121.0, 149.94], [150.0, 150.26], [150.0, 195.98], [197.0, 197.99]], "keep_status": [false, true, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [53.22, 30.49, 0.0, 0.0, 30.33, 31.23, 0.0, 0.0, 38.06, 35.37, 35.72, 38.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["cacophony", 14.37], ["gong", 13.43], ["music", 13.24]], null, null, [["music", 45.34], ["cacophony", 15.23], ["noise", 4.9]], [["music", 88.15], ["musical instrument", 2.86], ["synthesizer", 1.47]], null, null, [["music", 74.4], ["throbbing", 3.62], ["musical instrument", 2.34]], [["music", 73.89], ["musical instrument", 5.95], ["didgeridoo", 4.98]], [["music", 40.59], ["hum", 11.92], ["throbbing", 8.38]], [["music", 53.39], ["hum", 7.7], ["effects unit", 5.01]], null, null, null], "duration": [4.95, 10.6, 0.29, 0.7, 18.3, 5.66, 0.8, 0.7, 3.49, 11.26, 15.18, 28.94, 0.26, 45.98, 0.99]} \ No newline at end of file diff --git a/annotations_1/S60NRfBYTl4_filtered.json b/annotations_1/S60NRfBYTl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e7dd5456b292c4ab1c6ce3eb00649f4b7716084 --- /dev/null +++ b/annotations_1/S60NRfBYTl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.42], [19.0, 33.37], [35.0, 36.49], [38.0, 39.11], [49.0, 52.96], [57.0, 59.56], [61.0, 61.7], [63.0, 64.3], [68.0, 68.67], [70.0, 71.0], [72.0, 75.3], [83.0, 83.3], [88.0, 89.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.23, 85.9, 0.0, 0.0, 36.64, 86.82, 0.0, 0.0, 0.0, 0.0, 76.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 85.02], ["speech synthesizer", 6.62], ["male speech, man speaking", 1.02]], null, null, null, null, null, null, null, null], "duration": [9.42, 14.37, 1.49, 1.11, 3.96, 2.56, 0.7, 1.3, 0.67, 1.0, 3.3, 0.3, 1.85]} \ No newline at end of file diff --git a/annotations_1/S64LeYg3Tg4_filtered.json b/annotations_1/S64LeYg3Tg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d439185018cb88932068456f273ac50537ad8138 --- /dev/null +++ b/annotations_1/S64LeYg3Tg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.83], [16.0, 16.63], [23.0, 23.43], [27.0, 27.18], [29.0, 29.84], [31.0, 34.2], [36.0, 40.69], [42.0, 42.16], [44.0, 49.92], [50.0, 51.93], [55.0, 57.94], [59.0, 64.03], [66.0, 67.39], [71.0, 71.54], [75.0, 76.0], [80.0, 82.31], [85.0, 85.13], [86.0, 86.51], [95.0, 96.7], [98.0, 101.31], [102.0, 107.99], [110.0, 115.23], [116.0, 118.07], [125.0, 125.93], [134.0, 134.45], [141.0, 140.81], [150.0, 149.62], [151.0, 151.07], [153.0, 153.45], [157.0, 157.05], [160.0, 160.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 99.84, 0.0, 72.16, 0.0, 70.3, 100.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 96.89, 99.16, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.63, 0.43, 0.18, 0.84, 3.2, 4.69, 0.16, 5.92, 1.93, 2.94, 5.03, 1.39, 0.54, 1.0, 2.31, 0.13, 0.51, 1.7, 3.31, 5.99, 5.23, 2.07, 0.93, 0.45, -0.19, -0.38, 0.07, 0.45, 0.05, 0.03]} \ No newline at end of file diff --git a/annotations_1/S6iFW-HoFwc_filtered.json b/annotations_1/S6iFW-HoFwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f862b0bcec1685b93960ec0bc45c849f77c973f5 --- /dev/null +++ b/annotations_1/S6iFW-HoFwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.45], [8.0, 8.43], [11.0, 11.28], [12.0, 12.78], [15.0, 15.3], [16.0, 16.98], [18.0, 18.12], [20.0, 20.75], [22.0, 22.54], [23.0, 22.67], [23.0, 22.77], [23.0, 22.81], [24.0, 24.17], [27.0, 27.87], [29.0, 30.77], [33.0, 34.99], [36.0, 36.98], [37.0, 39.21], [41.0, 42.28], [43.0, 43.51], [44.0, 46.18], [46.0, 47.92], [48.0, 49.87], [55.0, 55.76], [57.0, 57.64], [60.0, 71.95], [73.0, 76.4], [77.0, 83.35], [84.0, 84.33], [86.0, 86.46], [87.0, 92.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 49.22, 55.04, 39.41, 0.0, 0.0, 33.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.77], ["theremin", 8.68], ["cello", 5.39]], null, [["fly, housefly", 20.43], ["hum", 19.51], ["mains hum", 15.97]], null, null, [["speech", 39.66], ["buzz", 11.3], ["electric shaver, electric razor", 10.37]]], "duration": [1.45, 0.43, 0.28, 0.78, 0.3, 0.98, 0.12, 0.75, 0.54, -0.33, -0.23, -0.19, 0.17, 0.87, 1.77, 1.99, 0.98, 2.21, 1.28, 0.51, 2.18, 1.92, 1.87, 0.76, 0.64, 11.95, 3.4, 6.35, 0.33, 0.46, 5.96]} \ No newline at end of file diff --git a/annotations_1/S6yZ-K4SHJU_filtered.json b/annotations_1/S6yZ-K4SHJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e3581de22214ebc9f878d0434e3c38b38820b6a --- /dev/null +++ b/annotations_1/S6yZ-K4SHJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [18.0, 29.74], [35.0, 50.01], [53.0, 59.63]], "keep_status": [false, false, true, true], "silence_prob": [0.0, 29.08, 36.11, 45.72], "audiomae_on_audioset": [null, [["speech", 71.39], ["boing", 6.57], ["music", 4.97]], [["hum", 42.0], ["throbbing", 9.18], ["mains hum", 5.91]], [["speech", 41.93], ["grunt", 8.28], ["frog", 3.7]]], "duration": [1.13, 11.74, 15.01, 6.63]} \ No newline at end of file diff --git a/annotations_1/S76Oq-NDyvw_filtered.json b/annotations_1/S76Oq-NDyvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a391c4d6804ba73d2932d98d35e5dd92aed3ec7b --- /dev/null +++ b/annotations_1/S76Oq-NDyvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [7.0, 7.43], [20.0, 22.15], [47.0, 48.59], [73.0, 77.33], [80.0, 83.13], [89.0, 94.86]], "keep_status": [false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 32.66, 0.0, 31.83, 31.47, 45.08], "audiomae_on_audioset": [null, null, [["music", 54.13], ["didgeridoo", 23.76], ["musical instrument", 6.01]], null, [["music", 61.84], ["electronic music", 4.12], ["musical instrument", 2.2]], [["music", 50.93], ["musical instrument", 6.06], ["cacophony", 3.68]], [["music", 62.87], ["boing", 7.83], ["synthetic singing", 3.69]]], "duration": [1.12, 0.43, 2.15, 1.59, 4.33, 3.13, 5.86]} \ No newline at end of file diff --git a/annotations_1/S7A0JYPGklw_filtered.json b/annotations_1/S7A0JYPGklw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bdea8fcb040c9ead16fec70aefa5c7975eeae4d --- /dev/null +++ b/annotations_1/S7A0JYPGklw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 6.91], [7.0, 9.58], [10.0, 15.45], [19.0, 26.57], [30.0, 38.06], [39.0, 40.83], [42.0, 45.03], [45.0, 49.6], [53.0, 60.59], [62.0, 63.71], [66.0, 67.26], [68.0, 77.72], [81.0, 82.02], [83.0, 83.89], [84.0, 86.07], [88.0, 87.99], [89.0, 90.9], [93.0, 102.81]], "keep_status": [false, false, true, false, false, true, false, true, true, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 45.62, 36.72, 39.55, 42.48, 0.0, 33.77, 38.02, 32.55, 0.0, 0.0, 41.1, 0.0, 0.0, 44.66, 0.0, 0.0, 30.7], "audiomae_on_audioset": [null, null, [["music", 31.3], ["speech", 14.12], ["hum", 10.03]], [["hum", 33.16], ["mains hum", 24.24], ["speech", 14.41]], [["hum", 45.83], ["mains hum", 23.83], ["throbbing", 22.31]], [["hum", 24.13], ["mains hum", 21.04], ["throbbing", 20.22]], null, [["hum", 24.94], ["mains hum", 17.07], ["music", 16.04]], [["hum", 33.89], ["music", 17.57], ["throbbing", 14.5]], [["music", 42.94], ["speech", 22.12], ["hum", 7.78]], null, null, [["speech", 32.16], ["hum", 18.15], ["music", 12.41]], null, null, [["speech", 35.39], ["music", 24.89], ["hum", 9.31]], null, null, [["music", 29.69], ["hum", 19.6], ["mains hum", 7.86]]], "duration": [0.58, 1.91, 2.58, 5.45, 7.57, 8.06, 1.83, 3.03, 4.6, 7.59, 1.71, 1.26, 9.72, 1.02, 0.89, 2.07, -0.01, 1.9, 9.81]} \ No newline at end of file diff --git a/annotations_1/S7iDxRJpDZU_filtered.json b/annotations_1/S7iDxRJpDZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa63c601f7c0358b727fcd33c875ee35e02e6c5 --- /dev/null +++ b/annotations_1/S7iDxRJpDZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 57.45], [61.0, 66.14], [69.0, 69.52], [70.0, 71.63], [73.0, 86.73], [90.0, 111.89], [113.0, 116.8]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [40.79, 65.32, 0.0, 0.0, 32.39, 30.23, 43.96], "audiomae_on_audioset": [[["mains hum", 40.79], ["hum", 20.0], ["buzz", 16.51]], null, null, null, [["music", 61.42], ["buzz", 7.23], ["hum", 4.29]], [["speech", 35.15], ["music", 10.83], ["hum", 8.97]], [["music", 33.24], ["speech", 5.29], ["electronic music", 4.91]]], "duration": [8.45, 5.14, 0.52, 1.63, 13.73, 21.89, 3.8]} \ No newline at end of file diff --git a/annotations_1/S989EXPoZKs_filtered.json b/annotations_1/S989EXPoZKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12644afc87d77d4fa6f676d0bf0edcc6e8420853 --- /dev/null +++ b/annotations_1/S989EXPoZKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.81], [13.0, 13.41], [15.0, 20.09], [33.0, 36.1], [37.0, 42.26], [45.0, 46.11], [50.0, 50.5], [56.0, 57.15], [58.0, 58.7], [61.0, 62.48], [63.0, 64.79], [67.0, 66.87], [72.0, 75.42], [76.0, 79.98], [82.0, 82.17], [84.0, 84.65], [96.0, 95.88], [97.0, 103.52], [106.0, 106.46], [109.0, 110.74], [111.0, 118.37], [120.0, 124.5], [126.0, 127.08], [135.0, 136.73], [138.0, 139.01], [141.0, 144.53], [146.0, 148.34], [150.0, 151.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.57, 100.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.16, 0.0, 0.0, 0.0, 44.4, 0.0, 0.0, 38.19, 40.54, 0.0, 0.0, 0.0, 93.91, 99.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.84], ["ambient music", 5.04], ["musical instrument", 4.71]], null, null, [["music", 70.04], ["bass guitar", 9.25], ["musical instrument", 3.54]], [["music", 58.43], ["speech", 12.28], ["bass guitar", 3.08]], null, null, null, null, null, null], "duration": [-0.19, 0.41, 5.09, 3.1, 5.26, 1.11, 0.5, 1.15, 0.7, 1.48, 1.79, -0.13, 3.42, 3.98, 0.17, 0.65, -0.12, 6.52, 0.46, 1.74, 7.37, 4.5, 1.08, 1.73, 1.01, 3.53, 2.34, 1.44]} \ No newline at end of file diff --git a/annotations_1/S99xKAAo43k_filtered.json b/annotations_1/S99xKAAo43k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c0d3047c019ad47320af165cf69a9cf6c811d41 --- /dev/null +++ b/annotations_1/S99xKAAo43k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 22.01], [22.0, 22.79], [25.0, 26.4], [28.0, 33.42], [35.0, 44.9], [46.0, 47.97], [48.0, 48.96], [51.0, 51.16], [53.0, 53.18], [55.0, 55.68], [56.0, 56.54], [57.0, 57.57], [67.0, 67.78], [74.0, 92.5], [94.0, 95.0], [100.0, 100.74], [102.0, 102.25], [103.0, 103.3], [104.0, 105.14], [106.0, 106.66], [118.0, 118.72], [120.0, 120.73], [124.0, 124.85], [126.0, 128.73]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [32.51, 0.0, 0.0, 34.49, 33.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05], "audiomae_on_audioset": [[["music", 50.21], ["throbbing", 15.32], ["didgeridoo", 12.34]], null, null, [["music", 42.81], ["throbbing", 16.1], ["hum", 3.94]], [["music", 40.59], ["throbbing", 10.02], ["hum", 5.97]], null, null, null, null, null, null, null, null, [["music", 59.94], ["speech", 18.03], ["throbbing", 6.87]], null, null, null, null, null, null, null, null, null, [["music", 18.92], ["hum", 13.83], ["speech", 11.34]]], "duration": [8.01, 0.79, 1.4, 5.42, 9.9, 1.97, 0.96, 0.16, 0.18, 0.68, 0.54, 0.57, 0.78, 18.5, 1.0, 0.74, 0.25, 0.3, 1.14, 0.66, 0.72, 0.73, 0.85, 2.73]} \ No newline at end of file diff --git a/annotations_1/S9EIFSWUoOc_filtered.json b/annotations_1/S9EIFSWUoOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e0722c06a71db06e19b7767c8ac1af73deedda5 --- /dev/null +++ b/annotations_1/S9EIFSWUoOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.15], [27.0, 28.59], [31.0, 31.24], [32.0, 31.7], [32.0, 33.05], [37.0, 37.71], [44.0, 44.12], [45.0, 45.87], [46.0, 47.06], [50.0, 50.11], [53.0, 53.06], [62.0, 62.65], [71.0, 70.87], [72.0, 72.3], [74.0, 74.29], [81.0, 82.07], [83.0, 83.27], [90.0, 96.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.15, 1.59, 0.24, -0.3, 1.05, 0.71, 0.12, 0.87, 1.06, 0.11, 0.06, 0.65, -0.13, 0.3, 0.29, 1.07, 0.27, 6.9]} \ No newline at end of file diff --git a/annotations_1/S9U3ajjpH5A_filtered.json b/annotations_1/S9U3ajjpH5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b16e27872fa0df3a92d7daece72b233ecfb0b33 --- /dev/null +++ b/annotations_1/S9U3ajjpH5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.16], [2.0, 2.15], [3.0, 5.71], [6.0, 6.91], [8.0, 12.11], [22.0, 31.87], [33.0, 40.78]], "keep_status": [false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 35.2, 0.0, 30.5, 49.97, 32.67], "audiomae_on_audioset": [null, null, [["speech", 48.79], ["music", 16.68], ["sidetone", 15.18]], null, [["breaking", 42.21], ["glass", 13.35], ["music", 7.99]], [["hum", 17.52], ["stomach rumble", 8.88], ["music", 6.71]], [["breaking", 22.96], ["music", 11.54], ["thunk", 10.87]]], "duration": [0.16, 0.15, 2.71, 0.91, 4.11, 9.87, 7.78]} \ No newline at end of file diff --git a/annotations_1/SCR9s8egrmo_filtered.json b/annotations_1/SCR9s8egrmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52619f2e98cb522901748e358bfc92560b8257d7 --- /dev/null +++ b/annotations_1/SCR9s8egrmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.04], [6.0, 6.79], [11.0, 11.16], [17.0, 17.32], [19.0, 19.53], [27.0, 26.92], [29.0, 29.24], [30.0, 30.25], [32.0, 34.64], [35.0, 36.24], [37.0, 40.85], [42.0, 44.44], [45.0, 46.99], [51.0, 53.6], [54.0, 56.27], [58.0, 58.31], [63.0, 63.98], [68.0, 68.35], [75.0, 75.51], [76.0, 77.67], [79.0, 81.45], [82.0, 82.21], [84.0, 85.85], [87.0, 91.18], [92.0, 94.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.19, 0.0, 37.02, 63.64, 0.0, 99.05, 54.7, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 91.47, 79.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 72.05], ["speech", 4.34], ["boing", 4.01]], null, [["music", 74.35], ["boing", 6.42], ["musical instrument", 5.06]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.79, 0.16, 0.32, 0.53, -0.08, 0.24, 0.25, 2.64, 1.24, 3.85, 2.44, 1.99, 2.6, 2.27, 0.31, 0.98, 0.35, 0.51, 1.67, 2.45, 0.21, 1.85, 4.18, 2.83]} \ No newline at end of file diff --git a/annotations_1/SCn7SurOKdw_filtered.json b/annotations_1/SCn7SurOKdw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24528c37c63881e9eaf18ed95652e1889b50b5da --- /dev/null +++ b/annotations_1/SCn7SurOKdw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.77], [15.0, 15.38], [19.0, 20.02], [26.0, 26.96], [30.0, 30.87], [37.0, 37.5], [40.0, 40.54], [45.0, 45.4], [46.0, 47.39], [49.0, 49.03], [68.0, 69.57], [70.0, 72.55], [74.0, 74.38], [76.0, 76.4], [78.0, 78.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [40.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.36, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.76], ["didgeridoo", 27.32], ["speech", 4.51]], null, null, null, null, null, null, null, null, null, null, [["music", 29.72], ["speech", 26.05], ["theremin", 10.86]], null, null, null], "duration": [2.77, 0.38, 1.02, 0.96, 0.87, 0.5, 0.54, 0.4, 1.39, 0.03, 1.57, 2.55, 0.38, 0.4, 0.39]} \ No newline at end of file diff --git a/annotations_1/SD0eJL4D6q0_filtered.json b/annotations_1/SD0eJL4D6q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af2d53d7f77ece3db6560dadc7046f0bd2a6b956 --- /dev/null +++ b/annotations_1/SD0eJL4D6q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.5], [19.0, 33.79], [34.0, 39.23], [43.0, 42.97], [48.0, 53.54], [54.0, 74.51], [76.0, 99.93], [101.0, 108.6], [111.0, 111.2]], "keep_status": [true, false, true, false, false, false, true, true, false], "silence_prob": [29.76, 32.16, 31.22, 0.0, 34.43, 35.14, 30.23, 29.06, 0.0], "audiomae_on_audioset": [[["music", 31.91], ["hum", 20.2], ["mains hum", 10.84]], [["hum", 56.24], ["throbbing", 16.24], ["music", 16.11]], [["music", 40.29], ["electronic music", 10.01], ["singing bowl", 7.0]], null, [["music", 40.41], ["speech", 22.65], ["singing bowl", 12.34]], [["music", 42.69], ["hum", 20.62], ["mains hum", 9.16]], [["music", 25.59], ["singing bowl", 16.69], ["insect", 12.38]], [["music", 42.39], ["hum", 13.16], ["mains hum", 7.62]], null], "duration": [4.5, 14.79, 5.23, -0.03, 5.54, 20.51, 23.93, 7.6, 0.2]} \ No newline at end of file diff --git a/annotations_1/SDIk9DOro4A_filtered.json b/annotations_1/SDIk9DOro4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efaa07bed41cf4355f025b406cb2ddd4c41c3edf --- /dev/null +++ b/annotations_1/SDIk9DOro4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [11.0, 10.99], [19.0, 19.5], [27.0, 55.63], [57.0, 63.27], [74.0, 74.29], [75.0, 79.57], [82.0, 86.83], [90.0, 95.44], [96.0, 96.79], [105.0, 105.24], [116.0, 120.39], [121.0, 125.95], [131.0, 131.03], [136.0, 136.19], [141.0, 142.18], [145.0, 150.03], [152.0, 151.98], [155.0, 156.63], [159.0, 160.22], [161.0, 161.22], [168.0, 168.4], [172.0, 173.26], [175.0, 179.04], [181.0, 181.77], [188.0, 190.32], [192.0, 192.84], [197.0, 196.69], [197.0, 199.72]], "keep_status": [false, false, false, true, true, false, true, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.37, 37.65, 0.0, 44.23, 36.89, 37.24, 0.0, 0.0, 44.01, 89.72, 0.0, 0.0, 0.0, 35.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 86.27, 0.0, 0.0, 58.81], "audiomae_on_audioset": [null, null, null, [["music", 41.58], ["livestock, farm animals, working animals", 14.86], ["moo", 7.64]], [["hum", 33.23], ["mains hum", 16.41], ["music", 15.77]], null, [["speech", 20.22], ["whack, thwack", 10.89], ["bouncing", 9.47]], [["speech", 85.92], ["beatboxing", 7.41], ["fart", 1.81]], [["speech", 21.45], ["music", 19.83], ["boing", 12.17]], null, null, [["thunk", 42.78], ["music", 14.91], ["whack, thwack", 6.1]], null, null, null, null, [["music", 24.17], ["laughter", 10.79], ["belly laugh", 7.65]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, -0.01, 0.5, 28.63, 6.27, 0.29, 4.57, 4.83, 5.44, 0.79, 0.24, 4.39, 4.95, 0.03, 0.19, 1.18, 5.03, -0.02, 1.63, 1.22, 0.22, 0.4, 1.26, 4.04, 0.77, 2.32, 0.84, -0.31, 2.72]} \ No newline at end of file diff --git a/annotations_1/SDq_ZTxHLh4_filtered.json b/annotations_1/SDq_ZTxHLh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42447c6861ac7561dce8b1ceeae3745cf1ab4bbd --- /dev/null +++ b/annotations_1/SDq_ZTxHLh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.66], [8.0, 8.58], [16.0, 16.48], [17.0, 19.04], [20.0, 20.33], [23.0, 23.65], [29.0, 29.42], [32.0, 32.48], [33.0, 33.57], [36.0, 36.42], [47.0, 48.02], [49.0, 49.49], [50.0, 51.27], [52.0, 74.16], [78.0, 78.9], [88.0, 88.11], [92.0, 92.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.49, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.34], ["synthesizer", 10.21], ["didgeridoo", 5.25]], null, null, null], "duration": [-0.34, 0.58, 0.48, 2.04, 0.33, 0.65, 0.42, 0.48, 0.57, 0.42, 1.02, 0.49, 1.27, 22.16, 0.9, 0.11, 0.37]} \ No newline at end of file diff --git a/annotations_1/SELFeneZL04_filtered.json b/annotations_1/SELFeneZL04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf48aaa609fd33d7c927c46342843212da08989a --- /dev/null +++ b/annotations_1/SELFeneZL04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [7.0, 7.87], [13.0, 13.51], [16.0, 18.1], [19.0, 20.41], [26.0, 26.62], [27.0, 28.54], [31.0, 31.75], [33.0, 37.05], [38.0, 40.0], [41.0, 44.56], [45.0, 47.93], [48.0, 49.92], [51.0, 66.8], [69.0, 69.92], [71.0, 75.46], [80.0, 87.94], [89.0, 91.23], [94.0, 97.24], [106.0, 110.71], [112.0, 115.69], [116.0, 116.99], [120.0, 120.31], [123.0, 123.92], [126.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 48.82, 78.38, 79.59, 84.62, 0.0, 67.76, 0.0, 34.06, 33.34, 32.93, 32.64, 31.17, 30.65, 0.0, 0.0, 0.0, 58.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 11.16], ["rumble", 10.27], ["goat", 5.61]], null, null, null, null, null, null, [["music", 74.21], ["singing", 5.4], ["musical instrument", 2.34]], [["music", 66.76], ["didgeridoo", 11.88], ["singing", 2.14]], [["music", 64.68], ["musical instrument", 5.54], ["guitar", 5.44]], [["music", 63.81], ["didgeridoo", 7.19], ["synthesizer", 2.98]], [["music", 69.29], ["musical instrument", 3.97], ["clarinet", 1.88]], [["music", 64.95], ["musical instrument", 5.14], ["sitar", 2.41]], null, null, null, null], "duration": [1.34, 0.87, 0.51, 2.1, 1.41, 0.62, 1.54, 0.75, 4.05, 2.0, 3.56, 2.93, 1.92, 15.8, 0.92, 4.46, 7.94, 2.23, 3.24, 4.71, 3.69, 0.99, 0.31, 0.92, 3.05]} \ No newline at end of file diff --git a/annotations_1/SF5EacV4NI0_filtered.json b/annotations_1/SF5EacV4NI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21af10b44e14b0cbf4fc640e7e95e39fb704cf17 --- /dev/null +++ b/annotations_1/SF5EacV4NI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.15], [26.0, 26.06], [26.0, 29.27], [47.0, 47.49], [50.0, 50.06], [51.0, 51.71], [54.0, 57.03], [59.0, 64.18], [65.0, 65.6], [70.0, 77.7], [107.0, 111.7], [112.0, 112.58]], "keep_status": [false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [38.86, 0.0, 32.61, 0.0, 0.0, 0.0, 44.4, 40.17, 0.0, 42.55, 39.43, 0.0], "audiomae_on_audioset": [[["music", 31.1], ["speech", 24.91], ["animal", 15.14]], null, [["speech", 59.08], ["horse", 11.43], ["clip-clop", 7.97]], null, null, null, [["moo", 17.39], ["cattle, bovinae", 15.9], ["livestock, farm animals, working animals", 11.66]], [["speech", 20.01], ["cattle, bovinae", 18.44], ["moo", 15.0]], null, [["radio", 21.77], ["speech", 20.79], ["cattle, bovinae", 11.53]], [["cattle, bovinae", 21.64], ["livestock, farm animals, working animals", 17.87], ["music", 16.03]], null], "duration": [18.15, 0.06, 3.27, 0.49, 0.06, 0.71, 3.03, 5.18, 0.6, 7.7, 4.7, 0.58]} \ No newline at end of file diff --git a/annotations_1/SHaByZZvfFE_filtered.json b/annotations_1/SHaByZZvfFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7959618578a4464e10df4fd84efabf17c3a72602 --- /dev/null +++ b/annotations_1/SHaByZZvfFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 49.2], [50.0, 50.3], [59.0, 60.93], [66.0, 72.86], [75.0, 76.18], [79.0, 79.19], [81.0, 87.07], [88.0, 95.77], [102.0, 104.21]], "keep_status": [false, false, false, true, false, false, true, true, true], "silence_prob": [30.1, 0.0, 0.0, 29.78, 0.0, 0.0, 29.65, 30.32, 32.58], "audiomae_on_audioset": [[["whale vocalization", 52.08], ["music", 28.18], ["speech", 2.34]], null, null, [["music", 27.01], ["throbbing", 26.09], ["hum", 5.02]], null, null, [["buzz", 14.44], ["insect", 12.03], ["music", 11.55]], [["music", 23.45], ["speech", 20.19], ["fly, housefly", 7.35]], [["mains hum", 18.63], ["music", 17.04], ["hum", 11.01]]], "duration": [17.2, 0.3, 1.93, 6.86, 1.18, 0.19, 6.07, 7.77, 2.21]} \ No newline at end of file diff --git a/annotations_1/SJ1_epc6q2E_filtered.json b/annotations_1/SJ1_epc6q2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b0c973df16747ffa268607d4e12ae6664626658 --- /dev/null +++ b/annotations_1/SJ1_epc6q2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.43], [12.0, 15.25], [18.0, 19.95], [21.0, 21.83], [25.0, 26.52], [28.0, 31.06], [33.0, 33.74], [35.0, 41.17], [42.0, 43.38], [44.0, 46.16], [48.0, 49.15], [50.0, 52.69], [53.0, 55.88], [57.0, 58.09], [59.0, 59.85], [61.0, 62.65], [64.0, 65.04], [67.0, 67.91], [70.0, 71.09], [76.0, 77.55], [78.0, 80.01], [81.0, 83.02], [84.0, 85.48], [86.0, 87.15], [88.0, 88.01], [93.0, 93.02], [93.0, 101.24], [102.0, 103.28], [105.0, 106.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.44, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 95.23, 0.0, 100.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, 3.25, 1.95, 0.83, 1.52, 3.06, 0.74, 6.17, 1.38, 2.16, 1.15, 2.69, 2.88, 1.09, 0.85, 1.65, 1.04, 0.91, 1.09, 1.55, 2.01, 2.02, 1.48, 1.15, 0.01, 0.02, 8.24, 1.28, 1.42]} \ No newline at end of file diff --git a/annotations_1/SJSDO3IHsrs_filtered.json b/annotations_1/SJSDO3IHsrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd111b2dca3de7e540b52adff087a8899015ba85 --- /dev/null +++ b/annotations_1/SJSDO3IHsrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.09], [10.0, 14.15], [17.0, 26.4], [40.0, 51.06], [52.0, 67.05], [75.0, 75.36], [77.0, 80.0], [87.0, 89.14], [93.0, 100.99], [112.0, 113.27], [124.0, 125.44], [131.0, 133.91], [136.0, 136.56], [140.0, 142.11], [146.0, 153.44], [155.0, 155.44]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, true, false, true, true, false], "silence_prob": [44.81, 35.1, 32.25, 30.61, 30.89, 0.0, 39.09, 29.45, 33.69, 0.0, 0.0, 48.52, 0.0, 37.61, 31.48, 0.0], "audiomae_on_audioset": [[["music", 69.17], ["didgeridoo", 12.56], ["musical instrument", 4.65]], [["music", 35.28], ["whale vocalization", 34.26], ["musical instrument", 5.3]], [["music", 25.86], ["fly, housefly", 12.42], ["insect", 7.9]], [["music", 70.72], ["hum", 4.92], ["throbbing", 3.34]], [["music", 51.7], ["speech", 9.59], ["rumble", 4.46]], null, [["music", 64.19], ["hum", 5.71], ["scary music", 4.96]], [["music", 17.94], ["hum", 10.08], ["eruption", 6.25]], [["music", 54.43], ["didgeridoo", 14.96], ["quack", 2.42]], null, null, [["hum", 21.95], ["music", 18.55], ["mains hum", 8.18]], null, [["music", 24.19], ["speech", 15.63], ["hum", 15.52]], [["music", 46.72], ["scary music", 12.3], ["bell", 5.43]], null], "duration": [3.09, 4.15, 9.4, 11.06, 15.05, 0.36, 3.0, 2.14, 7.99, 1.27, 1.44, 2.91, 0.56, 2.11, 7.44, 0.44]} \ No newline at end of file diff --git a/annotations_1/SJdUJZ7odoU_filtered.json b/annotations_1/SJdUJZ7odoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0502e0837d09d75b12330dd016f5c709f3cf8055 --- /dev/null +++ b/annotations_1/SJdUJZ7odoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 17.66], [19.0, 21.41], [22.0, 22.55], [25.0, 25.42], [27.0, 26.96], [28.0, 28.85], [31.0, 32.75], [35.0, 37.03], [38.0, 37.99], [39.0, 41.27], [42.0, 44.71], [45.0, 46.94], [53.0, 53.84], [56.0, 56.79], [58.0, 59.49], [61.0, 63.64], [64.0, 77.58], [78.0, 81.53], [82.0, 83.3], [85.0, 86.51], [88.0, 92.75], [93.0, 101.31], [102.0, 104.08], [105.0, 106.12], [107.0, 112.9]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [37.05, 35.36, 0.0, 0.0, 0.0, 0.0, 0.0, 37.07, 0.0, 36.96, 37.54, 0.0, 0.0, 0.0, 0.0, 42.65, 28.38, 29.2, 0.0, 0.0, 31.9, 31.85, 30.98, 0.0, 29.37], "audiomae_on_audioset": [[["hum", 43.12], ["mains hum", 39.34], ["music", 7.22]], [["sine wave", 40.69], ["speech", 20.78], ["music", 9.73]], null, null, null, null, null, [["hum", 25.38], ["mains hum", 21.69], ["music", 12.58]], null, [["music", 43.92], ["gong", 9.73], ["hum", 9.7]], [["music", 55.46], ["electronic music", 7.72], ["gong", 5.76]], null, null, null, null, [["music", 46.92], ["hum", 16.9], ["electronic music", 6.81]], [["speech", 49.62], ["music", 15.75], ["burst, pop", 4.48]], [["speech", 30.12], ["burst, pop", 10.89], ["explosion", 8.93]], null, null, [["throbbing", 74.37], ["hum", 14.0], ["music", 5.46]], [["hum", 34.96], ["throbbing", 30.73], ["speech", 18.0]], [["music", 86.11], ["throbbing", 2.88], ["electronic music", 1.65]], null, [["music", 76.1], ["hum", 4.55], ["didgeridoo", 3.32]]], "duration": [15.66, 2.41, 0.55, 0.42, -0.04, 0.85, 1.75, 2.03, -0.01, 2.27, 2.71, 1.94, 0.84, 0.79, 1.49, 2.64, 13.58, 3.53, 1.3, 1.51, 4.75, 8.31, 2.08, 1.12, 5.9]} \ No newline at end of file diff --git a/annotations_1/SK4l-e7UvRs_filtered.json b/annotations_1/SK4l-e7UvRs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d47952aa85fd35b6062e32509a903ff1d4be093b --- /dev/null +++ b/annotations_1/SK4l-e7UvRs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [6.0, 6.67], [9.0, 9.24], [11.0, 15.94], [29.0, 33.84]], "keep_status": [false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 33.06, 34.4], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 20.49], ["canidae, dogs, wolves", 10.98], ["cattle, bovinae", 7.36]], [["cheering", 25.26], ["crowd", 19.39], ["music", 5.68]]], "duration": [0.55, 0.67, 0.24, 4.94, 4.84]} \ No newline at end of file diff --git a/annotations_1/SKC8iPeIvEA_filtered.json b/annotations_1/SKC8iPeIvEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed2805f09bcddc7c91fb297c35210fbc0b6f9b51 --- /dev/null +++ b/annotations_1/SKC8iPeIvEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.32], [11.0, 12.02], [18.0, 19.26], [32.0, 33.44], [52.0, 52.46], [123.0, 124.11]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.32, 1.02, 1.26, 1.44, 0.46, 1.11]} \ No newline at end of file diff --git a/annotations_1/SKDX-qJaJ08_filtered.json b/annotations_1/SKDX-qJaJ08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f62621e13f240b8258a5425b5e4f39cb1cb3a83 --- /dev/null +++ b/annotations_1/SKDX-qJaJ08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.59], [17.0, 19.04], [36.0, 37.13], [39.0, 39.33], [42.0, 44.86], [46.0, 50.14], [51.0, 52.12], [53.0, 55.41], [56.0, 57.11], [57.0, 57.28], [57.0, 57.54], [58.0, 59.41], [62.0, 63.1], [64.0, 68.13], [69.0, 69.77], [71.0, 71.17], [73.0, 74.14], [75.0, 88.91], [89.0, 92.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.93, 97.22, 0.0, 0.0, 92.64, 88.83, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 100.0, 46.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 61.18], ["speech", 15.87], ["moo", 5.42]]], "duration": [3.59, 2.04, 1.13, 0.33, 2.86, 4.14, 1.12, 2.41, 1.11, 0.28, 0.54, 1.41, 1.1, 4.13, 0.77, 0.17, 1.14, 13.91, 3.67]} \ No newline at end of file diff --git a/annotations_1/SKTvxXjJ_MU_filtered.json b/annotations_1/SKTvxXjJ_MU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..173c43267ed3e6352d35e535f1cb75719f3289dd --- /dev/null +++ b/annotations_1/SKTvxXjJ_MU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.75], [9.0, 10.76], [11.0, 13.8], [16.0, 16.46], [18.0, 18.23], [19.0, 25.35], [26.0, 26.05], [26.0, 27.09], [29.0, 28.83], [31.0, 36.63], [42.0, 42.94], [43.0, 44.17], [45.0, 48.19], [51.0, 52.2], [68.0, 69.99], [73.0, 73.65], [81.0, 85.45], [99.0, 99.54], [105.0, 107.81], [123.0, 123.62], [125.0, 137.39], [141.0, 148.78], [153.0, 153.35], [155.0, 157.11], [158.0, 158.87], [171.0, 175.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, true, false, true], "silence_prob": [37.28, 0.0, 33.5, 0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 29.62, 0.0, 0.0, 29.81, 0.0, 0.0, 0.0, 31.44, 0.0, 31.37, 0.0, 30.55, 29.42, 0.0, 32.28, 0.0, 37.78], "audiomae_on_audioset": [[["hum", 30.29], ["throbbing", 28.63], ["music", 15.62]], null, [["mains hum", 36.81], ["hum", 31.06], ["sidetone", 9.12]], null, null, [["throbbing", 39.21], ["hum", 32.92], ["mains hum", 12.44]], null, null, null, [["hum", 44.12], ["throbbing", 21.07], ["mains hum", 19.38]], null, null, [["throbbing", 31.45], ["hum", 11.5], ["music", 11.31]], null, null, null, [["music", 36.03], ["boing", 12.2], ["buzz", 10.78]], null, [["music", 49.38], ["percussion", 5.17], ["throbbing", 2.96]], null, [["livestock, farm animals, working animals", 50.03], ["music", 13.48], ["cattle, bovinae", 9.46]], [["music", 18.68], ["livestock, farm animals, working animals", 13.56], ["cattle, bovinae", 7.73]], null, [["music", 43.85], ["didgeridoo", 7.59], ["theremin", 6.85]], null, [["music", 29.77], ["hum", 16.03], ["foghorn", 9.1]]], "duration": [4.75, 1.76, 2.8, 0.46, 0.23, 6.35, 0.05, 1.09, -0.17, 5.63, 0.94, 1.17, 3.19, 1.2, 1.99, 0.65, 4.45, 0.54, 2.81, 0.62, 12.39, 7.78, 0.35, 2.11, 0.87, 4.14]} \ No newline at end of file diff --git a/annotations_1/SLC0omm3N98_filtered.json b/annotations_1/SLC0omm3N98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a07a5460fd57e5df2805aaee6f917d89ecbc2d4f --- /dev/null +++ b/annotations_1/SLC0omm3N98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.46], [21.0, 21.66], [22.0, 22.76], [25.0, 26.42], [27.0, 27.57], [30.0, 32.31], [34.0, 34.94], [38.0, 40.04], [42.0, 42.92], [44.0, 45.87], [48.0, 49.69], [52.0, 51.75], [52.0, 53.13], [53.0, 55.36], [56.0, 56.46], [57.0, 58.5], [60.0, 60.88], [62.0, 66.48], [68.0, 69.09], [69.0, 70.87], [71.0, 72.5], [73.0, 73.63], [75.0, 75.56], [77.0, 78.11], [83.0, 86.9], [88.0, 89.75], [91.0, 93.24], [94.0, 93.87], [95.0, 96.33], [97.0, 98.44], [104.0, 104.33], [106.0, 117.58], [120.0, 122.62], [123.0, 123.7], [124.0, 124.95], [128.0, 128.76], [132.0, 132.09], [135.0, 135.06], [143.0, 142.55], [145.0, 146.47], [147.0, 147.93], [149.0, 149.22], [150.0, 150.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.52, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.66, 0.76, 1.42, 0.57, 2.31, 0.94, 2.04, 0.92, 1.87, 1.69, -0.25, 1.13, 2.36, 0.46, 1.5, 0.88, 4.48, 1.09, 1.87, 1.5, 0.63, 0.56, 1.11, 3.9, 1.75, 2.24, -0.13, 1.33, 1.44, 0.33, 11.58, 2.62, 0.7, 0.95, 0.76, 0.09, 0.06, -0.45, 1.47, 0.93, 0.22, 0.5]} \ No newline at end of file diff --git a/annotations_1/SLL5ziDWc6k_filtered.json b/annotations_1/SLL5ziDWc6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6d43b3c7a62d9360f1516ee9464d73065cbe02b --- /dev/null +++ b/annotations_1/SLL5ziDWc6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [5.0, 12.99], [18.0, 18.06], [21.0, 21.3], [24.0, 24.6], [26.0, 25.98], [27.0, 39.12], [40.0, 40.34], [45.0, 47.97], [51.0, 52.59], [54.0, 53.91], [68.0, 83.27], [84.0, 94.07], [96.0, 97.88], [99.0, 100.52], [103.0, 102.95], [106.0, 108.03], [110.0, 110.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 35.75, 0.0, 0.0, 0.0, 0.0, 29.07, 0.0, 69.2, 0.0, 0.0, 29.2, 42.62, 0.0, 0.0, 0.0, 69.47, 0.0], "audiomae_on_audioset": [null, [["speech", 49.4], ["music", 23.41], ["hum", 6.41]], null, null, null, null, [["music", 49.29], ["smash, crash", 10.27], ["whack, thwack", 7.03]], null, null, null, null, [["music", 63.67], ["hum", 11.25], ["mains hum", 3.27]], [["speech", 35.04], ["arrow", 7.41], ["groan", 7.12]], null, null, null, null, null], "duration": [1.38, 7.99, 0.06, 0.3, 0.6, -0.02, 12.12, 0.34, 2.97, 1.59, -0.09, 15.27, 10.07, 1.88, 1.52, -0.05, 2.03, 0.71]} \ No newline at end of file diff --git a/annotations_1/SM2LxRKqYR8_filtered.json b/annotations_1/SM2LxRKqYR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39265c7b6db9154eda5acecbff729a7eccdcc06c --- /dev/null +++ b/annotations_1/SM2LxRKqYR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 28.75], [32.0, 50.75], [51.0, 57.01], [58.0, 59.8], [63.0, 65.04], [66.0, 67.19], [70.0, 73.87], [75.0, 75.32], [79.0, 80.33], [81.0, 82.24], [86.0, 85.87], [117.0, 122.0], [122.0, 124.5], [125.0, 128.36], [131.0, 137.49], [140.0, 149.84], [150.0, 151.04], [152.0, 157.81], [159.0, 163.85], [165.0, 168.08], [171.0, 173.84], [175.0, 178.01], [178.0, 178.26], [178.0, 178.33], [179.0, 178.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.86, 99.21, 99.99, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.75, 18.75, 6.01, 1.8, 2.04, 1.19, 3.87, 0.32, 1.33, 1.24, -0.13, 5.0, 2.5, 3.36, 6.49, 9.84, 1.04, 5.81, 4.85, 3.08, 2.84, 3.01, 0.26, 0.33, -0.42]} \ No newline at end of file diff --git a/annotations_1/SMaYCguBHAA_filtered.json b/annotations_1/SMaYCguBHAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba38b0ac9a17d5ad26805cd9cbe7a110a757e00 --- /dev/null +++ b/annotations_1/SMaYCguBHAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.36], [6.0, 6.76], [8.0, 8.95], [18.0, 19.58], [28.0, 28.12], [28.0, 29.59], [31.0, 35.87], [37.0, 37.49], [39.0, 39.14], [40.0, 40.47], [43.0, 42.7], [44.0, 45.3], [49.0, 51.11], [52.0, 52.3], [64.0, 64.27], [79.0, 79.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.76, 0.95, 1.58, 0.12, 1.59, 4.87, 0.49, 0.14, 0.47, -0.3, 1.3, 2.11, 0.3, 0.27, 0.2]} \ No newline at end of file diff --git a/annotations_1/SN8buDY-7LM_filtered.json b/annotations_1/SN8buDY-7LM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b470bc469948123c8cc11f5e154e8e90e8e2e02 --- /dev/null +++ b/annotations_1/SN8buDY-7LM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.28], [15.0, 18.28], [19.0, 22.38], [23.0, 26.38], [27.0, 34.82], [37.0, 40.54], [42.0, 43.78], [45.0, 51.49], [54.0, 58.43], [59.0, 67.74], [71.0, 102.46], [105.0, 113.95], [115.0, 120.83], [121.0, 122.13], [123.0, 135.23], [136.0, 137.13], [140.0, 144.68], [146.0, 149.18], [150.0, 151.02], [155.0, 160.64], [161.0, 165.43], [167.0, 170.26], [172.0, 173.2], [174.0, 175.85], [176.0, 181.6], [185.0, 186.14], [189.0, 189.68], [191.0, 194.12], [195.0, 195.42], [196.0, 196.64], [197.0, 197.38], [198.0, 199.57], [201.0, 201.85], [202.0, 202.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.79, 61.37, 61.67, 61.08, 76.37, 93.29, 0.0, 64.75, 67.38, 62.89, 0.0, 65.32, 79.24, 0.0, 64.18, 0.0, 95.51, 91.3, 0.0, 64.29, 40.48, 89.19, 0.0, 0.0, 78.72, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.8], ["ping", 5.75], ["synthesizer", 4.44]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.28, 3.28, 3.38, 3.38, 7.82, 3.54, 1.78, 6.49, 4.43, 8.74, 31.46, 8.95, 5.83, 1.13, 12.23, 1.13, 4.68, 3.18, 1.02, 5.64, 4.43, 3.26, 1.2, 1.85, 5.6, 1.14, 0.68, 3.12, 0.42, 0.64, 0.38, 1.57, 0.85, 0.41]} \ No newline at end of file diff --git a/annotations_1/SOR9UOc-alI_filtered.json b/annotations_1/SOR9UOc-alI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de860f837a0434405a3ac03c937efcc9337a0e10 --- /dev/null +++ b/annotations_1/SOR9UOc-alI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 34.62], [35.0, 37.1], [38.0, 39.53], [40.0, 42.58], [44.0, 44.61], [46.0, 46.41], [48.0, 47.78], [54.0, 54.5], [57.0, 58.18], [59.0, 59.21], [61.0, 64.84], [67.0, 68.93], [70.0, 71.29], [73.0, 77.8], [79.0, 79.51], [80.0, 85.51], [88.0, 92.28], [93.0, 94.0], [94.0, 101.21], [103.0, 104.48], [114.0, 114.72], [115.0, 116.14], [121.0, 121.22], [124.0, 124.24], [125.0, 126.4], [128.0, 130.59], [136.0, 140.34], [141.0, 143.61], [147.0, 151.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.89, 78.21, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 0.0, 59.77, 0.0, 96.77, 97.64, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 100.0, 99.84, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.33], ["breaking", 11.86], ["inside, small room", 2.11]], null, null, null, null, null, null, null, null, null, null], "duration": [8.62, 2.1, 1.53, 2.58, 0.61, 0.41, -0.22, 0.5, 1.18, 0.21, 3.84, 1.93, 1.29, 4.8, 0.51, 5.51, 4.28, 1.0, 7.21, 1.48, 0.72, 1.14, 0.22, 0.24, 1.4, 2.59, 4.34, 2.61, 4.7]} \ No newline at end of file diff --git a/annotations_1/SOwJJPZKIys_filtered.json b/annotations_1/SOwJJPZKIys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e8e7413f21510c8711ff7296609f4b846e6b21e --- /dev/null +++ b/annotations_1/SOwJJPZKIys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.55], [28.0, 29.15], [36.0, 36.0], [37.0, 37.64], [40.0, 41.22], [44.0, 46.26], [53.0, 52.93], [65.0, 65.6], [70.0, 69.84], [73.0, 74.58], [92.0, 93.82], [96.0, 96.18], [101.0, 136.29], [139.0, 157.76], [164.0, 166.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.07, 31.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.05], ["didgeridoo", 3.67], ["throbbing", 2.47]], [["roar", 19.77], ["whale vocalization", 12.57], ["animal", 9.09]]], "duration": [0.55, 1.15, 0.0, 0.64, 1.22, 2.26, -0.07, 0.6, -0.16, 1.58, 1.82, 0.18, 35.29, 18.76, 2.55]} \ No newline at end of file diff --git a/annotations_1/SPMpDCxhKGU_filtered.json b/annotations_1/SPMpDCxhKGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1c321c09d53763d5c5423ed75e09d3f3579f676 --- /dev/null +++ b/annotations_1/SPMpDCxhKGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [11.0, 11.53], [13.0, 12.99], [15.0, 15.4], [17.0, 20.51], [22.0, 24.75], [36.0, 37.94], [38.0, 39.5], [40.0, 41.5], [50.0, 52.34], [53.0, 53.15], [53.0, 53.4], [58.0, 62.97], [66.0, 67.36], [71.0, 86.04], [89.0, 92.75], [93.0, 102.14], [103.0, 108.13], [110.0, 119.84], [121.0, 127.4], [128.0, 129.02], [130.0, 131.31], [132.0, 134.42], [140.0, 167.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 99.8, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 32.05, 0.0, 35.96, 68.15, 31.67, 76.37, 32.87, 31.91, 0.0, 0.0, 75.72, 33.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["groan", 25.9], ["wail, moan", 12.41], ["cattle, bovinae", 8.82]], null, [["speech", 21.98], ["cattle, bovinae", 11.83], ["livestock, farm animals, working animals", 11.62]], null, [["groan", 29.72], ["music", 18.56], ["speech", 17.67]], null, [["music", 21.35], ["speech", 12.7], ["animal", 4.96]], [["boing", 27.47], ["whack, thwack", 21.76], ["music", 18.0]], null, null, null, [["music", 55.43], ["throbbing", 6.66], ["electronic music", 5.06]]], "duration": [0.97, 0.53, -0.01, 0.4, 3.51, 2.75, 1.94, 1.5, 1.5, 2.34, 0.15, 0.4, 4.97, 1.36, 15.04, 3.75, 9.14, 5.13, 9.84, 6.4, 1.02, 1.31, 2.42, 27.53]} \ No newline at end of file diff --git a/annotations_1/SQH8if7dbqw_filtered.json b/annotations_1/SQH8if7dbqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ef272b7ba880168a96b99bd98f92de257d96d05 --- /dev/null +++ b/annotations_1/SQH8if7dbqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [8.0, 8.28], [9.0, 11.42], [13.0, 13.2], [17.0, 27.7], [34.0, 36.1], [44.0, 50.82], [52.0, 62.45], [64.0, 64.59], [69.0, 101.26], [110.0, 111.33], [112.0, 113.1], [114.0, 114.4], [116.0, 121.58], [124.0, 125.52]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 32.98, 0.0, 28.86, 29.21, 32.0, 29.49, 0.0, 0.0, 0.0, 0.0, 0.0, 44.87, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.84], ["breaking", 17.25], ["glass", 5.41]], null, [["music", 38.1], ["speech", 36.51], ["didgeridoo", 3.65]], [["music", 54.03], ["throbbing", 7.5], ["hum", 3.83]], [["music", 60.57], ["didgeridoo", 9.38], ["hum", 6.3]], [["throbbing", 25.48], ["hum", 16.55], ["music", 12.39]], null, null, null, null, null, [["music", 27.55], ["speech", 14.64], ["hum", 5.58]], null], "duration": [0.47, 0.28, 2.42, 0.2, 10.7, 2.1, 6.82, 10.45, 0.59, 32.26, 1.33, 1.1, 0.4, 5.58, 1.52]} \ No newline at end of file diff --git a/annotations_1/SRy397r355A_filtered.json b/annotations_1/SRy397r355A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ec7c3cde0cfb878063579df4b5e5f3d1252334a --- /dev/null +++ b/annotations_1/SRy397r355A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.93], [6.0, 7.59], [8.0, 9.04], [10.0, 11.2], [12.0, 15.03], [19.0, 22.65], [24.0, 26.11], [30.0, 30.72], [32.0, 33.74], [34.0, 35.51], [37.0, 38.04], [39.0, 40.22], [41.0, 42.23], [43.0, 43.8], [45.0, 47.48], [48.0, 48.66], [49.0, 50.11], [52.0, 52.08], [53.0, 53.13], [56.0, 56.24], [57.0, 57.28], [66.0, 66.12], [67.0, 67.95], [70.0, 80.16], [82.0, 82.86], [88.0, 88.87], [90.0, 90.48], [93.0, 93.7], [100.0, 101.36], [102.0, 106.02], [109.0, 109.31], [117.0, 117.44], [119.0, 119.06], [122.0, 122.4], [129.0, 129.3], [130.0, 130.22], [132.0, 132.81], [137.0, 137.59], [138.0, 143.78], [144.0, 148.53], [150.0, 150.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.08, 98.73, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.87, 0.0, 0.0, 0.0, 0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 98.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.36], ["boing", 13.36], ["speech", 3.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 1.59, 1.04, 1.2, 3.03, 3.65, 2.11, 0.72, 1.74, 1.51, 1.04, 1.22, 1.23, 0.8, 2.48, 0.66, 1.11, 0.08, 0.13, 0.24, 0.28, 0.12, 0.95, 10.16, 0.86, 0.87, 0.48, 0.7, 1.36, 4.02, 0.31, 0.44, 0.06, 0.4, 0.3, 0.22, 0.81, 0.59, 5.78, 4.53, 0.69]} \ No newline at end of file diff --git a/annotations_1/SSQJIBb_9gw_filtered.json b/annotations_1/SSQJIBb_9gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2a63c4e5ec4256e4e4f3daa0a39aa85ee7590fe --- /dev/null +++ b/annotations_1/SSQJIBb_9gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.22], [19.0, 19.92], [22.0, 22.76], [23.0, 26.37], [27.0, 28.02], [29.0, 29.35], [29.0, 32.48], [34.0, 43.36], [46.0, 46.21], [48.0, 48.1], [49.0, 54.06], [54.0, 59.04], [62.0, 62.31], [63.0, 66.72], [70.0, 70.65], [74.0, 74.8], [75.0, 75.61], [76.0, 78.31], [79.0, 79.46], [80.0, 80.33], [87.0, 87.81], [88.0, 88.48], [93.0, 93.8], [95.0, 97.31], [98.0, 98.29], [99.0, 101.24], [102.0, 104.8], [108.0, 110.03], [110.0, 111.65], [114.0, 114.89]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false], "silence_prob": [90.25, 0.0, 0.0, 39.49, 0.0, 0.0, 32.66, 31.52, 0.0, 0.0, 30.52, 29.55, 0.0, 29.84, 0.0, 0.0, 0.0, 30.68, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89, 0.0, 34.9, 31.11, 31.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 43.32], ["noise", 18.84], ["theremin", 5.02]], null, null, [["livestock, farm animals, working animals", 59.52], ["cattle, bovinae", 16.5], ["moo", 15.34]], [["music", 45.21], ["screaming", 9.69], ["speech", 7.55]], null, null, [["music", 51.92], ["cattle, bovinae", 11.24], ["speech", 7.46]], [["music", 20.95], ["speech", 12.96], ["moo", 10.8]], null, [["speech", 60.79], ["music", 6.62], ["whale vocalization", 5.4]], null, null, null, [["music", 44.96], ["speech", 33.99], ["theremin", 7.18]], null, null, null, null, null, [["music", 48.23], ["speech", 7.42], ["crying, sobbing", 4.57]], null, [["speech", 33.21], ["baby laughter", 16.25], ["baby cry, infant cry", 11.36]], [["music", 31.7], ["wail, moan", 25.24], ["speech", 9.47]], [["groan", 15.29], ["crying, sobbing", 12.25], ["whimper", 5.66]], null, null], "duration": [2.22, 0.92, 0.76, 3.37, 1.02, 0.35, 3.48, 9.36, 0.21, 0.1, 5.06, 5.04, 0.31, 3.72, 0.65, 0.8, 0.61, 2.31, 0.46, 0.33, 0.81, 0.48, 0.8, 2.31, 0.29, 2.24, 2.8, 2.03, 1.65, 0.89]} \ No newline at end of file diff --git a/annotations_1/SSY6_T2oAow_filtered.json b/annotations_1/SSY6_T2oAow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce0fe891a728917bd526b9fe6ae887fbb103c31a --- /dev/null +++ b/annotations_1/SSY6_T2oAow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 60.49], [61.0, 61.74], [62.0, 62.55], [64.0, 65.62], [67.0, 101.38], [115.0, 116.77]], "keep_status": [true, false, false, false, false, false], "silence_prob": [35.4, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.8], ["whip", 6.65], ["smash, crash", 5.99]], null, null, null, null, null], "duration": [20.49, 0.74, 0.55, 1.62, 34.38, 1.77]} \ No newline at end of file diff --git a/annotations_1/STfoetR9Su8_filtered.json b/annotations_1/STfoetR9Su8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0ddf0aed35d0e8a83197ae818c8f78f46baf435 --- /dev/null +++ b/annotations_1/STfoetR9Su8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.96], [18.0, 59.64], [61.0, 61.23], [62.0, 83.67], [84.0, 84.86], [94.0, 96.25]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 29.84, 0.0, 30.56], "audiomae_on_audioset": [null, null, null, [["music", 82.15], ["cacophony", 10.58], ["throbbing", 0.84]], null, [["music", 38.81], ["throbbing", 15.78], ["hum", 7.45]]], "duration": [1.96, 41.64, 0.23, 21.67, 0.86, 2.25]} \ No newline at end of file diff --git a/annotations_1/STh780YGgIo_filtered.json b/annotations_1/STh780YGgIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ec572ba6fa6c0021e3a74a1c4159bad9c1d049 --- /dev/null +++ b/annotations_1/STh780YGgIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 34.47], [37.0, 39.68], [40.0, 41.79], [43.0, 45.32], [47.0, 63.8], [67.0, 81.04], [82.0, 83.62], [84.0, 84.91], [86.0, 86.22], [90.0, 93.55], [94.0, 97.97], [99.0, 101.95], [103.0, 106.37], [107.0, 119.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.27, 0.0, 80.11, 33.64, 57.01, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 79.07, 99.78], "audiomae_on_audioset": [null, null, null, null, [["music", 75.51], ["ambient music", 4.67], ["tick-tock", 3.06]], null, null, null, null, null, null, null, null, null], "duration": [1.47, 2.68, 1.79, 2.32, 16.8, 14.04, 1.62, 0.91, 0.22, 3.55, 3.97, 2.95, 3.37, 12.4]} \ No newline at end of file diff --git a/annotations_1/STl0s9g_FwA_filtered.json b/annotations_1/STl0s9g_FwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fdd34b9692b3660d64f629cce019c08a456a849 --- /dev/null +++ b/annotations_1/STl0s9g_FwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [5.0, 11.7], [14.0, 14.44], [16.0, 16.87], [30.0, 30.37], [32.0, 32.39], [38.0, 38.16], [39.0, 39.65], [41.0, 41.07], [43.0, 43.77], [48.0, 49.67], [62.0, 62.36], [73.0, 73.79], [75.0, 75.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 6.7, 0.44, 0.87, 0.37, 0.39, 0.16, 0.65, 0.07, 0.77, 1.67, 0.36, 0.79, 0.59]} \ No newline at end of file diff --git a/annotations_1/STqJ_Up4iFg_filtered.json b/annotations_1/STqJ_Up4iFg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b06309aa94863e15327ce01625076f89638e9abd --- /dev/null +++ b/annotations_1/STqJ_Up4iFg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [9.0, 10.17], [14.0, 19.36], [22.0, 24.56], [26.0, 26.49], [29.0, 30.33], [33.0, 33.93], [35.0, 36.02], [41.0, 44.14], [55.0, 55.51], [59.0, 62.46], [67.0, 80.2], [83.0, 83.15], [84.0, 85.75], [93.0, 94.04], [97.0, 99.98], [106.0, 106.37], [113.0, 112.94], [113.0, 135.51], [137.0, 140.04], [141.0, 141.44], [143.0, 149.13], [151.0, 152.04], [152.0, 157.08], [160.0, 160.25]], "keep_status": [false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.14, 43.79, 0.0, 0.0, 0.0, 0.0, 32.12, 0.0, 31.4, 32.65, 0.0, 0.0, 0.0, 33.28, 0.0, 0.0, 40.17, 40.97, 0.0, 37.84, 0.0, 80.46, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 38.2], ["music", 20.47], ["theremin", 7.73]], [["music", 20.03], ["hum", 7.54], ["mains hum", 5.41]], null, null, null, null, [["music", 60.7], ["smash, crash", 4.17], ["musical instrument", 2.9]], null, [["music", 39.5], ["boing", 10.67], ["fly, housefly", 6.41]], [["music", 85.52], ["throbbing", 4.9], ["hum", 1.76]], null, null, null, [["music", 43.98], ["fly, housefly", 7.05], ["mosquito", 3.76]], null, null, [["speech", 28.46], ["whack, thwack", 25.1], ["boing", 14.17]], [["speech", 56.68], ["thunk", 11.17], ["breaking", 3.5]], null, [["speech", 37.11], ["music", 35.98], ["whack, thwack", 8.08]], null, null, null], "duration": [0.85, 1.17, 5.36, 2.56, 0.49, 1.33, 0.93, 1.02, 3.14, 0.51, 3.46, 13.2, 0.15, 1.75, 1.04, 2.98, 0.37, -0.06, 22.51, 3.04, 0.44, 6.13, 1.04, 5.08, 0.25]} \ No newline at end of file diff --git a/annotations_1/SUKdlcCiE60_filtered.json b/annotations_1/SUKdlcCiE60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..548164e661347fb0b771d9fa016add4e52e96abf --- /dev/null +++ b/annotations_1/SUKdlcCiE60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [6.0, 7.64], [9.0, 9.56], [12.0, 13.49], [15.0, 15.55], [18.0, 20.31], [23.0, 23.87], [26.0, 26.18], [27.0, 27.28], [31.0, 31.94], [33.0, 32.97], [33.0, 33.12], [33.0, 35.01], [37.0, 38.15], [42.0, 43.07], [47.0, 48.66], [51.0, 52.2], [53.0, 53.57], [65.0, 65.72], [67.0, 70.38], [72.0, 72.3], [77.0, 77.55], [81.0, 81.06], [84.0, 85.43], [92.0, 93.18], [98.0, 99.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.64, 0.56, 1.49, 0.55, 2.31, 0.87, 0.18, 0.28, 0.94, -0.03, 0.12, 2.01, 1.15, 1.07, 1.66, 1.2, 0.57, 0.72, 3.38, 0.3, 0.55, 0.06, 1.43, 1.18, 1.22]} \ No newline at end of file diff --git a/annotations_1/SUfo49TsWOQ_filtered.json b/annotations_1/SUfo49TsWOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6886bbf6cb8d1bbc0a3548ae44eeafadc7bc4611 --- /dev/null +++ b/annotations_1/SUfo49TsWOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [6.0, 6.17], [7.0, 8.13], [9.0, 9.49], [12.0, 19.89], [23.0, 23.65], [24.0, 27.99], [29.0, 30.23], [36.0, 36.02], [37.0, 37.72], [39.0, 39.38], [40.0, 40.34], [41.0, 40.88], [44.0, 43.73], [45.0, 47.33], [48.0, 49.25], [52.0, 53.37], [55.0, 55.71], [61.0, 62.06], [67.0, 68.2], [70.0, 70.65], [72.0, 74.12], [79.0, 79.47], [81.0, 82.31], [83.0, 84.4], [85.0, 86.12], [87.0, 89.65], [92.0, 94.36], [96.0, 97.19], [99.0, 100.79], [106.0, 107.03], [108.0, 109.88], [111.0, 114.03], [118.0, 119.23], [121.0, 121.59], [125.0, 129.69], [131.0, 131.99], [134.0, 134.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 99.26, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 83.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.17, 1.13, 0.49, 7.89, 0.65, 3.99, 1.23, 0.02, 0.72, 0.38, 0.34, -0.12, -0.27, 2.33, 1.25, 1.37, 0.71, 1.06, 1.2, 0.65, 2.12, 0.47, 1.31, 1.4, 1.12, 2.65, 2.36, 1.19, 1.79, 1.03, 1.88, 3.03, 1.23, 0.59, 4.69, 0.99, 0.96]} \ No newline at end of file diff --git a/annotations_1/SUr7fu-LXj4_filtered.json b/annotations_1/SUr7fu-LXj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c6a04761451deaa4e8f44b4bcdf5cb8f939b7e9 --- /dev/null +++ b/annotations_1/SUr7fu-LXj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 1.0], [1.0, 1.11], [1.0, 1.49], [2.0, 2.25], [9.0, 26.49], [39.0, 44.02], [52.0, 55.39], [68.0, 71.15], [72.0, 71.85], [78.0, 80.59], [81.0, 81.82], [84.0, 84.48], [90.0, 95.39], [105.0, 179.95], [188.0, 188.01], [188.0, 188.94], [189.0, 191.56], [193.0, 202.07], [203.0, 204.53]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.42, 30.53, 35.15, 31.48, 0.0, 32.49, 0.0, 0.0, 32.54, 0.0, 0.0, 0.0, 31.23, 32.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 77.27], ["didgeridoo", 5.37], ["speech", 3.01]], [["music", 41.07], ["speech", 7.51], ["crowd", 3.2]], [["music", 71.77], ["brass instrument", 6.7], ["trombone", 6.56]], [["music", 46.78], ["didgeridoo", 19.83], ["musical instrument", 4.94]], null, [["music", 66.75], ["didgeridoo", 13.28], ["musical instrument", 2.54]], null, null, [["music", 58.29], ["didgeridoo", 22.98], ["musical instrument", 5.19]], null, null, null, [["music", 85.08], ["didgeridoo", 1.09], ["speech", 0.96]], [["music", 38.37], ["chime", 14.07], ["cacophony", 6.95]], null], "duration": [0.5, 0.0, 0.11, 0.49, 0.25, 17.49, 5.02, 3.39, 3.15, -0.15, 2.59, 0.82, 0.48, 5.39, 74.95, 0.01, 0.94, 2.56, 9.07, 1.53]} \ No newline at end of file diff --git a/annotations_1/SV8jbzudYJ8_filtered.json b/annotations_1/SV8jbzudYJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bbe31ac99547624ff6b01599a2bd7f20fff8c8f --- /dev/null +++ b/annotations_1/SV8jbzudYJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.02], [3.0, 7.06], [9.0, 11.37], [15.0, 16.92], [18.0, 20.51], [24.0, 26.64], [30.0, 32.46], [37.0, 40.44], [42.0, 45.39], [46.0, 51.24], [51.0, 55.22], [56.0, 59.44], [61.0, 71.86], [74.0, 78.43], [82.0, 83.62], [85.0, 94.02], [95.0, 99.13], [101.0, 105.65], [108.0, 112.08], [113.0, 114.42], [116.0, 118.94], [120.0, 124.01], [125.0, 127.63], [129.0, 131.45], [132.0, 135.03], [136.0, 141.74], [142.0, 146.55], [147.0, 148.24], [150.0, 153.05], [158.0, 159.85], [163.0, 163.43], [170.0, 171.58], [182.0, 187.44], [190.0, 191.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.39, 100.0, 0.0, 83.7, 99.26, 99.85, 100.0, 45.95, 62.17, 57.32, 99.05, 53.65, 55.96, 0.0, 58.3, 70.72, 99.98, 100.0, 0.0, 66.39, 100.0, 100.0, 96.54, 45.88, 65.79, 42.39, 0.0, 88.83, 0.0, 0.0, 0.0, 85.72, 0.0], "audiomae_on_audioset": [null, [["sidetone", 69.37], ["speech", 9.23], ["chirp tone", 3.44]], null, null, null, null, null, null, [["speech", 49.79], ["sine wave", 13.23], ["chirp tone", 12.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.71], ["hum", 9.62], ["sidetone", 5.59]], null, [["sidetone", 66.42], ["speech", 12.16], ["music", 7.17]], null, null, null, null, null, null, null], "duration": [1.02, 4.06, 2.37, 1.92, 2.51, 2.64, 2.46, 3.44, 3.39, 5.24, 4.22, 3.44, 10.86, 4.43, 1.62, 9.02, 4.13, 4.65, 4.08, 1.42, 2.94, 4.01, 2.63, 2.45, 3.03, 5.74, 4.55, 1.24, 3.05, 1.85, 0.43, 1.58, 5.44, 1.74]} \ No newline at end of file diff --git a/annotations_1/SVQDD7TK-qA_filtered.json b/annotations_1/SVQDD7TK-qA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f412523f856c167669ed5a9046a93b76111382eb --- /dev/null +++ b/annotations_1/SVQDD7TK-qA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.1], [5.0, 13.86], [15.0, 15.55], [17.0, 18.25], [20.0, 25.14], [25.0, 25.32], [25.0, 32.16], [33.0, 36.04], [41.0, 43.17], [46.0, 57.2], [62.0, 62.36], [64.0, 64.3], [75.0, 80.92], [83.0, 85.02], [91.0, 100.26], [105.0, 109.43], [112.0, 112.5], [113.0, 114.44], [115.0, 114.79], [118.0, 120.01], [121.0, 123.11], [129.0, 130.62], [133.0, 154.04], [155.0, 156.51], [158.0, 173.03]], "keep_status": [false, true, false, false, true, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 31.63, 0.0, 0.0, 30.53, 0.0, 31.5, 38.56, 36.59, 50.97, 0.0, 0.0, 41.76, 98.44, 88.1, 69.47, 0.0, 0.0, 0.0, 84.25, 37.16, 0.0, 32.96, 0.0, 31.85], "audiomae_on_audioset": [null, [["speech", 38.76], ["noise", 11.37], ["scratching (performance technique)", 10.43]], null, null, [["speech", 27.38], ["whack, thwack", 13.76], ["animal", 11.23]], null, [["speech", 43.75], ["breaking", 8.46], ["whack, thwack", 7.16]], [["speech", 36.96], ["fart", 17.7], ["animal", 6.63]], [["speech", 37.59], ["music", 12.86], ["throbbing", 4.35]], null, null, null, [["cattle, bovinae", 37.91], ["livestock, farm animals, working animals", 29.3], ["moo", 22.16]], null, null, null, null, null, null, null, [["speech", 42.25], ["sidetone", 12.69], ["eruption", 7.1]], null, [["speech", 32.38], ["music", 18.25], ["hum", 8.77]], null, [["breaking", 35.19], ["whack, thwack", 21.33], ["music", 15.36]]], "duration": [0.1, 8.86, 0.55, 1.25, 5.14, 0.32, 7.16, 3.04, 2.17, 11.2, 0.36, 0.3, 5.92, 2.02, 9.26, 4.43, 0.5, 1.44, -0.21, 2.01, 2.11, 1.62, 21.04, 1.51, 15.03]} \ No newline at end of file diff --git a/annotations_1/SVSzVDnvkHw_filtered.json b/annotations_1/SVSzVDnvkHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..003524951293d714098ea36edfdb0bc4105eeb93 --- /dev/null +++ b/annotations_1/SVSzVDnvkHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.03], [21.0, 21.29], [22.0, 22.5], [24.0, 27.53], [30.0, 37.03], [38.0, 38.55], [46.0, 46.58], [47.0, 47.76], [58.0, 58.94], [60.0, 60.29], [61.0, 62.41], [67.0, 67.44], [69.0, 69.23], [70.0, 71.59], [79.0, 79.3], [81.0, 81.92], [90.0, 92.42], [93.0, 93.51], [99.0, 99.37], [100.0, 101.87], [116.0, 117.21], [124.0, 124.55], [125.0, 131.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.22, 34.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 0.0, 0.0, 0.0, 0.0, 0.0, 32.31], "audiomae_on_audioset": [null, null, null, [["gong", 62.34], ["speech", 14.06], ["music", 8.39]], [["music", 40.56], ["speech", 27.54], ["synthesizer", 6.16]], null, null, null, null, null, null, null, null, null, null, null, [["shofar", 26.05], ["sine wave", 14.46], ["wind instrument, woodwind instrument", 9.74]], null, null, null, null, null, [["music", 35.25], ["speech", 31.45], ["theremin", 3.76]]], "duration": [1.03, 0.29, 0.5, 3.53, 7.03, 0.55, 0.58, 0.76, 0.94, 0.29, 1.41, 0.44, 0.23, 1.59, 0.3, 0.92, 2.42, 0.51, 0.37, 1.87, 1.21, 0.55, 6.31]} \ No newline at end of file diff --git a/annotations_1/SVTxvLaac6A_filtered.json b/annotations_1/SVTxvLaac6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26188c8bec6d6b7041d3aaf8ff09f93936ac1dde --- /dev/null +++ b/annotations_1/SVTxvLaac6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 14.55], [15.0, 31.28], [32.0, 36.61], [37.0, 44.96], [46.0, 57.3], [58.0, 61.94], [64.0, 64.61], [68.0, 70.58], [72.0, 74.16], [80.0, 81.01], [82.0, 83.78], [89.0, 92.96], [98.0, 97.95], [98.0, 99.81], [103.0, 129.56], [132.0, 136.11], [137.0, 137.2], [144.0, 147.07], [149.0, 150.01]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, true, false, false, true, true, false, true, false], "silence_prob": [65.32, 35.28, 60.42, 46.09, 39.25, 55.39, 0.0, 30.43, 46.94, 0.0, 0.0, 32.73, 0.0, 0.0, 31.19, 31.15, 0.0, 29.34, 0.0], "audiomae_on_audioset": [null, [["music", 44.1], ["throbbing", 11.76], ["hum", 7.32]], null, [["music", 33.74], ["speech", 29.81], ["thunk", 15.06]], [["music", 42.97], ["speech", 8.02], ["singing bowl", 7.8]], null, null, [["speech", 56.62], ["music", 5.89], ["static", 4.79]], [["music", 63.24], ["guitar", 4.02], ["inside, small room", 3.66]], null, null, [["boing", 19.3], ["speech", 17.79], ["music", 17.31]], null, null, [["speech", 30.36], ["livestock, farm animals, working animals", 9.26], ["explosion", 8.97]], [["fly, housefly", 29.05], ["insect", 15.83], ["mosquito", 15.4]], null, [["didgeridoo", 34.38], ["speech", 21.29], ["music", 12.46]], null], "duration": [11.55, 16.28, 4.61, 7.96, 11.3, 3.94, 0.61, 2.58, 2.16, 1.01, 1.78, 3.96, -0.05, 1.81, 26.56, 4.11, 0.2, 3.07, 1.01]} \ No newline at end of file diff --git a/annotations_1/SV_eLd8wm70_filtered.json b/annotations_1/SV_eLd8wm70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcc02b160f2c2deaf0dfc34d3ec9cf1787731d1f --- /dev/null +++ b/annotations_1/SV_eLd8wm70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [5.0, 7.96], [9.0, 10.61], [13.0, 14.77], [19.0, 24.34], [26.0, 26.05], [27.0, 27.78], [31.0, 32.53], [34.0, 35.58], [36.0, 38.37], [39.0, 39.02], [42.0, 42.6], [44.0, 44.86], [49.0, 49.59], [57.0, 56.98], [57.0, 58.72], [60.0, 61.03], [65.0, 65.5], [67.0, 84.86], [86.0, 86.63], [88.0, 102.84], [104.0, 106.3], [106.0, 106.47], [107.0, 110.47], [112.0, 113.98], [117.0, 118.0], [122.0, 122.35], [124.0, 124.48], [126.0, 126.76]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 39.55, 0.0, 0.0, 31.24, 0.0, 0.0, 0.0, 0.0, 31.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 0.0, 28.91, 66.15, 0.0, 43.2, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 38.81], ["music", 7.09], ["sidetone", 4.93]], null, null, [["speech", 54.98], ["music", 24.38], ["electronic music", 3.68]], null, null, null, null, [["speech", 33.22], ["music", 33.12], ["thunk", 3.47]], null, null, null, null, null, null, null, null, [["music", 83.54], ["throbbing", 4.27], ["hum", 1.44]], null, [["speech", 31.82], ["music", 31.34], ["electric shaver, electric razor", 5.88]], null, null, [["thunk", 28.13], ["music", 16.09], ["hum", 7.73]], null, null, null, null, null], "duration": [1.23, 2.96, 1.61, 1.77, 5.34, 0.05, 0.78, 1.53, 1.58, 2.37, 0.02, 0.6, 0.86, 0.59, -0.02, 1.72, 1.03, 0.5, 17.86, 0.63, 14.84, 2.3, 0.47, 3.47, 1.98, 1.0, 0.35, 0.48, 0.76]} \ No newline at end of file diff --git a/annotations_1/SW-1sk_U8vU_filtered.json b/annotations_1/SW-1sk_U8vU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..577c1366b7852fcc41d5eb054677d6c6a810ef1f --- /dev/null +++ b/annotations_1/SW-1sk_U8vU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [6.0, 8.97], [13.0, 13.24], [16.0, 18.39], [24.0, 25.3], [30.0, 43.75], [45.0, 49.55], [52.0, 55.53], [57.0, 57.96], [63.0, 65.6], [71.0, 72.98], [76.0, 77.9], [81.0, 85.9], [94.0, 96.62], [99.0, 99.39], [100.0, 101.31], [103.0, 102.86], [109.0, 109.73], [112.0, 112.36], [114.0, 114.56], [115.0, 116.26], [118.0, 122.69], [123.0, 124.56], [126.0, 126.59], [137.0, 137.73], [150.0, 150.87], [153.0, 154.79], [160.0, 160.3], [166.0, 167.26], [170.0, 171.76], [178.0, 180.57], [182.0, 183.42], [192.0, 193.73], [195.0, 197.02], [198.0, 203.1]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 89.01, 0.0, 49.4, 0.0, 40.5, 59.15, 56.78, 0.0, 90.6, 0.0, 0.0, 81.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 37.71, 36.66], "audiomae_on_audioset": [null, null, null, [["music", 34.33], ["speech", 13.19], ["singing bowl", 6.52]], null, [["ambient music", 27.63], ["music", 22.27], ["singing bowl", 11.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.2], ["music", 15.39], ["hum", 4.74]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 20.82], ["music", 18.64], ["hum", 12.12]], [["music", 23.3], ["hum", 16.28], ["throbbing", 10.84]]], "duration": [0.7, 2.97, 0.24, 2.39, 1.3, 13.75, 4.55, 3.53, 0.96, 2.6, 1.98, 1.9, 4.9, 2.62, 0.39, 1.31, -0.14, 0.73, 0.36, 0.56, 1.26, 4.69, 1.56, 0.59, 0.73, 0.87, 1.79, 0.3, 1.26, 1.76, 2.57, 1.42, 1.73, 2.02, 5.1]} \ No newline at end of file diff --git a/annotations_1/SW5_v_8r9VA_filtered.json b/annotations_1/SW5_v_8r9VA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fc78cc5253e46b3b57e3c376a26baf89fb215f --- /dev/null +++ b/annotations_1/SW5_v_8r9VA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.77], [9.0, 9.49], [10.0, 9.63], [17.0, 19.2], [21.0, 62.16], [62.0, 69.48], [71.0, 71.44], [73.0, 80.67], [86.0, 93.66], [95.0, 96.9]], "keep_status": [false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.63, 0.0, 35.57, 0.0, 30.37, 31.33, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.79], ["cattle, bovinae", 13.12], ["moo", 12.52]], null, [["music", 37.67], ["speech", 33.36], ["breaking", 7.63]], null, [["music", 37.55], ["throbbing", 26.78], ["speech", 15.35]], [["ding", 21.22], ["clang", 19.07], ["music", 7.39]], null], "duration": [-0.23, 0.49, -0.37, 2.2, 41.16, 7.48, 0.44, 7.67, 7.66, 1.9]} \ No newline at end of file diff --git a/annotations_1/SWKDbfvyZMU_filtered.json b/annotations_1/SWKDbfvyZMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..182b9ae5f132020472bc7cee8f0bda99d2b9e6bd --- /dev/null +++ b/annotations_1/SWKDbfvyZMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.19], [9.0, 11.37], [13.0, 13.73], [14.0, 19.03], [24.0, 24.16], [25.0, 27.92], [30.0, 33.17], [34.0, 42.4], [43.0, 47.63], [50.0, 51.09], [56.0, 56.42], [67.0, 68.23], [69.0, 70.46], [72.0, 72.96], [74.0, 76.86], [81.0, 81.7], [83.0, 83.42], [88.0, 89.18], [92.0, 98.12], [98.0, 99.0], [102.0, 105.24], [111.0, 118.86], [127.0, 130.65], [133.0, 133.81], [136.0, 139.97], [141.0, 142.99], [145.0, 148.68]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [99.99, 48.69, 0.0, 60.89, 0.0, 97.73, 52.45, 88.64, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 30.16, 0.0, 31.86, 33.36, 51.5, 0.0, 80.64, 0.0, 75.39], "audiomae_on_audioset": [null, [["clang", 40.27], ["speech", 18.35], ["ding", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.43], ["music", 6.23], ["applause", 4.37]], null, [["speech", 54.46], ["vehicle", 6.71], ["car", 5.53]], [["speech", 58.86], ["vehicle", 8.86], ["music", 6.56]], null, null, null, null, null], "duration": [2.19, 2.37, 0.73, 5.03, 0.16, 2.92, 3.17, 8.4, 4.63, 1.09, 0.42, 1.23, 1.46, 0.96, 2.86, 0.7, 0.42, 1.18, 6.12, 1.0, 3.24, 7.86, 3.65, 0.81, 3.97, 1.99, 3.68]} \ No newline at end of file diff --git a/annotations_1/SWgcv5EwMgI_filtered.json b/annotations_1/SWgcv5EwMgI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f4a7207c5e83e0508378a1d74f66bd1a5c94ed8 --- /dev/null +++ b/annotations_1/SWgcv5EwMgI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 43.6], [46.0, 48.19], [49.0, 51.8], [57.0, 61.03], [64.0, 65.25], [66.0, 72.47], [73.0, 121.14]], "keep_status": [false, true, false, false, false, true, false], "silence_prob": [37.82, 44.26, 37.3, 40.5, 0.0, 45.78, 0.0], "audiomae_on_audioset": [[["music", 40.71], ["didgeridoo", 24.23], ["theremin", 7.81]], [["music", 36.06], ["hum", 11.5], ["fly, housefly", 7.29]], [["music", 53.32], ["didgeridoo", 13.16], ["speech", 4.87]], [["music", 76.33], ["musical instrument", 2.58], ["electronic music", 2.5]], null, [["music", 25.0], ["shuffling cards", 17.93], ["speech", 7.96]], null], "duration": [2.6, 2.19, 2.8, 4.03, 1.25, 6.47, 48.14]} \ No newline at end of file diff --git a/annotations_1/SWl87YF_hHQ_filtered.json b/annotations_1/SWl87YF_hHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb87e86fd80065b22cdc48abdf337fb87cd40d28 --- /dev/null +++ b/annotations_1/SWl87YF_hHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.69], [15.0, 23.46], [24.0, 24.71], [29.0, 29.78], [35.0, 38.08], [40.0, 42.11], [45.0, 52.07], [55.0, 55.54], [57.0, 56.64], [57.0, 64.67], [68.0, 83.4], [84.0, 83.94]], "keep_status": [true, true, false, false, true, true, true, false, false, true, false, false], "silence_prob": [29.65, 30.3, 0.0, 0.0, 30.56, 30.11, 30.17, 0.0, 0.0, 29.23, 28.76, 0.0], "audiomae_on_audioset": [[["buzz", 28.36], ["music", 13.67], ["hum", 11.07]], [["music", 16.36], ["speech", 14.77], ["insect", 9.48]], null, null, [["speech", 33.6], ["boing", 19.07], ["music", 8.93]], [["mains hum", 22.8], ["hum", 21.05], ["music", 16.58]], [["music", 50.75], ["theremin", 6.29], ["synthesizer", 5.89]], null, null, [["speech", 45.65], ["music", 13.35], ["groan", 10.82]], [["music", 61.78], ["theremin", 16.18], ["buzz", 4.03]], null], "duration": [7.69, 8.46, 0.71, 0.78, 3.08, 2.11, 7.07, 0.54, -0.36, 7.67, 15.4, -0.06]} \ No newline at end of file diff --git a/annotations_1/SWlYiOtP5mI_filtered.json b/annotations_1/SWlYiOtP5mI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38a2b6490e14794bc4006bb2efb67a00875e30fe --- /dev/null +++ b/annotations_1/SWlYiOtP5mI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.98], [14.0, 14.15], [19.0, 19.6], [21.0, 23.41], [28.0, 29.1], [30.0, 32.63], [35.0, 35.72], [37.0, 37.44], [53.0, 54.4], [62.0, 63.59], [65.0, 69.75], [73.0, 73.63], [83.0, 85.26], [95.0, 96.42], [99.0, 101.26], [104.0, 105.39], [107.0, 108.85], [111.0, 111.87], [112.0, 113.14], [123.0, 124.09], [124.0, 126.59], [129.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 75.55, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 42.76, 0.0, 39.63, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 39.63], ["theremin", 8.62], ["synthesizer", 6.95]], null, [["music", 36.37], ["cello", 13.98], ["violin, fiddle", 12.21]], null, [["speech", 49.39], ["sidetone", 30.5], ["chirp tone", 3.7]], null, null, null, null, null, [["sidetone", 56.61], ["speech", 16.92], ["singing bowl", 9.68]], null], "duration": [0.98, 0.15, 0.6, 2.41, 1.1, 2.63, 0.72, 0.44, 1.4, 1.59, 4.75, 0.63, 2.26, 1.42, 2.26, 1.39, 1.85, 0.87, 1.14, 1.09, 2.59, -0.03]} \ No newline at end of file diff --git a/annotations_1/SXVUCgoOcfs_filtered.json b/annotations_1/SXVUCgoOcfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc4be882f7549023dc168d006065f836ef00c2ca --- /dev/null +++ b/annotations_1/SXVUCgoOcfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.78], [19.0, 20.41], [27.0, 28.75], [30.0, 30.97], [33.0, 37.44], [41.0, 70.09], [71.0, 74.29], [76.0, 76.96], [79.0, 92.65], [95.0, 104.14]], "keep_status": [false, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.67, 30.36, 30.17, 0.0, 30.73, 38.02], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 85.01], ["music", 2.89], ["mosquito", 2.16]], [["music", 15.89], ["livestock, farm animals, working animals", 11.98], ["horse", 9.15]], [["music", 15.36], ["fly, housefly", 11.53], ["didgeridoo", 5.87]], null, [["hum", 34.02], ["mains hum", 25.77], ["music", 12.31]], [["music", 25.99], ["speech", 20.77], ["theremin", 6.29]]], "duration": [-0.22, 1.41, 1.75, 0.97, 4.44, 29.09, 3.29, 0.96, 13.65, 9.14]} \ No newline at end of file diff --git a/annotations_1/SY40M1lhknY_filtered.json b/annotations_1/SY40M1lhknY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7e08d371e3d8c70fb16ec533b63544c6ce4ac1 --- /dev/null +++ b/annotations_1/SY40M1lhknY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [8.0, 9.26], [20.0, 20.44], [25.0, 31.33], [32.0, 33.83], [34.0, 37.74], [41.0, 46.14], [46.0, 130.94], [134.0, 135.08], [136.0, 146.84], [159.0, 159.49], [165.0, 165.13], [166.0, 165.74], [168.0, 189.46], [190.0, 195.51], [200.0, 200.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 62.99, 0.0, 64.52, 81.53, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 99.16, 70.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.26, 0.44, 6.33, 1.83, 3.74, 5.14, 84.94, 1.08, 10.84, 0.49, 0.13, -0.26, 21.46, 5.51, 0.42]} \ No newline at end of file diff --git a/annotations_1/SYffGozxMbU_filtered.json b/annotations_1/SYffGozxMbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b6b9d6f65f6886af0fb11bf746f89f41ecaa63c --- /dev/null +++ b/annotations_1/SYffGozxMbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.42], [16.0, 17.29], [18.0, 19.11], [21.0, 22.52], [23.0, 28.0], [29.0, 36.98], [47.0, 48.39], [50.0, 50.48], [53.0, 52.81], [61.0, 60.86], [79.0, 84.23], [87.0, 90.51], [93.0, 94.68], [99.0, 100.38], [102.0, 103.59], [105.0, 125.27]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [39.38, 0.0, 0.0, 0.0, 32.68, 33.71, 0.0, 0.0, 0.0, 0.0, 34.58, 33.77, 0.0, 0.0, 0.0, 32.1], "audiomae_on_audioset": [[["music", 41.1], ["whale vocalization", 15.14], ["theremin", 9.96]], null, null, null, [["groan", 21.8], ["animal", 10.52], ["whale vocalization", 5.87]], [["music", 43.89], ["theremin", 36.63], ["whale vocalization", 6.51]], null, null, null, null, [["fly, housefly", 23.98], ["speech", 11.99], ["hum", 11.92]], [["whip", 48.47], ["music", 19.22], ["speech", 7.56]], null, null, null, [["music", 31.65], ["cacophony", 16.32], ["speech", 11.46]]], "duration": [6.42, 1.29, 1.11, 1.52, 5.0, 7.98, 1.39, 0.48, -0.19, -0.14, 5.23, 3.51, 1.68, 1.38, 1.59, 20.27]} \ No newline at end of file diff --git a/annotations_1/SZ3oe7dJdMc_filtered.json b/annotations_1/SZ3oe7dJdMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58b55937a234a406008a914ab6d45f77d0090395 --- /dev/null +++ b/annotations_1/SZ3oe7dJdMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.14], [19.0, 20.55], [22.0, 26.28], [29.0, 31.35], [33.0, 34.92], [36.0, 40.2], [41.0, 40.95], [41.0, 47.12], [48.0, 85.31], [87.0, 92.4], [93.0, 120.26], [122.0, 183.64], [184.0, 195.94], [198.0, 207.54], [208.0, 222.15]], "keep_status": [false, false, true, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.72, 39.58, 0.0, 35.33, 0.0, 29.96, 0.0, 46.5, 43.48, 0.0, 30.14, 29.58, 29.33], "audiomae_on_audioset": [null, null, [["music", 45.91], ["buzz", 10.76], ["mains hum", 8.68]], [["hum", 14.95], ["buzz", 11.75], ["mains hum", 8.32]], null, [["music", 37.5], ["throbbing", 10.75], ["gears", 7.77]], null, [["livestock, farm animals, working animals", 20.35], ["music", 17.31], ["hum", 15.12]], null, [["music", 61.94], ["musical instrument", 8.48], ["guitar", 8.31]], [["music", 70.89], ["effects unit", 6.76], ["guitar", 6.47]], null, [["music", 84.2], ["musical instrument", 2.22], ["didgeridoo", 1.8]], [["music", 65.98], ["throbbing", 5.54], ["musical instrument", 3.45]], [["music", 66.03], ["throbbing", 12.29], ["hum", 3.32]]], "duration": [1.14, 1.55, 4.28, 2.35, 1.92, 4.2, -0.05, 6.12, 37.31, 5.4, 27.26, 61.64, 11.94, 9.54, 14.15]} \ No newline at end of file diff --git a/annotations_1/S_QFbRtEF7I_filtered.json b/annotations_1/S_QFbRtEF7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..074cd37425858baa51fdc3417feb1182ceb8c813 --- /dev/null +++ b/annotations_1/S_QFbRtEF7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 21.0], [22.0, 24.73], [26.0, 30.01], [31.0, 35.16], [36.0, 41.91], [43.0, 43.88], [46.0, 60.76], [61.0, 68.0], [74.0, 75.1], [76.0, 84.67], [86.0, 91.57]], "keep_status": [true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [49.18, 53.65, 55.81, 68.41, 34.09, 0.0, 33.65, 29.53, 0.0, 30.29, 31.04], "audiomae_on_audioset": [[["music", 42.14], ["synthesizer", 11.21], ["sonar", 6.35]], null, null, null, [["music", 41.65], ["breaking", 20.28], ["smash, crash", 13.35]], null, [["music", 47.65], ["whale vocalization", 11.03], ["didgeridoo", 7.5]], [["speech", 65.6], ["music", 18.22], ["whack, thwack", 5.35]], null, [["throbbing", 10.25], ["whack, thwack", 9.8], ["hum", 7.93]], [["hum", 16.49], ["music", 12.03], ["mains hum", 7.98]]], "duration": [17.0, 2.73, 4.01, 4.16, 5.91, 0.88, 14.76, 7.0, 1.1, 8.67, 5.57]} \ No newline at end of file diff --git a/annotations_1/S_lcxLCaxAw_filtered.json b/annotations_1/S_lcxLCaxAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cab67862db8ebc1ff9376575abc434c4995d03e --- /dev/null +++ b/annotations_1/S_lcxLCaxAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [11.0, 11.03], [12.0, 15.82], [20.0, 20.98], [22.0, 24.04], [30.0, 30.74], [33.0, 34.91], [37.0, 40.34], [41.0, 41.84], [43.0, 44.0], [45.0, 45.84], [47.0, 48.41], [50.0, 49.94], [53.0, 55.56], [56.0, 62.67], [67.0, 68.2], [69.0, 69.5]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 45.3, 0.0, 78.38, 0.0, 0.0, 35.48, 0.0, 0.0, 0.0, 0.0, 0.0, 84.62, 33.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 37.34], ["moo", 17.68], ["cattle, bovinae", 14.84]], null, null, null, null, [["fly, housefly", 26.14], ["frog", 16.24], ["insect", 13.04]], null, null, null, null, null, null, [["speech", 38.1], ["music", 7.58], ["fly, housefly", 6.47]], null, null], "duration": [0.46, 0.03, 3.82, 0.98, 2.04, 0.74, 1.91, 3.34, 0.84, 1.0, 0.84, 1.41, -0.06, 2.56, 6.67, 1.2, 0.5]} \ No newline at end of file diff --git a/annotations_1/SaUYfjxV8Ic_filtered.json b/annotations_1/SaUYfjxV8Ic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c64433cdebc7c3cf57e37d4c937ed6d52115aa3 --- /dev/null +++ b/annotations_1/SaUYfjxV8Ic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [5.0, 7.92], [9.0, 17.91], [20.0, 30.15], [33.0, 33.81], [40.0, 41.45], [45.0, 45.39], [49.0, 49.86], [51.0, 51.24], [57.0, 57.32], [59.0, 63.32], [64.0, 65.04], [67.0, 69.15], [69.0, 70.73], [72.0, 84.94], [85.0, 88.69], [89.0, 93.45], [95.0, 95.34], [98.0, 98.02], [99.0, 100.6], [101.0, 103.45], [105.0, 107.42], [108.0, 109.14], [123.0, 131.79], [134.0, 133.86], [135.0, 136.27], [138.0, 138.89], [139.0, 143.46]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.84, 42.72, 35.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 78.21, 0.0, 47.39, 40.93, 56.63, 0.0, 0.0, 0.0, 72.46, 67.13, 0.0, 36.64, 0.0, 0.0, 0.0, 38.72], "audiomae_on_audioset": [null, [["speech", 37.84], ["music", 20.71], ["guitar", 4.4]], [["music", 58.81], ["theremin", 19.08], ["musical instrument", 1.2]], [["music", 44.95], ["speech", 36.04], ["hum", 2.25]], null, null, null, null, null, null, null, null, null, null, [["hum", 29.85], ["mains hum", 22.2], ["music", 17.33]], [["speech", 25.17], ["music", 17.59], ["singing bowl", 13.8]], null, null, null, null, null, null, null, [["theremin", 49.71], ["music", 26.7], ["musical instrument", 2.64]], null, null, null, [["speech", 38.05], ["music", 26.62], ["synthesizer", 5.18]]], "duration": [1.67, 2.92, 8.91, 10.15, 0.81, 1.45, 0.39, 0.86, 0.24, 0.32, 4.32, 1.04, 2.15, 1.73, 12.94, 3.69, 4.45, 0.34, 0.02, 1.6, 2.45, 2.42, 1.14, 8.79, -0.14, 1.27, 0.89, 4.46]} \ No newline at end of file diff --git a/annotations_1/SaaTUj7m8e4_filtered.json b/annotations_1/SaaTUj7m8e4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c6d158c51d5f37a4ce6cd22556df6848bedb6a5 --- /dev/null +++ b/annotations_1/SaaTUj7m8e4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.0], [20.0, 27.92], [28.0, 30.23], [31.0, 46.25], [60.0, 62.34], [64.0, 64.54], [65.0, 70.75], [72.0, 72.52], [78.0, 79.2], [80.0, 81.5], [83.0, 84.01], [89.0, 89.97], [93.0, 94.0], [97.0, 97.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [63.85, 80.64, 42.91, 54.7, 75.72, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 59.82], ["chirp tone", 5.51], ["inside, small room", 5.51]], null, null, null, [["speech", 40.99], ["stomach rumble", 9.19], ["sine wave", 7.28]], null, null, null, null, null, null, null], "duration": [4.0, 7.92, 2.23, 15.25, 2.34, 0.54, 5.75, 0.52, 1.2, 1.5, 1.01, 0.97, 1.0, 0.29]} \ No newline at end of file diff --git a/annotations_1/Saz3f-zPYeI_filtered.json b/annotations_1/Saz3f-zPYeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de18de8249bee5b58cef5a2aa0550df0c134b3b0 --- /dev/null +++ b/annotations_1/Saz3f-zPYeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [5.0, 5.29], [6.0, 7.01], [10.0, 10.45], [13.0, 14.77], [17.0, 18.12], [20.0, 21.36], [25.0, 25.51], [28.0, 28.34], [33.0, 33.35], [43.0, 43.95], [49.0, 49.03], [66.0, 73.06], [90.0, 90.68], [94.0, 94.27], [97.0, 103.82], [104.0, 105.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.72, 0.0, 0.0, 28.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["crowd", 43.28], ["cheering", 36.25], ["children shouting", 4.55]], null, null, [["clatter", 17.1], ["crowd", 7.42], ["speech", 6.93]], null], "duration": [0.59, 0.29, 1.01, 0.45, 1.77, 1.12, 1.36, 0.51, 0.34, 0.35, 0.95, 0.03, 7.06, 0.68, 0.27, 6.82, 1.14]} \ No newline at end of file diff --git a/annotations_1/Sb8ufI6z0zM_filtered.json b/annotations_1/Sb8ufI6z0zM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ea0ffa897296e2197f05edb09030ecb64d58062 --- /dev/null +++ b/annotations_1/Sb8ufI6z0zM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 6.45], [12.0, 29.69], [30.0, 54.11], [56.0, 56.64], [59.0, 66.21], [66.0, 66.72], [77.0, 77.9], [85.0, 86.76], [88.0, 88.87], [91.0, 91.93], [93.0, 93.75], [98.0, 98.37], [106.0, 114.13], [115.0, 130.5], [131.0, 131.87]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 29.0, 30.17, 29.75, 0.0, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.57, 29.03, 0.0], "audiomae_on_audioset": [null, [["buzz", 33.56], ["music", 12.27], ["speech", 11.65]], [["music", 45.59], ["throbbing", 29.34], ["hum", 6.49]], [["music", 63.57], ["speech", 4.34], ["whip", 2.57]], null, [["speech", 35.64], ["music", 18.01], ["thunk", 17.6]], null, null, null, null, null, null, null, [["music", 40.25], ["speech", 23.55], ["throbbing", 15.86]], [["music", 58.95], ["throbbing", 5.88], ["animal", 2.98]], null], "duration": [0.0, 5.45, 17.69, 24.11, 0.64, 7.21, 0.72, 0.9, 1.76, 0.87, 0.93, 0.75, 0.37, 8.13, 15.5, 0.87]} \ No newline at end of file diff --git a/annotations_1/SbP_EGRp9Kw_filtered.json b/annotations_1/SbP_EGRp9Kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24f5bcfc70bd1eb8e60f81446328efd3697b4d75 --- /dev/null +++ b/annotations_1/SbP_EGRp9Kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 36.58], [37.0, 40.42], [42.0, 44.12], [46.0, 50.92], [51.0, 53.76], [59.0, 60.2], [62.0, 64.23], [65.0, 70.26], [72.0, 78.46], [79.0, 80.13], [86.0, 87.3], [89.0, 96.3], [98.0, 100.53], [104.0, 143.11], [146.0, 146.47], [148.0, 149.01], [150.0, 156.27], [158.0, 159.58], [160.0, 163.7], [164.0, 167.17], [168.0, 186.71], [188.0, 202.74]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.18, 45.24, 64.75, 98.44, 53.16, 0.0, 96.77, 48.65, 45.36, 0.0, 0.0, 99.82, 83.16, 0.0, 0.0, 0.0, 97.83, 0.0, 90.95, 100.0, 82.97, 88.46], "audiomae_on_audioset": [[["speech", 58.86], ["sidetone", 10.28], ["dial tone", 3.6]], [["noise", 14.57], ["music", 11.73], ["sidetone", 11.38]], null, null, null, null, null, [["speech", 50.29], ["sidetone", 12.91], ["whale vocalization", 8.38]], [["speech", 54.5], ["sidetone", 11.42], ["noise", 7.39]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.58, 3.42, 2.12, 4.92, 2.76, 1.2, 2.23, 5.26, 6.46, 1.13, 1.3, 7.3, 2.53, 39.11, 0.47, 1.01, 6.27, 1.58, 3.7, 3.17, 18.71, 14.74]} \ No newline at end of file diff --git a/annotations_1/Sbtm5uE3cCQ_filtered.json b/annotations_1/Sbtm5uE3cCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a93e1ecc16efad30f8ce1849221e310ee52b0db --- /dev/null +++ b/annotations_1/Sbtm5uE3cCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.42], [20.0, 21.59], [23.0, 27.3], [30.0, 43.06], [49.0, 53.06], [54.0, 57.74], [58.0, 57.77], [65.0, 69.16], [74.0, 76.81], [80.0, 80.33], [83.0, 82.92], [88.0, 88.74], [92.0, 92.31], [93.0, 93.07], [103.0, 104.87], [108.0, 108.13], [109.0, 109.98], [112.0, 112.01], [116.0, 116.9], [119.0, 118.69], [120.0, 121.31], [122.0, 123.5], [127.0, 127.6], [131.0, 131.45], [132.0, 132.43], [135.0, 136.58], [141.0, 140.91], [141.0, 141.84], [143.0, 144.21], [152.0, 153.08], [155.0, 155.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.85, 0.0, 61.87, 51.02, 54.43, 47.86, 0.0, 42.79, 33.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.72], ["theremin", 34.78], ["musical instrument", 1.98]], null, null, null, null, [["speech", 53.64], ["music", 14.24], ["thunk", 3.63]], null, [["music", 66.12], ["musical instrument", 4.36], ["synthesizer", 3.94]], [["music", 70.15], ["musical instrument", 7.81], ["didgeridoo", 6.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.42, 1.59, 4.3, 13.06, 4.06, 3.74, -0.23, 4.16, 2.81, 0.33, -0.08, 0.74, 0.31, 0.07, 1.87, 0.13, 0.98, 0.01, 0.9, -0.31, 1.31, 1.5, 0.6, 0.45, 0.43, 1.58, -0.09, 0.84, 1.21, 1.08, 0.46]} \ No newline at end of file diff --git a/annotations_1/ScJijQn6RyI_filtered.json b/annotations_1/ScJijQn6RyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb44d3f5faa226d23bf356dcb1262540eded36f --- /dev/null +++ b/annotations_1/ScJijQn6RyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [9.0, 15.06], [17.0, 17.19], [19.0, 20.76], [22.0, 31.5], [32.0, 33.64], [37.0, 37.84], [39.0, 38.97], [44.0, 44.91], [48.0, 48.66], [51.0, 52.22], [57.0, 57.59], [62.0, 63.73], [64.0, 64.08], [67.0, 67.95], [69.0, 70.19], [71.0, 70.88], [72.0, 72.72], [79.0, 81.77], [84.0, 84.65], [102.0, 102.51], [103.0, 104.16], [106.0, 105.92], [110.0, 119.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.88, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.71, 0.0, 0.0, 0.0, 0.0, 32.09], "audiomae_on_audioset": [null, [["speech", 47.03], ["sidetone", 30.5], ["radio", 8.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.94], ["radio", 4.46], ["telephone", 2.68]], null, null, null, null, [["speech", 70.04], ["boing", 9.5], ["radio", 2.85]]], "duration": [0.79, 6.06, 0.19, 1.76, 9.5, 1.64, 0.84, -0.03, 0.91, 0.66, 1.22, 0.59, 1.73, 0.08, 0.95, 1.19, -0.12, 0.72, 2.77, 0.65, 0.51, 1.16, -0.08, 9.57]} \ No newline at end of file diff --git a/annotations_1/SccBZYmyjxE_filtered.json b/annotations_1/SccBZYmyjxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a184dbc39dd886f0e956d7442829b94663571208 --- /dev/null +++ b/annotations_1/SccBZYmyjxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 41.88], [45.0, 57.11], [59.0, 72.72], [75.0, 81.4], [85.0, 87.59], [89.0, 89.94], [92.0, 93.02], [94.0, 94.2], [95.0, 95.84], [98.0, 98.24], [98.0, 105.71], [107.0, 109.63], [119.0, 119.6], [122.0, 122.82]], "keep_status": [false, false, true, true, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 51.44, 42.24, 40.43, 39.25, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 39.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 25.46], ["hum", 22.28], ["mains hum", 20.65]], [["music", 37.37], ["hum", 13.33], ["speech", 9.41]], [["music", 39.96], ["speech", 22.74], ["trance music", 7.38]], null, null, null, null, null, [["music", 34.42], ["throbbing", 15.73], ["hum", 15.56]], [["music", 47.38], ["hum", 11.58], ["mains hum", 7.79]], null, null], "duration": [-0.12, 12.11, 13.72, 6.4, 2.59, 0.94, 1.02, 0.2, 0.84, 0.24, 7.71, 2.63, 0.6, 0.82]} \ No newline at end of file diff --git a/annotations_1/Sd4y4XC-qvw_filtered.json b/annotations_1/Sd4y4XC-qvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74ab30212aa7bd39825bf75af8a3839e4f901b8 --- /dev/null +++ b/annotations_1/Sd4y4XC-qvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 59.53], [60.0, 62.14], [63.0, 71.54], [73.0, 76.13], [85.0, 88.86], [93.0, 94.0], [97.0, 106.2], [111.0, 112.13], [113.0, 119.69], [121.0, 122.39], [124.0, 155.17]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 99.82, 49.18, 35.62, 44.57, 0.0, 32.04, 0.0, 45.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 75.97], ["crow", 3.18], ["hum", 2.47]], [["music", 34.55], ["electric shaver, electric razor", 3.93], ["moo", 2.42]], [["speech", 52.75], ["music", 20.81], ["sonar", 4.08]], null, [["music", 30.82], ["mains hum", 10.64], ["hum", 7.96]], null, [["music", 68.54], ["scary music", 4.58], ["rumble", 2.16]], null, null], "duration": [33.53, 2.14, 8.54, 3.13, 3.86, 1.0, 9.2, 1.13, 6.69, 1.39, 31.17]} \ No newline at end of file diff --git a/annotations_1/SdFZEeR8a2s_filtered.json b/annotations_1/SdFZEeR8a2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8984db0a9deaea36a52df889181a228cc5e4a2a4 --- /dev/null +++ b/annotations_1/SdFZEeR8a2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 67.32], [72.0, 72.55], [74.0, 82.34], [88.0, 88.7], [89.0, 88.74], [89.0, 100.68], [102.0, 113.95], [118.0, 117.85], [126.0, 126.49], [129.0, 129.71], [136.0, 152.17], [157.0, 160.64], [167.0, 168.49], [177.0, 177.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.36, 0.0, 0.0, 72.75, 55.67, 0.0, 0.0, 0.0, 38.52, 38.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 47.18], ["speech", 18.39], ["hum", 11.06]], [["music", 40.34], ["speech", 37.26], ["scary music", 5.64]], null, null], "duration": [34.32, 0.55, 8.34, 0.7, -0.26, 11.68, 11.95, -0.15, 0.49, 0.71, 16.17, 3.64, 1.49, 0.63]} \ No newline at end of file diff --git a/annotations_1/Se2zCvUqqWw_filtered.json b/annotations_1/Se2zCvUqqWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f31fc98041e878cb6ff31424af80cf64cf6950a --- /dev/null +++ b/annotations_1/Se2zCvUqqWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.51], [17.0, 24.8], [26.0, 26.49], [37.0, 36.98], [38.0, 38.84], [39.0, 39.09], [39.0, 39.78], [47.0, 48.37], [53.0, 60.2], [69.0, 76.0], [81.0, 90.95], [92.0, 93.24], [100.0, 99.98], [100.0, 100.26], [103.0, 103.01], [103.0, 103.94], [108.0, 108.04], [109.0, 116.26], [117.0, 117.19], [119.0, 124.58], [125.0, 137.84]], "keep_status": [false, true, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 29.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.15, 30.25, 36.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.34, 0.0, 30.64, 30.59], "audiomae_on_audioset": [null, [["music", 34.87], ["didgeridoo", 13.74], ["speech", 7.67]], null, null, null, null, null, null, [["whip", 43.46], ["speech", 9.41], ["whack, thwack", 8.99]], [["speech", 19.45], ["cattle, bovinae", 10.75], ["music", 9.88]], [["speech", 39.5], ["fly, housefly", 9.13], ["insect", 8.88]], null, null, null, null, null, null, [["speech", 34.28], ["music", 26.81], ["groan", 5.11]], null, [["music", 22.67], ["cattle, bovinae", 15.55], ["livestock, farm animals, working animals", 13.37]], [["speech", 24.68], ["music", 23.88], ["groan", 22.7]]], "duration": [0.51, 7.8, 0.49, -0.02, 0.84, 0.09, 0.78, 1.37, 7.2, 7.0, 9.95, 1.24, -0.02, 0.26, 0.01, 0.94, 0.04, 7.26, 0.19, 5.58, 12.84]} \ No newline at end of file diff --git a/annotations_1/Se38Z08pYS0_filtered.json b/annotations_1/Se38Z08pYS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1eaac3c464a560c6b49a55d8647e9adfd3e250e --- /dev/null +++ b/annotations_1/Se38Z08pYS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.57], [8.0, 8.56], [21.0, 21.57], [23.0, 23.55], [25.0, 27.84], [29.0, 30.97], [32.0, 34.03], [34.0, 51.44], [53.0, 57.5], [59.0, 59.16], [60.0, 62.33], [64.0, 64.45], [66.0, 68.28], [70.0, 70.46], [71.0, 71.44], [72.0, 72.47], [73.0, 73.31], [75.0, 75.24], [82.0, 83.4], [89.0, 89.14], [91.0, 91.69]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 86.27, 30.21, 33.48, 0.0, 32.33, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 19.07], ["speech", 11.73], ["electric shaver, electric razor", 11.51]], [["speech", 50.56], ["wail, moan", 21.73], ["music", 12.02]], null, [["music", 21.21], ["speech", 18.47], ["reverberation", 7.44]], null, [["groan", 17.59], ["grunt", 15.64], ["sound effect", 6.24]], null, null, null, null, null, null, null, null], "duration": [1.57, 0.56, 0.57, 0.55, 2.84, 1.97, 2.03, 17.44, 4.5, 0.16, 2.33, 0.45, 2.28, 0.46, 0.44, 0.47, 0.31, 0.24, 1.4, 0.14, 0.69]} \ No newline at end of file diff --git a/annotations_1/SeYgMYijdz4_filtered.json b/annotations_1/SeYgMYijdz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5232c6265e621b0bff51f4e2824f79288de57faa --- /dev/null +++ b/annotations_1/SeYgMYijdz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.04], [4.0, 5.63], [8.0, 9.73], [12.0, 18.99], [22.0, 25.34], [31.0, 31.72], [33.0, 33.84], [37.0, 39.01], [39.0, 39.45], [39.0, 39.48], [39.0, 39.51], [40.0, 39.68], [40.0, 39.72], [40.0, 39.75], [40.0, 39.78], [45.0, 79.03], [80.0, 80.99], [82.0, 87.72], [88.0, 91.03], [101.0, 120.11], [124.0, 166.09]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.92, 31.43, 0.0, 0.0, 28.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.1, 29.0, 28.73, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 40.69], ["reverberation", 15.91], ["sound effect", 7.46]], [["cattle, bovinae", 22.75], ["whale vocalization", 22.4], ["moo", 19.3]], null, null, [["groan", 21.69], ["speech", 13.14], ["sound effect", 9.05]], null, null, null, null, null, null, null, null, null, [["hum", 35.76], ["throbbing", 30.09], ["music", 19.13]], [["music", 28.27], ["speech", 8.42], ["hum", 8.14]], [["music", 53.6], ["whale vocalization", 12.87], ["noise", 4.05]], null], "duration": [0.04, 1.63, 1.73, 6.99, 3.34, 0.72, 0.84, 2.01, 0.45, 0.48, 0.51, -0.32, -0.28, -0.25, -0.22, 34.03, 0.99, 5.72, 3.03, 19.11, 42.09]} \ No newline at end of file diff --git a/annotations_1/Sf47YRUStx8_filtered.json b/annotations_1/Sf47YRUStx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b9fc622b1d3cca31d8faaad6fa053975fe73e85 --- /dev/null +++ b/annotations_1/Sf47YRUStx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [14.0, 14.2], [16.0, 16.43], [21.0, 24.29], [25.0, 25.69], [36.0, 36.71], [44.0, 46.52], [47.0, 49.17], [50.0, 50.28], [53.0, 53.74], [65.0, 66.26], [69.0, 74.22], [75.0, 77.77], [79.0, 79.78], [81.0, 82.41], [83.0, 83.08], [85.0, 84.77], [86.0, 86.51], [90.0, 91.18], [102.0, 109.81], [113.0, 113.43], [114.0, 113.98], [116.0, 116.68], [117.0, 117.49], [118.0, 117.68], [121.0, 121.58], [123.0, 124.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 99.71, 83.88, 0.0, 0.0, 0.0, 43.98, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 21.96], ["music", 17.77], ["moo", 15.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 0.2, 0.43, 3.29, 0.69, 0.71, 2.52, 2.17, 0.28, 0.74, 1.26, 5.22, 2.77, 0.78, 1.41, 0.08, -0.23, 0.51, 1.18, 7.81, 0.43, -0.02, 0.68, 0.49, -0.32, 0.58, 1.06]} \ No newline at end of file diff --git a/annotations_1/SfMSiaxLslA_filtered.json b/annotations_1/SfMSiaxLslA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7cb778fd2c2a190e1d5c2dda38c7a11a5ea054a --- /dev/null +++ b/annotations_1/SfMSiaxLslA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [6.0, 8.41], [12.0, 12.68], [14.0, 15.65], [17.0, 23.28], [24.0, 25.03], [27.0, 28.7], [32.0, 33.27], [34.0, 35.16], [38.0, 38.26], [41.0, 42.94], [44.0, 45.69], [47.0, 47.33], [49.0, 50.68], [53.0, 53.6], [56.0, 57.47], [58.0, 59.22], [67.0, 67.96], [77.0, 78.88], [80.0, 81.35], [84.0, 84.35], [86.0, 86.83], [89.0, 89.94], [93.0, 96.53], [99.0, 99.84], [103.0, 103.67], [110.0, 110.84], [114.0, 114.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.56, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 2.41, 0.68, 1.65, 6.28, 1.03, 1.7, 1.27, 1.16, 0.26, 1.94, 1.69, 0.33, 1.68, 0.6, 1.47, 1.22, 0.96, 1.88, 1.35, 0.35, 0.83, 0.94, 3.53, 0.84, 0.67, 0.84, 0.39]} \ No newline at end of file diff --git a/annotations_1/SiY9kPYOZuM_filtered.json b/annotations_1/SiY9kPYOZuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9358eabfba5770232a0d89b25368fe8c958ff5fb --- /dev/null +++ b/annotations_1/SiY9kPYOZuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.11], [13.0, 13.12], [14.0, 15.52], [16.0, 15.99], [17.0, 16.7], [26.0, 27.4], [35.0, 37.47], [43.0, 43.51], [45.0, 46.18], [46.0, 46.41], [46.0, 46.65], [47.0, 46.79], [49.0, 50.11], [53.0, 54.68], [56.0, 77.16], [80.0, 91.13], [92.0, 92.62], [94.0, 97.77], [105.0, 117.26], [119.0, 119.67], [122.0, 125.14], [126.0, 126.45], [127.0, 126.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.98, 31.43, 0.0, 32.57, 31.81, 0.0, 34.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["boing", 42.97], ["thunk", 15.79], ["speech", 9.64]], null, null, null, null, null, null, null, [["speech", 31.36], ["hum", 12.04], ["mains hum", 7.0]], [["hum", 16.45], ["speech", 12.99], ["mains hum", 12.78]], null, [["speech", 52.67], ["music", 22.38], ["sidetone", 8.0]], [["speech", 82.12], ["animal", 2.97], ["fart", 1.7]], null, [["speech", 41.76], ["music", 23.69], ["sidetone", 9.99]], null, null], "duration": [0.11, 0.12, 1.52, -0.01, -0.3, 1.4, 2.47, 0.51, 1.18, 0.41, 0.65, -0.21, 1.11, 1.68, 21.16, 11.13, 0.62, 3.77, 12.26, 0.67, 3.14, 0.45, -0.29]} \ No newline at end of file diff --git a/annotations_1/SjF_DpHczjE_filtered.json b/annotations_1/SjF_DpHczjE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3994515ffcd88bcf194d469caf2bca519d98d68 --- /dev/null +++ b/annotations_1/SjF_DpHczjE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.16], [42.0, 42.09], [88.0, 88.3]], "keep_status": [true, false, false], "silence_prob": [29.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.17], ["throbbing", 10.23], ["electronic music", 5.45]], null, null], "duration": [7.16, 0.09, 0.3]} \ No newline at end of file diff --git a/annotations_1/SmMmQHR_F4Y_filtered.json b/annotations_1/SmMmQHR_F4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0790e709df23c14441fd8e596709e5872e01fa1e --- /dev/null +++ b/annotations_1/SmMmQHR_F4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.23], [13.0, 149.44], [150.0, 150.87], [152.0, 152.15], [153.0, 154.3], [155.0, 155.92], [157.0, 160.71], [164.0, 163.97], [168.0, 170.24], [173.0, 183.2]], "keep_status": [false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 59.07, 32.13], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 11.53], ["hum", 10.19], ["throbbing", 9.9]], null, null, [["speech", 14.81], ["gong", 10.59], ["music", 9.44]]], "duration": [0.23, 136.44, 0.87, 0.15, 1.3, 0.92, 3.71, -0.03, 2.24, 10.2]} \ No newline at end of file diff --git a/annotations_1/SmrdaRhZJt4_filtered.json b/annotations_1/SmrdaRhZJt4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e4dfd3d84cf6613e9410eecb9de9d4f603cd3b5 --- /dev/null +++ b/annotations_1/SmrdaRhZJt4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [6.0, 7.43], [9.0, 9.71], [11.0, 11.11], [12.0, 22.08], [24.0, 24.38], [26.0, 27.89], [32.0, 32.93], [34.0, 35.36], [37.0, 38.13], [40.0, 40.07], [43.0, 44.19], [48.0, 49.33], [52.0, 53.43], [55.0, 56.51], [61.0, 66.18], [67.0, 68.07], [70.0, 71.14], [75.0, 76.6], [80.0, 80.99], [81.0, 81.24], [86.0, 87.39], [91.0, 94.07], [96.0, 97.71], [100.0, 100.8], [103.0, 104.57], [105.0, 108.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 0.0, 0.0, 0.0, 36.96], "audiomae_on_audioset": [null, null, null, null, [["music", 48.19], ["guitar", 12.56], ["speech", 12.21]], null, null, null, null, null, null, null, null, null, null, [["music", 53.86], ["theremin", 8.32], ["musical instrument", 6.14]], null, null, null, null, null, null, [["music", 63.34], ["didgeridoo", 9.11], ["theremin", 4.78]], null, null, null, [["music", 73.77], ["effects unit", 9.19], ["guitar", 3.61]]], "duration": [0.77, 1.43, 0.71, 0.11, 10.08, 0.38, 1.89, 0.93, 1.36, 1.13, 0.07, 1.19, 1.33, 1.43, 1.51, 5.18, 1.07, 1.14, 1.6, 0.99, 0.24, 1.39, 3.07, 1.71, 0.8, 1.57, 3.26]} \ No newline at end of file diff --git a/annotations_1/Snbbz0C_ZiA_filtered.json b/annotations_1/Snbbz0C_ZiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f1d430cf7acd3a1405ebbdfdf2f20dd8ec6304f --- /dev/null +++ b/annotations_1/Snbbz0C_ZiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.28], [14.0, 18.79], [19.0, 28.29], [29.0, 30.05], [31.0, 31.65], [32.0, 33.17], [36.0, 40.02], [42.0, 45.18], [46.0, 47.92], [49.0, 58.16], [59.0, 60.96], [62.0, 63.41], [64.0, 66.82], [72.0, 73.38], [75.0, 78.0], [81.0, 82.12], [86.0, 86.88], [89.0, 89.77], [92.0, 94.49], [103.0, 108.6], [111.0, 117.09], [118.0, 122.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [85.17, 94.07, 83.88, 0.0, 0.0, 0.0, 90.6, 87.19, 0.0, 89.9, 0.0, 0.0, 77.53, 0.0, 84.43, 0.0, 0.0, 0.0, 98.1, 98.93, 40.75, 73.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.88], ["synthesizer", 4.41], ["dog", 4.32]], null], "duration": [3.28, 4.79, 9.29, 1.05, 0.65, 1.17, 4.02, 3.18, 1.92, 9.16, 1.96, 1.41, 2.82, 1.38, 3.0, 1.12, 0.88, 0.77, 2.49, 5.6, 6.09, 4.42]} \ No newline at end of file diff --git a/annotations_1/SpOd7BwzlMU_filtered.json b/annotations_1/SpOd7BwzlMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..272da7ffb683184684a3627764019f57375fbeb8 --- /dev/null +++ b/annotations_1/SpOd7BwzlMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 43.58], [44.0, 55.93], [56.0, 57.4], [59.0, 62.92], [65.0, 85.8], [86.0, 89.7], [90.0, 90.95], [92.0, 93.04], [93.0, 99.49]], "keep_status": [false, false, false, true, false, true, false, false, false], "silence_prob": [39.15, 30.17, 0.0, 31.01, 30.09, 30.88, 0.0, 0.0, 53.84], "audiomae_on_audioset": [[["music", 29.6], ["hum", 27.21], ["throbbing", 26.28]], [["music", 49.58], ["speech", 13.92], ["throbbing", 9.36]], null, [["sidetone", 19.29], ["speech", 15.55], ["music", 12.4]], [["speech", 42.37], ["music", 19.0], ["throbbing", 18.34]], [["clang", 24.9], ["throbbing", 17.0], ["hum", 13.82]], null, null, null], "duration": [18.58, 11.93, 1.4, 3.92, 20.8, 3.7, 0.95, 1.04, 6.49]} \ No newline at end of file diff --git a/annotations_1/Sq7RMukT_sY_filtered.json b/annotations_1/Sq7RMukT_sY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6027576df978c48d021209e2f08b3816c25089 --- /dev/null +++ b/annotations_1/Sq7RMukT_sY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.04], [26.0, 26.77], [28.0, 29.25], [38.0, 40.14], [42.0, 42.5], [43.0, 42.55], [43.0, 46.77], [48.0, 52.32], [53.0, 54.77], [57.0, 57.82], [60.0, 61.03], [65.0, 64.81], [69.0, 71.17], [72.0, 86.75], [88.0, 88.91], [92.0, 92.8], [106.0, 108.31], [109.0, 113.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.45, 0.0, 0.0, 96.29, 0.0, 0.0, 87.19, 87.37, 0.0, 0.0, 0.0, 0.0, 95.23, 94.81, 0.0, 0.0, 78.55, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.04, 0.77, 1.25, 2.14, 0.5, -0.45, 3.77, 4.32, 1.77, 0.82, 1.03, -0.19, 2.17, 14.75, 0.91, 0.8, 2.31, 4.04]} \ No newline at end of file diff --git a/annotations_1/SqFAf6aGTtw_filtered.json b/annotations_1/SqFAf6aGTtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a9452bae63be0d4986d04d754d64b15a2ed494 --- /dev/null +++ b/annotations_1/SqFAf6aGTtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [5.0, 5.32], [7.0, 7.86], [9.0, 9.54], [12.0, 13.95], [17.0, 23.35], [26.0, 46.75], [53.0, 53.92], [56.0, 56.81], [58.0, 58.68]], "keep_status": [false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.85, 30.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 22.91], ["explosion", 17.86], ["burst, pop", 16.51]], [["speech", 21.4], ["music", 14.21], ["crowd", 9.72]], null, null, null], "duration": [0.75, 0.32, 0.86, 0.54, 1.95, 6.35, 20.75, 0.92, 0.81, 0.68]} \ No newline at end of file diff --git a/annotations_1/SqQmfQfAzzg_filtered.json b/annotations_1/SqQmfQfAzzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f35d112ba35a07a80bec59cad4efefb71faa78ce --- /dev/null +++ b/annotations_1/SqQmfQfAzzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.05], [7.0, 7.82], [11.0, 12.16], [15.0, 16.56], [17.0, 19.33], [27.0, 28.38], [30.0, 30.86], [34.0, 37.29], [39.0, 42.94], [44.0, 45.35], [47.0, 48.12], [50.0, 52.22], [53.0, 53.25], [61.0, 64.17]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 48.35, 47.31, 0.0, 0.0, 51.39, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 66.95], ["musical instrument", 7.91], ["guitar", 3.59]], [["music", 56.94], ["ambient music", 6.12], ["hum", 5.99]], null, null, null, null, null], "duration": [1.05, 0.82, 1.16, 1.56, 2.33, 1.38, 0.86, 3.29, 3.94, 1.35, 1.12, 2.22, 0.25, 3.17]} \ No newline at end of file diff --git a/annotations_1/SqSZ5RSaT8k_filtered.json b/annotations_1/SqSZ5RSaT8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47177e0c6e3ae63e962f0b4b7e0a9e310607e084 --- /dev/null +++ b/annotations_1/SqSZ5RSaT8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [8.0, 8.65], [16.0, 16.41], [20.0, 20.58], [24.0, 24.76], [25.0, 25.42], [27.0, 26.84], [27.0, 28.07], [30.0, 31.16], [32.0, 32.43], [35.0, 36.69], [38.0, 39.53], [41.0, 41.12], [42.0, 43.29], [51.0, 51.54], [54.0, 54.87], [61.0, 63.31], [63.0, 64.29], [66.0, 66.72], [67.0, 68.81], [84.0, 84.27], [91.0, 91.0], [92.0, 93.77], [99.0, 102.95], [108.0, 108.94], [110.0, 112.01], [114.0, 115.26], [116.0, 116.65], [118.0, 118.79], [120.0, 121.64], [136.0, 136.51], [141.0, 141.35], [144.0, 144.8], [147.0, 147.19], [156.0, 156.93], [159.0, 160.69], [165.0, 165.82], [167.0, 168.94], [171.0, 172.08], [180.0, 181.11], [182.0, 181.9], [183.0, 184.59], [185.0, 185.23], [191.0, 191.73], [193.0, 193.99], [207.0, 207.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.52, 0.0, 45.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.81], ["music", 11.52], ["sound effect", 3.64]], null, null, null, null, null, null, [["speech", 8.8], ["hum", 8.16], ["sidetone", 5.29]], null, [["rumble", 16.37], ["noise", 13.87], ["microwave oven", 7.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 0.65, 0.41, 0.58, 0.76, 0.42, -0.16, 1.07, 1.16, 0.43, 1.69, 1.53, 0.12, 1.29, 0.54, 0.87, 2.31, 1.29, 0.72, 1.81, 0.27, 0.0, 1.77, 3.95, 0.94, 2.01, 1.26, 0.65, 0.79, 1.64, 0.51, 0.35, 0.8, 0.19, 0.93, 1.69, 0.82, 1.94, 1.08, 1.11, -0.1, 1.59, 0.23, 0.73, 0.99, 0.6]} \ No newline at end of file diff --git a/annotations_1/Sqnrzd0HCRY_filtered.json b/annotations_1/Sqnrzd0HCRY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..338f95715dade8e8fc5cc564e49e764836048eb7 --- /dev/null +++ b/annotations_1/Sqnrzd0HCRY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.3], [63.0, 63.0], [66.0, 84.75], [91.0, 106.3], [109.0, 109.38], [111.0, 112.35], [112.0, 118.44]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 28.42, 28.75, 0.0, 0.0, 29.85], "audiomae_on_audioset": [null, null, [["music", 42.9], ["speech", 37.21], ["hum", 2.72]], [["music", 71.99], ["didgeridoo", 3.7], ["throbbing", 2.55]], null, null, [["music", 11.22], ["didgeridoo", 8.48], ["sound effect", 6.01]]], "duration": [1.3, 0.0, 18.75, 15.3, 0.38, 1.35, 6.44]} \ No newline at end of file diff --git a/annotations_1/SrNNEi50cl4_filtered.json b/annotations_1/SrNNEi50cl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2683f8d9f2ceaf7c6603b0184fe5292fc01e24e9 --- /dev/null +++ b/annotations_1/SrNNEi50cl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.97], [8.0, 8.01], [8.0, 8.04], [8.0, 8.07], [8.0, 8.11], [8.0, 8.14], [8.0, 8.18], [25.0, 27.28], [32.0, 32.31], [32.0, 32.34], [32.0, 33.34], [37.0, 37.44], [40.0, 41.84], [45.0, 50.09], [50.0, 53.82], [61.0, 69.89], [72.0, 73.99], [75.0, 79.27], [80.0, 84.42], [89.0, 94.27], [98.0, 103.67], [107.0, 107.0], [111.0, 111.4], [117.0, 117.02], [122.0, 122.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [52.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 43.2, 85.35, 51.71, 0.0, 100.0, 48.31, 56.03, 36.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.67], ["cowbell", 17.52], ["music", 4.86]], null, null, null, null, [["hum", 18.12], ["speech", 12.9], ["fart", 6.49]], null, [["livestock, farm animals, working animals", 30.35], ["moo", 18.44], ["cattle, bovinae", 15.7]], null, null, null, null], "duration": [3.97, 0.01, 0.04, 0.07, 0.11, 0.14, 0.18, 2.28, 0.31, 0.34, 1.34, 0.44, 1.84, 5.09, 3.82, 8.89, 1.99, 4.27, 4.42, 5.27, 5.67, 0.0, 0.4, 0.02, 0.74]} \ No newline at end of file diff --git a/annotations_1/SroZoan9faw_filtered.json b/annotations_1/SroZoan9faw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d61670724bb6699a184fa1e12cd642f69167e6 --- /dev/null +++ b/annotations_1/SroZoan9faw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.52], [24.0, 23.55], [24.0, 23.58], [24.0, 23.62], [24.0, 23.72], [24.0, 49.5], [51.0, 52.2], [52.0, 70.56], [74.0, 78.06], [83.0, 192.2], [193.0, 218.44]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.1, 0.0, 36.54, 32.17, 0.0, 29.14], "audiomae_on_audioset": [null, null, null, null, null, [["music", 41.5], ["theremin", 22.91], ["throbbing", 3.49]], null, [["theremin", 44.17], ["music", 30.65], ["whale vocalization", 9.72]], [["theremin", 34.69], ["music", 33.31], ["musical instrument", 9.45]], null, [["music", 28.35], ["speech", 9.69], ["hum", 8.28]]], "duration": [0.52, -0.45, -0.42, -0.38, -0.28, 25.5, 1.2, 18.56, 4.06, 109.2, 25.44]} \ No newline at end of file diff --git a/annotations_1/SrqVUFbk_sE_filtered.json b/annotations_1/SrqVUFbk_sE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b114a81a796a4d5cb02d754d504d444b0f68e11 --- /dev/null +++ b/annotations_1/SrqVUFbk_sE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.81], [11.0, 12.04], [14.0, 14.45], [15.0, 16.44], [18.0, 19.8], [21.0, 21.63], [22.0, 23.99], [26.0, 26.89], [27.0, 27.53], [30.0, 32.19], [32.0, 34.69], [37.0, 38.37], [40.0, 41.89], [46.0, 47.29], [49.0, 49.38], [51.0, 53.27], [57.0, 57.06], [58.0, 58.83], [62.0, 62.8], [68.0, 70.6], [72.0, 75.54], [76.0, 79.44], [80.0, 86.27], [87.0, 89.31], [90.0, 94.05], [95.0, 96.85], [98.0, 104.94], [107.0, 110.83], [111.0, 115.3], [116.0, 119.4], [121.0, 122.45], [123.0, 126.96], [128.0, 136.07], [136.0, 138.57], [139.0, 165.42], [167.0, 171.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 98.1, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 77.87, 53.78, 77.53, 93.76, 94.37, 84.07, 0.0, 90.6, 98.99, 59.68, 99.82, 0.0, 90.6, 98.51, 70.3, 98.01, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.52], ["dial tone", 11.77], ["sidetone", 11.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.81, 1.04, 0.45, 1.44, 1.8, 0.63, 1.99, 0.89, 0.53, 2.19, 2.69, 1.37, 1.89, 1.29, 0.38, 2.27, 0.06, 0.83, 0.8, 2.6, 3.54, 3.44, 6.27, 2.31, 4.05, 1.85, 6.94, 3.83, 4.3, 3.4, 1.45, 3.96, 8.07, 2.57, 26.42, 4.19]} \ No newline at end of file diff --git a/annotations_1/SrvRkUwIFfk_filtered.json b/annotations_1/SrvRkUwIFfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9337632cc8aa912547544a491d9601516ea0f123 --- /dev/null +++ b/annotations_1/SrvRkUwIFfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.65], [21.0, 24.19], [26.0, 26.28], [28.0, 28.26], [28.0, 28.41], [29.0, 31.16], [32.0, 33.27], [37.0, 42.26], [42.0, 42.58], [43.0, 47.04], [47.0, 77.97], [78.0, 79.66], [80.0, 91.91], [95.0, 95.35], [97.0, 97.12], [99.0, 103.0], [103.0, 104.95], [106.0, 106.44], [108.0, 128.43], [129.0, 130.54], [131.0, 133.05], [140.0, 143.85], [147.0, 148.66], [154.0, 155.34], [164.0, 165.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.13, 99.4, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.96, 0.0, 0.0, 99.68, 0.0, 0.0, 94.37, 0.0, 88.1, 68.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.65, 3.19, 0.28, 0.26, 0.41, 2.16, 1.27, 5.26, 0.58, 4.04, 30.97, 1.66, 11.91, 0.35, 0.12, 4.0, 1.95, 0.44, 20.43, 1.54, 2.05, 3.85, 1.66, 1.34, 1.94]} \ No newline at end of file diff --git a/annotations_1/Ss5HAL8j7p8_filtered.json b/annotations_1/Ss5HAL8j7p8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e21b8c1ee845b28b8b9b13cc7ea534eb9a5819b --- /dev/null +++ b/annotations_1/Ss5HAL8j7p8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.13], [31.0, 33.37], [36.0, 106.88], [108.0, 110.96], [115.0, 118.47]], "keep_status": [true, true, false, true, true], "silence_prob": [31.31, 34.3, 0.0, 39.77, 38.1], "audiomae_on_audioset": [[["music", 35.2], ["throbbing", 10.36], ["electronic music", 7.66]], [["music", 29.78], ["throbbing", 12.73], ["hum", 10.22]], null, [["cattle, bovinae", 23.0], ["moo", 13.29], ["speech", 8.3]], [["speech", 37.37], ["music", 14.12], ["didgeridoo", 9.92]]], "duration": [2.13, 2.37, 70.88, 2.96, 3.47]} \ No newline at end of file diff --git a/annotations_1/StUN1G5filU_filtered.json b/annotations_1/StUN1G5filU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ecccd05b502d63586e1c81f4e186e852ee73085 --- /dev/null +++ b/annotations_1/StUN1G5filU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 27.73], [34.0, 34.45], [45.0, 46.68], [49.0, 55.88], [58.0, 58.53], [64.0, 64.74], [72.0, 72.13], [102.0, 102.42], [105.0, 106.03], [110.0, 110.03], [125.0, 126.06]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 23.6], ["didgeridoo", 23.55], ["livestock, farm animals, working animals", 11.35]], null, null, null, null, null, null, null], "duration": [-0.27, 0.45, 1.68, 6.88, 0.53, 0.74, 0.13, 0.42, 1.03, 0.03, 1.06]} \ No newline at end of file diff --git a/annotations_1/StoThowf7Y4_filtered.json b/annotations_1/StoThowf7Y4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f1737d93e7b50bb08088fdc1349df3a0d5347b2 --- /dev/null +++ b/annotations_1/StoThowf7Y4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.88], [18.0, 18.89], [19.0, 20.95], [23.0, 26.67], [30.0, 40.27], [43.0, 46.97], [48.0, 57.81], [61.0, 61.86], [67.0, 68.55], [71.0, 72.74], [78.0, 77.58], [80.0, 80.69], [83.0, 84.45], [88.0, 88.2], [91.0, 90.88], [93.0, 92.97], [97.0, 98.05], [99.0, 102.9], [104.0, 104.01], [107.0, 107.32], [111.0, 111.03], [117.0, 117.49], [118.0, 118.81], [121.0, 122.3], [124.0, 124.48], [126.0, 134.27], [137.0, 137.54]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [79.41, 0.0, 0.0, 33.02, 32.06, 33.26, 31.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.97, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 74.03], ["theremin", 5.95], ["synthesizer", 5.43]], [["hum", 46.31], ["throbbing", 14.56], ["mains hum", 12.05]], [["music", 27.17], ["throbbing", 11.85], ["hum", 11.35]], [["music", 49.48], ["throbbing", 24.9], ["hum", 11.18]], null, null, null, null, null, null, null, null, null, null, [["hum", 22.84], ["whale vocalization", 18.99], ["music", 13.65]], null, null, null, null, null, null, null, [["throbbing", 32.96], ["hum", 25.26], ["music", 15.74]], null], "duration": [4.88, 0.89, 1.95, 3.67, 10.27, 3.97, 9.81, 0.86, 1.55, 1.74, -0.42, 0.69, 1.45, 0.2, -0.12, -0.03, 1.05, 3.9, 0.01, 0.32, 0.03, 0.49, 0.81, 1.3, 0.48, 8.27, 0.54]} \ No newline at end of file diff --git a/annotations_1/StvrI9z9kLY_filtered.json b/annotations_1/StvrI9z9kLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5448fe18ea8fbe4dc03367f43415299ca7a37a92 --- /dev/null +++ b/annotations_1/StvrI9z9kLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.17], [17.0, 32.53], [33.0, 34.74], [37.0, 37.22], [43.0, 43.46], [44.0, 44.51], [48.0, 55.31], [56.0, 63.1], [64.0, 64.89], [66.0, 66.95], [72.0, 72.89], [80.0, 81.3], [90.0, 89.9], [91.0, 91.13], [92.0, 92.33], [96.0, 96.99], [103.0, 103.89], [113.0, 113.9], [115.0, 115.37], [118.0, 118.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.33, 50.56, 0.0, 0.0, 0.0, 0.0, 62.47, 39.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.64], ["musical instrument", 3.12], ["clarinet", 1.78]], null, null, null, null, null, null, [["music", 68.2], ["theremin", 9.77], ["cello", 2.87]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.17, 15.53, 1.74, 0.22, 0.46, 0.51, 7.31, 7.1, 0.89, 0.95, 0.89, 1.3, -0.1, 0.13, 0.33, 0.99, 0.89, 0.9, 0.37, 0.81]} \ No newline at end of file diff --git a/annotations_1/SuEt5n-k0e8_filtered.json b/annotations_1/SuEt5n-k0e8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d15a8bcdbd473683f0c1b5b936a2caa6a4154f46 --- /dev/null +++ b/annotations_1/SuEt5n-k0e8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 19.8], [23.0, 22.99], [30.0, 31.46], [37.0, 37.89], [40.0, 40.1], [43.0, 46.55], [49.0, 49.64], [53.0, 53.42], [58.0, 58.75], [65.0, 65.3], [67.0, 68.01], [69.0, 71.19], [72.0, 73.11], [75.0, 75.57], [80.0, 80.79], [81.0, 82.22], [83.0, 84.08], [88.0, 90.1], [91.0, 94.14], [98.0, 99.01], [100.0, 101.46], [107.0, 107.03], [109.0, 110.22], [111.0, 112.4], [113.0, 113.95], [115.0, 116.72], [118.0, 118.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.55, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.8, -0.01, 1.46, 0.89, 0.1, 3.55, 0.64, 0.42, 0.75, 0.3, 1.01, 2.19, 1.11, 0.57, 0.79, 1.22, 1.08, 2.1, 3.14, 1.01, 1.46, 0.03, 1.22, 1.4, 0.95, 1.72, 0.47]} \ No newline at end of file diff --git a/annotations_1/SuSUwDgtq1g_filtered.json b/annotations_1/SuSUwDgtq1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0fb2319730918ab90b8f003b0074615a5db4eca --- /dev/null +++ b/annotations_1/SuSUwDgtq1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.73], [23.0, 23.63], [35.0, 35.19], [49.0, 48.81], [51.0, 51.31], [54.0, 53.76], [56.0, 56.59], [60.0, 59.66], [61.0, 61.84], [68.0, 69.06], [71.0, 72.59], [79.0, 79.73], [82.0, 82.39], [86.0, 87.03], [104.0, 105.41], [110.0, 110.22], [121.0, 122.54], [123.0, 123.94], [125.0, 125.71], [138.0, 139.58], [143.0, 144.27], [146.0, 146.57], [151.0, 151.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.73, 0.63, 0.19, -0.19, 0.31, -0.24, 0.59, -0.34, 0.84, 1.06, 1.59, 0.73, 0.39, 1.03, 1.41, 0.22, 1.54, 0.94, 0.71, 1.58, 1.27, 0.57, 0.33]} \ No newline at end of file diff --git a/annotations_1/Sv-BxH3SVS8_filtered.json b/annotations_1/Sv-BxH3SVS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6188c0f75a23784697fc6b7d9e8cc2896ae676c --- /dev/null +++ b/annotations_1/Sv-BxH3SVS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [6.0, 9.05], [11.0, 12.04], [18.0, 20.31], [29.0, 31.63], [35.0, 36.54], [42.0, 44.81], [48.0, 51.66], [70.0, 71.22], [74.0, 79.71], [96.0, 96.85], [99.0, 100.33], [105.0, 107.43], [135.0, 135.04], [135.0, 137.76], [156.0, 159.33], [188.0, 188.97], [192.0, 192.33], [193.0, 195.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 93.91, 0.0, 65.55, 75.23, 0.0, 54.3, 48.74, 0.0, 29.41, 0.0, 0.0, 29.77, 0.0, 29.19, 30.69, 0.0, 0.0, 29.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 61.21], ["theremin", 7.33], ["speech", 7.08]], null, [["music", 58.59], ["theremin", 19.21], ["carnatic music", 5.36]], null, null, [["boing", 28.5], ["music", 25.6], ["singing", 5.51]], null, [["music", 45.05], ["mosquito", 7.13], ["singing", 2.95]], [["music", 68.12], ["foghorn", 8.4], ["singing", 1.77]], null, null, [["music", 22.46], ["boing", 10.09], ["carnatic music", 8.46]]], "duration": [0.66, 3.05, 1.04, 2.31, 2.63, 1.54, 2.81, 3.66, 1.22, 5.71, 0.85, 1.33, 2.43, 0.04, 2.76, 3.33, 0.97, 0.33, 2.47]} \ No newline at end of file diff --git a/annotations_1/Sw4pvbkQ-jk_filtered.json b/annotations_1/Sw4pvbkQ-jk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Sw4pvbkQ-jk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/SwCNp21CKes_filtered.json b/annotations_1/SwCNp21CKes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0b822b84d554a3ae515a4ca4380233acb43f2ed --- /dev/null +++ b/annotations_1/SwCNp21CKes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [4.0, 4.51], [11.0, 12.48], [28.0, 28.22], [34.0, 36.09], [62.0, 62.04], [77.0, 82.54], [87.0, 87.4]], "keep_status": [false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 41.3, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 34.42], ["music", 4.81], ["cattle, bovinae", 4.78]], null, [["music", 45.9], ["sonar", 14.38], ["hum", 8.52]], null], "duration": [0.74, 0.51, 1.48, 0.22, 2.09, 0.04, 5.54, 0.4]} \ No newline at end of file diff --git a/annotations_1/SwarL21fqj0_filtered.json b/annotations_1/SwarL21fqj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c71c4b6f07961366dd53ece0e7e5e13c3d0ef1 --- /dev/null +++ b/annotations_1/SwarL21fqj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.75], [10.0, 10.71], [13.0, 12.61], [14.0, 15.9], [17.0, 38.74], [41.0, 54.53], [59.0, 62.85], [66.0, 89.23], [91.0, 93.61], [94.0, 109.32]], "keep_status": [true, false, false, false, true, false, false, false, false, false], "silence_prob": [33.46, 0.0, 0.0, 0.0, 31.08, 30.73, 30.94, 29.43, 28.59, 30.53], "audiomae_on_audioset": [[["breaking", 26.09], ["whack, thwack", 11.01], ["crack", 6.79]], null, null, null, [["music", 38.26], ["throbbing", 16.86], ["whack, thwack", 11.19]], [["music", 62.89], ["speech", 6.2], ["crack", 3.81]], [["music", 40.92], ["throbbing", 21.95], ["hum", 15.33]], [["music", 43.17], ["throbbing", 25.01], ["hum", 12.76]], [["music", 64.24], ["throbbing", 8.26], ["hum", 8.25]], [["throbbing", 41.68], ["hum", 24.6], ["music", 22.46]]], "duration": [2.75, 0.71, -0.39, 1.9, 21.74, 13.53, 3.85, 23.23, 2.61, 15.32]} \ No newline at end of file diff --git a/annotations_1/SwjKQrYpe-g_filtered.json b/annotations_1/SwjKQrYpe-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48801f7b2191a2b83644ba15197090cdebce0b77 --- /dev/null +++ b/annotations_1/SwjKQrYpe-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [6.0, 6.66], [19.0, 19.87], [30.0, 35.61], [36.0, 37.57], [41.0, 42.58], [43.0, 44.56], [45.0, 49.03], [51.0, 51.29], [52.0, 51.85], [52.0, 56.29], [59.0, 60.51], [64.0, 78.48], [80.0, 80.1], [81.0, 83.37], [85.0, 87.18], [88.0, 89.09], [90.0, 90.95], [92.0, 111.75], [112.0, 118.94], [120.0, 128.66], [129.0, 153.37], [157.0, 165.0]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 33.54, 0.0, 0.0, 29.3, 0.0, 29.85, 0.0, 32.57, 36.66, 0.0, 0.0, 29.26, 29.31, 37.19, 29.38, 28.47], "audiomae_on_audioset": [null, null, null, [["whack, thwack", 52.01], ["ding", 8.75], ["breaking", 4.0]], null, null, null, [["music", 51.16], ["speech", 15.11], ["boing", 10.85]], null, null, [["whack, thwack", 23.16], ["whip", 9.59], ["music", 9.05]], null, [["music", 50.63], ["didgeridoo", 7.91], ["whack, thwack", 7.44]], null, [["music", 41.61], ["crack", 9.62], ["thunk", 8.62]], [["music", 40.58], ["speech", 33.93], ["boing", 3.11]], null, null, [["whack, thwack", 86.14], ["music", 5.17], ["thunk", 0.91]], [["beatboxing", 20.86], ["speech", 20.37], ["whack, thwack", 16.72]], [["music", 21.36], ["groan", 19.14], ["cattle, bovinae", 7.6]], [["whack, thwack", 32.29], ["music", 21.2], ["breaking", 4.88]], [["whack, thwack", 35.15], ["music", 19.02], ["speech", 11.53]]], "duration": [1.31, 0.66, 0.87, 5.61, 1.57, 1.58, 1.56, 4.03, 0.29, -0.15, 4.29, 1.51, 14.48, 0.1, 2.37, 2.18, 1.09, 0.95, 19.75, 6.94, 8.66, 24.37, 8.0]} \ No newline at end of file diff --git a/annotations_1/SxJcAxTBKOk_filtered.json b/annotations_1/SxJcAxTBKOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d0828dfe96f15eca8189f6b1d756b740527ee4d --- /dev/null +++ b/annotations_1/SxJcAxTBKOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.97], [13.0, 13.49], [15.0, 15.72], [17.0, 17.56], [23.0, 23.72], [29.0, 31.02], [31.0, 31.09], [32.0, 32.58], [36.0, 36.75], [50.0, 58.4], [63.0, 70.7], [87.0, 102.34], [104.0, 106.79], [108.0, 115.1], [117.0, 122.22]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [30.52, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 0.0, 0.0, 31.12, 30.31, 29.38, 46.5, 44.52, 63.96], "audiomae_on_audioset": [[["music", 52.83], ["hum", 18.29], ["thunk", 6.11]], null, null, null, null, [["music", 40.98], ["throbbing", 30.81], ["hum", 5.83]], null, null, null, [["didgeridoo", 26.09], ["speech", 23.05], ["music", 19.62]], [["speech", 46.42], ["whack, thwack", 9.71], ["thunk", 7.0]], [["speech", 69.65], ["helicopter", 20.45], ["music", 4.24]], [["speech", 47.57], ["music", 8.43], ["walk, footsteps", 6.49]], [["telephone dialing, dtmf", 35.64], ["music", 12.2], ["sidetone", 8.41]], null], "duration": [3.97, 0.49, 0.72, 0.56, 0.72, 2.02, 0.09, 0.58, 0.75, 8.4, 7.7, 15.34, 2.79, 7.1, 5.22]} \ No newline at end of file diff --git a/annotations_1/Sy_thm1fviY_filtered.json b/annotations_1/Sy_thm1fviY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ee5725e630b64e43e6dce63d4925f45512a48ae --- /dev/null +++ b/annotations_1/Sy_thm1fviY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 24.56], [26.0, 29.0], [31.0, 41.88], [44.0, 74.36], [75.0, 79.41], [83.0, 83.34], [84.0, 106.84], [107.0, 109.44], [112.0, 114.67], [117.0, 118.54], [119.0, 128.44], [129.0, 130.32]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [54.83, 65.55, 65.55, 0.0, 60.05, 0.0, 64.18, 47.78, 56.48, 0.0, 30.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 32.56], ["music", 8.08], ["sonar", 7.27]], null, null, [["speech", 74.95], ["boing", 3.47], ["sound effect", 2.69]], null], "duration": [14.56, 3.0, 10.88, 30.36, 4.41, 0.34, 22.84, 2.44, 2.67, 1.54, 9.44, 1.32]} \ No newline at end of file diff --git a/annotations_1/SzVC7ErC8RY_filtered.json b/annotations_1/SzVC7ErC8RY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79cfea2ac0fb8afdd237f570a1c0f14e1260e62d --- /dev/null +++ b/annotations_1/SzVC7ErC8RY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.7], [40.0, 41.34], [44.0, 44.49], [61.0, 64.39], [65.0, 66.41], [69.0, 71.44], [72.0, 73.41], [76.0, 76.05], [78.0, 80.43], [83.0, 84.05], [89.0, 89.63], [90.0, 94.54], [95.0, 99.47], [102.0, 116.18], [131.0, 131.45], [137.0, 136.75], [139.0, 139.53], [144.0, 145.93], [151.0, 152.0], [154.0, 153.82], [161.0, 161.87], [163.0, 164.74], [166.0, 169.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.98, 0.0, 0.0, 74.6, 88.83, 51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.7, 1.34, 0.49, 3.39, 1.41, 2.44, 1.41, 0.05, 2.43, 1.05, 0.63, 4.54, 4.47, 14.18, 0.45, -0.25, 0.53, 1.93, 1.0, -0.18, 0.87, 1.74, 3.62]} \ No newline at end of file diff --git a/annotations_1/SzlHzRvw-MI_filtered.json b/annotations_1/SzlHzRvw-MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fd7b737570a406ab4619110b37b44baafee1d88 --- /dev/null +++ b/annotations_1/SzlHzRvw-MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.32], [4.0, 5.14], [6.0, 7.03], [8.0, 8.7], [11.0, 11.03], [12.0, 19.53], [21.0, 23.45], [24.0, 24.9], [29.0, 29.74], [30.0, 31.53], [32.0, 33.86], [34.0, 35.55], [39.0, 42.09], [43.0, 44.93], [46.0, 53.47], [55.0, 57.11], [62.0, 63.26], [64.0, 65.06], [66.0, 67.05], [74.0, 79.02], [82.0, 87.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 70.86, 100.0, 0.0, 0.0, 0.0, 80.82, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.14, 1.03, 0.7, 0.03, 7.53, 2.45, 0.9, 0.74, 1.53, 1.86, 1.55, 3.09, 1.93, 7.47, 2.11, 1.26, 1.06, 1.05, 5.02, 5.44]} \ No newline at end of file diff --git a/annotations_1/T-ELiRFK_v0_filtered.json b/annotations_1/T-ELiRFK_v0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14330c9f3f0c0417de9a4d12756e453e795df48f --- /dev/null +++ b/annotations_1/T-ELiRFK_v0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.91], [7.0, 7.16], [8.0, 8.43], [17.0, 17.15], [19.0, 20.34], [21.0, 21.68], [27.0, 27.55], [30.0, 39.18]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 32.79], ["whale vocalization", 15.95], ["mains hum", 7.77]]], "duration": [1.91, 0.16, 0.43, 0.15, 1.34, 0.68, 0.55, 9.18]} \ No newline at end of file diff --git a/annotations_1/T1IyMJOC0JM_filtered.json b/annotations_1/T1IyMJOC0JM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076c6cc24d8f5cda939b11b4ca8aea77a47bfce9 --- /dev/null +++ b/annotations_1/T1IyMJOC0JM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.11], [16.0, 18.39], [22.0, 26.59], [31.0, 32.88], [52.0, 52.37], [65.0, 65.18], [69.0, 70.71], [74.0, 76.06], [79.0, 79.42], [87.0, 87.02], [92.0, 95.23], [101.0, 106.68], [114.0, 115.35], [116.0, 127.97], [130.0, 129.83], [133.0, 152.0], [154.0, 161.06], [163.0, 192.01]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true], "silence_prob": [37.89, 43.2, 29.61, 0.0, 0.0, 0.0, 0.0, 33.05, 0.0, 0.0, 29.93, 30.83, 0.0, 30.26, 0.0, 29.23, 30.13, 29.23], "audiomae_on_audioset": [[["music", 41.27], ["fly, housefly", 8.29], ["mosquito", 7.16]], [["music", 42.14], ["speech", 11.86], ["hum", 4.46]], [["explosion", 22.4], ["music", 18.2], ["burst, pop", 11.43]], null, null, null, null, [["sound effect", 19.99], ["fly, housefly", 8.98], ["music", 8.01]], null, null, [["cattle, bovinae", 36.67], ["livestock, farm animals, working animals", 28.93], ["moo", 20.82]], [["music", 71.97], ["groan", 6.46], ["speech", 5.24]], null, [["fly, housefly", 30.11], ["mosquito", 16.87], ["insect", 13.41]], null, [["music", 39.66], ["speech", 36.78], ["vehicle", 2.87]], [["music", 49.32], ["brass instrument", 5.13], ["trombone", 4.55]], [["music", 34.21], ["theremin", 10.97], ["didgeridoo", 4.54]]], "duration": [4.11, 2.39, 4.59, 1.88, 0.37, 0.18, 1.71, 2.06, 0.42, 0.02, 3.23, 5.68, 1.35, 11.97, -0.17, 19.0, 7.06, 29.01]} \ No newline at end of file diff --git a/annotations_1/T2ph28ghuEU_filtered.json b/annotations_1/T2ph28ghuEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf132990167a16faabe26d6501d35b8d37930a52 --- /dev/null +++ b/annotations_1/T2ph28ghuEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [9.0, 36.8], [38.0, 39.04], [40.0, 61.99], [65.0, 66.31], [71.0, 114.94], [115.0, 182.87], [185.0, 211.42]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 30.88, 0.0, 35.67, 0.0, 0.0, 0.0, 33.19], "audiomae_on_audioset": [null, [["music", 57.54], ["electronic music", 2.67], ["buzz", 2.57]], null, [["speech", 20.82], ["fly, housefly", 13.98], ["music", 11.12]], null, null, null, [["music", 87.3], ["electronic music", 1.16], ["video game music", 0.94]]], "duration": [1.23, 27.8, 1.04, 21.99, 1.31, 43.94, 67.87, 26.42]} \ No newline at end of file diff --git a/annotations_1/T31h3L_egm8_filtered.json b/annotations_1/T31h3L_egm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..431981d1d974b7ce186f32c67cfa50286f5a2682 --- /dev/null +++ b/annotations_1/T31h3L_egm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [4.0, 4.38], [7.0, 6.64], [11.0, 11.48], [12.0, 12.88], [13.0, 13.49], [16.0, 17.05], [17.0, 19.21], [21.0, 23.92], [25.0, 26.23], [27.0, 27.6], [35.0, 34.84], [36.0, 40.81], [44.0, 53.99], [58.0, 58.46], [68.0, 68.59], [74.0, 108.48], [110.0, 114.62], [117.0, 120.06], [121.0, 122.49], [124.0, 125.27], [128.0, 128.17], [132.0, 133.12], [135.0, 135.01], [136.0, 136.88], [138.0, 137.89], [139.0, 140.27], [145.0, 146.31], [150.0, 150.85], [152.0, 152.27], [157.0, 157.38], [159.0, 160.34], [160.0, 162.26], [164.0, 169.97], [171.0, 173.4]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.49, 46.75, 0.0, 0.0, 0.0, 40.36, 45.75, 0.0, 0.0, 0.0, 42.11, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.36, 38.2, 60.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 26.75], ["mains hum", 13.21], ["throbbing", 12.87]], [["music", 65.24], ["throbbing", 3.07], ["synthesizer", 3.03]], null, null, null, [["hum", 22.88], ["music", 21.32], ["throbbing", 15.77]], [["music", 38.41], ["hum", 23.79], ["throbbing", 7.68]], null, null, null, [["theremin", 68.86], ["hum", 15.78], ["music", 5.23]], [["civil defense siren", 17.9], ["singing bowl", 11.74], ["music", 10.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.95], ["mains hum", 22.38], ["music", 7.36]], null], "duration": [0.92, 0.38, -0.36, 0.48, 0.88, 0.49, 1.05, 2.21, 2.92, 1.23, 0.6, -0.16, 4.81, 9.99, 0.46, 0.59, 34.48, 4.62, 3.06, 1.49, 1.27, 0.17, 1.12, 0.01, 0.88, -0.11, 1.27, 1.31, 0.85, 0.27, 0.38, 1.34, 2.26, 5.97, 2.4]} \ No newline at end of file diff --git a/annotations_1/T3zIklxWw44_filtered.json b/annotations_1/T3zIklxWw44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b284422ef5ef7892ab4d09aa25b824f126a3117 --- /dev/null +++ b/annotations_1/T3zIklxWw44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [13.0, 14.57], [15.0, 14.71], [15.0, 16.73], [18.0, 20.22], [22.0, 24.56], [25.0, 28.39], [30.0, 30.89], [31.0, 33.83], [36.0, 38.35], [39.0, 44.36], [45.0, 45.98], [49.0, 49.32], [51.0, 53.08], [57.0, 58.06], [65.0, 66.78], [67.0, 67.61], [69.0, 69.97], [71.0, 80.1], [81.0, 85.99], [87.0, 89.75], [91.0, 91.61], [96.0, 98.14], [99.0, 101.49], [105.0, 105.9], [108.0, 108.3], [112.0, 112.78], [114.0, 116.53], [118.0, 118.18], [119.0, 121.93], [123.0, 125.44], [126.0, 127.55], [128.0, 135.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.87, 100.0, 91.98, 0.0, 94.66, 100.0, 99.82, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.9, 100.0, 100.0, 0.0, 97.54, 79.07, 0.0, 0.0, 0.0, 100.0, 0.0, 86.64, 100.0, 0.0, 99.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.57, -0.29, 1.73, 2.22, 2.56, 3.39, 0.89, 2.83, 2.35, 5.36, 0.98, 0.32, 2.08, 1.06, 1.78, 0.61, 0.97, 9.1, 4.99, 2.75, 0.61, 2.14, 2.49, 0.9, 0.3, 0.78, 2.53, 0.18, 2.93, 2.44, 1.55, 7.7]} \ No newline at end of file diff --git a/annotations_1/T4WNCHc_MmQ_filtered.json b/annotations_1/T4WNCHc_MmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39b34f140e5d50b5c7ac1b02f7da93c37f566f7c --- /dev/null +++ b/annotations_1/T4WNCHc_MmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 39.8], [41.0, 44.44], [46.0, 130.23], [132.0, 149.96], [150.0, 150.03], [151.0, 180.69]], "keep_status": [false, false, false, false, false, false], "silence_prob": [28.77, 33.22, 0.0, 29.22, 0.0, 28.52], "audiomae_on_audioset": [[["music", 27.46], ["hum", 27.11], ["mains hum", 19.46]], [["music", 35.1], ["hum", 24.35], ["throbbing", 13.44]], null, [["mains hum", 32.61], ["music", 23.69], ["hum", 22.49]], null, [["throbbing", 38.89], ["music", 30.88], ["hum", 5.96]]], "duration": [10.8, 3.44, 84.23, 17.96, 0.03, 29.69]} \ No newline at end of file diff --git a/annotations_1/T5CoWL_wdC4_filtered.json b/annotations_1/T5CoWL_wdC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5afde7deb613c74dae826bc1cf2c63d7826e197 --- /dev/null +++ b/annotations_1/T5CoWL_wdC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [3.0, 11.2], [11.0, 11.72], [16.0, 18.06], [25.0, 28.39], [31.0, 35.61], [38.0, 40.93], [42.0, 42.7], [44.0, 44.36], [45.0, 46.33], [49.0, 50.41], [64.0, 74.65], [79.0, 80.62], [84.0, 103.42], [109.0, 110.64], [115.0, 121.31], [122.0, 121.95]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, true, false, true, false, true, false], "silence_prob": [0.0, 33.83, 0.0, 34.61, 31.16, 37.83, 33.34, 0.0, 0.0, 0.0, 0.0, 29.9, 0.0, 28.99, 0.0, 47.9, 0.0], "audiomae_on_audioset": [null, [["music", 50.76], ["hum", 12.0], ["mains hum", 7.55]], null, [["music", 30.32], ["speech", 14.44], ["didgeridoo", 11.13]], [["music", 21.47], ["hum", 10.99], ["mains hum", 10.52]], [["didgeridoo", 26.69], ["music", 24.86], ["grunt", 22.09]], [["hum", 38.16], ["speech", 18.74], ["throbbing", 11.81]], null, null, null, null, [["music", 34.11], ["speech", 7.94], ["buzz", 6.29]], null, [["music", 30.11], ["quack", 9.42], ["groan", 7.12]], null, [["music", 44.81], ["theremin", 6.86], ["musical instrument", 3.9]], null], "duration": [0.13, 8.2, 0.72, 2.06, 3.39, 4.61, 2.93, 0.7, 0.36, 1.33, 1.41, 10.65, 1.62, 19.42, 1.64, 6.31, -0.05]} \ No newline at end of file diff --git a/annotations_1/T5KjTcbQVMs_filtered.json b/annotations_1/T5KjTcbQVMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca8dd2bac9b4af9307ad4182f21d1b6a5f71d0bb --- /dev/null +++ b/annotations_1/T5KjTcbQVMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.63], [5.0, 14.25], [19.0, 20.66], [21.0, 22.87], [25.0, 25.81], [28.0, 29.0], [30.0, 34.45], [35.0, 36.12], [40.0, 80.38], [81.0, 90.44], [95.0, 110.3], [112.0, 113.19], [116.0, 116.55], [119.0, 123.65], [126.0, 126.66], [127.0, 127.77], [129.0, 130.91], [137.0, 138.18], [140.0, 141.47], [146.0, 149.34], [151.0, 153.89], [155.0, 160.64], [161.0, 169.32], [171.0, 172.67], [174.0, 175.44], [179.0, 180.79], [184.0, 186.11], [189.0, 192.84], [195.0, 198.19], [202.0, 202.44], [205.0, 205.65]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 36.73, 0.0, 0.0, 0.0, 0.0, 30.78, 0.0, 0.0, 40.62, 33.0, 0.0, 0.0, 32.93, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 58.05, 30.15, 30.77, 0.0, 0.0, 0.0, 29.69, 28.88, 29.07, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 59.56], ["whale vocalization", 4.86], ["animal", 3.98]], null, null, null, null, [["speech", 37.35], ["hum", 17.68], ["sidetone", 13.93]], null, null, [["thunk", 38.19], ["music", 36.73], ["tap", 3.53]], [["music", 40.21], ["speech", 39.35], ["whale vocalization", 2.96]], null, null, [["music", 26.99], ["speech", 15.37], ["whale vocalization", 8.51]], null, null, null, null, null, null, null, [["speech", 45.4], ["music", 16.27], ["cattle, bovinae", 7.42]], [["throbbing", 29.01], ["hum", 25.97], ["music", 19.96]], null, null, null, [["music", 16.79], ["speech", 12.89], ["vehicle", 7.67]], [["livestock, farm animals, working animals", 50.74], ["cattle, bovinae", 24.44], ["moo", 18.26]], [["music", 34.05], ["throbbing", 4.46], ["hum", 3.64]], null, null], "duration": [1.63, 9.25, 1.66, 1.87, 0.81, 1.0, 4.45, 1.12, 40.38, 9.44, 15.3, 1.19, 0.55, 4.65, 0.66, 0.77, 1.91, 1.18, 1.47, 3.34, 2.89, 5.64, 8.32, 1.67, 1.44, 1.79, 2.11, 3.84, 3.19, 0.44, 0.65]} \ No newline at end of file diff --git a/annotations_1/T5cFTmim4Rw_filtered.json b/annotations_1/T5cFTmim4Rw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebb45ae22d97f8c4f50342d2f800458a94f3b870 --- /dev/null +++ b/annotations_1/T5cFTmim4Rw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 99.96], [101.0, 112.77]], "keep_status": [false, true], "silence_prob": [0.0, 31.01], "audiomae_on_audioset": [null, [["buzz", 15.56], ["fly, housefly", 9.45], ["music", 7.83]]], "duration": [35.96, 11.77]} \ No newline at end of file diff --git a/annotations_1/T5p0IaOt3tQ_filtered.json b/annotations_1/T5p0IaOt3tQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc1752f2747f67cb3291696799966127885bbf0a --- /dev/null +++ b/annotations_1/T5p0IaOt3tQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [3.0, 4.41], [8.0, 9.51], [10.0, 10.0], [12.0, 12.31], [19.0, 19.14], [20.0, 27.33], [27.0, 28.75], [30.0, 30.43], [31.0, 32.32], [36.0, 36.56], [52.0, 52.86], [61.0, 60.79], [68.0, 68.74], [69.0, 69.55], [73.0, 73.67], [74.0, 74.95], [78.0, 78.27], [79.0, 79.14], [80.0, 80.62], [83.0, 88.45], [95.0, 95.64], [96.0, 96.48], [105.0, 105.07], [105.0, 106.15], [109.0, 108.67], [113.0, 113.61], [119.0, 119.38], [120.0, 121.0], [122.0, 122.62], [130.0, 132.9], [134.0, 142.08], [142.0, 153.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 36.86, 35.87], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 79.44], ["noise", 6.22], ["beatboxing", 2.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.27], ["sidetone", 20.06], ["telephone", 11.2]], null, null, null, null, null, null, null, null, null, null, [["music", 37.57], ["musical instrument", 8.74], ["synthesizer", 6.95]], [["music", 54.58], ["brass instrument", 7.55], ["musical instrument", 7.4]]], "duration": [1.51, 1.41, 1.51, 0.0, 0.31, 0.14, 7.33, 1.75, 0.43, 1.32, 0.56, 0.86, -0.21, 0.74, 0.55, 0.67, 0.95, 0.27, 0.14, 0.62, 5.45, 0.64, 0.48, 0.07, 1.15, -0.33, 0.61, 0.38, 1.0, 0.62, 2.9, 8.08, 11.27]} \ No newline at end of file diff --git a/annotations_1/T5rzOU-4Bkc_filtered.json b/annotations_1/T5rzOU-4Bkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89ec3100714cf98854554649cefd331f2553cb04 --- /dev/null +++ b/annotations_1/T5rzOU-4Bkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.48], [7.0, 14.93], [17.0, 32.09], [34.0, 33.98], [38.0, 38.15], [40.0, 43.98], [45.0, 46.11], [50.0, 50.31], [52.0, 53.99], [55.0, 55.73], [58.0, 59.04], [65.0, 65.87], [68.0, 72.98], [88.0, 87.83], [90.0, 94.69], [95.0, 95.71], [97.0, 96.82], [98.0, 99.71], [101.0, 100.84], [105.0, 109.61], [111.0, 111.84], [113.0, 125.71], [127.0, 133.12], [134.0, 133.66], [134.0, 133.69], [134.0, 133.73], [134.0, 133.76], [134.0, 162.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.44, 30.75, 54.23, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 82.79, 65.67, 0.0, 0.0, 0.0, 0.0, 76.37], "audiomae_on_audioset": [[["music", 50.88], ["didgeridoo", 24.2], ["theremin", 3.0]], [["music", 49.29], ["throbbing", 14.74], ["electronic music", 10.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.48, 7.93, 15.09, -0.02, 0.15, 3.98, 1.11, 0.31, 1.99, 0.73, 1.04, 0.87, 4.98, -0.17, 4.69, 0.71, -0.18, 1.71, -0.16, 4.61, 0.84, 12.71, 6.12, -0.34, -0.31, -0.27, -0.24, 28.68]} \ No newline at end of file diff --git a/annotations_1/T69FlogsAGI_filtered.json b/annotations_1/T69FlogsAGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a695c17cd4cc7f9fc09b524427a856ba3940f9f --- /dev/null +++ b/annotations_1/T69FlogsAGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [8.0, 8.55], [11.0, 18.42], [22.0, 23.18], [27.0, 62.63], [63.0, 65.03], [66.0, 66.87], [68.0, 68.45], [69.0, 69.67], [70.0, 71.04], [72.0, 73.18], [75.0, 77.52], [79.0, 80.84], [82.0, 89.55], [90.0, 92.35], [93.0, 93.51], [94.0, 94.91], [95.0, 95.81], [97.0, 97.09], [98.0, 98.37], [99.0, 99.84], [100.0, 101.07], [102.0, 102.37], [103.0, 103.59], [104.0, 122.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 61.47, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 56.63, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.22], ["noise", 10.97], ["synthesizer", 7.89]]], "duration": [1.11, 0.55, 7.42, 1.18, 35.63, 2.03, 0.87, 0.45, 0.67, 1.04, 1.18, 2.52, 1.84, 7.55, 2.35, 0.51, 0.91, 0.81, 0.09, 0.37, 0.84, 1.07, 0.37, 0.59, 18.44]} \ No newline at end of file diff --git a/annotations_1/T7kklmGWLDk_filtered.json b/annotations_1/T7kklmGWLDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf88b0f40eded9982ad3bc20584d3ab829f4ea7 --- /dev/null +++ b/annotations_1/T7kklmGWLDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.44], [13.0, 16.73], [19.0, 20.02], [21.0, 33.88], [35.0, 36.51], [38.0, 40.59], [42.0, 42.96], [45.0, 45.82], [48.0, 49.55], [52.0, 55.46], [57.0, 58.16], [60.0, 60.86], [65.0, 67.78], [71.0, 76.98], [79.0, 79.52], [80.0, 82.59], [87.0, 88.33], [90.0, 91.07], [92.0, 92.7], [94.0, 94.36], [99.0, 100.75], [109.0, 108.78], [112.0, 111.89], [123.0, 123.33], [140.0, 143.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 73.51, 0.0, 42.08, 0.0, 64.29, 0.0, 0.0, 0.0, 94.95, 0.0, 0.0, 35.64, 65.32, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.47], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 55.72], ["mosquito", 23.51], ["insect", 8.8]], null, null, null, null, null, null, null, null, [["fart", 29.52], ["fly, housefly", 7.21], ["speech", 6.81]], null, null, null, null, null, null, null, null, null, null, null, [["laughter", 34.84], ["snicker", 14.31], ["chuckle, chortle", 11.77]]], "duration": [1.44, 3.73, 1.02, 12.88, 1.51, 2.59, 0.96, 0.82, 1.55, 3.46, 1.16, 0.86, 2.78, 5.98, 0.52, 2.59, 1.33, 1.07, 0.7, 0.36, 1.75, -0.22, -0.11, 0.33, 3.82]} \ No newline at end of file diff --git a/annotations_1/T8KFieVkVkU_filtered.json b/annotations_1/T8KFieVkVkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a0f80ebe1f594f5811b2f0d5e599d08a187980a --- /dev/null +++ b/annotations_1/T8KFieVkVkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [13.0, 15.08], [21.0, 21.59], [23.0, 25.19], [41.0, 41.67], [46.0, 45.86], [49.0, 50.63], [56.0, 56.52], [58.0, 59.93], [62.0, 66.63], [69.0, 69.31], [70.0, 71.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.86, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["buzzer", 26.33], ["sliding door", 6.49], ["telephone", 5.33]], null, null, null, null, null, null, null, null], "duration": [0.64, 2.08, 0.59, 2.19, 0.67, -0.14, 1.63, 0.52, 1.93, 4.63, 0.31, 1.66]} \ No newline at end of file diff --git a/annotations_1/TAK8DeL_w00_filtered.json b/annotations_1/TAK8DeL_w00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc8473f93332ed220672d244740dd4aa62c8c64 --- /dev/null +++ b/annotations_1/TAK8DeL_w00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [24.0, 24.36], [25.0, 26.28], [27.0, 28.05], [29.0, 30.45], [35.0, 36.75], [38.0, 39.63], [46.0, 50.82], [60.0, 61.28], [63.0, 64.42], [65.0, 66.41], [77.0, 79.95], [86.0, 86.46], [100.0, 104.21], [110.0, 114.0], [125.0, 125.54], [128.0, 130.38], [134.0, 134.59], [136.0, 141.25], [151.0, 152.54], [157.0, 163.11], [164.0, 169.59], [170.0, 172.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 99.93, 0.0, 65.55, 84.43, 0.0, 77.7, 0.0, 73.36, 0.0, 78.55, 74.76, 97.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.36, 1.28, 1.05, 1.45, 1.75, 1.63, 4.82, 1.28, 1.42, 1.41, 2.95, 0.46, 4.21, 4.0, 0.54, 2.38, 0.59, 5.25, 1.54, 6.11, 5.59, 2.29]} \ No newline at end of file diff --git a/annotations_1/TBHjt3AyALw_filtered.json b/annotations_1/TBHjt3AyALw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec1428d446cdeb59cf6d30ff07cc981b2676d730 --- /dev/null +++ b/annotations_1/TBHjt3AyALw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.61], [6.0, 6.66], [13.0, 13.59], [15.0, 16.34], [17.0, 17.2], [18.0, 20.36], [21.0, 21.93], [22.0, 22.67], [23.0, 23.35], [25.0, 25.76], [27.0, 27.18], [29.0, 29.19], [30.0, 30.4], [32.0, 32.75], [36.0, 36.14], [41.0, 40.88], [48.0, 50.45], [52.0, 54.31], [55.0, 57.86], [59.0, 59.76], [63.0, 63.27], [67.0, 71.88], [73.0, 74.55], [76.0, 79.84], [80.0, 80.92], [82.0, 83.27], [87.0, 87.51], [88.0, 88.89], [92.0, 92.25], [94.0, 97.65], [100.0, 102.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.69, 100.0, 99.91, 0.0, 0.0, 60.79, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.45], ["electronic music", 6.03], ["sidetone", 4.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.66, 0.59, 1.34, 0.2, 2.36, 0.93, 0.67, 0.35, 0.76, 0.18, 0.19, 0.4, 0.75, 0.14, -0.12, 2.45, 2.31, 2.86, 0.76, 0.27, 4.88, 1.55, 3.84, 0.92, 1.27, 0.51, 0.89, 0.25, 3.65, 2.52]} \ No newline at end of file diff --git a/annotations_1/TC41JxKq_xQ_filtered.json b/annotations_1/TC41JxKq_xQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..977d6fe3f7f4826f1e84186a7d6b86126c2babb1 --- /dev/null +++ b/annotations_1/TC41JxKq_xQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.48], [10.0, 16.02], [18.0, 19.4], [22.0, 30.5], [34.0, 35.53], [37.0, 38.52], [40.0, 41.64], [42.0, 43.78], [46.0, 48.2], [48.0, 53.62], [56.0, 57.5], [62.0, 63.88], [64.0, 78.21], [84.0, 84.5], [85.0, 88.92], [92.0, 98.46], [109.0, 124.78], [126.0, 126.06], [129.0, 138.03]], "keep_status": [false, true, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, true], "silence_prob": [32.57, 32.79, 0.0, 31.66, 0.0, 0.0, 0.0, 0.0, 30.56, 31.39, 0.0, 0.0, 31.4, 0.0, 31.06, 31.91, 31.12, 0.0, 43.51], "audiomae_on_audioset": [[["speech", 47.52], ["music", 26.08], ["animal", 3.45]], [["music", 36.3], ["mosquito", 7.09], ["speech", 7.04]], null, [["music", 39.0], ["speech", 8.98], ["fly, housefly", 5.84]], null, null, null, null, [["siren", 31.86], ["civil defense siren", 25.92], ["whir", 4.57]], [["boing", 51.7], ["music", 9.32], ["buzz", 4.63]], null, null, [["music", 62.0], ["speech", 15.39], ["synthesizer", 5.38]], null, [["music", 63.61], ["speech", 6.73], ["cattle, bovinae", 5.97]], [["music", 62.39], ["speech", 8.34], ["fart", 2.15]], [["music", 58.66], ["speech", 4.79], ["musical instrument", 3.0]], null, [["whale vocalization", 28.83], ["music", 15.89], ["sidetone", 6.2]]], "duration": [3.48, 6.02, 1.4, 8.5, 1.53, 1.52, 1.64, 1.78, 2.2, 5.62, 1.5, 1.88, 14.21, 0.5, 3.92, 6.46, 15.78, 0.06, 9.03]} \ No newline at end of file diff --git a/annotations_1/TChg5dQ36WM_filtered.json b/annotations_1/TChg5dQ36WM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b79cc68902b4435e20a1ed28b300b4fd0cd1b0a1 --- /dev/null +++ b/annotations_1/TChg5dQ36WM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.59], [15.0, 15.26], [16.0, 16.9], [17.0, 18.39], [27.0, 27.55], [33.0, 34.45], [35.0, 35.01], [37.0, 38.33], [39.0, 40.47], [53.0, 53.81], [55.0, 56.05], [69.0, 69.33], [76.0, 76.23], [78.0, 78.98], [80.0, 81.94], [82.0, 83.69], [87.0, 88.87], [96.0, 97.9], [99.0, 100.75], [103.0, 103.76], [104.0, 106.24], [110.0, 110.74], [119.0, 121.47], [122.0, 149.57], [154.0, 159.78], [160.0, 162.13], [163.0, 163.7], [166.0, 166.83], [169.0, 169.89], [171.0, 177.43], [178.0, 183.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 0.0, 95.91, 82.61, 87.74, 47.74, 0.0, 0.0, 0.0, 81.71, 57.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.81], ["hum", 11.12], ["sine wave", 9.07]], null, null, null, null, null], "duration": [0.59, 0.26, 0.9, 1.39, 0.55, 1.45, 0.01, 1.33, 1.47, 0.81, 1.05, 0.33, 0.23, 0.98, 1.94, 1.69, 1.87, 1.9, 1.75, 0.76, 2.24, 0.74, 2.47, 27.57, 5.78, 2.13, 0.7, 0.83, 0.89, 6.43, 5.46]} \ No newline at end of file diff --git a/annotations_1/TEZq-_XkcRA_filtered.json b/annotations_1/TEZq-_XkcRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2f203d5fba1f3071d2215f3f03e9f9a935278e8 --- /dev/null +++ b/annotations_1/TEZq-_XkcRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.77], [12.0, 12.14], [13.0, 15.08], [19.0, 20.56], [23.0, 34.25], [36.0, 37.61], [43.0, 44.86], [48.0, 47.82], [50.0, 51.38], [53.0, 54.3], [55.0, 58.09], [60.0, 80.54], [82.0, 82.53], [85.0, 85.77], [87.0, 87.83], [93.0, 94.69], [96.0, 96.82], [99.0, 109.24], [112.0, 119.74], [123.0, 125.81]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 57.01, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 45.69, 49.27], "audiomae_on_audioset": [null, null, null, null, [["rumble", 14.83], ["creak", 12.27], ["hum", 11.21]], null, null, null, null, null, null, [["hum", 40.09], ["throbbing", 12.68], ["mains hum", 10.55]], null, null, null, null, null, [["music", 56.11], ["musical instrument", 4.22], ["hum", 2.95]], [["hum", 23.14], ["mains hum", 19.76], ["music", 15.46]], [["hum", 26.25], ["throbbing", 21.42], ["mains hum", 5.35]]], "duration": [1.77, 0.14, 2.08, 1.56, 11.25, 1.61, 1.86, -0.18, 1.38, 1.3, 3.09, 20.54, 0.53, 0.77, 0.83, 1.69, 0.82, 10.24, 7.74, 2.81]} \ No newline at end of file diff --git a/annotations_1/TEvVc1vsO2U_filtered.json b/annotations_1/TEvVc1vsO2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/TEvVc1vsO2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/TFDiCTUAJuE_filtered.json b/annotations_1/TFDiCTUAJuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..038c93fb128727fb4bd89f884523159aa00c210b --- /dev/null +++ b/annotations_1/TFDiCTUAJuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [5.0, 5.98], [6.0, 7.74], [14.0, 14.52], [16.0, 17.71], [34.0, 34.25], [40.0, 40.98], [53.0, 54.92], [56.0, 56.61], [71.0, 72.96], [79.0, 81.51], [83.0, 83.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.06, 0.98, 1.74, 0.52, 1.71, 0.25, 0.98, 1.92, 0.61, 1.96, 2.51, 0.74]} \ No newline at end of file diff --git a/annotations_1/TGghm3K1NXQ_filtered.json b/annotations_1/TGghm3K1NXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e143db7f22a8ca1248604028bcc455c1339ed3f3 --- /dev/null +++ b/annotations_1/TGghm3K1NXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.08], [14.0, 22.15], [29.0, 34.45], [37.0, 43.46], [48.0, 49.59], [55.0, 56.64], [60.0, 60.83], [61.0, 62.61], [73.0, 75.73], [77.0, 79.91], [84.0, 86.19], [88.0, 116.92], [131.0, 133.02], [139.0, 140.09], [141.0, 142.15], [148.0, 150.45]], "keep_status": [true, true, true, true, false, false, false, false, true, true, true, true, false, false, false, true], "silence_prob": [28.14, 33.5, 29.06, 29.44, 0.0, 0.0, 0.0, 0.0, 44.34, 43.98, 43.35, 33.9, 30.88, 0.0, 0.0, 28.24], "audiomae_on_audioset": [[["speech", 35.57], ["explosion", 15.21], ["burst, pop", 5.8]], [["music", 28.39], ["hum", 27.64], ["mains hum", 9.04]], [["speech", 16.51], ["throbbing", 16.49], ["hum", 12.01]], [["speech", 22.64], ["whip", 20.29], ["music", 6.28]], null, null, null, null, [["music", 38.18], ["theremin", 9.23], ["hum", 8.45]], [["music", 27.49], ["throbbing", 10.71], ["hum", 6.44]], [["music", 27.19], ["didgeridoo", 26.18], ["hum", 5.47]], [["speech", 24.7], ["fly, housefly", 19.06], ["insect", 9.12]], [["music", 38.16], ["speech", 26.46], ["boing", 6.68]], null, null, [["eruption", 20.03], ["explosion", 12.54], ["hum", 8.08]]], "duration": [2.08, 8.15, 5.45, 6.46, 1.59, 1.64, 0.83, 1.61, 2.73, 2.91, 2.19, 28.92, 2.02, 1.09, 1.15, 2.45]} \ No newline at end of file diff --git a/annotations_1/TGqOd_3mrr4_filtered.json b/annotations_1/TGqOd_3mrr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea68b9f53e28b1c3235691e90dca97f0eca9e314 --- /dev/null +++ b/annotations_1/TGqOd_3mrr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.24], [7.0, 9.83], [12.0, 61.6], [68.0, 68.64], [69.0, 74.22], [75.0, 78.51], [79.0, 83.74], [84.0, 84.32], [85.0, 85.73], [87.0, 87.25], [87.0, 91.57], [95.0, 95.89], [101.0, 101.88], [103.0, 104.55], [107.0, 107.62], [111.0, 112.29], [115.0, 116.01], [119.0, 118.88], [122.0, 122.1], [133.0, 134.74], [147.0, 147.6], [163.0, 164.91], [167.0, 167.7], [169.0, 170.24], [173.0, 176.91], [179.0, 181.7]], "keep_status": [false, false, false, false, true, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [99.95, 99.99, 0.0, 0.0, 43.33, 40.52, 43.74, 0.0, 0.0, 0.0, 39.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 40.16], "audiomae_on_audioset": [null, null, null, null, [["music", 31.68], ["speech", 23.94], ["hum", 11.1]], [["speech", 28.55], ["music", 21.87], ["mains hum", 10.5]], [["music", 45.01], ["speech", 14.29], ["didgeridoo", 9.4]], null, null, null, [["speech", 24.51], ["music", 23.33], ["musical instrument", 3.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 23.55], ["speech", 13.35], ["didgeridoo", 7.95]], [["music", 51.11], ["throbbing", 7.5], ["hum", 6.39]]], "duration": [2.24, 2.83, 49.6, 0.64, 5.22, 3.51, 4.74, 0.32, 0.73, 0.25, 4.57, 0.89, 0.88, 1.55, 0.62, 1.29, 1.01, -0.12, 0.1, 1.74, 0.6, 1.91, 0.7, 1.24, 3.91, 2.7]} \ No newline at end of file diff --git a/annotations_1/THuOIvlbIjM_filtered.json b/annotations_1/THuOIvlbIjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6806c9bea95cea745e07110567d4f0c57add2ae7 --- /dev/null +++ b/annotations_1/THuOIvlbIjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.08], [16.0, 17.76], [19.0, 20.31], [21.0, 25.56], [27.0, 31.6], [32.0, 34.57], [37.0, 42.33], [43.0, 44.46], [45.0, 47.01], [48.0, 48.96], [49.0, 50.5], [52.0, 54.06], [55.0, 56.57], [58.0, 62.88], [64.0, 68.66], [71.0, 76.55], [78.0, 78.85], [79.0, 81.01], [82.0, 84.59], [86.0, 86.41], [89.0, 89.38], [90.0, 91.44], [100.0, 102.03], [103.0, 103.59], [107.0, 111.62], [112.0, 114.25], [115.0, 115.4], [120.0, 176.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 99.82, 99.96, 64.18, 99.94, 0.0, 100.0, 0.0, 0.0, 99.36, 0.0, 98.36, 95.37, 91.47, 0.0, 92.31, 94.66, 0.0, 0.0, 0.0, 44.57, 0.0, 35.73, 56.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.01], ["whimper", 6.05], ["speech", 5.05]], null, [["cattle, bovinae", 23.28], ["moo", 16.67], ["livestock, farm animals, working animals", 11.5]], null, null, null], "duration": [2.08, 1.76, 1.31, 4.56, 4.6, 2.57, 5.33, 1.46, 2.01, 0.96, 1.5, 2.06, 1.57, 4.88, 4.66, 5.55, 0.85, 2.01, 2.59, 0.41, 0.38, 1.44, 2.03, 0.59, 4.62, 2.25, 0.4, 56.76]} \ No newline at end of file diff --git a/annotations_1/TIEtN-jVDbg_filtered.json b/annotations_1/TIEtN-jVDbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..553995988b94b27f6c58ce93fd8dd1207685d8a4 --- /dev/null +++ b/annotations_1/TIEtN-jVDbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[132.0, 133.2], [134.0, 139.45], [140.0, 142.82], [144.0, 146.28]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 34.63, 35.53, 37.45], "audiomae_on_audioset": [null, [["hum", 45.76], ["throbbing", 37.94], ["mains hum", 3.87]], [["music", 47.27], ["speech", 25.69], ["electronic music", 3.92]], [["hum", 62.59], ["throbbing", 26.04], ["mains hum", 7.69]]], "duration": [1.2, 5.45, 2.82, 2.28]} \ No newline at end of file diff --git a/annotations_1/TIu_CYwemFo_filtered.json b/annotations_1/TIu_CYwemFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32877ad131e5468368f79f0a7914f7ae5c5abdb3 --- /dev/null +++ b/annotations_1/TIu_CYwemFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.32], [5.0, 4.94], [5.0, 6.91], [10.0, 11.91], [14.0, 15.15], [17.0, 17.61], [19.0, 20.04], [28.0, 28.78], [29.0, 29.78], [33.0, 33.62], [38.0, 38.37], [40.0, 40.71], [41.0, 41.72], [43.0, 44.02], [45.0, 46.6], [48.0, 48.3], [50.0, 50.9], [54.0, 55.17], [70.0, 70.58], [78.0, 78.58], [84.0, 84.45], [91.0, 91.98], [96.0, 97.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["owl", 64.35], ["hoot", 20.73], ["sidetone", 2.48]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.32, -0.06, 1.91, 1.91, 1.15, 0.61, 1.04, 0.78, 0.78, 0.62, 0.37, 0.71, 0.72, 1.02, 1.6, 0.3, 0.9, 1.17, 0.58, 0.58, 0.45, 0.98, 1.34]} \ No newline at end of file diff --git a/annotations_1/TJa_A5cVd-w_filtered.json b/annotations_1/TJa_A5cVd-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/TJa_A5cVd-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/TKszvumsyFY_filtered.json b/annotations_1/TKszvumsyFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b60cbed4fe1298cf9a7e1c3b83b20d6ed51ae568 --- /dev/null +++ b/annotations_1/TKszvumsyFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.75], [40.0, 41.62], [46.0, 47.56], [48.0, 50.82], [51.0, 51.54], [52.0, 53.49], [55.0, 55.92], [57.0, 76.99], [80.0, 133.03]], "keep_status": [false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.9, 0.0, 0.0, 0.0, 31.7, 0.0], "audiomae_on_audioset": [null, null, null, [["throbbing", 25.49], ["hum", 17.12], ["mains hum", 15.62]], null, null, null, [["music", 55.66], ["hum", 7.07], ["buzz", 6.07]], null], "duration": [0.75, 1.62, 1.56, 2.82, 0.54, 1.49, 0.92, 19.99, 53.03]} \ No newline at end of file diff --git a/annotations_1/TLOD07LZw90_filtered.json b/annotations_1/TLOD07LZw90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2460243c68ef40f422a767844b553b2fb0ad2b99 --- /dev/null +++ b/annotations_1/TLOD07LZw90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.73], [43.0, 68.44], [71.0, 123.7], [129.0, 130.6], [137.0, 147.92], [152.0, 152.91], [154.0, 154.94]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [36.62, 30.77, 0.0, 0.0, 65.79, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 12.11], ["music", 11.46], ["throbbing", 7.51]], [["music", 81.82], ["musical instrument", 3.03], ["guitar", 1.05]], null, null, null, null, null], "duration": [6.73, 25.44, 52.7, 1.6, 10.92, 0.91, 0.94]} \ No newline at end of file diff --git a/annotations_1/TMe71Lvy1lA_filtered.json b/annotations_1/TMe71Lvy1lA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e74b0121098da1c8c0cbe7a5d423f0586703449 --- /dev/null +++ b/annotations_1/TMe71Lvy1lA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 108.41], [109.0, 110.0], [113.0, 137.02], [137.0, 137.64], [140.0, 153.12], [154.0, 154.52], [158.0, 158.01], [162.0, 164.1], [171.0, 171.0], [171.0, 173.42]], "keep_status": [false, false, true, false, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 28.87, 0.0, 31.53, 0.0, 0.0, 32.91, 0.0, 32.46], "audiomae_on_audioset": [null, null, [["music", 25.63], ["cacophony", 16.67], ["noise", 6.79]], null, [["speech", 20.76], ["music", 11.28], ["hum", 9.5]], null, null, [["didgeridoo", 42.19], ["music", 23.21], ["cattle, bovinae", 3.84]], null, [["music", 26.13], ["frog", 17.03], ["fly, housefly", 13.46]]], "duration": [33.41, 1.0, 24.02, 0.64, 13.12, 0.52, 0.01, 2.1, 0.0, 2.42]} \ No newline at end of file diff --git a/annotations_1/TMeiAg1kXKs_filtered.json b/annotations_1/TMeiAg1kXKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d920c66b446c3d039a3ec4d59355d24e36f05c09 --- /dev/null +++ b/annotations_1/TMeiAg1kXKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.59], [21.0, 22.47], [29.0, 31.82], [36.0, 39.61], [40.0, 41.28], [52.0, 52.62], [54.0, 55.32], [56.0, 56.57], [58.0, 60.94], [65.0, 72.64], [75.0, 75.59], [77.0, 81.4], [87.0, 87.81], [97.0, 97.66], [105.0, 105.78], [108.0, 109.04], [112.0, 112.65], [117.0, 117.95], [119.0, 124.44], [125.0, 126.42], [130.0, 132.19], [135.0, 137.57], [141.0, 142.42], [145.0, 149.76], [151.0, 164.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 0.0, 78.89, 56.4, 0.0, 0.0, 0.0, 0.0, 49.09, 52.22, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 86.09, 79.07, 0.0, 71.29, 83.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 45.39], ["whale vocalization", 20.98], ["radio", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.59, 1.47, 2.82, 3.61, 1.28, 0.62, 1.32, 0.57, 2.94, 7.64, 0.59, 4.4, 0.81, 0.66, 0.78, 1.04, 0.65, 0.95, 5.44, 1.42, 2.19, 2.57, 1.42, 4.76, 13.42]} \ No newline at end of file diff --git a/annotations_1/TPDKmRQddq0_filtered.json b/annotations_1/TPDKmRQddq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e110a64ad2d557927eac693d0bcca559ad48d0a --- /dev/null +++ b/annotations_1/TPDKmRQddq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 75.76], [77.0, 80.96], [83.0, 83.3], [84.0, 120.12], [121.0, 121.31], [123.0, 178.38], [180.0, 190.66]], "keep_status": [true, true, false, false, false, false, false], "silence_prob": [32.23, 31.32, 0.0, 0.0, 0.0, 0.0, 41.83], "audiomae_on_audioset": [[["hum", 15.78], ["fly, housefly", 13.01], ["mains hum", 8.75]], [["speech", 51.59], ["motorboat, speedboat", 6.72], ["vehicle", 5.64]], null, null, null, null, [["music", 57.9], ["hum", 12.38], ["mains hum", 4.22]]], "duration": [9.76, 3.96, 0.3, 36.12, 0.31, 55.38, 10.66]} \ No newline at end of file diff --git a/annotations_1/TRCSLhYz9CA_filtered.json b/annotations_1/TRCSLhYz9CA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2855872d2b55470b3866af6f6b48268bf37d090f --- /dev/null +++ b/annotations_1/TRCSLhYz9CA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 34.43], [36.0, 38.8], [43.0, 59.05], [61.0, 105.33], [106.0, 106.86], [111.0, 126.86]], "keep_status": [false, true, false, false, false, false], "silence_prob": [34.23, 36.59, 32.73, 0.0, 0.0, 31.42], "audiomae_on_audioset": [[["music", 60.04], ["didgeridoo", 20.18], ["hum", 1.91]], [["hum", 41.86], ["throbbing", 12.8], ["music", 12.55]], [["music", 66.89], ["theremin", 14.16], ["glass", 2.18]], null, null, [["music", 38.87], ["buzz", 32.88], ["hum", 8.41]]], "duration": [9.43, 2.8, 16.05, 44.33, 0.86, 15.86]} \ No newline at end of file diff --git a/annotations_1/TSAdyzdX4eA_filtered.json b/annotations_1/TSAdyzdX4eA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6b6b6bbfaf1daeb113c80e01804d247a976e4bf --- /dev/null +++ b/annotations_1/TSAdyzdX4eA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.82], [16.0, 16.7], [19.0, 21.1], [26.0, 26.87], [28.0, 28.44], [36.0, 36.51], [37.0, 38.58], [40.0, 40.91], [47.0, 49.47], [51.0, 53.79], [57.0, 57.99], [59.0, 60.88], [63.0, 67.58], [70.0, 71.61], [95.0, 95.37], [114.0, 115.13], [117.0, 118.99], [124.0, 126.77], [139.0, 139.28], [148.0, 148.58], [153.0, 152.85], [154.0, 153.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 78.38, 0.0, 0.0, 51.94, 0.0, 0.0, 0.0, 0.0, 42.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 79.12], ["speech", 13.09], ["whale vocalization", 1.04]], null, null, null, null], "duration": [-0.18, 0.7, 2.1, 0.87, 0.44, 0.51, 1.58, 0.91, 2.47, 2.79, 0.99, 1.88, 4.58, 1.61, 0.37, 1.13, 1.99, 2.77, 0.28, 0.58, -0.15, -0.13]} \ No newline at end of file diff --git a/annotations_1/TSCcj7mYuhc_filtered.json b/annotations_1/TSCcj7mYuhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a835340f586b06b4ac7a165b8e713897cfeac22 --- /dev/null +++ b/annotations_1/TSCcj7mYuhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [4.0, 5.66], [7.0, 9.24], [10.0, 11.91], [12.0, 13.32], [14.0, 14.27], [16.0, 16.28], [30.0, 30.91], [32.0, 31.78], [33.0, 33.2], [34.0, 36.15], [42.0, 42.52], [49.0, 49.91], [55.0, 56.07], [57.0, 57.13], [59.0, 61.69], [64.0, 64.76], [68.0, 68.64], [71.0, 71.56], [74.0, 74.43], [77.0, 77.53], [80.0, 80.82], [82.0, 82.75], [83.0, 84.0], [85.0, 85.11], [85.0, 85.82], [87.0, 87.71], [89.0, 89.68], [97.0, 104.06], [108.0, 109.11], [110.0, 110.79], [116.0, 117.91], [119.0, 120.23], [120.0, 121.66], [125.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 1.66, 2.24, 1.91, 1.32, 0.27, 0.28, 0.91, -0.22, 0.2, 2.15, 0.52, 0.91, 1.07, 0.13, 2.69, 0.76, 0.64, 0.56, 0.43, 0.53, 0.82, 0.75, 1.0, 0.11, 0.82, 0.71, 0.68, 7.06, 1.11, 0.79, 1.91, 1.23, 1.66, 2.38]} \ No newline at end of file diff --git a/annotations_1/TSPaaPqteCU_filtered.json b/annotations_1/TSPaaPqteCU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34d97fba559fed6de9a9d55a0b9ce0814ba8e79f --- /dev/null +++ b/annotations_1/TSPaaPqteCU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 16.01], [17.0, 23.3], [28.0, 28.95], [29.0, 30.08], [31.0, 32.59], [38.0, 40.83], [44.0, 45.87], [49.0, 52.98], [59.0, 68.76], [73.0, 76.52], [78.0, 79.61], [81.0, 82.39], [83.0, 89.97], [94.0, 98.09], [101.0, 109.04], [110.0, 112.65], [113.0, 113.68], [115.0, 117.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [60.98, 60.98, 0.0, 0.0, 0.0, 77.2, 0.0, 54.17, 72.9, 79.59, 0.0, 0.0, 50.11, 41.09, 38.02, 34.43, 0.0, 33.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.39], ["violin, fiddle", 9.42], ["musical instrument", 8.77]], [["music", 69.83], ["theremin", 11.21], ["middle eastern music", 2.21]], [["music", 61.91], ["theremin", 6.55], ["musical instrument", 4.57]], null, [["music", 47.73], ["theremin", 13.21], ["bowed string instrument", 6.23]]], "duration": [15.01, 6.3, 0.95, 1.08, 1.59, 2.83, 1.87, 3.98, 9.76, 3.52, 1.61, 1.39, 6.97, 4.09, 8.04, 2.65, 0.68, 2.95]} \ No newline at end of file diff --git a/annotations_1/TSQ770iqDgY_filtered.json b/annotations_1/TSQ770iqDgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a35effa3720f89dc63df052dab1a815e29811f0 --- /dev/null +++ b/annotations_1/TSQ770iqDgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.81], [4.0, 5.83], [6.0, 8.72], [12.0, 12.39], [16.0, 17.02], [21.0, 21.84], [24.0, 25.35], [33.0, 35.14], [36.0, 37.81], [39.0, 45.33], [47.0, 49.37], [51.0, 53.28], [62.0, 76.17], [79.0, 80.7], [92.0, 92.52], [95.0, 95.93], [101.0, 102.91], [104.0, 104.48], [117.0, 117.64], [154.0, 153.93], [168.0, 176.76], [183.0, 183.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 86.64, 92.8, 54.5, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.15], ["sidetone", 18.79], ["radio", 17.36]], null], "duration": [-0.19, 1.83, 2.72, 0.39, 1.02, 0.84, 1.35, 2.14, 1.81, 6.33, 2.37, 2.28, 14.17, 1.7, 0.52, 0.93, 1.91, 0.48, 0.64, -0.07, 8.76, 0.46]} \ No newline at end of file diff --git a/annotations_1/TSclZRaacyA_filtered.json b/annotations_1/TSclZRaacyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d91f5906c06fbc69087c6d90105cd29470c1d2db --- /dev/null +++ b/annotations_1/TSclZRaacyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 4.55], [5.0, 5.46], [6.0, 8.73], [10.0, 12.46], [13.0, 16.11], [19.0, 21.07], [25.0, 25.95], [28.0, 29.59], [32.0, 36.37], [42.0, 42.9], [43.0, 43.41], [44.0, 44.95], [45.0, 47.14], [49.0, 49.35], [53.0, 53.54], [56.0, 60.72], [66.0, 65.92], [69.0, 68.67], [71.0, 72.3], [74.0, 86.36], [88.0, 117.34], [118.0, 119.62], [121.0, 124.36], [125.0, 129.25], [132.0, 135.06], [137.0, 137.35], [141.0, 142.65], [145.0, 144.66], [145.0, 146.82], [148.0, 148.2], [149.0, 149.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 70.44, 99.68, 99.92, 62.78, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 46.57, 0.0, 0.0, 0.0, 41.24, 30.58, 0.0, 99.95, 63.96, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.81], ["music", 11.36], ["inside, small room", 9.56]], null, null, [["music", 23.96], ["crushing", 13.55], ["hum", 13.52]], null, null, null, [["hum", 51.02], ["music", 19.87], ["mains hum", 13.66]], [["hum", 42.16], ["music", 21.96], ["mains hum", 12.8]], null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 1.55, 0.46, 2.73, 2.46, 3.11, 2.07, 0.95, 1.59, 4.37, 0.9, 0.41, 0.95, 2.14, 0.35, 0.54, 4.72, -0.08, -0.33, 1.3, 12.36, 29.34, 1.62, 3.36, 4.25, 3.06, 0.35, 1.65, -0.34, 1.82, 0.2, 0.66]} \ No newline at end of file diff --git a/annotations_1/TSnlLU5k9lU_filtered.json b/annotations_1/TSnlLU5k9lU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..726dc686cfe60cc2df5366946ae040b58f686cfc --- /dev/null +++ b/annotations_1/TSnlLU5k9lU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.44], [7.0, 35.01], [38.0, 46.35], [48.0, 90.59], [92.0, 93.65], [95.0, 97.83], [99.0, 101.11], [102.0, 104.84], [106.0, 124.88], [126.0, 128.29]], "keep_status": [false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.98, 57.17, 0.0, 0.0, 94.37, 58.38, 95.09, 88.28, 90.95], "audiomae_on_audioset": [null, [["music", 33.5], ["sheep", 21.34], ["speech", 13.42]], null, null, null, null, null, null, null, null], "duration": [1.44, 28.01, 8.35, 42.59, 1.65, 2.83, 2.11, 2.84, 18.88, 2.29]} \ No newline at end of file diff --git a/annotations_1/TTOlRTmEdoY_filtered.json b/annotations_1/TTOlRTmEdoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4763cc72c90d5edab270698a62110da4d8310485 --- /dev/null +++ b/annotations_1/TTOlRTmEdoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.31], [15.0, 15.31], [35.0, 36.41], [38.0, 39.19], [44.0, 44.22], [46.0, 46.47], [48.0, 47.95], [49.0, 50.41], [53.0, 54.95], [56.0, 57.35], [59.0, 60.49], [63.0, 65.43], [66.0, 73.28], [74.0, 74.6], [81.0, 82.95], [86.0, 87.89], [91.0, 91.49], [94.0, 94.47], [117.0, 116.73], [149.0, 149.59], [150.0, 149.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.28, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.31, 1.41, 1.19, 0.22, 0.47, -0.05, 1.41, 1.95, 1.35, 1.49, 2.43, 7.28, 0.6, 1.95, 1.89, 0.49, 0.47, -0.27, 0.59, -0.26]} \ No newline at end of file diff --git a/annotations_1/TUMru_xqvMU_filtered.json b/annotations_1/TUMru_xqvMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfe150923efa60e2572d179e62729fe4bcdd03d4 --- /dev/null +++ b/annotations_1/TUMru_xqvMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.16], [6.0, 6.07], [13.0, 13.69], [15.0, 16.26], [16.0, 17.25], [19.0, 19.16], [21.0, 23.9], [24.0, 26.89], [28.0, 28.86], [29.0, 30.0], [34.0, 34.5], [39.0, 38.96], [40.0, 40.41], [42.0, 42.9], [43.0, 44.37], [46.0, 46.18], [48.0, 48.17], [50.0, 50.09], [51.0, 50.8], [51.0, 51.41], [52.0, 52.59], [55.0, 60.4], [64.0, 66.43], [68.0, 79.96], [81.0, 82.22], [85.0, 85.08], [86.0, 85.95], [86.0, 86.7], [87.0, 88.3], [88.0, 88.42], [88.0, 88.45], [89.0, 88.65], [100.0, 100.79], [101.0, 101.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.43, 73.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.76, 44.23, 37.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 33.91], ["livestock, farm animals, working animals", 31.11], ["moo", 26.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.76], ["telephone", 20.66], ["radio", 3.35]], [["snicker", 17.28], ["laughter", 10.83], ["chuckle, chortle", 10.51]], [["speech", 40.46], ["radio", 4.83], ["whack, thwack", 4.69]], null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.07, 0.69, 1.26, 1.25, 0.16, 2.9, 2.89, 0.86, 1.0, 0.5, -0.04, 0.41, 0.9, 1.37, 0.18, 0.17, 0.09, -0.2, 0.41, 0.59, 5.4, 2.43, 11.96, 1.22, 0.08, -0.05, 0.7, 1.3, 0.42, 0.45, -0.35, 0.79, 0.83]} \ No newline at end of file diff --git a/annotations_1/TVViHShXqC4_filtered.json b/annotations_1/TVViHShXqC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1bbeb6f28304a9f034a3a8915b5c226a7ea6952 --- /dev/null +++ b/annotations_1/TVViHShXqC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [4.0, 5.14], [9.0, 10.45], [12.0, 14.44], [16.0, 17.85], [22.0, 22.71], [24.0, 27.73], [29.0, 30.77], [31.0, 32.81], [33.0, 34.4], [35.0, 35.94], [37.0, 45.67], [47.0, 49.0], [50.0, 50.85], [53.0, 54.36], [67.0, 88.82], [90.0, 90.32], [91.0, 91.98], [92.0, 93.19], [95.0, 97.16], [99.0, 100.47], [101.0, 102.63], [103.0, 104.68], [106.0, 106.24], [107.0, 108.68], [110.0, 113.27]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.5, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 42.04, 58.64, 0.0, 0.0, 42.81, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6], "audiomae_on_audioset": [null, null, null, [["music", 40.33], ["gobble", 7.89], ["turkey", 7.49]], null, null, null, null, null, null, null, [["theremin", 42.32], ["music", 32.12], ["synthesizer", 3.32]], null, null, null, [["clarinet", 34.5], ["music", 33.51], ["wind instrument, woodwind instrument", 14.98]], null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.14, 1.45, 2.44, 1.85, 0.71, 3.73, 1.77, 1.81, 1.4, 0.94, 8.67, 2.0, 0.85, 1.36, 21.82, 0.32, 0.98, 1.19, 2.16, 1.47, 1.63, 1.68, 0.24, 1.68, 3.27]} \ No newline at end of file diff --git a/annotations_1/TXAJapM6E-U_filtered.json b/annotations_1/TXAJapM6E-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d463cee2f8ba647ef4b363387880020fc9a3a39f --- /dev/null +++ b/annotations_1/TXAJapM6E-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.63], [11.0, 18.57], [19.0, 20.51], [21.0, 22.98], [25.0, 26.47], [29.0, 29.27], [31.0, 30.99], [32.0, 37.35], [42.0, 41.99], [43.0, 44.71], [46.0, 46.82], [54.0, 54.18], [55.0, 58.02], [59.0, 71.0], [74.0, 95.08], [100.0, 101.41], [109.0, 109.59], [111.0, 112.29], [112.0, 114.89], [116.0, 119.42], [120.0, 120.61], [121.0, 122.57], [124.0, 128.44], [129.0, 130.0], [131.0, 131.57]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.08, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 68.28, 33.85, 30.97, 0.0, 0.0, 0.0, 37.43, 97.33, 0.0, 0.0, 94.81, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.56], ["whack, thwack", 13.0], ["fly, housefly", 11.5]], null, null, null, null, null, null, null, null, null, null, null, [["music", 53.93], ["hum", 11.57], ["mains hum", 6.48]], [["speech", 33.37], ["cattle, bovinae", 14.18], ["moo", 11.28]], null, null, null, [["speech", 56.98], ["thunk", 12.14], ["music", 4.35]], null, null, null, null, null, null], "duration": [0.63, 7.57, 1.51, 1.98, 1.47, 0.27, -0.01, 5.35, -0.01, 1.71, 0.82, 0.18, 3.02, 12.0, 21.08, 1.41, 0.59, 1.29, 2.89, 3.42, 0.61, 1.57, 4.44, 1.0, 0.57]} \ No newline at end of file diff --git a/annotations_1/TXRHf6Hzg0g_filtered.json b/annotations_1/TXRHf6Hzg0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..230dab2dd90f95fab2479cae33c97afacf72f697 --- /dev/null +++ b/annotations_1/TXRHf6Hzg0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 40.81], [41.0, 51.07], [53.0, 54.19], [57.0, 57.42], [60.0, 59.83], [64.0, 79.51], [82.0, 95.84], [97.0, 97.6], [100.0, 100.4], [102.0, 102.34], [106.0, 106.64], [108.0, 108.75], [110.0, 114.96], [117.0, 117.0]], "keep_status": [false, true, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.49, 0.0, 0.0, 0.0, 29.15, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0], "audiomae_on_audioset": [null, [["rumble", 28.28], ["whack, thwack", 15.13], ["speech", 5.64]], null, null, null, [["buzz", 19.51], ["vehicle", 15.84], ["music", 14.5]], [["music", 32.09], ["sound effect", 13.33], ["grunt", 9.8]], null, null, null, null, null, null, null], "duration": [-0.19, 10.07, 1.19, 0.42, -0.17, 15.51, 13.84, 0.6, 0.4, 0.34, 0.64, 0.75, 4.96, 0.0]} \ No newline at end of file diff --git a/annotations_1/TXlioVAN41o_filtered.json b/annotations_1/TXlioVAN41o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afe122a83eb825f2a44b9648b78ca0519e299594 --- /dev/null +++ b/annotations_1/TXlioVAN41o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.94], [10.0, 14.27], [18.0, 18.76], [20.0, 21.3], [22.0, 23.38], [24.0, 25.19], [26.0, 27.03], [30.0, 31.62], [34.0, 41.93], [42.0, 53.59], [55.0, 62.26], [64.0, 64.88], [66.0, 66.73], [68.0, 94.17], [96.0, 96.45], [97.0, 97.38], [105.0, 112.21], [114.0, 114.02], [115.0, 115.42], [118.0, 118.23], [119.0, 121.73], [124.0, 125.36]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 44.72, 62.68, 0.0, 0.0, 46.43, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 81.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 44.83], ["fly, housefly", 11.12], ["music", 10.34]], null, null, null, [["throbbing", 36.74], ["hum", 26.22], ["music", 16.52]], null, null, null, null, null, null, null, null], "duration": [1.94, 4.27, 0.76, 1.3, 1.38, 1.19, 1.03, 1.62, 7.93, 11.59, 7.26, 0.88, 0.73, 26.17, 0.45, 0.38, 7.21, 0.02, 0.42, 0.23, 2.73, 1.36]} \ No newline at end of file diff --git a/annotations_1/TYA75RnDMGI_filtered.json b/annotations_1/TYA75RnDMGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0802deeb6ea62872f0e3a25ed4db034779ae5a77 --- /dev/null +++ b/annotations_1/TYA75RnDMGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [34.0, 34.53], [52.0, 56.73], [59.0, 92.52], [93.0, 142.3], [149.0, 149.62], [151.0, 153.15], [162.0, 162.21], [167.0, 167.75], [169.0, 169.32]], "keep_status": [false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.74, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.03], ["throbbing", 16.79], ["music", 13.89]], null, null, null, [["speech", 34.1], ["hum", 10.18], ["mains hum", 6.67]], null, null, null], "duration": [0.57, 0.53, 4.73, 33.52, 49.3, 0.62, 2.15, 0.21, 0.75, 0.32]} \ No newline at end of file diff --git a/annotations_1/TYJ-1E4hKAU_filtered.json b/annotations_1/TYJ-1E4hKAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da831929b13629864675ed7fa1db28baaa62993f --- /dev/null +++ b/annotations_1/TYJ-1E4hKAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [15.0, 15.35], [19.0, 24.92], [27.0, 27.72], [29.0, 30.3], [31.0, 31.94], [32.0, 32.31], [32.0, 32.37], [33.0, 33.96], [50.0, 49.81], [51.0, 137.24], [140.0, 157.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.56], ["speech", 9.74], ["trombone", 4.94]]], "duration": [1.61, 0.35, 5.92, 0.72, 1.3, 0.94, 0.31, 0.37, 0.96, -0.19, 86.24, 17.65]} \ No newline at end of file diff --git a/annotations_1/TZ9xan53wuA_filtered.json b/annotations_1/TZ9xan53wuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ea1cdfdc1fdb5d17221db7662cde6054c8fd0d --- /dev/null +++ b/annotations_1/TZ9xan53wuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.21], [6.0, 8.01], [9.0, 12.06], [17.0, 21.27], [23.0, 26.15], [28.0, 30.0], [32.0, 33.22], [35.0, 35.31], [39.0, 43.14], [45.0, 53.89], [55.0, 57.82], [62.0, 67.12], [70.0, 78.73], [80.0, 84.65], [86.0, 104.41], [105.0, 106.47], [108.0, 116.58], [119.0, 120.19], [121.0, 121.83], [123.0, 130.77], [131.0, 138.3], [139.0, 141.52]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [67.51, 91.81, 46.72, 70.72, 66.27, 49.04, 0.0, 0.0, 56.78, 75.72, 51.71, 45.02, 31.35, 48.82, 32.58, 0.0, 54.1, 0.0, 0.0, 46.9, 52.62, 59.68], "audiomae_on_audioset": [null, null, [["speech", 34.35], ["music", 18.21], ["theremin", 12.52]], null, null, [["music", 26.06], ["whale vocalization", 13.03], ["hum", 11.3]], null, null, null, null, null, [["music", 26.31], ["hum", 25.87], ["throbbing", 10.62]], [["hum", 30.98], ["mains hum", 29.13], ["throbbing", 12.35]], [["music", 39.2], ["speech", 19.46], ["hum", 14.16]], [["music", 21.56], ["hum", 19.47], ["whack, thwack", 9.03]], null, null, null, null, [["speech", 32.47], ["music", 25.57], ["hum", 17.06]], null, null], "duration": [3.21, 2.01, 3.06, 4.27, 3.15, 2.0, 1.22, 0.31, 4.14, 8.89, 2.82, 5.12, 8.73, 4.65, 18.41, 1.47, 8.58, 1.19, 0.83, 7.77, 7.3, 2.52]} \ No newline at end of file diff --git a/annotations_1/TZdCMfr0Um8_filtered.json b/annotations_1/TZdCMfr0Um8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fb52c5c154e5a4de8b12d5cfc69641b76e5f319 --- /dev/null +++ b/annotations_1/TZdCMfr0Um8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.98], [4.0, 4.28], [5.0, 7.08], [8.0, 10.76], [11.0, 13.64], [16.0, 19.6], [20.0, 24.51], [26.0, 38.26], [39.0, 47.83], [49.0, 63.14], [65.0, 67.76], [70.0, 70.77], [71.0, 76.67], [78.0, 78.19], [81.0, 81.87], [85.0, 88.92], [91.0, 93.21], [96.0, 98.44], [99.0, 100.41], [101.0, 128.31], [134.0, 143.18], [144.0, 145.77], [148.0, 148.22], [149.0, 151.24], [152.0, 153.86], [163.0, 174.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.52, 99.94, 85.54, 95.91, 87.0, 71.87, 78.21, 74.92, 98.27, 0.0, 81.89, 0.0, 0.0, 81.35, 91.64, 61.37, 0.0, 68.41, 55.46, 0.0, 0.0, 58.47, 0.0, 44.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.3], ["hum", 9.33], ["throbbing", 5.09]]], "duration": [1.98, 0.28, 2.08, 2.76, 2.64, 3.6, 4.51, 12.26, 8.83, 14.14, 2.76, 0.77, 5.67, 0.19, 0.87, 3.92, 2.21, 2.44, 1.41, 27.31, 9.18, 1.77, 0.22, 2.24, 1.86, 11.34]} \ No newline at end of file diff --git a/annotations_1/TZyl-21DgPo_filtered.json b/annotations_1/TZyl-21DgPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad813e6bc0c9c65c725fc0949f63adebe624b774 --- /dev/null +++ b/annotations_1/TZyl-21DgPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [5.0, 5.63], [7.0, 11.92], [13.0, 13.46], [14.0, 15.21], [17.0, 18.15], [19.0, 20.34], [21.0, 24.81], [27.0, 27.77], [30.0, 30.89], [34.0, 34.47], [35.0, 35.8], [38.0, 44.27], [49.0, 51.9], [56.0, 57.01], [58.0, 59.0], [62.0, 69.55], [70.0, 71.2], [72.0, 72.84], [75.0, 75.15], [77.0, 85.29], [87.0, 87.86], [89.0, 90.04], [92.0, 101.61], [103.0, 111.37], [113.0, 113.7], [116.0, 115.97], [117.0, 118.67], [120.0, 120.77], [122.0, 128.01], [129.0, 129.78], [132.0, 133.0], [134.0, 149.44], [150.0, 150.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 88.28, 100.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 73.21, 83.34, 0.0, 0.0, 0.0, 0.0, 38.83, 0.0, 0.0, 80.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.59], ["speech", 5.1], ["didgeridoo", 5.06]], null, null, null, null], "duration": [0.39, 0.63, 4.92, 0.46, 1.21, 1.15, 1.34, 3.81, 0.77, 0.89, 0.47, 0.8, 6.27, 2.9, 1.01, 1.0, 7.55, 1.2, 0.84, 0.15, 8.29, 0.86, 1.04, 9.61, 8.37, 0.7, -0.03, 1.67, 0.77, 6.01, 0.78, 1.0, 15.44, 0.36]} \ No newline at end of file diff --git a/annotations_1/T_pKvfMT5ck_filtered.json b/annotations_1/T_pKvfMT5ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e089866b2ae02dd2e7b3beb62ad6797c672f3522 --- /dev/null +++ b/annotations_1/T_pKvfMT5ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 80.94], [83.0, 82.95], [87.0, 104.68], [107.0, 115.55], [116.0, 128.06]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 30.13, 29.27, 29.6], "audiomae_on_audioset": [null, null, [["music", 71.3], ["throbbing", 4.47], ["boing", 2.23]], [["music", 45.46], ["cattle, bovinae", 5.07], ["vehicle", 4.68]], [["music", 71.68], ["electronic music", 3.17], ["synthesizer", 2.25]]], "duration": [30.94, -0.05, 17.68, 8.55, 12.06]} \ No newline at end of file diff --git a/annotations_1/Tazw08OZpwU_filtered.json b/annotations_1/Tazw08OZpwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96a9c47e53b0c832075adfb058fac857535e951c --- /dev/null +++ b/annotations_1/Tazw08OZpwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [3.0, 3.1], [4.0, 4.6], [6.0, 9.69], [12.0, 12.6], [13.0, 20.41], [23.0, 31.82], [35.0, 41.22], [45.0, 45.71], [47.0, 47.44], [56.0, 56.4], [58.0, 58.77], [60.0, 63.95], [68.0, 74.06], [75.0, 76.57], [79.0, 80.01], [82.0, 82.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 0.0, 82.25, 99.8, 99.99, 0.0, 0.0, 0.0, 0.0, 92.97, 88.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 0.1, 0.6, 3.69, 0.6, 7.41, 8.82, 6.22, 0.71, 0.44, 0.4, 0.77, 3.95, 6.06, 1.57, 1.01, 0.61]} \ No newline at end of file diff --git a/annotations_1/Tc7e-4kbDto_filtered.json b/annotations_1/Tc7e-4kbDto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ccc70086d70359f6c118ba2e29ad825121b77e --- /dev/null +++ b/annotations_1/Tc7e-4kbDto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 37.35], [38.0, 85.18], [88.0, 103.64], [104.0, 110.73], [114.0, 114.2]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.84, 30.33, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.57], ["artillery fire", 6.46], ["gunshot, gunfire", 3.99]], [["gunshot, gunfire", 16.0], ["music", 13.58], ["explosion", 12.04]], null], "duration": [1.35, 47.18, 15.64, 6.73, 0.2]} \ No newline at end of file diff --git a/annotations_1/TcBlM3VLePM_filtered.json b/annotations_1/TcBlM3VLePM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2bff34fd0afca67004ae67264f345708f7e9a4 --- /dev/null +++ b/annotations_1/TcBlM3VLePM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.67], [11.0, 15.21], [22.0, 22.42], [29.0, 33.15], [35.0, 38.6], [39.0, 39.53], [41.0, 44.61], [49.0, 49.62], [51.0, 57.87], [59.0, 58.9], [63.0, 63.73], [70.0, 70.73], [76.0, 77.11], [78.0, 78.31], [84.0, 83.81], [85.0, 85.9], [90.0, 90.15], [92.0, 92.15], [93.0, 93.46], [95.0, 96.38], [110.0, 116.07]], "keep_status": [false, false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.52, 36.61, 0.0, 30.6, 34.57, 0.0, 37.41, 0.0, 43.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.86], "audiomae_on_audioset": [[["hum", 47.65], ["mains hum", 19.39], ["speech", 10.59]], [["livestock, farm animals, working animals", 42.04], ["moo", 15.42], ["cattle, bovinae", 12.89]], null, [["speech", 49.72], ["fart", 5.92], ["electric shaver, electric razor", 5.72]], [["didgeridoo", 45.87], ["speech", 11.95], ["livestock, farm animals, working animals", 8.55]], null, [["didgeridoo", 41.1], ["music", 19.73], ["theremin", 5.55]], null, [["speech", 40.56], ["sidetone", 8.82], ["mains hum", 7.04]], null, null, null, null, null, null, null, null, null, null, null, [["music", 44.18], ["speech", 32.64], ["crowd", 4.96]]], "duration": [3.67, 4.21, 0.42, 4.15, 3.6, 0.53, 3.61, 0.62, 6.87, -0.1, 0.73, 0.73, 1.11, 0.31, -0.19, 0.9, 0.15, 0.15, 0.46, 1.38, 6.07]} \ No newline at end of file diff --git a/annotations_1/TcJjhnPrM9o_filtered.json b/annotations_1/TcJjhnPrM9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e6b72deb88cd91339eee4fc2fb0eae1c09245b0 --- /dev/null +++ b/annotations_1/TcJjhnPrM9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.01], [5.0, 17.31], [17.0, 19.18], [21.0, 20.82], [22.0, 24.53], [25.0, 28.51], [31.0, 31.06], [32.0, 53.08], [54.0, 56.76], [58.0, 58.89], [60.0, 61.94], [62.0, 63.31], [68.0, 89.51], [91.0, 93.66], [95.0, 97.56], [99.0, 137.49], [138.0, 144.07]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 38.31, 53.16, 0.0, 60.05, 93.76, 0.0, 32.93, 39.04, 0.0, 0.0, 0.0, 48.44, 65.79, 98.19, 0.0, 93.76], "audiomae_on_audioset": [null, [["speech", 71.0], ["slap, smack", 6.57], ["hum", 4.06]], null, null, null, null, null, [["speech", 49.28], ["hum", 18.05], ["music", 8.3]], [["speech", 40.23], ["fly, housefly", 9.64], ["radio", 4.12]], null, null, null, [["speech", 46.81], ["fly, housefly", 8.86], ["insect", 5.75]], null, null, null, null], "duration": [0.01, 12.31, 2.18, -0.18, 2.53, 3.51, 0.06, 21.08, 2.76, 0.89, 1.94, 1.31, 21.51, 2.66, 2.56, 38.49, 6.07]} \ No newline at end of file diff --git a/annotations_1/TcaAWs46kog_filtered.json b/annotations_1/TcaAWs46kog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a1f6b3debf688894d5307584972c14094c2a4f --- /dev/null +++ b/annotations_1/TcaAWs46kog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.67], [19.0, 21.61], [23.0, 35.41], [37.0, 44.69], [48.0, 48.57], [49.0, 49.77], [51.0, 52.39], [54.0, 54.08], [57.0, 57.97], [58.0, 59.78], [61.0, 64.86], [66.0, 66.55], [69.0, 69.6], [71.0, 72.91], [75.0, 74.7], [77.0, 77.5], [79.0, 90.51], [92.0, 91.72], [95.0, 100.72], [101.0, 110.96], [112.0, 119.1], [120.0, 120.33], [120.0, 122.01], [131.0, 131.55], [134.0, 135.28], [140.0, 141.02], [142.0, 142.72], [144.0, 144.07], [146.0, 147.68]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, true, false, false, false, false, false, false], "silence_prob": [54.76, 57.97, 32.57, 37.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 43.4, 0.0, 42.17, 46.22, 37.77, 0.0, 33.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 41.11], ["speech", 11.33], ["effects unit", 9.99]], [["music", 39.16], ["quack", 17.12], ["duck", 15.77]], null, null, null, null, null, null, null, null, null, null, null, null, [["quack", 25.58], ["music", 18.31], ["duck", 14.67]], null, [["music", 25.17], ["speech", 10.7], ["didgeridoo", 8.82]], [["music", 39.91], ["singing bowl", 13.67], ["speech", 9.7]], [["speech", 37.67], ["animal", 22.41], ["fart", 2.68]], null, [["speech", 22.57], ["owl", 11.35], ["animal", 9.24]], null, null, null, null, null, null], "duration": [5.67, 2.61, 12.41, 7.69, 0.57, 0.77, 1.39, 0.08, 0.97, 1.78, 3.86, 0.55, 0.6, 1.91, -0.3, 0.5, 11.51, -0.28, 5.72, 9.96, 7.1, 0.33, 2.01, 0.55, 1.28, 1.02, 0.72, 0.07, 1.68]} \ No newline at end of file diff --git a/annotations_1/TcndF9QpYAU_filtered.json b/annotations_1/TcndF9QpYAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28b4364a2026881dab1e5267fe50cc557cb2023b --- /dev/null +++ b/annotations_1/TcndF9QpYAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.32], [16.0, 18.01], [24.0, 27.99], [30.0, 29.86], [41.0, 41.47], [55.0, 54.92], [60.0, 60.0], [65.0, 65.62], [69.0, 69.03], [71.0, 72.99], [75.0, 76.57], [78.0, 78.98], [79.0, 80.74], [83.0, 84.57], [86.0, 87.76], [90.0, 90.76], [95.0, 97.48], [98.0, 103.0], [104.0, 108.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.86, 51.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 94.07, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 2.01, 3.99, -0.14, 0.47, -0.08, 0.0, 0.62, 0.03, 1.99, 1.57, 0.98, 1.74, 1.57, 1.76, 0.76, 2.48, 5.0, 4.46]} \ No newline at end of file diff --git a/annotations_1/Td3qZIf5Swg_filtered.json b/annotations_1/Td3qZIf5Swg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efc2358da21292b862eb7f95858858d1ab5f5e16 --- /dev/null +++ b/annotations_1/Td3qZIf5Swg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 7.25], [8.0, 8.29], [9.0, 12.87], [14.0, 14.86], [19.0, 20.04], [21.0, 22.91], [25.0, 26.22], [30.0, 33.56], [35.0, 36.53], [43.0, 46.55], [48.0, 51.02], [53.0, 66.26], [68.0, 137.39], [140.0, 139.95], [141.0, 141.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 51.23, 0.0, 52.16, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 35.91, 39.66, 33.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 43.49], ["speech", 12.94], ["didgeridoo", 9.88]], [["music", 53.55], ["synthesizer", 13.51], ["musical instrument", 8.35]], [["music", 62.57], ["brass instrument", 6.82], ["musical instrument", 6.06]], null, null, null], "duration": [0.76, 3.25, 0.29, 3.87, 0.86, 1.04, 1.91, 1.22, 3.56, 1.53, 3.55, 3.02, 13.26, 69.39, -0.05, 0.29]} \ No newline at end of file diff --git a/annotations_1/Te32eYR3jo4_filtered.json b/annotations_1/Te32eYR3jo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..999174effe192ec3c2a4cc163aea67ff11a93f4f --- /dev/null +++ b/annotations_1/Te32eYR3jo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.67], [5.0, 5.53], [6.0, 11.16], [13.0, 16.87], [18.0, 23.16], [24.0, 36.96], [39.0, 57.48], [60.0, 81.03], [84.0, 91.91], [95.0, 99.22], [105.0, 105.87], [107.0, 106.96], [107.0, 107.0], [107.0, 107.32], [107.0, 108.75], [116.0, 116.04], [120.0, 123.16], [125.0, 125.68], [126.0, 126.6], [128.0, 132.56], [135.0, 135.92], [137.0, 140.81], [142.0, 142.6], [144.0, 146.43], [150.0, 150.2], [154.0, 161.97]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 75.23, 36.03, 36.31, 32.5, 29.37, 29.39, 33.8, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 39.57, 0.0, 72.9, 0.0, 32.52, 0.0, 30.37], "audiomae_on_audioset": [null, null, null, [["music", 34.15], ["throbbing", 10.73], ["speech", 6.63]], [["music", 24.17], ["didgeridoo", 21.66], ["throbbing", 6.07]], [["hum", 55.5], ["mains hum", 17.11], ["throbbing", 10.93]], [["music", 71.33], ["throbbing", 6.79], ["theremin", 5.53]], [["music", 64.88], ["didgeridoo", 25.5], ["animal", 3.01]], [["cattle, bovinae", 23.88], ["animal", 16.37], ["moo", 16.01]], [["animal", 65.68], ["speech", 15.54], ["domestic animals, pets", 5.37]], null, null, null, null, null, null, [["speech", 29.12], ["mains hum", 12.36], ["hum", 10.53]], null, null, [["fire", 28.81], ["speech", 21.78], ["animal", 7.67]], null, null, null, [["speech", 28.16], ["fly, housefly", 10.77], ["insect", 9.0]], null, [["animal", 25.36], ["domestic animals, pets", 18.87], ["dog", 17.25]]], "duration": [1.67, 0.53, 5.16, 3.87, 5.16, 12.96, 18.48, 21.03, 7.91, 4.22, 0.87, -0.04, 0.0, 0.32, 1.75, 0.04, 3.16, 0.68, 0.6, 4.56, 0.92, 3.81, 0.6, 2.43, 0.2, 7.97]} \ No newline at end of file diff --git a/annotations_1/TeSzBaedb2Y_filtered.json b/annotations_1/TeSzBaedb2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62d2367a31a5709e065350a05cc5d7751816691e --- /dev/null +++ b/annotations_1/TeSzBaedb2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.41], [19.0, 21.05], [24.0, 28.0], [31.0, 30.97], [33.0, 33.59], [36.0, 42.26], [47.0, 48.24], [50.0, 58.01], [65.0, 65.75], [66.0, 66.73], [72.0, 72.71], [76.0, 76.71], [83.0, 84.28], [85.0, 86.54], [87.0, 96.11], [98.0, 159.11], [161.0, 163.63], [165.0, 164.62], [165.0, 166.48], [168.0, 169.13]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [32.38, 36.97, 30.33, 0.0, 0.0, 29.8, 0.0, 29.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.47, 0.0, 29.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["groan", 19.28], ["grunt", 14.71], ["sound effect", 13.46]], [["speech", 51.68], ["busy signal", 4.4], ["grunt", 3.3]], [["sound effect", 26.58], ["speech", 16.67], ["fart", 6.99]], null, null, [["music", 57.14], ["speech", 22.34], ["grunt", 3.39]], null, [["speech", 37.67], ["music", 22.73], ["groan", 6.83]], null, null, null, null, null, null, [["music", 31.41], ["livestock, farm animals, working animals", 14.17], ["cattle, bovinae", 10.83]], null, [["speech", 30.67], ["music", 22.85], ["hum", 10.66]], null, null, null], "duration": [3.41, 2.05, 4.0, -0.03, 0.59, 6.26, 1.24, 8.01, 0.75, 0.73, 0.71, 0.71, 1.28, 1.54, 9.11, 61.11, 2.63, -0.38, 1.48, 1.13]} \ No newline at end of file diff --git a/annotations_1/TeeNLFHot1Q_filtered.json b/annotations_1/TeeNLFHot1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..721a70d4666f193a47145c7216b42aabb369ae37 --- /dev/null +++ b/annotations_1/TeeNLFHot1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.07], [11.0, 11.43], [12.0, 12.8], [13.0, 14.0], [16.0, 19.3], [20.0, 21.63], [28.0, 28.78], [33.0, 40.86], [45.0, 45.54], [46.0, 46.45], [52.0, 52.56], [66.0, 67.05], [68.0, 68.76], [69.0, 70.38], [72.0, 72.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 41.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 45.45], ["mains hum", 17.07], ["music", 12.19]], null, null, null, null, null, null, null], "duration": [1.07, 0.43, 0.8, 1.0, 3.3, 1.63, 0.78, 7.86, 0.54, 0.45, 0.56, 1.05, 0.76, 1.38, 0.66]} \ No newline at end of file diff --git a/annotations_1/TfbuiIc3pME_filtered.json b/annotations_1/TfbuiIc3pME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b867decdf19ad2f83fffb95f62b79af0b9263d96 --- /dev/null +++ b/annotations_1/TfbuiIc3pME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.39], [25.0, 64.37], [66.0, 77.06], [80.0, 103.79], [109.0, 114.78], [119.0, 132.11], [147.0, 147.58], [148.0, 148.68], [154.0, 155.09]], "keep_status": [true, false, true, false, true, true, false, false, false], "silence_prob": [29.46, 0.0, 28.46, 28.72, 40.14, 34.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 22.54], ["hum", 18.98], ["throbbing", 18.75]], null, [["hum", 24.13], ["music", 22.07], ["throbbing", 19.5]], [["mains hum", 44.05], ["hum", 27.25], ["music", 17.31]], [["hum", 31.69], ["mains hum", 25.01], ["throbbing", 11.41]], [["hum", 27.77], ["cough", 13.43], ["throbbing", 11.01]], null, null, null], "duration": [2.39, 39.37, 11.06, 23.79, 5.78, 13.11, 0.58, 0.68, 1.09]} \ No newline at end of file diff --git a/annotations_1/TffPDHIwQtc_filtered.json b/annotations_1/TffPDHIwQtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e156c982d41cbf0a513a8e56664d408ffa9d5d7 --- /dev/null +++ b/annotations_1/TffPDHIwQtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.34], [9.0, 9.14], [14.0, 29.89], [30.0, 30.13], [33.0, 36.91], [38.0, 53.94], [55.0, 55.27], [56.0, 56.0], [56.0, 56.86], [60.0, 75.09], [80.0, 102.32], [103.0, 105.27]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.22, 0.0, 38.11, 0.0, 49.45, 51.77, 0.0, 0.0, 0.0, 78.89, 37.65, 38.05], "audiomae_on_audioset": [[["hum", 15.42], ["speech", 9.3], ["vehicle", 6.08]], null, [["hum", 39.48], ["throbbing", 27.11], ["mains hum", 12.31]], null, [["fly, housefly", 24.04], ["insect", 20.59], ["hum", 8.21]], null, null, null, null, null, [["hum", 42.47], ["mains hum", 23.9], ["buzz", 10.01]], [["mains hum", 48.78], ["hum", 38.55], ["fly, housefly", 2.96]]], "duration": [3.34, 0.14, 15.89, 0.13, 3.91, 15.94, 0.27, 0.0, 0.86, 15.09, 22.32, 2.27]} \ No newline at end of file diff --git a/annotations_1/TfsGgp4go6k_filtered.json b/annotations_1/TfsGgp4go6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b5f1cfd2534dfa583210cbab9e90598913d175 --- /dev/null +++ b/annotations_1/TfsGgp4go6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [7.0, 7.03], [14.0, 14.1], [16.0, 17.42], [22.0, 22.37], [23.0, 23.92], [41.0, 41.44], [47.0, 46.89], [47.0, 47.24], [63.0, 66.9], [71.0, 73.04], [74.0, 75.42], [83.0, 83.56], [100.0, 105.53], [106.0, 106.59], [118.0, 119.2], [120.0, 120.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 96.17, 0.0, 0.0, 31.65, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["fly, housefly", 29.95], ["speech", 18.0], ["insect", 11.68]], null, null, null, [["music", 36.24], ["sidetone", 23.18], ["drum machine", 5.82]], null, null, null], "duration": [1.94, 0.03, 0.1, 1.42, 0.37, 0.92, 0.44, -0.11, 0.24, 3.9, 2.04, 1.42, 0.56, 5.53, 0.59, 1.2, 0.73]} \ No newline at end of file diff --git a/annotations_1/TgujxmrRUlw_filtered.json b/annotations_1/TgujxmrRUlw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abe2315de430fa5f133f4a0f19169deb34253fa0 --- /dev/null +++ b/annotations_1/TgujxmrRUlw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.06], [27.0, 27.46], [29.0, 29.71], [35.0, 39.87], [47.0, 47.19], [56.0, 56.59], [74.0, 74.78], [75.0, 76.55], [82.0, 82.07], [93.0, 105.16], [107.0, 108.63], [114.0, 115.26], [116.0, 117.59], [120.0, 120.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.03, 0.0, 0.0, 0.0, 0.0, 0.0, 30.11, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 36.65], ["music", 27.25], ["horse", 3.96]], null, null, null, null, null, [["music", 41.37], ["speech", 25.73], ["crowd", 11.98]], null, null, null, null], "duration": [0.06, 0.46, 0.71, 4.87, 0.19, 0.59, 0.78, 1.55, 0.07, 12.16, 1.63, 1.26, 1.59, 0.53]} \ No newline at end of file diff --git a/annotations_1/TgzbVMwrr7s_filtered.json b/annotations_1/TgzbVMwrr7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..380b9518564417d2edd067eb972a6037308ff173 --- /dev/null +++ b/annotations_1/TgzbVMwrr7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.14], [13.0, 15.2], [25.0, 26.15], [27.0, 28.07], [35.0, 36.8], [45.0, 45.72], [47.0, 47.12], [47.0, 48.44], [55.0, 55.63], [57.0, 58.06], [61.0, 61.82], [64.0, 65.72], [69.0, 89.33], [90.0, 91.84], [93.0, 93.24], [97.0, 97.77], [103.0, 104.41], [107.0, 109.11], [113.0, 124.61], [125.0, 130.94], [132.0, 148.34], [152.0, 152.12], [153.0, 154.99], [159.0, 160.35], [162.0, 162.01], [163.0, 164.08], [167.0, 172.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 0.0, 0.0, 96.17, 66.76, 42.3, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.5], ["hum", 19.19], ["speech", 4.9]], [["music", 42.7], ["hum", 26.24], ["mains hum", 10.17]], null, null, null, null, null, null], "duration": [1.14, 2.2, 1.15, 1.07, 1.8, 0.72, 0.12, 1.44, 0.63, 1.06, 0.82, 1.72, 20.33, 1.84, 0.24, 0.77, 1.41, 2.11, 11.61, 5.94, 16.34, 0.12, 1.99, 1.35, 0.01, 1.08, 5.0]} \ No newline at end of file diff --git a/annotations_1/ThCnJ2m0exo_filtered.json b/annotations_1/ThCnJ2m0exo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1711af8a092dc08a0205c954848e970bfb5f0b --- /dev/null +++ b/annotations_1/ThCnJ2m0exo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 55.05], [55.0, 57.28], [58.0, 74.56]], "keep_status": [false, true, true], "silence_prob": [29.52, 30.78, 33.1], "audiomae_on_audioset": [[["music", 70.89], ["noise", 6.43], ["cacophony", 5.74]], [["music", 39.59], ["electronic music", 3.3], ["cattle, bovinae", 2.9]], [["hum", 28.06], ["throbbing", 16.19], ["music", 13.47]]], "duration": [16.05, 2.28, 16.56]} \ No newline at end of file diff --git a/annotations_1/ThIBEo7fsSQ_filtered.json b/annotations_1/ThIBEo7fsSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d5456687f464fee13c62349aa4bec31f320d7b3 --- /dev/null +++ b/annotations_1/ThIBEo7fsSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.85], [2.0, 3.55], [5.0, 5.27], [7.0, 7.32], [8.0, 9.81], [11.0, 12.46], [14.0, 14.81], [16.0, 17.74], [50.0, 50.36], [63.0, 64.99], [70.0, 71.83], [74.0, 74.61], [78.0, 81.58], [99.0, 99.93], [102.0, 103.11], [105.0, 104.87], [128.0, 128.98], [140.0, 139.85], [157.0, 157.0], [159.0, 159.31], [165.0, 166.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 1.55, 0.27, 0.32, 1.81, 1.46, 0.81, 1.74, 0.36, 1.99, 1.83, 0.61, 3.58, 0.93, 1.11, -0.13, 0.98, -0.15, 0.0, 0.31, 1.24]} \ No newline at end of file diff --git a/annotations_1/ThWvubM3qSs_filtered.json b/annotations_1/ThWvubM3qSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/ThWvubM3qSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ThdpcnGKsVY_filtered.json b/annotations_1/ThdpcnGKsVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ef6a3328b0f1f31b29f934eeb2f8101a3e04a6 --- /dev/null +++ b/annotations_1/ThdpcnGKsVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.56], [17.0, 30.84], [33.0, 35.43], [36.0, 37.72], [42.0, 45.06], [46.0, 47.21], [50.0, 51.46], [53.0, 53.69], [54.0, 62.48], [64.0, 65.03], [66.0, 76.32], [78.0, 92.8], [96.0, 106.57], [109.0, 109.0], [109.0, 114.15], [116.0, 137.22], [141.0, 143.29], [146.0, 147.6], [152.0, 153.72]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [44.9, 46.68, 30.41, 0.0, 65.44, 0.0, 0.0, 0.0, 46.97, 0.0, 45.95, 31.33, 30.89, 0.0, 34.94, 38.25, 33.92, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 29.18], ["mains hum", 25.89], ["music", 20.05]], [["music", 63.98], ["theremin", 10.22], ["ambient music", 4.02]], [["music", 31.62], ["carnatic music", 9.72], ["mantra", 6.12]], null, null, null, null, null, [["speech", 65.93], ["music", 10.52], ["sheep", 7.76]], null, [["music", 52.21], ["hum", 13.47], ["mains hum", 6.4]], [["music", 82.05], ["scary music", 3.72], ["theremin", 2.98]], [["music", 69.02], ["theremin", 6.26], ["ambient music", 6.22]], null, [["music", 49.25], ["ambient music", 23.17], ["theremin", 4.86]], [["music", 81.82], ["scary music", 4.01], ["ambient music", 2.75]], [["music", 59.62], ["mantra", 4.22], ["foghorn", 3.72]], null, null], "duration": [10.56, 13.84, 2.43, 1.72, 3.06, 1.21, 1.46, 0.69, 8.48, 1.03, 10.32, 14.8, 10.57, 0.0, 5.15, 21.22, 2.29, 1.6, 1.72]} \ No newline at end of file diff --git a/annotations_1/Tht98G49dos_filtered.json b/annotations_1/Tht98G49dos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3356d48f35f9f6e68f3ce2c479eeee6dbcb360ea --- /dev/null +++ b/annotations_1/Tht98G49dos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [9.0, 9.17], [26.0, 31.5], [32.0, 33.88], [64.0, 64.02], [70.0, 73.23], [78.0, 78.33], [79.0, 79.91], [82.0, 82.97], [88.0, 88.74], [92.0, 92.45], [96.0, 96.09], [107.0, 107.69], [129.0, 132.75], [137.0, 136.78]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.11, 0.0, 0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.82, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.4], ["drum", 6.35], ["speech", 4.3]], null, null, [["music", 69.9], ["speech", 4.3], ["electronic music", 3.88]], null, null, null, null, null, null, null, [["cattle, bovinae", 33.72], ["moo", 32.42], ["livestock, farm animals, working animals", 24.03]], null], "duration": [0.19, 0.17, 5.5, 1.88, 0.02, 3.23, 0.33, 0.91, 0.97, 0.74, 0.45, 0.09, 0.69, 3.75, -0.22]} \ No newline at end of file diff --git a/annotations_1/TiJBxtM5iKw_filtered.json b/annotations_1/TiJBxtM5iKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2897804c023b18dc86f7bc393c98a62891d108b3 --- /dev/null +++ b/annotations_1/TiJBxtM5iKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 61.3], [66.0, 78.44], [79.0, 79.91], [83.0, 106.98], [108.0, 123.99], [126.0, 126.47], [129.0, 143.46], [144.0, 151.38], [152.0, 152.93], [154.0, 161.54]], "keep_status": [false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 29.43, 0.0, 29.59, 29.24, 0.0, 29.32, 45.18, 0.0, 29.98], "audiomae_on_audioset": [null, [["music", 66.12], ["trance music", 7.05], ["electronic music", 6.57]], null, [["music", 60.8], ["livestock, farm animals, working animals", 6.9], ["throbbing", 5.93]], [["theremin", 56.61], ["music", 29.98], ["whale vocalization", 1.46]], null, [["music", 33.83], ["throbbing", 9.54], ["whip", 7.17]], [["speech", 32.19], ["coin (dropping)", 8.03], ["mechanisms", 6.29]], null, [["speech", 67.78], ["explosion", 7.31], ["music", 6.09]]], "duration": [0.3, 12.44, 0.91, 23.98, 15.99, 0.47, 14.46, 7.38, 0.93, 7.54]} \ No newline at end of file diff --git a/annotations_1/TiQaVmutQwg_filtered.json b/annotations_1/TiQaVmutQwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a395fd831c8d185c5ff7e4555360c84c32bcd6c8 --- /dev/null +++ b/annotations_1/TiQaVmutQwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.96], [47.0, 48.74], [51.0, 51.43], [53.0, 53.69], [54.0, 65.6], [67.0, 75.12], [77.0, 77.3], [78.0, 78.75], [80.0, 80.59], [81.0, 82.14], [83.0, 83.35], [84.0, 90.12]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.26, 40.21, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43], "audiomae_on_audioset": [null, null, null, null, [["music", 30.34], ["splash, splatter", 8.08], ["frog", 7.66]], [["speech", 23.03], ["music", 18.59], ["radio", 7.11]], null, null, null, null, null, [["speech", 37.41], ["music", 7.1], ["buzz", 6.09]]], "duration": [0.96, 1.74, 0.43, 0.69, 11.6, 8.12, 0.3, 0.75, 0.59, 1.14, 0.35, 6.12]} \ No newline at end of file diff --git a/annotations_1/Tid44iy6Rjs_filtered.json b/annotations_1/Tid44iy6Rjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8447c57920ca73a9b439a595680be48ba507ec22 --- /dev/null +++ b/annotations_1/Tid44iy6Rjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.09], [14.0, 14.57], [20.0, 21.3], [23.0, 23.84], [28.0, 28.97], [30.0, 30.72], [31.0, 31.99], [41.0, 41.74], [44.0, 44.27], [65.0, 70.46], [71.0, 73.26], [73.0, 77.58], [79.0, 79.24], [81.0, 82.14], [85.0, 85.16], [90.0, 91.72], [95.0, 95.22], [107.0, 108.48], [110.0, 110.03], [113.0, 114.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 87.37, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.09, 0.57, 1.3, 0.84, 0.97, 0.72, 0.99, 0.74, 0.27, 5.46, 2.26, 4.58, 0.24, 1.14, 0.16, 1.72, 0.22, 1.48, 0.03, 1.02]} \ No newline at end of file diff --git a/annotations_1/Tiz3eN3KJRQ_filtered.json b/annotations_1/Tiz3eN3KJRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b289549a0ab761a060786f6a8048b0cfde4cf3 --- /dev/null +++ b/annotations_1/Tiz3eN3KJRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.68], [23.0, 36.49], [44.0, 43.88], [44.0, 62.01], [64.0, 65.45], [67.0, 67.47], [72.0, 76.77], [77.0, 136.12], [137.0, 139.01], [141.0, 144.29], [145.0, 146.16], [147.0, 155.9]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 43.66, 0.0, 45.98, 0.0, 0.0, 31.77, 0.0, 34.25, 30.46, 0.0, 46.09], "audiomae_on_audioset": [null, [["speech", 44.07], ["animal", 21.89], ["horse", 3.99]], null, [["music", 66.14], ["animal", 4.13], ["mouse", 3.53]], null, null, [["fart", 58.97], ["music", 17.28], ["didgeridoo", 16.07]], null, [["mosquito", 52.85], ["fly, housefly", 17.28], ["insect", 15.95]], [["music", 17.51], ["speech", 10.51], ["fart", 5.87]], null, [["music", 65.11], ["theremin", 4.21], ["musical instrument", 4.0]]], "duration": [1.68, 13.49, -0.12, 18.01, 1.45, 0.47, 4.77, 59.12, 2.01, 3.29, 1.16, 8.9]} \ No newline at end of file diff --git a/annotations_1/TjY8crETM6s_filtered.json b/annotations_1/TjY8crETM6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f98b53f6b2a0d9a7aa7857f9d519fb5a5fd16952 --- /dev/null +++ b/annotations_1/TjY8crETM6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.4], [9.0, 12.78], [14.0, 14.4], [15.0, 16.5], [24.0, 32.12], [37.0, 37.47], [40.0, 48.74], [52.0, 67.86], [70.0, 101.68], [107.0, 109.19]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [32.85, 33.59, 0.0, 0.0, 29.5, 0.0, 29.7, 28.64, 0.0, 31.47], "audiomae_on_audioset": [[["music", 67.03], ["speech", 5.89], ["throbbing", 2.5]], [["speech", 44.07], ["rumble", 25.29], ["mains hum", 4.41]], null, null, [["speech", 51.62], ["hum", 14.03], ["mains hum", 10.55]], null, [["hum", 28.58], ["music", 27.78], ["throbbing", 27.46]], [["speech", 46.28], ["hum", 9.23], ["whack, thwack", 5.94]], null, [["speech", 60.15], ["music", 5.47], ["vehicle", 4.7]]], "duration": [3.4, 3.78, 0.4, 1.5, 8.12, 0.47, 8.74, 15.86, 31.68, 2.19]} \ No newline at end of file diff --git a/annotations_1/TjvHy-IYET8_filtered.json b/annotations_1/TjvHy-IYET8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..267796e640721c1a2c28b809acedafd6e9938490 --- /dev/null +++ b/annotations_1/TjvHy-IYET8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.91], [28.0, 28.56], [30.0, 31.08], [33.0, 34.15], [36.0, 36.22], [37.0, 37.69], [40.0, 50.36], [51.0, 53.15], [55.0, 56.08], [59.0, 62.33], [63.0, 75.32], [78.0, 78.66], [80.0, 81.95], [82.0, 83.0]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.38, 35.49, 0.0, 57.56, 40.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.28], ["hum", 17.18], ["throbbing", 13.67]], [["speech", 19.46], ["music", 18.57], ["echo", 18.26]], null, null, [["music", 62.78], ["hum", 5.96], ["speech", 5.68]], null, null, null], "duration": [-0.09, 0.56, 1.08, 1.15, 0.22, 0.69, 10.36, 2.15, 1.08, 3.33, 12.32, 0.66, 1.95, 1.0]} \ No newline at end of file diff --git a/annotations_1/Tkjw0XB9Xuc_filtered.json b/annotations_1/Tkjw0XB9Xuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..653c89cedc463b8135e9ccbc313806e89b8ab038 --- /dev/null +++ b/annotations_1/Tkjw0XB9Xuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.63], [14.0, 14.72], [16.0, 15.94], [17.0, 21.76], [22.0, 21.95], [22.0, 50.14], [51.0, 73.41], [74.0, 83.08], [84.0, 101.36], [106.0, 107.32], [109.0, 111.69], [115.0, 124.9], [128.0, 130.13], [134.0, 138.33]], "keep_status": [true, false, false, true, false, true, true, true, true, false, true, true, true, true], "silence_prob": [29.1, 0.0, 0.0, 28.44, 0.0, 28.66, 30.02, 28.27, 29.01, 0.0, 29.15, 28.6, 28.48, 29.31], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 37.45], ["cattle, bovinae", 21.01], ["music", 9.3]], null, null, [["cattle, bovinae", 13.41], ["speech", 11.42], ["moo", 11.17]], null, [["music", 32.68], ["boom", 7.55], ["explosion", 6.85]], [["music", 41.64], ["hum", 15.31], ["speech", 5.05]], [["music", 25.65], ["cattle, bovinae", 16.88], ["speech", 8.38]], [["electric shaver, electric razor", 7.78], ["animal", 7.09], ["music", 7.04]], null, [["breaking", 21.4], ["livestock, farm animals, working animals", 7.87], ["sound effect", 7.76]], [["music", 51.42], ["buzz", 9.77], ["speech", 5.57]], [["speech", 22.44], ["music", 15.65], ["whoosh, swoosh, swish", 8.81]], [["music", 26.79], ["cowbell", 17.47], ["boing", 7.21]]], "duration": [9.63, 0.72, -0.06, 4.76, -0.05, 28.14, 22.41, 9.08, 17.36, 1.32, 2.69, 9.9, 2.13, 4.33]} \ No newline at end of file diff --git a/annotations_1/TknTP23YYFI_filtered.json b/annotations_1/TknTP23YYFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76f19c47aa641fbf053eeb692118db6e7358ce9d --- /dev/null +++ b/annotations_1/TknTP23YYFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.22], [15.0, 15.03], [15.0, 19.94], [23.0, 27.63], [28.0, 29.74], [30.0, 29.88], [30.0, 35.58], [43.0, 44.14], [50.0, 51.27], [59.0, 59.36], [62.0, 61.99], [67.0, 67.09], [70.0, 70.16], [74.0, 75.27], [79.0, 79.91], [85.0, 85.16], [86.0, 87.18], [89.0, 96.09], [101.0, 107.52], [109.0, 109.71], [115.0, 117.64], [121.0, 121.07], [124.0, 125.9], [127.0, 127.84], [132.0, 132.41], [140.0, 143.09], [146.0, 146.16], [149.0, 149.88], [162.0, 163.11], [165.0, 167.26], [170.0, 172.88], [177.0, 176.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.31, 0.0, 45.65, 53.28, 0.0, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 100.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 94.52, 93.13, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.53], ["speech", 21.7], ["sidetone", 19.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.22, 0.03, 4.94, 4.63, 1.74, -0.12, 5.58, 1.14, 1.27, 0.36, -0.01, 0.09, 0.16, 1.27, 0.91, 0.16, 1.18, 7.09, 6.52, 0.71, 2.64, 0.07, 1.9, 0.84, 0.41, 3.09, 0.16, 0.88, 1.11, 2.26, 2.88, -0.01]} \ No newline at end of file diff --git a/annotations_1/TlyHBaAJVbk_filtered.json b/annotations_1/TlyHBaAJVbk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bca76febc1a12bc5ab3b766993d48bb988a082a9 --- /dev/null +++ b/annotations_1/TlyHBaAJVbk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 103.98], [105.0, 107.52], [109.0, 109.98], [111.0, 145.62]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 55.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [53.98, 2.52, 0.98, 34.62]} \ No newline at end of file diff --git a/annotations_1/TmALN8vdU0s_filtered.json b/annotations_1/TmALN8vdU0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c29803263aaa41515099aef59337d03fe125247 --- /dev/null +++ b/annotations_1/TmALN8vdU0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.97], [5.0, 25.73], [29.0, 29.42], [30.0, 60.64], [61.0, 67.68], [68.0, 73.14], [74.0, 78.44], [79.0, 84.18], [86.0, 86.71], [89.0, 96.99], [98.0, 98.64], [100.0, 100.63], [102.0, 102.61], [104.0, 104.14], [108.0, 108.09], [113.0, 113.95], [120.0, 119.91], [120.0, 124.31]], "keep_status": [false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.03, 0.0, 0.0, 28.88, 44.84, 32.31, 29.53, 0.0, 74.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.48], "audiomae_on_audioset": [null, null, null, null, [["music", 25.72], ["didgeridoo", 9.52], ["fart", 8.75]], [["music", 22.19], ["hum", 11.03], ["mains hum", 9.07]], [["music", 22.81], ["hum", 13.85], ["buzz", 6.86]], [["speech", 25.71], ["didgeridoo", 22.17], ["radio", 10.2]], null, null, null, null, null, null, null, null, null, [["speech", 80.34], ["sidetone", 5.77], ["breaking", 1.83]]], "duration": [-0.03, 20.73, 0.42, 30.64, 6.68, 5.14, 4.44, 5.18, 0.71, 7.99, 0.64, 0.63, 0.61, 0.14, 0.09, 0.95, -0.09, 4.31]} \ No newline at end of file diff --git a/annotations_1/TmTq2M6xgEs_filtered.json b/annotations_1/TmTq2M6xgEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2110ec23f5c9dd3f572eb40687eea475f5ba9b54 --- /dev/null +++ b/annotations_1/TmTq2M6xgEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.55], [8.0, 10.49], [12.0, 15.57], [18.0, 20.95], [23.0, 26.25], [28.0, 31.83], [33.0, 34.25], [36.0, 37.25], [39.0, 47.24], [55.0, 56.37], [62.0, 84.01], [85.0, 89.78], [96.0, 95.67], [99.0, 102.81], [105.0, 105.48], [108.0, 110.61], [112.0, 113.05], [122.0, 124.29]], "keep_status": [false, true, false, false, true, false, false, false, false, false, true, false, false, true, false, true, false, true], "silence_prob": [0.0, 45.85, 61.67, 52.05, 48.44, 61.08, 0.0, 0.0, 37.35, 0.0, 32.77, 32.67, 0.0, 31.04, 0.0, 29.86, 0.0, 33.68], "audiomae_on_audioset": [null, [["hum", 19.02], ["music", 18.81], ["throbbing", 16.24]], null, null, [["music", 55.48], ["hum", 7.64], ["mains hum", 5.6]], null, null, null, [["music", 55.69], ["scary music", 16.38], ["hum", 3.9]], null, [["hum", 27.87], ["music", 22.29], ["mains hum", 7.64]], [["music", 35.63], ["speech", 20.92], ["hum", 18.19]], null, [["music", 49.48], ["speech", 8.94], ["throbbing", 7.29]], null, [["whack, thwack", 17.41], ["thump, thud", 13.11], ["breaking", 12.32]], null, [["fly, housefly", 28.29], ["mosquito", 26.99], ["insect", 6.63]]], "duration": [1.55, 2.49, 3.57, 2.95, 3.25, 3.83, 1.25, 1.25, 8.24, 1.37, 22.01, 4.78, -0.33, 3.81, 0.48, 2.61, 1.05, 2.29]} \ No newline at end of file diff --git a/annotations_1/Tn44a8_14LU_filtered.json b/annotations_1/Tn44a8_14LU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00d2b624558a86960294febf0704e2248cc62aa5 --- /dev/null +++ b/annotations_1/Tn44a8_14LU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.36], [16.0, 17.32], [20.0, 24.04], [24.0, 26.37], [29.0, 29.54], [31.0, 31.21], [37.0, 42.3], [43.0, 54.62], [56.0, 56.67], [67.0, 69.69], [73.0, 73.62], [75.0, 75.39], [76.0, 77.13], [83.0, 84.37], [85.0, 84.99], [85.0, 85.95], [86.0, 87.12], [88.0, 88.92], [96.0, 99.23], [126.0, 129.12], [130.0, 131.79], [133.0, 134.65], [136.0, 136.53], [138.0, 156.17]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.55, 46.9, 0.0, 0.0, 77.2, 71.72, 0.0, 51.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9, 32.76, 0.0, 0.0, 0.0, 28.37], "audiomae_on_audioset": [null, null, null, [["speech", 27.82], ["sine wave", 17.9], ["sidetone", 9.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 28.39], ["speech", 18.66], ["boing", 11.21]], [["music", 77.98], ["didgeridoo", 8.41], ["musical instrument", 4.23]], null, null, null, [["music", 86.83], ["musical instrument", 3.91], ["guitar", 1.51]]], "duration": [1.36, 1.32, 4.04, 2.37, 0.54, 0.21, 5.3, 11.62, 0.67, 2.69, 0.62, 0.39, 1.13, 1.37, -0.01, 0.95, 1.12, 0.92, 3.23, 3.12, 1.79, 1.65, 0.53, 18.17]} \ No newline at end of file diff --git a/annotations_1/ToF0U78xIyA_filtered.json b/annotations_1/ToF0U78xIyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a3e77b11412e38aa04d36285306f25da9779ab2 --- /dev/null +++ b/annotations_1/ToF0U78xIyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.12], [9.0, 11.35], [12.0, 13.14], [16.0, 18.22], [21.0, 26.67], [29.0, 30.81], [35.0, 36.54], [38.0, 38.47], [43.0, 48.32], [57.0, 58.65], [64.0, 65.26], [67.0, 68.13], [78.0, 78.81], [80.0, 81.36], [82.0, 81.94], [84.0, 85.45], [87.0, 88.67], [90.0, 90.56], [92.0, 95.89], [97.0, 97.63], [98.0, 98.07], [98.0, 100.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [63.42, 71.14, 0.0, 64.63, 92.31, 0.0, 0.0, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 38.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 37.85], ["breaking", 23.26], ["whack, thwack", 9.62]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.35], ["throbbing", 9.5], ["hum", 5.53]]], "duration": [2.12, 2.35, 1.14, 2.22, 5.67, 1.81, 1.54, 0.47, 5.32, 1.65, 1.26, 1.13, 0.81, 1.36, -0.06, 1.45, 1.67, 0.56, 3.89, 0.63, 0.07, 2.84]} \ No newline at end of file diff --git a/annotations_1/Tp9iK2u30qQ_filtered.json b/annotations_1/Tp9iK2u30qQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06c05d2efdb9da19dc36773d5165cdb1053bd045 --- /dev/null +++ b/annotations_1/Tp9iK2u30qQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.67], [11.0, 12.46], [15.0, 16.17], [19.0, 19.85], [23.0, 23.99], [26.0, 53.7], [56.0, 62.53], [64.0, 65.5], [72.0, 101.34], [102.0, 107.01], [109.0, 130.2], [134.0, 143.94], [149.0, 154.45], [155.0, 163.44], [164.0, 164.2], [164.0, 165.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.94, 29.37, 0.0, 48.06, 53.53, 36.84, 36.44, 36.29, 37.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 40.1], ["music", 27.7], ["mains hum", 19.16]], [["hum", 18.13], ["throbbing", 8.41], ["music", 8.25]], null, [["speech", 57.91], ["music", 14.41], ["breaking", 8.11]], null, [["music", 69.9], ["ambient music", 13.43], ["electronic music", 3.17]], [["music", 54.99], ["speech", 13.06], ["ambient music", 8.53]], [["scary music", 57.03], ["music", 37.98], ["soundtrack music", 1.04]], [["music", 58.53], ["scary music", 17.89], ["speech", 7.6]], null, null], "duration": [1.67, 1.46, 1.17, 0.85, 0.99, 27.7, 6.53, 1.5, 29.34, 5.01, 21.2, 9.94, 5.45, 8.44, 0.2, 1.6]} \ No newline at end of file diff --git a/annotations_1/TpNPIxWdZgY_filtered.json b/annotations_1/TpNPIxWdZgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb4155ea6e3387aa2ef344dbe228b8259a97b5f --- /dev/null +++ b/annotations_1/TpNPIxWdZgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.96], [16.0, 24.17], [26.0, 27.4], [28.0, 29.93], [31.0, 32.16], [36.0, 36.91], [38.0, 42.96], [44.0, 55.92], [56.0, 58.33], [60.0, 61.82], [64.0, 66.33], [68.0, 68.42], [69.0, 71.22], [74.0, 75.1], [77.0, 78.06], [79.0, 81.67], [83.0, 86.31], [88.0, 88.45], [89.0, 91.35], [96.0, 121.53], [123.0, 124.83], [125.0, 127.75], [129.0, 131.01], [135.0, 136.31], [140.0, 141.18], [143.0, 144.91], [148.0, 149.05], [150.0, 151.92], [153.0, 154.8], [156.0, 157.27], [158.0, 159.24], [161.0, 161.81], [162.0, 166.58], [168.0, 168.98], [171.0, 172.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.73, 99.99, 0.0, 0.0, 0.0, 0.0, 88.64, 60.79, 54.04, 0.0, 81.71, 0.0, 87.37, 0.0, 0.0, 68.02, 88.46, 0.0, 86.27, 68.8, 0.0, 58.13, 62.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.96, 8.17, 1.4, 1.93, 1.16, 0.91, 4.96, 11.92, 2.33, 1.82, 2.33, 0.42, 2.22, 1.1, 1.06, 2.67, 3.31, 0.45, 2.35, 25.53, 1.83, 2.75, 2.01, 1.31, 1.18, 1.91, 1.05, 1.92, 1.8, 1.27, 1.24, 0.81, 4.58, 0.98, 1.13]} \ No newline at end of file diff --git a/annotations_1/Tq9zhCo-PTQ_filtered.json b/annotations_1/Tq9zhCo-PTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57732faeccadb9638168d053bb8450f90c441f2b --- /dev/null +++ b/annotations_1/Tq9zhCo-PTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.86], [6.0, 8.51], [11.0, 13.32], [16.0, 15.9], [18.0, 18.57], [24.0, 24.34], [25.0, 24.88], [26.0, 27.48], [28.0, 28.48], [36.0, 60.72], [66.0, 67.53], [70.0, 77.84], [85.0, 87.91], [93.0, 97.93], [99.0, 111.59], [113.0, 116.45], [117.0, 118.18], [119.0, 119.33], [122.0, 131.25], [135.0, 137.0], [139.0, 141.24], [145.0, 147.63], [152.0, 164.13], [166.0, 168.72], [171.0, 174.55], [175.0, 175.88], [177.0, 181.36], [182.0, 187.0], [188.0, 188.27], [189.0, 194.05], [194.0, 199.25], [200.0, 203.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [0.0, 73.51, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.96, 0.0, 51.23, 66.88, 59.33, 41.38, 65.55, 0.0, 0.0, 36.04, 37.93, 40.95, 71.87, 78.72, 92.15, 44.12, 0.0, 93.13, 80.64, 0.0, 40.24, 40.16, 43.69], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 77.99], ["musical instrument", 3.99], ["singing", 2.11]], null, null, null, null, [["music", 16.2], ["cello", 10.75], ["speech", 8.57]], null, null, null, [["speech", 40.07], ["music", 29.69], ["didgeridoo", 8.53]], [["didgeridoo", 20.0], ["moo", 14.86], ["cattle, bovinae", 13.8]], [["speech", 30.2], ["fly, housefly", 14.99], ["music", 13.51]], null, null, null, [["speech", 41.96], ["radio", 8.35], ["noise", 7.19]], null, null, null, null, [["music", 29.04], ["speech", 11.38], ["musical instrument", 4.67]], [["music", 42.38], ["theremin", 12.21], ["speech", 8.83]], [["music", 46.38], ["musical instrument", 7.6], ["theremin", 7.39]]], "duration": [0.86, 2.51, 2.32, -0.1, 0.57, 0.34, -0.12, 1.48, 0.48, 24.72, 1.53, 7.84, 2.91, 4.93, 12.59, 3.45, 1.18, 0.33, 9.25, 2.0, 2.24, 2.63, 12.13, 2.72, 3.55, 0.88, 4.36, 5.0, 0.27, 5.05, 5.25, 3.03]} \ No newline at end of file diff --git a/annotations_1/Tr3_HOXg4Ug_filtered.json b/annotations_1/Tr3_HOXg4Ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..766ab34bda2cbe6b7448c801afbe8e8609f539e6 --- /dev/null +++ b/annotations_1/Tr3_HOXg4Ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.69], [15.0, 29.76], [31.0, 31.11], [32.0, 38.2], [39.0, 38.97], [39.0, 39.18], [39.0, 40.81], [42.0, 43.68], [45.0, 58.29]], "keep_status": [true, false, false, true, false, false, false, false, true], "silence_prob": [31.13, 31.63, 0.0, 30.57, 0.0, 0.0, 0.0, 0.0, 39.49], "audiomae_on_audioset": [[["music", 32.45], ["throbbing", 13.11], ["mains hum", 9.21]], [["music", 65.07], ["musical instrument", 4.64], ["speech", 3.92]], null, [["speech", 39.87], ["mains hum", 12.35], ["music", 12.17]], null, null, null, null, [["music", 31.02], ["didgeridoo", 19.45], ["whack, thwack", 4.4]]], "duration": [5.69, 14.76, 0.11, 6.2, -0.03, 0.18, 1.81, 1.68, 13.29]} \ No newline at end of file diff --git a/annotations_1/TrvXqosqkls_filtered.json b/annotations_1/TrvXqosqkls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0a4a10ef1a318b5cd16266f0ce8678ef636b0f8 --- /dev/null +++ b/annotations_1/TrvXqosqkls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.11], [14.0, 13.83], [18.0, 26.81], [28.0, 55.98], [59.0, 102.69], [105.0, 108.78], [111.0, 111.4], [113.0, 134.47], [137.0, 138.99], [140.0, 140.64], [142.0, 147.88], [149.0, 153.71], [156.0, 156.73], [159.0, 159.87], [162.0, 165.67], [168.0, 170.7], [172.0, 175.02], [176.0, 176.88], [178.0, 185.89], [187.0, 187.62], [191.0, 192.3], [194.0, 215.22], [218.0, 250.32], [251.0, 253.88], [255.0, 266.67], [268.0, 273.1], [276.0, 279.51], [281.0, 282.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.93, 28.68, 0.0, 29.27, 0.0, 29.26, 0.0, 0.0, 29.42, 29.39, 0.0, 0.0, 30.02, 29.34, 29.44, 0.0, 29.21, 0.0, 0.0, 28.95, 0.0, 34.6, 38.58, 59.77, 73.21, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.27], ["synthesizer", 5.61], ["didgeridoo", 2.07]], [["hum", 34.95], ["mains hum", 27.97], ["music", 21.53]], null, [["music", 72.34], ["theremin", 7.58], ["musical instrument", 4.47]], null, [["music", 50.72], ["hum", 20.45], ["throbbing", 9.01]], null, null, [["music", 54.69], ["musical instrument", 7.32], ["synthesizer", 5.48]], [["music", 43.22], ["synthesizer", 5.08], ["electronic music", 4.11]], null, null, [["music", 40.87], ["synthesizer", 24.35], ["musical instrument", 7.62]], [["music", 34.5], ["speech", 16.15], ["noise", 6.81]], [["music", 33.27], ["musical instrument", 10.63], ["brass instrument", 5.44]], null, [["music", 46.29], ["speech", 20.92], ["sidetone", 2.53]], null, null, [["music", 41.61], ["speech", 23.55], ["foghorn", 5.65]], null, [["hum", 38.18], ["mains hum", 16.21], ["music", 12.58]], [["rumble", 45.79], ["hum", 25.99], ["mains hum", 8.64]], null, null, null], "duration": [1.11, -0.17, 8.81, 27.98, 43.69, 3.78, 0.4, 21.47, 1.99, 0.64, 5.88, 4.71, 0.73, 0.87, 3.67, 2.7, 3.02, 0.88, 7.89, 0.62, 1.3, 21.22, 32.32, 2.88, 11.67, 5.1, 3.51, 1.66]} \ No newline at end of file diff --git a/annotations_1/Trx5K54MNp8_filtered.json b/annotations_1/Trx5K54MNp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dd3989d38cb5c50e18f85adc8014ecbbd26ffb2 --- /dev/null +++ b/annotations_1/Trx5K54MNp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 30.77], [32.0, 57.64], [59.0, 83.74], [90.0, 112.6], [118.0, 121.64], [122.0, 123.74], [129.0, 160.27], [161.0, 161.74], [162.0, 163.83]], "keep_status": [false, true, true, true, true, false, false, false, false], "silence_prob": [43.03, 38.88, 37.0, 29.67, 32.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 57.23], ["speech", 7.29], ["stomach rumble", 6.85]], [["livestock, farm animals, working animals", 35.31], ["cattle, bovinae", 12.89], ["moo", 6.9]], [["speech", 36.01], ["glass", 5.83], ["rumble", 5.8]], [["animal", 16.81], ["livestock, farm animals, working animals", 9.76], ["sheep", 7.62]], [["animal", 25.54], ["speech", 20.13], ["dog", 14.37]], null, null, null, null], "duration": [28.77, 25.64, 24.74, 22.6, 3.64, 1.74, 31.27, 0.74, 1.83]} \ No newline at end of file diff --git a/annotations_1/Ts8WRHAQvk4_filtered.json b/annotations_1/Ts8WRHAQvk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..847b7c4e3fcdb973f67550f422b952c8cb6c82b1 --- /dev/null +++ b/annotations_1/Ts8WRHAQvk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [4.0, 4.85], [7.0, 7.86], [10.0, 10.27], [11.0, 11.37], [13.0, 13.29], [14.0, 15.42], [19.0, 19.35], [20.0, 21.07], [25.0, 26.37], [27.0, 28.09], [30.0, 31.51], [33.0, 33.91], [37.0, 37.62], [50.0, 50.35], [58.0, 58.09], [77.0, 77.68], [86.0, 86.14], [92.0, 106.41], [108.0, 108.28], [110.0, 111.38], [116.0, 118.35], [120.0, 121.98], [126.0, 128.09], [130.0, 130.87], [133.0, 133.69], [135.0, 134.64], [138.0, 140.48], [146.0, 158.04], [159.0, 160.52], [162.0, 163.07], [165.0, 166.4], [176.0, 176.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.03, 0.0, 0.0, 50.86, 0.0, 47.82, 0.0, 0.0, 0.0, 53.4, 37.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.03], ["rumble", 16.54], ["whale vocalization", 14.91]], null, null, null, null, [["music", 28.53], ["rumble", 5.37], ["throbbing", 4.21]], null, null, null, null, [["throbbing", 24.06], ["music", 14.76], ["hum", 11.56]], null, null, null, null], "duration": [0.54, 0.85, 0.86, 0.27, 0.37, 0.29, 1.42, 0.35, 1.07, 1.37, 1.09, 1.51, 0.91, 0.62, 0.35, 0.09, 0.68, 0.14, 14.41, 0.28, 1.38, 2.35, 1.98, 2.09, 0.87, 0.69, -0.36, 2.48, 12.04, 1.52, 1.07, 1.4, 0.57]} \ No newline at end of file diff --git a/annotations_1/Tt-GdLwV4dA_filtered.json b/annotations_1/Tt-GdLwV4dA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee2a0f919e4f0641ab38d141cf92a6ce044a7df4 --- /dev/null +++ b/annotations_1/Tt-GdLwV4dA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.17], [15.0, 20.21], [22.0, 42.33], [53.0, 59.7], [60.0, 60.84], [70.0, 73.58], [79.0, 79.59], [81.0, 97.65]], "keep_status": [true, false, true, true, false, false, false, true], "silence_prob": [33.01, 35.25, 31.16, 31.79, 0.0, 30.76, 0.0, 30.9], "audiomae_on_audioset": [[["music", 51.41], ["noise", 7.73], ["cacophony", 3.27]], [["music", 53.24], ["didgeridoo", 13.76], ["sidetone", 9.12]], [["music", 42.91], ["boing", 5.77], ["speech", 5.38]], [["music", 40.05], ["glockenspiel", 9.97], ["mallet percussion", 7.11]], null, [["moo", 34.21], ["cattle, bovinae", 31.45], ["livestock, farm animals, working animals", 23.38]], null, [["music", 32.16], ["boing", 12.39], ["theremin", 8.29]]], "duration": [9.17, 5.21, 20.33, 6.7, 0.84, 3.58, 0.59, 16.65]} \ No newline at end of file diff --git a/annotations_1/Tt2oL1sVVhM_filtered.json b/annotations_1/Tt2oL1sVVhM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..302c819786fda107d2e067fec7db976cabe4c970 --- /dev/null +++ b/annotations_1/Tt2oL1sVVhM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.42], [12.0, 14.23], [14.0, 14.45], [16.0, 18.08], [19.0, 20.17], [21.0, 45.28], [47.0, 85.75], [88.0, 108.55], [112.0, 119.28]], "keep_status": [false, true, false, false, false, true, false, true, true], "silence_prob": [31.92, 32.02, 0.0, 32.91, 0.0, 31.27, 0.0, 31.23, 30.32], "audiomae_on_audioset": [[["hum", 40.07], ["speech", 21.83], ["mains hum", 10.64]], [["speech", 43.64], ["eruption", 10.16], ["vehicle", 4.55]], null, [["speech", 33.51], ["hum", 22.79], ["mains hum", 16.4]], null, [["speech", 26.57], ["music", 17.92], ["hum", 12.94]], null, [["speech", 40.79], ["music", 17.96], ["eruption", 2.51]], [["speech", 19.05], ["music", 6.79], ["vehicle", 6.48]]], "duration": [5.42, 2.23, 0.45, 2.08, 1.17, 24.28, 38.75, 20.55, 7.28]} \ No newline at end of file diff --git a/annotations_1/Tt7qQmpLA2U_filtered.json b/annotations_1/Tt7qQmpLA2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..892b8872653ebf532661ce3ab206fc8d7de04f0d --- /dev/null +++ b/annotations_1/Tt7qQmpLA2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.35], [5.0, 6.61], [10.0, 10.77], [12.0, 11.85], [15.0, 20.31], [21.0, 21.2], [22.0, 23.16], [24.0, 42.99], [52.0, 64.76], [67.0, 69.69], [75.0, 79.03], [81.0, 99.94], [102.0, 102.81], [111.0, 113.59], [121.0, 120.88]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.1, 0.0, 0.0, 30.92, 30.6, 29.58, 29.42, 29.55, 0.0, 29.37, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 67.9], ["throbbing", 6.36], ["electronic music", 6.15]], null, null, [["music", 71.74], ["throbbing", 2.68], ["drum machine", 2.32]], [["music", 59.53], ["speech", 19.41], ["electronic music", 2.34]], [["music", 62.4], ["speech", 4.32], ["electronic music", 3.28]], [["music", 56.6], ["drum machine", 8.24], ["synthesizer", 7.79]], [["music", 69.28], ["throbbing", 6.27], ["hum", 3.04]], null, [["music", 75.85], ["electronic music", 3.93], ["drum machine", 3.06]], null], "duration": [1.35, 1.61, 0.77, -0.15, 5.31, 0.2, 1.16, 18.99, 12.76, 2.69, 4.03, 18.94, 0.81, 2.59, -0.12]} \ No newline at end of file diff --git a/annotations_1/TtALqoM5hkY_filtered.json b/annotations_1/TtALqoM5hkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3465818e2c9de8860c8bb214c145596dd140f04d --- /dev/null +++ b/annotations_1/TtALqoM5hkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 101.48], [103.0, 103.17], [104.0, 103.98], [108.0, 108.36], [111.0, 112.21], [113.0, 114.29], [115.0, 115.47], [116.0, 116.51], [118.0, 118.98], [124.0, 126.66], [128.0, 128.49], [129.0, 129.3], [155.0, 155.36], [165.0, 164.64], [168.0, 168.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [94.48, 0.17, -0.02, 0.36, 1.21, 1.29, 0.47, 0.51, 0.98, 2.66, 0.49, 0.3, 0.36, -0.36, 0.42]} \ No newline at end of file diff --git a/annotations_1/TuBXSOUS-U4_filtered.json b/annotations_1/TuBXSOUS-U4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f33ca4a22e3d49b3625183e4bcef6709a8c4e63 --- /dev/null +++ b/annotations_1/TuBXSOUS-U4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.27], [13.0, 13.86], [14.0, 14.13], [17.0, 17.39], [18.0, 22.92], [23.0, 24.09], [32.0, 31.99], [37.0, 53.45], [58.0, 78.8], [85.0, 94.51], [95.0, 98.24]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [38.04, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 31.66, 33.36, 60.98, 60.98], "audiomae_on_audioset": [[["music", 78.42], ["musical instrument", 5.98], ["guitar", 4.05]], null, null, null, [["music", 49.35], ["speech", 16.22], ["whack, thwack", 11.72]], null, null, [["music", 37.2], ["speech", 10.41], ["didgeridoo", 8.99]], [["glass", 53.38], ["music", 14.53], ["breaking", 7.48]], null, null], "duration": [2.27, 0.86, 0.13, 0.39, 4.92, 1.09, -0.01, 16.45, 20.8, 9.51, 3.24]} \ No newline at end of file diff --git a/annotations_1/TunbuB_bBb8_filtered.json b/annotations_1/TunbuB_bBb8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd79923286b1b9ee40cc4adeb73b144e53867ee7 --- /dev/null +++ b/annotations_1/TunbuB_bBb8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [10.0, 11.94], [20.0, 21.61], [22.0, 22.32], [22.0, 22.62], [24.0, 23.72], [27.0, 39.24], [40.0, 42.3], [50.0, 50.62], [52.0, 51.92], [54.0, 55.63], [57.0, 60.37], [67.0, 66.72], [68.0, 68.99], [71.0, 71.14], [80.0, 85.58], [87.0, 87.52], [88.0, 93.55], [99.0, 99.13], [114.0, 118.25], [119.0, 129.05], [139.0, 144.88], [147.0, 148.78], [151.0, 152.34], [157.0, 157.67], [165.0, 166.21], [184.0, 184.76], [188.0, 188.22], [189.0, 191.03], [191.0, 195.24]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 48.35, 0.0, 0.0, 0.0, 28.9, 0.0, 0.0, 0.0, 33.36, 0.0, 30.81, 0.0, 89.9, 81.35, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.83, 36.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 23.68], ["chirp tone", 15.06], ["sine wave", 9.68]], null, null, null, [["speech", 54.93], ["music", 22.23], ["explosion", 7.93]], null, null, null, [["music", 36.59], ["throbbing", 20.14], ["hum", 17.33]], null, [["music", 51.24], ["speech", 24.14], ["hum", 3.21]], null, null, null, null, null, null, null, null, null, null, [["speech", 47.88], ["mains hum", 11.27], ["hum", 9.25]], [["speech", 36.75], ["music", 27.79], ["theremin", 8.77]]], "duration": [0.22, 1.94, 1.61, 0.32, 0.62, -0.28, 12.24, 2.3, 0.62, -0.08, 1.63, 3.37, -0.28, 0.99, 0.14, 5.58, 0.52, 5.55, 0.13, 4.25, 10.05, 5.88, 1.78, 1.34, 0.67, 1.21, 0.76, 0.22, 2.03, 4.24]} \ No newline at end of file diff --git a/annotations_1/Tv5BC6yJ61o_filtered.json b/annotations_1/Tv5BC6yJ61o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05af3461d7fc94a51a4ca7cc3e9301e35dbf85e3 --- /dev/null +++ b/annotations_1/Tv5BC6yJ61o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [5.0, 5.24], [6.0, 6.72], [8.0, 8.61], [11.0, 10.98], [12.0, 13.63], [17.0, 19.2], [23.0, 23.45], [26.0, 26.47], [27.0, 27.68], [31.0, 32.05], [33.0, 36.0], [38.0, 39.18], [40.0, 41.59], [44.0, 46.67], [48.0, 53.08], [57.0, 59.8], [62.0, 64.52], [68.0, 69.3], [70.0, 73.55], [75.0, 78.56], [80.0, 85.9], [87.0, 98.36], [99.0, 99.5], [100.0, 155.01], [156.0, 168.84], [172.0, 171.95], [173.0, 174.09], [175.0, 176.15], [179.0, 180.33], [184.0, 184.27], [195.0, 196.53], [198.0, 199.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0, 0.0, 44.04, 47.46, 68.28, 61.97, 0.0, 72.75, 58.81, 71.72, 36.72, 0.0, 0.0, 42.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.23], ["sidetone", 33.96], ["music", 11.35]], null, null, [["music", 51.64], ["theremin", 24.65], ["musical instrument", 4.24]], [["music", 58.98], ["theremin", 8.13], ["musical instrument", 7.54]], null, null, null, null, null, null, [["sine wave", 43.14], ["tuning fork", 22.09], ["chirp tone", 20.93]], null, null, [["hum", 30.9], ["mains hum", 23.53], ["music", 14.83]], null, null, null, null, null, null, null], "duration": [1.37, 0.24, 0.72, 0.61, -0.02, 1.63, 2.2, 0.45, 0.47, 0.68, 1.05, 3.0, 1.18, 1.59, 2.67, 5.08, 2.8, 2.52, 1.3, 3.55, 3.56, 5.9, 11.36, 0.5, 55.01, 12.84, -0.05, 1.09, 1.15, 1.33, 0.27, 1.53, 1.4]} \ No newline at end of file diff --git a/annotations_1/TvFCzrDQrD8_filtered.json b/annotations_1/TvFCzrDQrD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88ac8cefe26e8aac137b13307977ea7814fd82ad --- /dev/null +++ b/annotations_1/TvFCzrDQrD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.91], [24.0, 30.42], [34.0, 35.33], [37.0, 37.77], [38.0, 39.01], [40.0, 41.17], [42.0, 42.82], [44.0, 44.81], [46.0, 47.73], [49.0, 49.33], [50.0, 51.33], [54.0, 54.35], [56.0, 59.8], [62.0, 61.87], [62.0, 63.05], [77.0, 77.48], [79.0, 79.71], [82.0, 84.38], [85.0, 90.64], [92.0, 93.97], [95.0, 97.02], [98.0, 98.95], [100.0, 105.31], [108.0, 108.63], [110.0, 112.67], [115.0, 115.91]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 34.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.17, 0.0, 0.0, 0.0, 0.0, 90.95, 83.34, 0.0, 84.43, 0.0, 89.19, 0.0, 47.66, 0.0], "audiomae_on_audioset": [null, [["speech", 29.71], ["music", 14.81], ["hum", 10.31]], null, null, null, null, null, null, null, null, null, null, [["music", 25.68], ["hum", 12.1], ["singing bowl", 5.9]], null, null, null, null, null, null, null, null, null, null, null, [["music", 39.02], ["singing bowl", 7.73], ["hum", 7.59]], null], "duration": [0.91, 6.42, 1.33, 0.77, 1.01, 1.17, 0.82, 0.81, 1.73, 0.33, 1.33, 0.35, 3.8, -0.13, 1.05, 0.48, 0.71, 2.38, 5.64, 1.97, 2.02, 0.95, 5.31, 0.63, 2.67, 0.91]} \ No newline at end of file diff --git a/annotations_1/TwnfJ8d9NqY_filtered.json b/annotations_1/TwnfJ8d9NqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f2ced682cd57de6b1746667ef66d8a552199b32 --- /dev/null +++ b/annotations_1/TwnfJ8d9NqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 57.81], [60.0, 61.77], [67.0, 81.77], [83.0, 82.9], [84.0, 84.82], [88.0, 90.27], [92.0, 92.25], [93.0, 93.23], [94.0, 94.27], [95.0, 95.47], [98.0, 98.52], [100.0, 100.75]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [66.39, 0.0, 34.75, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.92], ["gunshot, gunfire", 13.65], ["music", 8.82]], null, null, null, null, null, null, null, null, null], "duration": [9.81, 1.77, 14.77, -0.1, 0.82, 2.27, 0.25, 0.23, 0.27, 0.47, 0.52, 0.75]} \ No newline at end of file diff --git a/annotations_1/TxvqZhVwrSY_filtered.json b/annotations_1/TxvqZhVwrSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9e45a5db427e55d3bf9b2d0433d873af9ba5655 --- /dev/null +++ b/annotations_1/TxvqZhVwrSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 33.34], [34.0, 39.04], [43.0, 45.01], [49.0, 51.93], [55.0, 55.19], [57.0, 58.21], [64.0, 64.12], [68.0, 68.66], [71.0, 71.96], [77.0, 78.9], [81.0, 87.81], [88.0, 90.46], [92.0, 92.45], [104.0, 103.76], [108.0, 110.13], [111.0, 112.08], [113.0, 138.38], [140.0, 141.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [28.61, 28.55, 30.18, 29.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.82, 32.45, 0.0, 0.0, 36.66, 0.0, 29.57, 0.0], "audiomae_on_audioset": [[["throbbing", 29.91], ["hum", 27.58], ["speech", 14.03]], [["throbbing", 40.82], ["music", 24.46], ["hum", 15.73]], [["throbbing", 56.73], ["hum", 29.98], ["mains hum", 3.73]], [["throbbing", 45.39], ["music", 20.37], ["hum", 19.7]], null, null, null, null, null, null, [["music", 20.0], ["whack, thwack", 16.16], ["grunt", 7.92]], [["music", 10.71], ["hum", 9.82], ["mains hum", 8.75]], null, null, [["didgeridoo", 67.34], ["music", 17.11], ["hum", 3.11]], null, [["hum", 13.99], ["breaking", 12.29], ["whack, thwack", 10.98]], null], "duration": [11.34, 5.04, 2.01, 2.93, 0.19, 1.21, 0.12, 0.66, 0.96, 1.9, 6.81, 2.46, 0.45, -0.24, 2.13, 1.08, 25.38, 1.35]} \ No newline at end of file diff --git a/annotations_1/TyS98_jQIA0_filtered.json b/annotations_1/TyS98_jQIA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc5a1e9662a7ac32058e8376a479683b21bc91e0 --- /dev/null +++ b/annotations_1/TyS98_jQIA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.92], [13.0, 13.41], [19.0, 19.87], [20.0, 20.88], [25.0, 25.69], [29.0, 30.79], [33.0, 34.15], [37.0, 39.07], [43.0, 43.07], [50.0, 51.16], [54.0, 54.85], [58.0, 58.28], [59.0, 61.65], [63.0, 65.52], [72.0, 72.45], [88.0, 90.49], [93.0, 94.09], [95.0, 96.62], [98.0, 99.06], [101.0, 101.9], [103.0, 104.08], [108.0, 112.48], [114.0, 115.64], [117.0, 118.98], [122.0, 123.57], [124.0, 125.66], [126.0, 129.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0, 0.0, 87.55, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 0.41, 0.87, 0.88, 0.69, 1.79, 1.15, 2.07, 0.07, 1.16, 0.85, 0.28, 2.65, 2.52, 0.45, 2.49, 1.09, 1.62, 1.06, 0.9, 1.08, 4.48, 1.64, 1.98, 1.57, 1.66, 3.15]} \ No newline at end of file diff --git a/annotations_1/TzNPYPp_v78_filtered.json b/annotations_1/TzNPYPp_v78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebcf4a86d1a35a0530791609d7ccb95f2321142 --- /dev/null +++ b/annotations_1/TzNPYPp_v78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.95], [11.0, 11.58], [14.0, 37.23], [38.0, 58.85], [60.0, 76.96], [77.0, 79.52], [80.0, 80.2], [81.0, 83.05], [84.0, 86.7], [88.0, 88.87], [90.0, 90.9], [98.0, 98.05], [99.0, 100.38], [101.0, 104.38], [106.0, 106.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.84, 44.75, 35.65, 70.16, 0.0, 91.98, 81.89, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.22], ["theremin", 24.45], ["wind instrument, woodwind instrument", 7.09]], [["music", 42.86], ["theremin", 11.25], ["musical instrument", 6.34]], null, null, null, null, null, null, null, null, null, null], "duration": [0.95, 0.58, 23.23, 20.85, 16.96, 2.52, 0.2, 2.05, 2.7, 0.87, 0.9, 0.05, 1.38, 3.38, 0.68]} \ No newline at end of file diff --git a/annotations_1/TzRrEgkfhG8_filtered.json b/annotations_1/TzRrEgkfhG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59e63624f392b71f1b518d138cacda3caabeff3e --- /dev/null +++ b/annotations_1/TzRrEgkfhG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 42.45], [46.0, 84.55], [87.0, 89.36], [91.0, 91.71], [94.0, 95.01]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [35.45, 38.55, 2.36, 0.71, 1.01]} \ No newline at end of file diff --git a/annotations_1/U-7MSowBlG8_filtered.json b/annotations_1/U-7MSowBlG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..335da67d753cf45db28266d45ff8b7524929a0f2 --- /dev/null +++ b/annotations_1/U-7MSowBlG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.27], [8.0, 8.8], [12.0, 17.69], [18.0, 18.47], [23.0, 23.65], [28.0, 28.81], [35.0, 36.81], [39.0, 40.36], [41.0, 43.24], [54.0, 54.18], [57.0, 63.24], [65.0, 69.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 74.44, 46.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 36.9], ["speech", 11.21], ["musical instrument", 6.6]]], "duration": [0.27, 0.8, 5.69, 0.47, 0.65, 0.81, 1.81, 1.36, 2.24, 0.18, 6.24, 4.03]} \ No newline at end of file diff --git a/annotations_1/U-R21NaE91o_filtered.json b/annotations_1/U-R21NaE91o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fabbb9b3e3b6c009cfdfdc9d28559a15e310e1e4 --- /dev/null +++ b/annotations_1/U-R21NaE91o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [5.0, 7.06], [9.0, 18.37], [19.0, 18.79], [23.0, 27.28], [29.0, 30.97], [32.0, 37.59], [45.0, 45.77], [49.0, 53.7], [60.0, 60.27], [67.0, 77.13], [79.0, 83.15], [85.0, 87.96], [95.0, 96.5], [97.0, 97.7], [102.0, 102.51], [110.0, 110.4], [111.0, 167.8]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 30.6, 31.49, 0.0, 33.33, 0.0, 30.25, 0.0, 30.17, 0.0, 30.44, 28.93, 30.17, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.6], ["burping, eructation", 16.45], ["hum", 8.39]], [["speech", 41.63], ["mains hum", 22.63], ["hum", 22.28]], null, [["hum", 46.25], ["throbbing", 33.19], ["mains hum", 16.47]], null, [["music", 33.96], ["throbbing", 28.56], ["hum", 13.67]], null, [["music", 52.54], ["hum", 13.43], ["throbbing", 12.56]], null, [["music", 35.56], ["throbbing", 31.53], ["hum", 12.5]], [["music", 43.59], ["speech", 26.55], ["dubstep", 4.99]], [["music", 55.14], ["burping, eructation", 8.16], ["throbbing", 6.62]], null, null, null, null, null], "duration": [0.98, 2.06, 9.37, -0.21, 4.28, 1.97, 5.59, 0.77, 4.7, 0.27, 10.13, 4.15, 2.96, 1.5, 0.7, 0.51, 0.4, 56.8]} \ No newline at end of file diff --git a/annotations_1/U-Sqe0DN_E8_filtered.json b/annotations_1/U-Sqe0DN_E8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..395a565bc661701098949adb2af7db96cb6a905e --- /dev/null +++ b/annotations_1/U-Sqe0DN_E8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.52], [8.0, 10.45], [14.0, 14.22], [15.0, 15.25], [16.0, 17.83], [19.0, 20.24], [26.0, 26.6], [27.0, 29.0], [30.0, 36.34], [39.0, 39.33], [41.0, 42.74], [46.0, 47.28], [48.0, 49.28], [50.0, 51.8], [53.0, 53.49], [54.0, 54.85], [58.0, 58.23], [63.0, 66.01], [67.0, 68.76], [72.0, 72.4], [76.0, 77.3], [78.0, 79.1], [80.0, 80.6], [84.0, 84.43], [86.0, 89.23], [90.0, 97.8], [99.0, 100.2], [103.0, 105.29], [109.0, 108.65], [119.0, 120.36], [121.0, 122.34], [124.0, 125.68], [127.0, 128.34], [129.0, 132.51], [135.0, 137.13], [139.0, 139.45], [145.0, 145.2], [147.0, 147.53], [149.0, 149.12], [151.0, 163.7], [166.0, 172.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 93.6, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 92.97, 0.0, 0.0, 0.0, 0.0, 89.19, 60.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 2.45, 0.22, 0.25, 1.83, 1.24, 0.6, 2.0, 6.34, 0.33, 1.74, 1.28, 1.28, 1.8, 0.49, 0.85, 0.23, 3.01, 1.76, 0.4, 1.3, 1.1, 0.6, 0.43, 3.23, 7.8, 1.2, 2.29, -0.35, 1.36, 1.34, 1.68, 1.34, 3.51, 2.13, 0.45, 0.2, 0.53, 0.12, 12.7, 6.83]} \ No newline at end of file diff --git a/annotations_1/U0HHhK_MrWg_filtered.json b/annotations_1/U0HHhK_MrWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..477b0751404497c5f9b284ccb677e7a22745d165 --- /dev/null +++ b/annotations_1/U0HHhK_MrWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [7.0, 8.6], [20.0, 21.3], [23.0, 23.5], [26.0, 25.81], [27.0, 27.68], [30.0, 30.43], [37.0, 37.59], [40.0, 40.59], [43.0, 43.01], [45.0, 45.52], [48.0, 48.12], [53.0, 53.5], [56.0, 58.85], [59.0, 64.94], [67.0, 69.11], [70.0, 70.48], [78.0, 79.78], [81.0, 82.07], [83.0, 83.35], [92.0, 92.6], [94.0, 94.37], [96.0, 97.36], [101.0, 101.56], [105.0, 109.29], [112.0, 112.11], [114.0, 114.49], [116.0, 116.78], [119.0, 121.05], [124.0, 141.49], [147.0, 147.66], [152.0, 152.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 47.46, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 0.0, 0.0, 0.0, 77.03, 71.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 35.62], ["music", 25.41], ["didgeridoo", 7.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 1.6, 1.3, 0.5, -0.19, 0.68, 0.43, 0.59, 0.59, 0.01, 0.52, 0.12, 0.5, 2.85, 5.94, 2.11, 0.48, 1.78, 1.07, 0.35, 0.6, 0.37, 1.36, 0.56, 4.29, 0.11, 0.49, 0.78, 2.05, 17.49, 0.66, 0.68]} \ No newline at end of file diff --git a/annotations_1/U1GUJMTmoMY_filtered.json b/annotations_1/U1GUJMTmoMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3847af50d7555d2f2b557c4410b74da6134ab23 --- /dev/null +++ b/annotations_1/U1GUJMTmoMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.09], [9.0, 9.83], [18.0, 18.96], [26.0, 26.15], [28.0, 28.14], [29.0, 29.84], [33.0, 33.47], [35.0, 35.29], [41.0, 41.52], [55.0, 55.21], [63.0, 63.85], [68.0, 68.07], [70.0, 70.88], [77.0, 77.45], [81.0, 82.09], [88.0, 95.86], [98.0, 98.68], [99.0, 99.67], [109.0, 109.26], [114.0, 114.51], [118.0, 118.45], [121.0, 123.62], [130.0, 130.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [34.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0], "audiomae_on_audioset": [[["music", 44.06], ["didgeridoo", 35.21], ["ambient music", 3.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.45], ["dial tone", 9.05], ["sidetone", 7.14]], null], "duration": [4.09, 0.83, 0.96, 0.15, 0.14, 0.84, 0.47, 0.29, 0.52, 0.21, 0.85, 0.07, 0.88, 0.45, 1.09, 7.86, 0.68, 0.67, 0.26, 0.51, 0.45, 2.62, 0.5]} \ No newline at end of file diff --git a/annotations_1/U1_VGnnMle8_filtered.json b/annotations_1/U1_VGnnMle8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58358d795f4565433da4a92140025b405e735642 --- /dev/null +++ b/annotations_1/U1_VGnnMle8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.02], [8.0, 16.02], [20.0, 21.34], [28.0, 28.68], [31.0, 31.26], [38.0, 41.25], [54.0, 54.31], [55.0, 66.88], [70.0, 69.97], [71.0, 71.14], [73.0, 73.13], [76.0, 76.5], [81.0, 81.57], [93.0, 93.26], [108.0, 107.76], [117.0, 118.77], [130.0, 131.57], [133.0, 133.86], [150.0, 150.31], [152.0, 152.36], [158.0, 160.46], [163.0, 164.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.11, 0.0, 0.0, 0.0, 39.43, 0.0, 33.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 35.81], ["speech", 28.37], ["clang", 7.81]], null, null, null, [["throbbing", 46.95], ["hum", 28.73], ["speech", 5.42]], null, [["fart", 47.8], ["speech", 22.33], ["music", 22.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 8.02, 1.34, 0.68, 0.26, 3.25, 0.31, 11.88, -0.03, 0.14, 0.13, 0.5, 0.57, 0.26, -0.24, 1.77, 1.57, 0.86, 0.31, 0.36, 2.46, 1.88]} \ No newline at end of file diff --git a/annotations_1/U22aGOTlIy8_filtered.json b/annotations_1/U22aGOTlIy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294d75786a28dc7e9ce42f63d9a70109bd2b3517 --- /dev/null +++ b/annotations_1/U22aGOTlIy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 60.39], [65.0, 71.07], [75.0, 81.35], [82.0, 82.7], [86.0, 89.83], [91.0, 91.83], [93.0, 93.72], [96.0, 96.82], [98.0, 98.85], [99.0, 102.64], [103.0, 104.16], [107.0, 108.77], [110.0, 117.0], [118.0, 120.46], [122.0, 122.28], [123.0, 126.3], [128.0, 133.98], [136.0, 138.11], [146.0, 152.73], [154.0, 161.62], [164.0, 165.2]], "keep_status": [false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 30.18, 30.44, 0.0, 30.35, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0, 0.0, 31.28, 33.53, 0.0, 32.67, 30.81, 31.02, 30.73, 30.43, 0.0], "audiomae_on_audioset": [null, [["music", 46.28], ["hum", 14.38], ["throbbing", 12.51]], [["music", 55.9], ["didgeridoo", 8.26], ["speech", 4.41]], null, [["speech", 21.92], ["music", 16.66], ["hum", 16.4]], null, null, null, null, [["music", 33.59], ["throbbing", 9.28], ["speech", 8.7]], null, null, [["music", 37.08], ["throbbing", 26.36], ["hum", 11.62]], [["music", 68.81], ["synthesizer", 2.44], ["didgeridoo", 2.24]], null, [["music", 41.45], ["speech", 31.0], ["animal", 4.94]], [["music", 30.5], ["mains hum", 17.68], ["hum", 17.54]], [["mains hum", 21.46], ["speech", 15.95], ["music", 15.24]], [["music", 56.3], ["throbbing", 12.09], ["didgeridoo", 5.66]], [["music", 50.55], ["speech", 22.63], ["whale vocalization", 1.75]], null], "duration": [49.39, 6.07, 6.35, 0.7, 3.83, 0.83, 0.72, 0.82, 0.85, 3.64, 1.16, 1.77, 7.0, 2.46, 0.28, 3.3, 5.98, 2.11, 6.73, 7.62, 1.2]} \ No newline at end of file diff --git a/annotations_1/U2HWD9dymUk_filtered.json b/annotations_1/U2HWD9dymUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d468e00de77ad8e90477dd922bf2a36180522e43 --- /dev/null +++ b/annotations_1/U2HWD9dymUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.9], [20.0, 19.94], [21.0, 20.71], [21.0, 28.81], [31.0, 31.95], [33.0, 44.78], [45.0, 50.14], [51.0, 50.87], [53.0, 80.13], [81.0, 83.59], [85.0, 91.4], [104.0, 108.65], [109.0, 112.72], [114.0, 132.29], [134.0, 144.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 50.71, 76.7, 0.0, 56.63, 47.58, 44.69, 47.78, 56.93, 46.33, 40.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.13], ["wind instrument, woodwind instrument", 19.78], ["flute", 14.03]], [["music", 62.08], ["clock", 7.96], ["ice cream truck, ice cream van", 7.84]], [["music", 74.02], ["soundtrack music", 2.67], ["hum", 2.28]], null, [["music", 80.24], ["theremin", 1.54], ["scary music", 1.43]], [["music", 44.14], ["organ", 13.9], ["theremin", 13.05]]], "duration": [-0.1, -0.06, -0.29, 7.81, 0.95, 11.78, 5.14, -0.13, 27.13, 2.59, 6.4, 4.65, 3.72, 18.29, 10.61]} \ No newline at end of file diff --git a/annotations_1/U2SdWVntd-o_filtered.json b/annotations_1/U2SdWVntd-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5f51eeb1ad4a4a5106f29ae26f5279f499d0f31 --- /dev/null +++ b/annotations_1/U2SdWVntd-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 55.41], [57.0, 58.11], [62.0, 62.02], [64.0, 115.21], [119.0, 123.26], [124.0, 125.29], [127.0, 126.98], [128.0, 132.0], [134.0, 145.0], [146.0, 152.78]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.84, 0.0, 0.0, 49.78, 28.99, 28.09], "audiomae_on_audioset": [null, null, null, null, [["music", 55.35], ["didgeridoo", 8.0], ["synthesizer", 6.75]], null, null, [["music", 64.23], ["mantra", 4.33], ["gong", 1.78]], [["hum", 43.12], ["music", 16.36], ["mains hum", 9.78]], [["music", 46.26], ["speech", 15.72], ["electronic music", 8.44]]], "duration": [53.41, 1.11, 0.02, 51.21, 4.26, 1.29, -0.02, 4.0, 11.0, 6.78]} \ No newline at end of file diff --git a/annotations_1/U4fnEAu1--0_filtered.json b/annotations_1/U4fnEAu1--0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee69e3968dd22b5279677db2ab4a106afcc26f54 --- /dev/null +++ b/annotations_1/U4fnEAu1--0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.03], [4.0, 5.61], [7.0, 8.58], [10.0, 11.08], [19.0, 25.08], [35.0, 37.25], [38.0, 42.57], [43.0, 45.08], [49.0, 49.1], [50.0, 63.0], [65.0, 80.94], [81.0, 82.59], [83.0, 84.91], [88.0, 90.58], [95.0, 97.11], [99.0, 101.88], [103.0, 104.46], [108.0, 112.58], [113.0, 114.56], [116.0, 116.9], [117.0, 120.36], [121.0, 132.53], [134.0, 140.9], [143.0, 145.3], [146.0, 148.68], [150.0, 150.9], [153.0, 157.38], [159.0, 162.26], [166.0, 166.24], [170.0, 171.88], [172.0, 173.52], [176.0, 178.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [81.17, 0.0, 0.0, 0.0, 81.71, 88.64, 95.78, 85.35, 0.0, 31.15, 32.68, 0.0, 0.0, 70.58, 99.97, 83.16, 0.0, 70.72, 0.0, 0.0, 100.0, 99.78, 96.04, 99.48, 96.66, 0.0, 78.55, 30.73, 0.0, 0.0, 0.0, 99.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 45.12], ["music", 41.43], ["whack, thwack", 1.78]], [["music", 77.93], ["throbbing", 4.65], ["hum", 2.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 29.35], ["speech", 18.92], ["music", 15.56]], null, null, null, null], "duration": [2.03, 1.61, 1.58, 1.08, 6.08, 2.25, 4.57, 2.08, 0.1, 13.0, 15.94, 1.59, 1.91, 2.58, 2.11, 2.88, 1.46, 4.58, 1.56, 0.9, 3.36, 11.53, 6.9, 2.3, 2.68, 0.9, 4.38, 3.26, 0.24, 1.88, 1.52, 2.33]} \ No newline at end of file diff --git a/annotations_1/U5EKQ63wREM_filtered.json b/annotations_1/U5EKQ63wREM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98c1470cf9af7008a44002636044e6971600f208 --- /dev/null +++ b/annotations_1/U5EKQ63wREM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[72.0, 73.14], [73.0, 79.62], [82.0, 122.89], [126.0, 127.06], [129.0, 129.86], [132.0, 133.12], [136.0, 142.35], [144.0, 147.04], [148.0, 149.15]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.4, 0.0, 0.0, 0.0, 0.0, 86.64, 88.1, 0.0], "audiomae_on_audioset": [null, [["music", 64.69], ["throbbing", 3.64], ["synthesizer", 3.43]], null, null, null, null, null, null, null], "duration": [1.14, 6.62, 40.89, 1.06, 0.86, 1.12, 6.35, 3.04, 1.15]} \ No newline at end of file diff --git a/annotations_1/U6GY91u1I_c_filtered.json b/annotations_1/U6GY91u1I_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44f11ab6cd6abe72d8c19a315c9d2ade448ee09c --- /dev/null +++ b/annotations_1/U6GY91u1I_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.62], [15.0, 16.41], [20.0, 33.67], [34.0, 35.23], [40.0, 54.94], [55.0, 55.04], [56.0, 61.59], [62.0, 63.24], [72.0, 76.25], [80.0, 94.47], [98.0, 110.46], [118.0, 118.47], [120.0, 128.07], [130.0, 134.37], [136.0, 137.79], [142.0, 145.42], [146.0, 149.47], [154.0, 154.03], [158.0, 158.63], [163.0, 169.62], [174.0, 186.56], [190.0, 203.27]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true], "silence_prob": [29.34, 0.0, 28.85, 0.0, 29.12, 0.0, 28.99, 0.0, 28.77, 28.88, 29.25, 0.0, 29.87, 35.92, 0.0, 53.91, 36.54, 0.0, 0.0, 29.72, 28.74, 29.57], "audiomae_on_audioset": [[["music", 59.73], ["throbbing", 7.15], ["electronic music", 3.95]], null, [["hum", 20.72], ["electric shaver, electric razor", 11.76], ["mains hum", 11.29]], null, [["cattle, bovinae", 23.01], ["music", 19.51], ["livestock, farm animals, working animals", 18.0]], null, [["speech", 47.49], ["music", 22.08], ["whack, thwack", 3.31]], null, [["speech", 72.41], ["burst, pop", 6.48], ["explosion", 5.99]], [["music", 65.51], ["speech", 12.09], ["buzz", 3.72]], [["music", 51.14], ["hum", 13.44], ["throbbing", 8.93]], null, [["music", 46.69], ["speech", 21.05], ["breaking", 4.22]], [["music", 40.54], ["speech", 8.83], ["beep, bleep", 7.19]], null, null, [["theremin", 35.67], ["music", 26.45], ["speech", 13.19]], null, null, [["music", 42.0], ["speech", 36.2], ["whack, thwack", 2.98]], [["music", 41.98], ["speech", 23.17], ["outside, rural or natural", 2.11]], [["speech", 34.69], ["music", 30.86], ["eruption", 3.74]]], "duration": [3.62, 1.41, 13.67, 1.23, 14.94, 0.04, 5.59, 1.24, 4.25, 14.47, 12.46, 0.47, 8.07, 4.37, 1.79, 3.42, 3.47, 0.03, 0.63, 6.62, 12.56, 13.27]} \ No newline at end of file diff --git a/annotations_1/U714emx9EJQ_filtered.json b/annotations_1/U714emx9EJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0287f67275abf240023968425439091f44ffc8e --- /dev/null +++ b/annotations_1/U714emx9EJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [4.0, 9.78], [15.0, 17.88], [23.0, 36.54], [38.0, 59.86], [61.0, 74.44], [78.0, 78.83], [84.0, 89.82]], "keep_status": [false, false, true, false, true, true, false, true], "silence_prob": [0.0, 31.36, 43.03, 41.24, 31.56, 29.78, 0.0, 31.36], "audiomae_on_audioset": [null, [["speech", 57.31], ["music", 13.88], ["musical instrument", 4.83]], [["music", 21.36], ["hum", 15.36], ["throbbing", 10.53]], [["music", 37.27], ["speech", 30.19], ["mains hum", 8.1]], [["music", 47.78], ["hum", 13.51], ["mains hum", 6.77]], [["explosion", 15.32], ["music", 13.34], ["smash, crash", 7.46]], null, [["music", 24.9], ["thunk", 22.36], ["firecracker", 10.43]]], "duration": [0.57, 5.78, 2.88, 13.54, 21.86, 13.44, 0.83, 5.82]} \ No newline at end of file diff --git a/annotations_1/U74NUVSKuP0_filtered.json b/annotations_1/U74NUVSKuP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e51d7eeef4f27ae910748a31afe8f4405843ea --- /dev/null +++ b/annotations_1/U74NUVSKuP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 31.63], [34.0, 38.1], [41.0, 68.94], [69.0, 96.94], [100.0, 108.36], [110.0, 131.94]], "keep_status": [false, true, false, true, false, true], "silence_prob": [30.32, 29.6, 36.99, 30.41, 35.08, 28.96], "audiomae_on_audioset": [[["mains hum", 48.2], ["hum", 27.65], ["gong", 4.19]], [["music", 28.73], ["explosion", 19.21], ["hum", 4.23]], [["music", 48.05], ["hum", 18.0], ["throbbing", 5.8]], [["music", 56.24], ["hum", 6.51], ["mains hum", 4.98]], [["music", 44.87], ["throbbing", 20.08], ["hum", 16.81]], [["music", 39.1], ["throbbing", 19.63], ["hum", 9.07]]], "duration": [5.63, 4.1, 27.94, 27.94, 8.36, 21.94]} \ No newline at end of file diff --git a/annotations_1/U7HxeKhKgwM_filtered.json b/annotations_1/U7HxeKhKgwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..844fff09b433d1e60a33e2ea1e51e31713d44b25 --- /dev/null +++ b/annotations_1/U7HxeKhKgwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 55.54], [59.0, 63.05], [63.0, 71.34], [73.0, 95.25], [97.0, 99.0], [102.0, 121.61], [124.0, 128.29], [129.0, 136.93], [138.0, 148.91], [149.0, 149.12]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 55.18, 30.36, 31.34, 96.42, 87.92, 63.85, 33.66, 36.57, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.48], ["machine gun", 28.45], ["gunshot, gunfire", 4.74]], [["speech", 30.29], ["music", 15.65], ["smash, crash", 12.38]], null, null, null, [["music", 56.21], ["speech", 17.34], ["noise", 4.09]], [["music", 37.79], ["fly, housefly", 26.09], ["mosquito", 18.85]], null], "duration": [34.54, 4.05, 8.34, 22.25, 2.0, 19.61, 4.29, 7.93, 10.91, 0.12]} \ No newline at end of file diff --git a/annotations_1/U7jlC1QNaUM_filtered.json b/annotations_1/U7jlC1QNaUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cab3599edca894289ceef98984e4afa71202aa79 --- /dev/null +++ b/annotations_1/U7jlC1QNaUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 67.02], [69.0, 70.09], [72.0, 74.14], [74.0, 107.45], [109.0, 123.38], [128.0, 138.3], [139.0, 155.16], [156.0, 167.51], [170.0, 176.08]], "keep_status": [false, false, false, false, true, true, false, false, false], "silence_prob": [52.51, 0.0, 53.1, 0.0, 45.95, 45.75, 65.32, 56.86, 57.48], "audiomae_on_audioset": [null, null, null, null, [["music", 24.59], ["hum", 15.57], ["throbbing", 14.19]], [["music", 36.74], ["hum", 15.96], ["mains hum", 11.83]], null, null, null], "duration": [15.02, 1.09, 2.14, 33.45, 14.38, 10.3, 16.16, 11.51, 6.08]} \ No newline at end of file diff --git a/annotations_1/U8fgto8IZLM_filtered.json b/annotations_1/U8fgto8IZLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80a7f34ddf7e8cb637033d66a289bf71afe6346a --- /dev/null +++ b/annotations_1/U8fgto8IZLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.87], [10.0, 11.25], [12.0, 12.48], [15.0, 18.59], [27.0, 31.36], [33.0, 33.91], [37.0, 38.74], [40.0, 43.29], [47.0, 48.03], [53.0, 54.38], [56.0, 67.41], [69.0, 69.8], [74.0, 74.41], [77.0, 77.03], [79.0, 81.33], [94.0, 94.74], [95.0, 97.36], [98.0, 99.0], [108.0, 109.32], [109.0, 109.38], [111.0, 110.94], [112.0, 112.38], [113.0, 113.07], [114.0, 115.86], [117.0, 119.91], [121.0, 121.46], [160.0, 161.05], [164.0, 164.1], [166.0, 166.36]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.22, 43.28, 0.0, 0.0, 30.21, 0.0, 0.0, 30.53, 0.0, 0.0, 0.0, 91.98, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.03], ["speech", 4.25], ["throbbing", 2.69]], null, null, [["moo", 45.9], ["cattle, bovinae", 39.18], ["livestock, farm animals, working animals", 9.98]], null, null, [["music", 43.99], ["cattle, bovinae", 14.33], ["moo", 9.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 1.25, 0.48, 3.59, 4.36, 0.91, 1.74, 3.29, 1.03, 1.38, 11.41, 0.8, 0.41, 0.03, 2.33, 0.74, 2.36, 1.0, 1.32, 0.38, -0.06, 0.38, 0.07, 1.86, 2.91, 0.46, 1.05, 0.1, 0.36]} \ No newline at end of file diff --git a/annotations_1/U9WHLcpvVz0_filtered.json b/annotations_1/U9WHLcpvVz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..861458abf3ccd9a8455430e5871350c4580ae923 --- /dev/null +++ b/annotations_1/U9WHLcpvVz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.43], [8.0, 8.09], [13.0, 13.64], [28.0, 34.7], [38.0, 49.74], [51.0, 53.84], [55.0, 56.66], [59.0, 59.64], [67.0, 71.27], [80.0, 80.16], [92.0, 102.63], [106.0, 113.86], [116.0, 120.56]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 34.68, 29.59, 35.91, 0.0, 0.0, 31.12, 0.0, 31.3, 30.55, 32.3], "audiomae_on_audioset": [null, null, null, [["music", 60.65], ["hum", 7.29], ["gong", 5.43]], [["hum", 43.88], ["mains hum", 19.47], ["throbbing", 11.3]], [["music", 33.32], ["hum", 19.66], ["throbbing", 12.68]], null, null, [["music", 27.56], ["throbbing", 20.88], ["hum", 16.33]], null, [["music", 71.82], ["throbbing", 4.58], ["synthesizer", 4.07]], [["music", 60.78], ["musical instrument", 5.02], ["didgeridoo", 2.23]], [["music", 48.02], ["speech", 10.78], ["fart", 4.31]]], "duration": [0.43, 0.09, 0.64, 6.7, 11.74, 2.84, 1.66, 0.64, 4.27, 0.16, 10.63, 7.86, 4.56]} \ No newline at end of file diff --git a/annotations_1/U9t_bzEKBnA_filtered.json b/annotations_1/U9t_bzEKBnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6edbf9f72eedc8a649c8bacbe71be1164505b8a3 --- /dev/null +++ b/annotations_1/U9t_bzEKBnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.05], [26.0, 26.42], [28.0, 28.71], [33.0, 34.89], [36.0, 36.48], [37.0, 38.96], [40.0, 41.15], [42.0, 44.19], [45.0, 48.98], [50.0, 50.52], [63.0, 63.32], [70.0, 70.01], [71.0, 72.86], [78.0, 79.12], [80.0, 80.25], [81.0, 81.08], [82.0, 82.98], [83.0, 84.23], [87.0, 87.13], [90.0, 90.36], [91.0, 95.5], [96.0, 99.76], [100.0, 102.69], [103.0, 105.83], [111.0, 112.89], [115.0, 116.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 70.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 71.72, 58.3, 67.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.42, 0.71, 1.89, 0.48, 1.96, 1.15, 2.19, 3.98, 0.52, 0.32, 0.01, 1.86, 1.12, 0.25, 0.08, 0.98, 1.23, 0.13, 0.36, 4.5, 3.76, 2.69, 2.83, 1.89, 1.87]} \ No newline at end of file diff --git a/annotations_1/UAoJ_mv0Pqo_filtered.json b/annotations_1/UAoJ_mv0Pqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d39dd79f9f70d48a1f064b04dd2deb6145089993 --- /dev/null +++ b/annotations_1/UAoJ_mv0Pqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.77], [17.0, 21.52], [24.0, 25.17], [29.0, 29.05], [33.0, 34.11], [36.0, 38.18], [40.0, 40.44], [42.0, 42.6], [44.0, 56.42], [58.0, 58.11], [59.0, 60.4], [63.0, 63.69], [64.0, 65.45], [67.0, 67.39], [68.0, 99.87], [101.0, 103.81], [105.0, 106.14], [108.0, 125.86], [128.0, 138.15], [139.0, 149.17]], "keep_status": [false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [33.04, 41.83, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.17, 0.0, 32.66, 30.43, 30.95], "audiomae_on_audioset": [[["hum", 49.23], ["mains hum", 20.0], ["throbbing", 13.09]], [["throbbing", 24.24], ["speech", 18.12], ["hum", 12.58]], null, null, null, [["hum", 16.41], ["eruption", 11.74], ["mains hum", 7.7]], null, null, [["music", 25.18], ["speech", 16.73], ["mains hum", 8.63]], null, null, null, null, null, null, [["speech", 20.3], ["music", 12.78], ["hum", 12.6]], null, [["music", 31.83], ["mains hum", 20.49], ["hum", 20.23]], [["speech", 39.59], ["music", 13.6], ["hum", 12.37]], [["hum", 34.96], ["mains hum", 32.47], ["music", 9.2]]], "duration": [8.77, 4.52, 1.17, 0.05, 1.11, 2.18, 0.44, 0.6, 12.42, 0.11, 1.4, 0.69, 1.45, 0.39, 31.87, 2.81, 1.14, 17.86, 10.15, 10.17]} \ No newline at end of file diff --git a/annotations_1/UB1xsj0ZiKA_filtered.json b/annotations_1/UB1xsj0ZiKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07099374584f459743b3f91e9a0eda3329f5fbf8 --- /dev/null +++ b/annotations_1/UB1xsj0ZiKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.66], [11.0, 18.5], [24.0, 25.59], [33.0, 40.26], [45.0, 49.79], [59.0, 62.73], [71.0, 72.45], [75.0, 78.6], [86.0, 87.24], [89.0, 90.1], [92.0, 93.16], [95.0, 97.43], [100.0, 106.79], [117.0, 117.0], [120.0, 123.13], [127.0, 128.11], [143.0, 144.1], [148.0, 161.3], [166.0, 194.32]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [28.9, 29.56, 0.0, 29.13, 28.59, 29.94, 0.0, 29.25, 0.0, 0.0, 0.0, 29.91, 29.05, 0.0, 29.99, 0.0, 0.0, 28.88, 28.85], "audiomae_on_audioset": [[["hum", 48.04], ["music", 14.67], ["mains hum", 8.35]], [["music", 35.06], ["throbbing", 23.88], ["hum", 21.7]], null, [["music", 34.17], ["throbbing", 13.41], ["hum", 12.38]], [["speech", 45.93], ["music", 20.57], ["ship", 6.63]], [["music", 34.84], ["mains hum", 18.16], ["hum", 12.2]], null, [["mains hum", 33.42], ["hum", 32.45], ["throbbing", 11.76]], null, null, null, [["music", 29.57], ["ambient music", 16.96], ["synthesizer", 7.5]], [["music", 54.45], ["ambient music", 15.1], ["synthesizer", 9.08]], null, [["music", 40.67], ["mains hum", 18.71], ["hum", 11.47]], null, null, [["music", 74.72], ["ambient music", 10.03], ["soundtrack music", 1.99]], [["music", 48.98], ["didgeridoo", 14.94], ["hum", 9.45]]], "duration": [3.66, 7.5, 1.59, 7.26, 4.79, 3.73, 1.45, 3.6, 1.24, 1.1, 1.16, 2.43, 6.79, 0.0, 3.13, 1.11, 1.1, 13.3, 28.32]} \ No newline at end of file diff --git a/annotations_1/UBOcWFBBB04_filtered.json b/annotations_1/UBOcWFBBB04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f85135a3e47e20db0426a69808dcf8cfa10a72a --- /dev/null +++ b/annotations_1/UBOcWFBBB04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.62], [12.0, 11.65], [20.0, 20.46], [21.0, 21.56], [23.0, 24.93], [26.0, 26.86], [28.0, 28.73], [33.0, 34.48], [39.0, 39.46], [48.0, 48.73], [53.0, 53.86], [56.0, 57.1], [71.0, 70.85], [74.0, 75.41], [79.0, 79.64], [81.0, 81.92], [85.0, 85.33], [86.0, 86.29], [90.0, 91.15], [93.0, 93.01], [95.0, 97.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, -0.35, 0.46, 0.56, 1.93, 0.86, 0.73, 1.48, 0.46, 0.73, 0.86, 1.1, -0.15, 1.41, 0.64, 0.92, 0.33, 0.29, 1.15, 0.01, 2.87]} \ No newline at end of file diff --git a/annotations_1/UBWIoJF2X4A_filtered.json b/annotations_1/UBWIoJF2X4A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccfe8d9faf9e9b0255d31ca0662abfc235c628f0 --- /dev/null +++ b/annotations_1/UBWIoJF2X4A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.86], [22.0, 27.48], [29.0, 29.4], [40.0, 52.57], [54.0, 69.77]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 33.34, 0.0, 28.96, 28.75], "audiomae_on_audioset": [null, [["music", 60.85], ["speech", 7.64], ["fireworks", 2.59]], null, [["music", 77.49], ["speech", 5.59], ["electronic music", 2.06]], [["music", 71.45], ["livestock, farm animals, working animals", 3.49], ["moo", 3.32]]], "duration": [-0.14, 5.48, 0.4, 12.57, 15.77]} \ No newline at end of file diff --git a/annotations_1/UBmxdy6C4JI_filtered.json b/annotations_1/UBmxdy6C4JI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..372f82a9fd0a1212f77efd3a296811fc37ab15e4 --- /dev/null +++ b/annotations_1/UBmxdy6C4JI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.2], [22.0, 24.73], [29.0, 29.96], [35.0, 40.19], [41.0, 41.59], [42.0, 42.57], [44.0, 44.56], [46.0, 46.75], [50.0, 55.85], [58.0, 60.79], [64.0, 64.35], [67.0, 79.86], [81.0, 81.75], [86.0, 93.04], [101.0, 105.9], [107.0, 111.11], [115.0, 132.26], [139.0, 141.24], [142.0, 142.84], [143.0, 149.99], [154.0, 159.81], [163.0, 168.27], [172.0, 176.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.54, 0.0, 31.93, 0.0, 0.0, 0.0, 0.0, 31.45, 31.92, 0.0, 31.1, 0.0, 31.95, 32.66, 33.38, 31.58, 33.48, 0.0, 30.59, 31.34, 31.63, 47.01], "audiomae_on_audioset": [null, [["music", 73.25], ["musical instrument", 4.85], ["guitar", 4.21]], null, [["music", 84.83], ["musical instrument", 4.74], ["guitar", 4.12]], null, null, null, null, [["music", 75.01], ["musical instrument", 4.05], ["cacophony", 3.95]], [["music", 86.91], ["musical instrument", 3.93], ["guitar", 3.32]], null, [["music", 78.01], ["musical instrument", 5.57], ["guitar", 4.2]], null, [["music", 81.19], ["speech", 9.72], ["musical instrument", 2.6]], [["music", 60.57], ["cacophony", 5.66], ["musical instrument", 5.42]], [["music", 62.36], ["throbbing", 8.78], ["hum", 4.78]], [["music", 86.22], ["musical instrument", 4.2], ["guitar", 3.16]], [["music", 80.65], ["throbbing", 2.93], ["musical instrument", 2.37]], null, [["music", 57.52], ["speech", 12.8], ["noise", 8.29]], [["music", 80.12], ["whack, thwack", 2.69], ["fart", 1.41]], [["music", 89.71], ["musical instrument", 2.85], ["cacophony", 1.24]], [["music", 39.7], ["throbbing", 26.01], ["hum", 12.47]]], "duration": [0.2, 2.73, 0.96, 5.19, 0.59, 0.57, 0.56, 0.75, 5.85, 2.79, 0.35, 12.86, 0.75, 7.04, 4.9, 4.11, 17.26, 2.24, 0.84, 6.99, 5.81, 5.27, 4.67]} \ No newline at end of file diff --git a/annotations_1/UBnufwe-p_c_filtered.json b/annotations_1/UBnufwe-p_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00a45198798e81ac45127cb491122306ceff2b0e --- /dev/null +++ b/annotations_1/UBnufwe-p_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.17], [9.0, 24.87], [29.0, 29.3], [30.0, 33.03], [35.0, 35.13], [36.0, 36.64], [39.0, 41.01], [42.0, 42.69], [44.0, 52.74], [57.0, 57.37], [60.0, 61.55], [65.0, 69.26], [71.0, 72.23], [72.0, 74.53], [79.0, 83.19], [84.0, 84.72], [91.0, 91.35], [94.0, 104.75], [105.0, 109.27], [110.0, 110.51], [111.0, 142.48]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [29.18, 28.59, 0.0, 32.19, 0.0, 0.0, 31.87, 0.0, 28.62, 0.0, 0.0, 28.72, 0.0, 28.62, 29.65, 0.0, 0.0, 28.92, 29.86, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 41.22], ["throbbing", 36.59], ["mains hum", 9.53]], [["vehicle", 28.53], ["car", 18.8], ["music", 17.3]], null, [["throbbing", 46.34], ["music", 25.21], ["hum", 13.34]], null, null, [["throbbing", 43.64], ["hum", 21.74], ["music", 20.0]], null, [["vehicle", 23.94], ["skidding", 23.29], ["music", 16.23]], null, null, [["music", 44.64], ["vehicle", 15.77], ["car", 7.37]], null, [["music", 30.51], ["speech", 9.12], ["throbbing", 9.05]], [["hum", 42.29], ["throbbing", 25.18], ["music", 9.01]], null, null, [["music", 57.57], ["hum", 17.88], ["throbbing", 10.68]], [["hum", 48.7], ["throbbing", 31.48], ["music", 9.9]], null, null], "duration": [4.17, 15.87, 0.3, 3.03, 0.13, 0.64, 2.01, 0.69, 8.74, 0.37, 1.55, 4.26, 1.23, 2.53, 4.19, 0.72, 0.35, 10.75, 4.27, 0.51, 31.48]} \ No newline at end of file diff --git a/annotations_1/UC6sKTqfgg8_filtered.json b/annotations_1/UC6sKTqfgg8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62512428a8fd4754b1c45fe1df7c8c910e997bda --- /dev/null +++ b/annotations_1/UC6sKTqfgg8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.41], [27.0, 50.77], [53.0, 53.5], [59.0, 64.42], [67.0, 71.36], [74.0, 73.8], [75.0, 75.51], [76.0, 76.4], [78.0, 78.51], [80.0, 80.87], [82.0, 82.16], [84.0, 91.57], [93.0, 93.18], [95.0, 100.5], [104.0, 105.95], [108.0, 110.69], [112.0, 116.14], [119.0, 122.54], [126.0, 126.23], [128.0, 144.51], [145.0, 144.64], [145.0, 145.0], [145.0, 145.67]], "keep_status": [false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.96, 0.0, 39.89, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 93.91, 0.0, 59.68, 90.95, 76.04, 0.0, 39.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.37], ["didgeridoo", 19.08], ["speech", 9.21]], null, [["fly, housefly", 14.67], ["noise", 10.7], ["hum", 10.55]], [["fly, housefly", 28.51], ["bee, wasp, etc.", 17.52], ["insect", 14.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 36.9], ["music", 29.92], ["speech", 18.5]], null, null, null], "duration": [0.41, 23.77, 0.5, 5.42, 4.36, -0.2, 0.51, 0.4, 0.51, 0.87, 0.16, 7.57, 0.18, 5.5, 1.95, 2.69, 4.14, 3.54, 0.23, 16.51, -0.36, 0.0, 0.67]} \ No newline at end of file diff --git a/annotations_1/UCCkKfTVEy4_filtered.json b/annotations_1/UCCkKfTVEy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb8372968cc99f9c5e62ecd6bf21b6e56455f070 --- /dev/null +++ b/annotations_1/UCCkKfTVEy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 14.72], [18.0, 20.38], [26.0, 27.6], [30.0, 34.32], [51.0, 51.7], [60.0, 61.33], [62.0, 78.54], [86.0, 86.76], [89.0, 95.94], [110.0, 114.64], [120.0, 124.39], [128.0, 128.26], [139.0, 150.03]], "keep_status": [false, true, false, true, false, false, false, false, true, true, true, false, true], "silence_prob": [28.96, 34.33, 0.0, 30.77, 0.0, 0.0, 28.88, 0.0, 29.49, 30.21, 29.18, 0.0, 28.66], "audiomae_on_audioset": [[["buzz", 43.14], ["music", 33.82], ["vehicle", 3.35]], [["hum", 18.71], ["mains hum", 16.13], ["throbbing", 13.43]], null, [["noise", 29.73], ["music", 16.37], ["cacophony", 4.73]], null, null, [["music", 58.71], ["buzz", 9.21], ["mains hum", 4.43]], null, [["music", 51.43], ["hum", 9.67], ["throbbing", 7.61]], [["speech", 22.44], ["music", 16.4], ["foghorn", 12.53]], [["music", 25.79], ["vehicle", 6.1], ["electronic music", 5.77]], null, [["music", 45.18], ["throbbing", 7.89], ["hum", 7.64]]], "duration": [11.72, 2.38, 1.6, 4.32, 0.7, 1.33, 16.54, 0.76, 6.94, 4.64, 4.39, 0.26, 11.03]} \ No newline at end of file diff --git a/annotations_1/UCGdsPwcKKg_filtered.json b/annotations_1/UCGdsPwcKKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7697d798fa64ea6f590a3e84c125b6356dbfe892 --- /dev/null +++ b/annotations_1/UCGdsPwcKKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.37], [23.0, 24.17], [30.0, 30.48], [32.0, 67.49], [71.0, 73.18], [81.0, 88.75], [90.0, 112.72], [113.0, 118.5], [121.0, 160.42], [161.0, 161.5], [162.0, 177.21], [177.0, 179.95]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.05, 41.83, 33.43, 32.61, 0.0, 0.0, 28.59, 33.39], "audiomae_on_audioset": [null, null, null, null, [["speech", 61.87], ["radio", 6.5], ["hum", 5.06]], [["hum", 54.26], ["throbbing", 16.48], ["mains hum", 13.54]], [["music", 30.1], ["sound effect", 10.53], ["speech", 6.06]], [["speech", 31.79], ["music", 21.96], ["throbbing", 13.7]], null, null, [["music", 43.86], ["didgeridoo", 10.46], ["speech", 8.8]], [["speech", 64.56], ["music", 4.16], ["hum", 2.56]]], "duration": [0.37, 1.17, 0.48, 35.49, 2.18, 7.75, 22.72, 5.5, 39.42, 0.5, 15.21, 2.95]} \ No newline at end of file diff --git a/annotations_1/UCac6K5YWns_filtered.json b/annotations_1/UCac6K5YWns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b336771390aa97aeb50eaa384f2b17d36bc46d20 --- /dev/null +++ b/annotations_1/UCac6K5YWns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 27.7], [30.0, 32.29], [39.0, 39.8], [41.0, 41.55], [42.0, 45.89], [47.0, 47.85], [48.0, 47.88], [48.0, 48.93], [53.0, 59.1], [62.0, 62.29], [64.0, 66.56], [69.0, 69.97], [73.0, 74.31], [77.0, 77.23], [79.0, 80.03], [82.0, 121.29], [127.0, 128.28], [131.0, 131.01], [134.0, 135.85], [137.0, 139.62], [142.0, 142.65], [149.0, 171.32]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.16, 36.74, 0.0, 0.0, 43.53, 0.0, 0.0, 0.0, 29.3, 0.0, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 78.04], "audiomae_on_audioset": [[["music", 45.53], ["speech", 15.37], ["explosion", 10.87]], [["music", 36.97], ["hum", 18.66], ["mains hum", 10.63]], null, null, [["music", 73.93], ["hum", 3.15], ["ambient music", 2.57]], null, null, null, [["music", 26.64], ["theremin", 19.16], ["hum", 15.11]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [22.7, 2.29, 0.8, 0.55, 3.89, 0.85, -0.12, 0.93, 6.1, 0.29, 2.56, 0.97, 1.31, 0.23, 1.03, 39.29, 1.28, 0.01, 1.85, 2.62, 0.65, 22.32]} \ No newline at end of file diff --git a/annotations_1/UDINZf4W4mw_filtered.json b/annotations_1/UDINZf4W4mw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9be885bdcb9836bb489a09ea3f2ebd1beb6945b --- /dev/null +++ b/annotations_1/UDINZf4W4mw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.34], [11.0, 11.75], [12.0, 12.78], [18.0, 21.69], [25.0, 24.92], [29.0, 29.2], [32.0, 32.73], [37.0, 39.09], [43.0, 42.85], [50.0, 56.64], [59.0, 59.71], [66.0, 66.43], [69.0, 69.57], [71.0, 84.35], [85.0, 92.74]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 45.59, 0.0, 30.21, 0.0, 0.0, 0.0, 31.18, 32.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 21.35], ["music", 12.89], ["fly, housefly", 5.27]], null, [["hum", 36.84], ["music", 8.64], ["mains hum", 8.35]], null, null, null, [["music", 48.68], ["hum", 9.86], ["mains hum", 3.16]], [["speech", 23.11], ["music", 21.3], ["hum", 12.03]]], "duration": [0.34, 0.75, 0.78, 3.69, -0.08, 0.2, 0.73, 2.09, -0.15, 6.64, 0.71, 0.43, 0.57, 13.35, 7.74]} \ No newline at end of file diff --git a/annotations_1/UDhWyFDDrUg_filtered.json b/annotations_1/UDhWyFDDrUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a93d529f28ae2bfb8b15ff85256e2b9d9757521 --- /dev/null +++ b/annotations_1/UDhWyFDDrUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [4.0, 4.38], [7.0, 42.16], [47.0, 54.8], [60.0, 69.25], [73.0, 88.47], [89.0, 95.17], [98.0, 104.57], [105.0, 106.32], [109.0, 112.77], [114.0, 116.16], [116.0, 117.66], [120.0, 120.72], [122.0, 122.91], [124.0, 125.04], [127.0, 130.27], [131.0, 132.73], [137.0, 136.8], [138.0, 138.91], [141.0, 141.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.45, 31.72, 29.61, 39.44, 47.27, 0.0, 56.78, 50.51, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.78], ["speech", 20.27], ["throbbing", 9.82]], [["hum", 31.04], ["music", 27.67], ["throbbing", 27.12]], [["music", 39.33], ["speech", 32.19], ["hum", 3.98]], [["music", 43.09], ["speech", 19.41], ["rumble", 8.87]], [["music", 69.21], ["scary music", 15.9], ["ambient music", 2.67]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.38, 35.16, 7.8, 9.25, 15.47, 6.17, 6.57, 1.32, 3.77, 2.16, 1.66, 0.72, 0.91, 1.04, 3.27, 1.73, -0.2, 0.91, 0.54]} \ No newline at end of file diff --git a/annotations_1/UDq-H6B36g8_filtered.json b/annotations_1/UDq-H6B36g8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23437bc01253c910615f0ba71b766fd6b35af561 --- /dev/null +++ b/annotations_1/UDq-H6B36g8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.52], [11.0, 13.53], [21.0, 21.79], [23.0, 24.29], [26.0, 40.31], [42.0, 48.59], [51.0, 51.97], [53.0, 53.91], [56.0, 57.48], [59.0, 59.37], [61.0, 61.2], [64.0, 64.1], [72.0, 73.04], [74.0, 74.97], [81.0, 81.77], [84.0, 84.37], [85.0, 85.82], [88.0, 89.8], [100.0, 100.31], [107.0, 107.67], [116.0, 116.55], [123.0, 124.24], [125.0, 126.39], [128.0, 129.88], [131.0, 131.89], [132.0, 133.79], [135.0, 135.72], [137.0, 138.4]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.45, 41.24, 0.0, 0.0, 33.03, 32.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 15.76], ["hum", 12.36], ["vehicle", 6.57]], [["throbbing", 23.91], ["music", 10.62], ["hum", 10.55]], null, null, [["music", 62.61], ["timpani", 7.85], ["throbbing", 4.78]], [["music", 54.68], ["theremin", 28.79], ["musical instrument", 2.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.52, 2.53, 0.79, 1.29, 14.31, 6.59, 0.97, 0.91, 1.48, 0.37, 0.2, 0.1, 1.04, 0.97, 0.77, 0.37, 0.82, 1.8, 0.31, 0.67, 0.55, 1.24, 1.39, 1.88, 0.89, 1.79, 0.72, 1.4]} \ No newline at end of file diff --git a/annotations_1/UECge-Vi8VA_filtered.json b/annotations_1/UECge-Vi8VA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94a42bbd2690e08fa0ff905703df03bd45058bad --- /dev/null +++ b/annotations_1/UECge-Vi8VA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.31], [19.0, 24.48], [26.0, 26.57], [29.0, 29.56], [30.0, 31.18], [33.0, 34.33], [35.0, 38.6], [40.0, 47.43], [56.0, 59.16], [61.0, 61.67], [62.0, 62.94], [67.0, 67.46], [75.0, 75.29], [81.0, 82.36], [85.0, 85.36], [91.0, 91.5], [94.0, 94.32], [104.0, 104.38], [106.0, 105.7], [108.0, 107.92], [111.0, 111.96], [117.0, 120.41], [122.0, 124.77], [131.0, 131.01], [134.0, 134.18], [139.0, 139.21], [156.0, 156.88], [158.0, 158.21], [158.0, 158.82], [165.0, 166.26], [167.0, 171.58], [172.0, 174.53], [175.0, 175.34], [181.0, 182.55], [188.0, 188.5], [195.0, 195.2], [210.0, 214.61], [217.0, 217.98]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [31.48, 38.52, 0.0, 0.0, 0.0, 0.0, 37.18, 35.19, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.09, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.83, 42.42, 0.0, 0.0, 0.0, 0.0, 36.54, 0.0], "audiomae_on_audioset": [[["music", 32.78], ["sonar", 14.76], ["gong", 7.59]], [["speech", 64.23], ["music", 7.16], ["hum", 3.45]], null, null, null, null, [["beatboxing", 21.87], ["wail, moan", 21.06], ["speech", 10.7]], [["music", 31.71], ["chirp tone", 21.97], ["effects unit", 10.55]], [["music", 39.98], ["speech", 25.03], ["effects unit", 6.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.67], ["thunk", 6.82], ["sonar", 3.03]], [["speech", 47.71], ["hum", 8.84], ["busy signal", 6.38]], null, null, null, null, [["music", 69.63], ["synthesizer", 11.38], ["electronic music", 3.18]], null], "duration": [4.31, 5.48, 0.57, 0.56, 1.18, 1.33, 3.6, 7.43, 3.16, 0.67, 0.94, 0.46, 0.29, 1.36, 0.36, 0.5, 0.32, 0.38, -0.3, -0.08, 0.96, 3.41, 2.77, 0.01, 0.18, 0.21, 0.88, 0.21, 0.82, 1.26, 4.58, 2.53, 0.34, 1.55, 0.5, 0.2, 4.61, 0.98]} \ No newline at end of file diff --git a/annotations_1/UF2c01_glHU_filtered.json b/annotations_1/UF2c01_glHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b46b020d410bed004dc9f15cfd580abd1ebefeb5 --- /dev/null +++ b/annotations_1/UF2c01_glHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.48], [7.0, 8.68], [9.0, 10.77], [23.0, 22.89], [29.0, 29.74], [31.0, 31.16], [32.0, 33.39], [36.0, 36.27], [37.0, 37.98], [39.0, 41.03], [42.0, 52.98], [53.0, 56.05], [57.0, 58.6], [59.0, 67.54], [68.0, 71.69], [73.0, 74.01], [75.0, 75.24], [78.0, 79.74], [81.0, 85.95], [86.0, 86.64], [87.0, 90.22], [91.0, 92.04], [102.0, 144.14], [145.0, 154.45], [156.0, 164.96], [166.0, 168.22], [169.0, 170.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 55.18, 49.36, 0.0, 38.27, 53.72, 0.0, 0.0, 0.0, 43.64, 0.0, 39.24, 0.0, 0.0, 38.37, 30.81, 52.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 18.79], ["speech", 17.39], ["music", 14.61]], null, [["music", 30.91], ["speech", 29.39], ["whimper", 12.44]], null, null, null, null, [["frog", 58.92], ["croak", 16.08], ["music", 6.05]], null, [["buzzer", 31.18], ["music", 12.56], ["fire alarm", 8.66]], null, null, [["hum", 56.51], ["mains hum", 22.45], ["buzz", 6.54]], [["livestock, farm animals, working animals", 40.62], ["cattle, bovinae", 15.36], ["music", 8.7]], null, null], "duration": [2.48, 1.68, 1.77, -0.11, 0.74, 0.16, 1.39, 0.27, 0.98, 2.03, 10.98, 3.05, 1.6, 8.54, 3.69, 1.01, 0.24, 1.74, 4.95, 0.64, 3.22, 1.04, 42.14, 9.45, 8.96, 2.22, 1.46]} \ No newline at end of file diff --git a/annotations_1/UFFWH8N9SLk_filtered.json b/annotations_1/UFFWH8N9SLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd1084159a9d1f436bc9c4e66a6a914baf0ea913 --- /dev/null +++ b/annotations_1/UFFWH8N9SLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.7], [7.0, 8.7], [9.0, 11.65], [13.0, 15.16], [17.0, 18.28], [20.0, 20.85], [22.0, 26.42], [29.0, 30.5], [32.0, 34.38], [39.0, 39.87], [42.0, 42.65], [44.0, 46.41], [50.0, 52.1], [54.0, 60.03], [61.0, 63.63], [65.0, 70.66], [77.0, 79.91], [86.0, 87.96], [90.0, 90.85], [95.0, 97.23], [99.0, 101.36], [104.0, 105.92], [109.0, 110.52], [113.0, 117.26], [122.0, 124.93], [128.0, 128.16], [131.0, 133.73], [137.0, 137.3], [141.0, 142.42], [151.0, 151.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 72.9, 98.19, 0.0, 0.0, 59.24, 0.0, 68.67, 0.0, 0.0, 81.71, 99.1, 99.82, 99.95, 82.61, 44.69, 0.0, 0.0, 55.74, 42.67, 0.0, 0.0, 41.87, 50.81, 0.0, 43.2, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.92], ["singing bowl", 8.54], ["vocal music", 4.39]], null, null, null, [["music", 47.2], ["singing bowl", 10.72], ["effects unit", 5.59]], null, null, [["music", 60.54], ["didgeridoo", 15.39], ["musical instrument", 5.12]], null, null, [["music", 50.55], ["didgeridoo", 24.82], ["effects unit", 3.51]], null, null, null], "duration": [0.7, 1.7, 2.65, 2.16, 1.28, 0.85, 4.42, 1.5, 2.38, 0.87, 0.65, 2.41, 2.1, 6.03, 2.63, 5.66, 2.91, 1.96, 0.85, 2.23, 2.36, 1.92, 1.52, 4.26, 2.93, 0.16, 2.73, 0.3, 1.42, 0.58]} \ No newline at end of file diff --git a/annotations_1/UFiKhV_Ay70_filtered.json b/annotations_1/UFiKhV_Ay70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c296416c1001ea222448cdffd67733154d8ac1f --- /dev/null +++ b/annotations_1/UFiKhV_Ay70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.99], [11.0, 12.66], [20.0, 20.61], [25.0, 25.71], [28.0, 28.95], [30.0, 31.36], [32.0, 33.51], [37.0, 37.93], [51.0, 52.14], [55.0, 58.45], [76.0, 76.13], [81.0, 82.8], [84.0, 88.99], [90.0, 100.16], [109.0, 116.45], [119.0, 120.41], [120.0, 120.46], [130.0, 131.67], [137.0, 137.13], [140.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 61.87, 94.37, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.99, 1.66, 0.61, 0.71, 0.95, 1.36, 1.51, 0.93, 1.14, 3.45, 0.13, 1.8, 4.99, 10.16, 7.45, 1.41, 0.46, 1.67, 0.13, 1.17]} \ No newline at end of file diff --git a/annotations_1/UFo40MSG5Ss_filtered.json b/annotations_1/UFo40MSG5Ss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0f7440bf89c3b10fd850d75a102534423ce1d90 --- /dev/null +++ b/annotations_1/UFo40MSG5Ss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.8], [25.0, 29.61], [33.0, 81.75], [82.0, 115.8], [120.0, 121.47], [122.0, 123.25]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 33.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 62.68], ["didgeridoo", 13.91], ["musical instrument", 4.83]], null, null, null, null], "duration": [-0.2, 4.61, 48.75, 33.8, 1.47, 1.25]} \ No newline at end of file diff --git a/annotations_1/UFuxiZFwDPs_filtered.json b/annotations_1/UFuxiZFwDPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98f3ab198abaf5c2b6381738fc1a600a30119f20 --- /dev/null +++ b/annotations_1/UFuxiZFwDPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 27.11], [28.0, 29.62], [31.0, 33.08], [35.0, 41.57], [43.0, 43.92], [45.0, 51.78], [53.0, 53.84], [62.0, 63.32], [66.0, 67.14], [68.0, 76.6], [77.0, 83.56], [88.0, 89.29], [95.0, 97.83], [99.0, 100.62], [105.0, 106.14], [107.0, 108.63], [110.0, 116.23], [123.0, 125.36], [132.0, 142.92], [147.0, 150.03], [151.0, 151.31], [152.0, 157.08], [159.0, 161.27]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, true, false, false, false, true, true, false, false, false, true, true], "silence_prob": [35.28, 0.0, 38.35, 36.91, 0.0, 40.54, 0.0, 0.0, 0.0, 41.44, 39.19, 0.0, 41.46, 0.0, 0.0, 0.0, 40.77, 42.98, 41.89, 42.79, 0.0, 42.42, 41.42], "audiomae_on_audioset": [[["hum", 38.43], ["mains hum", 31.42], ["music", 9.78]], null, [["hum", 45.89], ["mains hum", 17.66], ["throbbing", 9.31]], [["throbbing", 46.31], ["hum", 29.81], ["music", 4.58]], null, [["music", 26.73], ["throbbing", 8.25], ["heart sounds, heartbeat", 8.21]], null, null, null, [["hum", 30.67], ["music", 12.79], ["throbbing", 12.23]], [["whale vocalization", 46.12], ["hum", 14.1], ["speech", 9.37]], null, [["hum", 25.36], ["throbbing", 23.75], ["music", 12.33]], null, null, null, [["hum", 23.59], ["music", 19.25], ["throbbing", 12.3]], [["music", 33.32], ["hum", 13.37], ["mains hum", 7.39]], [["hum", 29.72], ["throbbing", 28.69], ["sidetone", 15.65]], [["hum", 46.57], ["mains hum", 27.84], ["throbbing", 12.72]], null, [["throbbing", 30.1], ["hum", 19.69], ["heart sounds, heartbeat", 8.62]], [["hum", 32.4], ["throbbing", 14.8], ["whale vocalization", 11.6]]], "duration": [26.11, 1.62, 2.08, 6.57, 0.92, 6.78, 0.84, 1.32, 1.14, 8.6, 6.56, 1.29, 2.83, 1.62, 1.14, 1.63, 6.23, 2.36, 10.92, 3.03, 0.31, 5.08, 2.27]} \ No newline at end of file diff --git a/annotations_1/UGfYt2Ufipw_filtered.json b/annotations_1/UGfYt2Ufipw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d17e361fb5f310e04de5b864ecc573ee8ca01865 --- /dev/null +++ b/annotations_1/UGfYt2Ufipw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.72], [4.0, 5.34], [7.0, 7.01], [7.0, 7.72], [9.0, 9.86], [24.0, 26.25], [27.0, 27.68], [32.0, 31.9], [33.0, 34.21], [37.0, 40.49], [46.0, 45.74], [47.0, 47.31], [48.0, 49.74], [54.0, 54.31], [64.0, 66.77], [72.0, 75.17], [76.0, 76.37], [77.0, 77.63], [78.0, 83.12], [84.0, 85.19]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.29, 0.0, 0.0, 0.0, 41.64, 0.0, 0.0, 0.0, 0.0, 37.77, 42.3, 0.0, 0.0, 40.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["animal", 24.92], ["dog", 9.59], ["speech", 8.06]], null, null, null, [["music", 26.19], ["frog", 12.56], ["boing", 7.16]], null, null, null, null, [["music", 37.91], ["speech", 15.3], ["sidetone", 2.42]], [["music", 52.61], ["bird", 4.32], ["bird vocalization, bird call, bird song", 3.56]], null, null, [["music", 65.8], ["synthesizer", 7.16], ["boing", 5.17]], null], "duration": [1.72, 1.34, 0.01, 0.72, 0.86, 2.25, 0.68, -0.1, 1.21, 3.49, -0.26, 0.31, 1.74, 0.31, 2.77, 3.17, 0.37, 0.63, 5.12, 1.19]} \ No newline at end of file diff --git a/annotations_1/UHaEsAcQQ6k_filtered.json b/annotations_1/UHaEsAcQQ6k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d4b13ac625dc5f0ab1f1701d4943605f188b3bc --- /dev/null +++ b/annotations_1/UHaEsAcQQ6k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.88], [13.0, 13.34], [17.0, 33.71], [42.0, 42.5], [49.0, 55.86], [56.0, 56.44], [57.0, 78.21], [82.0, 83.27], [88.0, 97.19], [114.0, 118.89], [120.0, 124.77], [128.0, 129.73]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.16, 0.0, 31.69, 0.0, 32.1, 0.0, 31.95, 0.0, 32.83, 35.2, 31.82, 0.0], "audiomae_on_audioset": [[["music", 54.26], ["musical instrument", 5.9], ["guitar", 4.76]], null, [["music", 70.15], ["synthesizer", 5.81], ["musical instrument", 3.39]], null, [["music", 55.25], ["speech", 26.11], ["sidetone", 7.29]], null, [["music", 47.36], ["speech", 27.66], ["musical instrument", 5.36]], null, [["music", 65.98], ["speech", 12.42], ["didgeridoo", 7.38]], [["music", 72.76], ["didgeridoo", 7.29], ["speech", 6.05]], [["music", 56.86], ["piano", 5.34], ["musical instrument", 5.15]], null], "duration": [8.88, 0.34, 16.71, 0.5, 6.86, 0.44, 21.21, 1.27, 9.19, 4.89, 4.77, 1.73]} \ No newline at end of file diff --git a/annotations_1/UIxwyNULzdk_filtered.json b/annotations_1/UIxwyNULzdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..800174df0a3bdadfa088ba63269db605bf540975 --- /dev/null +++ b/annotations_1/UIxwyNULzdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.71], [15.0, 20.26], [22.0, 23.36], [26.0, 26.92], [31.0, 33.44], [34.0, 35.14], [37.0, 37.5], [38.0, 39.04], [40.0, 40.64], [42.0, 43.24], [44.0, 46.65], [51.0, 51.76], [55.0, 55.78], [57.0, 56.84], [58.0, 58.41], [59.0, 75.32], [77.0, 77.94], [80.0, 83.27], [85.0, 89.55], [92.0, 99.69], [100.0, 102.68], [105.0, 105.88], [110.0, 117.54], [122.0, 131.9], [134.0, 141.3], [151.0, 155.43], [157.0, 171.42], [175.0, 175.61], [179.0, 179.39], [185.0, 201.04], [202.0, 207.94], [210.0, 218.15], [219.0, 220.24], [221.0, 221.75], [222.0, 222.79], [224.0, 223.99], [228.0, 228.01], [235.0, 235.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, true, false, true, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 53.28, 0.0, 0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 0.0, 0.0, 0.0, 36.32, 0.0, 89.72, 96.29, 33.13, 35.04, 0.0, 32.55, 33.37, 32.38, 34.7, 33.06, 0.0, 0.0, 33.75, 30.83, 32.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 36.22], ["music", 18.89], ["synthesizer", 11.75]], null, null, null, null, [["music", 38.26], ["speech", 22.93], ["ambient music", 7.56]], null, null, null, [["music", 34.56], ["shofar", 33.49], ["wind instrument, woodwind instrument", 8.93]], [["music", 27.66], ["theremin", 25.43], ["ambient music", 8.16]], null, [["speech", 43.15], ["music", 15.12], ["civil defense siren", 2.53]], [["hum", 49.98], ["mains hum", 13.4], ["music", 10.84]], [["fly, housefly", 33.48], ["mosquito", 16.64], ["music", 9.42]], [["music", 40.68], ["throbbing", 29.66], ["hum", 12.2]], [["music", 69.2], ["speech", 4.51], ["throbbing", 2.83]], null, null, [["music", 30.01], ["theremin", 12.97], ["mosquito", 6.9]], [["speech", 39.1], ["vehicle", 10.65], ["music", 5.48]], [["music", 33.03], ["speech", 15.36], ["didgeridoo", 10.64]], null, null, null, null, null, null], "duration": [1.71, 5.26, 1.36, 0.92, 2.44, 1.14, 0.5, 1.04, 0.64, 1.24, 2.65, 0.76, 0.78, -0.16, 0.41, 16.32, 0.94, 3.27, 4.55, 7.69, 2.68, 0.88, 7.54, 9.9, 7.3, 4.43, 14.42, 0.61, 0.39, 16.04, 5.94, 8.15, 1.24, 0.75, 0.79, -0.01, 0.01, 0.38]} \ No newline at end of file diff --git a/annotations_1/UJQvNi4m4LM_filtered.json b/annotations_1/UJQvNi4m4LM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc03753527c48ded946011525dda1c6508b7b2da --- /dev/null +++ b/annotations_1/UJQvNi4m4LM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.76], [7.0, 8.56], [9.0, 10.45], [13.0, 15.38], [16.0, 17.14], [18.0, 19.4], [24.0, 24.95], [26.0, 35.23], [36.0, 37.86], [40.0, 42.45], [43.0, 43.77], [48.0, 49.84], [50.0, 52.15], [53.0, 54.48], [55.0, 55.59], [58.0, 58.82], [62.0, 63.83], [65.0, 66.18], [69.0, 73.43], [78.0, 79.93], [82.0, 87.27], [91.0, 91.42], [93.0, 94.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 99.84, 0.0, 99.76, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 84.25, 0.0, 95.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 1.56, 1.45, 2.38, 1.14, 1.4, 0.95, 9.23, 1.86, 2.45, 0.77, 1.84, 2.15, 1.48, 0.59, 0.82, 1.83, 1.18, 4.43, 1.93, 5.27, 0.42, 1.36]} \ No newline at end of file diff --git a/annotations_1/UJ_zLBr1NxE_filtered.json b/annotations_1/UJ_zLBr1NxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..617e55b38098d08cf5801524d7e07faf0a250f53 --- /dev/null +++ b/annotations_1/UJ_zLBr1NxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.93], [4.0, 16.46], [18.0, 33.13], [34.0, 45.54], [55.0, 57.86], [62.0, 61.72], [63.0, 91.02], [92.0, 93.45], [96.0, 118.84], [119.0, 118.94], [119.0, 146.45], [147.0, 150.82], [151.0, 169.74]], "keep_status": [true, false, true, true, true, false, true, false, true, false, true, true, false], "silence_prob": [40.24, 30.68, 36.46, 29.06, 29.68, 0.0, 29.11, 0.0, 28.71, 0.0, 28.74, 29.38, 29.03], "audiomae_on_audioset": [[["music", 32.19], ["whale vocalization", 6.5], ["noise", 5.42]], [["speech", 58.69], ["music", 18.1], ["hum", 4.25]], [["hum", 13.98], ["rumble", 10.31], ["thunk", 8.74]], [["speech", 23.08], ["eruption", 15.44], ["explosion", 12.8]], [["speech", 27.34], ["music", 12.76], ["mains hum", 7.7]], null, [["speech", 32.63], ["music", 11.04], ["buzz", 8.82]], null, [["vehicle", 13.98], ["eruption", 9.27], ["livestock, farm animals, working animals", 4.39]], null, [["music", 48.15], ["boom", 10.24], ["speech", 5.99]], [["speech", 46.65], ["explosion", 7.84], ["eruption", 7.1]], [["music", 82.13], ["cacophony", 2.69], ["electronic music", 1.6]]], "duration": [2.93, 12.46, 15.13, 11.54, 2.86, -0.28, 28.02, 1.45, 22.84, -0.06, 27.45, 3.82, 18.74]} \ No newline at end of file diff --git a/annotations_1/UK-vT8iapA8_filtered.json b/annotations_1/UK-vT8iapA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..495401675729c5bdb00e8f7aac02633cf3a30669 --- /dev/null +++ b/annotations_1/UK-vT8iapA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [2.0, 2.35], [2.0, 3.25], [6.0, 6.44], [12.0, 13.41], [23.0, 26.81], [31.0, 37.02], [41.0, 41.57], [46.0, 48.24], [49.0, 50.04], [52.0, 53.11], [59.0, 60.47], [64.0, 65.2], [71.0, 72.1], [73.0, 74.14], [79.0, 79.81], [82.0, 83.15], [84.0, 83.93], [88.0, 88.74], [92.0, 93.31], [96.0, 97.17], [99.0, 100.57], [112.0, 112.53], [115.0, 122.35], [124.0, 124.75], [126.0, 146.38], [149.0, 149.84], [159.0, 158.95], [164.0, 164.91], [166.0, 168.18]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.41, 33.38, 0.0, 38.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 30.54, 0.0, 0.0, 0.0, 96.54], "audiomae_on_audioset": [null, null, null, null, null, [["music", 66.48], ["fart", 5.25], ["whip", 4.69]], [["music", 61.67], ["guitar", 2.38], ["plucked string instrument", 2.25]], null, [["music", 62.19], ["boing", 1.93], ["cattle, bovinae", 1.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.91], ["carnatic music", 9.04], ["fly, housefly", 4.25]], null, [["music", 48.8], ["speech", 29.49], ["hum", 2.77]], null, null, null, null], "duration": [0.46, 0.35, 1.25, 0.44, 1.41, 3.81, 6.02, 0.57, 2.24, 1.04, 1.11, 1.47, 1.2, 1.1, 1.14, 0.81, 1.15, -0.07, 0.74, 1.31, 1.17, 1.57, 0.53, 7.35, 0.75, 20.38, 0.84, -0.05, 0.91, 2.18]} \ No newline at end of file diff --git a/annotations_1/UK0wGi3JHrY_filtered.json b/annotations_1/UK0wGi3JHrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c5818acddbb40c0672ef50292f456c86c878f02 --- /dev/null +++ b/annotations_1/UK0wGi3JHrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.72], [8.0, 8.88], [18.0, 18.45], [20.0, 19.87], [21.0, 24.63], [26.0, 26.52], [27.0, 27.18], [29.0, 31.23], [35.0, 38.23], [40.0, 44.0], [54.0, 58.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 99.9, 99.95, 99.36, 94.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.88, 0.45, -0.13, 3.63, 0.52, 0.18, 2.23, 3.23, 4.0, 4.21]} \ No newline at end of file diff --git a/annotations_1/UN5YOny_U8g_filtered.json b/annotations_1/UN5YOny_U8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..170745a54b4c26cd901c856a322935e9e49ec069 --- /dev/null +++ b/annotations_1/UN5YOny_U8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 7.3], [10.0, 10.47], [12.0, 12.72], [14.0, 14.13], [15.0, 16.46], [17.0, 18.13], [22.0, 22.05], [23.0, 23.48], [25.0, 26.97], [29.0, 29.54], [35.0, 37.35], [38.0, 39.18], [41.0, 43.12], [45.0, 45.74], [50.0, 51.17], [53.0, 53.74], [58.0, 58.26], [60.0, 61.45], [67.0, 67.15], [69.0, 69.45], [77.0, 77.87], [79.0, 79.88], [81.0, 81.43], [82.0, 85.5], [90.0, 91.18], [92.0, 93.21], [94.0, 94.47], [100.0, 101.87], [103.0, 103.76], [104.0, 104.43], [112.0, 112.8], [113.0, 115.72], [117.0, 120.43], [122.0, 124.26]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 44.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.99, 0.0, 44.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.9, 31.84, 30.92], "audiomae_on_audioset": [null, [["hum", 38.82], ["mains hum", 13.77], ["throbbing", 13.34]], null, null, null, null, null, null, null, null, null, [["music", 35.82], ["sidetone", 25.22], ["speech", 22.87]], null, [["sidetone", 18.83], ["whale vocalization", 18.25], ["music", 16.3]], null, null, null, null, null, null, null, null, null, null, [["speech", 19.39], ["livestock, farm animals, working animals", 14.05], ["cattle, bovinae", 13.67]], null, null, null, null, null, null, null, [["speech", 38.29], ["music", 24.8], ["didgeridoo", 7.51]], [["radio", 24.64], ["whale vocalization", 13.39], ["livestock, farm animals, working animals", 6.59]], [["radio", 18.04], ["livestock, farm animals, working animals", 13.32], ["animal", 9.89]]], "duration": [0.5, 4.3, 0.47, 0.72, 0.13, 1.46, 1.13, 0.05, 0.48, 1.97, 0.54, 2.35, 1.18, 2.12, 0.74, 1.17, 0.74, 0.26, 1.45, 0.15, 0.45, 0.87, 0.88, 0.43, 3.5, 1.18, 1.21, 0.47, 1.87, 0.76, 0.43, 0.8, 2.72, 3.43, 2.26]} \ No newline at end of file diff --git a/annotations_1/UNLFpS_xEZI_filtered.json b/annotations_1/UNLFpS_xEZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24e212ad03d3f170bd7f59da811dd8047efecc5a --- /dev/null +++ b/annotations_1/UNLFpS_xEZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.21], [26.0, 29.88], [32.0, 34.42], [36.0, 43.55], [49.0, 49.11], [51.0, 53.6], [55.0, 55.59], [56.0, 57.15], [62.0, 71.37], [72.0, 73.75], [74.0, 75.95], [77.0, 78.49], [79.0, 81.78], [83.0, 84.94], [85.0, 87.1], [88.0, 88.74]], "keep_status": [false, true, true, true, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.75, 32.12, 30.4, 0.0, 35.91, 0.0, 0.0, 54.76, 0.0, 0.0, 0.0, 62.47, 0.0, 48.82, 0.0], "audiomae_on_audioset": [null, [["music", 47.46], ["speech", 8.25], ["drum machine", 5.54]], [["music", 51.96], ["thunk", 6.67], ["boing", 4.85]], [["music", 57.55], ["boing", 6.28], ["speech", 6.01]], null, [["music", 20.72], ["speech", 16.69], ["throbbing", 10.41]], null, null, null, null, null, null, null, null, [["hum", 20.75], ["throbbing", 17.68], ["speech", 16.59]], null], "duration": [0.21, 3.88, 2.42, 7.55, 0.11, 2.6, 0.59, 1.15, 9.37, 1.75, 1.95, 1.49, 2.78, 1.94, 2.1, 0.74]} \ No newline at end of file diff --git a/annotations_1/UNYBtjHAuSA_filtered.json b/annotations_1/UNYBtjHAuSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07d7b44fe8111732caebbcf459fa6bb3ed6e6eb4 --- /dev/null +++ b/annotations_1/UNYBtjHAuSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.29], [6.0, 6.62], [9.0, 14.5], [16.0, 29.39], [31.0, 34.42], [36.0, 37.27], [39.0, 44.29], [47.0, 47.31], [49.0, 60.32], [64.0, 65.15], [67.0, 68.18], [71.0, 71.68]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 46.12, 39.44, 38.37, 0.0, 48.27, 0.0, 38.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 33.04], ["music", 19.58], ["hum", 17.6]], [["music", 68.31], ["musical instrument", 5.05], ["theremin", 3.49]], [["music", 69.14], ["musical instrument", 6.21], ["theremin", 5.53]], null, [["music", 51.09], ["wind instrument, woodwind instrument", 5.56], ["clarinet", 5.53]], null, [["music", 41.87], ["theremin", 32.76], ["hum", 5.22]], null, null, null], "duration": [1.29, 0.62, 5.5, 13.39, 3.42, 1.27, 5.29, 0.31, 11.32, 1.15, 1.18, 0.68]} \ No newline at end of file diff --git a/annotations_1/UP6UWl1Y1-Q_filtered.json b/annotations_1/UP6UWl1Y1-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6899c1b4d8023a5f17412689d38f1a941442f508 --- /dev/null +++ b/annotations_1/UP6UWl1Y1-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.86], [5.0, 6.42], [7.0, 10.89], [12.0, 13.46], [14.0, 14.69], [19.0, 20.68], [23.0, 23.97], [26.0, 26.7], [29.0, 31.4], [34.0, 35.61], [38.0, 39.8], [42.0, 43.71], [47.0, 49.65], [53.0, 54.41], [55.0, 55.83], [56.0, 58.06], [60.0, 60.69], [66.0, 65.96], [73.0, 73.31], [77.0, 78.44], [80.0, 81.8], [85.0, 86.32], [88.0, 89.87], [92.0, 92.21], [96.0, 96.4], [100.0, 101.44], [104.0, 104.38], [105.0, 107.92], [108.0, 111.55], [114.0, 115.23], [116.0, 118.03], [119.0, 120.31], [121.0, 124.23], [132.0, 133.66], [135.0, 135.99], [138.0, 139.11], [140.0, 140.98], [146.0, 148.64], [150.0, 150.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 54.43, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 74.29, 0.0, 84.98, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 1.42, 3.89, 1.46, 0.69, 1.68, 0.97, 0.7, 2.4, 1.61, 1.8, 1.71, 2.65, 1.41, 0.83, 2.06, 0.69, -0.04, 0.31, 1.44, 1.8, 1.32, 1.87, 0.21, 0.4, 1.44, 0.38, 2.92, 3.55, 1.23, 2.03, 1.31, 3.23, 1.66, 0.99, 1.11, 0.98, 2.64, 0.16]} \ No newline at end of file diff --git a/annotations_1/UPAs32xduAM_filtered.json b/annotations_1/UPAs32xduAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6d82e2618a61661e1ad69f317ac04ba4eeb70a5 --- /dev/null +++ b/annotations_1/UPAs32xduAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.52], [15.0, 15.42], [20.0, 20.71], [22.0, 23.01], [28.0, 29.42], [31.0, 31.95], [36.0, 36.63], [38.0, 38.15], [42.0, 47.31], [47.0, 47.34], [49.0, 63.24], [65.0, 76.44], [77.0, 83.62], [85.0, 88.16], [91.0, 91.27], [92.0, 93.73], [95.0, 96.65], [98.0, 99.2], [99.0, 101.87], [103.0, 105.11], [106.0, 107.96], [109.0, 113.51], [114.0, 117.24], [118.0, 120.07], [123.0, 125.27], [126.0, 129.52], [131.0, 133.2]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.56, 0.0, 44.72, 48.06, 41.26, 43.2, 0.0, 0.0, 0.0, 0.0, 44.99, 60.51, 0.0, 54.1, 59.86, 52.05, 50.31, 41.54, 40.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 48.67], ["speech", 5.87], ["didgeridoo", 3.89]], null, [["music", 58.12], ["didgeridoo", 11.92], ["musical instrument", 8.85]], [["music", 34.11], ["fly, housefly", 15.92], ["mosquito", 13.7]], [["speech", 40.69], ["music", 13.53], ["hum", 7.8]], [["music", 45.26], ["didgeridoo", 5.99], ["effects unit", 4.92]], null, null, null, null, [["music", 39.13], ["speech", 12.43], ["musical instrument", 11.83]], null, null, null, null, null, null, [["speech", 65.59], ["sidetone", 15.7], ["music", 5.95]], [["speech", 35.4], ["music", 20.29], ["didgeridoo", 4.8]]], "duration": [1.52, 0.42, 0.71, 1.01, 1.42, 0.95, 0.63, 0.15, 5.31, 0.34, 14.24, 11.44, 6.62, 3.16, 0.27, 1.73, 1.65, 1.2, 2.87, 2.11, 1.96, 4.51, 3.24, 2.07, 2.27, 3.52, 2.2]} \ No newline at end of file diff --git a/annotations_1/UPIr8vb7OeI_filtered.json b/annotations_1/UPIr8vb7OeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..431c346e65f76dd12097a62e5285af8875968961 --- /dev/null +++ b/annotations_1/UPIr8vb7OeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.78], [17.0, 17.12], [18.0, 19.85], [21.0, 20.78], [27.0, 27.26], [28.0, 30.0], [32.0, 34.8], [42.0, 42.06], [46.0, 46.31], [50.0, 52.74], [53.0, 54.55], [56.0, 56.15], [57.0, 57.94], [60.0, 59.9], [65.0, 65.48], [66.0, 66.39], [75.0, 75.32], [82.0, 82.32], [84.0, 84.47], [88.0, 89.21], [90.0, 90.91], [91.0, 94.12], [96.0, 96.09], [104.0, 104.62], [105.0, 108.94], [114.0, 115.3], [117.0, 118.13], [119.0, 122.57], [124.0, 124.7], [126.0, 126.71], [129.0, 137.46], [139.0, 138.87], [140.0, 144.81], [147.0, 147.28], [153.0, 153.27], [154.0, 155.92], [160.0, 160.57], [163.0, 165.23], [173.0, 175.19], [184.0, 184.3], [188.0, 188.64], [192.0, 192.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [50.41, 0.0, 0.0, 0.0, 0.0, 57.01, 85.35, 0.0, 0.0, 35.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.65, 0.0, 0.0, 34.68, 0.0, 0.0, 33.17, 0.0, 0.0, 32.73, 0.0, 33.39, 0.0, 0.0, 0.0, 0.0, 33.22, 73.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 28.66], ["didgeridoo", 23.26], ["speech", 12.94]], null, null, null, null, null, null, null, null, null, null, null, [["music", 58.13], ["musical instrument", 6.82], ["theremin", 3.81]], null, null, [["music", 51.34], ["speech", 21.64], ["didgeridoo", 5.21]], null, null, [["music", 30.78], ["foghorn", 12.82], ["theremin", 11.45]], null, null, [["music", 64.87], ["didgeridoo", 5.97], ["musical instrument", 4.08]], null, [["music", 41.04], ["synthesizer", 16.15], ["musical instrument", 7.38]], null, null, null, null, [["music", 36.28], ["synthesizer", 6.96], ["electronic music", 6.53]], null, null, null, null], "duration": [2.78, 0.12, 1.85, -0.22, 0.26, 2.0, 2.8, 0.06, 0.31, 2.74, 1.55, 0.15, 0.94, -0.1, 0.48, 0.39, 0.32, 0.32, 0.47, 1.21, 0.91, 3.12, 0.09, 0.62, 3.94, 1.3, 1.13, 3.57, 0.7, 0.71, 8.46, -0.13, 4.81, 0.28, 0.27, 1.92, 0.57, 2.23, 2.19, 0.3, 0.64, 0.94]} \ No newline at end of file diff --git a/annotations_1/UPhZaK9jxYs_filtered.json b/annotations_1/UPhZaK9jxYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a805b72166123051c257a92930693accf4d88f11 --- /dev/null +++ b/annotations_1/UPhZaK9jxYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.02], [10.0, 10.71], [11.0, 24.95], [30.0, 49.76], [51.0, 52.39], [54.0, 61.25], [64.0, 64.23], [65.0, 65.64], [66.0, 66.55], [67.0, 67.64], [73.0, 75.41], [76.0, 77.48], [80.0, 80.96], [85.0, 86.27], [87.0, 86.8], [87.0, 89.8], [94.0, 94.24], [95.0, 99.67], [101.0, 102.79], [104.0, 105.44], [107.0, 108.5], [111.0, 114.25], [116.0, 123.77], [127.0, 130.13], [131.0, 136.36], [138.0, 140.09], [142.0, 152.44]], "keep_status": [true, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.72, 0.0, 45.3, 55.67, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 46.9, 0.0, 0.0, 0.0, 0.0, 67.63, 0.0, 70.02, 0.0, 0.0, 0.0, 60.79, 87.74, 94.81, 34.78, 89.19, 42.98], "audiomae_on_audioset": [[["speech", 45.66], ["hum", 10.76], ["mains hum", 6.56]], null, [["fly, housefly", 23.35], ["insect", 12.69], ["animal", 8.02]], null, null, [["speech", 24.5], ["bouncing", 12.27], ["hum", 9.99]], null, null, null, null, [["speech", 53.47], ["hum", 6.5], ["inside, small room", 5.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.21], ["glass", 9.69], ["breaking", 7.55]], null, [["music", 70.86], ["theremin", 3.95], ["musical instrument", 3.11]]], "duration": [3.02, 0.71, 13.95, 19.76, 1.39, 7.25, 0.23, 0.64, 0.55, 0.64, 2.41, 1.48, 0.96, 1.27, -0.2, 2.8, 0.24, 4.67, 1.79, 1.44, 1.5, 3.25, 7.77, 3.13, 5.36, 2.09, 10.44]} \ No newline at end of file diff --git a/annotations_1/UQ15FRltlsY_filtered.json b/annotations_1/UQ15FRltlsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0d0811006902d3c8a1657c5157ffa79f54fc9cb --- /dev/null +++ b/annotations_1/UQ15FRltlsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [13.0, 14.22], [15.0, 15.97], [19.0, 19.38], [20.0, 20.78], [24.0, 24.29], [25.0, 25.24], [30.0, 31.14], [32.0, 35.63], [37.0, 37.23], [38.0, 42.84], [44.0, 46.3], [51.0, 53.06], [55.0, 55.75], [56.0, 58.67], [59.0, 59.91], [65.0, 66.12], [69.0, 69.74], [70.0, 70.83], [73.0, 75.73], [77.0, 77.84], [91.0, 92.35], [100.0, 101.33], [102.0, 102.64], [104.0, 104.87], [105.0, 106.98], [108.0, 108.95], [110.0, 111.13], [112.0, 116.73], [118.0, 121.17], [122.0, 129.25], [132.0, 136.58], [137.0, 138.38], [140.0, 140.24], [141.0, 141.56], [143.0, 143.73], [145.0, 148.69], [149.0, 151.09], [153.0, 157.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 99.82, 97.64, 51.66, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 69.74, 99.99, 99.52, 0.0, 0.0, 0.0, 0.0, 98.1, 42.46, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.18], ["music", 15.05], ["mains hum", 6.61]], null], "duration": [-0.09, 1.22, 0.97, 0.38, 0.78, 0.29, 0.24, 1.14, 3.63, 0.23, 4.84, 2.3, 2.06, 0.75, 2.67, 0.91, 1.12, 0.74, 0.83, 2.73, 0.84, 1.35, 1.33, 0.64, 0.87, 1.98, 0.95, 1.13, 4.73, 3.17, 7.25, 4.58, 1.38, 0.24, 0.56, 0.73, 3.69, 2.09, 4.44]} \ No newline at end of file diff --git a/annotations_1/UQes95Ouciw_filtered.json b/annotations_1/UQes95Ouciw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7de111a968727ce1e2e5dc206947732fd50564c --- /dev/null +++ b/annotations_1/UQes95Ouciw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 37.44], [39.0, 45.27], [46.0, 45.64], [46.0, 50.48], [52.0, 54.89], [57.0, 58.92], [62.0, 63.36], [69.0, 72.47], [74.0, 78.54], [79.0, 84.91], [87.0, 93.46], [94.0, 98.51], [100.0, 108.45], [110.0, 122.49], [123.0, 133.95], [136.0, 137.62], [138.0, 154.11], [154.0, 155.7], [156.0, 159.27], [160.0, 162.95], [164.0, 164.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.59, 72.46, 0.0, 75.55, 75.55, 0.0, 0.0, 85.9, 72.9, 78.55, 89.01, 55.04, 71.14, 73.82, 88.28, 0.0, 40.64, 0.0, 55.81, 86.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 41.18], ["speech", 30.32], ["mains hum", 7.28]], null, null, null, null], "duration": [3.44, 6.27, -0.36, 4.48, 2.89, 1.92, 1.36, 3.47, 4.54, 5.91, 6.46, 4.51, 8.45, 12.49, 10.95, 1.62, 16.11, 1.7, 3.27, 2.95, 0.62]} \ No newline at end of file diff --git a/annotations_1/UQmQ7d-wXQE_filtered.json b/annotations_1/UQmQ7d-wXQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4fd429bd4b2f44fb45da967f37d1370a8a2891f --- /dev/null +++ b/annotations_1/UQmQ7d-wXQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.85], [17.0, 57.77], [60.0, 60.25], [63.0, 72.91], [79.0, 79.39], [82.0, 82.85]], "keep_status": [false, false, false, false, false, false], "silence_prob": [43.1, 0.0, 0.0, 52.1, 0.0, 0.0], "audiomae_on_audioset": [[["theremin", 45.93], ["music", 29.41], ["musical instrument", 2.76]], null, null, null, null, null], "duration": [5.85, 40.77, 0.25, 9.91, 0.39, 0.85]} \ No newline at end of file diff --git a/annotations_1/URDzGjLruJU_filtered.json b/annotations_1/URDzGjLruJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b97035058d9af633c9b05931b181eb31cfc3415a --- /dev/null +++ b/annotations_1/URDzGjLruJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.07], [14.0, 15.94], [16.0, 16.6], [17.0, 41.22], [42.0, 44.32], [46.0, 46.3], [47.0, 47.82], [48.0, 80.38], [84.0, 101.6], [103.0, 108.04], [110.0, 125.46], [126.0, 126.23], [127.0, 133.64], [138.0, 139.58]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.97, 32.53, 0.0, 0.0, 0.0, 34.02, 37.17, 31.18, 0.0, 31.13, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.57], ["theremin", 17.08], ["musical instrument", 3.3]], [["music", 43.47], ["theremin", 17.39], ["speech", 10.47]], null, null, null, [["music", 36.79], ["theremin", 16.43], ["hum", 8.07]], [["music", 44.43], ["theremin", 13.48], ["musical instrument", 6.45]], [["music", 39.82], ["cello", 14.81], ["double bass", 10.42]], null, [["music", 52.27], ["theremin", 13.15], ["musical instrument", 3.97]], null], "duration": [0.07, 1.94, 0.6, 24.22, 2.32, 0.3, 0.82, 32.38, 17.6, 5.04, 15.46, 0.23, 6.64, 1.58]} \ No newline at end of file diff --git a/annotations_1/USWXF1XW2zo_filtered.json b/annotations_1/USWXF1XW2zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60b2a180447f9fc33ccf9c87ac4dc83b7ffa5268 --- /dev/null +++ b/annotations_1/USWXF1XW2zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.66], [26.0, 26.69], [28.0, 28.81], [30.0, 31.02], [41.0, 41.59], [42.0, 42.77], [45.0, 45.37], [48.0, 48.3], [50.0, 51.09], [52.0, 52.88], [60.0, 61.82], [67.0, 67.42], [70.0, 70.29], [86.0, 86.9], [88.0, 88.79], [92.0, 92.03], [97.0, 97.29], [98.0, 99.1], [102.0, 102.44], [106.0, 106.29], [122.0, 121.81], [124.0, 125.29], [127.0, 127.43], [127.0, 127.47], [133.0, 133.27], [135.0, 135.55], [138.0, 139.67], [141.0, 142.26], [144.0, 144.75], [147.0, 147.53], [149.0, 150.08], [154.0, 153.84], [156.0, 156.74], [160.0, 160.51], [161.0, 160.76], [163.0, 163.8], [167.0, 168.24], [170.0, 172.32], [172.0, 172.57], [175.0, 175.9], [183.0, 184.62], [187.0, 187.68], [191.0, 192.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.43], ["music", 9.42], ["ice cream truck, ice cream van", 3.67]], null, null, null, null, null], "duration": [0.66, 0.69, 0.81, 1.02, 0.59, 0.77, 0.37, 0.3, 1.09, 0.88, 1.82, 0.42, 0.29, 0.9, 0.79, 0.03, 0.29, 1.1, 0.44, 0.29, -0.19, 1.29, 0.43, 0.47, 0.27, 0.55, 1.67, 1.26, 0.75, 0.53, 1.08, -0.16, 0.74, 0.51, -0.24, 0.8, 1.24, 2.32, 0.57, 0.9, 1.62, 0.68, 1.3]} \ No newline at end of file diff --git a/annotations_1/UUAQ3T09_os_filtered.json b/annotations_1/UUAQ3T09_os_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..604f98dd253b3cc04d4f6786853a6c95e7f32018 --- /dev/null +++ b/annotations_1/UUAQ3T09_os_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.96], [6.0, 6.51], [12.0, 12.16], [14.0, 14.12], [15.0, 15.9], [17.0, 18.2], [19.0, 19.48], [27.0, 26.94], [31.0, 31.51], [33.0, 35.92], [37.0, 50.7], [51.0, 51.95], [53.0, 63.44], [68.0, 68.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 30.39, 0.0, 39.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 65.2], ["music", 20.16], ["whack, thwack", 2.43]], null, [["speech", 57.27], ["music", 13.47], ["sidetone", 4.3]], null], "duration": [-0.04, 0.51, 0.16, 0.12, 0.9, 1.2, 0.48, -0.06, 0.51, 2.92, 13.7, 0.95, 10.44, 0.79]} \ No newline at end of file diff --git a/annotations_1/UVDRpF027l0_filtered.json b/annotations_1/UVDRpF027l0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02e1724a21aaff1f4bb31fadf25bd744587d8414 --- /dev/null +++ b/annotations_1/UVDRpF027l0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 37.25], [41.0, 52.07], [52.0, 60.05], [61.0, 62.06], [63.0, 71.56], [75.0, 120.93], [124.0, 151.46], [161.0, 171.56], [178.0, 181.03], [185.0, 195.17]], "keep_status": [false, true, false, false, false, false, true, true, true, false], "silence_prob": [32.0, 32.09, 32.82, 0.0, 30.91, 0.0, 30.73, 30.67, 32.17, 32.09], "audiomae_on_audioset": [[["music", 73.49], ["speech", 3.44], ["throbbing", 2.98]], [["music", 58.49], ["synthesizer", 4.58], ["keyboard (musical)", 2.68]], [["music", 75.51], ["synthesizer", 3.16], ["singing", 2.09]], null, [["fly, housefly", 48.79], ["mosquito", 37.03], ["insect", 12.43]], null, [["music", 38.16], ["breaking", 8.85], ["whack, thwack", 6.79]], [["music", 50.0], ["groan", 6.07], ["outside, rural or natural", 5.61]], [["music", 36.02], ["speech", 24.04], ["hum", 9.57]], [["music", 47.27], ["speech", 25.4], ["foghorn", 6.12]]], "duration": [8.25, 11.07, 8.05, 1.06, 8.56, 45.93, 27.46, 10.56, 3.03, 10.17]} \ No newline at end of file diff --git a/annotations_1/UVOJk8TFwpQ_filtered.json b/annotations_1/UVOJk8TFwpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0c37d9d43659e4146cfc8b36a1e39a733341c5a --- /dev/null +++ b/annotations_1/UVOJk8TFwpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.11], [7.0, 7.25], [9.0, 9.34], [16.0, 25.32], [29.0, 29.57], [31.0, 31.14], [32.0, 32.98], [42.0, 42.47], [46.0, 46.74], [58.0, 58.73], [63.0, 63.9], [70.0, 70.83], [77.0, 77.6], [96.0, 96.5], [112.0, 112.95], [123.0, 123.25], [127.0, 127.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 63.51], ["musical instrument", 8.31], ["cacophony", 3.37]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 0.25, 0.34, 9.32, 0.57, 0.14, 0.98, 0.47, 0.74, 0.73, 0.9, 0.83, 0.6, 0.5, 0.95, 0.25, 0.45]} \ No newline at end of file diff --git a/annotations_1/UVXRswx8I8g_filtered.json b/annotations_1/UVXRswx8I8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1fc9e00514d359a63c3af6a1116193777880a6 --- /dev/null +++ b/annotations_1/UVXRswx8I8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.24], [16.0, 16.78], [21.0, 22.89], [30.0, 34.01], [40.0, 40.41], [42.0, 42.9], [44.0, 44.27], [47.0, 47.51], [50.0, 52.3], [62.0, 64.03], [71.0, 72.15], [73.0, 73.87], [98.0, 98.69], [105.0, 105.83], [108.0, 109.34], [112.0, 113.19], [116.0, 121.12], [128.0, 135.99], [143.0, 147.01]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.69, 0.0, 0.0, 0.0, 0.0, 32.9, 35.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.48, 35.57, 37.76], "audiomae_on_audioset": [null, null, null, [["speech", 65.81], ["applause", 20.75], ["crowd", 2.62]], null, null, null, null, [["applause", 23.62], ["speech", 17.09], ["crowd", 12.04]], [["music", 37.3], ["speech", 21.04], ["guitar", 4.34]], null, null, null, null, null, null, [["applause", 26.23], ["music", 20.34], ["musical instrument", 4.53]], [["music", 53.93], ["guitar", 9.99], ["musical instrument", 9.59]], [["music", 47.97], ["musical instrument", 7.17], ["bass guitar", 6.95]]], "duration": [1.24, 0.78, 1.89, 4.01, 0.41, 0.9, 0.27, 0.51, 2.3, 2.03, 1.15, 0.87, 0.69, 0.83, 1.34, 1.19, 5.12, 7.99, 4.01]} \ No newline at end of file diff --git a/annotations_1/UWS3FOpdFMU_filtered.json b/annotations_1/UWS3FOpdFMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c93a74ae754235d6c148f9f676a270354ad6c43 --- /dev/null +++ b/annotations_1/UWS3FOpdFMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.45]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.45]} \ No newline at end of file diff --git a/annotations_1/UWlxRKXD6sY_filtered.json b/annotations_1/UWlxRKXD6sY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ed06f6fae21dc55e0cf55952d0a6bca4300a611 --- /dev/null +++ b/annotations_1/UWlxRKXD6sY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [14.0, 16.34], [46.0, 46.3], [56.0, 56.71], [69.0, 69.82], [71.0, 72.05], [83.0, 87.0], [89.0, 90.88], [92.0, 94.12], [95.0, 96.9], [109.0, 109.39], [114.0, 114.2], [119.0, 119.35], [122.0, 123.96], [136.0, 136.8], [144.0, 145.17], [147.0, 148.68], [154.0, 155.78], [159.0, 159.17], [159.0, 162.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.26], ["speech", 13.11], ["mains hum", 5.42]]], "duration": [0.59, 2.34, 0.3, 0.71, 0.82, 1.05, 4.0, 1.88, 2.12, 1.9, 0.39, 0.2, 0.35, 1.96, 0.8, 1.17, 1.68, 1.78, 0.17, 3.36]} \ No newline at end of file diff --git a/annotations_1/UWtFueVeqHc_filtered.json b/annotations_1/UWtFueVeqHc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10aa11a439947f4240b80559b6c0d6d8451b492a --- /dev/null +++ b/annotations_1/UWtFueVeqHc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.5], [5.0, 44.54], [48.0, 72.03], [73.0, 120.24], [120.0, 128.02], [130.0, 130.96], [132.0, 136.59], [137.0, 138.89], [141.0, 142.11], [144.0, 144.64], [146.0, 148.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 89.72, 0.0, 64.29, 0.0, 68.02, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 39.54, 24.03, 47.24, 8.02, 0.96, 4.59, 1.89, 1.11, 0.64, 2.37]} \ No newline at end of file diff --git a/annotations_1/UX1-VvE01iw_filtered.json b/annotations_1/UX1-VvE01iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f34e9b8fa346e6a672d61ea884427aca03c8d6a --- /dev/null +++ b/annotations_1/UX1-VvE01iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 90.49], [91.0, 92.91], [94.0, 162.43], [164.0, 172.88], [173.0, 174.46], [178.0, 178.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 50.56], ["noise", 10.61], ["hum", 10.43]], null, null], "duration": [1.49, 1.91, 68.43, 8.88, 1.46, 0.95]} \ No newline at end of file diff --git a/annotations_1/UXldWskFeFY_filtered.json b/annotations_1/UXldWskFeFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03354354ca482d8f38e3d4d8d3d1a8931a439381 --- /dev/null +++ b/annotations_1/UXldWskFeFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 25.34], [28.0, 76.82], [77.0, 77.6], [78.0, 82.75], [83.0, 98.02], [115.0, 144.66], [154.0, 155.31], [166.0, 168.59], [174.0, 176.99], [180.0, 180.89], [186.0, 193.19], [193.0, 207.5], [212.0, 213.26], [215.0, 214.98], [221.0, 224.75], [239.0, 239.41], [241.0, 241.84], [243.0, 249.07], [250.0, 256.83], [258.0, 259.31], [262.0, 262.8], [268.0, 268.64], [279.0, 283.32], [285.0, 287.34]], "keep_status": [false, false, false, false, true, true, false, true, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [41.68, 0.0, 0.0, 46.33, 48.95, 30.68, 0.0, 30.81, 30.66, 0.0, 32.43, 50.36, 0.0, 0.0, 87.74, 0.0, 0.0, 45.46, 33.83, 0.0, 0.0, 0.0, 36.47, 35.93], "audiomae_on_audioset": [[["music", 44.86], ["hum", 13.59], ["ambient music", 12.02]], null, null, [["music", 55.46], ["synthesizer", 22.88], ["musical instrument", 2.86]], [["music", 43.54], ["throbbing", 18.38], ["hum", 5.85]], [["music", 45.05], ["hum", 9.64], ["throbbing", 8.75]], null, [["music", 33.79], ["hum", 5.2], ["electronic music", 4.54]], [["music", 42.23], ["quack", 13.41], ["didgeridoo", 10.44]], null, [["music", 52.18], ["synthesizer", 11.76], ["hum", 5.25]], null, null, null, null, null, null, [["music", 23.0], ["speech", 7.9], ["synthesizer", 7.76]], [["music", 35.51], ["boing", 17.71], ["wind instrument, woodwind instrument", 9.35]], null, null, null, [["mosquito", 63.23], ["fly, housefly", 14.85], ["insect", 7.25]], [["music", 68.55], ["speech", 10.25], ["quack", 5.67]]], "duration": [17.34, 48.82, 0.6, 4.75, 15.02, 29.66, 1.31, 2.59, 2.99, 0.89, 7.19, 14.5, 1.26, -0.02, 3.75, 0.41, 0.84, 6.07, 6.83, 1.31, 0.8, 0.64, 4.32, 2.34]} \ No newline at end of file diff --git a/annotations_1/UY0nYr-dXEI_filtered.json b/annotations_1/UY0nYr-dXEI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc042c4b0ac6430eed1d69453cc72c9cf9db22db --- /dev/null +++ b/annotations_1/UY0nYr-dXEI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [5.0, 6.45], [7.0, 8.67], [9.0, 10.17], [10.0, 10.91], [12.0, 16.09], [19.0, 20.16], [21.0, 21.78], [23.0, 25.66], [27.0, 28.16], [32.0, 32.43], [33.0, 35.06], [36.0, 37.27], [40.0, 39.95], [41.0, 42.13], [43.0, 44.0], [45.0, 45.69], [46.0, 47.26], [50.0, 50.79], [51.0, 109.78], [116.0, 117.83], [119.0, 121.37], [123.0, 123.13], [131.0, 134.37], [135.0, 134.97], [137.0, 137.86], [141.0, 141.24], [151.0, 151.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 100.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 34.7, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.76], ["speech synthesizer", 6.0], ["grunt", 2.53]], null, null, null, null], "duration": [0.55, 1.45, 1.67, 1.17, 0.91, 4.09, 1.16, 0.78, 2.66, 1.16, 0.43, 2.06, 1.27, -0.05, 1.13, 1.0, 0.69, 1.26, 0.79, 58.78, 1.83, 2.37, 0.13, 3.37, -0.03, 0.86, 0.24, 0.77]} \ No newline at end of file diff --git a/annotations_1/UYYIYehBS_s_filtered.json b/annotations_1/UYYIYehBS_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4376f272b2298c38537fbbe155c6a5bc6b699e42 --- /dev/null +++ b/annotations_1/UYYIYehBS_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.14], [29.0, 29.3], [32.0, 32.56], [35.0, 42.8], [49.0, 49.0], [51.0, 55.95], [64.0, 68.54], [88.0, 99.64], [104.0, 107.28], [110.0, 113.12], [114.0, 114.54], [120.0, 128.36], [130.0, 130.11]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.44, 0.0, 45.33, 46.22, 46.86, 93.6, 90.43, 0.0, 78.04, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 36.08], ["trombone", 19.32], ["brass instrument", 12.53]], null, [["music", 61.44], ["speech", 3.28], ["brass instrument", 2.14]], [["music", 41.99], ["speech", 15.77], ["trombone", 8.5]], [["music", 22.39], ["moo", 18.37], ["cattle, bovinae", 14.68]], null, null, null, null, null], "duration": [1.14, 0.3, 0.56, 7.8, 0.0, 4.95, 4.54, 11.64, 3.28, 3.12, 0.54, 8.36, 0.11]} \ No newline at end of file diff --git a/annotations_1/UZ2IjJCsxxo_filtered.json b/annotations_1/UZ2IjJCsxxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b2b08c4b9bd4e527291247fb2dbba1d91b37d00 --- /dev/null +++ b/annotations_1/UZ2IjJCsxxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.64], [12.0, 13.37], [22.0, 22.22], [31.0, 36.27], [37.0, 53.0], [55.0, 60.4], [63.0, 63.41], [73.0, 75.34], [78.0, 79.0], [81.0, 83.0], [86.0, 93.83], [99.0, 99.79], [102.0, 110.4], [111.0, 111.6], [112.0, 112.29], [113.0, 113.39], [114.0, 125.25], [127.0, 129.39]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [86.09, 0.0, 0.0, 34.08, 33.62, 34.85, 0.0, 31.71, 0.0, 36.18, 38.05, 0.0, 34.1, 0.0, 0.0, 0.0, 33.69, 38.55], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 32.19], ["mosquito", 17.95], ["insect", 14.08]], [["music", 34.19], ["animal", 12.9], ["domestic animals, pets", 4.99]], [["music", 74.79], ["smash, crash", 4.39], ["theremin", 2.14]], null, [["music", 39.63], ["speech", 21.95], ["cattle, bovinae", 6.12]], null, [["sheep", 33.66], ["speech", 27.43], ["bleat", 18.56]], [["fly, housefly", 72.35], ["mosquito", 13.94], ["insect", 8.83]], null, [["speech", 49.05], ["music", 10.41], ["clip-clop", 5.85]], null, null, null, [["cattle, bovinae", 19.64], ["moo", 17.14], ["livestock, farm animals, working animals", 17.06]], [["fly, housefly", 41.9], ["mosquito", 39.32], ["insect", 13.85]]], "duration": [2.64, 1.37, 0.22, 5.27, 16.0, 5.4, 0.41, 2.34, 1.0, 2.0, 7.83, 0.79, 8.4, 0.6, 0.29, 0.39, 11.25, 2.39]} \ No newline at end of file diff --git a/annotations_1/UZnkAElIe_c_filtered.json b/annotations_1/UZnkAElIe_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94d1413cfd43f4145e0c4436312341c76e6ce535 --- /dev/null +++ b/annotations_1/UZnkAElIe_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [6.0, 6.47], [8.0, 9.09], [15.0, 15.2], [19.0, 31.63]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.13], "audiomae_on_audioset": [null, null, null, null, [["throbbing", 32.76], ["hum", 30.54], ["music", 27.37]]], "duration": [0.72, 0.47, 1.09, 0.2, 12.63]} \ No newline at end of file diff --git a/annotations_1/U_MNiopwFxs_filtered.json b/annotations_1/U_MNiopwFxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b7599f906410a685ff0260a018543c06078d6f9 --- /dev/null +++ b/annotations_1/U_MNiopwFxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [6.0, 9.15], [10.0, 11.91], [12.0, 14.22], [19.0, 19.55], [21.0, 23.4], [25.0, 26.18], [27.0, 28.31], [34.0, 34.52], [38.0, 39.28], [42.0, 44.44], [48.0, 48.57], [49.0, 61.77], [67.0, 68.89], [74.0, 75.12], [78.0, 78.43], [82.0, 107.92], [110.0, 111.69], [114.0, 117.04]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 35.71, 0.0, 43.05, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 88.83, 0.0, 30.41, 0.0, 0.0, 0.0, 29.89, 0.0, 34.36], "audiomae_on_audioset": [null, [["rumble", 11.22], ["throbbing", 9.04], ["music", 8.41]], null, [["speech", 40.4], ["music", 14.25], ["musical instrument", 3.22]], null, null, null, null, null, null, null, null, [["music", 66.2], ["throbbing", 9.03], ["electronic music", 5.8]], null, null, null, [["throbbing", 30.25], ["music", 26.6], ["speech", 12.77]], null, [["music", 23.64], ["gong", 19.49], ["timpani", 10.13]]], "duration": [0.58, 3.15, 1.91, 2.22, 0.55, 2.4, 1.18, 1.31, 0.52, 1.28, 2.44, 0.57, 12.77, 1.89, 1.12, 0.43, 25.92, 1.69, 3.04]} \ No newline at end of file diff --git a/annotations_1/Ua4pj7Sxy-8_filtered.json b/annotations_1/Ua4pj7Sxy-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a6ec532151c1512eef60c68eefc270c539baeb0 --- /dev/null +++ b/annotations_1/Ua4pj7Sxy-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.44], [19.0, 19.57], [21.0, 21.88], [27.0, 27.77], [29.0, 29.34], [32.0, 32.46], [35.0, 35.38], [40.0, 40.41], [45.0, 47.43], [52.0, 52.79], [63.0, 63.75], [69.0, 70.16], [71.0, 73.4], [76.0, 75.98], [78.0, 80.0], [83.0, 85.51], [94.0, 95.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 94.52, 0.0, 76.7, 72.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 0.57, 0.88, 0.77, 0.34, 0.46, 0.38, 0.41, 2.43, 0.79, 0.75, 1.16, 2.4, -0.02, 2.0, 2.51, 1.2]} \ No newline at end of file diff --git a/annotations_1/UayJYYeMANA_filtered.json b/annotations_1/UayJYYeMANA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39b7a5c52cfb597cca9770c29e52b7b0cc206891 --- /dev/null +++ b/annotations_1/UayJYYeMANA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.05], [10.0, 10.81], [13.0, 16.04], [21.0, 23.85], [27.0, 28.22], [29.0, 29.94], [33.0, 33.08], [37.0, 37.2], [39.0, 40.24], [42.0, 53.99], [54.0, 54.5], [55.0, 55.11], [60.0, 60.51], [62.0, 66.16], [67.0, 68.15], [70.0, 71.36], [73.0, 83.07], [84.0, 85.33], [87.0, 94.32]], "keep_status": [false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [37.44, 0.0, 31.28, 37.19, 0.0, 0.0, 0.0, 0.0, 0.0, 35.51, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 37.59, 0.0, 34.34], "audiomae_on_audioset": [[["throbbing", 31.76], ["hum", 20.6], ["speech", 20.04]], null, [["music", 42.95], ["speech", 9.92], ["cacophony", 4.04]], [["trombone", 24.73], ["music", 22.19], ["foghorn", 20.58]], null, null, null, null, null, [["music", 32.89], ["speech", 17.07], ["throbbing", 5.24]], null, null, null, null, null, null, [["music", 32.05], ["fly, housefly", 29.03], ["insect", 7.21]], null, [["music", 41.29], ["throbbing", 22.13], ["speech", 18.82]]], "duration": [4.05, 0.81, 3.04, 2.85, 1.22, 0.94, 0.08, 0.2, 1.24, 11.99, 0.5, 0.11, 0.51, 4.16, 1.15, 1.36, 10.07, 1.33, 7.32]} \ No newline at end of file diff --git a/annotations_1/Ub88RPZnHQM_filtered.json b/annotations_1/Ub88RPZnHQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29575dd2165a5de2d5134455c5856f9a7e663a3a --- /dev/null +++ b/annotations_1/Ub88RPZnHQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.69], [4.0, 5.46], [6.0, 6.47], [11.0, 17.0], [20.0, 20.78], [22.0, 21.9], [26.0, 26.91], [32.0, 32.44], [34.0, 34.55], [36.0, 41.66], [45.0, 45.62], [49.0, 49.57], [59.0, 60.34], [61.0, 62.41], [65.0, 68.01], [70.0, 71.14], [76.0, 76.35], [80.0, 81.19], [82.0, 84.38], [85.0, 85.73], [87.0, 89.61], [91.0, 91.72], [93.0, 95.62], [97.0, 99.23], [100.0, 108.09], [108.0, 110.51], [114.0, 114.89], [117.0, 117.91], [119.0, 119.31], [119.0, 119.62], [120.0, 120.45], [125.0, 125.1], [127.0, 127.65], [130.0, 131.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 97.73, 0.0, 99.85, 0.0, 92.15, 60.89, 73.67, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.31, 1.46, 0.47, 6.0, 0.78, -0.1, 0.91, 0.44, 0.55, 5.66, 0.62, 0.57, 1.34, 1.41, 3.01, 1.14, 0.35, 1.19, 2.38, 0.73, 2.61, 0.72, 2.62, 2.23, 8.09, 2.51, 0.89, 0.91, 0.31, 0.62, 0.45, 0.1, 0.65, 1.06]} \ No newline at end of file diff --git a/annotations_1/Ubb88WMrdmo_filtered.json b/annotations_1/Ubb88WMrdmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21a2a5b3e6b74251543e711411b13fb83ad6ecbf --- /dev/null +++ b/annotations_1/Ubb88WMrdmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.12], [14.0, 14.82], [17.0, 17.58], [21.0, 20.87], [28.0, 28.93], [40.0, 41.96], [44.0, 44.0], [47.0, 54.9], [60.0, 73.38], [75.0, 75.61], [77.0, 78.38], [78.0, 80.06], [82.0, 83.47], [86.0, 88.43], [90.0, 90.27], [91.0, 90.66], [98.0, 100.03], [102.0, 102.19], [104.0, 106.34], [107.0, 138.6], [142.0, 142.37], [142.0, 152.31], [161.0, 160.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 41.16, 0.0, 0.0, 59.51, 0.0, 54.76, 0.0, 0.0, 69.34, 0.0, 65.55, 0.0, 0.0, 29.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["cattle, bovinae", 42.83], ["moo", 37.43], ["livestock, farm animals, working animals", 19.64]], [["moo", 27.17], ["cattle, bovinae", 24.83], ["livestock, farm animals, working animals", 24.6]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.34], ["speech", 14.97], ["gunshot, gunfire", 8.07]], null], "duration": [0.12, 0.82, 0.58, -0.13, 0.93, 1.96, 0.0, 7.9, 13.38, 0.61, 1.38, 2.06, 1.47, 2.43, 0.27, -0.34, 2.03, 0.19, 2.34, 31.6, 0.37, 10.31, -0.21]} \ No newline at end of file diff --git a/annotations_1/UbwxGgR-EAM_filtered.json b/annotations_1/UbwxGgR-EAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1b3cbba209ce6b3fcf324d857b840fb81827eb4 --- /dev/null +++ b/annotations_1/UbwxGgR-EAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.81], [15.0, 14.76], [18.0, 18.67], [25.0, 25.47], [29.0, 29.74], [35.0, 35.95], [40.0, 39.66], [49.0, 50.57], [51.0, 52.08], [55.0, 55.12], [58.0, 58.01], [65.0, 66.26], [69.0, 69.15], [76.0, 77.3], [86.0, 88.6], [91.0, 92.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, -0.24, 0.67, 0.47, 0.74, 0.95, -0.34, 1.57, 1.08, 0.12, 0.01, 1.26, 0.15, 1.3, 2.6, 1.25]} \ No newline at end of file diff --git a/annotations_1/Uc--n6RoIgw_filtered.json b/annotations_1/Uc--n6RoIgw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38c0381a880dd69f3fc71fd002c25b6a39cf3d0d --- /dev/null +++ b/annotations_1/Uc--n6RoIgw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [4.0, 4.78], [5.0, 5.48], [7.0, 10.17], [15.0, 15.97], [17.0, 18.99], [21.0, 22.17], [23.0, 39.83], [41.0, 41.81], [43.0, 53.94], [57.0, 57.62], [58.0, 60.27], [63.0, 63.71], [65.0, 91.05], [93.0, 94.93], [95.0, 95.03], [97.0, 99.5], [102.0, 137.71], [139.0, 140.14], [142.0, 143.48], [148.0, 148.44], [151.0, 152.42], [153.0, 154.03], [156.0, 156.3], [158.0, 158.72], [163.0, 174.5], [177.0, 176.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.01, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 41.58, 0.0, 43.93, 0.0, 40.5, 0.0, 31.95, 0.0, 0.0, 28.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 41.68], ["theremin", 26.79], ["musical instrument", 9.02]], null, [["music", 49.58], ["musical instrument", 13.15], ["tabla", 7.76]], null, [["music", 65.72], ["keyboard (musical)", 3.48], ["musical instrument", 2.92]], null, [["mains hum", 30.02], ["music", 18.14], ["hum", 18.03]], null, null, [["music", 34.07], ["breaking", 12.18], ["didgeridoo", 10.08]], null, null, null, null, null, null, null, null, [["music", 40.49], ["speech", 24.57], ["didgeridoo", 5.91]], null], "duration": [2.0, 0.78, 0.48, 3.17, 0.97, 1.99, 1.17, 16.83, 0.81, 10.94, 0.62, 2.27, 0.71, 26.05, 1.93, 0.03, 2.5, 35.71, 1.14, 1.48, 0.44, 1.42, 1.03, 0.3, 0.72, 11.5, -0.06]} \ No newline at end of file diff --git a/annotations_1/UciEIYZ-Eos_filtered.json b/annotations_1/UciEIYZ-Eos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5937e9304b5258d0c4b61b08387d5f93b4124c84 --- /dev/null +++ b/annotations_1/UciEIYZ-Eos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [10.0, 10.98], [12.0, 16.61], [24.0, 28.32], [31.0, 32.98], [35.0, 36.83], [41.0, 44.91], [56.0, 57.96], [60.0, 61.28], [69.0, 69.63], [79.0, 82.9], [84.0, 86.85], [91.0, 93.45], [94.0, 100.89], [107.0, 107.74], [110.0, 124.9], [160.0, 163.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 73.21, 66.51, 0.0, 0.0, 41.24, 0.0, 0.0, 0.0, 50.41, 49.0, 51.18, 36.93, 0.0, 36.27, 30.35], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.33], ["pulse", 8.42], ["throbbing", 2.07]], null, null, null, null, [["music", 64.82], ["boing", 22.85], ["musical instrument", 2.2]], null, [["music", 36.79], ["fly, housefly", 17.72], ["speech", 6.89]], null, [["music", 61.23], ["theremin", 11.74], ["synthesizer", 5.56]], [["music", 46.64], ["moo", 7.78], ["cattle, bovinae", 5.58]]], "duration": [0.27, 0.98, 4.61, 4.32, 1.98, 1.83, 3.91, 1.96, 1.28, 0.63, 3.9, 2.85, 2.45, 6.89, 0.74, 14.9, 3.68]} \ No newline at end of file diff --git a/annotations_1/UeV6eAtHp0M_filtered.json b/annotations_1/UeV6eAtHp0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63735001682ba086149d5f4cd85323c8df8b2577 --- /dev/null +++ b/annotations_1/UeV6eAtHp0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.33], [21.0, 20.85], [24.0, 25.57], [27.0, 29.59], [33.0, 35.4], [39.0, 40.51], [42.0, 48.17], [49.0, 50.6], [53.0, 56.27], [58.0, 58.31], [60.0, 60.24], [62.0, 62.83], [63.0, 69.63], [72.0, 72.05], [76.0, 78.17], [81.0, 85.18], [88.0, 89.63], [91.0, 95.03], [100.0, 99.96], [102.0, 104.28], [105.0, 105.73], [107.0, 109.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.85, 99.96, 0.0, 83.88, 0.0, 98.51, 0.0, 0.0, 0.0, 98.66, 0.0, 99.36, 97.33, 0.0, 100.0, 0.0, 97.22, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, -0.15, 1.57, 2.59, 2.4, 1.51, 6.17, 1.6, 3.27, 0.31, 0.24, 0.83, 6.63, 0.05, 2.17, 4.18, 1.63, 4.03, -0.04, 2.28, 0.73, 2.05]} \ No newline at end of file diff --git a/annotations_1/UeeK-Fgup9w_filtered.json b/annotations_1/UeeK-Fgup9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e15cbb47c41a8486acad9d429330165aca7d2e6 --- /dev/null +++ b/annotations_1/UeeK-Fgup9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.34], [14.0, 14.44], [15.0, 17.93], [20.0, 44.78], [48.0, 78.87], [80.0, 95.28], [97.0, 125.47], [127.0, 147.72], [157.0, 157.74], [163.0, 165.2]], "keep_status": [false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.84, 29.28, 0.0, 30.86, 31.1, 33.56, 0.0, 40.7], "audiomae_on_audioset": [null, null, [["music", 31.45], ["hum", 20.3], ["mains hum", 7.28]], [["hum", 34.62], ["throbbing", 28.1], ["music", 22.64]], null, [["hum", 37.91], ["music", 24.26], ["throbbing", 17.15]], [["hum", 49.11], ["throbbing", 26.09], ["music", 15.81]], [["hum", 33.13], ["music", 24.34], ["mains hum", 12.69]], null, [["throbbing", 25.89], ["hum", 19.06], ["music", 7.49]]], "duration": [0.34, 0.44, 2.93, 24.78, 30.87, 15.28, 28.47, 20.72, 0.74, 2.2]} \ No newline at end of file diff --git a/annotations_1/UepHO767tO8_filtered.json b/annotations_1/UepHO767tO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04b231f2cf9061cc84e331c7ab12013d130180f1 --- /dev/null +++ b/annotations_1/UepHO767tO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 80.54], [81.0, 82.71], [85.0, 86.54], [87.0, 96.45], [102.0, 124.28], [125.0, 188.05]], "keep_status": [false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.88, 31.81, 0.0], "audiomae_on_audioset": [null, null, null, [["cowbell", 22.34], ["speech", 17.42], ["livestock, farm animals, working animals", 17.05]], [["music", 17.22], ["hum", 11.62], ["whack, thwack", 9.69]], null], "duration": [78.54, 1.71, 1.54, 9.45, 22.28, 63.05]} \ No newline at end of file diff --git a/annotations_1/Ueq8bUwdm80_filtered.json b/annotations_1/Ueq8bUwdm80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20f90c283408dca301cb3e285c59a6344b899cb0 --- /dev/null +++ b/annotations_1/Ueq8bUwdm80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.16], [25.0, 35.46], [36.0, 37.56], [40.0, 40.0], [41.0, 41.45], [45.0, 45.6], [49.0, 49.62], [51.0, 50.85], [56.0, 57.0], [60.0, 62.55], [69.0, 69.28], [71.0, 71.09], [74.0, 75.1], [83.0, 83.83], [86.0, 88.8], [96.0, 98.64], [100.0, 100.25], [100.0, 104.7], [107.0, 107.69], [112.0, 113.58], [118.0, 119.55], [121.0, 124.07], [129.0, 133.08], [136.0, 137.15], [137.0, 138.28], [139.0, 140.22], [146.0, 147.95], [151.0, 151.5], [153.0, 153.23], [160.0, 160.66], [162.0, 196.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 100.0, 40.36, 0.0, 50.36, 0.0, 0.0, 0.0, 31.57, 35.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 36.55], ["music", 28.09], ["theremin", 4.48]], null, null, null, null, null, [["fly, housefly", 24.88], ["whale vocalization", 16.21], ["insect", 12.93]], [["music", 33.14], ["fart", 26.44], ["boing", 13.55]], null, null, null, null, null, null, null, null], "duration": [1.16, 10.46, 1.56, 0.0, 0.45, 0.6, 0.62, -0.15, 1.0, 2.55, 0.28, 0.09, 1.1, 0.83, 2.8, 2.64, 0.25, 4.7, 0.69, 1.58, 1.55, 3.07, 4.08, 1.15, 1.28, 1.22, 1.95, 0.5, 0.23, 0.66, 34.52]} \ No newline at end of file diff --git a/annotations_1/UfoHq1-vpss_filtered.json b/annotations_1/UfoHq1-vpss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f21c6064758ab7ac0eafce49e18c180d895f1f0e --- /dev/null +++ b/annotations_1/UfoHq1-vpss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [7.0, 9.0], [15.0, 16.36], [18.0, 18.66], [21.0, 21.15], [32.0, 32.95], [35.0, 36.26], [52.0, 55.11], [56.0, 56.24], [62.0, 62.9], [65.0, 66.24], [87.0, 88.91], [90.0, 91.44], [96.0, 96.21], [97.0, 97.95], [100.0, 101.38], [102.0, 104.03], [116.0, 119.15], [120.0, 120.63], [130.0, 129.96], [158.0, 158.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 88.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 2.0, 1.36, 0.66, 0.15, 0.95, 1.26, 3.11, 0.24, 0.9, 1.24, 1.91, 1.44, 0.21, 0.95, 1.38, 2.03, 3.15, 0.63, -0.04, 0.84]} \ No newline at end of file diff --git a/annotations_1/Ufv54teYXAw_filtered.json b/annotations_1/Ufv54teYXAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d09fc80b473d734ddab963cfa59f431c9f634b0 --- /dev/null +++ b/annotations_1/Ufv54teYXAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [5.0, 4.85], [6.0, 6.62], [10.0, 10.12], [12.0, 15.96], [17.0, 17.63]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.25, -0.15, 0.62, 0.12, 3.96, 0.63]} \ No newline at end of file diff --git a/annotations_1/Ug6yhGuDcUQ_filtered.json b/annotations_1/Ug6yhGuDcUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2b3d9aeae409ab388887e18d8bd192b529253e6 --- /dev/null +++ b/annotations_1/Ug6yhGuDcUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.5], [15.0, 17.69], [21.0, 26.77], [29.0, 29.94], [30.0, 41.07], [42.0, 43.92], [45.0, 45.62], [47.0, 48.29], [50.0, 51.66], [56.0, 65.72], [67.0, 72.47], [76.0, 112.5], [118.0, 122.66], [123.0, 124.29], [126.0, 128.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.96, 64.52, 0.0, 39.27, 0.0, 0.0, 0.0, 0.0, 90.43, 66.51, 0.0, 39.31, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 40.74], ["speech", 29.75], ["music", 8.02]], null, null, null, null, null, null, null, [["moo", 52.36], ["cattle, bovinae", 35.03], ["livestock, farm animals, working animals", 9.18]], null, null], "duration": [1.5, 2.69, 5.77, 0.94, 11.07, 1.92, 0.62, 1.29, 1.66, 9.72, 5.47, 36.5, 4.66, 1.29, 2.44]} \ No newline at end of file diff --git a/annotations_1/UgSVWM44JBE_filtered.json b/annotations_1/UgSVWM44JBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b9d47ca7fc32eb7288ee57adbedef11b7d5a8ee --- /dev/null +++ b/annotations_1/UgSVWM44JBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [8.0, 9.51], [12.0, 12.65], [18.0, 18.17], [37.0, 36.88], [43.0, 51.14], [54.0, 54.58], [57.0, 57.52], [58.0, 57.75], [62.0, 62.18], [63.0, 64.49], [68.0, 69.13], [76.0, 76.44], [80.0, 91.83], [92.0, 103.98], [111.0, 112.21], [113.0, 114.52], [116.0, 117.71], [123.0, 123.99], [125.0, 125.69], [135.0, 134.87], [137.0, 136.83], [144.0, 144.64], [149.0, 150.3], [154.0, 154.68], [155.0, 157.32], [159.0, 161.69], [164.0, 165.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.17, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.16, 83.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.97], ["throbbing", 5.69], ["scary music", 2.18]], [["speech", 34.39], ["hum", 13.46], ["sonar", 10.0]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 1.51, 0.65, 0.17, -0.12, 8.14, 0.58, 0.52, -0.25, 0.18, 1.49, 1.13, 0.44, 11.83, 11.98, 1.21, 1.52, 1.71, 0.99, 0.69, -0.13, -0.17, 0.64, 1.3, 0.68, 2.32, 2.69, 1.54]} \ No newline at end of file diff --git a/annotations_1/UgiK8333Np0_filtered.json b/annotations_1/UgiK8333Np0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..920e055e9eff13c83a42bc10e1cc7b684a31659d --- /dev/null +++ b/annotations_1/UgiK8333Np0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [5.0, 5.61], [12.0, 15.28], [22.0, 28.21], [29.0, 36.56], [39.0, 40.19], [42.0, 42.99], [43.0, 53.59], [60.0, 71.88], [73.0, 88.72], [96.0, 96.74], [97.0, 99.64]], "keep_status": [false, false, true, true, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.28, 33.25, 32.66, 0.0, 0.0, 34.74, 38.47, 47.16, 0.0, 45.85], "audiomae_on_audioset": [null, null, [["music", 16.96], ["sheep", 12.3], ["livestock, farm animals, working animals", 10.97]], [["music", 37.79], ["speech", 16.78], ["fly, housefly", 8.22]], [["speech", 26.15], ["sidetone", 21.49], ["music", 19.09]], null, null, [["music", 54.48], ["speech", 34.13], ["boing", 1.32]], [["music", 35.54], ["gong", 13.77], ["synthesizer", 11.32]], [["theremin", 56.83], ["music", 21.36], ["boing", 5.14]], null, [["speech", 67.43], ["boing", 9.66], ["music", 5.28]]], "duration": [0.9, 0.61, 3.28, 6.21, 7.56, 1.19, 0.99, 10.59, 11.88, 15.72, 0.74, 2.64]} \ No newline at end of file diff --git a/annotations_1/UglfLjHUNbU_filtered.json b/annotations_1/UglfLjHUNbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43949100f63dd21e925a8c6b4274df4df3cde9da --- /dev/null +++ b/annotations_1/UglfLjHUNbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [5.0, 45.32], [47.0, 50.09], [55.0, 59.48], [60.0, 98.61]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 63.64, 52.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.5, 40.32, 3.09, 4.48, 38.61]} \ No newline at end of file diff --git a/annotations_1/UgtSRZHvyWY_filtered.json b/annotations_1/UgtSRZHvyWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7d7d6b8b8d8b5110d0f2f4a963112633af730b9 --- /dev/null +++ b/annotations_1/UgtSRZHvyWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 45.15], [46.0, 46.77], [50.0, 51.16], [54.0, 54.67], [60.0, 64.0], [65.0, 67.05], [69.0, 70.71], [71.0, 72.25], [73.0, 100.38], [102.0, 115.08]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [46.43, 0.0, 0.0, 0.0, 63.42, 76.04, 0.0, 0.0, 38.59, 61.18], "audiomae_on_audioset": [[["speech", 26.16], ["insect", 9.55], ["fly, housefly", 7.71]], null, null, null, null, null, null, null, [["hum", 33.84], ["throbbing", 20.14], ["heart sounds, heartbeat", 8.95]], null], "duration": [11.15, 0.77, 1.16, 0.67, 4.0, 2.05, 1.71, 1.25, 27.38, 13.08]} \ No newline at end of file diff --git a/annotations_1/UhL24j9G3tc_filtered.json b/annotations_1/UhL24j9G3tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41753f53abc6985fff588c354cfcb2a007e83cef --- /dev/null +++ b/annotations_1/UhL24j9G3tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.31], [16.0, 17.22], [19.0, 19.47], [23.0, 24.81], [28.0, 30.43], [33.0, 34.86], [35.0, 35.5], [36.0, 36.95], [37.0, 37.56], [41.0, 44.42], [48.0, 51.11], [53.0, 54.85], [58.0, 58.24], [60.0, 60.57], [62.0, 63.53], [65.0, 68.49], [69.0, 68.71], [69.0, 70.85], [71.0, 77.77], [85.0, 87.71], [90.0, 96.47], [100.0, 100.82], [114.0, 114.42], [116.0, 116.31], [127.0, 128.24], [157.0, 158.08]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, false], "silence_prob": [40.88, 0.0, 0.0, 0.0, 33.2, 0.0, 0.0, 0.0, 0.0, 41.42, 38.35, 0.0, 0.0, 0.0, 0.0, 43.71, 0.0, 0.0, 41.78, 33.57, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.74], ["synthesizer", 14.94], ["boing", 9.27]], null, null, null, [["music", 35.12], ["boing", 28.31], ["speech", 10.75]], null, null, null, null, [["music", 49.18], ["boing", 5.08], ["music for children", 4.46]], [["boing", 47.92], ["music", 27.02], ["music for children", 5.0]], null, null, null, null, [["music", 55.05], ["boing", 8.69], ["musical instrument", 2.36]], null, null, [["music", 31.26], ["speech", 15.59], ["music for children", 8.09]], [["grunt", 32.9], ["music", 24.07], ["pig", 7.71]], [["livestock, farm animals, working animals", 24.48], ["music", 18.87], ["cattle, bovinae", 12.38]], null, null, null, null, null], "duration": [3.31, 1.22, 0.47, 1.81, 2.43, 1.86, 0.5, 0.95, 0.56, 3.42, 3.11, 1.85, 0.24, 0.57, 1.53, 3.49, -0.29, 1.85, 6.77, 2.71, 6.47, 0.82, 0.42, 0.31, 1.24, 1.08]} \ No newline at end of file diff --git a/annotations_1/UiQdZRBhBAE_filtered.json b/annotations_1/UiQdZRBhBAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..120001ebe47f03464a281ca143b455f636ff9c92 --- /dev/null +++ b/annotations_1/UiQdZRBhBAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 19.3], [26.0, 25.91], [28.0, 29.3], [30.0, 30.94], [33.0, 34.43], [36.0, 37.84], [39.0, 42.23], [43.0, 54.14], [55.0, 56.49], [59.0, 107.89], [110.0, 112.4], [112.0, 112.43], [114.0, 113.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 95.09, 0.0, 0.0, 74.92, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.3, -0.09, 1.3, 0.94, 1.43, 1.84, 3.23, 11.14, 1.49, 48.89, 2.4, 0.43, -0.02]} \ No newline at end of file diff --git a/annotations_1/UinILaRACDA_filtered.json b/annotations_1/UinILaRACDA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dfc443f4fbbdb28098f8e6a484d1dfbf2ef08d7 --- /dev/null +++ b/annotations_1/UinILaRACDA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.41], [17.0, 18.64], [20.0, 20.49], [22.0, 22.5], [24.0, 28.54], [29.0, 29.91], [35.0, 51.16], [52.0, 52.68], [54.0, 53.97], [55.0, 55.46], [59.0, 80.1], [81.0, 82.44], [83.0, 83.71], [88.0, 89.73], [91.0, 97.34], [98.0, 100.16], [101.0, 101.76], [103.0, 103.91], [105.0, 106.12], [108.0, 108.33], [115.0, 118.34], [119.0, 124.7], [128.0, 130.62], [132.0, 133.47], [134.0, 135.06], [137.0, 138.25], [139.0, 139.31], [140.0, 140.22], [142.0, 142.25], [144.0, 144.8], [157.0, 157.6], [162.0, 163.75], [165.0, 166.68], [167.0, 169.13], [171.0, 173.5], [183.0, 182.93], [184.0, 185.31], [186.0, 188.64], [189.0, 190.24], [191.0, 192.48]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.63, 0.0, 0.0, 0.0, 37.72, 0.0, 35.65, 0.0, 0.0, 0.0, 37.65, 0.0, 0.0, 0.0, 99.98, 70.58, 0.0, 0.0, 0.0, 0.0, 99.95, 59.33, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 88.83, 0.0, 0.0, 73.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 41.14], ["synthesizer", 7.77], ["didgeridoo", 5.34]], null, [["music", 73.22], ["electronic music", 5.94], ["ambient music", 4.59]], null, null, null, [["speech", 48.14], ["music", 21.66], ["hum", 6.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, 1.64, 0.49, 0.5, 4.54, 0.91, 16.16, 0.68, -0.03, 0.46, 21.1, 1.44, 0.71, 1.73, 6.34, 2.16, 0.76, 0.91, 1.12, 0.33, 3.34, 5.7, 2.62, 1.47, 1.06, 1.25, 0.31, 0.22, 0.25, 0.8, 0.6, 1.75, 1.68, 2.13, 2.5, -0.07, 1.31, 2.64, 1.24, 1.48]} \ No newline at end of file diff --git a/annotations_1/Uiqk92r4luQ_filtered.json b/annotations_1/Uiqk92r4luQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf8fb1226071f254e078aa9015a8c5e82926549f --- /dev/null +++ b/annotations_1/Uiqk92r4luQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.58], [16.0, 40.53], [44.0, 44.58], [48.0, 48.32], [50.0, 50.77], [51.0, 51.44], [59.0, 58.77], [59.0, 59.81], [60.0, 65.94], [70.0, 70.14], [85.0, 85.75], [87.0, 99.12], [100.0, 100.92], [113.0, 113.75], [117.0, 116.9], [119.0, 122.01], [123.0, 131.92], [133.0, 140.49], [141.0, 141.37], [149.0, 149.05], [150.0, 152.88], [158.0, 158.38], [165.0, 165.96], [170.0, 170.72], [180.0, 179.93], [183.0, 184.25], [194.0, 193.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.88, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 0.0, 0.0, 36.57, 0.0, 0.0, 0.0, 44.04, 39.33, 40.93, 0.0, 0.0, 41.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.66], ["didgeridoo", 10.59], ["speech", 9.9]], [["sidetone", 49.85], ["music", 39.46], ["speech", 2.14]], null, null, null, null, null, null, [["music", 74.75], ["speech", 5.26], ["didgeridoo", 4.88]], null, null, [["music", 55.07], ["musical instrument", 6.99], ["didgeridoo", 6.26]], null, null, null, [["music", 75.83], ["musical instrument", 6.61], ["guitar", 1.8]], [["music", 58.59], ["sidetone", 13.03], ["didgeridoo", 6.56]], [["music", 72.23], ["speech", 7.51], ["didgeridoo", 3.79]], null, null, [["music", 81.45], ["speech", 5.11], ["musical instrument", 2.12]], null, null, null, null, null, null], "duration": [8.58, 24.53, 0.58, 0.32, 0.77, 0.44, -0.23, 0.81, 5.94, 0.14, 0.75, 12.12, 0.92, 0.75, -0.1, 3.01, 8.92, 7.49, 0.37, 0.05, 2.88, 0.38, 0.96, 0.72, -0.07, 1.25, -0.03]} \ No newline at end of file diff --git a/annotations_1/Uj6eiUsNwvU_filtered.json b/annotations_1/Uj6eiUsNwvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84d8bfbf6df876829090b13cc4b3d598edc6c113 --- /dev/null +++ b/annotations_1/Uj6eiUsNwvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.4], [19.0, 19.77], [23.0, 28.8], [29.0, 29.4], [30.0, 33.35], [43.0, 47.04], [51.0, 54.41], [55.0, 57.15], [58.0, 69.18], [70.0, 80.4], [93.0, 98.52], [107.0, 115.33], [122.0, 123.94], [131.0, 133.89], [139.0, 140.32], [142.0, 147.19], [148.0, 157.94], [165.0, 168.1], [169.0, 174.68], [181.0, 195.25]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 38.22, 0.0, 32.24, 30.81, 29.88, 29.07, 29.44, 29.92, 29.28, 29.47, 0.0, 30.17, 0.0, 29.4, 29.64, 29.08, 29.58, 29.23], "audiomae_on_audioset": [null, null, [["throbbing", 39.92], ["music", 27.8], ["hum", 14.13]], null, [["music", 55.52], ["speech", 7.2], ["boing", 4.82]], [["music", 63.88], ["electronic music", 10.59], ["dubstep", 4.65]], [["speech", 53.93], ["music", 9.98], ["groan", 8.44]], [["sidetone", 36.96], ["speech", 26.64], ["music", 12.13]], [["music", 63.06], ["speech", 11.49], ["cacophony", 3.82]], [["music", 58.09], ["speech", 11.23], ["throbbing", 6.72]], [["music", 57.59], ["hum", 14.74], ["throbbing", 10.15]], [["music", 69.98], ["electronic music", 6.93], ["techno", 2.17]], null, [["music", 45.33], ["throbbing", 23.73], ["hum", 10.94]], null, [["cattle, bovinae", 33.44], ["moo", 23.76], ["livestock, farm animals, working animals", 16.51]], [["music", 56.72], ["speech", 10.24], ["cacophony", 7.35]], [["music", 64.69], ["hum", 6.19], ["throbbing", 5.96]], [["music", 55.13], ["speech", 8.31], ["burst, pop", 5.19]], [["music", 60.79], ["electronic music", 7.14], ["throbbing", 6.19]]], "duration": [1.4, 0.77, 5.8, 0.4, 3.35, 4.04, 3.41, 2.15, 11.18, 10.4, 5.52, 8.33, 1.94, 2.89, 1.32, 5.19, 9.94, 3.1, 5.68, 14.25]} \ No newline at end of file diff --git a/annotations_1/UjOJ-AMtAzY_filtered.json b/annotations_1/UjOJ-AMtAzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c9b914cf41a846d40b2cffdd6c36c1e2ec65d1c --- /dev/null +++ b/annotations_1/UjOJ-AMtAzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 57.15], [61.0, 87.89], [89.0, 91.72], [95.0, 101.63], [102.0, 121.64], [123.0, 146.92], [148.0, 148.26], [149.0, 159.46], [162.0, 163.27]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.72, 99.59, 94.52, 88.83, 87.19, 0.0, 58.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [53.15, 26.89, 2.72, 6.63, 19.64, 23.92, 0.26, 10.46, 1.27]} \ No newline at end of file diff --git a/annotations_1/Uk1MJFwGMjI_filtered.json b/annotations_1/Uk1MJFwGMjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dcb590266393cb0333d14ef2a0d83ace8808986 --- /dev/null +++ b/annotations_1/Uk1MJFwGMjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [9.0, 9.96], [12.0, 14.66], [15.0, 16.17], [22.0, 35.6], [36.0, 41.39], [49.0, 52.0], [53.0, 53.97], [55.0, 56.07], [57.0, 58.48], [59.0, 70.04], [71.0, 73.55], [75.0, 77.79], [78.0, 80.54], [82.0, 83.32], [85.0, 85.56], [87.0, 97.71], [98.0, 98.76], [107.0, 107.05], [108.0, 112.35], [114.0, 117.81], [119.0, 120.02], [121.0, 122.89], [124.0, 124.66], [126.0, 126.39], [127.0, 130.23], [131.0, 131.73], [133.0, 134.65], [136.0, 137.08], [139.0, 145.12]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.64, 0.0, 34.26, 37.21, 87.19, 0.0, 0.0, 0.0, 87.74, 92.15, 94.66, 89.9, 0.0, 0.0, 90.08, 0.0, 0.0, 94.95, 94.81, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 51.5], "audiomae_on_audioset": [null, null, null, null, [["music", 44.91], ["speech", 15.9], ["foghorn", 4.76]], [["livestock, farm animals, working animals", 31.94], ["moo", 21.47], ["music", 16.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.96, 2.66, 1.17, 13.6, 5.39, 3.0, 0.97, 1.07, 1.48, 11.04, 2.55, 2.79, 2.54, 1.32, 0.56, 10.71, 0.76, 0.05, 4.35, 3.81, 1.02, 1.89, 0.66, 0.39, 3.23, 0.73, 1.65, 1.08, 6.12]} \ No newline at end of file diff --git a/annotations_1/UkH65BsZg_g_filtered.json b/annotations_1/UkH65BsZg_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e61c540d70c9be6971df4c432df9923cd1c9b2b1 --- /dev/null +++ b/annotations_1/UkH65BsZg_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 5.43], [7.0, 9.44], [18.0, 18.23], [24.0, 24.27], [25.0, 26.06], [27.0, 27.67], [28.0, 29.12], [32.0, 32.59], [34.0, 40.14], [42.0, 44.29], [47.0, 47.95], [49.0, 49.33], [52.0, 54.21], [61.0, 64.71], [69.0, 69.62], [74.0, 73.79], [79.0, 80.96], [81.0, 85.55], [92.0, 93.58], [95.0, 95.49], [99.0, 100.33], [103.0, 103.25], [106.0, 109.48], [110.0, 110.98], [114.0, 114.56], [120.0, 126.98], [129.0, 129.19], [130.0, 139.85], [141.0, 142.1], [147.0, 147.38], [150.0, 150.13], [154.0, 159.02], [160.0, 160.42], [161.0, 161.28], [163.0, 163.76], [165.0, 166.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 87.19, 0.0, 0.0, 78.21, 62.47, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 69.61, 0.0, 62.07, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.43, 2.44, 0.23, 0.27, 1.06, 0.67, 1.12, 0.59, 6.14, 2.29, 0.95, 0.33, 2.21, 3.71, 0.62, -0.21, 1.96, 4.55, 1.58, 0.49, 1.33, 0.25, 3.48, 0.98, 0.56, 6.98, 0.19, 9.85, 1.1, 0.38, 0.13, 5.02, 0.42, 0.28, 0.76, 1.09]} \ No newline at end of file diff --git a/annotations_1/UkIwAAKv_iA_filtered.json b/annotations_1/UkIwAAKv_iA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7ef62301741a5ade470ef04d0572079170f6068 --- /dev/null +++ b/annotations_1/UkIwAAKv_iA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.92], [10.0, 10.88], [15.0, 15.23], [16.0, 16.53], [29.0, 33.83], [34.0, 34.97], [36.0, 36.66], [39.0, 40.74], [43.0, 43.34], [47.0, 51.24], [57.0, 57.1], [63.0, 63.69], [65.0, 66.45], [68.0, 68.89], [73.0, 82.09], [83.0, 84.7], [85.0, 86.07], [88.0, 102.95]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.12, 0.0, 0.0, 0.0, 0.0, 33.82, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 25.78], ["breaking", 11.19], ["laughter", 9.31]], null, null, null, null, [["speech", 46.57], ["fly, housefly", 13.57], ["insect", 8.45]], null, null, null], "duration": [-0.08, 0.88, 0.23, 0.53, 4.83, 0.97, 0.66, 1.74, 0.34, 4.24, 0.1, 0.69, 1.45, 0.89, 9.09, 1.7, 1.07, 14.95]} \ No newline at end of file diff --git a/annotations_1/UkPkaNawTUw_filtered.json b/annotations_1/UkPkaNawTUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0a9b038cf338ef838352613c15c6bdb1c38e2a7 --- /dev/null +++ b/annotations_1/UkPkaNawTUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.5], [21.0, 36.53], [39.0, 45.62], [46.0, 47.12], [49.0, 54.28], [55.0, 63.58], [64.0, 65.31], [67.0, 78.68], [82.0, 83.79], [84.0, 85.31]], "keep_status": [true, true, true, false, true, false, false, false, false, false], "silence_prob": [39.05, 40.02, 33.3, 0.0, 41.5, 32.78, 0.0, 32.37, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 14.21], ["noise", 8.5], ["electric shaver, electric razor", 8.28]], [["speech", 15.2], ["sidetone", 10.97], ["music", 10.37]], [["throbbing", 32.93], ["hum", 21.35], ["heart sounds, heartbeat", 13.18]], null, [["hum", 44.74], ["throbbing", 15.09], ["mains hum", 9.38]], [["speech", 66.29], ["hum", 7.6], ["throbbing", 7.53]], null, [["speech", 74.8], ["whack, thwack", 7.14], ["livestock, farm animals, working animals", 1.72]], null, null], "duration": [16.5, 15.53, 6.62, 1.12, 5.28, 8.58, 1.31, 11.68, 1.79, 1.31]} \ No newline at end of file diff --git a/annotations_1/UkamBJTqN8c_filtered.json b/annotations_1/UkamBJTqN8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38f056bd61632a689d28c3a8018c3bd1c0a9d132 --- /dev/null +++ b/annotations_1/UkamBJTqN8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [14.0, 21.91], [23.0, 23.57], [25.0, 35.65], [40.0, 42.45], [43.0, 47.6], [48.0, 65.7], [69.0, 79.35], [82.0, 82.61], [84.0, 85.08], [87.0, 97.06], [98.0, 114.54], [115.0, 143.43], [144.0, 144.54], [145.0, 145.35], [150.0, 173.65]], "keep_status": [false, false, false, false, true, true, true, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 32.81, 0.0, 31.89, 33.56, 39.41, 40.97, 44.18, 0.0, 0.0, 34.64, 40.88, 32.51, 0.0, 0.0, 32.22], "audiomae_on_audioset": [null, [["hum", 44.7], ["throbbing", 25.16], ["music", 11.6]], null, [["music", 37.42], ["hum", 27.2], ["mains hum", 12.02]], [["music", 55.24], ["mains hum", 6.87], ["synthesizer", 5.61]], [["hum", 32.61], ["mains hum", 24.9], ["music", 10.35]], [["music", 37.07], ["synthesizer", 11.61], ["theremin", 8.49]], [["music", 61.44], ["didgeridoo", 8.53], ["synthesizer", 5.53]], null, null, [["hum", 40.62], ["music", 19.77], ["throbbing", 9.57]], [["hum", 52.41], ["mains hum", 14.35], ["speech", 12.71]], [["speech", 45.7], ["music", 28.36], ["shout", 4.76]], null, null, [["livestock, farm animals, working animals", 29.14], ["music", 16.63], ["cattle, bovinae", 11.58]]], "duration": [1.07, 7.91, 0.57, 10.65, 2.45, 4.6, 17.7, 10.35, 0.61, 1.08, 10.06, 16.54, 28.43, 0.54, 0.35, 23.65]} \ No newline at end of file diff --git a/annotations_1/UlxZ06150xI_filtered.json b/annotations_1/UlxZ06150xI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..416bebf4197bc540c51782971644ce5c656ebbea --- /dev/null +++ b/annotations_1/UlxZ06150xI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [8.0, 12.26], [13.0, 18.45], [19.0, 26.0], [30.0, 30.67], [32.0, 36.26], [38.0, 38.65], [39.0, 40.59], [45.0, 45.28], [46.0, 47.02], [48.0, 48.3], [49.0, 57.84], [62.0, 73.65], [81.0, 81.21], [85.0, 89.58], [91.0, 91.54], [93.0, 93.68], [94.0, 95.18], [97.0, 97.28], [98.0, 98.66], [101.0, 101.58], [104.0, 104.3], [110.0, 111.54], [112.0, 113.21], [129.0, 130.11], [131.0, 131.92], [135.0, 137.2], [141.0, 153.99], [155.0, 155.56], [157.0, 157.79], [159.0, 174.75], [175.0, 174.78], [175.0, 176.3]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 30.93, 30.46, 29.81, 0.0, 29.03, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 30.87, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.56, 30.65, 0.0, 0.0, 31.52, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.42], ["throbbing", 12.28], ["smash, crash", 9.85]], [["speech", 40.71], ["music", 37.31], ["electronic music", 3.49]], [["music", 16.17], ["hum", 15.75], ["speech", 15.65]], null, [["speech", 33.38], ["music", 27.78], ["smash, crash", 9.05]], null, null, null, null, null, [["music", 29.82], ["breaking", 23.17], ["hum", 6.18]], [["explosion", 17.97], ["speech", 16.58], ["music", 15.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 20.44], ["whack, thwack", 12.74], ["music", 11.65]], [["speech", 75.98], ["explosion", 2.71], ["machine gun", 2.6]], null, null, [["music", 41.88], ["explosion", 18.54], ["burst, pop", 5.78]], null, null], "duration": [0.56, 4.26, 5.45, 7.0, 0.67, 4.26, 0.65, 1.59, 0.28, 1.02, 0.3, 8.84, 11.65, 0.21, 4.58, 0.54, 0.68, 1.18, 0.28, 0.66, 0.58, 0.3, 1.54, 1.21, 1.11, 0.92, 2.2, 12.99, 0.56, 0.79, 15.75, -0.22, 1.3]} \ No newline at end of file diff --git a/annotations_1/UmRkYrYgnN4_filtered.json b/annotations_1/UmRkYrYgnN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c058da779d417f73a486c3690c96c89937a61f3a --- /dev/null +++ b/annotations_1/UmRkYrYgnN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 34.01], [35.0, 38.92], [40.0, 40.02], [43.0, 43.48], [45.0, 49.37], [50.0, 53.1], [55.0, 83.17], [84.0, 87.51], [90.0, 93.39], [94.0, 96.25], [97.0, 99.57], [100.0, 101.43], [102.0, 102.37], [104.0, 116.4], [116.0, 117.12], [118.0, 119.94], [120.0, 120.21], [121.0, 122.74], [124.0, 124.01]], "keep_status": [true, true, false, false, true, true, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [39.04, 40.09, 0.0, 0.0, 38.47, 38.05, 50.11, 42.19, 59.24, 67.63, 43.43, 0.0, 0.0, 37.22, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 29.45], ["music", 25.08], ["throbbing", 7.6]], [["hum", 32.37], ["mains hum", 28.6], ["fly, housefly", 5.38]], null, null, [["music", 31.88], ["whale vocalization", 8.37], ["hum", 7.99]], [["music", 26.99], ["speech", 25.44], ["hum", 5.51]], null, [["music", 81.66], ["musical instrument", 2.13], ["ambient music", 1.86]], null, null, [["music", 20.38], ["hum", 17.97], ["sonar", 16.99]], null, null, [["hum", 35.9], ["mains hum", 23.95], ["throbbing", 6.2]], null, null, null, null, null], "duration": [17.01, 3.92, 0.02, 0.48, 4.37, 3.1, 28.17, 3.51, 3.39, 2.25, 2.57, 1.43, 0.37, 12.4, 1.12, 1.94, 0.21, 1.74, 0.01]} \ No newline at end of file diff --git a/annotations_1/UmynxNlSRaE_filtered.json b/annotations_1/UmynxNlSRaE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b35d4097d3ae72f456fa1eb17b35abb83688f21e --- /dev/null +++ b/annotations_1/UmynxNlSRaE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 63.51], [69.0, 72.5]], "keep_status": [true, true], "silence_prob": [47.98, 49.59], "audiomae_on_audioset": [[["music", 44.91], ["effects unit", 6.96], ["musical instrument", 6.93]], [["music", 27.12], ["gong", 25.15], ["musical instrument", 5.45]]], "duration": [23.51, 3.5]} \ No newline at end of file diff --git a/annotations_1/UnllAPMRnKE_filtered.json b/annotations_1/UnllAPMRnKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6a0ff7ce6a8da20d25cb8d7c914c99245c3d5 --- /dev/null +++ b/annotations_1/UnllAPMRnKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.68], [10.0, 10.27], [16.0, 15.8], [27.0, 28.54], [30.0, 31.41], [32.0, 32.88], [56.0, 56.52], [57.0, 57.43], [58.0, 58.36], [68.0, 69.8], [73.0, 73.8], [75.0, 74.85], [75.0, 75.56], [82.0, 82.26], [83.0, 85.04], [100.0, 100.4], [102.0, 103.42], [105.0, 106.14], [108.0, 109.44], [111.0, 114.81], [118.0, 120.28], [122.0, 125.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 86.45, 75.55, 65.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 0.27, -0.2, 1.54, 1.41, 0.88, 0.52, 0.43, 0.36, 1.8, 0.8, -0.15, 0.56, 0.26, 2.04, 0.4, 1.42, 1.14, 1.44, 3.81, 2.28, 3.95]} \ No newline at end of file diff --git a/annotations_1/Uo1FfULMJ5E_filtered.json b/annotations_1/Uo1FfULMJ5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Uo1FfULMJ5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/UoMiVPjDb10_filtered.json b/annotations_1/UoMiVPjDb10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c247a49199c060e18d847eb67b1f65f96b2b1c3a --- /dev/null +++ b/annotations_1/UoMiVPjDb10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.22], [22.0, 23.23], [24.0, 27.16], [37.0, 42.26], [43.0, 43.8], [48.0, 48.36], [50.0, 50.55], [51.0, 52.03], [54.0, 65.1], [68.0, 70.6], [71.0, 72.47], [74.0, 76.92], [77.0, 78.16], [79.0, 79.95], [83.0, 82.58], [84.0, 85.14], [87.0, 87.62], [90.0, 93.92], [100.0, 99.86], [101.0, 101.48], [103.0, 105.46], [107.0, 107.5], [108.0, 109.32], [114.0, 115.52], [123.0, 124.51], [130.0, 135.43], [136.0, 136.83], [137.0, 137.54], [145.0, 145.61], [148.0, 148.31]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.42, 35.55, 0.0, 0.0, 0.0, 0.0, 37.07, 39.24, 0.0, 42.55, 0.0, 0.0, 0.0, 0.0, 0.0, 38.64, 0.0, 0.0, 39.44, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["insect", 20.14], ["fly, housefly", 18.06], ["bee, wasp, etc.", 10.71]], [["cattle, bovinae", 40.04], ["livestock, farm animals, working animals", 37.64], ["moo", 22.21]], null, null, null, null, [["music", 57.58], ["theremin", 12.95], ["buzz", 2.5]], [["music", 36.6], ["foghorn", 6.63], ["theremin", 6.29]], null, [["foghorn", 66.31], ["music", 9.77], ["didgeridoo", 2.88]], null, null, null, null, null, [["music", 44.9], ["hum", 10.63], ["mains hum", 5.91]], null, null, [["music", 34.52], ["musical instrument", 4.84], ["crushing", 4.09]], null, null, null, null, null, null, null, null, null], "duration": [1.22, 1.23, 3.16, 5.26, 0.8, 0.36, 0.55, 1.03, 11.1, 2.6, 1.47, 2.92, 1.16, 0.95, -0.42, 1.14, 0.62, 3.92, -0.14, 0.48, 2.46, 0.5, 1.32, 1.52, 1.51, 5.43, 0.83, 0.54, 0.61, 0.31]} \ No newline at end of file diff --git a/annotations_1/Uovtut2ckMg_filtered.json b/annotations_1/Uovtut2ckMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d120837d357e7f2cf2ca98e761fb93ca5dac11 --- /dev/null +++ b/annotations_1/Uovtut2ckMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.31], [15.0, 23.55], [27.0, 29.3], [38.0, 38.01], [45.0, 47.01], [52.0, 53.49], [62.0, 63.88], [67.0, 71.61], [73.0, 73.87], [82.0, 83.22], [85.0, 84.94], [86.0, 86.46], [92.0, 92.43], [98.0, 99.05], [110.0, 113.0], [120.0, 120.38], [122.0, 125.29]], "keep_status": [false, true, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.62, 44.37, 0.0, 47.12, 0.0, 0.0, 33.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 59.33], "audiomae_on_audioset": [null, [["animal", 51.98], ["sheep", 9.15], ["livestock, farm animals, working animals", 7.21]], [["speech", 32.53], ["fly, housefly", 14.85], ["music", 9.21]], null, [["speech", 39.12], ["music", 15.5], ["hum", 4.85]], null, null, [["whale vocalization", 28.6], ["noise", 20.42], ["music", 7.54]], null, null, null, null, null, null, null, null, null], "duration": [0.31, 8.55, 2.3, 0.01, 2.01, 1.49, 1.88, 4.61, 0.87, 1.22, -0.06, 0.46, 0.43, 1.05, 3.0, 0.38, 3.29]} \ No newline at end of file diff --git a/annotations_1/Up7TU2t7_8g_filtered.json b/annotations_1/Up7TU2t7_8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0168b32ba6859f716e31e3064df125f383afa0f3 --- /dev/null +++ b/annotations_1/Up7TU2t7_8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.11], [16.0, 26.38], [32.0, 77.46], [80.0, 144.73], [147.0, 170.87], [173.0, 177.23]], "keep_status": [true, true, false, false, true, true], "silence_prob": [29.3, 29.16, 0.0, 0.0, 28.94, 29.34], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 30.69], ["cattle, bovinae", 12.81], ["music", 7.8]], [["music", 38.66], ["vehicle", 10.87], ["car", 6.43]], null, null, [["speech", 34.49], ["music", 15.85], ["buzz", 7.59]], [["music", 33.5], ["hum", 8.12], ["buzz", 6.45]]], "duration": [11.11, 10.38, 45.46, 64.73, 23.87, 4.23]} \ No newline at end of file diff --git a/annotations_1/UpgP8aA8ABE_filtered.json b/annotations_1/UpgP8aA8ABE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6de4ad785ba46e7dc2048b44f7596defa1110114 --- /dev/null +++ b/annotations_1/UpgP8aA8ABE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 34.96], [39.0, 39.28], [45.0, 46.23], [47.0, 49.44], [61.0, 66.65], [67.0, 69.87], [76.0, 87.56], [93.0, 97.38], [103.0, 104.14], [110.0, 110.91], [114.0, 114.4], [116.0, 116.67], [118.0, 119.2], [121.0, 122.17], [126.0, 126.5], [128.0, 130.65], [131.0, 133.22], [134.0, 137.37], [139.0, 140.39], [143.0, 144.22], [150.0, 161.16]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.9, 0.0, 0.0, 35.25, 42.6, 33.74, 34.61, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.78, 94.37, 99.05, 0.0, 0.0, 69.07], "audiomae_on_audioset": [[["music", 81.17], ["speech", 3.02], ["boing", 2.71]], null, null, [["music", 59.41], ["throbbing", 7.03], ["whack, thwack", 5.46]], [["whistle", 22.68], ["music", 19.88], ["speech", 7.92]], [["music", 66.59], ["frog", 5.6], ["speech", 3.23]], [["music", 36.1], ["boing", 11.88], ["speech", 3.79]], [["music", 59.43], ["guitar", 8.5], ["bass guitar", 6.38]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [29.96, 0.28, 1.23, 2.44, 5.65, 2.87, 11.56, 4.38, 1.14, 0.91, 0.4, 0.67, 1.2, 1.17, 0.5, 2.65, 2.22, 3.37, 1.39, 1.22, 11.16]} \ No newline at end of file diff --git a/annotations_1/UrCi_k2TXOA_filtered.json b/annotations_1/UrCi_k2TXOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c4ad2a82313caa86dcad3a9cde484687c698505 --- /dev/null +++ b/annotations_1/UrCi_k2TXOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [4.0, 5.17], [13.0, 13.59], [15.0, 15.09], [16.0, 16.75], [18.0, 18.69], [20.0, 20.61], [26.0, 32.85], [34.0, 34.87], [38.0, 41.27], [44.0, 44.09], [46.0, 48.22], [49.0, 50.23], [51.0, 71.74], [72.0, 73.6], [74.0, 76.82], [79.0, 81.38], [83.0, 83.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.73, 0.0, 99.59, 0.0, 48.1, 0.0, 41.14, 0.0, 99.85, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 59.08], ["blender", 8.28], ["radio", 5.22]], null, null, null, [["inside, small room", 10.85], ["knock", 7.52], ["dial tone", 6.84]], null, [["chirp tone", 28.25], ["speech", 8.6], ["hum", 7.79]], null, null, null, null], "duration": [0.31, 1.17, 0.59, 0.09, 0.75, 0.69, 0.61, 6.85, 0.87, 3.27, 0.09, 2.22, 1.23, 20.74, 1.6, 2.82, 2.38, 0.54]} \ No newline at end of file diff --git a/annotations_1/Us1MxXdSHw8_filtered.json b/annotations_1/Us1MxXdSHw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c33cca6bdb5d87a07be6c5b89d789d321bdbc4c --- /dev/null +++ b/annotations_1/Us1MxXdSHw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [7.0, 13.98], [14.0, 16.48], [20.0, 21.66], [23.0, 24.43], [25.0, 26.42], [28.0, 30.21], [32.0, 34.5], [36.0, 36.05], [40.0, 40.83], [42.0, 42.67], [43.0, 43.39], [44.0, 44.76], [46.0, 46.77], [47.0, 47.56], [48.0, 49.32], [50.0, 51.11], [52.0, 52.71], [54.0, 55.98], [57.0, 57.05], [58.0, 59.39], [70.0, 71.25], [73.0, 73.33], [74.0, 74.56], [75.0, 77.36], [79.0, 80.69], [82.0, 84.7], [86.0, 87.96], [91.0, 102.74], [104.0, 117.76], [119.0, 118.99], [121.0, 122.13], [124.0, 124.92], [127.0, 127.48], [130.0, 130.0], [150.0, 154.72]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.63, 38.9, 0.0, 0.0, 0.0, 67.25, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.08, 0.0, 32.15, 0.0, 29.7, 28.88, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0], "audiomae_on_audioset": [null, [["music", 43.8], ["hum", 11.16], ["mains hum", 8.5]], [["music", 45.95], ["speech", 10.06], ["sidetone", 6.45]], null, null, null, null, [["speech", 41.69], ["knock", 6.89], ["thunk", 4.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.03], ["animal", 12.42], ["whale vocalization", 6.86]], null, [["music", 25.59], ["synthesizer", 8.52], ["musical instrument", 6.55]], null, [["music", 37.69], ["piano", 17.58], ["keyboard (musical)", 16.93]], [["piano", 30.21], ["music", 25.1], ["musical instrument", 17.22]], null, null, null, null, null, [["music", 52.88], ["musical instrument", 12.38], ["piano", 4.88]]], "duration": [1.56, 6.98, 2.48, 1.66, 1.43, 1.42, 2.21, 2.5, 0.05, 0.83, 0.67, 0.39, 0.76, 0.77, 0.56, 1.32, 1.11, 0.71, 1.98, 0.05, 1.39, 1.25, 0.33, 0.56, 2.36, 1.69, 2.7, 1.96, 11.74, 13.76, -0.01, 1.13, 0.92, 0.48, 0.0, 4.72]} \ No newline at end of file diff --git a/annotations_1/UsM7OBEMqnk_filtered.json b/annotations_1/UsM7OBEMqnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..124abe1dbd393b43457fd1f32b57b89b3247c10b --- /dev/null +++ b/annotations_1/UsM7OBEMqnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 27.35], [29.0, 33.51], [36.0, 40.32], [40.0, 49.06], [51.0, 61.79], [62.0, 85.04], [85.0, 85.77], [87.0, 91.17], [99.0, 98.64]], "keep_status": [false, false, false, false, true, true, false, false, false], "silence_prob": [29.84, 30.83, 29.7, 29.88, 30.11, 30.44, 0.0, 36.59, 0.0], "audiomae_on_audioset": [[["music", 81.09], ["didgeridoo", 2.92], ["musical instrument", 2.55]], [["music", 69.13], ["breaking", 10.62], ["smash, crash", 6.05]], [["speech", 38.19], ["music", 37.32], ["didgeridoo", 3.39]], [["music", 70.0], ["speech", 8.01], ["breaking", 5.32]], [["music", 31.75], ["boing", 19.83], ["speech", 4.61]], [["music", 54.55], ["speech", 8.55], ["boing", 6.86]], null, [["music", 71.68], ["synthesizer", 5.28], ["musical instrument", 3.68]], null], "duration": [21.35, 4.51, 4.32, 9.06, 10.79, 23.04, 0.77, 4.17, -0.36]} \ No newline at end of file diff --git a/annotations_1/UsNnkax2wNA_filtered.json b/annotations_1/UsNnkax2wNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20d1d2d10b20dcd145f0c1858eaab58289a02849 --- /dev/null +++ b/annotations_1/UsNnkax2wNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [6.0, 8.82], [9.0, 9.58], [10.0, 10.52], [14.0, 16.95], [22.0, 33.78], [37.0, 37.98], [40.0, 40.17], [42.0, 41.86], [45.0, 45.39], [47.0, 47.17], [52.0, 52.2], [54.0, 55.68], [57.0, 58.87], [59.0, 97.38], [98.0, 98.22], [98.0, 99.13], [100.0, 102.52], [103.0, 110.61], [116.0, 125.12], [126.0, 133.08], [136.0, 147.6], [152.0, 151.9], [153.0, 154.36], [154.0, 154.89], [155.0, 154.92], [155.0, 154.95], [155.0, 154.99], [155.0, 155.02], [155.0, 155.06], [155.0, 159.11], [160.0, 159.95], [160.0, 169.33], [169.0, 173.87], [181.0, 201.29], [206.0, 207.0], [207.0, 212.18], [212.0, 212.21], [214.0, 226.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 91.81, 0.0, 0.0, 34.8, 35.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 31.16, 31.87, 39.67, 32.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.6, 0.0, 37.08, 33.21, 40.24, 0.0, 30.64, 0.0, 40.5], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 34.65], ["moo", 32.41], ["cattle, bovinae", 29.14]], [["music", 75.46], ["didgeridoo", 5.52], ["musical instrument", 2.4]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.1], ["speech", 25.26], ["musical instrument", 2.92]], [["speech", 40.8], ["music", 17.41], ["fart", 13.2]], [["music", 59.85], ["speech", 19.18], ["didgeridoo", 7.95]], [["music", 50.07], ["speech", 24.72], ["didgeridoo", 4.04]], null, null, null, null, null, null, null, null, [["music", 27.42], ["fly, housefly", 22.7], ["mosquito", 21.36]], null, [["music", 72.89], ["synthesizer", 4.35], ["theremin", 4.15]], [["music", 74.57], ["theremin", 4.04], ["hum", 3.98]], [["music", 60.5], ["theremin", 7.4], ["musical instrument", 2.12]], null, [["music", 49.77], ["speech", 15.33], ["boing", 4.37]], null, [["music", 56.08], ["theremin", 19.99], ["synthesizer", 3.52]]], "duration": [0.94, 2.82, 0.58, 0.52, 2.95, 11.78, 0.98, 0.17, -0.14, 0.39, 0.17, 0.2, 1.68, 1.87, 38.38, 0.22, 1.13, 2.52, 7.61, 9.12, 7.08, 11.6, -0.1, 1.36, 0.89, -0.08, -0.05, -0.01, 0.02, 0.06, 4.11, -0.05, 9.33, 4.87, 20.29, 1.0, 5.18, 0.21, 12.54]} \ No newline at end of file diff --git a/annotations_1/UsZNj9srzR8_filtered.json b/annotations_1/UsZNj9srzR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02abf417c60ac707c3d6663693bc7a16e691f65f --- /dev/null +++ b/annotations_1/UsZNj9srzR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 50.8], [51.0, 51.39], [58.0, 66.75], [69.0, 81.72], [83.0, 83.51], [84.0, 152.95], [155.0, 156.79], [158.0, 206.47], [207.0, 208.35]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [30.54, 0.0, 32.72, 31.12, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.18], ["speech", 7.86], ["musical instrument", 4.14]], null, [["ding", 29.69], ["clang", 26.18], ["music", 20.81]], [["music", 64.92], ["throbbing", 9.69], ["hum", 4.13]], null, null, null, null, null], "duration": [23.8, 0.39, 8.75, 12.72, 0.51, 68.95, 1.79, 48.47, 1.35]} \ No newline at end of file diff --git a/annotations_1/UtyiyBw401w_filtered.json b/annotations_1/UtyiyBw401w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c071e9148e3652b74e684b44a30bf2a0fcdf9941 --- /dev/null +++ b/annotations_1/UtyiyBw401w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [9.0, 11.1], [11.0, 13.56], [17.0, 25.03], [26.0, 28.51], [31.0, 33.22], [35.0, 36.22], [40.0, 42.57], [47.0, 48.07], [49.0, 51.14], [54.0, 57.42], [58.0, 58.77], [60.0, 64.79], [67.0, 67.47], [68.0, 75.44], [76.0, 78.31], [79.0, 80.5], [83.0, 97.23], [99.0, 113.51], [116.0, 126.72], [127.0, 139.16], [140.0, 151.66], [153.0, 152.91], [157.0, 158.48], [159.0, 158.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 94.37, 94.95, 92.31, 97.54, 95.37, 0.0, 99.76, 0.0, 99.31, 97.43, 0.0, 77.53, 0.0, 99.44, 99.26, 0.0, 89.36, 57.17, 65.32, 42.35, 44.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["telephone", 22.77], ["telephone bell ringing", 19.82], ["fire alarm", 7.52]], [["telephone bell ringing", 91.36], ["telephone", 7.65], ["ringtone", 0.47]], null, null, null], "duration": [0.64, 2.1, 2.56, 8.03, 2.51, 2.22, 1.22, 2.57, 1.07, 2.14, 3.42, 0.77, 4.79, 0.47, 7.44, 2.31, 1.5, 14.23, 14.51, 10.72, 12.16, 11.66, -0.09, 1.48, -0.27]} \ No newline at end of file diff --git a/annotations_1/UvDzmAFiUj8_filtered.json b/annotations_1/UvDzmAFiUj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b72b41d7262d6953550724b6640e9ff51c9daf55 --- /dev/null +++ b/annotations_1/UvDzmAFiUj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 76.11], [76.0, 76.15], [76.0, 76.76], [77.0, 76.86], [80.0, 86.76], [89.0, 135.84], [137.0, 144.96], [149.0, 153.42], [156.0, 158.26], [158.0, 158.31]], "keep_status": [true, false, false, false, true, false, true, true, false, false], "silence_prob": [30.87, 0.0, 0.0, 0.0, 34.55, 0.0, 36.05, 32.1, 35.16, 0.0], "audiomae_on_audioset": [[["music", 48.64], ["buzz", 11.26], ["speech", 3.92]], null, null, null, [["speech", 45.96], ["music", 14.04], ["whack, thwack", 7.96]], null, [["frog", 14.57], ["speech", 11.35], ["hum", 9.29]], [["fly, housefly", 33.14], ["speech", 14.14], ["insect", 12.49]], [["speech", 38.17], ["music", 29.28], ["beatboxing", 5.05]], null], "duration": [22.11, 0.15, 0.76, -0.14, 6.76, 46.84, 7.96, 4.42, 2.26, 0.31]} \ No newline at end of file diff --git a/annotations_1/UvRaab90nQ0_filtered.json b/annotations_1/UvRaab90nQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43453e617478f81f5ac65d6d09c1ee288b61aa57 --- /dev/null +++ b/annotations_1/UvRaab90nQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.31], [19.0, 19.28], [20.0, 20.44], [22.0, 22.65], [28.0, 29.03], [30.0, 34.03], [59.0, 61.48], [67.0, 67.04], [70.0, 71.79], [73.0, 72.96], [74.0, 74.63], [79.0, 82.66], [83.0, 84.74], [97.0, 98.58], [102.0, 102.79], [104.0, 103.99], [105.0, 113.09], [117.0, 119.15], [126.0, 126.45], [128.0, 128.31], [136.0, 136.81], [138.0, 139.35], [141.0, 145.93]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true], "silence_prob": [55.46, 0.0, 0.0, 0.0, 0.0, 33.73, 100.0, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0, 0.0, 0.0, 31.36, 32.33, 0.0, 0.0, 0.0, 0.0, 34.3], "audiomae_on_audioset": [null, null, null, null, null, [["music", 47.24], ["synthesizer", 12.71], ["musical instrument", 4.72]], null, null, null, null, null, [["speech", 61.91], ["busy signal", 9.61], ["dial tone", 4.73]], null, null, null, null, [["cattle, bovinae", 22.29], ["speech", 17.05], ["moo", 15.44]], [["music", 24.18], ["hum", 11.19], ["speech", 10.03]], null, null, null, null, [["music", 33.23], ["speech", 23.14], ["cattle, bovinae", 5.09]]], "duration": [6.31, 0.28, 0.44, 0.65, 1.03, 4.03, 2.48, 0.04, 1.79, -0.04, 0.63, 3.66, 1.74, 1.58, 0.79, -0.01, 8.09, 2.15, 0.45, 0.31, 0.81, 1.35, 4.93]} \ No newline at end of file diff --git a/annotations_1/UvSGGd3ewFI_filtered.json b/annotations_1/UvSGGd3ewFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15de1d51a8bfcef0ac4f9b026bfa2adc923514b4 --- /dev/null +++ b/annotations_1/UvSGGd3ewFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.57], [8.0, 9.17], [14.0, 14.39], [17.0, 17.74], [19.0, 19.68], [24.0, 24.85], [44.0, 44.63], [65.0, 67.71], [69.0, 98.78], [104.0, 140.32], [143.0, 144.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.57, 30.49, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 55.61], ["speech", 8.1], ["didgeridoo", 7.03]], [["music", 35.13], ["speech", 31.07], ["buzz", 3.83]], null, null], "duration": [1.57, 1.17, 0.39, 0.74, 0.68, 0.85, 0.63, 2.71, 29.78, 36.32, 1.02]} \ No newline at end of file diff --git a/annotations_1/Uvm8N3wQDTo_filtered.json b/annotations_1/Uvm8N3wQDTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25c2142dde8e05efcdffc6c611b62ccf7e20f258 --- /dev/null +++ b/annotations_1/Uvm8N3wQDTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [17.0, 17.34], [24.0, 24.02], [26.0, 26.57], [31.0, 32.91], [42.0, 42.85], [87.0, 87.79], [102.0, 102.57], [110.0, 112.18], [127.0, 127.33], [131.0, 130.64], [133.0, 133.62], [143.0, 143.75], [146.0, 147.56], [154.0, 155.06], [156.0, 156.47], [167.0, 169.92], [175.0, 174.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 42.79], ["music", 25.72], ["whale vocalization", 15.56]], null, null, null, null, null, null, null, [["speech", 40.53], ["whale vocalization", 36.62], ["music", 3.9]], null], "duration": [0.78, 0.34, 0.02, 0.57, 1.91, 0.85, 0.79, 0.57, 2.18, 0.33, -0.36, 0.62, 0.75, 1.56, 1.06, 0.47, 2.92, -0.28]} \ No newline at end of file diff --git a/annotations_1/UwfFWXUEyfQ_filtered.json b/annotations_1/UwfFWXUEyfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f480e3c173c6e97146a5e497b22598d9742eec0e --- /dev/null +++ b/annotations_1/UwfFWXUEyfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.04], [15.0, 15.65], [18.0, 19.2], [20.0, 20.87], [24.0, 25.14], [29.0, 28.9], [37.0, 37.17], [39.0, 39.33], [41.0, 41.0], [49.0, 61.86], [64.0, 69.11], [72.0, 73.21], [76.0, 76.87], [77.0, 83.86], [87.0, 87.69], [89.0, 118.84], [122.0, 123.13]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.64, 33.12, 0.0, 0.0, 39.77, 0.0, 29.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.36], ["didgeridoo", 24.51], ["whale vocalization", 6.63]], [["animal", 15.22], ["music", 9.91], ["whale vocalization", 7.45]], null, null, [["music", 42.39], ["musical instrument", 11.16], ["effects unit", 6.48]], null, [["music", 11.22], ["grunt", 10.82], ["sound effect", 7.89]], null], "duration": [1.04, 0.65, 1.2, 0.87, 1.14, -0.1, 0.17, 0.33, 0.0, 12.86, 5.11, 1.21, 0.87, 6.86, 0.69, 29.84, 1.13]} \ No newline at end of file diff --git a/annotations_1/UxHXWhEq5lo_filtered.json b/annotations_1/UxHXWhEq5lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71079419097092aaef25a1646d024439a8d815e4 --- /dev/null +++ b/annotations_1/UxHXWhEq5lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.71], [28.0, 29.07], [29.0, 37.81], [40.0, 49.42], [51.0, 52.08], [53.0, 52.91], [53.0, 52.96], [53.0, 54.16], [55.0, 91.5], [92.0, 93.19], [98.0, 98.73], [100.0, 140.49], [144.0, 143.94], [148.0, 148.76], [150.0, 150.74], [154.0, 154.77]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.84, 35.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 43.71], ["whack, thwack", 8.83], ["sidetone", 7.93]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 1.07, 8.81, 9.42, 1.08, -0.09, -0.04, 1.16, 36.5, 1.19, 0.73, 40.49, -0.06, 0.76, 0.74, 0.77]} \ No newline at end of file diff --git a/annotations_1/UxjYMYu0F8o_filtered.json b/annotations_1/UxjYMYu0F8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b81c62add9608ac746a29651bf144d26cc72f86 --- /dev/null +++ b/annotations_1/UxjYMYu0F8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [7.0, 11.08], [14.0, 15.42], [16.0, 18.17], [19.0, 20.44], [21.0, 21.78], [30.0, 30.38], [31.0, 31.97], [34.0, 34.91], [35.0, 38.62], [39.0, 39.97], [41.0, 41.91], [43.0, 44.2], [51.0, 57.06], [60.0, 60.49], [61.0, 62.14], [66.0, 68.61], [72.0, 76.0], [76.0, 76.6], [77.0, 79.89], [80.0, 83.1], [84.0, 84.92], [85.0, 90.53], [91.0, 93.14], [99.0, 99.45], [101.0, 102.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.51, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 88.64, 74.13, 0.0, 94.07, 56.55, 0.0, 54.97, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 4.08, 1.42, 2.17, 1.44, 0.78, 0.38, 0.97, 0.91, 3.62, 0.97, 0.91, 1.2, 6.06, 0.49, 1.14, 2.61, 4.0, 0.6, 2.89, 3.1, 0.92, 5.53, 2.14, 0.45, 1.64]} \ No newline at end of file diff --git a/annotations_1/Uy-L94Tio9w_filtered.json b/annotations_1/Uy-L94Tio9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e843c97628ddcaa440700437ca82a02bb85d6cd --- /dev/null +++ b/annotations_1/Uy-L94Tio9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 56.39], [64.0, 75.1], [81.0, 112.83], [117.0, 117.98], [119.0, 119.47], [122.0, 177.94]], "keep_status": [false, false, false, false, false, false], "silence_prob": [28.13, 27.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.25], ["explosion", 16.57], ["burst, pop", 7.09]], [["speech", 66.91], ["music", 13.41], ["vehicle", 4.1]], null, null, null, null], "duration": [5.39, 11.1, 31.83, 0.98, 0.47, 55.94]} \ No newline at end of file diff --git a/annotations_1/UyKyxHFIT3A_filtered.json b/annotations_1/UyKyxHFIT3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37f0ccb27962a02e33c502dd1168629eebb4ee14 --- /dev/null +++ b/annotations_1/UyKyxHFIT3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.23], [10.0, 10.07], [14.0, 14.93], [16.0, 18.81], [26.0, 26.18], [33.0, 33.83], [35.0, 37.42], [39.0, 44.47], [47.0, 47.83], [57.0, 57.05], [59.0, 60.02], [68.0, 68.62], [70.0, 70.38], [73.0, 78.49], [81.0, 81.45], [86.0, 86.68], [91.0, 99.71], [103.0, 103.47], [108.0, 108.65], [115.0, 115.89], [117.0, 117.61], [118.0, 118.45], [122.0, 122.23], [132.0, 133.03], [135.0, 137.22], [145.0, 146.87], [150.0, 150.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 99.36, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.07, 0.93, 2.81, 0.18, 0.83, 2.42, 5.47, 0.83, 0.05, 1.02, 0.62, 0.38, 5.49, 0.45, 0.68, 8.71, 0.47, 0.65, 0.89, 0.61, 0.45, 0.23, 1.03, 2.22, 1.87, 0.65]} \ No newline at end of file diff --git a/annotations_1/Uz8w8WHmWMI_filtered.json b/annotations_1/Uz8w8WHmWMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8cebce55cd0c2fc13ce71431212d7393421a266 --- /dev/null +++ b/annotations_1/Uz8w8WHmWMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [10.0, 26.81], [33.0, 32.8], [43.0, 43.12], [46.0, 47.34], [50.0, 49.94], [53.0, 53.32], [59.0, 59.29], [63.0, 64.44], [65.0, 66.66], [83.0, 83.4], [113.0, 113.49], [116.0, 119.69], [122.0, 127.89], [144.0, 143.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 29.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 29.32, 0.0], "audiomae_on_audioset": [null, [["music", 77.95], ["funk", 1.48], ["boing", 1.45]], null, null, null, null, null, null, null, null, null, null, [["moo", 27.86], ["cattle, bovinae", 21.65], ["livestock, farm animals, working animals", 16.21]], [["speech", 58.22], ["sound effect", 6.28], ["music", 5.49]], null], "duration": [0.39, 16.81, -0.2, 0.12, 1.34, -0.06, 0.32, 0.29, 1.44, 1.66, 0.4, 0.49, 3.69, 5.89, -0.1]} \ No newline at end of file diff --git a/annotations_1/V-9fQTUix6I_filtered.json b/annotations_1/V-9fQTUix6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17455936c32941e3703be368c77a07f6cbd00f30 --- /dev/null +++ b/annotations_1/V-9fQTUix6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.89], [14.0, 16.92], [20.0, 20.88], [25.0, 25.64], [32.0, 41.18], [46.0, 51.6], [58.0, 61.92], [64.0, 66.26], [66.0, 66.43], [69.0, 74.75], [81.0, 88.86], [93.0, 93.8], [98.0, 102.63], [103.0, 103.15], [109.0, 110.08], [111.0, 115.67], [117.0, 133.0], [141.0, 143.06], [144.0, 150.26], [160.0, 165.4], [166.0, 165.94], [166.0, 166.29], [169.0, 170.87], [173.0, 179.68]], "keep_status": [true, false, false, false, true, true, false, false, false, false, true, false, false, false, false, true, true, false, true, true, false, false, false, true], "silence_prob": [30.62, 32.88, 0.0, 0.0, 30.29, 31.59, 31.17, 32.97, 0.0, 32.19, 31.46, 0.0, 36.79, 0.0, 0.0, 34.45, 31.32, 34.12, 32.98, 30.86, 0.0, 0.0, 0.0, 30.5], "audiomae_on_audioset": [[["wild animals", 23.65], ["animal", 18.3], ["speech", 14.35]], [["speech", 35.3], ["music", 31.55], ["groan", 15.24]], null, null, [["speech", 45.46], ["vehicle", 8.56], ["grunt", 6.95]], [["music", 35.0], ["moo", 12.06], ["cattle, bovinae", 10.41]], [["music", 64.46], ["groan", 14.49], ["speech", 3.62]], [["music", 68.96], ["guitar", 5.14], ["plucked string instrument", 4.13]], null, [["music", 63.31], ["speech", 4.78], ["boing", 4.04]], [["music", 37.81], ["motorcycle", 7.06], ["moo", 4.26]], null, [["speech", 25.55], ["sidetone", 23.85], ["music", 22.77]], null, null, [["music", 36.23], ["speech", 24.64], ["sidetone", 5.01]], [["speech", 28.63], ["music", 28.14], ["hum", 9.24]], [["music", 67.71], ["rock music", 2.67], ["musical instrument", 1.93]], [["music", 59.21], ["theremin", 4.66], ["speech", 2.94]], [["music", 31.57], ["explosion", 17.8], ["hum", 13.84]], null, null, null, [["music", 28.22], ["speech", 8.17], ["groan", 5.51]]], "duration": [3.89, 2.92, 0.88, 0.64, 9.18, 5.6, 3.92, 2.26, 0.43, 5.75, 7.86, 0.8, 4.63, 0.15, 1.08, 4.67, 16.0, 2.06, 6.26, 5.4, -0.06, 0.29, 1.87, 6.68]} \ No newline at end of file diff --git a/annotations_1/V-hOCaVISok_filtered.json b/annotations_1/V-hOCaVISok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b80d0558cc28b346afb01b7805f07151f9315401 --- /dev/null +++ b/annotations_1/V-hOCaVISok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 39.75], [47.0, 55.05], [60.0, 85.94], [87.0, 94.56], [96.0, 96.42], [103.0, 104.97], [106.0, 106.2], [109.0, 109.85], [111.0, 111.6], [113.0, 115.72], [118.0, 118.45], [119.0, 123.53], [124.0, 125.83], [127.0, 132.6], [134.0, 133.74], [135.0, 137.24], [138.0, 140.81], [142.0, 141.94], [144.0, 156.57]], "keep_status": [true, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true], "silence_prob": [28.39, 28.32, 28.25, 40.17, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 50.81, 0.0, 56.03, 0.0, 41.52, 39.22, 0.0, 37.81], "audiomae_on_audioset": [[["music", 57.14], ["throbbing", 3.39], ["hum", 3.11]], [["speech", 72.36], ["music", 5.06], ["whip", 1.7]], [["speech", 25.18], ["music", 11.47], ["whale vocalization", 8.65]], [["music", 19.05], ["hum", 8.66], ["gasp", 7.58]], null, null, null, null, null, [["speech", 29.14], ["hum", 23.8], ["mains hum", 10.68]], null, null, null, null, null, [["mains hum", 46.82], ["hum", 24.3], ["frog", 3.25]], [["hum", 29.73], ["music", 12.6], ["throbbing", 10.93]], null, [["gasp", 27.97], ["hum", 22.65], ["whimper", 7.68]]], "duration": [15.75, 8.05, 25.94, 7.56, 0.42, 1.97, 0.2, 0.85, 0.6, 2.72, 0.45, 4.53, 1.83, 5.6, -0.26, 2.24, 2.81, -0.06, 12.57]} \ No newline at end of file diff --git a/annotations_1/V-mlZvBRoOQ_filtered.json b/annotations_1/V-mlZvBRoOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9bbe5faddbdb6d740b0767221d99b21e2d62d45 --- /dev/null +++ b/annotations_1/V-mlZvBRoOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.41], [21.0, 21.51], [22.0, 24.58], [27.0, 33.83], [35.0, 35.53], [37.0, 37.18], [39.0, 40.0], [41.0, 41.62], [42.0, 41.98], [43.0, 43.01], [43.0, 47.66], [50.0, 50.18], [50.0, 51.24], [53.0, 53.55], [54.0, 55.51], [57.0, 58.31], [63.0, 66.43], [67.0, 67.68], [69.0, 69.5], [71.0, 71.56], [73.0, 74.38], [76.0, 77.19], [78.0, 78.7], [79.0, 80.01], [80.0, 81.28], [82.0, 82.71], [84.0, 84.91], [88.0, 88.57], [91.0, 92.03], [92.0, 92.96], [93.0, 95.98], [97.0, 97.19], [99.0, 98.95], [100.0, 100.3], [101.0, 101.97], [103.0, 104.38], [105.0, 108.35], [109.0, 112.35], [116.0, 117.68], [118.0, 118.93], [119.0, 119.85], [123.0, 125.54], [127.0, 128.26], [130.0, 131.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.57, 0.0, 64.97, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.9, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 91.98, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 76.97], ["fart", 4.15], ["horse", 3.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.47], ["speech", 15.17], ["marimba, xylophone", 7.82]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.41, 0.51, 2.58, 6.83, 0.53, 0.18, 1.0, 0.62, -0.02, 0.01, 4.66, 0.18, 1.24, 0.55, 1.51, 1.31, 3.43, 0.68, 0.5, 0.56, 1.38, 1.19, 0.7, 1.01, 1.28, 0.71, 0.91, 0.57, 1.03, 0.96, 2.98, 0.19, -0.05, 0.3, 0.97, 1.38, 3.35, 3.35, 1.68, 0.93, 0.85, 2.54, 1.26, 1.7]} \ No newline at end of file diff --git a/annotations_1/V-vgoh3ukPc_filtered.json b/annotations_1/V-vgoh3ukPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4f06b81e43b938573dcba3003aeecee0966721 --- /dev/null +++ b/annotations_1/V-vgoh3ukPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 20.6], [21.0, 25.93], [27.0, 33.15], [35.0, 35.46], [36.0, 43.66], [44.0, 45.23], [46.0, 47.43], [48.0, 52.52], [53.0, 54.06], [55.0, 56.56], [60.0, 61.13], [62.0, 63.17], [69.0, 69.62], [75.0, 84.5], [88.0, 101.41], [109.0, 111.75], [117.0, 134.6], [137.0, 137.67], [143.0, 143.77], [146.0, 146.38], [149.0, 148.86], [152.0, 153.3], [159.0, 161.97]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.22, 34.17, 33.29, 0.0, 34.16, 0.0, 0.0, 42.6, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 33.3, 30.61, 30.56, 0.0, 0.0, 0.0, 0.0, 0.0, 32.4], "audiomae_on_audioset": [[["music", 58.66], ["drum machine", 13.17], ["synthesizer", 5.39]], [["music", 67.68], ["synthesizer", 11.42], ["musical instrument", 3.99]], [["music", 28.22], ["thunk", 18.31], ["hum", 5.68]], null, [["music", 19.59], ["speech", 18.65], ["hum", 11.37]], null, null, [["music", 56.64], ["speech", 18.35], ["hum", 5.79]], null, null, null, null, null, [["music", 62.94], ["didgeridoo", 7.43], ["speech", 4.01]], [["music", 82.71], ["throbbing", 2.32], ["sampler", 1.0]], [["music", 35.87], ["boing", 8.43], ["whack, thwack", 7.47]], [["music", 77.47], ["fart", 3.05], ["whack, thwack", 1.74]], null, null, null, null, null, [["thunk", 61.3], ["music", 31.03], ["whack, thwack", 2.14]]], "duration": [12.6, 4.93, 6.15, 0.46, 7.66, 1.23, 1.43, 4.52, 1.06, 1.56, 1.13, 1.17, 0.62, 9.5, 13.41, 2.75, 17.6, 0.67, 0.77, 0.38, -0.14, 1.3, 2.97]} \ No newline at end of file diff --git a/annotations_1/V022pMeqRjA_filtered.json b/annotations_1/V022pMeqRjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ceca115e982266f2c539d7681d485e764422f4e --- /dev/null +++ b/annotations_1/V022pMeqRjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 48.02], [49.0, 50.68], [57.0, 57.32], [57.0, 75.0], [76.0, 81.99], [84.0, 90.98], [91.0, 91.03], [92.0, 130.82], [134.0, 134.97], [135.0, 136.21]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.32, 31.85, 36.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 46.81], ["hum", 15.63], ["mains hum", 7.18]], [["vehicle", 16.81], ["buzz", 12.17], ["car", 7.27]], [["hum", 38.72], ["mains hum", 38.65], ["music", 3.92]], null, null, null, null], "duration": [0.02, 1.68, 0.32, 18.0, 5.99, 6.98, 0.03, 38.82, 0.97, 1.21]} \ No newline at end of file diff --git a/annotations_1/V11YeYfaxv0_filtered.json b/annotations_1/V11YeYfaxv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a4af2671acf3f2d058045a7d942c8d0c20775b --- /dev/null +++ b/annotations_1/V11YeYfaxv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 75.37], [77.0, 84.13], [87.0, 95.57], [100.0, 107.33], [109.0, 115.82], [118.0, 124.63], [126.0, 141.59], [145.0, 147.99], [149.0, 150.31], [151.0, 154.77], [155.0, 156.64], [157.0, 158.33]], "keep_status": [false, true, false, true, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 30.17, 28.96, 29.33, 29.02, 28.72, 29.38, 47.08, 0.0, 32.43, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 39.59], ["music", 23.88], ["groan", 4.49]], [["music", 62.97], ["throbbing", 8.84], ["cacophony", 4.48]], [["speech", 16.81], ["vehicle", 12.77], ["whale vocalization", 12.58]], [["speech", 17.74], ["music", 10.51], ["vehicle", 10.39]], [["speech", 60.16], ["vehicle", 12.95], ["car", 2.63]], [["music", 22.74], ["throbbing", 22.5], ["hum", 22.32]], [["speech", 55.25], ["music", 3.67], ["fly, housefly", 3.17]], null, [["hum", 49.84], ["music", 17.2], ["throbbing", 12.63]], null, null], "duration": [38.37, 7.13, 8.57, 7.33, 6.82, 6.63, 15.59, 2.99, 1.31, 3.77, 1.64, 1.33]} \ No newline at end of file diff --git a/annotations_1/V15AidhVCSw_filtered.json b/annotations_1/V15AidhVCSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9085c52861c7b87f74ab28419bc9924e4038d463 --- /dev/null +++ b/annotations_1/V15AidhVCSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.32], [7.0, 8.26], [9.0, 10.02], [11.0, 12.31], [14.0, 13.93], [15.0, 16.39], [17.0, 18.71], [20.0, 22.52], [26.0, 26.25], [27.0, 36.48], [38.0, 40.88], [44.0, 45.3], [47.0, 48.36], [56.0, 57.43], [61.0, 61.97], [64.0, 64.67], [67.0, 67.63], [85.0, 87.18], [88.0, 88.15], [91.0, 92.79], [93.0, 96.67], [97.0, 97.71], [98.0, 98.59], [99.0, 99.47], [101.0, 101.92], [103.0, 103.4], [104.0, 106.52], [108.0, 109.41], [110.0, 111.67], [116.0, 116.63], [119.0, 120.83], [123.0, 123.77], [126.0, 126.79], [136.0, 136.7], [137.0, 137.59], [139.0, 138.77], [140.0, 140.05], [141.0, 140.97], [142.0, 152.64], [159.0, 159.8], [167.0, 168.02], [169.0, 170.87], [173.0, 173.65], [176.0, 177.72], [180.0, 180.06], [180.0, 180.13], [180.0, 180.27], [183.0, 186.34], [189.0, 190.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 45.46, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 69.09], ["music", 12.93], ["musical instrument", 3.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.32, 1.26, 1.02, 1.31, -0.07, 1.39, 1.71, 2.52, 0.25, 9.48, 2.88, 1.3, 1.36, 1.43, 0.97, 0.67, 0.63, 2.18, 0.15, 1.79, 3.67, 0.71, 0.59, 0.47, 0.92, 0.4, 2.52, 1.41, 1.67, 0.63, 1.83, 0.77, 0.79, 0.7, 0.59, -0.23, 0.05, -0.03, 10.64, 0.8, 1.02, 1.87, 0.65, 1.72, 0.06, 0.13, 0.27, 3.34, 1.48]} \ No newline at end of file diff --git a/annotations_1/V25QF11MwDU_filtered.json b/annotations_1/V25QF11MwDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cea59718890ff2929ba205fd5eeb08cb5a9e84b --- /dev/null +++ b/annotations_1/V25QF11MwDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 98.17], [100.0, 100.53], [103.0, 104.19], [108.0, 108.7], [112.0, 115.55], [116.0, 117.15], [118.0, 122.89], [125.0, 125.86], [127.0, 127.48]], "keep_status": [true, false, false, false, true, false, false, false, false], "silence_prob": [29.22, 0.0, 0.0, 0.0, 28.95, 0.0, 36.28, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 50.72], ["whale vocalization", 9.8], ["music", 4.45]], null, null, null, [["music", 27.39], ["sonar", 22.34], ["hum", 12.83]], null, [["music", 41.27], ["hum", 28.41], ["mains hum", 5.04]], null, null], "duration": [2.17, 0.53, 1.19, 0.7, 3.55, 1.15, 4.89, 0.86, 0.48]} \ No newline at end of file diff --git a/annotations_1/V26hcTgoDLY_filtered.json b/annotations_1/V26hcTgoDLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b66e61b3a9306d5cecb86bfd511bd3cc7dbbde --- /dev/null +++ b/annotations_1/V26hcTgoDLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.95], [23.0, 23.63], [24.0, 24.14], [27.0, 28.48], [33.0, 33.64], [35.0, 34.97], [36.0, 35.95], [38.0, 38.08], [39.0, 39.11], [41.0, 41.98], [42.0, 43.53], [44.0, 45.2], [46.0, 46.25], [47.0, 47.78], [49.0, 49.03], [50.0, 51.0], [52.0, 53.08], [56.0, 56.88], [57.0, 58.08], [59.0, 59.93], [60.0, 61.55], [63.0, 63.42], [64.0, 64.45], [65.0, 65.35], [67.0, 67.54], [69.0, 68.86], [70.0, 70.5], [75.0, 75.0], [76.0, 76.65], [77.0, 77.43], [79.0, 79.73], [81.0, 81.14], [83.0, 82.78], [84.0, 86.46], [89.0, 88.86], [90.0, 89.75], [97.0, 96.82], [101.0, 101.24], [107.0, 107.4], [112.0, 112.09], [114.0, 114.12], [117.0, 118.77], [122.0, 123.09], [133.0, 133.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["snicker", 26.33], ["chuckle, chortle", 18.49], ["speech", 13.79]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 0.63, 0.14, 1.48, 0.64, -0.03, -0.05, 0.08, 0.11, 0.98, 1.53, 1.2, 0.25, 0.78, 0.03, 1.0, 1.08, 0.88, 1.08, 0.93, 1.55, 0.42, 0.45, 0.35, 0.54, -0.14, 0.5, 0.0, 0.65, 0.43, 0.73, 0.14, -0.22, 2.46, -0.14, -0.25, -0.18, 0.24, 0.4, 0.09, 0.12, 1.77, 1.09, 0.68]} \ No newline at end of file diff --git a/annotations_1/V2RKM83CQ_A_filtered.json b/annotations_1/V2RKM83CQ_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed21ad17e590c06e90bcbf4e45b4821d30e6226 --- /dev/null +++ b/annotations_1/V2RKM83CQ_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.77], [17.0, 18.64], [19.0, 19.94], [23.0, 68.2], [69.0, 69.57], [70.0, 72.1], [75.0, 78.36], [94.0, 118.49], [120.0, 134.59], [137.0, 137.86], [140.0, 140.58], [147.0, 147.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.74, 0.0, 0.0, 0.0, 0.0, 99.62, 82.97, 75.88, 73.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.41], ["didgeridoo", 13.08], ["speech", 7.8]], null, null, null, null, null, null, null, null, null, null, null], "duration": [10.77, 1.64, 0.94, 45.2, 0.57, 2.1, 3.36, 24.49, 14.59, 0.86, 0.58, 0.87]} \ No newline at end of file diff --git a/annotations_1/V300Gtn8NVs_filtered.json b/annotations_1/V300Gtn8NVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bde7497971c19d402f6ef7345fa79746c9768c4 --- /dev/null +++ b/annotations_1/V300Gtn8NVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.09], [13.0, 13.78], [17.0, 27.43], [28.0, 35.11], [35.0, 35.53], [36.0, 65.26], [70.0, 82.92], [85.0, 87.47], [93.0, 109.76], [110.0, 114.32], [116.0, 127.09], [127.0, 128.24], [133.0, 142.15], [143.0, 150.11], [151.0, 152.19], [153.0, 154.35], [156.0, 156.61]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.94, 45.49, 0.0, 34.17, 33.68, 33.21, 39.27, 60.32, 39.75, 0.0, 31.2, 32.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 40.26], ["mains hum", 22.87], ["hum", 20.63]], [["hum", 31.57], ["mains hum", 22.67], ["music", 19.79]], null, [["music", 31.33], ["electric shaver, electric razor", 18.9], ["speech", 9.49]], [["music", 37.43], ["hum", 27.05], ["mains hum", 13.07]], [["music", 57.65], ["didgeridoo", 6.97], ["musical instrument", 4.77]], [["music", 52.19], ["hum", 16.26], ["mains hum", 6.29]], null, [["music", 49.96], ["speech", 13.95], ["buzz", 7.02]], null, [["hum", 35.52], ["mains hum", 24.64], ["speech", 18.97]], [["music", 78.48], ["throbbing", 5.65], ["hum", 2.74]], null, null, null], "duration": [0.09, 0.78, 10.43, 7.11, 0.53, 29.26, 12.92, 2.47, 16.76, 4.32, 11.09, 1.24, 9.15, 7.11, 1.19, 1.35, 0.61]} \ No newline at end of file diff --git a/annotations_1/V32SkmBB1KU_filtered.json b/annotations_1/V32SkmBB1KU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..133131d73ed02c0e45645ebabeefcc27f2900e7b --- /dev/null +++ b/annotations_1/V32SkmBB1KU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.3], [8.0, 9.26], [11.0, 12.16], [13.0, 15.45], [19.0, 22.25], [23.0, 26.76], [29.0, 31.8], [35.0, 36.31], [38.0, 38.91], [40.0, 41.71], [42.0, 50.9], [63.0, 64.45], [66.0, 66.06], [67.0, 68.42], [69.0, 79.42], [82.0, 82.95], [84.0, 85.19], [88.0, 98.61], [100.0, 99.93], [101.0, 101.71], [103.0, 103.71], [105.0, 106.56], [107.0, 110.84], [112.0, 112.75], [114.0, 119.28], [121.0, 135.43], [137.0, 139.72], [140.0, 140.49], [142.0, 148.27], [152.0, 153.79], [156.0, 157.59], [160.0, 161.15], [165.0, 168.02], [169.0, 169.64], [173.0, 174.9], [177.0, 178.87], [183.0, 184.98], [186.0, 187.32], [189.0, 204.45], [207.0, 218.34], [221.0, 220.85], [221.0, 221.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.07, 0.0, 0.0, 87.92, 98.27, 96.42, 98.51, 0.0, 0.0, 0.0, 39.94, 0.0, 0.0, 0.0, 44.55, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 74.29, 93.91, 96.66, 0.0, 94.22, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 35.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 67.18], ["bleat", 9.14], ["livestock, farm animals, working animals", 3.76]], null, null, null, [["music", 74.1], ["musical instrument", 2.89], ["cello", 2.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.81], ["theremin", 6.21], ["cello", 5.06]], [["music", 76.28], ["theremin", 6.66], ["ambient music", 2.17]], null, null], "duration": [2.3, 1.26, 1.16, 2.45, 3.25, 3.76, 2.8, 1.31, 0.91, 1.71, 8.9, 1.45, 0.06, 1.42, 10.42, 0.95, 1.19, 10.61, -0.07, 0.71, 0.71, 1.56, 3.84, 0.75, 5.28, 14.43, 2.72, 0.49, 6.27, 1.79, 1.59, 1.15, 3.02, 0.64, 1.9, 1.87, 1.98, 1.32, 15.45, 11.34, -0.15, 0.0]} \ No newline at end of file diff --git a/annotations_1/V3Gnq8VFai4_filtered.json b/annotations_1/V3Gnq8VFai4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fcb196bb1d87885c6881eb98260e598ebf792ec --- /dev/null +++ b/annotations_1/V3Gnq8VFai4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [3.0, 11.4], [13.0, 14.08], [24.0, 24.56], [29.0, 29.54], [30.0, 31.48], [35.0, 36.76], [38.0, 40.05], [43.0, 100.09], [102.0, 143.7], [151.0, 151.24], [152.0, 155.76], [157.0, 158.25], [159.0, 160.08], [164.0, 164.35], [168.0, 171.19], [174.0, 176.47], [177.0, 178.48], [182.0, 188.23], [189.0, 204.2], [205.0, 207.27], [210.0, 212.45], [218.0, 231.48], [232.0, 232.9], [234.0, 233.93], [235.0, 235.82], [239.0, 240.11], [243.0, 244.32], [248.0, 250.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.39, 0.0, 0.0, 0.0, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 29.03, 0.0, 0.0, 0.0, 31.07, 35.15, 0.0, 28.8, 29.04, 28.78, 28.58, 29.07, 0.0, 0.0, 0.0, 0.0, 0.0, 29.54], "audiomae_on_audioset": [null, [["hum", 50.72], ["throbbing", 32.95], ["mains hum", 3.97]], null, null, null, null, null, null, null, null, null, [["hum", 21.32], ["music", 18.07], ["mains hum", 15.34]], null, null, null, [["hum", 31.45], ["mains hum", 27.16], ["throbbing", 26.67]], [["music", 61.35], ["musical instrument", 6.64], ["synthesizer", 4.07]], null, [["music", 41.92], ["throbbing", 29.95], ["hum", 5.11]], [["speech", 54.5], ["music", 21.55], ["buzz", 8.32]], [["music", 33.16], ["vehicle", 16.5], ["electronic music", 4.94]], [["zipper (clothing)", 21.34], ["music", 17.56], ["boom", 17.11]], [["music", 48.69], ["speech", 28.04], ["explosion", 1.82]], null, null, null, null, null, [["cattle, bovinae", 33.74], ["moo", 26.95], ["speech", 12.27]]], "duration": [0.44, 8.4, 1.08, 0.56, 0.54, 1.48, 1.76, 2.05, 57.09, 41.7, 0.24, 3.76, 1.25, 1.08, 0.35, 3.19, 2.47, 1.48, 6.23, 15.2, 2.27, 2.45, 13.48, 0.9, -0.07, 0.82, 1.11, 1.32, 2.01]} \ No newline at end of file diff --git a/annotations_1/V3Tlo0EutEQ_filtered.json b/annotations_1/V3Tlo0EutEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b887b7e0ba6fb53ea8b52933d5d3f85d52bd8c8 --- /dev/null +++ b/annotations_1/V3Tlo0EutEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.52], [23.0, 32.8], [33.0, 33.59], [38.0, 45.84], [49.0, 55.95], [62.0, 62.24], [64.0, 90.64], [95.0, 95.84], [110.0, 109.85], [114.0, 114.47], [116.0, 116.23], [117.0, 117.96], [127.0, 128.76], [130.0, 130.37]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.2, 31.16, 0.0, 30.2, 29.55, 0.0, 30.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.06], ["hum", 10.46], ["mains hum", 6.75]], [["music", 76.4], ["speech", 5.99], ["whack, thwack", 3.31]], null, [["music", 44.05], ["speech", 8.85], ["fly, housefly", 8.7]], [["mosquito", 36.3], ["fly, housefly", 34.33], ["insect", 13.04]], null, [["livestock, farm animals, working animals", 26.76], ["cattle, bovinae", 24.15], ["moo", 18.27]], null, null, null, null, null, null, null], "duration": [9.52, 9.8, 0.59, 7.84, 6.95, 0.24, 26.64, 0.84, -0.15, 0.47, 0.23, 0.96, 1.76, 0.37]} \ No newline at end of file diff --git a/annotations_1/V3aM1IFedho_filtered.json b/annotations_1/V3aM1IFedho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..260dc8bc7ed1e590f6de9cec310754091177b5cc --- /dev/null +++ b/annotations_1/V3aM1IFedho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.56], [28.0, 28.31], [58.0, 58.9], [67.0, 71.76], [73.0, 73.4], [76.0, 76.71], [79.0, 80.18], [133.0, 138.06], [139.0, 140.09], [141.0, 141.61], [145.0, 146.64], [151.0, 151.36], [154.0, 154.75], [156.0, 158.55], [160.0, 161.76], [162.0, 163.54], [167.0, 168.4], [170.0, 173.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 83.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 0.31, 0.9, 4.76, 0.4, 0.71, 1.18, 5.06, 1.09, 0.61, 1.64, 0.36, 0.75, 2.55, 1.76, 1.54, 1.4, 3.45]} \ No newline at end of file diff --git a/annotations_1/V4UM9BrSqos_filtered.json b/annotations_1/V4UM9BrSqos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bf0cd1d4ad4e401e5deaaffc69a580fd8075423 --- /dev/null +++ b/annotations_1/V4UM9BrSqos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.85], [10.0, 10.37], [12.0, 12.93], [14.0, 15.18], [21.0, 22.84], [29.0, 29.73], [40.0, 45.15], [47.0, 47.66], [48.0, 49.1], [49.0, 51.78], [55.0, 56.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 63.64, 0.0, 0.0, 73.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.85, 0.37, 0.93, 1.18, 1.84, 0.73, 5.15, 0.66, 1.1, 2.78, 1.19]} \ No newline at end of file diff --git a/annotations_1/V5P-1Vedt5E_filtered.json b/annotations_1/V5P-1Vedt5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e782c6ca667df291dd98616a817a39ee8be7fad --- /dev/null +++ b/annotations_1/V5P-1Vedt5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.23], [16.0, 18.08], [19.0, 24.97], [34.0, 47.04], [49.0, 49.3], [51.0, 51.12], [53.0, 53.55], [60.0, 60.0], [66.0, 68.62], [78.0, 78.11], [83.0, 82.86], [87.0, 91.83], [94.0, 97.95], [102.0, 109.63], [110.0, 111.91], [113.0, 114.22], [116.0, 116.7], [119.0, 120.61], [124.0, 126.45], [128.0, 130.44], [135.0, 138.06], [141.0, 152.54], [154.0, 160.71], [166.0, 166.09], [167.0, 167.75], [170.0, 170.68], [177.0, 184.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.89, 57.56, 60.98, 0.0, 0.0, 0.0, 0.0, 56.18, 0.0, 0.0, 61.18, 77.03, 97.11, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 98.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 2.08, 5.97, 13.04, 0.3, 0.12, 0.55, 0.0, 2.62, 0.11, -0.14, 4.83, 3.95, 7.63, 1.91, 1.22, 0.7, 1.61, 2.45, 2.44, 3.06, 11.54, 6.71, 0.09, 0.75, 0.68, 7.59]} \ No newline at end of file diff --git a/annotations_1/V5hfxgrLuoU_filtered.json b/annotations_1/V5hfxgrLuoU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f9b8f02b94bb460e2435fb1a63236bfe2149549 --- /dev/null +++ b/annotations_1/V5hfxgrLuoU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 22.17], [26.0, 27.08], [32.0, 50.13], [61.0, 67.14]], "keep_status": [false, false, true, false], "silence_prob": [95.23, 0.0, 30.01, 38.03], "audiomae_on_audioset": [null, null, [["hum", 21.1], ["music", 19.14], ["mains hum", 16.84]], [["hum", 48.91], ["speech", 14.51], ["throbbing", 9.59]]], "duration": [6.17, 1.08, 18.13, 6.14]} \ No newline at end of file diff --git a/annotations_1/V6B3elF2pYU_filtered.json b/annotations_1/V6B3elF2pYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e001f6ea9e46e383fdcdc68faf7380b6768cc0f --- /dev/null +++ b/annotations_1/V6B3elF2pYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.2], [7.0, 17.2], [18.0, 22.96], [26.0, 27.58], [30.0, 36.95], [38.0, 39.06], [40.0, 41.88], [43.0, 45.32], [46.0, 47.9], [51.0, 51.58], [54.0, 70.19], [71.0, 71.71], [72.0, 75.74], [79.0, 83.19], [88.0, 91.5], [93.0, 95.55], [96.0, 98.22], [101.0, 102.73], [108.0, 109.04], [111.0, 112.97], [114.0, 115.87], [118.0, 118.18], [120.0, 120.39], [122.0, 130.59], [132.0, 136.11], [139.0, 138.91], [141.0, 143.34], [147.0, 148.12], [149.0, 150.97]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [50.66, 46.5, 95.23, 0.0, 97.73, 0.0, 0.0, 99.36, 0.0, 0.0, 33.31, 0.0, 38.4, 43.87, 39.41, 53.22, 40.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 36.04, 0.0, 51.77, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 51.29], ["guitar", 6.56], ["singing bowl", 6.38]], null, null, null, null, null, null, null, null, [["music", 51.22], ["hum", 22.9], ["throbbing", 10.65]], null, [["music", 42.76], ["synthesizer", 18.4], ["speech", 12.97]], [["music", 64.65], ["theremin", 3.46], ["hum", 3.4]], [["throbbing", 30.63], ["music", 26.77], ["hum", 19.86]], null, [["music", 46.74], ["hum", 6.15], ["ambient music", 5.52]], null, null, null, null, null, null, [["music", 51.06], ["electronic music", 8.99], ["ambient music", 6.9]], [["music", 47.38], ["ambient music", 9.67], ["theremin", 8.78]], null, null, null, null], "duration": [4.2, 10.2, 4.96, 1.58, 6.95, 1.06, 1.88, 2.32, 1.9, 0.58, 16.19, 0.71, 3.74, 4.19, 3.5, 2.55, 2.22, 1.73, 1.04, 1.97, 1.87, 0.18, 0.39, 8.59, 4.11, -0.09, 2.34, 1.12, 1.97]} \ No newline at end of file diff --git a/annotations_1/V6SMgd9L6Z0_filtered.json b/annotations_1/V6SMgd9L6Z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccf7cc171712f31b33b25e740c1ab0ce40eca3dc --- /dev/null +++ b/annotations_1/V6SMgd9L6Z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.0], [19.0, 27.94], [30.0, 30.1], [35.0, 35.16], [35.0, 41.39], [45.0, 46.55], [50.0, 50.23], [50.0, 54.63], [55.0, 57.7], [59.0, 69.5], [70.0, 73.23], [78.0, 79.81], [86.0, 90.39], [94.0, 94.15], [100.0, 101.76], [103.0, 103.84], [104.0, 104.79], [105.0, 107.28], [108.0, 108.84], [112.0, 113.54], [115.0, 115.47], [120.0, 119.94], [126.0, 127.65], [129.0, 129.56], [130.0, 131.63], [133.0, 133.59], [143.0, 143.55], [146.0, 147.02], [151.0, 152.66], [157.0, 157.6], [160.0, 160.51]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.69, 31.48, 0.0, 0.0, 30.19, 0.0, 0.0, 31.24, 29.91, 30.22, 29.98, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.66], ["synthesizer", 4.14], ["throbbing", 3.1]], [["music", 59.86], ["musical instrument", 6.61], ["carnatic music", 5.34]], null, null, [["music", 73.06], ["speech", 5.64], ["boing", 4.21]], null, null, [["music", 61.48], ["synthesizer", 5.85], ["speech", 3.47]], [["music", 45.07], ["speech", 19.78], ["didgeridoo", 8.05]], [["music", 75.99], ["fart", 6.93], ["boing", 3.2]], [["music", 54.03], ["singing", 3.04], ["guitar", 2.64]], null, [["music", 55.58], ["boing", 16.82], ["plop", 5.7]], null, null, null, null, [["livestock, farm animals, working animals", 47.56], ["cattle, bovinae", 24.72], ["moo", 10.72]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.0, 8.94, 0.1, 0.16, 6.39, 1.55, 0.23, 4.63, 2.7, 10.5, 3.23, 1.81, 4.39, 0.15, 1.76, 0.84, 0.79, 2.28, 0.84, 1.54, 0.47, -0.06, 1.65, 0.56, 1.63, 0.59, 0.55, 1.02, 1.66, 0.6, 0.51]} \ No newline at end of file diff --git a/annotations_1/V6WWK1gvpjc_filtered.json b/annotations_1/V6WWK1gvpjc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5838e527dfb8e6333ed2d9e282c055af86fd8dc6 --- /dev/null +++ b/annotations_1/V6WWK1gvpjc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [36.0, 36.26], [52.0, 55.76], [64.0, 64.49], [65.0, 66.07], [72.0, 72.44], [75.0, 75.84], [79.0, 79.73], [84.0, 84.3], [85.0, 84.86], [85.0, 85.6], [87.0, 87.66], [89.0, 89.38], [90.0, 90.81], [93.0, 93.78], [97.0, 98.31], [99.0, 100.21], [101.0, 101.44], [107.0, 107.13], [109.0, 109.12], [114.0, 114.89], [115.0, 116.13], [121.0, 120.85], [129.0, 129.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 74.05], ["video game music", 5.79], ["quack", 3.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 0.26, 3.76, 0.49, 1.07, 0.44, 0.84, 0.73, 0.3, -0.14, 0.6, 0.66, 0.38, 0.81, 0.78, 1.31, 1.21, 0.44, 0.13, 0.12, 0.89, 1.13, -0.15, 0.44]} \ No newline at end of file diff --git a/annotations_1/V6xx32EGypQ_filtered.json b/annotations_1/V6xx32EGypQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53d4192607606e3c2702c3196844be012107f404 --- /dev/null +++ b/annotations_1/V6xx32EGypQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [5.0, 4.56], [5.0, 4.6], [5.0, 5.31], [9.0, 9.24], [14.0, 19.11], [22.0, 22.52], [46.0, 46.01], [83.0, 85.29], [87.0, 87.74], [88.0, 90.95], [91.0, 92.08], [107.0, 109.92], [115.0, 117.1], [129.0, 132.02], [133.0, 133.22], [138.0, 137.89], [139.0, 139.8], [142.0, 142.94], [144.0, 144.53], [145.0, 144.96], [147.0, 148.2], [150.0, 150.52], [151.0, 152.02], [162.0, 162.36], [164.0, 163.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.71, 0.0, 0.0, 50.91, 0.0, 33.44, 0.0, 36.92, 32.65, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 29.12], ["mosquito", 28.48], ["insect", 14.02]], null, null, null, null, [["speech", 29.55], ["sidetone", 9.85], ["frog", 8.89]], null, [["music", 12.85], ["sidetone", 9.39], ["electric shaver, electric razor", 6.77]], [["cattle, bovinae", 19.36], ["speech", 16.8], ["radio", 15.54]], [["moo", 33.9], ["cattle, bovinae", 31.67], ["livestock, farm animals, working animals", 7.99]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, -0.44, -0.4, 0.31, 0.24, 5.11, 0.52, 0.01, 2.29, 0.74, 2.95, 1.08, 2.92, 2.1, 3.02, 0.22, -0.11, 0.8, 0.94, 0.53, -0.04, 1.2, 0.52, 1.02, 0.36, -0.1]} \ No newline at end of file diff --git a/annotations_1/V8M4lPWWr3o_filtered.json b/annotations_1/V8M4lPWWr3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce36da0f8a88767149cab78f951ad86ae6e4d799 --- /dev/null +++ b/annotations_1/V8M4lPWWr3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.27], [15.0, 44.05], [45.0, 57.13], [59.0, 60.57], [64.0, 64.25], [65.0, 64.81], [66.0, 66.18], [69.0, 70.01], [71.0, 81.23], [85.0, 86.07], [92.0, 93.46], [96.0, 98.79]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 56.03, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 35.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 42.46], ["hum", 9.96], ["sidetone", 7.71]], null, null, [["music", 35.82], ["hum", 14.73], ["sidetone", 10.33]]], "duration": [1.27, 29.05, 12.13, 1.57, 0.25, -0.19, 0.18, 1.01, 10.23, 1.07, 1.46, 2.79]} \ No newline at end of file diff --git a/annotations_1/V99QCtwXKsI_filtered.json b/annotations_1/V99QCtwXKsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..922f9c0d72dbbd3331ffa977af7613e1f7307223 --- /dev/null +++ b/annotations_1/V99QCtwXKsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.66], [9.0, 9.41], [10.0, 10.99], [12.0, 12.38], [14.0, 14.42], [18.0, 18.15], [21.0, 29.81], [31.0, 31.48], [32.0, 51.75], [53.0, 53.18], [54.0, 57.01], [58.0, 59.63], [62.0, 61.86], [65.0, 66.23], [67.0, 71.34], [72.0, 72.57], [74.0, 74.95], [76.0, 79.24], [80.0, 80.6], [82.0, 82.61], [88.0, 89.34], [90.0, 92.62], [95.0, 96.06], [104.0, 104.23], [107.0, 106.93], [109.0, 109.7], [112.0, 112.92], [114.0, 114.37], [116.0, 116.16], [123.0, 126.1], [127.0, 127.75], [128.0, 129.56], [131.0, 136.85], [138.0, 139.19], [140.0, 141.47], [142.0, 144.26], [149.0, 149.08], [154.0, 155.36], [160.0, 159.9], [161.0, 161.35], [163.0, 164.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 50.02, 0.0, 95.37, 0.0, 0.0, 0.0, 51.18, 0.0, 0.0, 51.82, 0.0, 0.0, 0.0, 45.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 0.0, 95.23, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 64.33], ["sidetone", 15.62], ["radio", 12.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 45.1], ["moo", 35.13], ["livestock, farm animals, working animals", 11.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.66, 0.41, 0.99, 0.38, 0.42, 0.15, 8.81, 0.48, 19.75, 0.18, 3.01, 1.63, -0.14, 1.23, 4.34, 0.57, 0.95, 3.24, 0.6, 0.61, 1.34, 2.62, 1.06, 0.23, -0.07, 0.7, 0.92, 0.37, 0.16, 3.1, 0.75, 1.56, 5.85, 1.19, 1.47, 2.26, 0.08, 1.36, -0.1, 0.35, 1.37]} \ No newline at end of file diff --git a/annotations_1/V9E9Nce1dC0_filtered.json b/annotations_1/V9E9Nce1dC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eebb16008fe6dc5bee5995f1206a09607534a0e8 --- /dev/null +++ b/annotations_1/V9E9Nce1dC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 47.16], [49.0, 49.05], [49.0, 57.91], [59.0, 59.8], [60.0, 61.4], [62.0, 62.78], [65.0, 67.59], [68.0, 69.87], [70.0, 70.95], [72.0, 72.99], [76.0, 76.69], [77.0, 80.77], [84.0, 84.79], [87.0, 87.13], [90.0, 92.72], [96.0, 97.6], [98.0, 98.17], [101.0, 101.98], [102.0, 102.37], [103.0, 104.63], [107.0, 108.51], [109.0, 126.5], [128.0, 129.63], [130.0, 133.07], [135.0, 135.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.91, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 62.78, 0.0], "audiomae_on_audioset": [null, null, [["speech", 79.04], ["sidetone", 6.47], ["fart", 2.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.16, 0.05, 8.91, 0.8, 1.4, 0.78, 2.59, 1.87, 0.95, 0.99, 0.69, 3.77, 0.79, 0.13, 2.72, 1.6, 0.17, 0.98, 0.37, 1.63, 1.51, 17.5, 1.63, 3.07, 0.99]} \ No newline at end of file diff --git a/annotations_1/V9GnOAfI4w4_filtered.json b/annotations_1/V9GnOAfI4w4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77d0dd0770eb92b27acae95d0b41f1f38922e9b1 --- /dev/null +++ b/annotations_1/V9GnOAfI4w4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.3], [12.0, 13.42], [18.0, 18.67], [20.0, 20.66], [23.0, 29.39], [33.0, 39.63], [54.0, 56.08], [72.0, 72.84], [75.0, 75.78], [77.0, 79.34], [83.0, 83.08], [90.0, 89.97], [90.0, 91.39], [93.0, 93.24], [102.0, 109.02], [110.0, 110.62], [114.0, 117.34], [120.0, 122.94], [123.0, 129.0], [132.0, 131.99], [135.0, 138.21], [141.0, 143.16]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, true], "silence_prob": [58.98, 0.0, 0.0, 0.0, 56.7, 31.22, 37.24, 0.0, 0.0, 38.93, 0.0, 0.0, 0.0, 0.0, 29.25, 0.0, 29.06, 29.41, 29.46, 0.0, 33.32, 31.3], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 33.55], ["insect", 21.46], ["bee, wasp, etc.", 12.96]], [["speech", 41.49], ["didgeridoo", 18.13], ["music", 11.11]], null, null, [["fly, housefly", 14.33], ["livestock, farm animals, working animals", 11.2], ["insect", 9.93]], null, null, null, null, [["music", 41.57], ["didgeridoo", 9.63], ["whack, thwack", 5.64]], null, [["cattle, bovinae", 38.34], ["livestock, farm animals, working animals", 27.85], ["moo", 19.91]], [["music", 46.78], ["throbbing", 15.13], ["hum", 10.96]], [["music", 44.68], ["speech", 18.47], ["throbbing", 15.8]], null, [["speech", 46.0], ["music", 7.16], ["hum", 4.12]], [["whale vocalization", 24.02], ["didgeridoo", 21.09], ["music", 15.65]]], "duration": [4.3, 1.42, 0.67, 0.66, 6.39, 6.63, 2.08, 0.84, 0.78, 2.34, 0.08, -0.03, 1.39, 0.24, 7.02, 0.62, 3.34, 2.94, 6.0, -0.01, 3.21, 2.16]} \ No newline at end of file diff --git a/annotations_1/V9JniMBfW18_filtered.json b/annotations_1/V9JniMBfW18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd2d7c7b21f4ae772e89cb5472922672bc4cff5e --- /dev/null +++ b/annotations_1/V9JniMBfW18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.07], [11.0, 11.52], [26.0, 26.06], [32.0, 35.16], [37.0, 39.92], [42.0, 43.98], [45.0, 48.98], [50.0, 51.12], [53.0, 53.47], [58.0, 58.43], [60.0, 61.72], [65.0, 66.23], [68.0, 73.3], [77.0, 77.3], [78.0, 78.7], [106.0, 106.78], [108.0, 108.55], [114.0, 113.97], [115.0, 116.14]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.5, 72.16, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 23.37], ["throbbing", 10.34], ["fly, housefly", 8.77]], null, null, [["whale vocalization", 26.48], ["music", 10.42], ["hum", 6.4]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.52, 0.06, 3.16, 2.92, 1.98, 3.98, 1.12, 0.47, 0.43, 1.72, 1.23, 5.3, 0.3, 0.7, 0.78, 0.55, -0.03, 1.14]} \ No newline at end of file diff --git a/annotations_1/V9mx4UV8DNc_filtered.json b/annotations_1/V9mx4UV8DNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1042995ab98ade40fc49507e2de73d0cb6d36890 --- /dev/null +++ b/annotations_1/V9mx4UV8DNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.6], [25.0, 67.09], [69.0, 68.93], [70.0, 78.26], [80.0, 84.59], [86.0, 90.31], [95.0, 99.13]], "keep_status": [false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 34.59, 31.77, 31.4, 35.0], "audiomae_on_audioset": [null, null, null, [["music", 35.32], ["hum", 29.75], ["throbbing", 10.31]], [["music", 41.95], ["hum", 16.2], ["mains hum", 9.89]], [["music", 48.65], ["scary music", 8.42], ["electronic music", 4.76]], [["music", 45.03], ["throbbing", 7.52], ["electronic music", 6.94]]], "duration": [0.6, 42.09, -0.07, 8.26, 4.59, 4.31, 4.13]} \ No newline at end of file diff --git a/annotations_1/VAaeEoQq6jY_filtered.json b/annotations_1/VAaeEoQq6jY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40256e170869e36096c7bfc6b1dfb284cfc60474 --- /dev/null +++ b/annotations_1/VAaeEoQq6jY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.16], [6.0, 5.93], [11.0, 13.29], [15.0, 17.44], [25.0, 25.68], [33.0, 33.08], [52.0, 53.23], [57.0, 61.06], [63.0, 62.97], [66.0, 66.14], [69.0, 69.62], [70.0, 70.95], [73.0, 72.81], [73.0, 75.3], [76.0, 75.79], [78.0, 79.57], [80.0, 80.79], [84.0, 87.49], [89.0, 89.07], [94.0, 94.42], [96.0, 95.99], [101.0, 101.41], [105.0, 105.33], [117.0, 118.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.21, 55.74, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 39.91, 0.0, 0.0, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 89.99], ["speech synthesizer", 1.89], ["radio", 1.68]], null, null, null, null, null, null, null, null, null, null], "duration": [0.16, -0.07, 2.29, 2.44, 0.68, 0.08, 1.23, 4.06, -0.03, 0.14, 0.62, 0.95, -0.19, 2.3, -0.21, 1.57, 0.79, 3.49, 0.07, 0.42, -0.01, 0.41, 0.33, 1.4]} \ No newline at end of file diff --git a/annotations_1/VAmXYYSt6TM_filtered.json b/annotations_1/VAmXYYSt6TM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9c4007a1ea854b5ad2dc09212b34bf8c97a95ef --- /dev/null +++ b/annotations_1/VAmXYYSt6TM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [8.0, 8.68], [13.0, 14.18], [18.0, 22.11], [24.0, 24.6], [25.0, 51.56], [53.0, 53.45], [55.0, 55.0], [57.0, 57.08], [62.0, 72.13], [73.0, 80.72], [84.0, 95.98], [98.0, 157.98], [162.0, 167.78], [168.0, 169.13], [172.0, 174.93], [176.0, 176.34], [179.0, 180.32], [182.0, 211.23], [214.0, 223.75], [224.0, 223.8], [224.0, 223.91], [225.0, 226.62]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, true, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.98, 0.0, 35.45, 0.0, 0.0, 0.0, 31.62, 46.68, 36.69, 0.0, 31.01, 0.0, 29.21, 0.0, 0.0, 29.06, 28.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 28.36], ["mains hum", 21.26], ["whale vocalization", 16.61]], null, null, null, [["music", 69.78], ["whale vocalization", 11.5], ["synthesizer", 2.29]], [["whale vocalization", 64.24], ["music", 28.18], ["synthesizer", 1.09]], [["music", 30.61], ["hum", 15.94], ["whale vocalization", 15.9]], null, [["music", 27.2], ["throbbing", 20.11], ["hum", 15.34]], null, [["music", 42.95], ["speech", 10.83], ["throbbing", 6.24]], null, null, [["music", 26.5], ["livestock, farm animals, working animals", 19.92], ["cattle, bovinae", 7.09]], [["music", 33.63], ["speech", 15.26], ["mains hum", 8.84]], null, null, null], "duration": [1.56, 0.68, 1.18, 4.11, 0.6, 26.56, 0.45, 0.0, 0.08, 10.13, 7.72, 11.98, 59.98, 5.78, 1.13, 2.93, 0.34, 1.32, 29.23, 9.75, -0.2, -0.09, 1.62]} \ No newline at end of file diff --git a/annotations_1/VAnkBQ7eWyc_filtered.json b/annotations_1/VAnkBQ7eWyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19903d1e7139cfd13fa334e38d0ebd3f012e31c --- /dev/null +++ b/annotations_1/VAnkBQ7eWyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 54.35], [55.0, 67.88], [71.0, 102.95], [105.0, 108.01], [114.0, 120.72], [131.0, 131.7]], "keep_status": [false, true, false, true, false, false], "silence_prob": [30.37, 29.85, 0.0, 30.41, 29.19, 0.0], "audiomae_on_audioset": [[["music", 75.12], ["musical instrument", 8.32], ["synthesizer", 2.73]], [["music", 32.49], ["brass instrument", 21.48], ["musical instrument", 8.8]], null, [["mains hum", 24.64], ["hum", 22.09], ["didgeridoo", 5.87]], [["music", 27.63], ["theremin", 25.25], ["wind instrument, woodwind instrument", 21.07]], null], "duration": [20.35, 12.88, 31.95, 3.01, 6.72, 0.7]} \ No newline at end of file diff --git a/annotations_1/VBLIuICtHuo_filtered.json b/annotations_1/VBLIuICtHuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98960acc2aad70c334cb0c54734418ddd2dd7aef --- /dev/null +++ b/annotations_1/VBLIuICtHuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [11.0, 11.3], [18.0, 18.23], [19.0, 25.83], [30.0, 32.07], [38.0, 39.14], [41.0, 41.98], [43.0, 84.45], [94.0, 96.84], [105.0, 110.78], [125.0, 128.12]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.25, 31.28, 0.0, 0.0, 0.0, 29.52, 31.24, 31.92], "audiomae_on_audioset": [null, null, null, [["music", 47.02], ["boing", 10.07], ["speech", 8.64]], [["music", 64.28], ["trombone", 4.78], ["didgeridoo", 3.69]], null, null, null, [["vehicle", 18.27], ["music", 11.77], ["car", 10.05]], [["livestock, farm animals, working animals", 48.94], ["cattle, bovinae", 22.55], ["moo", 19.25]], [["livestock, farm animals, working animals", 34.58], ["moo", 33.58], ["cattle, bovinae", 30.25]]], "duration": [0.48, 0.3, 0.23, 6.83, 2.07, 1.14, 0.98, 41.45, 2.84, 5.78, 3.12]} \ No newline at end of file diff --git a/annotations_1/VBTrQhEwFqA_filtered.json b/annotations_1/VBTrQhEwFqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b09a7ad86e3c0fb09f2e6c543484a2ed34fae330 --- /dev/null +++ b/annotations_1/VBTrQhEwFqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 28.66], [33.0, 33.4], [33.0, 33.44], [33.0, 33.49], [34.0, 37.45], [38.0, 39.14], [41.0, 42.26], [47.0, 52.12], [61.0, 71.54], [82.0, 95.23], [97.0, 120.99]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [28.81, 0.0, 0.0, 0.0, 66.15, 0.0, 0.0, 59.77, 29.89, 57.17, 31.25], "audiomae_on_audioset": [[["music", 26.06], ["hum", 18.63], ["rumble", 17.28]], null, null, null, null, null, null, null, [["music", 22.45], ["whack, thwack", 16.59], ["sound effect", 4.47]], null, [["music", 57.48], ["breaking", 9.91], ["speech", 5.73]]], "duration": [24.66, 0.4, 0.44, 0.49, 3.45, 1.14, 1.26, 5.12, 10.54, 13.23, 23.99]} \ No newline at end of file diff --git a/annotations_1/VC0PPBrYBco_filtered.json b/annotations_1/VC0PPBrYBco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68a3006cb51d47140fa26b0321b7ce1efc13ebb5 --- /dev/null +++ b/annotations_1/VC0PPBrYBco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.53], [14.0, 28.81], [33.0, 44.68], [46.0, 46.63], [48.0, 49.22], [51.0, 52.89], [54.0, 54.78], [58.0, 58.13], [61.0, 61.43], [62.0, 61.69], [64.0, 66.21], [67.0, 67.76], [71.0, 71.76], [74.0, 75.47], [114.0, 115.59], [117.0, 117.19], [120.0, 120.6], [124.0, 124.93], [126.0, 127.7], [128.0, 129.25], [130.0, 130.47], [131.0, 132.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.29, 33.98, 37.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 72.47], ["singing", 2.85], ["male singing", 1.13]], [["music", 90.44], ["singing", 1.07], ["soul music", 1.04]], [["music", 47.27], ["speech", 43.02], ["noise", 2.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.53, 14.81, 11.68, 0.63, 1.22, 1.89, 0.78, 0.13, 0.43, -0.31, 2.21, 0.76, 0.76, 1.47, 1.59, 0.19, 0.6, 0.93, 1.7, 1.25, 0.47, 1.29]} \ No newline at end of file diff --git a/annotations_1/VCJrgPb3y80_filtered.json b/annotations_1/VCJrgPb3y80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81c972948a03576a165757d24d35d1ea104b5dde --- /dev/null +++ b/annotations_1/VCJrgPb3y80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.84], [6.0, 6.39], [9.0, 11.01], [11.0, 12.39], [13.0, 20.06], [22.0, 24.34], [30.0, 31.94], [35.0, 38.62], [43.0, 43.28], [51.0, 51.02], [52.0, 53.67], [55.0, 55.58], [56.0, 58.26], [60.0, 64.17], [66.0, 66.58], [68.0, 69.26], [70.0, 71.58], [73.0, 74.93], [76.0, 77.48], [79.0, 80.23], [81.0, 83.81], [87.0, 93.36], [100.0, 100.41], [109.0, 110.29], [120.0, 128.82], [130.0, 131.48], [135.0, 148.96], [152.0, 153.37], [156.0, 157.57], [160.0, 168.15], [170.0, 174.55], [177.0, 179.95], [183.0, 188.28], [189.0, 194.1], [195.0, 199.76], [200.0, 204.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.94, 0.0, 96.42, 85.72, 0.0, 50.36, 0.0, 0.0, 0.0, 0.0, 39.04, 31.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 94.37, 0.0, 0.0, 35.9, 0.0, 40.7, 0.0, 0.0, 100.0, 51.66, 99.1, 99.78, 93.45, 99.16, 62.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 19.27], ["speech", 15.59], ["chirp tone", 14.31]], [["fart", 40.26], ["music", 7.82], ["didgeridoo", 5.67]], null, null, null, null, null, null, null, null, null, null, [["speech", 72.15], ["sidetone", 21.02], ["noise", 0.73]], null, [["fart", 45.72], ["speech", 6.22], ["gasp", 4.29]], null, null, null, null, null, null, null, null, null], "duration": [1.84, 0.39, 2.01, 1.39, 7.06, 2.34, 1.94, 3.62, 0.28, 0.02, 1.67, 0.58, 2.26, 4.17, 0.58, 1.26, 1.58, 1.93, 1.48, 1.23, 2.81, 6.36, 0.41, 1.29, 8.82, 1.48, 13.96, 1.37, 1.57, 8.15, 4.55, 2.95, 5.28, 5.1, 4.76, 4.21]} \ No newline at end of file diff --git a/annotations_1/VCLL9aD-VKw_filtered.json b/annotations_1/VCLL9aD-VKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f1de797f19df875d2ad26ca6d627014291547d2 --- /dev/null +++ b/annotations_1/VCLL9aD-VKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.96], [5.0, 5.36], [9.0, 16.31], [18.0, 30.4], [33.0, 34.48], [35.0, 40.74], [41.0, 49.59], [50.0, 57.11], [58.0, 59.54], [61.0, 68.94], [70.0, 71.42], [72.0, 73.45], [77.0, 80.84], [81.0, 83.76], [85.0, 86.26], [87.0, 94.36], [95.0, 94.93], [95.0, 96.11], [98.0, 98.25], [99.0, 99.4], [101.0, 101.76], [103.0, 103.67], [104.0, 104.57], [106.0, 107.0], [108.0, 107.86], [109.0, 109.46], [109.0, 109.95], [111.0, 110.93], [121.0, 122.79], [124.0, 126.94], [129.0, 131.48], [132.0, 133.98], [134.0, 135.82], [138.0, 140.58], [141.0, 142.84], [144.0, 145.27]], "keep_status": [false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.76, 28.85, 0.0, 37.39, 33.96, 46.97, 0.0, 48.31, 0.0, 0.0, 94.66, 44.12, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 58.55, 0.0, 0.0, 96.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 25.81], ["speech", 13.12], ["foghorn", 12.84]], [["speech", 35.24], ["music", 22.84], ["vehicle", 13.19]], null, [["music", 33.1], ["theremin", 23.8], ["speech", 15.76]], [["music", 43.68], ["theremin", 17.36], ["hum", 8.45]], [["music", 65.39], ["synthesizer", 14.62], ["musical instrument", 4.09]], null, [["music", 54.41], ["synthesizer", 4.43], ["didgeridoo", 4.13]], null, null, null, [["flute", 30.21], ["speech", 27.68], ["wind instrument, woodwind instrument", 21.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.36, 7.31, 12.4, 1.48, 5.74, 8.59, 7.11, 1.54, 7.94, 1.42, 1.45, 3.84, 2.76, 1.26, 7.36, -0.07, 1.11, 0.25, 0.4, 0.76, 0.67, 0.57, 1.0, -0.14, 0.46, 0.95, -0.07, 1.79, 2.94, 2.48, 1.98, 1.82, 2.58, 1.84, 1.27]} \ No newline at end of file diff --git a/annotations_1/VCvOWhT1TiA_filtered.json b/annotations_1/VCvOWhT1TiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dcd419bedd308f1804a5af1c53ca6dda6eee025 --- /dev/null +++ b/annotations_1/VCvOWhT1TiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [5.0, 5.91], [7.0, 7.3], [31.0, 31.6], [45.0, 46.08], [47.0, 47.9], [49.0, 52.17], [106.0, 106.84], [114.0, 116.13], [121.0, 125.59]], "keep_status": [false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 30.07, 30.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 50.34], ["sidetone", 11.1], ["boing", 6.97]], [["music", 31.07], ["cattle, bovinae", 16.46], ["moo", 12.99]]], "duration": [1.25, 0.91, 0.3, 0.6, 1.08, 0.9, 3.17, 0.84, 2.13, 4.59]} \ No newline at end of file diff --git a/annotations_1/VD8UttNfU60_filtered.json b/annotations_1/VD8UttNfU60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce7140d48feb8fc76566cde5dc046d5794f5f126 --- /dev/null +++ b/annotations_1/VD8UttNfU60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [3.0, 3.92], [8.0, 9.44], [13.0, 14.12], [19.0, 18.71], [21.0, 21.2], [25.0, 25.25], [29.0, 29.22], [30.0, 30.91], [32.0, 33.45], [38.0, 38.4], [39.0, 40.19], [44.0, 45.0], [46.0, 47.02], [55.0, 54.78], [61.0, 62.43], [63.0, 64.64], [65.0, 66.65], [69.0, 68.88], [72.0, 72.27], [75.0, 75.54], [77.0, 77.68], [86.0, 87.17], [89.0, 89.13], [91.0, 92.38], [100.0, 101.41], [102.0, 102.12], [104.0, 106.14], [108.0, 119.16], [120.0, 119.92], [120.0, 121.74], [128.0, 129.79], [130.0, 135.55], [143.0, 144.75], [147.0, 148.0], [152.0, 152.22], [163.0, 164.76], [169.0, 169.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.91, 67.63, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.92, 1.44, 1.12, -0.29, 0.2, 0.25, 0.22, 0.91, 1.45, 0.4, 1.19, 1.0, 1.02, -0.22, 1.43, 1.64, 1.65, -0.12, 0.27, 0.54, 0.68, 1.17, 0.13, 1.38, 1.41, 0.12, 2.14, 11.16, -0.08, 1.74, 1.79, 5.55, 1.75, 1.0, 0.22, 1.76, 0.47]} \ No newline at end of file diff --git a/annotations_1/VDCoR_PxceY_filtered.json b/annotations_1/VDCoR_PxceY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..801db277bf383a839dcfcb1874a54a98b36350e0 --- /dev/null +++ b/annotations_1/VDCoR_PxceY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.35], [20.0, 45.08], [46.0, 72.91], [75.0, 76.99], [85.0, 109.44]], "keep_status": [false, true, true, false, true], "silence_prob": [41.28, 32.81, 31.24, 0.0, 28.75], "audiomae_on_audioset": [[["hum", 37.01], ["throbbing", 26.11], ["rumble", 8.94]], [["hum", 22.35], ["music", 22.22], ["rumble", 8.98]], [["music", 39.61], ["throbbing", 13.21], ["didgeridoo", 11.67]], null, [["hum", 16.75], ["throbbing", 15.55], ["music", 14.21]]], "duration": [8.35, 25.08, 26.91, 1.99, 24.44]} \ No newline at end of file diff --git a/annotations_1/VDwI61e2_6I_filtered.json b/annotations_1/VDwI61e2_6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbce78b561c31505bbb6e483a2726c7f66033fac --- /dev/null +++ b/annotations_1/VDwI61e2_6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.63], [15.0, 66.01], [72.0, 83.44], [84.0, 84.48], [85.0, 121.88], [122.0, 123.43]], "keep_status": [false, false, false, false, false, false], "silence_prob": [99.8, 0.0, 33.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 51.58], ["animal", 14.53], ["dog", 6.26]], null, null, null], "duration": [2.63, 51.01, 11.44, 0.48, 36.88, 1.43]} \ No newline at end of file diff --git a/annotations_1/VGcOGt-OV7s_filtered.json b/annotations_1/VGcOGt-OV7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b80209cc951fcf78bece281bc685186bc74e6a4 --- /dev/null +++ b/annotations_1/VGcOGt-OV7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.02], [14.0, 16.06], [20.0, 22.47], [23.0, 23.65], [25.0, 27.08], [36.0, 40.05], [58.0, 59.04], [63.0, 67.71], [74.0, 86.53], [91.0, 95.4], [96.0, 98.83]], "keep_status": [false, true, true, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 49.45, 44.69, 0.0, 44.93, 36.13, 0.0, 38.51, 32.02, 36.36, 46.02], "audiomae_on_audioset": [null, [["music", 35.96], ["throbbing", 11.14], ["hum", 9.61]], [["music", 17.24], ["hum", 13.02], ["boing", 8.07]], null, [["music", 51.05], ["synthesizer", 4.3], ["theremin", 3.97]], [["music", 61.05], ["electronic music", 6.07], ["hum", 5.23]], null, [["music", 34.21], ["speech", 32.18], ["hum", 8.18]], [["music", 54.23], ["hum", 8.09], ["throbbing", 7.86]], [["music", 18.98], ["boing", 16.2], ["ding", 13.94]], [["speech", 40.59], ["music", 34.22], ["thunk", 2.0]]], "duration": [1.02, 2.06, 2.47, 0.65, 2.08, 4.05, 1.04, 4.71, 12.53, 4.4, 2.83]} \ No newline at end of file diff --git a/annotations_1/VGhUlUHKv7s_filtered.json b/annotations_1/VGhUlUHKv7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3be30e1940c2d283a67d2e83b202546b4ce4d1e3 --- /dev/null +++ b/annotations_1/VGhUlUHKv7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [15.0, 16.6], [19.0, 20.12], [27.0, 27.55], [28.0, 30.55], [44.0, 44.46], [51.0, 52.03], [58.0, 63.44], [66.0, 79.64], [82.0, 87.13], [89.0, 92.45], [94.0, 108.06], [111.0, 140.16], [148.0, 155.12], [159.0, 160.05], [161.0, 174.55], [177.0, 176.77], [181.0, 181.45]], "keep_status": [false, false, false, false, true, false, false, true, true, true, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 46.09, 0.0, 0.0, 29.15, 28.48, 28.65, 28.98, 28.41, 28.6, 29.09, 0.0, 29.35, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 39.39], ["speech", 15.09], ["hum", 8.92]], null, null, [["speech", 21.15], ["mosquito", 18.98], ["fly, housefly", 10.45]], [["speech", 21.57], ["music", 20.24], ["groan", 7.78]], [["music", 47.95], ["speech", 9.17], ["boing", 5.76]], [["civil defense siren", 13.23], ["music", 8.35], ["speech", 6.47]], [["speech", 28.2], ["music", 18.67], ["explosion", 6.74]], [["music", 32.18], ["speech", 29.77], ["groan", 10.29]], [["music", 16.02], ["speech", 13.72], ["animal", 7.88]], null, [["music", 28.42], ["speech", 12.54], ["boing", 11.38]], null, null], "duration": [0.36, 1.6, 1.12, 0.55, 2.55, 0.46, 1.03, 5.44, 13.64, 5.13, 3.45, 14.06, 29.16, 7.12, 1.05, 13.55, -0.23, 0.45]} \ No newline at end of file diff --git a/annotations_1/VHj96nAjRn0_filtered.json b/annotations_1/VHj96nAjRn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cff49513b9c4f7f9d28a9f3e3e43aa0b351d16fc --- /dev/null +++ b/annotations_1/VHj96nAjRn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 58.99], [59.0, 61.15], [62.0, 80.23], [81.0, 81.75], [83.0, 85.01], [89.0, 90.04]], "keep_status": [false, true, true, false, false, false], "silence_prob": [0.0, 48.19, 47.23, 0.0, 98.27, 0.0], "audiomae_on_audioset": [null, [["speech", 38.99], ["music", 13.56], ["hum", 6.22]], [["music", 36.87], ["hum", 9.45], ["singing bowl", 7.37]], null, null, null], "duration": [56.99, 2.15, 18.23, 0.75, 2.01, 1.04]} \ No newline at end of file diff --git a/annotations_1/VIA2wUCj36Q_filtered.json b/annotations_1/VIA2wUCj36Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1848945ed547d716c5d3c153ac6f005b8844c29b --- /dev/null +++ b/annotations_1/VIA2wUCj36Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 7.97], [10.0, 10.67], [15.0, 16.12], [30.0, 30.69], [35.0, 37.66], [46.0, 46.57], [55.0, 55.8], [61.0, 63.29], [69.0, 72.94], [77.0, 77.97], [80.0, 80.6], [85.0, 86.12], [88.0, 88.33], [91.0, 90.95], [99.0, 100.35], [104.0, 119.69], [142.0, 146.16], [147.0, 147.39], [147.0, 149.17], [152.0, 152.63], [154.0, 154.31], [157.0, 158.25], [172.0, 173.01], [174.0, 178.44], [184.0, 189.92]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.01, 0.0, 0.0, 31.98, 30.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.35, 30.31, 0.0, 31.5, 0.0, 0.0, 0.0, 0.0, 30.72, 30.73], "audiomae_on_audioset": [null, null, null, null, null, [["music", 60.0], ["musical instrument", 5.82], ["guitar", 3.76]], null, null, [["music", 51.05], ["carnatic music", 20.46], ["speech", 6.3]], [["music", 68.51], ["carnatic music", 7.61], ["musical instrument", 5.23]], null, null, null, null, null, null, [["music", 65.72], ["theremin", 13.4], ["musical instrument", 4.04]], [["music", 55.17], ["carnatic music", 8.84], ["theremin", 5.57]], null, [["music", 52.03], ["didgeridoo", 6.15], ["boing", 5.39]], null, null, null, null, [["music", 67.56], ["musical instrument", 5.22], ["carnatic music", 3.17]], [["music", 41.11], ["bleat", 14.61], ["sheep", 13.51]]], "duration": [0.68, 0.97, 0.67, 1.12, 0.69, 2.66, 0.57, 0.8, 2.29, 3.94, 0.97, 0.6, 1.12, 0.33, -0.05, 1.35, 15.69, 4.16, 0.39, 2.17, 0.63, 0.31, 1.25, 1.01, 4.44, 5.92]} \ No newline at end of file diff --git a/annotations_1/VILmrL5jP7s_filtered.json b/annotations_1/VILmrL5jP7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83e6c6eb921aa2a781e7a570cd9aa3b531f1e5a8 --- /dev/null +++ b/annotations_1/VILmrL5jP7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.56], [7.0, 11.65], [14.0, 16.28], [17.0, 20.36], [22.0, 22.0], [23.0, 24.48], [25.0, 28.73], [29.0, 39.36], [40.0, 55.46], [57.0, 60.3], [63.0, 67.63], [71.0, 71.52], [74.0, 87.25]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 59.96, 99.05, 98.36, 0.0, 0.0, 70.58, 37.32, 40.75, 48.39, 35.59, 0.0, 38.08], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 53.51], ["music", 25.39], ["thunk", 4.96]], [["music", 12.2], ["speech", 12.15], ["hum", 11.5]], [["fart", 64.29], ["music", 12.72], ["speech", 3.65]], [["music", 20.75], ["mosquito", 16.45], ["hum", 4.58]], null, [["music", 36.85], ["synthesizer", 17.18], ["scary music", 7.47]]], "duration": [1.56, 4.65, 2.28, 3.36, 0.0, 1.48, 3.73, 10.36, 15.46, 3.3, 4.63, 0.52, 13.25]} \ No newline at end of file diff --git a/annotations_1/VJECUbUadpg_filtered.json b/annotations_1/VJECUbUadpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01e6ff4b6b853a30c89052de87a7a23fd104a87b --- /dev/null +++ b/annotations_1/VJECUbUadpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.97], [42.0, 172.03]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.97, 130.03]} \ No newline at end of file diff --git a/annotations_1/VJW2e8_cIfw_filtered.json b/annotations_1/VJW2e8_cIfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c87d2a3d9c3feeeed0f19ed76e32be0b252fdeab --- /dev/null +++ b/annotations_1/VJW2e8_cIfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 20.46], [24.0, 29.35], [30.0, 39.78], [44.0, 56.64], [57.0, 58.23], [60.0, 122.15], [123.0, 145.57], [147.0, 155.17]], "keep_status": [true, false, true, true, false, false, false, false], "silence_prob": [29.36, 29.24, 28.51, 29.17, 0.0, 0.0, 28.81, 32.61], "audiomae_on_audioset": [[["music", 23.72], ["speech", 16.29], ["whack, thwack", 6.78]], [["speech", 73.39], ["music", 12.7], ["hum", 2.62]], [["throbbing", 24.97], ["music", 17.34], ["hum", 15.24]], [["music", 26.41], ["whack, thwack", 14.37], ["speech", 12.06]], null, null, [["music", 65.27], ["buzz", 3.63], ["throbbing", 2.49]], [["mains hum", 44.41], ["hum", 43.58], ["throbbing", 4.01]]], "duration": [17.46, 5.35, 9.78, 12.64, 1.23, 62.15, 22.57, 8.17]} \ No newline at end of file diff --git a/annotations_1/VKl41s51JvE_filtered.json b/annotations_1/VKl41s51JvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fbb4f07189658444546ee1dc3fc3e53ad2cd5c4 --- /dev/null +++ b/annotations_1/VKl41s51JvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.75], [53.0, 55.93], [60.0, 66.24], [70.0, 70.63], [73.0, 74.28], [84.0, 84.59], [90.0, 90.78], [91.0, 92.62], [93.0, 94.24], [95.0, 95.49], [96.0, 96.84], [98.0, 107.7], [108.0, 128.43], [130.0, 131.77], [135.0, 151.66], [152.0, 153.45], [155.0, 163.92], [165.0, 167.16], [171.0, 171.48], [173.0, 173.64], [175.0, 175.64], [177.0, 177.57], [179.0, 180.08], [180.0, 182.53], [184.0, 185.19], [191.0, 190.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.46, 47.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.6, 29.99, 0.0, 55.67, 0.0, 63.21, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 54.36], ["dial tone", 11.86], ["sine wave", 8.74]], null, null, null, null, null, null, null, null, [["speech", 40.22], ["music", 26.71], ["sidetone", 12.82]], [["music", 45.89], ["speech", 17.55], ["sidetone", 13.19]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 2.93, 6.24, 0.63, 1.28, 0.59, 0.78, 1.62, 1.24, 0.49, 0.84, 9.7, 20.43, 1.77, 16.66, 1.45, 8.92, 2.16, 0.48, 0.64, 0.64, 0.57, 1.08, 2.53, 1.19, -0.08]} \ No newline at end of file diff --git a/annotations_1/VLm7BuSsFK8_filtered.json b/annotations_1/VLm7BuSsFK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72a5a2f0b1ec5cda69150b081c25ffb180a3fc3b --- /dev/null +++ b/annotations_1/VLm7BuSsFK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [7.0, 15.15], [17.0, 20.83], [23.0, 27.35], [28.0, 30.25], [32.0, 63.0], [65.0, 66.53], [68.0, 124.01], [126.0, 127.97], [130.0, 152.0], [153.0, 153.12]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 35.51, 50.21, 45.43, 39.09, 0.0, 0.0, 0.0, 0.0, 28.61, 0.0], "audiomae_on_audioset": [null, [["music", 49.02], ["throbbing", 19.58], ["hum", 11.8]], null, [["music", 25.12], ["hum", 23.59], ["throbbing", 20.69]], [["music", 39.22], ["hum", 22.3], ["throbbing", 10.96]], null, null, null, null, [["fireworks", 16.52], ["machine gun", 15.19], ["speech", 11.56]], null], "duration": [0.43, 8.15, 3.83, 4.35, 2.25, 31.0, 1.53, 56.01, 1.97, 22.0, 0.12]} \ No newline at end of file diff --git a/annotations_1/VM8ViJw7uNs_filtered.json b/annotations_1/VM8ViJw7uNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cedf83a4abb3771b9a52903ddac852e8e642c363 --- /dev/null +++ b/annotations_1/VM8ViJw7uNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.27], [17.0, 34.57], [35.0, 35.5], [37.0, 37.47], [38.0, 39.31], [43.0, 44.0], [45.0, 49.11], [50.0, 50.36], [60.0, 61.94], [63.0, 66.68], [67.0, 67.88], [70.0, 71.1], [74.0, 74.83], [75.0, 77.04], [79.0, 79.02], [81.0, 81.89], [84.0, 85.11], [91.0, 91.1], [93.0, 95.07], [97.0, 97.39], [100.0, 103.25], [104.0, 106.3], [108.0, 107.92], [109.0, 108.78], [109.0, 109.97], [111.0, 111.13], [114.0, 114.71], [117.0, 122.54], [123.0, 127.33], [130.0, 130.23], [136.0, 137.39], [138.0, 138.3], [139.0, 139.13], [140.0, 140.76], [143.0, 150.35], [151.0, 152.47], [154.0, 158.14], [161.0, 161.57], [175.0, 179.24], [181.0, 182.55], [183.0, 184.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 92.15, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 76.37, 0.0, 94.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 17.57, 0.5, 0.47, 1.31, 1.0, 4.11, 0.36, 1.94, 3.68, 0.88, 1.1, 0.83, 2.04, 0.02, 0.89, 1.11, 0.1, 2.07, 0.39, 3.25, 2.3, -0.08, -0.22, 0.97, 0.13, 0.71, 5.54, 4.33, 0.23, 1.39, 0.3, 0.13, 0.76, 7.35, 1.47, 4.14, 0.57, 4.24, 1.55, 1.33]} \ No newline at end of file diff --git a/annotations_1/VNLN5xyxwAY_filtered.json b/annotations_1/VNLN5xyxwAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c36e6795a2c3b3c6227d47274154ebb56618f5f --- /dev/null +++ b/annotations_1/VNLN5xyxwAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 54.01], [56.0, 58.68], [60.0, 66.8], [70.0, 71.76], [81.0, 89.04], [89.0, 98.73], [99.0, 98.76], [101.0, 101.19], [104.0, 104.65], [106.0, 112.28], [117.0, 118.79], [126.0, 132.44], [133.0, 133.78], [135.0, 134.96], [135.0, 135.58], [138.0, 142.21], [146.0, 145.74], [147.0, 147.04], [147.0, 147.92], [149.0, 149.18], [150.0, 151.31], [151.0, 152.56], [154.0, 154.08], [155.0, 155.58], [157.0, 158.11], [162.0, 162.23], [163.0, 163.43]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.89, 58.47, 45.59, 0.0, 37.0, 35.76, 0.0, 0.0, 0.0, 33.38, 0.0, 32.45, 0.0, 0.0, 0.0, 36.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.95], ["theremin", 11.29], ["didgeridoo", 3.16]], null, [["whale vocalization", 75.88], ["noise", 6.89], ["music", 4.76]], [["animal", 19.93], ["sheep", 8.8], ["bleat", 8.61]], null, null, null, [["music", 27.45], ["whale vocalization", 19.7], ["mains hum", 12.95]], null, [["music", 32.43], ["mains hum", 16.72], ["whale vocalization", 10.55]], null, null, null, [["cattle, bovinae", 25.59], ["livestock, farm animals, working animals", 17.98], ["moo", 15.65]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.01, 2.68, 6.8, 1.76, 8.04, 9.73, -0.24, 0.19, 0.65, 6.28, 1.79, 6.44, 0.78, -0.04, 0.58, 4.21, -0.26, 0.04, 0.92, 0.18, 1.31, 1.56, 0.08, 0.58, 1.11, 0.23, 0.43]} \ No newline at end of file diff --git a/annotations_1/VOk7mIZRPzI_filtered.json b/annotations_1/VOk7mIZRPzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..857b31ad49dc42d7193256aeca79a3fedc9fe221 --- /dev/null +++ b/annotations_1/VOk7mIZRPzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 55.78], [58.0, 58.8], [61.0, 60.88], [62.0, 90.48], [93.0, 136.58], [141.0, 142.74], [144.0, 145.05], [147.0, 149.25], [151.0, 160.74], [161.0, 160.81], [161.0, 160.95]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false], "silence_prob": [31.4, 0.0, 0.0, 30.4, 0.0, 0.0, 0.0, 66.51, 39.82, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 28.66], ["music", 19.25], ["throbbing", 17.65]], null, null, [["music", 50.35], ["musical instrument", 9.71], ["synthesizer", 9.38]], null, null, null, null, [["hum", 22.66], ["music", 21.66], ["gong", 10.83]], null, null], "duration": [14.78, 0.8, -0.12, 28.48, 43.58, 1.74, 1.05, 2.25, 9.74, -0.19, -0.05]} \ No newline at end of file diff --git a/annotations_1/VPOd_Y2qFJk_filtered.json b/annotations_1/VPOd_Y2qFJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad895d93eae3d6a8c3e3df1527a6dbc61ba4cf12 --- /dev/null +++ b/annotations_1/VPOd_Y2qFJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [6.0, 8.73], [10.0, 12.92], [15.0, 16.36], [18.0, 19.21], [20.0, 20.88], [22.0, 23.35], [25.0, 26.52], [28.0, 29.78], [30.0, 32.24], [34.0, 35.18], [38.0, 40.32], [44.0, 44.34], [45.0, 47.02], [49.0, 51.29], [60.0, 60.25], [70.0, 69.85], [70.0, 70.83], [72.0, 72.79], [77.0, 78.33], [79.0, 80.08], [84.0, 85.36], [88.0, 99.98], [102.0, 103.71], [105.0, 112.58], [113.0, 116.01], [120.0, 124.92], [129.0, 128.7], [131.0, 131.01]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 44.57, 45.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.83, 0.0, 59.96, 0.0, 40.64, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.4, 0.0, 28.87, 28.89, 29.3, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 15.51], ["music", 13.75], ["insect", 12.76]], [["speech", 34.33], ["music", 19.12], ["singing bowl", 18.56]], null, null, null, null, null, null, [["music", 58.21], ["speech", 23.18], ["hum", 2.75]], null, null, null, [["music", 47.04], ["speech", 30.71], ["hum", 1.97]], null, null, null, null, null, null, null, null, [["music", 32.36], ["boing", 13.98], ["speech", 8.59]], null, [["music", 41.31], ["speech", 27.76], ["crowd", 8.56]], [["cattle, bovinae", 25.55], ["speech", 17.54], ["moo", 14.01]], [["crowd", 45.79], ["speech", 13.17], ["cheering", 11.73]], null, null], "duration": [0.92, 2.73, 2.92, 1.36, 1.21, 0.88, 1.35, 1.52, 1.78, 2.24, 1.18, 2.32, 0.34, 2.02, 2.29, 0.25, -0.15, 0.83, 0.79, 1.33, 1.08, 1.36, 11.98, 1.71, 7.58, 3.01, 4.92, -0.3, 0.01]} \ No newline at end of file diff --git a/annotations_1/VPXd9ANX3Bw_filtered.json b/annotations_1/VPXd9ANX3Bw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..415ff0c281c219bd8a0aa621bcef28f91a9c27ca --- /dev/null +++ b/annotations_1/VPXd9ANX3Bw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [8.0, 8.01], [12.0, 17.54], [19.0, 23.4], [25.0, 29.32], [30.0, 53.54], [57.0, 59.95], [62.0, 72.84], [74.0, 76.6], [78.0, 80.47], [82.0, 82.31], [83.0, 83.89], [86.0, 90.0], [91.0, 91.62], [97.0, 97.29], [106.0, 107.25], [112.0, 112.33]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 36.72, 31.68, 30.5, 30.49, 31.48, 30.45, 30.85, 33.05, 0.0, 0.0, 31.57, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 24.38], ["music", 9.3], ["buzzer", 6.05]], [["music", 27.44], ["ding", 24.84], ["clang", 24.16]], [["music", 64.72], ["explosion", 5.33], ["burst, pop", 3.56]], [["music", 49.49], ["whack, thwack", 18.89], ["whip", 4.56]], [["music", 62.49], ["didgeridoo", 5.62], ["musical instrument", 3.37]], [["music", 49.22], ["speech", 19.05], ["boing", 10.61]], [["music", 38.57], ["brass instrument", 5.95], ["trombone", 3.02]], [["music", 27.02], ["musical instrument", 4.18], ["dog", 4.04]], null, null, [["fart", 21.55], ["speech", 20.82], ["wail, moan", 10.66]], null, null, null, null], "duration": [0.45, 0.01, 5.54, 4.4, 4.32, 23.54, 2.95, 10.84, 2.6, 2.47, 0.31, 0.89, 4.0, 0.62, 0.29, 1.25, 0.33]} \ No newline at end of file diff --git a/annotations_1/VPaFRrTJZ4U_filtered.json b/annotations_1/VPaFRrTJZ4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7932284188891071454979c85e1287551bc33b9e --- /dev/null +++ b/annotations_1/VPaFRrTJZ4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.91], [12.0, 12.63], [13.0, 13.19], [14.0, 13.86], [18.0, 22.0], [49.0, 49.28], [49.0, 62.94], [86.0, 87.88], [107.0, 107.49], [121.0, 142.57]], "keep_status": [false, false, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.83, 0.0, 30.0, 0.0, 0.0, 29.95], "audiomae_on_audioset": [null, null, null, null, [["music", 53.99], ["carnatic music", 8.08], ["singing", 6.99]], null, [["music", 57.86], ["moo", 3.04], ["sampler", 2.61]], null, null, [["music", 56.59], ["theremin", 7.44], ["shofar", 4.57]]], "duration": [0.91, 0.63, 0.19, -0.14, 4.0, 0.28, 13.94, 1.88, 0.49, 21.57]} \ No newline at end of file diff --git a/annotations_1/VPeXTe_6uOc_filtered.json b/annotations_1/VPeXTe_6uOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d609d72ce317bbc84312e2e536a0c617e2024d9b --- /dev/null +++ b/annotations_1/VPeXTe_6uOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 79.46], [80.0, 81.85], [83.0, 90.98], [96.0, 96.01], [97.0, 100.25], [101.0, 109.41], [112.0, 113.24], [115.0, 121.27], [124.0, 127.26]], "keep_status": [true, false, true, false, true, false, false, false, false], "silence_prob": [35.16, 0.0, 43.4, 0.0, 44.09, 64.86, 0.0, 78.38, 66.63], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 15.41], ["sound effect", 13.74], ["grunt", 9.6]], null, [["music", 17.84], ["didgeridoo", 7.96], ["reverberation", 7.89]], null, [["didgeridoo", 22.44], ["music", 19.15], ["hum", 17.1]], null, null, null, null], "duration": [4.46, 1.85, 7.98, 0.01, 3.25, 8.41, 1.24, 6.27, 3.26]} \ No newline at end of file diff --git a/annotations_1/VQjjlqVjiII_filtered.json b/annotations_1/VQjjlqVjiII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d309dd92a9b4e34076007671f3401736ca1ec9 --- /dev/null +++ b/annotations_1/VQjjlqVjiII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 32.37], [33.0, 34.23], [35.0, 49.86], [56.0, 66.02], [71.0, 72.33], [74.0, 74.21], [81.0, 80.81], [82.0, 83.32], [97.0, 103.38], [104.0, 105.19], [105.0, 109.85], [125.0, 127.87], [129.0, 129.44]], "keep_status": [true, false, true, true, false, false, false, false, true, false, true, true, false], "silence_prob": [30.47, 0.0, 31.29, 31.78, 0.0, 0.0, 0.0, 0.0, 31.96, 0.0, 38.02, 36.64, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 21.63], ["cowbell", 19.48], ["music", 15.25]], null, [["cattle, bovinae", 16.9], ["livestock, farm animals, working animals", 16.69], ["moo", 13.56]], [["music", 28.78], ["fly, housefly", 18.28], ["mosquito", 16.37]], null, null, null, null, [["speech", 42.17], ["music", 13.86], ["sine wave", 10.91]], null, [["sine wave", 23.84], ["chirp tone", 12.04], ["speech", 10.84]], [["music", 29.18], ["electric shaver, electric razor", 12.96], ["speech", 11.94]], null], "duration": [13.37, 1.23, 14.86, 10.02, 1.33, 0.21, -0.19, 1.32, 6.38, 1.19, 4.85, 2.87, 0.44]} \ No newline at end of file diff --git a/annotations_1/VR0NIF6PbCo_filtered.json b/annotations_1/VR0NIF6PbCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c077e81f5f43a52b931702c60ae8d836d616851 --- /dev/null +++ b/annotations_1/VR0NIF6PbCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 2.96], [4.0, 6.03], [9.0, 9.24], [10.0, 10.22], [12.0, 11.77], [12.0, 12.88], [14.0, 14.39], [15.0, 16.24], [23.0, 23.43], [24.0, 24.31], [28.0, 31.45], [33.0, 34.57], [37.0, 37.1], [37.0, 37.89], [39.0, 40.0], [51.0, 51.11], [59.0, 59.64], [61.0, 61.45], [62.0, 62.82], [63.0, 64.62], [66.0, 66.09], [69.0, 68.77], [70.0, 71.14], [74.0, 74.34], [75.0, 75.56], [77.0, 78.06], [79.0, 89.06], [93.0, 93.7], [97.0, 97.7], [98.0, 98.83], [101.0, 102.36], [112.0, 112.62], [113.0, 114.66], [116.0, 116.7], [117.0, 117.75], [123.0, 136.26], [139.0, 140.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.96, 2.03, 0.24, 0.22, -0.23, 0.88, 0.39, 1.24, 0.43, 0.31, 3.45, 1.57, 0.1, 0.89, 1.0, 0.11, 0.64, 0.45, 0.82, 1.62, 0.09, -0.23, 1.14, 0.34, 0.56, 1.06, 10.06, 0.7, 0.7, 0.83, 1.36, 0.62, 1.66, 0.7, 0.75, 13.26, 1.19]} \ No newline at end of file diff --git a/annotations_1/VRXkf4--IXw_filtered.json b/annotations_1/VRXkf4--IXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dba280182df9fa954f6057c27666c36cde48b8c8 --- /dev/null +++ b/annotations_1/VRXkf4--IXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [4.0, 5.75], [6.0, 8.11], [8.0, 9.58], [10.0, 10.88], [12.0, 13.51], [19.0, 21.66], [23.0, 26.74], [29.0, 30.37], [34.0, 34.87], [35.0, 44.69], [46.0, 48.61], [50.0, 53.87], [56.0, 56.47], [57.0, 57.4], [59.0, 62.48], [64.0, 68.45], [70.0, 71.83], [73.0, 73.95], [77.0, 77.46], [80.0, 80.82], [87.0, 87.35], [89.0, 91.23], [92.0, 92.82], [97.0, 97.66], [98.0, 99.5], [101.0, 103.98], [104.0, 105.36], [109.0, 110.35], [120.0, 120.93], [123.0, 124.44], [128.0, 128.41], [130.0, 131.7], [133.0, 135.19], [137.0, 139.41], [144.0, 144.68], [146.0, 146.96], [147.0, 148.81], [149.0, 150.15], [150.0, 151.48], [152.0, 153.06], [155.0, 155.39], [157.0, 165.11], [168.0, 169.47]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.62, 0.0, 0.0, 0.0, 81.53, 70.3, 0.0, 0.0, 64.52, 87.0, 73.97, 0.0, 0.0, 92.31, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 0.0, 0.0, 0.0, 35.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.31, 0.0], "audiomae_on_audioset": [null, null, [["music", 22.17], ["drum", 13.69], ["percussion", 13.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.15], ["music", 4.47], ["synthesizer", 1.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.18], ["radio", 12.11], ["telephone", 10.96]], null], "duration": [0.98, 1.75, 2.11, 1.58, 0.88, 1.51, 2.66, 3.74, 1.37, 0.87, 9.69, 2.61, 3.87, 0.47, 0.4, 3.48, 4.45, 1.83, 0.95, 0.46, 0.82, 0.35, 2.23, 0.82, 0.66, 1.5, 2.98, 1.36, 1.35, 0.93, 1.44, 0.41, 1.7, 2.19, 2.41, 0.68, 0.96, 1.81, 1.15, 1.48, 1.06, 0.39, 8.11, 1.47]} \ No newline at end of file diff --git a/annotations_1/VRuV5oMqkDg_filtered.json b/annotations_1/VRuV5oMqkDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cb9d0a0ab6a6bd00fe6267268d30745cad48c01 --- /dev/null +++ b/annotations_1/VRuV5oMqkDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 53.86], [54.0, 55.11], [56.0, 56.89], [58.0, 59.24], [60.0, 61.89], [63.0, 64.27], [66.0, 68.49], [70.0, 71.76], [76.0, 80.6], [84.0, 86.31], [88.0, 91.89], [92.0, 95.5], [98.0, 100.68], [103.0, 105.0], [106.0, 108.01]], "keep_status": [false, false, false, false, false, false, true, false, true, false, true, true, true, true, false], "silence_prob": [29.59, 0.0, 0.0, 0.0, 0.0, 0.0, 28.78, 0.0, 30.1, 32.9, 35.71, 36.49, 35.92, 46.02, 50.06], "audiomae_on_audioset": [[["music", 51.04], ["hum", 18.75], ["mains hum", 8.12]], null, null, null, null, null, [["music", 12.81], ["throbbing", 11.81], ["hum", 10.57]], null, [["mains hum", 26.03], ["speech", 24.57], ["hum", 13.44]], [["whale vocalization", 51.76], ["fly, housefly", 19.46], ["bee, wasp, etc.", 4.89]], [["boat, water vehicle", 15.45], ["fly, housefly", 12.54], ["hum", 6.84]], [["speech", 36.69], ["fly, housefly", 17.33], ["insect", 8.38]], [["hum", 23.21], ["mains hum", 13.08], ["throbbing", 12.03]], [["music", 38.83], ["frog", 16.01], ["whale vocalization", 12.09]], null], "duration": [25.86, 1.11, 0.89, 1.24, 1.89, 1.27, 2.49, 1.76, 4.6, 2.31, 3.89, 3.5, 2.68, 2.0, 2.01]} \ No newline at end of file diff --git a/annotations_1/VTTj-7UumYk_filtered.json b/annotations_1/VTTj-7UumYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d178c32f69ec975045e586fc719c3dabf888c679 --- /dev/null +++ b/annotations_1/VTTj-7UumYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [10.0, 10.15], [47.0, 47.39], [49.0, 49.25], [68.0, 69.92], [82.0, 82.32], [83.0, 84.48]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.92, 0.15, 0.39, 0.25, 1.92, 0.32, 1.48]} \ No newline at end of file diff --git a/annotations_1/VU3Tu4K4MOo_filtered.json b/annotations_1/VU3Tu4K4MOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38e825c43e721a140bc8c2bd0abe11b4a2432407 --- /dev/null +++ b/annotations_1/VU3Tu4K4MOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.21], [29.0, 32.46], [33.0, 33.96], [35.0, 35.82], [39.0, 39.61], [44.0, 45.4], [47.0, 46.84], [47.0, 52.96], [54.0, 62.43], [63.0, 63.98], [66.0, 66.7], [68.0, 68.96], [71.0, 72.44], [73.0, 94.31]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [68.41, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 46.94, 65.55, 0.0, 0.0, 0.0, 0.0, 56.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 41.63], ["sidetone", 21.37], ["hum", 5.65]], null, null, null, null, null, null], "duration": [15.21, 3.46, 0.96, 0.82, 0.61, 1.4, -0.16, 5.96, 8.43, 0.98, 0.7, 0.96, 1.44, 21.31]} \ No newline at end of file diff --git a/annotations_1/VV26lYf6VyM_filtered.json b/annotations_1/VV26lYf6VyM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c256f8eecb595604fdb2ffb3772507e2266ae8 --- /dev/null +++ b/annotations_1/VV26lYf6VyM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.79], [19.0, 21.17], [23.0, 23.77], [25.0, 25.79], [27.0, 29.03], [39.0, 41.94], [43.0, 43.43], [45.0, 54.53], [56.0, 56.76], [58.0, 58.38], [62.0, 62.06], [70.0, 70.11], [72.0, 72.77], [77.0, 77.87], [79.0, 79.91], [80.0, 82.34], [85.0, 87.39], [97.0, 98.14], [102.0, 132.38], [138.0, 152.68], [155.0, 159.26]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [29.97, 36.37, 0.0, 0.0, 56.4, 65.32, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.37, 36.0, 0.0, 0.0, 34.04, 40.68], "audiomae_on_audioset": [[["music", 70.06], ["electronic music", 8.21], ["whale vocalization", 5.17]], [["music", 29.53], ["sine wave", 7.51], ["electronic music", 6.12]], null, null, null, null, null, [["hum", 18.57], ["animal", 12.55], ["throbbing", 10.56]], null, null, null, null, null, null, null, [["music", 64.66], ["didgeridoo", 15.48], ["electronic music", 5.49]], [["hum", 21.3], ["music", 18.63], ["mains hum", 11.97]], null, null, [["music", 51.48], ["hum", 22.82], ["throbbing", 11.73]], [["music", 51.76], ["gong", 19.02], ["electronic music", 10.66]]], "duration": [6.79, 2.17, 0.77, 0.79, 2.03, 2.94, 0.43, 9.53, 0.76, 0.38, 0.06, 0.11, 0.77, 0.87, 0.91, 2.34, 2.39, 1.14, 30.38, 14.68, 4.26]} \ No newline at end of file diff --git a/annotations_1/VV97_cn54bQ_filtered.json b/annotations_1/VV97_cn54bQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0119b46618ff4c6b4a52872aff653d9272d17039 --- /dev/null +++ b/annotations_1/VV97_cn54bQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.89], [20.0, 20.7], [25.0, 25.74], [26.0, 26.57], [28.0, 28.21], [29.0, 29.83], [35.0, 47.44], [48.0, 50.4], [53.0, 54.97], [55.0, 56.17], [58.0, 62.14], [66.0, 68.84], [71.0, 73.21], [75.0, 104.04], [107.0, 122.1], [126.0, 148.49], [152.0, 152.76]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, true, true, true, false, true, false], "silence_prob": [35.3, 0.0, 0.0, 0.0, 0.0, 0.0, 44.78, 43.05, 0.0, 0.0, 32.37, 33.77, 39.09, 28.65, 29.24, 28.5, 0.0], "audiomae_on_audioset": [[["speech", 42.37], ["buzz", 15.39], ["vehicle", 4.49]], null, null, null, null, null, [["whale vocalization", 28.94], ["hum", 26.87], ["mains hum", 10.6]], [["fly, housefly", 34.33], ["insect", 21.06], ["speech", 12.11]], null, null, [["speech", 36.87], ["music", 35.19], ["boing", 7.97]], [["speech", 20.73], ["buzz", 7.72], ["hum", 6.26]], [["civil defense siren", 20.97], ["music", 13.73], ["siren", 12.85]], [["music", 28.03], ["mains hum", 20.57], ["hum", 14.02]], [["hum", 30.52], ["mains hum", 25.49], ["music", 20.36]], [["music", 22.91], ["skidding", 12.54], ["race car, auto racing", 11.04]], null], "duration": [16.89, 0.7, 0.74, 0.57, 0.21, 0.83, 12.44, 2.4, 1.97, 1.17, 4.14, 2.84, 2.21, 29.04, 15.1, 22.49, 0.76]} \ No newline at end of file diff --git a/annotations_1/VVlECM2KyYg_filtered.json b/annotations_1/VVlECM2KyYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..748e1983624c89d34507409919db54f4e1a2a7e3 --- /dev/null +++ b/annotations_1/VVlECM2KyYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.97], [15.0, 16.14], [19.0, 18.81], [24.0, 31.18], [49.0, 49.72], [53.0, 53.81], [59.0, 63.46], [64.0, 69.16], [72.0, 72.08]], "keep_status": [false, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 35.43, 31.42, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 23.66], ["sidetone", 19.36], ["speech", 10.5]], null, null, [["music", 29.44], ["speech", 20.91], ["door", 12.09]], [["music", 44.01], ["fly, housefly", 6.54], ["boing", 5.07]], null], "duration": [0.97, 1.14, -0.19, 7.18, 0.72, 0.81, 4.46, 5.16, 0.08]} \ No newline at end of file diff --git a/annotations_1/VVvKuI8oK3c_filtered.json b/annotations_1/VVvKuI8oK3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9774fa233c58232af52d70f2e891b5bd6b3e5db --- /dev/null +++ b/annotations_1/VVvKuI8oK3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [5.0, 7.99], [8.0, 8.72], [10.0, 13.26], [16.0, 18.33], [22.0, 22.79], [23.0, 23.46], [24.0, 23.57], [24.0, 25.51], [26.0, 28.86], [30.0, 30.54], [31.0, 32.97], [34.0, 34.3], [35.0, 35.65], [38.0, 38.15], [41.0, 41.52], [43.0, 45.23], [46.0, 59.59], [61.0, 69.25], [71.0, 77.67], [80.0, 79.73], [84.0, 84.55], [86.0, 87.86], [89.0, 90.56], [93.0, 95.18], [96.0, 98.07], [99.0, 100.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.78, 0.0, 61.57, 68.67, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 99.98, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 2.99, 0.72, 3.26, 2.33, 0.79, 0.46, -0.43, 1.51, 2.86, 0.54, 1.97, 0.3, 0.65, 0.15, 0.52, 2.23, 13.59, 8.25, 6.67, -0.27, 0.55, 1.86, 1.56, 2.18, 2.07, 1.38]} \ No newline at end of file diff --git a/annotations_1/VWMSjhr1BZE_filtered.json b/annotations_1/VWMSjhr1BZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c626d18adc2aac64cc698a1cafd845dda1ef77 --- /dev/null +++ b/annotations_1/VWMSjhr1BZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 23.43], [25.0, 27.08], [31.0, 31.56], [38.0, 42.87], [46.0, 53.0], [54.0, 59.63], [61.0, 62.26], [64.0, 65.96], [67.0, 69.06], [70.0, 72.35], [74.0, 74.63], [77.0, 78.17], [79.0, 78.88], [86.0, 86.59], [89.0, 89.09], [93.0, 94.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.0, 97.11, 0.0, 91.81, 87.37, 89.54, 0.0, 0.0, 100.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.43, 2.08, 0.56, 4.87, 7.0, 5.63, 1.26, 1.96, 2.06, 2.35, 0.63, 1.17, -0.12, 0.59, 0.09, 1.59]} \ No newline at end of file diff --git a/annotations_1/VW_Bmy2Cm2c_filtered.json b/annotations_1/VW_Bmy2Cm2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9ea214df1aae978f8035574dba6bff234994852 --- /dev/null +++ b/annotations_1/VW_Bmy2Cm2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [2.0, 7.2], [17.0, 18.15], [24.0, 25.2], [32.0, 33.4], [36.0, 38.25], [43.0, 46.26], [48.0, 56.46], [59.0, 59.36], [60.0, 60.72], [62.0, 64.03], [66.0, 67.1], [69.0, 73.8], [75.0, 75.36], [76.0, 76.84], [78.0, 80.86], [86.0, 85.99], [93.0, 93.09], [98.0, 99.25], [104.0, 109.29], [110.0, 111.33], [113.0, 115.1], [116.0, 118.79], [121.0, 131.3], [132.0, 135.23], [137.0, 138.72], [140.0, 140.71], [142.0, 148.36], [149.0, 155.46], [160.0, 160.3], [163.0, 163.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.2, 0.0, 0.0, 0.0, 47.98, 66.03, 54.43, 0.0, 0.0, 93.6, 0.0, 93.76, 0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 46.83, 0.0, 96.66, 97.83, 70.86, 98.8, 0.0, 0.0, 98.66, 91.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 51.89], ["sine wave", 9.71], ["busy signal", 9.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.83], ["sidetone", 31.6], ["rumble", 8.82]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 5.2, 1.15, 1.2, 1.4, 2.25, 3.26, 8.46, 0.36, 0.72, 2.03, 1.1, 4.8, 0.36, 0.84, 2.86, -0.01, 0.09, 1.25, 5.29, 1.33, 2.1, 2.79, 10.3, 3.23, 1.72, 0.71, 6.36, 6.46, 0.3, 0.73]} \ No newline at end of file diff --git a/annotations_1/VXPxIwL1e5g_filtered.json b/annotations_1/VXPxIwL1e5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b66674a4e92870d5ccae93af8d912c48dd57216 --- /dev/null +++ b/annotations_1/VXPxIwL1e5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [16.0, 16.55], [18.0, 24.36], [32.0, 31.99], [39.0, 39.39], [40.0, 40.27], [41.0, 42.94], [44.0, 45.98], [48.0, 48.36], [50.0, 51.68], [72.0, 72.57], [76.0, 82.16], [84.0, 84.37], [116.0, 116.73], [121.0, 121.73], [131.0, 131.45], [132.0, 133.66], [135.0, 135.5], [139.0, 139.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.55, 6.36, -0.01, 0.39, 0.27, 1.94, 1.98, 0.36, 1.68, 0.57, 6.16, 0.37, 0.73, 0.73, 0.45, 1.66, 0.5, 0.6]} \ No newline at end of file diff --git a/annotations_1/VXkEBRtERnA_filtered.json b/annotations_1/VXkEBRtERnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08244930626466624324e4d88545b19f1737cef7 --- /dev/null +++ b/annotations_1/VXkEBRtERnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.11], [8.0, 8.53], [10.0, 11.01], [12.0, 13.02], [17.0, 17.78], [19.0, 24.76], [25.0, 30.43], [34.0, 34.53], [35.0, 35.58], [36.0, 37.25], [38.0, 38.38], [40.0, 42.62], [43.0, 43.44], [46.0, 46.53], [47.0, 47.46], [48.0, 48.22], [51.0, 50.82], [54.0, 54.57], [55.0, 55.88], [58.0, 59.19], [59.0, 60.72], [61.0, 63.36], [68.0, 89.99], [91.0, 92.67], [93.0, 93.9], [94.0, 94.47], [98.0, 98.71], [102.0, 102.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.92, 0.0, 0.0, 0.0, 0.0, 96.54, 78.72, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.53, 38.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 34.23], ["cattle, bovinae", 28.77], ["livestock, farm animals, working animals", 19.89]], [["music", 57.12], ["organ", 10.43], ["keyboard (musical)", 6.17]], null, null, null, null, null], "duration": [5.11, 0.53, 1.01, 1.02, 0.78, 5.76, 5.43, 0.53, 0.58, 1.25, 0.38, 2.62, 0.44, 0.53, 0.46, 0.22, -0.18, 0.57, 0.88, 1.19, 1.72, 2.36, 21.99, 1.67, 0.9, 0.47, 0.71, 0.42]} \ No newline at end of file diff --git a/annotations_1/VXlMfWObFCA_filtered.json b/annotations_1/VXlMfWObFCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49069650a39b236509d4635f937444478c7a615c --- /dev/null +++ b/annotations_1/VXlMfWObFCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 2.0], [3.0, 3.79], [10.0, 10.22], [11.0, 10.93], [12.0, 13.34], [14.0, 14.94], [16.0, 17.79], [19.0, 21.37], [24.0, 24.34], [25.0, 27.11], [30.0, 30.57], [32.0, 36.27], [40.0, 41.2], [47.0, 47.95], [49.0, 50.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 0.0, 66.39, 0.0, 73.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.0, 0.79, 0.22, -0.07, 1.34, 0.94, 1.79, 2.37, 0.34, 2.11, 0.57, 4.27, 1.2, 0.95, 1.23]} \ No newline at end of file diff --git a/annotations_1/VXx_DVHO0go_filtered.json b/annotations_1/VXx_DVHO0go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ba68fe71bcbad58e2dfe5dbaa178cd2915962c1 --- /dev/null +++ b/annotations_1/VXx_DVHO0go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.84], [13.0, 13.1], [16.0, 16.11], [17.0, 17.14], [21.0, 23.36], [35.0, 35.53], [38.0, 41.32], [43.0, 50.57], [61.0, 63.29], [78.0, 78.8], [79.0, 79.2], [85.0, 85.9], [91.0, 101.07], [102.0, 103.49]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, true, false], "silence_prob": [32.56, 0.0, 0.0, 0.0, 30.02, 0.0, 39.5, 31.79, 32.17, 0.0, 0.0, 0.0, 32.37, 0.0], "audiomae_on_audioset": [[["music", 70.29], ["synthesizer", 4.32], ["musical instrument", 4.17]], null, null, null, [["animal", 17.31], ["speech", 10.34], ["howl", 9.63]], null, [["hum", 24.54], ["throbbing", 19.99], ["mains hum", 7.8]], [["speech", 22.03], ["burst, pop", 10.19], ["explosion", 8.4]], [["hum", 40.02], ["throbbing", 31.12], ["heart sounds, heartbeat", 10.1]], null, null, null, [["music", 23.04], ["hum", 12.19], ["mains hum", 8.61]], null], "duration": [2.84, 0.1, 0.11, 0.14, 2.36, 0.53, 3.32, 7.57, 2.29, 0.8, 0.2, 0.9, 10.07, 1.49]} \ No newline at end of file diff --git a/annotations_1/VZM1S9VcjAM_filtered.json b/annotations_1/VZM1S9VcjAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e68cc454a3c5d7df964cf0ab311fa556a852bbc --- /dev/null +++ b/annotations_1/VZM1S9VcjAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.26], [16.0, 15.89], [17.0, 18.69], [20.0, 20.68], [22.0, 22.64], [24.0, 27.51], [28.0, 31.43], [34.0, 35.9], [37.0, 38.2], [39.0, 40.78], [42.0, 45.03], [47.0, 61.87], [64.0, 66.36], [68.0, 70.73], [72.0, 74.14], [75.0, 80.23], [81.0, 83.93], [85.0, 85.73], [86.0, 87.45], [89.0, 90.34], [92.0, 93.36], [94.0, 94.83], [96.0, 97.6], [101.0, 102.69], [104.0, 104.82], [106.0, 107.92], [111.0, 113.88], [115.0, 116.19], [118.0, 119.99], [122.0, 122.82], [125.0, 125.46], [129.0, 130.37], [131.0, 132.7], [133.0, 135.84], [139.0, 139.6], [141.0, 147.55], [154.0, 155.43], [159.0, 159.21], [162.0, 162.31], [163.0, 163.68], [164.0, 164.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 97.11, 0.0, 0.0, 0.0, 98.44, 83.34, 100.0, 97.11, 99.95, 99.87, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 53.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, -0.11, 1.69, 0.68, 0.64, 3.51, 3.43, 1.9, 1.2, 1.78, 3.03, 14.87, 2.36, 2.73, 2.14, 5.23, 2.93, 0.73, 1.45, 1.34, 1.36, 0.83, 1.6, 1.69, 0.82, 1.92, 2.88, 1.19, 1.99, 0.82, 0.46, 1.37, 1.7, 2.84, 0.6, 6.55, 1.43, 0.21, 0.31, 0.68, 0.88]} \ No newline at end of file diff --git a/annotations_1/V_dtlMkvp2Q_filtered.json b/annotations_1/V_dtlMkvp2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54d0950d31e01284164188a36bbd2ff4bc3e2312 --- /dev/null +++ b/annotations_1/V_dtlMkvp2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 34.13], [37.0, 38.5], [40.0, 41.07], [42.0, 43.29], [52.0, 53.69], [55.0, 55.73], [58.0, 58.55], [65.0, 65.92], [69.0, 74.68], [76.0, 81.92], [83.0, 96.23], [98.0, 98.86], [101.0, 113.44], [115.0, 151.46], [153.0, 158.41], [160.0, 166.02], [168.0, 167.71], [168.0, 169.33], [169.0, 169.37]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false], "silence_prob": [35.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.81, 31.9, 30.53, 0.0, 28.96, 0.0, 28.58, 32.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 37.75], ["music", 26.09], ["throbbing", 12.27]], null, null, null, null, null, null, null, [["burst, pop", 15.75], ["speech", 13.18], ["explosion", 9.1]], [["music", 41.61], ["hum", 19.53], ["electronic music", 13.15]], [["hum", 56.56], ["mains hum", 21.83], ["throbbing", 8.12]], null, [["music", 42.23], ["hum", 8.92], ["speech", 7.33]], null, [["music", 33.34], ["throbbing", 27.47], ["hum", 22.4]], [["music", 42.4], ["speech", 11.25], ["glass", 5.17]], null, null, null], "duration": [4.13, 1.5, 1.07, 1.29, 1.69, 0.73, 0.55, 0.92, 5.68, 5.92, 13.23, 0.86, 12.44, 36.46, 5.41, 6.02, -0.29, 1.33, 0.37]} \ No newline at end of file diff --git a/annotations_1/Vb6cuUI7B3E_filtered.json b/annotations_1/Vb6cuUI7B3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9060de40ad8d0933b84ce6f8b01d607625ac8edb --- /dev/null +++ b/annotations_1/Vb6cuUI7B3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [6.0, 7.92], [19.0, 20.66], [42.0, 42.58], [46.0, 46.35], [53.0, 53.91], [58.0, 61.62], [77.0, 78.61], [81.0, 81.35], [101.0, 101.28], [107.0, 109.54], [111.0, 111.69], [114.0, 114.99], [115.0, 117.31], [118.0, 128.49], [136.0, 140.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 62.89, 74.6, 82.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 1.92, 1.66, 0.58, 0.35, 0.91, 3.62, 1.61, 0.35, 0.28, 2.54, 0.69, 0.99, 2.31, 10.49, 4.51]} \ No newline at end of file diff --git a/annotations_1/VbBi8ZIWbUc_filtered.json b/annotations_1/VbBi8ZIWbUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ef935c4a56a041f0be0cd707c75cb759e06e26e --- /dev/null +++ b/annotations_1/VbBi8ZIWbUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [3.0, 4.08], [27.0, 27.58], [31.0, 31.75], [35.0, 35.99], [38.0, 38.37]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.13, 1.08, 0.58, 0.75, 0.99, 0.37]} \ No newline at end of file diff --git a/annotations_1/VbP7jMN_v-w_filtered.json b/annotations_1/VbP7jMN_v-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5ec13bda8a6edb40ec85d2c0dc8c220b0d00196 --- /dev/null +++ b/annotations_1/VbP7jMN_v-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [2.0, 4.35], [5.0, 6.54], [7.0, 18.2], [21.0, 21.78], [32.0, 38.96], [45.0, 46.08], [46.0, 46.74], [47.0, 47.93], [51.0, 52.51], [53.0, 54.53], [82.0, 93.39], [98.0, 98.85], [105.0, 106.1], [111.0, 118.1], [136.0, 136.43], [137.0, 136.65], [140.0, 144.12], [158.0, 160.25], [161.0, 164.86]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.91, 0.0, 41.83, 0.0, 40.97, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 0.0, 0.0, 31.65, 0.0, 0.0, 32.06, 31.51, 32.45], "audiomae_on_audioset": [null, [["music", 37.19], ["speech", 10.87], ["grunt", 3.88]], null, [["music", 61.22], ["thunk", 10.98], ["quack", 5.97]], null, [["music", 21.49], ["speech", 19.76], ["sheep", 8.35]], null, null, null, null, null, [["music", 51.45], ["throbbing", 19.02], ["hum", 11.69]], null, null, [["cattle, bovinae", 47.6], ["moo", 36.52], ["livestock, farm animals, working animals", 13.91]], null, null, [["mains hum", 43.07], ["music", 18.59], ["hum", 13.87]], [["fly, housefly", 43.62], ["mosquito", 18.17], ["insect", 13.75]], [["music", 30.67], ["fly, housefly", 22.17], ["insect", 11.12]]], "duration": [-0.08, 2.35, 1.54, 11.2, 0.78, 6.96, 1.08, 0.74, 0.93, 1.51, 1.53, 11.39, 0.85, 1.1, 7.1, 0.43, -0.35, 4.12, 2.25, 3.86]} \ No newline at end of file diff --git a/annotations_1/Vchw3dbVeUo_filtered.json b/annotations_1/Vchw3dbVeUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8efd49d7ede5c8c9e218139d77eca260205e8640 --- /dev/null +++ b/annotations_1/Vchw3dbVeUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [9.0, 10.29], [13.0, 20.88], [31.0, 33.34], [40.0, 41.27], [44.0, 44.31], [47.0, 48.25], [49.0, 49.08], [51.0, 52.62], [55.0, 55.68], [60.0, 60.51], [71.0, 77.84], [85.0, 85.58], [89.0, 89.58], [93.0, 94.44], [99.0, 99.55], [107.0, 108.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.1, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 80.34], ["musical instrument", 1.63], ["throbbing", 1.36]], [["music", 63.15], ["speech", 9.63], ["electronic music", 3.22]], null, null, null, null, null, null, null, [["music", 25.41], ["throbbing", 14.82], ["sidetone", 14.36]], null, null, null, null, null], "duration": [0.78, 1.29, 7.88, 2.34, 1.27, 0.31, 1.25, 0.08, 1.62, 0.68, 0.51, 6.84, 0.58, 0.58, 1.44, 0.55, 1.28]} \ No newline at end of file diff --git a/annotations_1/VcnAtRLJS84_filtered.json b/annotations_1/VcnAtRLJS84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..201620f20ecc98a93c18958df2337b76874a8dca --- /dev/null +++ b/annotations_1/VcnAtRLJS84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.79], [38.0, 40.42], [40.0, 40.46]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.93, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 32.2], ["cattle, bovinae", 29.05], ["moo", 28.51]], null], "duration": [0.79, 2.42, 0.46]} \ No newline at end of file diff --git a/annotations_1/VdAC6kNpXeM_filtered.json b/annotations_1/VdAC6kNpXeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f8b46169cf2e99e6bfbd8f84e778786ff9bcdd8 --- /dev/null +++ b/annotations_1/VdAC6kNpXeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [6.0, 5.78], [8.0, 8.36], [12.0, 17.9], [20.0, 32.56], [34.0, 58.36]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.28, 30.17, 29.94], "audiomae_on_audioset": [null, null, null, [["music", 40.82], ["throbbing", 17.27], ["hum", 13.12]], [["music", 37.72], ["throbbing", 31.6], ["hum", 14.97]], [["throbbing", 41.75], ["music", 23.09], ["hum", 20.09]]], "duration": [0.49, -0.22, 0.36, 5.9, 12.56, 24.36]} \ No newline at end of file diff --git a/annotations_1/Veh9KV9fm6s_filtered.json b/annotations_1/Veh9KV9fm6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b362c39597d8bc64e568f5013a4923734b3f585 --- /dev/null +++ b/annotations_1/Veh9KV9fm6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 123.23]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [88.23]} \ No newline at end of file diff --git a/annotations_1/Vfi1V_SL9H8_filtered.json b/annotations_1/Vfi1V_SL9H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53bb50a9f8e2054369669413392507ffbc886080 --- /dev/null +++ b/annotations_1/Vfi1V_SL9H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[141.0, 141.44]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.44]} \ No newline at end of file diff --git a/annotations_1/VflasoWmuoA_filtered.json b/annotations_1/VflasoWmuoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dffe2b6df4886710ada4fd44935d64fec5641d39 --- /dev/null +++ b/annotations_1/VflasoWmuoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.7], [13.0, 12.72], [14.0, 45.49], [47.0, 47.95], [53.0, 52.74], [53.0, 54.9], [57.0, 58.73], [60.0, 61.47], [68.0, 70.01], [71.0, 72.84], [76.0, 80.96], [82.0, 83.76], [85.0, 87.62], [89.0, 91.5], [92.0, 93.16], [94.0, 96.47], [97.0, 99.03], [100.0, 102.17], [103.0, 104.38], [106.0, 106.89], [109.0, 110.0], [112.0, 112.53], [117.0, 117.86], [124.0, 124.68], [127.0, 127.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.64, 0.0, 40.7, 0.0, 49.27, 43.43, 0.0, 50.51, 55.89, 40.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.45], ["singing bowl", 32.19], ["speech", 11.27]], null, null, null, null, null, null, null, [["music", 35.36], ["speech", 14.41], ["mains hum", 7.8]], null, [["music", 33.77], ["mains hum", 16.65], ["hum", 14.71]], null, [["music", 38.05], ["didgeridoo", 6.59], ["mains hum", 5.03]], [["music", 74.55], ["scary music", 5.12], ["ambient music", 3.13]], null, null, null, [["music", 31.92], ["frog", 8.2], ["croak", 7.94]], null, null, null, null, null, null, null], "duration": [6.7, -0.28, 31.49, 0.95, -0.26, 1.9, 1.73, 1.47, 2.01, 1.84, 4.96, 1.76, 2.62, 2.5, 1.16, 2.47, 2.03, 2.17, 1.38, 0.89, 1.0, 0.53, 0.86, 0.68, 0.14]} \ No newline at end of file diff --git a/annotations_1/VgO0K_0mi1U_filtered.json b/annotations_1/VgO0K_0mi1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1da70830f488b9617015a8a340c2e01117c68829 --- /dev/null +++ b/annotations_1/VgO0K_0mi1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.31], [13.0, 14.44], [15.0, 15.28], [16.0, 18.13], [19.0, 26.94], [31.0, 38.18], [39.0, 39.41], [41.0, 42.03], [50.0, 50.41], [58.0, 66.04], [67.0, 67.68], [68.0, 69.16], [75.0, 93.75], [95.0, 100.99], [102.0, 103.3], [111.0, 124.11], [125.0, 132.48], [134.0, 142.03], [142.0, 142.53], [143.0, 149.23], [150.0, 151.39], [154.0, 154.65], [162.0, 162.58], [163.0, 163.59]], "keep_status": [true, false, false, true, true, true, false, false, false, true, false, false, true, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [44.55, 0.0, 0.0, 41.52, 33.77, 45.27, 0.0, 0.0, 0.0, 32.96, 0.0, 0.0, 32.7, 34.99, 0.0, 30.3, 29.82, 28.92, 0.0, 29.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 25.34], ["didgeridoo", 12.99], ["hum", 5.42]], null, null, [["speech", 26.31], ["mains hum", 9.24], ["music", 8.97]], [["music", 19.5], ["cattle, bovinae", 17.71], ["speech", 12.37]], [["cattle, bovinae", 19.47], ["whale vocalization", 14.83], ["livestock, farm animals, working animals", 14.5]], null, null, null, [["music", 23.11], ["clip-clop", 19.64], ["speech", 13.26]], null, null, [["music", 34.06], ["sheep", 16.83], ["bleat", 12.28]], [["music", 42.25], ["hum", 11.57], ["throbbing", 7.94]], null, [["speech", 58.83], ["music", 19.1], ["outside, rural or natural", 3.89]], [["animal", 67.35], ["speech", 7.74], ["music", 5.01]], [["speech", 47.59], ["hubbub, speech noise, speech babble", 10.18], ["cattle, bovinae", 6.69]], null, [["livestock, farm animals, working animals", 25.6], ["speech", 16.67], ["cowbell", 9.68]], null, null, null, null], "duration": [3.31, 1.44, 0.28, 2.13, 7.94, 7.18, 0.41, 1.03, 0.41, 8.04, 0.68, 1.16, 18.75, 5.99, 1.3, 13.11, 7.48, 8.03, 0.53, 6.23, 1.39, 0.65, 0.58, 0.59]} \ No newline at end of file diff --git a/annotations_1/Vh-olAK5vrs_filtered.json b/annotations_1/Vh-olAK5vrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c3e8e374255327414734891be89c58227453239 --- /dev/null +++ b/annotations_1/Vh-olAK5vrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.21], [8.0, 8.99], [11.0, 12.87], [14.0, 13.9], [14.0, 59.27], [60.0, 88.74]], "keep_status": [true, false, false, false, false, false], "silence_prob": [33.67, 0.0, 0.0, 0.0, 0.0, 30.93], "audiomae_on_audioset": [[["music", 49.4], ["hum", 6.34], ["throbbing", 6.14]], null, null, null, null, [["hum", 34.67], ["music", 28.44], ["throbbing", 19.41]]], "duration": [6.21, 0.99, 1.87, -0.1, 45.27, 28.74]} \ No newline at end of file diff --git a/annotations_1/Vh7XH68xWKw_filtered.json b/annotations_1/Vh7XH68xWKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dffefb72af5e4817c53c108fbd5df7a360c33f2 --- /dev/null +++ b/annotations_1/Vh7XH68xWKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [7.0, 8.04], [10.0, 10.3], [24.0, 25.07], [25.0, 30.16], [57.0, 59.36], [60.0, 61.79], [63.0, 63.69], [66.0, 66.43], [67.0, 70.24], [73.0, 76.6], [78.0, 78.8], [81.0, 83.42], [85.0, 98.73]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.11, 38.74, 0.0, 0.0, 0.0, 48.52, 31.41, 0.0, 36.33, 42.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 30.93], ["hum", 14.89], ["sidetone", 12.71]], [["hum", 34.71], ["throbbing", 24.93], ["music", 5.86]], null, null, null, [["sine wave", 64.42], ["chirp tone", 17.71], ["speech", 8.71]], [["speech", 64.57], ["music", 3.12], ["fart", 1.95]], null, [["didgeridoo", 27.37], ["music", 19.57], ["speech", 12.22]], [["hum", 56.76], ["mains hum", 22.2], ["throbbing", 11.33]]], "duration": [1.6, 1.04, 0.3, 1.07, 5.16, 2.36, 1.79, 0.69, 0.43, 3.24, 3.6, 0.8, 2.42, 13.73]} \ No newline at end of file diff --git a/annotations_1/VhYxVXimdIw_filtered.json b/annotations_1/VhYxVXimdIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46cac2c313fdb39c07e7327844e2075530a80cfe --- /dev/null +++ b/annotations_1/VhYxVXimdIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.45], [7.0, 8.01], [10.0, 18.44], [20.0, 20.97], [22.0, 23.89], [25.0, 38.42], [40.0, 40.95], [44.0, 44.07], [45.0, 51.76], [54.0, 61.06], [62.0, 76.59], [78.0, 83.47], [85.0, 97.98]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 33.17, 0.0, 0.0, 39.34, 0.0, 0.0, 38.8, 54.9, 29.94, 33.78, 32.61], "audiomae_on_audioset": [null, null, [["foghorn", 32.57], ["music", 23.09], ["speech", 11.16]], null, null, [["fly, housefly", 57.94], ["insect", 19.6], ["mosquito", 6.92]], null, null, [["fly, housefly", 49.09], ["mosquito", 19.52], ["insect", 12.9]], null, [["music", 30.66], ["speech", 7.02], ["burst, pop", 5.83]], [["fart", 24.98], ["bee, wasp, etc.", 24.65], ["fly, housefly", 16.91]], [["speech", 38.25], ["fart", 6.38], ["explosion", 4.6]]], "duration": [1.45, 1.01, 8.44, 0.97, 1.89, 13.42, 0.95, 0.07, 6.76, 7.06, 14.59, 5.47, 12.98]} \ No newline at end of file diff --git a/annotations_1/VhzodI8yBUE_filtered.json b/annotations_1/VhzodI8yBUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b1801b786bcba9a2ee1233a0307628c9d039bdd --- /dev/null +++ b/annotations_1/VhzodI8yBUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 28.85], [29.0, 33.0], [36.0, 60.78]], "keep_status": [false, true, true], "silence_prob": [33.64, 33.36, 32.29], "audiomae_on_audioset": [[["music", 83.9], ["didgeridoo", 3.22], ["glass", 1.48]], [["throbbing", 29.28], ["music", 28.56], ["hum", 8.21]], [["buzz", 29.15], ["music", 22.0], ["mains hum", 9.65]]], "duration": [18.85, 4.0, 24.78]} \ No newline at end of file diff --git a/annotations_1/ViF6HrzoOj4_filtered.json b/annotations_1/ViF6HrzoOj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d2cb23a1488d982295ab15e101ceefe56b2e814 --- /dev/null +++ b/annotations_1/ViF6HrzoOj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.58], [15.0, 16.06], [19.0, 18.99], [22.0, 22.27], [28.0, 34.5], [35.0, 40.22], [40.0, 42.21], [46.0, 46.53], [47.0, 47.31], [47.0, 47.83], [48.0, 48.79], [49.0, 52.95], [66.0, 69.21], [86.0, 86.29], [95.0, 96.55], [98.0, 99.15], [101.0, 108.94], [110.0, 115.87], [116.0, 116.09], [116.0, 118.45]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [29.47, 0.0, 0.0, 0.0, 29.67, 31.44, 28.38, 0.0, 0.0, 0.0, 0.0, 29.7, 31.9, 0.0, 0.0, 0.0, 38.46, 44.96, 0.0, 50.36], "audiomae_on_audioset": [[["whale vocalization", 23.27], ["speech", 21.21], ["stomach rumble", 15.95]], null, null, null, [["whale vocalization", 72.21], ["speech", 23.52], ["stomach rumble", 1.08]], [["whale vocalization", 91.62], ["speech", 1.73], ["hum", 1.21]], [["music", 42.25], ["whale vocalization", 10.35], ["synthesizer", 5.69]], null, null, null, null, [["whale vocalization", 40.46], ["stomach rumble", 19.33], ["speech", 18.56]], [["speech", 25.96], ["whale vocalization", 10.16], ["cattle, bovinae", 9.26]], null, null, null, [["music", 33.58], ["whale vocalization", 18.62], ["hum", 12.5]], [["music", 33.74], ["stomach rumble", 33.71], ["whale vocalization", 14.77]], null, null], "duration": [9.58, 1.06, -0.01, 0.27, 6.5, 5.22, 2.21, 0.53, 0.31, 0.83, 0.79, 3.95, 3.21, 0.29, 1.55, 1.15, 7.94, 5.87, 0.09, 2.45]} \ No newline at end of file diff --git a/annotations_1/ViQZwRewYl8_filtered.json b/annotations_1/ViQZwRewYl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a9c98cae22ea3ab89ce22f53614c5cad3a9f167 --- /dev/null +++ b/annotations_1/ViQZwRewYl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.01], [16.0, 38.21], [39.0, 40.34], [44.0, 56.66], [60.0, 61.2], [62.0, 63.1], [67.0, 71.86], [72.0, 86.48], [87.0, 91.99], [100.0, 103.82], [107.0, 122.23], [123.0, 124.04], [129.0, 141.74], [143.0, 146.25], [149.0, 150.94], [155.0, 157.06], [160.0, 172.86], [174.0, 180.55], [183.0, 183.07], [185.0, 185.18]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, false, true, false, false, true, true, false, false, false], "silence_prob": [29.46, 29.43, 0.0, 29.9, 0.0, 0.0, 29.99, 29.48, 32.44, 30.99, 29.63, 0.0, 29.51, 31.46, 0.0, 28.71, 28.65, 29.27, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 31.5], ["hum", 27.28], ["throbbing", 11.21]], [["speech", 66.17], ["music", 17.54], ["hum", 2.31]], null, [["cattle, bovinae", 21.61], ["livestock, farm animals, working animals", 19.7], ["moo", 17.69]], null, null, [["speech", 48.29], ["music", 13.63], ["whack, thwack", 9.15]], [["speech", 29.82], ["throbbing", 20.97], ["music", 11.91]], [["speech", 35.51], ["music", 23.24], ["throbbing", 20.11]], [["vehicle", 32.35], ["race car, auto racing", 9.19], ["car", 8.08]], [["music", 36.23], ["speech", 31.6], ["cattle, bovinae", 2.98]], null, [["music", 45.32], ["hum", 9.45], ["throbbing", 9.26]], [["music", 68.84], ["synthesizer", 8.23], ["throbbing", 6.18]], null, [["music", 29.9], ["hum", 22.36], ["electronic music", 6.84]], [["music", 51.28], ["speech", 7.92], ["throbbing", 7.84]], [["music", 75.85], ["electronic music", 6.41], ["throbbing", 4.07]], null, null], "duration": [6.01, 22.21, 1.34, 12.66, 1.2, 1.1, 4.86, 14.48, 4.99, 3.82, 15.23, 1.04, 12.74, 3.25, 1.94, 2.06, 12.86, 6.55, 0.07, 0.18]} \ No newline at end of file diff --git a/annotations_1/VkD1dhWMYts_filtered.json b/annotations_1/VkD1dhWMYts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4063ec20dda25176a75b1b1c91318d2e00f10122 --- /dev/null +++ b/annotations_1/VkD1dhWMYts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [11.0, 10.99], [21.0, 21.83], [25.0, 25.83], [27.0, 38.89], [51.0, 95.77], [105.0, 109.81], [112.0, 120.28], [127.0, 136.11], [140.0, 141.47], [146.0, 149.99], [157.0, 158.5]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.61, 0.0, 32.59, 31.96, 31.44, 0.0, 35.44, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 83.01], ["music", 12.57], ["speech", 1.08]], null, [["music", 46.46], ["theremin", 9.93], ["didgeridoo", 7.09]], [["music", 67.28], ["skateboard", 2.16], ["speech", 1.81]], [["speech", 44.81], ["hum", 12.29], ["music", 11.1]], null, [["music", 56.25], ["speech", 20.85], ["electronic music", 3.11]], null], "duration": [1.55, -0.01, 0.83, 0.83, 11.89, 44.77, 4.81, 8.28, 9.11, 1.47, 3.99, 1.5]} \ No newline at end of file diff --git a/annotations_1/VkldXV8Pgi8_filtered.json b/annotations_1/VkldXV8Pgi8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d25fb4dd2a7f9a8ed42a5d4f0bf1fbc5ea576a2f --- /dev/null +++ b/annotations_1/VkldXV8Pgi8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.21], [8.0, 8.73], [10.0, 13.81], [16.0, 17.2], [21.0, 22.71], [23.0, 25.27], [25.0, 25.34], [27.0, 28.32], [36.0, 37.71], [38.0, 40.64], [44.0, 43.92], [50.0, 53.99], [56.0, 56.78], [58.0, 58.29], [63.0, 63.69], [65.0, 66.01], [72.0, 74.39], [75.0, 75.37], [77.0, 79.03], [82.0, 82.85], [84.0, 89.23], [93.0, 93.99], [96.0, 96.75], [97.0, 98.0], [113.0, 113.97], [115.0, 115.23], [119.0, 119.64], [123.0, 123.35], [124.0, 125.02], [127.0, 127.94], [129.0, 129.68], [132.0, 131.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.86, 0.0, 0.0, 41.58, 0.0, 0.0, 0.0, 79.41, 0.0, 33.45, 0.0, 0.0, 0.0, 0.0, 39.04, 0.0, 43.66, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 31.39], ["speech", 26.64], ["hum", 16.75]], null, null, null, null, null, [["grunt", 38.86], ["music", 29.19], ["groan", 14.0]], null, null, null, null, [["music", 46.2], ["speech", 40.15], ["hum", 1.88]], null, [["music", 49.39], ["speech", 27.36], ["fart", 4.92]], null, [["speech", 47.89], ["music", 36.89], ["boing", 4.9]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.73, 3.81, 1.2, 1.71, 2.27, 0.34, 1.32, 1.71, 2.64, -0.08, 3.99, 0.78, 0.29, 0.69, 1.01, 2.39, 0.37, 2.03, 0.85, 5.23, 0.99, 0.75, 1.0, 0.97, 0.23, 0.64, 0.35, 1.02, 0.94, 0.68, -0.16]} \ No newline at end of file diff --git a/annotations_1/Vl3IiVDwgpY_filtered.json b/annotations_1/Vl3IiVDwgpY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96124c8c680e066e94ea7ca7690a5f91b8b95f27 --- /dev/null +++ b/annotations_1/Vl3IiVDwgpY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 90.46], [92.0, 124.06]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [75.46, 32.06]} \ No newline at end of file diff --git a/annotations_1/VlMy5-BAjzo_filtered.json b/annotations_1/VlMy5-BAjzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fde9e24c7b03efa33dc2309b88a9bf5a3b09f664 --- /dev/null +++ b/annotations_1/VlMy5-BAjzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.0], [6.0, 6.1], [7.0, 10.39], [12.0, 12.23], [14.0, 22.92], [27.0, 31.97], [35.0, 38.08], [41.0, 47.14], [53.0, 54.57], [60.0, 62.18], [65.0, 70.29], [71.0, 111.45], [114.0, 116.4], [119.0, 119.99], [121.0, 123.03]], "keep_status": [false, false, false, false, true, false, true, true, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 41.09, 0.0, 49.5, 51.5, 36.25, 33.53, 0.0, 43.77, 36.02, 0.0, 38.37, 0.0, 59.51], "audiomae_on_audioset": [null, null, [["music", 59.71], ["crow", 9.57], ["caw", 5.02]], null, [["music", 41.59], ["speech", 16.99], ["theremin", 6.81]], null, [["music", 33.55], ["speech", 28.01], ["didgeridoo", 4.93]], [["speech", 30.16], ["didgeridoo", 22.71], ["music", 16.83]], null, [["speech", 25.71], ["music", 15.78], ["hum", 5.44]], [["speech", 28.99], ["music", 19.83], ["mains hum", 17.63]], null, [["mains hum", 14.53], ["hum", 13.88], ["speech", 11.84]], null, null], "duration": [0.0, 0.1, 3.39, 0.23, 8.92, 4.97, 3.08, 6.14, 1.57, 2.18, 5.29, 40.45, 2.4, 0.99, 2.03]} \ No newline at end of file diff --git a/annotations_1/VlSkPA60ujQ_filtered.json b/annotations_1/VlSkPA60ujQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..263fd17cd0839800a5b4d160ddebfc9f4cb14780 --- /dev/null +++ b/annotations_1/VlSkPA60ujQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.97], [19.0, 20.58], [30.0, 30.72], [32.0, 32.48], [38.0, 38.4], [45.0, 45.27], [60.0, 60.49], [61.0, 65.11], [68.0, 68.76], [69.0, 69.6], [78.0, 78.22], [78.0, 78.29], [84.0, 85.7], [94.0, 93.9], [103.0, 103.87], [114.0, 114.32], [123.0, 126.47], [127.0, 128.61], [143.0, 143.61], [147.0, 148.93], [153.0, 153.67], [157.0, 158.85]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 49.46], ["speech", 12.48], ["musical instrument", 7.08]], null, null, null, null, null, null, null, null, [["music", 33.67], ["speech", 23.94], ["foghorn", 16.02]], null, null, null, null, null], "duration": [0.97, 1.58, 0.72, 0.48, 0.4, 0.27, 0.49, 4.11, 0.76, 0.6, 0.22, 0.29, 1.7, -0.1, 0.87, 0.32, 3.47, 1.61, 0.61, 1.93, 0.67, 1.85]} \ No newline at end of file diff --git a/annotations_1/VlfBJLU-8us_filtered.json b/annotations_1/VlfBJLU-8us_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25a800165d063a84ea7eef577854ea897510166e --- /dev/null +++ b/annotations_1/VlfBJLU-8us_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.67], [3.0, 3.99], [4.0, 4.83], [8.0, 8.31], [10.0, 10.27], [12.0, 16.78], [18.0, 18.35], [19.0, 19.65], [20.0, 21.63], [25.0, 25.61], [27.0, 28.59], [29.0, 30.27], [31.0, 32.17], [34.0, 36.54], [37.0, 38.89], [40.0, 40.22], [42.0, 43.9], [44.0, 45.69], [49.0, 49.64], [53.0, 54.03], [57.0, 57.96], [61.0, 63.05], [66.0, 66.66], [69.0, 69.53], [71.0, 72.87], [75.0, 75.84], [76.0, 77.3], [78.0, 78.41], [81.0, 88.57], [91.0, 93.14], [94.0, 96.28], [97.0, 97.82], [101.0, 101.63], [102.0, 102.91], [105.0, 106.17], [110.0, 114.52], [116.0, 119.21], [122.0, 123.36], [124.0, 124.41], [125.0, 126.59], [127.0, 129.79], [131.0, 132.78], [133.0, 134.35], [137.0, 137.74], [139.0, 145.93], [146.0, 147.31], [151.0, 155.17], [157.0, 161.47], [162.0, 163.31], [164.0, 170.04], [172.0, 173.35], [175.0, 198.0], [199.0, 204.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 99.56, 100.0, 0.0, 0.0, 0.0, 0.0, 99.88, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 89.19, 0.0, 98.01, 91.13, 0.0, 61.27, 0.0, 81.35, 45.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.89], ["effects unit", 10.05], ["guitar", 6.81]]], "duration": [1.67, 0.99, 0.83, 0.31, 0.27, 4.78, 0.35, 0.65, 1.63, 0.61, 1.59, 1.27, 1.17, 2.54, 1.89, 0.22, 1.9, 1.69, 0.64, 1.03, 0.96, 2.05, 0.66, 0.53, 1.87, 0.84, 1.3, 0.41, 7.57, 2.14, 2.28, 0.82, 0.63, 0.91, 1.17, 4.52, 3.21, 1.36, 0.41, 1.59, 2.79, 1.78, 1.35, 0.74, 6.93, 1.31, 4.17, 4.47, 1.31, 6.04, 1.35, 23.0, 5.75]} \ No newline at end of file diff --git a/annotations_1/Vln90evTYog_filtered.json b/annotations_1/Vln90evTYog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8db9c4d8fc7367b45e0a881981211faaf354705d --- /dev/null +++ b/annotations_1/Vln90evTYog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [12.0, 12.9], [18.0, 19.5], [21.0, 21.46], [23.0, 72.42], [75.0, 75.79], [77.0, 77.58], [83.0, 83.02], [92.0, 93.61], [95.0, 101.75], [102.0, 103.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.9, 1.5, 0.46, 49.42, 0.79, 0.58, 0.02, 1.61, 6.75, 1.37]} \ No newline at end of file diff --git a/annotations_1/VmT0mZH5ivo_filtered.json b/annotations_1/VmT0mZH5ivo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b38450a250477ea27e45b5df4291a30ca2daf43e --- /dev/null +++ b/annotations_1/VmT0mZH5ivo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.55], [22.0, 25.02], [26.0, 28.49], [30.0, 37.34], [39.0, 70.66], [75.0, 119.26], [120.0, 123.4], [124.0, 132.48], [133.0, 147.66], [148.0, 148.81], [150.0, 151.31], [152.0, 154.26], [156.0, 164.51], [171.0, 235.72]], "keep_status": [true, true, true, true, false, false, true, true, true, false, false, false, true, false], "silence_prob": [34.41, 42.22, 41.3, 36.87, 0.0, 0.0, 38.49, 29.28, 28.98, 0.0, 0.0, 42.96, 29.67, 0.0], "audiomae_on_audioset": [[["hum", 25.86], ["mains hum", 22.68], ["music", 14.78]], [["music", 22.12], ["speech", 17.9], ["foghorn", 7.48]], [["music", 25.63], ["hum", 5.37], ["throbbing", 4.76]], [["hum", 18.58], ["music", 18.24], ["mains hum", 17.44]], null, null, [["mains hum", 35.93], ["hum", 21.21], ["fly, housefly", 8.83]], [["music", 24.22], ["throbbing", 22.98], ["hum", 12.05]], [["didgeridoo", 37.68], ["throbbing", 11.46], ["music", 10.63]], null, null, [["music", 65.95], ["musical instrument", 5.41], ["theremin", 3.25]], [["music", 31.83], ["didgeridoo", 14.04], ["hum", 10.21]], null], "duration": [3.55, 3.02, 2.49, 7.34, 31.66, 44.26, 3.4, 8.48, 14.66, 0.81, 1.31, 2.26, 8.51, 64.72]} \ No newline at end of file diff --git a/annotations_1/VmZ1ni2IDdo_filtered.json b/annotations_1/VmZ1ni2IDdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37b6f05b7ec5fac2c58a4355859576a294fc6855 --- /dev/null +++ b/annotations_1/VmZ1ni2IDdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [9.0, 9.78], [18.0, 18.4], [20.0, 20.53], [22.0, 22.5], [25.0, 24.78], [35.0, 34.89], [39.0, 39.33], [43.0, 44.93], [56.0, 56.03], [60.0, 61.47], [73.0, 73.67], [79.0, 80.08], [93.0, 93.41], [94.0, 95.25], [96.0, 97.21], [99.0, 99.77], [101.0, 101.43], [104.0, 104.13], [106.0, 106.49], [112.0, 114.29], [117.0, 117.0], [120.0, 120.18], [122.0, 123.74], [128.0, 131.18], [132.0, 132.04], [132.0, 144.29], [147.0, 149.98], [150.0, 151.53], [158.0, 160.98], [161.0, 161.03], [161.0, 161.13], [161.0, 162.28], [165.0, 165.35], [167.0, 167.86], [168.0, 169.48], [173.0, 176.89], [178.0, 178.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.96, 0.0, 0.0, 0.0, 52.05, 0.0, 39.47, 47.66, 0.0, 52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.42], ["boing", 26.79], ["didgeridoo", 12.36]], null, null, null, null, null, [["hum", 39.91], ["mains hum", 32.11], ["throbbing", 16.38]], [["music", 36.39], ["didgeridoo", 11.61], ["buzz", 5.95]], null, null, null, null, null, null, null, null, [["music", 52.01], ["fly, housefly", 6.3], ["didgeridoo", 4.23]], null], "duration": [0.82, 0.78, 0.4, 0.53, 0.5, -0.22, -0.11, 0.33, 1.93, 0.03, 1.47, 0.67, 1.08, 0.41, 1.25, 1.21, 0.77, 0.43, 0.13, 0.49, 2.29, 0.0, 0.18, 1.74, 3.18, 0.04, 12.29, 2.98, 1.53, 2.98, 0.03, 0.13, 1.28, 0.35, 0.86, 1.48, 3.89, 0.5]} \ No newline at end of file diff --git a/annotations_1/Vmo12BffgQc_filtered.json b/annotations_1/Vmo12BffgQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d6a4c0a4390ae22aa7166d94f335f5026fbccc9 --- /dev/null +++ b/annotations_1/Vmo12BffgQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [11.0, 11.65], [15.0, 15.03], [16.0, 21.17], [23.0, 23.28], [27.0, 33.39], [47.0, 50.06], [51.0, 53.59], [59.0, 60.29], [62.0, 63.22], [65.0, 78.43], [81.0, 82.32], [84.0, 87.18], [90.0, 90.85], [92.0, 93.45], [94.0, 94.95], [96.0, 96.74], [99.0, 99.33], [103.0, 104.23], [106.0, 106.54], [110.0, 110.74], [120.0, 121.61], [124.0, 125.04], [127.0, 126.91], [128.0, 129.32], [130.0, 131.87], [139.0, 143.38], [147.0, 147.88]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.1, 0.0, 39.44, 99.97, 100.0, 0.0, 0.0, 91.81, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 40.63], ["electric piano", 11.4], ["keyboard (musical)", 8.35]], null, [["music", 33.73], ["cello", 10.52], ["double bass", 5.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 0.65, 0.03, 5.17, 0.28, 6.39, 3.06, 2.59, 1.29, 1.22, 13.43, 1.32, 3.18, 0.85, 1.45, 0.95, 0.74, 0.33, 1.23, 0.54, 0.74, 1.61, 1.04, -0.09, 1.32, 1.87, 4.38, 0.88]} \ No newline at end of file diff --git a/annotations_1/Vn5WazNB5sU_filtered.json b/annotations_1/Vn5WazNB5sU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb6ad203dd8924e60f004ba97a3b87ce14b6176e --- /dev/null +++ b/annotations_1/Vn5WazNB5sU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [3.0, 10.77], [11.0, 16.88], [18.0, 31.45], [36.0, 36.61], [41.0, 41.49], [42.0, 60.91], [62.0, 71.95], [74.0, 74.43], [80.0, 87.37], [94.0, 100.35], [104.0, 104.63], [111.0, 118.15], [119.0, 128.48], [130.0, 148.78], [151.0, 161.03], [161.0, 164.91], [167.0, 167.51]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 30.41, 30.04, 29.29, 0.0, 0.0, 29.92, 31.85, 0.0, 28.69, 30.9, 0.0, 29.42, 29.32, 28.77, 28.19, 31.9, 0.0], "audiomae_on_audioset": [null, [["throbbing", 68.32], ["hum", 21.65], ["speech", 3.72]], [["throbbing", 40.63], ["hum", 38.29], ["music", 7.37]], [["speech", 36.6], ["music", 32.49], ["throbbing", 6.43]], null, null, [["music", 37.26], ["fly, housefly", 18.54], ["didgeridoo", 12.82]], [["hum", 42.55], ["music", 20.7], ["throbbing", 20.61]], null, [["mains hum", 43.24], ["hum", 40.75], ["throbbing", 3.72]], [["music", 28.8], ["speech", 19.28], ["throbbing", 17.16]], null, [["music", 29.96], ["hum", 24.94], ["mains hum", 12.29]], [["music", 34.64], ["hum", 16.17], ["throbbing", 13.74]], [["music", 31.95], ["throbbing", 23.25], ["hum", 22.1]], [["music", 77.86], ["throbbing", 10.42], ["hum", 4.08]], [["hum", 26.47], ["music", 22.77], ["sidetone", 11.1]], null], "duration": [1.73, 7.77, 5.88, 13.45, 0.61, 0.49, 18.91, 9.95, 0.43, 7.37, 6.35, 0.63, 7.15, 9.48, 18.78, 10.03, 3.91, 0.51]} \ No newline at end of file diff --git a/annotations_1/Vnp8CkPERus_filtered.json b/annotations_1/Vnp8CkPERus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de5971da5d5eb8a36791d983c28688affdac38fe --- /dev/null +++ b/annotations_1/Vnp8CkPERus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.14], [4.0, 11.94], [14.0, 53.67], [57.0, 70.16], [71.0, 71.83], [73.0, 73.65], [77.0, 78.97], [82.0, 82.86], [85.0, 92.18], [93.0, 95.77], [97.0, 103.91], [105.0, 106.05], [110.0, 115.38], [117.0, 118.13], [118.0, 120.16], [121.0, 125.41], [126.0, 126.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 31.43, 0.0, 39.7, 0.0, 0.0, 0.0, 0.0, 71.57, 64.52, 51.99, 0.0, 58.38, 0.0, 34.54, 33.95, 0.0], "audiomae_on_audioset": [null, [["hum", 50.21], ["mains hum", 28.67], ["music", 11.6]], null, [["music", 37.26], ["throbbing", 12.34], ["animal", 12.24]], null, null, null, null, null, null, null, null, null, null, [["speech", 38.58], ["music", 9.85], ["mains hum", 9.33]], [["mains hum", 23.24], ["hum", 22.27], ["speech", 11.61]], null], "duration": [0.14, 7.94, 39.67, 13.16, 0.83, 0.65, 1.97, 0.86, 7.18, 2.77, 6.91, 1.05, 5.38, 1.13, 2.16, 4.41, 0.45]} \ No newline at end of file diff --git a/annotations_1/VohdBtnMchg_filtered.json b/annotations_1/VohdBtnMchg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ece010daab1638f272b88f959ed38dae8921fe52 --- /dev/null +++ b/annotations_1/VohdBtnMchg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 41.74], [43.0, 43.58], [46.0, 46.36], [48.0, 49.4], [50.0, 53.2], [54.0, 54.31], [55.0, 55.66], [57.0, 58.65], [59.0, 60.25], [61.0, 63.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.75, 0.0, 0.0, 0.0, 0.0, 31.5], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 50.87], ["mains hum", 13.1], ["hum", 11.88]], null, null, null, null, [["theremin", 76.95], ["music", 20.15], ["musical instrument", 0.61]]], "duration": [1.74, 0.58, 0.36, 1.4, 3.2, 0.31, 0.66, 1.65, 1.25, 2.44]} \ No newline at end of file diff --git a/annotations_1/VqAqUVcgQdE_filtered.json b/annotations_1/VqAqUVcgQdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75ebde177e262663c0fadfbdd8281c16499e51ed --- /dev/null +++ b/annotations_1/VqAqUVcgQdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [4.0, 17.36], [21.0, 23.68], [26.0, 54.85], [57.0, 70.16], [74.0, 78.24], [79.0, 79.52], [81.0, 87.17], [92.0, 97.33], [98.0, 104.53], [108.0, 117.63], [119.0, 122.22], [134.0, 148.0], [153.0, 164.46], [169.0, 169.38], [172.0, 195.51], [197.0, 198.54], [211.0, 210.95], [212.0, 212.94], [216.0, 216.9], [229.0, 233.22], [235.0, 236.26]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 29.55, 43.9, 29.58, 32.17, 30.67, 0.0, 30.39, 30.66, 30.61, 32.81, 34.86, 30.92, 30.66, 0.0, 29.98, 0.0, 0.0, 0.0, 0.0, 36.01, 0.0], "audiomae_on_audioset": [null, [["music", 55.22], ["whack, thwack", 6.7], ["speech", 4.66]], [["hum", 30.34], ["music", 21.57], ["throbbing", 19.5]], [["music", 74.34], ["electronic music", 5.27], ["throbbing", 3.69]], [["music", 60.17], ["boing", 23.32], ["buzz", 1.63]], [["music", 56.16], ["cacophony", 11.6], ["throbbing", 8.42]], null, [["music", 45.7], ["throbbing", 15.57], ["hum", 8.4]], [["boing", 62.42], ["music", 18.19], ["sound effect", 2.07]], [["music", 69.82], ["boing", 9.78], ["speech", 9.76]], [["music", 47.78], ["speech", 12.31], ["hum", 11.63]], [["music", 68.92], ["sidetone", 3.36], ["musical instrument", 3.33]], [["music", 45.09], ["hum", 15.61], ["throbbing", 10.81]], [["music", 58.19], ["throbbing", 3.36], ["sound effect", 2.38]], null, [["music", 38.62], ["hum", 12.08], ["speech", 10.61]], null, null, null, null, [["music", 34.89], ["noise", 9.5], ["grunt", 7.42]], null], "duration": [1.27, 13.36, 2.68, 28.85, 13.16, 4.24, 0.52, 6.17, 5.33, 6.53, 9.63, 3.22, 14.0, 11.46, 0.38, 23.51, 1.54, -0.05, 0.94, 0.9, 4.22, 1.26]} \ No newline at end of file diff --git a/annotations_1/VqZAfqVCEnk_filtered.json b/annotations_1/VqZAfqVCEnk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e452f84078726df3841689795cd6a5901798773 --- /dev/null +++ b/annotations_1/VqZAfqVCEnk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.72], [15.0, 18.79], [21.0, 25.96], [29.0, 34.69], [38.0, 92.08], [92.0, 94.26], [96.0, 106.71], [109.0, 119.06], [120.0, 122.18]], "keep_status": [true, false, false, true, false, false, true, false, false], "silence_prob": [37.17, 31.25, 31.27, 30.39, 0.0, 56.55, 35.28, 45.02, 42.35], "audiomae_on_audioset": [[["music", 38.56], ["speech", 12.28], ["synthesizer", 11.32]], [["music", 69.84], ["didgeridoo", 3.54], ["throbbing", 3.45]], [["music", 72.57], ["didgeridoo", 6.68], ["throbbing", 2.08]], [["music", 47.29], ["boing", 7.84], ["fart", 6.06]], null, null, [["animal", 36.29], ["bow-wow", 14.33], ["domestic animals, pets", 11.54]], [["music", 33.41], ["hum", 30.83], ["mains hum", 13.58]], [["music", 51.35], ["hum", 14.62], ["throbbing", 6.33]]], "duration": [2.72, 3.79, 4.96, 5.69, 54.08, 2.26, 10.71, 10.06, 2.18]} \ No newline at end of file diff --git a/annotations_1/VrXUYjVCX2o_filtered.json b/annotations_1/VrXUYjVCX2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b94cf7e10afd578cf5385abc2a89f7ea6f3e3c50 --- /dev/null +++ b/annotations_1/VrXUYjVCX2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.3], [9.0, 8.92], [16.0, 16.14], [18.0, 18.05], [23.0, 23.95], [28.0, 28.26], [29.0, 29.78], [35.0, 41.57], [44.0, 43.95], [46.0, 51.49], [52.0, 79.54], [80.0, 81.46], [83.0, 83.42], [85.0, 84.74], [85.0, 85.67]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.57, 0.0, 73.97, 46.29, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 23.22], ["sound effect", 12.81], ["whale vocalization", 12.05]], null, null, [["speech", 31.42], ["fly, housefly", 10.83], ["hum", 9.22]], null, null, null, null], "duration": [0.3, -0.08, 0.14, 0.05, 0.95, 0.26, 0.78, 6.57, -0.05, 5.49, 27.54, 1.46, 0.42, -0.26, 0.67]} \ No newline at end of file diff --git a/annotations_1/Vro5qtVA4PE_filtered.json b/annotations_1/Vro5qtVA4PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0847cedf76ddeefa1d5abdaa620ad0ccee98884f --- /dev/null +++ b/annotations_1/Vro5qtVA4PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [24.0, 25.07], [25.0, 26.49], [30.0, 55.26], [62.0, 65.38], [67.0, 70.98], [76.0, 78.9], [81.0, 84.48], [85.0, 92.11], [93.0, 100.25], [102.0, 109.61], [112.0, 121.32], [128.0, 140.04], [140.0, 141.07], [146.0, 146.8]], "keep_status": [false, false, false, true, true, true, true, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.65, 29.99, 37.19, 31.38, 32.32, 32.47, 30.86, 31.58, 31.59, 39.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.9], ["livestock, farm animals, working animals", 14.23], ["sheep", 12.55]], [["music", 37.97], ["throbbing", 18.25], ["hum", 8.34]], [["music", 29.96], ["hum", 26.26], ["mains hum", 7.88]], [["music", 45.45], ["speech", 15.9], ["theremin", 6.94]], [["mosquito", 43.42], ["fly, housefly", 20.21], ["music", 16.3]], [["music", 39.65], ["moo", 9.93], ["livestock, farm animals, working animals", 7.47]], [["music", 18.49], ["percussion", 13.22], ["drum", 8.95]], [["music", 80.36], ["musical instrument", 2.04], ["didgeridoo", 1.35]], [["music", 28.41], ["cattle, bovinae", 9.71], ["fly, housefly", 9.37]], [["music", 75.25], ["didgeridoo", 4.02], ["musical instrument", 2.58]], null, null], "duration": [0.43, 1.07, 1.49, 25.26, 3.38, 3.98, 2.9, 3.48, 7.11, 7.25, 7.61, 9.32, 12.04, 1.07, 0.8]} \ No newline at end of file diff --git a/annotations_1/Vs0CShp6HFA_filtered.json b/annotations_1/Vs0CShp6HFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dc7b165d0034bb4593ccd22c83c5447bd6aa2c6 --- /dev/null +++ b/annotations_1/Vs0CShp6HFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.78], [3.0, 19.65], [22.0, 28.39], [30.0, 30.67], [34.0, 33.96], [41.0, 41.66], [46.0, 46.55], [51.0, 52.05], [62.0, 64.45], [69.0, 69.52], [70.0, 88.6], [95.0, 97.75], [103.0, 104.35], [117.0, 120.55], [124.0, 124.65], [133.0, 133.05], [134.0, 134.49], [141.0, 143.82], [146.0, 146.55], [149.0, 150.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.48, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67, 0.0, 34.55, 33.75, 0.0, 31.47, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0], "audiomae_on_audioset": [null, [["sidetone", 47.81], ["music", 24.35], ["speech", 14.1]], [["music", 67.18], ["speech", 8.97], ["throbbing", 2.11]], null, null, null, null, null, null, null, [["music", 47.45], ["speech", 34.46], ["didgeridoo", 5.23]], [["cattle, bovinae", 43.29], ["moo", 40.52], ["livestock, farm animals, working animals", 12.66]], null, [["livestock, farm animals, working animals", 30.32], ["cattle, bovinae", 15.36], ["breaking", 8.99]], null, null, null, null, null, null], "duration": [-0.22, 16.65, 6.39, 0.67, -0.04, 0.66, 0.55, 1.05, 2.45, 0.52, 18.6, 2.75, 1.35, 3.55, 0.65, 0.05, 0.49, 2.82, 0.55, 1.25]} \ No newline at end of file diff --git a/annotations_1/VuUzda9kvJA_filtered.json b/annotations_1/VuUzda9kvJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c629a00e5301029a163183ddf11abe1175f19ca0 --- /dev/null +++ b/annotations_1/VuUzda9kvJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.64], [14.0, 16.16], [16.0, 17.1], [18.0, 20.75], [27.0, 38.5], [41.0, 42.33], [43.0, 45.94], [47.0, 50.21], [51.0, 68.89], [70.0, 132.38], [138.0, 139.28]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [32.8, 97.22, 0.0, 70.16, 31.31, 0.0, 31.29, 30.73, 30.52, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.32], ["sidetone", 14.13], ["electronic music", 6.06]], null, null, null, [["music", 62.16], ["animal", 5.54], ["domestic animals, pets", 3.66]], null, [["speech", 36.25], ["rumble", 7.61], ["vehicle", 6.23]], [["fly, housefly", 21.35], ["insect", 15.5], ["speech", 10.84]], [["music", 44.96], ["throbbing", 14.91], ["hum", 10.37]], null, null], "duration": [2.64, 2.16, 1.1, 2.75, 11.5, 1.33, 2.94, 3.21, 17.89, 62.38, 1.28]} \ No newline at end of file diff --git a/annotations_1/Vv9KJYUnVvA_filtered.json b/annotations_1/Vv9KJYUnVvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16eea391d422fa42fc3d9a7cfe4b733de6c913fd --- /dev/null +++ b/annotations_1/Vv9KJYUnVvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 40.22], [42.0, 54.21], [55.0, 56.93], [58.0, 64.47], [65.0, 88.11], [89.0, 91.2], [92.0, 94.1], [95.0, 96.4], [97.0, 98.68], [99.0, 100.62], [102.0, 103.15], [106.0, 112.51], [114.0, 121.78], [123.0, 130.98], [131.0, 145.44], [147.0, 210.98], [212.0, 212.19], [213.0, 225.88], [227.0, 231.79], [236.0, 236.76], [237.0, 283.98], [284.0, 284.01]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [37.1, 31.71, 0.0, 31.63, 52.92, 62.47, 41.38, 0.0, 0.0, 0.0, 0.0, 44.57, 52.98, 30.88, 37.88, 0.0, 0.0, 30.95, 30.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.92], ["musical instrument", 11.81], ["effects unit", 9.78]], [["speech", 65.59], ["whale vocalization", 8.29], ["sidetone", 3.28]], null, [["music", 49.26], ["stomach rumble", 20.27], ["speech", 5.94]], null, null, [["music", 45.85], ["hum", 6.05], ["throbbing", 5.36]], null, null, null, null, [["music", 62.75], ["fart", 12.1], ["guitar", 2.28]], null, [["music", 40.86], ["mains hum", 11.6], ["hum", 8.53]], [["music", 81.48], ["electronic music", 1.74], ["animal", 1.51]], null, null, [["music", 50.47], ["hum", 7.58], ["mains hum", 5.49]], [["music", 70.51], ["whale vocalization", 4.3], ["theremin", 2.63]], null, null, null], "duration": [3.22, 12.21, 1.93, 6.47, 23.11, 2.2, 2.1, 1.4, 1.68, 1.62, 1.15, 6.51, 7.78, 7.98, 14.44, 63.98, 0.19, 12.88, 4.79, 0.76, 46.98, 0.01]} \ No newline at end of file diff --git a/annotations_1/VvNX7pOAK58_filtered.json b/annotations_1/VvNX7pOAK58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5965058c62b8ad590d78857335e177abc0fb002a --- /dev/null +++ b/annotations_1/VvNX7pOAK58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.7], [17.0, 17.56], [27.0, 27.87], [30.0, 59.9], [64.0, 70.23], [74.0, 76.45], [103.0, 113.34], [115.0, 120.93], [125.0, 125.41], [126.0, 136.56], [138.0, 139.14], [140.0, 145.77], [149.0, 156.91], [161.0, 163.63], [165.0, 165.64], [167.0, 168.51], [175.0, 185.09], [186.0, 211.96], [213.0, 213.14], [214.0, 219.0], [221.0, 237.0], [238.0, 244.44], [245.0, 246.27], [248.0, 248.24], [251.0, 252.07], [255.0, 256.8], [259.0, 261.18]], "keep_status": [true, false, false, true, true, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.03, 0.0, 0.0, 29.36, 29.89, 31.44, 29.39, 29.32, 0.0, 29.53, 0.0, 29.87, 29.56, 29.14, 0.0, 0.0, 29.4, 29.7, 0.0, 30.43, 29.6, 29.47, 0.0, 0.0, 0.0, 0.0, 41.48], "audiomae_on_audioset": [[["music", 48.01], ["throbbing", 8.46], ["hum", 6.76]], null, null, [["livestock, farm animals, working animals", 27.35], ["music", 19.85], ["cattle, bovinae", 9.52]], [["speech", 48.14], ["music", 18.05], ["foghorn", 3.62]], [["music", 68.66], ["throbbing", 4.65], ["sonar", 1.73]], [["music", 43.63], ["animal", 8.66], ["groan", 6.3]], [["music", 55.46], ["speech", 6.23], ["throbbing", 3.98]], null, [["music", 27.98], ["speech", 18.08], ["throbbing", 15.42]], null, [["skateboard", 40.16], ["music", 27.85], ["speech", 6.62]], [["music", 50.74], ["speech", 30.22], ["electronic music", 2.96]], [["crowd", 24.89], ["throbbing", 9.38], ["music", 8.57]], null, null, [["speech", 55.81], ["music", 23.53], ["animal", 2.47]], [["music", 51.53], ["explosion", 11.91], ["speech", 9.21]], null, [["throbbing", 41.64], ["music", 32.78], ["hum", 4.86]], [["music", 47.98], ["mains hum", 14.61], ["hum", 10.79]], [["music", 33.01], ["throbbing", 24.33], ["hum", 23.62]], null, null, null, null, [["music", 74.71], ["throbbing", 4.14], ["soundtrack music", 2.25]]], "duration": [12.7, 0.56, 0.87, 29.9, 6.23, 2.45, 10.34, 5.93, 0.41, 10.56, 1.14, 5.77, 7.91, 2.63, 0.64, 1.51, 10.09, 25.96, 0.14, 5.0, 16.0, 6.44, 1.27, 0.24, 1.07, 1.8, 2.18]} \ No newline at end of file diff --git a/annotations_1/VvfIdmaKwfQ_filtered.json b/annotations_1/VvfIdmaKwfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c262a7850985e5a07fb93e75dd4f646308bc56f --- /dev/null +++ b/annotations_1/VvfIdmaKwfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.04], [27.0, 28.49], [29.0, 31.73], [45.0, 47.68], [52.0, 52.12], [56.0, 56.19], [57.0, 70.46], [75.0, 75.36], [82.0, 83.0], [83.0, 84.37], [92.0, 124.88], [126.0, 126.47], [131.0, 131.38], [133.0, 134.96], [146.0, 146.16], [146.0, 146.26], [148.0, 148.05]], "keep_status": [true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.47, 0.0, 31.78, 39.85, 0.0, 0.0, 31.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.19], ["speech", 22.39], ["musical instrument", 2.99]], null, [["music", 22.88], ["carnatic music", 11.97], ["speech", 10.86]], [["music", 34.49], ["speech", 12.71], ["fly, housefly", 4.7]], null, null, [["music", 51.17], ["hum", 5.3], ["throbbing", 4.27]], null, null, null, null, null, null, null, null, null, null], "duration": [2.04, 1.49, 2.73, 2.68, 0.12, 0.19, 13.46, 0.36, 1.0, 1.37, 32.88, 0.47, 0.38, 1.96, 0.16, 0.26, 0.05]} \ No newline at end of file diff --git a/annotations_1/VwkGKFFk-F4_filtered.json b/annotations_1/VwkGKFFk-F4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0474ddf6e798d0f01b8b21bc740ae7be62025a73 --- /dev/null +++ b/annotations_1/VwkGKFFk-F4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [4.0, 4.43], [5.0, 5.76], [8.0, 9.85], [13.0, 15.09], [15.0, 17.66], [18.0, 19.43], [21.0, 25.46], [27.0, 29.37], [38.0, 42.74], [48.0, 49.1], [53.0, 53.13], [53.0, 54.57], [60.0, 62.7], [64.0, 65.47], [69.0, 71.27], [73.0, 80.5], [83.0, 83.64], [84.0, 86.64], [99.0, 99.96], [110.0, 111.06], [112.0, 112.65], [115.0, 114.84], [116.0, 116.6], [119.0, 119.33], [122.0, 123.67], [124.0, 125.49], [127.0, 128.29], [132.0, 133.61], [134.0, 135.63], [144.0, 161.15], [163.0, 165.11], [167.0, 168.15], [170.0, 172.76], [176.0, 178.58], [181.0, 182.19], [184.0, 184.11], [187.0, 189.45], [193.0, 194.59], [196.0, 197.9], [199.0, 199.64], [200.0, 202.26], [204.0, 205.31], [207.0, 208.52], [210.0, 211.03], [214.0, 214.93], [217.0, 218.29], [219.0, 220.78], [222.0, 223.4], [225.0, 226.81], [227.0, 227.45], [228.0, 231.38], [235.0, 236.49], [237.0, 239.26], [239.0, 245.57], [246.0, 249.79], [250.0, 252.78], [255.0, 256.98], [260.0, 260.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.95, 94.66, 0.0, 99.78, 99.96, 99.76, 0.0, 0.0, 0.0, 98.01, 0.0, 93.76, 66.63, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 99.99, 0.0, 95.91, 99.84, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 96.42, 99.78, 98.36, 71.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.43, 0.76, 1.85, 2.09, 2.66, 1.43, 4.46, 2.37, 4.74, 1.1, 0.13, 1.57, 2.7, 1.47, 2.27, 7.5, 0.64, 2.64, 0.96, 1.06, 0.65, -0.16, 0.6, 0.33, 1.67, 1.49, 1.29, 1.61, 1.63, 17.15, 2.11, 1.15, 2.76, 2.58, 1.19, 0.11, 2.45, 1.59, 1.9, 0.64, 2.26, 1.31, 1.52, 1.03, 0.93, 1.29, 1.78, 1.4, 1.81, 0.45, 3.38, 1.49, 2.26, 6.57, 3.79, 2.78, 1.98, 0.58]} \ No newline at end of file diff --git a/annotations_1/VwlkxIN9tfQ_filtered.json b/annotations_1/VwlkxIN9tfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c96250d0d37a558eaa6f86151f88246ce6c21d9e --- /dev/null +++ b/annotations_1/VwlkxIN9tfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 31.95], [32.0, 32.27], [32.0, 39.82], [41.0, 41.44], [41.0, 65.97], [72.0, 72.25], [75.0, 76.64], [79.0, 83.42], [92.0, 92.45], [94.0, 119.06]], "keep_status": [false, false, true, false, true, false, false, false, false, false], "silence_prob": [30.61, 0.0, 29.98, 0.0, 48.1, 0.0, 0.0, 60.51, 0.0, 65.44], "audiomae_on_audioset": [[["music", 44.93], ["speech", 21.85], ["electronic music", 5.51]], null, [["speech", 52.92], ["explosion", 8.98], ["eruption", 7.0]], null, [["music", 37.27], ["explosion", 11.33], ["hum", 4.6]], null, null, null, null, null], "duration": [27.95, 0.27, 7.82, 0.44, 24.97, 0.25, 1.64, 4.42, 0.45, 25.06]} \ No newline at end of file diff --git a/annotations_1/Vx0MQxIFBW8_filtered.json b/annotations_1/Vx0MQxIFBW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55e5bf2441228d255b202896fc1027f60e1b95ba --- /dev/null +++ b/annotations_1/Vx0MQxIFBW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [12.0, 17.04], [18.0, 19.82], [21.0, 24.02], [29.0, 32.88], [34.0, 35.67], [37.0, 39.53], [43.0, 43.66], [46.0, 46.89], [49.0, 54.75], [60.0, 60.45], [66.0, 68.01], [69.0, 72.87], [76.0, 76.25], [77.0, 82.7], [85.0, 89.14], [92.0, 91.84], [94.0, 95.5], [106.0, 106.62], [107.0, 112.01], [113.0, 113.49], [118.0, 124.75], [129.0, 130.32], [132.0, 132.22], [133.0, 132.56], [133.0, 132.65], [133.0, 132.83], [133.0, 134.94], [139.0, 139.26], [141.0, 141.66], [149.0, 160.51], [163.0, 173.52], [175.0, 184.87], [188.0, 212.01]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 72.01, 0.0, 86.09, 67.51, 0.0, 37.93, 0.0, 0.0, 46.61, 0.0, 71.87, 55.67, 0.0, 47.66, 41.85, 0.0, 0.0, 0.0, 42.86, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43, 29.77, 30.31, 29.68], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 31.18], ["boing", 19.32], ["bow-wow", 5.16]], null, null, [["music", 38.79], ["didgeridoo", 13.78], ["throbbing", 9.48]], null, null, null, null, [["speech", 34.97], ["music", 19.77], ["outside, rural or natural", 5.66]], [["telephone dialing, dtmf", 15.25], ["music", 10.69], ["radio", 10.17]], null, null, null, [["music", 67.66], ["guitar", 8.87], ["musical instrument", 6.56]], null, [["music", 68.08], ["mosquito", 4.44], ["fly, housefly", 2.78]], null, null, null, null, null, null, null, null, [["music", 66.23], ["whack, thwack", 7.01], ["speech", 6.77]], [["music", 62.13], ["speech", 8.1], ["groan", 3.55]], [["music", 74.2], ["boing", 5.72], ["reggae", 4.99]], [["livestock, farm animals, working animals", 30.22], ["cowbell", 15.28], ["cattle, bovinae", 14.86]]], "duration": [0.45, 5.04, 1.82, 3.02, 3.88, 1.67, 2.53, 0.66, 0.89, 5.75, 0.45, 2.01, 3.87, 0.25, 5.7, 4.14, -0.16, 1.5, 0.62, 5.01, 0.49, 6.75, 1.32, 0.22, -0.44, -0.35, -0.17, 1.94, 0.26, 0.66, 11.51, 10.52, 9.87, 24.01]} \ No newline at end of file diff --git a/annotations_1/Vx3I6XjqCho_filtered.json b/annotations_1/Vx3I6XjqCho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Vx3I6XjqCho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/VxKyoOxyrdU_filtered.json b/annotations_1/VxKyoOxyrdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7ede030b7a685d4d1f68eb32d3c85e8bdb98b8b --- /dev/null +++ b/annotations_1/VxKyoOxyrdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.74], [24.0, 32.46], [34.0, 34.89], [35.0, 35.9], [54.0, 55.58], [61.0, 66.36], [68.0, 69.72], [71.0, 82.05], [84.0, 88.42], [90.0, 92.57], [95.0, 98.52]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 38.25, 0.0, 0.0, 0.0, 37.0, 0.0, 47.62, 60.6, 99.05, 83.16], "audiomae_on_audioset": [null, [["music", 61.17], ["throbbing", 16.4], ["hum", 7.55]], null, null, null, [["music", 57.83], ["didgeridoo", 7.06], ["musical instrument", 4.53]], null, [["mains hum", 39.73], ["hum", 28.32], ["sidetone", 12.93]], null, null, null], "duration": [0.74, 8.46, 0.89, 0.9, 1.58, 5.36, 1.72, 11.05, 4.42, 2.57, 3.52]} \ No newline at end of file diff --git a/annotations_1/VzXMcMcBwA8_filtered.json b/annotations_1/VzXMcMcBwA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51bcf15353d108c6600aa8da02880ab826b9cb1d --- /dev/null +++ b/annotations_1/VzXMcMcBwA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.67], [16.0, 21.95], [22.0, 24.14], [30.0, 30.23], [30.0, 31.02], [33.0, 32.9], [34.0, 33.99], [36.0, 36.36], [37.0, 37.29], [46.0, 52.66], [53.0, 62.7], [65.0, 65.72], [71.0, 71.9], [74.0, 74.88], [81.0, 82.54], [83.0, 83.32], [84.0, 84.01], [89.0, 89.43], [91.0, 91.18], [92.0, 92.89], [95.0, 96.6], [99.0, 102.15], [105.0, 128.39], [131.0, 131.6], [132.0, 131.73], [132.0, 149.76], [153.0, 153.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [41.28, 32.01, 35.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.18, 32.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 94.52, 0.0, 0.0, 31.16, 0.0], "audiomae_on_audioset": [[["music", 71.85], ["throbbing", 4.5], ["musical instrument", 4.16]], [["music", 55.95], ["musical instrument", 12.55], ["trombone", 9.56]], [["music", 46.92], ["trombone", 16.67], ["brass instrument", 8.95]], null, null, null, null, null, null, [["speech", 44.67], ["music", 31.43], ["sidetone", 5.65]], [["music", 66.77], ["trombone", 10.92], ["brass instrument", 4.87]], null, null, null, null, null, null, null, null, null, null, [["explosion", 24.0], ["eruption", 17.71], ["noise", 10.59]], null, null, null, [["gong", 19.74], ["music", 11.62], ["electronic music", 6.35]], null], "duration": [4.67, 5.95, 2.14, 0.23, 1.02, -0.1, -0.01, 0.36, 0.29, 6.66, 9.7, 0.72, 0.9, 0.88, 1.54, 0.32, 0.01, 0.43, 0.18, 0.89, 1.6, 3.15, 23.39, 0.6, -0.27, 17.76, 0.57]} \ No newline at end of file diff --git a/annotations_1/W-7hoLpXFXE_filtered.json b/annotations_1/W-7hoLpXFXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a36162ad55959e9f42c0ff22dab4c1a021a4281 --- /dev/null +++ b/annotations_1/W-7hoLpXFXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.5], [14.0, 20.83], [32.0, 31.67], [40.0, 41.82], [42.0, 43.19], [45.0, 45.13], [47.0, 49.45], [51.0, 56.56], [60.0, 60.39], [61.0, 67.44], [68.0, 70.34], [72.0, 90.32], [93.0, 107.38], [109.0, 116.58]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 36.41, 0.0, 0.0, 0.0, 0.0, 30.11, 33.39, 0.0, 30.85, 29.58, 30.3, 32.87, 83.16], "audiomae_on_audioset": [null, [["music", 81.04], ["synthesizer", 5.32], ["sidetone", 0.99]], null, null, null, null, [["music", 11.48], ["fixed-wing aircraft, airplane", 10.78], ["jet engine", 9.95]], [["music", 32.63], ["hum", 26.73], ["throbbing", 11.7]], null, [["music", 81.55], ["hum", 1.85], ["didgeridoo", 1.41]], [["music", 41.0], ["hum", 13.87], ["mains hum", 13.19]], [["music", 42.34], ["hum", 19.4], ["mains hum", 10.11]], [["hum", 45.28], ["throbbing", 23.02], ["mains hum", 18.07]], null], "duration": [1.5, 6.83, -0.33, 1.82, 1.19, 0.13, 2.45, 5.56, 0.39, 6.44, 2.34, 18.32, 14.38, 7.58]} \ No newline at end of file diff --git a/annotations_1/W-cZK60yWbY_filtered.json b/annotations_1/W-cZK60yWbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cc03f7a7655bc3a92a60c808a98baa98d062d94 --- /dev/null +++ b/annotations_1/W-cZK60yWbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.38], [8.0, 9.15], [11.0, 11.57], [18.0, 18.42], [22.0, 22.99], [27.0, 27.33], [37.0, 37.96], [40.0, 40.73], [43.0, 43.71], [47.0, 49.86], [59.0, 61.82], [63.0, 63.96], [65.0, 66.36], [72.0, 77.5], [82.0, 82.56], [85.0, 85.72], [87.0, 90.22], [93.0, 94.24], [96.0, 99.72], [101.0, 101.02], [103.0, 103.99], [107.0, 107.67], [113.0, 125.68], [127.0, 127.65], [129.0, 129.39], [131.0, 134.2], [136.0, 178.48], [182.0, 182.82], [185.0, 185.6], [187.0, 187.02]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.02, 43.87, 0.0, 0.0, 32.1, 0.0, 0.0, 53.59, 0.0, 29.16, 0.0, 0.0, 0.0, 29.53, 0.0, 0.0, 29.59, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 42.59], ["music", 34.91], ["speech", 4.97]], null, null, null, null, null, null, null, null, [["music", 47.77], ["noise", 10.87], ["throbbing", 7.01]], [["throbbing", 42.7], ["hum", 20.73], ["music", 14.95]], null, null, [["music", 42.38], ["gong", 20.84], ["electronic music", 8.93]], null, null, null, null, [["speech", 31.08], ["beatboxing", 17.06], ["whack, thwack", 3.97]], null, null, null, [["speech", 15.1], ["music", 11.39], ["rumble", 7.85]], null, null, [["hum", 33.38], ["mains hum", 24.1], ["music", 22.14]], null, null, null, null], "duration": [4.38, 1.15, 0.57, 0.42, 0.99, 0.33, 0.96, 0.73, 0.71, 2.86, 2.82, 0.96, 1.36, 5.5, 0.56, 0.72, 3.22, 1.24, 3.72, 0.02, 0.99, 0.67, 12.68, 0.65, 0.39, 3.2, 42.48, 0.82, 0.6, 0.02]} \ No newline at end of file diff --git a/annotations_1/W-rC7PEsItw_filtered.json b/annotations_1/W-rC7PEsItw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed869332f96f6db317fdbb8fdb333fe467fdb058 --- /dev/null +++ b/annotations_1/W-rC7PEsItw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 25.42], [27.0, 56.96], [58.0, 60.07], [62.0, 71.17], [72.0, 73.9], [75.0, 76.72], [78.0, 81.65], [82.0, 84.86], [86.0, 94.04], [96.0, 99.15], [100.0, 108.68], [110.0, 112.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.13, 99.48, 100.0, 100.0, 0.0, 0.0, 97.43, 94.95, 98.66, 99.76, 99.98, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.42, 29.96, 2.07, 9.17, 1.9, 1.72, 3.65, 2.86, 8.04, 3.15, 8.68, 2.6]} \ No newline at end of file diff --git a/annotations_1/W18J6bcq9YI_filtered.json b/annotations_1/W18J6bcq9YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26a8341fb51c6a8c33ca11ef4bdfa824ff1b5c26 --- /dev/null +++ b/annotations_1/W18J6bcq9YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.85], [19.0, 18.81], [35.0, 43.93], [58.0, 59.68], [61.0, 61.16], [65.0, 65.94], [67.0, 67.42], [70.0, 70.06], [70.0, 70.65], [74.0, 75.29], [79.0, 79.24], [80.0, 82.49], [84.0, 84.48], [94.0, 94.58], [102.0, 103.84], [105.0, 105.54], [107.0, 107.32], [112.0, 112.78], [116.0, 115.86], [116.0, 117.71], [119.0, 119.52], [121.0, 121.26], [128.0, 135.87], [138.0, 140.22], [142.0, 142.13], [149.0, 149.45], [151.0, 151.23], [152.0, 155.06], [159.0, 160.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.38, 65.67, 0.0, 0.0, 0.0, 30.03, 0.0], "audiomae_on_audioset": [null, null, [["music", 60.2], ["speech", 16.81], ["outside, rural or natural", 2.01]], null, null, null, null, null, null, null, null, [["speech", 61.31], ["beatboxing", 17.53], ["boing", 2.31]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 67.81], ["insect", 17.73], ["bee, wasp, etc.", 6.72]], null, null, null, null, [["speech", 52.89], ["whack, thwack", 8.88], ["fart", 7.05]], null], "duration": [0.85, -0.19, 8.93, 1.68, 0.16, 0.94, 0.42, 0.06, 0.65, 1.29, 0.24, 2.49, 0.48, 0.58, 1.84, 0.54, 0.32, 0.78, -0.14, 1.71, 0.52, 0.26, 7.87, 2.22, 0.13, 0.45, 0.23, 3.06, 1.74]} \ No newline at end of file diff --git a/annotations_1/W1c-QSe7uU0_filtered.json b/annotations_1/W1c-QSe7uU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb30e7b638867cd4cb3a6a2021e102a6cc5918ba --- /dev/null +++ b/annotations_1/W1c-QSe7uU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [8.0, 8.87], [11.0, 18.89], [20.0, 21.15], [22.0, 23.19], [25.0, 26.16], [29.0, 30.16], [35.0, 36.29], [37.0, 37.77], [40.0, 40.78], [42.0, 43.85], [48.0, 50.38], [57.0, 63.26], [64.0, 65.28], [67.0, 67.51], [69.0, 71.96], [74.0, 87.67], [95.0, 95.55], [98.0, 106.29], [107.0, 108.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 89.19, 0.0, 0.0, 97.83, 84.25, 0.0, 40.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 44.7], ["throbbing", 26.63], ["mains hum", 11.49]], null], "duration": [0.43, 0.87, 7.89, 1.15, 1.19, 1.16, 1.16, 1.29, 0.77, 0.78, 1.85, 2.38, 6.26, 1.28, 0.51, 2.96, 13.67, 0.55, 8.29, 1.78]} \ No newline at end of file diff --git a/annotations_1/W1w1qcvdTi8_filtered.json b/annotations_1/W1w1qcvdTi8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdb79c1aed09d10a089d43950bb24fab2db3611 --- /dev/null +++ b/annotations_1/W1w1qcvdTi8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 45.79], [50.0, 51.51], [52.0, 56.05], [59.0, 70.98], [72.0, 72.74], [73.0, 74.33], [74.0, 74.49], [77.0, 81.6], [85.0, 88.64], [89.0, 89.18], [90.0, 90.27], [92.0, 109.98]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.07, 29.9, 0.0, 0.0, 0.0, 29.64, 35.8, 0.0, 0.0, 30.52], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 25.65], ["livestock, farm animals, working animals", 23.59], ["moo", 11.23]], [["cattle, bovinae", 30.21], ["livestock, farm animals, working animals", 27.86], ["moo", 15.29]], null, null, null, [["livestock, farm animals, working animals", 40.6], ["cattle, bovinae", 40.02], ["moo", 16.41]], [["hum", 36.79], ["mains hum", 28.32], ["throbbing", 8.53]], null, null, [["speech", 57.05], ["mains hum", 12.83], ["hum", 7.68]]], "duration": [43.79, 1.51, 4.05, 11.98, 0.74, 1.33, 0.49, 4.6, 3.64, 0.18, 0.27, 17.98]} \ No newline at end of file diff --git a/annotations_1/W28kNzz50pw_filtered.json b/annotations_1/W28kNzz50pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db2204923c6051948b959df43eb59bcfae01fa58 --- /dev/null +++ b/annotations_1/W28kNzz50pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 91.18], [93.0, 93.85], [97.0, 98.37], [100.0, 109.38], [111.0, 116.06], [119.0, 157.86]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.91, 32.98, 0.0], "audiomae_on_audioset": [null, null, null, [["vehicle", 23.67], ["car", 16.56], ["music", 13.11]], [["music", 85.3], ["throbbing", 3.25], ["electronic music", 1.74]], null], "duration": [42.18, 0.85, 1.37, 9.38, 5.06, 38.86]} \ No newline at end of file diff --git a/annotations_1/W3x0ZxDSF38_filtered.json b/annotations_1/W3x0ZxDSF38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4be625f2a7ad57fad639489e0112494fef6a8f0b --- /dev/null +++ b/annotations_1/W3x0ZxDSF38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [10.0, 14.62], [20.0, 23.9], [28.0, 28.9], [34.0, 42.62], [46.0, 46.26], [47.0, 47.82], [48.0, 47.87], [48.0, 48.2], [48.0, 48.42], [48.0, 50.26], [53.0, 53.6], [56.0, 58.21], [58.0, 58.55], [59.0, 60.32], [60.0, 61.16], [62.0, 61.62], [62.0, 63.41], [65.0, 65.43], [66.0, 67.47], [69.0, 91.74], [98.0, 98.04], [100.0, 129.95]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.22, 36.16, 0.0, 31.68, 0.0, 0.0, 0.0, 0.0, 0.0, 38.56, 0.0, 38.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.38, 0.0, 30.38], "audiomae_on_audioset": [null, [["music", 41.82], ["theremin", 19.65], ["synthesizer", 9.1]], [["music", 57.41], ["whale vocalization", 4.49], ["synthesizer", 3.58]], null, [["whack, thwack", 22.58], ["fly, housefly", 21.49], ["mosquito", 8.86]], null, null, null, null, null, [["music", 62.69], ["musical instrument", 10.71], ["theremin", 5.86]], null, [["music", 64.1], ["speech", 6.37], ["musical instrument", 4.14]], null, null, null, null, null, null, null, [["speech", 49.84], ["music", 33.08], ["fart", 9.79]], null, [["speech", 49.57], ["music", 28.06], ["musical instrument", 4.45]]], "duration": [0.45, 4.62, 3.9, 0.9, 8.62, 0.26, 0.82, -0.13, 0.2, 0.42, 2.26, 0.6, 2.21, 0.55, 1.32, 1.16, -0.38, 1.41, 0.43, 1.47, 22.74, 0.04, 29.95]} \ No newline at end of file diff --git a/annotations_1/W4efgyM82kE_filtered.json b/annotations_1/W4efgyM82kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00dcdeb4950e6e36577d0ec94486fb51ae142fbc --- /dev/null +++ b/annotations_1/W4efgyM82kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 36.58], [37.0, 47.93], [49.0, 58.28], [59.0, 59.63]], "keep_status": [true, true, false, false], "silence_prob": [37.86, 33.61, 32.52, 0.0], "audiomae_on_audioset": [[["speech", 50.21], ["music", 12.45], ["whack, thwack", 5.56]], [["speech", 38.79], ["music", 18.44], ["basketball bounce", 8.79]], [["speech", 83.92], ["music", 4.22], ["tap", 2.19]], null], "duration": [13.58, 10.93, 9.28, 0.63]} \ No newline at end of file diff --git a/annotations_1/W4kci76gyn0_filtered.json b/annotations_1/W4kci76gyn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad0008959c0c95fc2198f59e31ebe6966cb648a9 --- /dev/null +++ b/annotations_1/W4kci76gyn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.41], [9.0, 9.73], [11.0, 12.21], [14.0, 14.94], [17.0, 17.54], [19.0, 19.3], [20.0, 32.49], [33.0, 34.96], [38.0, 39.31], [39.0, 46.31], [48.0, 48.61], [55.0, 56.1], [59.0, 59.41], [60.0, 60.42], [61.0, 61.2], [63.0, 63.32], [69.0, 69.9], [71.0, 72.35], [76.0, 77.09], [78.0, 78.76], [81.0, 81.97], [85.0, 85.4], [87.0, 87.27], [88.0, 88.7], [91.0, 92.8], [95.0, 96.38], [100.0, 101.44], [102.0, 103.6], [104.0, 105.78], [107.0, 108.13], [112.0, 115.8], [119.0, 119.99], [122.0, 122.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.73, 1.21, 0.94, 0.54, 0.3, 12.49, 1.96, 1.31, 7.31, 0.61, 1.1, 0.41, 0.42, 0.2, 0.32, 0.9, 1.35, 1.09, 0.76, 0.97, 0.4, 0.27, 0.7, 1.8, 1.38, 1.44, 1.6, 1.78, 1.13, 3.8, 0.99, 0.61]} \ No newline at end of file diff --git a/annotations_1/W4vPyEk5UK8_filtered.json b/annotations_1/W4vPyEk5UK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..702b1557dc9b31cf5e2e5637631c2868b197800f --- /dev/null +++ b/annotations_1/W4vPyEk5UK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.21], [14.0, 14.18], [14.0, 17.56], [22.0, 25.76], [32.0, 33.42], [39.0, 39.73], [43.0, 51.38], [60.0, 66.46], [66.0, 66.7], [67.0, 69.96], [75.0, 76.64], [88.0, 92.42], [94.0, 94.31], [95.0, 95.69], [101.0, 106.79], [109.0, 115.47], [117.0, 116.55], [117.0, 116.67], [118.0, 119.5], [120.0, 122.96], [124.0, 124.65], [128.0, 130.62], [136.0, 137.57], [138.0, 138.69], [148.0, 149.07], [150.0, 152.47], [155.0, 156.32]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [32.39, 0.0, 38.4, 39.41, 0.0, 0.0, 36.02, 34.85, 0.0, 34.72, 0.0, 32.0, 0.0, 0.0, 35.38, 37.16, 0.0, 0.0, 0.0, 39.43, 0.0, 35.21, 0.0, 0.0, 0.0, 34.15, 0.0], "audiomae_on_audioset": [[["music", 55.4], ["synthesizer", 10.1], ["didgeridoo", 8.2]], null, [["music", 57.42], ["theremin", 6.0], ["musical instrument", 4.92]], [["music", 64.38], ["ambient music", 6.73], ["synthesizer", 6.58]], null, null, [["music", 42.25], ["hum", 13.98], ["didgeridoo", 8.87]], [["music", 38.4], ["whale vocalization", 13.09], ["hum", 8.59]], null, [["music", 59.36], ["hum", 7.32], ["didgeridoo", 5.13]], null, [["music", 48.7], ["speech", 13.69], ["electronic music", 4.75]], null, null, [["music", 57.89], ["ambient music", 12.26], ["hum", 4.45]], [["throbbing", 44.11], ["hum", 19.86], ["music", 18.16]], null, null, null, [["music", 34.68], ["throbbing", 13.19], ["hum", 11.29]], null, [["throbbing", 35.43], ["hum", 23.1], ["music", 16.97]], null, null, null, [["music", 49.43], ["hum", 10.83], ["whale vocalization", 6.17]], null], "duration": [11.21, 0.18, 3.56, 3.76, 1.42, 0.73, 8.38, 6.46, 0.7, 2.96, 1.64, 4.42, 0.31, 0.69, 5.79, 6.47, -0.45, -0.33, 1.5, 2.96, 0.65, 2.62, 1.57, 0.69, 1.07, 2.47, 1.32]} \ No newline at end of file diff --git a/annotations_1/W5-oHwzdWos_filtered.json b/annotations_1/W5-oHwzdWos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28e56d2a7e6303db98646d1395c3424c8a61562d --- /dev/null +++ b/annotations_1/W5-oHwzdWos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.74], [16.0, 16.87], [19.0, 25.54], [27.0, 27.94], [32.0, 32.41], [35.0, 37.18], [44.0, 45.6], [52.0, 52.73], [58.0, 58.6], [63.0, 63.69], [74.0, 76.47], [93.0, 94.04], [97.0, 98.54], [110.0, 111.37], [114.0, 116.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 36.57, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 0.0, 32.15, 0.0, 0.0, 0.0, 34.75], "audiomae_on_audioset": [null, null, [["music", 23.36], ["brass instrument", 18.97], ["french horn", 13.42]], null, null, null, null, null, null, null, [["music", 24.03], ["didgeridoo", 17.61], ["musical instrument", 7.65]], null, null, null, [["music", 36.89], ["speech", 18.81], ["theremin", 6.98]]], "duration": [-0.26, 0.87, 6.54, 0.94, 0.41, 2.18, 1.6, 0.73, 0.6, 0.69, 2.47, 1.04, 1.54, 1.37, 2.04]} \ No newline at end of file diff --git a/annotations_1/W6KRJEKYY7k_filtered.json b/annotations_1/W6KRJEKYY7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4f7fa3207ffaa582426c11d249c8e231eae4602 --- /dev/null +++ b/annotations_1/W6KRJEKYY7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [4.0, 6.81], [8.0, 22.82], [24.0, 24.88], [27.0, 27.84], [30.0, 31.01], [35.0, 40.07], [41.0, 43.34], [45.0, 48.19], [50.0, 52.95], [54.0, 55.31], [57.0, 57.72], [61.0, 61.8], [63.0, 69.35], [70.0, 70.33], [73.0, 73.85], [79.0, 80.6], [82.0, 83.0], [87.0, 91.0], [92.0, 93.12], [93.0, 94.27], [95.0, 96.15], [97.0, 113.66], [114.0, 115.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 87.92, 48.44, 0.0, 0.0, 0.0, 89.54, 99.68, 78.89, 53.1, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 33.24, 0.0], "audiomae_on_audioset": [null, null, [["hum", 73.94], ["mains hum", 14.64], ["throbbing", 2.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["trumpet", 23.54], ["brass instrument", 22.98], ["music", 21.09]], null], "duration": [0.27, 2.81, 14.82, 0.88, 0.84, 1.01, 5.07, 2.34, 3.19, 2.95, 1.31, 0.72, 0.8, 6.35, 0.33, 0.85, 1.6, 1.0, 4.0, 1.12, 1.27, 1.15, 16.66, 1.06]} \ No newline at end of file diff --git a/annotations_1/W7BLikBY5Ak_filtered.json b/annotations_1/W7BLikBY5Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11c112e494bf6589a1f294aa8642b4e865be9144 --- /dev/null +++ b/annotations_1/W7BLikBY5Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.99], [21.0, 22.32], [26.0, 26.42], [28.0, 28.38], [29.0, 33.02], [34.0, 42.43], [45.0, 45.47], [49.0, 50.84], [51.0, 54.84], [58.0, 58.28], [60.0, 60.67], [62.0, 64.62], [67.0, 67.59], [78.0, 80.01], [82.0, 82.88], [84.0, 84.65], [85.0, 87.61], [89.0, 89.14], [96.0, 96.58], [100.0, 102.69], [114.0, 114.66], [118.0, 119.85], [125.0, 126.15], [126.0, 126.33], [127.0, 128.36], [129.0, 134.06], [137.0, 136.8], [138.0, 140.27], [141.0, 142.45], [143.0, 144.19], [145.0, 144.95], [147.0, 148.69], [151.0, 157.32], [164.0, 169.45], [172.0, 172.2]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 44.04, 37.78, 0.0, 0.0, 43.56, 0.0, 0.0, 39.61, 0.0, 80.46, 0.0, 0.0, 96.04, 0.0, 0.0, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 39.5, 39.8, 0.0], "audiomae_on_audioset": [null, null, null, null, [["frog", 50.36], ["whale vocalization", 10.38], ["animal", 9.89]], [["speech", 20.72], ["fart", 20.14], ["cough", 14.99]], null, null, [["sidetone", 53.07], ["sine wave", 11.43], ["speech", 10.23]], null, null, [["hum", 22.53], ["speech", 21.27], ["sidetone", 11.17]], null, null, null, null, null, null, null, [["speech", 20.2], ["sidetone", 14.2], ["hum", 10.64]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.2], ["sidetone", 7.35], ["busy signal", 2.09]], [["speech", 9.14], ["tuning fork", 7.31], ["knock", 6.17]], null], "duration": [0.99, 1.32, 0.42, 0.38, 4.02, 8.43, 0.47, 1.84, 3.84, 0.28, 0.67, 2.62, 0.59, 2.01, 0.88, 0.65, 2.61, 0.14, 0.58, 2.69, 0.66, 1.85, 1.15, 0.33, 1.36, 5.06, -0.2, 2.27, 1.45, 1.19, -0.05, 1.69, 6.32, 5.45, 0.2]} \ No newline at end of file diff --git a/annotations_1/W8EhiYDVPEU_filtered.json b/annotations_1/W8EhiYDVPEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22bb31352f3551c90f57f283db7fe779809cdd3 --- /dev/null +++ b/annotations_1/W8EhiYDVPEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.22], [15.0, 24.92], [26.0, 29.05], [31.0, 31.83], [34.0, 35.72], [37.0, 38.69], [40.0, 41.37], [43.0, 50.13], [51.0, 55.38], [56.0, 57.28], [59.0, 64.77], [66.0, 72.62], [75.0, 76.05], [77.0, 84.25], [88.0, 90.0], [91.0, 94.37], [95.0, 96.8], [98.0, 100.28], [100.0, 101.36], [102.0, 102.36], [104.0, 105.48], [106.0, 117.37], [118.0, 120.29], [120.0, 121.81], [124.0, 125.85], [127.0, 140.63], [143.0, 146.21], [148.0, 152.19], [156.0, 167.27]], "keep_status": [false, true, true, false, false, false, false, true, true, false, true, true, false, true, true, true, false, true, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [34.04, 34.53, 47.9, 0.0, 0.0, 0.0, 0.0, 39.37, 30.74, 0.0, 43.08, 38.16, 0.0, 37.19, 47.86, 42.15, 0.0, 38.78, 0.0, 0.0, 0.0, 36.35, 39.0, 0.0, 0.0, 35.6, 40.16, 31.06, 32.44], "audiomae_on_audioset": [[["grunt", 56.0], ["speech", 11.71], ["music", 3.81]], [["music", 48.62], ["throbbing", 9.44], ["hum", 8.83]], [["music", 28.61], ["hum", 13.23], ["mains hum", 11.92]], null, null, null, null, [["music", 19.74], ["fart", 7.87], ["animal", 7.09]], [["livestock, farm animals, working animals", 13.24], ["music", 13.07], ["effects unit", 11.52]], null, [["music", 34.62], ["animal", 11.41], ["effects unit", 6.33]], [["speech", 45.56], ["noise", 7.75], ["music", 5.09]], null, [["grunt", 27.45], ["music", 18.95], ["speech", 5.88]], [["singing bowl", 35.77], ["music", 13.28], ["hum", 4.55]], [["music", 16.23], ["hum", 12.41], ["mains hum", 9.07]], null, [["music", 19.34], ["whale vocalization", 6.21], ["effects unit", 5.61]], null, null, null, [["speech", 53.74], ["music", 11.48], ["noise", 7.24]], [["speech", 38.97], ["music", 15.52], ["singing bowl", 8.73]], null, null, [["speech", 41.3], ["grunt", 32.93], ["music", 17.19]], [["speech", 49.61], ["grunt", 28.95], ["music", 8.96]], [["whale vocalization", 15.54], ["sine wave", 12.32], ["burping, eructation", 11.42]], [["music", 40.35], ["gong", 15.88], ["didgeridoo", 11.54]]], "duration": [4.22, 9.92, 3.05, 0.83, 1.72, 1.69, 1.37, 7.13, 4.38, 1.28, 5.77, 6.62, 1.05, 7.25, 2.0, 3.37, 1.8, 2.28, 1.36, 0.36, 1.48, 11.37, 2.29, 1.81, 1.85, 13.63, 3.21, 4.19, 11.27]} \ No newline at end of file diff --git a/annotations_1/W8fjSVywGGk_filtered.json b/annotations_1/W8fjSVywGGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..657cf8f0c84efa9f803cc83296b44c0ae60be277 --- /dev/null +++ b/annotations_1/W8fjSVywGGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.45], [12.0, 12.87], [15.0, 18.42], [22.0, 22.47], [25.0, 35.7], [36.0, 37.77], [40.0, 47.61], [51.0, 54.33], [54.0, 57.86], [58.0, 59.17], [62.0, 62.01], [64.0, 65.18], [66.0, 66.29], [69.0, 73.7], [80.0, 80.13], [81.0, 81.24], [84.0, 84.57], [85.0, 86.76], [87.0, 86.95], [87.0, 87.35], [87.0, 87.44], [88.0, 88.82], [96.0, 119.31], [120.0, 121.27], [122.0, 122.88], [124.0, 124.31], [129.0, 130.6], [131.0, 131.65], [135.0, 135.62], [137.0, 136.95]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [84.8, 0.0, 91.98, 0.0, 93.91, 0.0, 86.09, 49.92, 67.38, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 43.38], ["theremin", 5.46], ["carnatic music", 3.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.74], ["whack, thwack", 6.14], ["grunt", 6.1]], null, null, null, null, null, null, null], "duration": [5.45, 0.87, 3.42, 0.47, 10.7, 1.77, 7.61, 3.33, 3.86, 1.17, 0.01, 1.18, 0.29, 4.7, 0.13, 0.24, 0.57, 1.76, -0.05, 0.35, 0.44, 0.82, 23.31, 1.27, 0.88, 0.31, 1.6, 0.65, 0.62, -0.05]} \ No newline at end of file diff --git a/annotations_1/W95X207kQxU_filtered.json b/annotations_1/W95X207kQxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..407e89b70bc20c04edda56af000477b7cc03a51e --- /dev/null +++ b/annotations_1/W95X207kQxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.04], [33.0, 33.4], [69.0, 73.97], [107.0, 109.39], [110.0, 110.81], [117.0, 117.42], [140.0, 140.22], [144.0, 145.57]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.92, 76.2, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 80.83], ["throbbing", 3.92], ["drum and bass", 1.69]], null, null, null, null, null], "duration": [1.04, 0.4, 4.97, 2.39, 0.81, 0.42, 0.22, 1.57]} \ No newline at end of file diff --git a/annotations_1/W9Rb6wHuQXU_filtered.json b/annotations_1/W9Rb6wHuQXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e10bf6a13a602970f8d69904fddbc48bc8ceb919 --- /dev/null +++ b/annotations_1/W9Rb6wHuQXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [9.0, 9.41], [25.0, 29.0], [34.0, 35.31], [36.0, 36.64], [40.0, 40.69], [42.0, 42.79], [46.0, 46.14], [47.0, 51.66], [54.0, 58.85], [60.0, 92.01], [94.0, 131.18], [132.0, 138.03], [143.0, 148.26], [150.0, 158.19], [160.0, 166.41], [167.0, 174.02], [174.0, 174.87], [176.0, 196.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 36.47, 30.47, 0.0, 0.0, 30.71, 30.73, 30.84, 30.42, 30.06, 0.0, 30.57], "audiomae_on_audioset": [null, null, [["music", 42.42], ["speech", 35.6], ["sidetone", 2.88]], null, null, null, null, null, [["speech", 58.78], ["music", 26.46], ["arrow", 1.22]], [["livestock, farm animals, working animals", 11.43], ["music", 10.76], ["cattle, bovinae", 10.67]], null, null, [["music", 63.03], ["throbbing", 10.97], ["hum", 5.38]], [["music", 46.62], ["throbbing", 9.82], ["hum", 9.11]], [["music", 42.89], ["speech", 18.91], ["hum", 5.17]], [["music", 75.75], ["throbbing", 3.44], ["synthesizer", 3.28]], [["music", 58.56], ["speech", 14.95], ["musical instrument", 5.36]], null, [["music", 47.83], ["synthesizer", 11.39], ["cacophony", 7.85]]], "duration": [0.51, 0.41, 4.0, 1.31, 0.64, 0.69, 0.79, 0.14, 4.66, 4.85, 32.01, 37.18, 6.03, 5.26, 8.19, 6.41, 7.02, 0.87, 20.94]} \ No newline at end of file diff --git a/annotations_1/WAX89Cuk-Yc_filtered.json b/annotations_1/WAX89Cuk-Yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b74c02bc8df2cc32af8e72c8f4e12f4e198a66b --- /dev/null +++ b/annotations_1/WAX89Cuk-Yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [8.0, 17.9], [27.0, 27.13], [28.0, 28.09], [28.0, 29.32], [37.0, 37.35], [40.0, 40.93], [43.0, 44.14], [46.0, 47.82], [51.0, 51.98], [55.0, 56.07], [57.0, 58.8], [61.0, 62.4], [69.0, 72.86], [75.0, 76.82], [80.0, 79.96], [83.0, 84.28], [84.0, 84.5], [85.0, 87.76], [90.0, 91.54], [99.0, 99.47], [110.0, 113.71], [117.0, 117.64], [119.0, 119.5], [125.0, 127.06], [127.0, 130.0], [133.0, 133.86], [136.0, 139.14], [142.0, 143.92], [146.0, 146.69], [153.0, 158.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 35.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.94, 0.0, 0.0, 0.0, 0.0, 35.46, 0.0, 0.0, 32.68, 0.0, 0.0, 32.1, 30.18, 0.0, 32.65, 0.0, 0.0, 30.64], "audiomae_on_audioset": [null, [["speech", 59.49], ["noise", 20.6], ["sidetone", 7.13]], null, null, null, null, null, null, null, null, null, null, null, [["music", 89.25], ["theremin", 1.21], ["singing", 1.18]], null, null, null, null, [["music", 46.67], ["mains hum", 8.97], ["hum", 7.47]], null, null, [["music", 21.15], ["vibraphone", 9.78], ["marimba, xylophone", 9.26]], null, null, [["music", 39.97], ["theremin", 9.76], ["cello", 7.77]], [["music", 47.13], ["mantra", 16.23], ["carnatic music", 8.85]], null, [["theremin", 43.34], ["music", 27.15], ["musical instrument", 4.13]], null, null, [["music", 83.0], ["singing", 2.59], ["carnatic music", 1.71]]], "duration": [0.41, 9.9, 0.13, 0.09, 1.32, 0.35, 0.93, 1.14, 1.82, 0.98, 1.07, 1.8, 1.4, 3.86, 1.82, -0.04, 1.28, 0.5, 2.76, 1.54, 0.47, 3.71, 0.64, 0.5, 2.06, 3.0, 0.86, 3.14, 1.92, 0.69, 5.62]} \ No newline at end of file diff --git a/annotations_1/WBY5O2nTvSU_filtered.json b/annotations_1/WBY5O2nTvSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d08360b5bf0ccbc5e09ef82d13f827b3d80242c --- /dev/null +++ b/annotations_1/WBY5O2nTvSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 53.23], [56.0, 125.86], [127.0, 152.79], [154.0, 154.3], [156.0, 156.22], [157.0, 158.89], [160.0, 162.23], [164.0, 165.1], [165.0, 167.29]], "keep_status": [false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 29.92, 0.0, 0.0, 0.0, 35.14, 0.0, 34.89], "audiomae_on_audioset": [null, null, [["music", 76.37], ["speech", 3.63], ["theremin", 1.87]], null, null, null, [["moo", 19.56], ["cattle, bovinae", 18.69], ["speech", 16.45]], null, [["livestock, farm animals, working animals", 23.22], ["speech", 13.06], ["civil defense siren", 7.37]]], "duration": [36.23, 69.86, 25.79, 0.3, 0.22, 1.89, 2.23, 1.1, 2.29]} \ No newline at end of file diff --git a/annotations_1/WBreuW9LLSw_filtered.json b/annotations_1/WBreuW9LLSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1016ec42b8939b4c23b724e5dca0aa0a6c53aa63 --- /dev/null +++ b/annotations_1/WBreuW9LLSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.5], [5.0, 7.18], [9.0, 12.93], [21.0, 21.98], [29.0, 31.83], [38.0, 38.8], [39.0, 39.61], [43.0, 42.63], [48.0, 60.22], [63.0, 64.05], [66.0, 68.94], [70.0, 94.2], [105.0, 105.78]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.04, 31.03, 32.18, 0.0, 31.25, 0.0, 0.0, 0.0, 29.23, 0.0, 29.48, 29.14, 0.0], "audiomae_on_audioset": [[["speech", 63.89], ["foghorn", 6.3], ["music", 5.88]], [["music", 67.12], ["trombone", 8.21], ["musical instrument", 4.98]], [["music", 73.27], ["fly, housefly", 4.06], ["electronic music", 2.35]], null, [["music", 29.38], ["throbbing", 19.15], ["hum", 16.92]], null, null, null, [["music", 77.78], ["didgeridoo", 3.14], ["electronic music", 2.74]], null, [["hum", 30.71], ["music", 22.21], ["speech", 21.16]], [["music", 52.99], ["speech", 37.19], ["throbbing", 1.17]], null], "duration": [2.5, 2.18, 3.93, 0.98, 2.83, 0.8, 0.61, -0.37, 12.22, 1.05, 2.94, 24.2, 0.78]} \ No newline at end of file diff --git a/annotations_1/WC7TpzxGktk_filtered.json b/annotations_1/WC7TpzxGktk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e605f187d0ab856721ac63a3113a1205ad70aa6e --- /dev/null +++ b/annotations_1/WC7TpzxGktk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.53], [12.0, 15.8], [21.0, 50.18], [52.0, 61.8], [65.0, 65.65], [66.0, 92.08], [93.0, 95.2]], "keep_status": [false, true, true, false, false, false, true], "silence_prob": [0.0, 40.54, 41.12, 34.64, 0.0, 51.77, 48.74], "audiomae_on_audioset": [null, [["speech", 28.62], ["hum", 19.7], ["music", 16.01]], [["hum", 29.95], ["speech", 17.97], ["throbbing", 9.03]], [["music", 55.43], ["hum", 14.62], ["throbbing", 9.77]], null, null, [["music", 51.35], ["speech", 6.46], ["hum", 5.2]]], "duration": [1.53, 3.8, 29.18, 9.8, 0.65, 26.08, 2.2]} \ No newline at end of file diff --git a/annotations_1/WCB6zM_9DQU_filtered.json b/annotations_1/WCB6zM_9DQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d04762e0a6625df95acb66566d53a547579aed80 --- /dev/null +++ b/annotations_1/WCB6zM_9DQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.71], [24.0, 25.37], [29.0, 29.81], [32.0, 33.99], [35.0, 45.81], [50.0, 56.57], [59.0, 59.36], [61.0, 64.61], [65.0, 66.39], [68.0, 69.57], [71.0, 71.32], [73.0, 76.71], [79.0, 89.21]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.14, 34.81, 0.0, 33.38, 0.0, 0.0, 0.0, 34.55, 29.98], "audiomae_on_audioset": [null, null, null, null, [["livestock, farm animals, working animals", 44.77], ["animal", 17.16], ["cattle, bovinae", 15.61]], [["speech", 23.69], ["horse", 19.38], ["animal", 12.66]], null, [["cattle, bovinae", 24.64], ["moo", 22.93], ["livestock, farm animals, working animals", 12.45]], null, null, null, [["livestock, farm animals, working animals", 18.57], ["animal", 17.97], ["cattle, bovinae", 12.6]], [["animal", 45.77], ["livestock, farm animals, working animals", 19.15], ["cattle, bovinae", 9.78]]], "duration": [1.71, 1.37, 0.81, 1.99, 10.81, 6.57, 0.36, 3.61, 1.39, 1.57, 0.32, 3.71, 10.21]} \ No newline at end of file diff --git a/annotations_1/WCaRP0aT9CU_filtered.json b/annotations_1/WCaRP0aT9CU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e6993964963ece2d971a3243b0e168f9dd39a26 --- /dev/null +++ b/annotations_1/WCaRP0aT9CU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.83], [12.0, 13.64], [15.0, 16.11], [20.0, 20.7], [26.0, 27.68], [31.0, 31.9], [33.0, 34.48], [38.0, 37.99], [40.0, 40.58], [41.0, 48.51], [49.0, 49.84], [52.0, 52.83]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [28.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.58, 0.0, 0.0], "audiomae_on_audioset": [[["music", 25.12], ["speech", 19.05], ["rumble", 10.87]], null, null, null, null, null, null, null, null, [["music", 44.58], ["hum", 10.61], ["throbbing", 9.88]], null, null], "duration": [2.83, 1.64, 1.11, 0.7, 1.68, 0.9, 1.48, -0.01, 0.58, 7.51, 0.84, 0.83]} \ No newline at end of file diff --git a/annotations_1/WCf36CQxBfY_filtered.json b/annotations_1/WCf36CQxBfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b28ac265ac6dd01652ab3ae6651e9b2c082bbc47 --- /dev/null +++ b/annotations_1/WCf36CQxBfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.49], [17.0, 19.4], [21.0, 25.0], [27.0, 28.22], [32.0, 62.75], [66.0, 118.35], [124.0, 124.31], [125.0, 128.16], [130.0, 129.95]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.01, 29.99, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0], "audiomae_on_audioset": [null, [["music", 50.37], ["mains hum", 16.51], ["hum", 12.15]], [["music", 61.98], ["throbbing", 13.31], ["electronic music", 3.33]], null, null, null, null, null, null], "duration": [0.49, 2.4, 4.0, 1.22, 30.75, 52.35, 0.31, 3.16, -0.05]} \ No newline at end of file diff --git a/annotations_1/WDAlAqy9WUM_filtered.json b/annotations_1/WDAlAqy9WUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b19bcb41ba1ef9ccc59b2a595b0dd08a260668f --- /dev/null +++ b/annotations_1/WDAlAqy9WUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [20.0, 28.24], [39.0, 75.25], [83.0, 93.95], [97.0, 103.91], [110.0, 111.2]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 31.23, 0.0, 36.3, 32.49, 0.0], "audiomae_on_audioset": [null, [["music", 85.39], ["drum machine", 2.04], ["synthesizer", 1.6]], null, [["music", 73.03], ["buzz", 4.18], ["hum", 2.16]], [["music", 77.67], ["electronic music", 7.05], ["dubstep", 1.8]], null], "duration": [0.52, 8.24, 36.25, 10.95, 6.91, 1.2]} \ No newline at end of file diff --git a/annotations_1/WDuIl_uPY_s_filtered.json b/annotations_1/WDuIl_uPY_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..396907802aee52fc3f5dbba8f67916f1741ba8fc --- /dev/null +++ b/annotations_1/WDuIl_uPY_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [15.0, 32.21], [33.0, 33.03], [36.0, 56.61], [58.0, 61.72], [78.0, 124.38]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 29.91, 0.0, 29.79, 30.89, 0.0], "audiomae_on_audioset": [null, [["music", 37.47], ["throbbing", 25.47], ["hum", 20.24]], null, [["music", 94.71], ["hip hop music", 0.96], ["electronic music", 0.87]], [["music", 42.02], ["electronic music", 11.19], ["throbbing", 9.67]], null], "duration": [0.64, 17.21, 0.03, 20.61, 3.72, 46.38]} \ No newline at end of file diff --git a/annotations_1/WEfMDGtX3K0_filtered.json b/annotations_1/WEfMDGtX3K0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83d12aa77f389d51d3f97b0b3dd5efe55e974840 --- /dev/null +++ b/annotations_1/WEfMDGtX3K0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.59], [13.0, 15.04], [29.0, 29.83], [33.0, 33.22], [34.0, 36.56], [41.0, 44.12], [45.0, 45.54], [46.0, 46.99], [54.0, 56.96], [58.0, 59.12], [63.0, 64.49], [65.0, 66.02], [68.0, 71.52], [93.0, 95.99], [97.0, 99.59], [101.0, 103.06], [106.0, 106.41], [109.0, 109.17], [112.0, 138.03], [140.0, 166.48]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, true, false, true, false, false, false, true, true], "silence_prob": [0.0, 30.29, 0.0, 0.0, 30.96, 38.64, 0.0, 0.0, 35.24, 0.0, 0.0, 0.0, 30.56, 29.7, 29.57, 30.64, 0.0, 0.0, 29.16, 29.59], "audiomae_on_audioset": [null, [["sheep", 39.07], ["bleat", 19.13], ["music", 15.04]], null, null, [["whale vocalization", 42.02], ["cattle, bovinae", 17.71], ["livestock, farm animals, working animals", 13.47]], [["music", 29.18], ["sidetone", 23.11], ["speech", 16.6]], null, null, [["music", 34.68], ["speech", 27.57], ["livestock, farm animals, working animals", 5.29]], null, null, null, [["speech", 43.09], ["livestock, farm animals, working animals", 9.97], ["music", 9.64]], [["speech", 56.6], ["music", 9.58], ["explosion", 3.9]], [["speech", 39.23], ["whack, thwack", 13.87], ["music", 6.69]], [["music", 70.7], ["speech", 7.59], ["electronic music", 2.8]], null, null, [["speech", 32.01], ["music", 12.27], ["hum", 7.93]], [["music", 49.25], ["hum", 11.35], ["theremin", 7.17]]], "duration": [1.59, 2.04, 0.83, 0.22, 2.56, 3.12, 0.54, 0.99, 2.96, 1.12, 1.49, 1.02, 3.52, 2.99, 2.59, 2.06, 0.41, 0.17, 26.03, 26.48]} \ No newline at end of file diff --git a/annotations_1/WEvTEdLLa2s_filtered.json b/annotations_1/WEvTEdLLa2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3310fbdf07db943de5f2506c2fd14dacfc4ae93c --- /dev/null +++ b/annotations_1/WEvTEdLLa2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.75], [8.0, 8.38], [13.0, 13.88], [25.0, 26.16], [31.0, 31.48], [38.0, 38.45], [39.0, 40.51], [42.0, 43.44], [53.0, 53.62], [55.0, 55.29], [62.0, 62.87], [69.0, 70.78], [79.0, 79.17], [80.0, 82.95], [91.0, 92.1], [96.0, 95.99], [97.0, 100.82], [101.0, 102.17], [103.0, 102.83], [104.0, 108.18], [110.0, 112.63], [113.0, 114.62], [115.0, 116.06], [122.0, 125.61], [130.0, 130.28], [136.0, 137.76], [159.0, 159.53], [165.0, 165.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.55, 0.0, 0.0, 45.46, 0.0, 0.0, 44.75, 64.63, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.57], ["music", 6.79], ["boing", 6.76]], null, null, [["speech", 70.06], ["music", 6.61], ["beatboxing", 3.42]], null, null, [["speech", 70.05], ["music", 7.07], ["sidetone", 3.44]], null, null, null, null, null, null, null, null], "duration": [-0.25, 0.38, 0.88, 1.16, 0.48, 0.45, 1.51, 1.44, 0.62, 0.29, 0.87, 1.78, 0.17, 2.95, 1.1, -0.01, 3.82, 1.17, -0.17, 4.18, 2.63, 1.62, 1.06, 3.61, 0.28, 1.76, 0.53, 0.08]} \ No newline at end of file diff --git a/annotations_1/WEwS34zf8mk_filtered.json b/annotations_1/WEwS34zf8mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a2d6d04b18480c53ea95db5fed9cd3bc6ded722 --- /dev/null +++ b/annotations_1/WEwS34zf8mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.16], [6.0, 5.9], [10.0, 10.52], [19.0, 20.71], [22.0, 26.45], [29.0, 31.46], [34.0, 35.83], [49.0, 50.13], [61.0, 61.62], [66.0, 67.07], [67.0, 74.12], [78.0, 81.08], [90.0, 94.2], [98.0, 121.29], [134.0, 133.96], [141.0, 144.58], [146.0, 146.57]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false], "silence_prob": [31.71, 0.0, 0.0, 0.0, 42.17, 37.62, 0.0, 0.0, 0.0, 0.0, 31.96, 31.15, 30.39, 28.78, 0.0, 88.64, 0.0], "audiomae_on_audioset": [[["hum", 29.8], ["music", 17.21], ["speech", 16.72]], null, null, null, [["music", 72.45], ["synthesizer", 2.77], ["theremin", 2.44]], [["music", 72.13], ["didgeridoo", 5.46], ["synthesizer", 4.69]], null, null, null, null, [["music", 81.43], ["groan", 4.56], ["speech", 3.72]], [["music", 50.62], ["hum", 5.28], ["sonar", 4.46]], [["music", 29.07], ["cattle, bovinae", 14.08], ["livestock, farm animals, working animals", 10.4]], [["music", 24.72], ["hum", 11.64], ["speech", 9.58]], null, null, null], "duration": [2.16, -0.1, 0.52, 1.71, 4.45, 2.46, 1.83, 1.13, 0.62, 1.07, 7.12, 3.08, 4.2, 23.29, -0.04, 3.58, 0.57]} \ No newline at end of file diff --git a/annotations_1/WFAu7jYslik_filtered.json b/annotations_1/WFAu7jYslik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..631c77962d23c424ed75fd8e3b1ab8eff7eb3cae --- /dev/null +++ b/annotations_1/WFAu7jYslik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.45], [5.0, 13.12], [15.0, 15.87], [17.0, 92.26]], "keep_status": [false, true, false, false], "silence_prob": [100.0, 49.45, 0.0, 0.0], "audiomae_on_audioset": [null, [["noise", 28.39], ["music", 14.23], ["fly, housefly", 9.01]], null, null], "duration": [3.45, 8.12, 0.87, 75.26]} \ No newline at end of file diff --git a/annotations_1/WFUAl0Nly7Y_filtered.json b/annotations_1/WFUAl0Nly7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9189bbc33f5522b7f1fba951fe8c25cf0e574ffa --- /dev/null +++ b/annotations_1/WFUAl0Nly7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [7.0, 7.69], [9.0, 11.03], [14.0, 14.45], [15.0, 16.5], [18.0, 18.62], [22.0, 23.35], [25.0, 25.44], [27.0, 27.97], [29.0, 31.58], [33.0, 35.11], [36.0, 36.31], [37.0, 39.43], [40.0, 42.09], [43.0, 45.08], [46.0, 46.03], [50.0, 50.87], [52.0, 54.78], [64.0, 64.76], [66.0, 67.27], [69.0, 70.8], [73.0, 73.72], [74.0, 76.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 94.95, 0.0, 90.78, 99.26, 77.03, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 94.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.69, 2.03, 0.45, 1.5, 0.62, 1.35, 0.44, 0.97, 2.58, 2.11, 0.31, 2.43, 2.09, 2.08, 0.03, 0.87, 2.78, 0.76, 1.27, 1.8, 0.72, 2.28]} \ No newline at end of file diff --git a/annotations_1/WFdOIU2jKpo_filtered.json b/annotations_1/WFdOIU2jKpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79b31772857dc957078f92b051673d4e187ba500 --- /dev/null +++ b/annotations_1/WFdOIU2jKpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [6.0, 7.01], [8.0, 15.75], [19.0, 19.11], [21.0, 39.99], [41.0, 98.59], [99.0, 131.73], [133.0, 138.52], [140.0, 142.99], [144.0, 149.25], [150.0, 151.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 38.58, 0.0, 32.02, 0.0, 0.0, 99.71, 98.1, 41.01, 0.0], "audiomae_on_audioset": [null, null, [["music", 31.29], ["hum", 24.83], ["mains hum", 14.46]], null, [["hum", 43.46], ["mains hum", 25.49], ["music", 9.05]], null, null, null, null, [["speech", 55.97], ["echo", 10.29], ["hum", 5.49]], null], "duration": [0.78, 1.01, 7.75, 0.11, 18.99, 57.59, 32.73, 5.52, 2.99, 5.25, 1.53]} \ No newline at end of file diff --git a/annotations_1/WGRVxwlEoio_filtered.json b/annotations_1/WGRVxwlEoio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a52abbe38648a1f754467ff2c58b38ace8b12d4b --- /dev/null +++ b/annotations_1/WGRVxwlEoio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [6.0, 6.22], [8.0, 7.92], [11.0, 11.25], [12.0, 11.67], [12.0, 12.93], [14.0, 16.26], [17.0, 28.68], [34.0, 34.64], [36.0, 36.04], [39.0, 39.61], [42.0, 43.23], [46.0, 46.74], [48.0, 48.09], [49.0, 50.25], [51.0, 51.46], [52.0, 53.33], [54.0, 56.27], [58.0, 58.18], [61.0, 61.37], [62.0, 64.27], [65.0, 66.85], [68.0, 70.48], [71.0, 72.72], [74.0, 75.57], [77.0, 79.68], [80.0, 83.57], [85.0, 86.51], [87.0, 89.5], [91.0, 93.12], [95.0, 95.5], [97.0, 98.63], [100.0, 105.7], [108.0, 111.03], [112.0, 112.58], [115.0, 115.79], [121.0, 159.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 0.0, 74.76, 0.0, 80.11, 0.0, 0.0, 48.82, 42.3, 0.0, 54.23, 51.07, 0.0, 0.0, 44.18, 29.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 38.06], ["speech", 38.02], ["quack", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.08], ["speech", 23.28], ["foghorn", 8.59]], [["cattle, bovinae", 30.67], ["moo", 27.07], ["livestock, farm animals, working animals", 14.46]], null, null, null, null, null, [["music", 17.67], ["musical instrument", 12.21], ["didgeridoo", 10.92]], [["theremin", 63.21], ["cattle, bovinae", 4.93], ["livestock, farm animals, working animals", 3.1]], null, null, null], "duration": [0.5, 0.22, -0.08, 0.25, -0.33, 0.93, 2.26, 11.68, 0.64, 0.04, 0.61, 1.23, 0.74, 0.09, 1.25, 0.46, 1.33, 2.27, 0.18, 0.37, 2.27, 1.85, 2.48, 1.72, 1.57, 2.68, 3.57, 1.51, 2.5, 2.12, 0.5, 1.63, 5.7, 3.03, 0.58, 0.79, 38.63]} \ No newline at end of file diff --git a/annotations_1/WG_LG1CfsCE_filtered.json b/annotations_1/WG_LG1CfsCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..716e693b694e32d37477c09c675111e99d13b455 --- /dev/null +++ b/annotations_1/WG_LG1CfsCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [8.0, 8.51], [10.0, 10.02], [10.0, 13.31], [14.0, 15.25], [16.0, 16.65], [22.0, 23.87], [28.0, 28.19], [32.0, 32.59], [35.0, 35.13], [38.0, 37.99], [43.0, 52.35], [58.0, 58.9], [64.0, 64.81], [68.0, 70.5], [74.0, 76.55], [80.0, 91.52], [128.0, 130.82], [141.0, 142.33], [148.0, 149.12], [154.0, 154.53], [163.0, 163.76], [169.0, 169.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.21, 0.0, 0.0, 37.0, 32.99, 29.15, 36.28, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 40.02], ["cattle, bovinae", 38.0], ["moo", 16.79]], null, null, null, null, null, null, null, [["music", 56.72], ["synthesizer", 6.42], ["musical instrument", 5.23]], null, null, [["music", 33.16], ["hum", 15.34], ["mains hum", 13.44]], [["music", 54.46], ["speech", 11.08], ["boing", 7.56]], [["music", 31.61], ["hum", 25.05], ["mains hum", 17.82]], [["cattle, bovinae", 14.73], ["livestock, farm animals, working animals", 14.26], ["moo", 11.18]], null, null, null, null, null], "duration": [0.6, 0.51, 0.02, 3.31, 1.25, 0.65, 1.87, 0.19, 0.59, 0.13, -0.01, 9.35, 0.9, 0.81, 2.5, 2.55, 11.52, 2.82, 1.33, 1.12, 0.53, 0.76, 0.01]} \ No newline at end of file diff --git a/annotations_1/WGxfP216OFI_filtered.json b/annotations_1/WGxfP216OFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d835cbf78af8b7214fd60665a814d799b5a31178 --- /dev/null +++ b/annotations_1/WGxfP216OFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [7.0, 9.39], [11.0, 11.84], [14.0, 17.73], [20.0, 21.83], [23.0, 24.95], [25.0, 26.74], [28.0, 34.06], [36.0, 41.17], [44.0, 47.46], [49.0, 51.87], [57.0, 60.61], [63.0, 64.08], [66.0, 73.77], [75.0, 84.99], [86.0, 87.98], [89.0, 89.63], [91.0, 92.75], [94.0, 113.05], [114.0, 115.62], [118.0, 145.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.8, 99.76, 99.98, 100.0, 99.95, 0.0, 100.0, 99.76, 0.0, 0.0, 0.0, 89.9, 0.0, 56.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 2.39, 0.84, 3.73, 1.83, 1.95, 1.74, 6.06, 5.17, 3.46, 2.87, 3.61, 1.08, 7.77, 9.99, 1.98, 0.63, 1.75, 19.05, 1.62, 27.23]} \ No newline at end of file diff --git a/annotations_1/WHcarLLrz9Y_filtered.json b/annotations_1/WHcarLLrz9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ee47b6eb22324ea5d2a8da79b8e701046d1b4c6 --- /dev/null +++ b/annotations_1/WHcarLLrz9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [6.0, 6.52], [8.0, 8.34], [20.0, 20.46], [27.0, 26.91], [31.0, 33.72], [34.0, 36.42], [39.0, 39.51], [46.0, 46.62], [47.0, 50.5], [64.0, 65.08], [73.0, 73.13], [76.0, 76.5], [77.0, 77.8], [83.0, 83.42], [84.0, 85.9], [94.0, 94.58], [97.0, 97.04], [105.0, 105.76], [108.0, 108.75], [112.0, 113.36], [117.0, 121.02], [124.0, 123.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 67.25, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 0.52, 0.34, 0.46, -0.09, 2.72, 2.42, 0.51, 0.62, 3.5, 1.08, 0.13, 0.5, 0.8, 0.42, 1.9, 0.58, 0.04, 0.76, 0.75, 1.36, 4.02, -0.21]} \ No newline at end of file diff --git a/annotations_1/WIBrEMlCGSM_filtered.json b/annotations_1/WIBrEMlCGSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f722e1468956d0c14c0be68bdefa17e7733ce99 --- /dev/null +++ b/annotations_1/WIBrEMlCGSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 39.83], [42.0, 43.55], [45.0, 48.05], [50.0, 50.6], [58.0, 58.67], [61.0, 78.73], [81.0, 89.75], [90.0, 115.86], [118.0, 122.1], [123.0, 123.89], [125.0, 129.98], [131.0, 134.97], [136.0, 144.86], [145.0, 147.12], [148.0, 148.74], [152.0, 152.17], [152.0, 153.33], [157.0, 157.52], [159.0, 158.95], [160.0, 159.81], [167.0, 167.14], [168.0, 168.39], [171.0, 172.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.89, 0.0, 80.64, 0.0, 0.0, 79.59, 58.81, 61.77, 79.07, 0.0, 97.83, 95.23, 55.39, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 42.42], ["insect", 27.24], ["bee, wasp, etc.", 14.71]], null, null, null, null, null, null, null, null, null], "duration": [17.83, 1.55, 3.05, 0.6, 0.67, 17.73, 8.75, 25.86, 4.1, 0.89, 4.98, 3.97, 8.86, 2.12, 0.74, 0.17, 1.33, 0.52, -0.05, -0.19, 0.14, 0.39, 1.05]} \ No newline at end of file diff --git a/annotations_1/WIZlfA5kV7Q_filtered.json b/annotations_1/WIZlfA5kV7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f00d195dc185ed4224a451b717cea68e83680269 --- /dev/null +++ b/annotations_1/WIZlfA5kV7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [8.0, 7.91], [19.0, 18.87], [19.0, 23.26], [31.0, 39.88], [43.0, 43.8], [44.0, 44.69], [46.0, 46.8], [48.0, 49.18], [51.0, 51.04], [52.0, 52.39], [54.0, 54.7], [57.0, 57.21], [58.0, 58.72], [59.0, 60.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.33, 36.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 61.21], ["electric shaver, electric razor", 6.74], ["buzz", 5.33]], [["speech", 65.85], ["radio", 4.28], ["noise", 3.89]], null, null, null, null, null, null, null, null, null, null], "duration": [0.07, -0.09, -0.13, 4.26, 8.88, 0.8, 0.69, 0.8, 1.18, 0.04, 0.39, 0.7, 0.21, 0.72, 1.96]} \ No newline at end of file diff --git a/annotations_1/WIr_dCgNAjM_filtered.json b/annotations_1/WIr_dCgNAjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a82fc4cd503c711110594680645f5e3185807ed --- /dev/null +++ b/annotations_1/WIr_dCgNAjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 58.38], [60.0, 87.57], [89.0, 92.11], [101.0, 100.95], [103.0, 105.21], [107.0, 107.67], [110.0, 110.39], [120.0, 121.02], [124.0, 124.83], [125.0, 148.07]], "keep_status": [true, true, true, false, true, false, false, false, false, false], "silence_prob": [28.87, 29.43, 32.62, 0.0, 47.9, 0.0, 0.0, 0.0, 0.0, 29.58], "audiomae_on_audioset": [[["grunt", 15.32], ["whack, thwack", 14.22], ["sound effect", 13.82]], [["grunt", 34.92], ["music", 23.28], ["livestock, farm animals, working animals", 6.92]], [["music", 24.54], ["hum", 17.74], ["noise", 14.07]], null, [["insect", 9.52], ["fly, housefly", 9.14], ["liquid", 8.02]], null, null, null, null, [["music", 51.81], ["speech", 31.73], ["didgeridoo", 7.95]]], "duration": [18.38, 27.57, 3.11, -0.05, 2.21, 0.67, 0.39, 1.02, 0.83, 23.07]} \ No newline at end of file diff --git a/annotations_1/WJOMiXmwfYE_filtered.json b/annotations_1/WJOMiXmwfYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9590ff21fb57e6b320032ac0024e725872f8e4bc --- /dev/null +++ b/annotations_1/WJOMiXmwfYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.48], [13.0, 13.74], [32.0, 32.68], [34.0, 34.87], [37.0, 37.15], [37.0, 38.01], [44.0, 44.17], [46.0, 46.26], [50.0, 49.96], [60.0, 60.02], [63.0, 70.19], [71.0, 71.59], [74.0, 75.68], [82.0, 85.13], [88.0, 97.97], [114.0, 114.39], [120.0, 121.86], [147.0, 147.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 37.47, 30.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 45.04], ["music", 33.95], ["insect", 3.31]], null, null, [["music", 45.95], ["hum", 6.99], ["electronic music", 6.99]], [["music", 52.87], ["hum", 11.02], ["throbbing", 7.93]], null, null, null], "duration": [0.48, 0.74, 0.68, 0.87, 0.15, 1.01, 0.17, 0.26, -0.04, 0.02, 7.19, 0.59, 1.68, 3.13, 9.97, 0.39, 1.86, 0.78]} \ No newline at end of file diff --git a/annotations_1/WK0fQueuPoI_filtered.json b/annotations_1/WK0fQueuPoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b353434a6dad068845066d1346bb7da2612996fb --- /dev/null +++ b/annotations_1/WK0fQueuPoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.87], [18.0, 19.47], [22.0, 22.54], [24.0, 26.74], [34.0, 34.94], [35.0, 35.82], [36.0, 37.57], [40.0, 40.76], [41.0, 42.01], [42.0, 43.04], [44.0, 44.58], [45.0, 46.2], [55.0, 55.71], [56.0, 55.93], [57.0, 59.66], [61.0, 62.4], [63.0, 63.8], [65.0, 68.89], [70.0, 70.83], [71.0, 73.82], [78.0, 78.88], [79.0, 79.91], [81.0, 85.68], [87.0, 88.47], [95.0, 96.11], [97.0, 106.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [60.7, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 64.63, 0.0, 66.15, 0.0, 0.0, 65.2, 0.0, 0.0, 34.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.24], ["cattle, bovinae", 17.79], ["theremin", 12.17]]], "duration": [5.87, 1.47, 0.54, 2.74, 0.94, 0.82, 1.57, 0.76, 1.01, 1.04, 0.58, 1.2, 0.71, -0.07, 2.66, 1.4, 0.8, 3.89, 0.83, 2.82, 0.88, 0.91, 4.68, 1.47, 1.11, 9.46]} \ No newline at end of file diff --git a/annotations_1/WLE2QEOBde4_filtered.json b/annotations_1/WLE2QEOBde4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62376698bdbf351b6ba4a45265e9ad45c1019230 --- /dev/null +++ b/annotations_1/WLE2QEOBde4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 26.82], [28.0, 28.53], [29.0, 30.69], [32.0, 32.19], [35.0, 39.21], [42.0, 43.31], [46.0, 45.91], [47.0, 47.87], [51.0, 82.81], [84.0, 90.27]], "keep_status": [true, false, false, false, true, false, false, false, false, false], "silence_prob": [32.62, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0, 0.0, 0.0, 55.96], "audiomae_on_audioset": [[["explosion", 36.62], ["speech", 17.89], ["eruption", 10.1]], null, null, null, [["fly, housefly", 27.01], ["explosion", 18.25], ["insect", 9.67]], null, null, null, null, null], "duration": [12.82, 0.53, 1.69, 0.19, 4.21, 1.31, -0.09, 0.87, 31.81, 6.27]} \ No newline at end of file diff --git a/annotations_1/WLKpgzXHKLA_filtered.json b/annotations_1/WLKpgzXHKLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648cc03adf9a5f698f2c96ef9a49a6030be2b028 --- /dev/null +++ b/annotations_1/WLKpgzXHKLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 57.82], [59.0, 62.63]], "keep_status": [false, true], "silence_prob": [0.0, 29.95], "audiomae_on_audioset": [null, [["music", 32.01], ["vehicle", 7.79], ["cacophony", 6.95]]], "duration": [38.82, 3.63]} \ No newline at end of file diff --git a/annotations_1/WLq3zSm5SkQ_filtered.json b/annotations_1/WLq3zSm5SkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c11fe263cad482cf37acd3a164170b6c7a9ee31 --- /dev/null +++ b/annotations_1/WLq3zSm5SkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.55], [13.0, 19.82], [22.0, 38.82], [43.0, 42.74], [43.0, 56.91], [58.0, 58.31], [59.0, 60.49], [61.0, 61.11], [70.0, 70.06], [74.0, 75.51], [76.0, 82.04], [93.0, 94.93], [101.0, 102.27], [103.0, 103.84], [108.0, 108.9], [110.0, 122.35], [127.0, 174.55]], "keep_status": [true, false, true, false, true, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [33.99, 34.37, 29.6, 0.0, 39.85, 0.0, 0.0, 0.0, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 0.0, 33.53, 0.0], "audiomae_on_audioset": [[["music", 18.06], ["rumble", 11.54], ["hum", 10.13]], [["music", 77.73], ["didgeridoo", 4.59], ["scary music", 4.28]], [["music", 50.52], ["didgeridoo", 7.12], ["hum", 5.18]], null, [["animal", 17.88], ["hum", 11.91], ["grunt", 9.47]], null, null, null, null, null, [["moo", 14.72], ["speech", 13.86], ["cattle, bovinae", 11.17]], null, null, null, null, [["livestock, farm animals, working animals", 14.16], ["speech", 13.82], ["cattle, bovinae", 12.5]], null], "duration": [5.55, 6.82, 16.82, -0.26, 13.91, 0.31, 1.49, 0.11, 0.06, 1.51, 6.04, 1.93, 1.27, 0.84, 0.9, 12.35, 47.55]} \ No newline at end of file diff --git a/annotations_1/WM3TedgbwIc_filtered.json b/annotations_1/WM3TedgbwIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ef11bbb1a218fedc0446a14fbfca0925c3c7d2b --- /dev/null +++ b/annotations_1/WM3TedgbwIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.95], [36.0, 36.1], [37.0, 38.84], [39.0, 40.0], [60.0, 60.98], [64.0, 66.97], [72.0, 78.16], [80.0, 81.53], [82.0, 83.93], [84.0, 84.67], [85.0, 89.9], [90.0, 93.26], [97.0, 97.55], [99.0, 113.16], [114.0, 115.13], [117.0, 117.9], [118.0, 151.98], [153.0, 153.77], [154.0, 155.41], [157.0, 160.02], [161.0, 178.09], [180.0, 180.15]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 49.27, 42.74, 0.0, 0.0, 0.0, 51.5, 89.01, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 41.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 47.44], ["sidetone", 9.72], ["dial tone", 6.32]], [["speech", 62.46], ["thunk", 5.09], ["hum", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.59], ["synthesizer", 9.08], ["throbbing", 8.09]], null], "duration": [2.95, 0.1, 1.84, 1.0, 0.98, 2.97, 6.16, 1.53, 1.93, 0.67, 4.9, 3.26, 0.55, 14.16, 1.13, 0.9, 33.98, 0.77, 1.41, 3.02, 17.09, 0.15]} \ No newline at end of file diff --git a/annotations_1/WNAjVd38Q1E_filtered.json b/annotations_1/WNAjVd38Q1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01db915a19a3e0fefcf0f1f4023446ad843cbc75 --- /dev/null +++ b/annotations_1/WNAjVd38Q1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [7.0, 7.7], [8.0, 8.88], [11.0, 15.94], [17.0, 17.49], [19.0, 27.04], [28.0, 28.71], [31.0, 31.43], [33.0, 32.9], [34.0, 34.38], [38.0, 39.95], [40.0, 41.54], [43.0, 43.7], [46.0, 47.14], [48.0, 48.93], [49.0, 49.06], [50.0, 52.25], [57.0, 57.59], [69.0, 69.85], [71.0, 74.65], [78.0, 82.22], [84.0, 84.94], [86.0, 87.0], [95.0, 96.01], [98.0, 100.14], [109.0, 109.81], [111.0, 113.8], [120.0, 120.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 79.24, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 0.0, 40.02, 48.35, 0.0, 0.0, 0.0, 44.4, 0.0, 48.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 63.89], ["speech", 9.88], ["music", 2.93]], [["speech", 38.92], ["music", 12.39], ["didgeridoo", 9.54]], null, null, null, [["hum", 15.25], ["music", 11.31], ["throbbing", 8.49]], null, [["throbbing", 39.49], ["music", 30.6], ["hum", 10.31]], null], "duration": [1.82, 0.7, 0.88, 4.94, 0.49, 8.04, 0.71, 0.43, -0.1, 0.38, 1.95, 1.54, 0.7, 1.14, 0.93, 0.06, 2.25, 0.59, 0.85, 3.65, 4.22, 0.94, 1.0, 1.01, 2.14, 0.81, 2.8, 0.16]} \ No newline at end of file diff --git a/annotations_1/WNUJIR9y-N4_filtered.json b/annotations_1/WNUJIR9y-N4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b66a7036de8fcf5221a812ec01ec6a7c1a02a988 --- /dev/null +++ b/annotations_1/WNUJIR9y-N4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 30.77], [36.0, 36.37], [37.0, 38.42], [43.0, 62.33], [66.0, 67.47], [68.0, 69.06], [70.0, 71.22], [79.0, 80.62], [81.0, 81.65], [83.0, 83.61], [96.0, 96.13], [102.0, 103.08], [107.0, 107.11], [109.0, 109.54], [118.0, 119.25], [120.0, 120.33], [121.0, 121.78], [127.0, 128.68], [129.0, 130.33], [133.0, 133.68], [136.0, 137.08], [139.0, 139.83], [140.0, 142.65], [145.0, 145.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.87, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 62.85], ["breaking", 7.1], ["whack, thwack", 5.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 27.73], ["bee, wasp, etc.", 25.4], ["insect", 17.79]], null], "duration": [-0.23, 0.37, 1.42, 19.33, 1.47, 1.06, 1.22, 1.62, 0.65, 0.61, 0.13, 1.08, 0.11, 0.54, 1.25, 0.33, 0.78, 1.68, 1.33, 0.68, 1.08, 0.83, 2.65, 0.5]} \ No newline at end of file diff --git a/annotations_1/WO0KS0mbu80_filtered.json b/annotations_1/WO0KS0mbu80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed13fe565817deb81875db91ffe5e0b1335adadd --- /dev/null +++ b/annotations_1/WO0KS0mbu80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.12], [12.0, 13.36], [15.0, 17.24], [20.0, 21.9], [23.0, 24.16], [25.0, 25.91], [26.0, 28.65], [33.0, 43.17], [45.0, 44.93], [46.0, 46.85], [49.0, 52.95], [56.0, 55.95], [56.0, 56.08]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [81.17, 0.0, 56.33, 0.0, 0.0, 0.0, 31.43, 30.58, 0.0, 0.0, 28.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 36.07], ["whale vocalization", 10.97], ["music", 6.74]], [["music", 80.57], ["speech", 6.2], ["whale vocalization", 1.38]], null, null, [["speech", 38.61], ["music", 25.96], ["mains hum", 6.81]], null, null], "duration": [2.12, 1.36, 2.24, 1.9, 1.16, 0.91, 2.65, 10.17, -0.07, 0.85, 3.95, -0.05, 0.08]} \ No newline at end of file diff --git a/annotations_1/WOBy9Q8Gf9I_filtered.json b/annotations_1/WOBy9Q8Gf9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02ec87849673692da65c8e83e6b97169169abe62 --- /dev/null +++ b/annotations_1/WOBy9Q8Gf9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.3], [13.0, 15.58], [17.0, 18.55], [21.0, 21.88], [25.0, 28.46], [31.0, 32.09]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 99.93, 0.0, 0.0, 99.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.3, 2.58, 1.55, 0.88, 3.46, 1.09]} \ No newline at end of file diff --git a/annotations_1/WOnHL_mSXRY_filtered.json b/annotations_1/WOnHL_mSXRY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..912a7f8961f061b64593c29333e40bc3b5edf762 --- /dev/null +++ b/annotations_1/WOnHL_mSXRY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.8], [18.0, 20.29], [23.0, 23.67], [27.0, 28.51], [31.0, 33.98], [42.0, 44.14], [47.0, 48.02], [55.0, 57.15], [60.0, 61.8], [65.0, 66.19], [69.0, 70.61], [83.0, 85.48], [93.0, 95.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.6, 0.0, 0.0, 73.06, 80.64, 0.0, 96.66, 0.0, 0.0, 0.0, 74.92, 42.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 27.88], ["fly, housefly", 22.89], ["frog", 19.66]]], "duration": [0.8, 2.29, 0.67, 1.51, 2.98, 2.14, 1.02, 2.15, 1.8, 1.19, 1.61, 2.48, 2.03]} \ No newline at end of file diff --git a/annotations_1/WPggG_9I20E_filtered.json b/annotations_1/WPggG_9I20E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd50642b4f1223e9f8d8a7a6917b2b4cbdc67eb --- /dev/null +++ b/annotations_1/WPggG_9I20E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.08], [18.0, 18.33], [20.0, 19.87], [36.0, 37.18], [42.0, 42.03], [46.0, 46.06], [51.0, 52.14], [56.0, 56.96], [60.0, 61.72], [65.0, 64.76], [65.0, 66.55], [77.0, 94.51], [97.0, 97.63], [99.0, 100.89], [103.0, 103.77], [116.0, 117.09], [120.0, 120.36], [123.0, 124.24], [127.0, 131.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 76.81], ["drum machine", 5.82], ["electronic music", 4.09]], null, null, null, null, null, null, [["music", 50.18], ["throbbing", 8.79], ["drum and bass", 5.44]]], "duration": [0.08, 0.33, -0.13, 1.18, 0.03, 0.06, 1.14, 0.96, 1.72, -0.24, 1.55, 17.51, 0.63, 1.89, 0.77, 1.09, 0.36, 1.24, 4.58]} \ No newline at end of file diff --git a/annotations_1/WQP_cY7FAyQ_filtered.json b/annotations_1/WQP_cY7FAyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff5dde1353981ac02494001fa6cc39f3411b5403 --- /dev/null +++ b/annotations_1/WQP_cY7FAyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.06], [31.0, 57.08], [60.0, 125.24], [126.0, 127.33], [128.0, 135.14], [137.0, 138.65], [141.0, 141.2], [150.0, 151.26], [152.0, 156.29], [159.0, 160.0], [162.0, 163.31], [165.0, 164.94], [167.0, 175.74]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [38.64, 33.33, 0.0, 0.0, 31.96, 0.0, 0.0, 0.0, 31.5, 0.0, 0.0, 0.0, 30.81], "audiomae_on_audioset": [[["music", 69.6], ["synthesizer", 5.27], ["electronic music", 4.79]], [["music", 80.89], ["electronic music", 4.63], ["drum machine", 2.21]], null, null, [["hum", 41.0], ["mains hum", 16.42], ["speech", 8.77]], null, null, null, [["music", 64.3], ["electronic music", 15.73], ["throbbing", 4.77]], null, null, null, [["music", 27.9], ["hum", 25.39], ["mains hum", 18.4]]], "duration": [3.06, 26.08, 65.24, 1.33, 7.14, 1.65, 0.2, 1.26, 4.29, 1.0, 1.31, -0.06, 8.74]} \ No newline at end of file diff --git a/annotations_1/WRlIDIu2qpg_filtered.json b/annotations_1/WRlIDIu2qpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..864568786c9db74f0ecc652f5d0f4605b26a3167 --- /dev/null +++ b/annotations_1/WRlIDIu2qpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.15], [10.0, 10.77], [14.0, 14.39], [15.0, 16.85], [21.0, 22.03], [24.0, 24.44], [44.0, 44.31], [55.0, 56.3], [106.0, 105.95], [117.0, 119.79], [172.0, 173.35], [174.0, 177.75], [183.0, 186.41], [189.0, 206.32], [219.0, 219.52], [226.0, 229.0], [233.0, 234.15]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.21, 0.0, 29.61, 28.36, 29.31, 0.0, 30.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 41.9], ["static", 10.19], ["throbbing", 9.26]], null, [["music", 71.21], ["bleat", 3.89], ["groan", 3.05]], [["music", 40.35], ["mains hum", 9.5], ["electronic music", 8.94]], [["music", 49.49], ["throbbing", 22.4], ["hum", 8.6]], null, [["music", 71.91], ["electronic music", 3.48], ["throbbing", 2.01]], null], "duration": [1.15, 0.77, 0.39, 1.85, 1.03, 0.44, 0.31, 1.3, -0.05, 2.79, 1.35, 3.75, 3.41, 17.32, 0.52, 3.0, 1.15]} \ No newline at end of file diff --git a/annotations_1/WS8Sc1nCi8U_filtered.json b/annotations_1/WS8Sc1nCi8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9f1aec30c26453410ba6a4af260ffc0a815ecfb --- /dev/null +++ b/annotations_1/WS8Sc1nCi8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 44.15], [46.0, 46.25], [46.0, 46.36], [47.0, 74.34], [78.0, 84.05], [86.0, 93.28], [94.0, 100.14], [102.0, 103.0], [106.0, 109.38], [114.0, 120.11]], "keep_status": [false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 30.08, 30.21, 30.63, 29.87, 0.0, 30.04, 30.17], "audiomae_on_audioset": [null, null, null, [["music", 82.03], ["hum", 1.85], ["throbbing", 1.73]], [["speech", 46.02], ["music", 14.6], ["didgeridoo", 7.34]], [["music", 57.38], ["hum", 9.5], ["mains hum", 7.12]], [["music", 64.13], ["throbbing", 21.07], ["hum", 2.24]], null, [["music", 20.0], ["hum", 16.14], ["static", 13.93]], [["music", 26.21], ["whale vocalization", 11.85], ["speech", 10.28]]], "duration": [32.15, 0.25, 0.36, 27.34, 6.05, 7.28, 6.14, 1.0, 3.38, 6.11]} \ No newline at end of file diff --git a/annotations_1/WSYe57h6YUE_filtered.json b/annotations_1/WSYe57h6YUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f740f9587360a60d70f413c5c5cc621b5b43fe92 --- /dev/null +++ b/annotations_1/WSYe57h6YUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.08], [15.0, 15.72], [16.0, 16.29], [17.0, 20.66], [23.0, 22.77], [25.0, 26.1], [31.0, 33.22], [35.0, 41.34], [43.0, 55.02], [56.0, 57.84], [58.0, 59.73], [62.0, 72.2], [73.0, 73.36], [83.0, 83.29], [90.0, 93.82], [96.0, 97.16], [110.0, 128.02], [141.0, 141.3], [142.0, 142.57], [146.0, 147.6], [151.0, 156.96], [158.0, 158.5], [160.0, 160.68], [161.0, 162.19], [166.0, 166.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 38.15, 59.15, 50.26, 0.0, 0.0, 42.28, 0.0, 0.0, 35.46, 0.0, 29.79, 0.0, 0.0, 0.0, 30.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 43.14], ["music", 23.62], ["musical instrument", 6.05]], null, null, null, null, [["music", 37.22], ["speech", 15.79], ["mains hum", 12.22]], null, null, [["speech", 43.81], ["music", 22.17], ["fart", 4.92]], null, [["music", 31.37], ["speech", 26.53], ["buzz", 5.35]], null, null, null, [["music", 43.96], ["speech", 16.78], ["boing", 7.37]], null, null, null, null], "duration": [0.08, 0.72, 0.29, 3.66, -0.23, 1.1, 2.22, 6.34, 12.02, 1.84, 1.73, 10.2, 0.36, 0.29, 3.82, 1.16, 18.02, 0.3, 0.57, 1.6, 5.96, 0.5, 0.68, 1.19, 0.8]} \ No newline at end of file diff --git a/annotations_1/WShQx7lNPi4_filtered.json b/annotations_1/WShQx7lNPi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77dbfe0f17aa2c80de0f9f37735b303cccb0232f --- /dev/null +++ b/annotations_1/WShQx7lNPi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.84], [14.0, 16.23], [22.0, 23.58], [32.0, 35.13], [37.0, 36.88], [37.0, 37.93], [44.0, 45.01], [45.0, 45.32], [49.0, 50.03], [56.0, 56.62], [58.0, 58.11], [58.0, 59.46], [61.0, 62.46], [69.0, 70.53], [72.0, 72.27], [74.0, 75.88], [79.0, 80.35], [81.0, 106.37], [107.0, 107.99], [108.0, 108.03], [108.0, 114.88], [120.0, 120.02], [125.0, 126.35], [130.0, 133.95], [136.0, 136.85]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 49.09, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.5, 0.0, 0.0, 28.65, 0.0, 0.0, 38.67, 0.0], "audiomae_on_audioset": [null, [["fart", 15.37], ["dial tone", 12.42], ["speech", 7.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.59], ["didgeridoo", 4.41], ["musical instrument", 3.78]], null, null, [["music", 56.0], ["boing", 19.12], ["sidetone", 9.85]], null, null, [["hum", 17.63], ["dog", 9.99], ["animal", 8.6]], null], "duration": [0.84, 2.23, 1.58, 3.13, -0.12, 0.93, 1.01, 0.32, 1.03, 0.62, 0.11, 1.46, 1.46, 1.53, 0.27, 1.88, 1.35, 25.37, 0.99, 0.03, 6.88, 0.02, 1.35, 3.95, 0.85]} \ No newline at end of file diff --git a/annotations_1/WT6DQ_NO5zw_filtered.json b/annotations_1/WT6DQ_NO5zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dc9190343993de5ea7de903d6f750c0d625e61b --- /dev/null +++ b/annotations_1/WT6DQ_NO5zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.07], [3.0, 3.79], [8.0, 7.52], [10.0, 25.95], [30.0, 39.95], [43.0, 75.3], [78.0, 78.68], [79.0, 102.9]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.07, 30.77, 0.0, 0.0, 28.59], "audiomae_on_audioset": [null, null, null, [["speech", 47.23], ["explosion", 10.45], ["music", 9.77]], [["music", 74.13], ["speech", 2.32], ["cattle, bovinae", 1.96]], null, null, [["music", 77.35], ["musical instrument", 3.27], ["animal", 1.86]]], "duration": [0.07, 0.79, -0.48, 15.95, 9.95, 32.3, 0.68, 23.9]} \ No newline at end of file diff --git a/annotations_1/WThmGeHf4hA_filtered.json b/annotations_1/WThmGeHf4hA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f236d49cbf339bcdeeadf36471a78d11031d52e --- /dev/null +++ b/annotations_1/WThmGeHf4hA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.88], [12.0, 12.41], [16.0, 16.01], [21.0, 21.84], [25.0, 26.03], [30.0, 30.59], [31.0, 32.1], [36.0, 37.5], [42.0, 50.21], [52.0, 53.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 23.76], ["speech", 18.04], ["mains hum", 11.5]], null], "duration": [-0.12, 0.41, 0.01, 0.84, 1.03, 0.59, 1.1, 1.5, 8.21, 1.62]} \ No newline at end of file diff --git a/annotations_1/WXne2B_inx8_filtered.json b/annotations_1/WXne2B_inx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad1648c3ef591e30b02b5bc11206f8c2f939f71d --- /dev/null +++ b/annotations_1/WXne2B_inx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 45.59], [60.0, 59.91], [66.0, 66.02], [67.0, 67.47], [70.0, 70.58], [74.0, 75.15], [77.0, 78.07], [79.0, 79.71], [84.0, 84.38], [86.0, 87.54], [88.0, 88.94], [98.0, 98.24], [100.0, 100.94], [102.0, 101.92], [104.0, 104.75], [109.0, 110.47], [112.0, 112.89], [113.0, 121.78], [124.0, 125.74], [127.0, 136.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 0.0, 43.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.52], ["music", 21.72], ["throbbing", 18.95]], null, [["hum", 43.13], ["throbbing", 16.36], ["speech", 14.09]]], "duration": [1.59, -0.09, 0.02, 0.47, 0.58, 1.15, 1.07, 0.71, 0.38, 1.54, 0.94, 0.24, 0.94, -0.08, 0.75, 1.47, 0.89, 8.78, 1.74, 9.85]} \ No newline at end of file diff --git a/annotations_1/WYi4Bp1hmC0_filtered.json b/annotations_1/WYi4Bp1hmC0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7883ad070dc095facad4578e8ace180a73d98396 --- /dev/null +++ b/annotations_1/WYi4Bp1hmC0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.26], [10.0, 32.05], [33.0, 34.77], [36.0, 37.89], [41.0, 54.16], [58.0, 65.28], [66.0, 73.97], [75.0, 109.22], [110.0, 111.64], [113.0, 113.46], [114.0, 117.83], [120.0, 123.94], [126.0, 127.16], [128.0, 142.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [99.56, 31.73, 0.0, 0.0, 29.2, 29.13, 31.66, 0.0, 0.0, 0.0, 29.81, 32.53, 0.0, 30.11], "audiomae_on_audioset": [null, [["music", 38.88], ["speech", 30.48], ["hum", 11.68]], null, null, [["music", 53.19], ["didgeridoo", 20.23], ["musical instrument", 5.17]], [["music", 68.91], ["mains hum", 4.67], ["electronic music", 3.43]], [["music", 64.02], ["mains hum", 8.28], ["hum", 7.23]], null, null, null, [["music", 43.88], ["hum", 16.27], ["mains hum", 5.16]], [["speech", 22.86], ["mains hum", 22.17], ["music", 15.88]], null, [["livestock, farm animals, working animals", 56.27], ["cattle, bovinae", 12.97], ["moo", 7.96]]], "duration": [5.26, 22.05, 1.77, 1.89, 13.16, 7.28, 7.97, 34.22, 1.64, 0.46, 3.83, 3.94, 1.16, 14.4]} \ No newline at end of file diff --git a/annotations_1/WZ6JK1mPT-A_filtered.json b/annotations_1/WZ6JK1mPT-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdcd8ff0a30841383f51d591412903ee444b2394 --- /dev/null +++ b/annotations_1/WZ6JK1mPT-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [3.0, 3.77], [8.0, 32.14], [34.0, 52.76], [54.0, 96.75], [98.0, 112.06], [114.0, 124.88]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 30.94, 39.6, 0.0, 34.07, 30.26], "audiomae_on_audioset": [null, null, [["music", 62.46], ["boing", 8.01], ["whack, thwack", 2.65]], [["music", 47.4], ["theremin", 17.76], ["glockenspiel", 7.07]], null, [["music", 30.72], ["speech", 17.83], ["fart", 16.38]], [["music", 55.14], ["boing", 6.25], ["speech", 4.66]]], "duration": [-0.01, 0.77, 24.14, 18.76, 42.75, 14.06, 10.88]} \ No newline at end of file diff --git a/annotations_1/WZNe0TD1E-I_filtered.json b/annotations_1/WZNe0TD1E-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d3f6095ce1a24a24defe8924effc0d09093e008 --- /dev/null +++ b/annotations_1/WZNe0TD1E-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.83], [12.0, 12.68], [15.0, 15.82], [20.0, 20.07], [22.0, 23.63], [28.0, 28.32], [30.0, 30.65], [31.0, 32.24], [37.0, 37.2], [40.0, 41.44], [43.0, 44.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 0.68, 0.82, 0.07, 1.63, 0.32, 0.65, 1.24, 0.2, 1.44, 1.2]} \ No newline at end of file diff --git a/annotations_1/W_EYrVGI7LQ_filtered.json b/annotations_1/W_EYrVGI7LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4b2c2da271662859d046b391207a38c45a6ce25 --- /dev/null +++ b/annotations_1/W_EYrVGI7LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.01], [11.0, 12.16], [23.0, 23.82], [30.0, 32.59], [33.0, 41.44], [44.0, 48.63], [50.0, 52.93], [54.0, 64.44], [65.0, 107.6], [108.0, 109.17], [114.0, 116.01], [121.0, 125.69], [132.0, 134.99], [147.0, 150.79], [154.0, 162.5]], "keep_status": [false, false, false, true, false, true, true, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.79, 31.09, 30.19, 37.98, 29.38, 0.0, 0.0, 35.15, 29.49, 28.87, 28.79, 29.38], "audiomae_on_audioset": [null, null, null, [["speech", 34.01], ["crowd", 8.24], ["music", 4.88]], [["speech", 34.56], ["eruption", 30.3], ["explosion", 12.5]], [["fly, housefly", 21.26], ["insect", 13.37], ["speech", 8.75]], [["music", 48.32], ["hum", 7.68], ["throbbing", 6.07]], [["music", 21.17], ["hum", 12.06], ["mains hum", 8.61]], null, null, [["music", 35.39], ["dubstep", 7.95], ["electronic music", 7.01]], [["music", 32.56], ["speech", 10.15], ["vehicle", 8.12]], [["speech", 55.12], ["music", 14.29], ["sound effect", 3.56]], [["music", 13.63], ["sound effect", 10.98], ["mains hum", 10.81]], [["music", 71.65], ["speech", 5.68], ["electronic music", 3.7]]], "duration": [0.01, 1.16, 0.82, 2.59, 8.44, 4.63, 2.93, 10.44, 42.6, 1.17, 2.01, 4.69, 2.99, 3.79, 8.5]} \ No newline at end of file diff --git a/annotations_1/W_fixpI0BL8_filtered.json b/annotations_1/W_fixpI0BL8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aeb67cd7b2e8fa92ba31ede8552499334276b4f --- /dev/null +++ b/annotations_1/W_fixpI0BL8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [4.0, 4.72], [7.0, 8.21], [8.0, 8.65], [9.0, 9.91], [17.0, 17.41], [20.0, 31.65], [33.0, 33.4], [34.0, 35.53], [37.0, 38.5], [41.0, 41.18], [41.0, 41.99], [42.0, 43.19], [43.0, 45.76], [56.0, 60.13], [63.0, 63.64], [66.0, 66.36], [68.0, 68.54], [69.0, 70.14], [73.0, 73.67], [75.0, 75.05], [75.0, 86.09], [88.0, 94.36], [98.0, 100.21], [103.0, 103.27], [103.0, 106.22], [118.0, 117.81], [120.0, 122.62], [123.0, 124.07], [125.0, 130.38]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.48, 49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 47.66, 40.97, 0.0, 38.36, 0.0, 71.29, 0.0, 36.06], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 18.06], ["speech", 8.27], ["heart sounds, heartbeat", 5.7]], null, null, null, null, null, null, [["rowboat, canoe, kayak", 21.94], ["speech", 11.31], ["boat, water vehicle", 10.4]], [["sidetone", 39.3], ["radio", 23.59], ["noise", 13.56]], null, null, null, null, null, null, [["livestock, farm animals, working animals", 29.89], ["cattle, bovinae", 12.71], ["animal", 11.66]], [["fly, housefly", 6.86], ["vehicle", 6.73], ["insect", 4.77]], [["music", 36.17], ["whistling", 11.74], ["radio", 8.2]], null, [["frog", 33.19], ["fly, housefly", 27.56], ["insect", 12.39]], null, null, null, [["fly, housefly", 41.28], ["insect", 38.76], ["mosquito", 10.15]]], "duration": [0.44, 0.72, 1.21, 0.65, 0.91, 0.41, 11.65, 0.4, 1.53, 1.5, 0.18, 0.99, 1.19, 2.76, 4.13, 0.64, 0.36, 0.54, 1.14, 0.67, 0.05, 11.09, 6.36, 2.21, 0.27, 3.22, -0.19, 2.62, 1.07, 5.38]} \ No newline at end of file diff --git a/annotations_1/W_qA7Xt_UPw_filtered.json b/annotations_1/W_qA7Xt_UPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb153d709c87d732753ee0a4dc35d20667355c55 --- /dev/null +++ b/annotations_1/W_qA7Xt_UPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 19.84], [20.0, 19.94], [20.0, 32.76], [43.0, 44.14], [45.0, 45.22], [46.0, 46.26], [49.0, 51.95], [54.0, 54.28], [55.0, 56.34], [57.0, 94.9], [103.0, 113.44]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.52, 0.0, 0.0, 0.0, 28.89, 0.0, 0.0, 0.0, 55.31], "audiomae_on_audioset": [null, null, [["frog", 28.05], ["insect", 19.38], ["speech", 13.73]], null, null, null, [["cattle, bovinae", 49.91], ["livestock, farm animals, working animals", 30.24], ["moo", 19.49]], null, null, null, null], "duration": [-0.16, -0.06, 12.76, 1.14, 0.22, 0.26, 2.95, 0.28, 1.34, 37.9, 10.44]} \ No newline at end of file diff --git a/annotations_1/Wa3l6Q7e5aA_filtered.json b/annotations_1/Wa3l6Q7e5aA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d82f9bec5377b785b67f5c2b3d40c026bb8d831 --- /dev/null +++ b/annotations_1/Wa3l6Q7e5aA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.58], [4.0, 5.8], [9.0, 8.88], [10.0, 10.3], [12.0, 12.24], [20.0, 33.61], [35.0, 49.45], [52.0, 59.1], [60.0, 61.55], [62.0, 67.96], [70.0, 71.36], [73.0, 76.94], [78.0, 79.32], [80.0, 83.25], [84.0, 92.45], [95.0, 96.11], [98.0, 102.3], [103.0, 107.7], [135.0, 136.68]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.37, 28.76, 28.88, 0.0, 39.17, 0.0, 28.83, 0.0, 32.42, 28.4, 0.0, 28.54, 29.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.82], ["throbbing", 10.46], ["hum", 6.24]], [["music", 81.02], ["electronic music", 4.46], ["cacophony", 1.97]], [["music", 88.56], ["electronic music", 3.08], ["dubstep", 1.31]], null, [["speech", 76.72], ["throbbing", 6.12], ["hum", 3.32]], null, [["didgeridoo", 32.91], ["music", 19.26], ["speech", 9.89]], null, [["music", 37.49], ["didgeridoo", 18.2], ["speech", 5.22]], [["music", 34.38], ["buzz", 12.92], ["didgeridoo", 12.16]], null, [["music", 64.02], ["throbbing", 10.71], ["hum", 6.43]], [["music", 43.31], ["throbbing", 17.47], ["hum", 14.61]], null], "duration": [-0.42, 1.8, -0.12, 0.3, 0.24, 13.61, 14.45, 7.1, 1.55, 5.96, 1.36, 3.94, 1.32, 3.25, 8.45, 1.11, 4.3, 4.7, 1.68]} \ No newline at end of file diff --git a/annotations_1/WavZVQM3U00_filtered.json b/annotations_1/WavZVQM3U00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a6d2e9257ed66494f1a7ff8e36977cff7788be1 --- /dev/null +++ b/annotations_1/WavZVQM3U00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.15], [13.0, 27.36], [28.0, 34.77], [38.0, 37.99], [38.0, 38.91], [41.0, 43.19], [45.0, 47.92], [51.0, 72.0], [73.0, 90.53], [97.0, 119.89]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [53.47, 58.13, 35.96, 0.0, 0.0, 67.51, 56.7, 51.44, 37.26, 33.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 64.68], ["speech", 29.4], ["mosquito", 0.57]], null, null, null, null, null, [["music", 50.46], ["speech", 9.5], ["noise", 6.95]], [["fly, housefly", 46.61], ["insect", 23.11], ["mosquito", 10.02]]], "duration": [3.15, 14.36, 6.77, -0.01, 0.91, 2.19, 2.92, 21.0, 17.53, 22.89]} \ No newline at end of file diff --git a/annotations_1/WbFri7eX_YA_filtered.json b/annotations_1/WbFri7eX_YA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c1a0049f640cdb4d7706257a506e59337bf0c2d --- /dev/null +++ b/annotations_1/WbFri7eX_YA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.41], [12.0, 12.41], [15.0, 15.67], [17.0, 16.77], [19.0, 19.67], [21.0, 20.85], [21.0, 21.73], [25.0, 25.35], [28.0, 29.08], [32.0, 33.84], [34.0, 35.4], [38.0, 39.06], [41.0, 41.91], [45.0, 44.61], [45.0, 46.3], [49.0, 49.64], [52.0, 53.23], [56.0, 61.67], [64.0, 65.47], [69.0, 69.75], [71.0, 72.05], [75.0, 75.02], [76.0, 77.35], [79.0, 79.1], [80.0, 80.77], [84.0, 84.55], [88.0, 87.93], [89.0, 89.24], [90.0, 93.97], [97.0, 96.82], [99.0, 100.41], [103.0, 104.01], [105.0, 107.43], [108.0, 108.24], [110.0, 110.93], [113.0, 113.59], [115.0, 115.3], [116.0, 117.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.3, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.97], ["theremin", 20.22], ["whale vocalization", 6.27]], null, null, null, null, null, null, null, null, null, null, [["speech", 54.85], ["radio", 9.14], ["music", 6.71]], null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.41, 0.67, -0.23, 0.67, -0.15, 0.73, 0.35, 1.08, 1.84, 1.4, 1.06, 0.91, -0.39, 1.3, 0.64, 1.23, 5.67, 1.47, 0.75, 1.05, 0.02, 1.35, 0.1, 0.77, 0.55, -0.07, 0.24, 3.97, -0.18, 1.41, 1.01, 2.43, 0.24, 0.93, 0.59, 0.3, 1.95]} \ No newline at end of file diff --git a/annotations_1/WbcZ3k4Mr6Q_filtered.json b/annotations_1/WbcZ3k4Mr6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c5a10f5beb9f212a2a52573d237321c8544e54 --- /dev/null +++ b/annotations_1/WbcZ3k4Mr6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.45], [16.0, 16.41], [17.0, 16.68], [18.0, 18.0], [18.0, 18.72], [20.0, 20.06], [28.0, 29.2], [32.0, 34.11], [35.0, 35.48], [38.0, 41.76], [50.0, 50.09], [51.0, 51.92], [56.0, 56.51], [58.0, 57.92], [58.0, 59.07], [61.0, 62.77], [64.0, 65.4], [66.0, 87.07], [88.0, 91.86], [96.0, 96.92], [99.0, 99.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [55.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 37.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.66, 90.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["moo", 41.87], ["cattle, bovinae", 18.57], ["whale vocalization", 13.13]], null, null, null, null, null, null, null, [["speech", 49.41], ["explosion", 10.2], ["horse", 7.81]], null, null, null], "duration": [8.45, 0.41, -0.32, 0.0, 0.72, 0.06, 1.2, 2.11, 0.48, 3.76, 0.09, 0.92, 0.51, -0.08, 1.07, 1.77, 1.4, 21.07, 3.86, 0.92, 0.32]} \ No newline at end of file diff --git a/annotations_1/Wc_pikEIkcQ_filtered.json b/annotations_1/Wc_pikEIkcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..117d53dc294a6e3d19d337c41106cdc8b5d83ad0 --- /dev/null +++ b/annotations_1/Wc_pikEIkcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.42], [11.0, 12.41], [13.0, 14.27], [18.0, 46.75], [49.0, 65.2], [68.0, 70.14], [74.0, 74.41], [76.0, 82.17], [85.0, 88.21], [96.0, 97.46], [100.0, 101.46], [102.0, 103.32], [106.0, 106.39], [106.0, 106.91], [112.0, 113.27], [119.0, 121.88], [123.0, 123.33], [127.0, 131.25], [134.0, 134.4], [137.0, 138.81], [139.0, 144.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [71.87, 0.0, 0.0, 52.45, 33.54, 67.25, 0.0, 61.77, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 36.13, 0.0, 0.0, 29.7], "audiomae_on_audioset": [null, null, null, null, [["music", 90.91], ["buzz", 1.71], ["theremin", 1.26]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.03], ["foghorn", 11.53], ["trombone", 10.64]], null, null, [["music", 37.8], ["mains hum", 17.36], ["hum", 12.19]]], "duration": [6.42, 1.41, 1.27, 28.75, 16.2, 2.14, 0.41, 6.17, 3.21, 1.46, 1.46, 1.32, 0.39, 0.91, 1.27, 2.88, 0.33, 4.25, 0.4, 1.81, 5.14]} \ No newline at end of file diff --git a/annotations_1/WcmMx1_lQmA_filtered.json b/annotations_1/WcmMx1_lQmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca165b0b90541a788133a8cfb826ccb1ca560c31 --- /dev/null +++ b/annotations_1/WcmMx1_lQmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [4.0, 3.92], [4.0, 6.13], [11.0, 10.96], [12.0, 13.07], [20.0, 20.22], [21.0, 21.68], [22.0, 24.98], [29.0, 29.37], [31.0, 31.75], [33.0, 33.64], [34.0, 34.28], [36.0, 37.23], [39.0, 47.07], [48.0, 50.9], [52.0, 52.76], [53.0, 54.84], [55.0, 59.56], [62.0, 62.88], [64.0, 66.07], [67.0, 68.17], [70.0, 72.05], [74.0, 74.82], [76.0, 76.79], [83.0, 85.21], [90.0, 90.56]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 42.37, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.51, 61.97, 0.0, 0.0, 30.74, 0.0, 29.36, 0.0, 62.27, 0.0, 0.0, 48.14, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 25.28], ["hum", 20.62], ["speech", 14.74]], null, null, null, null, [["buzzer", 15.73], ["speech", 11.26], ["ding", 10.41]], null, null, null, null, null, [["hum", 18.3], ["animal", 10.99], ["speech", 10.01]], null, null, null, [["hum", 20.05], ["whoosh, swoosh, swish", 10.27], ["mains hum", 10.08]], null, [["whack, thwack", 12.2], ["breaking", 7.37], ["frog", 6.32]], null, null, null, null, [["fly, housefly", 30.06], ["insect", 21.21], ["bee, wasp, etc.", 13.34]], null], "duration": [0.35, -0.08, 2.13, -0.04, 1.07, 0.22, 0.68, 2.98, 0.37, 0.75, 0.64, 0.28, 1.23, 8.07, 2.9, 0.76, 1.84, 4.56, 0.88, 2.07, 1.17, 2.05, 0.82, 0.79, 2.21, 0.56]} \ No newline at end of file diff --git a/annotations_1/WcsyV7eMrGI_filtered.json b/annotations_1/WcsyV7eMrGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01f00c601e8197f15a6e64b560899aa7e870f24e --- /dev/null +++ b/annotations_1/WcsyV7eMrGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.52], [17.0, 18.03], [25.0, 26.94], [41.0, 41.55]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.52, 1.03, 1.94, 0.55]} \ No newline at end of file diff --git a/annotations_1/Wd5RTjtSSxk_filtered.json b/annotations_1/Wd5RTjtSSxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68fd758f3c7adcc1d3064d2b3af983dfa1f336f1 --- /dev/null +++ b/annotations_1/Wd5RTjtSSxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.74], [15.0, 14.77], [15.0, 18.81], [20.0, 19.94], [38.0, 64.69], [65.0, 76.96], [78.0, 78.06], [79.0, 80.99], [81.0, 84.13], [85.0, 85.5], [88.0, 92.15], [108.0, 109.11], [114.0, 117.0]], "keep_status": [false, false, false, false, true, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 30.71, 0.0, 39.01, 37.51, 0.0, 0.0, 38.94, 0.0, 36.7, 0.0, 32.79], "audiomae_on_audioset": [null, null, [["music", 59.21], ["dubstep", 8.4], ["electronic music", 6.24]], null, [["music", 52.39], ["electronic music", 8.48], ["throbbing", 8.4]], [["music", 29.35], ["throbbing", 27.63], ["hum", 13.02]], null, null, [["mains hum", 23.02], ["hum", 16.29], ["speech", 10.71]], null, [["speech", 33.9], ["music", 26.65], ["hum", 6.82]], null, [["music", 41.14], ["speech", 18.15], ["sidetone", 10.84]]], "duration": [-0.26, -0.23, 3.81, -0.06, 26.69, 11.96, 0.06, 1.99, 3.13, 0.5, 4.15, 1.11, 3.0]} \ No newline at end of file diff --git a/annotations_1/WdS4ZMa6tXM_filtered.json b/annotations_1/WdS4ZMa6tXM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fea3ee2f2a1e1dc25b210663ccaf49c5b814531 --- /dev/null +++ b/annotations_1/WdS4ZMa6tXM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.32], [6.0, 6.83], [7.0, 8.83], [10.0, 10.34], [11.0, 11.57], [13.0, 15.4], [16.0, 17.14], [26.0, 26.99], [30.0, 30.75], [41.0, 43.14], [55.0, 58.41], [59.0, 60.18], [60.0, 61.7], [63.0, 68.08], [70.0, 72.3], [75.0, 76.1], [78.0, 88.42], [90.0, 102.37], [105.0, 105.0], [107.0, 110.15], [112.0, 111.72], [121.0, 121.19], [122.0, 122.5], [123.0, 124.65], [126.0, 126.39], [127.0, 127.48], [128.0, 128.51], [129.0, 129.52], [132.0, 132.34], [134.0, 135.82], [138.0, 143.28], [147.0, 148.58], [149.0, 150.57], [156.0, 156.46], [158.0, 161.06], [164.0, 166.16], [168.0, 175.1], [177.0, 181.52], [183.0, 183.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 0.0, 0.0, 35.98, 54.76, 0.0, 0.0, 38.19, 36.07, 0.0, 33.32, 32.68, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.47, 0.0, 0.0, 0.0, 64.75, 62.27, 54.63, 98.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["siren", 72.67], ["civil defense siren", 21.57], ["police car (siren)", 3.5]], null, null, null, [["music", 74.83], ["frog", 3.87], ["synthesizer", 2.29]], null, null, null, [["music", 63.38], ["electronic music", 4.01], ["speech", 3.63]], [["music", 56.73], ["speech", 19.36], ["boing", 4.54]], null, [["music", 49.65], ["speech", 32.48], ["electronic music", 2.66]], [["music", 63.48], ["speech", 17.01], ["musical instrument", 4.07]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.37], ["musical instrument", 5.25], ["synthesizer", 4.95]], null, null, null, null, null, null, null, null], "duration": [1.32, 0.83, 1.83, 0.34, 0.57, 2.4, 1.14, 0.99, 0.75, 2.14, 3.41, 1.18, 1.7, 5.08, 2.3, 1.1, 10.42, 12.37, 0.0, 3.15, -0.28, 0.19, 0.5, 1.65, 0.39, 0.48, 0.51, 0.52, 0.34, 1.82, 5.28, 1.58, 1.57, 0.46, 3.06, 2.16, 7.1, 4.52, 0.96]} \ No newline at end of file diff --git a/annotations_1/WdzNa6wmtpw_filtered.json b/annotations_1/WdzNa6wmtpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8d2562239612d4d95344f681db622d20382ab66 --- /dev/null +++ b/annotations_1/WdzNa6wmtpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 34.48], [36.0, 50.53], [51.0, 51.36], [52.0, 83.84], [84.0, 85.43], [87.0, 91.69], [97.0, 97.46], [99.0, 100.55], [102.0, 136.59]], "keep_status": [false, true, false, false, false, true, false, false, false], "silence_prob": [31.36, 30.77, 0.0, 0.0, 0.0, 43.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 84.37], ["speech", 3.09], ["sheep", 0.98]], [["throbbing", 24.12], ["hum", 20.38], ["speech", 17.99]], null, null, null, [["music", 45.22], ["throbbing", 13.3], ["hum", 7.64]], null, null, null], "duration": [14.48, 14.53, 0.36, 31.84, 1.43, 4.69, 0.46, 1.55, 34.59]} \ No newline at end of file diff --git a/annotations_1/WeSHSxMfC0A_filtered.json b/annotations_1/WeSHSxMfC0A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc22e8ea8ed4a1070a5b9806789ca164eea047f4 --- /dev/null +++ b/annotations_1/WeSHSxMfC0A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 32.58], [34.0, 34.3], [35.0, 39.61], [44.0, 67.29], [68.0, 68.4], [87.0, 92.69], [100.0, 100.23], [107.0, 133.71], [138.0, 138.77], [140.0, 141.2], [145.0, 144.61], [145.0, 146.4]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [66.51, 0.0, 74.76, 45.56, 0.0, 84.25, 0.0, 37.49, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.91], ["speech", 3.84], ["singing bowl", 3.23]], null, null, null, [["music", 49.93], ["speech", 18.04], ["thunk", 4.71]], null, null, null, null], "duration": [20.58, 0.3, 4.61, 23.29, 0.4, 5.69, 0.23, 26.71, 0.77, 1.2, -0.39, 1.4]} \ No newline at end of file diff --git a/annotations_1/Wf6feYvdHs4_filtered.json b/annotations_1/Wf6feYvdHs4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e09e887c778b1030b3424c01c3a2fff3e2efbd3 --- /dev/null +++ b/annotations_1/Wf6feYvdHs4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 30.97], [34.0, 43.02], [62.0, 67.02], [77.0, 78.36], [80.0, 82.0], [106.0, 106.32], [109.0, 113.02], [115.0, 129.27], [130.0, 130.32]], "keep_status": [false, true, false, false, true, false, true, true, false], "silence_prob": [0.0, 30.01, 36.28, 0.0, 38.86, 0.0, 38.93, 44.23, 0.0], "audiomae_on_audioset": [null, [["speech", 40.86], ["animal", 10.72], ["frog", 9.0]], [["whistling", 37.28], ["speech", 25.8], ["radio", 8.56]], null, [["hum", 9.59], ["eruption", 6.73], ["mains hum", 6.5]], null, [["theremin", 24.13], ["chirp tone", 19.71], ["whale vocalization", 9.0]], [["hum", 13.37], ["noise", 10.86], ["animal", 8.71]], null], "duration": [-0.03, 9.02, 5.02, 1.36, 2.0, 0.32, 4.02, 14.27, 0.32]} \ No newline at end of file diff --git a/annotations_1/WfAp-jZV5Bo_filtered.json b/annotations_1/WfAp-jZV5Bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0de466aa04c3f714aca3359e49dc93b0431d719 --- /dev/null +++ b/annotations_1/WfAp-jZV5Bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [5.0, 6.81], [9.0, 30.42], [34.0, 36.51], [37.0, 37.49], [40.0, 41.18], [42.0, 113.85], [115.0, 136.51]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 32.0, 94.52, 0.0, 0.0, 0.0, 33.29], "audiomae_on_audioset": [null, null, [["breaking", 51.73], ["music", 16.56], ["buzz", 6.74]], null, null, null, null, [["music", 32.74], ["sonar", 12.1], ["hum", 5.54]]], "duration": [0.93, 1.81, 21.42, 2.51, 0.49, 1.18, 71.85, 21.51]} \ No newline at end of file diff --git a/annotations_1/WfCufFRo-hU_filtered.json b/annotations_1/WfCufFRo-hU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..749af98c26d29786fde44aef4f84a5f80fd03214 --- /dev/null +++ b/annotations_1/WfCufFRo-hU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.04], [8.0, 9.76], [12.0, 13.51], [16.0, 18.6], [20.0, 21.12], [21.0, 22.52], [23.0, 30.08], [30.0, 30.45], [31.0, 32.51], [33.0, 36.39], [40.0, 41.76], [44.0, 45.4], [47.0, 47.51], [49.0, 50.48], [51.0, 51.92], [54.0, 57.37], [58.0, 60.37], [61.0, 62.4], [63.0, 66.38], [68.0, 69.16], [73.0, 73.68], [74.0, 76.08], [79.0, 80.7], [82.0, 83.59], [85.0, 86.49], [88.0, 88.72], [90.0, 91.67], [93.0, 94.22], [96.0, 97.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.08, 0.0, 0.0, 95.51, 0.0, 0.0, 63.96, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 99.78, 0.0, 79.41, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.04, 1.76, 1.51, 2.6, 1.12, 1.52, 7.08, 0.45, 1.51, 3.39, 1.76, 1.4, 0.51, 1.48, 0.92, 3.37, 2.37, 1.4, 3.38, 1.16, 0.68, 2.08, 1.7, 1.59, 1.49, 0.72, 1.67, 1.22, 1.16]} \ No newline at end of file diff --git a/annotations_1/WgMhaDEPGXo_filtered.json b/annotations_1/WgMhaDEPGXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da8a182197997f68b6cacba1de15a5bd2c287824 --- /dev/null +++ b/annotations_1/WgMhaDEPGXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.83], [13.0, 13.53], [14.0, 14.3], [17.0, 17.36], [23.0, 23.16], [24.0, 26.1], [27.0, 28.66], [30.0, 30.96], [31.0, 32.63], [34.0, 35.21], [37.0, 40.14], [46.0, 51.17], [52.0, 53.99], [57.0, 57.65], [58.0, 59.53], [60.0, 65.25], [67.0, 79.52], [80.0, 85.82], [88.0, 90.04], [91.0, 94.85], [96.0, 100.26], [101.0, 100.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 81.0, 62.89, 0.0, 0.0, 0.0, 95.09, 49.5, 41.12, 47.27, 40.09, 35.45, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.54], ["theremin", 13.18], ["musical instrument", 3.7]], [["music", 78.95], ["theremin", 8.16], ["musical instrument", 2.74]], [["speech", 41.76], ["music", 19.83], ["mains hum", 6.95]], [["theremin", 67.11], ["music", 23.66], ["musical instrument", 1.12]], [["music", 41.89], ["theremin", 16.6], ["foghorn", 5.03]], null], "duration": [-0.17, 0.53, 0.3, 0.36, 0.16, 2.1, 1.66, 0.96, 1.63, 1.21, 3.14, 5.17, 1.99, 0.65, 1.53, 5.25, 12.52, 5.82, 2.04, 3.85, 4.26, -0.23]} \ No newline at end of file diff --git a/annotations_1/WgXQnXPb-TA_filtered.json b/annotations_1/WgXQnXPb-TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d21ad391f43268b8bd83b7ed74566219d397e16b --- /dev/null +++ b/annotations_1/WgXQnXPb-TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.05], [11.0, 11.2], [15.0, 16.16], [19.0, 18.67], [27.0, 27.16], [30.0, 30.59], [37.0, 40.07], [43.0, 47.02], [48.0, 50.9], [53.0, 55.73], [56.0, 70.07], [75.0, 75.71], [81.0, 80.74], [84.0, 85.97], [87.0, 89.29], [89.0, 89.8], [90.0, 93.43], [97.0, 97.75], [107.0, 110.94], [113.0, 113.16], [119.0, 119.82], [121.0, 122.32]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 43.08, 51.18, 49.68, 36.22, 0.0, 0.0, 0.0, 92.15, 0.0, 59.15, 0.0, 70.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.85], ["music", 12.4], ["busy signal", 7.34]], [["music", 49.78], ["speech", 25.42], ["musical instrument", 2.48]], null, [["music", 48.38], ["speech", 8.05], ["mains hum", 3.39]], [["music", 37.51], ["singing bowl", 24.67], ["speech", 11.44]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.2, 1.16, -0.33, 0.16, 0.59, 3.07, 4.02, 2.9, 2.73, 14.07, 0.71, -0.26, 1.97, 2.29, 0.8, 3.43, 0.75, 3.94, 0.16, 0.82, 1.32]} \ No newline at end of file diff --git a/annotations_1/WhT70B0c7TE_filtered.json b/annotations_1/WhT70B0c7TE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db4065f5e961860ed364ac0ce1f0054311425519 --- /dev/null +++ b/annotations_1/WhT70B0c7TE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.01], [17.0, 17.32], [19.0, 19.58], [20.0, 22.47], [31.0, 31.45], [35.0, 35.19], [38.0, 38.15], [50.0, 51.53], [67.0, 67.64], [69.0, 84.94], [85.0, 86.26], [87.0, 87.76], [88.0, 88.55], [89.0, 88.64], [89.0, 88.72], [89.0, 89.78], [91.0, 92.33], [93.0, 108.67], [113.0, 114.76], [119.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.0], ["foghorn", 9.62], ["speech", 9.32]], null, null, null, null, null, null, null, [["music", 66.98], ["synthesizer", 12.56], ["musical instrument", 2.88]], null, null], "duration": [1.01, 0.32, 0.58, 2.47, 0.45, 0.19, 0.15, 1.53, 0.64, 15.94, 1.26, 0.76, 0.55, -0.36, -0.28, 0.78, 1.33, 15.67, 1.76, 0.42]} \ No newline at end of file diff --git a/annotations_1/WhUvsKY-l28_filtered.json b/annotations_1/WhUvsKY-l28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b603d647f56108605ee3df8a753c88bed5b8953 --- /dev/null +++ b/annotations_1/WhUvsKY-l28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [5.0, 6.22], [7.0, 9.14], [12.0, 12.78], [15.0, 15.65], [17.0, 17.91], [19.0, 20.71], [25.0, 26.03], [31.0, 30.74], [31.0, 32.49], [42.0, 42.92], [53.0, 54.03], [61.0, 62.02], [64.0, 64.77], [67.0, 67.88], [89.0, 90.07], [99.0, 100.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [74.44, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.02, 1.22, 2.14, 0.78, 0.65, 0.91, 1.71, 1.03, -0.26, 1.49, 0.92, 1.03, 1.02, 0.77, 0.88, 1.07, 1.89]} \ No newline at end of file diff --git a/annotations_1/Wi4OhwrVwP8_filtered.json b/annotations_1/Wi4OhwrVwP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb20f15eac786c6feb4a1784ed51f3492213ac1c --- /dev/null +++ b/annotations_1/Wi4OhwrVwP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.74], [9.0, 16.68], [18.0, 18.4], [21.0, 20.61], [21.0, 23.97], [25.0, 26.92], [30.0, 39.04], [40.0, 42.03], [48.0, 73.33], [79.0, 89.77], [94.0, 130.94], [132.0, 137.29], [143.0, 149.03], [150.0, 161.5]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [29.08, 28.86, 0.0, 0.0, 29.54, 0.0, 29.73, 30.44, 28.4, 30.28, 0.0, 61.37, 35.29, 55.18], "audiomae_on_audioset": [[["speech", 29.65], ["hum", 27.59], ["mains hum", 11.11]], [["hum", 43.39], ["throbbing", 26.87], ["music", 13.51]], null, null, [["hum", 54.85], ["throbbing", 19.22], ["mains hum", 9.81]], null, [["music", 52.68], ["throbbing", 21.95], ["hum", 10.79]], [["music", 79.93], ["musical instrument", 3.53], ["synthesizer", 3.17]], [["mains hum", 23.21], ["hum", 21.44], ["speech", 18.71]], [["hum", 27.08], ["rumble", 25.76], ["mains hum", 14.31]], null, null, [["mains hum", 37.43], ["hum", 23.63], ["creak", 7.36]], null], "duration": [5.74, 7.68, 0.4, -0.39, 2.97, 1.92, 9.04, 2.03, 25.33, 10.77, 36.94, 5.29, 6.03, 11.5]} \ No newline at end of file diff --git a/annotations_1/WkEK2NyGq10_filtered.json b/annotations_1/WkEK2NyGq10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e239fb852b197d628d25884e7f2ac3ff2dc2e4a --- /dev/null +++ b/annotations_1/WkEK2NyGq10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.88], [8.0, 7.96], [9.0, 8.95], [11.0, 11.91], [14.0, 20.39], [22.0, 30.57], [31.0, 37.57], [41.0, 56.74], [59.0, 61.7], [64.0, 64.88], [67.0, 68.32], [94.0, 111.62], [114.0, 118.03], [125.0, 125.78], [126.0, 127.62], [128.0, 128.22], [129.0, 128.87], [137.0, 137.29]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.33, 46.15, 40.28, 49.92, 35.98, 0.0, 0.0, 31.0, 30.65, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 62.25], ["synthesizer", 5.74], ["ambient music", 3.49]], [["music", 55.57], ["hum", 15.18], ["ambient music", 3.48]], [["music", 29.99], ["hum", 23.64], ["ambient music", 10.55]], [["hum", 31.34], ["music", 30.02], ["mains hum", 6.34]], [["groan", 19.27], ["livestock, farm animals, working animals", 9.99], ["cattle, bovinae", 9.27]], null, null, [["boing", 36.49], ["gong", 12.04], ["music", 10.62]], [["music", 27.22], ["groan", 24.19], ["didgeridoo", 10.84]], null, null, null, null, null], "duration": [1.88, -0.04, -0.05, 0.91, 6.39, 8.57, 6.57, 15.74, 2.7, 0.88, 1.32, 17.62, 4.03, 0.78, 1.62, 0.22, -0.13, 0.29]} \ No newline at end of file diff --git a/annotations_1/WksivsiSF_o_filtered.json b/annotations_1/WksivsiSF_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8ccc66752b3c912a79cd0837becb8eafc43555c --- /dev/null +++ b/annotations_1/WksivsiSF_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.26], [21.0, 21.52], [25.0, 26.08], [27.0, 29.2], [30.0, 38.55], [44.0, 44.41], [45.0, 54.72], [57.0, 97.61], [100.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [66.63, 0.0, 0.0, 87.19, 49.54, 0.0, 56.78, 0.0, 44.26], "audiomae_on_audioset": [null, null, null, null, [["music", 72.8], ["hum", 9.05], ["mains hum", 7.64]], null, null, null, [["music", 74.3], ["hum", 6.1], ["throbbing", 4.35]]], "duration": [2.26, 0.52, 1.08, 2.2, 8.55, 0.41, 9.72, 40.61, 19.94]} \ No newline at end of file diff --git a/annotations_1/Wl6COOA3V6Y_filtered.json b/annotations_1/Wl6COOA3V6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..584c741638a7872d2b1b9afdfe2e336eb806cc39 --- /dev/null +++ b/annotations_1/Wl6COOA3V6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.9], [14.0, 15.16], [19.0, 21.36], [31.0, 32.58], [34.0, 45.44], [47.0, 47.28], [47.0, 51.51], [55.0, 58.11], [60.0, 60.62], [61.0, 88.75], [95.0, 95.07], [96.0, 97.68]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [63.53, 0.0, 91.81, 0.0, 29.9, 0.0, 28.64, 28.71, 0.0, 30.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 70.79], ["whack, thwack", 3.66], ["explosion", 2.93]], null, [["grunt", 22.89], ["sound effect", 18.65], ["speech", 15.87]], [["scratching (performance technique)", 26.55], ["sound effect", 21.74], ["music", 12.12]], null, [["music", 64.57], ["noise", 5.08], ["effects unit", 3.06]], null, null], "duration": [2.9, 1.16, 2.36, 1.58, 11.44, 0.28, 4.51, 3.11, 0.62, 27.75, 0.07, 1.68]} \ No newline at end of file diff --git a/annotations_1/WlvCTpjwaXE_filtered.json b/annotations_1/WlvCTpjwaXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..792ce8d5f06ad242a99f03ab934d00e49be2848a --- /dev/null +++ b/annotations_1/WlvCTpjwaXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 20.76], [22.0, 22.65], [24.0, 25.08], [28.0, 28.29], [39.0, 44.95], [47.0, 54.31], [59.0, 59.09], [67.0, 67.24], [69.0, 69.87], [72.0, 76.27], [77.0, 77.43], [79.0, 80.86], [83.0, 84.13], [87.0, 87.12], [88.0, 88.28], [89.0, 93.06], [94.0, 94.31], [99.0, 100.2], [102.0, 107.59], [109.0, 110.35], [110.0, 110.42], [111.0, 110.64], [111.0, 111.65]], "keep_status": [true, false, false, false, true, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [32.03, 0.0, 0.0, 0.0, 42.67, 36.97, 0.0, 0.0, 0.0, 36.63, 0.0, 0.0, 0.0, 0.0, 0.0, 39.74, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 25.46], ["music", 24.93], ["mains hum", 12.25]], null, null, null, [["frog", 23.72], ["insect", 13.55], ["grunt", 8.34]], [["fly, housefly", 15.45], ["insect", 15.21], ["speech", 14.97]], null, null, null, [["fly, housefly", 20.21], ["insect", 18.49], ["electric shaver, electric razor", 13.71]], null, null, null, null, null, [["insect", 22.87], ["fly, housefly", 14.02], ["fart", 7.6]], null, null, null, null, null, null, null], "duration": [14.76, 0.65, 1.08, 0.29, 5.95, 7.31, 0.09, 0.24, 0.87, 4.27, 0.43, 1.86, 1.13, 0.12, 0.28, 4.06, 0.31, 1.2, 5.59, 1.35, 0.42, -0.36, 0.65]} \ No newline at end of file diff --git a/annotations_1/WmFiW2CSiO4_filtered.json b/annotations_1/WmFiW2CSiO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0348d2aac5e1448b08b1a0b130b86096f1b86dd --- /dev/null +++ b/annotations_1/WmFiW2CSiO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [3.0, 3.72], [6.0, 8.83], [9.0, 10.49], [29.0, 29.81], [36.0, 38.35], [45.0, 45.22], [49.0, 50.48], [53.0, 56.07], [58.0, 59.05], [60.0, 61.23], [62.0, 62.95], [65.0, 68.42], [70.0, 72.82], [75.0, 78.14], [80.0, 79.93], [83.0, 83.42]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.74, 0.0, 0.0, 93.45, 0.0, 0.0, 35.03, 0.0, 0.0, 0.0, 54.3, 78.38, 85.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sneeze", 13.59], ["whack, thwack", 13.4], ["whale vocalization", 10.72]], null, null, null, null, null, null, null, null], "duration": [1.52, 0.72, 2.83, 1.49, 0.81, 2.35, 0.22, 1.48, 3.07, 1.05, 1.23, 0.95, 3.42, 2.82, 3.14, -0.07, 0.42]} \ No newline at end of file diff --git a/annotations_1/Wm_7niZcI1s_filtered.json b/annotations_1/Wm_7niZcI1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a002f84a9a20af7881affa508fbe4b89bca40ca --- /dev/null +++ b/annotations_1/Wm_7niZcI1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.78], [6.0, 8.9], [13.0, 13.44], [15.0, 17.24], [26.0, 28.24], [32.0, 34.47], [38.0, 39.33], [40.0, 40.41], [42.0, 46.84], [51.0, 52.47], [57.0, 57.47], [62.0, 64.54], [70.0, 78.38], [80.0, 82.14], [83.0, 83.88], [84.0, 85.43], [87.0, 90.29], [92.0, 93.43], [95.0, 95.62], [96.0, 97.88], [98.0, 98.91], [100.0, 102.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.63, 0.0, 60.6, 96.04, 82.61, 0.0, 0.0, 77.7, 0.0, 0.0, 92.97, 50.41, 100.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 90.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.78, 2.9, 0.44, 2.24, 2.24, 2.47, 1.33, 0.41, 4.84, 1.47, 0.47, 2.54, 8.38, 2.14, 0.88, 1.43, 3.29, 1.43, 0.62, 1.88, 0.91, 2.96]} \ No newline at end of file diff --git a/annotations_1/Wmo60ltq-TA_filtered.json b/annotations_1/Wmo60ltq-TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65e462f61622b0011303374f5a004e09c49c0a9f --- /dev/null +++ b/annotations_1/Wmo60ltq-TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [12.0, 12.06], [14.0, 15.26], [16.0, 16.95], [19.0, 19.21], [21.0, 22.2], [24.0, 24.54], [27.0, 28.59], [30.0, 31.31], [35.0, 35.34], [36.0, 36.91], [41.0, 41.42], [43.0, 44.46], [46.0, 48.25], [55.0, 55.0], [58.0, 59.43], [63.0, 65.62], [66.0, 65.82], [66.0, 67.58], [72.0, 72.3], [73.0, 74.7], [75.0, 76.6], [80.0, 80.23], [82.0, 82.21], [84.0, 85.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.44], ["speech", 14.61], ["didgeridoo", 10.47]], null, null, null, null, null, null, null, null], "duration": [-0.09, 0.06, 1.26, 0.95, 0.21, 1.2, 0.54, 1.59, 1.31, 0.34, 0.91, 0.42, 1.46, 2.25, 0.0, 1.43, 2.62, -0.18, 1.58, 0.3, 1.7, 1.6, 0.23, 0.21, 1.36]} \ No newline at end of file diff --git a/annotations_1/WmzictYYVj4_filtered.json b/annotations_1/WmzictYYVj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdbb2b67f0b397162a0adb49d9fc73f277d91d58 --- /dev/null +++ b/annotations_1/WmzictYYVj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [4.0, 5.05], [9.0, 10.56], [11.0, 11.18], [12.0, 12.82], [14.0, 15.72], [16.0, 17.76], [18.0, 22.05], [22.0, 27.51], [28.0, 30.18], [33.0, 33.22], [34.0, 34.13], [36.0, 38.43], [39.0, 39.02], [41.0, 41.72], [44.0, 45.0], [46.0, 47.39], [48.0, 47.73], [55.0, 55.54], [57.0, 58.58], [59.0, 59.85], [60.0, 63.78], [66.0, 67.31], [68.0, 78.54], [81.0, 81.14], [85.0, 85.63], [86.0, 86.21], [88.0, 88.7], [91.0, 90.76], [92.0, 93.48], [94.0, 94.69], [96.0, 100.35], [100.0, 100.94], [104.0, 103.79], [106.0, 106.22], [108.0, 108.09], [109.0, 110.37], [114.0, 116.13], [118.0, 118.49], [119.0, 119.43], [120.0, 121.04], [125.0, 127.8], [128.0, 130.57], [132.0, 132.53], [134.0, 134.2], [136.0, 136.46], [137.0, 138.28], [141.0, 140.83], [141.0, 141.07], [143.0, 145.29], [146.0, 155.87], [157.0, 161.81], [163.0, 163.9], [165.0, 165.52], [180.0, 180.45], [183.0, 183.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 62.37, 89.72, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 0.0, 99.97, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 82.97, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.05, 1.56, 0.18, 0.82, 1.72, 1.76, 4.05, 5.51, 2.18, 0.22, 0.13, 2.43, 0.02, 0.72, 1.0, 1.39, -0.27, 0.54, 1.58, 0.85, 3.78, 1.31, 10.54, 0.14, 0.63, 0.21, 0.7, -0.24, 1.48, 0.69, 4.35, 0.94, -0.21, 0.22, 0.09, 1.37, 2.13, 0.49, 0.43, 1.04, 2.8, 2.57, 0.53, 0.2, 0.46, 1.28, -0.17, 0.07, 2.29, 9.87, 4.81, 0.9, 0.52, 0.45, 0.64]} \ No newline at end of file diff --git a/annotations_1/WnAVeKAUxPY_filtered.json b/annotations_1/WnAVeKAUxPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4789cd74c032ea7a943e6a3f13940724ba1a432 --- /dev/null +++ b/annotations_1/WnAVeKAUxPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.69], [11.0, 11.03], [14.0, 17.47], [28.0, 28.21], [30.0, 30.97], [32.0, 32.44], [37.0, 37.07], [40.0, 40.83], [44.0, 44.9], [46.0, 62.26], [63.0, 66.63], [68.0, 72.96], [76.0, 78.36], [83.0, 83.79], [86.0, 86.36], [88.0, 88.48], [91.0, 91.37], [92.0, 92.67], [94.0, 95.18], [97.0, 97.65], [99.0, 99.06], [102.0, 103.57], [108.0, 108.21], [109.0, 110.27], [112.0, 113.56], [114.0, 115.25], [118.0, 118.52], [120.0, 120.45], [120.0, 120.53], [125.0, 127.11], [129.0, 136.21], [137.0, 137.62], [139.0, 139.41], [139.0, 146.42], [147.0, 156.83], [160.0, 161.42], [162.0, 166.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 35.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.63, 66.51, 67.13, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.83, 49.31, 0.0, 0.0, 41.85, 62.58, 0.0, 45.98], "audiomae_on_audioset": [null, null, [["speech", 57.86], ["music", 14.28], ["musical instrument", 5.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 36.61], ["hum", 33.26], ["speech", 13.58]], null, null, [["speech", 59.77], ["thunk", 9.34], ["hum", 4.95]], null, null, [["speech", 46.13], ["cough", 28.83], ["throat clearing", 3.66]]], "duration": [5.69, 0.03, 3.47, 0.21, 0.97, 0.44, 0.07, 0.83, 0.9, 16.26, 3.63, 4.96, 2.36, 0.79, 0.36, 0.48, 0.37, 0.67, 1.18, 0.65, 0.06, 1.57, 0.21, 1.27, 1.56, 1.25, 0.52, 0.45, 0.53, 2.11, 7.21, 0.62, 0.41, 7.42, 9.83, 1.42, 4.97]} \ No newline at end of file diff --git a/annotations_1/WncnbHD-JXI_filtered.json b/annotations_1/WncnbHD-JXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07946daf92f53cab6cf7ea7ab18e252607940154 --- /dev/null +++ b/annotations_1/WncnbHD-JXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.75], [21.0, 22.79], [23.0, 23.5], [25.0, 27.82], [29.0, 31.33], [33.0, 38.53], [42.0, 42.53], [44.0, 49.52], [51.0, 51.7], [53.0, 66.68], [69.0, 71.86], [80.0, 80.22], [82.0, 82.98], [91.0, 91.37]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.28, 36.9, 32.21, 0.0, 33.79, 0.0, 33.56, 51.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 63.42], ["cowbell", 13.96], ["cattle, bovinae", 8.47]], [["music", 18.64], ["livestock, farm animals, working animals", 13.46], ["cattle, bovinae", 12.63]], [["music", 64.05], ["speech", 14.37], ["whack, thwack", 2.36]], null, [["music", 29.48], ["speech", 25.28], ["sidetone", 21.73]], null, [["music", 49.35], ["boing", 26.46], ["speech", 6.12]], null, null, null, null], "duration": [1.75, 1.79, 0.5, 2.82, 2.33, 5.53, 0.53, 5.52, 0.7, 13.68, 2.86, 0.22, 0.98, 0.37]} \ No newline at end of file diff --git a/annotations_1/Wnocz8UrhQw_filtered.json b/annotations_1/Wnocz8UrhQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e1864cd3370b1330108238c652a305e41f93e17 --- /dev/null +++ b/annotations_1/Wnocz8UrhQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 59.19], [60.0, 89.45], [91.0, 91.39], [94.0, 118.45]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 30.68, 0.0, 30.37], "audiomae_on_audioset": [null, [["music", 46.69], ["throbbing", 9.97], ["hum", 8.55]], null, [["vehicle", 23.61], ["music", 19.45], ["speech", 14.89]]], "duration": [1.19, 29.45, 0.39, 24.45]} \ No newline at end of file diff --git a/annotations_1/WnrOQRdqiQ4_filtered.json b/annotations_1/WnrOQRdqiQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18b2c6dcb4dcbb4918c3ba4f7cecf830e357b1d9 --- /dev/null +++ b/annotations_1/WnrOQRdqiQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.96], [16.0, 18.06], [18.0, 21.19], [23.0, 24.07], [24.0, 26.45], [27.0, 30.33], [33.0, 35.5], [38.0, 42.04], [42.0, 44.31], [46.0, 48.49], [49.0, 51.93], [53.0, 56.08], [58.0, 58.28], [63.0, 64.66], [65.0, 68.34], [72.0, 75.42], [76.0, 77.94], [79.0, 79.93], [81.0, 81.73], [82.0, 85.63], [86.0, 88.33], [90.0, 89.78], [90.0, 93.65], [95.0, 95.93], [98.0, 98.86], [102.0, 102.69], [105.0, 106.61], [112.0, 113.12], [113.0, 114.03], [130.0, 130.5]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.27, 99.98, 100.0, 0.0, 93.13, 99.96, 99.9, 51.23, 78.72, 100.0, 98.19, 99.92, 0.0, 0.0, 99.96, 99.98, 0.0, 0.0, 0.0, 80.64, 63.74, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 15.97], ["sound effect", 6.24], ["synthesizer", 5.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.96, 2.06, 3.19, 1.07, 2.45, 3.33, 2.5, 4.04, 2.31, 2.49, 2.93, 3.08, 0.28, 1.66, 3.34, 3.42, 1.94, 0.93, 0.73, 3.63, 2.33, -0.22, 3.65, 0.93, 0.86, 0.69, 1.61, 1.12, 1.03, 0.5]} \ No newline at end of file diff --git a/annotations_1/Wo4U1SqnRpA_filtered.json b/annotations_1/Wo4U1SqnRpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23f5f4872fcfacd99a0f7e28a2d549264ce6c0f3 --- /dev/null +++ b/annotations_1/Wo4U1SqnRpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.36], [14.0, 15.08], [16.0, 16.61], [18.0, 19.13], [22.0, 22.6], [27.0, 27.36], [28.0, 29.24], [32.0, 34.15], [44.0, 48.22], [49.0, 50.4], [52.0, 53.01], [56.0, 57.42], [60.0, 59.9], [64.0, 64.44], [65.0, 65.7], [67.0, 71.98], [75.0, 76.0], [80.0, 81.35], [86.0, 87.52], [90.0, 92.77], [93.0, 93.99], [95.0, 96.48], [98.0, 100.06], [105.0, 107.1], [109.0, 110.19], [115.0, 115.37], [117.0, 116.99], [120.0, 121.86], [123.0, 127.01], [128.0, 128.78], [134.0, 135.73], [138.0, 138.86], [141.0, 148.56], [152.0, 154.79], [156.0, 160.3], [165.0, 166.33], [168.0, 169.15], [170.0, 172.12], [174.0, 174.65], [177.0, 177.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 41.38, 43.38, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 87.55, 82.25, 89.01, 0.0, 0.0, 70.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.55], ["sidetone", 12.38], ["radio", 7.4]], [["speech", 59.28], ["radio", 8.1], ["sidetone", 6.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 1.08, 0.61, 1.13, 0.6, 0.36, 1.24, 2.15, 4.22, 1.4, 1.01, 1.42, -0.1, 0.44, 0.7, 4.98, 1.0, 1.35, 1.52, 2.77, 0.99, 1.48, 2.06, 2.1, 1.19, 0.37, -0.01, 1.86, 4.01, 0.78, 1.73, 0.86, 7.56, 2.79, 4.3, 1.33, 1.15, 2.12, 0.65, 0.23]} \ No newline at end of file diff --git a/annotations_1/WoN5cCs0l2M_filtered.json b/annotations_1/WoN5cCs0l2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bc5de335d9f85539148c3e8e0d5cbff3130b6eb --- /dev/null +++ b/annotations_1/WoN5cCs0l2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [9.0, 10.39], [14.0, 14.72], [15.0, 18.27], [19.0, 20.63], [21.0, 21.91], [24.0, 26.11], [28.0, 32.37], [33.0, 33.91], [35.0, 35.29], [40.0, 41.32], [43.0, 43.53], [49.0, 53.16], [54.0, 55.56], [56.0, 63.31], [68.0, 68.52], [84.0, 85.73], [86.0, 90.49], [93.0, 96.55], [97.0, 98.15], [108.0, 108.19], [110.0, 110.93], [112.0, 112.99], [114.0, 115.57], [123.0, 123.77], [132.0, 132.49], [133.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 63.64, 89.01, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 50.91, 0.0, 0.0, 57.89, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 1.39, 0.72, 3.27, 1.63, 0.91, 2.11, 4.37, 0.91, 0.29, 1.32, 0.53, 4.16, 1.56, 7.31, 0.52, 1.73, 4.49, 3.55, 1.15, 0.19, 0.93, 0.99, 1.57, 0.77, 0.49, -0.37]} \ No newline at end of file diff --git a/annotations_1/Wq8gxNsz9ZQ_filtered.json b/annotations_1/Wq8gxNsz9ZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb045d47bc735718e7b35ea5e28b6027cc4d0f5 --- /dev/null +++ b/annotations_1/Wq8gxNsz9ZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.84], [26.0, 27.09], [30.0, 33.44], [35.0, 35.45], [37.0, 40.51], [55.0, 55.36], [58.0, 60.57], [84.0, 84.3], [86.0, 87.59], [94.0, 93.72], [101.0, 100.95]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [33.31, 0.0, 32.17, 0.0, 33.56, 0.0, 48.78, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 35.02], ["speech", 14.62], ["fly, housefly", 12.16]], null, [["speech", 44.67], ["whale vocalization", 24.64], ["sidetone", 5.11]], null, [["boing", 35.05], ["moo", 6.06], ["livestock, farm animals, working animals", 5.07]], null, [["music", 61.99], ["percussion", 13.02], ["drum", 4.85]], null, null, null, null], "duration": [3.84, 1.09, 3.44, 0.45, 3.51, 0.36, 2.57, 0.3, 1.59, -0.28, -0.05]} \ No newline at end of file diff --git a/annotations_1/WqWefwlmFmI_filtered.json b/annotations_1/WqWefwlmFmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..509d014e0aa2a4d8a5442f9746cf9d1cfa24c95a --- /dev/null +++ b/annotations_1/WqWefwlmFmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.7], [13.0, 12.73], [13.0, 13.71], [14.0, 41.91], [43.0, 48.96], [50.0, 77.23], [84.0, 84.69], [85.0, 88.92], [91.0, 119.5], [120.0, 125.2]], "keep_status": [true, false, false, true, false, true, false, true, false, true], "silence_prob": [43.35, 0.0, 0.0, 46.22, 91.64, 35.5, 0.0, 31.91, 31.95, 41.42], "audiomae_on_audioset": [[["speech", 27.97], ["theremin", 24.96], ["music", 14.58]], null, null, [["music", 46.25], ["hum", 4.0], ["mains hum", 3.36]], null, [["music", 51.67], ["speech", 7.81], ["singing bowl", 4.47]], null, [["music", 28.08], ["boing", 18.48], ["effects unit", 11.26]], [["music", 64.43], ["boing", 6.88], ["cacophony", 4.67]], [["music", 49.12], ["effects unit", 9.23], ["synthesizer", 8.33]]], "duration": [9.7, -0.27, 0.71, 27.91, 5.96, 27.23, 0.69, 3.92, 28.5, 5.2]} \ No newline at end of file diff --git a/annotations_1/WrY9UuucSUs_filtered.json b/annotations_1/WrY9UuucSUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e29f6e9a4c5f2a1672ace696f9926fb0f02f475c --- /dev/null +++ b/annotations_1/WrY9UuucSUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [15.0, 15.85], [28.0, 28.98], [31.0, 32.22], [35.0, 35.46], [36.0, 39.82], [52.0, 63.41], [65.0, 68.25], [68.0, 68.37], [68.0, 71.96], [78.0, 83.61], [84.0, 84.13], [86.0, 86.48], [89.0, 90.22], [93.0, 93.36], [95.0, 129.2]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.21, 34.74, 33.36, 0.0, 32.84, 30.77, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["whack, thwack", 31.68], ["cattle, bovinae", 11.06], ["fly, housefly", 7.14]], [["music", 62.58], ["throbbing", 13.27], ["hum", 4.9]], [["music", 76.64], ["synthesizer", 3.25], ["musical instrument", 2.83]], null, [["music", 49.14], ["speech", 26.1], ["sidetone", 4.98]], [["music", 57.63], ["speech", 9.78], ["synthesizer", 7.89]], null, null, null, null, null], "duration": [0.11, 0.85, 0.98, 1.22, 0.46, 3.82, 11.41, 3.25, 0.37, 3.96, 5.61, 0.13, 0.48, 1.22, 0.36, 34.2]} \ No newline at end of file diff --git a/annotations_1/WrZN5ouSodc_filtered.json b/annotations_1/WrZN5ouSodc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d27c17dfdea0e7ba7b0801366b578210cbcd624d --- /dev/null +++ b/annotations_1/WrZN5ouSodc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [3.0, 4.02], [6.0, 7.86], [12.0, 31.97], [35.0, 53.72], [54.0, 53.76], [54.0, 58.01], [61.0, 61.37], [62.0, 66.68], [67.0, 81.03], [87.0, 91.71], [95.0, 95.98], [99.0, 109.81], [112.0, 118.76], [121.0, 154.9], [155.0, 154.94], [158.0, 165.3]], "keep_status": [false, false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 39.89, 45.02, 0.0, 41.91, 0.0, 34.02, 33.68, 48.31, 0.0, 41.83, 35.35, 0.0, 0.0, 43.53], "audiomae_on_audioset": [null, null, null, [["hum", 27.04], ["mains hum", 12.55], ["music", 11.73]], [["music", 50.65], ["hum", 13.94], ["throbbing", 11.62]], null, [["music", 28.14], ["mains hum", 16.05], ["hum", 12.66]], null, [["music", 38.83], ["breaking", 19.23], ["speech", 7.05]], [["didgeridoo", 33.38], ["music", 29.85], ["speech", 8.61]], [["throbbing", 16.09], ["speech", 14.84], ["hum", 13.62]], null, [["music", 40.39], ["hum", 15.3], ["mains hum", 14.49]], [["throbbing", 30.71], ["hum", 25.43], ["speech", 18.22]], null, null, [["music", 30.82], ["hum", 12.38], ["mains hum", 6.44]]], "duration": [0.81, 1.02, 1.86, 19.97, 18.72, -0.24, 4.01, 0.37, 4.68, 14.03, 4.71, 0.98, 10.81, 6.76, 33.9, -0.06, 7.3]} \ No newline at end of file diff --git a/annotations_1/Wrb8nkLKkxU_filtered.json b/annotations_1/Wrb8nkLKkxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8880294e4d024615b6a1ce7038fe5da86bcb44d4 --- /dev/null +++ b/annotations_1/Wrb8nkLKkxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.84], [13.0, 27.3], [36.0, 36.95], [39.0, 39.66]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 47.35, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 33.07], ["mains hum", 13.19], ["throbbing", 10.04]], null, null], "duration": [1.84, 14.3, 0.95, 0.66]} \ No newline at end of file diff --git a/annotations_1/WsHqQAfZvc4_filtered.json b/annotations_1/WsHqQAfZvc4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f968057e1c98c3532c81ff5ef2373f4d2cfbe4 --- /dev/null +++ b/annotations_1/WsHqQAfZvc4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.84], [17.0, 29.73], [32.0, 47.29], [49.0, 70.77], [72.0, 99.93], [101.0, 102.09], [104.0, 115.28], [123.0, 128.19], [134.0, 153.15]], "keep_status": [false, false, true, true, true, false, true, false, false], "silence_prob": [0.0, 32.27, 31.62, 31.48, 32.17, 0.0, 30.77, 30.82, 31.71], "audiomae_on_audioset": [null, [["music", 60.47], ["speech", 18.19], ["fart", 6.65]], [["music", 25.85], ["speech", 12.65], ["fart", 11.24]], [["livestock, farm animals, working animals", 25.58], ["music", 21.07], ["cattle, bovinae", 13.37]], [["music", 23.18], ["mosquito", 22.39], ["fly, housefly", 16.48]], null, [["music", 35.25], ["throbbing", 16.69], ["livestock, farm animals, working animals", 4.32]], [["music", 51.53], ["speech", 19.97], ["didgeridoo", 2.4]], [["music", 44.3], ["throbbing", 19.17], ["quack", 18.7]]], "duration": [0.84, 12.73, 15.29, 21.77, 27.93, 1.09, 11.28, 5.19, 19.15]} \ No newline at end of file diff --git a/annotations_1/WsaXEsBV6b4_filtered.json b/annotations_1/WsaXEsBV6b4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b5068716d83b1bbc83e64d0c79591af7445a4ac --- /dev/null +++ b/annotations_1/WsaXEsBV6b4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.27], [7.0, 8.13], [11.0, 11.08], [12.0, 12.55], [19.0, 19.14], [23.0, 24.93], [26.0, 27.38], [33.0, 33.67], [35.0, 35.46], [37.0, 37.62], [43.0, 43.82], [48.0, 48.47], [52.0, 52.22], [53.0, 53.62], [55.0, 54.97], [59.0, 59.58], [61.0, 61.13], [63.0, 63.58], [66.0, 66.31], [69.0, 68.89], [72.0, 72.27], [74.0, 74.56], [75.0, 76.25], [79.0, 78.88], [81.0, 81.21], [91.0, 91.86], [98.0, 101.34], [102.0, 102.46], [104.0, 104.13], [106.0, 105.8], [108.0, 108.43], [112.0, 112.35], [125.0, 125.05], [125.0, 125.81], [126.0, 126.76], [127.0, 127.65], [129.0, 131.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 1.13, 0.08, 0.55, 0.14, 1.93, 1.38, 0.67, 0.46, 0.62, 0.82, 0.47, 0.22, 0.62, -0.03, 0.58, 0.13, 0.58, 0.31, -0.11, 0.27, 0.56, 1.25, -0.12, 0.21, 0.86, 3.34, 0.46, 0.13, -0.2, 0.43, 0.35, 0.05, 0.81, 0.76, 0.65, 2.77]} \ No newline at end of file diff --git a/annotations_1/WsffSfKc-mw_filtered.json b/annotations_1/WsffSfKc-mw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c59f4774d75bda80bb9159f161342d5ee2e96aef --- /dev/null +++ b/annotations_1/WsffSfKc-mw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.33], [11.0, 11.8], [13.0, 33.08], [35.0, 41.5], [42.0, 42.8], [51.0, 52.32], [69.0, 69.01], [69.0, 74.09], [85.0, 90.07], [92.0, 92.58], [96.0, 95.91], [96.0, 96.03], [98.0, 98.73], [99.0, 100.74], [102.0, 102.15], [110.0, 115.11], [126.0, 128.75]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 37.86, 29.91, 0.0, 0.0, 0.0, 34.4, 32.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.85, 44.87], "audiomae_on_audioset": [null, null, [["music", 54.74], ["speech", 6.67], ["musical instrument", 3.49]], [["wail, moan", 38.78], ["crying, sobbing", 13.78], ["speech", 10.72]], null, null, null, [["moo", 30.83], ["speech", 29.7], ["cattle, bovinae", 17.33]], [["speech", 43.54], ["music", 19.07], ["thump, thud", 11.91]], null, null, null, null, null, null, [["speech", 27.2], ["fart", 13.25], ["music", 10.84]], [["speech", 44.71], ["hum", 3.83], ["heart sounds, heartbeat", 3.2]]], "duration": [1.33, 0.8, 20.08, 6.5, 0.8, 1.32, 0.01, 5.09, 5.07, 0.58, -0.09, 0.03, 0.73, 1.74, 0.15, 5.11, 2.75]} \ No newline at end of file diff --git a/annotations_1/WsgkiKu7AO8_filtered.json b/annotations_1/WsgkiKu7AO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b9a6b7dc48247288665b0fdda8a4e5f4a524fe6 --- /dev/null +++ b/annotations_1/WsgkiKu7AO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.33], [38.0, 41.47], [44.0, 46.11], [50.0, 49.96], [50.0, 50.58], [51.0, 53.79], [54.0, 55.02], [55.0, 65.04], [73.0, 74.28], [76.0, 76.74], [77.0, 77.57], [78.0, 86.81], [89.0, 96.72], [102.0, 103.25], [104.0, 105.12], [126.0, 127.35], [128.0, 133.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [99.92, 60.6, 100.0, 0.0, 0.0, 90.43, 0.0, 77.7, 0.0, 0.0, 0.0, 65.55, 32.16, 0.0, 0.0, 0.0, 67.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.92], ["didgeridoo", 11.39], ["theremin", 8.25]], null, null, null, null], "duration": [2.33, 3.47, 2.11, -0.04, 0.58, 2.79, 1.02, 10.04, 1.28, 0.74, 0.57, 8.81, 7.72, 1.25, 1.12, 1.35, 5.57]} \ No newline at end of file diff --git a/annotations_1/Wuer3mLqIxc_filtered.json b/annotations_1/Wuer3mLqIxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32fbfdbf7549cf206fc69edaec509f8d2891c580 --- /dev/null +++ b/annotations_1/Wuer3mLqIxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.01], [17.0, 20.63], [26.0, 26.5], [30.0, 30.33], [33.0, 37.57], [38.0, 38.3], [39.0, 39.9], [40.0, 41.28], [44.0, 45.3], [47.0, 55.88], [57.0, 57.27], [62.0, 62.38], [72.0, 72.4], [93.0, 93.88], [98.0, 99.69], [107.0, 107.6], [115.0, 121.24], [129.0, 129.79], [133.0, 133.17], [141.0, 143.06], [149.0, 151.36], [183.0, 182.98], [185.0, 185.21], [187.0, 193.01], [194.0, 201.53], [216.0, 217.32], [220.0, 221.12]], "keep_status": [true, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false], "silence_prob": [29.11, 29.22, 0.0, 0.0, 30.77, 0.0, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.11, 0.0, 0.0, 30.94, 30.03, 0.0, 0.0, 31.17, 29.7, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.16], ["theremin", 11.72], ["vehicle", 9.01]], [["speech", 25.56], ["foghorn", 22.34], ["vehicle", 13.47]], null, null, [["music", 52.04], ["speech", 10.65], ["quack", 7.13]], null, null, null, null, [["music", 36.82], ["brass instrument", 11.87], ["trombone", 10.54]], null, null, null, null, null, null, [["music", 71.91], ["musical instrument", 9.17], ["trombone", 4.64]], null, null, [["speech", 37.84], ["music", 16.53], ["foghorn", 4.69]], [["music", 33.84], ["trombone", 6.45], ["foghorn", 5.75]], null, null, [["speech", 49.72], ["music", 16.42], ["didgeridoo", 7.46]], [["speech", 35.39], ["cattle, bovinae", 10.59], ["moo", 7.28]], null, null], "duration": [8.01, 3.63, 0.5, 0.33, 4.57, 0.3, 0.9, 1.28, 1.3, 8.88, 0.27, 0.38, 0.4, 0.88, 1.69, 0.6, 6.24, 0.79, 0.17, 2.06, 2.36, -0.02, 0.21, 6.01, 7.53, 1.32, 1.12]} \ No newline at end of file diff --git a/annotations_1/Wurqpe5tNjA_filtered.json b/annotations_1/Wurqpe5tNjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d9e4c19451782b38e5bfd883252a5ec775d3b5a --- /dev/null +++ b/annotations_1/Wurqpe5tNjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.19], [9.0, 12.02], [14.0, 14.4], [15.0, 15.7], [16.0, 16.88], [25.0, 26.72], [30.0, 31.83], [34.0, 34.43], [35.0, 36.53], [40.0, 40.91], [42.0, 43.53], [45.0, 47.98], [49.0, 53.82], [54.0, 55.34], [57.0, 60.22], [61.0, 64.34], [66.0, 74.17], [87.0, 87.47], [90.0, 90.58], [92.0, 93.5], [95.0, 96.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.1, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 54.17, 0.0, 55.6, 85.9, 52.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.19, 3.02, 0.4, 0.7, 0.88, 1.72, 1.83, 0.43, 1.53, 0.91, 1.53, 2.98, 4.82, 1.34, 3.22, 3.34, 8.17, 0.47, 0.58, 1.5, 1.5]} \ No newline at end of file diff --git a/annotations_1/Wv07oUFHGRQ_filtered.json b/annotations_1/Wv07oUFHGRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8d29baf6976e056df3127e5e05081a46a2ca907 --- /dev/null +++ b/annotations_1/Wv07oUFHGRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [9.0, 14.03], [16.0, 16.83], [24.0, 24.22], [27.0, 27.31], [30.0, 30.75], [34.0, 36.19], [38.0, 38.43], [40.0, 40.47], [44.0, 43.85], [49.0, 49.65], [51.0, 51.09], [60.0, 60.42], [62.0, 66.34], [68.0, 71.0], [71.0, 72.18], [76.0, 80.97], [90.0, 90.91], [93.0, 93.6], [97.0, 97.19], [105.0, 104.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 82.07, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 5.03, 0.83, 0.22, 0.31, 0.75, 2.19, 0.43, 0.47, -0.15, 0.65, 0.09, 0.42, 4.34, 3.0, 1.18, 4.97, 0.91, 0.6, 0.19, -0.42]} \ No newline at end of file diff --git a/annotations_1/WxIgfDZXS4k_filtered.json b/annotations_1/WxIgfDZXS4k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e9bf59ecd1d842ce463c963ca2aa2cdd5dd4b2e --- /dev/null +++ b/annotations_1/WxIgfDZXS4k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 35.48], [36.0, 45.1], [46.0, 47.82], [49.0, 51.12], [52.0, 53.52], [54.0, 56.51], [57.0, 92.52], [98.0, 149.55], [150.0, 150.13], [152.0, 151.93], [152.0, 153.94], [154.0, 155.29], [156.0, 156.76], [159.0, 159.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 94.22, 0.0, 97.73, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 9.1, 1.82, 2.12, 1.52, 2.51, 35.52, 51.55, 0.13, -0.07, 1.94, 1.29, 0.76, 0.71]} \ No newline at end of file diff --git a/annotations_1/Wy4EfdnMZ5g_filtered.json b/annotations_1/Wy4EfdnMZ5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f07587579f091e0284bbcbde02b276af4cbfe4dd --- /dev/null +++ b/annotations_1/Wy4EfdnMZ5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.78], [7.0, 9.63], [11.0, 12.02], [13.0, 13.81], [15.0, 15.47], [16.0, 19.9], [21.0, 23.25], [27.0, 29.32], [30.0, 31.4], [35.0, 34.87], [36.0, 37.71], [41.0, 43.12], [45.0, 47.26], [50.0, 51.58], [54.0, 59.53], [61.0, 61.99], [62.0, 63.07], [68.0, 68.99], [70.0, 83.32], [84.0, 88.11], [90.0, 92.45], [94.0, 95.61], [97.0, 99.17], [100.0, 101.56], [102.0, 103.4], [104.0, 105.11], [108.0, 108.99], [109.0, 111.92], [112.0, 114.34], [115.0, 118.13], [118.0, 121.39], [122.0, 124.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [80.46, 85.54, 0.0, 0.0, 0.0, 99.73, 92.48, 99.78, 0.0, 0.0, 0.0, 94.81, 95.64, 0.0, 99.4, 0.0, 0.0, 0.0, 94.81, 99.73, 97.54, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 90.6, 58.22, 99.76, 62.58, 99.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.78, 2.63, 1.02, 0.81, 0.47, 3.9, 2.25, 2.32, 1.4, -0.13, 1.71, 2.12, 2.26, 1.58, 5.53, 0.99, 1.07, 0.99, 13.32, 4.11, 2.45, 1.61, 2.17, 1.56, 1.4, 1.11, 0.99, 2.92, 2.34, 3.13, 3.39, 2.26]} \ No newline at end of file diff --git a/annotations_1/WygmbuU_78c_filtered.json b/annotations_1/WygmbuU_78c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f0ce6af7513dec116eca79d92516ae624f0a391 --- /dev/null +++ b/annotations_1/WygmbuU_78c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 83.78], [87.0, 112.99], [114.0, 123.11], [125.0, 149.44]], "keep_status": [true, true, false, true], "silence_prob": [28.49, 28.36, 28.08, 28.37], "audiomae_on_audioset": [[["speech", 33.47], ["field recording", 10.74], ["throbbing", 8.22]], [["hum", 22.37], ["music", 18.05], ["speech", 16.66]], [["hum", 52.25], ["throbbing", 16.81], ["mains hum", 12.61]], [["music", 34.12], ["hum", 10.51], ["throbbing", 10.16]]], "duration": [4.78, 25.99, 9.11, 24.44]} \ No newline at end of file diff --git a/annotations_1/WzAHXnFWd5U_filtered.json b/annotations_1/WzAHXnFWd5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eae190fe40a4bc509fdaa64bc4e905ffcf8d0b99 --- /dev/null +++ b/annotations_1/WzAHXnFWd5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.09], [16.0, 30.0], [35.0, 39.65], [42.0, 74.12], [76.0, 76.59], [78.0, 77.84], [78.0, 79.52], [85.0, 87.56]], "keep_status": [false, true, false, false, false, false, false, true], "silence_prob": [35.12, 37.33, 35.61, 0.0, 0.0, 0.0, 0.0, 32.91], "audiomae_on_audioset": [[["music", 73.23], ["throbbing", 4.0], ["hum", 3.52]], [["music", 28.4], ["speech", 14.27], ["hum", 8.4]], [["music", 82.25], ["speech", 5.95], ["drum machine", 4.25]], null, null, null, null, [["music", 30.75], ["speech", 13.06], ["boing", 8.22]]], "duration": [7.09, 14.0, 4.65, 32.12, 0.59, -0.16, 1.52, 2.56]} \ No newline at end of file diff --git a/annotations_1/X-VYaCvJwxY_filtered.json b/annotations_1/X-VYaCvJwxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef587757b19b1e1033b3b5e1f3ef2c75ab9fec03 --- /dev/null +++ b/annotations_1/X-VYaCvJwxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 50.7], [54.0, 91.25], [99.0, 106.25], [107.0, 107.84], [109.0, 111.28], [114.0, 116.92], [122.0, 122.96], [125.0, 126.06], [128.0, 127.57], [132.0, 133.42], [135.0, 135.21], [136.0, 141.25], [146.0, 146.01], [147.0, 150.82], [153.0, 154.72], [155.0, 161.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.76, 0.0, 67.76, 0.0, 99.8, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 98.86, 0.0, 98.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.7, 37.25, 7.25, 0.84, 2.28, 2.92, 0.96, 1.06, -0.43, 1.42, 0.21, 5.25, 0.01, 3.82, 1.72, 6.28]} \ No newline at end of file diff --git a/annotations_1/X0d8qyjQ20M_filtered.json b/annotations_1/X0d8qyjQ20M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8338b423d7d1acb86c8066d080c82325d4fa3003 --- /dev/null +++ b/annotations_1/X0d8qyjQ20M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 35.87], [36.0, 37.03], [38.0, 54.78], [59.0, 59.56], [60.0, 69.26], [73.0, 76.6], [77.0, 77.58], [78.0, 87.03], [91.0, 99.66], [100.0, 100.99], [102.0, 103.08], [104.0, 106.78], [108.0, 110.24], [111.0, 125.17], [126.0, 126.5], [127.0, 127.79], [129.0, 130.05], [133.0, 133.91], [135.0, 136.71], [137.0, 139.55], [141.0, 141.59], [143.0, 143.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.26, 0.0, 29.81, 0.0, 36.83, 40.68, 0.0, 39.11, 72.9, 0.0, 0.0, 49.73, 75.39, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 35.79, 0.0, 0.0], "audiomae_on_audioset": [[["music", 42.78], ["hum", 26.77], ["throbbing", 14.42]], null, [["throbbing", 24.76], ["hum", 22.47], ["music", 22.38]], null, [["music", 44.61], ["ambient music", 30.1], ["new-age music", 2.53]], [["music", 58.05], ["ambient music", 18.06], ["electronic music", 5.31]], null, [["music", 55.09], ["hum", 16.21], ["ambient music", 12.84]], null, null, null, [["speech", 16.72], ["mains hum", 12.99], ["bee, wasp, etc.", 10.08]], null, null, null, null, null, null, null, [["hum", 38.37], ["throbbing", 34.28], ["mains hum", 10.22]], null, null], "duration": [21.87, 1.03, 16.78, 0.56, 9.26, 3.6, 0.58, 9.03, 8.66, 0.99, 1.08, 2.78, 2.24, 14.17, 0.5, 0.79, 1.05, 0.91, 1.71, 2.55, 0.59, 0.77]} \ No newline at end of file diff --git a/annotations_1/X0uMMVqQgeY_filtered.json b/annotations_1/X0uMMVqQgeY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33908040d92fee1700c69e0966211139019e4df7 --- /dev/null +++ b/annotations_1/X0uMMVqQgeY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.38], [14.0, 26.06], [28.0, 29.37], [37.0, 41.98], [48.0, 55.27], [56.0, 55.93], [59.0, 59.34], [60.0, 79.17], [81.0, 83.56], [85.0, 86.73], [99.0, 99.89], [103.0, 104.53], [106.0, 113.09], [115.0, 121.31], [123.0, 127.16], [130.0, 146.1], [148.0, 150.85], [155.0, 156.74], [159.0, 170.82], [172.0, 198.31], [201.0, 215.81]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [38.72, 32.56, 0.0, 31.46, 32.61, 0.0, 0.0, 32.25, 32.81, 0.0, 0.0, 0.0, 37.72, 35.57, 32.97, 33.5, 32.84, 0.0, 31.92, 30.47, 30.7], "audiomae_on_audioset": [[["music", 27.55], ["synthesizer", 11.16], ["effects unit", 8.86]], [["music", 42.44], ["speech", 17.48], ["fart", 7.98]], null, [["music", 31.75], ["speech", 13.21], ["fly, housefly", 5.28]], [["music", 61.26], ["speech", 14.18], ["boing", 4.64]], null, null, [["speech", 48.55], ["music", 32.94], ["fart", 2.21]], [["music", 32.78], ["speech", 23.28], ["throbbing", 16.6]], null, null, null, [["music", 58.31], ["speech", 25.49], ["boing", 2.91]], [["speech", 43.35], ["music", 17.41], ["hum", 6.55]], [["music", 53.88], ["speech", 13.97], ["synthesizer", 5.98]], [["music", 60.45], ["speech", 10.75], ["timpani", 5.31]], [["music", 27.09], ["throbbing", 15.57], ["pulse", 6.61]], null, [["music", 71.88], ["electronic music", 2.76], ["drum machine", 2.74]], [["music", 83.46], ["speech", 5.29], ["throbbing", 2.57]], [["music", 71.23], ["drum", 3.19], ["percussion", 2.81]]], "duration": [3.38, 12.06, 1.37, 4.98, 7.27, -0.07, 0.34, 19.17, 2.56, 1.73, 0.89, 1.53, 7.09, 6.31, 4.16, 16.1, 2.85, 1.74, 11.82, 26.31, 14.81]} \ No newline at end of file diff --git a/annotations_1/X0vQQA32UAs_filtered.json b/annotations_1/X0vQQA32UAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92323d837cbbfe972b4d485ee28cb00c319569d9 --- /dev/null +++ b/annotations_1/X0vQQA32UAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.95], [9.0, 16.28], [18.0, 19.14], [23.0, 31.94], [33.0, 34.16], [38.0, 50.75], [54.0, 132.66]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 62.27, 0.0, 35.14, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 59.1], ["sidetone", 15.82], ["hum", 9.18]], null, [["music", 39.0], ["speech", 27.0], ["didgeridoo", 11.23]], null], "duration": [0.95, 7.28, 1.14, 8.94, 1.16, 12.75, 78.66]} \ No newline at end of file diff --git a/annotations_1/X1ByBEw-WxM_filtered.json b/annotations_1/X1ByBEw-WxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6222932d401c1b09deab69644ba8bdb376fe5de --- /dev/null +++ b/annotations_1/X1ByBEw-WxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.54], [23.0, 32.14], [38.0, 39.66], [45.0, 50.16], [62.0, 64.25], [66.0, 68.44], [69.0, 68.84], [76.0, 78.81], [81.0, 83.71], [87.0, 96.5], [105.0, 109.36], [114.0, 125.64], [128.0, 131.08], [134.0, 140.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.29, 0.0, 77.53, 43.33, 79.07, 0.0, 82.97, 93.45, 30.91, 41.28, 93.76, 99.88, 50.61], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 69.8], ["sine wave", 8.12], ["speech", 6.77]], null, null, null, null, [["speech", 74.13], ["thunk", 9.48], ["whack, thwack", 3.84]], [["speech", 75.84], ["busy signal", 6.9], ["sidetone", 6.31]], null, null, null], "duration": [1.54, 9.14, 1.66, 5.16, 2.25, 2.44, -0.16, 2.81, 2.71, 9.5, 4.36, 11.64, 3.08, 6.37]} \ No newline at end of file diff --git a/annotations_1/X1SJgm2hIAY_filtered.json b/annotations_1/X1SJgm2hIAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/X1SJgm2hIAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/X2X3DxFAFlQ_filtered.json b/annotations_1/X2X3DxFAFlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..783ff68df3e55d12ad811d57dacc89fb11e1dd94 --- /dev/null +++ b/annotations_1/X2X3DxFAFlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [9.0, 9.27], [10.0, 10.17], [15.0, 16.33], [18.0, 18.67], [20.0, 22.17], [24.0, 26.16], [31.0, 33.51], [34.0, 36.32], [40.0, 40.32], [42.0, 44.51], [47.0, 47.88], [49.0, 49.71], [51.0, 54.92], [56.0, 59.75], [61.0, 62.56], [63.0, 63.54], [65.0, 67.61], [69.0, 70.77], [73.0, 74.61], [76.0, 76.13], [78.0, 79.22], [80.0, 81.85], [84.0, 85.14], [86.0, 87.25], [89.0, 89.33], [95.0, 96.6], [97.0, 98.42], [103.0, 104.73], [106.0, 108.82], [111.0, 111.35], [119.0, 119.64], [121.0, 123.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 70.02, 85.72, 57.89, 82.97, 0.0, 30.3, 0.0, 0.0, 31.18, 31.75, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 53.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 23.89], ["cattle, bovinae", 13.89], ["livestock, farm animals, working animals", 12.21]], null, null, [["speech", 30.49], ["music", 26.22], ["noise", 6.52]], [["cattle, bovinae", 20.62], ["livestock, farm animals, working animals", 18.82], ["moo", 16.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.27, 0.17, 1.33, 0.67, 2.17, 2.16, 2.51, 2.32, 0.32, 2.51, 0.88, 0.71, 3.92, 3.75, 1.56, 0.54, 2.61, 1.77, 1.61, 0.13, 1.22, 1.85, 1.14, 1.25, 0.33, 1.6, 1.42, 1.73, 2.82, 0.35, 0.64, 2.31]} \ No newline at end of file diff --git a/annotations_1/X2YJECANG6A_filtered.json b/annotations_1/X2YJECANG6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/X2YJECANG6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/X36kqKTClAg_filtered.json b/annotations_1/X36kqKTClAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b9c385e99ec247055e26acf657ce61980d652f --- /dev/null +++ b/annotations_1/X36kqKTClAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.7], [21.0, 20.73], [24.0, 25.57], [26.0, 26.38], [29.0, 30.15], [33.0, 33.15], [35.0, 35.67], [41.0, 41.82], [43.0, 45.25], [46.0, 48.34], [50.0, 50.55], [51.0, 51.56], [55.0, 56.52], [64.0, 65.4], [66.0, 67.27], [68.0, 67.91], [68.0, 69.89], [70.0, 70.93], [72.0, 72.33], [75.0, 75.68], [76.0, 85.48], [89.0, 89.02], [90.0, 91.5], [92.0, 93.14], [94.0, 95.45], [96.0, 103.27], [104.0, 105.54], [110.0, 110.79], [114.0, 115.18], [117.0, 117.8], [120.0, 121.07], [121.0, 136.41], [139.0, 146.5], [147.0, 148.19], [149.0, 150.2], [152.0, 152.46], [153.0, 154.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.07, 0.0, 0.0, 0.0, 0.0, 40.9, 0.0, 0.0, 0.0, 0.0, 0.0, 35.31, 32.73, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["rumble", 23.65], ["mains hum", 18.6], ["hum", 18.27]], null, null, null, null, [["sine wave", 32.48], ["chirp tone", 13.85], ["speech", 11.12]], null, null, null, null, null, [["speech", 28.89], ["hum", 15.09], ["music", 10.94]], [["music", 49.2], ["hum", 10.48], ["throbbing", 8.55]], null, null, null, null], "duration": [1.7, -0.27, 1.57, 0.38, 1.15, 0.15, 0.67, 0.82, 2.25, 2.34, 0.55, 0.56, 1.52, 1.4, 1.27, -0.09, 1.89, 0.93, 0.33, 0.68, 9.48, 0.02, 1.5, 1.14, 1.45, 7.27, 1.54, 0.79, 1.18, 0.8, 1.07, 15.41, 7.5, 1.19, 1.2, 0.46, 1.33]} \ No newline at end of file diff --git a/annotations_1/X3XwuyPljm4_filtered.json b/annotations_1/X3XwuyPljm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..672c7b1e72d10d7ca5e02090a27020c9c06c81c2 --- /dev/null +++ b/annotations_1/X3XwuyPljm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [6.0, 6.61], [10.0, 11.99], [13.0, 16.12], [19.0, 20.85], [24.0, 24.11], [28.0, 28.24], [31.0, 31.24], [50.0, 51.56], [54.0, 55.66], [63.0, 63.1], [70.0, 76.52], [82.0, 83.02], [84.0, 86.09], [87.0, 87.79], [88.0, 91.54], [98.0, 98.36], [99.0, 99.84], [102.0, 103.2], [109.0, 110.29], [113.0, 112.63], [114.0, 114.69], [119.0, 119.11], [125.0, 125.27], [130.0, 136.27], [137.0, 140.12], [141.0, 141.32], [145.0, 145.1], [146.0, 146.79], [147.0, 148.12], [149.0, 149.84], [151.0, 155.53], [157.0, 160.96], [162.0, 162.99], [167.0, 169.3], [171.0, 172.79], [175.0, 175.09], [177.0, 178.58], [179.0, 182.9], [185.0, 186.14], [187.0, 187.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.64, 0.0, 80.64, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 44.75, 63.31, 0.0, 42.02, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 53.84], ["music", 5.51], ["thunk", 2.81]], null, null, [["beatboxing", 31.55], ["throat clearing", 19.93], ["speech", 9.08]], null, null, null, null, null, null], "duration": [0.78, 0.61, 1.99, 3.12, 1.85, 0.11, 0.24, 0.24, 1.56, 1.66, 0.1, 6.52, 1.02, 2.09, 0.79, 3.54, 0.36, 0.84, 1.2, 1.29, -0.37, 0.69, 0.11, 0.27, 6.27, 3.12, 0.32, 0.1, 0.79, 1.12, 0.84, 4.53, 3.96, 0.99, 2.3, 1.79, 0.09, 1.58, 3.9, 1.14, 0.44]} \ No newline at end of file diff --git a/annotations_1/X4JETt9w9Zw_filtered.json b/annotations_1/X4JETt9w9Zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b80158b4cae2e3b80f88b9fcb2c417a4176314ba --- /dev/null +++ b/annotations_1/X4JETt9w9Zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 53.05], [56.0, 57.0], [59.0, 59.9], [63.0, 113.43], [114.0, 114.94], [117.0, 134.3], [136.0, 136.09], [138.0, 138.38], [142.0, 143.83], [150.0, 149.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.96, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 44.77], ["cattle, bovinae", 23.84], ["moo", 14.48]], null, null, null, null], "duration": [47.05, 1.0, 0.9, 50.43, 0.94, 17.3, 0.09, 0.38, 1.83, -0.11]} \ No newline at end of file diff --git a/annotations_1/X4jdgckXC9I_filtered.json b/annotations_1/X4jdgckXC9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ce3fb71c967872f0d528cd07a516bc8446914e7 --- /dev/null +++ b/annotations_1/X4jdgckXC9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.77], [13.0, 15.67], [16.0, 21.29], [22.0, 25.68], [27.0, 42.7], [44.0, 45.49], [46.0, 47.21], [48.0, 55.54], [56.0, 56.96], [57.0, 58.5], [59.0, 69.87], [72.0, 72.39], [73.0, 73.95], [75.0, 82.46], [83.0, 84.92], [87.0, 90.27], [92.0, 91.96]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 45.56, 98.8, 57.01, 0.0, 0.0, 81.71, 0.0, 0.0, 40.22, 0.0, 0.0, 31.68, 0.0, 51.99, 0.0], "audiomae_on_audioset": [null, null, [["speech", 50.39], ["sneeze", 5.66], ["hum", 4.84]], null, null, null, null, null, null, null, [["music", 36.3], ["speech", 22.02], ["theremin", 5.11]], null, null, [["music", 70.26], ["didgeridoo", 4.24], ["musical instrument", 3.69]], null, null, null], "duration": [1.77, 2.67, 5.29, 3.68, 15.7, 1.49, 1.21, 7.54, 0.96, 1.5, 10.87, 0.39, 0.95, 7.46, 1.92, 3.27, -0.04]} \ No newline at end of file diff --git a/annotations_1/X4lUmgN_ByQ_filtered.json b/annotations_1/X4lUmgN_ByQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..002393844b6ce1260331f772a3f55c7fba577d1c --- /dev/null +++ b/annotations_1/X4lUmgN_ByQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [7.0, 7.13], [8.0, 8.07], [10.0, 10.08], [10.0, 12.18], [16.0, 16.04], [18.0, 23.21], [23.0, 36.63], [37.0, 38.72], [52.0, 55.34], [57.0, 60.22], [66.0, 91.44], [92.0, 97.21], [98.0, 101.43], [103.0, 103.3], [105.0, 109.32], [109.0, 109.54], [111.0, 155.16], [156.0, 156.51], [157.0, 182.06], [182.0, 182.73], [185.0, 185.43], [187.0, 190.38], [193.0, 205.36], [206.0, 206.74], [208.0, 226.93], [228.0, 229.09]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, false, true, true, false, true, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.97, 0.0, 29.24, 29.64, 0.0, 35.26, 30.61, 29.65, 30.02, 31.32, 0.0, 30.07, 0.0, 0.0, 0.0, 30.77, 0.0, 0.0, 30.46, 29.84, 0.0, 29.61, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 52.64], ["whimper", 3.98], ["oink", 2.67]], null, [["speech", 65.22], ["music", 11.59], ["hubbub, speech noise, speech babble", 1.41]], [["livestock, farm animals, working animals", 51.46], ["cattle, bovinae", 28.36], ["moo", 16.83]], null, [["hum", 26.89], ["music", 22.25], ["throbbing", 14.87]], [["music", 38.14], ["speech", 20.81], ["hum", 6.91]], [["music", 44.03], ["speech", 35.56], ["buzz", 2.19]], [["music", 28.95], ["groan", 19.09], ["throbbing", 8.62]], [["music", 31.16], ["speech", 21.58], ["hum", 5.62]], null, [["music", 42.19], ["didgeridoo", 18.84], ["theremin", 7.87]], null, null, null, [["music", 52.61], ["hum", 17.59], ["throbbing", 7.13]], null, null, [["music", 31.98], ["mains hum", 16.85], ["hum", 8.7]], [["hum", 13.97], ["music", 13.39], ["mains hum", 11.53]], null, [["music", 35.55], ["livestock, farm animals, working animals", 7.85], ["hum", 6.78]], null], "duration": [0.49, 0.13, 0.07, 0.08, 2.18, 0.04, 5.21, 13.63, 1.72, 3.34, 3.22, 25.44, 5.21, 3.43, 0.3, 4.32, 0.54, 44.16, 0.51, 25.06, 0.73, 0.43, 3.38, 12.36, 0.74, 18.93, 1.09]} \ No newline at end of file diff --git a/annotations_1/X5_GpmLuea4_filtered.json b/annotations_1/X5_GpmLuea4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1deb9056d9a72b17ff815cb5444044958ca6dd48 --- /dev/null +++ b/annotations_1/X5_GpmLuea4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 34.91], [36.0, 72.81], [75.0, 88.18]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 46.54], "audiomae_on_audioset": [null, null, [["music", 70.44], ["flamenco", 6.98], ["tap", 3.72]]], "duration": [34.91, 36.81, 13.18]} \ No newline at end of file diff --git a/annotations_1/X5dtBoyZ33o_filtered.json b/annotations_1/X5dtBoyZ33o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70fbad470ad759630ae8e6a1406a71d5995bca93 --- /dev/null +++ b/annotations_1/X5dtBoyZ33o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [10.0, 44.95], [45.0, 45.08], [45.0, 45.22], [45.0, 52.29], [55.0, 59.53], [62.0, 62.55], [66.0, 82.83], [84.0, 84.64], [88.0, 93.58], [96.0, 98.71], [101.0, 104.92], [105.0, 104.97], [107.0, 115.32], [116.0, 118.83], [121.0, 123.75], [125.0, 131.55], [138.0, 146.6], [153.0, 164.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.79, 31.51, 0.0, 32.26, 0.0, 31.88, 32.84, 31.29, 0.0, 31.86, 35.0, 31.04, 32.5, 31.59, 32.69], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 43.0], ["livestock, farm animals, working animals", 25.2], ["moo", 23.36]], [["moo", 44.03], ["cattle, bovinae", 27.6], ["livestock, farm animals, working animals", 17.31]], null, [["music", 66.84], ["didgeridoo", 4.99], ["cattle, bovinae", 2.43]], null, [["music", 30.13], ["theremin", 13.36], ["didgeridoo", 4.73]], [["moo", 52.86], ["cattle, bovinae", 27.85], ["livestock, farm animals, working animals", 10.99]], [["cattle, bovinae", 33.7], ["livestock, farm animals, working animals", 28.92], ["moo", 24.34]], null, [["music", 40.66], ["theremin", 16.99], ["speech", 7.2]], [["moo", 41.35], ["cattle, bovinae", 31.0], ["livestock, farm animals, working animals", 15.07]], [["music", 35.0], ["theremin", 26.61], ["boing", 5.34]], [["music", 25.99], ["moo", 10.62], ["cattle, bovinae", 8.97]], [["boing", 46.81], ["music", 28.16], ["whale vocalization", 3.88]], [["music", 27.36], ["speech", 21.0], ["moo", 10.76]]], "duration": [0.35, 34.95, 0.08, 0.22, 7.29, 4.53, 0.55, 16.83, 0.64, 5.58, 2.71, 3.92, -0.03, 8.32, 2.83, 2.75, 6.55, 8.6, 11.73]} \ No newline at end of file diff --git a/annotations_1/X67GWsa_NNM_filtered.json b/annotations_1/X67GWsa_NNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cd2627c31a61185e0a123d56fcbfeba031fb410 --- /dev/null +++ b/annotations_1/X67GWsa_NNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.92], [9.0, 10.98], [14.0, 20.58], [24.0, 25.64], [27.0, 28.8], [34.0, 55.68], [58.0, 64.44], [71.0, 74.71], [80.0, 80.7], [81.0, 104.33], [106.0, 111.08], [113.0, 115.1], [119.0, 119.55], [121.0, 123.94]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [36.61, 0.0, 34.08, 0.0, 0.0, 35.68, 33.32, 29.84, 0.0, 33.63, 39.52, 48.02, 0.0, 43.3], "audiomae_on_audioset": [[["music", 21.43], ["synthesizer", 9.89], ["gong", 7.76]], null, [["hum", 57.26], ["music", 12.5], ["mains hum", 11.76]], null, null, [["mains hum", 52.34], ["hum", 38.94], ["throbbing", 2.35]], [["music", 63.91], ["hum", 10.26], ["mains hum", 7.91]], [["music", 34.74], ["didgeridoo", 26.18], ["speech", 23.39]], null, [["throbbing", 14.36], ["hum", 13.76], ["speech", 11.45]], [["didgeridoo", 39.74], ["music", 30.25], ["singing bowl", 15.0]], [["music", 46.66], ["singing bowl", 17.82], ["didgeridoo", 6.56]], null, [["music", 55.75], ["didgeridoo", 10.21], ["musical instrument", 5.82]]], "duration": [2.92, 1.98, 6.58, 1.64, 1.8, 21.68, 6.44, 3.71, 0.7, 23.33, 5.08, 2.1, 0.55, 2.94]} \ No newline at end of file diff --git a/annotations_1/X6keMEfkZok_filtered.json b/annotations_1/X6keMEfkZok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53606e4f0f34e6fffb8041e5c2ba2cf8f5934051 --- /dev/null +++ b/annotations_1/X6keMEfkZok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.51], [5.0, 9.54], [10.0, 10.88], [12.0, 28.27], [29.0, 30.47], [35.0, 46.38], [48.0, 51.63], [52.0, 58.06], [60.0, 60.59], [62.0, 62.99], [63.0, 63.48], [64.0, 65.4], [66.0, 68.91], [73.0, 74.93], [78.0, 84.74], [85.0, 85.95], [88.0, 89.48], [91.0, 90.91], [93.0, 92.96], [93.0, 94.56], [107.0, 108.51], [113.0, 113.93], [116.0, 128.61], [129.0, 129.29], [129.0, 130.08], [136.0, 136.81], [139.0, 162.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 99.82, 0.0, 99.99, 0.0, 100.0, 99.99, 99.99, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.51, 4.54, 0.88, 16.27, 1.47, 11.38, 3.63, 6.06, 0.59, 0.99, 0.48, 1.4, 2.91, 1.93, 6.74, 0.95, 1.48, -0.09, -0.04, 1.56, 1.51, 0.93, 12.61, 0.29, 1.08, 0.81, 23.89]} \ No newline at end of file diff --git a/annotations_1/X6zbmAt0YwI_filtered.json b/annotations_1/X6zbmAt0YwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db771e4e4fd35711633c7618e5b1a99f1a295647 --- /dev/null +++ b/annotations_1/X6zbmAt0YwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 38.08], [40.0, 47.34], [52.0, 58.31], [60.0, 60.47], [63.0, 65.04], [67.0, 68.18], [71.0, 71.98], [73.0, 74.53], [77.0, 78.63], [87.0, 89.29], [90.0, 91.76], [93.0, 95.81], [97.0, 106.42], [109.0, 109.54]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.21, 34.82, 36.78, 0.0, 75.23, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 92.15, 59.24, 0.0], "audiomae_on_audioset": [[["music", 28.96], ["speech", 23.75], ["radio", 10.15]], [["music", 26.37], ["speech", 22.23], ["clarinet", 15.13]], [["music", 42.02], ["didgeridoo", 23.45], ["speech", 6.12]], null, null, null, null, null, null, null, null, null, null, null], "duration": [5.08, 7.34, 6.31, 0.47, 2.04, 1.18, 0.98, 1.53, 1.63, 2.29, 1.76, 2.81, 9.42, 0.54]} \ No newline at end of file diff --git a/annotations_1/X8qBorenkn8_filtered.json b/annotations_1/X8qBorenkn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e34eda7229d46a8c6a50ad3fb2d0e5fc4257ee5 --- /dev/null +++ b/annotations_1/X8qBorenkn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.02], [11.0, 11.08], [12.0, 23.7], [25.0, 31.5], [32.0, 36.95], [38.0, 39.6], [43.0, 46.11], [47.0, 48.27], [53.0, 54.26], [55.0, 55.51], [56.0, 57.33], [59.0, 69.94]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [37.05, 0.0, 40.7, 69.74, 51.88, 0.0, 40.29, 0.0, 0.0, 0.0, 0.0, 32.83], "audiomae_on_audioset": [[["cattle, bovinae", 53.39], ["moo", 33.6], ["livestock, farm animals, working animals", 6.01]], null, [["animal", 18.54], ["horse", 14.43], ["livestock, farm animals, working animals", 9.92]], null, null, null, [["music", 47.44], ["theremin", 7.77], ["didgeridoo", 4.93]], null, null, null, null, [["music", 50.0], ["didgeridoo", 16.38], ["musical instrument", 6.26]]], "duration": [2.02, 0.08, 11.7, 6.5, 4.95, 1.6, 3.11, 1.27, 1.26, 0.51, 1.33, 10.94]} \ No newline at end of file diff --git a/annotations_1/X8w0J4y5X4g_filtered.json b/annotations_1/X8w0J4y5X4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c796878456ac628d5d87f9dfa8a9562c32c5e1 --- /dev/null +++ b/annotations_1/X8w0J4y5X4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.09], [15.0, 15.08], [17.0, 19.08], [22.0, 25.41], [28.0, 28.7], [33.0, 32.75], [33.0, 34.47], [42.0, 42.43], [52.0, 57.11], [60.0, 61.62], [75.0, 75.19], [76.0, 82.04], [83.0, 84.25], [85.0, 87.94], [91.0, 92.18], [94.0, 100.3], [101.0, 102.91], [104.0, 104.6], [108.0, 109.41]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [29.05, 0.0, 28.71, 28.6, 0.0, 0.0, 0.0, 0.0, 28.71, 0.0, 0.0, 28.39, 0.0, 29.48, 0.0, 32.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 50.66], ["moo", 24.46], ["livestock, farm animals, working animals", 22.9]], null, [["music", 39.5], ["didgeridoo", 7.98], ["speech", 4.67]], [["cattle, bovinae", 61.85], ["moo", 29.23], ["livestock, farm animals, working animals", 5.43]], null, null, null, null, [["speech", 32.25], ["cattle, bovinae", 14.75], ["livestock, farm animals, working animals", 8.61]], null, null, [["speech", 45.36], ["vehicle", 13.4], ["siren", 8.2]], null, [["mains hum", 24.68], ["music", 20.76], ["speech", 12.93]], null, [["hum", 31.95], ["mains hum", 21.64], ["throbbing", 17.47]], null, null, null], "duration": [7.09, 0.08, 2.08, 3.41, 0.7, -0.25, 1.47, 0.43, 5.11, 1.62, 0.19, 6.04, 1.25, 2.94, 1.18, 6.3, 1.91, 0.6, 1.41]} \ No newline at end of file diff --git a/annotations_1/XA0J-wn1Esg_filtered.json b/annotations_1/XA0J-wn1Esg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a225d714e9fb95d374870fa4004d4fbd90175b2 --- /dev/null +++ b/annotations_1/XA0J-wn1Esg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.08], [16.0, 33.02], [34.0, 35.38], [37.0, 38.28], [39.0, 41.35], [42.0, 42.57], [44.0, 46.6], [47.0, 49.82], [50.0, 52.2], [55.0, 56.94], [58.0, 64.91], [65.0, 64.94], [66.0, 70.38], [74.0, 77.18], [78.0, 79.05], [81.0, 83.32], [84.0, 120.88], [121.0, 124.5], [137.0, 141.15], [142.0, 143.87], [146.0, 147.51], [150.0, 158.4], [159.0, 160.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 97.92, 0.0, 0.0, 99.8, 0.0, 97.33, 55.81, 76.04, 0.0, 99.68, 0.0, 99.44, 97.11, 0.0, 96.77, 0.0, 36.14, 35.49, 0.0, 0.0, 29.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.22], ["throbbing", 5.59], ["musical instrument", 5.28]], [["theremin", 51.98], ["music", 32.23], ["electronic music", 1.59]], null, null, [["hum", 26.24], ["music", 25.21], ["throbbing", 16.41]], null], "duration": [1.08, 17.02, 1.38, 1.28, 2.35, 0.57, 2.6, 2.82, 2.2, 1.94, 6.91, -0.06, 4.38, 3.18, 1.05, 2.32, 36.88, 3.5, 4.15, 1.87, 1.51, 8.4, 1.74]} \ No newline at end of file diff --git a/annotations_1/XAIeh0YarFs_filtered.json b/annotations_1/XAIeh0YarFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61f26b07399970baabb43961156fbc52da425aed --- /dev/null +++ b/annotations_1/XAIeh0YarFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.89], [19.0, 28.63], [29.0, 30.18], [31.0, 33.42], [34.0, 35.11], [37.0, 38.64], [40.0, 40.41], [42.0, 44.88], [49.0, 58.11], [59.0, 70.48], [77.0, 78.06], [81.0, 81.77], [82.0, 83.15], [85.0, 85.67], [88.0, 90.95], [93.0, 93.38], [96.0, 97.09], [99.0, 99.18], [102.0, 103.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.47, 0.0, 76.86, 0.0, 0.0, 0.0, 50.76, 49.73, 41.32, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 52.25], ["cattle, bovinae", 21.22], ["moo", 16.12]], null, null, null, null, null, null, [["whale vocalization", 65.68], ["speech", 11.13], ["music", 4.81]], [["whale vocalization", 48.26], ["hum", 15.56], ["speech", 11.27]], null, null, null, null, [["whale vocalization", 46.64], ["music", 20.45], ["boat, water vehicle", 9.19]], null, null, null, null], "duration": [0.89, 9.63, 1.18, 2.42, 1.11, 1.64, 0.41, 2.88, 9.11, 11.48, 1.06, 0.77, 1.15, 0.67, 2.95, 0.38, 1.09, 0.18, 1.03]} \ No newline at end of file diff --git a/annotations_1/XAVgIM5X42w_filtered.json b/annotations_1/XAVgIM5X42w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f600c5dcdc8be9d61d030f943d5738168045ef28 --- /dev/null +++ b/annotations_1/XAVgIM5X42w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.0], [11.0, 12.33], [20.0, 21.47], [23.0, 24.29], [27.0, 28.51], [29.0, 29.37], [32.0, 34.69], [35.0, 36.66], [37.0, 38.53], [41.0, 40.73], [45.0, 45.93], [48.0, 49.37], [54.0, 54.45], [56.0, 57.23], [58.0, 59.09], [64.0, 63.91], [66.0, 66.68], [67.0, 67.9], [68.0, 68.79], [69.0, 70.36], [73.0, 73.79], [75.0, 75.22], [76.0, 78.04], [84.0, 85.29], [87.0, 88.47], [90.0, 90.95], [93.0, 94.05], [96.0, 96.5], [97.0, 98.96], [100.0, 101.76], [108.0, 108.7], [119.0, 120.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 45.88], ["sidetone", 11.31], ["music", 8.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.33, 1.47, 1.29, 1.51, 0.37, 2.69, 1.66, 1.53, -0.27, 0.93, 1.37, 0.45, 1.23, 1.09, -0.09, 0.68, 0.9, 0.79, 1.36, 0.79, 0.22, 2.04, 1.29, 1.47, 0.95, 1.05, 0.5, 1.96, 1.76, 0.7, 1.21]} \ No newline at end of file diff --git a/annotations_1/XB401RfGMlM_filtered.json b/annotations_1/XB401RfGMlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec76ebd1766fe348e75b3758e73bd22d4cbbd04a --- /dev/null +++ b/annotations_1/XB401RfGMlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.44], [33.0, 35.29], [46.0, 46.68], [69.0, 72.64], [80.0, 81.26], [88.0, 89.13], [98.0, 98.19], [98.0, 99.74], [104.0, 104.08], [106.0, 107.43], [110.0, 110.22], [111.0, 111.72], [124.0, 129.56], [137.0, 137.08], [138.0, 137.96], [138.0, 139.04], [140.0, 140.97], [142.0, 143.02], [150.0, 150.11]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.65, 0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["didgeridoo", 64.8], ["music", 26.88], ["speech", 1.04]], null, [["cattle, bovinae", 39.22], ["livestock, farm animals, working animals", 14.19], ["moo", 13.42]], null, null, null, null, null, null, null, null, [["moo", 40.81], ["cattle, bovinae", 37.25], ["livestock, farm animals, working animals", 19.57]], null, null, null, null, null, null], "duration": [1.44, 2.29, 0.68, 3.64, 1.26, 1.13, 0.19, 1.74, 0.08, 1.43, 0.22, 0.72, 5.56, 0.08, -0.04, 1.04, 0.97, 1.02, 0.11]} \ No newline at end of file diff --git a/annotations_1/XBCML9xJI8I_filtered.json b/annotations_1/XBCML9xJI8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f6278a409f022000b4c976bc26a63042f2c9343 --- /dev/null +++ b/annotations_1/XBCML9xJI8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.41], [28.0, 35.46], [50.0, 51.88], [60.0, 67.56], [69.0, 78.61], [82.0, 82.81], [87.0, 88.43], [91.0, 99.57], [105.0, 105.24], [106.0, 111.13], [114.0, 130.2], [133.0, 134.03], [139.0, 139.72], [146.0, 146.64], [171.0, 170.61]], "keep_status": [false, true, false, true, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [31.95, 36.89, 0.0, 34.25, 30.27, 0.0, 0.0, 30.67, 0.0, 35.2, 31.41, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 70.31], ["trance music", 4.21], ["electronic music", 3.68]], [["music", 53.97], ["drum machine", 4.75], ["throbbing", 4.42]], null, [["music", 50.68], ["electronic music", 5.92], ["animal", 5.68]], [["music", 39.91], ["cattle, bovinae", 15.28], ["moo", 13.97]], null, null, [["music", 43.59], ["animal", 6.16], ["electronic music", 5.61]], null, [["music", 31.17], ["sidetone", 19.21], ["moo", 10.96]], [["music", 77.67], ["speech", 6.49], ["electronic music", 4.23]], null, null, null, null], "duration": [5.41, 7.46, 1.88, 7.56, 9.61, 0.81, 1.43, 8.57, 0.24, 5.13, 16.2, 1.03, 0.72, 0.64, -0.39]} \ No newline at end of file diff --git a/annotations_1/XBz2wuGU9Cs_filtered.json b/annotations_1/XBz2wuGU9Cs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80ffb4b09bf90ec9d2af26bc416fc2c7ac93d2a8 --- /dev/null +++ b/annotations_1/XBz2wuGU9Cs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.89], [8.0, 8.51], [18.0, 18.01], [20.0, 20.26], [22.0, 22.17], [28.0, 28.36], [30.0, 30.91], [33.0, 34.47], [37.0, 37.47], [40.0, 41.01], [42.0, 43.09], [44.0, 45.01], [47.0, 47.65], [48.0, 48.81], [52.0, 52.91], [57.0, 57.16], [59.0, 59.64], [65.0, 66.33], [67.0, 67.85], [72.0, 74.02], [78.0, 78.46], [80.0, 80.76], [82.0, 83.62], [85.0, 86.26], [90.0, 91.47], [96.0, 96.67], [107.0, 107.13], [112.0, 112.95], [118.0, 118.88], [123.0, 123.13], [126.0, 126.64], [128.0, 127.82], [129.0, 128.88], [132.0, 131.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 0.51, 0.01, 0.26, 0.17, 0.36, 0.91, 1.47, 0.47, 1.01, 1.09, 1.01, 0.65, 0.81, 0.91, 0.16, 0.64, 1.33, 0.85, 2.02, 0.46, 0.76, 1.62, 1.26, 1.47, 0.67, 0.13, 0.95, 0.88, 0.13, 0.64, -0.18, -0.12, -0.18]} \ No newline at end of file diff --git a/annotations_1/XC0h9nx3Pw4_filtered.json b/annotations_1/XC0h9nx3Pw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ff6c1dfbb461c4239ac43ad31df0037e21f5d08 --- /dev/null +++ b/annotations_1/XC0h9nx3Pw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.75], [7.0, 7.43], [10.0, 10.3], [11.0, 13.61], [15.0, 15.4], [17.0, 17.96], [21.0, 23.67], [25.0, 26.16], [26.0, 28.59], [30.0, 49.99], [58.0, 58.48], [61.0, 61.72], [70.0, 76.3], [77.0, 83.47], [89.0, 89.67], [91.0, 99.0], [100.0, 101.63], [115.0, 115.38], [129.0, 133.86], [135.0, 134.97], [135.0, 139.21], [143.0, 144.63], [147.0, 147.65], [149.0, 168.2], [169.0, 170.13]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 99.92, 0.0, 46.19, 31.69, 0.0, 0.0, 30.56, 31.37, 0.0, 30.03, 0.0, 0.0, 41.87, 0.0, 32.47, 0.0, 0.0, 33.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sidetone", 30.56], ["hum", 20.42], ["music", 7.52]], [["speech", 84.08], ["music", 3.34], ["inside, small room", 0.88]], null, null, [["speech", 37.54], ["didgeridoo", 9.68], ["music", 9.42]], [["whack, thwack", 35.17], ["speech", 26.66], ["thunk", 15.45]], null, [["speech", 36.8], ["music", 32.09], ["theremin", 4.55]], null, null, [["speech", 37.48], ["mains hum", 12.63], ["hum", 11.86]], null, [["speech", 37.48], ["hum", 18.35], ["mains hum", 9.64]], null, null, [["speech", 61.79], ["music", 5.59], ["creak", 4.03]], null], "duration": [-0.25, 0.43, 0.3, 2.61, 0.4, 0.96, 2.67, 1.16, 2.59, 19.99, 0.48, 0.72, 6.3, 6.47, 0.67, 8.0, 1.63, 0.38, 4.86, -0.03, 4.21, 1.63, 0.65, 19.2, 1.13]} \ No newline at end of file diff --git a/annotations_1/XCJxGxYDjQE_filtered.json b/annotations_1/XCJxGxYDjQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e59c5f221b5bf1c0f415894c41503e748530f60f --- /dev/null +++ b/annotations_1/XCJxGxYDjQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[108.0, 108.53], [109.0, 109.26], [109.0, 109.31], [109.0, 117.26], [119.0, 128.01], [131.0, 160.64], [163.0, 164.66]], "keep_status": [false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.16, 29.54, 29.47, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.23], ["hum", 8.98], ["throbbing", 7.8]], [["music", 43.94], ["fly, housefly", 3.76], ["classical music", 3.54]], [["livestock, farm animals, working animals", 17.96], ["hum", 12.05], ["cattle, bovinae", 7.69]], null], "duration": [0.53, 0.26, 0.31, 8.26, 9.01, 29.64, 1.66]} \ No newline at end of file diff --git a/annotations_1/XDO8OYnmkNY_filtered.json b/annotations_1/XDO8OYnmkNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f42d8c51f436e6edcf9787869e8aa885b8fef9f --- /dev/null +++ b/annotations_1/XDO8OYnmkNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.35], [13.0, 15.48], [16.0, 17.39], [19.0, 21.0], [22.0, 23.38], [25.0, 26.33], [35.0, 36.46], [38.0, 39.68], [43.0, 44.09], [45.0, 45.15], [48.0, 49.08], [53.0, 53.33], [53.0, 54.7], [57.0, 58.45], [60.0, 60.35], [62.0, 63.29], [64.0, 65.3], [68.0, 71.69], [77.0, 79.1], [81.0, 81.68], [82.0, 83.98], [86.0, 86.83], [89.0, 91.71], [94.0, 100.18], [102.0, 101.93], [103.0, 105.0], [108.0, 109.56], [113.0, 117.71], [121.0, 123.06], [124.0, 126.33], [128.0, 129.17], [133.0, 135.11], [140.0, 140.37], [144.0, 145.81], [147.0, 149.13], [152.0, 151.98], [155.0, 157.94], [159.0, 181.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 100.0, 0.0, 0.0, 0.0, 100.0, 99.05, 0.0, 100.0, 0.0, 100.0, 100.0, 99.91, 0.0, 100.0, 0.0, 0.0, 94.37, 0.0, 100.0, 72.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.35, 2.48, 1.39, 2.0, 1.38, 1.33, 1.46, 1.68, 1.09, 0.15, 1.08, 0.33, 1.7, 1.45, 0.35, 1.29, 1.3, 3.69, 2.1, 0.68, 1.98, 0.83, 2.71, 6.18, -0.07, 2.0, 1.56, 4.71, 2.06, 2.33, 1.17, 2.11, 0.37, 1.81, 2.13, -0.02, 2.94, 22.62]} \ No newline at end of file diff --git a/annotations_1/XDlC8NyBBro_filtered.json b/annotations_1/XDlC8NyBBro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a93666381c3e119d2ad52fd37924e0e6ed9be616 --- /dev/null +++ b/annotations_1/XDlC8NyBBro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.85], [1.0, 1.12], [2.0, 4.26], [5.0, 5.32], [6.0, 6.83], [11.0, 11.06], [12.0, 11.99], [13.0, 20.53], [21.0, 21.66], [22.0, 22.0], [24.0, 25.37], [26.0, 33.78], [36.0, 37.02], [37.0, 38.72], [39.0, 47.58], [54.0, 53.99], [54.0, 54.65], [58.0, 60.15], [61.0, 61.3], [62.0, 64.27], [82.0, 82.54], [84.0, 84.91], [85.0, 85.26], [93.0, 92.65], [95.0, 96.28], [100.0, 100.13], [102.0, 102.69], [110.0, 111.08], [121.0, 121.19], [122.0, 122.17], [124.0, 124.41], [135.0, 136.0], [139.0, 139.99], [142.0, 143.48], [144.0, 145.39], [147.0, 147.14], [150.0, 150.84], [153.0, 153.47], [160.0, 165.7], [181.0, 186.71], [191.0, 194.04], [195.0, 195.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 41.87, 0.0, 0.0, 89.19, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 81.17, 38.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.02], ["keyboard (musical)", 7.98], ["musical instrument", 6.62]], null, null, null, null, [["sine wave", 25.43], ["sidetone", 17.68], ["chirp tone", 16.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 20.38], ["speech", 12.89], ["livestock, farm animals, working animals", 12.4]], null], "duration": [-0.15, 0.12, 2.26, 0.32, 0.83, 0.06, -0.01, 7.53, 0.66, 0.0, 1.37, 7.78, 1.02, 1.72, 8.58, -0.01, 0.65, 2.15, 0.3, 2.27, 0.54, 0.91, 0.26, -0.35, 1.28, 0.13, 0.69, 1.08, 0.19, 0.17, 0.41, 1.0, 0.99, 1.48, 1.39, 0.14, 0.84, 0.47, 5.7, 5.71, 3.04, 0.37]} \ No newline at end of file diff --git a/annotations_1/XDnXI6KXoeg_filtered.json b/annotations_1/XDnXI6KXoeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0100cb3aff71e1804801d779c4cf3633990b51fd --- /dev/null +++ b/annotations_1/XDnXI6KXoeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [5.0, 6.89], [9.0, 9.44], [11.0, 11.91], [14.0, 16.92], [19.0, 19.9], [24.0, 25.29], [26.0, 34.03], [40.0, 41.88], [44.0, 44.71], [47.0, 54.89], [56.0, 64.27], [65.0, 66.41], [69.0, 70.56], [73.0, 73.08], [75.0, 76.49], [79.0, 82.48], [83.0, 88.62], [90.0, 90.85], [94.0, 97.88], [98.0, 101.17], [101.0, 106.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [91.64, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 36.38, 0.0, 0.0, 87.19, 48.74, 0.0, 0.0, 0.0, 0.0, 46.26, 48.31, 0.0, 60.6, 44.9, 46.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 33.89], ["speech", 31.8], ["throbbing", 10.12]], null, null, null, [["speech", 42.38], ["hum", 22.12], ["mains hum", 16.77]], null, null, null, null, [["sidetone", 40.72], ["speech", 21.23], ["music", 11.92]], [["speech", 22.66], ["hum", 13.08], ["mains hum", 12.55]], null, null, [["music", 58.66], ["hum", 10.1], ["sidetone", 5.58]], [["music", 25.87], ["speech", 23.0], ["whale vocalization", 8.33]]], "duration": [2.36, 1.89, 0.44, 0.91, 2.92, 0.9, 1.29, 8.03, 1.88, 0.71, 7.89, 8.27, 1.41, 1.56, 0.08, 1.49, 3.48, 5.62, 0.85, 3.88, 3.17, 5.51]} \ No newline at end of file diff --git a/annotations_1/XEF8mU3Vanc_filtered.json b/annotations_1/XEF8mU3Vanc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5090034be9d22e3be98a33810eb1a625d1da7c74 --- /dev/null +++ b/annotations_1/XEF8mU3Vanc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.91], [13.0, 13.24], [13.0, 13.8], [16.0, 16.56], [26.0, 26.67], [27.0, 27.51], [43.0, 46.11], [52.0, 53.27], [64.0, 64.0], [65.0, 65.5], [66.0, 66.23], [78.0, 86.1], [87.0, 93.56], [96.0, 95.88], [98.0, 98.81], [120.0, 120.39], [121.0, 121.63], [140.0, 140.1], [149.0, 151.39], [161.0, 161.38], [165.0, 166.72], [168.0, 169.45], [171.0, 172.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 34.18, 34.62, 0.0, 0.0, 0.0, 0.0, 0.0, 35.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 42.49], ["music", 36.18], ["synthesizer", 6.08]], null, null, null, null, [["music", 69.06], ["speech", 11.16], ["hum", 2.26]], [["music", 70.25], ["carnatic music", 5.23], ["sitar", 4.57]], null, null, null, null, null, [["music", 21.45], ["speech", 13.88], ["hum", 10.63]], null, null, null, null], "duration": [1.91, 0.24, 0.8, 0.56, 0.67, 0.51, 3.11, 1.27, 0.0, 0.5, 0.23, 8.1, 6.56, -0.12, 0.81, 0.39, 0.63, 0.1, 2.39, 0.38, 1.72, 1.45, 1.23]} \ No newline at end of file diff --git a/annotations_1/XF33SnFIDAQ_filtered.json b/annotations_1/XF33SnFIDAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e9c37683678470667cf260db66158f5a2415a50 --- /dev/null +++ b/annotations_1/XF33SnFIDAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.42], [15.0, 15.38], [17.0, 17.09], [18.0, 19.72], [22.0, 22.44], [24.0, 27.01], [27.0, 28.19], [30.0, 35.16], [37.0, 37.02], [37.0, 41.84], [43.0, 43.77], [49.0, 49.25], [51.0, 52.02], [52.0, 54.84], [55.0, 54.94], [55.0, 55.04], [57.0, 59.83], [62.0, 62.06], [66.0, 66.61], [68.0, 70.93], [71.0, 75.36], [78.0, 80.13], [82.0, 84.62], [88.0, 97.21], [98.0, 102.98], [103.0, 104.03], [105.0, 105.93]], "keep_status": [true, false, false, false, false, true, false, true, false, true, false, false, false, true, false, false, true, false, false, true, true, true, false, false, false, false, false], "silence_prob": [49.82, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 43.2, 0.0, 36.43, 0.0, 0.0, 0.0, 33.36, 0.0, 0.0, 38.67, 0.0, 0.0, 37.97, 34.15, 42.79, 57.89, 39.05, 59.33, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.01], ["throbbing", 9.49], ["speech", 8.06]], null, null, null, null, [["music", 30.49], ["fly, housefly", 10.48], ["insect", 6.99]], null, [["music", 40.08], ["speech", 7.44], ["mosquito", 6.74]], null, [["speech", 14.33], ["cattle, bovinae", 11.11], ["fly, housefly", 9.4]], null, null, null, [["speech", 31.52], ["fart", 12.12], ["frying (food)", 10.85]], null, null, [["fly, housefly", 36.38], ["insect", 12.88], ["speech", 11.91]], null, null, [["music", 48.29], ["speech", 4.18], ["singing", 2.95]], [["speech", 36.75], ["fly, housefly", 9.26], ["insect", 7.3]], [["speech", 23.22], ["music", 14.72], ["hum", 12.28]], null, [["sidetone", 34.41], ["speech", 32.77], ["music", 8.74]], null, null, null], "duration": [8.42, 0.38, 0.09, 1.72, 0.44, 3.01, 1.19, 5.16, 0.02, 4.84, 0.77, 0.25, 1.02, 2.84, -0.06, 0.04, 2.83, 0.06, 0.61, 2.93, 4.36, 2.13, 2.62, 9.21, 4.98, 1.03, 0.93]} \ No newline at end of file diff --git a/annotations_1/XF5omSq8eRQ_filtered.json b/annotations_1/XF5omSq8eRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c4a3ab44a8c05581be4f84b75ae6baa8955583c --- /dev/null +++ b/annotations_1/XF5omSq8eRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.7], [10.0, 10.66], [14.0, 15.75], [24.0, 24.07], [32.0, 58.45], [72.0, 73.85], [75.0, 75.95], [78.0, 91.69], [95.0, 95.62], [111.0, 115.08], [120.0, 124.88], [127.0, 144.76], [151.0, 153.18], [162.0, 168.39], [172.0, 172.39], [174.0, 179.56], [180.0, 181.28], [186.0, 186.22], [187.0, 187.84], [189.0, 189.24], [191.0, 191.19], [192.0, 195.1], [197.0, 211.72], [214.0, 223.59], [224.0, 226.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.51, 0.0, 0.0, 31.44, 0.0, 29.92, 31.11, 30.37, 31.52, 30.16, 0.0, 31.01, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 31.04, 35.35, 39.18], "audiomae_on_audioset": [null, null, null, null, [["music", 37.41], ["throbbing", 12.88], ["speech", 10.72]], null, null, [["music", 86.81], ["synthesizer", 2.15], ["sound effect", 1.59]], null, [["music", 50.04], ["throbbing", 14.41], ["hum", 8.14]], [["music", 50.1], ["hum", 17.51], ["throbbing", 9.35]], [["music", 64.49], ["cacophony", 6.04], ["theremin", 4.46]], [["music", 60.91], ["speech", 12.05], ["synthesizer", 3.03]], [["music", 35.24], ["speech", 24.95], ["livestock, farm animals, working animals", 13.38]], null, [["speech", 39.03], ["music", 23.27], ["throbbing", 9.78]], null, null, null, null, null, null, [["music", 23.46], ["speech", 15.3], ["sidetone", 14.91]], [["cattle, bovinae", 23.9], ["moo", 14.09], ["livestock, farm animals, working animals", 10.92]], [["music", 43.76], ["boing", 10.15], ["groan", 8.17]]], "duration": [0.7, 0.66, 1.75, 0.07, 26.45, 1.85, 0.95, 13.69, 0.62, 4.08, 4.88, 17.76, 2.18, 6.39, 0.39, 5.56, 1.28, 0.22, 0.84, 0.24, 0.19, 3.1, 14.72, 9.59, 2.94]} \ No newline at end of file diff --git a/annotations_1/XFKhIBH23-Q_filtered.json b/annotations_1/XFKhIBH23-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9097e2a560ee05c3145dbd4b3f1821e15f1118a9 --- /dev/null +++ b/annotations_1/XFKhIBH23-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.38], [10.0, 11.37], [12.0, 12.26], [16.0, 15.99], [20.0, 20.88], [23.0, 23.08], [23.0, 23.79], [25.0, 25.57], [32.0, 32.78], [49.0, 49.5], [52.0, 52.41], [54.0, 55.09], [64.0, 65.57], [66.0, 66.8], [67.0, 71.83], [95.0, 95.96], [108.0, 108.89], [109.0, 109.54], [117.0, 117.05], [119.0, 119.38], [120.0, 120.46], [142.0, 142.92], [145.0, 154.5], [156.0, 156.54], [157.0, 157.2], [172.0, 173.62], [176.0, 176.64], [177.0, 178.28], [180.0, 179.9], [182.0, 182.28], [182.0, 182.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.37, 0.26, -0.01, 0.88, 0.08, 0.79, 0.57, 0.78, 0.5, 0.41, 1.09, 1.57, 0.8, 4.83, 0.96, 0.89, 0.54, 0.05, 0.38, 0.46, 0.92, 9.5, 0.54, 0.2, 1.62, 0.64, 1.28, -0.1, 0.28, 0.39]} \ No newline at end of file diff --git a/annotations_1/XGoagkYcJ38_filtered.json b/annotations_1/XGoagkYcJ38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85ae0bc64244c6264a03f9ba5d7a35a9c8d6ff71 --- /dev/null +++ b/annotations_1/XGoagkYcJ38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.11], [21.0, 59.68]], "keep_status": [false, false], "silence_prob": [32.36, 0.0], "audiomae_on_audioset": [[["music", 46.15], ["didgeridoo", 41.5], ["musical instrument", 3.75]], null], "duration": [2.11, 38.68]} \ No newline at end of file diff --git a/annotations_1/XHuewsIKvP0_filtered.json b/annotations_1/XHuewsIKvP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7290caf8520546c59666d9ce7e885ad3fb136e6b --- /dev/null +++ b/annotations_1/XHuewsIKvP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 49.27], [51.0, 56.81], [58.0, 59.76], [63.0, 64.15], [69.0, 69.23], [77.0, 78.09], [80.0, 79.98], [82.0, 85.72], [87.0, 91.44], [92.0, 105.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.05, 50.11, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 52.05, 73.82], "audiomae_on_audioset": [[["music", 83.37], ["ice cream truck, ice cream van", 6.69], ["speech", 1.66]], null, null, null, null, null, null, null, null, null], "duration": [13.27, 5.81, 1.76, 1.15, 0.23, 1.09, -0.02, 3.72, 4.44, 13.9]} \ No newline at end of file diff --git a/annotations_1/XHuo5etrwvY_filtered.json b/annotations_1/XHuo5etrwvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7831ffed46d6e12fca7818d95d48c9539243303 --- /dev/null +++ b/annotations_1/XHuo5etrwvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 77.4], [80.0, 108.01], [118.0, 123.84], [127.0, 149.91], [152.0, 153.62], [154.0, 155.36]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 61.87, 28.48, 29.96, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 16.24], ["rumble", 11.14], ["music", 9.36]], [["speech", 17.11], ["music", 12.1], ["groan", 9.58]], null, null], "duration": [76.4, 28.01, 5.84, 22.91, 1.62, 1.36]} \ No newline at end of file diff --git a/annotations_1/XIJ-TpmNlI0_filtered.json b/annotations_1/XIJ-TpmNlI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d0b0a43b62bc1d9e2ec315d9b37f2db1563b6c7 --- /dev/null +++ b/annotations_1/XIJ-TpmNlI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.45], [13.0, 19.84], [20.0, 22.65], [24.0, 31.87], [39.0, 39.53], [40.0, 41.55], [44.0, 49.55], [53.0, 54.01], [54.0, 55.61], [57.0, 58.43], [61.0, 63.05], [65.0, 66.46], [67.0, 67.54], [69.0, 69.33], [70.0, 99.57], [101.0, 102.15]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.06, 30.61, 29.06, 29.04, 0.0, 0.0, 31.42, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 28.48, 0.0], "audiomae_on_audioset": [[["speech", 44.6], ["fart", 18.3], ["sheep", 5.22]], [["music", 27.98], ["sidetone", 24.1], ["hum", 11.77]], [["music", 55.37], ["speech", 23.4], ["electronic music", 2.41]], [["music", 21.12], ["livestock, farm animals, working animals", 15.11], ["cattle, bovinae", 9.7]], null, null, [["speech", 42.1], ["music", 22.56], ["boing", 5.76]], null, null, null, null, null, null, null, [["speech", 17.3], ["music", 10.87], ["crowd", 10.83]], null], "duration": [3.45, 6.84, 2.65, 7.87, 0.53, 1.55, 5.55, 1.01, 1.61, 1.43, 2.05, 1.46, 0.54, 0.33, 29.57, 1.15]} \ No newline at end of file diff --git a/annotations_1/XIPjMKd3-1U_filtered.json b/annotations_1/XIPjMKd3-1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e82c117ed4890f561a566c4561e1beb901f53e --- /dev/null +++ b/annotations_1/XIPjMKd3-1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [4.0, 4.16], [15.0, 17.25], [23.0, 23.87], [25.0, 30.21], [33.0, 35.99], [38.0, 38.42], [42.0, 42.67], [48.0, 48.34], [54.0, 59.39], [63.0, 63.1], [79.0, 79.19], [88.0, 90.09], [92.0, 93.12], [96.0, 97.33], [108.0, 108.31], [121.0, 127.99], [132.0, 135.89], [144.0, 154.53], [156.0, 156.02], [158.0, 171.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 64.52, 0.0, 99.16, 97.92, 0.0, 0.0, 0.0, 41.74, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 31.17, 30.64, 30.24, 0.0, 30.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 15.9], ["moo", 14.38], ["sine wave", 11.84]], null, null, null, null, null, null, [["music", 57.39], ["effects unit", 10.21], ["distortion", 4.61]], [["music", 30.4], ["moo", 14.0], ["speech", 12.22]], [["music", 72.27], ["speech", 6.91], ["musical instrument", 1.99]], null, [["music", 52.77], ["speech", 7.93], ["animal", 3.1]]], "duration": [-0.09, 0.16, 2.25, 0.87, 5.21, 2.99, 0.42, 0.67, 0.34, 5.39, 0.1, 0.19, 2.09, 1.12, 1.33, 0.31, 6.99, 3.89, 10.53, 0.02, 13.27]} \ No newline at end of file diff --git a/annotations_1/XJsuAUwGz0M_filtered.json b/annotations_1/XJsuAUwGz0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3b5487ad86b13f3f5567e4a7450724abe95e864 --- /dev/null +++ b/annotations_1/XJsuAUwGz0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.91], [13.0, 17.46], [21.0, 35.67], [36.0, 50.45]], "keep_status": [true, true, false, false], "silence_prob": [29.58, 39.46, 30.43, 33.72], "audiomae_on_audioset": [[["music", 47.41], ["musical instrument", 5.06], ["explosion", 4.41]], [["music", 20.1], ["mosquito", 16.53], ["throbbing", 10.14]], [["music", 59.7], ["speech", 6.24], ["cacophony", 5.18]], [["music", 68.88], ["throbbing", 10.54], ["hum", 5.07]]], "duration": [4.91, 4.46, 14.67, 14.45]} \ No newline at end of file diff --git a/annotations_1/XKNZy6gahyc_filtered.json b/annotations_1/XKNZy6gahyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e8dc7323ec0b5864cf974a28a0db73ff0f82f29 --- /dev/null +++ b/annotations_1/XKNZy6gahyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [5.0, 6.44], [7.0, 10.0], [12.0, 13.04], [15.0, 16.09], [17.0, 17.49], [20.0, 27.51], [34.0, 46.5], [48.0, 71.76], [75.0, 79.25], [83.0, 92.16], [93.0, 95.54], [98.0, 98.52], [100.0, 104.73], [108.0, 116.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 33.26, 0.0, 0.0, 0.0, 29.89, 30.14, 30.3, 30.14, 30.49, 30.58, 0.0, 30.62, 29.78], "audiomae_on_audioset": [null, null, [["fly, housefly", 30.3], ["mosquito", 18.26], ["music", 14.31]], null, null, null, [["music", 45.81], ["fly, housefly", 19.04], ["mosquito", 6.67]], [["cattle, bovinae", 40.54], ["moo", 31.22], ["livestock, farm animals, working animals", 12.85]], [["music", 69.34], ["speech", 8.12], ["didgeridoo", 6.28]], [["speech", 51.53], ["music", 14.35], ["vehicle", 4.64]], [["music", 38.04], ["hum", 21.17], ["speech", 13.19]], [["music", 31.36], ["hum", 20.73], ["throbbing", 12.88]], null, [["music", 66.89], ["fly, housefly", 3.53], ["speech", 2.57]], [["music", 71.6], ["carnatic music", 2.28], ["noise", 1.89]]], "duration": [1.13, 1.44, 3.0, 1.04, 1.09, 0.49, 7.51, 12.5, 23.76, 4.25, 9.16, 2.54, 0.52, 4.73, 8.04]} \ No newline at end of file diff --git a/annotations_1/XLAGTl0Nnws_filtered.json b/annotations_1/XLAGTl0Nnws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66c3e7a99b98de6b5f309f7674ecce966055ad94 --- /dev/null +++ b/annotations_1/XLAGTl0Nnws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 42.52], [44.0, 44.36], [45.0, 47.48], [67.0, 68.71], [81.0, 81.01], [86.0, 88.18], [92.0, 93.09], [101.0, 103.06], [103.0, 103.62], [110.0, 116.63]], "keep_status": [true, false, true, false, false, false, false, false, false, true], "silence_prob": [42.35, 0.0, 48.65, 0.0, 0.0, 53.72, 0.0, 64.52, 0.0, 44.99], "audiomae_on_audioset": [[["speech", 38.12], ["hum", 10.17], ["mains hum", 9.87]], null, [["speech", 26.28], ["siren", 14.58], ["emergency vehicle", 12.76]], null, null, null, null, null, null, [["animal", 23.95], ["dog", 14.21], ["speech", 13.88]]], "duration": [7.52, 0.36, 2.48, 1.71, 0.01, 2.18, 1.09, 2.06, 0.62, 6.63]} \ No newline at end of file diff --git a/annotations_1/XLMDSjCzEx8_filtered.json b/annotations_1/XLMDSjCzEx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11b2e74213bfecd9ae6fe2acf523f7d73b861d30 --- /dev/null +++ b/annotations_1/XLMDSjCzEx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [11.0, 14.99], [18.0, 18.5], [20.0, 23.38], [34.0, 34.65], [70.0, 70.8], [75.0, 75.17], [78.0, 78.61], [80.0, 80.2], [86.0, 87.1], [97.0, 98.09], [100.0, 100.31], [102.0, 102.51], [105.0, 106.32], [108.0, 110.39], [114.0, 114.74]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.13, 0.0, 40.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0], "audiomae_on_audioset": [null, null, null, [["noise", 29.11], ["crushing", 15.88], ["thunk", 6.97]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 3.99, 0.5, 3.38, 0.65, 0.8, 0.17, 0.61, 0.2, 1.1, 1.09, 0.31, 0.51, 1.32, 2.39, 0.74]} \ No newline at end of file diff --git a/annotations_1/XM3MRt89zy4_filtered.json b/annotations_1/XM3MRt89zy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da65eb33625f7d7480374a0159821bb6b76f14d9 --- /dev/null +++ b/annotations_1/XM3MRt89zy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.77], [36.0, 37.52], [39.0, 39.5], [42.0, 43.56], [44.0, 45.06], [50.0, 51.22], [52.0, 53.55], [56.0, 58.13], [62.0, 62.78], [65.0, 65.45], [68.0, 70.87], [73.0, 74.36], [91.0, 94.26], [95.0, 95.4], [97.0, 97.36], [99.0, 100.72], [105.0, 104.82], [109.0, 112.92], [115.0, 116.28], [123.0, 123.84], [127.0, 127.5], [129.0, 129.54], [136.0, 136.46], [138.0, 138.5], [143.0, 143.46], [144.0, 144.41]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.85, 0.0, 0.0, 48.52, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 34.45], ["livestock, farm animals, working animals", 18.84], ["animal", 10.02]], null, null, [["cattle, bovinae", 22.6], ["moo", 22.52], ["music", 10.82]], null, [["singing bowl", 23.28], ["music", 18.85], ["hum", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.77, 1.52, 0.5, 1.56, 1.06, 1.22, 1.55, 2.13, 0.78, 0.45, 2.87, 1.36, 3.26, 0.4, 0.36, 1.72, -0.18, 3.92, 1.28, 0.84, 0.5, 0.54, 0.46, 0.5, 0.46, 0.41]} \ No newline at end of file diff --git a/annotations_1/XMGoOSCbul0_filtered.json b/annotations_1/XMGoOSCbul0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d557b590bc510cd0c1e855d69c335b16312fa9c --- /dev/null +++ b/annotations_1/XMGoOSCbul0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.98], [20.0, 24.34], [25.0, 25.73], [26.0, 30.1], [31.0, 32.29], [33.0, 43.34], [46.0, 48.07], [52.0, 52.74], [54.0, 56.51], [60.0, 62.94], [64.0, 72.0], [76.0, 81.75], [83.0, 83.71], [93.0, 94.8], [99.0, 100.16], [105.0, 115.45], [120.0, 120.73]], "keep_status": [true, true, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false], "silence_prob": [31.98, 42.19, 0.0, 30.24, 0.0, 29.2, 29.89, 0.0, 30.14, 30.46, 29.79, 30.1, 0.0, 0.0, 0.0, 29.71, 0.0], "audiomae_on_audioset": [[["speech", 35.15], ["music", 16.97], ["sidetone", 13.23]], [["speech", 27.61], ["glass", 12.49], ["music", 9.74]], null, [["cattle, bovinae", 38.77], ["moo", 30.76], ["livestock, farm animals, working animals", 27.24]], null, [["music", 84.35], ["throbbing", 2.0], ["beatboxing", 1.33]], [["music", 52.72], ["synthesizer", 5.1], ["theremin", 4.67]], null, [["music", 23.96], ["didgeridoo", 12.37], ["mains hum", 11.57]], [["music", 37.31], ["hum", 15.3], ["throbbing", 14.43]], [["music", 76.17], ["boing", 12.87], ["hip hop music", 0.79]], [["music", 39.11], ["static", 7.77], ["singing", 6.54]], null, null, null, [["music", 45.3], ["throbbing", 27.48], ["hum", 7.44]], null], "duration": [5.98, 4.34, 0.73, 4.1, 1.29, 10.34, 2.07, 0.74, 2.51, 2.94, 8.0, 5.75, 0.71, 1.8, 1.16, 10.45, 0.73]} \ No newline at end of file diff --git a/annotations_1/XMKKYshEbzM_filtered.json b/annotations_1/XMKKYshEbzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32c354db7df2d7cee519e3452f7b743f57706da2 --- /dev/null +++ b/annotations_1/XMKKYshEbzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.4], [41.0, 44.09], [46.0, 46.16], [46.0, 46.2], [46.0, 47.65], [48.0, 48.83], [50.0, 53.79], [58.0, 58.92], [66.0, 66.63], [67.0, 68.89], [69.0, 79.3], [80.0, 80.28], [83.0, 159.31]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.58, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 0.0, 28.64, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 22.11], ["rumble", 13.2], ["music", 11.43]], null, null, null, null, [["music", 74.04], ["throbbing", 7.93], ["hum", 3.61]], null, null, null, [["hum", 31.58], ["speech", 24.62], ["mains hum", 17.49]], null, null], "duration": [0.4, 3.09, 0.16, 0.2, 1.65, 0.83, 3.79, 0.92, 0.63, 1.89, 10.3, 0.28, 76.31]} \ No newline at end of file diff --git a/annotations_1/XMPTy7Iaw9s_filtered.json b/annotations_1/XMPTy7Iaw9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2859cd898f1d0bea05470853bc53a99fd478cddb --- /dev/null +++ b/annotations_1/XMPTy7Iaw9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.32], [16.0, 22.08], [26.0, 31.89], [34.0, 34.38], [36.0, 45.77], [51.0, 59.21], [63.0, 98.41], [101.0, 104.8], [106.0, 118.67], [123.0, 132.51], [141.0, 142.15], [143.0, 145.34], [147.0, 148.56], [152.0, 155.29]], "keep_status": [true, false, false, false, true, true, false, true, true, false, false, true, false, false], "silence_prob": [28.97, 29.46, 28.76, 0.0, 28.91, 29.06, 0.0, 28.75, 29.11, 29.17, 0.0, 29.3, 0.0, 29.28], "audiomae_on_audioset": [[["music", 43.18], ["hum", 10.15], ["throbbing", 6.15]], [["throbbing", 35.94], ["hum", 27.68], ["music", 21.55]], [["speech", 39.37], ["vehicle", 24.27], ["car", 11.01]], null, [["music", 50.55], ["throbbing", 10.16], ["hum", 6.27]], [["mains hum", 33.85], ["hum", 15.2], ["vehicle", 9.7]], null, [["mains hum", 14.91], ["music", 10.86], ["hum", 10.49]], [["buzz", 14.34], ["fly, housefly", 12.85], ["music", 12.67]], [["music", 80.24], ["speech", 4.25], ["throbbing", 3.29]], null, [["music", 48.6], ["musical instrument", 8.1], ["synthesizer", 6.36]], null, [["speech", 55.07], ["vehicle", 11.9], ["music", 6.44]]], "duration": [2.32, 6.08, 5.89, 0.38, 9.77, 8.21, 35.41, 3.8, 12.67, 9.51, 1.15, 2.34, 1.56, 3.29]} \ No newline at end of file diff --git a/annotations_1/XMt98-MEWmw_filtered.json b/annotations_1/XMt98-MEWmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc82d2892141b3a7fe85bd3820d52e3a4a2cffce --- /dev/null +++ b/annotations_1/XMt98-MEWmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [10.0, 10.79], [12.0, 13.0], [15.0, 14.72], [16.0, 16.26], [22.0, 22.89], [24.0, 24.21], [26.0, 26.16], [27.0, 27.03], [29.0, 29.37], [31.0, 30.6], [32.0, 32.46], [35.0, 36.36], [38.0, 39.46], [40.0, 41.01], [55.0, 56.91], [65.0, 64.62], [67.0, 67.93], [69.0, 68.94], [71.0, 71.76], [74.0, 74.53], [75.0, 75.69], [78.0, 79.3], [82.0, 82.24], [91.0, 92.1], [92.0, 94.14], [96.0, 96.55], [99.0, 100.92], [102.0, 102.91], [104.0, 105.58], [108.0, 109.32], [111.0, 110.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.79, 1.0, -0.28, 0.26, 0.89, 0.21, 0.16, 0.03, 0.37, -0.4, 0.46, 1.36, 1.46, 1.01, 1.91, -0.38, 0.93, -0.06, 0.76, 0.53, 0.69, 1.3, 0.24, 1.1, 2.14, 0.55, 1.92, 0.91, 1.58, 1.32, -0.19]} \ No newline at end of file diff --git a/annotations_1/XNUers0BuD4_filtered.json b/annotations_1/XNUers0BuD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131ffd75cfcf20cde19b06e065bc6e38ee6af1e9 --- /dev/null +++ b/annotations_1/XNUers0BuD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.47], [8.0, 9.41], [10.0, 10.47], [11.0, 12.01], [13.0, 15.62], [21.0, 23.53], [25.0, 25.03], [26.0, 26.25], [26.0, 29.81], [30.0, 31.95], [35.0, 37.62], [38.0, 38.5], [40.0, 40.71], [43.0, 42.7], [44.0, 51.73], [54.0, 56.51], [60.0, 62.04], [63.0, 63.44], [75.0, 75.49], [86.0, 87.76], [89.0, 91.37], [93.0, 92.91], [94.0, 94.22], [98.0, 99.77], [101.0, 102.91], [103.0, 104.68], [106.0, 108.03], [109.0, 111.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.93, 90.6, 0.0, 0.0, 98.8, 0.0, 100.0, 0.0, 0.0, 0.0, 99.65, 75.39, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.47, 1.41, 0.47, 1.01, 2.62, 2.53, 0.03, 0.25, 3.81, 1.95, 2.62, 0.5, 0.71, -0.3, 7.73, 2.51, 2.04, 0.44, 0.49, 1.76, 2.37, -0.09, 0.22, 1.77, 1.91, 1.68, 2.03, 2.86]} \ No newline at end of file diff --git a/annotations_1/XNZRK35VNrk_filtered.json b/annotations_1/XNZRK35VNrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d698a378e5dba9c5583867422187a5041628926b --- /dev/null +++ b/annotations_1/XNZRK35VNrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[84.0, 86.9]], "keep_status": [false], "silence_prob": [38.64], "audiomae_on_audioset": [[["mains hum", 30.05], ["hum", 26.35], ["music", 18.74]]], "duration": [2.9]} \ No newline at end of file diff --git a/annotations_1/XNwDyM81lSE_filtered.json b/annotations_1/XNwDyM81lSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c02dc819092634f72270f5ffde31e89860632304 --- /dev/null +++ b/annotations_1/XNwDyM81lSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.23], [11.0, 12.87], [14.0, 16.21], [18.0, 20.6], [22.0, 23.57], [25.0, 26.23], [28.0, 30.1], [31.0, 32.75], [33.0, 34.99], [36.0, 40.39], [42.0, 47.21], [48.0, 52.34], [53.0, 65.6], [69.0, 69.42], [70.0, 86.21], [86.0, 86.27], [88.0, 88.42], [89.0, 99.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [89.72, 0.0, 67.89, 69.07, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 41.18, 61.57, 29.25, 0.0, 29.9, 0.0, 0.0, 30.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 40.45], ["foghorn", 15.95], ["hum", 7.29]], null, [["music", 40.22], ["didgeridoo", 11.73], ["speech", 7.21]], null, [["music", 46.19], ["brass instrument", 23.83], ["trombone", 16.94]], null, null, [["music", 54.65], ["brass instrument", 14.04], ["trombone", 11.84]]], "duration": [5.23, 1.87, 2.21, 2.6, 1.57, 1.23, 2.1, 1.75, 1.99, 4.39, 5.21, 4.34, 12.6, 0.42, 16.21, 0.27, 0.42, 10.18]} \ No newline at end of file diff --git a/annotations_1/XO4HxR3dPsI_filtered.json b/annotations_1/XO4HxR3dPsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87d4f07ab1bb714e838c0c127132be36f8b46673 --- /dev/null +++ b/annotations_1/XO4HxR3dPsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [10.0, 14.01], [20.0, 21.1], [26.0, 26.08], [27.0, 27.73], [29.0, 29.17], [31.0, 30.99], [43.0, 43.87], [53.0, 53.33], [62.0, 63.04], [68.0, 68.54], [80.0, 80.94], [81.0, 83.67], [84.0, 86.56], [94.0, 94.49], [97.0, 98.73], [109.0, 109.22], [114.0, 114.94], [116.0, 117.14], [123.0, 123.89], [138.0, 138.96], [141.0, 141.86], [145.0, 145.72], [151.0, 152.58], [155.0, 156.83], [158.0, 159.21], [164.0, 165.77], [167.0, 169.48]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82], "audiomae_on_audioset": [null, [["chainsaw", 22.34], ["civil defense siren", 11.09], ["speech", 7.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 4.01, 1.1, 0.08, 0.73, 0.17, -0.01, 0.87, 0.33, 1.04, 0.54, 0.94, 2.67, 2.56, 0.49, 1.73, 0.22, 0.94, 1.14, 0.89, 0.96, 0.86, 0.72, 1.58, 1.83, 1.21, 1.77, 2.48]} \ No newline at end of file diff --git a/annotations_1/XOfjQQT9O08_filtered.json b/annotations_1/XOfjQQT9O08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1db5cb92790611a54cd57ce15bfcca52742daa91 --- /dev/null +++ b/annotations_1/XOfjQQT9O08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [8.0, 8.58], [16.0, 17.58], [22.0, 27.36], [34.0, 38.04], [44.0, 47.8], [55.0, 60.83], [63.0, 70.73], [72.0, 72.45], [73.0, 72.94], [73.0, 73.89], [77.0, 93.09], [100.0, 100.82], [102.0, 104.16], [105.0, 104.97], [113.0, 114.4], [121.0, 123.47], [127.0, 128.41], [130.0, 131.73]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.17, 32.07, 30.3, 30.17, 35.49, 0.0, 0.0, 0.0, 30.94, 0.0, 29.27, 0.0, 0.0, 32.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 72.54], ["drum machine", 4.36], ["boing", 3.31]], [["music", 64.36], ["speech", 5.45], ["cattle, bovinae", 3.87]], [["speech", 60.86], ["music", 11.81], ["whack, thwack", 5.68]], [["hum", 19.7], ["speech", 19.27], ["music", 14.3]], [["hum", 37.07], ["throbbing", 26.05], ["music", 20.58]], null, null, null, [["music", 52.52], ["speech", 12.57], ["electronic music", 5.78]], null, [["music", 30.98], ["speech", 12.92], ["electronic music", 4.13]], null, null, [["music", 51.14], ["hum", 12.15], ["speech", 5.91]], null, null], "duration": [0.19, 0.58, 1.58, 5.36, 4.04, 3.8, 5.83, 7.73, 0.45, -0.06, 0.89, 16.09, 0.82, 2.16, -0.03, 1.4, 2.47, 1.41, 1.73]} \ No newline at end of file diff --git a/annotations_1/XP0SZTwlmMk_filtered.json b/annotations_1/XP0SZTwlmMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cb61f75ad6b70aae9e69dc93f8d05a3d0c25347 --- /dev/null +++ b/annotations_1/XP0SZTwlmMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [8.0, 11.77], [13.0, 14.1], [15.0, 16.5], [21.0, 21.9], [27.0, 26.94], [31.0, 32.14], [36.0, 39.97], [40.0, 41.25], [45.0, 51.73], [55.0, 55.81], [60.0, 65.62], [71.0, 75.93], [77.0, 84.47], [86.0, 89.88]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, true], "silence_prob": [0.0, 34.76, 0.0, 0.0, 0.0, 0.0, 0.0, 37.01, 0.0, 39.4, 0.0, 50.86, 49.54, 45.43, 43.51], "audiomae_on_audioset": [null, [["speech", 77.48], ["chop", 3.35], ["ping", 2.09]], null, null, null, null, null, [["speech", 35.03], ["didgeridoo", 11.3], ["sidetone", 10.03]], null, [["speech", 13.22], ["noise", 9.37], ["sidetone", 5.86]], null, null, [["speech", 33.04], ["beatboxing", 22.06], ["music", 8.62]], [["speech", 61.58], ["hum", 11.81], ["sidetone", 8.42]], [["speech", 23.97], ["sidetone", 16.47], ["fly, housefly", 14.39]]], "duration": [0.42, 3.77, 1.1, 1.5, 0.9, -0.06, 1.14, 3.97, 1.25, 6.73, 0.81, 5.62, 4.93, 7.47, 3.88]} \ No newline at end of file diff --git a/annotations_1/XPKzmSSQ2xk_filtered.json b/annotations_1/XPKzmSSQ2xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6740e32134551e091ce6c305db8d57121723afea --- /dev/null +++ b/annotations_1/XPKzmSSQ2xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.09], [16.0, 24.83], [26.0, 31.77], [33.0, 34.06], [35.0, 36.05], [38.0, 39.11], [41.0, 42.3], [44.0, 45.42], [47.0, 47.14], [48.0, 49.32], [51.0, 53.37], [54.0, 56.56], [57.0, 58.58], [60.0, 62.92], [65.0, 65.74], [67.0, 68.07], [70.0, 70.38], [72.0, 73.21], [76.0, 77.45], [81.0, 81.84], [84.0, 86.61], [90.0, 92.37], [95.0, 101.09], [104.0, 109.98], [112.0, 114.69]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.38, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 77.2, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 93.29, 99.95, 99.9, 99.99], "audiomae_on_audioset": [null, [["speech", 50.52], ["frog", 8.98], ["radio", 7.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 8.83, 5.77, 1.06, 1.05, 1.11, 1.3, 1.42, 0.14, 1.32, 2.37, 2.56, 1.58, 2.92, 0.74, 1.07, 0.38, 1.21, 1.45, 0.84, 2.61, 2.37, 6.09, 5.98, 2.69]} \ No newline at end of file diff --git a/annotations_1/XPsDyk5bJdE_filtered.json b/annotations_1/XPsDyk5bJdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01efda7119c3412f99fd3042dbd511309c945c12 --- /dev/null +++ b/annotations_1/XPsDyk5bJdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.8], [12.0, 12.48], [13.0, 14.15], [16.0, 16.87], [30.0, 30.79], [32.0, 33.62], [37.0, 39.41], [40.0, 42.84], [63.0, 63.22], [69.0, 69.99], [77.0, 77.99], [81.0, 82.02], [85.0, 85.33], [86.0, 86.68], [95.0, 96.11], [97.0, 97.97], [100.0, 101.22], [107.0, 107.32], [108.0, 109.51], [110.0, 115.23], [116.0, 116.67], [122.0, 123.85], [129.0, 132.26], [135.0, 135.5], [137.0, 137.89], [141.0, 141.42], [143.0, 144.15], [145.0, 145.39], [147.0, 147.51], [152.0, 152.59], [155.0, 155.33], [158.0, 157.84], [164.0, 164.67], [167.0, 167.24], [168.0, 168.57]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.05, 0.0, 0.0, 0.0, 0.0, 0.0, 88.28, 40.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["thunk", 18.43], ["gong", 13.15], ["music", 11.74]], null, null, null, null, null, null, [["music", 43.72], ["mantra", 14.06], ["chant", 9.93]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.83], ["mains hum", 10.34], ["hum", 4.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.8, 0.48, 1.15, 0.87, 0.79, 1.62, 2.41, 2.84, 0.22, 0.99, 0.99, 1.02, 0.33, 0.68, 1.11, 0.97, 1.22, 0.32, 1.51, 5.23, 0.67, 1.85, 3.26, 0.5, 0.89, 0.42, 1.15, 0.39, 0.51, 0.59, 0.33, -0.16, 0.67, 0.24, 0.57]} \ No newline at end of file diff --git a/annotations_1/XPsddyf2EcY_filtered.json b/annotations_1/XPsddyf2EcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..383336bd1d53a0eb21856df4060d62601a8322b9 --- /dev/null +++ b/annotations_1/XPsddyf2EcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [1.0, 1.85], [2.0, 2.78], [7.0, 8.06], [9.0, 10.02], [11.0, 12.43], [12.0, 12.48], [13.0, 14.2], [14.0, 14.77], [16.0, 16.16], [22.0, 22.06], [24.0, 26.01], [27.0, 27.6], [29.0, 30.72], [40.0, 43.44], [44.0, 45.42], [49.0, 48.93], [49.0, 65.03], [72.0, 76.99], [79.0, 83.78], [86.0, 86.78], [88.0, 88.62], [91.0, 93.18], [105.0, 105.12], [107.0, 112.87], [114.0, 113.64], [120.0, 122.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.88, 0.0, 0.0, 35.31, 0.0, 0.0, 30.63, 31.22, 35.01, 0.0, 0.0, 32.51, 0.0, 33.53, 0.0, 29.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 54.51], ["grunt", 11.21], ["groan", 6.56]], null, null, [["music", 35.1], ["speech", 31.15], ["quack", 3.56]], null, null, [["music", 51.64], ["speech", 27.87], ["synthesizer", 4.54]], [["music", 68.16], ["speech", 18.63], ["synthesizer", 4.02]], [["music", 72.1], ["boing", 8.51], ["sidetone", 4.32]], null, null, [["music", 47.34], ["speech", 17.17], ["sidetone", 14.84]], null, [["music", 62.76], ["speech", 11.42], ["musical instrument", 7.79]], null, [["boing", 26.48], ["music", 15.6], ["whack, thwack", 12.27]]], "duration": [0.5, 0.85, 0.78, 1.06, 1.02, 1.43, 0.48, 1.2, 0.77, 0.16, 0.06, 2.01, 0.6, 1.72, 3.44, 1.42, -0.07, 16.03, 4.99, 4.78, 0.78, 0.62, 2.18, 0.12, 5.87, -0.36, 2.72]} \ No newline at end of file diff --git a/annotations_1/XQEr5FlhFDc_filtered.json b/annotations_1/XQEr5FlhFDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86ada645a4720d7fe09f616fd23f3b66ec4101e6 --- /dev/null +++ b/annotations_1/XQEr5FlhFDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.69], [11.0, 17.1], [19.0, 21.25], [23.0, 25.15], [28.0, 47.78], [50.0, 60.72], [63.0, 67.37], [70.0, 72.62], [75.0, 76.76], [80.0, 88.47], [90.0, 93.83], [95.0, 95.42], [97.0, 99.42], [100.0, 101.12], [102.0, 110.83], [116.0, 138.4], [147.0, 148.63], [152.0, 151.88]], "keep_status": [false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [58.22, 46.86, 66.63, 57.01, 63.64, 47.43, 57.17, 44.32, 0.0, 52.68, 40.86, 0.0, 57.56, 0.0, 61.87, 40.17, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 18.66], ["speech", 14.98], ["hum", 11.75]], null, null, null, [["hum", 40.42], ["speech", 30.53], ["mains hum", 5.8]], null, [["speech", 29.73], ["aircraft", 11.65], ["fixed-wing aircraft, airplane", 11.07]], null, null, [["noise", 15.86], ["music", 15.25], ["mains hum", 13.11]], null, null, null, null, [["music", 69.36], ["hum", 5.96], ["throbbing", 4.54]], null, null], "duration": [3.69, 6.1, 2.25, 2.15, 19.78, 10.72, 4.37, 2.62, 1.76, 8.47, 3.83, 0.42, 2.42, 1.12, 8.83, 22.4, 1.63, -0.12]} \ No newline at end of file diff --git a/annotations_1/XR7br4b3gsg_filtered.json b/annotations_1/XR7br4b3gsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d60744d4fdd7f44e9db50ef87a7d9dd5a64c60fa --- /dev/null +++ b/annotations_1/XR7br4b3gsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.25], [27.0, 28.21], [29.0, 29.71], [30.0, 35.4], [37.0, 37.44], [39.0, 45.77], [48.0, 50.26], [51.0, 51.76], [53.0, 53.57], [56.0, 56.4], [63.0, 64.15], [67.0, 122.22], [125.0, 124.61], [127.0, 127.68], [131.0, 131.82], [137.0, 137.64], [141.0, 141.86], [142.0, 144.95], [146.0, 150.33], [154.0, 157.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.14, 0.0, 30.05, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 50.06, 34.44], "audiomae_on_audioset": [null, null, null, [["hum", 54.36], ["throbbing", 18.38], ["music", 8.79]], null, [["speech", 27.26], ["gunshot, gunfire", 26.96], ["artillery fire", 20.71]], [["hum", 41.12], ["mains hum", 30.95], ["music", 9.02]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.77], ["drum machine", 15.41], ["synthesizer", 6.23]]], "duration": [0.25, 1.21, 0.71, 5.4, 0.44, 6.77, 2.26, 0.76, 0.57, 0.4, 1.15, 55.22, -0.39, 0.68, 0.82, 0.64, 0.86, 2.95, 4.33, 3.81]} \ No newline at end of file diff --git a/annotations_1/XRtuUFYTctA_filtered.json b/annotations_1/XRtuUFYTctA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08c211fe793dd4bb97425cd90957a7a1b5683734 --- /dev/null +++ b/annotations_1/XRtuUFYTctA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [6.0, 18.76], [21.0, 21.81], [23.0, 24.16], [25.0, 39.66], [42.0, 41.86], [45.0, 44.98], [47.0, 46.85], [49.0, 49.05], [50.0, 59.39], [60.0, 61.08], [65.0, 66.46], [68.0, 68.15], [70.0, 72.89]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.2, 0.0, 0.0, 30.02, 0.0, 0.0, 0.0, 0.0, 40.38, 0.0, 0.0, 0.0, 68.54], "audiomae_on_audioset": [null, [["speech", 52.48], ["radio", 9.03], ["sidetone", 7.98]], null, null, [["fart", 34.92], ["speech", 31.82], ["walk, footsteps", 4.58]], null, null, null, null, [["radio", 27.0], ["noise", 19.05], ["speech", 12.9]], null, null, null, null], "duration": [1.06, 12.76, 0.81, 1.16, 14.66, -0.14, -0.02, -0.15, 0.05, 9.39, 1.08, 1.46, 0.15, 2.89]} \ No newline at end of file diff --git a/annotations_1/XT2IS2dn8gM_filtered.json b/annotations_1/XT2IS2dn8gM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..373db5d646d46309f94f70b3bcfcc852ce5008c9 --- /dev/null +++ b/annotations_1/XT2IS2dn8gM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 35.01], [38.0, 47.98], [52.0, 63.61], [66.0, 66.07], [68.0, 91.3], [96.0, 100.08], [106.0, 106.79], [108.0, 109.34], [114.0, 114.34], [115.0, 115.96], [117.0, 117.8], [119.0, 119.58], [120.0, 120.73], [121.0, 122.57], [125.0, 127.36], [130.0, 130.13]], "keep_status": [true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.86, 39.07, 34.53, 0.0, 33.78, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0], "audiomae_on_audioset": [[["throbbing", 29.75], ["music", 27.06], ["bow-wow", 10.93]], [["throbbing", 61.25], ["music", 14.88], ["hum", 11.29]], [["music", 50.91], ["throbbing", 7.61], ["bow-wow", 4.73]], null, [["music", 51.76], ["animal", 6.63], ["throbbing", 6.32]], null, null, null, null, null, null, null, null, null, null, null], "duration": [13.01, 9.98, 11.61, 0.07, 23.3, 4.08, 0.79, 1.34, 0.34, 0.96, 0.8, 0.58, 0.73, 1.57, 2.36, 0.13]} \ No newline at end of file diff --git a/annotations_1/XTCEl_MFfHA_filtered.json b/annotations_1/XTCEl_MFfHA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e2d21af0adbc48c1957000b72474d11bf2399a --- /dev/null +++ b/annotations_1/XTCEl_MFfHA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 41.49], [42.0, 53.67], [54.0, 56.22]], "keep_status": [false, true, true], "silence_prob": [66.15, 45.56, 42.39], "audiomae_on_audioset": [null, [["music", 58.33], ["gong", 5.22], ["hum", 5.09]], [["music", 41.28], ["gong", 7.05], ["theremin", 6.68]]], "duration": [3.49, 11.67, 2.22]} \ No newline at end of file diff --git a/annotations_1/XTjTXskLQO0_filtered.json b/annotations_1/XTjTXskLQO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12fcc12b3ddab98448a952ed67a8a04640879cff --- /dev/null +++ b/annotations_1/XTjTXskLQO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.17], [18.0, 20.12], [35.0, 35.63], [36.0, 37.25], [40.0, 40.66], [41.0, 43.39], [44.0, 49.35], [50.0, 50.41], [51.0, 52.88], [53.0, 54.3], [55.0, 61.38], [69.0, 69.04], [72.0, 72.69], [74.0, 75.05], [77.0, 79.03], [85.0, 86.63], [88.0, 103.92], [113.0, 112.72], [113.0, 114.61], [118.0, 118.79], [119.0, 122.62], [129.0, 135.09], [139.0, 139.95], [142.0, 142.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.87, 0.0, 0.0, 0.0, 55.25, 73.21, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 36.02, 0.0, 34.16, 0.0, 0.0, 0.0, 52.62, 38.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 51.4], ["thunk", 12.27], ["crushing", 5.45]], null, null, null, [["speech", 25.97], ["thunk", 19.44], ["boing", 16.76]], null, [["music", 79.22], ["boing", 8.3], ["thunk", 2.2]], null, null, null, null, [["music", 69.36], ["singing", 3.14], ["musical instrument", 3.12]], null, null], "duration": [1.17, 2.12, 0.63, 1.25, 0.66, 2.39, 5.35, 0.41, 1.88, 1.3, 6.38, 0.04, 0.69, 1.05, 2.03, 1.63, 15.92, -0.28, 1.61, 0.79, 3.62, 6.09, 0.95, 0.92]} \ No newline at end of file diff --git a/annotations_1/XUSzvNtSsFE_filtered.json b/annotations_1/XUSzvNtSsFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b2fc273a117fb6cbd0bbc30a932362f6c33c07c --- /dev/null +++ b/annotations_1/XUSzvNtSsFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 33.25], [34.0, 62.78], [63.0, 66.02], [71.0, 72.12], [76.0, 76.49], [83.0, 100.92], [104.0, 104.97], [105.0, 108.18], [110.0, 110.74], [111.0, 133.02], [136.0, 143.72], [145.0, 147.77], [151.0, 171.22], [172.0, 183.36], [187.0, 191.17], [192.0, 194.8]], "keep_status": [true, false, true, false, false, true, false, true, false, true, true, false, false, true, true, false], "silence_prob": [32.13, 31.23, 34.74, 0.0, 0.0, 29.87, 0.0, 38.6, 0.0, 30.47, 32.38, 28.24, 29.21, 28.75, 42.91, 68.41], "audiomae_on_audioset": [[["whale vocalization", 50.36], ["buzz", 11.06], ["music", 5.78]], [["hum", 43.47], ["mains hum", 19.57], ["rumble", 12.51]], [["sidetone", 26.76], ["speech", 24.59], ["music", 12.19]], null, null, [["music", 15.46], ["fly, housefly", 13.51], ["insect", 9.45]], null, [["music", 38.28], ["throbbing", 14.49], ["hum", 9.72]], null, [["speech", 45.38], ["breaking", 15.7], ["music", 7.92]], [["music", 46.17], ["electronic music", 7.25], ["sidetone", 5.91]], [["livestock, farm animals, working animals", 44.0], ["cattle, bovinae", 20.46], ["moo", 18.99]], [["speech", 46.4], ["music", 19.09], ["rumble", 4.91]], [["fly, housefly", 11.32], ["insect", 8.83], ["music", 7.87]], [["music", 52.37], ["noise", 8.29], ["throbbing", 7.0]], null], "duration": [17.25, 28.78, 3.02, 1.12, 0.49, 17.92, 0.97, 3.18, 0.74, 22.02, 7.72, 2.77, 20.22, 11.36, 4.17, 2.8]} \ No newline at end of file diff --git a/annotations_1/XUcN9bf_jP0_filtered.json b/annotations_1/XUcN9bf_jP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43b48cceb1a9305c450715bfea0585b61732f96a --- /dev/null +++ b/annotations_1/XUcN9bf_jP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.33], [17.0, 17.37], [19.0, 20.7], [22.0, 29.74], [30.0, 30.79], [31.0, 36.42], [40.0, 40.91], [44.0, 47.68], [54.0, 54.7], [56.0, 57.38], [57.0, 57.64], [59.0, 69.13], [72.0, 74.36], [76.0, 77.4], [82.0, 121.49], [125.0, 125.37], [126.0, 126.69], [134.0, 134.18]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.88, 0.0, 33.77, 0.0, 31.63, 0.0, 0.0, 0.0, 29.7, 34.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 15.74], ["livestock, farm animals, working animals", 8.35], ["moo", 7.97]], null, [["speech", 22.94], ["music", 22.75], ["sidetone", 9.32]], null, [["music", 36.16], ["thunk", 32.91], ["speech", 6.61]], null, null, null, [["music", 68.67], ["speech", 4.14], ["livestock, farm animals, working animals", 3.6]], [["boing", 11.32], ["grunt", 7.57], ["noise", 5.71]], null, null, null, null, null], "duration": [0.33, 0.37, 1.7, 7.74, 0.79, 5.42, 0.91, 3.68, 0.7, 1.38, 0.64, 10.13, 2.36, 1.4, 39.49, 0.37, 0.69, 0.18]} \ No newline at end of file diff --git a/annotations_1/XUdBdsMc5EQ_filtered.json b/annotations_1/XUdBdsMc5EQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc88850d3f03c72378c04a359311aa2f4d0a0c4b --- /dev/null +++ b/annotations_1/XUdBdsMc5EQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.7], [9.0, 9.96], [11.0, 11.35], [16.0, 16.65], [28.0, 28.12], [31.0, 31.77], [33.0, 33.89], [36.0, 36.39], [38.0, 37.62], [38.0, 38.23], [40.0, 41.49], [47.0, 46.95], [51.0, 51.12], [51.0, 51.63], [52.0, 52.51], [53.0, 54.18], [55.0, 55.44], [62.0, 62.36], [71.0, 70.71], [77.0, 77.41], [88.0, 88.06], [88.0, 89.48], [90.0, 91.13], [93.0, 93.53], [117.0, 127.95], [131.0, 131.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.7, 0.96, 0.35, 0.65, 0.12, 0.77, 0.89, 0.39, -0.38, 0.23, 1.49, -0.05, 0.12, 0.63, 0.51, 1.18, 0.44, 0.36, -0.29, 0.41, 0.06, 1.48, 1.13, 0.53, 10.95, 0.68]} \ No newline at end of file diff --git a/annotations_1/XUyFzVAKCm4_filtered.json b/annotations_1/XUyFzVAKCm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75a92ae3c06071929b4a1cb2505fecbd11c2c5c2 --- /dev/null +++ b/annotations_1/XUyFzVAKCm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 20.63], [23.0, 30.32], [36.0, 43.85], [50.0, 51.11], [53.0, 54.04], [55.0, 55.68], [58.0, 60.64], [62.0, 62.75], [65.0, 65.16], [67.0, 68.25], [73.0, 75.36], [80.0, 80.49], [87.0, 92.72], [94.0, 98.56], [102.0, 103.15], [103.0, 103.42], [104.0, 104.94], [105.0, 110.05], [115.0, 121.81], [126.0, 142.28], [148.0, 158.36]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [38.51, 36.73, 88.64, 0.0, 0.0, 0.0, 63.31, 0.0, 0.0, 0.0, 42.06, 0.0, 33.03, 30.68, 0.0, 0.0, 0.0, 30.63, 30.42, 31.01, 30.62], "audiomae_on_audioset": [[["music", 65.54], ["funny music", 3.97], ["yodeling", 2.19]], [["music", 52.14], ["speech", 12.41], ["synthesizer", 3.06]], null, null, null, null, null, null, null, null, [["didgeridoo", 21.93], ["frog", 17.29], ["music", 11.78]], null, [["music", 40.8], ["didgeridoo", 14.65], ["speech", 11.74]], [["music", 81.7], ["musical instrument", 3.27], ["sampler", 1.6]], null, null, null, [["music", 72.48], ["sampler", 3.11], ["rock and roll", 1.95]], [["music", 79.03], ["electronic music", 4.68], ["sampler", 1.39]], [["music", 88.34], ["reggae", 1.13], ["electronic music", 0.98]], [["music", 69.77], ["crowd", 3.93], ["applause", 2.93]]], "duration": [7.63, 7.32, 7.85, 1.11, 1.04, 0.68, 2.64, 0.75, 0.16, 1.25, 2.36, 0.49, 5.72, 4.56, 1.15, 0.42, 0.94, 5.05, 6.81, 16.28, 10.36]} \ No newline at end of file diff --git a/annotations_1/XWAuh7S1zjk_filtered.json b/annotations_1/XWAuh7S1zjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3b4ef302e03a6405c88d945d0ecaabfdb1c0c99 --- /dev/null +++ b/annotations_1/XWAuh7S1zjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [5.0, 6.81], [8.0, 10.13], [11.0, 12.28], [14.0, 15.89], [16.0, 17.63], [19.0, 23.57], [26.0, 26.69], [30.0, 31.97], [37.0, 38.69], [39.0, 41.49], [45.0, 49.42], [50.0, 51.63], [52.0, 54.67], [59.0, 61.11], [61.0, 63.1], [64.0, 66.21], [69.0, 70.07], [71.0, 71.69], [72.0, 83.47], [88.0, 94.85], [97.0, 98.71], [101.0, 100.84], [104.0, 104.57], [106.0, 108.3], [109.0, 112.11]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 0.0, 61.77, 56.7, 0.0, 81.0, 52.98, 52.98, 60.42, 0.0, 0.0, 31.14, 43.51, 0.0, 0.0, 0.0, 72.75, 40.11], "audiomae_on_audioset": [null, null, [["music", 36.15], ["didgeridoo", 11.62], ["noise", 4.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.46], ["music", 26.34], ["breaking", 5.27]], [["mains hum", 29.13], ["hum", 19.57], ["fly, housefly", 15.16]], null, null, null, null, [["music", 19.18], ["speech", 17.33], ["hum", 4.48]]], "duration": [1.45, 1.81, 2.13, 1.28, 1.89, 1.63, 4.57, 0.69, 1.97, 1.69, 2.49, 4.42, 1.63, 2.67, 2.11, 2.1, 2.21, 1.07, 0.69, 11.47, 6.85, 1.71, -0.16, 0.57, 2.3, 3.11]} \ No newline at end of file diff --git a/annotations_1/XWgSKXw8ZwI_filtered.json b/annotations_1/XWgSKXw8ZwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96308f7dbb96dfbe481bd9dd6d0e629290fab240 --- /dev/null +++ b/annotations_1/XWgSKXw8ZwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.84], [24.0, 25.81], [28.0, 40.69], [41.0, 41.05], [41.0, 52.78], [53.0, 58.53], [62.0, 100.87], [102.0, 139.77]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.15, 0.0, 32.14, 33.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 40.82], ["explosion", 16.62], ["eruption", 8.72]], null, [["music", 41.65], ["hum", 28.24], ["mains hum", 11.73]], [["speech", 29.01], ["hum", 25.63], ["music", 19.11]], null, null], "duration": [0.84, 1.81, 12.69, 0.05, 11.78, 5.53, 38.87, 37.77]} \ No newline at end of file diff --git a/annotations_1/XYc1XujRb1w_filtered.json b/annotations_1/XYc1XujRb1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5954042d817bb49cf99746fb1796f50ccd7b8d96 --- /dev/null +++ b/annotations_1/XYc1XujRb1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [3.0, 4.35], [5.0, 6.24], [20.0, 20.31], [21.0, 20.71], [43.0, 43.17], [57.0, 58.24], [68.0, 69.25], [81.0, 80.69], [86.0, 87.69], [95.0, 95.77], [97.0, 98.61], [100.0, 101.95], [104.0, 105.07], [107.0, 108.75], [110.0, 117.75], [118.0, 119.37], [120.0, 121.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 1.35, 1.24, 0.31, -0.29, 0.17, 1.24, 1.25, -0.31, 1.69, 0.77, 1.61, 1.95, 1.07, 1.75, 7.75, 1.37, 1.44]} \ No newline at end of file diff --git a/annotations_1/X_4WgfjyOyg_filtered.json b/annotations_1/X_4WgfjyOyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c092e9a93a7442e5962c8fc66a9ca30dfae414 --- /dev/null +++ b/annotations_1/X_4WgfjyOyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 34.86], [36.0, 66.77], [69.0, 71.51], [74.0, 85.21], [90.0, 115.53], [116.0, 119.94], [124.0, 123.99], [125.0, 127.11], [128.0, 133.22], [134.0, 134.54], [138.0, 169.18]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false], "silence_prob": [29.24, 0.0, 60.51, 34.43, 28.94, 59.51, 0.0, 43.56, 36.9, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.46], ["breaking", 15.15], ["sound effect", 4.01]], null, null, [["speech", 63.04], ["music", 7.2], ["hum", 7.1]], [["music", 80.14], ["bell", 2.18], ["musical instrument", 1.61]], null, null, [["music", 41.23], ["whale vocalization", 9.11], ["hum", 6.96]], [["music", 54.27], ["hum", 6.41], ["speech", 5.61]], null, null], "duration": [14.86, 30.77, 2.51, 11.21, 25.53, 3.94, -0.01, 2.11, 5.22, 0.54, 31.18]} \ No newline at end of file diff --git a/annotations_1/Xa0JBPt2cGU_filtered.json b/annotations_1/Xa0JBPt2cGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1314503d7aa236b5e0b4219fed0726fca5e378fd --- /dev/null +++ b/annotations_1/Xa0JBPt2cGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.42], [23.0, 24.51], [30.0, 30.67], [44.0, 44.86], [47.0, 47.01], [49.0, 49.0], [68.0, 68.52], [74.0, 74.75], [81.0, 81.4], [82.0, 84.21], [104.0, 104.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 39.41], ["speech", 8.24], ["livestock, farm animals, working animals", 5.14]], null], "duration": [1.42, 1.51, 0.67, 0.86, 0.01, 0.0, 0.52, 0.75, 0.4, 2.21, 0.5]} \ No newline at end of file diff --git a/annotations_1/XaI13YBdi_M_filtered.json b/annotations_1/XaI13YBdi_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb34281d994e23992d23aec6d17d1eeacce10cd --- /dev/null +++ b/annotations_1/XaI13YBdi_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.45], [7.0, 10.17], [11.0, 27.87], [29.0, 34.55], [36.0, 36.63], [39.0, 43.66], [45.0, 94.86], [98.0, 145.89]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [69.74, 62.37, 60.05, 48.56, 0.0, 43.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.16], ["electronic music", 6.27], ["singing bowl", 6.23]], null, [["music", 60.07], ["didgeridoo", 12.14], ["synthesizer", 3.14]], null, null], "duration": [2.45, 3.17, 16.87, 5.55, 0.63, 4.66, 49.86, 47.89]} \ No newline at end of file diff --git a/annotations_1/Xaj3Ohn7YrE_filtered.json b/annotations_1/Xaj3Ohn7YrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aafbb8741ef372adc76c8d7f522ade72be2ed12a --- /dev/null +++ b/annotations_1/Xaj3Ohn7YrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 26.55], [31.0, 36.09], [42.0, 42.28], [44.0, 45.17], [47.0, 47.29], [48.0, 54.35], [55.0, 55.21], [58.0, 58.06], [61.0, 61.18], [62.0, 62.51], [64.0, 65.1], [66.0, 85.95], [86.0, 114.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.9, 96.54, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 71.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.55, 5.09, 0.28, 1.17, 0.29, 6.35, 0.21, 0.06, 0.18, 0.51, 1.1, 19.95, 28.22]} \ No newline at end of file diff --git a/annotations_1/XarGS1AeEcE_filtered.json b/annotations_1/XarGS1AeEcE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..061f299f8bd830468f88d6a0ac787cc3bb5b7af5 --- /dev/null +++ b/annotations_1/XarGS1AeEcE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 42.2], [47.0, 52.22], [52.0, 52.25], [52.0, 131.33]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [38.2, 5.22, 0.25, 79.33]} \ No newline at end of file diff --git a/annotations_1/Xc3bqi1G5xk_filtered.json b/annotations_1/Xc3bqi1G5xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37acbbe95fbe6a0503c276e461a41afd02f61614 --- /dev/null +++ b/annotations_1/Xc3bqi1G5xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.87], [20.0, 20.85], [33.0, 32.8], [40.0, 42.72], [44.0, 44.25], [48.0, 54.11], [56.0, 57.05], [61.0, 61.7], [65.0, 65.75], [67.0, 67.41], [90.0, 92.35], [99.0, 106.07], [108.0, 109.44], [111.0, 111.77], [114.0, 115.37], [117.0, 120.16], [121.0, 120.99], [127.0, 127.4], [130.0, 132.46], [136.0, 137.0], [149.0, 149.23], [154.0, 155.68], [159.0, 159.7], [163.0, 164.22], [169.0, 169.87], [176.0, 176.05], [180.0, 179.88], [181.0, 182.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 79.94, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 39.28, 99.65, 0.0, 0.0, 0.0, 47.82, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 91.68], ["boing", 2.47], ["inside, small room", 0.72]], null, null, null, null, [["speech", 59.41], ["sidetone", 28.51], ["dial tone", 3.33]], null, null, [["music", 53.1], ["telephone", 10.62], ["telephone dialing, dtmf", 4.44]], null, null, null, null, null, null, null, null, null], "duration": [1.87, 0.85, -0.2, 2.72, 0.25, 6.11, 1.05, 0.7, 0.75, 0.41, 2.35, 7.07, 1.44, 0.77, 1.37, 3.16, -0.01, 0.4, 2.46, 1.0, 0.23, 1.68, 0.7, 1.22, 0.87, 0.05, -0.12, 1.06]} \ No newline at end of file diff --git a/annotations_1/XcDzb6AeAI0_filtered.json b/annotations_1/XcDzb6AeAI0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f0cd61fdcfefecdbdb8aa50ef8548673c423601 --- /dev/null +++ b/annotations_1/XcDzb6AeAI0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [8.0, 10.61], [13.0, 13.53], [16.0, 18.79], [19.0, 27.06], [29.0, 29.71], [35.0, 35.34], [37.0, 37.4], [39.0, 78.17], [79.0, 79.68], [81.0, 81.68], [84.0, 86.0], [87.0, 87.34], [92.0, 94.83], [98.0, 98.39], [103.0, 103.81], [105.0, 105.73], [109.0, 115.08], [118.0, 118.98], [121.0, 124.6], [126.0, 126.87], [129.0, 128.97], [135.0, 138.43], [141.0, 142.5], [146.0, 148.68], [149.0, 148.8], [154.0, 155.6], [158.0, 169.1], [170.0, 170.46], [171.0, 173.87], [176.0, 177.25], [178.0, 184.57]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 35.84, 0.0, 32.94, 30.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 77.03, 0.0, 0.0, 0.0, 61.27, 0.0, 99.93, 0.0, 0.0, 90.6, 0.0, 36.68, 0.0, 0.0, 49.59, 0.0, 87.92, 0.0, 32.93], "audiomae_on_audioset": [null, [["fly, housefly", 16.78], ["insect", 16.57], ["busy signal", 14.91]], null, [["speech", 25.04], ["snicker", 9.79], ["chuckle, chortle", 7.12]], [["speech", 67.79], ["music", 12.66], ["thunk", 6.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.22], ["music", 29.68], ["theremin", 6.78]], null, null, [["speech", 46.25], ["frog", 14.39], ["animal", 4.11]], null, null, null, [["fart", 63.91], ["mosquito", 7.64], ["whale vocalization", 5.74]]], "duration": [0.48, 2.61, 0.53, 2.79, 8.06, 0.71, 0.34, 0.4, 39.17, 0.68, 0.68, 2.0, 0.34, 2.83, 0.39, 0.81, 0.73, 6.08, 0.98, 3.6, 0.87, -0.03, 3.43, 1.5, 2.68, -0.2, 1.6, 11.1, 0.46, 2.87, 1.25, 6.57]} \ No newline at end of file diff --git a/annotations_1/XcgNkFuPBV8_filtered.json b/annotations_1/XcgNkFuPBV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2417286b14cd54b0ea66041bed7c7a73aed3886 --- /dev/null +++ b/annotations_1/XcgNkFuPBV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 29.89], [30.0, 32.44], [34.0, 33.86], [38.0, 54.51], [55.0, 55.53], [59.0, 64.59], [67.0, 69.18], [81.0, 99.76], [105.0, 106.03], [118.0, 118.25], [124.0, 150.58], [151.0, 150.79], [151.0, 150.94], [151.0, 151.16], [151.0, 151.43], [152.0, 151.95], [152.0, 152.15], [153.0, 156.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 95.64, 0.0, 35.62, 0.0, 31.98, 30.94, 31.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.36], "audiomae_on_audioset": [null, null, null, [["music", 54.52], ["speech", 21.83], ["didgeridoo", 9.91]], null, [["speech", 51.08], ["music", 33.47], ["cacophony", 0.97]], [["moo", 30.61], ["cattle, bovinae", 24.9], ["livestock, farm animals, working animals", 19.18]], [["music", 31.7], ["speech", 30.79], ["vehicle", 2.79]], null, null, [["speech", 53.49], ["music", 22.68], ["hum", 2.26]], null, null, null, null, null, null, [["music", 50.51], ["whale vocalization", 9.89], ["hum", 5.6]]], "duration": [1.89, 2.44, -0.14, 16.51, 0.53, 5.59, 2.18, 18.76, 1.03, 0.25, 26.58, -0.21, -0.06, 0.16, 0.43, -0.05, 0.15, 3.14]} \ No newline at end of file diff --git a/annotations_1/Xd5ESRqpz3E_filtered.json b/annotations_1/Xd5ESRqpz3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a3faa7cb5ff530cb97f2373bb7f973833e9dc7f --- /dev/null +++ b/annotations_1/Xd5ESRqpz3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.55], [17.0, 45.15], [49.0, 49.76], [56.0, 59.75], [61.0, 76.65], [81.0, 86.36], [96.0, 101.01], [104.0, 107.22], [109.0, 111.11], [114.0, 121.0], [123.0, 123.21], [124.0, 155.51], [156.0, 159.33], [164.0, 165.54]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [28.96, 28.61, 0.0, 28.94, 29.53, 28.86, 29.01, 28.57, 29.24, 28.89, 0.0, 0.0, 29.37, 0.0], "audiomae_on_audioset": [[["speech", 41.31], ["music", 10.47], ["rumble", 6.48]], [["music", 77.08], ["theremin", 2.66], ["buzz", 2.3]], null, [["livestock, farm animals, working animals", 51.09], ["cattle, bovinae", 30.11], ["moo", 18.77]], [["music", 45.93], ["wild animals", 7.96], ["didgeridoo", 7.89]], [["music", 31.54], ["hum", 31.42], ["mains hum", 22.47]], [["hum", 45.31], ["mains hum", 15.35], ["throbbing", 12.06]], [["mains hum", 25.76], ["music", 19.07], ["hum", 18.49]], [["music", 50.18], ["throbbing", 13.09], ["hum", 7.86]], [["music", 46.21], ["throbbing", 36.65], ["hum", 4.83]], null, null, [["music", 74.85], ["electronic music", 4.9], ["dubstep", 1.77]], null], "duration": [11.55, 28.15, 0.76, 3.75, 15.65, 5.36, 5.01, 3.22, 2.11, 7.0, 0.21, 31.51, 3.33, 1.54]} \ No newline at end of file diff --git a/annotations_1/XdtbL0dP0X0_filtered.json b/annotations_1/XdtbL0dP0X0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18f8e322bc0dc2feded1062734a186a88faf33d6 --- /dev/null +++ b/annotations_1/XdtbL0dP0X0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.9], [19.0, 20.71], [21.0, 21.46], [22.0, 23.16], [24.0, 25.57], [30.0, 30.27], [32.0, 32.39], [38.0, 38.28], [41.0, 41.57], [48.0, 48.71], [65.0, 69.87], [71.0, 71.86], [75.0, 76.49], [78.0, 88.67], [89.0, 90.49], [94.0, 94.53], [96.0, 96.7], [107.0, 108.57], [111.0, 120.24], [133.0, 133.69], [134.0, 134.64], [137.0, 138.13], [142.0, 142.38], [143.0, 143.01], [144.0, 145.54], [148.0, 149.82], [154.0, 153.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 40.38, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 66.36], ["electric shaver, electric razor", 7.76], ["mains hum", 4.29]], null, null, [["music", 37.53], ["throbbing", 14.88], ["speech", 12.47]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 1.71, 0.46, 1.16, 1.57, 0.27, 0.39, 0.28, 0.57, 0.71, 4.87, 0.86, 1.49, 10.67, 1.49, 0.53, 0.7, 1.57, 9.24, 0.69, 0.64, 1.13, 0.38, 0.01, 1.54, 1.82, -0.18]} \ No newline at end of file diff --git a/annotations_1/Xdzv5V4MVus_filtered.json b/annotations_1/Xdzv5V4MVus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cfe18c8b41218aa32eb96995f4f2c90c8edc83b --- /dev/null +++ b/annotations_1/Xdzv5V4MVus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 26.69], [28.0, 28.59], [31.0, 59.41], [62.0, 63.75], [66.0, 66.82], [68.0, 69.26], [73.0, 90.98], [92.0, 107.94], [112.0, 112.82], [116.0, 123.52], [126.0, 139.87], [145.0, 154.09], [158.0, 164.62], [168.0, 177.04], [177.0, 177.8], [182.0, 183.66], [184.0, 184.44], [185.0, 185.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.33, 0.0, 28.47, 0.0, 0.0, 0.0, 28.58, 28.34, 0.0, 28.47, 28.37, 28.86, 28.81, 28.46, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.1], ["smash, crash", 16.55], ["whack, thwack", 10.08]], null, [["music", 37.86], ["speech", 32.54], ["whack, thwack", 2.91]], null, null, null, [["music", 51.64], ["speech", 18.3], ["vehicle", 4.69]], [["music", 62.39], ["mains hum", 9.89], ["hum", 7.14]], null, [["music", 57.74], ["speech", 12.15], ["smash, crash", 6.78]], [["throbbing", 33.47], ["music", 32.85], ["hum", 8.95]], [["music", 39.61], ["speech", 28.41], ["whack, thwack", 7.07]], [["speech", 55.29], ["music", 16.3], ["electric shaver, electric razor", 4.08]], [["music", 59.84], ["whack, thwack", 5.85], ["sound effect", 4.14]], null, null, null, null], "duration": [14.69, 0.59, 28.41, 1.75, 0.82, 1.26, 17.98, 15.94, 0.82, 7.52, 13.87, 9.09, 6.62, 9.04, 0.8, 1.66, 0.44, 0.36]} \ No newline at end of file diff --git a/annotations_1/XeGGNf_-nYM_filtered.json b/annotations_1/XeGGNf_-nYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f720394c4a8e55f3d9afa93ffe95ac1fd4c14b8f --- /dev/null +++ b/annotations_1/XeGGNf_-nYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [10.0, 11.15], [13.0, 15.43], [16.0, 17.68], [18.0, 18.2], [28.0, 27.87], [30.0, 31.58], [32.0, 39.66], [44.0, 46.87], [49.0, 50.68], [75.0, 85.08], [97.0, 97.61], [100.0, 101.76], [106.0, 105.88], [110.0, 115.23], [118.0, 119.58], [127.0, 127.38], [137.0, 137.84], [139.0, 139.02], [141.0, 142.75], [151.0, 151.11], [157.0, 157.84]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 0.0, 32.29, 30.48, 0.0, 29.01, 0.0, 0.0, 0.0, 29.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 27.35], ["wind instrument, woodwind instrument", 9.83], ["trombone", 8.26]], null, null, null, null, [["music", 35.17], ["brass instrument", 10.15], ["trombone", 9.86]], [["whack, thwack", 74.96], ["music", 3.84], ["whip", 3.77]], null, [["buzz", 26.83], ["music", 20.99], ["rumble", 5.95]], null, null, null, [["groan", 21.89], ["sound effect", 13.34], ["reverberation", 8.26]], null, null, null, null, null, null, null], "duration": [1.6, 1.15, 2.43, 1.68, 0.2, -0.13, 1.58, 7.66, 2.87, 1.68, 10.08, 0.61, 1.76, -0.12, 5.23, 1.58, 0.38, 0.84, 0.02, 1.75, 0.11, 0.84]} \ No newline at end of file diff --git a/annotations_1/XeasXb98akc_filtered.json b/annotations_1/XeasXb98akc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d292b032eb76feffe3ed050be6f18fff141911b --- /dev/null +++ b/annotations_1/XeasXb98akc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [7.0, 7.65], [15.0, 16.09], [17.0, 18.0], [22.0, 22.91], [24.0, 23.58], [26.0, 28.22], [29.0, 36.58], [40.0, 40.66], [42.0, 42.06], [59.0, 59.07], [62.0, 62.36], [64.0, 64.39], [67.0, 68.1], [69.0, 69.42], [72.0, 71.86], [74.0, 74.14], [81.0, 82.09], [84.0, 83.67], [87.0, 87.72], [93.0, 93.01], [101.0, 101.71], [108.0, 108.01], [109.0, 109.26], [110.0, 113.56], [116.0, 116.38], [117.0, 117.27], [117.0, 117.46], [117.0, 131.31], [133.0, 142.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 34.16, 33.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.24], ["speech", 25.95], ["didgeridoo", 9.57]], [["music", 21.21], ["whack, thwack", 19.61], ["speech", 19.07]]], "duration": [0.85, 0.65, 1.09, 1.0, 0.91, -0.42, 2.22, 7.58, 0.66, 0.06, 0.07, 0.36, 0.39, 1.1, 0.42, -0.14, 0.14, 1.09, -0.33, 0.72, 0.01, 0.71, 0.01, 0.26, 3.56, 0.38, 0.27, 0.46, 14.31, 9.2]} \ No newline at end of file diff --git a/annotations_1/XemAlj9_qKE_filtered.json b/annotations_1/XemAlj9_qKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c99c91deae6b1c8d261669f228f23d807362e80b --- /dev/null +++ b/annotations_1/XemAlj9_qKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [7.0, 7.67], [9.0, 11.48], [13.0, 14.08], [15.0, 16.31], [17.0, 17.24], [18.0, 21.15], [27.0, 28.19], [33.0, 34.96], [36.0, 36.68], [37.0, 38.25], [40.0, 56.89], [58.0, 61.59], [68.0, 72.03], [74.0, 83.54], [86.0, 89.48], [90.0, 91.07], [92.0, 94.59], [99.0, 113.85], [117.0, 117.32], [118.0, 118.22], [119.0, 121.81], [123.0, 123.94], [124.0, 125.25], [126.0, 126.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 75.72, 63.53, 73.82, 78.38, 86.09, 0.0, 99.78, 40.52, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 16.16], ["tap", 9.49], ["knock", 8.38]], null, null, [["speech", 32.26], ["hum", 12.21], ["mains hum", 10.92]], null, null, null], "duration": [0.52, 0.67, 2.48, 1.08, 1.31, 0.24, 3.15, 1.19, 1.96, 0.68, 1.25, 16.89, 3.59, 4.03, 9.54, 3.48, 1.07, 2.59, 14.85, 0.32, 0.22, 2.81, 0.94, 1.25, 0.76]} \ No newline at end of file diff --git a/annotations_1/XgGyrrzTBz4_filtered.json b/annotations_1/XgGyrrzTBz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..274ed086b321379638d1824a02eed24b03bea577 --- /dev/null +++ b/annotations_1/XgGyrrzTBz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.57], [24.0, 30.4], [33.0, 36.63], [39.0, 39.6], [40.0, 43.56], [44.0, 43.61], [44.0, 44.81], [46.0, 46.04], [59.0, 98.17], [98.0, 98.91], [102.0, 106.59], [107.0, 111.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.56, 34.87, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 32.12], "audiomae_on_audioset": [null, [["speech", 82.21], ["music", 4.86], ["hum", 1.78]], [["hum", 48.36], ["throbbing", 19.56], ["music", 10.8]], null, [["hum", 30.88], ["throbbing", 28.63], ["music", 16.74]], null, null, null, null, null, [["speech", 20.82], ["hum", 5.24], ["whimper", 5.02]], [["speech", 36.52], ["explosion", 31.01], ["burst, pop", 9.68]]], "duration": [0.57, 6.4, 3.63, 0.6, 3.56, -0.39, 0.81, 0.04, 39.17, 0.91, 4.59, 4.33]} \ No newline at end of file diff --git a/annotations_1/Xi3P8vUveVQ_filtered.json b/annotations_1/Xi3P8vUveVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e5db2ce9616c8b632383af4189b217cc884c771 --- /dev/null +++ b/annotations_1/Xi3P8vUveVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.44], [28.0, 35.21], [39.0, 47.28], [48.0, 62.78], [67.0, 104.08], [104.0, 107.18], [107.0, 111.72], [112.0, 125.42], [125.0, 125.49], [126.0, 137.15], [141.0, 144.42], [145.0, 150.79], [152.0, 154.31], [157.0, 158.19], [161.0, 167.95]], "keep_status": [false, true, false, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 28.6, 32.08, 33.23, 0.0, 39.63, 39.67, 94.95, 0.0, 59.96, 46.26, 52.1, 88.46, 0.0, 37.5], "audiomae_on_audioset": [null, [["whack, thwack", 31.27], ["music", 18.87], ["thump, thud", 9.1]], [["music", 69.55], ["sonar", 7.68], ["electronic music", 6.37]], [["music", 71.26], ["hum", 3.94], ["electronic music", 3.5]], null, [["speech", 38.26], ["boing", 6.5], ["sidetone", 4.12]], [["whale vocalization", 32.76], ["hum", 17.73], ["animal", 10.41]], null, null, null, [["speech", 32.34], ["music", 16.54], ["hum", 14.03]], null, null, null, [["music", 53.37], ["ambient music", 18.66], ["electronic music", 4.42]]], "duration": [0.44, 7.21, 8.28, 14.78, 37.08, 3.18, 4.72, 13.42, 0.49, 11.15, 3.42, 5.79, 2.31, 1.19, 6.95]} \ No newline at end of file diff --git a/annotations_1/XiXa1C9FECU_filtered.json b/annotations_1/XiXa1C9FECU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd56bcc48f471e2ad80c572eb968b36f853a837 --- /dev/null +++ b/annotations_1/XiXa1C9FECU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.88], [3.0, 3.97], [8.0, 9.02], [18.0, 18.32], [19.0, 20.51], [21.0, 23.5], [48.0, 48.76], [51.0, 51.95], [53.0, 54.19], [58.0, 58.92], [63.0, 63.26], [66.0, 67.37], [70.0, 76.87], [78.0, 79.59], [86.0, 86.85], [89.0, 89.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 0.97, 1.02, 0.32, 1.51, 2.5, 0.76, 0.95, 1.19, 0.92, 0.26, 1.37, 6.87, 1.59, 0.85, 0.95]} \ No newline at end of file diff --git a/annotations_1/Xjp16xSdsp0_filtered.json b/annotations_1/Xjp16xSdsp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a431d0c694986f6632c5da6affbc368cf31b7af9 --- /dev/null +++ b/annotations_1/Xjp16xSdsp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.45], [29.0, 29.71], [32.0, 33.29], [35.0, 35.92], [37.0, 58.43], [59.0, 80.03], [81.0, 82.22], [83.0, 83.84], [86.0, 86.21], [87.0, 102.52], [104.0, 130.17]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.92, 39.41, 0.0, 0.0, 0.0, 41.07, 33.52], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.69], ["hum", 13.42], ["livestock, farm animals, working animals", 12.16]], [["music", 64.83], ["hum", 7.38], ["mains hum", 5.93]], null, null, null, [["music", 31.83], ["whale vocalization", 21.52], ["hum", 6.37]], [["music", 68.29], ["ambient music", 10.19], ["scary music", 8.18]]], "duration": [0.45, 0.71, 1.29, 0.92, 21.43, 21.03, 1.22, 0.84, 0.21, 15.52, 26.17]} \ No newline at end of file diff --git a/annotations_1/XkNQZg7yTvw_filtered.json b/annotations_1/XkNQZg7yTvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bad367fb6f3cf90af6cf889b292fe120e86b911 --- /dev/null +++ b/annotations_1/XkNQZg7yTvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [4.0, 4.53], [5.0, 5.32], [10.0, 12.07], [24.0, 24.71], [30.0, 30.75], [32.0, 36.37], [41.0, 40.86], [49.0, 50.06], [52.0, 52.61], [59.0, 60.25], [67.0, 67.02], [81.0, 82.46], [94.0, 94.98], [101.0, 102.03], [115.0, 118.18], [121.0, 125.73], [127.0, 133.54], [139.0, 140.0], [140.0, 140.37], [145.0, 147.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.88, 34.15, 31.18, 0.0, 0.0, 30.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.39], ["didgeridoo", 6.69], ["musical instrument", 2.6]], [["music", 49.04], ["didgeridoo", 10.8], ["speech", 6.02]], [["music", 48.87], ["speech", 10.21], ["outside, rural or natural", 7.0]], null, null, [["music", 50.44], ["speech", 19.51], ["boing", 4.04]]], "duration": [1.52, 0.53, 0.32, 2.07, 0.71, 0.75, 4.37, -0.14, 1.06, 0.61, 1.25, 0.02, 1.46, 0.98, 1.03, 3.18, 4.73, 6.54, 1.0, 0.37, 2.65]} \ No newline at end of file diff --git a/annotations_1/XlEkeUg2z8I_filtered.json b/annotations_1/XlEkeUg2z8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4905b66e7c1ffe6292ce186cc7cef57f2ea67246 --- /dev/null +++ b/annotations_1/XlEkeUg2z8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.04], [30.0, 29.94], [30.0, 31.36], [38.0, 38.69], [40.0, 40.53], [43.0, 44.24], [46.0, 46.36], [48.0, 48.36], [55.0, 56.47], [58.0, 58.38], [59.0, 60.2], [61.0, 63.32], [64.0, 65.13], [69.0, 69.67], [79.0, 79.49], [86.0, 86.14], [91.0, 92.6], [95.0, 101.65], [105.0, 106.0], [107.0, 112.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 55.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, -0.06, 1.36, 0.69, 0.53, 1.24, 0.36, 0.36, 1.47, 0.38, 1.2, 2.32, 1.13, 0.67, 0.49, 0.14, 1.6, 6.65, 1.0, 5.38]} \ No newline at end of file diff --git a/annotations_1/XlJpElakwP4_filtered.json b/annotations_1/XlJpElakwP4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82f543989c459f94bbf394f678d65d0537e3b095 --- /dev/null +++ b/annotations_1/XlJpElakwP4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.49], [12.0, 79.24], [80.0, 87.39], [94.0, 96.96], [102.0, 110.1], [111.0, 113.26], [115.0, 134.01], [136.0, 141.27], [143.0, 145.56]], "keep_status": [false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.96, 32.23, 33.24, 33.42, 28.98, 29.99, 29.88], "audiomae_on_audioset": [null, null, [["music", 52.72], ["cattle, bovinae", 4.8], ["moo", 4.76]], [["cattle, bovinae", 45.32], ["moo", 35.34], ["livestock, farm animals, working animals", 14.9]], [["music", 53.54], ["sidetone", 11.36], ["didgeridoo", 6.35]], [["music", 20.2], ["sidetone", 19.0], ["speech", 15.91]], [["music", 72.31], ["didgeridoo", 4.5], ["electronic music", 2.79]], [["music", 63.68], ["speech", 8.29], ["carnatic music", 3.19]], [["music", 79.74], ["speech", 4.53], ["singing", 1.26]]], "duration": [0.49, 67.24, 7.39, 2.96, 8.1, 2.26, 19.01, 5.27, 2.56]} \ No newline at end of file diff --git a/annotations_1/XlOaSZy_S50_filtered.json b/annotations_1/XlOaSZy_S50_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5475b01d41c9ccd1e2887525ddd11632fe8f291b --- /dev/null +++ b/annotations_1/XlOaSZy_S50_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.14], [18.0, 26.03], [29.0, 29.1], [30.0, 31.18], [32.0, 33.02], [35.0, 36.04], [37.0, 37.35], [40.0, 41.05], [42.0, 42.28], [48.0, 48.37], [50.0, 51.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 8.03, 0.1, 1.18, 1.02, 1.04, 0.35, 1.05, 0.28, 0.37, 1.21]} \ No newline at end of file diff --git a/annotations_1/XnfiKz-Zk7Y_filtered.json b/annotations_1/XnfiKz-Zk7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc50ac54e875a1eacea42c5aad9fadb9f61a5902 --- /dev/null +++ b/annotations_1/XnfiKz-Zk7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.89], [17.0, 17.69], [18.0, 18.57], [20.0, 20.31], [23.0, 24.02], [25.0, 25.44], [27.0, 28.78], [33.0, 33.35], [34.0, 44.0], [62.0, 64.02], [65.0, 67.32], [74.0, 74.39], [77.0, 77.65], [79.0, 79.81], [81.0, 81.53], [87.0, 87.2], [88.0, 88.08], [92.0, 95.61], [100.0, 102.81], [103.0, 105.53], [107.0, 109.76], [110.0, 111.11], [112.0, 113.07], [126.0, 127.48], [128.0, 129.71], [131.0, 146.79], [150.0, 153.66], [154.0, 156.42], [166.0, 166.01], [167.0, 168.74], [170.0, 170.4], [190.0, 190.29], [193.0, 193.08], [199.0, 199.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 81.53, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.8, 54.83, 45.33, 48.61, 0.0, 0.0, 0.0, 0.0, 41.78, 83.88, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 39.03], ["speech", 21.91], ["knock", 13.03]], null, [["speech", 52.91], ["coin (dropping)", 7.6], ["noise", 7.3]], [["music", 53.93], ["synthesizer", 6.64], ["musical instrument", 3.6]], null, null, null, null, [["music", 61.63], ["synthesizer", 5.95], ["ambient music", 5.62]], null, [["music", 35.85], ["guitar", 11.49], ["effects unit", 8.92]], null, null, null, null, null, null], "duration": [-0.11, 0.69, 0.57, 0.31, 1.02, 0.44, 1.78, 0.35, 10.0, 2.02, 2.32, 0.39, 0.65, 0.81, 0.53, 0.2, 0.08, 3.61, 2.81, 2.53, 2.76, 1.11, 1.07, 1.48, 1.71, 15.79, 3.66, 2.42, 0.01, 1.74, 0.4, 0.29, 0.08, 0.61]} \ No newline at end of file diff --git a/annotations_1/Xq4HZGi38qo_filtered.json b/annotations_1/Xq4HZGi38qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1ef5760214ccbabf878d23db7a57bc96ba7cb82 --- /dev/null +++ b/annotations_1/Xq4HZGi38qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.97], [13.0, 13.64], [14.0, 15.16], [28.0, 29.39], [33.0, 34.06], [41.0, 41.39], [66.0, 66.23], [70.0, 71.27], [76.0, 79.89], [82.0, 82.93], [89.0, 92.1], [93.0, 99.39], [101.0, 101.31], [104.0, 104.3], [105.0, 105.17], [106.0, 109.71], [113.0, 121.02], [123.0, 124.5], [126.0, 131.04], [135.0, 136.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 52.39, 46.9, 0.0, 0.0, 0.0, 80.64, 33.3, 0.0, 32.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 21.52], ["music", 14.9], ["throbbing", 13.86]], null, null, null, null, [["speech", 29.86], ["music", 25.35], ["hum", 12.3]], null, [["throbbing", 35.24], ["music", 32.05], ["hum", 16.36]], null], "duration": [-0.03, 0.64, 1.16, 1.39, 1.06, 0.39, 0.23, 1.27, 3.89, 0.93, 3.1, 6.39, 0.31, 0.3, 0.17, 3.71, 8.02, 1.5, 5.04, 1.95]} \ No newline at end of file diff --git a/annotations_1/Xq5eXYCKUF8_filtered.json b/annotations_1/Xq5eXYCKUF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f898c59430870dcdc57bd02843e5fae75801380 --- /dev/null +++ b/annotations_1/Xq5eXYCKUF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.47], [21.0, 25.14], [27.0, 34.86], [35.0, 34.91], [36.0, 36.85], [37.0, 39.61], [41.0, 70.29], [71.0, 75.57], [76.0, 77.16], [78.0, 82.86], [86.0, 92.79], [94.0, 94.59], [96.0, 98.66], [102.0, 102.27], [104.0, 105.21], [106.0, 107.37], [109.0, 110.88], [117.0, 122.76], [124.0, 127.82], [129.0, 131.38], [135.0, 135.19], [137.0, 139.13], [140.0, 141.45], [143.0, 143.11], [144.0, 154.03]], "keep_status": [true, true, true, false, false, true, true, true, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [49.31, 43.48, 38.28, 0.0, 0.0, 38.58, 31.44, 31.26, 0.0, 31.79, 42.86, 0.0, 30.72, 0.0, 0.0, 0.0, 0.0, 31.18, 46.05, 46.05, 0.0, 46.26, 0.0, 0.0, 29.39], "audiomae_on_audioset": [[["speech", 38.37], ["fart", 9.34], ["crunch", 6.11]], [["music", 27.4], ["singing bowl", 10.56], ["hum", 8.32]], [["speech", 25.39], ["whale vocalization", 11.86], ["hum", 11.65]], null, null, [["music", 14.94], ["livestock, farm animals, working animals", 7.62], ["cattle, bovinae", 7.06]], [["singing bowl", 39.68], ["music", 16.19], ["hum", 7.88]], [["music", 19.58], ["hum", 17.38], ["throbbing", 17.33]], null, [["music", 53.36], ["throbbing", 10.58], ["sidetone", 9.95]], [["thunk", 58.54], ["music", 5.77], ["whack, thwack", 4.29]], null, [["fart", 61.46], ["speech", 4.62], ["dog", 3.84]], null, null, null, null, [["thunk", 31.44], ["music", 29.27], ["whack, thwack", 12.68]], [["mains hum", 34.93], ["hum", 28.06], ["music", 8.09]], [["speech", 31.76], ["hum", 17.41], ["singing bowl", 12.12]], null, [["speech", 50.48], ["gong", 21.25], ["music", 7.53]], null, null, [["speech", 40.94], ["breaking", 11.52], ["whack, thwack", 8.15]]], "duration": [10.47, 4.14, 7.86, -0.09, 0.85, 2.61, 29.29, 4.57, 1.16, 4.86, 6.79, 0.59, 2.66, 0.27, 1.21, 1.37, 1.88, 5.76, 3.82, 2.38, 0.19, 2.13, 1.45, 0.11, 10.03]} \ No newline at end of file diff --git a/annotations_1/XqqckmSFUwo_filtered.json b/annotations_1/XqqckmSFUwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be8eea34cef3ef5341071c7a8d7e2031884981e8 --- /dev/null +++ b/annotations_1/XqqckmSFUwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 45.15], [51.0, 63.66], [64.0, 64.88], [66.0, 70.65], [71.0, 101.49], [102.0, 117.93], [119.0, 119.45], [120.0, 121.83]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.67, 0.0, 71.72, 0.0, 41.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.16], ["synthesizer", 6.98], ["keyboard (musical)", 5.88]], null, null], "duration": [1.15, 12.66, 0.88, 4.65, 30.49, 15.93, 0.45, 1.83]} \ No newline at end of file diff --git a/annotations_1/XqwQlCAM3P0_filtered.json b/annotations_1/XqwQlCAM3P0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..874065a25d72edae11e02a9325cb023a4e6a39ec --- /dev/null +++ b/annotations_1/XqwQlCAM3P0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.01], [11.0, 17.76], [21.0, 22.67], [24.0, 24.43], [25.0, 26.43], [28.0, 28.59], [29.0, 29.0], [30.0, 31.63], [33.0, 46.25], [48.0, 48.41], [50.0, 51.09], [56.0, 57.6], [58.0, 61.28], [67.0, 68.47], [70.0, 73.45], [76.0, 76.81], [93.0, 95.15], [97.0, 98.19], [99.0, 99.64], [100.0, 102.1], [104.0, 106.41], [107.0, 110.73]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 48.31, 0.0, 86.09, 0.0, 99.8, 0.0, 0.0, 99.87, 90.43, 99.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 40.41], ["hum", 18.64], ["throbbing", 8.87]], null, null, null, [["music", 31.58], ["speech", 26.38], ["moo", 3.36]], null, null, null, null, null, null, null, null, null], "duration": [2.01, 6.76, 1.67, 0.43, 1.43, 0.59, 0.0, 1.63, 13.25, 0.41, 1.09, 1.6, 3.28, 1.47, 3.45, 0.81, 2.15, 1.19, 0.64, 2.1, 2.41, 3.73]} \ No newline at end of file diff --git a/annotations_1/Xr9GABUefT8_filtered.json b/annotations_1/Xr9GABUefT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac309ec34ef806331188fa52adab5a13bac4eab0 --- /dev/null +++ b/annotations_1/Xr9GABUefT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.32], [10.0, 12.09], [14.0, 18.91], [20.0, 20.53], [21.0, 22.37], [27.0, 27.82], [30.0, 30.69], [40.0, 44.81], [50.0, 51.44], [52.0, 51.87], [53.0, 54.68], [58.0, 58.6], [63.0, 64.27], [64.0, 66.85], [71.0, 71.19], [72.0, 81.03], [86.0, 87.39], [89.0, 89.56], [90.0, 95.15], [98.0, 101.97], [105.0, 105.51], [109.0, 112.28], [112.0, 116.02], [117.0, 123.58], [130.0, 130.79], [137.0, 138.11], [143.0, 143.8]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 61.77, 49.18, 0.0, 0.0, 0.0, 0.0, 44.63, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 38.28, 0.0, 0.0, 54.43, 46.12, 0.0, 43.77, 60.05, 74.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 31.84], ["beatboxing", 11.09], ["music", 9.44]], null, null, null, null, [["music", 47.48], ["speech", 7.87], ["fly, housefly", 5.44]], null, null, null, null, null, null, null, [["speech", 37.43], ["music", 33.78], ["whack, thwack", 3.35]], null, null, null, [["music", 52.23], ["speech", 6.11], ["hum", 3.45]], null, [["music", 28.3], ["speech", 18.22], ["hum", 7.48]], null, null, null, null, null], "duration": [0.32, 2.09, 4.91, 0.53, 1.37, 0.82, 0.69, 4.81, 1.44, -0.13, 1.68, 0.6, 1.27, 2.85, 0.19, 9.03, 1.39, 0.56, 5.15, 3.97, 0.51, 3.28, 4.02, 6.58, 0.79, 1.11, 0.8]} \ No newline at end of file diff --git a/annotations_1/XrujkDtd0iY_filtered.json b/annotations_1/XrujkDtd0iY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a53a6ee0f70315cdaea18d6858724930f880ac --- /dev/null +++ b/annotations_1/XrujkDtd0iY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.53], [12.0, 13.27], [21.0, 21.12], [45.0, 46.58], [48.0, 49.2], [50.0, 51.49], [53.0, 53.64], [57.0, 59.66], [61.0, 65.08], [66.0, 66.6], [71.0, 71.25], [74.0, 75.76], [78.0, 79.0], [85.0, 87.54], [97.0, 98.61], [100.0, 114.98], [115.0, 115.28], [115.0, 115.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false], "silence_prob": [35.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.57, 30.39, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0, 30.95, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.8], ["speech", 11.3], ["throbbing", 5.44]], null, null, null, null, null, null, [["music", 66.58], ["foghorn", 4.72], ["theremin", 4.14]], [["music", 50.69], ["foghorn", 11.21], ["throbbing", 6.98]], null, null, null, null, [["cattle, bovinae", 24.47], ["moo", 21.26], ["livestock, farm animals, working animals", 13.64]], null, [["music", 46.84], ["speech", 10.39], ["buzz", 4.08]], null, null], "duration": [6.53, 1.27, 0.12, 1.58, 1.2, 1.49, 0.64, 2.66, 4.08, 0.6, 0.25, 1.76, 1.0, 2.54, 1.61, 14.98, 0.28, 0.45]} \ No newline at end of file diff --git a/annotations_1/XssDZqS6WzE_filtered.json b/annotations_1/XssDZqS6WzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f38e2e1af3c02d3772abb31d87d27b33156d7852 --- /dev/null +++ b/annotations_1/XssDZqS6WzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.48], [12.0, 14.89], [24.0, 34.97], [35.0, 36.44], [46.0, 56.24], [58.0, 58.5], [62.0, 61.7], [66.0, 68.0], [68.0, 69.3], [70.0, 74.61], [87.0, 91.44], [93.0, 93.63], [94.0, 99.13], [100.0, 100.63], [102.0, 103.35], [106.0, 114.2]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.06, 35.12, 0.0, 36.61, 0.0, 0.0, 75.72, 0.0, 91.13, 84.07, 0.0, 83.7, 0.0, 0.0, 75.55], "audiomae_on_audioset": [null, null, [["speech", 30.74], ["cattle, bovinae", 10.9], ["moo", 9.9]], null, [["speech", 72.44], ["boat, water vehicle", 4.0], ["hubbub, speech noise, speech babble", 3.49]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 2.89, 10.97, 1.44, 10.24, 0.5, -0.3, 2.0, 1.3, 4.61, 4.44, 0.63, 5.13, 0.63, 1.35, 8.2]} \ No newline at end of file diff --git a/annotations_1/Xstux7DlrgU_filtered.json b/annotations_1/Xstux7DlrgU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47cc091ef1720d99e224a61d406a9345a5201e41 --- /dev/null +++ b/annotations_1/Xstux7DlrgU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.22], [8.0, 9.98], [13.0, 13.54], [17.0, 18.13], [20.0, 20.26], [25.0, 25.56], [27.0, 27.77], [28.0, 28.68], [31.0, 31.62], [37.0, 37.49], [38.0, 42.16], [43.0, 43.71], [45.0, 45.23], [46.0, 46.63], [50.0, 50.11], [81.0, 82.09], [87.0, 88.79], [95.0, 95.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 57.95], ["musical instrument", 6.89], ["speech", 6.87]], null, null, null, null, null, null, null], "duration": [2.22, 1.98, 0.54, 1.13, 0.26, 0.56, 0.77, 0.68, 0.62, 0.49, 4.16, 0.71, 0.23, 0.63, 0.11, 1.09, 1.79, 0.76]} \ No newline at end of file diff --git a/annotations_1/XtL5tGpGIN8_filtered.json b/annotations_1/XtL5tGpGIN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74150a2d79b9de4d1ca9698db82663dadc8de088 --- /dev/null +++ b/annotations_1/XtL5tGpGIN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.35], [7.0, 13.1], [14.0, 14.08], [15.0, 22.18], [23.0, 23.06], [25.0, 63.85], [64.0, 65.37], [66.0, 145.05], [146.0, 146.64]], "keep_status": [true, false, false, true, false, false, false, false, false], "silence_prob": [46.4, 40.33, 0.0, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 26.56], ["hum", 20.92], ["noise", 12.12]], [["speech", 51.64], ["bee, wasp, etc.", 13.13], ["insect", 7.56]], null, [["frog", 30.17], ["speech", 20.97], ["electric shaver, electric razor", 6.55]], null, null, null, null, null], "duration": [3.35, 6.1, 0.08, 7.18, 0.06, 38.85, 1.37, 79.05, 0.64]} \ No newline at end of file diff --git a/annotations_1/XtduKM28ohU_filtered.json b/annotations_1/XtduKM28ohU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..046e26b44466fa7b6d93d16e50a9a77b1d931832 --- /dev/null +++ b/annotations_1/XtduKM28ohU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [6.0, 9.07], [14.0, 15.21], [16.0, 17.95], [22.0, 24.26], [29.0, 33.22], [34.0, 34.25], [34.0, 36.9], [39.0, 40.59], [41.0, 41.76], [47.0, 51.34], [52.0, 55.61], [57.0, 69.74], [73.0, 81.63], [83.0, 84.25], [97.0, 106.1], [111.0, 114.74], [123.0, 126.49], [128.0, 133.39], [136.0, 138.45], [140.0, 142.42], [146.0, 148.42], [151.0, 151.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 68.8, 0.0, 0.0, 72.31, 78.21, 0.0, 71.72, 0.0, 0.0, 71.57, 64.41, 65.91, 69.34, 0.0, 31.18, 71.0, 42.19, 62.17, 53.22, 58.72, 67.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.98], ["musical instrument", 5.07], ["effects unit", 2.55]], null, [["music", 42.36], ["plucked string instrument", 5.58], ["hum", 4.57]], null, null, null, null, null], "duration": [0.25, 3.07, 1.21, 1.95, 2.26, 4.22, 0.25, 2.9, 1.59, 0.76, 4.34, 3.61, 12.74, 8.63, 1.25, 9.1, 3.74, 3.49, 5.39, 2.45, 2.42, 2.42, 0.43]} \ No newline at end of file diff --git a/annotations_1/Xu0QBBxHZWs_filtered.json b/annotations_1/Xu0QBBxHZWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e56fa84cf6643459593d1392587ceb12cd7749db --- /dev/null +++ b/annotations_1/Xu0QBBxHZWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.67], [13.0, 34.64], [37.0, 49.76], [51.0, 55.78], [56.0, 58.83], [60.0, 60.45], [63.0, 67.91], [68.0, 70.73], [72.0, 73.53], [74.0, 75.0], [76.0, 77.36], [78.0, 79.07], [80.0, 121.98], [133.0, 133.73]], "keep_status": [true, false, false, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [43.48, 29.62, 33.43, 32.19, 30.95, 0.0, 41.14, 41.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.9], ["hum", 14.23], ["throbbing", 7.73]], [["music", 36.33], ["hum", 26.77], ["mains hum", 20.71]], [["hum", 53.79], ["mains hum", 38.26], ["throbbing", 2.21]], [["music", 40.89], ["hum", 10.33], ["speech", 7.24]], [["hum", 39.25], ["mains hum", 27.67], ["music", 12.27]], null, [["burping, eructation", 24.55], ["music", 10.64], ["hiccup", 9.82]], [["noise", 29.1], ["music", 15.07], ["fly, housefly", 6.93]], null, null, null, null, null, null], "duration": [2.67, 21.64, 12.76, 4.78, 2.83, 0.45, 4.91, 2.73, 1.53, 1.0, 1.36, 1.07, 41.98, 0.73]} \ No newline at end of file diff --git a/annotations_1/XuNDB-xL6uc_filtered.json b/annotations_1/XuNDB-xL6uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5972631c0b2fad44ed8c7e7c1d821eda1985c72f --- /dev/null +++ b/annotations_1/XuNDB-xL6uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 35.75], [39.0, 39.73], [46.0, 46.13], [52.0, 52.34], [54.0, 54.97], [57.0, 57.32], [63.0, 63.53], [68.0, 67.9], [69.0, 69.75], [73.0, 73.74], [77.0, 76.87], [85.0, 87.74], [89.0, 89.29], [93.0, 93.7], [95.0, 95.37], [97.0, 97.26], [98.0, 98.81], [99.0, 99.86], [101.0, 101.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.75, 0.73, 0.13, 0.34, 0.97, 0.32, 0.53, -0.1, 0.75, 0.74, -0.13, 2.74, 0.29, 0.7, 0.37, 0.26, 0.81, 0.86, 0.34]} \ No newline at end of file diff --git a/annotations_1/Xurw2Ar9NNk_filtered.json b/annotations_1/Xurw2Ar9NNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25ec8d04e88173080b294289af2a60e00dbd9572 --- /dev/null +++ b/annotations_1/Xurw2Ar9NNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [5.0, 6.18], [8.0, 8.63], [10.0, 10.25], [11.0, 16.55], [19.0, 21.93], [26.0, 26.45], [28.0, 29.25], [30.0, 31.73], [33.0, 33.76], [37.0, 38.28], [40.0, 40.88], [44.0, 45.84], [47.0, 47.87], [49.0, 49.72], [55.0, 55.76], [57.0, 57.18], [59.0, 61.3], [62.0, 62.34], [68.0, 70.77], [73.0, 73.14], [76.0, 76.44], [80.0, 80.64], [84.0, 84.0], [90.0, 92.89], [94.0, 95.67], [98.0, 98.85], [103.0, 105.93], [108.0, 109.36], [112.0, 113.07], [115.0, 115.96]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.72, 49.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 45.82, 0.0, 0.0, 57.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 27.65], ["hum", 19.73], ["mains hum", 10.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 21.09], ["moo", 17.88], ["music", 16.9]], null, null, null, null, null, null], "duration": [0.38, 1.18, 0.63, 0.25, 5.55, 2.93, 0.45, 1.25, 1.73, 0.76, 1.28, 0.88, 1.84, 0.87, 0.72, 0.76, 0.18, 2.3, 0.34, 2.77, 0.14, 0.44, 0.64, 0.0, 2.89, 1.67, 0.85, 2.93, 1.36, 1.07, 0.96]} \ No newline at end of file diff --git a/annotations_1/Xv9ME0TfQjk_filtered.json b/annotations_1/Xv9ME0TfQjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d28b636859bca39ac43273725cada991e1240cd --- /dev/null +++ b/annotations_1/Xv9ME0TfQjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.68], [11.0, 31.95], [33.0, 32.95], [33.0, 92.82], [95.0, 95.32], [98.0, 102.14], [103.0, 109.95]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [29.98, 30.38, 0.0, 0.0, 0.0, 29.6, 29.5], "audiomae_on_audioset": [[["music", 34.92], ["cacophony", 30.95], ["hum", 5.17]], [["music", 31.72], ["hum", 27.67], ["throbbing", 12.17]], null, null, null, [["music", 53.21], ["speech", 5.81], ["pulse", 5.58]], [["hum", 34.72], ["throbbing", 27.8], ["mains hum", 18.98]]], "duration": [6.68, 20.95, -0.05, 59.82, 0.32, 4.14, 6.95]} \ No newline at end of file diff --git a/annotations_1/XvOKgNVwLes_filtered.json b/annotations_1/XvOKgNVwLes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77f7c9f443af02bfed0263a488d4365ba9e898df --- /dev/null +++ b/annotations_1/XvOKgNVwLes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.62], [8.0, 11.1], [16.0, 16.87], [20.0, 20.01], [21.0, 25.1], [29.0, 30.57], [35.0, 35.63], [40.0, 41.35], [45.0, 46.06], [70.0, 71.07], [72.0, 75.03], [76.0, 77.04], [82.0, 83.27], [109.0, 110.2], [124.0, 125.79], [127.0, 127.62], [131.0, 136.22], [142.0, 143.02], [144.0, 146.87], [160.0, 163.85]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [46.5, 55.81, 0.0, 0.0, 48.52, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 82.43, 39.11], "audiomae_on_audioset": [[["music", 39.38], ["speech", 24.77], ["musical instrument", 3.75]], null, null, null, [["music", 34.35], ["didgeridoo", 16.36], ["hum", 8.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 22.65], ["moo", 20.2], ["cattle, bovinae", 11.71]]], "duration": [2.62, 3.1, 0.87, 0.01, 4.1, 1.57, 0.63, 1.35, 1.06, 1.07, 3.03, 1.04, 1.27, 1.2, 1.79, 0.62, 5.22, 1.02, 2.87, 3.85]} \ No newline at end of file diff --git a/annotations_1/XvnWjkHgWEw_filtered.json b/annotations_1/XvnWjkHgWEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..beb96c0658eff72162777085e75e46630aba5632 --- /dev/null +++ b/annotations_1/XvnWjkHgWEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.26], [15.0, 23.6], [25.0, 25.89], [32.0, 32.21], [34.0, 35.23], [37.0, 37.12], [38.0, 40.02], [41.0, 41.98], [43.0, 43.41], [48.0, 48.88], [51.0, 51.66], [53.0, 53.72], [55.0, 56.03], [57.0, 57.15], [64.0, 64.86], [68.0, 68.93], [74.0, 76.44], [78.0, 78.95], [81.0, 80.84], [83.0, 83.62], [85.0, 87.15], [88.0, 90.53], [93.0, 92.57], [93.0, 92.69], [93.0, 93.83], [95.0, 94.78], [95.0, 95.47]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.12, 39.69, 0.0, 0.0, 0.0, 0.0, 34.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 91.64, 29.77, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 66.87], ["noise", 4.99], ["music", 2.81]], [["animal", 14.7], ["horse", 13.77], ["speech", 13.13]], null, null, null, null, [["didgeridoo", 19.36], ["boing", 17.27], ["echo", 6.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 12.23], ["animal", 7.66], ["roar", 7.4]], null, null, null, null, null], "duration": [4.26, 8.6, 0.89, 0.21, 1.23, 0.12, 2.02, 0.98, 0.41, 0.88, 0.66, 0.72, 1.03, 0.15, 0.86, 0.93, 2.44, 0.95, -0.16, 0.62, 2.15, 2.53, -0.43, -0.31, 0.83, -0.22, 0.47]} \ No newline at end of file diff --git a/annotations_1/Xvyf7ml1ndo_filtered.json b/annotations_1/Xvyf7ml1ndo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6adc824890f729254bab1871cdd1a02e77062b32 --- /dev/null +++ b/annotations_1/Xvyf7ml1ndo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.9], [15.0, 16.44], [19.0, 20.53], [25.0, 30.82], [33.0, 33.74], [37.0, 39.51], [43.0, 51.92], [54.0, 55.58], [60.0, 61.28], [70.0, 78.11], [79.0, 79.68], [84.0, 85.56], [86.0, 87.88], [88.0, 89.02], [97.0, 97.55], [102.0, 106.37], [109.0, 111.33], [117.0, 122.01], [126.0, 127.23], [129.0, 129.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 67.0, 0.0, 50.56, 49.64, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 48.56, 100.0, 96.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["didgeridoo", 53.62], ["music", 20.69], ["speech", 5.82]], null, null, null, null, null, null, null, null, [["speech", 39.06], ["whimper", 6.65], ["baby cry, infant cry", 5.93]], null, null, null, null], "duration": [0.9, 1.44, 1.53, 5.82, 0.74, 2.51, 8.92, 1.58, 1.28, 8.11, 0.68, 1.56, 1.88, 1.02, 0.55, 4.37, 2.33, 5.01, 1.23, 0.96]} \ No newline at end of file diff --git a/annotations_1/XwFR9NZfhUI_filtered.json b/annotations_1/XwFR9NZfhUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d9c7c003b1743c314800ca1339cc14e7cbf0842 --- /dev/null +++ b/annotations_1/XwFR9NZfhUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.89], [5.0, 5.04], [6.0, 7.03], [7.0, 20.76], [23.0, 25.2], [28.0, 27.94], [35.0, 55.38], [59.0, 59.61], [60.0, 62.82], [73.0, 74.02], [78.0, 80.67], [81.0, 87.1], [88.0, 109.48], [112.0, 119.77], [124.0, 124.85], [129.0, 129.79], [134.0, 134.13], [136.0, 139.9], [141.0, 156.95], [159.0, 167.97], [170.0, 178.9], [180.0, 181.14], [184.0, 186.02], [191.0, 195.35]], "keep_status": [false, false, false, false, false, false, true, false, true, false, true, false, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 37.53, 44.99, 0.0, 32.05, 0.0, 33.21, 0.0, 32.27, 36.02, 32.52, 41.03, 0.0, 0.0, 0.0, 36.64, 29.76, 30.2, 29.31, 0.0, 32.51, 30.25], "audiomae_on_audioset": [null, null, null, [["speech", 31.99], ["crushing", 25.72], ["noise", 14.91]], [["mains hum", 47.62], ["hum", 30.0], ["noise", 3.2]], null, [["noise", 15.33], ["hum", 11.8], ["explosion", 10.63]], null, [["fart", 14.2], ["bee, wasp, etc.", 11.62], ["speech", 10.74]], null, [["speech", 9.1], ["vehicle", 8.94], ["hum", 8.45]], [["speech", 46.91], ["sidetone", 38.01], ["boing", 4.92]], [["speech", 27.69], ["cattle, bovinae", 14.47], ["moo", 11.16]], [["speech", 28.35], ["explosion", 10.66], ["sidetone", 5.57]], null, null, null, [["speech", 45.71], ["fart", 32.75], ["sidetone", 2.05]], [["speech", 49.56], ["explosion", 5.9], ["vehicle", 5.02]], [["music", 70.61], ["didgeridoo", 5.42], ["buzz", 2.56]], [["cattle, bovinae", 44.7], ["livestock, farm animals, working animals", 26.08], ["moo", 21.92]], null, [["music", 34.19], ["sidetone", 14.51], ["hum", 10.83]], [["livestock, farm animals, working animals", 56.19], ["cattle, bovinae", 24.37], ["moo", 10.74]]], "duration": [1.89, 0.04, 1.03, 13.76, 2.2, -0.06, 20.38, 0.61, 2.82, 1.02, 2.67, 6.1, 21.48, 7.77, 0.85, 0.79, 0.13, 3.9, 15.95, 8.97, 8.9, 1.14, 2.02, 4.35]} \ No newline at end of file diff --git a/annotations_1/XyEHIOZf5yE_filtered.json b/annotations_1/XyEHIOZf5yE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cf3f17df800a78c655b14c127f09069ebb6f238 --- /dev/null +++ b/annotations_1/XyEHIOZf5yE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.66], [16.0, 17.71], [21.0, 28.44], [31.0, 33.0], [37.0, 42.03], [43.0, 66.31], [67.0, 74.36], [77.0, 79.22], [81.0, 80.92], [81.0, 88.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.1, 99.1, 69.47, 87.92, 95.78, 99.94, 0.0, 88.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.34, 1.71, 7.44, 2.0, 5.03, 23.31, 7.36, 2.22, -0.08, 7.86]} \ No newline at end of file diff --git a/annotations_1/Xz-BR8gyPhg_filtered.json b/annotations_1/Xz-BR8gyPhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40638faf8cf9b1e0448c34d913b808cbb344c7a4 --- /dev/null +++ b/annotations_1/Xz-BR8gyPhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.35], [7.0, 7.82], [13.0, 13.66], [17.0, 17.42], [31.0, 31.19], [32.0, 32.56], [36.0, 37.61], [41.0, 41.89], [43.0, 42.97], [44.0, 44.74], [45.0, 45.93], [46.0, 46.99], [49.0, 50.4], [58.0, 58.65], [63.0, 63.48], [66.0, 67.1], [68.0, 79.84], [83.0, 83.84], [87.0, 88.64], [90.0, 91.5], [93.0, 94.34], [101.0, 101.11], [104.0, 105.07], [107.0, 107.13], [110.0, 109.86], [115.0, 120.6], [121.0, 123.31], [124.0, 124.93], [133.0, 133.51], [136.0, 136.85], [139.0, 138.79], [140.0, 140.86], [141.0, 142.92], [148.0, 149.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 49.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.48], ["theremin", 25.88], ["musical instrument", 2.68]], null, null, null, null, null, null, null, null, null, [["speech", 31.58], ["hum", 16.67], ["sidetone", 14.91]], null, null, null, null, null, null, null], "duration": [0.35, 0.82, 0.66, 0.42, 0.19, 0.56, 1.61, 0.89, -0.03, 0.74, 0.93, 0.99, 1.4, 0.65, 0.48, 1.1, 11.84, 0.84, 1.64, 1.5, 1.34, 0.11, 1.07, 0.13, -0.14, 5.6, 2.31, 0.93, 0.51, 0.85, -0.21, 0.86, 1.92, 1.05]} \ No newline at end of file diff --git a/annotations_1/Y--v_LdWlQA_filtered.json b/annotations_1/Y--v_LdWlQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf7a7d064ca5f6028a8f6fb2e57952daf29f323 --- /dev/null +++ b/annotations_1/Y--v_LdWlQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.1], [11.0, 11.03], [12.0, 12.12], [13.0, 13.64], [15.0, 24.12], [26.0, 33.74], [42.0, 42.13], [52.0, 51.83], [56.0, 56.67], [57.0, 57.79], [59.0, 59.68], [63.0, 64.17], [72.0, 71.9], [77.0, 82.58], [85.0, 95.66], [112.0, 114.66], [116.0, 117.21], [118.0, 118.77], [121.0, 121.78], [131.0, 131.21], [133.0, 133.12], [135.0, 136.05], [137.0, 138.94], [142.0, 143.45], [145.0, 149.22], [150.0, 150.65], [152.0, 152.41], [153.0, 154.01], [162.0, 164.25]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [35.82, 0.0, 0.0, 0.0, 32.45, 34.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 62.78, 45.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.03, 0.0, 0.0, 0.0, 50.81], "audiomae_on_audioset": [[["speech", 44.19], ["music", 24.82], ["radio", 3.78]], null, null, null, [["speech", 48.77], ["radio", 10.58], ["horse", 6.6]], [["speech", 54.27], ["fly, housefly", 10.16], ["music", 6.9]], null, null, null, null, null, null, null, [["fly, housefly", 17.31], ["bee, wasp, etc.", 16.47], ["cattle, bovinae", 12.42]], null, [["music", 52.26], ["radio", 10.58], ["musical instrument", 3.64]], null, null, null, null, null, null, null, null, [["speech", 57.57], ["clip-clop", 3.97], ["eruption", 3.88]], null, null, null, null], "duration": [4.1, 0.03, 0.12, 0.64, 9.12, 7.74, 0.13, -0.17, 0.67, 0.79, 0.68, 1.17, -0.1, 5.58, 10.66, 2.66, 1.21, 0.77, 0.78, 0.21, 0.12, 1.05, 1.94, 1.45, 4.22, 0.65, 0.41, 1.01, 2.25]} \ No newline at end of file diff --git a/annotations_1/Y-cCAY2hGPs_filtered.json b/annotations_1/Y-cCAY2hGPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66a2d36aa93d667f0442485b137b6b1811c6b614 --- /dev/null +++ b/annotations_1/Y-cCAY2hGPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [6.0, 7.87], [10.0, 12.87], [18.0, 19.09], [20.0, 21.79], [23.0, 45.6], [56.0, 57.1], [67.0, 67.88], [72.0, 73.25], [79.0, 81.97], [86.0, 86.8], [94.0, 100.25], [109.0, 113.21]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 29.73, 0.0, 0.0, 29.76, 0.0, 0.0, 0.0, 32.28, 0.0, 32.02, 59.15], "audiomae_on_audioset": [null, null, [["chuckle, chortle", 14.57], ["laughter", 13.07], ["snicker", 9.78]], null, null, [["music", 66.73], ["siren", 4.03], ["electronic music", 3.24]], null, null, null, [["chirp tone", 32.49], ["sine wave", 7.24], ["dial tone", 6.26]], null, [["hum", 27.53], ["music", 14.79], ["mains hum", 12.43]], null], "duration": [0.53, 1.87, 2.87, 1.09, 1.79, 22.6, 1.1, 0.88, 1.25, 2.97, 0.8, 6.25, 4.21]} \ No newline at end of file diff --git a/annotations_1/Y-rxY2LxPI8_filtered.json b/annotations_1/Y-rxY2LxPI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12b69f57f328d5317ae05a73bc0f10c722a805b7 --- /dev/null +++ b/annotations_1/Y-rxY2LxPI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.93], [18.0, 20.73], [32.0, 134.74], [136.0, 136.7], [146.0, 151.53], [153.0, 162.63], [164.0, 164.96], [176.0, 177.03], [182.0, 182.82], [184.0, 184.67], [187.0, 187.76], [188.0, 189.65], [191.0, 201.46], [203.0, 204.47], [223.0, 223.84], [226.0, 226.98]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.47, 35.45, 0.0, 0.0, 81.89, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.59], ["hum", 9.69], ["whimper", 7.33]], [["humming", 64.2], ["music", 11.5], ["vocal music", 2.89]], null, null, null, null, null, null, null, null, null, null, [["music", 82.93], ["scary music", 6.09], ["ambient music", 1.74]], null, null, null], "duration": [4.93, 2.73, 102.74, 0.7, 5.53, 9.63, 0.96, 1.03, 0.82, 0.67, 0.76, 1.65, 10.46, 1.47, 0.84, 0.98]} \ No newline at end of file diff --git a/annotations_1/Y0IXtktHTgk_filtered.json b/annotations_1/Y0IXtktHTgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..126cea5eadf13dee16e5e877a2d074d33f419227 --- /dev/null +++ b/annotations_1/Y0IXtktHTgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.08], [26.0, 30.72], [32.0, 38.3], [42.0, 42.53], [61.0, 62.46]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 68.54, 69.74, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.08, 4.72, 6.3, 0.53, 1.46]} \ No newline at end of file diff --git a/annotations_1/Y0uLpcThaeU_filtered.json b/annotations_1/Y0uLpcThaeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f7682ecb6bafc2f6132d9adc11cd7d7886545be --- /dev/null +++ b/annotations_1/Y0uLpcThaeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [3.0, 3.82], [4.0, 4.95], [6.0, 6.37], [12.0, 12.9], [17.0, 17.64], [19.0, 19.6], [21.0, 23.19], [24.0, 25.73], [29.0, 31.97], [32.0, 36.91], [39.0, 41.94], [43.0, 45.77], [53.0, 55.75], [72.0, 72.42], [74.0, 73.65], [74.0, 73.68], [74.0, 73.72], [78.0, 80.7], [81.0, 84.92], [87.0, 87.15], [88.0, 89.21], [95.0, 95.2], [96.0, 97.61], [100.0, 101.44], [102.0, 106.54], [107.0, 114.57], [120.0, 119.74], [120.0, 130.79], [132.0, 133.17], [136.0, 136.95], [138.0, 138.45], [142.0, 147.04], [148.0, 149.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 99.85, 62.47, 57.17, 97.54, 98.44, 0.0, 0.0, 0.0, 0.0, 95.51, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 94.81, 0.0, 86.27, 0.0, 0.0, 0.0, 83.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.82, 0.95, 0.37, 0.9, 0.64, 0.6, 2.19, 1.73, 2.97, 4.91, 2.94, 2.77, 2.75, 0.42, -0.35, -0.32, -0.28, 2.7, 3.92, 0.15, 1.21, 0.2, 1.61, 1.44, 4.54, 7.57, -0.26, 10.79, 1.17, 0.95, 0.45, 5.04, 1.18]} \ No newline at end of file diff --git a/annotations_1/Y15QXiFUV8U_filtered.json b/annotations_1/Y15QXiFUV8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9a4751a965d09f734f46c20313a83947bc072a1 --- /dev/null +++ b/annotations_1/Y15QXiFUV8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.07], [6.0, 9.22], [10.0, 10.69], [13.0, 13.39], [15.0, 15.11], [17.0, 16.87], [45.0, 49.92], [57.0, 57.42], [58.0, 58.18], [59.0, 60.02], [61.0, 61.11], [71.0, 71.17], [72.0, 73.28], [74.0, 78.83], [93.0, 94.26], [94.0, 95.54], [96.0, 97.87], [103.0, 103.64], [105.0, 108.53], [109.0, 109.71], [111.0, 111.23], [116.0, 116.99], [120.0, 120.56], [121.0, 122.2], [141.0, 142.18], [142.0, 143.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.98, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 52.21], ["speech", 10.16], ["synthesizer", 8.35]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 3.22, 0.69, 0.39, 0.11, -0.13, 4.92, 0.42, 0.18, 1.02, 0.11, 0.17, 1.28, 4.83, 1.26, 1.54, 1.87, 0.64, 3.53, 0.71, 0.23, 0.99, 0.56, 1.2, 1.18, 1.83]} \ No newline at end of file diff --git a/annotations_1/Y2ZU8ZjyzoA_filtered.json b/annotations_1/Y2ZU8ZjyzoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d22120f93c8f62473c64464ab754bb4aedf51ba --- /dev/null +++ b/annotations_1/Y2ZU8ZjyzoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.83], [18.0, 19.75], [22.0, 23.73], [25.0, 29.32], [31.0, 33.03], [34.0, 34.72], [36.0, 39.43], [42.0, 44.04], [47.0, 48.71], [50.0, 51.95], [53.0, 54.67], [56.0, 57.43], [59.0, 62.02], [65.0, 67.32], [71.0, 73.36], [74.0, 78.12], [79.0, 80.65], [81.0, 81.35], [82.0, 88.94], [92.0, 94.07], [96.0, 98.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 0.0, 0.0, 98.27, 94.52, 0.0, 95.78, 94.07, 0.0, 0.0, 0.0, 0.0, 82.07, 38.97, 96.04, 93.45, 0.0, 0.0, 95.64, 90.43, 72.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.39], ["mains hum", 25.29], ["speech", 14.36]], null, null, null, null, null, null, null], "duration": [7.83, 1.75, 1.73, 4.32, 2.03, 0.72, 3.43, 2.04, 1.71, 1.95, 1.67, 1.43, 3.02, 2.32, 2.36, 4.12, 1.65, 0.35, 6.94, 2.07, 2.63]} \ No newline at end of file diff --git a/annotations_1/Y4SSkX4sRMQ_filtered.json b/annotations_1/Y4SSkX4sRMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a0eae7d886976cbf9e1c347064d15a8ecd8e45d --- /dev/null +++ b/annotations_1/Y4SSkX4sRMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 41.17], [45.0, 45.77], [47.0, 47.04], [47.0, 51.39]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [null, null, null, null], "duration": [32.17, 0.77, 0.04, 4.39]} \ No newline at end of file diff --git a/annotations_1/Y4XiKFvQ1rM_filtered.json b/annotations_1/Y4XiKFvQ1rM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..825e56a1c768bf6e5b56ef2d38bedc91ac4b11aa --- /dev/null +++ b/annotations_1/Y4XiKFvQ1rM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [9.0, 10.1], [11.0, 12.5], [14.0, 14.62], [16.0, 16.88], [21.0, 25.03], [29.0, 33.71], [35.0, 36.26], [37.0, 40.27], [43.0, 43.02], [47.0, 47.68], [49.0, 51.92], [58.0, 58.18], [60.0, 62.72], [64.0, 73.79], [75.0, 78.22], [79.0, 82.78], [84.0, 87.61], [89.0, 88.75], [90.0, 91.07], [93.0, 93.41], [94.0, 99.49], [100.0, 102.17], [105.0, 105.61], [106.0, 106.68], [108.0, 108.33], [109.0, 109.46], [114.0, 118.45], [122.0, 129.39], [137.0, 138.13], [141.0, 142.89], [145.0, 146.57], [148.0, 148.31], [150.0, 152.25], [154.0, 155.22], [157.0, 158.35], [165.0, 166.78], [168.0, 168.51], [171.0, 170.83], [173.0, 173.16], [174.0, 176.25], [177.0, 178.34], [179.0, 180.01], [180.0, 181.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 47.9, 0.0, 76.7, 0.0, 0.0, 100.0, 0.0, 88.64, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.85, 99.05, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 33.39], ["sine wave", 31.86], ["dial tone", 15.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.1, 1.5, 0.62, 0.88, 4.03, 4.71, 1.26, 3.27, 0.02, 0.68, 2.92, 0.18, 2.72, 9.79, 3.22, 3.78, 3.61, -0.25, 1.07, 0.41, 5.49, 2.17, 0.61, 0.68, 0.33, 0.46, 4.45, 7.39, 1.13, 1.89, 1.57, 0.31, 2.25, 1.22, 1.35, 1.78, 0.51, -0.17, 0.16, 2.25, 1.34, 1.01, 1.18]} \ No newline at end of file diff --git a/annotations_1/Y5EkcuhBwiU_filtered.json b/annotations_1/Y5EkcuhBwiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f06aeedf30fe48bcc3ae3789219443ee44e7f243 --- /dev/null +++ b/annotations_1/Y5EkcuhBwiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.16], [10.0, 10.42], [14.0, 14.77], [15.0, 19.01], [26.0, 31.23], [38.0, 38.2], [54.0, 53.87], [71.0, 72.37], [83.0, 83.19], [104.0, 104.67], [146.0, 148.27], [152.0, 153.0], [154.0, 155.44], [158.0, 161.13], [167.0, 178.66], [181.0, 192.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.25, 30.14, 0.0, 0.0, 0.0, 0.0, 0.0, 36.83, 0.0, 0.0, 34.49, 33.39, 31.98], "audiomae_on_audioset": [null, null, null, [["music", 61.79], ["synthesizer", 5.35], ["singing", 2.34]], [["music", 63.96], ["crowd", 6.55], ["speech", 4.46]], null, null, null, null, null, [["music", 39.66], ["trombone", 32.58], ["brass instrument", 9.57]], null, null, [["music", 34.34], ["fly, housefly", 10.36], ["mosquito", 10.07]], [["music", 83.03], ["swing music", 2.12], ["musical instrument", 1.83]], [["music", 75.16], ["boing", 7.59], ["speech", 3.26]]], "duration": [1.16, 0.42, 0.77, 4.01, 5.23, 0.2, -0.13, 1.37, 0.19, 0.67, 2.27, 1.0, 1.44, 3.13, 11.66, 11.79]} \ No newline at end of file diff --git a/annotations_1/Y5Y0SYRZRtM_filtered.json b/annotations_1/Y5Y0SYRZRtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a5eea562e3177e9b08a6bd5de6194d4c4ef1838 --- /dev/null +++ b/annotations_1/Y5Y0SYRZRtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 66.28], [69.0, 69.58], [73.0, 75.27], [82.0, 82.31], [82.0, 84.57], [85.0, 89.45], [89.0, 89.5], [90.0, 89.8], [90.0, 89.83], [90.0, 94.46], [97.0, 97.06], [99.0, 100.21], [107.0, 111.5], [112.0, 113.36], [117.0, 117.88], [118.0, 118.93]], "keep_status": [false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.18, 0.0, 33.02, 30.22, 0.0, 0.0, 0.0, 29.83, 0.0, 0.0, 29.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 28.28], ["music", 26.17], ["speech", 5.41]], null, [["speech", 72.5], ["radio", 7.93], ["sidetone", 5.82]], [["music", 40.62], ["speech", 15.74], ["hum", 6.7]], null, null, null, [["speech", 27.99], ["music", 20.83], ["breaking", 11.0]], null, null, [["whale vocalization", 45.33], ["mains hum", 15.77], ["hum", 15.18]], null, null, null], "duration": [0.28, 0.58, 2.27, 0.31, 2.57, 4.45, 0.5, -0.2, -0.17, 4.46, 0.06, 1.21, 4.5, 1.36, 0.88, 0.93]} \ No newline at end of file diff --git a/annotations_1/Y69UrBaCUAs_filtered.json b/annotations_1/Y69UrBaCUAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e88958f66ccefd9f11393cb0a30f937f27ed39d0 --- /dev/null +++ b/annotations_1/Y69UrBaCUAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.11], [1.0, 1.26], [1.0, 22.71], [30.0, 29.64], [30.0, 40.56], [51.0, 51.19], [52.0, 52.42], [53.0, 53.82], [56.0, 57.84], [58.0, 58.9], [59.0, 59.44], [63.0, 63.48], [67.0, 68.74], [75.0, 75.52], [81.0, 81.51], [85.0, 85.5], [88.0, 96.48], [99.0, 109.44], [114.0, 124.85], [130.0, 130.35], [131.0, 131.36]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.09, 0.0, 37.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 30.54, 29.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 39.76], ["hum", 29.27], ["music", 18.87]], null, [["music", 60.18], ["musical instrument", 2.5], ["speech", 1.43]], null, null, null, null, null, null, null, null, null, null, null, [["music", 50.03], ["speech", 23.01], ["sidetone", 3.63]], [["speech", 59.86], ["music", 26.09], ["groan", 3.22]], [["speech", 64.82], ["music", 13.84], ["sidetone", 5.63]], null, null], "duration": [0.11, 0.26, 21.71, -0.36, 10.56, 0.19, 0.42, 0.82, 1.84, 0.9, 0.44, 0.48, 1.74, 0.52, 0.51, 0.5, 8.48, 10.44, 10.85, 0.35, 0.36]} \ No newline at end of file diff --git a/annotations_1/Y6CLpg06kFE_filtered.json b/annotations_1/Y6CLpg06kFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf21372d60a419ba895ee312208dcbf3e3c7c254 --- /dev/null +++ b/annotations_1/Y6CLpg06kFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 24.66], [26.0, 26.54], [27.0, 64.32], [69.0, 68.96], [73.0, 73.84]], "keep_status": [true, false, false, false, false], "silence_prob": [37.72, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 28.53], ["music", 14.46], ["hum", 7.59]], null, null, null, null], "duration": [18.66, 0.54, 37.32, -0.04, 0.84]} \ No newline at end of file diff --git a/annotations_1/Y6jBV4wDoO4_filtered.json b/annotations_1/Y6jBV4wDoO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b67a50433e0cee4ae50fb3d72b2d6cdf060cdf73 --- /dev/null +++ b/annotations_1/Y6jBV4wDoO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.45], [6.0, 6.3], [7.0, 6.94], [9.0, 9.48], [20.0, 22.54], [25.0, 25.27], [28.0, 28.9], [43.0, 46.04], [48.0, 48.44], [49.0, 49.6], [56.0, 62.21], [63.0, 64.83], [75.0, 75.25], [76.0, 83.15], [84.0, 84.52], [85.0, 89.63], [90.0, 102.44], [105.0, 136.09], [141.0, 147.06], [155.0, 157.2], [158.0, 160.56], [165.0, 177.55], [183.0, 184.38], [189.0, 190.05], [190.0, 190.78], [193.0, 193.55], [194.0, 194.49], [195.0, 195.44], [199.0, 202.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 99.31, 0.0, 0.0, 46.72, 0.0, 0.0, 83.16, 0.0, 49.92, 35.32, 0.0, 35.43, 34.47, 36.82, 37.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 77.67], ["sidetone", 6.47], ["hum", 3.04]], null, null, null, null, [["speech", 43.56], ["music", 21.8], ["fart", 5.67]], [["fart", 23.51], ["livestock, farm animals, working animals", 16.96], ["moo", 15.5]], null, [["speech", 73.83], ["outside, urban or manmade", 2.54], ["horse", 2.17]], [["cattle, bovinae", 44.34], ["moo", 36.59], ["livestock, farm animals, working animals", 3.86]], [["speech", 51.85], ["radio", 13.88], ["crowd", 5.66]], [["livestock, farm animals, working animals", 41.71], ["moo", 26.69], ["cattle, bovinae", 21.65]], null, null, null, null, null, null, null], "duration": [2.45, 0.3, -0.06, 0.48, 2.54, 0.27, 0.9, 3.04, 0.44, 0.6, 6.21, 1.83, 0.25, 7.15, 0.52, 4.63, 12.44, 31.09, 6.06, 2.2, 2.56, 12.55, 1.38, 1.05, 0.78, 0.55, 0.49, 0.44, 3.02]} \ No newline at end of file diff --git a/annotations_1/Y8eSWYGZXe0_filtered.json b/annotations_1/Y8eSWYGZXe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..976c41697784091be697b2d9318f28285f9e6e92 --- /dev/null +++ b/annotations_1/Y8eSWYGZXe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.04], [15.0, 25.37], [26.0, 27.41], [29.0, 31.41], [32.0, 34.48], [35.0, 37.1], [41.0, 44.27], [47.0, 127.36], [127.0, 128.6], [130.0, 153.69], [154.0, 156.2], [160.0, 164.59], [166.0, 194.14], [195.0, 197.14]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, true, false, true], "silence_prob": [86.45, 83.16, 0.0, 99.73, 43.23, 50.11, 60.6, 0.0, 0.0, 32.81, 38.52, 38.78, 34.8, 37.04], "audiomae_on_audioset": [null, null, null, null, [["speech", 16.3], ["fly, housefly", 15.37], ["insect", 12.89]], null, null, null, null, [["music", 54.68], ["throbbing", 8.77], ["hum", 6.49]], [["music", 27.16], ["boing", 10.87], ["bleat", 4.31]], [["music", 43.36], ["speech", 19.85], ["sidetone", 6.07]], [["sidetone", 36.56], ["music", 34.11], ["speech", 15.35]], [["music", 36.54], ["speech", 22.47], ["musical instrument", 8.22]]], "duration": [7.04, 10.37, 1.41, 2.41, 2.48, 2.1, 3.27, 80.36, 1.6, 23.69, 2.2, 4.59, 28.14, 2.14]} \ No newline at end of file diff --git a/annotations_1/Y9HqtZTcTJk_filtered.json b/annotations_1/Y9HqtZTcTJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a276de3b893057213f38d2ce6b06e1c5ddcd88fc --- /dev/null +++ b/annotations_1/Y9HqtZTcTJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.34], [10.0, 10.44], [12.0, 13.44], [17.0, 17.02], [19.0, 20.44], [22.0, 21.91], [25.0, 26.69], [28.0, 31.23], [34.0, 35.51], [36.0, 39.61], [41.0, 45.44], [47.0, 47.46], [50.0, 52.0], [58.0, 58.73], [80.0, 82.81], [86.0, 87.64], [90.0, 92.06], [97.0, 107.67], [112.0, 115.8], [118.0, 118.03], [124.0, 134.76], [135.0, 135.55], [137.0, 139.06], [140.0, 139.94], [140.0, 140.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, true, false, false], "silence_prob": [70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 67.89, 42.58, 0.0, 40.07, 0.0, 48.19, 0.0, 48.1, 35.4, 29.43, 0.0, 31.66, 0.0, 33.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 83.6], ["narration, monologue", 2.34], ["speech synthesizer", 2.28]], null, [["speech", 60.57], ["music", 14.46], ["didgeridoo", 5.51]], null, [["whale vocalization", 72.3], ["speech", 18.69], ["echo", 3.07]], null, [["speech", 26.39], ["music", 17.53], ["didgeridoo", 12.17]], [["echo", 55.07], ["music", 6.08], ["speech", 3.72]], [["explosion", 41.18], ["speech", 18.81], ["burst, pop", 15.37]], null, [["music", 29.76], ["speech", 28.82], ["hum", 11.22]], null, [["music", 39.66], ["speech", 19.18], ["didgeridoo", 5.0]], null, null], "duration": [2.34, 0.44, 1.44, 0.02, 1.44, -0.09, 1.69, 3.23, 1.51, 3.61, 4.44, 0.46, 2.0, 0.73, 2.81, 1.64, 2.06, 10.67, 3.8, 0.03, 10.76, 0.55, 2.06, -0.06, 0.85]} \ No newline at end of file diff --git a/annotations_1/Y9Nt3hlMUUI_filtered.json b/annotations_1/Y9Nt3hlMUUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dda2320c0e7c0db081ae079ebc5d1c16d28dd912 --- /dev/null +++ b/annotations_1/Y9Nt3hlMUUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 46.92], [48.0, 55.86], [56.0, 57.38], [58.0, 58.87], [59.0, 61.67], [62.0, 68.22], [70.0, 69.87], [70.0, 75.22], [77.0, 87.79], [90.0, 92.55], [97.0, 99.2], [100.0, 101.36], [102.0, 105.11], [107.0, 107.62], [108.0, 114.05], [118.0, 130.77], [135.0, 160.74], [168.0, 169.87]], "keep_status": [false, true, false, false, false, false, false, true, true, true, true, false, false, false, true, false, false, false], "silence_prob": [54.7, 34.37, 0.0, 0.0, 42.55, 50.16, 0.0, 43.66, 35.5, 33.0, 45.85, 0.0, 58.89, 0.0, 45.05, 44.26, 42.02, 0.0], "audiomae_on_audioset": [null, [["hum", 39.96], ["mains hum", 13.46], ["music", 11.61]], null, null, [["speech", 55.74], ["music", 14.57], ["sine wave", 2.41]], null, null, [["music", 43.23], ["synthesizer", 9.89], ["speech", 5.96]], [["music", 26.64], ["buzz", 12.48], ["fly, housefly", 8.92]], [["clang", 30.33], ["music", 9.12], ["synthesizer", 8.82]], [["music", 33.1], ["gong", 29.03], ["ambient music", 3.78]], null, null, null, [["music", 50.47], ["speech", 9.82], ["effects unit", 5.06]], [["music", 52.34], ["theremin", 17.87], ["hum", 5.58]], [["theremin", 42.33], ["music", 26.01], ["ambient music", 3.97]], null], "duration": [6.92, 7.86, 1.38, 0.87, 2.67, 6.22, -0.13, 5.22, 10.79, 2.55, 2.2, 1.36, 3.11, 0.62, 6.05, 12.77, 25.74, 1.87]} \ No newline at end of file diff --git a/annotations_1/Y9OrRbeB-rU_filtered.json b/annotations_1/Y9OrRbeB-rU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1fb1d254dd3f8e93041a98fc1a532430d7239b --- /dev/null +++ b/annotations_1/Y9OrRbeB-rU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.58], [8.0, 9.44], [15.0, 26.89], [28.0, 33.27], [35.0, 38.42], [39.0, 41.27], [42.0, 42.79], [44.0, 45.12], [49.0, 51.53], [53.0, 54.4], [57.0, 59.95], [62.0, 62.14], [63.0, 63.75], [68.0, 68.39], [69.0, 70.23], [71.0, 110.34], [115.0, 124.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 70.44, 91.3, 80.64, 96.66, 0.0, 0.0, 99.94, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0, 84.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 1.44, 11.89, 5.27, 3.42, 2.27, 0.79, 1.12, 2.53, 1.4, 2.95, 0.14, 0.75, 0.39, 1.23, 39.34, 9.93]} \ No newline at end of file diff --git a/annotations_1/Y9b8tw9TR2k_filtered.json b/annotations_1/Y9b8tw9TR2k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcddc4b12c60cc658de1919da2e319812b535346 --- /dev/null +++ b/annotations_1/Y9b8tw9TR2k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.3], [11.0, 11.33], [18.0, 24.61], [26.0, 32.31], [42.0, 45.15], [54.0, 54.67], [62.0, 68.62], [78.0, 82.32], [83.0, 84.87], [86.0, 87.0], [90.0, 90.93], [92.0, 93.43], [99.0, 99.4], [103.0, 103.23], [115.0, 122.84], [123.0, 124.31], [127.0, 127.28], [136.0, 137.61], [140.0, 140.78], [143.0, 144.26], [146.0, 145.79], [146.0, 147.77], [150.0, 152.17], [158.0, 157.98], [159.0, 159.7], [163.0, 164.05], [165.0, 165.55], [166.0, 168.18], [169.0, 171.1], [175.0, 186.81], [188.0, 189.5], [190.0, 192.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [31.34, 0.0, 30.96, 32.84, 32.21, 0.0, 33.53, 31.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 57.01, 56.4, 31.6, 0.0, 42.37], "audiomae_on_audioset": [[["music", 73.36], ["speech", 9.45], ["throbbing", 3.63]], null, [["music", 78.11], ["electronic music", 3.05], ["throbbing", 2.88]], [["music", 66.18], ["guitar", 5.81], ["musical instrument", 3.56]], [["music", 84.82], ["electronic music", 1.28], ["didgeridoo", 0.95]], null, [["music", 72.69], ["hum", 2.47], ["singing", 1.61]], [["music", 64.64], ["speech", 8.19], ["didgeridoo", 4.38]], null, null, null, null, null, null, [["music", 53.16], ["guitar", 5.41], ["musical instrument", 4.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.94], ["guitar", 6.54], ["musical instrument", 6.13]], null, [["music", 48.4], ["foghorn", 5.34], ["double bass", 5.14]]], "duration": [8.3, 0.33, 6.61, 6.31, 3.15, 0.67, 6.62, 4.32, 1.87, 1.0, 0.93, 1.43, 0.4, 0.23, 7.84, 1.31, 0.28, 1.61, 0.78, 1.26, -0.21, 1.77, 2.17, -0.02, 0.7, 1.05, 0.55, 2.18, 2.1, 11.81, 1.5, 2.16]} \ No newline at end of file diff --git a/annotations_1/YAmnMBHMPso_filtered.json b/annotations_1/YAmnMBHMPso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d45081228d1935e83028d815983b261b7ae3b318 --- /dev/null +++ b/annotations_1/YAmnMBHMPso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.79], [15.0, 16.61], [18.0, 19.36], [20.0, 24.39], [26.0, 26.37], [34.0, 35.16], [35.0, 36.86], [38.0, 39.43], [40.0, 66.75], [70.0, 71.14], [76.0, 83.61], [85.0, 85.89], [89.0, 90.04], [90.0, 90.54], [92.0, 93.02], [94.0, 94.2], [99.0, 102.34], [104.0, 104.21], [104.0, 107.52]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [52.45, 0.0, 0.0, 38.66, 0.0, 0.0, 0.0, 0.0, 39.57, 0.0, 37.47, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 44.81], "audiomae_on_audioset": [null, null, null, [["music", 32.5], ["fly, housefly", 11.04], ["hum", 5.6]], null, null, null, null, [["speech", 42.36], ["music", 22.89], ["hum", 9.45]], null, [["music", 69.6], ["synthesizer", 6.66], ["ambient music", 2.75]], null, null, null, null, null, null, null, [["music", 28.84], ["hum", 23.12], ["mains hum", 9.69]]], "duration": [2.79, 1.61, 1.36, 4.39, 0.37, 1.16, 1.86, 1.43, 26.75, 1.14, 7.61, 0.89, 1.04, 0.54, 1.02, 0.2, 3.34, 0.21, 3.52]} \ No newline at end of file diff --git a/annotations_1/YCiimJ7d2Cs_filtered.json b/annotations_1/YCiimJ7d2Cs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea234485c1f5f24db6eb7172f81e05c1ac105a2b --- /dev/null +++ b/annotations_1/YCiimJ7d2Cs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.83], [16.0, 16.17], [19.0, 19.77], [21.0, 21.34], [28.0, 37.81], [39.0, 39.8], [45.0, 46.6], [56.0, 56.61]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.39, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 19.45], ["musical instrument", 18.55], ["brass instrument", 18.07]], null, null, null], "duration": [0.83, 0.17, 0.77, 0.34, 9.81, 0.8, 1.6, 0.61]} \ No newline at end of file diff --git a/annotations_1/YDeGYXbeQV8_filtered.json b/annotations_1/YDeGYXbeQV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b5783d9c565ab9a70ac8590712ae86d3a6c950 --- /dev/null +++ b/annotations_1/YDeGYXbeQV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.17], [7.0, 7.15], [16.0, 16.11], [22.0, 23.14], [33.0, 34.23], [39.0, 43.24], [44.0, 45.72], [48.0, 59.12], [60.0, 80.82], [85.0, 85.6], [86.0, 86.41], [90.0, 91.52], [96.0, 97.8], [101.0, 101.22], [135.0, 135.19], [155.0, 155.41], [158.0, 158.77], [159.0, 161.32], [162.0, 162.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 98.51, 43.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 66.95], ["throbbing", 11.89], ["speech", 4.39]], null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 0.15, 0.11, 1.14, 1.23, 4.24, 1.72, 11.12, 20.82, 0.6, 0.41, 1.52, 1.8, 0.22, 0.19, 0.41, 0.77, 2.32, 0.82]} \ No newline at end of file diff --git a/annotations_1/YDkE97uXjRo_filtered.json b/annotations_1/YDkE97uXjRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af2446d48161e6f7d17452fdf56571461f9d1331 --- /dev/null +++ b/annotations_1/YDkE97uXjRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 21.73], [23.0, 42.3], [43.0, 45.6], [47.0, 47.49], [49.0, 50.57], [54.0, 60.74], [62.0, 125.64], [127.0, 130.76]], "keep_status": [false, false, true, false, false, false, false, true], "silence_prob": [58.72, 58.3, 47.58, 0.0, 0.0, 30.41, 0.0, 41.07], "audiomae_on_audioset": [null, null, [["mains hum", 30.16], ["hum", 17.63], ["music", 13.76]], null, null, [["music", 48.19], ["speech", 19.93], ["hum", 7.32]], null, [["fly, housefly", 33.77], ["insect", 13.86], ["mains hum", 11.46]]], "duration": [15.73, 19.3, 2.6, 0.49, 1.57, 6.74, 63.64, 3.76]} \ No newline at end of file diff --git a/annotations_1/YEdNAX9h_vI_filtered.json b/annotations_1/YEdNAX9h_vI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61750dfcaf0b31303a9927170aedbf6074958ecd --- /dev/null +++ b/annotations_1/YEdNAX9h_vI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [5.0, 8.4], [14.0, 18.96], [20.0, 19.6], [20.0, 29.81], [31.0, 32.49], [37.0, 37.83], [39.0, 45.99], [47.0, 59.58], [63.0, 65.37], [69.0, 68.72], [73.0, 74.21], [79.0, 78.97], [82.0, 82.98], [84.0, 85.68], [87.0, 88.72], [102.0, 102.32], [103.0, 106.14], [108.0, 108.4], [110.0, 110.96], [114.0, 125.79], [126.0, 128.88], [129.0, 129.44], [129.0, 129.66], [130.0, 141.44], [144.0, 144.32]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 43.64, 31.24, 0.0, 30.33, 0.0, 0.0, 31.83, 40.43, 52.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 38.72, 30.27, 0.0, 0.0, 29.65, 0.0], "audiomae_on_audioset": [null, [["music", 49.17], ["theremin", 26.62], ["musical instrument", 4.74]], [["wind instrument, woodwind instrument", 27.16], ["music", 18.23], ["shofar", 15.03]], null, [["music", 39.26], ["whack, thwack", 18.98], ["speech", 16.84]], null, null, [["throbbing", 27.56], ["music", 20.78], ["hum", 18.56]], [["music", 70.04], ["theremin", 5.56], ["thunk", 3.54]], null, null, null, null, null, null, null, null, [["music", 36.82], ["theremin", 22.99], ["thunk", 12.72]], null, null, [["music", 69.17], ["musical instrument", 5.53], ["wind instrument, woodwind instrument", 2.12]], [["foghorn", 72.16], ["speech", 12.82], ["music", 5.7]], null, null, [["speech", 20.86], ["fly, housefly", 17.99], ["music", 7.93]], null], "duration": [0.35, 3.4, 4.96, -0.4, 9.81, 1.49, 0.83, 6.99, 12.58, 2.37, -0.28, 1.21, -0.03, 0.98, 1.68, 1.72, 0.32, 3.14, 0.4, 0.96, 11.79, 2.88, 0.44, 0.66, 11.44, 0.32]} \ No newline at end of file diff --git a/annotations_1/YEv7cVW8hBA_filtered.json b/annotations_1/YEv7cVW8hBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..147b530ea82f05e95e28fb3867b47cce3f44dc73 --- /dev/null +++ b/annotations_1/YEv7cVW8hBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.01], [13.0, 13.78], [14.0, 15.55], [17.0, 17.24], [22.0, 23.09], [24.0, 23.79], [24.0, 25.2], [26.0, 26.57], [28.0, 28.0], [29.0, 30.15], [33.0, 33.3], [36.0, 36.98], [45.0, 45.52], [46.0, 46.53], [48.0, 49.37], [51.0, 51.95], [55.0, 56.27], [58.0, 58.77], [60.0, 60.25], [62.0, 63.31], [64.0, 67.49], [68.0, 68.82], [70.0, 70.56], [72.0, 72.22], [73.0, 73.04], [73.0, 73.45], [76.0, 76.59], [77.0, 79.71], [81.0, 81.94], [90.0, 90.68], [95.0, 95.15], [97.0, 98.86], [100.0, 101.43], [102.0, 102.0], [103.0, 102.79], [103.0, 103.98], [108.0, 108.41], [119.0, 119.58], [127.0, 128.07], [129.0, 133.19], [140.0, 140.75]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [48.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.85, 0.0], "audiomae_on_audioset": [[["speech", 13.72], ["whale vocalization", 11.76], ["radio", 6.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 73.45], ["fly, housefly", 2.52], ["insect", 2.37]], null, null, null, null, null, null, null, null, null, null, null, [["insect", 31.15], ["fly, housefly", 22.19], ["speech", 11.32]], null], "duration": [2.01, 0.78, 1.55, 0.24, 1.09, -0.21, 1.2, 0.57, 0.0, 1.15, 0.3, 0.98, 0.52, 0.53, 1.37, 0.95, 1.27, 0.77, 0.25, 1.31, 3.49, 0.82, 0.56, 0.22, 0.04, 0.45, 0.59, 2.71, 0.94, 0.68, 0.15, 1.86, 1.43, 0.0, -0.21, 0.98, 0.41, 0.58, 1.07, 4.19, 0.75]} \ No newline at end of file diff --git a/annotations_1/YFIIcUg_C4I_filtered.json b/annotations_1/YFIIcUg_C4I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad0f6bfcad592b8ee5e01ebb59a9f890dcd4f300 --- /dev/null +++ b/annotations_1/YFIIcUg_C4I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 32.9], [35.0, 38.33], [43.0, 49.74], [52.0, 52.88], [54.0, 54.84], [56.0, 56.69], [62.0, 66.19], [66.0, 71.05], [75.0, 79.69], [80.0, 86.14], [87.0, 88.4], [91.0, 91.86], [93.0, 93.83], [95.0, 95.0], [96.0, 96.67], [104.0, 105.51], [108.0, 109.73], [117.0, 118.4], [125.0, 124.7], [132.0, 132.07], [134.0, 136.86], [140.0, 141.05], [147.0, 147.46]], "keep_status": [false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [58.55, 45.65, 40.21, 0.0, 0.0, 0.0, 29.72, 31.16, 29.66, 33.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.89, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.33], ["hum", 13.75], ["throbbing", 10.15]], [["music", 42.3], ["moo", 5.57], ["cattle, bovinae", 5.41]], null, null, null, [["speech", 55.57], ["music", 19.48], ["sidetone", 7.79]], [["music", 38.39], ["speech", 18.9], ["sidetone", 9.39]], [["music", 45.93], ["hum", 13.04], ["mains hum", 9.54]], [["music", 39.48], ["speech", 23.36], ["throbbing", 13.33]], null, null, null, null, null, null, null, null, null, null, [["music", 25.37], ["synthesizer", 10.08], ["inside, small room", 7.38]], null, null], "duration": [15.9, 3.33, 6.74, 0.88, 0.84, 0.69, 4.19, 5.05, 4.69, 6.14, 1.4, 0.86, 0.83, 0.0, 0.67, 1.51, 1.73, 1.4, -0.3, 0.07, 2.86, 1.05, 0.46]} \ No newline at end of file diff --git a/annotations_1/YG-plVmM7O4_filtered.json b/annotations_1/YG-plVmM7O4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c46e8ada80fac4e6fa9cb7f91a3c56772d884bbd --- /dev/null +++ b/annotations_1/YG-plVmM7O4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.46], [6.0, 6.1], [9.0, 10.29], [12.0, 12.43], [14.0, 17.59], [18.0, 19.63], [21.0, 24.54], [27.0, 36.04], [39.0, 54.94], [56.0, 59.8], [60.0, 61.62], [62.0, 65.01], [67.0, 71.17], [74.0, 73.82], [78.0, 77.85], [79.0, 87.03], [89.0, 90.09], [91.0, 90.93], [92.0, 94.19], [95.0, 97.39], [98.0, 98.52], [99.0, 104.36], [109.0, 109.65], [111.0, 111.64], [122.0, 121.95], [138.0, 138.06]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.06, 0.0, 56.18, 59.24, 37.82, 41.68, 0.0, 36.28, 30.65, 0.0, 0.0, 30.51, 0.0, 0.0, 32.34, 32.2, 0.0, 31.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 38.41], ["cattle, bovinae", 6.71], ["livestock, farm animals, working animals", 6.47]], null, null, null, [["music", 44.76], ["didgeridoo", 24.34], ["speech", 20.34]], [["speech", 20.44], ["music", 14.78], ["hum", 13.42]], null, [["music", 30.98], ["hum", 14.74], ["speech", 10.35]], [["music", 47.77], ["speech", 24.28], ["hum", 3.51]], null, null, [["speech", 27.32], ["music", 24.93], ["foghorn", 14.64]], null, null, [["music", 34.06], ["speech", 22.28], ["hum", 10.88]], [["music", 50.7], ["speech", 20.25], ["musical instrument", 2.67]], null, [["speech", 43.38], ["music", 18.7], ["hum", 6.61]], null, null, null, null], "duration": [0.46, 0.1, 1.29, 0.43, 3.59, 1.63, 3.54, 9.04, 15.94, 3.8, 1.62, 3.01, 4.17, -0.18, -0.15, 8.03, 1.09, -0.07, 2.19, 2.39, 0.52, 5.36, 0.65, 0.64, -0.05, 0.06]} \ No newline at end of file diff --git a/annotations_1/YG0VNVGxyYs_filtered.json b/annotations_1/YG0VNVGxyYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28dbd4524b4de9862fbd6f3c93507c3b0e904da3 --- /dev/null +++ b/annotations_1/YG0VNVGxyYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [22.0, 22.45], [26.0, 26.01], [37.0, 37.79], [41.0, 40.86], [43.0, 43.83], [63.0, 63.66], [64.0, 68.88], [70.0, 69.9]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.45, 0.01, 0.79, -0.14, 0.83, 0.66, 4.88, -0.1]} \ No newline at end of file diff --git a/annotations_1/YGwPTU-SvbI_filtered.json b/annotations_1/YGwPTU-SvbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5887175229d4ddb9d49885128a3eabb567a189b9 --- /dev/null +++ b/annotations_1/YGwPTU-SvbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.96], [14.0, 13.76], [17.0, 17.09], [27.0, 28.63], [30.0, 31.67], [32.0, 33.47], [35.0, 35.4], [38.0, 38.37], [39.0, 39.53], [41.0, 42.16], [48.0, 53.15], [54.0, 54.78], [56.0, 65.38], [70.0, 103.47], [105.0, 107.16], [108.0, 136.22], [137.0, 136.97], [137.0, 137.03], [139.0, 141.57], [142.0, 151.85], [155.0, 154.94], [156.0, 158.55], [159.0, 160.15], [165.0, 166.14], [169.0, 169.53], [170.0, 170.95], [172.0, 172.25], [174.0, 174.09], [175.0, 177.53], [179.0, 179.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.99, 0.0, 32.21, 0.0, 97.92, 30.1, 0.0, 0.0, 41.7, 48.1, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 24.84], ["throbbing", 21.82], ["hum", 18.89]], null, [["music", 27.41], ["speech", 27.17], ["whack, thwack", 9.0]], null, null, [["music", 56.25], ["speech", 27.81], ["hum", 4.23]], null, null, [["music", 23.25], ["speech", 6.15], ["fly, housefly", 5.98]], [["hum", 16.57], ["creak", 10.27], ["whack, thwack", 9.52]], null, null, null, null, null, null, null, null, null, null], "duration": [0.96, -0.24, 0.09, 1.63, 1.67, 1.47, 0.4, 0.37, 0.53, 1.16, 5.15, 0.78, 9.38, 33.47, 2.16, 28.22, -0.03, 0.03, 2.57, 9.85, -0.06, 2.55, 1.15, 1.14, 0.53, 0.95, 0.25, 0.09, 2.53, 0.25]} \ No newline at end of file diff --git a/annotations_1/YH_vICd0WQ0_filtered.json b/annotations_1/YH_vICd0WQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13252ef83357daf3bc1109c3def9bb3d4e50fd66 --- /dev/null +++ b/annotations_1/YH_vICd0WQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.0], [17.0, 17.61], [21.0, 21.39], [22.0, 26.54], [28.0, 30.43], [33.0, 33.72], [37.0, 36.73], [37.0, 38.3], [39.0, 38.84], [41.0, 42.08], [44.0, 44.49], [48.0, 48.49], [57.0, 57.57], [63.0, 63.71], [65.0, 65.94], [67.0, 66.93], [70.0, 70.21], [71.0, 73.01], [74.0, 74.58], [75.0, 76.49], [82.0, 82.9], [98.0, 100.87], [102.0, 104.01], [110.0, 110.62], [112.0, 112.01], [114.0, 115.03], [122.0, 123.23], [126.0, 126.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 61.97, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.29, 0.0, 0.0, 0.0, 72.6, 53.1, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.26], ["music", 9.24], ["sidetone", 7.21]], null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.61, 0.39, 4.54, 2.43, 0.72, -0.27, 1.3, -0.16, 1.08, 0.49, 0.49, 0.57, 0.71, 0.94, -0.07, 0.21, 2.01, 0.58, 1.49, 0.9, 2.87, 2.01, 0.62, 0.01, 1.03, 1.23, 0.89]} \ No newline at end of file diff --git a/annotations_1/YHirkSmJcEU_filtered.json b/annotations_1/YHirkSmJcEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..963468da6fccc205d0fb84e6c302a767832b217f --- /dev/null +++ b/annotations_1/YHirkSmJcEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.57], [17.0, 24.61], [25.0, 24.95], [26.0, 48.91], [50.0, 58.94], [62.0, 67.73], [70.0, 77.43], [91.0, 91.2], [95.0, 96.43], [97.0, 103.22], [104.0, 104.48], [111.0, 111.01], [112.0, 112.65], [114.0, 114.39], [118.0, 118.57], [121.0, 122.28], [123.0, 122.84], [128.0, 129.52], [131.0, 132.51], [138.0, 139.7], [140.0, 140.26], [141.0, 141.52], [143.0, 143.73], [145.0, 145.66], [148.0, 158.04]], "keep_status": [false, true, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.54, 0.0, 31.32, 32.13, 30.59, 33.24, 0.0, 0.0, 38.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63], "audiomae_on_audioset": [null, [["music", 46.15], ["speech", 11.4], ["musical instrument", 4.25]], null, [["speech", 25.02], ["buzz", 18.01], ["fly, housefly", 10.22]], [["music", 71.53], ["musical instrument", 2.41], ["speech", 2.06]], [["music", 30.78], ["sidetone", 17.84], ["speech", 16.35]], [["speech", 36.09], ["hum", 9.88], ["sidetone", 8.58]], null, null, [["speech", 74.17], ["fly, housefly", 3.99], ["insect", 2.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 7.61, -0.05, 22.91, 8.94, 5.73, 7.43, 0.2, 1.43, 6.22, 0.48, 0.01, 0.65, 0.39, 0.57, 1.28, -0.16, 1.52, 1.51, 1.7, 0.26, 0.52, 0.73, 0.66, 10.04]} \ No newline at end of file diff --git a/annotations_1/YI8DWdXhg5Q_filtered.json b/annotations_1/YI8DWdXhg5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8b1c47b075159311b8bf69f70e9ef1dbee022c3 --- /dev/null +++ b/annotations_1/YI8DWdXhg5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.19], [21.0, 22.49], [28.0, 29.61], [30.0, 30.67], [31.0, 31.7], [33.0, 35.65], [39.0, 41.2], [47.0, 47.56], [51.0, 55.59], [58.0, 61.65], [80.0, 86.49], [96.0, 96.3], [101.0, 102.98], [104.0, 114.1], [115.0, 127.75]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 56.4, 30.72, 0.0, 33.02, 41.42, 33.08, 0.0, 0.0, 34.64, 29.97], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 38.9], ["speech", 36.54], ["music", 6.88]], null, [["speech", 58.26], ["music", 12.5], ["sidetone", 4.36]], [["speech", 31.07], ["fart", 11.94], ["sidetone", 8.4]], [["music", 16.87], ["animal", 9.63], ["speech", 8.44]], null, null, [["music", 36.03], ["mains hum", 8.12], ["speech", 6.03]], [["cattle, bovinae", 31.18], ["livestock, farm animals, working animals", 24.06], ["moo", 21.68]]], "duration": [0.19, 1.49, 1.61, 0.67, 0.7, 2.65, 2.2, 0.56, 4.59, 3.65, 6.49, 0.3, 1.98, 10.1, 12.75]} \ No newline at end of file diff --git a/annotations_1/YIg4Pcmy8ww_filtered.json b/annotations_1/YIg4Pcmy8ww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c795dd5d1f45c6393033f20ee0d59007f6a590b --- /dev/null +++ b/annotations_1/YIg4Pcmy8ww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [17.0, 17.81], [33.0, 33.88], [38.0, 45.05], [50.0, 50.68], [56.0, 63.31], [68.0, 68.66], [95.0, 95.01], [98.0, 101.63]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [49.36, 0.0, 0.0, 47.86, 0.0, 41.91, 0.0, 0.0, 32.85], "audiomae_on_audioset": [[["music", 87.22], ["drip", 2.82], ["synthesizer", 1.18]], null, null, [["whale vocalization", 80.41], ["music", 12.25], ["noise", 2.02]], null, [["music", 47.71], ["synthesizer", 7.62], ["buzz", 6.53]], null, null, [["music", 71.25], ["speech", 11.68], ["throbbing", 1.88]]], "duration": [2.15, 0.81, 0.88, 7.05, 0.68, 7.31, 0.66, 0.01, 3.63]} \ No newline at end of file diff --git a/annotations_1/YIhMJMRdGGY_filtered.json b/annotations_1/YIhMJMRdGGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/YIhMJMRdGGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/YJV5WB1wxdk_filtered.json b/annotations_1/YJV5WB1wxdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1e882dc45d35aae0e8e54c3d4e6da9f69d6bc8a --- /dev/null +++ b/annotations_1/YJV5WB1wxdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 22.4], [24.0, 24.26], [25.0, 28.46], [32.0, 32.7], [34.0, 34.64], [47.0, 62.41], [68.0, 68.91], [72.0, 73.3], [85.0, 86.07], [87.0, 89.65], [91.0, 93.7], [95.0, 95.44], [101.0, 103.33], [107.0, 109.54], [113.0, 114.0], [117.0, 117.51], [119.0, 119.03], [120.0, 120.23], [126.0, 129.25], [131.0, 131.38], [132.0, 132.26]], "keep_status": [true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [28.75, 0.0, 28.78, 0.0, 0.0, 28.78, 0.0, 0.0, 0.0, 99.56, 42.53, 0.0, 50.26, 54.76, 0.0, 0.0, 0.0, 0.0, 29.02, 0.0, 0.0], "audiomae_on_audioset": [[["music", 24.44], ["throbbing", 16.57], ["boing", 15.66]], null, [["music", 27.68], ["didgeridoo", 22.7], ["speech", 11.91]], null, null, [["speech", 63.85], ["hum", 9.72], ["throbbing", 4.74]], null, null, null, null, [["music", 24.38], ["crushing", 12.21], ["synthesizer", 9.78]], null, null, null, null, null, null, null, [["speech", 35.66], ["music", 18.5], ["musical instrument", 8.16]], null, null], "duration": [19.4, 0.26, 3.46, 0.7, 0.64, 15.41, 0.91, 1.3, 1.07, 2.65, 2.7, 0.44, 2.33, 2.54, 1.0, 0.51, 0.03, 0.23, 3.25, 0.38, 0.26]} \ No newline at end of file diff --git a/annotations_1/YKZRedzkeU8_filtered.json b/annotations_1/YKZRedzkeU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41f4f73e922b2e3bde099e153b1199ed8f24dfaf --- /dev/null +++ b/annotations_1/YKZRedzkeU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.43], [12.0, 11.52], [12.0, 25.81], [26.0, 27.38], [28.0, 33.54], [36.0, 36.39], [38.0, 38.23], [45.0, 45.66], [51.0, 51.56], [52.0, 52.78], [55.0, 56.1], [69.0, 69.25], [116.0, 116.99], [118.0, 119.4], [121.0, 122.94], [132.0, 132.48], [134.0, 134.97], [135.0, 136.11], [137.0, 138.72], [140.0, 140.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.29, 0.0, 28.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 37.77], ["hum", 25.49], ["music", 13.98]], null, [["music", 43.98], ["groan", 30.48], ["whimper", 6.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.43, -0.48, 13.81, 1.38, 5.54, 0.39, 0.23, 0.66, 0.56, 0.78, 1.1, 0.25, 0.99, 1.4, 1.94, 0.48, 0.97, 1.11, 1.72, 0.88]} \ No newline at end of file diff --git a/annotations_1/YKvG96jMVWE_filtered.json b/annotations_1/YKvG96jMVWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4735e81b47a7bbec665db1b80dce50809c504101 --- /dev/null +++ b/annotations_1/YKvG96jMVWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 22.76], [23.0, 29.03], [30.0, 96.82], [99.0, 109.14], [114.0, 117.27], [124.0, 129.36], [132.0, 136.07], [138.0, 139.92], [142.0, 143.82], [145.0, 145.56], [147.0, 161.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [78.89, 83.16, 0.0, 74.6, 84.07, 79.24, 54.63, 0.0, 0.0, 0.0, 40.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 51.99], ["theremin", 5.37], ["gong", 3.6]]], "duration": [9.76, 6.03, 66.82, 10.14, 3.27, 5.36, 4.07, 1.92, 1.82, 0.56, 14.77]} \ No newline at end of file diff --git a/annotations_1/YLjwEodCmT4_filtered.json b/annotations_1/YLjwEodCmT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8027ce53ceb2be1a3b3ce6ae0598f94edfc6870 --- /dev/null +++ b/annotations_1/YLjwEodCmT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [7.0, 12.23], [19.0, 23.82], [37.0, 38.28], [43.0, 50.75], [54.0, 54.31], [56.0, 56.76], [84.0, 86.41], [89.0, 89.99], [92.0, 92.62], [94.0, 94.07], [102.0, 102.19], [103.0, 118.13], [119.0, 120.01], [120.0, 134.45], [136.0, 136.24]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.56, 38.21, 0.0, 34.1, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 99.52, 0.0], "audiomae_on_audioset": [null, [["hum", 40.0], ["music", 19.77], ["mains hum", 16.6]], [["music", 13.8], ["didgeridoo", 6.67], ["boing", 5.8]], null, [["music", 26.07], ["sidetone", 22.22], ["speech", 11.99]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 5.23, 4.82, 1.28, 7.75, 0.31, 0.76, 2.41, 0.99, 0.62, 0.07, 0.19, 15.13, 1.01, 14.45, 0.24]} \ No newline at end of file diff --git a/annotations_1/YNAv6w5RDIs_filtered.json b/annotations_1/YNAv6w5RDIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b65252b145d4e29523518c44715b9c931445479 --- /dev/null +++ b/annotations_1/YNAv6w5RDIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.02], [9.0, 10.84], [12.0, 12.68], [14.0, 19.41], [21.0, 55.93], [56.0, 60.51], [63.0, 64.49], [65.0, 66.78], [68.0, 69.21], [70.0, 71.36], [73.0, 76.15], [77.0, 84.82], [95.0, 108.75], [111.0, 112.4], [117.0, 126.82], [130.0, 136.73], [142.0, 142.79], [154.0, 154.53], [155.0, 158.19], [163.0, 174.53], [179.0, 181.13], [184.0, 185.35], [186.0, 188.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [75.72, 0.0, 0.0, 64.41, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 61.18, 73.67, 32.79, 0.0, 31.24, 31.31, 0.0, 0.0, 32.09, 31.21, 32.58, 0.0, 32.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.88], ["throbbing", 15.62], ["hum", 10.25]], null, [["music", 67.85], ["speech", 4.86], ["throbbing", 4.84]], [["throbbing", 29.58], ["music", 28.85], ["hum", 12.12]], null, null, [["music", 59.54], ["synthesizer", 4.15], ["musical instrument", 2.96]], [["throbbing", 47.54], ["hum", 29.26], ["music", 14.82]], [["music", 58.99], ["theremin", 7.46], ["singing", 3.72]], null, [["music", 60.21], ["throbbing", 4.85], ["synthesizer", 2.8]]], "duration": [5.02, 1.84, 0.68, 5.41, 34.93, 4.51, 1.49, 1.78, 1.21, 1.36, 3.15, 7.82, 13.75, 1.4, 9.82, 6.73, 0.79, 0.53, 3.19, 11.53, 2.13, 1.35, 2.82]} \ No newline at end of file diff --git a/annotations_1/YNZmZ4ARr38_filtered.json b/annotations_1/YNZmZ4ARr38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9baa79114dac3e4a951ef0a5360de0c3982f3265 --- /dev/null +++ b/annotations_1/YNZmZ4ARr38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.83], [5.0, 5.61], [7.0, 10.98], [21.0, 20.93], [25.0, 26.28], [32.0, 33.22], [35.0, 35.4], [45.0, 51.17], [52.0, 52.76], [57.0, 59.27], [67.0, 72.67], [74.0, 76.71], [79.0, 78.71], [82.0, 88.23], [94.0, 99.94], [105.0, 106.29], [107.0, 108.04], [109.0, 111.67], [116.0, 120.82], [129.0, 136.21], [137.0, 137.49], [139.0, 154.92]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 33.84, 38.52, 59.07, 0.0, 45.43, 37.43, 0.0, 0.0, 39.8, 33.56, 35.08, 0.0, 31.91], "audiomae_on_audioset": [null, null, [["music", 53.65], ["burping, eructation", 21.66], ["musical instrument", 2.18]], null, null, null, null, [["fart", 63.56], ["music", 25.53], ["speech", 2.61]], null, [["music", 37.16], ["throbbing", 25.33], ["didgeridoo", 6.03]], [["music", 36.5], ["guitar", 19.44], ["plucked string instrument", 10.26]], null, null, [["music", 23.66], ["guitar", 7.66], ["cattle, bovinae", 6.27]], [["music", 52.33], ["speech", 19.56], ["burping, eructation", 15.93]], null, null, [["music", 32.46], ["speech", 30.58], ["boing", 5.26]], [["music", 30.14], ["breaking", 17.63], ["speech", 12.17]], [["speech", 46.45], ["music", 27.12], ["fart", 7.13]], null, [["music", 25.89], ["speech", 24.02], ["whack, thwack", 15.97]]], "duration": [0.83, 0.61, 3.98, -0.07, 1.28, 1.22, 0.4, 6.17, 0.76, 2.27, 5.67, 2.71, -0.29, 6.23, 5.94, 1.29, 1.04, 2.67, 4.82, 7.21, 0.49, 15.92]} \ No newline at end of file diff --git a/annotations_1/YOCEHKSgwlQ_filtered.json b/annotations_1/YOCEHKSgwlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463185e28e100674d58987ab52da7090c287898b --- /dev/null +++ b/annotations_1/YOCEHKSgwlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.17], [14.0, 15.72], [17.0, 33.57], [34.0, 36.17], [37.0, 47.97], [49.0, 57.96], [65.0, 76.81], [77.0, 115.52], [124.0, 131.94]], "keep_status": [false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 30.5, 31.81, 34.14, 42.37, 31.54, 0.0, 50.71], "audiomae_on_audioset": [null, null, [["speech", 60.06], ["music", 6.83], ["eruption", 4.37]], [["speech", 8.63], ["animal", 5.5], ["cacophony", 4.93]], [["speech", 66.48], ["hum", 10.65], ["throbbing", 3.48]], [["splash, splatter", 24.67], ["speech", 14.68], ["frog", 14.07]], [["explosion", 38.42], ["hum", 15.34], ["throbbing", 6.35]], null, null], "duration": [1.17, 1.72, 16.57, 2.17, 10.97, 8.96, 11.81, 38.52, 7.94]} \ No newline at end of file diff --git a/annotations_1/YOUt-qq-snc_filtered.json b/annotations_1/YOUt-qq-snc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6758aae9004ed55a8298419c44578e14e5546a18 --- /dev/null +++ b/annotations_1/YOUt-qq-snc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 97.19]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [93.19]} \ No newline at end of file diff --git a/annotations_1/YPIfHEdHjHI_filtered.json b/annotations_1/YPIfHEdHjHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac6a2d026fad1057be18a1a2590e04f50278d8b0 --- /dev/null +++ b/annotations_1/YPIfHEdHjHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.05], [18.0, 19.68], [21.0, 21.52], [23.0, 24.0], [25.0, 26.2], [27.0, 28.75], [32.0, 33.25], [35.0, 36.37], [37.0, 38.65], [41.0, 41.81], [45.0, 46.74], [51.0, 52.32], [53.0, 54.35], [56.0, 57.11], [60.0, 61.37], [63.0, 65.8], [68.0, 68.62], [71.0, 72.81], [75.0, 76.37], [78.0, 81.35], [83.0, 83.86], [84.0, 88.79], [91.0, 95.72], [96.0, 97.26], [99.0, 99.47], [100.0, 100.45], [102.0, 107.0], [109.0, 109.66], [113.0, 121.66], [122.0, 126.32], [128.0, 130.08], [131.0, 134.5], [135.0, 136.29], [139.0, 141.93], [144.0, 147.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.99, 0.0, 98.01, 99.8, 0.0, 0.0, 0.0, 88.46, 0.0, 96.42, 84.07, 62.27, 100.0, 0.0, 100.0, 31.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.66], ["effects unit", 17.06], ["distortion", 8.06]]], "duration": [1.05, 1.68, 0.52, 1.0, 1.2, 1.75, 1.25, 1.37, 1.65, 0.81, 1.74, 1.32, 1.35, 1.11, 1.37, 2.8, 0.62, 1.81, 1.37, 3.35, 0.86, 4.79, 4.72, 1.26, 0.47, 0.45, 5.0, 0.66, 8.66, 4.32, 2.08, 3.5, 1.29, 2.93, 3.97]} \ No newline at end of file diff --git a/annotations_1/YPXkzktz5oA_filtered.json b/annotations_1/YPXkzktz5oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c85e115b0c5a546fd55a6a6f7ca3a5382c5e97 --- /dev/null +++ b/annotations_1/YPXkzktz5oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.59], [15.0, 22.37], [24.0, 29.34], [31.0, 31.99], [38.0, 50.06], [51.0, 56.3], [57.0, 73.82], [80.0, 80.87], [86.0, 87.88], [89.0, 90.48], [93.0, 92.79]], "keep_status": [true, true, true, false, false, true, true, false, false, false, false], "silence_prob": [43.08, 33.72, 38.38, 0.0, 38.37, 32.67, 29.75, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 26.85], ["hum", 7.02], ["ping", 6.44]], [["music", 53.85], ["speech", 5.12], ["buzz", 3.08]], [["buzz", 21.44], ["hum", 9.92], ["music", 8.92]], null, [["music", 64.64], ["synthesizer", 5.87], ["musical instrument", 4.15]], [["music", 33.04], ["hum", 18.38], ["throbbing", 9.71]], [["speech", 22.41], ["music", 19.27], ["bleat", 11.51]], null, null, null, null], "duration": [3.59, 7.37, 5.34, 0.99, 12.06, 5.3, 16.82, 0.87, 1.88, 1.48, -0.21]} \ No newline at end of file diff --git a/annotations_1/YR4qgOi7VQ0_filtered.json b/annotations_1/YR4qgOi7VQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..338b60aae24185880d3751d6cdfc02e9cb5600c6 --- /dev/null +++ b/annotations_1/YR4qgOi7VQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.45], [9.0, 9.9], [10.0, 11.53], [18.0, 19.16], [20.0, 20.39], [21.0, 22.28], [25.0, 25.49], [26.0, 26.6], [28.0, 28.97], [30.0, 34.4], [35.0, 36.93], [39.0, 40.69], [41.0, 41.72], [42.0, 42.38], [48.0, 48.47], [52.0, 52.02], [58.0, 57.87], [70.0, 70.31], [73.0, 73.87], [76.0, 79.88], [82.0, 82.48], [85.0, 86.48], [89.0, 89.58], [91.0, 91.96], [93.0, 93.82], [94.0, 95.72], [96.0, 97.8], [105.0, 104.67], [105.0, 106.41], [115.0, 115.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 0.9, 1.53, 1.16, 0.39, 1.28, 0.49, 0.6, 0.97, 4.4, 1.93, 1.69, 0.72, 0.38, 0.47, 0.02, -0.13, 0.31, 0.87, 3.88, 0.48, 1.48, 0.58, 0.96, 0.82, 1.72, 1.8, -0.33, 1.41, 0.52]} \ No newline at end of file diff --git a/annotations_1/YRCIuvKg4tc_filtered.json b/annotations_1/YRCIuvKg4tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40cf484fec20d682c7044d45f935ba76e00c367e --- /dev/null +++ b/annotations_1/YRCIuvKg4tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.63], [31.0, 36.36], [37.0, 38.3], [62.0, 63.29], [66.0, 67.34], [90.0, 102.9], [104.0, 105.34], [106.0, 105.92], [106.0, 111.69], [116.0, 121.47], [123.0, 130.98], [135.0, 142.48], [150.0, 153.08], [153.0, 154.08], [158.0, 165.65]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 36.59, 0.0, 0.0, 0.0, 28.79, 0.0, 0.0, 28.65, 28.46, 28.65, 28.6, 29.28, 0.0, 29.56], "audiomae_on_audioset": [null, [["moo", 24.6], ["music", 21.86], ["cattle, bovinae", 15.68]], null, null, null, [["cattle, bovinae", 36.62], ["moo", 36.6], ["livestock, farm animals, working animals", 19.32]], null, null, [["music", 40.18], ["speech", 11.71], ["electronic music", 3.63]], [["breaking", 49.13], ["speech", 16.5], ["music", 7.59]], [["whack, thwack", 24.61], ["music", 18.14], ["speech", 6.76]], [["breaking", 60.79], ["music", 14.45], ["smash, crash", 8.49]], [["speech", 53.31], ["music", 10.99], ["cattle, bovinae", 8.46]], null, [["music", 61.42], ["throbbing", 16.05], ["electronic music", 7.23]]], "duration": [1.63, 5.36, 1.3, 1.29, 1.34, 12.9, 1.34, -0.08, 5.69, 5.47, 7.98, 7.48, 3.08, 1.08, 7.65]} \ No newline at end of file diff --git a/annotations_1/YRdXmtGnwCI_filtered.json b/annotations_1/YRdXmtGnwCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d52ccc63eb52715c13f3e57afc18b3d68c685173 --- /dev/null +++ b/annotations_1/YRdXmtGnwCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.44], [8.0, 60.59], [61.0, 61.48], [62.0, 65.84], [66.0, 67.22], [69.0, 74.88], [79.0, 100.57], [102.0, 103.05], [104.0, 104.89], [109.0, 109.41], [110.0, 112.99]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.59, 0.0, 32.36, 41.78, 0.0, 0.0, 0.0, 62.89], "audiomae_on_audioset": [null, null, null, [["music", 39.78], ["mains hum", 15.14], ["speech", 13.58]], null, [["whale vocalization", 55.69], ["burping, eructation", 21.14], ["music", 3.68]], [["music", 25.17], ["rumble", 12.83], ["hum", 9.11]], null, null, null, null], "duration": [1.44, 52.59, 0.48, 3.84, 1.22, 5.88, 21.57, 1.05, 0.89, 0.41, 2.99]} \ No newline at end of file diff --git a/annotations_1/YRpgfi7L9Rs_filtered.json b/annotations_1/YRpgfi7L9Rs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa3e3225288c70f3126958bf844038e490efd4d2 --- /dev/null +++ b/annotations_1/YRpgfi7L9Rs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.9], [8.0, 8.14], [11.0, 11.62], [16.0, 19.2], [20.0, 22.22], [25.0, 24.9], [31.0, 31.72], [38.0, 38.2], [42.0, 43.09], [45.0, 46.21], [67.0, 69.67], [70.0, 93.99], [98.0, 99.18]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.46, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 34.7, 30.23, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.35], ["crack", 3.82], ["mechanisms", 3.13]], null, null, null, null, null, null, [["music", 35.92], ["sound effect", 9.37], ["theremin", 7.27]], [["music", 66.17], ["didgeridoo", 4.42], ["theremin", 3.54]], null], "duration": [0.9, 0.14, 0.62, 3.2, 2.22, -0.1, 0.72, 0.2, 1.09, 1.21, 2.67, 23.99, 1.18]} \ No newline at end of file diff --git a/annotations_1/YRruOzr9_w0_filtered.json b/annotations_1/YRruOzr9_w0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0bcd787062e36f3625a005c3ba67ccf0ca57e71 --- /dev/null +++ b/annotations_1/YRruOzr9_w0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.05], [11.0, 12.51], [16.0, 15.74], [19.0, 19.06], [20.0, 20.65], [25.0, 25.3], [33.0, 33.17], [39.0, 39.56], [41.0, 41.18], [43.0, 42.72], [45.0, 45.08], [59.0, 58.77], [60.0, 60.1], [63.0, 66.02], [71.0, 71.78], [73.0, 72.77], [74.0, 74.36], [79.0, 81.65], [95.0, 95.23], [100.0, 100.25], [102.0, 102.71], [120.0, 120.55], [121.0, 121.36], [123.0, 124.56], [126.0, 126.49], [139.0, 140.32], [144.0, 144.54], [147.0, 147.6], [154.0, 157.67], [160.0, 161.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.58, 0.0, 0.0, 0.0, 33.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 19.92], ["cattle, bovinae", 14.81], ["whack, thwack", 14.06]], null, null, null, [["laughter", 23.45], ["snicker", 21.41], ["baby laughter", 15.84]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 1.51, -0.26, 0.06, 0.65, 0.3, 0.17, 0.56, 0.18, -0.28, 0.08, -0.23, 0.1, 3.02, 0.78, -0.23, 0.36, 2.65, 0.23, 0.25, 0.71, 0.55, 0.36, 1.56, 0.49, 1.32, 0.54, 0.6, 3.67, 1.74]} \ No newline at end of file diff --git a/annotations_1/YSN08rz66zE_filtered.json b/annotations_1/YSN08rz66zE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db81c10a07be47c48669a8a614e5173c4625e7d7 --- /dev/null +++ b/annotations_1/YSN08rz66zE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [31.0, 39.92], [42.0, 50.65], [53.0, 53.16], [54.0, 55.32], [58.0, 57.96], [60.0, 61.28], [62.0, 62.43], [63.0, 64.0], [65.0, 65.69], [67.0, 67.56], [69.0, 68.94], [70.0, 71.17], [72.0, 72.13], [73.0, 74.8], [76.0, 78.68], [80.0, 84.6], [90.0, 90.71], [96.0, 96.67], [111.0, 111.2], [111.0, 112.43], [115.0, 115.62], [118.0, 120.11], [121.0, 124.26], [129.0, 130.17], [131.0, 130.98], [137.0, 150.58], [155.0, 155.95], [157.0, 159.34], [159.0, 159.43], [161.0, 161.97], [167.0, 167.9], [177.0, 177.65], [183.0, 195.81], [201.0, 202.39], [203.0, 205.5], [208.0, 208.63], [223.0, 224.13], [229.0, 233.52], [241.0, 246.18], [250.0, 251.6]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.58, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.93, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0, 31.18, 29.84, 0.0, 0.0, 30.57, 0.0, 30.31, 0.0, 0.0, 0.0, 0.0, 30.89, 0.0, 30.42, 0.0, 0.0, 30.47, 30.64, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 54.97], ["car", 5.33], ["music", 3.84]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.72], ["cattle, bovinae", 12.47], ["moo", 10.09]], null, null, null, null, null, [["music", 68.84], ["reggae", 4.99], ["electronic music", 1.83]], [["music", 62.27], ["funny music", 8.11], ["boing", 3.34]], null, null, [["music", 70.3], ["didgeridoo", 3.26], ["reggae", 1.88]], null, [["music", 75.0], ["funny music", 5.22], ["quack", 3.1]], null, null, null, null, [["music", 83.83], ["singing", 2.15], ["reggae", 1.57]], null, [["music", 75.72], ["reggae", 2.81], ["rock and roll", 1.6]], null, null, [["music", 70.9], ["middle eastern music", 4.63], ["carnatic music", 3.3]], [["music", 70.42], ["singing", 2.79], ["reggae", 2.28]], null], "duration": [0.4, 8.92, 8.65, 0.16, 1.32, -0.04, 1.28, 0.43, 1.0, 0.69, 0.56, -0.06, 1.17, 0.13, 1.8, 2.68, 4.6, 0.71, 0.67, 0.2, 1.43, 0.62, 2.11, 3.26, 1.17, -0.02, 13.58, 0.95, 2.34, 0.43, 0.97, 0.9, 0.65, 12.81, 1.39, 2.5, 0.63, 1.13, 4.52, 5.18, 1.6]} \ No newline at end of file diff --git a/annotations_1/YSOUTJUdTgs_filtered.json b/annotations_1/YSOUTJUdTgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6420528e4bd194445b70f22082e4f1f7bd846183 --- /dev/null +++ b/annotations_1/YSOUTJUdTgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 16.58], [22.0, 34.92], [38.0, 51.9], [68.0, 72.87], [82.0, 82.81], [87.0, 92.31], [93.0, 93.34], [95.0, 95.47], [99.0, 99.42], [101.0, 104.03], [104.0, 120.9], [121.0, 120.97], [123.0, 126.5], [129.0, 129.03], [143.0, 144.15], [149.0, 149.2], [156.0, 156.52], [159.0, 160.27], [168.0, 168.69], [173.0, 176.28], [177.0, 178.98], [190.0, 190.36], [201.0, 200.94], [201.0, 201.9], [210.0, 211.81], [214.0, 220.08], [222.0, 222.62], [226.0, 250.28], [252.0, 254.55], [257.0, 257.23], [258.0, 261.13]], "keep_status": [false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [32.07, 28.64, 29.73, 29.38, 0.0, 36.28, 0.0, 0.0, 0.0, 29.05, 29.34, 0.0, 39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 34.93, 0.0, 29.37, 40.28, 0.0, 98.86], "audiomae_on_audioset": [[["music", 64.32], ["throbbing", 7.82], ["hum", 4.37]], [["music", 46.28], ["speech", 33.22], ["throbbing", 5.81]], [["music", 77.94], ["throbbing", 8.74], ["electronic music", 3.06]], [["groan", 37.39], ["roaring cats (lions, tigers)", 4.15], ["crying, sobbing", 3.85]], null, [["music", 31.95], ["theremin", 19.72], ["hum", 7.06]], null, null, null, [["speech", 32.5], ["sonar", 21.73], ["music", 14.8]], [["throbbing", 54.95], ["music", 18.16], ["hum", 10.34]], null, [["music", 18.66], ["speech", 13.84], ["hum", 6.79]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 29.92], ["explosion", 27.89], ["burst, pop", 5.66]], null, [["explosion", 27.79], ["burst, pop", 7.51], ["eruption", 7.12]], [["livestock, farm animals, working animals", 23.3], ["sheep", 11.48], ["moo", 10.2]], null, null], "duration": [14.58, 12.92, 13.9, 4.87, 0.81, 5.31, 0.34, 0.47, 0.42, 3.03, 16.9, -0.03, 3.5, 0.03, 1.15, 0.2, 0.52, 1.27, 0.69, 3.28, 1.98, 0.36, -0.06, 0.9, 1.81, 6.08, 0.62, 24.28, 2.55, 0.23, 3.13]} \ No newline at end of file diff --git a/annotations_1/YSfBTZfswSg_filtered.json b/annotations_1/YSfBTZfswSg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1e83fbe04187e93c07379ad423728c54510e4d4 --- /dev/null +++ b/annotations_1/YSfBTZfswSg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.07], [21.0, 45.67], [47.0, 47.39], [48.0, 48.66], [49.0, 49.45], [53.0, 61.37]], "keep_status": [false, true, false, false, false, true], "silence_prob": [0.0, 29.88, 0.0, 0.0, 0.0, 29.06], "audiomae_on_audioset": [null, [["speech", 40.07], ["music", 17.15], ["explosion", 8.68]], null, null, null, [["hum", 22.05], ["mains hum", 18.51], ["music", 12.57]]], "duration": [0.07, 24.67, 0.39, 0.66, 0.45, 8.37]} \ No newline at end of file diff --git a/annotations_1/YSrOLez2GbE_filtered.json b/annotations_1/YSrOLez2GbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e78fd514a1494939587a59d2e5938394a26f313c --- /dev/null +++ b/annotations_1/YSrOLez2GbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.08], [6.0, 7.45], [9.0, 16.8], [24.0, 25.12], [27.0, 32.46], [33.0, 35.34], [36.0, 39.8], [45.0, 46.13], [50.0, 52.42], [55.0, 56.74], [58.0, 59.1], [60.0, 61.82], [66.0, 67.68], [74.0, 77.14], [81.0, 82.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 99.97, 0.0, 99.96, 81.71, 99.98, 0.0, 50.16, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 1.45, 7.8, 1.12, 5.46, 2.34, 3.8, 1.13, 2.42, 1.74, 1.1, 1.82, 1.68, 3.14, 1.24]} \ No newline at end of file diff --git a/annotations_1/YTdTD0TbEp4_filtered.json b/annotations_1/YTdTD0TbEp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a95545c1c26a44b278693184935c1dc029d242ed --- /dev/null +++ b/annotations_1/YTdTD0TbEp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 69.48], [70.0, 72.35], [73.0, 117.34], [118.0, 118.45]], "keep_status": [false, false, false, false], "silence_prob": [32.43, 31.47, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 65.79], ["music", 11.1], ["noise", 3.69]], [["boing", 49.75], ["music", 18.23], ["speech", 4.73]], null, null], "duration": [12.48, 2.35, 44.34, 0.45]} \ No newline at end of file diff --git a/annotations_1/YV-vi9NuyTw_filtered.json b/annotations_1/YV-vi9NuyTw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6abf7b2baaacd220006c9a1a280e7464ec4b2efc --- /dev/null +++ b/annotations_1/YV-vi9NuyTw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.75], [15.0, 16.17], [17.0, 18.1], [20.0, 23.43], [26.0, 26.45], [32.0, 48.69], [50.0, 54.43], [61.0, 95.17], [96.0, 96.36], [99.0, 103.87], [108.0, 125.85], [126.0, 125.95]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [30.38, 0.0, 0.0, 39.02, 0.0, 28.96, 35.53, 0.0, 0.0, 88.83, 41.12, 0.0], "audiomae_on_audioset": [[["speech", 49.15], ["music", 28.85], ["hum", 10.53]], null, null, [["music", 59.81], ["hum", 5.5], ["shuffling cards", 3.98]], null, [["music", 49.22], ["buzz", 11.23], ["mains hum", 5.1]], [["mains hum", 19.67], ["speech", 19.47], ["music", 18.96]], null, null, null, [["mains hum", 44.04], ["hum", 41.03], ["music", 5.79]], null], "duration": [6.75, 1.17, 1.1, 3.43, 0.45, 16.69, 4.43, 34.17, 0.36, 4.87, 17.85, -0.05]} \ No newline at end of file diff --git a/annotations_1/YWJMmQUGP00_filtered.json b/annotations_1/YWJMmQUGP00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..03f4c9fd80579697919654c9ea4e5863e29277d6 --- /dev/null +++ b/annotations_1/YWJMmQUGP00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.0], [7.0, 8.34], [12.0, 12.88], [17.0, 18.12], [21.0, 20.76], [23.0, 23.55], [26.0, 26.03], [27.0, 27.67], [28.0, 28.44], [29.0, 29.42], [30.0, 30.21], [33.0, 33.15], [39.0, 40.32], [57.0, 59.76], [65.0, 65.47], [66.0, 69.31], [70.0, 71.42], [72.0, 73.97], [75.0, 79.1], [81.0, 81.09], [87.0, 88.1], [89.0, 88.92], [90.0, 90.0], [92.0, 92.4], [93.0, 92.92], [98.0, 101.44], [110.0, 110.32], [111.0, 111.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 86.27, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.34, 0.88, 1.12, -0.24, 0.55, 0.03, 0.67, 0.44, 0.42, 0.21, 0.15, 1.32, 2.76, 0.47, 3.31, 1.42, 1.97, 4.1, 0.09, 1.1, -0.08, 0.0, 0.4, -0.08, 3.44, 0.32, 0.74]} \ No newline at end of file diff --git a/annotations_1/YYPpg3_Y4XY_filtered.json b/annotations_1/YYPpg3_Y4XY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef8dfcd2914938535050351a276922dbe6bafd1a --- /dev/null +++ b/annotations_1/YYPpg3_Y4XY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 30.43], [31.0, 31.56], [32.0, 32.32], [36.0, 53.82], [57.0, 57.77], [58.0, 59.09], [64.0, 64.93], [71.0, 72.15], [80.0, 103.77], [104.0, 122.45], [123.0, 126.32], [128.0, 133.73], [134.0, 134.37]], "keep_status": [true, false, false, true, false, false, false, false, true, true, true, true, false], "silence_prob": [28.85, 0.0, 0.0, 28.42, 0.0, 0.0, 0.0, 0.0, 28.72, 28.99, 29.03, 28.63, 0.0], "audiomae_on_audioset": [[["speech", 20.91], ["thump, thud", 6.87], ["music", 5.73]], null, null, [["speech", 27.44], ["music", 20.73], ["thump, thud", 9.55]], null, null, null, null, [["music", 27.97], ["noise", 9.41], ["buzz", 8.12]], [["throbbing", 16.46], ["hum", 15.84], ["music", 14.3]], [["speech", 35.75], ["music", 22.58], ["hum", 9.45]], [["speech", 12.72], ["thump, thud", 9.47], ["music", 8.99]], null], "duration": [8.43, 0.56, 0.32, 17.82, 0.77, 1.09, 0.93, 1.15, 23.77, 18.45, 3.32, 5.73, 0.37]} \ No newline at end of file diff --git a/annotations_1/YYZSg-BBAmw_filtered.json b/annotations_1/YYZSg-BBAmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a62e06c446d436a7490e1b079d3d3344253a584f --- /dev/null +++ b/annotations_1/YYZSg-BBAmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.08], [12.0, 13.56], [15.0, 17.14], [19.0, 19.2], [21.0, 21.12], [23.0, 24.33], [38.0, 39.66], [43.0, 44.91], [45.0, 46.45], [47.0, 67.14]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.33], "audiomae_on_audioset": [null, null, [["music", 23.2], ["hum", 10.68], ["speech", 10.34]], null, null, null, null, null, null, [["speech", 40.41], ["hum", 24.33], ["mains hum", 15.11]]], "duration": [1.08, 1.56, 2.14, 0.2, 0.12, 1.33, 1.66, 1.91, 1.45, 20.14]} \ No newline at end of file diff --git a/annotations_1/YYo5jJy61T8_filtered.json b/annotations_1/YYo5jJy61T8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22c214b6ce80da0fbbe4448a8f3d18610b79bdc9 --- /dev/null +++ b/annotations_1/YYo5jJy61T8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [3.0, 3.28], [9.0, 8.7], [14.0, 14.57], [16.0, 16.78], [23.0, 24.75], [27.0, 28.98], [30.0, 31.26], [32.0, 35.88], [37.0, 40.22], [41.0, 42.36], [46.0, 46.52], [47.0, 48.05], [49.0, 53.52], [55.0, 56.56], [58.0, 70.33], [72.0, 72.84], [73.0, 75.15], [76.0, 76.49], [78.0, 78.27], [79.0, 79.73], [81.0, 81.19], [85.0, 85.46], [90.0, 91.44], [94.0, 94.81], [97.0, 98.83], [103.0, 103.05], [104.0, 104.31], [105.0, 106.57], [110.0, 110.27], [112.0, 113.12], [116.0, 117.63], [118.0, 129.63], [131.0, 133.44], [134.0, 136.86], [138.0, 144.05], [145.0, 146.75], [147.0, 149.49], [150.0, 151.24], [152.0, 159.34], [161.0, 175.09], [177.0, 178.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 88.46, 0.0, 0.0, 0.0, 98.19, 0.0, 99.93, 0.0, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 100.0, 90.43, 100.0, 0.0, 59.86, 0.0, 99.73, 84.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.28, -0.3, 0.57, 0.78, 1.75, 1.98, 1.26, 3.88, 3.22, 1.36, 0.52, 1.05, 4.52, 1.56, 12.33, 0.84, 2.15, 0.49, 0.27, 0.73, 0.19, 0.46, 1.44, 0.81, 1.83, 0.05, 0.31, 1.57, 0.27, 1.12, 1.63, 11.63, 2.44, 2.86, 6.05, 1.75, 2.49, 1.24, 7.34, 14.09, 1.93]} \ No newline at end of file diff --git a/annotations_1/YYsdcBacV2U_filtered.json b/annotations_1/YYsdcBacV2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2e416ae484a4ab7d05b0008f032aa6948e0940 --- /dev/null +++ b/annotations_1/YYsdcBacV2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.95], [16.0, 17.34], [25.0, 25.57], [36.0, 40.32], [57.0, 57.57], [62.0, 71.07], [76.0, 77.19], [86.0, 87.96], [90.0, 91.18], [91.0, 95.93], [98.0, 108.33], [110.0, 113.27], [126.0, 137.3], [140.0, 154.77], [168.0, 167.95]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.44, 0.0, 40.64, 0.0, 0.0, 0.0, 49.27, 35.28, 31.71, 31.29, 31.38, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.72], ["speech", 25.55], ["crowd", 3.73]], null, [["speech", 45.39], ["music", 36.37], ["shatter", 9.01]], null, null, null, [["music", 55.08], ["ambient music", 9.52], ["foghorn", 3.88]], [["music", 58.26], ["hum", 13.44], ["throbbing", 8.17]], [["speech", 36.01], ["music", 29.83], ["hum", 3.09]], [["buzz", 33.75], ["music", 23.65], ["throbbing", 13.81]], [["hum", 27.55], ["throbbing", 26.4], ["music", 19.24]], null], "duration": [0.95, 1.34, 0.57, 4.32, 0.57, 9.07, 1.19, 1.96, 1.18, 4.93, 10.33, 3.27, 11.3, 14.77, -0.05]} \ No newline at end of file diff --git a/annotations_1/YZ5Y_GhXMKw_filtered.json b/annotations_1/YZ5Y_GhXMKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ee10fe00518050fff4c0dc9d47439bf6cb309a --- /dev/null +++ b/annotations_1/YZ5Y_GhXMKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [9.0, 10.1], [11.0, 11.48], [20.0, 20.73], [21.0, 21.98], [36.0, 44.12], [57.0, 62.5], [64.0, 64.57], [66.0, 71.02], [73.0, 84.55], [85.0, 102.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 50.06, 0.0, 99.59, 87.55, 96.89], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 24.76], ["hum", 20.63], ["throbbing", 15.95]], null, null, null, null, null], "duration": [0.1, 1.1, 0.48, 0.73, 0.98, 8.12, 5.5, 0.57, 5.02, 11.55, 17.91]} \ No newline at end of file diff --git a/annotations_1/YZGetnQQU48_filtered.json b/annotations_1/YZGetnQQU48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daa8c8ec36d86222f51d4033e1a4aef1c80019ad --- /dev/null +++ b/annotations_1/YZGetnQQU48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [2.0, 2.59], [5.0, 5.8], [10.0, 10.42], [11.0, 11.92], [13.0, 15.31], [19.0, 31.6], [33.0, 34.05], [36.0, 40.41], [41.0, 42.77], [44.0, 46.18], [47.0, 50.92], [52.0, 52.46], [54.0, 68.07], [70.0, 70.29], [73.0, 78.38], [81.0, 99.6], [102.0, 102.76], [104.0, 105.93], [107.0, 108.18], [111.0, 112.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 95.78, 0.0, 43.82, 0.0, 100.0, 99.68, 0.0, 37.81, 0.0, 42.81, 71.43, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["sidetone", 43.74], ["speech", 21.91], ["music", 5.49]], null, null, null, null, [["music", 34.1], ["speech", 20.02], ["fart", 17.31]], null, [["sonar", 21.58], ["music", 20.89], ["thunk", 20.88]], null, null, null, null, null], "duration": [0.35, 0.59, 0.8, 0.42, 0.92, 2.31, 12.6, 1.05, 4.41, 1.77, 2.18, 3.92, 0.46, 14.07, 0.29, 5.38, 18.6, 0.76, 1.93, 1.18, 1.24]} \ No newline at end of file diff --git a/annotations_1/YZrVYAXYyws_filtered.json b/annotations_1/YZrVYAXYyws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..782d216c173ffd93cc0ed611c2ea0f5be00453f1 --- /dev/null +++ b/annotations_1/YZrVYAXYyws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.45], [13.0, 13.9], [15.0, 15.53], [20.0, 20.53], [23.0, 24.88], [25.0, 26.65], [27.0, 34.64], [37.0, 38.03], [41.0, 45.05], [46.0, 47.97], [50.0, 53.06], [54.0, 56.03], [57.0, 58.16], [60.0, 63.1], [64.0, 79.98], [80.0, 82.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0, 85.9, 0.0, 59.77, 73.21, 0.0, 87.37, 36.91, 46.29], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 53.04], ["mains hum", 36.95], ["throbbing", 3.68]], null, null, null, null, null, null, null, [["music", 58.6], ["wild animals", 8.34], ["animal", 7.35]], [["music", 69.68], ["singing bowl", 2.94], ["musical instrument", 2.94]]], "duration": [4.45, 0.9, 0.53, 0.53, 1.88, 1.65, 7.64, 1.03, 4.05, 1.97, 3.06, 2.03, 1.16, 3.1, 15.98, 2.83]} \ No newline at end of file diff --git a/annotations_1/Y_U49qqwDGI_filtered.json b/annotations_1/Y_U49qqwDGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..438eb0c406af23e5c5e9ea034a7cc31ed1592149 --- /dev/null +++ b/annotations_1/Y_U49qqwDGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [3.0, 3.18], [17.0, 18.74], [21.0, 30.47], [37.0, 42.53], [43.0, 45.59], [47.0, 50.25], [52.0, 61.64], [67.0, 72.54], [81.0, 80.81], [83.0, 86.66], [91.0, 91.67], [93.0, 95.64], [102.0, 102.91], [108.0, 118.69], [120.0, 120.82], [122.0, 122.32], [125.0, 131.52], [132.0, 132.44], [132.0, 132.83], [134.0, 138.72], [141.0, 150.06], [154.0, 175.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.83, 28.8, 28.94, 28.75, 28.61, 29.7, 0.0, 28.63, 0.0, 37.35, 0.0, 28.71, 0.0, 0.0, 28.79, 0.0, 0.0, 28.18, 28.46, 30.68], "audiomae_on_audioset": [null, null, null, [["music", 85.11], ["electronic music", 4.39], ["throbbing", 2.22]], [["music", 84.83], ["electronic music", 5.18], ["dubstep", 2.42]], [["music", 75.02], ["electronic music", 6.38], ["dubstep", 3.78]], [["music", 76.61], ["speech", 7.66], ["electronic music", 1.76]], [["music", 76.87], ["throbbing", 6.47], ["cacophony", 4.19]], [["throbbing", 64.69], ["music", 16.45], ["hum", 9.91]], null, [["music", 31.19], ["hum", 14.56], ["zipper (clothing)", 10.48]], null, [["music", 62.86], ["dubstep", 11.78], ["electronic music", 4.42]], null, [["music", 67.37], ["throbbing", 7.66], ["hum", 5.33]], null, null, [["music", 54.01], ["buzz", 9.25], ["fly, housefly", 4.39]], null, null, [["music", 66.86], ["throbbing", 5.18], ["cacophony", 4.67]], [["hum", 42.57], ["mains hum", 35.01], ["throbbing", 4.91]], [["music", 54.26], ["hum", 10.58], ["mains hum", 7.97]]], "duration": [0.5, 0.18, 1.74, 9.47, 5.53, 2.59, 3.25, 9.64, 5.54, -0.19, 3.66, 0.67, 2.64, 0.91, 10.69, 0.82, 0.32, 6.52, 0.44, 0.83, 4.72, 9.06, 21.19]} \ No newline at end of file diff --git a/annotations_1/YaUe_zBgQ9I_filtered.json b/annotations_1/YaUe_zBgQ9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48717ca83712f10658f6963fb8c18b5b5d25d3d9 --- /dev/null +++ b/annotations_1/YaUe_zBgQ9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[110.0, 111.23], [113.0, 124.44], [127.0, 126.66]], "keep_status": [false, true, false], "silence_prob": [0.0, 32.79, 0.0], "audiomae_on_audioset": [null, [["throbbing", 37.83], ["music", 16.31], ["hum", 14.8]], null], "duration": [1.23, 11.44, -0.34]} \ No newline at end of file diff --git a/annotations_1/YauDSh8CfwI_filtered.json b/annotations_1/YauDSh8CfwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eec8344a15273758381c7dea1c2ff201994cf909 --- /dev/null +++ b/annotations_1/YauDSh8CfwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [2.0, 2.3], [3.0, 3.2], [4.0, 5.16], [6.0, 7.15], [8.0, 8.56], [9.0, 20.22], [26.0, 26.52], [28.0, 28.71], [30.0, 30.82], [32.0, 33.0], [34.0, 34.89], [36.0, 36.0], [38.0, 38.52], [40.0, 40.86], [45.0, 44.98], [48.0, 48.61], [51.0, 51.41], [54.0, 54.24], [55.0, 55.81], [57.0, 57.15], [59.0, 60.02], [60.0, 61.35], [62.0, 63.41], [65.0, 65.16], [67.0, 67.44], [69.0, 69.28], [70.0, 70.82], [74.0, 75.25], [76.0, 77.75], [79.0, 80.28], [82.0, 82.49], [83.0, 83.83], [86.0, 86.68], [92.0, 94.64], [96.0, 96.62], [99.0, 100.23], [102.0, 102.22], [103.0, 103.92], [105.0, 106.83], [109.0, 110.51], [112.0, 112.48], [114.0, 114.72], [118.0, 118.44], [120.0, 121.37], [123.0, 123.89], [130.0, 131.23], [134.0, 134.32], [137.0, 137.27], [139.0, 139.78], [141.0, 145.35], [146.0, 149.98], [151.0, 161.69], [166.0, 168.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 74.76, 88.28, 90.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.3, 0.2, 1.16, 1.15, 0.56, 11.22, 0.52, 0.71, 0.82, 1.0, 0.89, 0.0, 0.52, 0.86, -0.02, 0.61, 0.41, 0.24, 0.81, 0.15, 1.02, 1.35, 1.41, 0.16, 0.44, 0.28, 0.82, 1.25, 1.75, 1.28, 0.49, 0.83, 0.68, 2.64, 0.62, 1.23, 0.22, 0.92, 1.83, 1.51, 0.48, 0.72, 0.44, 1.37, 0.89, 1.23, 0.32, 0.27, 0.78, 4.35, 3.98, 10.69, 2.89]} \ No newline at end of file diff --git a/annotations_1/Yb4Lrplxq_A_filtered.json b/annotations_1/Yb4Lrplxq_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b2648054eabb89576cc17b131f1132550b30c7e --- /dev/null +++ b/annotations_1/Yb4Lrplxq_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.34], [12.0, 14.66], [16.0, 16.82]], "keep_status": [false, false, false], "silence_prob": [29.82, 31.89, 0.0], "audiomae_on_audioset": [[["music", 39.96], ["hum", 23.37], ["mains hum", 10.05]], [["sidetone", 51.06], ["hum", 19.88], ["throbbing", 7.63]], null], "duration": [7.34, 2.66, 0.82]} \ No newline at end of file diff --git a/annotations_1/YdcWFWm4n6g_filtered.json b/annotations_1/YdcWFWm4n6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0f6e8f330bbd20d911354368711bd4afda27413 --- /dev/null +++ b/annotations_1/YdcWFWm4n6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.28], [16.0, 25.03], [26.0, 45.67], [46.0, 50.48], [50.0, 50.52]], "keep_status": [true, true, true, false, false], "silence_prob": [37.49, 38.63, 36.7, 36.38, 0.0], "audiomae_on_audioset": [[["electric shaver, electric razor", 27.73], ["speech", 22.31], ["music", 12.71]], [["music", 40.97], ["whack, thwack", 16.07], ["grunt", 8.43]], [["music", 38.76], ["hum", 6.37], ["ambient music", 3.13]], [["fly, housefly", 35.21], ["insect", 24.66], ["mosquito", 12.5]], null], "duration": [5.28, 9.03, 19.67, 4.48, 0.52]} \ No newline at end of file diff --git a/annotations_1/YdowX3H-hGo_filtered.json b/annotations_1/YdowX3H-hGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c79b5af41cc91cd9748b125dd88868ac53f42f6 --- /dev/null +++ b/annotations_1/YdowX3H-hGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [15.0, 17.79], [18.0, 20.48], [24.0, 24.19], [28.0, 28.22], [34.0, 34.64], [58.0, 58.58], [69.0, 69.84], [72.0, 71.86], [94.0, 95.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.64, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 2.79, 2.48, 0.19, 0.22, 0.64, 0.58, 0.84, -0.14, 1.37]} \ No newline at end of file diff --git a/annotations_1/YduLKKYfgSk_filtered.json b/annotations_1/YduLKKYfgSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/YduLKKYfgSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/YeDjVvr-6Zc_filtered.json b/annotations_1/YeDjVvr-6Zc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5cacfbd699e75c7520901d7638868b9c118250 --- /dev/null +++ b/annotations_1/YeDjVvr-6Zc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.91], [19.0, 21.57], [22.0, 22.38], [23.0, 25.71], [32.0, 32.53], [33.0, 36.8], [39.0, 39.04], [49.0, 49.05], [50.0, 65.64], [66.0, 93.5], [94.0, 93.53], [94.0, 93.75], [95.0, 95.52], [98.0, 101.14], [101.0, 102.09], [105.0, 114.22], [115.0, 117.0], [125.0, 125.31], [127.0, 143.04], [150.0, 155.04], [159.0, 160.07], [162.0, 164.49], [167.0, 168.1], [170.0, 173.84], [179.0, 201.9], [202.0, 204.23], [205.0, 205.83], [209.0, 209.17], [210.0, 212.13]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.24, 96.66, 0.0, 41.87, 0.0, 34.77, 0.0, 0.0, 30.26, 30.28, 0.0, 0.0, 0.0, 39.27, 0.0, 33.42, 55.46, 0.0, 34.19, 67.13, 0.0, 81.17, 0.0, 33.27, 30.08, 36.44, 0.0, 0.0, 70.16], "audiomae_on_audioset": [[["music", 57.36], ["synthesizer", 7.56], ["theremin", 6.01]], null, null, [["speech", 88.26], ["grunt", 3.68], ["speech synthesizer", 2.11]], null, [["grunt", 33.1], ["music", 11.22], ["noise", 6.63]], null, null, [["music", 82.41], ["synthesizer", 2.28], ["hum", 1.78]], [["music", 40.42], ["speech", 30.64], ["whack, thwack", 4.23]], null, null, null, [["music", 43.55], ["speech", 28.21], ["didgeridoo", 10.45]], null, [["music", 47.4], ["whack, thwack", 13.42], ["throbbing", 5.02]], null, null, [["music", 40.83], ["hum", 8.99], ["synthesizer", 4.71]], null, null, null, null, [["music", 39.45], ["speech", 8.87], ["ding", 4.63]], [["music", 78.69], ["didgeridoo", 3.21], ["theremin", 2.64]], [["music", 83.51], ["didgeridoo", 2.89], ["throbbing", 2.62]], null, null, null], "duration": [8.91, 2.57, 0.38, 2.71, 0.53, 3.8, 0.04, 0.05, 15.64, 27.5, -0.47, -0.25, 0.52, 3.14, 1.09, 9.22, 2.0, 0.31, 16.04, 5.04, 1.07, 2.49, 1.1, 3.84, 22.9, 2.23, 0.83, 0.17, 2.13]} \ No newline at end of file diff --git a/annotations_1/YejzV_nWN1M_filtered.json b/annotations_1/YejzV_nWN1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e0bf92c8648fab920ab48bbb62f13626d1c216f --- /dev/null +++ b/annotations_1/YejzV_nWN1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.84], [12.0, 12.55], [14.0, 15.7], [16.0, 18.12], [20.0, 23.53], [25.0, 28.86], [32.0, 31.77], [36.0, 36.49], [39.0, 39.04], [40.0, 41.49], [43.0, 44.31], [45.0, 45.52], [47.0, 48.2], [49.0, 51.27], [52.0, 53.94], [55.0, 55.86], [59.0, 59.56], [60.0, 60.17], [60.0, 61.42], [62.0, 62.63], [65.0, 64.88], [66.0, 72.42], [74.0, 73.87], [81.0, 81.03], [81.0, 81.65], [89.0, 95.69], [98.0, 127.97], [130.0, 132.68], [133.0, 149.74], [151.0, 159.26], [160.0, 160.95]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [58.55, 0.0, 0.0, 41.74, 60.89, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.21, 0.0, 0.0, 0.0, 30.44, 28.72, 30.85, 28.7, 32.25, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 37.32], ["sonar", 6.43], ["speech", 4.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.4], ["speech", 29.5], ["boom", 9.01]], null, null, null, [["throbbing", 48.81], ["music", 20.79], ["hum", 19.34]], [["music", 31.05], ["cacophony", 17.31], ["machine gun", 13.19]], [["music", 70.02], ["speech", 10.43], ["hum", 4.85]], [["speech", 43.73], ["music", 22.01], ["boom", 3.53]], [["music", 64.07], ["throbbing", 13.95], ["hum", 7.13]], null], "duration": [3.84, 0.55, 1.7, 2.12, 3.53, 3.86, -0.23, 0.49, 0.04, 1.49, 1.31, 0.52, 1.2, 2.27, 1.94, 0.86, 0.56, 0.17, 1.42, 0.63, -0.12, 6.42, -0.13, 0.03, 0.65, 6.69, 29.97, 2.68, 16.74, 8.26, 0.95]} \ No newline at end of file diff --git a/annotations_1/YeqQ-Iae_VI_filtered.json b/annotations_1/YeqQ-Iae_VI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23199ca965d3355f7f61845739b4286daacf3d35 --- /dev/null +++ b/annotations_1/YeqQ-Iae_VI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 16.7], [18.0, 19.36], [21.0, 22.2], [24.0, 24.51], [28.0, 28.93], [30.0, 31.36], [32.0, 32.88], [35.0, 36.58], [38.0, 38.47], [39.0, 40.37], [41.0, 41.64], [48.0, 49.1], [52.0, 52.88], [54.0, 54.45], [57.0, 57.69], [58.0, 60.34], [61.0, 63.56], [65.0, 68.28], [71.0, 74.49], [81.0, 81.73], [83.0, 84.79], [86.0, 89.31], [92.0, 93.31], [95.0, 95.4], [97.0, 100.4], [103.0, 108.41], [111.0, 113.76], [116.0, 120.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 92.48, 97.54, 100.0, 0.0, 0.0, 98.44, 0.0, 0.0, 62.68, 62.27, 85.35, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [14.7, 1.36, 1.2, 0.51, 0.93, 1.36, 0.88, 1.58, 0.47, 1.37, 0.64, 1.1, 0.88, 0.45, 0.69, 2.34, 2.56, 3.28, 3.49, 0.73, 1.79, 3.31, 1.31, 0.4, 3.4, 5.41, 2.76, 4.61]} \ No newline at end of file diff --git a/annotations_1/YfKjUgN_RcY_filtered.json b/annotations_1/YfKjUgN_RcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b36773ad1c986fa72b9ca7acb15e1a25c33ef005 --- /dev/null +++ b/annotations_1/YfKjUgN_RcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 19.3], [22.0, 21.83], [22.0, 22.79], [24.0, 93.55], [99.0, 99.98], [105.0, 108.92], [116.0, 116.94], [117.0, 124.36], [125.0, 129.73], [130.0, 130.72], [132.0, 132.71], [135.0, 135.3], [140.0, 141.84], [143.0, 145.32], [147.0, 148.26], [153.0, 153.17], [156.0, 157.64], [158.0, 158.84], [160.0, 162.01], [162.0, 164.69], [167.0, 171.29]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [44.26, 0.0, 0.0, 0.0, 0.0, 43.61, 0.0, 32.53, 37.74, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 32.76, 34.15, 47.01], "audiomae_on_audioset": [[["music", 18.34], ["synthesizer", 9.91], ["didgeridoo", 9.89]], null, null, null, null, [["music", 41.07], ["speech", 16.1], ["didgeridoo", 13.18]], null, [["speech", 24.91], ["music", 22.99], ["didgeridoo", 5.36]], [["music", 18.15], ["speech", 15.99], ["moo", 12.77]], null, null, null, null, null, null, null, null, null, [["speech", 18.84], ["music", 13.91], ["didgeridoo", 11.14]], [["music", 31.68], ["speech", 16.92], ["hum", 11.54]], [["music", 21.27], ["dog", 11.03], ["animal", 8.02]]], "duration": [6.3, -0.17, 0.79, 69.55, 0.98, 3.92, 0.94, 7.36, 4.73, 0.72, 0.71, 0.3, 1.84, 2.32, 1.26, 0.17, 1.64, 0.84, 2.01, 2.69, 4.29]} \ No newline at end of file diff --git a/annotations_1/YfdRr7MWax4_filtered.json b/annotations_1/YfdRr7MWax4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebb8c36185d73ae4a35d8cf151b11d3c8a6c46d --- /dev/null +++ b/annotations_1/YfdRr7MWax4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.94], [7.0, 7.53], [13.0, 13.37], [21.0, 20.8], [22.0, 22.99], [27.0, 29.24], [30.0, 33.03], [35.0, 36.1], [37.0, 39.12], [40.0, 40.19], [42.0, 45.0], [48.0, 48.22], [50.0, 52.57], [53.0, 55.07], [56.0, 75.9], [81.0, 82.34], [85.0, 85.16], [88.0, 89.99], [92.0, 93.34], [96.0, 97.01], [99.0, 100.01], [102.0, 102.17], [104.0, 111.2], [113.0, 114.52], [117.0, 118.74], [120.0, 120.92], [124.0, 126.23], [129.0, 129.05], [132.0, 133.42], [136.0, 136.46], [140.0, 142.35], [150.0, 151.24], [153.0, 153.3], [157.0, 158.82], [160.0, 159.92], [161.0, 162.31], [166.0, 166.58], [169.0, 170.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 59.96, 0.0, 68.41, 46.05, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 0.0, 55.39, 0.0, 0.0, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.61], ["sidetone", 9.03], ["chirp tone", 8.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.06, 0.53, 0.37, -0.2, 0.99, 2.24, 3.03, 1.1, 2.12, 0.19, 3.0, 0.22, 2.57, 2.07, 19.9, 1.34, 0.16, 1.99, 1.34, 1.01, 1.01, 0.17, 7.2, 1.52, 1.74, 0.92, 2.23, 0.05, 1.42, 0.46, 2.35, 1.24, 0.3, 1.82, -0.08, 1.31, 0.58, 1.85]} \ No newline at end of file diff --git a/annotations_1/Yfqg-PxRCD8_filtered.json b/annotations_1/Yfqg-PxRCD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4202f2f847a5820c90f3642b1131d22754efec03 --- /dev/null +++ b/annotations_1/Yfqg-PxRCD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [19.0, 19.45], [20.0, 20.66], [35.0, 35.51], [67.0, 67.1], [116.0, 116.26], [129.0, 132.71], [135.0, 135.75], [136.0, 140.44], [144.0, 144.17], [146.0, 146.42], [169.0, 169.87], [171.0, 172.25], [173.0, 173.79]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.24, 0.0, 37.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 58.91], ["musical instrument", 9.75], ["carnatic music", 9.35]], null, [["music", 54.54], ["theremin", 8.59], ["glockenspiel", 3.25]], null, null, null, null, null], "duration": [0.1, 0.45, 0.66, 0.51, 0.1, 0.26, 3.71, 0.75, 4.44, 0.17, 0.42, 0.87, 1.25, 0.79]} \ No newline at end of file diff --git a/annotations_1/Yg1qC5VGoLw_filtered.json b/annotations_1/Yg1qC5VGoLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..582bb2a2f37d6e5597958431f841a018d078aba3 --- /dev/null +++ b/annotations_1/Yg1qC5VGoLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [8.0, 8.23], [10.0, 16.09], [18.0, 18.45], [27.0, 27.6], [32.0, 32.02], [32.0, 35.41], [36.0, 36.98], [38.0, 39.02], [40.0, 40.98], [42.0, 43.9], [60.0, 60.42], [63.0, 64.18], [65.0, 66.36], [68.0, 69.38], [74.0, 74.39], [78.0, 78.95], [81.0, 81.4], [84.0, 84.75], [88.0, 99.47], [103.0, 107.42], [110.0, 110.32]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 32.28, 0.0, 0.0, 0.0, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.37, 33.52, 0.0], "audiomae_on_audioset": [null, null, [["speech", 71.04], ["electric shaver, electric razor", 9.38], ["music", 4.42]], null, null, null, [["speech", 39.07], ["sidetone", 7.75], ["inside, small room", 5.6]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.77], ["moo", 13.01], ["livestock, farm animals, working animals", 12.35]], [["sheep", 71.32], ["bleat", 11.4], ["animal", 4.87]], null], "duration": [0.39, 0.23, 6.09, 0.45, 0.6, 0.02, 3.41, 0.98, 1.02, 0.98, 1.9, 0.42, 1.18, 1.36, 1.38, 0.39, 0.95, 0.4, 0.75, 11.47, 4.42, 0.32]} \ No newline at end of file diff --git a/annotations_1/Yg53M7TYpuo_filtered.json b/annotations_1/Yg53M7TYpuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e33f0a025abb62dfaee9acf9aae8a80c954bd1c --- /dev/null +++ b/annotations_1/Yg53M7TYpuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.97], [6.0, 36.75], [48.0, 64.83], [68.0, 78.51], [81.0, 142.74]], "keep_status": [true, false, true, true, false], "silence_prob": [31.5, 0.0, 30.48, 29.41, 0.0], "audiomae_on_audioset": [[["music", 22.86], ["noise", 13.38], ["didgeridoo", 10.99]], null, [["music", 36.65], ["smash, crash", 14.37], ["breaking", 11.92]], [["music", 57.56], ["cacophony", 4.79], ["musical instrument", 4.05]], null], "duration": [4.97, 30.75, 16.83, 10.51, 61.74]} \ No newline at end of file diff --git a/annotations_1/Yg6sZ2htZfc_filtered.json b/annotations_1/Yg6sZ2htZfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95eb8290264487c5997ad5c156d2d0ec36429f96 --- /dev/null +++ b/annotations_1/Yg6sZ2htZfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.02], [6.0, 7.06], [10.0, 13.96], [14.0, 15.69], [21.0, 39.55], [40.0, 40.63], [45.0, 45.86], [49.0, 53.42], [55.0, 54.89], [56.0, 56.44], [61.0, 60.91], [62.0, 62.43], [65.0, 73.55], [79.0, 79.27], [82.0, 83.4], [84.0, 87.0], [89.0, 100.36], [101.0, 101.85], [104.0, 111.5], [112.0, 112.4], [114.0, 122.15], [127.0, 127.82], [129.0, 135.08], [136.0, 136.43], [139.0, 145.62], [149.0, 223.05], [225.0, 228.11], [230.0, 232.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.4, 0.0, 82.61, 0.0, 66.27, 0.0, 0.0, 57.48, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 62.58, 59.51, 0.0, 54.63, 0.0, 58.38, 0.0, 65.32, 0.0, 60.51, 0.0, 72.01, 79.07], "audiomae_on_audioset": [[["music", 55.76], ["noise", 4.56], ["didgeridoo", 3.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.02, 1.06, 3.96, 1.69, 18.55, 0.63, 0.86, 4.42, -0.11, 0.44, -0.09, 0.43, 8.55, 0.27, 1.4, 3.0, 11.36, 0.85, 7.5, 0.4, 8.15, 0.82, 6.08, 0.43, 6.62, 74.05, 3.11, 2.01]} \ No newline at end of file diff --git a/annotations_1/YgnhijYmavY_filtered.json b/annotations_1/YgnhijYmavY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5902524479bcdd9d1febe5eaadde36fc10b90a73 --- /dev/null +++ b/annotations_1/YgnhijYmavY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.43], [14.0, 25.17], [27.0, 27.7], [31.0, 31.97], [34.0, 33.91], [36.0, 36.27], [38.0, 38.58], [46.0, 48.51], [51.0, 51.75], [53.0, 59.19], [62.0, 65.99], [67.0, 73.38], [76.0, 78.49], [95.0, 96.75], [97.0, 98.56], [100.0, 101.9], [103.0, 103.64], [109.0, 110.02], [111.0, 112.13], [113.0, 113.76]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 0.0, 30.84, 48.06, 52.05, 36.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["whale vocalization", 10.83], ["music", 10.7], ["speech", 8.31]], [["speech", 52.72], ["noise", 4.12], ["wild animals", 3.75]], null, [["speech", 12.62], ["moo", 10.64], ["music", 10.06]], null, null, null, null, null, null, null], "duration": [1.43, 11.17, 0.7, 0.97, -0.09, 0.27, 0.58, 2.51, 0.75, 6.19, 3.99, 6.38, 2.49, 1.75, 1.56, 1.9, 0.64, 1.02, 1.13, 0.76]} \ No newline at end of file diff --git a/annotations_1/Yh03Vnp8pCk_filtered.json b/annotations_1/Yh03Vnp8pCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d339e885cf34821e8bba40bf16032f7eb0c4f8dc --- /dev/null +++ b/annotations_1/Yh03Vnp8pCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 31.31], [33.0, 33.15], [34.0, 35.07], [36.0, 36.96], [38.0, 38.82], [40.0, 40.78], [42.0, 42.65], [44.0, 44.42], [46.0, 89.06], [89.0, 90.0], [91.0, 91.88], [92.0, 112.5], [114.0, 114.47], [115.0, 116.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.3], ["musical instrument", 9.19], ["effects unit", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.31, 0.15, 1.07, 0.96, 0.82, 0.78, 0.65, 0.42, 43.06, 1.0, 0.88, 20.5, 0.47, 1.6]} \ No newline at end of file diff --git a/annotations_1/YiCzTGRqCQ4_filtered.json b/annotations_1/YiCzTGRqCQ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..559143d1dc3922286a7be1baff4d9566a739319b --- /dev/null +++ b/annotations_1/YiCzTGRqCQ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [3.0, 10.76], [11.0, 11.5], [14.0, 15.2], [16.0, 20.26], [20.0, 21.37], [23.0, 48.96], [51.0, 57.21], [58.0, 80.81], [81.0, 85.65], [89.0, 92.97], [94.0, 122.25], [124.0, 124.24]], "keep_status": [false, true, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 36.16, 0.0, 0.0, 33.45, 0.0, 35.36, 31.13, 35.61, 33.45, 41.52, 33.92, 0.0], "audiomae_on_audioset": [null, [["music", 20.07], ["screaming", 17.52], ["speech", 13.67]], null, null, [["music", 64.16], ["didgeridoo", 8.05], ["musical instrument", 5.56]], null, [["music", 59.94], ["speech", 13.21], ["whack, thwack", 4.98]], [["music", 72.51], ["musical instrument", 3.44], ["whale vocalization", 2.37]], [["noise", 34.98], ["music", 22.13], ["theremin", 7.51]], [["music", 38.46], ["hum", 19.09], ["whale vocalization", 5.07]], [["music", 51.81], ["didgeridoo", 6.34], ["mains hum", 6.19]], [["cattle, bovinae", 43.3], ["moo", 31.6], ["livestock, farm animals, working animals", 13.24]], null], "duration": [0.75, 7.76, 0.5, 1.2, 4.26, 1.37, 25.96, 6.21, 22.81, 4.65, 3.97, 28.25, 0.24]} \ No newline at end of file diff --git a/annotations_1/YihADAPOCWU_filtered.json b/annotations_1/YihADAPOCWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7120d0febec20c70741e16a5c884ab5ec91e19ac --- /dev/null +++ b/annotations_1/YihADAPOCWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.92], [21.0, 22.03], [23.0, 23.67], [27.0, 27.4], [32.0, 32.78], [34.0, 35.26], [43.0, 43.04], [58.0, 58.9], [61.0, 64.45]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [65.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [8.92, 1.03, 0.67, 0.4, 0.78, 1.26, 0.04, 0.9, 3.45]} \ No newline at end of file diff --git a/annotations_1/YjJ2tMg4tTA_filtered.json b/annotations_1/YjJ2tMg4tTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f0f8bfa79c306f241d2d486c773d6b4e38f9b5 --- /dev/null +++ b/annotations_1/YjJ2tMg4tTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.95], [42.0, 52.76], [55.0, 56.05], [58.0, 59.39], [63.0, 62.9], [66.0, 67.51], [72.0, 74.21], [76.0, 76.33], [78.0, 79.51], [81.0, 81.85], [86.0, 86.78], [92.0, 93.77], [95.0, 95.99], [98.0, 98.39], [100.0, 137.66], [144.0, 145.52], [146.0, 145.67], [151.0, 151.51], [156.0, 155.9], [159.0, 159.17], [160.0, 162.84], [165.0, 166.55], [169.0, 169.52], [173.0, 172.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.77, 98.1, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 71.88], ["vehicle", 2.64], ["outside, rural or natural", 1.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.95, 10.76, 1.05, 1.39, -0.1, 1.51, 2.21, 0.33, 1.51, 0.85, 0.78, 1.77, 0.99, 0.39, 37.66, 1.52, -0.33, 0.51, -0.1, 0.17, 2.84, 1.55, 0.52, -0.06]} \ No newline at end of file diff --git a/annotations_1/YjbYhnnEDRo_filtered.json b/annotations_1/YjbYhnnEDRo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..548ac4f8ee9ea3efb2bf01be42a26a0e3f4360c3 --- /dev/null +++ b/annotations_1/YjbYhnnEDRo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.63], [7.0, 8.51], [17.0, 23.41], [25.0, 24.9], [27.0, 30.27], [32.0, 33.67], [36.0, 38.69], [40.0, 42.42], [43.0, 43.24], [44.0, 46.01], [47.0, 48.15], [52.0, 68.55], [70.0, 70.7], [72.0, 71.58], [78.0, 78.38], [79.0, 78.83], [80.0, 80.18], [81.0, 81.55], [82.0, 83.13], [85.0, 89.34], [90.0, 91.32], [99.0, 104.85], [105.0, 107.45], [108.0, 113.49], [115.0, 121.12], [121.0, 125.14], [125.0, 125.2], [127.0, 132.6], [133.0, 139.56], [142.0, 149.32], [151.0, 151.73], [155.0, 162.03], [163.0, 162.94], [167.0, 167.48], [173.0, 172.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.42, 0.0, 97.0, 0.0, 97.83, 0.0, 99.59, 99.16, 0.0, 99.88, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 100.0, 94.81, 100.0, 93.76, 99.4, 0.0, 85.35, 89.72, 59.15, 0.0, 54.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.63, 1.51, 6.41, -0.1, 3.27, 1.67, 2.69, 2.42, 0.24, 2.01, 1.15, 16.55, 0.7, -0.42, 0.38, -0.17, 0.18, 0.55, 1.13, 4.34, 1.32, 5.85, 2.45, 5.49, 6.12, 4.14, 0.2, 5.6, 6.56, 7.32, 0.73, 7.03, -0.06, 0.48, -0.29]} \ No newline at end of file diff --git a/annotations_1/YjewWZ3JWiE_filtered.json b/annotations_1/YjewWZ3JWiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..178b20daf97133c04b993a9128578e6b00acd886 --- /dev/null +++ b/annotations_1/YjewWZ3JWiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [11.0, 13.47], [14.0, 14.4], [22.0, 22.44], [28.0, 30.35], [32.0, 31.94], [38.0, 38.97], [52.0, 53.06], [63.0, 66.06], [78.0, 79.41], [81.0, 82.95], [84.0, 85.13], [89.0, 92.43], [94.0, 97.87], [99.0, 99.05], [102.0, 106.0], [109.0, 109.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 85.72, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 34.71, 0.0, 0.0, 0.0, 49.18, 41.34, 0.0, 35.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 82.01], ["breaking", 3.14], ["groan", 1.6]], null, null, null, [["music", 65.18], ["synthesizer", 5.73], ["boing", 3.05]], [["music", 71.98], ["boing", 7.51], ["electronic music", 2.74]], null, [["speech", 38.44], ["music", 33.94], ["foghorn", 3.84]], null], "duration": [-0.14, 2.47, 0.4, 0.44, 2.35, -0.06, 0.97, 1.06, 3.06, 1.41, 1.95, 1.13, 3.43, 3.87, 0.05, 4.0, 0.09]} \ No newline at end of file diff --git a/annotations_1/YjfLp0bll5U_filtered.json b/annotations_1/YjfLp0bll5U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f1a9b2fabfcab7fc8de6b2dcbbdf8a69821276 --- /dev/null +++ b/annotations_1/YjfLp0bll5U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.35], [20.0, 20.29], [21.0, 21.29], [22.0, 23.45], [24.0, 25.19], [26.0, 30.91], [32.0, 37.42], [40.0, 46.18], [47.0, 60.03], [64.0, 64.22], [65.0, 65.43], [71.0, 77.09], [78.0, 107.74], [110.0, 111.96], [113.0, 113.32], [114.0, 114.88], [122.0, 125.71], [126.0, 126.0], [126.0, 129.15], [130.0, 130.13], [132.0, 132.29]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [57.01, 0.0, 0.0, 0.0, 0.0, 34.31, 28.13, 28.19, 28.45, 0.0, 0.0, 30.81, 29.17, 0.0, 0.0, 0.0, 29.36, 0.0, 33.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.64], ["thunk", 4.59], ["whack, thwack", 3.33]], [["speech", 44.18], ["music", 18.15], ["explosion", 7.8]], [["music", 32.54], ["breaking", 10.19], ["whack, thwack", 8.0]], [["music", 56.17], ["speech", 29.56], ["whack, thwack", 2.06]], null, null, [["music", 60.01], ["throbbing", 19.12], ["electronic music", 5.02]], [["music", 67.6], ["speech", 13.62], ["electric shaver, electric razor", 1.58]], null, null, null, [["music", 20.13], ["speech", 20.11], ["whack, thwack", 12.96]], null, [["speech", 36.86], ["breaking", 14.09], ["smash, crash", 14.0]], null, null], "duration": [2.35, 0.29, 0.29, 1.45, 1.19, 4.91, 5.42, 6.18, 13.03, 0.22, 0.43, 6.09, 29.74, 1.96, 0.32, 0.88, 3.71, 0.0, 3.15, 0.13, 0.29]} \ No newline at end of file diff --git a/annotations_1/YkfEc-PYJ8A_filtered.json b/annotations_1/YkfEc-PYJ8A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c64f9a95ab40473f2f49af2449662b65553cce --- /dev/null +++ b/annotations_1/YkfEc-PYJ8A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [11.0, 13.02], [16.0, 16.17], [16.0, 20.06], [23.0, 25.05], [29.0, 30.06], [41.0, 42.72], [47.0, 74.68], [76.0, 76.18], [78.0, 81.45], [82.0, 82.66], [84.0, 85.51], [88.0, 107.18], [108.0, 111.91], [113.0, 120.87], [121.0, 123.08], [125.0, 125.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 70.3, 0.0, 41.6, 57.01, 0.0, 0.0, 59.07, 0.0, 45.11, 0.0, 0.0, 37.06, 33.27, 31.15, 30.92, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 37.73], ["sidetone", 26.06], ["music", 8.76]], null, null, null, null, null, [["speech", 53.12], ["music", 19.69], ["synthesizer", 4.09]], null, null, [["music", 84.42], ["ambient music", 3.23], ["synthesizer", 2.08]], [["music", 34.33], ["throbbing", 10.2], ["hum", 7.7]], [["music", 29.29], ["grunt", 8.25], ["hum", 7.96]], [["speech", 42.63], ["music", 12.93], ["hum", 9.93]], null], "duration": [1.27, 2.02, 0.17, 4.06, 2.05, 1.06, 1.72, 27.68, 0.18, 3.45, 0.66, 1.51, 19.18, 3.91, 7.87, 2.08, 0.59]} \ No newline at end of file diff --git a/annotations_1/YlbjPR7t1IU_filtered.json b/annotations_1/YlbjPR7t1IU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d5da50984576aefcf0e298c7a7a5b58747120d6 --- /dev/null +++ b/annotations_1/YlbjPR7t1IU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.16], [0.0, 1.38], [12.0, 12.18], [27.0, 27.4], [28.0, 28.46], [30.0, 30.47], [33.0, 34.13], [45.0, 46.11], [50.0, 50.57], [84.0, 85.55], [100.0, 100.2], [101.0, 100.85], [101.0, 103.45], [105.0, 105.78], [111.0, 111.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.91, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["grunt", 70.35], ["speech", 15.7], ["groan", 3.28]], null, null], "duration": [0.16, 1.38, 0.18, 0.4, 0.46, 0.47, 1.13, 1.11, 0.57, 1.55, 0.2, -0.15, 2.45, 0.78, 0.94]} \ No newline at end of file diff --git a/annotations_1/YmC-BayMaDg_filtered.json b/annotations_1/YmC-BayMaDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aff5f54cef37e651b7aa6f7c7fd532a19a44673 --- /dev/null +++ b/annotations_1/YmC-BayMaDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.98], [2.0, 2.37], [3.0, 11.55], [14.0, 16.41], [21.0, 22.89], [24.0, 25.37], [32.0, 38.52], [40.0, 41.12], [44.0, 49.92], [62.0, 65.67], [68.0, 70.06], [72.0, 74.7], [79.0, 79.24], [82.0, 92.64], [93.0, 97.19], [99.0, 112.5], [114.0, 128.85], [130.0, 130.59]], "keep_status": [false, false, false, false, false, false, true, false, true, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 34.57, 61.97, 0.0, 0.0, 31.66, 0.0, 33.6, 31.67, 29.65, 32.66, 0.0, 30.1, 30.91, 32.15, 52.98, 0.0], "audiomae_on_audioset": [null, null, [["speech", 72.47], ["music", 8.97], ["whack, thwack", 3.67]], null, null, null, [["music", 16.54], ["speech", 16.28], ["whack, thwack", 14.52]], null, [["music", 35.92], ["throbbing", 11.99], ["hum", 10.28]], [["music", 15.67], ["vehicle", 15.14], ["car passing by", 11.76]], [["cattle, bovinae", 42.52], ["livestock, farm animals, working animals", 31.18], ["moo", 18.65]], [["music", 29.72], ["fly, housefly", 18.92], ["mosquito", 14.17]], null, [["speech", 45.66], ["music", 22.63], ["theremin", 3.56]], [["music", 21.27], ["roar", 19.48], ["mosquito", 6.81]], [["livestock, farm animals, working animals", 51.89], ["cattle, bovinae", 24.15], ["moo", 14.41]], null, null], "duration": [-0.02, 0.37, 8.55, 2.41, 1.89, 1.37, 6.52, 1.12, 5.92, 3.67, 2.06, 2.7, 0.24, 10.64, 4.19, 13.5, 14.85, 0.59]} \ No newline at end of file diff --git a/annotations_1/YmGBAiHnK0U_filtered.json b/annotations_1/YmGBAiHnK0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bec4a6d504735ecf24288dc70f6e409dd0fad334 --- /dev/null +++ b/annotations_1/YmGBAiHnK0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.53], [3.0, 3.54], [4.0, 6.2], [7.0, 8.99], [10.0, 13.04], [14.0, 23.65], [24.0, 25.2], [25.0, 66.51], [70.0, 70.66], [72.0, 72.71], [74.0, 76.01], [77.0, 77.94], [78.0, 81.63], [83.0, 83.51], [84.0, 84.79], [85.0, 86.54], [93.0, 94.56], [99.0, 99.44], [101.0, 105.7], [109.0, 110.25], [112.0, 122.61], [125.0, 131.43], [138.0, 140.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.51, 0.0, 81.0, 46.72, 0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 39.89, 33.89, 73.67], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.36], ["speech", 26.76], ["didgeridoo", 11.24]], null, null, null, null, [["music", 67.73], ["musical instrument", 3.68], ["drum", 2.56]], null, [["music", 44.77], ["speech", 30.18], ["hum", 2.45]], null, null, null, null, null, null, null, [["music", 70.32], ["throbbing", 5.75], ["speech", 3.4]], [["music", 44.8], ["throbbing", 24.45], ["speech", 5.42]], null], "duration": [-0.47, 0.54, 2.2, 1.99, 3.04, 9.65, 1.2, 41.51, 0.66, 0.71, 2.01, 0.94, 3.63, 0.51, 0.79, 1.54, 1.56, 0.44, 4.7, 1.25, 10.61, 6.43, 2.95]} \ No newline at end of file diff --git a/annotations_1/YmRuVv2V5Go_filtered.json b/annotations_1/YmRuVv2V5Go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..021e04e9eacfa034037c4c9f550bf31f8b9d2456 --- /dev/null +++ b/annotations_1/YmRuVv2V5Go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.38], [8.0, 9.85], [10.0, 11.33], [12.0, 12.14], [13.0, 24.56], [25.0, 25.57], [27.0, 27.24], [29.0, 42.85], [44.0, 44.96], [46.0, 47.41], [48.0, 48.76], [50.0, 50.01], [51.0, 51.92], [52.0, 52.83], [56.0, 56.69], [60.0, 60.42], [61.0, 61.47], [66.0, 67.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 47.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["stomach rumble", 35.3], ["crow", 14.49], ["speech", 10.4]], null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 1.85, 1.33, 0.14, 11.56, 0.57, 0.24, 13.85, 0.96, 1.41, 0.76, 0.01, 0.92, 0.83, 0.69, 0.42, 0.47, 1.14]} \ No newline at end of file diff --git a/annotations_1/Yn8Or4O6_9U_filtered.json b/annotations_1/Yn8Or4O6_9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f55f3aeaef48559c28b289afc40cb9de2506718 --- /dev/null +++ b/annotations_1/Yn8Or4O6_9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.38], [11.0, 11.65], [21.0, 20.85], [24.0, 25.71], [27.0, 27.28], [31.0, 31.26], [47.0, 53.45], [55.0, 57.54], [62.0, 64.54], [69.0, 69.47], [73.0, 73.75], [90.0, 91.13], [94.0, 97.71], [100.0, 100.63], [115.0, 116.26], [126.0, 129.17], [131.0, 139.92], [149.0, 149.69]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.85, 35.05, 34.96, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 36.12, 33.58, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 66.98], ["synthesizer", 3.39], ["noise", 3.05]], [["music", 29.88], ["static", 15.8], ["mains hum", 8.28]], [["music", 60.27], ["hum", 9.42], ["mains hum", 8.44]], null, null, null, null, null, null, [["music", 25.82], ["speech", 15.53], ["bow-wow", 13.86]], [["music", 57.0], ["speech", 10.4], ["throbbing", 10.11]], null], "duration": [0.38, 0.65, -0.15, 1.71, 0.28, 0.26, 6.45, 2.54, 2.54, 0.47, 0.75, 1.13, 3.71, 0.63, 1.26, 3.17, 8.92, 0.69]} \ No newline at end of file diff --git a/annotations_1/YnnxVknsLk0_filtered.json b/annotations_1/YnnxVknsLk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb97bcb7d4b60aeab4a668b6317be58865d54cb5 --- /dev/null +++ b/annotations_1/YnnxVknsLk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.16], [10.0, 11.42], [12.0, 12.02], [14.0, 16.09], [21.0, 40.02], [42.0, 42.21], [44.0, 48.88], [54.0, 54.14], [64.0, 63.91], [69.0, 79.74], [82.0, 84.05], [85.0, 85.35], [91.0, 92.03], [96.0, 109.17], [111.0, 111.23], [112.0, 114.83], [125.0, 125.39], [135.0, 135.41], [136.0, 136.86], [138.0, 138.35], [140.0, 143.4]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [46.75, 0.0, 0.0, 56.1, 30.55, 0.0, 54.63, 0.0, 0.0, 31.11, 32.89, 0.0, 0.0, 28.61, 0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 78.72], "audiomae_on_audioset": [[["speech", 32.85], ["music", 14.95], ["hum", 3.89]], null, null, null, [["music", 40.41], ["throbbing", 10.89], ["electronic music", 9.4]], null, null, null, null, [["music", 40.22], ["hum", 24.55], ["mains hum", 12.42]], [["music", 25.33], ["whale vocalization", 12.04], ["hum", 8.27]], null, null, [["speech", 54.85], ["music", 8.62], ["explosion", 8.03]], null, null, null, null, null, null, null], "duration": [3.16, 1.42, 0.02, 2.09, 19.02, 0.21, 4.88, 0.14, -0.09, 10.74, 2.05, 0.35, 1.03, 13.17, 0.23, 2.83, 0.39, 0.41, 0.86, 0.35, 3.4]} \ No newline at end of file diff --git a/annotations_1/Yo3rEGWrlws_filtered.json b/annotations_1/Yo3rEGWrlws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e239268ae3070e6579cc9b1954fb986a6ada27ad --- /dev/null +++ b/annotations_1/Yo3rEGWrlws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.65], [23.0, 27.94], [28.0, 28.34], [31.0, 41.45], [43.0, 42.69], [44.0, 46.9], [56.0, 57.84], [60.0, 101.48], [104.0, 118.3], [120.0, 124.43], [125.0, 125.68], [126.0, 128.93], [132.0, 140.73], [141.0, 142.48], [158.0, 162.26], [163.0, 165.54], [169.0, 171.46], [177.0, 184.0], [186.0, 189.06], [190.0, 191.78], [194.0, 196.06]], "keep_status": [false, true, false, true, false, true, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [31.34, 30.35, 0.0, 30.25, 0.0, 32.7, 0.0, 0.0, 30.93, 30.61, 0.0, 30.92, 31.27, 0.0, 87.74, 100.0, 100.0, 100.0, 100.0, 0.0, 99.95], "audiomae_on_audioset": [[["music", 32.91], ["speech", 32.89], ["didgeridoo", 14.8]], [["speech", 28.18], ["whack, thwack", 14.25], ["thunk", 9.5]], null, [["speech", 46.44], ["groan", 10.58], ["fart", 4.81]], null, [["speech", 23.25], ["frog", 14.87], ["noise", 8.81]], null, null, [["music", 28.11], ["fart", 6.84], ["speech", 6.56]], [["music", 65.69], ["boing", 7.94], ["speech", 5.95]], null, [["music", 36.31], ["grunt", 8.37], ["frog", 4.39]], [["fly, housefly", 21.26], ["mosquito", 20.76], ["insect", 10.38]], null, null, null, null, null, null, null, null], "duration": [15.65, 4.94, 0.34, 10.45, -0.31, 2.9, 1.84, 41.48, 14.3, 4.43, 0.68, 2.93, 8.73, 1.48, 4.26, 2.54, 2.46, 7.0, 3.06, 1.78, 2.06]} \ No newline at end of file diff --git a/annotations_1/YoIcmX40-_s_filtered.json b/annotations_1/YoIcmX40-_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..feb6dd82ccc8d6703c40cf2e1e0f6ac075d9ed26 --- /dev/null +++ b/annotations_1/YoIcmX40-_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.72], [5.0, 6.88], [14.0, 16.26], [22.0, 23.14], [29.0, 30.91], [34.0, 42.57], [45.0, 49.28], [51.0, 52.25], [55.0, 56.67], [58.0, 59.07], [62.0, 62.63], [76.0, 76.94], [78.0, 96.87], [99.0, 114.32], [116.0, 117.68], [121.0, 124.17], [126.0, 134.25], [135.0, 140.21], [144.0, 147.31], [148.0, 149.01], [150.0, 152.66], [170.0, 170.01], [171.0, 173.03], [175.0, 175.74], [176.0, 188.62]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.64, 0.0, 0.0, 36.65, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 34.44, 34.34, 0.0, 37.62, 39.72, 39.07, 37.96, 0.0, 42.33, 0.0, 76.53, 0.0, 45.52], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 52.92], ["hum", 7.49], ["fart", 5.14]], [["sidetone", 42.33], ["speech", 20.23], ["fart", 5.37]], null, null, null, null, null, [["speech", 58.64], ["whack, thwack", 14.26], ["groan", 3.5]], [["speech", 52.38], ["music", 35.39], ["bleat", 1.44]], null, [["music", 37.82], ["speech", 21.37], ["radio", 7.65]], [["music", 59.37], ["speech", 8.31], ["boing", 4.37]], [["music", 62.54], ["hum", 4.87], ["speech", 4.13]], [["cattle, bovinae", 39.69], ["moo", 20.94], ["music", 17.21]], null, [["music", 64.51], ["didgeridoo", 3.94], ["hum", 2.18]], null, null, null, [["music", 72.15], ["hum", 6.66], ["soundtrack music", 3.83]]], "duration": [0.72, 1.88, 2.26, 1.14, 1.91, 8.57, 4.28, 1.25, 1.67, 1.07, 0.63, 0.94, 18.87, 15.32, 1.68, 3.17, 8.25, 5.21, 3.31, 1.01, 2.66, 0.01, 2.03, 0.74, 12.62]} \ No newline at end of file diff --git a/annotations_1/YpDpOphD1zo_filtered.json b/annotations_1/YpDpOphD1zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baee971de3e25853d562fa0fad3fc174255284f1 --- /dev/null +++ b/annotations_1/YpDpOphD1zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 41.71], [43.0, 44.19], [50.0, 50.67], [51.0, 52.02], [53.0, 55.83], [57.0, 57.67], [59.0, 58.9], [60.0, 61.1], [63.0, 62.9], [68.0, 69.25], [72.0, 73.75], [79.0, 79.62], [80.0, 80.54], [85.0, 88.69], [90.0, 91.34], [99.0, 99.81], [106.0, 107.59], [109.0, 110.34], [113.0, 115.11], [116.0, 117.73], [120.0, 120.06], [121.0, 124.02], [127.0, 128.09], [129.0, 129.07], [132.0, 137.34], [144.0, 145.03], [146.0, 147.26], [155.0, 156.39], [160.0, 161.08], [163.0, 166.09], [170.0, 172.18], [178.0, 178.9], [181.0, 181.63], [183.0, 184.94], [186.0, 186.68], [190.0, 192.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.82, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 97.73, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 99.56, 99.71, 0.0, 0.0, 0.0, 0.0, 89.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["cough", 33.5], ["speech", 23.49], ["throat clearing", 5.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [32.71, 1.19, 0.67, 1.02, 2.83, 0.67, -0.1, 1.1, -0.1, 1.25, 1.75, 0.62, 0.54, 3.69, 1.34, 0.81, 1.59, 1.34, 2.11, 1.73, 0.06, 3.02, 1.09, 0.07, 5.34, 1.03, 1.26, 1.39, 1.08, 3.09, 2.18, 0.9, 0.63, 1.94, 0.68, 2.69]} \ No newline at end of file diff --git a/annotations_1/YpFmmzisOy0_filtered.json b/annotations_1/YpFmmzisOy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a025f117fcd6c42fd1d0bc28f8efe6bdf7ad4ef6 --- /dev/null +++ b/annotations_1/YpFmmzisOy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.66], [14.0, 15.23], [17.0, 18.49], [23.0, 23.03], [27.0, 26.86], [29.0, 33.39], [34.0, 36.39], [38.0, 39.07], [41.0, 41.39], [42.0, 42.3], [44.0, 45.55], [47.0, 54.19], [56.0, 58.33], [59.0, 60.91], [62.0, 63.76], [65.0, 69.31], [70.0, 71.86], [72.0, 74.36], [79.0, 79.64], [80.0, 81.41], [83.0, 84.91], [86.0, 88.28], [89.0, 90.15], [91.0, 92.7], [95.0, 96.55], [101.0, 104.65], [110.0, 110.35], [112.0, 113.43], [115.0, 116.29], [118.0, 119.55], [121.0, 122.13], [123.0, 123.77], [125.0, 128.11], [129.0, 132.81], [133.0, 134.38], [136.0, 136.63], [137.0, 137.17], [138.0, 137.93], [140.0, 140.78], [144.0, 146.25], [148.0, 147.8], [148.0, 149.45], [151.0, 156.09], [157.0, 158.99], [160.0, 162.13], [163.0, 164.89], [166.0, 167.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 91.81, 0.0, 0.0, 0.0, 0.0, 96.04, 97.54, 0.0, 0.0, 94.95, 0.0, 59.24, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 0.0, 90.25, 0.0, 85.17, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.66, 1.23, 1.49, 0.03, -0.14, 4.39, 2.39, 1.07, 0.39, 0.3, 1.55, 7.19, 2.33, 1.91, 1.76, 4.31, 1.86, 2.36, 0.64, 1.41, 1.91, 2.28, 1.15, 1.7, 1.55, 3.65, 0.35, 1.43, 1.29, 1.55, 1.13, 0.77, 3.11, 3.81, 1.38, 0.63, 0.17, -0.07, 0.78, 2.25, -0.2, 1.45, 5.09, 1.99, 2.13, 1.89, 1.71]} \ No newline at end of file diff --git a/annotations_1/Ypa0nma0aSs_filtered.json b/annotations_1/Ypa0nma0aSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4b58be54d7e353c52194149f08979c1619180ba --- /dev/null +++ b/annotations_1/Ypa0nma0aSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.86], [15.0, 15.9], [21.0, 21.71], [23.0, 23.28], [24.0, 28.75], [32.0, 32.86], [47.0, 47.14], [50.0, 50.48], [53.0, 54.57], [59.0, 59.1], [59.0, 63.98], [64.0, 80.27], [84.0, 83.93], [85.0, 85.62], [86.0, 86.32], [100.0, 100.57], [101.0, 101.43], [102.0, 102.07], [102.0, 102.57], [103.0, 104.19], [106.0, 106.57], [107.0, 108.16], [114.0, 116.19], [118.0, 118.42], [119.0, 118.93], [119.0, 122.39], [123.0, 123.25], [124.0, 124.61], [125.0, 128.07], [129.0, 129.74], [131.0, 132.24], [137.0, 140.81], [141.0, 141.84], [143.0, 144.58], [145.0, 145.96], [148.0, 148.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 54.76, 63.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 47.78, 0.0, 0.0, 84.8, 0.0, 0.0, 85.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["frog", 45.57], ["speech", 21.46], ["croak", 19.32]], null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 0.9, 0.71, 0.28, 4.75, 0.86, 0.14, 0.48, 1.57, 0.1, 4.98, 16.27, -0.07, 0.62, 0.32, 0.57, 0.43, 0.07, 0.57, 1.19, 0.57, 1.16, 2.19, 0.42, -0.07, 3.39, 0.25, 0.61, 3.07, 0.74, 1.24, 3.81, 0.84, 1.58, 0.96, 0.78]} \ No newline at end of file diff --git a/annotations_1/YprQvoOj6wM_filtered.json b/annotations_1/YprQvoOj6wM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b44d4ef9025ae5749748875efa1b9c24779cda7 --- /dev/null +++ b/annotations_1/YprQvoOj6wM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.64], [43.0, 43.04], [55.0, 55.73], [66.0, 66.31], [78.0, 78.54], [83.0, 83.76], [94.0, 94.51], [100.0, 101.83], [124.0, 124.01], [131.0, 131.73], [146.0, 146.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.04, 0.73, 0.31, 0.54, 0.76, 0.51, 1.83, 0.01, 0.73, 0.72]} \ No newline at end of file diff --git a/annotations_1/YptUTTJjUVs_filtered.json b/annotations_1/YptUTTJjUVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d97af845b63bb209b5fafc5929154a4d7aed1cb --- /dev/null +++ b/annotations_1/YptUTTJjUVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.81], [8.0, 10.83], [12.0, 14.54], [18.0, 23.6], [25.0, 39.92], [40.0, 73.7], [74.0, 75.66], [77.0, 82.16], [83.0, 86.17], [89.0, 93.77], [94.0, 101.24], [102.0, 103.82], [104.0, 114.32], [115.0, 120.39], [121.0, 125.32]], "keep_status": [false, true, true, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 37.4, 36.76, 70.02, 82.25, 0.0, 0.0, 32.44, 34.8, 32.46, 39.69, 0.0, 31.09, 29.49, 31.27], "audiomae_on_audioset": [null, [["music", 37.56], ["synthesizer", 12.55], ["percussion", 6.19]], [["music", 35.0], ["synthesizer", 16.66], ["hum", 5.82]], null, null, null, null, [["sonar", 43.13], ["music", 20.59], ["beep, bleep", 6.76]], [["music", 35.54], ["sine wave", 11.07], ["synthesizer", 5.42]], [["chirp tone", 58.12], ["sine wave", 10.36], ["music", 5.96]], [["music", 17.38], ["speech", 17.37], ["noise", 16.8]], null, [["speech", 50.76], ["sine wave", 8.58], ["singing bowl", 8.38]], [["speech", 58.77], ["music", 16.47], ["synthesizer", 4.69]], [["frog", 26.13], ["whale vocalization", 8.14], ["buzz", 5.66]]], "duration": [-0.19, 2.83, 2.54, 5.6, 14.92, 33.7, 1.66, 5.16, 3.17, 4.77, 7.24, 1.82, 10.32, 5.39, 4.32]} \ No newline at end of file diff --git a/annotations_1/Yq9fKm8q0iY_filtered.json b/annotations_1/Yq9fKm8q0iY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52a822880fcf755e6e187d6db0e450d1caa5b907 --- /dev/null +++ b/annotations_1/Yq9fKm8q0iY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.81], [13.0, 14.54], [20.0, 20.55], [21.0, 25.64], [26.0, 27.7], [28.0, 30.65], [31.0, 32.98], [37.0, 40.27], [42.0, 43.75], [45.0, 48.27], [58.0, 59.39], [65.0, 66.82], [74.0, 75.36], [76.0, 80.05], [82.0, 83.4], [85.0, 86.1], [88.0, 89.7], [98.0, 99.45], [103.0, 105.0], [105.0, 107.06], [114.0, 117.96], [123.0, 124.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 99.85, 0.0, 98.93, 0.0, 99.68, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 99.71, 73.06, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.54, 0.55, 4.64, 1.7, 2.65, 1.98, 3.27, 1.75, 3.27, 1.39, 1.82, 1.36, 4.05, 1.4, 1.1, 1.7, 1.45, 2.0, 2.06, 3.96, 1.88]} \ No newline at end of file diff --git a/annotations_1/YqNktpnzIf8_filtered.json b/annotations_1/YqNktpnzIf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d9ae381aa43b318735ed8242cb52af2ba03c498 --- /dev/null +++ b/annotations_1/YqNktpnzIf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.11], [25.0, 25.29], [27.0, 27.33]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.11, 0.29, 0.33]} \ No newline at end of file diff --git a/annotations_1/YqkDor9GqqE_filtered.json b/annotations_1/YqkDor9GqqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..443fda3031702c9fa46f9330f07a4a1bae8b5869 --- /dev/null +++ b/annotations_1/YqkDor9GqqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [4.0, 6.78], [7.0, 9.51], [10.0, 11.38], [13.0, 13.27], [17.0, 18.64], [19.0, 24.51], [26.0, 26.0], [30.0, 33.4], [34.0, 36.27], [37.0, 40.04], [40.0, 41.4], [43.0, 44.95], [46.0, 51.93], [57.0, 57.4], [58.0, 58.78], [63.0, 63.1], [64.0, 64.42], [65.0, 65.75], [70.0, 71.07], [74.0, 76.11], [79.0, 79.59], [83.0, 83.69], [95.0, 95.82], [98.0, 99.2], [99.0, 99.74], [104.0, 104.38], [107.0, 107.42], [111.0, 111.99], [113.0, 113.64], [116.0, 116.07], [117.0, 117.46], [119.0, 119.82], [121.0, 121.51], [123.0, 123.31], [126.0, 126.62], [129.0, 132.44], [134.0, 135.11], [138.0, 137.93], [139.0, 142.8], [146.0, 146.89], [149.0, 153.98], [155.0, 159.07], [162.0, 174.65], [176.0, 175.98], [177.0, 177.99], [180.0, 180.54], [182.0, 183.63], [184.0, 185.36], [187.0, 187.49], [190.0, 191.05], [194.0, 194.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.72, 80.82, 0.0, 0.0, 0.0, 46.02, 0.0, 100.0, 100.0, 81.0, 0.0, 0.0, 38.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 91.98, 50.71, 29.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 72.3], ["sidetone", 12.46], ["radio", 12.31]], null, null, null, null, null, null, [["speech", 74.1], ["thunk", 16.88], ["whack, thwack", 1.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.01], ["screaming", 21.46], ["inside, small room", 6.78]], null, null, null, null, null, null, null, null], "duration": [1.51, 2.78, 2.51, 1.38, 0.27, 1.64, 5.51, 0.0, 3.4, 2.27, 3.04, 1.4, 1.95, 5.93, 0.4, 0.78, 0.1, 0.42, 0.75, 1.07, 2.11, 0.59, 0.69, 0.82, 1.2, 0.74, 0.38, 0.42, 0.99, 0.64, 0.07, 0.46, 0.82, 0.51, 0.31, 0.62, 3.44, 1.11, -0.07, 3.8, 0.89, 4.98, 4.07, 12.65, -0.02, 0.99, 0.54, 1.63, 1.36, 0.49, 1.05, 0.66]} \ No newline at end of file diff --git a/annotations_1/Yr1quUpD0Y0_filtered.json b/annotations_1/Yr1quUpD0Y0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d980b14d8651f192641c42bfd84f40b3db32aae5 --- /dev/null +++ b/annotations_1/Yr1quUpD0Y0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.09], [17.0, 17.05], [19.0, 31.21], [32.0, 45.59], [47.0, 52.68], [53.0, 69.69], [71.0, 81.13], [82.0, 116.28], [117.0, 119.94], [123.0, 129.78], [130.0, 131.01]], "keep_status": [false, false, true, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 29.41, 29.57, 28.96, 29.22, 29.1, 0.0, 32.46, 29.39, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 26.01], ["hum", 19.66], ["music", 16.35]], [["mains hum", 50.87], ["hum", 41.17], ["speech", 1.57]], [["music", 16.87], ["hum", 10.9], ["mains hum", 8.86]], [["mains hum", 35.61], ["hum", 33.18], ["music", 13.05]], [["music", 29.04], ["hum", 11.14], ["speech", 6.13]], null, [["music", 58.1], ["musical instrument", 6.68], ["synthesizer", 5.59]], [["mains hum", 35.78], ["hum", 21.22], ["music", 7.72]], null], "duration": [0.09, 0.05, 12.21, 13.59, 5.68, 16.69, 10.13, 34.28, 2.94, 6.78, 1.01]} \ No newline at end of file diff --git a/annotations_1/YsCeolAfbLw_filtered.json b/annotations_1/YsCeolAfbLw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b1a73e1982e6d73e72b52126d179a487e03b93 --- /dev/null +++ b/annotations_1/YsCeolAfbLw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.09], [22.0, 22.11], [26.0, 26.47], [28.0, 27.75], [30.0, 30.74], [51.0, 51.85], [70.0, 70.12], [76.0, 77.41], [79.0, 86.24], [90.0, 89.83]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 36.56], ["hum", 18.07], ["throbbing", 12.36]], null], "duration": [0.09, 0.11, 0.47, -0.25, 0.74, 0.85, 0.12, 1.41, 7.24, -0.17]} \ No newline at end of file diff --git a/annotations_1/Ys_zYL7K3KQ_filtered.json b/annotations_1/Ys_zYL7K3KQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9042c7986c0f12b382926ef3587d7cf444ff982e --- /dev/null +++ b/annotations_1/Ys_zYL7K3KQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.51], [11.0, 11.11], [14.0, 15.03], [20.0, 21.03], [25.0, 26.3], [30.0, 31.56], [32.0, 33.93], [34.0, 35.02], [35.0, 36.26], [38.0, 41.3], [42.0, 42.6], [43.0, 44.09], [46.0, 48.02], [48.0, 49.45], [50.0, 50.72], [52.0, 52.57], [53.0, 54.78], [57.0, 58.18], [60.0, 60.39], [61.0, 67.74], [68.0, 69.87], [71.0, 71.46], [72.0, 74.78], [76.0, 77.87], [79.0, 83.07], [83.0, 85.18], [87.0, 88.53], [90.0, 91.83], [92.0, 93.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 59.59, 0.0, 63.21, 70.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.11, 1.03, 1.03, 1.3, 1.56, 1.93, 1.02, 1.26, 3.3, 0.6, 1.09, 2.02, 1.45, 0.72, 0.57, 1.78, 1.18, 0.39, 6.74, 1.87, 0.46, 2.78, 1.87, 4.07, 2.18, 1.53, 1.83, 1.38]} \ No newline at end of file diff --git a/annotations_1/YtWJKXNMmhI_filtered.json b/annotations_1/YtWJKXNMmhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddeb3f1abb843ecd8cc45b527b6e9cf57409ef5e --- /dev/null +++ b/annotations_1/YtWJKXNMmhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.86], [12.0, 12.78], [16.0, 16.46], [19.0, 21.51], [26.0, 26.38], [27.0, 28.49], [37.0, 38.15], [40.0, 39.8], [42.0, 42.94], [46.0, 47.07], [58.0, 58.51], [60.0, 66.5], [67.0, 67.61], [75.0, 75.36], [76.0, 76.55], [81.0, 81.06], [82.0, 82.48], [83.0, 83.73], [84.0, 85.55], [87.0, 87.84], [107.0, 108.63], [117.0, 118.61], [120.0, 121.42], [123.0, 124.24], [126.0, 126.47], [131.0, 132.0], [137.0, 138.43], [144.0, 144.15], [152.0, 173.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.25, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.86, 0.78, 0.46, 2.51, 0.38, 1.49, 1.15, -0.2, 0.94, 1.07, 0.51, 6.5, 0.61, 0.36, 0.55, 0.06, 0.48, 0.73, 1.55, 0.84, 1.63, 1.61, 1.42, 1.24, 0.47, 1.0, 1.43, 0.15, 21.13]} \ No newline at end of file diff --git a/annotations_1/YtktNetGOKU_filtered.json b/annotations_1/YtktNetGOKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f06b8680e4c12a711ba726f4213d7dc5a471aadd --- /dev/null +++ b/annotations_1/YtktNetGOKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.0], [30.0, 30.54], [32.0, 32.21], [35.0, 36.46], [37.0, 41.45], [43.0, 45.66], [50.0, 51.93], [54.0, 56.1], [59.0, 59.93], [62.0, 64.62], [70.0, 80.7], [86.0, 86.49], [87.0, 88.91], [91.0, 93.26], [95.0, 98.17], [99.0, 100.04], [103.0, 103.2], [105.0, 106.81], [109.0, 116.13], [118.0, 119.55], [121.0, 131.77]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, true, false, true], "silence_prob": [40.14, 0.0, 0.0, 0.0, 63.42, 63.53, 0.0, 61.37, 0.0, 58.3, 35.62, 0.0, 0.0, 56.25, 36.35, 0.0, 0.0, 0.0, 39.04, 0.0, 30.69], "audiomae_on_audioset": [[["music", 53.02], ["hum", 6.57], ["fly, housefly", 5.34]], null, null, null, null, null, null, null, null, null, [["hum", 24.52], ["noise", 19.42], ["glass", 17.15]], null, null, null, [["music", 30.95], ["throbbing", 13.42], ["musical instrument", 10.06]], null, null, null, [["rumble", 26.47], ["breaking", 14.41], ["noise", 13.37]], null, [["buzz", 41.35], ["insect", 7.75], ["fly, housefly", 5.26]]], "duration": [11.0, 0.54, 0.21, 1.46, 4.45, 2.66, 1.93, 2.1, 0.93, 2.62, 10.7, 0.49, 1.91, 2.26, 3.17, 1.04, 0.2, 1.81, 7.13, 1.55, 10.77]} \ No newline at end of file diff --git a/annotations_1/YtqU_6Imito_filtered.json b/annotations_1/YtqU_6Imito_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..311a114193b532b214aa5b649d3da53e79937508 --- /dev/null +++ b/annotations_1/YtqU_6Imito_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [6.0, 8.67], [9.0, 17.96], [19.0, 19.77], [21.0, 21.39], [23.0, 37.91], [47.0, 53.08], [63.0, 90.07], [96.0, 113.76]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.34, 30.55, 0.0, 0.0, 29.19, 29.4, 30.41, 29.36], "audiomae_on_audioset": [null, [["speech", 38.79], ["music", 36.61], ["mains hum", 2.98]], [["music", 52.26], ["speech", 12.36], ["hum", 5.41]], null, null, [["music", 50.35], ["speech", 26.47], ["vehicle", 2.42]], [["speech", 44.09], ["explosion", 10.32], ["eruption", 7.08]], [["speech", 67.8], ["music", 15.23], ["sidetone", 3.07]], [["music", 85.66], ["explosion", 1.12], ["burst, pop", 1.1]]], "duration": [1.62, 2.67, 8.96, 0.77, 0.39, 14.91, 6.08, 27.07, 17.76]} \ No newline at end of file diff --git a/annotations_1/YvL_-Awg2gg_filtered.json b/annotations_1/YvL_-Awg2gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd454486ff93764d9527b96e42ad3ffb914fbe31 --- /dev/null +++ b/annotations_1/YvL_-Awg2gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [22.0, 21.84], [23.0, 33.79], [36.0, 36.58], [39.0, 41.17], [48.0, 61.6], [64.0, 73.62], [75.0, 75.64], [77.0, 77.19], [78.0, 78.43], [79.0, 90.54], [91.0, 96.25], [101.0, 114.39], [115.0, 116.65], [127.0, 128.14], [128.0, 132.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 34.95, 0.0, 50.31, 39.5, 40.9, 0.0, 0.0, 0.0, 35.89, 47.66, 37.46, 0.0, 0.0, 36.9], "audiomae_on_audioset": [null, null, [["music", 64.57], ["thunk", 15.15], ["bleat", 1.42]], null, null, [["music", 64.73], ["ding", 8.28], ["speech", 5.33]], [["music", 36.25], ["thunk", 16.87], ["hum", 9.2]], null, null, null, [["music", 53.63], ["throbbing", 21.83], ["hum", 6.42]], [["music", 52.61], ["theremin", 9.26], ["synthesizer", 4.27]], [["hum", 17.2], ["mains hum", 17.13], ["music", 17.13]], null, null, [["music", 31.63], ["speech", 8.62], ["gong", 7.39]]], "duration": [0.8, -0.16, 10.79, 0.58, 2.17, 13.6, 9.62, 0.64, 0.19, 0.43, 11.54, 5.25, 13.39, 1.65, 1.14, 4.02]} \ No newline at end of file diff --git a/annotations_1/YvNjJgJM728_filtered.json b/annotations_1/YvNjJgJM728_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4c942a7f5da6078c50d69c0a8694d05920ac34c --- /dev/null +++ b/annotations_1/YvNjJgJM728_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.49], [11.0, 10.74], [11.0, 23.3], [26.0, 32.8], [34.0, 33.86], [34.0, 44.27], [45.0, 48.86], [50.0, 52.74], [54.0, 57.32]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [53.59, 0.0, 58.05, 81.89, 0.0, 70.16, 87.55, 80.82, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [3.49, -0.26, 12.3, 6.8, -0.14, 10.27, 3.86, 2.74, 3.32]} \ No newline at end of file diff --git a/annotations_1/YvT0GTWPw0M_filtered.json b/annotations_1/YvT0GTWPw0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae8107e3bb4f4f788d3bed5c197e4ecf561b1c9f --- /dev/null +++ b/annotations_1/YvT0GTWPw0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 29.52], [30.0, 30.67], [32.0, 45.37], [51.0, 57.21], [59.0, 79.96], [84.0, 84.57], [85.0, 90.0], [92.0, 95.79]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [55.11, 0.0, 50.86, 92.15, 60.98, 0.0, 87.74, 60.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [18.52, 0.67, 13.37, 6.21, 20.96, 0.57, 5.0, 3.79]} \ No newline at end of file diff --git a/annotations_1/YwnX8My7428_filtered.json b/annotations_1/YwnX8My7428_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f731c5d8d8c23bec6d25dea7c48ca93fdd4932 --- /dev/null +++ b/annotations_1/YwnX8My7428_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 15.42], [16.0, 18.55], [20.0, 21.69], [23.0, 24.58], [25.0, 25.25], [26.0, 28.24], [31.0, 33.13], [34.0, 37.1], [38.0, 42.55], [44.0, 45.77], [47.0, 49.72], [51.0, 52.49], [54.0, 55.76], [57.0, 61.26], [64.0, 69.84], [71.0, 74.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.16, 68.41, 0.0, 0.0, 0.0, 72.6, 78.04, 70.44, 82.25, 0.0, 78.21, 0.0, 0.0, 74.13, 51.07, 60.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.42, 2.55, 1.69, 1.58, 0.25, 2.24, 2.13, 3.1, 4.55, 1.77, 2.72, 1.49, 1.76, 4.26, 5.84, 3.43]} \ No newline at end of file diff --git a/annotations_1/YxQJTlFyebM_filtered.json b/annotations_1/YxQJTlFyebM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e2117f1a0cb0beab1302a8474233863ef7d51ce --- /dev/null +++ b/annotations_1/YxQJTlFyebM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [16.0, 19.14], [22.0, 22.72], [26.0, 42.52], [43.0, 43.66], [60.0, 60.74], [66.0, 75.56], [76.0, 76.98], [92.0, 96.16], [99.0, 104.7], [129.0, 130.27], [139.0, 139.68]], "keep_status": [false, true, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 41.72, 0.0, 43.53, 0.0, 0.0, 47.62, 0.0, 38.32, 38.67, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 31.36], ["speech", 23.83], ["percussion", 4.52]], null, [["speech", 49.38], ["music", 23.51], ["musical instrument", 2.96]], null, null, [["speech", 41.63], ["electric shaver, electric razor", 12.72], ["music", 10.22]], null, [["music", 42.77], ["speech", 14.84], ["musical instrument", 3.55]], [["music", 68.56], ["speech", 13.29], ["musical instrument", 2.21]], null, null], "duration": [0.59, 3.14, 0.72, 16.52, 0.66, 0.74, 9.56, 0.98, 4.16, 5.7, 1.27, 0.68]} \ No newline at end of file diff --git a/annotations_1/YzCruCXU8Xc_filtered.json b/annotations_1/YzCruCXU8Xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86dad8910668cd6297454fef9821614d5be531ba --- /dev/null +++ b/annotations_1/YzCruCXU8Xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.35], [9.0, 9.02], [10.0, 16.93], [18.0, 19.8], [21.0, 21.27], [24.0, 24.9], [26.0, 26.92], [29.0, 29.54], [30.0, 31.5], [32.0, 33.69], [35.0, 35.72], [37.0, 37.59], [41.0, 42.47], [44.0, 45.79], [47.0, 48.57], [54.0, 54.87], [60.0, 60.17], [62.0, 62.56], [66.0, 66.38], [72.0, 75.2], [76.0, 84.08], [87.0, 87.22], [88.0, 90.31], [92.0, 92.03], [93.0, 94.22], [96.0, 100.26], [101.0, 103.45], [108.0, 108.55], [113.0, 113.75], [114.0, 114.88], [117.0, 116.67], [119.0, 120.55], [121.0, 122.07], [123.0, 123.25], [125.0, 127.94], [129.0, 131.46], [133.0, 133.52], [134.0, 136.22], [139.0, 139.9], [141.0, 141.67], [144.0, 145.2], [151.0, 151.56], [152.0, 153.57], [155.0, 156.49], [158.0, 160.69], [161.0, 162.72], [164.0, 164.51], [165.0, 168.17], [172.0, 174.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 87.19, 0.0, 99.26, 0.0, 0.0, 98.51, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 91.64, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 66.03, 73.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.35, 0.02, 6.93, 1.8, 0.27, 0.9, 0.92, 0.54, 1.5, 1.69, 0.72, 0.59, 1.47, 1.79, 1.57, 0.87, 0.17, 0.56, 0.38, 3.2, 8.08, 0.22, 2.31, 0.03, 1.22, 4.26, 2.45, 0.55, 0.75, 0.88, -0.33, 1.55, 1.07, 0.25, 2.94, 2.46, 0.52, 2.22, 0.9, 0.67, 1.2, 0.56, 1.57, 1.49, 2.69, 1.72, 0.51, 3.17, 2.97]} \ No newline at end of file diff --git a/annotations_1/YzIWoPLLktE_filtered.json b/annotations_1/YzIWoPLLktE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13b97bc4444522d8af9f54c330726b5461c19231 --- /dev/null +++ b/annotations_1/YzIWoPLLktE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.75], [13.0, 14.49], [16.0, 15.94], [18.0, 42.82], [43.0, 77.79], [79.0, 79.32], [80.0, 81.01], [83.0, 84.23], [87.0, 94.31], [95.0, 95.34], [100.0, 99.77], [105.0, 105.0]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [34.34, 0.0, 0.0, 31.08, 0.0, 0.0, 0.0, 0.0, 37.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 58.88], ["livestock, farm animals, working animals", 7.19], ["speech", 7.18]], null, null, [["speech", 66.98], ["eruption", 19.05], ["explosion", 5.67]], null, null, null, null, [["speech", 43.72], ["hum", 11.01], ["radio", 9.25]], null, null, null], "duration": [2.75, 1.49, -0.06, 24.82, 34.79, 0.32, 1.01, 1.23, 7.31, 0.34, -0.23, 0.0]} \ No newline at end of file diff --git a/annotations_1/Z-WSedqa5zA_filtered.json b/annotations_1/Z-WSedqa5zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..850dfb9676e348da0ce7364ee25172e2c7ba73fd --- /dev/null +++ b/annotations_1/Z-WSedqa5zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.3], [8.0, 13.22], [16.0, 60.25], [61.0, 74.83]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 28.31, 0.0, 28.22], "audiomae_on_audioset": [null, [["hum", 43.67], ["mains hum", 17.85], ["music", 8.86]], null, [["vehicle", 50.75], ["speech", 21.96], ["car", 13.58]]], "duration": [1.3, 5.22, 44.25, 13.83]} \ No newline at end of file diff --git a/annotations_1/Z-l7wGkNyko_filtered.json b/annotations_1/Z-l7wGkNyko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48b4630af43c36875a90b3711123042beb6ecedd --- /dev/null +++ b/annotations_1/Z-l7wGkNyko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.5], [5.0, 6.32], [15.0, 16.85], [18.0, 19.16], [21.0, 21.39], [22.0, 25.44], [32.0, 34.13], [37.0, 40.24], [42.0, 46.01], [47.0, 48.57], [49.0, 50.68], [52.0, 52.96], [55.0, 57.16], [58.0, 58.94], [60.0, 62.13], [63.0, 63.95], [65.0, 69.09], [70.0, 72.42], [74.0, 83.35], [84.0, 89.36], [90.0, 90.29], [91.0, 120.12], [121.0, 135.46], [138.0, 139.45], [142.0, 151.98], [160.0, 161.55]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [36.89, 0.0, 0.0, 0.0, 0.0, 55.11, 48.14, 58.05, 50.02, 0.0, 0.0, 0.0, 53.84, 0.0, 58.3, 0.0, 60.89, 47.86, 53.1, 49.87, 0.0, 30.6, 30.0, 0.0, 29.7, 0.0], "audiomae_on_audioset": [[["speech", 18.38], ["music", 11.29], ["synthesizer", 5.66]], null, null, null, null, null, [["sidetone", 26.88], ["music", 21.1], ["hum", 13.95]], null, null, null, null, null, null, null, null, null, null, [["music", 31.27], ["synthesizer", 16.93], ["didgeridoo", 6.03]], null, [["hum", 41.08], ["mains hum", 23.29], ["speech", 15.75]], null, [["music", 35.73], ["hum", 25.97], ["throbbing", 25.62]], [["music", 84.61], ["angry music", 1.59], ["guitar", 1.39]], null, [["music", 75.51], ["hum", 3.1], ["electronic music", 1.79]], null], "duration": [2.5, 1.32, 1.85, 1.16, 0.39, 3.44, 2.13, 3.24, 4.01, 1.57, 1.68, 0.96, 2.16, 0.94, 2.13, 0.95, 4.09, 2.42, 9.35, 5.36, 0.29, 29.12, 14.46, 1.45, 9.98, 1.55]} \ No newline at end of file diff --git a/annotations_1/Z0AxmKelYrE_filtered.json b/annotations_1/Z0AxmKelYrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5373bd4ca9482bcab712a2679e64af0035832465 --- /dev/null +++ b/annotations_1/Z0AxmKelYrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [5.0, 5.41], [5.0, 6.12], [6.0, 7.84], [11.0, 16.66], [33.0, 32.86], [33.0, 34.16], [40.0, 57.45], [58.0, 61.48], [62.0, 62.61], [74.0, 74.44], [96.0, 97.68], [99.0, 99.99], [106.0, 106.91], [114.0, 115.57], [118.0, 117.69], [118.0, 119.8], [121.0, 124.88], [125.0, 139.7]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.87, 0.0, 0.0, 44.34, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.98, 41.72], "audiomae_on_audioset": [null, null, null, null, [["music", 77.69], ["musical instrument", 5.82], ["theremin", 4.49]], null, null, [["music", 42.32], ["dog", 8.04], ["hum", 7.64]], null, null, null, null, null, null, null, null, null, [["speech", 21.5], ["whack, thwack", 16.2], ["music", 15.76]], [["music", 46.12], ["speech", 40.0], ["thunk", 8.04]]], "duration": [0.06, 0.41, 1.12, 1.84, 5.66, -0.14, 1.16, 17.45, 3.48, 0.61, 0.44, 1.68, 0.99, 0.91, 1.57, -0.31, 1.8, 3.88, 14.7]} \ No newline at end of file diff --git a/annotations_1/Z0FKMJQR9RU_filtered.json b/annotations_1/Z0FKMJQR9RU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f866a03bb68d9056c60845e5ef7da5761cd510 --- /dev/null +++ b/annotations_1/Z0FKMJQR9RU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.62], [1.0, 19.4], [23.0, 23.08], [23.0, 27.9], [28.0, 68.44], [68.0, 73.06], [77.0, 81.97], [83.0, 83.2], [84.0, 84.86], [86.0, 85.85], [87.0, 87.98], [89.0, 89.63], [96.0, 96.45], [97.0, 99.35], [107.0, 111.47], [121.0, 122.27], [128.0, 130.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 32.48, 0.0, 82.79, 0.0, 44.57, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.96, 70.02, 0.0, 48.44], "audiomae_on_audioset": [null, [["hum", 30.29], ["music", 27.68], ["mains hum", 20.27]], null, null, null, [["mains hum", 39.05], ["hum", 27.65], ["music", 8.49]], null, null, null, null, null, null, null, null, null, null, [["speech", 29.05], ["music", 17.99], ["cattle, bovinae", 8.55]]], "duration": [0.62, 18.4, 0.08, 4.9, 40.44, 5.06, 4.97, 0.2, 0.86, -0.15, 0.98, 0.63, 0.45, 2.35, 4.47, 1.27, 2.44]} \ No newline at end of file diff --git a/annotations_1/Z0Fm3Ym-aJM_filtered.json b/annotations_1/Z0Fm3Ym-aJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58f902742f0e14d3c94c6f6cc6b101a4c92b8952 --- /dev/null +++ b/annotations_1/Z0Fm3Ym-aJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.06], [6.0, 6.35], [11.0, 12.34], [13.0, 13.98], [16.0, 16.75], [20.0, 20.63], [23.0, 35.04], [40.0, 40.74], [43.0, 43.66], [48.0, 51.9], [62.0, 62.87], [64.0, 65.25], [79.0, 80.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.18, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.35, 1.34, 0.98, 0.75, 0.63, 12.04, 0.74, 0.66, 3.9, 0.87, 1.25, 1.01]} \ No newline at end of file diff --git a/annotations_1/Z0sFhnkRCsQ_filtered.json b/annotations_1/Z0sFhnkRCsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e025e515a8f6a31d579afca5220abf68eb7cb767 --- /dev/null +++ b/annotations_1/Z0sFhnkRCsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.13], [8.0, 8.5], [10.0, 10.83], [13.0, 13.36], [16.0, 16.11], [18.0, 18.12], [21.0, 21.59], [26.0, 27.11], [28.0, 29.39], [30.0, 31.08], [33.0, 35.72], [40.0, 40.19], [41.0, 41.17], [42.0, 42.5], [46.0, 45.98], [49.0, 49.76], [59.0, 58.63], [60.0, 60.35], [74.0, 75.09], [78.0, 79.02], [85.0, 86.81], [89.0, 90.66], [96.0, 97.63], [98.0, 99.0], [100.0, 100.4], [103.0, 105.54], [108.0, 112.13], [116.0, 117.29], [118.0, 118.89], [125.0, 125.34], [126.0, 126.35], [127.0, 128.61], [129.0, 131.26], [132.0, 133.42], [134.0, 135.78], [138.0, 139.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53, 45.65, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.19], ["inside, small room", 7.9], ["hum", 6.97]], null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.5, 0.83, 0.36, 0.11, 0.12, 0.59, 1.11, 1.39, 1.08, 2.72, 0.19, 0.17, 0.5, -0.02, 0.76, -0.37, 0.35, 1.09, 1.02, 1.81, 1.66, 1.63, 1.0, 0.4, 2.54, 4.13, 1.29, 0.89, 0.34, 0.35, 1.61, 2.26, 1.42, 1.78, 1.56]} \ No newline at end of file diff --git a/annotations_1/Z1DO7_hHqbw_filtered.json b/annotations_1/Z1DO7_hHqbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c2521fbec1feaef5d30a057544a338573126e6a --- /dev/null +++ b/annotations_1/Z1DO7_hHqbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.87], [5.0, 6.84], [12.0, 12.31], [14.0, 14.25], [26.0, 26.57], [28.0, 28.93], [31.0, 31.02], [31.0, 33.27], [36.0, 36.88], [38.0, 44.98], [46.0, 46.47], [57.0, 59.83], [60.0, 61.11], [69.0, 71.29], [76.0, 77.25], [82.0, 83.83], [101.0, 102.02], [105.0, 105.49], [114.0, 113.7], [117.0, 117.37], [148.0, 150.01], [153.0, 154.04], [158.0, 159.04], [161.0, 161.87], [162.0, 163.16], [166.0, 195.02], [198.0, 198.69]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 0.0, 29.51, 0.0, 35.03, 0.0, 29.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.28, 0.0, 0.0, 0.0, 0.0, 32.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 22.08], ["hum", 19.97], ["music", 16.8]], null, [["music", 36.32], ["speech", 34.27], ["mains hum", 7.64]], null, [["hum", 27.02], ["music", 19.7], ["mains hum", 14.29]], null, [["music", 50.71], ["didgeridoo", 7.33], ["electronic music", 4.69]], null, null, null, null, null, null, [["speech", 49.25], ["music", 14.94], ["explosion", 5.52]], null, null, null, null, [["hum", 43.45], ["mains hum", 31.0], ["music", 6.27]], null], "duration": [1.87, 1.84, 0.31, 0.25, 0.57, 0.93, 0.02, 2.27, 0.88, 6.98, 0.47, 2.83, 1.11, 2.29, 1.25, 1.83, 1.02, 0.49, -0.3, 0.37, 2.01, 1.04, 1.04, 0.87, 1.16, 29.02, 0.69]} \ No newline at end of file diff --git a/annotations_1/Z2-9fWRAwMo_filtered.json b/annotations_1/Z2-9fWRAwMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3aa254cb23f1481cc77a98ac59841411995928bd --- /dev/null +++ b/annotations_1/Z2-9fWRAwMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [7.0, 7.75], [9.0, 9.41], [11.0, 11.2], [15.0, 15.74], [16.0, 22.74], [23.0, 22.77], [25.0, 43.7], [47.0, 74.85], [76.0, 76.77], [78.0, 81.38], [83.0, 83.0], [87.0, 87.71], [89.0, 97.31], [98.0, 114.69], [116.0, 120.45], [125.0, 133.12], [136.0, 140.36], [142.0, 142.53], [144.0, 144.59], [147.0, 152.24], [154.0, 156.93], [159.0, 161.94], [163.0, 164.07]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.07, 0.0, 31.0, 30.13, 0.0, 32.92, 0.0, 0.0, 37.51, 29.66, 31.95, 38.42, 37.84, 0.0, 0.0, 81.89, 91.81, 90.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 38.96], ["hum", 7.24], ["mains hum", 6.14]], null, [["music", 59.99], ["throbbing", 4.28], ["hum", 4.07]], [["music", 30.59], ["livestock, farm animals, working animals", 12.55], ["cowbell", 9.5]], null, [["music", 58.47], ["livestock, farm animals, working animals", 9.29], ["animal", 6.19]], null, null, [["music", 39.61], ["fly, housefly", 8.09], ["insect", 7.04]], [["music", 39.34], ["throbbing", 11.69], ["hum", 10.09]], [["music", 37.88], ["hum", 15.0], ["mains hum", 10.07]], [["music", 31.44], ["hum", 28.39], ["throbbing", 12.81]], [["hum", 37.06], ["music", 12.96], ["throbbing", 12.28]], null, null, null, null, null, null], "duration": [1.24, 0.75, 0.41, 0.2, 0.74, 6.74, -0.23, 18.7, 27.85, 0.77, 3.38, 0.0, 0.71, 8.31, 16.69, 4.45, 8.12, 4.36, 0.53, 0.59, 5.24, 2.93, 2.94, 1.07]} \ No newline at end of file diff --git a/annotations_1/Z2-qppnyM3s_filtered.json b/annotations_1/Z2-qppnyM3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4416e23a19ea9432169c54f93a0541e310b5ef8a --- /dev/null +++ b/annotations_1/Z2-qppnyM3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.14], [37.0, 78.83], [81.0, 114.62], [115.0, 115.91], [120.0, 127.72]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.06], "audiomae_on_audioset": [null, null, null, null, [["eruption", 28.29], ["music", 20.06], ["whale vocalization", 8.2]]], "duration": [0.14, 41.83, 33.62, 0.91, 7.72]} \ No newline at end of file diff --git a/annotations_1/Z2eTW8qZBtk_filtered.json b/annotations_1/Z2eTW8qZBtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40382805a93b0f6154f94bffdac3d63ebdbedc37 --- /dev/null +++ b/annotations_1/Z2eTW8qZBtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.04], [17.0, 18.87], [21.0, 21.42], [22.0, 25.27], [31.0, 32.41], [37.0, 38.42], [40.0, 48.66], [51.0, 60.54], [66.0, 66.5], [72.0, 73.26], [79.0, 79.57], [88.0, 89.38], [90.0, 90.64], [91.0, 92.64], [94.0, 96.35], [97.0, 108.51], [110.0, 110.47], [112.0, 115.6], [116.0, 116.67], [120.0, 120.83], [126.0, 127.01], [133.0, 155.38], [160.0, 161.64], [167.0, 167.95], [173.0, 174.26], [180.0, 184.25], [184.0, 192.69], [194.0, 209.65], [214.0, 215.5], [227.0, 228.24], [236.0, 237.91], [240.0, 241.08], [243.0, 254.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.29, 0.0, 0.0, 30.9, 0.0, 0.0, 31.48, 31.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.69, 30.49, 0.0, 31.8, 0.0, 0.0, 0.0, 30.46, 0.0, 0.0, 0.0, 29.51, 30.19, 30.73, 0.0, 0.0, 0.0, 0.0, 29.67], "audiomae_on_audioset": [[["music", 57.78], ["bass guitar", 12.04], ["guitar", 10.79]], null, null, [["music", 80.24], ["singing", 2.5], ["musical instrument", 1.76]], null, null, [["music", 83.98], ["reggae", 1.58], ["singing", 1.13]], [["music", 75.45], ["reggae", 9.39], ["funk", 0.89]], null, null, null, null, null, null, [["music", 48.06], ["reggae", 14.34], ["singing", 4.11]], [["music", 76.51], ["moo", 3.17], ["cattle, bovinae", 2.76]], null, [["music", 77.51], ["reggae", 3.12], ["bass guitar", 2.37]], null, null, null, [["music", 84.93], ["singing", 1.58], ["reggae", 1.06]], null, null, null, [["music", 72.7], ["didgeridoo", 6.51], ["musical instrument", 2.6]], [["music", 85.9], ["singing", 1.78], ["reggae", 1.0]], [["music", 68.37], ["reggae", 7.38], ["bass guitar", 2.87]], null, null, null, null, [["music", 77.35], ["didgeridoo", 2.89], ["bleat", 2.64]]], "duration": [2.04, 1.87, 0.42, 3.27, 1.41, 1.42, 8.66, 9.54, 0.5, 1.26, 0.57, 1.38, 0.64, 1.64, 2.35, 11.51, 0.47, 3.6, 0.67, 0.83, 1.01, 22.38, 1.64, 0.95, 1.26, 4.25, 8.69, 15.65, 1.5, 1.24, 1.91, 1.08, 11.16]} \ No newline at end of file diff --git a/annotations_1/Z2xooz6844k_filtered.json b/annotations_1/Z2xooz6844k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36f17e7aa3953f58e88ed9ae7a285178b5f8d73f --- /dev/null +++ b/annotations_1/Z2xooz6844k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 25.39], [27.0, 70.95], [75.0, 82.46], [95.0, 102.36], [104.0, 127.28], [133.0, 143.9], [146.0, 146.06]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [33.89, 0.0, 33.43, 33.36, 31.58, 33.84, 0.0], "audiomae_on_audioset": [[["music", 72.52], ["reggae", 4.95], ["electronic music", 3.51]], null, [["music", 87.54], ["didgeridoo", 3.14], ["musical instrument", 0.85]], [["music", 76.18], ["electronic music", 5.11], ["throbbing", 4.12]], [["music", 91.09], ["electronic music", 3.39], ["throbbing", 0.67]], [["music", 30.02], ["speech", 29.46], ["foghorn", 3.25]], null], "duration": [9.39, 43.95, 7.46, 7.36, 23.28, 10.9, 0.06]} \ No newline at end of file diff --git a/annotations_1/Z4G5St8apOQ_filtered.json b/annotations_1/Z4G5St8apOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f731d3f111453e3a522edb43a51d79eee15fd18c --- /dev/null +++ b/annotations_1/Z4G5St8apOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.03], [10.0, 10.47], [14.0, 14.42], [22.0, 59.75], [61.0, 129.34], [130.0, 131.04], [132.0, 133.35], [134.0, 134.92], [137.0, 137.81], [141.0, 141.25], [142.0, 142.74], [143.0, 144.85], [145.0, 150.08], [151.0, 151.17], [154.0, 156.0], [157.0, 158.87], [162.0, 164.64], [166.0, 166.67], [167.0, 167.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.77, 0.0, 35.32, 0.0, 38.19, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.83], ["hum", 13.28], ["throbbing", 9.66]], null, [["music", 36.92], ["speech", 8.29], ["musical instrument", 5.88]], null, [["music", 38.26], ["hum", 13.97], ["mains hum", 9.43]], null, null], "duration": [0.03, 0.47, 0.42, 37.75, 68.34, 1.04, 1.35, 0.92, 0.81, 0.25, 0.74, 1.85, 5.08, 0.17, 2.0, 1.87, 2.64, 0.67, 0.98]} \ No newline at end of file diff --git a/annotations_1/Z4ScRG9SDSI_filtered.json b/annotations_1/Z4ScRG9SDSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb7134de11a30ec9f1a2cd24c99df22f57975a6f --- /dev/null +++ b/annotations_1/Z4ScRG9SDSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [6.0, 6.54], [9.0, 10.96], [13.0, 12.72], [16.0, 16.46], [17.0, 18.69], [26.0, 27.09], [29.0, 30.18], [35.0, 46.09], [53.0, 54.28], [56.0, 57.54], [61.0, 61.8], [65.0, 64.69], [70.0, 70.75], [71.0, 73.7], [82.0, 82.14], [91.0, 94.15], [94.0, 94.59], [95.0, 96.65], [99.0, 100.04], [102.0, 103.76], [106.0, 105.6], [107.0, 112.26], [114.0, 114.78], [118.0, 120.29], [121.0, 121.22], [122.0, 123.06], [126.0, 125.86], [126.0, 126.39], [129.0, 131.11], [133.0, 132.87], [135.0, 135.38], [137.0, 142.92], [144.0, 145.79], [150.0, 152.15], [157.0, 156.63], [160.0, 160.29], [170.0, 171.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.26, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 35.96, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 73.51, 0.0, 31.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 72.83], ["musical instrument", 2.63], ["groan", 2.17]], null, null, null, null, null, null, null, [["dog", 20.85], ["music", 19.57], ["animal", 16.57]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.91], ["music", 22.14], ["electronic music", 3.74]], null, null, null, null, [["speech", 44.13], ["fly, housefly", 10.07], ["insect", 7.95]], null, null, null], "duration": [1.12, 0.54, 1.96, -0.28, 0.46, 1.69, 1.09, 1.18, 11.09, 1.28, 1.54, 0.8, -0.31, 0.75, 2.7, 0.14, 3.15, 0.59, 1.65, 1.04, 1.76, -0.4, 5.26, 0.78, 2.29, 0.22, 1.06, -0.14, 0.39, 2.11, -0.13, 0.38, 5.92, 1.79, 2.15, -0.37, 0.29, 1.53]} \ No newline at end of file diff --git a/annotations_1/Z4kBo6FO8bc_filtered.json b/annotations_1/Z4kBo6FO8bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9f95b85d5276cd80dcbb31edb02fe67f4af9ae --- /dev/null +++ b/annotations_1/Z4kBo6FO8bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [8.0, 13.73], [17.0, 18.18], [19.0, 21.86], [23.0, 27.8], [33.0, 33.4], [38.0, 41.54], [46.0, 46.28], [51.0, 51.33], [56.0, 56.34], [65.0, 85.83], [96.0, 96.55], [99.0, 99.89], [113.0, 113.78]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.23, 0.0, 42.98, 49.18, 0.0, 35.1, 0.0, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 60.23], ["throbbing", 9.52], ["hum", 8.34]], null, [["music", 73.18], ["drum machine", 4.49], ["musical instrument", 2.39]], [["music", 70.96], ["bass guitar", 5.02], ["guitar", 1.88]], null, [["music", 21.53], ["whack, thwack", 12.7], ["fly, housefly", 8.08]], null, null, null, [["music", 71.42], ["speech", 7.5], ["boing", 4.09]], null, null, null], "duration": [0.31, 5.73, 1.18, 2.86, 4.8, 0.4, 3.54, 0.28, 0.33, 0.34, 20.83, 0.55, 0.89, 0.78]} \ No newline at end of file diff --git a/annotations_1/Z6SklaeTne8_filtered.json b/annotations_1/Z6SklaeTne8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a49b316f4e830a960c0cacc22ca4eca1b0ace26 --- /dev/null +++ b/annotations_1/Z6SklaeTne8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 68.5], [73.0, 79.14], [80.0, 81.08], [87.0, 118.84], [119.0, 138.15], [139.0, 148.24], [149.0, 149.55], [151.0, 166.51], [167.0, 183.41], [184.0, 186.43], [186.0, 189.41], [190.0, 191.15], [192.0, 192.62], [195.0, 197.04], [199.0, 199.2], [201.0, 200.87], [203.0, 205.21], [206.0, 212.82]], "keep_status": [false, true, false, false, false, true, false, true, true, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.09, 0.0, 0.0, 28.99, 32.56, 0.0, 29.57, 29.62, 32.7, 33.76, 0.0, 0.0, 45.98, 0.0, 0.0, 93.29, 42.44], "audiomae_on_audioset": [null, [["music", 32.54], ["throbbing", 9.18], ["speech", 7.16]], null, null, [["speech", 66.72], ["music", 7.45], ["vehicle", 5.18]], [["music", 54.06], ["smash, crash", 6.77], ["hum", 5.61]], null, [["music", 51.82], ["hum", 7.06], ["buzz", 4.15]], [["music", 26.83], ["mains hum", 14.91], ["hum", 13.27]], [["speech", 40.3], ["hum", 11.33], ["throbbing", 6.93]], [["speech", 33.26], ["throbbing", 9.95], ["music", 6.73]], null, null, [["music", 74.55], ["guitar", 4.29], ["musical instrument", 4.14]], null, null, null, [["music", 23.22], ["hum", 13.79], ["throbbing", 6.99]]], "duration": [33.5, 6.14, 1.08, 31.84, 19.15, 9.24, 0.55, 15.51, 16.41, 2.43, 3.41, 1.15, 0.62, 2.04, 0.2, -0.13, 2.21, 6.82]} \ No newline at end of file diff --git a/annotations_1/Z6cDbMLcxQI_filtered.json b/annotations_1/Z6cDbMLcxQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc8488b86a3d13f36e279d3a2ea2ead8ff1fc126 --- /dev/null +++ b/annotations_1/Z6cDbMLcxQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.34], [11.0, 11.65], [12.0, 12.41], [14.0, 14.55], [19.0, 19.43], [28.0, 28.34], [41.0, 43.36], [46.0, 51.8], [64.0, 68.08], [69.0, 74.12], [78.0, 81.6], [85.0, 103.2], [106.0, 129.34], [131.0, 136.44], [138.0, 144.39], [145.0, 145.74], [147.0, 151.41], [153.0, 157.77]], "keep_status": [false, false, false, false, false, false, true, true, true, true, true, false, true, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.1, 30.75, 30.85, 30.91, 30.35, 32.18, 32.1, 33.04, 31.35, 0.0, 60.23, 44.6], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 41.13], ["speech", 13.82], ["musical instrument", 6.01]], [["speech", 16.93], ["music", 13.61], ["livestock, farm animals, working animals", 13.04]], [["speech", 38.28], ["music", 16.17], ["reverberation", 5.38]], [["cowbell", 15.92], ["didgeridoo", 15.39], ["livestock, farm animals, working animals", 10.22]], [["music", 14.81], ["livestock, farm animals, working animals", 12.82], ["speech", 11.41]], [["cattle, bovinae", 29.76], ["moo", 28.09], ["livestock, farm animals, working animals", 26.41]], [["music", 40.97], ["fly, housefly", 10.14], ["livestock, farm animals, working animals", 8.73]], [["music", 32.58], ["buzz", 13.91], ["vehicle", 12.77]], [["buzz", 20.33], ["music", 18.59], ["fly, housefly", 13.26]], null, null, [["music", 52.58], ["theremin", 12.78], ["synthesizer", 7.77]]], "duration": [0.34, 0.65, 0.41, 0.55, 0.43, 0.34, 2.36, 5.8, 4.08, 5.12, 3.6, 18.2, 23.34, 5.44, 6.39, 0.74, 4.41, 4.77]} \ No newline at end of file diff --git a/annotations_1/Z8JHamH3gW4_filtered.json b/annotations_1/Z8JHamH3gW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95de74ff7933a81b23f160b53225435d9eb4d417 --- /dev/null +++ b/annotations_1/Z8JHamH3gW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 48.84], [56.0, 57.23], [58.0, 59.46], [61.0, 62.51], [65.0, 66.04], [66.0, 67.29], [68.0, 86.43], [93.0, 94.66], [96.0, 98.66]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.68, 0.0, 53.16], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 59.37], ["explosion", 8.99], ["burst, pop", 3.7]], null, null], "duration": [0.84, 1.23, 1.46, 1.51, 1.04, 1.29, 18.43, 1.66, 2.66]} \ No newline at end of file diff --git a/annotations_1/Z9h-ht1mVkw_filtered.json b/annotations_1/Z9h-ht1mVkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8842e3aa67c1aeb28fe2cd5fe83036179279b530 --- /dev/null +++ b/annotations_1/Z9h-ht1mVkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.48], [38.0, 64.2], [65.0, 176.93]], "keep_status": [false, false, false], "silence_prob": [0.0, 34.36, 0.0], "audiomae_on_audioset": [null, [["music", 44.72], ["speech", 34.91], ["didgeridoo", 4.98]], null], "duration": [0.48, 26.2, 111.93]} \ No newline at end of file diff --git a/annotations_1/Z9kPRWAjSNo_filtered.json b/annotations_1/Z9kPRWAjSNo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb9b50762d9dc9c079233e1de59e7c6ae1215d70 --- /dev/null +++ b/annotations_1/Z9kPRWAjSNo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 13.53], [16.0, 31.23], [32.0, 32.27], [33.0, 51.78], [53.0, 57.33], [61.0, 69.08], [70.0, 139.87]], "keep_status": [false, false, false, false, true, true, false], "silence_prob": [29.82, 30.26, 0.0, 29.87, 30.18, 29.89, 0.0], "audiomae_on_audioset": [[["music", 72.15], ["electronic music", 4.4], ["trance music", 2.35]], [["music", 72.14], ["throbbing", 5.73], ["hum", 3.19]], null, [["music", 59.84], ["throbbing", 18.59], ["hum", 13.28]], [["speech", 47.82], ["vehicle", 12.28], ["music", 9.28]], [["music", 41.78], ["cacophony", 11.57], ["hum", 9.83]], null], "duration": [10.53, 15.23, 0.27, 18.78, 4.33, 8.08, 69.87]} \ No newline at end of file diff --git a/annotations_1/Z9vRmexWHUo_filtered.json b/annotations_1/Z9vRmexWHUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2fce7b59895edd710b34702f3c60b4992103ebb --- /dev/null +++ b/annotations_1/Z9vRmexWHUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [2.0, 3.43], [5.0, 17.52], [28.0, 36.51], [41.0, 46.04], [51.0, 53.33], [55.0, 56.59], [59.0, 59.37], [60.0, 61.6], [76.0, 77.82], [80.0, 81.75], [85.0, 85.16], [90.0, 91.99], [99.0, 100.03], [104.0, 108.18], [115.0, 115.15]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.13, 35.3, 37.84, 36.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.01, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.17], ["hum", 13.06], ["didgeridoo", 9.15]], [["music", 57.27], ["ambient music", 11.15], ["electronic music", 3.94]], [["music", 40.45], ["gong", 10.06], ["didgeridoo", 5.53]], [["music", 41.35], ["moo", 11.35], ["cattle, bovinae", 10.8]], null, null, null, null, null, null, null, null, [["music", 44.48], ["hum", 15.36], ["throbbing", 11.21]], null], "duration": [0.38, 1.43, 12.52, 8.51, 5.04, 2.33, 1.59, 0.37, 1.6, 1.82, 1.75, 0.16, 1.99, 1.03, 4.18, 0.15]} \ No newline at end of file diff --git a/annotations_1/Z9zrMe8Gn1E_filtered.json b/annotations_1/Z9zrMe8Gn1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5e6994a61827c631c9a24a79a1d79ebedc53424 --- /dev/null +++ b/annotations_1/Z9zrMe8Gn1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.03], [22.0, 63.58], [65.0, 65.3], [66.0, 65.84], [66.0, 65.87], [66.0, 65.94], [66.0, 66.09], [66.0, 88.91]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39], "audiomae_on_audioset": [[["music", 44.03], ["clarinet", 10.74], ["musical instrument", 6.32]], null, null, null, null, null, null, [["music", 62.34], ["musical instrument", 7.07], ["trombone", 4.99]]], "duration": [12.03, 41.58, 0.3, -0.16, -0.13, -0.06, 0.09, 22.91]} \ No newline at end of file diff --git a/annotations_1/ZBqZpBkiLiI_filtered.json b/annotations_1/ZBqZpBkiLiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b722cb0893434fefe3879667dd70453604446a9 --- /dev/null +++ b/annotations_1/ZBqZpBkiLiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [11.0, 11.4], [16.0, 18.62], [22.0, 25.39], [27.0, 28.0], [34.0, 36.14], [37.0, 38.1], [39.0, 40.68], [48.0, 48.37], [61.0, 61.21], [63.0, 64.44], [68.0, 68.17], [84.0, 85.04], [86.0, 86.91], [99.0, 99.52], [102.0, 102.07], [103.0, 102.91], [103.0, 103.86], [105.0, 105.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.09, 84.98, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.06, 0.4, 2.62, 3.39, 1.0, 2.14, 1.1, 1.68, 0.37, 0.21, 1.44, 0.17, 1.04, 0.91, 0.52, 0.07, -0.09, 0.86, 0.81]} \ No newline at end of file diff --git a/annotations_1/ZBvJyUTIU0k_filtered.json b/annotations_1/ZBvJyUTIU0k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..266b08261d8fee651753bc5a7d7c7e328a7eb9f2 --- /dev/null +++ b/annotations_1/ZBvJyUTIU0k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.9], [20.0, 20.01], [20.0, 20.39], [24.0, 23.95], [24.0, 118.72], [120.0, 120.45], [121.0, 131.3], [132.0, 141.05], [143.0, 147.65], [150.0, 171.27], [173.0, 175.51], [176.0, 177.65]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 52.74, 76.7, 59.24, 31.67, 40.29, 0.0], "audiomae_on_audioset": [[["speech", 26.55], ["music", 12.87], ["insect", 9.57]], null, null, null, null, null, null, null, null, [["music", 68.95], ["hum", 6.74], ["electronic music", 3.2]], [["whale vocalization", 29.29], ["music", 27.29], ["speech", 8.76]], null], "duration": [7.9, 0.01, 0.39, -0.05, 94.72, 0.45, 10.3, 9.05, 4.65, 21.27, 2.51, 1.65]} \ No newline at end of file diff --git a/annotations_1/ZCTqZhZRYl0_filtered.json b/annotations_1/ZCTqZhZRYl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..572adda2952a7d46ba0bed4829a2056858911136 --- /dev/null +++ b/annotations_1/ZCTqZhZRYl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.5], [8.0, 11.65], [13.0, 16.46], [21.0, 24.26], [26.0, 29.42], [30.0, 35.38], [36.0, 37.34], [38.0, 39.21], [41.0, 44.52], [47.0, 63.42], [66.0, 70.29], [72.0, 76.87], [83.0, 86.86], [89.0, 91.12], [92.0, 102.07], [102.0, 102.44], [102.0, 104.06], [104.0, 120.68], [122.0, 122.81], [125.0, 126.67], [129.0, 129.22], [130.0, 132.39], [135.0, 135.7], [138.0, 138.6], [143.0, 143.61], [145.0, 145.61], [146.0, 147.83], [149.0, 149.62], [152.0, 153.2], [155.0, 162.21], [163.0, 164.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [63.53, 95.37, 71.14, 97.22, 99.99, 82.97, 0.0, 0.0, 99.93, 98.8, 98.19, 99.16, 99.95, 75.72, 94.37, 0.0, 60.14, 45.88, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.65], ["theremin", 13.58], ["didgeridoo", 9.02]], null, null, null, null, null, null, null, null, null, null, null, [["music", 48.74], ["theremin", 16.77], ["musical instrument", 3.43]], null], "duration": [3.5, 3.65, 3.46, 3.26, 3.42, 5.38, 1.34, 1.21, 3.52, 16.42, 4.29, 4.87, 3.86, 2.12, 10.07, 0.44, 2.06, 16.68, 0.81, 1.67, 0.22, 2.39, 0.7, 0.6, 0.61, 0.61, 1.83, 0.62, 1.2, 7.21, 1.44]} \ No newline at end of file diff --git a/annotations_1/ZCZyxZYgKIg_filtered.json b/annotations_1/ZCZyxZYgKIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a113b94c92b40ec8e0f5d58db05b3a1c38d29bb --- /dev/null +++ b/annotations_1/ZCZyxZYgKIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.32], [20.0, 22.91], [24.0, 30.4], [31.0, 34.77], [36.0, 36.24], [38.0, 38.4], [42.0, 42.52], [44.0, 44.32], [48.0, 49.6], [51.0, 53.2], [54.0, 55.92], [57.0, 57.67], [62.0, 63.51], [66.0, 68.08], [70.0, 75.09], [76.0, 76.62], [78.0, 79.25], [83.0, 87.54], [89.0, 94.66], [100.0, 102.02], [105.0, 104.95], [106.0, 110.37], [114.0, 114.25], [115.0, 114.99], [115.0, 115.33], [115.0, 116.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [98.86, 99.95, 79.07, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 96.04, 97.92, 0.0, 0.0, 90.95, 49.04, 35.98, 0.0, 40.77, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.74], ["whack, thwack", 7.77], ["animal", 4.36]], [["music", 32.44], ["guitar", 8.95], ["speech", 6.81]], null, [["speech", 77.76], ["sidetone", 3.17], ["boing", 2.59]], null, null, null, null], "duration": [2.32, 2.91, 6.4, 3.77, 0.24, 0.4, 0.52, 0.32, 1.6, 2.2, 1.92, 0.67, 1.51, 2.08, 5.09, 0.62, 1.25, 4.54, 5.66, 2.02, -0.05, 4.37, 0.25, -0.01, 0.33, 1.99]} \ No newline at end of file diff --git a/annotations_1/ZCdhsYpdRck_filtered.json b/annotations_1/ZCdhsYpdRck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5b21841e218866747ba0032f9a9491671a4a3e4 --- /dev/null +++ b/annotations_1/ZCdhsYpdRck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.73], [6.0, 9.05], [10.0, 12.95], [14.0, 16.56], [17.0, 20.29], [22.0, 25.22], [26.0, 31.43], [33.0, 34.97], [36.0, 38.04], [40.0, 46.33], [48.0, 53.76], [55.0, 57.32], [59.0, 62.45], [64.0, 66.45], [69.0, 70.11], [71.0, 71.78], [73.0, 90.36], [92.0, 94.8], [97.0, 97.61], [99.0, 101.21], [104.0, 106.51], [108.0, 110.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [82.43, 88.46, 67.76, 99.95, 84.07, 93.76, 75.39, 0.0, 97.92, 71.87, 86.45, 99.71, 95.09, 78.89, 0.0, 0.0, 45.46, 98.36, 0.0, 80.29, 77.03, 95.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 13.47], ["hum", 10.95], ["chirp tone", 5.55]], null, null, null, null, null], "duration": [3.73, 3.05, 2.95, 2.56, 3.29, 3.22, 5.43, 1.97, 2.04, 6.33, 5.76, 2.32, 3.45, 2.45, 1.11, 0.78, 17.36, 2.8, 0.61, 2.21, 2.51, 2.71]} \ No newline at end of file diff --git a/annotations_1/ZD9DyYVR3BI_filtered.json b/annotations_1/ZD9DyYVR3BI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8e543dc578d5ddb2a3e721ec05e9a77cb5f1e5 --- /dev/null +++ b/annotations_1/ZD9DyYVR3BI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.14], [20.0, 20.17], [22.0, 25.66], [27.0, 27.94], [30.0, 33.91], [35.0, 36.26], [38.0, 38.89], [40.0, 40.58], [41.0, 41.82], [45.0, 46.2], [47.0, 46.8], [48.0, 49.69], [50.0, 52.0], [53.0, 54.18], [55.0, 56.47], [57.0, 61.86], [64.0, 80.22], [86.0, 89.01], [90.0, 99.91], [101.0, 101.53], [112.0, 112.38], [114.0, 114.05], [124.0, 126.49], [128.0, 127.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.1, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 50.11, 29.92, 34.04, 31.36, 0.0, 0.0, 0.0, 54.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 16.13], ["music", 15.18], ["throbbing", 9.78]], null, null, null, [["speech", 61.58], ["music", 7.08], ["machine gun", 6.3]], [["speech", 27.45], ["music", 21.64], ["fly, housefly", 6.94]], [["music", 37.17], ["synthesizer", 8.99], ["speech", 7.54]], null, null, null, null, null], "duration": [1.14, 0.17, 3.66, 0.94, 3.91, 1.26, 0.89, 0.58, 0.82, 1.2, -0.2, 1.69, 2.0, 1.18, 1.47, 4.86, 16.22, 3.01, 9.91, 0.53, 0.38, 0.05, 2.49, -0.23]} \ No newline at end of file diff --git a/annotations_1/ZDyEERuK31Y_filtered.json b/annotations_1/ZDyEERuK31Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e4a1d741111f27e6740664c98f24bcc567b5916 --- /dev/null +++ b/annotations_1/ZDyEERuK31Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 32.7], [38.0, 46.77], [47.0, 53.42], [54.0, 65.8], [69.0, 75.12], [78.0, 79.03], [81.0, 92.04]], "keep_status": [true, true, false, true, true, false, false], "silence_prob": [30.18, 29.64, 29.64, 29.53, 29.1, 0.0, 29.94], "audiomae_on_audioset": [[["music", 51.38], ["hum", 9.0], ["mains hum", 6.26]], [["speech", 32.36], ["music", 26.75], ["foghorn", 6.59]], [["theremin", 67.33], ["music", 22.91], ["foghorn", 1.1]], [["music", 31.02], ["speech", 13.16], ["vehicle", 8.03]], [["cattle, bovinae", 28.28], ["moo", 23.74], ["livestock, farm animals, working animals", 16.93]], null, [["speech", 43.85], ["livestock, farm animals, working animals", 22.51], ["animal", 13.37]]], "duration": [17.7, 8.77, 6.42, 11.8, 6.12, 1.03, 11.04]} \ No newline at end of file diff --git a/annotations_1/ZFMSluy-4gE_filtered.json b/annotations_1/ZFMSluy-4gE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a053d991562d4363a761a4684cf911d7a93e2a92 --- /dev/null +++ b/annotations_1/ZFMSluy-4gE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.48], [8.0, 9.96], [11.0, 13.0], [14.0, 16.26], [18.0, 19.18], [20.0, 21.66], [24.0, 25.19], [27.0, 27.26], [29.0, 29.29], [32.0, 32.46], [35.0, 36.85], [39.0, 41.0], [51.0, 51.71], [60.0, 65.37], [66.0, 67.36], [69.0, 69.75], [72.0, 73.23], [94.0, 93.95], [96.0, 95.69], [103.0, 103.06], [109.0, 110.0], [111.0, 112.01], [132.0, 133.42], [143.0, 144.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 45.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.84], ["hiccup", 14.88], ["whale vocalization", 6.82]], null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.96, 2.0, 2.26, 1.18, 1.66, 1.19, 0.26, 0.29, 0.46, 1.85, 2.0, 0.71, 5.37, 1.36, 0.75, 1.23, -0.05, -0.31, 0.06, 1.0, 1.01, 1.42, 1.86]} \ No newline at end of file diff --git a/annotations_1/ZFXOR2yoWCg_filtered.json b/annotations_1/ZFXOR2yoWCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a94e3f7d0aca97e134c10c6c4be01c8e36d4c95 --- /dev/null +++ b/annotations_1/ZFXOR2yoWCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [4.0, 3.87], [4.0, 4.92], [6.0, 13.63], [14.0, 13.83], [14.0, 15.69], [16.0, 16.53], [18.0, 19.09], [21.0, 20.75], [21.0, 22.44], [27.0, 27.4], [66.0, 66.51], [70.0, 70.98], [73.0, 73.85], [78.0, 78.8], [80.0, 114.0], [118.0, 119.3], [148.0, 160.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 39.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.74], "audiomae_on_audioset": [null, null, null, [["speech", 81.52], ["music", 5.27], ["inside, large room or hall", 2.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.91], ["mains hum", 10.91], ["hum", 7.95]]], "duration": [1.37, -0.13, 0.92, 7.63, -0.17, 1.69, 0.53, 1.09, -0.25, 1.44, 0.4, 0.51, 0.98, 0.85, 0.8, 34.0, 1.3, 12.12]} \ No newline at end of file diff --git a/annotations_1/ZFrDw6oQai4_filtered.json b/annotations_1/ZFrDw6oQai4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ddbbe5ffe690b3cf3acc1b2449cf9669f07f227 --- /dev/null +++ b/annotations_1/ZFrDw6oQai4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 69.79], [71.0, 73.72], [75.0, 79.54], [80.0, 82.14], [83.0, 84.64], [86.0, 87.22], [88.0, 89.13], [90.0, 92.7], [93.0, 119.35], [120.0, 122.23], [123.0, 124.93], [127.0, 126.86], [128.0, 127.94], [129.0, 130.28], [131.0, 132.29], [137.0, 138.23], [140.0, 140.36], [145.0, 146.52], [148.0, 148.34], [151.0, 153.72], [154.0, 155.19], [156.0, 157.18], [159.0, 160.07], [162.0, 161.65], [162.0, 163.63], [170.0, 170.16], [171.0, 171.46], [177.0, 178.51], [179.0, 180.67], [182.0, 183.9], [185.0, 185.65], [186.0, 187.46], [191.0, 191.64], [192.0, 192.2], [193.0, 195.15], [195.0, 196.82]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [48.61, 73.51, 74.6, 42.58, 0.0, 0.0, 0.0, 72.6, 34.3, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.33, 0.0], "audiomae_on_audioset": [[["creak", 18.93], ["speech", 14.78], ["hum", 13.34]], null, null, [["cattle, bovinae", 37.97], ["speech", 27.5], ["moo", 22.47]], null, null, null, null, [["hum", 53.54], ["mains hum", 20.66], ["throbbing", 16.46]], [["hum", 29.93], ["speech", 22.92], ["mains hum", 13.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 25.23], ["hum", 8.25], ["mains hum", 5.92]], null], "duration": [3.79, 2.72, 4.54, 2.14, 1.64, 1.22, 1.13, 2.7, 26.35, 2.23, 1.93, -0.14, -0.06, 1.28, 1.29, 1.23, 0.36, 1.52, 0.34, 2.72, 1.19, 1.18, 1.07, -0.35, 1.63, 0.16, 0.46, 1.51, 1.67, 1.9, 0.65, 1.46, 0.64, 0.2, 2.15, 1.82]} \ No newline at end of file diff --git a/annotations_1/ZH81ElJu-Jw_filtered.json b/annotations_1/ZH81ElJu-Jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b639004807ede0cbe144842f59975ef4e670cef6 --- /dev/null +++ b/annotations_1/ZH81ElJu-Jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [4.0, 6.13], [7.0, 7.99], [9.0, 9.8], [12.0, 13.15], [20.0, 20.63], [22.0, 22.59], [23.0, 24.68], [29.0, 29.32], [35.0, 34.99], [36.0, 37.35], [39.0, 40.0], [41.0, 41.62], [43.0, 44.61], [51.0, 51.19], [51.0, 52.19], [53.0, 54.58], [56.0, 56.98], [66.0, 67.78], [73.0, 73.9], [75.0, 76.76], [80.0, 80.76], [83.0, 84.38], [86.0, 87.2], [92.0, 92.52], [94.0, 94.56], [97.0, 97.53], [99.0, 99.81], [103.0, 104.18], [106.0, 106.14], [107.0, 107.94], [109.0, 110.96], [114.0, 113.66], [116.0, 116.6], [125.0, 125.56], [127.0, 128.43], [130.0, 130.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 2.13, 0.99, 0.8, 1.15, 0.63, 0.59, 1.68, 0.32, -0.01, 1.35, 1.0, 0.62, 1.61, 0.19, 1.19, 1.58, 0.98, 1.78, 0.9, 1.76, 0.76, 1.38, 1.2, 0.52, 0.56, 0.53, 0.81, 1.18, 0.14, 0.94, 1.96, -0.34, 0.6, 0.56, 1.43, 0.72]} \ No newline at end of file diff --git a/annotations_1/ZIHWAugnBWI_filtered.json b/annotations_1/ZIHWAugnBWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1009cbe7c4b82baf537e8469d43179d34aaece3 --- /dev/null +++ b/annotations_1/ZIHWAugnBWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 6.88], [12.0, 11.99], [16.0, 17.25], [19.0, 20.34], [31.0, 31.87], [35.0, 37.23], [44.0, 45.28], [47.0, 50.04], [60.0, 60.15], [61.0, 65.53], [69.0, 68.74], [70.0, 82.58], [84.0, 85.16], [86.0, 100.5], [101.0, 114.49], [115.0, 116.38], [117.0, 137.03], [138.0, 139.08], [141.0, 141.18], [145.0, 144.96], [146.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.17, 0.0, 47.94, 0.0, 37.43, 0.0, 43.79, 0.0, 33.96, 58.64, 0.0, 33.61, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 61.09], ["hum", 7.34], ["throbbing", 6.48]], null, [["music", 64.5], ["drum machine", 10.74], ["synthesizer", 6.89]], null, [["music", 63.96], ["throbbing", 11.96], ["drum machine", 5.16]], null, [["speech", 72.16], ["thunk", 11.14], ["whack, thwack", 6.78]], null, null, [["whack, thwack", 72.64], ["speech", 5.82], ["thump, thud", 1.91]], null, null, null, null], "duration": [1.18, 1.88, -0.01, 1.25, 1.34, 0.87, 2.23, 1.28, 3.04, 0.15, 4.53, -0.26, 12.58, 1.16, 14.5, 13.49, 1.38, 20.03, 1.08, 0.18, -0.04, 1.12]} \ No newline at end of file diff --git a/annotations_1/ZIdKsGWToLo_filtered.json b/annotations_1/ZIdKsGWToLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..821e9661c230b688fac803b72d60e46e618469e1 --- /dev/null +++ b/annotations_1/ZIdKsGWToLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.61], [7.0, 7.62], [19.0, 20.14], [21.0, 22.86], [26.0, 27.94], [29.0, 30.64], [33.0, 34.89], [36.0, 35.99], [37.0, 38.94], [40.0, 41.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.62, 1.14, 1.86, 1.94, 1.64, 1.89, -0.01, 1.94, 1.08]} \ No newline at end of file diff --git a/annotations_1/ZJF_1LQbKiM_filtered.json b/annotations_1/ZJF_1LQbKiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6b85667ce0e00f037a71203be33c9ba59b93f41 --- /dev/null +++ b/annotations_1/ZJF_1LQbKiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.1], [11.0, 11.97], [13.0, 16.95], [20.0, 43.28], [49.0, 58.65], [62.0, 71.68], [72.0, 72.89], [74.0, 76.11], [77.0, 102.42], [107.0, 141.61], [145.0, 158.52]], "keep_status": [false, false, true, true, true, true, false, true, true, false, false], "silence_prob": [43.08, 0.0, 41.01, 31.34, 29.77, 30.65, 0.0, 33.5, 30.13, 0.0, 61.67], "audiomae_on_audioset": [[["music", 63.22], ["hum", 10.03], ["throbbing", 3.96]], null, [["speech", 54.45], ["music", 5.49], ["whale vocalization", 4.41]], [["music", 54.59], ["speech", 6.99], ["theremin", 5.91]], [["music", 31.17], ["cacophony", 19.61], ["hum", 6.06]], [["speech", 55.65], ["vehicle", 9.01], ["hum", 5.0]], null, [["vehicle", 29.5], ["aircraft", 27.17], ["fixed-wing aircraft, airplane", 9.89]], [["speech", 30.51], ["vehicle", 24.18], ["car", 12.69]], null, null], "duration": [6.1, 0.97, 3.95, 23.28, 9.65, 9.68, 0.89, 2.11, 25.42, 34.61, 13.52]} \ No newline at end of file diff --git a/annotations_1/ZKfVrsrm_ac_filtered.json b/annotations_1/ZKfVrsrm_ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c105f02c66403b479b34f6c6eebf8e3fd4a4013 --- /dev/null +++ b/annotations_1/ZKfVrsrm_ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [12.0, 12.18], [12.0, 12.68], [14.0, 14.64], [18.0, 18.39], [42.0, 42.3], [43.0, 42.6], [59.0, 60.93], [64.0, 64.1], [71.0, 72.33], [74.0, 74.43], [81.0, 81.75], [85.0, 87.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.18, 0.68, 0.64, 0.39, 0.3, -0.4, 1.93, 0.1, 1.33, 0.43, 0.75, 2.24]} \ No newline at end of file diff --git a/annotations_1/ZKgJtlJDPcc_filtered.json b/annotations_1/ZKgJtlJDPcc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ea808ca2521a7234ca0759893dce50c8e89f1e5 --- /dev/null +++ b/annotations_1/ZKgJtlJDPcc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.5], [13.0, 13.47], [18.0, 22.11], [24.0, 25.34], [29.0, 29.86], [31.0, 37.17], [38.0, 38.35], [39.0, 42.74], [45.0, 49.27], [50.0, 52.24], [54.0, 70.16], [71.0, 74.58], [76.0, 81.7], [82.0, 83.27], [84.0, 87.59], [89.0, 90.24], [91.0, 91.96], [93.0, 97.7], [99.0, 106.78], [112.0, 127.68], [128.0, 129.47]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [33.36, 0.0, 39.33, 0.0, 0.0, 34.96, 0.0, 57.17, 62.89, 51.99, 63.96, 63.42, 78.38, 0.0, 85.35, 0.0, 0.0, 36.87, 39.54, 42.0, 0.0], "audiomae_on_audioset": [[["hum", 19.55], ["music", 14.29], ["throbbing", 10.75]], null, [["speech", 67.99], ["music", 5.24], ["throbbing", 3.34]], null, null, [["groan", 21.45], ["speech", 12.62], ["whack, thwack", 12.28]], null, null, null, null, null, null, null, null, null, null, null, [["music", 18.35], ["thunk", 17.55], ["speech", 17.22]], [["fart", 46.59], ["speech", 14.53], ["mosquito", 7.03]], [["music", 29.38], ["throbbing", 27.1], ["hum", 5.73]], null], "duration": [10.5, 0.47, 4.11, 1.34, 0.86, 6.17, 0.35, 3.74, 4.27, 2.24, 16.16, 3.58, 5.7, 1.27, 3.59, 1.24, 0.96, 4.7, 7.78, 15.68, 1.47]} \ No newline at end of file diff --git a/annotations_1/ZKuscOD0LOM_filtered.json b/annotations_1/ZKuscOD0LOM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..150b0a7081606f0dc7f24315e09b649ad6725b4b --- /dev/null +++ b/annotations_1/ZKuscOD0LOM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.07], [9.0, 14.22], [19.0, 21.0], [22.0, 26.11], [27.0, 39.8], [45.0, 45.08], [46.0, 46.95], [49.0, 51.48], [59.0, 62.78], [64.0, 70.36], [71.0, 71.34], [71.0, 95.61], [98.0, 98.36], [102.0, 105.93], [108.0, 122.82]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false, false, true, false], "silence_prob": [73.67, 53.1, 86.45, 52.05, 40.36, 0.0, 0.0, 82.43, 43.08, 49.27, 0.0, 34.1, 0.0, 34.98, 33.19], "audiomae_on_audioset": [null, null, null, null, [["music", 45.26], ["synthesizer", 8.98], ["speech", 5.68]], null, null, null, [["music", 26.21], ["whack, thwack", 17.66], ["didgeridoo", 9.36]], [["music", 30.75], ["speech", 20.13], ["whack, thwack", 12.29]], null, [["music", 56.1], ["speech", 17.74], ["didgeridoo", 8.54]], null, [["music", 37.44], ["hum", 16.84], ["throbbing", 15.43]], [["music", 62.71], ["didgeridoo", 18.31], ["speech", 7.18]]], "duration": [2.07, 5.22, 2.0, 4.11, 12.8, 0.08, 0.95, 2.48, 3.78, 6.36, 0.34, 24.61, 0.36, 3.93, 14.82]} \ No newline at end of file diff --git a/annotations_1/ZLhyjNnrb6s_filtered.json b/annotations_1/ZLhyjNnrb6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..630cd1f4e4e3ca98839bef1405a0ab8a6ee006ef --- /dev/null +++ b/annotations_1/ZLhyjNnrb6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.87], [5.0, 10.5], [17.0, 18.99], [21.0, 21.83], [29.0, 36.68], [43.0, 44.02], [49.0, 48.86], [51.0, 51.17], [53.0, 53.67], [55.0, 55.78], [61.0, 61.72], [64.0, 65.79], [69.0, 71.36], [74.0, 94.74], [96.0, 97.11], [98.0, 98.78], [100.0, 101.21], [105.0, 106.89], [108.0, 120.07], [121.0, 121.0], [121.0, 122.44], [126.0, 128.11], [129.0, 129.86], [131.0, 131.58], [133.0, 167.95], [169.0, 171.61], [174.0, 176.07], [179.0, 180.47], [187.0, 191.69], [192.0, 193.6], [194.0, 193.7], [195.0, 197.83], [200.0, 200.55], [204.0, 227.97]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.69, 0.0, 0.0, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.01, 31.43, 0.0, 0.0, 0.0, 0.0, 35.24, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 42.84, 51.07, 0.0, 52.92, 0.0, 0.0, 62.47, 0.0, 30.12], "audiomae_on_audioset": [null, [["speech", 42.91], ["music", 17.08], ["echo", 4.93]], null, null, [["music", 53.64], ["speech", 8.4], ["fart", 6.6]], null, null, null, null, null, null, null, [["hum", 28.71], ["mains hum", 15.31], ["speech", 14.58]], [["music", 50.76], ["speech", 9.78], ["boing", 4.06]], null, null, null, null, [["hum", 28.53], ["music", 22.82], ["mains hum", 15.2]], null, null, [["whale vocalization", 34.54], ["music", 17.02], ["rumble", 6.38]], null, null, null, [["music", 66.2], ["hum", 2.8], ["musical instrument", 2.73]], null, null, null, null, null, null, null, [["music", 68.7], ["cacophony", 7.96], ["speech", 3.16]]], "duration": [1.87, 5.5, 1.99, 0.83, 7.68, 1.02, -0.14, 0.17, 0.67, 0.78, 0.72, 1.79, 2.36, 20.74, 1.11, 0.78, 1.21, 1.89, 12.07, 0.0, 1.44, 2.11, 0.86, 0.58, 34.95, 2.61, 2.07, 1.47, 4.69, 1.6, -0.3, 2.83, 0.55, 23.97]} \ No newline at end of file diff --git a/annotations_1/ZLjp7ahdbWc_filtered.json b/annotations_1/ZLjp7ahdbWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae8294f11ee926eb1ad367bf13ed16bc3988d3cb --- /dev/null +++ b/annotations_1/ZLjp7ahdbWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.65], [12.0, 13.53], [22.0, 87.4], [89.0, 92.06], [94.0, 96.25], [98.0, 99.5], [104.0, 107.99], [109.0, 110.93], [114.0, 114.84], [116.0, 117.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.06, 51.07, 0.0, 60.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.65, 1.53, 65.4, 3.06, 2.25, 1.5, 3.99, 1.93, 0.84, 1.83]} \ No newline at end of file diff --git a/annotations_1/ZLmRWzBjbtU_filtered.json b/annotations_1/ZLmRWzBjbtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31463ac02d7123247d615ff0908d5dc15c4bbdb9 --- /dev/null +++ b/annotations_1/ZLmRWzBjbtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.41], [10.0, 12.88], [14.0, 16.61], [18.0, 18.15], [19.0, 23.8], [24.0, 26.06], [28.0, 41.03], [60.0, 60.03], [75.0, 75.68], [77.0, 77.21], [78.0, 78.92], [104.0, 106.37], [111.0, 111.23], [114.0, 114.83], [119.0, 119.33], [137.0, 138.4], [154.0, 153.96], [160.0, 161.05], [162.0, 161.91]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 99.4, 29.51, 0.0, 75.07, 41.4, 36.31, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 48.0], ["explosion", 21.02], ["burst, pop", 10.58]], null, null, [["cattle, bovinae", 21.35], ["moo", 14.5], ["wail, moan", 11.46]], [["speech", 61.47], ["hum", 6.15], ["sonar", 5.41]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.41, 2.88, 2.61, 0.15, 4.8, 2.06, 13.03, 0.03, 0.68, 0.21, 0.92, 2.37, 0.23, 0.83, 0.33, 1.4, -0.04, 1.05, -0.09]} \ No newline at end of file diff --git a/annotations_1/ZMlGZcr95To_filtered.json b/annotations_1/ZMlGZcr95To_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a3dc723aee8e0e5fce64a174694b47c97aed5a5 --- /dev/null +++ b/annotations_1/ZMlGZcr95To_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[87.0, 87.49], [89.0, 118.81], [122.0, 127.21], [132.0, 133.24], [137.0, 139.08], [141.0, 141.94], [144.0, 146.31]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 31.6, 30.14, 0.0, 53.84, 0.0, 58.55], "audiomae_on_audioset": [null, [["throbbing", 44.24], ["music", 24.15], ["hum", 16.39]], [["hum", 53.11], ["throbbing", 32.63], ["mains hum", 6.41]], null, null, null, null], "duration": [0.49, 29.81, 5.21, 1.24, 2.08, 0.94, 2.31]} \ No newline at end of file diff --git a/annotations_1/ZMplRnotp8M_filtered.json b/annotations_1/ZMplRnotp8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5109c6153702e4d02550c015f05eaec3824e27f3 --- /dev/null +++ b/annotations_1/ZMplRnotp8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.85], [4.0, 4.21], [6.0, 6.51], [13.0, 14.01], [20.0, 22.33], [30.0, 30.81], [34.0, 34.86], [38.0, 41.57], [44.0, 46.2], [48.0, 49.11], [52.0, 53.42], [54.0, 54.9], [59.0, 59.14], [73.0, 72.81], [74.0, 74.93], [80.0, 80.72], [82.0, 81.97], [98.0, 100.04], [101.0, 102.57], [104.0, 105.31], [108.0, 108.94], [110.0, 110.86], [112.0, 113.32], [117.0, 120.28], [121.0, 123.08], [123.0, 125.27], [127.0, 128.14], [131.0, 131.28], [135.0, 145.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 70.44, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 63.42, 69.61, 0.0, 0.0, 96.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.21, 0.51, 1.01, 2.33, 0.81, 0.86, 3.57, 2.2, 1.11, 1.42, 0.9, 0.14, -0.19, 0.93, 0.72, -0.03, 2.04, 1.57, 1.31, 0.94, 0.86, 1.32, 3.28, 2.08, 2.27, 1.14, 0.28, 10.99]} \ No newline at end of file diff --git a/annotations_1/ZOfisAF09AA_filtered.json b/annotations_1/ZOfisAF09AA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72664cc8119de691a5f26174896ce82333d07848 --- /dev/null +++ b/annotations_1/ZOfisAF09AA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 41.23], [44.0, 46.68], [50.0, 56.94], [90.0, 105.68], [108.0, 109.32], [115.0, 116.11], [116.0, 122.42], [126.0, 126.66], [128.0, 139.95], [141.0, 143.01]], "keep_status": [false, true, false, true, false, false, true, false, false, true], "silence_prob": [31.6, 32.79, 32.34, 32.17, 0.0, 0.0, 32.52, 0.0, 33.7, 43.93], "audiomae_on_audioset": [[["music", 68.81], ["hum", 2.79], ["musical instrument", 1.83]], [["music", 58.63], ["sampler", 4.89], ["electronic music", 2.73]], [["music", 59.25], ["hum", 10.44], ["throbbing", 8.26]], [["music", 29.67], ["cattle, bovinae", 18.89], ["moo", 17.86]], null, null, [["music", 38.59], ["livestock, farm animals, working animals", 7.79], ["insect", 7.62]], null, [["music", 70.6], ["psychedelic rock", 5.57], ["musical instrument", 2.56]], [["music", 34.95], ["grunt", 11.49], ["livestock, farm animals, working animals", 7.24]]], "duration": [3.23, 2.68, 6.94, 15.68, 1.32, 1.11, 6.42, 0.66, 11.95, 2.01]} \ No newline at end of file diff --git a/annotations_1/ZP73cUcxidQ_filtered.json b/annotations_1/ZP73cUcxidQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..982e4c6de81a2e6f5a57297c23297f210f5ac333 --- /dev/null +++ b/annotations_1/ZP73cUcxidQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [7.0, 7.42], [10.0, 13.51], [16.0, 17.1], [18.0, 17.98], [18.0, 42.79], [44.0, 77.7], [79.0, 79.25], [79.0, 79.73], [89.0, 95.64], [96.0, 96.35], [97.0, 97.68], [98.0, 98.59], [99.0, 99.72], [100.0, 100.8], [101.0, 102.14], [106.0, 106.61], [116.0, 117.69], [126.0, 149.88], [150.0, 154.58], [156.0, 183.57], [185.0, 185.03], [186.0, 185.97]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 40.55, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 38.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.94, 33.83, 42.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["fart", 19.78], ["noise", 11.25], ["music", 8.93]], null, null, null, null, null, null, [["speech", 47.75], ["hum", 9.21], ["sidetone", 8.71]], null, null, null, null, null, null, null, null, [["music", 33.98], ["speech", 26.19], ["musical instrument", 8.19]], [["mains hum", 33.81], ["music", 23.77], ["hum", 21.64]], [["music", 40.77], ["hum", 25.23], ["rumble", 9.71]], null, null], "duration": [0.25, 0.42, 3.51, 1.1, -0.02, 24.79, 33.7, 0.25, 0.73, 6.64, 0.35, 0.68, 0.59, 0.72, 0.8, 1.14, 0.61, 1.69, 23.88, 4.58, 27.57, 0.03, -0.03]} \ No newline at end of file diff --git a/annotations_1/ZPCSC8NM87k_filtered.json b/annotations_1/ZPCSC8NM87k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d2136da5d24e151901e2ca3de14138c8a072126 --- /dev/null +++ b/annotations_1/ZPCSC8NM87k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.94], [14.0, 15.48], [17.0, 20.49], [22.0, 23.52], [27.0, 27.94], [28.0, 28.98], [35.0, 41.57], [43.0, 47.16], [48.0, 55.73], [60.0, 108.46], [110.0, 138.6], [142.0, 160.62], [163.0, 180.86], [182.0, 196.7], [199.0, 214.74], [215.0, 216.11]], "keep_status": [true, false, true, false, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [31.2, 0.0, 49.78, 0.0, 0.0, 0.0, 28.83, 28.65, 28.55, 0.0, 29.28, 28.72, 28.87, 29.66, 28.98, 0.0], "audiomae_on_audioset": [[["speech", 21.84], ["music", 13.91], ["throbbing", 12.84]], null, [["music", 30.84], ["theremin", 12.64], ["musical instrument", 5.17]], null, null, null, [["music", 61.35], ["didgeridoo", 10.41], ["noise", 6.69]], [["music", 39.99], ["sound effect", 4.91], ["grunt", 4.31]], [["mains hum", 42.12], ["hum", 39.48], ["throbbing", 4.78]], null, [["music", 48.17], ["hum", 9.23], ["didgeridoo", 7.21]], [["music", 63.32], ["throbbing", 3.33], ["hum", 2.41]], [["music", 68.93], ["throbbing", 4.35], ["speech", 3.76]], [["music", 34.71], ["speech", 26.73], ["cowbell", 12.03]], [["music", 67.16], ["speech", 5.47], ["musical instrument", 2.83]], null], "duration": [5.94, 1.48, 3.49, 1.52, 0.94, 0.98, 6.57, 4.16, 7.73, 48.46, 28.6, 18.62, 17.86, 14.7, 15.74, 1.11]} \ No newline at end of file diff --git a/annotations_1/ZPDbP3gms30_filtered.json b/annotations_1/ZPDbP3gms30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e152c1c9809c6a90d375a071f9615a0387aaa023 --- /dev/null +++ b/annotations_1/ZPDbP3gms30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.5], [19.0, 23.84], [24.0, 24.8], [26.0, 31.43], [32.0, 32.36], [33.0, 33.88], [35.0, 35.29], [36.0, 35.77], [36.0, 36.68]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [30.11, 30.52, 0.0, 34.64, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.04], ["music", 16.17], ["cattle, bovinae", 2.96]], [["livestock, farm animals, working animals", 41.39], ["cattle, bovinae", 28.82], ["moo", 19.38]], null, [["speech", 58.79], ["music", 7.66], ["sidetone", 5.25]], null, null, null, null, null], "duration": [3.5, 4.84, 0.8, 5.43, 0.36, 0.88, 0.29, -0.23, 0.68]} \ No newline at end of file diff --git a/annotations_1/ZPMDA9N1itk_filtered.json b/annotations_1/ZPMDA9N1itk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04037543bf30048da6fde47eb12f5f682cbb7c92 --- /dev/null +++ b/annotations_1/ZPMDA9N1itk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.46], [6.0, 6.61], [8.0, 8.6], [10.0, 10.27], [11.0, 12.28], [19.0, 20.31], [22.0, 29.66], [31.0, 31.16], [32.0, 32.61], [34.0, 34.84], [36.0, 37.3], [39.0, 39.39], [42.0, 42.69], [45.0, 45.91], [46.0, 46.8], [48.0, 53.59], [55.0, 54.94], [55.0, 60.4], [64.0, 64.76], [68.0, 69.28], [70.0, 72.42], [75.0, 75.56], [76.0, 76.72], [81.0, 81.45], [83.0, 83.86], [84.0, 86.07], [86.0, 89.21], [90.0, 90.58], [94.0, 95.54], [97.0, 97.38], [98.0, 99.22], [106.0, 106.03], [115.0, 115.2], [117.0, 118.72], [122.0, 122.69], [124.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 78.89, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 82.97, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.46, 0.61, 0.6, 0.27, 1.28, 1.31, 7.66, 0.16, 0.61, 0.84, 1.3, 0.39, 0.69, 0.91, 0.8, 5.59, -0.06, 5.4, 0.76, 1.28, 2.42, 0.56, 0.72, 0.45, 0.86, 2.07, 3.21, 0.58, 1.54, 0.38, 1.22, 0.03, 0.2, 1.72, 0.69, 7.04]} \ No newline at end of file diff --git a/annotations_1/ZPjREKxiNsQ_filtered.json b/annotations_1/ZPjREKxiNsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09671bc4d13f78a63f073498f094f55c6a369636 --- /dev/null +++ b/annotations_1/ZPjREKxiNsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 62.82], [64.0, 67.93], [70.0, 80.43], [81.0, 85.9], [87.0, 87.45], [88.0, 90.36], [91.0, 92.6], [93.0, 96.04], [98.0, 100.06], [102.0, 122.98], [126.0, 128.14], [129.0, 130.71], [132.0, 134.52], [137.0, 142.01], [143.0, 150.16], [156.0, 160.79], [162.0, 164.52], [166.0, 169.38], [170.0, 171.44]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.73, 29.72, 99.99, 98.99, 0.0, 73.21, 0.0, 100.0, 100.0, 99.9, 100.0, 0.0, 100.0, 100.0, 99.92, 99.76, 100.0, 100.0, 0.0], "audiomae_on_audioset": [[["music", 31.81], ["mains hum", 17.76], ["hum", 16.56]], [["groan", 14.13], ["animal", 12.27], ["speech", 11.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [18.82, 3.93, 10.43, 4.9, 0.45, 2.36, 1.6, 3.04, 2.06, 20.98, 2.14, 1.71, 2.52, 5.01, 7.16, 4.79, 2.52, 3.38, 1.44]} \ No newline at end of file diff --git a/annotations_1/ZQ0JJpvMq-g_filtered.json b/annotations_1/ZQ0JJpvMq-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..daeb1021d529eccab9c227bd6dd6d329b540416f --- /dev/null +++ b/annotations_1/ZQ0JJpvMq-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.53], [6.0, 20.76], [40.0, 42.62], [44.0, 46.57], [49.0, 49.0], [55.0, 56.3], [57.0, 63.95], [68.0, 68.47], [69.0, 71.1], [88.0, 88.6], [92.0, 91.98], [97.0, 96.92], [107.0, 109.17], [113.0, 112.92], [113.0, 114.76], [149.0, 150.94], [151.0, 152.17], [152.0, 152.95]], "keep_status": [true, true, true, true, false, false, true, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [45.75, 35.83, 44.99, 42.26, 0.0, 0.0, 37.71, 0.0, 34.08, 0.0, 0.0, 0.0, 32.06, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["didgeridoo", 21.05], ["speech", 19.02], ["hum", 9.87]], [["music", 29.94], ["vehicle", 19.69], ["car", 8.27]], [["music", 46.44], ["speech", 10.93], ["vehicle", 3.24]], [["ice cream truck, ice cream van", 27.88], ["speech", 24.09], ["music", 17.83]], null, null, [["speech", 28.48], ["reversing beeps", 25.81], ["cattle, bovinae", 11.53]], null, [["speech", 30.44], ["animal", 18.44], ["cattle, bovinae", 5.44]], null, null, null, [["speech", 47.17], ["outside, urban or manmade", 8.38], ["crowd", 6.64]], null, null, null, null, null], "duration": [3.53, 14.76, 2.62, 2.57, 0.0, 1.3, 6.95, 0.47, 2.1, 0.6, -0.02, -0.08, 2.17, -0.08, 1.76, 1.94, 1.17, 0.95]} \ No newline at end of file diff --git a/annotations_1/ZQHhiZUNM3Q_filtered.json b/annotations_1/ZQHhiZUNM3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a76711b19e6fcc1a5174e64616094ebf27a6a4ba --- /dev/null +++ b/annotations_1/ZQHhiZUNM3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [4.0, 9.48], [10.0, 10.62], [11.0, 10.74], [13.0, 13.42], [19.0, 19.75], [20.0, 24.97], [35.0, 34.96], [37.0, 37.37], [40.0, 39.92], [41.0, 48.02], [53.0, 55.39], [61.0, 62.36], [63.0, 63.02], [64.0, 64.05], [68.0, 67.98], [72.0, 75.07], [75.0, 77.3], [80.0, 80.69], [81.0, 82.92], [89.0, 90.26], [91.0, 96.94], [98.0, 99.49], [102.0, 105.04], [106.0, 107.32], [108.0, 109.31], [110.0, 113.44], [115.0, 116.31], [118.0, 120.58], [122.0, 125.88], [129.0, 131.99], [133.0, 165.01], [167.0, 166.8], [170.0, 175.8], [180.0, 188.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.86, 0.0, 0.0, 0.0, 0.0, 52.86, 0.0, 0.0, 0.0, 60.42, 94.07, 0.0, 0.0, 0.0, 0.0, 99.88, 96.89, 0.0, 0.0, 0.0, 99.59, 0.0, 99.44, 0.0, 0.0, 93.29, 0.0, 90.78, 57.25, 53.34, 0.0, 0.0, 95.09, 75.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 5.48, 0.62, -0.26, 0.42, 0.75, 4.97, -0.04, 0.37, -0.08, 7.02, 2.39, 1.36, 0.02, 0.05, -0.02, 3.07, 2.3, 0.69, 1.92, 1.26, 5.94, 1.49, 3.04, 1.32, 1.31, 3.44, 1.31, 2.58, 3.88, 2.99, 32.01, -0.2, 5.8, 8.77]} \ No newline at end of file diff --git a/annotations_1/ZSQBKh64SJA_filtered.json b/annotations_1/ZSQBKh64SJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30d58bdf042cd072a8e7928528010f500242b971 --- /dev/null +++ b/annotations_1/ZSQBKh64SJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.91], [26.0, 33.1], [39.0, 39.63], [42.0, 45.81], [46.0, 54.24], [55.0, 55.38], [56.0, 60.84], [61.0, 61.6], [62.0, 63.9], [66.0, 94.42], [95.0, 99.27]], "keep_status": [false, true, false, false, false, false, true, false, false, true, false], "silence_prob": [29.23, 29.8, 0.0, 32.85, 30.42, 0.0, 35.59, 0.0, 0.0, 29.56, 29.29], "audiomae_on_audioset": [[["cattle, bovinae", 53.86], ["livestock, farm animals, working animals", 25.28], ["moo", 14.42]], [["speech", 43.14], ["buzz", 17.81], ["music", 5.9]], null, [["music", 81.99], ["musical instrument", 2.09], ["synthesizer", 2.08]], [["speech", 65.67], ["music", 6.98], ["mains hum", 6.36]], null, [["music", 40.66], ["hum", 15.88], ["speech", 7.66]], null, null, [["music", 35.8], ["hum", 21.87], ["speech", 11.06]], [["speech", 45.01], ["music", 30.54], ["explosion", 6.06]]], "duration": [19.91, 7.1, 0.63, 3.81, 8.24, 0.38, 4.84, 0.6, 1.9, 28.42, 4.27]} \ No newline at end of file diff --git a/annotations_1/ZT0-DtdC93w_filtered.json b/annotations_1/ZT0-DtdC93w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92008b93144e6537744ba29d940d8cbb1b4ff405 --- /dev/null +++ b/annotations_1/ZT0-DtdC93w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [1.0, 1.51], [4.0, 10.62], [11.0, 20.8], [21.0, 21.24], [23.0, 24.76], [26.0, 27.84], [29.0, 29.69], [30.0, 31.16], [32.0, 33.93], [39.0, 39.5], [49.0, 49.18], [50.0, 51.27], [53.0, 57.18], [58.0, 58.85], [59.0, 63.73], [64.0, 67.68], [69.0, 72.22], [75.0, 77.21], [78.0, 81.77], [88.0, 88.48], [96.0, 96.94], [102.0, 107.13], [108.0, 109.31], [111.0, 112.45], [113.0, 114.47], [115.0, 118.25], [121.0, 121.93], [125.0, 125.46], [126.0, 127.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 36.72, 36.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 90.78, 93.91, 56.86, 99.44, 77.53, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 45.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.69], ["didgeridoo", 12.94], ["speech", 9.3]], [["speech", 36.8], ["music", 33.91], ["fly, housefly", 3.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.07], ["didgeridoo", 30.34], ["musical instrument", 6.53]], null, null, null], "duration": [0.21, 0.51, 6.62, 9.8, 0.24, 1.76, 1.84, 0.69, 1.16, 1.93, 0.5, 0.18, 1.27, 4.18, 0.85, 4.73, 3.68, 3.22, 2.21, 3.77, 0.48, 0.94, 5.13, 1.31, 1.45, 1.47, 3.25, 0.93, 0.46, 1.3]} \ No newline at end of file diff --git a/annotations_1/ZTsUO_9AT20_filtered.json b/annotations_1/ZTsUO_9AT20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dce4491754cd48f498cdceff2a8c0241046f3166 --- /dev/null +++ b/annotations_1/ZTsUO_9AT20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 21.81], [23.0, 61.79], [63.0, 71.17], [72.0, 84.25], [85.0, 106.15]], "keep_status": [false, false, true, false, true], "silence_prob": [34.63, 0.0, 35.02, 31.16, 30.39], "audiomae_on_audioset": [[["hum", 36.31], ["mains hum", 23.18], ["music", 15.05]], null, [["speech", 26.08], ["hum", 17.91], ["mains hum", 13.91]], [["music", 76.24], ["echo", 4.65], ["trombone", 1.77]], [["hum", 21.05], ["noise", 15.09], ["mains hum", 14.84]]], "duration": [21.81, 38.79, 8.17, 12.25, 21.15]} \ No newline at end of file diff --git a/annotations_1/ZUchY9Hw48A_filtered.json b/annotations_1/ZUchY9Hw48A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c57b4ee81924cda2f9edfe973bafe51eebf2051b --- /dev/null +++ b/annotations_1/ZUchY9Hw48A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 166.4], [170.0, 169.91]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [156.4, -0.09]} \ No newline at end of file diff --git a/annotations_1/ZUmTlIUmbmE_filtered.json b/annotations_1/ZUmTlIUmbmE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbe63de27847eadb7acb637cd98428064d7d79c1 --- /dev/null +++ b/annotations_1/ZUmTlIUmbmE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.06], [13.0, 19.3], [20.0, 21.9], [23.0, 59.39], [64.0, 65.03], [68.0, 68.49], [70.0, 70.26], [71.0, 87.05], [88.0, 101.9], [104.0, 106.73], [114.0, 114.49], [115.0, 116.55], [120.0, 121.9], [126.0, 141.81], [143.0, 172.67], [173.0, 172.72], [173.0, 172.94]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 38.12, 54.23, 0.0, 0.0, 0.0, 34.32, 33.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["electric shaver, electric razor", 63.64], ["speech", 13.61], ["noise", 4.02]], [["hum", 28.25], ["buzz", 9.99], ["mains hum", 7.46]], null, null, null, null, [["music", 29.18], ["noise", 20.92], ["effects unit", 6.59]], [["whack, thwack", 26.62], ["speech", 17.36], ["thunk", 16.05]], null, null], "duration": [1.06, 6.3, 1.9, 36.39, 1.03, 0.49, 0.26, 16.05, 13.9, 2.73, 0.49, 1.55, 1.9, 15.81, 29.67, -0.28, -0.06]} \ No newline at end of file diff --git a/annotations_1/ZVlfttyv5js_filtered.json b/annotations_1/ZVlfttyv5js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4691308c312bca7c0f4335aab47cf2e5e80a38c1 --- /dev/null +++ b/annotations_1/ZVlfttyv5js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.21], [10.0, 32.21], [33.0, 45.99], [50.0, 62.28], [63.0, 64.69], [72.0, 80.6], [84.0, 134.35]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 45.75, 44.26, 44.43, 0.0, 44.15, 0.0], "audiomae_on_audioset": [null, [["music", 36.64], ["hum", 16.93], ["throbbing", 15.85]], [["music", 51.36], ["theremin", 17.05], ["electronic music", 4.47]], [["music", 59.62], ["synthesizer", 5.92], ["throbbing", 5.2]], null, [["music", 68.14], ["speech", 5.29], ["hum", 2.83]], null], "duration": [0.21, 22.21, 12.99, 12.28, 1.69, 8.6, 50.35]} \ No newline at end of file diff --git a/annotations_1/ZW-xfRn8vFY_filtered.json b/annotations_1/ZW-xfRn8vFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc81350e92f6178f699ac9beba6bdf438fc8f4be --- /dev/null +++ b/annotations_1/ZW-xfRn8vFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.42], [4.0, 5.97], [7.0, 8.31], [10.0, 11.82], [13.0, 16.24], [18.0, 19.06], [23.0, 26.27], [27.0, 29.51], [30.0, 29.91], [31.0, 32.19], [35.0, 36.53], [37.0, 39.99], [41.0, 90.9], [93.0, 118.62], [120.0, 120.09], [122.0, 141.2], [142.0, 158.46], [161.0, 161.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [71.72, 0.0, 0.0, 0.0, 90.43, 0.0, 84.62, 79.07, 0.0, 0.0, 0.0, 73.06, 0.0, 33.24, 0.0, 42.13, 35.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.5], ["hum", 23.87], ["throbbing", 5.34]], null, [["music", 48.7], ["whale vocalization", 10.69], ["musical instrument", 7.31]], [["speech", 79.28], ["hum", 4.47], ["music", 2.93]], null], "duration": [2.42, 1.97, 1.31, 1.82, 3.24, 1.06, 3.27, 2.51, -0.09, 1.19, 1.53, 2.99, 49.9, 25.62, 0.09, 19.2, 16.46, 0.27]} \ No newline at end of file diff --git a/annotations_1/ZWe2pwIiWsk_filtered.json b/annotations_1/ZWe2pwIiWsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c02f9ca0406cd94667792fcf10d54afe4e3cfd94 --- /dev/null +++ b/annotations_1/ZWe2pwIiWsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.25], [12.0, 38.31], [41.0, 42.08], [44.0, 46.94], [49.0, 55.21], [58.0, 66.6], [67.0, 70.36], [71.0, 71.85], [73.0, 74.49], [76.0, 76.71], [78.0, 79.69], [91.0, 92.25], [93.0, 94.1], [98.0, 99.01], [103.0, 103.22], [104.0, 105.09], [106.0, 107.97], [109.0, 112.45], [113.0, 125.04], [130.0, 134.92], [139.0, 146.16], [148.0, 166.06]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [54.63, 29.42, 0.0, 29.1, 31.22, 36.13, 31.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.06, 29.23, 34.59, 30.97, 28.42], "audiomae_on_audioset": [null, [["music", 61.27], ["theremin", 14.05], ["hum", 3.12]], null, [["speech", 14.55], ["whip", 8.06], ["vehicle", 5.99]], [["mains hum", 26.65], ["hum", 18.58], ["buzz", 18.25]], [["hum", 43.64], ["mains hum", 27.08], ["music", 5.43]], [["music", 36.03], ["buzzer", 9.43], ["fire alarm", 5.08]], null, null, null, null, null, null, null, null, null, null, [["music", 29.74], ["echo", 7.73], ["boing", 7.0]], [["speech", 39.93], ["vehicle", 17.64], ["car", 13.98]], [["music", 29.55], ["gong", 25.27], ["throbbing", 4.46]], [["music", 38.06], ["didgeridoo", 9.21], ["theremin", 4.11]], [["music", 25.63], ["vehicle", 14.85], ["foghorn", 9.94]]], "duration": [3.25, 26.31, 1.08, 2.94, 6.21, 8.6, 3.36, 0.85, 1.49, 0.71, 1.69, 1.25, 1.1, 1.01, 0.22, 1.09, 1.97, 3.45, 12.04, 4.92, 7.16, 18.06]} \ No newline at end of file diff --git a/annotations_1/ZWszIB0z50k_filtered.json b/annotations_1/ZWszIB0z50k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1efae3a30ea47b23c5483056dd051c89d34c2b24 --- /dev/null +++ b/annotations_1/ZWszIB0z50k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.73], [12.0, 14.08], [15.0, 15.7], [17.0, 17.76], [22.0, 23.67], [26.0, 27.55], [32.0, 32.02], [34.0, 34.33], [35.0, 36.19], [45.0, 47.48], [48.0, 53.62], [58.0, 59.09], [60.0, 64.03], [66.0, 68.93], [71.0, 75.14], [76.0, 75.96], [86.0, 89.83], [96.0, 96.08], [99.0, 99.47], [100.0, 100.87], [105.0, 105.36], [107.0, 107.28], [116.0, 118.96], [121.0, 121.09], [122.0, 123.2], [124.0, 126.57], [129.0, 130.67], [131.0, 133.19], [134.0, 135.9], [139.0, 156.34], [157.0, 159.46]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 48.56, 0.0, 60.6, 85.35, 69.07, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 0.0, 78.55, 0.0, 66.51, 0.0, 35.83, 31.57], "audiomae_on_audioset": [null, [["speech", 26.59], ["hum", 13.83], ["sidetone", 9.77]], null, null, null, null, null, null, null, null, [["speech", 27.61], ["fly, housefly", 19.39], ["insect", 7.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.42], ["throbbing", 9.22], ["hum", 6.09]], [["moo", 47.31], ["cattle, bovinae", 30.02], ["livestock, farm animals, working animals", 11.38]]], "duration": [1.73, 2.08, 0.7, 0.76, 1.67, 1.55, 0.02, 0.33, 1.19, 2.48, 5.62, 1.09, 4.03, 2.93, 4.14, -0.04, 3.83, 0.08, 0.47, 0.87, 0.36, 0.28, 2.96, 0.09, 1.2, 2.57, 1.67, 2.19, 1.9, 17.34, 2.46]} \ No newline at end of file diff --git a/annotations_1/ZXkKHnmKWoI_filtered.json b/annotations_1/ZXkKHnmKWoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f46eaa64352905ed1adf90bc7d1111b3920d4d5b --- /dev/null +++ b/annotations_1/ZXkKHnmKWoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.75], [19.0, 35.87], [40.0, 45.05], [49.0, 73.89], [75.0, 105.17], [108.0, 108.21], [113.0, 134.2]], "keep_status": [false, false, true, true, false, false, false], "silence_prob": [0.0, 56.1, 40.48, 36.12, 0.0, 0.0, 30.44], "audiomae_on_audioset": [null, null, [["music", 22.75], ["hum", 12.22], ["gong", 8.11]], [["music", 40.87], ["grunt", 8.1], ["whale vocalization", 7.02]], null, null, [["speech", 48.09], ["music", 30.86], ["theremin", 3.9]]], "duration": [1.75, 16.87, 5.05, 24.89, 30.17, 0.21, 21.2]} \ No newline at end of file diff --git a/annotations_1/ZXyLYqWUffA_filtered.json b/annotations_1/ZXyLYqWUffA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d67c7961de1940abf33f571160374a6e43573e58 --- /dev/null +++ b/annotations_1/ZXyLYqWUffA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.24], [14.0, 16.38], [25.0, 25.34], [32.0, 32.02], [33.0, 33.4], [35.0, 35.56], [44.0, 44.05], [47.0, 46.85], [47.0, 48.49], [66.0, 66.75], [71.0, 71.0], [71.0, 74.87], [78.0, 80.94], [84.0, 84.77], [99.0, 99.18], [100.0, 100.21], [101.0, 101.82], [107.0, 107.87], [109.0, 111.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.9], ["music", 12.56], ["chirp tone", 6.73]], [["speech", 39.13], ["whack, thwack", 21.41], ["thunk", 17.45]], null, null, null, null, null, null], "duration": [1.24, 2.38, 0.34, 0.02, 0.4, 0.56, 0.05, -0.15, 1.49, 0.75, 0.0, 3.87, 2.94, 0.77, 0.18, 0.21, 0.82, 0.87, 2.75]} \ No newline at end of file diff --git a/annotations_1/Z_WhAyucr_E_filtered.json b/annotations_1/Z_WhAyucr_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0709be5e2f8a82943f75d3356fb3163c3142af90 --- /dev/null +++ b/annotations_1/Z_WhAyucr_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.87], [33.0, 36.21], [37.0, 39.73], [41.0, 44.32], [49.0, 49.77], [55.0, 55.34], [75.0, 74.68], [77.0, 83.71], [88.0, 89.6], [92.0, 94.47], [97.0, 97.19], [101.0, 102.52], [104.0, 103.99], [105.0, 105.21], [110.0, 115.3], [116.0, 118.47], [119.0, 120.9], [124.0, 126.72], [127.0, 128.75], [130.0, 131.77], [134.0, 135.72], [137.0, 138.0], [140.0, 141.03], [145.0, 145.72], [148.0, 148.81], [151.0, 156.44], [158.0, 159.6], [160.0, 161.15], [162.0, 162.68], [165.0, 165.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.87, 69.2, 42.51, 50.21, 0.0, 0.0, 0.0, 49.0, 0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 90.6, 78.72, 0.0, 37.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 67.6], ["crowd", 12.74], ["applause", 6.78]], null, [["radio", 35.75], ["sidetone", 30.69], ["speech", 20.04]], null, null, null, null, [["speech", 67.85], ["hum", 13.97], ["throbbing", 3.91]], null, null, null, null, null, null, null, null, null, [["music", 36.75], ["speech", 11.0], ["singing bowl", 8.23]], null, null, null, null, null, null, null, [["speech", 46.36], ["music", 22.97], ["hum", 7.8]], null, null, null, null], "duration": [4.87, 3.21, 2.73, 3.32, 0.77, 0.34, -0.32, 6.71, 1.6, 2.47, 0.19, 1.52, -0.01, 0.21, 5.3, 2.47, 1.9, 2.72, 1.75, 1.77, 1.72, 1.0, 1.03, 0.72, 0.81, 5.44, 1.6, 1.15, 0.68, 0.43]} \ No newline at end of file diff --git a/annotations_1/Zauzaj2bpvM_filtered.json b/annotations_1/Zauzaj2bpvM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92967e63be7a97717a63ba072bd0b7a0fdbdcf83 --- /dev/null +++ b/annotations_1/Zauzaj2bpvM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.43], [32.0, 32.53], [37.0, 37.67], [42.0, 42.77], [43.0, 44.19], [45.0, 44.9], [46.0, 45.77], [46.0, 46.35], [46.0, 46.57], [48.0, 48.79], [50.0, 50.35], [50.0, 50.41], [50.0, 52.3], [54.0, 53.87], [54.0, 54.31], [55.0, 56.22], [57.0, 56.69], [64.0, 65.43], [66.0, 66.87], [73.0, 76.98], [97.0, 97.85], [98.0, 100.58], [102.0, 103.35], [106.0, 106.22], [107.0, 109.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.99, 0.0, 36.15, 0.0, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.03], ["musical instrument", 11.69], ["cello", 4.12]], null, null, null, null, null, null, [["music", 57.43], ["musical instrument", 12.48], ["bowed string instrument", 8.42]], null, [["speech", 73.02], ["tuning fork", 17.81], ["music", 1.25]], null, null, null], "duration": [0.43, 0.53, 0.67, 0.77, 1.19, -0.1, -0.23, 0.35, 0.57, 0.79, 0.35, 0.41, 2.3, -0.13, 0.31, 1.22, -0.31, 1.43, 0.87, 3.98, 0.85, 2.58, 1.35, 0.22, 2.24]} \ No newline at end of file diff --git a/annotations_1/ZawJ9EBOLVk_filtered.json b/annotations_1/ZawJ9EBOLVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..920869b09ff559f19dfa1b6f89c6eff722406c29 --- /dev/null +++ b/annotations_1/ZawJ9EBOLVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.62], [25.0, 25.69], [26.0, 47.87], [50.0, 61.45], [64.0, 77.21]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.94, 29.12, 31.97], "audiomae_on_audioset": [null, null, [["music", 26.32], ["speech", 17.68], ["whack, thwack", 15.73]], [["speech", 58.61], ["music", 12.58], ["animal", 6.91]], [["music", 67.31], ["speech", 10.36], ["didgeridoo", 6.65]]], "duration": [1.62, 0.69, 21.87, 11.45, 13.21]} \ No newline at end of file diff --git a/annotations_1/ZbL_db16k0w_filtered.json b/annotations_1/ZbL_db16k0w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30c3d772f0edcc4e346f84b97e4b87727f9df72d --- /dev/null +++ b/annotations_1/ZbL_db16k0w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 34.65], [35.0, 34.7], [35.0, 35.09], [35.0, 46.5], [47.0, 58.19], [60.0, 61.91], [62.0, 74.04], [74.0, 77.77], [79.0, 81.13], [82.0, 83.84]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.82, 83.16, 0.0, 73.97, 38.98, 56.33, 0.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 20.48], ["music", 14.57], ["speech", 8.63]], null, null, null, [["cattle, bovinae", 31.32], ["moo", 26.45], ["livestock, farm animals, working animals", 21.58]], null, null], "duration": [-0.35, -0.3, 0.09, 11.5, 11.19, 1.91, 12.04, 3.77, 2.13, 1.84]} \ No newline at end of file diff --git a/annotations_1/Zbi-MbMsnIM_filtered.json b/annotations_1/Zbi-MbMsnIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6b98bdf065bd5b6d796d44c0daf575fa85c7760 --- /dev/null +++ b/annotations_1/Zbi-MbMsnIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.4], [28.0, 66.48], [70.0, 93.45], [99.0, 99.4], [104.0, 108.65], [112.0, 114.12], [118.0, 120.95], [123.0, 123.79], [125.0, 124.82], [129.0, 129.9], [139.0, 142.5], [144.0, 144.61], [146.0, 150.21]], "keep_status": [true, false, true, false, true, true, true, false, false, false, false, false, false], "silence_prob": [28.34, 0.0, 30.89, 0.0, 30.35, 28.32, 30.06, 0.0, 0.0, 0.0, 32.73, 0.0, 32.44], "audiomae_on_audioset": [[["music", 29.11], ["vehicle", 13.46], ["speech", 12.39]], null, [["speech", 24.72], ["hum", 11.05], ["rumble", 9.28]], null, [["whack, thwack", 25.01], ["music", 19.89], ["hum", 7.82]], [["vehicle", 33.54], ["car", 16.16], ["music", 8.25]], [["speech", 22.19], ["arrow", 19.53], ["explosion", 9.04]], null, null, null, [["speech", 33.52], ["rumble", 20.14], ["hum", 16.85]], null, [["rumble", 34.79], ["speech", 22.35], ["hum", 13.88]]], "duration": [16.4, 38.48, 23.45, 0.4, 4.65, 2.12, 2.95, 0.79, -0.18, 0.9, 3.5, 0.61, 4.21]} \ No newline at end of file diff --git a/annotations_1/Zbmc8C3GaC8_filtered.json b/annotations_1/Zbmc8C3GaC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b10c891349e533a91ff945e9ab8c06f115d251d --- /dev/null +++ b/annotations_1/Zbmc8C3GaC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.75], [7.0, 8.6], [9.0, 12.45], [23.0, 24.53], [25.0, 26.72], [28.0, 29.52], [34.0, 45.81], [47.0, 48.78], [52.0, 53.81], [55.0, 57.79], [58.0, 67.53], [69.0, 73.52], [76.0, 84.01], [88.0, 99.22], [100.0, 105.16], [106.0, 111.03], [114.0, 120.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [93.76, 0.0, 64.86, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 97.11, 81.71, 94.37, 98.27, 95.78, 46.36, 51.71, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.32], ["heart sounds, heartbeat", 3.65], ["hum", 3.25]], null, null], "duration": [2.75, 1.6, 3.45, 1.53, 1.72, 1.52, 11.81, 1.78, 1.81, 2.79, 9.53, 4.52, 8.01, 11.22, 5.16, 5.03, 6.23]} \ No newline at end of file diff --git a/annotations_1/Zd27SaRdxiE_filtered.json b/annotations_1/Zd27SaRdxiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef13863de947e3b48a1caa555204882e18794d4e --- /dev/null +++ b/annotations_1/Zd27SaRdxiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.22], [17.0, 17.54], [20.0, 20.63], [22.0, 22.62], [25.0, 27.23], [28.0, 28.76], [32.0, 32.71], [37.0, 37.98], [41.0, 42.06], [44.0, 44.41], [45.0, 47.24], [49.0, 55.32], [56.0, 62.26], [63.0, 65.35], [67.0, 67.49], [69.0, 79.12], [81.0, 81.28], [83.0, 87.69], [92.0, 93.9], [95.0, 97.33], [98.0, 97.93], [100.0, 100.84], [102.0, 104.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 92.15, 85.9, 55.53, 0.0, 59.15, 0.0, 51.6, 0.0, 47.46, 0.0, 0.0, 37.43], "audiomae_on_audioset": [null, null, null, null, [["music", 68.71], ["musical instrument", 7.96], ["speech", 3.96]], null, null, null, null, null, [["music", 39.57], ["speech", 18.27], ["mantra", 4.65]], null, null, null, null, null, null, null, null, [["foghorn", 36.16], ["music", 35.35], ["musical instrument", 4.87]], null, null, [["music", 37.13], ["speech", 7.95], ["hum", 7.39]]], "duration": [1.22, 0.54, 0.63, 0.62, 2.23, 0.76, 0.71, 0.98, 1.06, 0.41, 2.24, 6.32, 6.26, 2.35, 0.49, 10.12, 0.28, 4.69, 1.9, 2.33, -0.07, 0.84, 2.36]} \ No newline at end of file diff --git a/annotations_1/ZdhLQ1toP9s_filtered.json b/annotations_1/ZdhLQ1toP9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5dbbd3c5a8994d6e0b97b14fab9af75e19060bb --- /dev/null +++ b/annotations_1/ZdhLQ1toP9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.3], [12.0, 13.04], [14.0, 20.17], [21.0, 30.5], [32.0, 34.47], [39.0, 40.04], [42.0, 44.98], [45.0, 54.19], [57.0, 59.78], [62.0, 62.9], [64.0, 65.48], [71.0, 71.58], [72.0, 75.0], [76.0, 89.18], [92.0, 99.66], [101.0, 101.71], [103.0, 103.32], [106.0, 109.21], [110.0, 112.23], [114.0, 115.92], [118.0, 118.89], [120.0, 121.44], [127.0, 127.43], [129.0, 130.74], [131.0, 148.05], [149.0, 149.42], [150.0, 150.2], [151.0, 154.85], [155.0, 174.16]], "keep_status": [true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [49.54, 0.0, 52.68, 45.82, 51.66, 0.0, 30.41, 50.66, 95.51, 0.0, 0.0, 0.0, 72.6, 31.38, 44.81, 0.0, 0.0, 34.19, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 36.44, 0.0, 0.0, 50.06, 43.71], "audiomae_on_audioset": [[["speech", 51.42], ["sidetone", 13.12], ["music", 5.05]], null, null, [["speech", 29.57], ["music", 27.03], ["sonar", 10.85]], null, null, [["thunk", 22.36], ["speech", 16.71], ["music", 12.24]], null, null, null, null, null, null, [["music", 47.28], ["speech", 18.5], ["throbbing", 8.32]], [["music", 51.86], ["speech", 19.0], ["throbbing", 11.13]], null, null, [["music", 37.87], ["electronic music", 5.68], ["synthesizer", 4.08]], null, null, null, null, null, null, [["hum", 31.74], ["music", 27.63], ["mains hum", 9.32]], null, null, null, [["speech", 24.98], ["music", 20.3], ["coin (dropping)", 13.73]]], "duration": [2.3, 1.04, 6.17, 9.5, 2.47, 1.04, 2.98, 9.19, 2.78, 0.9, 1.48, 0.58, 3.0, 13.18, 7.66, 0.71, 0.32, 3.21, 2.23, 1.92, 0.89, 1.44, 0.43, 1.74, 17.05, 0.42, 0.2, 3.85, 19.16]} \ No newline at end of file diff --git a/annotations_1/ZdhqVdIsBSE_filtered.json b/annotations_1/ZdhqVdIsBSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae918c5c83541d33723710309578ca3d97cc5298 --- /dev/null +++ b/annotations_1/ZdhqVdIsBSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.5], [10.0, 16.83], [26.0, 33.08], [38.0, 41.2], [44.0, 58.5], [61.0, 61.92], [70.0, 75.22], [77.0, 76.92], [81.0, 101.04], [107.0, 107.49], [108.0, 111.81], [115.0, 116.72], [118.0, 129.39], [131.0, 136.11], [138.0, 140.71], [152.0, 152.56], [154.0, 155.7], [157.0, 162.28], [164.0, 166.53]], "keep_status": [false, true, true, true, false, false, false, false, false, false, true, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 30.0, 35.08, 39.41, 29.5, 0.0, 65.32, 0.0, 30.8, 0.0, 31.55, 0.0, 30.46, 33.72, 32.1, 0.0, 0.0, 30.69, 34.16], "audiomae_on_audioset": [null, [["music", 37.36], ["speech", 27.0], ["sidetone", 4.88]], [["mosquito", 21.6], ["fly, housefly", 18.86], ["mains hum", 17.93]], [["music", 24.84], ["chirp tone", 9.37], ["singing bowl", 6.99]], [["cacophony", 59.76], ["music", 22.46], ["buzz", 2.24]], null, null, null, [["music", 74.84], ["electronic music", 7.3], ["didgeridoo", 1.64]], null, [["music", 44.14], ["speech", 19.79], ["didgeridoo", 4.56]], null, [["hum", 32.84], ["mains hum", 21.85], ["music", 20.23]], [["music", 30.91], ["hum", 18.8], ["mains hum", 13.07]], [["music", 38.86], ["mains hum", 17.5], ["hum", 17.24]], null, null, [["speech", 32.54], ["mosquito", 18.37], ["fly, housefly", 10.51]], [["music", 49.86], ["electronic music", 6.5], ["theremin", 6.3]]], "duration": [1.5, 6.83, 7.08, 3.2, 14.5, 0.92, 5.22, -0.08, 20.04, 0.49, 3.81, 1.72, 11.39, 5.11, 2.71, 0.56, 1.7, 5.28, 2.53]} \ No newline at end of file diff --git a/annotations_1/Zdv1_Iimmgg_filtered.json b/annotations_1/Zdv1_Iimmgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5292fe20ed2058e35126b0d6f48bd65525df9689 --- /dev/null +++ b/annotations_1/Zdv1_Iimmgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 35.04], [36.0, 39.41], [40.0, 50.99], [53.0, 53.59], [55.0, 57.5], [58.0, 59.7], [61.0, 82.86], [85.0, 117.49], [118.0, 118.67], [121.0, 128.75]], "keep_status": [true, false, false, false, true, false, true, false, false, true], "silence_prob": [32.32, 72.75, 28.96, 0.0, 32.77, 0.0, 31.09, 0.0, 0.0, 30.99], "audiomae_on_audioset": [[["hum", 24.1], ["door", 9.86], ["mains hum", 8.54]], null, [["hum", 32.54], ["rumble", 25.35], ["mains hum", 20.88]], null, [["hum", 22.08], ["music", 16.24], ["buzz", 10.98]], null, [["hum", 31.24], ["mains hum", 24.42], ["music", 8.37]], null, null, [["hum", 14.11], ["music", 14.05], ["throbbing", 8.58]]], "duration": [5.04, 3.41, 10.99, 0.59, 2.5, 1.7, 21.86, 32.49, 0.67, 7.75]} \ No newline at end of file diff --git a/annotations_1/Zeg6dl4L60M_filtered.json b/annotations_1/Zeg6dl4L60M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01d9a584bcbd5a2fef764081fe77174b0d97ded0 --- /dev/null +++ b/annotations_1/Zeg6dl4L60M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.57], [10.0, 25.1], [25.0, 29.62], [30.0, 44.24], [46.0, 45.84], [46.0, 58.95], [61.0, 87.29], [88.0, 104.92], [105.0, 109.27], [110.0, 111.62], [112.0, 120.24], [121.0, 147.58], [148.0, 149.1], [151.0, 152.68], [155.0, 156.17]], "keep_status": [false, true, true, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [29.35, 30.1, 28.95, 29.05, 0.0, 28.63, 34.86, 29.75, 32.76, 0.0, 29.63, 28.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 25.52], ["music", 24.76], ["throbbing", 20.68]], [["music", 26.6], ["speech", 25.27], ["hum", 5.48]], [["speech", 31.9], ["whack, thwack", 16.95], ["music", 7.51]], [["speech", 35.83], ["whack, thwack", 17.71], ["music", 7.67]], null, [["music", 32.9], ["hum", 14.67], ["speech", 8.52]], [["hum", 55.64], ["mains hum", 15.41], ["music", 12.72]], [["music", 38.32], ["didgeridoo", 15.47], ["hum", 6.44]], [["livestock, farm animals, working animals", 53.3], ["cattle, bovinae", 18.62], ["moo", 12.69]], null, [["speech", 51.24], ["music", 30.53], ["didgeridoo", 3.24]], [["music", 37.02], ["speech", 36.02], ["burst, pop", 4.67]], null, null, null], "duration": [5.57, 15.1, 4.62, 14.24, -0.16, 12.95, 26.29, 16.92, 4.27, 1.62, 8.24, 26.58, 1.1, 1.68, 1.17]} \ No newline at end of file diff --git a/annotations_1/ZekXmBuhS5c_filtered.json b/annotations_1/ZekXmBuhS5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a9eca0e22baeb37ad3259c80ecbe80b9f1dc6ac --- /dev/null +++ b/annotations_1/ZekXmBuhS5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.1], [13.0, 18.39], [26.0, 26.77], [28.0, 31.48], [32.0, 40.44], [43.0, 43.68], [50.0, 51.76], [72.0, 73.33], [74.0, 77.23], [80.0, 81.77], [84.0, 88.38], [90.0, 91.39], [99.0, 120.33], [122.0, 122.66]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 28.61, 0.0, 61.47, 29.08, 0.0, 0.0, 0.0, 42.91, 0.0, 51.94, 0.0, 29.09, 0.0], "audiomae_on_audioset": [null, [["vehicle", 18.76], ["whale vocalization", 8.52], ["clatter", 6.21]], null, null, [["speech", 30.8], ["music", 17.55], ["crowd", 6.61]], null, null, null, [["hum", 28.53], ["music", 27.95], ["mains hum", 16.77]], null, null, null, [["music", 42.09], ["theremin", 9.86], ["crowd", 8.25]], null], "duration": [1.1, 5.39, 0.77, 3.48, 8.44, 0.68, 1.76, 1.33, 3.23, 1.77, 4.38, 1.39, 21.33, 0.66]} \ No newline at end of file diff --git a/annotations_1/ZfyjpKP8zDk_filtered.json b/annotations_1/ZfyjpKP8zDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d4da068049d778382abeb749e72cab8ad7ff1e --- /dev/null +++ b/annotations_1/ZfyjpKP8zDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.53], [6.0, 16.46], [19.0, 19.48], [23.0, 22.89], [27.0, 27.48], [28.0, 29.47], [30.0, 31.43], [32.0, 32.91], [33.0, 34.72], [37.0, 37.39], [39.0, 39.68], [45.0, 47.19], [48.0, 49.03], [50.0, 52.39], [53.0, 54.19], [54.0, 54.99], [62.0, 64.12], [65.0, 66.21], [67.0, 68.5], [69.0, 70.38], [80.0, 80.13], [85.0, 85.85], [87.0, 88.05], [89.0, 90.58], [91.0, 91.56], [92.0, 93.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 0.0, 91.81, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.53, 10.46, 0.48, -0.11, 0.48, 1.47, 1.43, 0.91, 1.72, 0.39, 0.68, 2.19, 1.03, 2.39, 1.19, 0.99, 2.12, 1.21, 1.5, 1.38, 0.13, 0.85, 1.05, 1.58, 0.56, 1.09]} \ No newline at end of file diff --git a/annotations_1/ZgAf9AuNc6Q_filtered.json b/annotations_1/ZgAf9AuNc6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..162853f4d0629a159056254539aa95a552a287dd --- /dev/null +++ b/annotations_1/ZgAf9AuNc6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.03], [21.0, 24.11], [35.0, 34.86], [56.0, 56.51], [57.0, 57.48], [87.0, 87.34], [89.0, 90.15], [94.0, 94.44], [103.0, 105.17], [130.0, 130.89], [133.0, 133.68], [135.0, 135.77], [137.0, 137.15], [139.0, 138.91], [144.0, 146.38], [148.0, 149.37], [155.0, 155.51], [160.0, 165.13], [168.0, 168.34], [170.0, 172.42], [180.0, 180.87]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [28.73, 28.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.88, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 0.0, 0.0, 36.25, 0.0, 29.5, 0.0], "audiomae_on_audioset": [[["vehicle", 18.63], ["speech", 11.51], ["race car, auto racing", 9.62]], [["speech", 33.14], ["music", 12.45], ["roar", 7.45]], null, null, null, null, null, null, [["speech", 21.28], ["music", 15.53], ["musical instrument", 6.85]], null, null, null, null, null, [["cattle, bovinae", 10.42], ["moo", 10.09], ["whale vocalization", 8.2]], null, null, [["music", 45.12], ["brass instrument", 5.15], ["throbbing", 4.42]], null, [["music", 48.51], ["hum", 5.98], ["cacophony", 5.33]], null], "duration": [2.03, 3.11, -0.14, 0.51, 0.48, 0.34, 1.15, 0.44, 2.17, 0.89, 0.68, 0.77, 0.15, -0.09, 2.38, 1.37, 0.51, 5.13, 0.34, 2.42, 0.87]} \ No newline at end of file diff --git a/annotations_1/ZgeAaV-OFvs_filtered.json b/annotations_1/ZgeAaV-OFvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..682c04bdd7d6a4eac9ab0aac77d8771d85a42509 --- /dev/null +++ b/annotations_1/ZgeAaV-OFvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.55], [14.0, 13.93], [15.0, 15.03], [16.0, 17.34], [23.0, 23.33], [26.0, 28.05], [30.0, 30.23], [30.0, 30.35], [30.0, 30.62], [35.0, 35.43], [44.0, 44.83], [48.0, 47.93], [51.0, 50.95], [53.0, 55.04], [59.0, 60.08], [66.0, 68.82], [72.0, 75.39], [82.0, 82.02], [82.0, 90.0], [94.0, 93.88], [95.0, 96.04], [96.0, 99.93], [101.0, 102.1], [114.0, 114.78], [116.0, 123.35], [139.0, 139.14]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [39.44, 0.0, 0.0, 0.0, 0.0, 41.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.05, 0.0, 29.69, 31.8, 0.0, 29.07, 0.0, 0.0, 49.31, 0.0, 0.0, 30.1, 0.0], "audiomae_on_audioset": [[["music", 48.33], ["musical instrument", 5.79], ["guitar", 5.51]], null, null, null, null, [["music", 67.72], ["synthesizer", 7.55], ["musical instrument", 4.25]], null, null, null, null, null, null, null, [["theremin", 44.19], ["music", 31.48], ["didgeridoo", 9.1]], null, [["music", 14.59], ["vehicle", 11.65], ["car", 10.84]], [["music", 43.52], ["fly, housefly", 6.38], ["insect", 4.91]], null, [["music", 76.52], ["electronic music", 7.75], ["house music", 4.31]], null, null, [["music", 44.49], ["speech", 41.13], ["boing", 5.95]], null, null, [["music", 41.36], ["theremin", 10.89], ["synthesizer", 10.72]], null], "duration": [2.55, -0.07, 0.03, 1.34, 0.33, 2.05, 0.23, 0.35, 0.62, 0.43, 0.83, -0.07, -0.05, 2.04, 1.08, 2.82, 3.39, 0.02, 8.0, -0.12, 1.04, 3.93, 1.1, 0.78, 7.35, 0.14]} \ No newline at end of file diff --git a/annotations_1/ZhGme4W06Kk_filtered.json b/annotations_1/ZhGme4W06Kk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/ZhGme4W06Kk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ZhqHIrO4ePo_filtered.json b/annotations_1/ZhqHIrO4ePo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef34a99bd455469fd16ef170f564a9b8aa852bd8 --- /dev/null +++ b/annotations_1/ZhqHIrO4ePo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.39], [31.0, 30.89], [32.0, 34.21], [48.0, 48.76], [53.0, 61.55], [66.0, 66.92], [68.0, 70.77], [74.0, 79.24], [82.0, 83.13], [85.0, 85.35], [88.0, 89.7], [97.0, 96.96], [99.0, 100.95], [102.0, 102.66], [110.0, 119.13], [122.0, 122.82], [125.0, 132.98], [133.0, 134.23], [136.0, 141.08]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [40.24, 0.0, 50.21, 0.0, 29.61, 0.0, 31.26, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.69, 0.0, 30.48, 0.0, 38.02], "audiomae_on_audioset": [[["stomach rumble", 44.87], ["whale vocalization", 14.1], ["music", 8.85]], null, null, null, [["music", 24.9], ["speech", 24.29], ["aircraft", 5.27]], null, [["sidetone", 28.06], ["music", 21.04], ["hum", 14.36]], [["music", 52.66], ["speech", 18.5], ["sidetone", 6.74]], null, null, null, null, null, null, [["cattle, bovinae", 21.95], ["moo", 20.29], ["whale vocalization", 19.49]], null, [["speech", 68.2], ["breaking", 11.28], ["smash, crash", 5.21]], null, [["sidetone", 11.75], ["noise", 9.77], ["hum", 9.59]]], "duration": [3.39, -0.11, 2.21, 0.76, 8.55, 0.92, 2.77, 5.24, 1.13, 0.35, 1.7, -0.04, 1.95, 0.66, 9.13, 0.82, 7.98, 1.23, 5.08]} \ No newline at end of file diff --git a/annotations_1/ZjEnS3hA1B4_filtered.json b/annotations_1/ZjEnS3hA1B4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bf433d6ed5068bed7b34b9534ca0d86f44478c0 --- /dev/null +++ b/annotations_1/ZjEnS3hA1B4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 76.45], [76.0, 80.94], [82.0, 113.05], [115.0, 118.08], [119.0, 130.59], [132.0, 134.77], [135.0, 138.1], [139.0, 141.64], [142.0, 143.92], [146.0, 148.63], [151.0, 153.27], [154.0, 161.15], [162.0, 163.0], [164.0, 166.06]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 32.51, 0.0, 36.22, 28.86, 50.97, 50.11, 45.08, 0.0, 43.48, 45.82, 42.86, 0.0, 73.21], "audiomae_on_audioset": [null, [["speech", 58.57], ["vehicle", 14.88], ["aircraft", 4.01]], null, [["hum", 39.47], ["music", 25.48], ["mains hum", 16.26]], [["speech", 25.05], ["music", 18.4], ["whack, thwack", 7.58]], null, null, [["theremin", 33.06], ["music", 14.19], ["hum", 13.01]], null, [["music", 60.96], ["electronic music", 11.48], ["hum", 5.78]], [["music", 24.61], ["hum", 18.16], ["mains hum", 17.62]], [["music", 29.17], ["hum", 23.61], ["mains hum", 7.23]], null, null], "duration": [0.45, 4.94, 31.05, 3.08, 11.59, 2.77, 3.1, 2.64, 1.92, 2.63, 2.27, 7.15, 1.0, 2.06]} \ No newline at end of file diff --git a/annotations_1/ZjPPfwVPTDE_filtered.json b/annotations_1/ZjPPfwVPTDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc7bd218200bc5245e9b178569d6f24cba209fb3 --- /dev/null +++ b/annotations_1/ZjPPfwVPTDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.36], [25.0, 26.03], [28.0, 28.71], [29.0, 30.25], [31.0, 31.56], [34.0, 34.82], [36.0, 36.59], [37.0, 37.64], [40.0, 40.54], [44.0, 44.93], [46.0, 46.57], [51.0, 51.87], [52.0, 59.07], [61.0, 62.23], [63.0, 64.57], [65.0, 65.82], [68.0, 68.62], [70.0, 94.85], [96.0, 98.81], [104.0, 104.73], [106.0, 106.73], [110.0, 111.48], [113.0, 113.91], [119.0, 119.62], [121.0, 123.57], [126.0, 126.17], [135.0, 135.82], [136.0, 136.86], [138.0, 140.49], [142.0, 142.4], [143.0, 143.7], [146.0, 148.32], [149.0, 149.82], [150.0, 151.04], [151.0, 152.46], [154.0, 156.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 49.22, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 92.8, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.28], ["effects unit", 11.68], ["guitar", 9.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 1.03, 0.71, 1.25, 0.56, 0.82, 0.59, 0.64, 0.54, 0.93, 0.57, 0.87, 7.07, 1.23, 1.57, 0.82, 0.62, 24.85, 2.81, 0.73, 0.73, 1.48, 0.91, 0.62, 2.57, 0.17, 0.82, 0.86, 2.49, 0.4, 0.7, 2.32, 0.82, 1.04, 1.46, 2.74]} \ No newline at end of file diff --git a/annotations_1/Zle2EnAj0Ms_filtered.json b/annotations_1/Zle2EnAj0Ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d627850c85f6cfcfa2339cc3afa6ca9d83534aa --- /dev/null +++ b/annotations_1/Zle2EnAj0Ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [9.0, 28.59], [30.0, 30.33], [34.0, 34.69], [44.0, 46.11], [51.0, 51.6], [52.0, 53.13], [66.0, 66.31], [72.0, 73.45], [74.0, 74.93], [78.0, 78.14], [82.0, 81.94], [86.0, 87.02]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.44, 0.0, 0.0, 34.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["rumble", 28.74], ["vehicle", 19.43], ["aircraft", 8.02]], null, null, [["music", 38.25], ["speech", 16.46], ["boing", 7.77]], null, null, null, null, null, null, null, null], "duration": [0.45, 19.59, 0.33, 0.69, 2.11, 0.6, 1.13, 0.31, 1.45, 0.93, 0.14, -0.06, 1.02]} \ No newline at end of file diff --git a/annotations_1/Zlqovh9U5v0_filtered.json b/annotations_1/Zlqovh9U5v0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4730b0b8a2f7e74d99aada01273da28ba38274ef --- /dev/null +++ b/annotations_1/Zlqovh9U5v0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [5.0, 14.07], [17.0, 18.15], [22.0, 23.04], [23.0, 24.09], [27.0, 27.13], [29.0, 29.2], [29.0, 29.44], [32.0, 34.23], [43.0, 43.66], [47.0, 48.02], [49.0, 50.72], [62.0, 62.61], [67.0, 67.26], [78.0, 81.01], [83.0, 82.97], [86.0, 87.42], [90.0, 95.12], [97.0, 97.63], [102.0, 102.66], [121.0, 121.44], [125.0, 124.65], [125.0, 125.15], [126.0, 125.61], [126.0, 126.89], [128.0, 129.14], [133.0, 137.27], [140.0, 143.34], [146.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 84.62, 0.0], "audiomae_on_audioset": [null, [["speech", 44.13], ["music", 22.07], ["didgeridoo", 4.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 9.07, 1.15, 1.04, 1.09, 0.13, 0.2, 0.44, 2.23, 0.66, 1.02, 1.72, 0.61, 0.26, 3.01, -0.03, 1.42, 5.12, 0.63, 0.66, 0.44, -0.35, 0.15, -0.39, 0.89, 1.14, 4.27, 3.34, 1.12]} \ No newline at end of file diff --git a/annotations_1/ZlzhOaHLFBM_filtered.json b/annotations_1/ZlzhOaHLFBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b725aebcd963bdf54423f4535a037672f7e71ee --- /dev/null +++ b/annotations_1/ZlzhOaHLFBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.78], [15.0, 27.28], [28.0, 37.76], [38.0, 64.42], [65.0, 91.69], [92.0, 107.87], [109.0, 113.88], [114.0, 116.55], [118.0, 122.25], [123.0, 125.54], [127.0, 128.73], [130.0, 131.26], [133.0, 150.92], [152.0, 153.69], [159.0, 159.95]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.16, 90.78, 38.38, 52.56, 51.23, 49.82, 56.7, 79.41, 84.43, 0.0, 0.0, 63.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 29.97], ["crushing", 8.58], ["arrow", 6.34]], null, null, [["music", 31.89], ["hum", 11.32], ["mains hum", 9.94]], null, null, null, null, null, null, null, null], "duration": [0.78, 12.28, 9.76, 26.42, 26.69, 15.87, 4.88, 2.55, 4.25, 2.54, 1.73, 1.26, 17.92, 1.69, 0.95]} \ No newline at end of file diff --git a/annotations_1/ZmKECCbMc88_filtered.json b/annotations_1/ZmKECCbMc88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ca4becc9ca471edf666a31481884d8420a47f69 --- /dev/null +++ b/annotations_1/ZmKECCbMc88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.07], [9.0, 10.69], [11.0, 11.96], [12.0, 26.76], [29.0, 30.1], [31.0, 31.9], [33.0, 33.51], [45.0, 45.74], [48.0, 48.36], [49.0, 51.88], [52.0, 52.69], [53.0, 53.47], [54.0, 54.65], [58.0, 58.56], [60.0, 61.11], [70.0, 70.46], [74.0, 76.47], [77.0, 77.87], [78.0, 80.91], [82.0, 82.43], [83.0, 84.06], [87.0, 93.21], [98.0, 99.82], [117.0, 117.73], [119.0, 131.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.72, 0.0, 42.26, 0.0, 0.0, 87.37, 0.0, 0.0, 33.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.23], ["sidetone", 35.59], ["dial tone", 5.79]], null, [["speech", 32.95], ["sidetone", 17.89], ["busy signal", 8.78]], null, null, null, null, null, [["speech", 42.47], ["cattle, bovinae", 14.06], ["moo", 11.63]]], "duration": [1.07, 1.69, 0.96, 14.76, 1.1, 0.9, 0.51, 0.74, 0.36, 2.88, 0.69, 0.47, 0.65, 0.56, 1.11, 0.46, 2.47, 0.87, 2.91, 0.43, 1.06, 6.21, 1.82, 0.73, 12.72]} \ No newline at end of file diff --git a/annotations_1/Zo0d4xk3BXw_filtered.json b/annotations_1/Zo0d4xk3BXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd1c778537b370268d54de8d2a327fc8f4fe02d2 --- /dev/null +++ b/annotations_1/Zo0d4xk3BXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.02], [5.0, 5.81], [7.0, 7.37], [8.0, 10.18], [11.0, 11.8], [13.0, 13.46], [16.0, 17.19], [18.0, 18.49], [25.0, 25.07], [34.0, 34.79], [40.0, 41.0], [42.0, 45.84], [59.0, 60.08], [61.0, 62.11], [76.0, 79.24], [86.0, 88.59], [92.0, 96.35], [105.0, 107.45], [109.0, 109.68], [111.0, 115.8], [118.0, 118.62], [122.0, 122.08], [124.0, 125.14], [126.0, 126.57], [128.0, 128.24], [129.0, 130.92], [135.0, 135.92], [136.0, 137.81], [139.0, 140.59], [144.0, 144.75], [153.0, 161.18], [174.0, 174.51], [180.0, 181.94], [185.0, 186.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.73, 0.0, 0.0, 32.05, 31.49, 31.42, 31.36, 0.0, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 67.08], ["boing", 16.32], ["speech", 4.46]], null, null, [["music", 60.96], ["guitar", 5.04], ["musical instrument", 4.67]], [["music", 56.14], ["musical instrument", 2.92], ["singing", 2.56]], [["music", 67.53], ["quack", 3.68], ["reggae", 2.89]], [["music", 61.86], ["musical instrument", 2.03], ["video game music", 1.49]], null, [["boing", 35.94], ["music", 35.47], ["theremin", 2.32]], null, null, null, null, null, null, null, null, null, null, [["music", 73.74], ["didgeridoo", 5.41], ["electronic music", 2.77]], null, null, null], "duration": [0.02, 0.81, 0.37, 2.18, 0.8, 0.46, 1.19, 0.49, 0.07, 0.79, 1.0, 3.84, 1.08, 1.11, 3.24, 2.59, 4.35, 2.45, 0.68, 4.8, 0.62, 0.08, 1.14, 0.57, 0.24, 1.92, 0.92, 1.81, 1.59, 0.75, 8.18, 0.51, 1.94, 1.43]} \ No newline at end of file diff --git a/annotations_1/ZoL1epfoq-g_filtered.json b/annotations_1/ZoL1epfoq-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88503a424731bb3a9930f65cc2463974084dd8ac --- /dev/null +++ b/annotations_1/ZoL1epfoq-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.28], [16.0, 20.56], [22.0, 37.35], [43.0, 42.63], [49.0, 49.65], [53.0, 54.16], [56.0, 59.68], [62.0, 61.91], [64.0, 64.23], [69.0, 70.6], [72.0, 73.55], [87.0, 87.99], [91.0, 90.81], [93.0, 95.57], [100.0, 100.67], [129.0, 132.85], [133.0, 133.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [38.22, 32.67, 31.17, 0.0, 0.0, 0.0, 43.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.2, 0.0, 34.43, 0.0], "audiomae_on_audioset": [[["fart", 28.76], ["speech", 17.68], ["domestic animals, pets", 4.01]], [["music", 76.9], ["guitar", 2.55], ["fart", 2.44]], [["music", 67.65], ["synthesizer", 5.42], ["musical instrument", 3.42]], null, null, null, [["insect", 33.38], ["fly, housefly", 28.23], ["bee, wasp, etc.", 12.49]], null, null, null, null, null, null, [["music", 41.91], ["speech", 21.24], ["musical instrument", 6.65]], null, [["music", 35.38], ["speech", 16.58], ["musical instrument", 8.75]], null], "duration": [2.28, 4.56, 15.35, -0.37, 0.65, 1.16, 3.68, -0.09, 0.23, 1.6, 1.55, 0.99, -0.19, 2.57, 0.67, 3.85, 0.93]} \ No newline at end of file diff --git a/annotations_1/ZpmCdIS3TKc_filtered.json b/annotations_1/ZpmCdIS3TKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9662f04a22295357193831bd854798c88b0f9ea8 --- /dev/null +++ b/annotations_1/ZpmCdIS3TKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.53], [19.0, 20.17], [23.0, 22.71], [25.0, 26.87], [29.0, 36.46], [38.0, 38.6], [40.0, 40.02], [41.0, 43.28], [45.0, 45.44], [47.0, 48.17], [50.0, 50.46], [52.0, 52.79], [56.0, 57.11], [58.0, 59.16], [61.0, 63.07], [64.0, 68.47], [71.0, 71.32], [72.0, 73.09], [75.0, 75.2], [77.0, 78.39], [79.0, 79.35], [83.0, 97.92], [99.0, 100.99], [104.0, 104.45], [106.0, 122.32], [123.0, 126.05], [129.0, 130.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 68.54, 50.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.17, -0.29, 1.87, 7.46, 0.6, 0.02, 2.28, 0.44, 1.17, 0.46, 0.79, 1.11, 1.16, 2.07, 4.47, 0.32, 1.09, 0.2, 1.39, 0.35, 14.92, 1.99, 0.45, 16.32, 3.05, 1.74]} \ No newline at end of file diff --git a/annotations_1/ZrDL3HQCwE8_filtered.json b/annotations_1/ZrDL3HQCwE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5df0486cf9bc7d4c3399a737f44fede034977539 --- /dev/null +++ b/annotations_1/ZrDL3HQCwE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 5.66], [10.0, 10.74], [11.0, 21.66], [23.0, 24.34], [26.0, 27.67], [29.0, 28.97], [29.0, 35.02], [40.0, 42.53], [45.0, 45.66], [46.0, 55.12], [57.0, 57.64], [58.0, 58.9], [59.0, 59.95], [60.0, 61.96], [62.0, 63.12], [66.0, 66.16], [68.0, 68.39], [69.0, 69.63], [70.0, 80.86], [81.0, 81.09], [81.0, 81.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.67, 0.0, 52.16, 0.0, 0.0, 0.0, 51.07, 46.61, 0.0, 40.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 67.5], ["inside, small room", 4.71], ["music", 4.11]], null, [["hum", 20.61], ["mains hum", 16.51], ["music", 8.93]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 2.66, 0.74, 10.66, 1.34, 1.67, -0.03, 6.02, 2.53, 0.66, 9.12, 0.64, 0.9, 0.95, 1.96, 1.12, 0.16, 0.39, 0.63, 10.86, 0.09, 0.24]} \ No newline at end of file diff --git a/annotations_1/ZrPvUd7E9HU_filtered.json b/annotations_1/ZrPvUd7E9HU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b096ced0b5f9658f992961c15ba2af668b9a682a --- /dev/null +++ b/annotations_1/ZrPvUd7E9HU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.08], [16.0, 15.94], [22.0, 22.81], [23.0, 23.8], [25.0, 27.57], [30.0, 32.21], [33.0, 35.02], [36.0, 37.83], [43.0, 43.65], [45.0, 44.83], [46.0, 46.68], [48.0, 48.95], [50.0, 51.49], [52.0, 53.33], [57.0, 58.53], [60.0, 62.45], [69.0, 69.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.68, 0.0, 0.0, 0.0, 93.45, 99.59, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, -0.06, 0.81, 0.8, 2.57, 2.21, 2.02, 1.83, 0.65, -0.17, 0.68, 0.95, 1.49, 1.33, 1.53, 2.45, 0.48]} \ No newline at end of file diff --git a/annotations_1/ZreZzV7y18Y_filtered.json b/annotations_1/ZreZzV7y18Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c74b82f5c0df8f2168cbfc408888be3ae473aad --- /dev/null +++ b/annotations_1/ZreZzV7y18Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.96], [8.0, 9.27], [11.0, 11.72], [12.0, 13.31], [15.0, 15.21], [20.0, 20.9], [26.0, 31.82], [35.0, 40.05], [43.0, 43.46], [49.0, 53.01], [68.0, 68.37], [71.0, 73.48], [78.0, 79.17], [80.0, 83.12], [84.0, 86.51], [88.0, 91.02], [93.0, 111.57], [112.0, 126.39], [129.0, 129.56], [132.0, 132.71], [135.0, 135.72], [137.0, 137.89], [139.0, 139.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.5, 31.05, 0.0, 51.12, 0.0, 39.49, 0.0, 100.0, 100.0, 100.0, 68.93, 38.59, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 77.87], ["carnatic music", 6.05], ["singing", 2.69]], [["music", 67.91], ["carnatic music", 13.14], ["clarinet", 4.24]], null, null, null, [["speech", 49.41], ["music", 19.59], ["hum", 6.17]], null, null, null, null, null, [["speech", 72.08], ["whale vocalization", 8.44], ["sidetone", 6.47]], null, null, null, null, null], "duration": [-0.04, 1.27, 0.72, 1.31, 0.21, 0.9, 5.82, 5.05, 0.46, 4.01, 0.37, 2.48, 1.17, 3.12, 2.51, 3.02, 18.57, 14.39, 0.56, 0.71, 0.72, 0.89, 0.33]} \ No newline at end of file diff --git a/annotations_1/ZsDOHhqqLCQ_filtered.json b/annotations_1/ZsDOHhqqLCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5285f2facb27d4a049443b59ee9ad1b27b7fad5d --- /dev/null +++ b/annotations_1/ZsDOHhqqLCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [4.0, 6.29], [7.0, 15.35], [16.0, 16.78], [18.0, 33.59], [35.0, 40.83], [42.0, 51.41], [55.0, 58.46], [61.0, 62.51], [64.0, 72.6], [74.0, 76.84], [82.0, 85.09], [92.0, 99.25], [100.0, 117.36], [117.0, 117.49], [118.0, 122.3], [124.0, 127.13], [129.0, 133.73], [138.0, 138.38], [143.0, 146.26], [147.0, 147.66], [148.0, 158.52]], "keep_status": [false, true, false, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 41.62, 40.38, 0.0, 43.79, 39.0, 31.85, 36.02, 0.0, 60.79, 68.41, 41.91, 46.5, 41.22, 0.0, 52.05, 54.23, 50.56, 0.0, 48.82, 0.0, 45.52], "audiomae_on_audioset": [null, [["music", 53.56], ["ambient music", 4.63], ["electronic music", 4.06]], [["speech", 34.49], ["music", 34.34], ["hum", 5.87]], null, [["music", 68.86], ["speech", 9.08], ["hum", 6.26]], [["music", 42.78], ["hum", 12.47], ["sonar", 8.27]], [["speech", 44.56], ["music", 9.12], ["hum", 7.84]], [["music", 56.54], ["didgeridoo", 10.13], ["throbbing", 3.56]], null, null, null, [["music", 47.39], ["rumble", 9.51], ["hum", 6.54]], [["hum", 34.25], ["music", 29.63], ["electronic music", 7.9]], [["breaking", 25.32], ["music", 17.02], ["coin (dropping)", 15.42]], null, null, null, null, null, [["music", 46.7], ["gong", 7.9], ["electronic music", 6.31]], null, [["music", 38.83], ["speech", 26.17], ["hum", 7.18]]], "duration": [0.3, 2.29, 8.35, 0.78, 15.59, 5.83, 9.41, 3.46, 1.51, 8.6, 2.84, 3.09, 7.25, 17.36, 0.49, 4.3, 3.13, 4.73, 0.38, 3.26, 0.66, 10.52]} \ No newline at end of file diff --git a/annotations_1/ZsqkTaYITKQ_filtered.json b/annotations_1/ZsqkTaYITKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c06e63fff3e57b028b03999c7abb81c46754252d --- /dev/null +++ b/annotations_1/ZsqkTaYITKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.65], [1.0, 0.94], [2.0, 2.39], [3.0, 3.57], [5.0, 6.84], [17.0, 18.6], [19.0, 20.83], [24.0, 25.66], [26.0, 28.58], [29.0, 30.47], [32.0, 34.92], [38.0, 38.31], [42.0, 42.63], [52.0, 55.11], [56.0, 58.51], [60.0, 63.04], [65.0, 65.82], [68.0, 70.04], [70.0, 74.65], [79.0, 81.21], [82.0, 83.29], [85.0, 85.53], [90.0, 90.44], [92.0, 92.67], [98.0, 99.69], [101.0, 102.0], [106.0, 108.43], [113.0, 122.3], [128.0, 129.91], [135.0, 136.34], [139.0, 140.98], [143.0, 145.32], [146.0, 148.66], [150.0, 151.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 99.99, 0.0, 99.91, 99.84, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 97.43, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.35, -0.06, 0.39, 0.57, 1.84, 1.6, 1.83, 1.66, 2.58, 1.47, 2.92, 0.31, 0.63, 3.11, 2.51, 3.04, 0.82, 2.04, 4.65, 2.21, 1.29, 0.53, 0.44, 0.67, 1.69, 1.0, 2.43, 9.3, 1.91, 1.34, 1.98, 2.32, 2.66, 1.29]} \ No newline at end of file diff --git a/annotations_1/ZtHl67Oeb5I_filtered.json b/annotations_1/ZtHl67Oeb5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c00d5171e8076a35f95979434b095c1990e77b6b --- /dev/null +++ b/annotations_1/ZtHl67Oeb5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.75], [37.0, 37.47], [46.0, 46.3], [56.0, 56.79], [58.0, 59.07], [61.0, 61.45], [65.0, 64.86], [71.0, 71.78], [78.0, 78.87], [96.0, 97.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.47, 0.3, 0.79, 1.07, 0.45, -0.14, 0.78, 0.87, 1.21]} \ No newline at end of file diff --git a/annotations_1/Zti44ptZTrc_filtered.json b/annotations_1/Zti44ptZTrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..528ff3795fe59c4dbfc1bf1d72a528007680ca30 --- /dev/null +++ b/annotations_1/Zti44ptZTrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.92], [6.0, 7.28], [8.0, 9.85], [11.0, 12.45], [13.0, 14.98], [19.0, 21.61], [23.0, 28.24], [31.0, 31.67], [32.0, 34.6], [36.0, 37.96], [44.0, 46.6], [48.0, 52.91], [56.0, 56.57], [59.0, 61.18], [62.0, 63.39], [65.0, 68.66], [72.0, 71.66], [74.0, 75.12], [80.0, 82.59], [87.0, 88.74], [97.0, 100.4], [105.0, 105.41], [108.0, 110.2], [111.0, 112.85], [115.0, 124.28], [126.0, 138.97], [145.0, 147.58], [149.0, 150.48], [156.0, 157.89], [160.0, 161.96], [163.0, 164.34], [166.0, 172.23], [173.0, 176.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.64, 0.0, 0.0, 0.0, 0.0, 91.81, 92.15, 0.0, 83.16, 0.0, 97.64, 92.48, 0.0, 69.47, 0.0, 96.42, 0.0, 0.0, 94.52, 0.0, 94.81, 0.0, 94.52, 0.0, 76.86, 54.5, 96.77, 0.0, 0.0, 0.0, 0.0, 73.82, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.92, 1.28, 1.85, 1.45, 1.98, 2.61, 5.24, 0.67, 2.6, 1.96, 2.6, 4.91, 0.57, 2.18, 1.39, 3.66, -0.34, 1.12, 2.59, 1.74, 3.4, 0.41, 2.2, 1.85, 9.28, 12.97, 2.58, 1.48, 1.89, 1.96, 1.34, 6.23, 3.44]} \ No newline at end of file diff --git a/annotations_1/Zufljc_8uLk_filtered.json b/annotations_1/Zufljc_8uLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/Zufljc_8uLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/Zw7lsVV14Yo_filtered.json b/annotations_1/Zw7lsVV14Yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8f304152c9d6d50475bd9fd77063dee1d3b57f3 --- /dev/null +++ b/annotations_1/Zw7lsVV14Yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 84.43]], "keep_status": [true], "silence_prob": [31.04], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 20.3], ["cattle, bovinae", 16.74], ["moo", 12.94]]], "duration": [5.43]} \ No newline at end of file diff --git a/annotations_1/Zxlo0xmD51Y_filtered.json b/annotations_1/Zxlo0xmD51Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd3654ecdc719588d9f7cb8b0278ba01e42b3270 --- /dev/null +++ b/annotations_1/Zxlo0xmD51Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.01], [15.0, 15.57], [17.0, 24.38], [26.0, 27.28], [29.0, 47.26], [49.0, 51.39], [52.0, 53.45], [55.0, 55.07], [57.0, 64.18], [67.0, 68.89], [74.0, 75.36], [76.0, 77.3], [79.0, 82.07], [82.0, 85.09], [91.0, 96.35], [98.0, 97.8], [98.0, 101.26]], "keep_status": [false, false, false, false, true, true, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [52.16, 0.0, 32.04, 0.0, 29.86, 30.93, 0.0, 0.0, 29.71, 0.0, 0.0, 0.0, 67.25, 46.79, 41.5, 0.0, 42.86], "audiomae_on_audioset": [null, null, [["hum", 49.78], ["throbbing", 19.36], ["mains hum", 6.56]], null, [["speech", 30.98], ["hum", 19.54], ["throbbing", 17.74]], [["mains hum", 29.7], ["hum", 29.32], ["throbbing", 10.98]], null, null, [["throbbing", 28.96], ["hum", 22.17], ["music", 15.84]], null, null, null, null, [["music", 20.47], ["hum", 11.93], ["speech", 11.15]], [["music", 39.85], ["speech", 28.39], ["fly, housefly", 4.84]], null, [["fly, housefly", 52.96], ["insect", 10.58], ["bee, wasp, etc.", 7.63]]], "duration": [5.01, 0.57, 7.38, 1.28, 18.26, 2.39, 1.45, 0.07, 7.18, 1.89, 1.36, 1.3, 3.07, 3.09, 5.35, -0.2, 3.26]} \ No newline at end of file diff --git a/annotations_1/ZyHoPZAsm60_filtered.json b/annotations_1/ZyHoPZAsm60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d18200a28037a2756ec7e856e9325a00eb5c2e78 --- /dev/null +++ b/annotations_1/ZyHoPZAsm60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.5], [16.0, 19.03], [20.0, 20.49], [21.0, 22.42], [23.0, 25.03], [27.0, 26.82], [28.0, 28.83], [32.0, 31.94], [33.0, 34.43], [41.0, 41.52], [45.0, 45.18], [60.0, 60.42], [63.0, 65.3], [70.0, 69.87], [73.0, 73.38], [79.0, 80.52], [81.0, 95.2], [96.0, 97.71], [99.0, 99.27], [100.0, 123.11], [140.0, 140.46], [142.0, 145.4], [146.0, 148.95], [151.0, 152.9], [153.0, 159.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.64, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 47.5, 0.0, 0.0, 36.52, 0.0, 72.01, 74.76, 0.0, 67.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.96], ["didgeridoo", 5.07], ["hum", 3.15]], null, null, [["music", 67.59], ["throbbing", 4.98], ["hum", 4.1]], null, null, null, null, null], "duration": [1.5, 3.03, 0.49, 1.42, 2.03, -0.18, 0.83, -0.06, 1.43, 0.52, 0.18, 0.42, 2.3, -0.13, 0.38, 1.52, 14.2, 1.71, 0.27, 23.11, 0.46, 3.4, 2.95, 1.9, 6.17]} \ No newline at end of file diff --git a/annotations_1/ZyMP_jN2Veg_filtered.json b/annotations_1/ZyMP_jN2Veg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb26c04fd62eb49ad01c1ee856a80f58c1a04148 --- /dev/null +++ b/annotations_1/ZyMP_jN2Veg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [8.0, 8.4], [12.0, 12.7], [14.0, 14.55], [15.0, 17.64], [21.0, 24.83], [31.0, 32.48], [33.0, 34.89], [38.0, 40.85], [44.0, 44.98], [46.0, 46.74], [48.0, 47.68], [49.0, 49.57], [50.0, 50.77], [52.0, 52.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.44, 51.5, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 47.9], ["mains hum", 28.11], ["throbbing", 20.09]], null, null, null, null, null, null], "duration": [0.63, 0.4, 0.7, 0.55, 2.64, 3.83, 1.48, 1.89, 2.85, 0.98, 0.74, -0.32, 0.57, 0.77, 0.44]} \ No newline at end of file diff --git a/annotations_1/ZyirxKE2aFs_filtered.json b/annotations_1/ZyirxKE2aFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b8f98e3f697f3e14c07952f10dd4f91d6795d3a --- /dev/null +++ b/annotations_1/ZyirxKE2aFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.93], [12.0, 17.25], [19.0, 23.09], [26.0, 69.43], [72.0, 93.93], [98.0, 113.12], [117.0, 119.8]], "keep_status": [true, false, true, false, false, false, true], "silence_prob": [29.96, 30.19, 30.2, 0.0, 30.93, 29.93, 29.95], "audiomae_on_audioset": [[["music", 56.22], ["synthesizer", 7.77], ["musical instrument", 3.12]], [["music", 63.58], ["synthesizer", 19.52], ["musical instrument", 4.86]], [["music", 25.27], ["noise", 11.71], ["cacophony", 5.22]], null, [["music", 64.18], ["speech", 12.32], ["didgeridoo", 4.97]], [["music", 60.33], ["theremin", 5.64], ["electronic music", 4.71]], [["music", 47.78], ["speech", 10.22], ["beatboxing", 5.79]]], "duration": [2.93, 5.25, 4.09, 43.43, 21.93, 15.12, 2.8]} \ No newline at end of file diff --git a/annotations_1/_-4Xy6CjAbw_filtered.json b/annotations_1/_-4Xy6CjAbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3712c28ab263353b2791cbd6548b5365a39a7a64 --- /dev/null +++ b/annotations_1/_-4Xy6CjAbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 99.71], [100.0, 112.24], [115.0, 120.97], [123.0, 123.52]], "keep_status": [false, true, true, false], "silence_prob": [0.0, 42.37, 39.98, 0.0], "audiomae_on_audioset": [null, [["music", 25.17], ["speech", 23.34], ["whack, thwack", 9.33]], [["music", 24.06], ["speech", 15.87], ["throbbing", 9.29]], null], "duration": [73.71, 12.24, 5.97, 0.52]} \ No newline at end of file diff --git a/annotations_1/_-9wCERdcog_filtered.json b/annotations_1/_-9wCERdcog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c50eab1ddea021c406fc09ace269ac1566d3984f --- /dev/null +++ b/annotations_1/_-9wCERdcog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.86], [4.0, 4.4], [8.0, 8.75], [10.0, 11.33], [13.0, 13.76], [16.0, 16.09], [18.0, 19.94], [27.0, 27.87], [28.0, 28.17], [39.0, 40.88], [42.0, 42.57], [44.0, 45.15], [49.0, 49.82], [50.0, 51.12], [52.0, 53.16], [57.0, 59.31], [60.0, 61.94], [62.0, 62.78], [64.0, 64.47], [67.0, 67.56], [69.0, 75.64], [76.0, 76.15], [77.0, 78.43], [79.0, 79.64], [80.0, 81.23], [82.0, 82.75], [85.0, 87.42], [93.0, 93.41], [95.0, 94.95], [96.0, 96.55], [97.0, 97.55], [98.0, 98.76], [100.0, 107.38], [108.0, 108.21], [112.0, 126.4], [128.0, 128.34], [133.0, 133.47], [133.0, 141.44], [142.0, 145.64], [148.0, 149.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 33.83, 0.0, 0.0, 32.09, 65.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.94], ["synthesizer", 5.73], ["effects unit", 5.61]], null, null, [["speech", 66.67], ["thunk", 10.4], ["music", 10.29]], null, null], "duration": [0.86, 0.4, 0.75, 1.33, 0.76, 0.09, 1.94, 0.87, 0.17, 1.88, 0.57, 1.15, 0.82, 1.12, 1.16, 2.31, 1.94, 0.78, 0.47, 0.56, 6.64, 0.15, 1.43, 0.64, 1.23, 0.75, 2.42, 0.41, -0.05, 0.55, 0.55, 0.76, 7.38, 0.21, 14.4, 0.34, 0.47, 8.44, 3.64, 1.22]} \ No newline at end of file diff --git a/annotations_1/_0FLP8sxv2E_filtered.json b/annotations_1/_0FLP8sxv2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94e384bff13db6e7d7d344c858f7e95e7bfc5add --- /dev/null +++ b/annotations_1/_0FLP8sxv2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.17], [23.0, 70.24], [72.0, 72.55], [76.0, 78.88], [80.0, 84.15], [86.0, 99.37], [103.0, 129.03], [130.0, 130.89], [134.0, 141.0]], "keep_status": [true, false, false, false, true, false, false, false, false], "silence_prob": [29.17, 0.0, 0.0, 30.0, 30.67, 32.6, 31.84, 0.0, 30.32], "audiomae_on_audioset": [[["music", 37.89], ["whale vocalization", 25.26], ["hum", 3.13]], null, null, [["throbbing", 31.66], ["music", 29.0], ["hum", 20.38]], [["music", 63.01], ["speech", 4.02], ["grunt", 2.48]], [["music", 80.93], ["hum", 1.57], ["throbbing", 1.49]], [["music", 76.48], ["ambient music", 4.55], ["theremin", 4.1]], null, [["music", 29.59], ["hum", 23.61], ["throbbing", 19.84]]], "duration": [15.17, 47.24, 0.55, 2.88, 4.15, 13.37, 26.03, 0.89, 7.0]} \ No newline at end of file diff --git a/annotations_1/_0X1jPgLo-A_filtered.json b/annotations_1/_0X1jPgLo-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8c818b7b428a02228e835e19f1e8159e5afd10 --- /dev/null +++ b/annotations_1/_0X1jPgLo-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.45], [14.0, 15.53], [16.0, 18.49], [20.0, 20.71], [22.0, 24.43], [26.0, 26.62], [27.0, 28.76], [30.0, 30.3], [31.0, 31.99], [34.0, 36.88], [40.0, 41.2], [43.0, 44.17], [45.0, 45.82], [46.0, 46.97], [49.0, 49.71], [51.0, 52.29], [53.0, 54.19], [55.0, 55.63], [60.0, 84.82], [88.0, 89.9], [91.0, 92.75], [94.0, 95.82], [96.0, 97.17], [98.0, 135.67], [136.0, 138.65], [139.0, 140.22], [141.0, 143.58], [146.0, 148.0], [149.0, 149.86]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 43.61, 0.0, 64.18, 0.0, 0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.19, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 0.0, 98.44, 99.71, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 43.36], ["speech", 18.21], ["insect", 5.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 18.61], ["animal", 14.54], ["music", 7.5]], null, null, null, null, null, [["animal", 34.39], ["insect", 7.75], ["wild animals", 7.17]], null, null, null, null], "duration": [0.45, 1.53, 2.49, 0.71, 2.43, 0.62, 1.76, 0.3, 0.99, 2.88, 1.2, 1.17, 0.82, 0.97, 0.71, 1.29, 1.19, 0.63, 24.82, 1.9, 1.75, 1.82, 1.17, 37.67, 2.65, 1.22, 2.58, 2.0, 0.86]} \ No newline at end of file diff --git a/annotations_1/_0gn0zQx4_s_filtered.json b/annotations_1/_0gn0zQx4_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87db74b0c7842f875a40b355aaab9126cac3a11a --- /dev/null +++ b/annotations_1/_0gn0zQx4_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [5.0, 5.83], [12.0, 12.23], [13.0, 13.68], [18.0, 23.52], [27.0, 27.7], [28.0, 31.38], [31.0, 31.45], [34.0, 68.49], [76.0, 85.26], [88.0, 88.52], [95.0, 100.85], [103.0, 103.82], [105.0, 107.45], [108.0, 111.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.54, 0.0, 30.21, 0.0, 0.0, 30.05, 0.0, 30.34, 0.0, 29.67, 30.87], "audiomae_on_audioset": [null, null, null, null, [["music", 37.01], ["speech", 23.46], ["dubstep", 16.05]], null, [["music", 47.23], ["speech", 21.85], ["sidetone", 11.3]], null, null, [["speech", 50.56], ["music", 24.51], ["electronic music", 5.71]], null, [["speech", 53.92], ["vehicle", 4.36], ["car", 3.24]], null, [["speech", 32.46], ["music", 22.22], ["grunt", 3.01]], [["music", 59.41], ["electronica", 3.49], ["techno", 3.42]]], "duration": [1.17, 0.83, 0.23, 0.68, 5.52, 0.7, 3.38, 0.45, 34.49, 9.26, 0.52, 5.85, 0.82, 2.45, 3.08]} \ No newline at end of file diff --git a/annotations_1/_0vYFxJJcB4_filtered.json b/annotations_1/_0vYFxJJcB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec6cc8b218b7fcdb9f715c920cb3a9032954fc9f --- /dev/null +++ b/annotations_1/_0vYFxJJcB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.7], [29.0, 29.89]], "keep_status": [false, false], "silence_prob": [78.55, 0.0], "audiomae_on_audioset": [null, null], "duration": [6.7, 0.89]} \ No newline at end of file diff --git a/annotations_1/_1fHeesAez0_filtered.json b/annotations_1/_1fHeesAez0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10613bf325d0eed7c163dd162e9b463941962d8a --- /dev/null +++ b/annotations_1/_1fHeesAez0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.35], [8.0, 10.61], [11.0, 13.14], [15.0, 19.01], [20.0, 21.32], [22.0, 30.87], [33.0, 36.41], [38.0, 41.98], [44.0, 45.13], [46.0, 53.7], [56.0, 60.72], [62.0, 63.66], [66.0, 67.85], [69.0, 69.09], [70.0, 72.66], [74.0, 74.17], [76.0, 77.14], [80.0, 80.94], [83.0, 84.03], [85.0, 85.63], [87.0, 87.24], [89.0, 90.93], [91.0, 92.94], [94.0, 96.89], [98.0, 101.76], [103.0, 105.61], [107.0, 108.41], [110.0, 111.86], [114.0, 116.88], [120.0, 121.58], [122.0, 127.67], [134.0, 135.48], [136.0, 136.63], [137.0, 138.45], [140.0, 140.02], [142.0, 157.49], [161.0, 168.52], [169.0, 172.57], [174.0, 175.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 91.64, 90.78, 100.0, 0.0, 100.0, 100.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 98.51, 100.0, 0.0, 0.0, 100.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.35, 2.61, 2.14, 4.01, 1.32, 8.87, 3.41, 3.98, 1.13, 7.7, 4.72, 1.66, 1.85, 0.09, 2.66, 0.17, 1.14, 0.94, 1.03, 0.63, 0.24, 1.93, 1.94, 2.89, 3.76, 2.61, 1.41, 1.86, 2.88, 1.58, 5.67, 1.48, 0.63, 1.45, 0.02, 15.49, 7.52, 3.57, 1.22]} \ No newline at end of file diff --git a/annotations_1/_1rqGyHtE4Q_filtered.json b/annotations_1/_1rqGyHtE4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21284ce78b744c90f5cd9a2c01481579b755d60d --- /dev/null +++ b/annotations_1/_1rqGyHtE4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 29.76], [60.0, 59.95], [60.0, 59.98], [61.0, 68.44], [71.0, 75.42]], "keep_status": [false, false, false, false, true], "silence_prob": [31.1, 0.0, 0.0, 29.7, 29.23], "audiomae_on_audioset": [[["music", 83.13], ["didgeridoo", 2.75], ["electronic music", 2.01]], null, null, [["music", 68.05], ["throbbing", 5.24], ["crowd", 3.73]], [["music", 42.23], ["vehicle", 12.55], ["motorcycle", 4.61]]], "duration": [12.76, -0.05, -0.02, 7.44, 4.42]} \ No newline at end of file diff --git a/annotations_1/_2gI4vpq9fo_filtered.json b/annotations_1/_2gI4vpq9fo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..067a71eeb2bc76ee5873f125a06cb5866d9ef2d0 --- /dev/null +++ b/annotations_1/_2gI4vpq9fo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 75.54]], "keep_status": [true], "silence_prob": [48.19], "audiomae_on_audioset": [[["music", 29.07], ["hum", 17.53], ["mains hum", 15.55]]], "duration": [28.54]} \ No newline at end of file diff --git a/annotations_1/_2vMtzWb6q0_filtered.json b/annotations_1/_2vMtzWb6q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9738d16ead0e2e487c242c60b244e31664b4d313 --- /dev/null +++ b/annotations_1/_2vMtzWb6q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.18], [18.0, 23.3], [28.0, 58.85], [63.0, 66.46], [67.0, 111.32], [114.0, 120.12]], "keep_status": [true, true, false, false, false, false], "silence_prob": [28.17, 35.01, 0.0, 36.08, 0.0, 29.57], "audiomae_on_audioset": [[["mains hum", 24.0], ["hum", 21.41], ["speech", 19.17]], [["hum", 25.46], ["speech", 20.78], ["music", 14.92]], null, [["music", 64.99], ["hum", 5.6], ["mains hum", 4.88]], null, [["music", 89.74], ["electronic music", 2.32], ["throbbing", 0.69]]], "duration": [10.18, 5.3, 30.85, 3.46, 44.32, 6.12]} \ No newline at end of file diff --git a/annotations_1/_41AKvC_uGk_filtered.json b/annotations_1/_41AKvC_uGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a538f4b3dc9faebb8d76e1f0d932dcf8c35f790c --- /dev/null +++ b/annotations_1/_41AKvC_uGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [4.0, 10.61], [12.0, 13.32], [14.0, 18.22], [19.0, 20.75], [22.0, 24.17], [25.0, 26.2], [29.0, 29.44], [30.0, 29.94], [30.0, 30.0], [31.0, 36.8], [38.0, 39.41], [42.0, 42.65], [44.0, 48.0], [49.0, 50.09], [51.0, 52.86], [53.0, 68.42], [69.0, 70.14], [73.0, 75.36], [79.0, 95.17], [106.0, 106.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 49.87, 0.0, 65.55, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 65.2, 0.0, 0.0, 45.52, 0.0, 46.47, 35.24, 0.0], "audiomae_on_audioset": [null, [["hum", 36.67], ["music", 19.66], ["throbbing", 15.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["rumble", 25.96], ["hum", 22.38], ["music", 16.21]], null, [["hum", 38.2], ["mains hum", 20.42], ["throbbing", 3.94]], [["music", 53.87], ["animal", 8.58], ["wild animals", 4.78]], null], "duration": [1.86, 6.61, 1.32, 4.22, 1.75, 2.17, 1.2, 0.44, -0.06, 0.0, 5.8, 1.41, 0.65, 4.0, 1.09, 1.86, 15.42, 1.14, 2.36, 16.17, 0.46]} \ No newline at end of file diff --git a/annotations_1/_4DRXSdPuCo_filtered.json b/annotations_1/_4DRXSdPuCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29af8086c84dee03dc822871ef202b64eee1e773 --- /dev/null +++ b/annotations_1/_4DRXSdPuCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [6.0, 7.05], [9.0, 10.1], [14.0, 15.26], [18.0, 19.63], [22.0, 25.27], [26.0, 28.26], [29.0, 31.33], [36.0, 37.35], [39.0, 40.58], [43.0, 43.78], [47.0, 47.34], [65.0, 65.92], [67.0, 67.19], [76.0, 77.21], [86.0, 86.83], [88.0, 88.42], [90.0, 90.41], [92.0, 92.18], [95.0, 96.26], [97.0, 98.29], [102.0, 103.01], [106.0, 109.19], [110.0, 112.65], [114.0, 114.3], [119.0, 120.01], [122.0, 123.26], [125.0, 126.32], [127.0, 130.25], [148.0, 149.49], [156.0, 159.87], [161.0, 161.96], [163.0, 163.17], [163.0, 163.26], [163.0, 170.24], [171.0, 171.19], [173.0, 173.89], [174.0, 177.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 84.98, 50.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 99.95, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 54.04, 0.0, 0.0, 0.0, 36.64, 0.0, 0.0, 49.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.17], ["hum", 6.98], ["noise", 4.93]], null, null, [["hum", 31.34], ["mains hum", 30.95], ["speech", 16.48]]], "duration": [1.51, 1.05, 1.1, 1.26, 1.63, 3.27, 2.26, 2.33, 1.35, 1.58, 0.78, 0.34, 0.92, 0.19, 1.21, 0.83, 0.42, 0.41, 0.18, 1.26, 1.29, 1.01, 3.19, 2.65, 0.3, 1.01, 1.26, 1.32, 3.25, 1.49, 3.87, 0.96, 0.17, 0.26, 7.24, 0.19, 0.89, 3.97]} \ No newline at end of file diff --git a/annotations_1/_4EkJkuiwIg_filtered.json b/annotations_1/_4EkJkuiwIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3597b85eb0f62c763ea1996d88b21e84d9e2c70 --- /dev/null +++ b/annotations_1/_4EkJkuiwIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.05], [15.0, 15.25], [59.0, 60.24], [79.0, 79.37], [95.0, 95.18], [103.0, 103.62]], "keep_status": [false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [3.05, 0.25, 1.24, 0.37, 0.18, 0.62]} \ No newline at end of file diff --git a/annotations_1/_4juqo20ABE_filtered.json b/annotations_1/_4juqo20ABE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..858e9bab8fdb526c208735513745fd63c84097c9 --- /dev/null +++ b/annotations_1/_4juqo20ABE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.3], [9.0, 9.48], [12.0, 12.31], [13.0, 13.95], [14.0, 14.55], [15.0, 15.13], [15.0, 16.55], [17.0, 17.29], [17.0, 28.0], [29.0, 31.55], [33.0, 38.96], [39.0, 54.3], [58.0, 64.02], [65.0, 65.72], [67.0, 67.34], [71.0, 70.85], [73.0, 74.07], [75.0, 75.96], [77.0, 77.25], [81.0, 81.38], [88.0, 88.52], [91.0, 91.52], [92.0, 92.64], [100.0, 100.8], [103.0, 103.74], [105.0, 112.67], [115.0, 115.94], [117.0, 120.12], [121.0, 124.88], [127.0, 127.94], [129.0, 129.88], [132.0, 133.07], [139.0, 139.99], [144.0, 145.0], [147.0, 154.65], [155.0, 156.81], [157.0, 158.13], [160.0, 159.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.52, 60.32, 37.8, 37.76, 52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 97.54, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 32.47], ["sidetone", 20.76], ["radio", 17.56]], [["hum", 16.35], ["mains hum", 11.35], ["music", 6.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.48, 0.31, 0.95, 0.55, 0.13, 1.55, 0.29, 11.0, 2.55, 5.96, 15.3, 6.02, 0.72, 0.34, -0.15, 1.07, 0.96, 0.25, 0.38, 0.52, 0.52, 0.64, 0.8, 0.74, 7.67, 0.94, 3.12, 3.88, 0.94, 0.88, 1.07, 0.99, 1.0, 7.65, 1.81, 1.13, -0.3]} \ No newline at end of file diff --git a/annotations_1/_4otc_6WtmQ_filtered.json b/annotations_1/_4otc_6WtmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95bbd09ab0e66aed3e5064197b10bd4b2ead2d88 --- /dev/null +++ b/annotations_1/_4otc_6WtmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.11], [14.0, 14.25], [15.0, 16.48], [17.0, 17.69], [21.0, 22.1], [24.0, 25.02], [31.0, 33.02], [44.0, 45.47], [55.0, 55.56], [56.0, 56.39], [58.0, 59.12], [63.0, 63.12], [63.0, 63.15], [64.0, 64.32], [65.0, 65.04], [65.0, 65.2], [65.0, 65.23], [66.0, 66.33], [72.0, 72.64], [89.0, 90.29], [91.0, 93.41], [95.0, 95.18], [96.0, 101.21], [102.0, 102.46], [103.0, 109.43], [113.0, 112.95], [114.0, 115.2], [118.0, 120.23], [123.0, 124.78], [128.0, 128.19], [129.0, 129.46], [136.0, 138.55], [141.0, 142.15], [146.0, 146.03], [163.0, 164.19], [166.0, 167.16], [168.0, 167.81], [169.0, 169.35]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.22, 0.0, 0.0, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 32.94, 0.0, 32.18, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["animal", 28.51], ["domestic animals, pets", 21.73], ["speech", 17.04]], null, null, null, null, null, [["speech", 49.43], ["sidetone", 14.77], ["music", 5.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 88.58], ["inside, small room", 4.87], ["noise", 1.79]], null, [["speech", 40.59], ["bow-wow", 14.19], ["dog", 12.57]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.11, 0.25, 1.48, 0.69, 1.1, 1.02, 2.02, 1.47, 0.56, 0.39, 1.12, 0.12, 0.15, 0.32, 0.04, 0.2, 0.23, 0.33, 0.64, 1.29, 2.41, 0.18, 5.21, 0.46, 6.43, -0.05, 1.2, 2.23, 1.78, 0.19, 0.46, 2.55, 1.15, 0.03, 1.19, 1.16, -0.19, 0.35]} \ No newline at end of file diff --git a/annotations_1/_525BmUkPmI_filtered.json b/annotations_1/_525BmUkPmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f3d8790780ae8e736a1e11e9c93b19f8a5e1478 --- /dev/null +++ b/annotations_1/_525BmUkPmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 26.74], [28.0, 42.74], [47.0, 57.37], [58.0, 66.73], [70.0, 70.28], [74.0, 74.44], [77.0, 80.05], [83.0, 83.12], [86.0, 86.12], [87.0, 87.59], [94.0, 94.51], [97.0, 97.61], [100.0, 100.63], [102.0, 102.64], [104.0, 104.84], [116.0, 117.56], [122.0, 123.6], [125.0, 125.02], [126.0, 130.54], [131.0, 133.32], [136.0, 138.72], [142.0, 143.77], [144.0, 145.98], [147.0, 147.75], [150.0, 150.75], [152.0, 152.78], [154.0, 154.04], [155.0, 155.97], [156.0, 156.86], [158.0, 160.68], [161.0, 161.76], [162.0, 163.0], [163.0, 163.65], [165.0, 165.55], [166.0, 167.58], [173.0, 173.23], [174.0, 174.85], [177.0, 188.42], [191.0, 191.47], [198.0, 197.82]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.91, 33.98, 33.38, 34.46, 0.0, 0.0, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 86.09, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 0.0], "audiomae_on_audioset": [[["music", 72.12], ["sampler", 2.27], ["electronic music", 1.99]], [["music", 73.16], ["house music", 1.4], ["hum", 1.07]], [["music", 29.89], ["electric shaver, electric razor", 9.98], ["moo", 7.76]], [["music", 63.64], ["sampler", 3.28], ["electric shaver, electric razor", 1.76]], null, null, [["music", 75.44], ["electronic music", 1.73], ["house music", 1.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.74, 14.74, 10.37, 8.73, 0.28, 0.44, 3.05, 0.12, 0.12, 0.59, 0.51, 0.61, 0.63, 0.64, 0.84, 1.56, 1.6, 0.02, 4.54, 2.32, 2.72, 1.77, 1.98, 0.75, 0.75, 0.78, 0.04, 0.97, 0.86, 2.68, 0.76, 1.0, 0.65, 0.55, 1.58, 0.23, 0.85, 11.42, 0.47, -0.18]} \ No newline at end of file diff --git a/annotations_1/_5IVdeFrhv4_filtered.json b/annotations_1/_5IVdeFrhv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..149a1d91bed76109daa947a5c9bdfcca5dc44817 --- /dev/null +++ b/annotations_1/_5IVdeFrhv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 3.2], [4.0, 5.91], [7.0, 7.55], [8.0, 9.22], [10.0, 10.96], [12.0, 12.87], [19.0, 21.32], [23.0, 24.48], [26.0, 29.13], [30.0, 31.8], [33.0, 35.34], [36.0, 40.05], [41.0, 41.79], [43.0, 43.98], [45.0, 46.79], [48.0, 49.86], [52.0, 52.56], [53.0, 54.3], [57.0, 59.75], [61.0, 77.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 95.09, 0.0, 97.64, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 38.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["tuning fork", 32.62], ["busy signal", 19.1], ["chirp tone", 8.32]]], "duration": [0.29, 0.2, 1.91, 0.55, 1.22, 0.96, 0.87, 2.32, 1.48, 3.13, 1.8, 2.34, 4.05, 0.79, 0.98, 1.79, 1.86, 0.56, 1.3, 2.75, 16.85]} \ No newline at end of file diff --git a/annotations_1/_5uHK-fVMcY_filtered.json b/annotations_1/_5uHK-fVMcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a4fd6783ea1a314a88f7fc566cc5321e46982c0 --- /dev/null +++ b/annotations_1/_5uHK-fVMcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 55.43], [56.0, 59.53], [68.0, 69.28], [70.0, 72.06], [74.0, 75.1], [79.0, 80.4], [82.0, 84.5], [89.0, 90.39], [94.0, 95.42], [97.0, 99.25], [102.0, 102.73], [104.0, 106.49], [107.0, 108.62], [112.0, 113.22], [123.0, 124.34], [131.0, 134.32], [136.0, 137.84], [139.0, 141.51], [146.0, 147.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 99.62, 0.0, 0.0, 100.0, 0.0, 0.0, 97.11, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [45.43, 3.53, 1.28, 2.06, 1.1, 1.4, 2.5, 1.39, 1.42, 2.25, 0.73, 2.49, 1.62, 1.22, 1.34, 3.32, 1.84, 2.51, 1.45]} \ No newline at end of file diff --git a/annotations_1/_6RI-8Ia4do_filtered.json b/annotations_1/_6RI-8Ia4do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe2e5e0bd8c20c62894bf79f7cc487e01b0a2b77 --- /dev/null +++ b/annotations_1/_6RI-8Ia4do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.11], [18.0, 20.22], [24.0, 27.4], [28.0, 65.06], [72.0, 72.55], [73.0, 99.94], [101.0, 117.69]], "keep_status": [false, false, true, false, false, true, true], "silence_prob": [0.0, 94.07, 47.16, 0.0, 0.0, 28.27, 28.29], "audiomae_on_audioset": [null, null, [["whale vocalization", 30.97], ["hum", 16.56], ["mains hum", 4.66]], null, null, [["buzz", 19.54], ["music", 15.09], ["speech", 12.78]], [["whack, thwack", 17.18], ["explosion", 14.05], ["music", 9.95]]], "duration": [0.11, 2.22, 3.4, 37.06, 0.55, 26.94, 16.69]} \ No newline at end of file diff --git a/annotations_1/_7DVsN761n0_filtered.json b/annotations_1/_7DVsN761n0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d4ac0750ccd2a0dc6ee657219a57d44a7e3eb84 --- /dev/null +++ b/annotations_1/_7DVsN761n0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.14], [21.0, 22.22], [24.0, 25.02], [26.0, 33.3], [42.0, 45.01], [47.0, 48.02], [49.0, 50.11], [51.0, 51.63], [58.0, 57.84], [58.0, 59.7], [61.0, 61.48], [62.0, 62.55], [65.0, 65.57], [69.0, 68.72], [74.0, 74.21], [75.0, 75.29], [76.0, 76.44], [82.0, 86.9], [89.0, 91.35], [94.0, 94.98], [96.0, 97.21], [100.0, 100.85], [102.0, 103.15], [104.0, 104.85], [107.0, 113.53], [123.0, 125.31], [132.0, 134.5], [136.0, 150.33], [154.0, 162.68], [163.0, 165.91], [168.0, 172.5], [190.0, 192.27], [194.0, 194.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.61, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.81, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 39.05, 29.3, 38.62, 31.41, 37.91, 95.91, 89.54, 40.59, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 53.25], ["wail, moan", 16.18], ["groan", 11.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.87], ["mains hum", 5.23], ["hum", 4.52]], null, null, null, null, null, null, [["speech", 36.62], ["music", 28.98], ["theremin", 4.28]], [["music", 53.45], ["boom", 9.51], ["hum", 6.64]], [["music", 60.04], ["speech", 7.74], ["synthesizer", 3.61]], [["music", 62.75], ["hum", 10.92], ["mains hum", 5.31]], [["whack, thwack", 43.51], ["music", 15.96], ["thunk", 14.43]], null, null, [["breaking", 52.7], ["thunk", 12.08], ["busy signal", 7.0]], null], "duration": [1.14, 1.22, 1.02, 7.3, 3.01, 1.02, 1.11, 0.63, -0.16, 1.7, 0.48, 0.55, 0.57, -0.28, 0.21, 0.29, 0.44, 4.9, 2.35, 0.98, 1.21, 0.85, 1.15, 0.85, 6.53, 2.31, 2.5, 14.33, 8.68, 2.91, 4.5, 2.27, 0.53]} \ No newline at end of file diff --git a/annotations_1/_8hB8umrGlo_filtered.json b/annotations_1/_8hB8umrGlo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfab35d373ed4ccf0f8afe1da8b517d7db2a1d97 --- /dev/null +++ b/annotations_1/_8hB8umrGlo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[90.0, 90.46], [92.0, 93.93], [96.0, 97.21], [99.0, 143.72]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.46, 1.93, 1.21, 44.72]} \ No newline at end of file diff --git a/annotations_1/_8w9rOpV3gc_filtered.json b/annotations_1/_8w9rOpV3gc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58283d87c7ad9a5f6f98d3473814eb80e77fd672 --- /dev/null +++ b/annotations_1/_8w9rOpV3gc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [7.0, 8.55], [9.0, 11.48], [13.0, 15.48], [18.0, 18.52], [19.0, 20.34], [25.0, 25.68], [27.0, 27.5], [29.0, 29.64], [41.0, 41.91], [46.0, 48.71], [56.0, 55.66], [61.0, 62.09], [74.0, 74.26], [75.0, 76.18], [89.0, 94.61], [98.0, 201.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 63.1, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.38, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 58.95], ["foghorn", 8.52], ["trombone", 7.41]], null, null, null, null, [["music", 73.61], ["synthesizer", 2.3], ["musical instrument", 1.91]], null], "duration": [0.46, 1.55, 2.48, 2.48, 0.52, 1.34, 0.68, 0.5, 0.64, 0.91, 2.71, -0.34, 1.09, 0.26, 1.18, 5.61, 103.33]} \ No newline at end of file diff --git a/annotations_1/_92v2IFT7WE_filtered.json b/annotations_1/_92v2IFT7WE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6a6143b9db7ffd99850bfa98b1733de8924ac58 --- /dev/null +++ b/annotations_1/_92v2IFT7WE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 132.66]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [58.66]} \ No newline at end of file diff --git a/annotations_1/_9qsxe5kHdo_filtered.json b/annotations_1/_9qsxe5kHdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..437707bc0a6135ac14efa359f17805fb286f64e0 --- /dev/null +++ b/annotations_1/_9qsxe5kHdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.0], [24.0, 27.04], [29.0, 51.95], [53.0, 55.16], [60.0, 61.33], [67.0, 68.13], [69.0, 69.74], [71.0, 90.85], [92.0, 97.43], [99.0, 101.92], [103.0, 105.04], [107.0, 116.13], [117.0, 117.41], [118.0, 119.55], [121.0, 122.67], [123.0, 123.6], [125.0, 127.3], [129.0, 130.67], [132.0, 140.71], [142.0, 143.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 99.98, 0.0, 0.0, 0.0, 99.99, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 3.04, 22.95, 2.16, 1.33, 1.13, 0.74, 19.85, 5.43, 2.92, 2.04, 9.13, 0.41, 1.55, 1.67, 0.6, 2.3, 1.67, 8.71, 1.28]} \ No newline at end of file diff --git a/annotations_1/_AElcgYtxpA_filtered.json b/annotations_1/_AElcgYtxpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78dfc32ac26d1966cb082da53053226cce255359 --- /dev/null +++ b/annotations_1/_AElcgYtxpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.63], [18.0, 63.78], [66.0, 73.36], [76.0, 76.84], [77.0, 87.67], [91.0, 94.19]], "keep_status": [false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 28.91, 0.0, 28.41, 28.4], "audiomae_on_audioset": [null, null, [["music", 17.24], ["hum", 16.71], ["throbbing", 15.38]], null, [["speech", 69.24], ["music", 20.68], ["throbbing", 1.16]], [["music", 31.34], ["speech", 19.27], ["zipper (clothing)", 10.5]]], "duration": [0.63, 45.78, 7.36, 0.84, 10.67, 3.19]} \ No newline at end of file diff --git a/annotations_1/_B6AZdgQbeU_filtered.json b/annotations_1/_B6AZdgQbeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45cdbfb8e70717c7748680a8d50b821504588870 --- /dev/null +++ b/annotations_1/_B6AZdgQbeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.88], [7.0, 7.77], [10.0, 11.11], [14.0, 30.16], [31.0, 31.56], [37.0, 38.38], [52.0, 53.52], [59.0, 59.97], [61.0, 62.34], [64.0, 65.99], [67.0, 67.49], [69.0, 74.8], [76.0, 77.85], [79.0, 79.71], [80.0, 81.01], [83.0, 84.2], [85.0, 86.91], [88.0, 89.78], [90.0, 91.98], [93.0, 96.96], [98.0, 99.23], [101.0, 102.73], [105.0, 106.91], [107.0, 109.07], [111.0, 112.4], [113.0, 113.83], [114.0, 115.94], [117.0, 120.48]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 38.19, 0.0, 0.0, 0.0, 46.97], "audiomae_on_audioset": [null, null, null, [["vehicle", 12.3], ["fixed-wing aircraft, airplane", 11.77], ["aircraft", 9.43]], null, null, null, null, null, null, null, [["music", 29.08], ["sonar", 12.41], ["electronic music", 11.12]], null, null, null, null, null, null, null, [["music", 15.48], ["hum", 13.11], ["rumble", 10.83]], null, null, null, [["speech", 53.47], ["bee, wasp, etc.", 4.66], ["outside, rural or natural", 4.39]], null, null, null, [["hum", 42.81], ["throbbing", 8.71], ["music", 5.64]]], "duration": [1.88, 0.77, 1.11, 16.16, 0.56, 1.38, 1.52, 0.97, 1.34, 1.99, 0.49, 5.8, 1.85, 0.71, 1.01, 1.2, 1.91, 1.78, 1.98, 3.96, 1.23, 1.73, 1.91, 2.07, 1.4, 0.83, 1.94, 3.48]} \ No newline at end of file diff --git a/annotations_1/_BjawJWZIxo_filtered.json b/annotations_1/_BjawJWZIxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2536354bbdffc277a9a85c577a9f7af41f21d004 --- /dev/null +++ b/annotations_1/_BjawJWZIxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [9.0, 67.22], [70.0, 70.78], [73.0, 101.26], [108.0, 109.27], [111.0, 112.35], [113.0, 113.86], [119.0, 125.76], [129.0, 132.22], [136.0, 170.41]], "keep_status": [false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.45, 0.0, 0.0, 0.0, 32.01, 52.8, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 26.21], ["music", 18.33], ["whack, thwack", 16.12]], null, null, null, [["music", 56.87], ["electronic music", 6.75], ["gong", 4.03]], null, null], "duration": [0.43, 58.22, 0.78, 28.26, 1.27, 1.35, 0.86, 6.76, 3.22, 34.41]} \ No newline at end of file diff --git a/annotations_1/_CuE3lto5XA_filtered.json b/annotations_1/_CuE3lto5XA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72ea90fe07fe72f06532c68fe4df220ac21b4340 --- /dev/null +++ b/annotations_1/_CuE3lto5XA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.12], [23.0, 34.47], [36.0, 39.29], [43.0, 44.02], [45.0, 44.88], [45.0, 49.76], [57.0, 79.66], [81.0, 106.42], [114.0, 160.96], [163.0, 163.8], [166.0, 166.7], [169.0, 170.13], [176.0, 177.42], [181.0, 181.77], [183.0, 183.25]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [28.34, 28.4, 29.2, 0.0, 0.0, 29.18, 29.43, 30.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 26.91], ["music", 18.89], ["mains hum", 16.63]], [["music", 31.78], ["speech", 30.2], ["buzz", 5.87]], [["music", 19.74], ["hum", 15.17], ["boom", 13.38]], null, null, [["explosion", 54.45], ["speech", 21.45], ["burst, pop", 11.2]], [["music", 23.47], ["speech", 22.44], ["hum", 16.55]], [["music", 52.92], ["throbbing", 20.32], ["hum", 10.56]], null, null, null, null, null, null, null], "duration": [4.12, 11.47, 3.29, 1.02, -0.12, 4.76, 22.66, 25.42, 46.96, 0.8, 0.7, 1.13, 1.42, 0.77, 0.25]} \ No newline at end of file diff --git a/annotations_1/_CuZqXrhEZI_filtered.json b/annotations_1/_CuZqXrhEZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..519eb90ef78697cc2a53b837b993b01337510f3e --- /dev/null +++ b/annotations_1/_CuZqXrhEZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.12], [28.0, 28.29], [29.0, 30.97], [32.0, 32.76], [34.0, 35.13], [37.0, 38.97], [41.0, 42.48], [43.0, 44.04], [46.0, 46.9], [48.0, 49.06], [51.0, 50.65], [52.0, 52.27], [61.0, 61.7], [66.0, 65.96], [69.0, 68.98], [73.0, 74.26], [77.0, 88.37], [89.0, 104.65], [105.0, 107.42], [109.0, 112.5], [115.0, 115.13], [118.0, 119.53], [126.0, 126.71], [131.0, 133.2], [136.0, 137.76], [140.0, 143.33], [145.0, 146.67], [148.0, 153.08], [154.0, 158.3], [160.0, 170.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 99.96, 99.98, 100.0, 0.0, 0.0, 0.0, 99.36, 0.0, 100.0, 0.0, 100.0, 99.85, 99.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.12, 0.29, 1.97, 0.76, 1.13, 1.97, 1.48, 1.04, 0.9, 1.06, -0.35, 0.27, 0.7, -0.04, -0.02, 1.26, 11.37, 15.65, 2.42, 3.5, 0.13, 1.53, 0.71, 2.2, 1.76, 3.33, 1.67, 5.08, 4.3, 10.72]} \ No newline at end of file diff --git a/annotations_1/_DtsWj_e2vI_filtered.json b/annotations_1/_DtsWj_e2vI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2caf1ae913c3aa2edbea084e4df63c1e9a58a788 --- /dev/null +++ b/annotations_1/_DtsWj_e2vI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [2.0, 3.03], [4.0, 6.74], [16.0, 16.75], [17.0, 18.01], [21.0, 23.45], [26.0, 27.18], [28.0, 28.66], [30.0, 30.25], [35.0, 36.27], [48.0, 48.44], [52.0, 53.47], [55.0, 55.76], [56.0, 56.46], [57.0, 58.16], [59.0, 62.72], [63.0, 63.96], [65.0, 65.16], [67.0, 66.77], [72.0, 75.25], [79.0, 79.27], [79.0, 79.57], [80.0, 81.16], [86.0, 87.2], [88.0, 92.87], [96.0, 98.07], [99.0, 108.26], [111.0, 112.87], [117.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.26, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.9, 1.03, 2.74, 0.75, 1.01, 2.45, 1.18, 0.66, 0.25, 1.27, 0.44, 1.47, 0.76, 0.46, 1.16, 3.72, 0.96, 0.16, -0.23, 3.25, 0.27, 0.57, 1.16, 1.2, 4.87, 2.07, 9.26, 1.87, 0.54]} \ No newline at end of file diff --git a/annotations_1/_Du0A1y4Wh4_filtered.json b/annotations_1/_Du0A1y4Wh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63b428258dc251f7cf3a27ec4cc2228dd7da2287 --- /dev/null +++ b/annotations_1/_Du0A1y4Wh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.3], [6.0, 7.03], [8.0, 9.76], [10.0, 11.28], [12.0, 12.75], [14.0, 13.86], [15.0, 16.12], [19.0, 20.34], [22.0, 24.6], [26.0, 28.95], [32.0, 33.57], [35.0, 38.06], [39.0, 40.95], [42.0, 44.95], [47.0, 48.19], [50.0, 51.16], [54.0, 56.49], [58.0, 58.65], [60.0, 63.26], [65.0, 65.65], [66.0, 80.92], [81.0, 81.09], [81.0, 89.13], [92.0, 92.79], [94.0, 94.29], [95.0, 95.42], [98.0, 99.32], [100.0, 101.41], [102.0, 103.76], [105.0, 107.76], [109.0, 110.46], [112.0, 112.65], [113.0, 114.64], [115.0, 117.12], [119.0, 119.91], [121.0, 126.54], [128.0, 127.99], [128.0, 128.63], [129.0, 129.64], [131.0, 131.85], [133.0, 137.4], [139.0, 145.57], [146.0, 147.72], [148.0, 150.89], [151.0, 161.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 66.76, 0.0, 66.03, 0.0, 45.05, 0.0, 0.0, 77.53, 0.0, 54.7, 0.0, 52.98, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 0.0, 0.0, 0.0, 64.29, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 73.67, 32.51, 0.0, 74.44, 31.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.3], ["music", 13.16], ["animal", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 32.86], ["mains hum", 17.15], ["hum", 15.33]], null, null, [["speech", 45.7], ["vehicle", 8.65], ["hum", 8.16]]], "duration": [0.3, 1.03, 1.76, 1.28, 0.75, -0.14, 1.12, 1.34, 2.6, 2.95, 1.57, 3.06, 1.95, 2.95, 1.19, 1.16, 2.49, 0.65, 3.26, 0.65, 14.92, 0.09, 8.13, 0.79, 0.29, 0.42, 1.32, 1.41, 1.76, 2.76, 1.46, 0.65, 1.64, 2.12, 0.91, 5.54, -0.01, 0.63, 0.64, 0.85, 4.4, 6.57, 1.72, 2.89, 10.28]} \ No newline at end of file diff --git a/annotations_1/_EjWpjky5lU_filtered.json b/annotations_1/_EjWpjky5lU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77187a5f086f63243f15593c0f95f119eaeeedb4 --- /dev/null +++ b/annotations_1/_EjWpjky5lU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.28], [21.0, 25.32], [29.0, 31.41], [35.0, 39.06], [40.0, 40.34], [42.0, 46.16], [47.0, 47.39], [53.0, 54.92], [58.0, 61.28], [66.0, 66.14], [68.0, 70.7], [72.0, 74.65], [86.0, 91.4], [92.0, 96.89], [102.0, 105.95], [106.0, 122.81]], "keep_status": [false, false, true, false, false, true, false, false, true, false, true, true, false, true, false, false], "silence_prob": [35.36, 32.12, 29.82, 29.23, 0.0, 29.99, 0.0, 0.0, 30.36, 0.0, 28.92, 28.77, 29.34, 30.35, 30.97, 30.13], "audiomae_on_audioset": [[["music", 51.05], ["throbbing", 11.29], ["theremin", 9.06]], [["foghorn", 40.54], ["music", 24.17], ["mechanisms", 5.7]], [["hum", 29.31], ["throbbing", 20.94], ["mains hum", 13.08]], [["music", 79.46], ["electronic music", 6.59], ["sound effect", 1.37]], null, [["music", 51.02], ["noise", 6.73], ["musical instrument", 6.15]], null, null, [["music", 29.49], ["hum", 18.32], ["mains hum", 12.48]], null, [["speech", 47.76], ["music", 9.2], ["electric shaver, electric razor", 7.44]], [["music", 46.66], ["reverberation", 7.58], ["cacophony", 4.48]], [["music", 52.6], ["throbbing", 12.12], ["hum", 10.02]], [["music", 26.51], ["throbbing", 20.54], ["hum", 13.65]], [["speech", 40.58], ["music", 34.25], ["didgeridoo", 5.29]], [["speech", 50.02], ["music", 24.85], ["hum", 3.51]]], "duration": [2.28, 4.32, 2.41, 4.06, 0.34, 4.16, 0.39, 1.92, 3.28, 0.14, 2.7, 2.65, 5.4, 4.89, 3.95, 16.81]} \ No newline at end of file diff --git a/annotations_1/_EpizUY_las_filtered.json b/annotations_1/_EpizUY_las_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a00ec7801ba1572cf13fb016d3fb7c286c0eb0d --- /dev/null +++ b/annotations_1/_EpizUY_las_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.89], [8.0, 12.04], [13.0, 40.37], [43.0, 50.87], [53.0, 55.19], [56.0, 58.6], [61.0, 62.55], [64.0, 65.57], [66.0, 67.86], [68.0, 70.06], [71.0, 71.71], [72.0, 77.11], [78.0, 79.81], [81.0, 83.71], [84.0, 90.17], [92.0, 93.92], [95.0, 103.08], [105.0, 108.43], [111.0, 112.11], [113.0, 120.14], [121.0, 123.87], [126.0, 128.43], [130.0, 130.13], [131.0, 134.0], [135.0, 135.92], [137.0, 139.82], [141.0, 142.26], [143.0, 144.63], [146.0, 154.25], [154.0, 154.28], [154.0, 154.48], [155.0, 156.49], [158.0, 159.8], [160.0, 160.69], [161.0, 161.99], [162.0, 163.76], [164.0, 165.92], [169.0, 170.45]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.19, 56.33, 35.7, 45.11, 90.6, 86.45, 0.0, 0.0, 0.0, 54.9, 0.0, 94.22, 0.0, 99.31, 98.27, 0.0, 39.98, 63.64, 0.0, 43.2, 76.37, 73.51, 0.0, 99.85, 0.0, 90.95, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 61.47], ["mains hum", 21.88], ["throbbing", 2.45]], [["hum", 23.26], ["music", 21.91], ["mains hum", 19.57]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.48], ["hum", 9.08], ["radio", 6.85]], null, null, [["speech", 61.96], ["radio", 6.21], ["mechanisms", 5.29]], null, null, null, null, null, null, null, null, [["speech", 80.27], ["telephone", 4.86], ["radio", 4.19]], null, null, null, null, null, null, null, null, null], "duration": [2.89, 4.04, 27.37, 7.87, 2.19, 2.6, 1.55, 1.57, 1.86, 2.06, 0.71, 5.11, 1.81, 2.71, 6.17, 1.92, 8.08, 3.43, 1.11, 7.14, 2.87, 2.43, 0.13, 3.0, 0.92, 2.82, 1.26, 1.63, 8.25, 0.28, 0.48, 1.49, 1.8, 0.69, 0.99, 1.76, 1.92, 1.45]} \ No newline at end of file diff --git a/annotations_1/_GAA_LvDQMQ_filtered.json b/annotations_1/_GAA_LvDQMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..097725ed7bd6893b6be106c0ed1a0c79e69f6d59 --- /dev/null +++ b/annotations_1/_GAA_LvDQMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.24], [11.0, 13.49], [14.0, 15.36], [18.0, 18.79], [20.0, 26.45], [27.0, 31.7], [33.0, 33.18], [38.0, 40.47], [42.0, 43.43], [45.0, 46.8], [48.0, 50.4], [51.0, 54.23], [55.0, 62.65], [64.0, 64.49], [65.0, 65.8], [68.0, 69.75], [73.0, 73.94], [75.0, 75.68], [77.0, 78.24], [80.0, 80.79], [82.0, 84.03], [85.0, 86.29], [88.0, 89.21], [91.0, 97.43], [99.0, 101.31], [103.0, 109.27], [111.0, 112.33], [115.0, 132.73], [135.0, 143.97], [145.0, 151.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.65, 71.72, 0.0, 0.0, 81.0, 60.05, 0.0, 84.98, 0.0, 0.0, 69.47, 50.36, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 57.09, 96.77, 69.34, 0.0, 38.91, 29.16, 37.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.19], ["synthesizer", 5.62], ["speech", 3.44]], [["music", 72.27], ["cacophony", 1.97], ["boom", 1.56]], [["hum", 53.15], ["mains hum", 16.2], ["music", 10.93]]], "duration": [2.24, 2.49, 1.36, 0.79, 6.45, 4.7, 0.18, 2.47, 1.43, 1.8, 2.4, 3.23, 7.65, 0.49, 0.8, 1.75, 0.94, 0.68, 1.24, 0.79, 2.03, 1.29, 1.21, 6.43, 2.31, 6.27, 1.33, 17.73, 8.97, 6.6]} \ No newline at end of file diff --git a/annotations_1/_GJG2JDvCes_filtered.json b/annotations_1/_GJG2JDvCes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/_GJG2JDvCes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/_HgOQNBkVvY_filtered.json b/annotations_1/_HgOQNBkVvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9274754dddf6274ff80eb0de7684296af6baa12b --- /dev/null +++ b/annotations_1/_HgOQNBkVvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.17], [4.0, 10.27], [11.0, 11.99], [14.0, 14.25], [17.0, 18.45], [21.0, 22.57], [25.0, 25.74], [31.0, 32.24], [35.0, 36.64], [39.0, 43.38], [49.0, 49.47], [55.0, 55.11], [61.0, 61.72], [63.0, 63.9], [66.0, 66.14], [68.0, 75.74], [76.0, 80.52], [82.0, 81.99], [83.0, 86.0], [90.0, 89.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 73.97, 0.0, 45.46, 0.0], "audiomae_on_audioset": [null, [["theremin", 65.39], ["music", 29.86], ["synthesizer", 0.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.18], ["music", 20.6], ["didgeridoo", 8.98]], null], "duration": [0.17, 6.27, 0.99, 0.25, 1.45, 1.57, 0.74, 1.24, 1.64, 4.38, 0.47, 0.11, 0.72, 0.9, 0.14, 7.74, 4.52, -0.01, 3.0, -0.12]} \ No newline at end of file diff --git a/annotations_1/_HoKFu0orAs_filtered.json b/annotations_1/_HoKFu0orAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa9c02d90001e1cb28330c5393f4db4a2ac25b6 --- /dev/null +++ b/annotations_1/_HoKFu0orAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [12.0, 14.76], [23.0, 30.27], [32.0, 40.69], [41.0, 42.84], [44.0, 45.69], [49.0, 49.55], [52.0, 52.34], [53.0, 54.55], [57.0, 57.47], [58.0, 58.14], [60.0, 60.86], [64.0, 67.44], [68.0, 68.5], [71.0, 71.15], [71.0, 72.12], [77.0, 78.34], [81.0, 82.88], [85.0, 85.58], [86.0, 87.0], [88.0, 88.32], [89.0, 89.58], [93.0, 93.53], [95.0, 98.63], [99.0, 103.57], [104.0, 108.55], [110.0, 110.05], [111.0, 111.94], [113.0, 113.54], [122.0, 123.03], [124.0, 125.1], [130.0, 131.45], [134.0, 136.98], [140.0, 140.76], [143.0, 143.33], [145.0, 145.76], [150.0, 152.49]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.11, 92.15, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 75.39, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 99.44], "audiomae_on_audioset": [null, [["music", 25.99], ["hum", 18.11], ["mains hum", 13.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 2.76, 7.27, 8.69, 1.84, 1.69, 0.55, 0.34, 1.55, 0.47, 0.14, 0.86, 3.44, 0.5, 0.15, 1.12, 1.34, 1.88, 0.58, 1.0, 0.32, 0.58, 0.53, 3.63, 4.57, 4.55, 0.05, 0.94, 0.54, 1.03, 1.1, 1.45, 2.98, 0.76, 0.33, 0.76, 2.49]} \ No newline at end of file diff --git a/annotations_1/_Hxk9-WNdGQ_filtered.json b/annotations_1/_Hxk9-WNdGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cce6ccf51c67bc35ae67072f2601991cf2b8e82 --- /dev/null +++ b/annotations_1/_Hxk9-WNdGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 33.71], [37.0, 48.09], [51.0, 60.44], [62.0, 99.45], [100.0, 118.27], [118.0, 118.34], [119.0, 126.81]], "keep_status": [true, false, true, false, true, false, false], "silence_prob": [27.81, 29.08, 29.03, 0.0, 28.93, 0.0, 28.36], "audiomae_on_audioset": [[["speech", 44.49], ["vehicle", 14.11], ["accelerating, revving, vroom", 5.43]], [["hum", 37.89], ["throbbing", 32.33], ["music", 12.84]], [["music", 35.4], ["vehicle", 16.67], ["motorcycle", 15.09]], null, [["music", 37.2], ["speech", 15.47], ["foghorn", 10.56]], null, [["music", 45.52], ["throbbing", 24.77], ["hum", 7.94]]], "duration": [5.71, 11.09, 9.44, 37.45, 18.27, 0.34, 7.81]} \ No newline at end of file diff --git a/annotations_1/_I_F4a-oUyA_filtered.json b/annotations_1/_I_F4a-oUyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02f14e3ceec04b4de18a40a5731e8e941644905c --- /dev/null +++ b/annotations_1/_I_F4a-oUyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.85], [31.0, 42.03], [43.0, 89.26], [92.0, 101.07], [107.0, 147.16]], "keep_status": [true, false, false, true, false], "silence_prob": [33.69, 33.83, 0.0, 42.11, 0.0], "audiomae_on_audioset": [[["buzz", 49.3], ["hum", 12.1], ["mains hum", 6.11]], [["hum", 50.42], ["mains hum", 20.47], ["buzz", 9.42]], null, [["speech", 41.42], ["music", 13.94], ["buzz", 5.86]], null], "duration": [4.85, 11.03, 46.26, 9.07, 40.16]} \ No newline at end of file diff --git a/annotations_1/_IwNoboTiHU_filtered.json b/annotations_1/_IwNoboTiHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a922584c01495d6cbaff2692d5cead71149b97ec --- /dev/null +++ b/annotations_1/_IwNoboTiHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 41.77], [45.0, 48.19], [50.0, 71.37], [72.0, 72.74], [76.0, 89.95], [91.0, 92.16], [92.0, 114.39], [115.0, 117.19], [119.0, 123.47], [125.0, 126.66]], "keep_status": [false, false, true, false, true, false, false, true, true, false], "silence_prob": [0.0, 31.69, 30.38, 0.0, 30.46, 0.0, 31.69, 36.76, 35.08, 0.0], "audiomae_on_audioset": [null, [["throbbing", 47.25], ["hum", 34.17], ["mains hum", 5.6]], [["music", 34.36], ["hum", 4.54], ["whack, thwack", 4.2]], null, [["hum", 30.44], ["throbbing", 15.75], ["music", 13.75]], null, [["speech", 33.91], ["music", 33.11], ["hum", 8.76]], [["music", 24.37], ["hum", 24.33], ["throbbing", 19.16]], [["speech", 26.76], ["music", 21.91], ["sonar", 11.66]], null], "duration": [38.77, 3.19, 21.37, 0.74, 13.95, 1.16, 22.39, 2.19, 4.47, 1.66]} \ No newline at end of file diff --git a/annotations_1/_JcFaIDdphE_filtered.json b/annotations_1/_JcFaIDdphE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dee2e78f8092c4b45fdd65c9dd62cc8c5f8d633 --- /dev/null +++ b/annotations_1/_JcFaIDdphE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 46.72], [50.0, 50.89], [52.0, 55.32], [57.0, 59.8], [61.0, 96.87], [99.0, 99.93], [102.0, 125.27]], "keep_status": [true, false, true, true, false, false, true], "silence_prob": [29.0, 0.0, 29.27, 29.66, 0.0, 0.0, 29.61], "audiomae_on_audioset": [[["music", 21.6], ["explosion", 6.53], ["vehicle", 4.85]], null, [["mains hum", 24.42], ["hum", 16.39], ["music", 14.53]], [["cattle, bovinae", 31.61], ["moo", 22.18], ["music", 7.94]], null, null, [["music", 36.06], ["car", 7.99], ["vehicle", 5.9]]], "duration": [2.72, 0.89, 3.32, 2.8, 35.87, 0.93, 23.27]} \ No newline at end of file diff --git a/annotations_1/_JoP_xhSETM_filtered.json b/annotations_1/_JoP_xhSETM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acc80d79ac89d399ea1984bfdf7433e0c800bc46 --- /dev/null +++ b/annotations_1/_JoP_xhSETM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 32.02], [35.0, 36.09], [37.0, 38.7], [39.0, 51.22], [54.0, 141.3], [144.0, 156.51], [157.0, 156.64], [157.0, 157.18], [160.0, 165.16], [169.0, 192.94], [197.0, 207.05]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [50.51, 0.0, 0.0, 29.79, 0.0, 32.53, 0.0, 0.0, 39.38, 30.53, 35.11], "audiomae_on_audioset": [null, null, null, [["hum", 18.42], ["mains hum", 11.71], ["fly, housefly", 8.75]], null, [["speech", 42.66], ["music", 14.96], ["coin (dropping)", 8.73]], null, null, [["speech", 86.85], ["music", 3.12], ["fart", 1.13]], [["music", 37.95], ["speech", 29.97], ["animal", 3.04]], [["music", 51.85], ["didgeridoo", 18.84], ["ambient music", 4.03]]], "duration": [19.02, 1.09, 1.7, 12.22, 87.3, 12.51, -0.36, 0.18, 5.16, 23.94, 10.05]} \ No newline at end of file diff --git a/annotations_1/_KzpueROmto_filtered.json b/annotations_1/_KzpueROmto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38e4afadacecef816698513909058cef5da3d210 --- /dev/null +++ b/annotations_1/_KzpueROmto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.08], [4.0, 5.61], [8.0, 10.03], [10.0, 10.07], [16.0, 18.42], [19.0, 22.11], [23.0, 54.43], [55.0, 170.95], [172.0, 179.79], [181.0, 181.6], [183.0, 188.15], [192.0, 192.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.83, 0.0, 92.97, 90.6, 0.0, 0.0, 58.81, 0.0, 41.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 41.68], ["speech", 26.05], ["hum", 8.15]], null], "duration": [0.08, 1.61, 2.03, 0.07, 2.42, 3.11, 31.43, 115.95, 7.79, 0.6, 5.15, 0.18]} \ No newline at end of file diff --git a/annotations_1/_LzgxVd1wF8_filtered.json b/annotations_1/_LzgxVd1wF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08ee0192bfcbf2c88b5ce89a5691c83f25fed987 --- /dev/null +++ b/annotations_1/_LzgxVd1wF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [15.0, 17.32], [18.0, 19.63], [22.0, 22.38], [24.0, 25.49], [28.0, 31.62], [32.0, 33.35], [37.0, 38.69], [40.0, 41.23], [46.0, 46.48], [51.0, 52.17], [53.0, 54.92], [62.0, 63.34], [64.0, 67.27], [69.0, 69.77], [73.0, 73.89], [76.0, 77.38], [82.0, 82.83], [87.0, 88.65], [96.0, 102.88], [107.0, 110.42], [112.0, 112.75], [119.0, 119.58], [122.0, 125.81], [128.0, 128.61], [135.0, 136.29], [139.0, 139.92], [147.0, 146.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.22, 0.0, 0.0, 0.0, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 34.1, 49.59, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["mains hum", 38.84], ["hum", 34.98], ["music", 7.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.28], ["theremin", 7.84], ["musical instrument", 4.14]], [["music", 75.24], ["speech", 3.03], ["musical instrument", 1.94]], null, null, [["music", 57.0], ["carnatic music", 13.38], ["middle eastern music", 5.05]], null, null, null, null], "duration": [0.61, 2.32, 1.63, 0.38, 1.49, 3.62, 1.35, 1.69, 1.23, 0.48, 1.17, 1.92, 1.34, 3.27, 0.77, 0.89, 1.38, 0.83, 1.65, 6.88, 3.42, 0.75, 0.58, 3.81, 0.61, 1.29, 0.92, -0.03]} \ No newline at end of file diff --git a/annotations_1/_Mr6MQB8vRg_filtered.json b/annotations_1/_Mr6MQB8vRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5c77064d85523ab1d7f4ca821dafc8ddfd4e28b --- /dev/null +++ b/annotations_1/_Mr6MQB8vRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 21.32], [23.0, 30.43], [31.0, 36.14], [39.0, 42.16], [43.0, 46.95], [49.0, 51.83], [53.0, 53.69], [54.0, 56.13], [58.0, 61.15], [69.0, 77.68], [80.0, 85.26], [86.0, 88.97], [91.0, 92.21], [92.0, 92.26], [94.0, 96.13], [98.0, 104.11], [105.0, 106.76], [109.0, 110.2], [111.0, 112.18], [116.0, 116.5], [117.0, 116.82], [117.0, 118.59], [120.0, 124.5], [125.0, 125.59], [127.0, 127.97], [130.0, 134.4], [137.0, 137.25], [144.0, 145.42], [147.0, 157.06], [158.0, 168.72], [173.0, 177.35], [180.0, 179.96]], "keep_status": [true, false, true, true, false, false, false, true, true, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [30.4, 35.71, 35.0, 36.87, 40.24, 52.68, 0.0, 29.77, 28.34, 28.26, 28.77, 29.62, 0.0, 0.0, 31.65, 47.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 40.57, 0.0, 0.0, 29.12, 29.31, 41.1, 0.0], "audiomae_on_audioset": [[["speech", 35.6], ["music", 15.49], ["sound effect", 4.56]], [["music", 42.2], ["speech", 34.92], ["hum", 2.66]], [["music", 34.03], ["hum", 17.23], ["throbbing", 9.81]], [["music", 32.75], ["speech", 12.68], ["brass instrument", 3.19]], [["music", 40.34], ["throbbing", 16.31], ["hum", 15.65]], null, null, [["hum", 25.07], ["music", 20.22], ["throbbing", 14.2]], [["music", 16.75], ["vehicle", 8.9], ["rumble", 7.71]], [["music", 54.53], ["hum", 12.68], ["mains hum", 6.97]], [["mains hum", 32.03], ["hum", 19.42], ["music", 17.38]], [["music", 64.13], ["speech", 8.92], ["electronic music", 3.16]], null, null, [["music", 42.42], ["whack, thwack", 11.58], ["breaking", 4.5]], [["music", 40.59], ["didgeridoo", 12.41], ["theremin", 4.74]], null, null, null, null, null, null, null, null, null, [["mains hum", 19.85], ["hum", 17.32], ["music", 12.77]], null, null, [["music", 77.63], ["throbbing", 3.68], ["theremin", 1.38]], [["music", 53.68], ["speech", 21.51], ["didgeridoo", 4.5]], [["music", 57.09], ["musical instrument", 8.83], ["percussion", 4.68]], null], "duration": [14.32, 7.43, 5.14, 3.16, 3.95, 2.83, 0.69, 2.13, 3.15, 8.68, 5.26, 2.97, 1.21, 0.26, 2.13, 6.11, 1.76, 1.2, 1.18, 0.5, -0.18, 1.59, 4.5, 0.59, 0.97, 4.4, 0.25, 1.42, 10.06, 10.72, 4.35, -0.04]} \ No newline at end of file diff --git a/annotations_1/_O8yGbcFmc4_filtered.json b/annotations_1/_O8yGbcFmc4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c23d7a8f4c9a53083a46408bb9f039b17e32313 --- /dev/null +++ b/annotations_1/_O8yGbcFmc4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.41], [22.0, 25.46], [27.0, 27.8], [28.0, 28.7], [32.0, 35.38], [41.0, 47.7], [74.0, 74.34], [84.0, 90.44], [92.0, 92.01], [95.0, 101.28], [101.0, 103.84], [105.0, 106.51], [108.0, 108.24], [111.0, 111.62]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 47.16, 0.0, 0.0, 82.61, 60.79, 0.0, 29.76, 0.0, 29.25, 32.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.47], ["music", 25.56], ["musical instrument", 3.09]], null, null, null, null, null, [["speech", 85.73], ["breaking", 4.95], ["sidetone", 1.44]], null, [["speech", 26.23], ["livestock, farm animals, working animals", 13.57], ["music", 8.97]], [["whale vocalization", 32.18], ["speech", 20.08], ["chirp tone", 6.45]], null, null, null], "duration": [1.41, 3.46, 0.8, 0.7, 3.38, 6.7, 0.34, 6.44, 0.01, 6.28, 2.84, 1.51, 0.24, 0.62]} \ No newline at end of file diff --git a/annotations_1/_O9lT22rCj8_filtered.json b/annotations_1/_O9lT22rCj8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1beef38f21a78598144c80a8d8270acb6e8f22f --- /dev/null +++ b/annotations_1/_O9lT22rCj8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.2], [8.0, 10.35], [11.0, 11.03], [20.0, 20.61], [25.0, 26.1], [33.0, 33.89], [34.0, 38.97], [40.0, 42.87], [44.0, 48.05], [50.0, 53.42], [55.0, 56.1], [57.0, 57.6], [61.0, 63.09], [67.0, 67.46], [71.0, 88.21], [91.0, 97.23], [98.0, 99.06], [100.0, 100.26], [100.0, 100.35], [101.0, 100.55], [101.0, 105.36], [107.0, 110.37], [113.0, 113.98], [115.0, 116.34]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.77, 0.0, 0.0, 0.0, 0.0, 37.97, 88.46, 99.44, 31.18, 0.0, 0.0, 100.0, 0.0, 31.65, 34.7, 0.0, 0.0, 0.0, 0.0, 43.98, 99.98, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 28.2], ["livestock, farm animals, working animals", 18.07], ["cattle, bovinae", 13.91]], null, null, [["groan", 21.78], ["wail, moan", 19.04], ["speech", 18.8]], null, null, null, null, [["music", 32.84], ["whack, thwack", 25.08], ["smash, crash", 17.54]], [["music", 46.21], ["speech", 15.08], ["didgeridoo", 7.94]], null, null, null, null, [["speech", 35.55], ["music", 26.28], ["throbbing", 9.06]], null, null, null], "duration": [1.2, 2.35, 0.03, 0.61, 1.1, 0.89, 4.97, 2.87, 4.05, 3.42, 1.1, 0.6, 2.09, 0.46, 17.21, 6.23, 1.06, 0.26, 0.35, -0.45, 4.36, 3.37, 0.98, 1.34]} \ No newline at end of file diff --git a/annotations_1/_OZS09-GVTg_filtered.json b/annotations_1/_OZS09-GVTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7141b03cad9875b7ce8119cdefbf4c6a207a92da --- /dev/null +++ b/annotations_1/_OZS09-GVTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 29.22], [32.0, 33.79], [35.0, 40.37], [42.0, 42.2], [45.0, 49.94], [55.0, 54.85], [58.0, 57.81], [62.0, 68.03], [71.0, 92.4], [94.0, 96.4], [103.0, 103.05], [104.0, 104.6], [106.0, 107.89], [108.0, 108.85], [109.0, 113.05], [117.0, 117.34], [120.0, 124.28], [126.0, 128.29], [131.0, 130.6], [132.0, 136.65], [139.0, 139.26], [141.0, 140.93], [141.0, 143.33], [146.0, 146.57], [154.0, 162.09], [165.0, 165.69], [166.0, 174.73]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, true, true, false, false, false, false, true, false, false, false, true], "silence_prob": [29.93, 0.0, 36.49, 0.0, 29.36, 0.0, 0.0, 29.33, 30.0, 36.29, 0.0, 0.0, 0.0, 0.0, 41.18, 0.0, 29.23, 29.94, 0.0, 30.44, 0.0, 0.0, 29.14, 0.0, 30.89, 0.0, 30.8], "audiomae_on_audioset": [[["throbbing", 31.36], ["music", 23.08], ["speech", 18.54]], null, [["throbbing", 28.62], ["hum", 27.18], ["music", 19.36]], null, [["music", 34.47], ["throbbing", 14.66], ["hum", 9.96]], null, null, [["music", 68.18], ["throbbing", 9.84], ["speech", 7.41]], [["music", 65.16], ["throbbing", 11.7], ["hum", 6.93]], [["music", 49.63], ["speech", 9.55], ["didgeridoo", 4.36]], null, null, null, null, [["hum", 15.19], ["mains hum", 15.15], ["music", 15.13]], null, [["music", 38.63], ["siren", 10.86], ["speech", 3.38]], [["music", 17.76], ["mosquito", 14.33], ["speech", 13.47]], null, [["music", 43.7], ["speech", 23.1], ["didgeridoo", 8.25]], null, null, [["speech", 44.33], ["music", 18.27], ["noise", 4.32]], null, [["music", 65.24], ["speech", 5.54], ["musical instrument", 3.22]], null, [["speech", 31.52], ["hum", 18.65], ["mains hum", 10.96]]], "duration": [23.22, 1.79, 5.37, 0.2, 4.94, -0.15, -0.19, 6.03, 21.4, 2.4, 0.05, 0.6, 1.89, 0.85, 4.05, 0.34, 4.28, 2.29, -0.4, 4.65, 0.26, -0.07, 2.33, 0.57, 8.09, 0.69, 8.73]} \ No newline at end of file diff --git a/annotations_1/_OaOalM_tcY_filtered.json b/annotations_1/_OaOalM_tcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d202eb7b4cc6e1812e5e43223f49b7feb532fffe --- /dev/null +++ b/annotations_1/_OaOalM_tcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.31], [21.0, 22.3], [23.0, 23.94], [27.0, 27.5], [33.0, 32.81], [55.0, 56.03], [69.0, 70.12], [73.0, 74.07], [76.0, 76.01]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.31, 1.3, 0.94, 0.5, -0.19, 1.03, 1.12, 1.07, 0.01]} \ No newline at end of file diff --git a/annotations_1/_OrEOa0TYTY_filtered.json b/annotations_1/_OrEOa0TYTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..722cd1cd7c7272341a147042a97c9e99410ab5d2 --- /dev/null +++ b/annotations_1/_OrEOa0TYTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [4.0, 5.17], [6.0, 6.83], [10.0, 10.72], [12.0, 13.2], [13.0, 17.0], [23.0, 23.94], [26.0, 27.43], [34.0, 35.13], [36.0, 36.78], [40.0, 40.0], [42.0, 42.57], [49.0, 49.76], [53.0, 54.3], [70.0, 70.44], [71.0, 72.37], [75.0, 75.57], [93.0, 94.12], [96.0, 96.4], [103.0, 103.28], [105.0, 106.3], [115.0, 115.01], [128.0, 129.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 52.87], ["music", 26.79], ["didgeridoo", 3.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.17, 0.83, 0.72, 1.2, 4.0, 0.94, 1.43, 1.13, 0.78, 0.0, 0.57, 0.76, 1.3, 0.44, 1.37, 0.57, 1.12, 0.4, 0.28, 1.3, 0.01, 1.36]} \ No newline at end of file diff --git a/annotations_1/_PSEaTZSZEE_filtered.json b/annotations_1/_PSEaTZSZEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23189da58b70070b3ca9f6095c29da68bb865c28 --- /dev/null +++ b/annotations_1/_PSEaTZSZEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [7.0, 6.98], [10.0, 10.13], [13.0, 14.3], [24.0, 26.45], [28.0, 28.93], [30.0, 30.82], [31.0, 32.86], [34.0, 34.94], [37.0, 37.05], [41.0, 41.57], [48.0, 48.14], [60.0, 60.35], [62.0, 62.02], [63.0, 63.54], [66.0, 66.97], [79.0, 79.78], [81.0, 82.39], [87.0, 87.67], [96.0, 95.96], [97.0, 96.99], [97.0, 99.98], [125.0, 125.52], [129.0, 129.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, -0.02, 0.13, 1.3, 2.45, 0.93, 0.82, 1.86, 0.94, 0.05, 0.57, 0.14, 0.35, 0.02, 0.54, 0.97, 0.78, 1.39, 0.67, -0.04, -0.01, 2.98, 0.52, 0.96]} \ No newline at end of file diff --git a/annotations_1/_PSZEvsYD6o_filtered.json b/annotations_1/_PSZEvsYD6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa9705906ec72bcd6b81cac27e367f7e372ff03 --- /dev/null +++ b/annotations_1/_PSZEvsYD6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 48.73], [53.0, 60.02]], "keep_status": [true, true], "silence_prob": [30.36, 31.6], "audiomae_on_audioset": [[["hum", 15.33], ["noise", 12.14], ["music", 10.53]], [["white noise", 31.18], ["noise", 24.27], ["sine wave", 11.8]]], "duration": [14.73, 7.02]} \ No newline at end of file diff --git a/annotations_1/_QKwR14HKf8_filtered.json b/annotations_1/_QKwR14HKf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e4741475b2c8dcf8ee0aab1bf0dcde8932ec50a --- /dev/null +++ b/annotations_1/_QKwR14HKf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [8.0, 8.83], [11.0, 11.21], [13.0, 16.09], [17.0, 19.33], [20.0, 21.71], [26.0, 27.63], [29.0, 29.4], [30.0, 32.24], [33.0, 34.01], [35.0, 37.99], [39.0, 40.71], [42.0, 45.25], [46.0, 46.75], [48.0, 48.81], [49.0, 87.32], [89.0, 104.16], [105.0, 122.39], [123.0, 131.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.23, 100.0, 0.0, 0.0, 0.0, 93.13, 0.0, 100.0, 0.0, 94.95, 0.0, 0.0, 0.0, 61.67, 91.81, 99.21], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.83, 0.21, 3.09, 2.33, 1.71, 1.63, 0.4, 2.24, 1.01, 2.99, 1.71, 3.25, 0.75, 0.81, 38.32, 15.16, 17.39, 8.85]} \ No newline at end of file diff --git a/annotations_1/_RG8hoGMxKw_filtered.json b/annotations_1/_RG8hoGMxKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..462e73dc90ff1f9d1ebfac3166a32007735d2f3c --- /dev/null +++ b/annotations_1/_RG8hoGMxKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.73], [23.0, 28.49], [32.0, 40.85], [41.0, 40.88], [41.0, 40.91], [44.0, 45.2], [46.0, 52.64], [54.0, 57.25], [60.0, 60.07], [63.0, 64.61], [67.0, 67.46], [78.0, 78.16], [87.0, 87.17], [88.0, 88.15], [90.0, 93.43], [93.0, 93.5], [94.0, 93.56], [94.0, 93.97], [99.0, 100.82], [110.0, 116.28], [122.0, 125.34], [127.0, 141.88], [144.0, 145.71]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [31.66, 31.98, 31.8, 0.0, 0.0, 0.0, 57.72, 46.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.59, 0.0, 0.0, 0.0, 0.0, 31.78, 31.59, 31.29, 0.0], "audiomae_on_audioset": [[["music", 30.11], ["buzz", 13.26], ["speech", 6.76]], [["music", 45.34], ["speech", 11.02], ["throbbing", 6.3]], [["music", 23.98], ["fly, housefly", 22.28], ["mosquito", 11.87]], null, null, null, null, [["music", 39.54], ["musical instrument", 5.96], ["wind instrument, woodwind instrument", 4.55]], null, null, null, null, null, null, [["music", 41.32], ["speech", 31.71], ["didgeridoo", 4.03]], null, null, null, null, [["music", 48.97], ["didgeridoo", 14.67], ["livestock, farm animals, working animals", 5.82]], [["music", 51.6], ["chant", 5.06], ["speech", 3.5]], [["music", 75.36], ["didgeridoo", 13.53], ["musical instrument", 1.57]], null], "duration": [9.73, 5.49, 8.85, -0.12, -0.09, 1.2, 6.64, 3.25, 0.07, 1.61, 0.46, 0.16, 0.17, 0.15, 3.43, 0.5, -0.44, -0.03, 1.82, 6.28, 3.34, 14.88, 1.71]} \ No newline at end of file diff --git a/annotations_1/_RHrQlqoTTA_filtered.json b/annotations_1/_RHrQlqoTTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f5d514f7a7835c85a3b4f430a9b9b2db70ced18 --- /dev/null +++ b/annotations_1/_RHrQlqoTTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [5.0, 8.5], [9.0, 11.53], [12.0, 12.46], [13.0, 13.78], [15.0, 17.88], [18.0, 24.11], [25.0, 27.35], [28.0, 28.7], [29.0, 29.37], [30.0, 30.13], [30.0, 37.66], [38.0, 40.73], [41.0, 40.76], [43.0, 43.65], [44.0, 46.01], [47.0, 48.24], [49.0, 55.12], [56.0, 63.73], [64.0, 70.46], [71.0, 71.47], [72.0, 72.72], [74.0, 78.71], [79.0, 85.94], [86.0, 92.18], [93.0, 94.68], [96.0, 96.58], [97.0, 99.76], [101.0, 101.56], [103.0, 104.01], [106.0, 107.82], [109.0, 110.27], [113.0, 113.56], [115.0, 114.76], [117.0, 118.08], [121.0, 122.79], [125.0, 124.8], [126.0, 128.83], [129.0, 131.85], [134.0, 135.35], [136.0, 136.68], [138.0, 138.81], [142.0, 143.04], [144.0, 145.99], [147.0, 148.0], [149.0, 149.74], [151.0, 152.9], [154.0, 158.68], [160.0, 164.51], [165.0, 165.52], [167.0, 167.37], [170.0, 170.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.57, 100.0, 0.0, 0.0, 82.61, 49.13, 100.0, 0.0, 0.0, 0.0, 42.76, 46.22, 0.0, 0.0, 64.86, 0.0, 67.25, 99.9, 96.89, 0.0, 0.0, 51.12, 91.47, 52.68, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 43.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 99.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 65.02], ["radio", 14.46], ["sidetone", 10.59]], null, null, null, null, [["speech", 29.22], ["laughter", 10.09], ["crying, sobbing", 8.15]], [["chuckle, chortle", 29.74], ["snicker", 20.26], ["baby laughter", 10.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.32], ["sidetone", 19.95], ["radio", 9.14]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 3.5, 2.53, 0.46, 0.78, 2.88, 6.11, 2.35, 0.7, 0.37, 0.13, 7.66, 2.73, -0.24, 0.65, 2.01, 1.24, 6.12, 7.73, 6.46, 0.47, 0.72, 4.71, 6.94, 6.18, 1.68, 0.58, 2.76, 0.56, 1.01, 1.82, 1.27, 0.56, -0.24, 1.08, 1.79, -0.2, 2.83, 2.85, 1.35, 0.68, 0.81, 1.04, 1.99, 1.0, 0.74, 1.9, 4.68, 4.51, 0.52, 0.37, 0.95]} \ No newline at end of file diff --git a/annotations_1/_RWkRZDPnao_filtered.json b/annotations_1/_RWkRZDPnao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a541d58e8515e1caa275036952e401197a5c6a31 --- /dev/null +++ b/annotations_1/_RWkRZDPnao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.72], [14.0, 14.82], [17.0, 17.93], [21.0, 20.92], [26.0, 25.98], [28.0, 28.39], [35.0, 49.67], [51.0, 51.98], [54.0, 54.82], [56.0, 55.98], [57.0, 61.21], [63.0, 64.2], [71.0, 72.4], [74.0, 74.44], [79.0, 80.43], [81.0, 82.12], [85.0, 89.24], [90.0, 91.52], [94.0, 95.98], [97.0, 98.73], [101.0, 103.18], [104.0, 105.58], [108.0, 109.38], [111.0, 111.96], [113.0, 113.22], [118.0, 118.64], [122.0, 122.23], [124.0, 124.43], [127.0, 127.92], [132.0, 132.22], [133.0, 134.2], [136.0, 136.98], [139.0, 139.16], [142.0, 143.04], [146.0, 147.24], [149.0, 149.54], [150.0, 151.53], [152.0, 152.68], [154.0, 154.41], [155.0, 157.28], [160.0, 160.93], [162.0, 162.3], [166.0, 166.46], [169.0, 169.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.78, 0.0, 0.0, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 87.91], ["sidetone", 4.76], ["radio", 2.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.72, 0.82, 0.93, -0.08, -0.02, 0.39, 14.67, 0.98, 0.82, -0.02, 4.21, 1.2, 1.4, 0.44, 1.43, 1.12, 4.24, 1.52, 1.98, 1.73, 2.18, 1.58, 1.38, 0.96, 0.22, 0.64, 0.23, 0.43, 0.92, 0.22, 1.2, 0.98, 0.16, 1.04, 1.24, 0.54, 1.53, 0.68, 0.41, 2.28, 0.93, 0.3, 0.46, 0.69]} \ No newline at end of file diff --git a/annotations_1/_S6GYF1B8Yk_filtered.json b/annotations_1/_S6GYF1B8Yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5207879a22297d5a6f875a2ca730d1f59affbb3 --- /dev/null +++ b/annotations_1/_S6GYF1B8Yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [17.0, 19.03], [21.0, 22.23], [25.0, 26.22], [28.0, 30.1], [72.0, 75.0], [75.0, 75.95], [78.0, 79.12], [80.0, 81.62], [82.0, 83.07], [84.0, 95.37], [100.0, 111.32], [123.0, 124.21], [126.0, 126.47], [128.0, 130.59], [133.0, 133.29], [135.0, 134.55]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 47.16, 0.0, 0.0, 32.82, 32.05, 0.0, 0.0, 0.0, 0.0, 32.28, 29.81, 0.0, 0.0, 33.31, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.07], ["whale vocalization", 8.0], ["theremin", 3.66]], null, null, [["foghorn", 57.13], ["music", 23.32], ["trombone", 4.07]], [["trombone", 31.15], ["foghorn", 22.0], ["music", 20.47]], null, null, null, null, [["cattle, bovinae", 42.55], ["moo", 19.81], ["livestock, farm animals, working animals", 15.14]], [["music", 25.66], ["vehicle", 14.73], ["car", 8.95]], null, null, [["foghorn", 87.8], ["music", 2.53], ["trombone", 2.31]], null, null], "duration": [0.59, 2.03, 1.23, 1.22, 2.1, 3.0, 0.95, 1.12, 1.62, 1.07, 11.37, 11.32, 1.21, 0.47, 2.59, 0.29, -0.45]} \ No newline at end of file diff --git a/annotations_1/_SdYxgbXnHs_filtered.json b/annotations_1/_SdYxgbXnHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bf69fcedeaffb96c2623dfeeb43c01970de651e --- /dev/null +++ b/annotations_1/_SdYxgbXnHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.09], [17.0, 18.3], [20.0, 30.69], [31.0, 32.46], [33.0, 37.02]], "keep_status": [false, false, true, false, false], "silence_prob": [51.94, 0.0, 43.58, 0.0, 55.46], "audiomae_on_audioset": [null, null, [["music", 33.73], ["speech", 7.74], ["ambient music", 6.13]], null, null], "duration": [2.09, 1.3, 10.69, 1.46, 4.02]} \ No newline at end of file diff --git a/annotations_1/_TmztVM7Z4s_filtered.json b/annotations_1/_TmztVM7Z4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b14ef5db7a73a74a94d779d232c6a5bd305f00be --- /dev/null +++ b/annotations_1/_TmztVM7Z4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [1.0, 1.49], [2.0, 1.65], [2.0, 1.9], [7.0, 8.82], [10.0, 10.99], [11.0, 11.45], [11.0, 12.04], [15.0, 17.76], [20.0, 23.26], [27.0, 39.28], [42.0, 44.15], [46.0, 46.35], [52.0, 77.09], [83.0, 84.91], [86.0, 87.72], [89.0, 89.26], [91.0, 91.44], [92.0, 93.34], [95.0, 96.23], [97.0, 97.07], [104.0, 105.06], [110.0, 110.74], [115.0, 125.56], [130.0, 132.36]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.26, 51.88, 33.28, 39.61, 0.0, 28.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.59, 34.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 35.14], ["didgeridoo", 16.68], ["speech", 11.77]], null, [["music", 42.04], ["sidetone", 16.41], ["hum", 9.4]], [["music", 23.11], ["didgeridoo", 15.69], ["speech", 7.55]], null, [["music", 28.25], ["speech", 11.92], ["livestock, farm animals, working animals", 8.03]], null, null, null, null, null, null, null, null, null, [["music", 66.47], ["didgeridoo", 12.79], ["foghorn", 2.98]], [["music", 34.49], ["mains hum", 15.95], ["hum", 10.14]]], "duration": [0.44, 0.49, -0.35, -0.1, 1.82, 0.99, 0.45, 1.04, 2.76, 3.26, 12.28, 2.15, 0.35, 25.09, 1.91, 1.72, 0.26, 0.44, 1.34, 1.23, 0.07, 1.06, 0.74, 10.56, 2.36]} \ No newline at end of file diff --git a/annotations_1/_UvKhc0wVU8_filtered.json b/annotations_1/_UvKhc0wVU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ac77ad020750d7ded37ec24b6221df3c43bd4e7 --- /dev/null +++ b/annotations_1/_UvKhc0wVU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.7], [19.0, 24.33], [26.0, 27.21], [35.0, 35.33], [40.0, 41.25], [45.0, 45.44], [52.0, 92.3], [95.0, 95.71], [98.0, 98.29]], "keep_status": [true, true, false, false, false, false, false, false, false], "silence_prob": [31.07, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.43], ["brass instrument", 17.02], ["trombone", 10.71]], [["music", 19.0], ["throbbing", 15.46], ["hum", 11.38]], null, null, null, null, null, null, null], "duration": [8.7, 5.33, 1.21, 0.33, 1.25, 0.44, 40.3, 0.71, 0.29]} \ No newline at end of file diff --git a/annotations_1/_VEDJMixt3c_filtered.json b/annotations_1/_VEDJMixt3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7415c0d5d2d76a1bfd74c2ad5dfa2541260958e6 --- /dev/null +++ b/annotations_1/_VEDJMixt3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.94], [9.0, 9.39], [14.0, 16.38], [17.0, 34.11], [36.0, 38.37], [40.0, 40.64], [42.0, 42.45], [45.0, 45.42], [51.0, 51.09], [52.0, 52.71], [55.0, 55.61], [63.0, 64.15], [72.0, 72.72], [73.0, 73.68], [75.0, 75.69], [85.0, 86.04], [88.0, 91.57], [92.0, 93.83], [98.0, 99.69], [105.0, 106.17], [108.0, 108.73], [115.0, 115.97], [117.0, 144.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.41, 49.73, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 88.83], "audiomae_on_audioset": [null, null, null, [["hum", 37.16], ["music", 29.28], ["mains hum", 15.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.39, 2.38, 17.11, 2.37, 0.64, 0.45, 0.42, 0.09, 0.71, 0.61, 1.15, 0.72, 0.68, 0.69, 1.04, 3.57, 1.83, 1.69, 1.17, 0.73, 0.97, 27.37]} \ No newline at end of file diff --git a/annotations_1/_Vyg1SVaZu4_filtered.json b/annotations_1/_Vyg1SVaZu4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c66cf9ce259ef707fd4ebec69ecb4bc5873b2f --- /dev/null +++ b/annotations_1/_Vyg1SVaZu4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.88], [6.0, 5.76], [32.0, 32.58], [35.0, 35.73], [36.0, 36.34], [39.0, 39.75], [43.0, 43.29], [45.0, 45.3], [64.0, 64.0], [65.0, 65.42], [85.0, 84.55], [86.0, 86.61], [89.0, 89.24], [92.0, 92.18], [101.0, 100.84], [150.0, 150.28], [153.0, 153.64], [155.0, 155.07], [158.0, 158.75], [162.0, 161.87], [166.0, 166.28], [169.0, 169.18], [170.0, 175.36], [176.0, 177.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, -0.24, 0.58, 0.73, 0.34, 0.75, 0.29, 0.3, 0.0, 0.42, -0.45, 0.61, 0.24, 0.18, -0.16, 0.28, 0.64, 0.07, 0.75, -0.13, 0.28, 0.18, 5.36, 1.13]} \ No newline at end of file diff --git a/annotations_1/_WUyZXhLHMk_filtered.json b/annotations_1/_WUyZXhLHMk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81b82c61db5a80d9d4a4b2d858df9be7ec658654 --- /dev/null +++ b/annotations_1/_WUyZXhLHMk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.89], [7.0, 50.68], [54.0, 54.62], [57.0, 58.77], [62.0, 63.66], [65.0, 65.77], [68.0, 72.32], [75.0, 75.63], [76.0, 77.04], [78.0, 85.33], [88.0, 88.89], [91.0, 92.2], [96.0, 96.31], [101.0, 101.6], [103.0, 105.16], [105.0, 105.87], [107.0, 107.6], [109.0, 117.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.89, 43.68, 0.62, 1.77, 1.66, 0.77, 4.32, 0.63, 1.04, 7.33, 0.89, 1.2, 0.31, 0.6, 2.16, 0.87, 0.6, 8.73]} \ No newline at end of file diff --git a/annotations_1/_X6dHrTceEE_filtered.json b/annotations_1/_X6dHrTceEE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cb3179335a88276a070c3ae37f0a56800967bd1 --- /dev/null +++ b/annotations_1/_X6dHrTceEE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.0], [16.0, 17.49], [20.0, 22.82], [26.0, 27.55], [38.0, 39.85], [41.0, 42.06], [43.0, 46.06], [48.0, 49.82], [52.0, 53.05], [54.0, 56.88], [58.0, 60.52], [63.0, 67.04], [68.0, 68.62], [75.0, 93.82], [94.0, 112.82]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, true, true], "silence_prob": [51.77, 0.0, 52.22, 0.0, 0.0, 0.0, 39.24, 0.0, 0.0, 43.85, 33.43, 29.89, 0.0, 30.56, 32.08], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 36.97], ["music", 15.95], ["dog", 10.29]], null, null, [["hum", 24.93], ["throbbing", 21.25], ["music", 16.12]], [["music", 35.28], ["throbbing", 19.01], ["hum", 9.0]], [["hum", 59.15], ["throbbing", 17.73], ["mains hum", 12.26]], null, [["music", 32.14], ["hum", 19.61], ["electronic music", 11.63]], [["music", 48.32], ["musical instrument", 11.39], ["violin, fiddle", 8.79]]], "duration": [7.0, 1.49, 2.82, 1.55, 1.85, 1.06, 3.06, 1.82, 1.05, 2.88, 2.52, 4.04, 0.62, 18.82, 18.82]} \ No newline at end of file diff --git a/annotations_1/_X8bBE1M994_filtered.json b/annotations_1/_X8bBE1M994_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/_X8bBE1M994_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/_XSFVQhMC5k_filtered.json b/annotations_1/_XSFVQhMC5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3b0ccb0521e358edc14be395dff5b790776a59b --- /dev/null +++ b/annotations_1/_XSFVQhMC5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [5.0, 4.72], [7.0, 8.26], [9.0, 10.2], [12.0, 13.19], [14.0, 14.93], [22.0, 22.71], [25.0, 25.96], [31.0, 32.66], [38.0, 39.23], [40.0, 40.81], [42.0, 44.79], [48.0, 49.05], [53.0, 53.3], [57.0, 57.32], [66.0, 67.66], [71.0, 71.68], [72.0, 75.51], [76.0, 76.81], [77.0, 78.95], [80.0, 81.92], [82.0, 83.34], [85.0, 90.02], [100.0, 100.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, -0.28, 1.26, 1.2, 1.19, 0.93, 0.71, 0.96, 1.66, 1.23, 0.81, 2.79, 1.05, 0.3, 0.32, 1.66, 0.68, 3.51, 0.81, 1.95, 1.92, 1.34, 5.02, 0.58]} \ No newline at end of file diff --git a/annotations_1/_XST7hft6k8_filtered.json b/annotations_1/_XST7hft6k8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34706a3147a78f101c57957f5fb001b0612ec7dd --- /dev/null +++ b/annotations_1/_XST7hft6k8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.54], [10.0, 10.13], [12.0, 14.96], [17.0, 17.29], [20.0, 20.39], [23.0, 22.87], [26.0, 27.11], [33.0, 33.0], [35.0, 37.17], [37.0, 38.31], [40.0, 44.56], [48.0, 57.86], [58.0, 59.66], [63.0, 64.12], [72.0, 72.37], [73.0, 73.33], [75.0, 75.46], [93.0, 93.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 69.47, 38.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 66.75], ["musical instrument", 5.89], ["theremin", 3.84]], null, null, null, null, null, null], "duration": [0.54, 0.13, 2.96, 0.29, 0.39, -0.13, 1.11, 0.0, 2.17, 1.31, 4.56, 9.86, 1.66, 1.12, 0.37, 0.33, 0.46, 0.63]} \ No newline at end of file diff --git a/annotations_1/_XuDmoP5scY_filtered.json b/annotations_1/_XuDmoP5scY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/_XuDmoP5scY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/_YMLnL33X78_filtered.json b/annotations_1/_YMLnL33X78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b4e7664b2d33d65aa6cf44a2796e29ddd3462eb --- /dev/null +++ b/annotations_1/_YMLnL33X78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [8.0, 8.19], [9.0, 10.23], [15.0, 15.94], [17.0, 17.22], [23.0, 24.71], [30.0, 30.87], [32.0, 32.76], [35.0, 35.4], [36.0, 36.76], [39.0, 39.56], [42.0, 42.08], [45.0, 45.69], [48.0, 49.92], [53.0, 53.79], [56.0, 56.35], [58.0, 58.72], [60.0, 60.62], [70.0, 70.7], [74.0, 76.01], [79.0, 80.06], [85.0, 85.4], [87.0, 87.05], [93.0, 94.69], [98.0, 100.67], [108.0, 109.04], [113.0, 113.04], [116.0, 116.77], [118.0, 118.71], [125.0, 125.73], [129.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.35, 0.0, 0.0, 0.0, 0.0, 36.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.52], ["musical instrument", 5.0], ["theremin", 4.61]], null, null, null, null, [["music", 41.92], ["speech", 13.46], ["musical instrument", 2.37]], null, null, null, null, null, null], "duration": [0.73, 0.19, 1.23, 0.94, 0.22, 1.71, 0.87, 0.76, 0.4, 0.76, 0.56, 0.08, 0.69, 1.92, 0.79, 0.35, 0.72, 0.62, 0.7, 2.01, 1.06, 0.4, 0.05, 1.69, 2.67, 1.04, 0.04, 0.77, 0.71, 0.73, 1.06]} \ No newline at end of file diff --git a/annotations_1/_ZA8FE-nu3E_filtered.json b/annotations_1/_ZA8FE-nu3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7f2dc3bae051329b73dd6d904f2c3718dcfcdf7 --- /dev/null +++ b/annotations_1/_ZA8FE-nu3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.32], [10.0, 10.91], [12.0, 14.08], [16.0, 20.14], [22.0, 22.62], [24.0, 24.87], [27.0, 28.19], [29.0, 32.16], [33.0, 34.96], [37.0, 37.72], [39.0, 43.43], [45.0, 45.37], [47.0, 66.12], [66.0, 67.39]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.67, 99.05, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 87.19, 0.0, 81.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 19.63], ["whale vocalization", 18.18], ["squeak", 10.48]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.91, 2.08, 4.14, 0.62, 0.87, 1.19, 3.16, 1.96, 0.72, 4.43, 0.37, 19.12, 1.39]} \ No newline at end of file diff --git a/annotations_1/_Z_n2Ray64o_filtered.json b/annotations_1/_Z_n2Ray64o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba3c483b26845bf4035ed60fda65a5b5235dae1e --- /dev/null +++ b/annotations_1/_Z_n2Ray64o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.13], [18.0, 18.2], [21.0, 33.79], [41.0, 62.48], [65.0, 65.57], [67.0, 76.5], [79.0, 82.7], [85.0, 85.38], [86.0, 86.58], [90.0, 96.21], [99.0, 110.56], [112.0, 122.47], [130.0, 137.13], [142.0, 143.97], [146.0, 146.35], [147.0, 147.5], [148.0, 147.53], [148.0, 147.56], [148.0, 147.6], [152.0, 156.66], [160.0, 167.48], [170.0, 170.23]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [34.88, 0.0, 29.67, 29.24, 0.0, 28.85, 29.38, 0.0, 0.0, 28.69, 29.01, 29.76, 28.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.4, 28.27, 0.0], "audiomae_on_audioset": [[["music", 33.76], ["speech", 27.49], ["throbbing", 9.29]], null, [["music", 61.91], ["hum", 3.93], ["cacophony", 3.12]], [["music", 72.63], ["sound effect", 2.07], ["buzz", 1.68]], null, [["music", 62.64], ["speech", 18.96], ["cacophony", 2.36]], [["music", 73.09], ["buzz", 2.67], ["outside, rural or natural", 2.37]], null, null, [["speech", 35.02], ["hum", 13.29], ["music", 11.74]], [["music", 73.22], ["cacophony", 7.97], ["sound effect", 2.2]], [["music", 71.88], ["hum", 4.33], ["cacophony", 2.8]], [["music", 77.0], ["soundtrack music", 1.85], ["eruption", 1.78]], null, null, null, null, null, null, [["cacophony", 22.26], ["music", 21.26], ["buzz", 4.76]], [["music", 32.45], ["speech", 26.06], ["noise", 8.72]], null], "duration": [2.13, 0.2, 12.79, 21.48, 0.57, 9.5, 3.7, 0.38, 0.58, 6.21, 11.56, 10.47, 7.13, 1.97, 0.35, 0.5, -0.47, -0.44, -0.4, 4.66, 7.48, 0.23]} \ No newline at end of file diff --git a/annotations_1/_ZwkQIBp4TA_filtered.json b/annotations_1/_ZwkQIBp4TA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2db2dfbcc7d789b7e99504c3c4a9b933ce9a130f --- /dev/null +++ b/annotations_1/_ZwkQIBp4TA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.27], [4.0, 5.95], [7.0, 8.23], [11.0, 12.38], [14.0, 14.99], [16.0, 17.17], [19.0, 26.23], [29.0, 29.35], [30.0, 31.06], [32.0, 32.46], [33.0, 34.01], [35.0, 40.74], [46.0, 46.5], [51.0, 55.36], [58.0, 58.28], [70.0, 70.29], [71.0, 71.79], [73.0, 76.52], [81.0, 83.19], [85.0, 85.23], [86.0, 87.94], [89.0, 89.19], [109.0, 111.72], [128.0, 129.66]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [85.9, 0.0, 0.0, 0.0, 0.0, 0.0, 49.97, 0.0, 0.0, 0.0, 0.0, 38.31, 0.0, 78.38, 0.0, 0.0, 0.0, 39.3, 60.23, 0.0, 0.0, 0.0, 31.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 22.59], ["music", 16.11], ["effects unit", 9.36]], null, null, null, null, [["animal", 30.13], ["music", 18.97], ["wild animals", 6.83]], null, null, null, null, null, [["cowbell", 38.56], ["livestock, farm animals, working animals", 26.27], ["cattle, bovinae", 14.66]], null, null, null, null, [["speech", 30.61], ["vehicle", 12.02], ["fly, housefly", 5.06]], null], "duration": [2.27, 1.95, 1.23, 1.38, 0.99, 1.17, 7.23, 0.35, 1.06, 0.46, 1.01, 5.74, 0.5, 4.36, 0.28, 0.29, 0.79, 3.52, 2.19, 0.23, 1.94, 0.19, 2.72, 1.66]} \ No newline at end of file diff --git a/annotations_1/_ZzKJflnVHU_filtered.json b/annotations_1/_ZzKJflnVHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6993d4f365fefe8bfb23f4e7fcab46166d3530e3 --- /dev/null +++ b/annotations_1/_ZzKJflnVHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[150.0, 151.07], [152.0, 153.03], [154.0, 165.2], [166.0, 166.97], [169.0, 169.25], [172.0, 172.49], [175.0, 180.32], [181.0, 182.04], [196.0, 196.79], [201.0, 202.37], [205.0, 205.39], [207.0, 206.71]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.21, 0.0, 0.0, 0.0, 40.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.73], ["insect", 7.21], ["fly, housefly", 5.29]], null, null, null, [["hum", 26.71], ["speech", 21.08], ["throbbing", 16.03]], null, null, null, null, null], "duration": [1.07, 1.03, 11.2, 0.97, 0.25, 0.49, 5.32, 1.04, 0.79, 1.37, 0.39, -0.29]} \ No newline at end of file diff --git a/annotations_1/__bdFiweOJY_filtered.json b/annotations_1/__bdFiweOJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4fb43ff34a41417c3f53a87beab5372dd8ce6df --- /dev/null +++ b/annotations_1/__bdFiweOJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 18.72], [19.0, 20.97], [23.0, 23.94], [26.0, 39.29], [40.0, 41.1]], "keep_status": [true, false, false, true, false], "silence_prob": [31.36, 0.0, 0.0, 32.2, 0.0], "audiomae_on_audioset": [[["hum", 41.08], ["music", 15.77], ["mains hum", 10.98]], null, null, [["music", 40.84], ["speech", 13.39], ["electronic music", 4.95]], null], "duration": [8.72, 1.97, 0.94, 13.29, 1.1]} \ No newline at end of file diff --git a/annotations_1/__f2KtcXAxI_filtered.json b/annotations_1/__f2KtcXAxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2a438fb1bca2aa0f96a2a60af86d2425f37c93e --- /dev/null +++ b/annotations_1/__f2KtcXAxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.7], [9.0, 9.42], [10.0, 10.4], [11.0, 11.38], [13.0, 13.32], [22.0, 22.3], [26.0, 26.01], [26.0, 26.65], [28.0, 28.36], [29.0, 29.54], [30.0, 31.08], [39.0, 40.05], [44.0, 43.87], [57.0, 58.19], [59.0, 62.9], [63.0, 65.64], [67.0, 67.42], [71.0, 71.31], [73.0, 74.31], [75.0, 74.83], [76.0, 76.05], [77.0, 80.06], [82.0, 82.81], [86.0, 87.34], [88.0, 89.13], [90.0, 91.81], [94.0, 94.8], [96.0, 96.5], [98.0, 98.54], [100.0, 99.99], [100.0, 101.51], [102.0, 103.3], [106.0, 107.25], [110.0, 110.76], [112.0, 113.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 63.1, 0.0, 0.0, 0.0, 0.0, 0.0, 51.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.7, 0.42, 0.4, 0.38, 0.32, 0.3, 0.01, 0.65, 0.36, 0.54, 1.08, 1.05, -0.13, 1.19, 3.9, 2.64, 0.42, 0.31, 1.31, -0.17, 0.05, 3.06, 0.81, 1.34, 1.13, 1.81, 0.8, 0.5, 0.54, -0.01, 1.51, 1.3, 1.25, 0.76, 1.31]} \ No newline at end of file diff --git a/annotations_1/_bJYiiCvPW4_filtered.json b/annotations_1/_bJYiiCvPW4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6c350ef5a8a13f83cd422009409f125d6c45823 --- /dev/null +++ b/annotations_1/_bJYiiCvPW4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [4.0, 4.62], [6.0, 10.72], [15.0, 15.42], [16.0, 16.36], [19.0, 22.62], [23.0, 22.94], [26.0, 26.64], [27.0, 43.53], [47.0, 49.42], [62.0, 62.48], [64.0, 64.77], [70.0, 71.15], [78.0, 95.62], [96.0, 101.33], [102.0, 104.14], [113.0, 115.21], [116.0, 124.44]], "keep_status": [false, false, true, false, false, true, false, false, true, true, false, false, false, true, true, true, true, true], "silence_prob": [0.0, 0.0, 37.49, 0.0, 0.0, 30.95, 0.0, 0.0, 29.0, 30.02, 0.0, 0.0, 0.0, 30.49, 29.99, 30.2, 29.89, 29.04], "audiomae_on_audioset": [null, null, [["music", 21.43], ["speech", 16.6], ["whale vocalization", 14.4]], null, null, [["electric shaver, electric razor", 29.48], ["speech", 24.82], ["moo", 4.96]], null, null, [["explosion", 20.53], ["speech", 13.12], ["eruption", 10.99]], [["speech", 24.96], ["explosion", 10.94], ["music", 10.15]], null, null, null, [["speech", 35.37], ["explosion", 11.29], ["fireworks", 9.16]], [["speech", 22.73], ["moo", 11.7], ["cattle, bovinae", 11.32]], [["civil defense siren", 23.57], ["speech", 17.83], ["explosion", 10.72]], [["eruption", 13.91], ["rumble", 11.81], ["whack, thwack", 8.68]], [["buzz", 34.94], ["music", 20.37], ["insect", 12.34]]], "duration": [0.66, 0.62, 4.72, 0.42, 0.36, 3.62, -0.06, 0.64, 16.53, 2.42, 0.48, 0.77, 1.15, 17.62, 5.33, 2.14, 2.21, 8.44]} \ No newline at end of file diff --git a/annotations_1/_dEEXgs7T1k_filtered.json b/annotations_1/_dEEXgs7T1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1f26467562c880ca9324bb2290f3af9a99c0854 --- /dev/null +++ b/annotations_1/_dEEXgs7T1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.69], [19.0, 36.93], [41.0, 41.57], [43.0, 43.51], [45.0, 45.44], [46.0, 46.4], [48.0, 86.44], [87.0, 86.56], [87.0, 140.58], [142.0, 151.98], [153.0, 153.39], [153.0, 153.44], [154.0, 154.35], [155.0, 158.58], [160.0, 211.72]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 35.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0, 0.0, 0.0, 29.47, 0.0], "audiomae_on_audioset": [null, [["music", 36.04], ["hum", 14.88], ["throbbing", 14.14]], null, null, null, null, null, null, null, [["speech", 34.14], ["fly, housefly", 20.39], ["music", 8.92]], null, null, null, [["music", 60.34], ["boing", 6.05], ["electric shaver, electric razor", 5.68]], null], "duration": [-0.31, 17.93, 0.57, 0.51, 0.44, 0.4, 38.44, -0.44, 53.58, 9.98, 0.39, 0.44, 0.35, 3.58, 51.72]} \ No newline at end of file diff --git a/annotations_1/_eHwoQ4VQ1o_filtered.json b/annotations_1/_eHwoQ4VQ1o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..201649486d2625908683ace54a996361df52765c --- /dev/null +++ b/annotations_1/_eHwoQ4VQ1o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.87], [19.0, 24.48], [27.0, 28.07], [29.0, 29.15], [30.0, 32.05], [34.0, 35.95], [38.0, 39.07], [44.0, 46.57], [48.0, 56.32], [62.0, 63.44], [70.0, 72.1], [74.0, 76.25], [78.0, 78.81], [81.0, 81.89], [88.0, 103.03], [104.0, 104.33], [108.0, 115.13], [117.0, 117.95], [119.0, 125.22]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [35.67, 31.83, 0.0, 0.0, 31.02, 0.0, 0.0, 34.98, 29.46, 0.0, 30.33, 31.28, 0.0, 0.0, 28.94, 0.0, 28.51, 0.0, 28.53], "audiomae_on_audioset": [[["music", 60.93], ["musical instrument", 7.86], ["bass guitar", 7.32]], [["music", 63.85], ["guitar", 8.62], ["bass guitar", 6.57]], null, null, [["music", 59.5], ["musical instrument", 6.66], ["guitar", 4.38]], null, null, [["music", 29.51], ["bass guitar", 15.44], ["effects unit", 13.62]], [["music", 73.84], ["musical instrument", 6.1], ["bass guitar", 4.68]], null, [["music", 42.19], ["didgeridoo", 16.39], ["guitar", 7.55]], [["speech", 32.07], ["music", 30.24], ["sidetone", 10.44]], null, null, [["music", 75.73], ["effects unit", 3.49], ["musical instrument", 2.95]], null, [["music", 41.95], ["speech", 25.72], ["guitar", 4.83]], null, [["music", 30.06], ["throbbing", 18.85], ["electronic music", 5.86]]], "duration": [9.87, 5.48, 1.07, 0.15, 2.05, 1.95, 1.07, 2.57, 8.32, 1.44, 2.1, 2.25, 0.81, 0.89, 15.03, 0.33, 7.13, 0.95, 6.22]} \ No newline at end of file diff --git a/annotations_1/_emU23tTUAw_filtered.json b/annotations_1/_emU23tTUAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81c57e5dffc85e74f7f3edc57820544b7aca6336 --- /dev/null +++ b/annotations_1/_emU23tTUAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.29], [18.0, 19.03], [21.0, 21.71], [22.0, 22.99], [25.0, 25.71], [36.0, 35.77], [39.0, 40.73], [44.0, 45.84], [58.0, 59.05], [65.0, 65.45], [69.0, 68.99], [71.0, 73.97], [78.0, 78.7], [80.0, 80.69], [81.0, 81.31], [82.0, 83.05], [84.0, 84.6], [91.0, 94.56], [111.0, 111.28], [112.0, 112.5], [113.0, 113.29], [113.0, 113.56], [114.0, 113.59], [114.0, 113.73], [114.0, 113.76], [114.0, 113.8], [114.0, 113.83], [114.0, 113.93], [114.0, 116.13]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 29.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.71], "audiomae_on_audioset": [[["music", 32.65], ["hum", 12.2], ["throbbing", 10.97]], null, null, null, null, null, null, null, null, null, null, [["hum", 25.33], ["mains hum", 9.72], ["speech", 8.68]], null, null, null, null, null, [["music", 49.21], ["boing", 11.89], ["hum", 9.52]], null, null, null, null, null, null, null, null, null, null, [["speech", 43.02], ["music", 35.36], ["didgeridoo", 5.47]]], "duration": [2.29, 1.03, 0.71, 0.99, 0.71, -0.23, 1.73, 1.84, 1.05, 0.45, -0.01, 2.97, 0.7, 0.69, 0.31, 1.05, 0.6, 3.56, 0.28, 0.5, 0.29, 0.56, -0.41, -0.27, -0.24, -0.2, -0.17, -0.07, 2.13]} \ No newline at end of file diff --git a/annotations_1/_eyLdmCxtPo_filtered.json b/annotations_1/_eyLdmCxtPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4118baa02fefeb7336f8a969e5382c5a5188b5a6 --- /dev/null +++ b/annotations_1/_eyLdmCxtPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [7.0, 8.68], [10.0, 11.03], [12.0, 20.65], [23.0, 26.1], [26.0, 28.9], [30.0, 30.13], [31.0, 31.41], [37.0, 37.02], [39.0, 39.66], [40.0, 40.9], [41.0, 41.77], [42.0, 42.65], [43.0, 44.31], [46.0, 47.9], [50.0, 53.11], [58.0, 61.62], [65.0, 65.6], [69.0, 69.25], [71.0, 71.81], [72.0, 73.04], [74.0, 74.36], [80.0, 80.47], [81.0, 82.26], [92.0, 93.28], [96.0, 96.31], [109.0, 109.44], [124.0, 124.51], [127.0, 128.17], [130.0, 130.86], [148.0, 150.43], [154.0, 154.13], [161.0, 161.13], [161.0, 161.28], [166.0, 166.6], [169.0, 169.37], [172.0, 174.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.9, 36.9, 36.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 71.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0, 0.0, 0.0, 34.52], "audiomae_on_audioset": [null, null, null, [["speech", 62.42], ["electric shaver, electric razor", 6.43], ["hum", 5.89]], [["livestock, farm animals, working animals", 36.67], ["cattle, bovinae", 22.18], ["moo", 13.03]], [["speech", 52.39], ["hum", 11.34], ["mains hum", 3.22]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.63], ["mains hum", 18.0], ["speech", 10.17]], null, null, null, null, null, [["speech", 41.05], ["music", 14.13], ["sidetone", 6.56]]], "duration": [1.32, 1.68, 1.03, 8.65, 3.1, 2.9, 0.13, 0.41, 0.02, 0.66, 0.9, 0.77, 0.65, 1.31, 1.9, 3.11, 3.62, 0.6, 0.25, 0.81, 1.04, 0.36, 0.47, 1.26, 1.28, 0.31, 0.44, 0.51, 1.17, 0.86, 2.43, 0.13, 0.13, 0.28, 0.6, 0.37, 2.9]} \ No newline at end of file diff --git a/annotations_1/_f7p28YFgvc_filtered.json b/annotations_1/_f7p28YFgvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1299ff281a5473d21c98efbef67a3cd05ef84d55 --- /dev/null +++ b/annotations_1/_f7p28YFgvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 43.28]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.28]} \ No newline at end of file diff --git a/annotations_1/_g-f7cZGqJ0_filtered.json b/annotations_1/_g-f7cZGqJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..986b6cc0132cb0e39622c93d3ee940243475c48b --- /dev/null +++ b/annotations_1/_g-f7cZGqJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.47], [21.0, 22.92], [26.0, 26.11], [28.0, 29.79], [31.0, 32.63], [34.0, 33.79], [36.0, 38.8], [46.0, 47.31], [49.0, 57.82], [59.0, 61.57], [67.0, 68.55], [71.0, 71.41], [77.0, 77.18], [79.0, 79.74], [81.0, 81.6], [83.0, 84.32], [85.0, 86.76], [88.0, 91.37], [92.0, 92.31], [94.0, 101.36], [102.0, 102.0], [107.0, 108.11], [109.0, 108.85], [109.0, 108.99], [110.0, 110.35], [111.0, 111.62], [113.0, 113.64], [115.0, 115.99], [117.0, 116.87], [118.0, 119.67], [122.0, 123.8], [128.0, 127.75], [128.0, 128.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.57, 0.0, 38.94, 69.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24, 0.0, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 79.4], ["sidetone", 2.71], ["hum", 2.25]], null, [["speech", 49.15], ["music", 40.99], ["effects unit", 1.06]], null, null, null, null, null, null, null, null, [["frog", 52.81], ["croak", 22.46], ["noise", 2.74]], null, [["speech", 42.24], ["radio", 33.86], ["telephone dialing, dtmf", 7.14]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.92, 0.11, 1.79, 1.63, -0.21, 2.8, 1.31, 8.82, 2.57, 1.55, 0.41, 0.18, 0.74, 0.6, 1.32, 1.76, 3.37, 0.31, 7.36, 0.0, 1.11, -0.15, -0.01, 0.35, 0.62, 0.64, 0.99, -0.13, 1.67, 1.8, -0.25, 0.11]} \ No newline at end of file diff --git a/annotations_1/_gVrJIUmCqU_filtered.json b/annotations_1/_gVrJIUmCqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..647802a12d3f838ac9bf830e3c47fce5c413b52b --- /dev/null +++ b/annotations_1/_gVrJIUmCqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [4.0, 6.84], [8.0, 8.34], [10.0, 10.96], [12.0, 21.81], [24.0, 24.49], [26.0, 26.74], [29.0, 30.4], [33.0, 34.25], [35.0, 35.61], [36.0, 36.53], [38.0, 38.8], [40.0, 42.08], [43.0, 45.39], [49.0, 50.53], [51.0, 52.05], [53.0, 53.6], [58.0, 58.63], [60.0, 62.34], [64.0, 64.86], [66.0, 67.44], [69.0, 70.73], [72.0, 74.06], [75.0, 78.07], [79.0, 84.72], [88.0, 90.22], [91.0, 93.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 88.46, 0.0, 0.0, 81.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.24, 99.9, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 100.0, 66.15, 78.38, 44.69, 50.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 18.28], ["speech", 17.61], ["knock", 17.05]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.78], ["chirp tone", 9.6], ["sine wave", 8.95]], null], "duration": [1.29, 2.84, 0.34, 0.96, 9.81, 0.49, 0.74, 1.4, 1.25, 0.61, 0.53, 0.8, 2.08, 2.39, 1.53, 1.05, 0.6, 0.63, 2.34, 0.86, 1.44, 1.73, 2.06, 3.07, 5.72, 2.22, 2.02]} \ No newline at end of file diff --git a/annotations_1/_i97zAZclkI_filtered.json b/annotations_1/_i97zAZclkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c702c3efc136d2fc01a9b22cc5bccd8b23c6ef5f --- /dev/null +++ b/annotations_1/_i97zAZclkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [12.0, 12.72], [36.0, 38.35], [43.0, 43.44], [45.0, 47.9], [61.0, 61.2], [63.0, 64.12], [65.0, 65.72], [69.0, 71.34]], "keep_status": [false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.96, 0.0, 56.48, 0.0, 0.0, 0.0, 41.54], "audiomae_on_audioset": [null, null, [["speech", 36.71], ["music", 24.17], ["didgeridoo", 6.09]], null, null, null, null, null, [["music", 34.8], ["sheep", 9.93], ["bleat", 7.09]]], "duration": [0.5, 0.72, 2.35, 0.44, 2.9, 0.2, 1.12, 0.72, 2.34]} \ No newline at end of file diff --git a/annotations_1/_iUWKODwAN8_filtered.json b/annotations_1/_iUWKODwAN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6db3362da3540b16fe1c586f494b0f461ae0464f --- /dev/null +++ b/annotations_1/_iUWKODwAN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [13.0, 12.78], [15.0, 15.55], [20.0, 20.48], [22.0, 22.87], [24.0, 26.65], [28.0, 31.33], [34.0, 34.5], [36.0, 36.27], [40.0, 41.32], [47.0, 49.72], [50.0, 54.14], [55.0, 57.45], [63.0, 64.59], [69.0, 70.01], [71.0, 72.23], [76.0, 77.55], [81.0, 81.46], [83.0, 84.67], [91.0, 100.6], [104.0, 105.09], [107.0, 107.11], [109.0, 109.36], [115.0, 115.5], [118.0, 118.76], [119.0, 120.19], [125.0, 125.59], [127.0, 127.33], [128.0, 128.22], [130.0, 132.49], [133.0, 134.89], [135.0, 137.86], [139.0, 139.72], [141.0, 142.43], [148.0, 147.95], [151.0, 152.73], [154.0, 154.6], [157.0, 157.62], [164.0, 164.98], [166.0, 166.9], [174.0, 174.58], [176.0, 177.92], [180.0, 180.72], [184.0, 185.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 99.4, 0.0, 0.0, 0.0, 99.92, 89.19, 98.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, -0.22, 0.55, 0.48, 0.87, 2.65, 3.33, 0.5, 0.27, 1.32, 2.72, 4.14, 2.45, 1.59, 1.01, 1.23, 1.55, 0.46, 1.67, 9.6, 1.09, 0.11, 0.36, 0.5, 0.76, 1.19, 0.59, 0.33, 0.22, 2.49, 1.89, 2.86, 0.72, 1.43, -0.05, 1.73, 0.6, 0.62, 0.98, 0.9, 0.58, 1.92, 0.72, 1.03]} \ No newline at end of file diff --git a/annotations_1/_kGt7Vv2Pyw_filtered.json b/annotations_1/_kGt7Vv2Pyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b0c64feac6d95e031081bbede29603f347f6193 --- /dev/null +++ b/annotations_1/_kGt7Vv2Pyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.05], [20.0, 23.58], [27.0, 27.82], [31.0, 31.8], [32.0, 32.88], [40.0, 40.44], [41.0, 41.3], [42.0, 42.16], [42.0, 42.33], [42.0, 42.4], [43.0, 42.58], [54.0, 54.75], [60.0, 61.69], [62.0, 64.39], [65.0, 65.82], [77.0, 78.97], [86.0, 86.56], [91.0, 90.88], [96.0, 97.02], [113.0, 114.45], [115.0, 115.6], [132.0, 131.94], [133.0, 133.37], [134.0, 136.95], [138.0, 138.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 3.58, 0.82, 0.8, 0.88, 0.44, 0.3, 0.16, 0.33, 0.4, -0.42, 0.75, 1.69, 2.39, 0.82, 1.97, 0.56, -0.12, 1.02, 1.45, 0.6, -0.06, 0.37, 2.95, 0.97]} \ No newline at end of file diff --git a/annotations_1/_mPOfQw2fmY_filtered.json b/annotations_1/_mPOfQw2fmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..926af9f82875316002b4827d51be5c119e367676 --- /dev/null +++ b/annotations_1/_mPOfQw2fmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.79], [5.0, 5.0], [21.0, 21.09], [23.0, 23.38], [28.0, 28.63], [31.0, 34.18], [37.0, 39.33], [40.0, 41.05], [43.0, 53.08], [54.0, 58.33], [59.0, 61.43], [65.0, 69.97], [71.0, 73.7], [76.0, 76.03], [83.0, 83.98], [84.0, 84.54], [85.0, 85.33], [89.0, 91.05], [92.0, 93.97], [104.0, 105.02], [110.0, 110.4], [112.0, 113.68], [120.0, 120.01], [122.0, 122.07], [129.0, 129.73], [130.0, 132.65], [135.0, 135.16], [140.0, 145.25], [146.0, 149.12], [150.0, 151.82], [153.0, 155.29], [158.0, 160.73], [161.0, 172.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 90.08, 0.0, 99.96, 99.88, 100.0, 100.0, 98.93, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 100.0, 99.98, 0.0, 99.31, 99.8, 46.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.54], ["speech", 21.87], ["singing bowl", 7.3]]], "duration": [1.79, 0.0, 0.09, 0.38, 0.63, 3.18, 2.33, 1.05, 10.08, 4.33, 2.43, 4.97, 2.7, 0.03, 0.98, 0.54, 0.33, 2.05, 1.97, 1.02, 0.4, 1.68, 0.01, 0.07, 0.73, 2.65, 0.16, 5.25, 3.12, 1.82, 2.29, 2.73, 11.62]} \ No newline at end of file diff --git a/annotations_1/_myZeGUaveU_filtered.json b/annotations_1/_myZeGUaveU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7991fe5d5722775d90b0d3e4a42a08b0e0c00d6e --- /dev/null +++ b/annotations_1/_myZeGUaveU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.1], [28.0, 30.45], [37.0, 38.42], [62.0, 62.63], [67.0, 70.24], [75.0, 77.87], [84.0, 95.99], [97.0, 97.92], [114.0, 142.37], [143.0, 143.18]], "keep_status": [false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 31.42, 0.0, 0.0, 33.03, 34.39, 32.78, 0.0, 31.58, 0.0], "audiomae_on_audioset": [null, [["music", 52.36], ["speech", 23.1], ["boing", 8.69]], null, null, [["music", 53.33], ["speech", 6.71], ["boing", 5.98]], [["music", 34.74], ["speech", 7.14], ["synthesizer", 5.97]], [["music", 59.18], ["boing", 6.65], ["sheep", 6.01]], null, [["music", 29.51], ["boing", 20.95], ["livestock, farm animals, working animals", 5.37]], null], "duration": [1.1, 2.45, 1.42, 0.63, 3.24, 2.87, 11.99, 0.92, 28.37, 0.18]} \ No newline at end of file diff --git a/annotations_1/_nSQhWq7etg_filtered.json b/annotations_1/_nSQhWq7etg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6da9bc1eb2bb269c0dcbb9dbfca55e0ae1d3d3f4 --- /dev/null +++ b/annotations_1/_nSQhWq7etg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.58], [28.0, 32.63], [33.0, 52.95], [55.0, 68.08], [70.0, 71.17], [73.0, 76.1], [81.0, 82.56], [83.0, 85.16], [99.0, 99.91], [102.0, 102.05], [102.0, 103.2], [104.0, 135.24], [137.0, 145.15], [148.0, 186.0], [192.0, 206.85]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 28.76, 29.06, 30.81, 0.0, 81.71, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 29.33, 0.0, 28.51], "audiomae_on_audioset": [null, [["whack, thwack", 15.48], ["sound effect", 13.31], ["fly, housefly", 10.64]], [["livestock, farm animals, working animals", 24.08], ["speech", 20.8], ["cattle, bovinae", 15.19]], [["music", 67.2], ["electronic music", 8.99], ["ambient music", 6.7]], null, null, null, [["speech", 16.33], ["whale vocalization", 7.77], ["hum", 5.99]], null, null, null, null, [["cattle, bovinae", 42.94], ["livestock, farm animals, working animals", 30.6], ["moo", 25.79]], null, [["speech", 27.82], ["music", 18.94], ["throbbing", 6.82]]], "duration": [1.58, 4.63, 19.95, 13.08, 1.17, 3.1, 1.56, 2.16, 0.91, 0.05, 1.2, 31.24, 8.15, 38.0, 14.85]} \ No newline at end of file diff --git a/annotations_1/_nnGxztgrQk_filtered.json b/annotations_1/_nnGxztgrQk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2e2c61bed9b2ce8b816302fa986c0740f289c9c --- /dev/null +++ b/annotations_1/_nnGxztgrQk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.23], [22.0, 22.54], [31.0, 36.51], [52.0, 53.5], [75.0, 75.57], [89.0, 89.16], [113.0, 117.15], [136.0, 139.99], [151.0, 152.14], [153.0, 152.81], [157.0, 158.16], [194.0, 194.97], [197.0, 197.75], [206.0, 232.21], [234.0, 235.6], [241.0, 242.38]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.01, 0.0, 0.0, 0.0, 35.01, 38.45, 0.0, 0.0, 0.0, 0.0, 0.0, 28.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 41.62], ["speech", 12.27], ["ding", 4.75]], null, null, null, [["music", 49.0], ["synthesizer", 9.8], ["ding", 6.8]], [["thunk", 22.63], ["music", 12.55], ["speech", 12.37]], null, null, null, null, null, [["speech", 57.15], ["buzz", 8.67], ["music", 7.3]], null, null], "duration": [0.23, 0.54, 5.51, 1.5, 0.57, 0.16, 4.15, 3.99, 1.14, -0.19, 1.16, 0.97, 0.75, 26.21, 1.6, 1.38]} \ No newline at end of file diff --git a/annotations_1/_oEolYMce4c_filtered.json b/annotations_1/_oEolYMce4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce69f68ad9f5633a766005f8086aae9866ddd012 --- /dev/null +++ b/annotations_1/_oEolYMce4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.61], [7.0, 8.45], [9.0, 9.66], [11.0, 11.6], [13.0, 14.71], [16.0, 17.22], [18.0, 19.3], [20.0, 21.49], [22.0, 22.57], [23.0, 30.27], [35.0, 48.76], [49.0, 72.2], [75.0, 76.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 31.01, 31.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["buzz", 24.51], ["insect", 7.98], ["fly, housefly", 7.81]], [["music", 35.54], ["fly, housefly", 11.99], ["insect", 8.06]], null], "duration": [4.61, 1.45, 0.66, 0.6, 1.71, 1.22, 1.3, 1.49, 0.57, 7.27, 13.76, 23.2, 1.65]} \ No newline at end of file diff --git a/annotations_1/_oLBVF_VYRM_filtered.json b/annotations_1/_oLBVF_VYRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82d2d4d21db2d424bdfb982eba08818e3d4bcbf1 --- /dev/null +++ b/annotations_1/_oLBVF_VYRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 35.6], [36.0, 43.38], [45.0, 47.34], [55.0, 55.19], [57.0, 103.86], [104.0, 118.4], [121.0, 148.0]], "keep_status": [false, false, true, false, false, true, false], "silence_prob": [28.45, 28.61, 28.19, 0.0, 0.0, 28.67, 28.92], "audiomae_on_audioset": [[["music", 76.33], ["electronic music", 2.46], ["cacophony", 2.24]], [["music", 71.84], ["didgeridoo", 7.64], ["musical instrument", 4.78]], [["music", 36.24], ["didgeridoo", 11.95], ["beatboxing", 4.65]], null, null, [["music", 61.66], ["electronic music", 3.75], ["vehicle", 3.09]], [["music", 79.34], ["electronic music", 2.52], ["throbbing", 2.32]]], "duration": [10.6, 7.38, 2.34, 0.19, 46.86, 14.4, 27.0]} \ No newline at end of file diff --git a/annotations_1/_oOULG_nhEc_filtered.json b/annotations_1/_oOULG_nhEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57900200d74000e551d86b32ca7f1f9167388c97 --- /dev/null +++ b/annotations_1/_oOULG_nhEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 86.05], [88.0, 103.99], [104.0, 104.33], [104.0, 104.4], [104.0, 104.46], [104.0, 104.6], [105.0, 104.63], [105.0, 104.67], [105.0, 104.7], [105.0, 104.77], [106.0, 115.03], [116.0, 154.95], [157.0, 158.8], [159.0, 160.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 90.02], ["didgeridoo", 1.33], ["electronic music", 1.25]], null, null, null, null, null, null, null, null, [["music", 78.05], ["speech", 2.84], ["electronic music", 2.82]], null, null, null], "duration": [32.05, 15.99, 0.33, 0.4, 0.46, 0.6, -0.37, -0.33, -0.3, -0.23, 9.03, 38.95, 1.8, 1.57]} \ No newline at end of file diff --git a/annotations_1/_pH9HcBNO2I_filtered.json b/annotations_1/_pH9HcBNO2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47a444dda9c5afa87afc199b1871204997584c33 --- /dev/null +++ b/annotations_1/_pH9HcBNO2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.28], [19.0, 22.54], [23.0, 24.24], [25.0, 29.66], [30.0, 30.96], [32.0, 48.1], [49.0, 49.38], [50.0, 65.42], [66.0, 66.87], [68.0, 68.22], [78.0, 80.94], [83.0, 83.12], [85.0, 85.6], [86.0, 87.29], [91.0, 92.45], [99.0, 104.65], [106.0, 108.13]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.36, 0.0, 66.76, 0.0, 75.39, 0.0, 49.59, 0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 49.0, 45.85], "audiomae_on_audioset": [null, [["music", 50.4], ["hum", 11.72], ["throbbing", 7.88]], null, null, null, null, null, [["music", 30.67], ["throbbing", 9.94], ["hum", 9.92]], null, null, null, null, null, null, null, [["music", 64.09], ["glass", 4.38], ["rumble", 3.81]], [["music", 31.9], ["throbbing", 23.6], ["hum", 19.31]]], "duration": [1.28, 3.54, 1.24, 4.66, 0.96, 16.1, 0.38, 15.42, 0.87, 0.22, 2.94, 0.12, 0.6, 1.29, 1.45, 5.65, 2.13]} \ No newline at end of file diff --git a/annotations_1/_pin0H9Udho_filtered.json b/annotations_1/_pin0H9Udho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e591205976525c7f4991057c944bb5c8cad1c914 --- /dev/null +++ b/annotations_1/_pin0H9Udho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.39], [41.0, 42.57], [49.0, 49.62], [51.0, 58.92], [60.0, 61.47], [64.0, 65.26], [66.0, 67.15], [68.0, 70.6], [71.0, 76.4], [82.0, 82.53], [84.0, 84.13], [87.0, 87.44], [88.0, 91.08], [93.0, 96.65], [98.0, 98.42], [104.0, 104.79], [107.0, 109.81], [142.0, 142.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.37, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.57, 0.62, 7.92, 1.47, 1.26, 1.15, 2.6, 5.4, 0.53, 0.13, 0.44, 3.08, 3.65, 0.42, 0.79, 2.81, 0.18]} \ No newline at end of file diff --git a/annotations_1/_pzN5x6Pepw_filtered.json b/annotations_1/_pzN5x6Pepw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f0eba81ef012b4d61599fe07e48e44941252a39 --- /dev/null +++ b/annotations_1/_pzN5x6Pepw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [5.0, 5.17], [6.0, 5.95], [9.0, 9.76], [11.0, 11.03], [11.0, 13.46], [14.0, 14.89], [16.0, 16.33], [19.0, 23.35], [24.0, 25.07], [26.0, 26.42], [36.0, 37.49], [40.0, 39.65], [44.0, 44.32], [47.0, 47.09], [63.0, 63.07], [72.0, 72.08], [96.0, 100.57], [101.0, 103.06], [103.0, 111.65], [113.0, 114.69], [116.0, 121.17], [124.0, 134.2], [135.0, 138.94], [141.0, 142.16], [147.0, 151.68], [159.0, 160.44], [164.0, 167.63], [169.0, 171.56], [172.0, 172.32], [176.0, 183.76], [185.0, 185.52], [186.0, 190.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.89, 85.9, 46.64, 0.0, 92.15, 76.04, 34.08, 0.0, 37.74, 0.0, 42.84, 84.8, 0.0, 71.57, 0.0, 66.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.63], ["music", 22.42], ["throbbing", 6.48]], null, [["mains hum", 31.46], ["hum", 24.34], ["speech", 18.88]], null, null, null, [["speech", 49.83], ["whale vocalization", 6.28], ["hum", 4.97]], null, [["sidetone", 36.63], ["mains hum", 19.13], ["hum", 13.94]], null, [["music", 31.37], ["speech", 18.25], ["hum", 13.16]], null, null, null, null, null], "duration": [-0.04, 0.17, -0.05, 0.76, 0.03, 2.46, 0.89, 0.33, 4.35, 1.07, 0.42, 1.49, -0.35, 0.32, 0.09, 0.07, 0.08, 4.57, 2.06, 8.65, 1.69, 5.17, 10.2, 3.94, 1.16, 4.68, 1.44, 3.63, 2.56, 0.32, 7.76, 0.52, 4.88]} \ No newline at end of file diff --git a/annotations_1/_qbp2nGRp1Q_filtered.json b/annotations_1/_qbp2nGRp1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7eac1b3bb38e026531d70cbce39fa046b6d6c7e7 --- /dev/null +++ b/annotations_1/_qbp2nGRp1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 42.67], [48.0, 49.1], [53.0, 52.88], [53.0, 53.0], [53.0, 54.72], [59.0, 59.64], [61.0, 109.39], [111.0, 111.57], [112.0, 113.26], [115.0, 125.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["electric shaver, electric razor", 24.43], ["music", 21.77], ["mains hum", 13.08]]], "duration": [35.67, 1.1, -0.12, 0.0, 1.72, 0.64, 48.39, 0.57, 1.26, 10.61]} \ No newline at end of file diff --git a/annotations_1/_qh-4JFLd-s_filtered.json b/annotations_1/_qh-4JFLd-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b249ab57ea0c58b4505bd93c37984d46657f9e81 --- /dev/null +++ b/annotations_1/_qh-4JFLd-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.89], [4.0, 5.88], [7.0, 7.57], [10.0, 11.37], [13.0, 14.17], [16.0, 20.9], [21.0, 23.95], [26.0, 26.72], [31.0, 32.26], [35.0, 48.1], [49.0, 50.19], [53.0, 54.65], [59.0, 59.71], [60.0, 61.37], [66.0, 66.21], [76.0, 76.03], [79.0, 82.43], [86.0, 85.99], [90.0, 92.55], [93.0, 94.17], [95.0, 105.8], [107.0, 111.28], [113.0, 113.31], [115.0, 121.58], [123.0, 127.58], [130.0, 132.22], [133.0, 134.22], [135.0, 137.93]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 44.43, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 72.9, 0.0, 46.54, 67.63, 0.0, 37.11, 57.56, 85.35, 0.0, 35.49], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 36.36], ["speech", 23.65], ["hum", 9.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.28], ["music", 39.0], ["whale vocalization", 5.4]], null, null, [["whale vocalization", 18.78], ["fly, housefly", 13.56], ["speech", 13.29]], null, null, null, [["speech", 69.88], ["chirp tone", 8.82], ["sine wave", 5.53]]], "duration": [1.89, 1.88, 0.57, 1.37, 1.17, 4.9, 2.95, 0.72, 1.26, 13.1, 1.19, 1.65, 0.71, 1.37, 0.21, 0.03, 3.43, -0.01, 2.55, 1.17, 10.8, 4.28, 0.31, 6.58, 4.58, 2.22, 1.22, 2.93]} \ No newline at end of file diff --git a/annotations_1/_qxAcodjpCo_filtered.json b/annotations_1/_qxAcodjpCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..983d532f6c15d71b499756b8af64dc4a87c0b22c --- /dev/null +++ b/annotations_1/_qxAcodjpCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.37], [15.0, 40.36], [40.0, 40.42], [42.0, 46.75]], "keep_status": [true, true, false, false], "silence_prob": [34.51, 30.55, 0.0, 32.25], "audiomae_on_audioset": [[["hum", 31.13], ["music", 18.65], ["throbbing", 10.49]], [["music", 18.45], ["speech", 17.03], ["explosion", 8.34]], null, [["hum", 44.52], ["mains hum", 13.49], ["rumble", 12.76]]], "duration": [10.37, 25.36, 0.42, 4.75]} \ No newline at end of file diff --git a/annotations_1/_r6i8Ae0cvo_filtered.json b/annotations_1/_r6i8Ae0cvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04988d2485d09f0fd0820f66d915ad75e12f9070 --- /dev/null +++ b/annotations_1/_r6i8Ae0cvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.92], [5.0, 8.33], [9.0, 26.13], [27.0, 28.61], [29.0, 31.35], [32.0, 33.67], [34.0, 45.81], [46.0, 48.61], [50.0, 54.99], [56.0, 66.92], [67.0, 68.72], [74.0, 76.5], [77.0, 81.09], [84.0, 84.52], [89.0, 90.71], [93.0, 102.46], [103.0, 109.07], [109.0, 110.78], [111.0, 113.63], [114.0, 116.11], [119.0, 126.82], [127.0, 147.11], [148.0, 164.49], [169.0, 170.51], [171.0, 173.03], [174.0, 175.1], [177.0, 178.41], [185.0, 186.78], [188.0, 190.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.81, 99.36, 0.0, 98.73, 0.0, 98.01, 96.66, 97.33, 99.26, 0.0, 62.47, 99.8, 0.0, 0.0, 97.64, 99.65, 0.0, 94.37, 98.51, 99.56, 94.66, 97.0, 0.0, 99.85, 0.0, 0.0, 0.0, 99.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 3.33, 17.13, 1.61, 2.35, 1.67, 11.81, 2.61, 4.99, 10.92, 1.72, 2.5, 4.09, 0.52, 1.71, 9.46, 6.07, 1.78, 2.63, 2.11, 7.82, 20.11, 16.49, 1.51, 2.03, 1.1, 1.41, 1.78, 2.81]} \ No newline at end of file diff --git a/annotations_1/_sHXbqFJCr0_filtered.json b/annotations_1/_sHXbqFJCr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8768d5760ad3a4bafa2ab211c2aa8f985290ea8b --- /dev/null +++ b/annotations_1/_sHXbqFJCr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 40.66], [41.0, 42.13], [43.0, 44.76], [48.0, 48.51], [49.0, 49.23], [50.0, 51.06], [53.0, 55.54], [57.0, 58.92], [64.0, 64.99], [66.0, 66.85], [71.0, 71.24], [72.0, 71.93], [72.0, 77.03], [77.0, 79.35], [80.0, 80.32], [83.0, 82.81], [86.0, 85.99], [90.0, 90.36], [96.0, 96.82], [97.0, 98.81], [100.0, 100.45], [105.0, 105.56], [109.0, 110.89], [112.0, 113.39], [115.0, 115.42], [117.0, 117.48], [119.0, 120.04], [121.0, 121.69], [125.0, 137.46], [139.0, 141.99], [145.0, 146.28], [148.0, 148.71], [150.0, 158.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 53.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.08, 29.58, 0.0, 0.0, 28.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 34.1], ["arrow", 18.9], ["tuning fork", 9.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.81], ["throbbing", 6.84], ["hum", 4.76]], [["music", 46.43], ["zipper (clothing)", 19.56], ["sound effect", 6.13]], null, null, [["speech", 64.46], ["explosion", 4.17], ["vehicle", 3.97]]], "duration": [1.66, 1.13, 1.76, 0.51, 0.23, 1.06, 2.54, 1.92, 0.99, 0.85, 0.24, -0.07, 5.03, 2.35, 0.32, -0.19, -0.01, 0.36, 0.82, 1.81, 0.45, 0.56, 1.89, 1.39, 0.42, 0.48, 1.04, 0.69, 12.46, 2.99, 1.28, 0.71, 8.77]} \ No newline at end of file diff --git a/annotations_1/_sZ4U5aOee0_filtered.json b/annotations_1/_sZ4U5aOee0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6a44f28e88eba0fa05e74d6161b5de0e5c907f7 --- /dev/null +++ b/annotations_1/_sZ4U5aOee0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.64], [13.0, 15.36], [17.0, 18.37], [20.0, 25.56], [27.0, 48.78], [50.0, 59.24], [62.0, 70.78], [72.0, 84.65]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [68.41, 88.28, 0.0, 68.67, 79.59, 40.41, 34.63, 35.52], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.49], ["theremin", 14.05], ["shofar", 5.91]], [["music", 70.35], ["scary music", 10.59], ["theremin", 7.94]], [["music", 34.82], ["mains hum", 15.49], ["hum", 12.18]]], "duration": [2.64, 2.36, 1.37, 5.56, 21.78, 9.24, 8.78, 12.65]} \ No newline at end of file diff --git a/annotations_1/_t1yxHW97xE_filtered.json b/annotations_1/_t1yxHW97xE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bce0e014d213fcce9e5c9d554d7e8ed10fbdabb --- /dev/null +++ b/annotations_1/_t1yxHW97xE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.61], [21.0, 22.86], [25.0, 25.71], [28.0, 28.75], [40.0, 40.44], [44.0, 50.77], [53.0, 53.45], [54.0, 58.09], [61.0, 62.83], [63.0, 63.26], [83.0, 83.52], [102.0, 110.13], [110.0, 111.2], [116.0, 134.43], [135.0, 135.62], [137.0, 138.72]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.7, 0.0, 33.02, 0.0, 0.0, 0.0, 35.78, 0.0, 34.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 15.31], ["groan", 10.99], ["grunt", 5.3]], null, [["music", 57.6], ["vocal music", 6.54], ["beatboxing", 3.77]], null, null, null, [["music", 64.67], ["singing", 6.58], ["carnatic music", 6.58]], null, [["music", 58.82], ["beatboxing", 8.37], ["singing", 3.84]], null, null], "duration": [0.61, 1.86, 0.71, 0.75, 0.44, 6.77, 0.45, 4.09, 1.83, 0.26, 0.52, 8.13, 1.2, 18.43, 0.62, 1.72]} \ No newline at end of file diff --git a/annotations_1/_t38ENQ9jlY_filtered.json b/annotations_1/_t38ENQ9jlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1d030fbcbd0bf8be059d12da86857c157a54b71 --- /dev/null +++ b/annotations_1/_t38ENQ9jlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.14], [12.0, 12.41], [12.0, 12.95], [15.0, 17.98], [25.0, 25.89], [35.0, 55.78], [59.0, 61.82], [64.0, 66.45], [67.0, 68.28], [74.0, 78.19], [87.0, 93.56], [96.0, 98.91], [103.0, 113.61], [114.0, 116.21], [121.0, 128.17], [131.0, 131.43]], "keep_status": [false, false, false, false, false, false, true, true, false, true, false, false, true, false, true, false], "silence_prob": [40.95, 0.0, 0.0, 30.67, 0.0, 29.84, 30.63, 29.07, 0.0, 29.89, 29.59, 30.28, 29.4, 32.06, 30.22, 0.0], "audiomae_on_audioset": [[["music", 56.42], ["grunt", 13.43], ["noise", 4.62]], null, null, [["livestock, farm animals, working animals", 34.63], ["moo", 29.83], ["cattle, bovinae", 25.17]], null, [["music", 36.7], ["speech", 36.42], ["bleat", 3.86]], [["music", 47.63], ["thunk", 6.04], ["whack, thwack", 4.73]], [["moo", 10.11], ["cattle, bovinae", 9.52], ["speech", 6.17]], null, [["speech", 30.55], ["music", 24.91], ["crowd", 3.16]], [["music", 66.45], ["boing", 15.86], ["speech", 5.14]], [["speech", 38.91], ["music", 29.77], ["vehicle", 5.03]], [["music", 38.02], ["animal", 5.99], ["sheep", 5.91]], [["music", 63.24], ["speech", 8.16], ["boing", 6.65]], [["speech", 37.43], ["music", 20.69], ["outside, rural or natural", 6.64]], null], "duration": [9.14, 0.41, 0.95, 2.98, 0.89, 20.78, 2.82, 2.45, 1.28, 4.19, 6.56, 2.91, 10.61, 2.21, 7.17, 0.43]} \ No newline at end of file diff --git a/annotations_1/_t4L-ZdoEr8_filtered.json b/annotations_1/_t4L-ZdoEr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5736755a05f4b7fc7ee414788669c431dcaaba1 --- /dev/null +++ b/annotations_1/_t4L-ZdoEr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.86], [14.0, 15.16], [18.0, 18.89], [21.0, 23.16], [25.0, 25.0], [25.0, 56.94], [65.0, 64.71], [67.0, 70.93], [72.0, 72.01], [73.0, 74.46], [77.0, 77.18], [86.0, 97.09], [98.0, 98.19], [117.0, 118.71], [123.0, 127.92], [129.0, 129.24], [131.0, 131.28], [134.0, 134.2], [135.0, 135.28], [137.0, 137.78], [140.0, 144.29], [150.0, 152.98], [153.0, 153.01], [153.0, 153.05], [153.0, 153.08], [153.0, 153.12], [153.0, 153.18], [153.0, 153.22], [153.0, 153.25], [153.0, 153.32], [153.0, 153.35], [153.0, 153.49], [155.0, 174.34], [175.0, 176.44], [177.0, 179.05], [184.0, 191.08]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 42.53, 0.0, 0.0, 0.0, 40.88, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 33.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.62, 0.0, 30.72, 31.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 58.75], ["synthesizer", 4.5], ["musical instrument", 2.32]], null, null, null, [["music", 37.73], ["speech", 32.36], ["quack", 10.09]], null, null, null, null, null, null, null, null, [["thunk", 59.52], ["music", 10.45], ["knock", 5.33]], [["music", 32.23], ["trombone", 13.71], ["brass instrument", 9.68]], null, null, null, null, null, null, null, null, null, null, [["music", 73.92], ["fly, housefly", 3.48], ["speech", 2.98]], null, [["music", 72.82], ["musical instrument", 2.74], ["hum", 2.09]], [["music", 33.43], ["speech", 31.88], ["hum", 4.26]]], "duration": [-0.14, 1.16, 0.89, 2.16, 0.0, 31.94, -0.29, 3.93, 0.01, 1.46, 0.18, 11.09, 0.19, 1.71, 4.92, 0.24, 0.28, 0.2, 0.28, 0.78, 4.29, 2.98, 0.01, 0.05, 0.08, 0.12, 0.18, 0.22, 0.25, 0.32, 0.35, 0.49, 19.34, 1.44, 2.05, 7.08]} \ No newline at end of file diff --git a/annotations_1/_uXfbxevYyg_filtered.json b/annotations_1/_uXfbxevYyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d103e7c88ddc086d327ca1a3b19c9d3bdaa30a8 --- /dev/null +++ b/annotations_1/_uXfbxevYyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.69], [6.0, 7.91], [9.0, 10.56], [13.0, 15.94], [19.0, 19.45], [20.0, 20.21], [21.0, 24.24], [25.0, 29.64], [30.0, 32.46], [34.0, 35.48], [38.0, 39.18], [40.0, 41.44], [44.0, 44.42], [46.0, 45.87], [46.0, 47.17], [50.0, 51.43], [53.0, 53.69], [57.0, 58.56], [61.0, 62.04], [63.0, 63.27], [65.0, 64.93], [65.0, 65.82], [66.0, 67.26], [69.0, 69.96], [73.0, 73.92], [79.0, 79.14], [80.0, 84.7], [88.0, 89.53], [91.0, 91.86], [93.0, 93.45], [95.0, 95.79], [96.0, 97.44], [98.0, 135.14], [135.0, 159.75], [160.0, 164.61], [165.0, 165.38], [166.0, 182.16], [182.0, 182.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [93.76, 0.0, 0.0, 96.29, 0.0, 0.0, 99.31, 54.83, 48.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.21, 40.68, 0.0, 40.07, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 84.53], ["radio", 3.02], ["telephone", 1.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.49], ["music", 6.82], ["moo", 6.08]], null, null, null, null, null, null, [["hum", 34.24], ["fart", 12.33], ["mains hum", 11.19]], [["fart", 14.2], ["hum", 11.73], ["throbbing", 7.91]], null, [["noise", 27.05], ["whack, thwack", 10.23], ["hum", 8.27]], null], "duration": [2.69, 1.91, 1.56, 2.94, 0.45, 0.21, 3.24, 4.64, 2.46, 1.48, 1.18, 1.44, 0.42, -0.13, 1.17, 1.43, 0.69, 1.56, 1.04, 0.27, -0.07, 0.82, 1.26, 0.96, 0.92, 0.14, 4.7, 1.53, 0.86, 0.45, 0.79, 1.44, 37.14, 24.75, 4.61, 0.38, 16.16, 0.21]} \ No newline at end of file diff --git a/annotations_1/_uwVIMdk7hc_filtered.json b/annotations_1/_uwVIMdk7hc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d376c9040d0e863c325b3b6facd5a9399133543 --- /dev/null +++ b/annotations_1/_uwVIMdk7hc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.76], [5.0, 5.24], [6.0, 7.33], [8.0, 9.04], [16.0, 16.48], [38.0, 38.82], [41.0, 41.69], [45.0, 45.22], [54.0, 54.77], [58.0, 58.72], [63.0, 64.42], [66.0, 66.78], [68.0, 68.57], [76.0, 76.59], [81.0, 81.48], [85.0, 85.55], [95.0, 95.67], [97.0, 100.33], [101.0, 101.98], [115.0, 119.58], [122.0, 122.72], [123.0, 124.58], [125.0, 126.59], [144.0, 145.72], [151.0, 151.92], [152.0, 151.97], [153.0, 153.89], [157.0, 157.38], [160.0, 160.69], [165.0, 166.48], [169.0, 170.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 76.73], ["ambient music", 4.29], ["electronic music", 2.98]], null, [["speech", 73.8], ["music", 8.35], ["sidetone", 3.78]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 0.24, 1.33, 1.04, 0.48, 0.82, 0.69, 0.22, 0.77, 0.72, 1.42, 0.78, 0.57, 0.59, 0.48, 0.55, 0.67, 3.33, 0.98, 4.58, 0.72, 1.58, 1.59, 1.72, 0.92, -0.03, 0.89, 0.38, 0.69, 1.48, 1.55]} \ No newline at end of file diff --git a/annotations_1/_vwllSx_Ew8_filtered.json b/annotations_1/_vwllSx_Ew8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1d58b1e423af5b0f1fd891e69ea306b1493fa66 --- /dev/null +++ b/annotations_1/_vwllSx_Ew8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 102.93], [110.0, 132.83]], "keep_status": [false, false], "silence_prob": [0.0, 32.64], "audiomae_on_audioset": [null, [["music", 64.65], ["speech", 5.03], ["bell", 4.96]]], "duration": [31.93, 22.83]} \ No newline at end of file diff --git a/annotations_1/_wkTjOjTafw_filtered.json b/annotations_1/_wkTjOjTafw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cdc9f66c7c71ea57b5a98cfb56e18e53c262fac --- /dev/null +++ b/annotations_1/_wkTjOjTafw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.25], [12.0, 19.7], [20.0, 21.9], [23.0, 23.73], [24.0, 29.83], [30.0, 33.0], [33.0, 34.87], [38.0, 38.1], [40.0, 41.64], [44.0, 46.45], [47.0, 48.3], [51.0, 52.03]], "keep_status": [true, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [35.3, 34.03, 0.0, 0.0, 48.95, 43.96, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0], "audiomae_on_audioset": [[["fart", 40.44], ["noise", 5.19], ["cacophony", 4.06]], [["animal", 47.48], ["livestock, farm animals, working animals", 9.14], ["neigh, whinny", 6.27]], null, null, [["speech", 40.47], ["animal", 21.58], ["hum", 3.74]], [["hum", 31.33], ["throbbing", 18.94], ["speech", 16.22]], null, null, null, null, null, null], "duration": [3.25, 7.7, 1.9, 0.73, 5.83, 3.0, 1.87, 0.1, 1.64, 2.45, 1.3, 1.03]} \ No newline at end of file diff --git a/annotations_1/_x3KSXMXzwM_filtered.json b/annotations_1/_x3KSXMXzwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a5e8ef27555eff62ff221700837aaa667daf586 --- /dev/null +++ b/annotations_1/_x3KSXMXzwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.14], [22.0, 22.72], [23.0, 29.71], [31.0, 31.35], [36.0, 36.86], [38.0, 41.07], [65.0, 67.69], [73.0, 74.21], [77.0, 77.45], [85.0, 84.97], [89.0, 89.16], [94.0, 93.73], [94.0, 98.95], [108.0, 108.45], [110.0, 110.62], [112.0, 116.6], [119.0, 124.75]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.19, 0.0, 31.56, 0.0, 0.0, 31.03, 31.69, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 31.25, 31.26], "audiomae_on_audioset": [[["speech", 83.35], ["fart", 2.32], ["horse", 2.29]], null, [["speech", 33.9], ["music", 12.8], ["sidetone", 11.64]], null, null, [["music", 77.96], ["boing", 2.69], ["rattle (instrument)", 1.46]], [["speech", 44.12], ["fart", 20.38], ["music", 5.2]], null, null, null, null, null, [["cowbell", 26.36], ["livestock, farm animals, working animals", 21.21], ["music", 16.95]], null, null, [["livestock, farm animals, working animals", 25.02], ["moo", 17.3], ["cattle, bovinae", 15.18]], [["speech", 89.97], ["applause", 3.75], ["crowd", 1.66]]], "duration": [7.14, 0.72, 6.71, 0.35, 0.86, 3.07, 2.69, 1.21, 0.45, -0.03, 0.16, -0.27, 4.95, 0.45, 0.62, 4.6, 5.75]} \ No newline at end of file diff --git a/annotations_1/_y_We1FV_RQ_filtered.json b/annotations_1/_y_We1FV_RQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34bea4330abf398eac49b8cb0e04f4cb01682b6a --- /dev/null +++ b/annotations_1/_y_We1FV_RQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.21], [22.0, 36.29], [37.0, 39.19], [40.0, 96.79], [100.0, 100.55], [102.0, 103.99], [107.0, 131.41], [132.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [68.41, 40.22, 84.98, 0.0, 0.0, 0.0, 29.23, 0.0], "audiomae_on_audioset": [null, [["throbbing", 37.88], ["hum", 30.4], ["music", 15.92]], null, null, null, null, [["hum", 31.97], ["music", 25.58], ["mains hum", 20.8]], null], "duration": [3.21, 14.29, 2.19, 56.79, 0.55, 1.99, 24.41, 1.1]} \ No newline at end of file diff --git a/annotations_1/_yxKJaVk4kI_filtered.json b/annotations_1/_yxKJaVk4kI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8f9526dc8092ba3d6ff289514b053435d0a1307 --- /dev/null +++ b/annotations_1/_yxKJaVk4kI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [9.0, 9.58], [11.0, 11.97], [14.0, 15.6], [18.0, 18.82], [19.0, 20.58], [29.0, 30.77], [31.0, 31.53], [33.0, 33.57], [35.0, 35.95], [38.0, 38.87], [40.0, 41.35], [43.0, 42.77], [43.0, 43.82], [44.0, 46.57], [49.0, 49.82], [51.0, 51.63], [52.0, 55.29], [58.0, 58.85], [60.0, 60.45], [63.0, 63.27], [68.0, 77.82], [79.0, 79.62], [81.0, 81.68], [85.0, 86.27], [88.0, 89.11], [90.0, 93.07], [95.0, 97.68], [98.0, 98.93], [101.0, 101.48], [117.0, 117.8], [120.0, 121.36], [122.0, 122.84], [124.0, 124.93], [126.0, 128.95], [129.0, 134.43], [135.0, 139.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 99.21, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 69.47, 72.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.58, 0.97, 1.6, 0.82, 1.58, 1.77, 0.53, 0.57, 0.95, 0.87, 1.35, -0.23, 0.82, 2.57, 0.82, 0.63, 3.29, 0.85, 0.45, 0.27, 9.82, 0.62, 0.68, 1.27, 1.11, 3.07, 2.68, 0.93, 0.48, 0.8, 1.36, 0.84, 0.93, 2.95, 5.43, 4.87]} \ No newline at end of file diff --git a/annotations_1/_zHhry-Ot0Y_filtered.json b/annotations_1/_zHhry-Ot0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d639bd1638eb596fd3d416e50f3e8b523456234a --- /dev/null +++ b/annotations_1/_zHhry-Ot0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.22], [14.0, 14.42], [14.0, 14.45], [15.0, 18.33], [19.0, 21.1], [23.0, 23.46], [25.0, 25.54], [29.0, 29.24], [31.0, 31.78], [49.0, 52.98], [54.0, 54.11], [55.0, 56.15], [57.0, 58.02], [59.0, 62.36], [67.0, 74.58], [84.0, 89.06], [92.0, 105.38], [126.0, 126.69], [128.0, 128.38], [140.0, 141.32], [143.0, 143.75], [144.0, 168.93], [170.0, 171.69], [173.0, 175.02]], "keep_status": [true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, true, false, false], "silence_prob": [29.34, 0.0, 0.0, 31.11, 33.32, 0.0, 0.0, 0.0, 0.0, 29.77, 0.0, 0.0, 0.0, 28.91, 28.78, 28.86, 28.59, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0, 70.16], "audiomae_on_audioset": [[["didgeridoo", 18.19], ["music", 16.11], ["whale vocalization", 7.55]], null, null, [["grunt", 87.89], ["music", 3.04], ["groan", 2.29]], [["speech", 20.13], ["music", 10.59], ["throat clearing", 7.49]], null, null, null, null, [["music", 12.76], ["vehicle", 4.76], ["buzz", 4.74]], null, null, null, [["cattle, bovinae", 21.9], ["moo", 19.69], ["livestock, farm animals, working animals", 10.27]], [["music", 54.59], ["breaking", 21.8], ["shatter", 3.8]], [["speech", 37.3], ["music", 27.44], ["mains hum", 9.19]], [["buzz", 19.98], ["music", 11.21], ["noise", 7.82]], null, null, null, null, [["animal", 45.56], ["domestic animals, pets", 7.26], ["dog", 5.39]], null, null], "duration": [5.22, 0.42, 0.45, 3.33, 2.1, 0.46, 0.54, 0.24, 0.78, 3.98, 0.11, 1.15, 1.02, 3.36, 7.58, 5.06, 13.38, 0.69, 0.38, 1.32, 0.75, 24.93, 1.69, 2.02]} \ No newline at end of file diff --git a/annotations_1/_zPImuBvnOA_filtered.json b/annotations_1/_zPImuBvnOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a74a30c6c4eb5637b52f1a0491ef5edf7002fa1 --- /dev/null +++ b/annotations_1/_zPImuBvnOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [1.0, 1.21], [3.0, 3.3], [15.0, 14.89], [38.0, 40.71], [48.0, 50.85], [51.0, 52.35], [57.0, 58.04], [61.0, 62.38], [66.0, 66.26], [69.0, 70.19], [73.0, 76.05], [77.0, 79.29], [80.0, 82.05], [86.0, 87.98], [89.0, 90.12], [91.0, 91.52], [93.0, 92.74], [93.0, 95.44], [102.0, 103.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.78, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 34.29, 44.99, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["gong", 29.98], ["music", 22.47], ["singing bowl", 13.34]], [["music", 68.97], ["speech", 4.7], ["hum", 4.0]], null, null, null, null, null, null], "duration": [-0.13, 0.21, 0.3, -0.11, 2.71, 2.85, 1.35, 1.04, 1.38, 0.26, 1.19, 3.05, 2.29, 2.05, 1.98, 1.12, 0.52, -0.26, 2.44, 1.49]} \ No newline at end of file diff --git a/annotations_1/a-CS6CjnEw8_filtered.json b/annotations_1/a-CS6CjnEw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2fab5d544b4f14b8b5ef74ef7bc6c40d95d43ed0 --- /dev/null +++ b/annotations_1/a-CS6CjnEw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.62], [23.0, 23.8], [25.0, 26.2], [27.0, 30.47], [35.0, 36.68], [38.0, 38.57], [40.0, 40.19], [41.0, 42.09], [43.0, 49.52], [51.0, 51.53], [52.0, 52.71], [53.0, 56.1], [58.0, 58.29], [59.0, 76.6], [78.0, 80.28], [82.0, 84.13], [87.0, 89.06], [98.0, 99.23], [101.0, 108.38], [109.0, 115.26], [116.0, 131.16], [132.0, 133.62], [135.0, 137.0], [142.0, 142.65], [143.0, 146.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 49.54, 0.0, 72.01, 96.54, 100.0, 94.81, 0.0, 100.0, 96.89, 99.93, 0.0, 97.54, 0.0, 88.28], "audiomae_on_audioset": [null, null, null, [["music", 25.28], ["didgeridoo", 11.68], ["guitar", 7.89]], null, null, null, null, null, null, null, [["sidetone", 50.03], ["busy signal", 18.45], ["speech", 16.24]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 0.8, 1.2, 3.47, 1.68, 0.57, 0.19, 1.09, 6.52, 0.53, 0.71, 3.1, 0.29, 17.6, 2.28, 2.13, 2.06, 1.23, 7.38, 6.26, 15.16, 1.62, 2.0, 0.65, 3.42]} \ No newline at end of file diff --git a/annotations_1/a2ZdXUZt3iw_filtered.json b/annotations_1/a2ZdXUZt3iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df29d7f48b70aeb32f211d1ddcc3e4c015939f30 --- /dev/null +++ b/annotations_1/a2ZdXUZt3iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 39.45], [40.0, 43.63], [45.0, 47.29], [49.0, 52.35], [53.0, 54.14], [56.0, 56.29], [58.0, 58.26], [59.0, 60.34], [63.0, 64.5], [65.0, 67.56], [68.0, 67.61], [68.0, 96.58], [99.0, 105.02], [107.0, 107.49], [109.0, 111.32], [114.0, 115.69]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.27, 45.92, 36.01, 41.42, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 28.85, 34.88, 0.0, 76.7, 0.0], "audiomae_on_audioset": [[["speech", 47.4], ["explosion", 10.71], ["music", 7.53]], [["music", 27.49], ["didgeridoo", 20.73], ["speech", 14.26]], [["didgeridoo", 18.3], ["speech", 16.09], ["mains hum", 14.86]], [["fart", 28.8], ["speech", 11.53], ["dog", 10.47]], null, null, null, null, null, null, null, [["speech", 57.29], ["music", 17.27], ["hum", 5.81]], [["music", 33.04], ["hum", 23.44], ["mains hum", 9.14]], null, null, null], "duration": [21.45, 3.63, 2.29, 3.35, 1.14, 0.29, 0.26, 1.34, 1.5, 2.56, -0.39, 28.58, 6.02, 0.49, 2.32, 1.69]} \ No newline at end of file diff --git a/annotations_1/a2qE4hG9XCk_filtered.json b/annotations_1/a2qE4hG9XCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72ba4c7dc702e0957e0e8673a725365a84854f41 --- /dev/null +++ b/annotations_1/a2qE4hG9XCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [7.0, 16.28], [17.0, 44.27], [44.0, 48.25], [49.0, 49.55], [51.0, 62.7], [66.0, 68.79], [75.0, 78.66], [82.0, 87.18], [93.0, 93.24], [95.0, 98.24], [99.0, 101.66], [103.0, 103.11], [109.0, 109.53], [113.0, 121.42], [125.0, 140.16]], "keep_status": [false, true, true, true, false, false, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 34.06, 31.04, 31.35, 0.0, 35.1, 37.56, 30.82, 30.25, 0.0, 32.35, 30.67, 0.0, 0.0, 30.43, 30.69], "audiomae_on_audioset": [null, [["hum", 23.84], ["music", 23.15], ["speech", 15.4]], [["music", 43.75], ["speech", 17.57], ["motorcycle", 6.65]], [["music", 46.49], ["throbbing", 9.02], ["hum", 6.22]], null, [["music", 42.89], ["whale vocalization", 15.88], ["speech", 15.0]], [["whale vocalization", 24.0], ["speech", 18.08], ["noise", 10.59]], [["music", 31.6], ["throbbing", 17.26], ["hum", 10.33]], [["music", 61.56], ["throbbing", 4.44], ["hum", 4.18]], null, [["music", 54.62], ["throbbing", 15.17], ["hum", 7.45]], [["music", 46.12], ["hum", 9.91], ["mains hum", 8.59]], null, null, [["speech", 23.11], ["buzz", 19.19], ["fly, housefly", 11.27]], [["music", 52.58], ["speech", 15.87], ["throbbing", 2.57]]], "duration": [0.51, 9.28, 27.27, 4.25, 0.55, 11.7, 2.79, 3.66, 5.18, 0.24, 3.24, 2.66, 0.11, 0.53, 8.42, 15.16]} \ No newline at end of file diff --git a/annotations_1/a3HOCIXroqQ_filtered.json b/annotations_1/a3HOCIXroqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..661201bf13c906ef187c42f34134443229ca4f0c --- /dev/null +++ b/annotations_1/a3HOCIXroqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.08], [13.0, 14.2], [19.0, 23.7], [27.0, 27.04], [34.0, 34.69], [37.0, 39.28], [40.0, 63.29], [65.0, 64.94], [65.0, 65.52], [67.0, 126.54]], "keep_status": [false, false, true, false, false, true, true, false, false, false], "silence_prob": [32.05, 0.0, 34.24, 0.0, 0.0, 29.76, 29.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 29.22], ["music", 21.11], ["hum", 19.91]], null, [["music", 20.85], ["speech", 18.62], ["throbbing", 17.01]], null, null, [["noise", 20.23], ["hum", 16.92], ["mains hum", 11.09]], [["vehicle", 21.13], ["music", 11.74], ["buzz", 11.25]], null, null, null], "duration": [2.08, 1.2, 4.7, 0.04, 0.69, 2.28, 23.29, -0.06, 0.52, 59.54]} \ No newline at end of file diff --git a/annotations_1/a3Xm0KpUYj4_filtered.json b/annotations_1/a3Xm0KpUYj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2ba4bce93bb3554e2903cf3de5feb1837cdae00 --- /dev/null +++ b/annotations_1/a3Xm0KpUYj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.4], [11.0, 11.6], [14.0, 29.15], [31.0, 33.18], [36.0, 38.64], [40.0, 45.66], [47.0, 47.02], [48.0, 49.33], [50.0, 52.83]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.51, 33.06, 32.56, 39.5, 0.0, 0.0, 36.1], "audiomae_on_audioset": [null, null, [["music", 35.34], ["hum", 24.56], ["throbbing", 24.16]], [["music", 29.16], ["synthesizer", 10.57], ["hum", 7.12]], [["music", 48.31], ["hum", 11.81], ["mains hum", 5.86]], [["speech", 55.42], ["hum", 20.14], ["mains hum", 7.45]], null, null, [["music", 65.82], ["bass guitar", 3.45], ["didgeridoo", 3.32]]], "duration": [0.4, 0.6, 15.15, 2.18, 2.64, 5.66, 0.02, 1.33, 2.83]} \ No newline at end of file diff --git a/annotations_1/a3bI7kbVBwM_filtered.json b/annotations_1/a3bI7kbVBwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6090461df8b196d9ffa5d39d6573147470d6febd --- /dev/null +++ b/annotations_1/a3bI7kbVBwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.06], [14.0, 15.2], [17.0, 17.78], [18.0, 22.47], [24.0, 29.62], [30.0, 31.94], [33.0, 35.24], [37.0, 44.58], [46.0, 47.34], [50.0, 64.47], [65.0, 70.48], [74.0, 75.56], [82.0, 94.19], [97.0, 100.57], [101.0, 118.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [30.36, 0.0, 0.0, 30.17, 29.78, 0.0, 29.83, 30.65, 0.0, 30.3, 31.21, 0.0, 29.97, 29.93, 30.22], "audiomae_on_audioset": [[["music", 64.4], ["throbbing", 7.64], ["electronic music", 4.49]], null, null, [["music", 79.91], ["throbbing", 4.67], ["electronic music", 3.1]], [["music", 77.63], ["electronic music", 3.75], ["techno", 2.7]], null, [["music", 73.6], ["sampler", 2.59], ["electronic music", 2.54]], [["music", 64.57], ["hum", 5.2], ["drum and bass", 3.68]], null, [["music", 92.31], ["funny music", 1.14], ["throbbing", 0.69]], [["music", 37.47], ["didgeridoo", 7.61], ["musical instrument", 4.85]], null, [["music", 85.85], ["roll", 2.42], ["rock and roll", 2.05]], [["music", 78.76], ["buzz", 1.91], ["electronic music", 1.58]], [["music", 94.63], ["psychedelic rock", 0.83], ["rock music", 0.67]]], "duration": [4.06, 1.2, 0.78, 4.47, 5.62, 1.94, 2.24, 7.58, 1.34, 14.47, 5.48, 1.56, 12.19, 3.57, 17.32]} \ No newline at end of file diff --git a/annotations_1/a46m8g3grB8_filtered.json b/annotations_1/a46m8g3grB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d55aef3e825b7a6a6a0e39697849ab77f2edc94d --- /dev/null +++ b/annotations_1/a46m8g3grB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.68], [51.0, 64.29], [65.0, 65.45], [66.0, 66.9], [79.0, 79.08], [80.0, 80.35], [81.0, 84.5], [85.0, 85.94], [86.0, 88.89], [93.0, 93.01], [95.0, 95.49], [100.0, 100.21], [102.0, 103.0], [105.0, 105.81], [106.0, 107.16], [108.0, 109.11], [114.0, 115.15], [116.0, 116.41], [117.0, 118.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.45, 52.74, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.83], ["fly, housefly", 3.57], ["livestock, farm animals, working animals", 3.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [21.68, 13.29, 0.45, 0.9, 0.08, 0.35, 3.5, 0.94, 2.89, 0.01, 0.49, 0.21, 1.0, 0.81, 1.16, 1.11, 1.15, 0.41, 1.98]} \ No newline at end of file diff --git a/annotations_1/a4OWkIrQUJw_filtered.json b/annotations_1/a4OWkIrQUJw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77ae13e5f453f75b646d5ef6eefd16b630314ece --- /dev/null +++ b/annotations_1/a4OWkIrQUJw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [7.0, 8.19], [9.0, 10.81], [13.0, 13.39], [14.0, 18.33], [25.0, 25.59], [33.0, 36.09], [40.0, 39.77], [40.0, 42.6], [44.0, 50.67], [52.0, 55.78], [57.0, 59.39], [63.0, 64.02], [64.0, 64.1], [64.0, 64.13], [65.0, 65.25], [66.0, 67.24], [68.0, 83.54], [85.0, 85.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.51, 0.0, 0.0, 0.0, 99.44, 0.0, 98.59, 0.0, 72.31, 91.81, 99.31, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 1.19, 1.81, 0.39, 4.33, 0.59, 3.09, -0.23, 2.6, 6.67, 3.78, 2.39, 1.02, 0.1, 0.13, 0.25, 1.24, 15.54, 0.04]} \ No newline at end of file diff --git a/annotations_1/a6--cEjo3bY_filtered.json b/annotations_1/a6--cEjo3bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9345711c347854aed3d1c0fb74433820141da379 --- /dev/null +++ b/annotations_1/a6--cEjo3bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.78], [9.0, 8.77], [13.0, 15.97], [19.0, 20.11], [21.0, 21.59], [32.0, 32.14], [36.0, 36.42], [37.0, 37.96], [41.0, 44.52], [48.0, 48.9], [58.0, 63.95], [66.0, 67.51], [69.0, 71.05], [73.0, 73.26], [73.0, 74.24], [76.0, 76.91], [77.0, 80.38], [82.0, 83.54], [85.0, 87.17], [88.0, 89.13], [90.0, 92.23], [95.0, 96.92], [102.0, 111.75], [115.0, 115.4], [116.0, 117.19], [118.0, 123.5], [124.0, 123.57], [124.0, 124.78], [130.0, 132.22], [135.0, 147.31], [147.0, 173.84], [174.0, 175.58], [176.0, 177.69]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 42.44, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0, 88.28, 0.0, 73.06, 0.0, 0.0, 0.0, 42.28, 0.0, 48.1, 0.0, 91.13, 0.0, 38.12, 0.0, 0.0, 36.09, 0.0, 0.0, 98.19, 35.94, 31.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 26.2], ["livestock, farm animals, working animals", 18.55], ["moo", 13.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["creak", 31.23], ["noise", 11.59], ["mosquito", 7.08]], null, [["speech", 36.9], ["insect", 8.79], ["fly, housefly", 8.46]], null, null, null, [["throbbing", 16.94], ["noise", 16.05], ["whack, thwack", 10.06]], null, null, [["speech", 57.84], ["noise", 3.97], ["hum", 3.65]], null, null, null, [["speech", 47.81], ["sidetone", 7.89], ["fart", 7.02]], [["speech", 38.55], ["whack, thwack", 9.09], ["animal", 6.55]], null, null], "duration": [1.78, -0.23, 2.97, 1.11, 0.59, 0.14, 0.42, 0.96, 3.52, 0.9, 5.95, 1.51, 2.05, 0.26, 1.24, 0.91, 3.38, 1.54, 2.17, 1.13, 2.23, 1.92, 9.75, 0.4, 1.19, 5.5, -0.43, 0.78, 2.22, 12.31, 26.84, 1.58, 1.69]} \ No newline at end of file diff --git a/annotations_1/a66f39DMwtY_filtered.json b/annotations_1/a66f39DMwtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4b4fa425e22d46c7fb214228a5732602aef983a --- /dev/null +++ b/annotations_1/a66f39DMwtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.94], [39.0, 43.6], [46.0, 46.23], [47.0, 47.85], [51.0, 51.19], [54.0, 54.7], [63.0, 73.25], [75.0, 75.63], [81.0, 81.21]], "keep_status": [false, true, false, false, false, false, true, false, false], "silence_prob": [38.04, 46.47, 0.0, 0.0, 0.0, 0.0, 40.92, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 43.9], ["music", 25.11], ["theremin", 3.47]], [["speech", 51.46], ["music", 10.16], ["sidetone", 7.42]], null, null, null, null, [["hum", 20.51], ["speech", 20.33], ["mains hum", 13.79]], null, null], "duration": [3.94, 4.6, 0.23, 0.85, 0.19, 0.7, 10.25, 0.63, 0.21]} \ No newline at end of file diff --git a/annotations_1/a6XtVMtUZI8_filtered.json b/annotations_1/a6XtVMtUZI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea2fb8b7e03b57e20b816efb036d4a15b0837274 --- /dev/null +++ b/annotations_1/a6XtVMtUZI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 46.57], [47.0, 47.43], [51.0, 51.9], [53.0, 53.77], [55.0, 59.09], [61.0, 62.43], [63.0, 66.53], [67.0, 74.46], [75.0, 77.92], [79.0, 80.57], [81.0, 83.24], [86.0, 111.27], [112.0, 118.86], [120.0, 120.53], [122.0, 127.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 65.09, 86.09, 0.0, 96.04, 99.48, 100.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.57, 0.43, 0.9, 0.77, 4.09, 1.43, 3.53, 7.46, 2.92, 1.57, 2.24, 25.27, 6.86, 0.53, 5.16]} \ No newline at end of file diff --git a/annotations_1/a6cUudbbHl0_filtered.json b/annotations_1/a6cUudbbHl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..832503368c5969dd02f8ed6a334343c4a28bd833 --- /dev/null +++ b/annotations_1/a6cUudbbHl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.43], [6.0, 8.16], [10.0, 13.42], [14.0, 18.96], [20.0, 21.91], [24.0, 26.52], [32.0, 35.9], [40.0, 40.49], [42.0, 42.77], [44.0, 49.82], [54.0, 57.21], [59.0, 60.22], [61.0, 62.61], [65.0, 68.84], [69.0, 69.45], [69.0, 69.5], [70.0, 70.7], [76.0, 76.25], [79.0, 81.67], [84.0, 85.08], [94.0, 94.95], [97.0, 97.75], [99.0, 100.33], [103.0, 107.72], [108.0, 114.07], [115.0, 117.91], [119.0, 120.95], [123.0, 124.09], [125.0, 127.62], [130.0, 131.46], [132.0, 134.47], [136.0, 137.69], [140.0, 140.83], [142.0, 143.43], [148.0, 150.13], [151.0, 153.54], [157.0, 158.13], [159.0, 160.1], [161.0, 162.23], [165.0, 165.67], [167.0, 168.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.22, 44.07, 60.32, 42.58, 0.0, 52.33, 54.63, 0.0, 0.0, 55.46, 36.52, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 61.57, 40.7, 31.77, 0.0, 0.0, 36.44, 0.0, 38.95, 0.0, 0.0, 0.0, 43.4, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.35], ["electronic music", 9.73], ["synthesizer", 7.52]], [["music", 53.53], ["singing bowl", 26.36], ["ambient music", 5.01]], null, [["singing bowl", 28.24], ["music", 27.15], ["speech", 21.3]], null, null, null, null, null, null, [["sine wave", 39.03], ["chirp tone", 13.69], ["fire", 4.75]], null, null, [["music", 18.64], ["hum", 14.18], ["speech", 14.15]], null, null, null, null, null, null, null, null, null, null, [["music", 36.79], ["singing bowl", 33.59], ["speech", 6.61]], [["speech", 22.16], ["music", 10.02], ["thump, thud", 6.55]], null, null, [["music", 70.79], ["hum", 5.79], ["electronic music", 3.78]], null, [["music", 27.48], ["sine wave", 23.14], ["gong", 15.43]], null, null, null, [["music", 47.25], ["singing bowl", 21.38], ["ambient music", 4.26]], [["music", 62.75], ["musical instrument", 7.93], ["synthesizer", 4.96]], null, null, null, null, null], "duration": [2.43, 2.16, 3.42, 4.96, 1.91, 2.52, 3.9, 0.49, 0.77, 5.82, 3.21, 1.22, 1.61, 3.84, 0.45, 0.5, 0.7, 0.25, 2.67, 1.08, 0.95, 0.75, 1.33, 4.72, 6.07, 2.91, 1.95, 1.09, 2.62, 1.46, 2.47, 1.69, 0.83, 1.43, 2.13, 2.54, 1.13, 1.1, 1.23, 0.67, 1.1]} \ No newline at end of file diff --git a/annotations_1/a7XZaIy4a9k_filtered.json b/annotations_1/a7XZaIy4a9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..959a773ef3b2caa4ec9c776e0fcf51d292faf1e2 --- /dev/null +++ b/annotations_1/a7XZaIy4a9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.23], [7.0, 8.18], [12.0, 12.66], [15.0, 16.58], [18.0, 18.15], [18.0, 27.19], [28.0, 29.71], [31.0, 31.65], [33.0, 35.41], [38.0, 39.07], [40.0, 40.34], [41.0, 42.04], [43.0, 44.15], [48.0, 48.69], [50.0, 50.79], [51.0, 55.97], [57.0, 58.18], [59.0, 61.25], [62.0, 63.12], [66.0, 68.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 66.76, 0.0, 74.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.18, 0.66, 1.58, 0.15, 9.19, 1.71, 0.65, 2.41, 1.07, 0.34, 1.04, 1.15, 0.69, 0.79, 4.97, 1.18, 2.25, 1.12, 2.69]} \ No newline at end of file diff --git a/annotations_1/a7gZgEpgKiY_filtered.json b/annotations_1/a7gZgEpgKiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d4d3b063238b140bc2add85aad99894bcc8e290 --- /dev/null +++ b/annotations_1/a7gZgEpgKiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.88], [4.0, 4.78], [8.0, 8.78], [12.0, 23.6], [25.0, 26.11], [26.0, 28.24], [30.0, 29.79], [31.0, 35.06], [36.0, 62.5], [64.0, 67.8], [69.0, 73.23], [75.0, 79.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.54, 0.0, 65.32, 0.0, 96.66, 69.47, 92.48, 94.52, 53.4], "audiomae_on_audioset": [null, null, null, [["music", 54.8], ["speech", 10.19], ["fart", 6.48]], null, null, null, null, null, null, null, null], "duration": [-0.12, 0.78, 0.78, 11.6, 1.11, 2.24, -0.21, 4.06, 26.5, 3.8, 4.23, 4.14]} \ No newline at end of file diff --git a/annotations_1/a7vAR-7YBWE_filtered.json b/annotations_1/a7vAR-7YBWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bee2d3cbebfc3f6b79df7e1ae2fe052b8df9cec7 --- /dev/null +++ b/annotations_1/a7vAR-7YBWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.67], [21.0, 22.3], [23.0, 23.62], [25.0, 25.79], [27.0, 29.39], [32.0, 35.19], [36.0, 35.85], [36.0, 40.36], [49.0, 49.57], [57.0, 57.77], [59.0, 63.15], [67.0, 67.83], [71.0, 72.74], [75.0, 81.87], [93.0, 93.06], [95.0, 96.38], [98.0, 104.58], [115.0, 115.87], [128.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 64.86, 83.34, 0.0, 44.29, 0.0, 0.0, 55.18, 0.0, 0.0, 40.62, 0.0, 0.0, 36.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 27.72], ["music", 13.7], ["fly, housefly", 6.73]], null, null, null, null, null, [["music", 32.41], ["singing bowl", 11.96], ["synthesizer", 7.81]], null, null, [["speech", 31.39], ["mains hum", 14.2], ["music", 10.77]], null, null], "duration": [0.67, 1.3, 0.62, 0.79, 2.39, 3.19, -0.15, 4.36, 0.57, 0.77, 4.15, 0.83, 1.74, 6.87, 0.06, 1.38, 6.58, 0.87, 1.05]} \ No newline at end of file diff --git a/annotations_1/a81pNygdAXw_filtered.json b/annotations_1/a81pNygdAXw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f7ac28193cf21b48cde6dfab51f17bf4f3d1328 --- /dev/null +++ b/annotations_1/a81pNygdAXw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.95], [13.0, 14.17], [15.0, 18.67], [20.0, 20.43], [23.0, 23.65], [27.0, 27.89], [29.0, 30.08], [32.0, 32.1], [33.0, 37.05], [40.0, 41.82], [44.0, 45.62], [48.0, 48.63], [52.0, 52.89], [56.0, 57.25], [62.0, 63.68], [65.0, 73.41], [75.0, 75.86], [77.0, 79.02], [82.0, 82.78], [84.0, 85.23], [86.0, 88.08], [91.0, 93.28], [95.0, 97.23], [99.0, 101.73], [103.0, 103.67], [105.0, 106.08], [109.0, 112.58]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.6, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 99.8, 79.07, 95.91, 99.68, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, [["cat", 7.72], ["hum", 6.7], ["inside, small room", 6.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.95, 1.17, 3.67, 0.43, 0.65, 0.89, 1.08, 0.1, 4.05, 1.82, 1.62, 0.63, 0.89, 1.25, 1.68, 8.41, 0.86, 2.02, 0.78, 1.23, 2.08, 2.28, 2.23, 2.73, 0.67, 1.08, 3.58]} \ No newline at end of file diff --git a/annotations_1/a87b-bsz1Mg_filtered.json b/annotations_1/a87b-bsz1Mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a000bf8c1a2dcfcc92ab82b380216f210d23ad3b --- /dev/null +++ b/annotations_1/a87b-bsz1Mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.64], [14.0, 15.08], [16.0, 17.61], [20.0, 39.55], [42.0, 44.68], [48.0, 53.11], [54.0, 63.76], [66.0, 66.12], [67.0, 68.64], [70.0, 71.73], [74.0, 76.72], [80.0, 79.95], [86.0, 86.48], [90.0, 95.08], [102.0, 107.32], [108.0, 111.97], [113.0, 120.29], [123.0, 130.2], [133.0, 134.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.67, 0.0, 0.0, 79.59, 91.81, 92.97, 80.64, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 94.22, 87.19, 56.4, 71.29, 92.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.64, 1.08, 1.61, 19.55, 2.68, 5.11, 9.76, 0.12, 1.64, 1.73, 2.72, -0.05, 0.48, 5.08, 5.32, 3.97, 7.29, 7.2, 1.13]} \ No newline at end of file diff --git a/annotations_1/a8EeFNXk1TE_filtered.json b/annotations_1/a8EeFNXk1TE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f05a214a8a3b7c1f44d2c4eed3346908a4e7b28 --- /dev/null +++ b/annotations_1/a8EeFNXk1TE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.72], [11.0, 12.38], [12.0, 12.41], [12.0, 12.45], [15.0, 15.38], [21.0, 21.9], [24.0, 25.42], [32.0, 38.74], [42.0, 46.26], [51.0, 51.48], [56.0, 58.38], [60.0, 60.29], [61.0, 62.36], [63.0, 64.34], [65.0, 67.46]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.18, 38.02, 0.0, 51.66, 0.0, 0.0, 0.0, 95.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 17.08], ["speech", 10.56], ["hum", 6.7]], [["speech", 53.59], ["noise", 5.6], ["sine wave", 3.77]], null, null, null, null, null, null], "duration": [-0.28, 1.38, 0.41, 0.45, 0.38, 0.9, 1.42, 6.74, 4.26, 0.48, 2.38, 0.29, 1.36, 1.34, 2.46]} \ No newline at end of file diff --git a/annotations_1/a8mImo0aNDo_filtered.json b/annotations_1/a8mImo0aNDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cec14281d1387111363fd02374ed1b6e0d74146 --- /dev/null +++ b/annotations_1/a8mImo0aNDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.85], [8.0, 8.41], [12.0, 16.26], [18.0, 18.76], [23.0, 55.38], [57.0, 57.06], [61.0, 61.92], [62.0, 62.78], [65.0, 66.75], [69.0, 75.68], [82.0, 82.9], [87.0, 87.71], [90.0, 90.31], [92.0, 92.87], [95.0, 110.64], [113.0, 123.52], [125.0, 130.2], [130.0, 131.67], [133.0, 134.72], [136.0, 137.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 0.0, 0.0, 29.79, 29.76, 28.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 68.61], ["throbbing", 12.75], ["hum", 2.82]], null, null, null, null, [["throbbing", 37.22], ["hum", 35.04], ["music", 14.72]], [["music", 53.99], ["hum", 7.72], ["mains hum", 7.44]], [["music", 46.43], ["speech", 18.79], ["throbbing", 3.54]], null, null, null], "duration": [0.85, 0.41, 4.26, 0.76, 32.38, 0.06, 0.92, 0.78, 1.75, 6.68, 0.9, 0.71, 0.31, 0.87, 15.64, 10.52, 5.2, 1.67, 1.72, 1.08]} \ No newline at end of file diff --git a/annotations_1/aB0ABzNHvAE_filtered.json b/annotations_1/aB0ABzNHvAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9911472e4d172ffad9125296004e3f1b8f71ce1b --- /dev/null +++ b/annotations_1/aB0ABzNHvAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [7.0, 7.65], [10.0, 17.07], [20.0, 22.94], [25.0, 25.71], [28.0, 30.48], [33.0, 35.6], [37.0, 44.0], [47.0, 48.84], [54.0, 55.09], [57.0, 70.5], [72.0, 72.4], [74.0, 77.55], [79.0, 81.46], [82.0, 82.8], [87.0, 88.42], [92.0, 94.2], [97.0, 103.33], [105.0, 107.92], [114.0, 115.59], [117.0, 117.91], [119.0, 123.08], [124.0, 125.0], [126.0, 129.57], [132.0, 150.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.91, 62.47, 0.0, 63.31, 63.53, 51.71, 0.0, 0.0, 59.77, 0.0, 89.19, 94.37, 0.0, 0.0, 94.66, 95.78, 95.37, 0.0, 0.0, 77.53, 0.0, 61.67, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.65, 7.07, 2.94, 0.71, 2.48, 2.6, 7.0, 1.84, 1.09, 13.5, 0.4, 3.55, 2.46, 0.8, 1.42, 2.2, 6.33, 2.92, 1.59, 0.91, 4.08, 1.0, 3.57, 18.94]} \ No newline at end of file diff --git a/annotations_1/aBxlJkcHDSM_filtered.json b/annotations_1/aBxlJkcHDSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ec44f7b43b8e43f3bcf0cc5ebafb3f667651e4 --- /dev/null +++ b/annotations_1/aBxlJkcHDSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.61], [4.0, 5.44], [7.0, 8.68], [12.0, 13.29], [15.0, 96.09], [97.0, 98.52], [101.0, 101.14], [103.0, 139.97], [141.0, 141.59], [143.0, 155.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 57.15], ["didgeridoo", 21.86], ["grunt", 14.46]]], "duration": [0.61, 1.44, 1.68, 1.29, 81.09, 1.52, 0.14, 36.97, 0.59, 12.9]} \ No newline at end of file diff --git a/annotations_1/aD4ZPXHAVCA_filtered.json b/annotations_1/aD4ZPXHAVCA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7d837ddb7218560cd2c7b219f4bcbfaa6e2ce20 --- /dev/null +++ b/annotations_1/aD4ZPXHAVCA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [8.0, 8.01], [8.0, 10.62], [14.0, 14.71], [16.0, 17.04], [18.0, 19.48], [22.0, 28.31], [29.0, 30.89], [33.0, 34.26], [35.0, 35.48], [37.0, 37.4], [45.0, 45.6], [49.0, 50.18], [54.0, 54.04], [56.0, 56.0], [57.0, 64.49], [71.0, 88.2], [93.0, 98.78], [101.0, 107.3], [114.0, 114.69], [116.0, 116.34], [118.0, 118.02], [122.0, 122.82], [125.0, 126.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.35, 29.69, 29.2, 29.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 28.63], ["frog", 15.2], ["croak", 14.39]], [["music", 53.96], ["saxophone", 11.21], ["singing", 7.08]], [["music", 87.59], ["music of latin america", 3.27], ["clarinet", 1.44]], [["livestock, farm animals, working animals", 38.08], ["moo", 25.42], ["cattle, bovinae", 21.81]], null, null, null, null, null], "duration": [0.83, 0.01, 2.62, 0.71, 1.04, 1.48, 6.31, 1.89, 1.26, 0.48, 0.4, 0.6, 1.18, 0.04, 0.0, 7.49, 17.2, 5.78, 6.3, 0.69, 0.34, 0.02, 0.82, 1.89]} \ No newline at end of file diff --git a/annotations_1/aDJgv1iARPg_filtered.json b/annotations_1/aDJgv1iARPg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0c19aba39d56c0114062dec44b8360fa5bbd42 --- /dev/null +++ b/annotations_1/aDJgv1iARPg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [23.0, 22.84], [29.0, 29.71], [31.0, 31.02], [42.0, 43.78], [46.0, 47.07], [67.0, 67.29], [84.0, 84.96], [109.0, 112.89], [114.0, 116.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 59.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.44, -0.16, 0.71, 0.02, 1.78, 1.07, 0.29, 0.96, 3.89, 2.16]} \ No newline at end of file diff --git a/annotations_1/aDU5CcINqyI_filtered.json b/annotations_1/aDU5CcINqyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ed9c3f7f22048b7221f80fb14fbed1f5edc925e --- /dev/null +++ b/annotations_1/aDU5CcINqyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 31.21], [32.0, 36.85], [62.0, 61.89], [64.0, 66.77], [67.0, 77.63], [80.0, 102.96], [105.0, 105.14], [107.0, 107.96], [112.0, 113.32], [114.0, 139.65], [146.0, 151.71], [154.0, 154.77], [156.0, 156.29], [159.0, 164.15], [165.0, 166.06], [169.0, 173.47], [175.0, 175.1]], "keep_status": [false, false, false, true, true, true, false, false, false, true, true, false, false, true, false, true, false], "silence_prob": [31.47, 32.39, 0.0, 36.74, 35.37, 35.34, 0.0, 0.0, 0.0, 29.8, 29.9, 0.0, 0.0, 38.23, 0.0, 40.38, 0.0], "audiomae_on_audioset": [[["music", 57.49], ["hum", 8.86], ["mains hum", 7.33]], [["music", 69.99], ["synthesizer", 4.79], ["musical instrument", 4.61]], null, [["speech", 39.56], ["fly, housefly", 8.49], ["didgeridoo", 5.01]], [["didgeridoo", 29.83], ["music", 24.9], ["throbbing", 13.43]], [["music", 36.62], ["throbbing", 24.9], ["synthesizer", 6.93]], null, null, null, [["music", 29.68], ["whack, thwack", 19.23], ["smash, crash", 15.18]], [["speech", 57.73], ["music", 6.98], ["buzz", 4.26]], null, null, [["speech", 27.67], ["music", 12.09], ["animal", 8.88]], null, [["speech", 22.4], ["music", 18.05], ["didgeridoo", 4.71]], null], "duration": [27.21, 4.85, -0.11, 2.77, 10.63, 22.96, 0.14, 0.96, 1.32, 25.65, 5.71, 0.77, 0.29, 5.15, 1.06, 4.47, 0.1]} \ No newline at end of file diff --git a/annotations_1/aDZSH05DM_c_filtered.json b/annotations_1/aDZSH05DM_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..780603d026bbec3e8e096e8d39761063be5e2f1a --- /dev/null +++ b/annotations_1/aDZSH05DM_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.96], [7.0, 8.53], [9.0, 47.53], [48.0, 48.63], [49.0, 50.43], [51.0, 53.11], [54.0, 56.94], [58.0, 76.45], [78.0, 78.04], [78.0, 81.21], [84.0, 85.04], [86.0, 92.87], [93.0, 98.88], [101.0, 101.14], [101.0, 101.87], [102.0, 102.95], [105.0, 105.58], [108.0, 111.06], [113.0, 113.64], [114.0, 115.18], [116.0, 116.83], [118.0, 121.12], [123.0, 123.65], [124.0, 126.06], [127.0, 153.23], [155.0, 160.08], [161.0, 161.81], [164.0, 173.67], [176.0, 175.95]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [83.16, 0.0, 0.0, 0.0, 0.0, 35.94, 34.28, 45.62, 0.0, 38.79, 0.0, 38.78, 34.98, 0.0, 0.0, 0.0, 0.0, 37.61, 0.0, 0.0, 0.0, 39.28, 0.0, 37.89, 34.3, 40.02, 0.0, 29.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 44.18], ["rumble", 6.09], ["mains hum", 5.96]], [["music", 54.8], ["electronic music", 13.87], ["ambient music", 5.67]], [["rumble", 19.61], ["music", 19.1], ["hum", 17.1]], null, [["throbbing", 23.92], ["cattle, bovinae", 18.13], ["livestock, farm animals, working animals", 9.88]], null, [["hum", 37.82], ["throbbing", 22.21], ["speech", 14.95]], [["music", 52.72], ["hum", 17.82], ["throbbing", 13.14]], null, null, null, null, [["music", 53.08], ["throbbing", 8.26], ["hum", 7.44]], null, null, null, [["music", 53.16], ["hum", 16.65], ["throbbing", 14.57]], null, [["music", 58.93], ["hum", 12.37], ["throbbing", 10.59]], [["hum", 40.82], ["throbbing", 28.27], ["music", 13.53]], [["music", 26.72], ["sine wave", 20.37], ["sonar", 13.07]], null, [["hum", 43.63], ["throbbing", 24.97], ["mains hum", 19.35]], null], "duration": [2.96, 1.53, 38.53, 0.63, 1.43, 2.11, 2.94, 18.45, 0.04, 3.21, 1.04, 6.87, 5.88, 0.14, 0.87, 0.95, 0.58, 3.06, 0.64, 1.18, 0.83, 3.12, 0.65, 2.06, 26.23, 5.08, 0.81, 9.67, -0.05]} \ No newline at end of file diff --git a/annotations_1/aDcfm_9GTyU_filtered.json b/annotations_1/aDcfm_9GTyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..104ecc079ddd3aba39b726305090fe5397b2a161 --- /dev/null +++ b/annotations_1/aDcfm_9GTyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.42], [21.0, 24.14], [29.0, 29.69], [30.0, 34.94], [36.0, 37.45], [38.0, 46.87]], "keep_status": [true, false, false, true, false, true], "silence_prob": [42.79, 33.6, 0.0, 33.41, 0.0, 31.73], "audiomae_on_audioset": [[["speech", 24.08], ["music", 12.77], ["wind instrument, woodwind instrument", 5.12]], [["theremin", 50.07], ["music", 33.2], ["musical instrument", 2.4]], null, [["music", 47.94], ["theremin", 7.41], ["trombone", 6.53]], null, [["whack, thwack", 39.31], ["speech", 8.2], ["breaking", 4.87]]], "duration": [2.42, 3.14, 0.69, 4.94, 1.45, 8.87]} \ No newline at end of file diff --git a/annotations_1/aDq_JsN2Y6c_filtered.json b/annotations_1/aDq_JsN2Y6c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c743836398ce014ec5947ab899f8d039869fa15 --- /dev/null +++ b/annotations_1/aDq_JsN2Y6c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.78], [10.0, 10.23], [13.0, 12.85], [13.0, 14.08], [14.0, 15.28], [17.0, 17.95], [21.0, 21.39], [25.0, 26.11], [27.0, 28.49], [33.0, 34.97], [37.0, 36.91], [38.0, 38.89], [42.0, 43.78], [48.0, 54.45], [56.0, 61.4], [64.0, 65.38], [66.0, 67.46], [70.0, 69.94], [71.0, 78.31], [80.0, 80.97], [81.0, 85.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 58.89, 0.0, 0.0, 0.0, 58.05, 0.0, 47.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.55], ["speech", 20.71], ["sidetone", 12.46]], null, null, null, null, null, null, [["speech", 46.79], ["music", 14.78], ["hum", 4.11]]], "duration": [0.78, 0.23, -0.15, 1.08, 1.28, 0.95, 0.39, 1.11, 1.49, 1.97, -0.09, 0.89, 1.78, 6.45, 5.4, 1.38, 1.46, -0.06, 7.31, 0.97, 4.41]} \ No newline at end of file diff --git a/annotations_1/aDvjCbdyEHw_filtered.json b/annotations_1/aDvjCbdyEHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2b909f8972676f7e158ba126b75bd240fcb33d --- /dev/null +++ b/annotations_1/aDvjCbdyEHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.28], [14.0, 14.55], [15.0, 16.29], [19.0, 19.06], [20.0, 21.52], [23.0, 22.91], [24.0, 24.21], [30.0, 30.2], [66.0, 66.46], [72.0, 72.84], [96.0, 96.43], [102.0, 101.97], [105.0, 106.08], [119.0, 118.77], [137.0, 143.67], [146.0, 149.99], [151.0, 159.16], [164.0, 171.34], [174.0, 179.04], [179.0, 181.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.56, 33.19, 30.37, 30.23, 30.29, 32.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.65], ["sidetone", 5.69], ["synthesizer", 4.67]], [["music", 86.91], ["drum machine", 3.28], ["sampler", 2.11]], [["music", 79.89], ["fly, housefly", 4.88], ["insect", 1.52]], [["music", 85.53], ["electronic music", 3.55], ["throbbing", 2.7]], [["music", 78.23], ["electronic music", 5.27], ["drum machine", 3.9]], [["music", 61.26], ["boing", 5.14], ["electronic music", 4.95]]], "duration": [0.28, 0.55, 1.29, 0.06, 1.52, -0.09, 0.21, 0.2, 0.46, 0.84, 0.43, -0.03, 1.08, -0.23, 6.67, 3.99, 8.16, 7.34, 5.04, 2.18]} \ No newline at end of file diff --git a/annotations_1/aEG9dwOsAAg_filtered.json b/annotations_1/aEG9dwOsAAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22013af76387e1d9070c3831049d492d8820cfa --- /dev/null +++ b/annotations_1/aEG9dwOsAAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.38], [9.0, 10.54], [12.0, 12.97], [14.0, 14.74], [16.0, 17.51], [25.0, 26.15], [28.0, 30.33], [37.0, 39.85], [47.0, 47.63], [50.0, 50.53], [64.0, 63.86], [98.0, 103.17], [104.0, 109.86], [116.0, 115.96], [118.0, 118.62], [119.0, 120.04], [121.0, 128.46], [129.0, 129.12], [130.0, 130.0], [132.0, 134.74], [135.0, 135.97], [137.0, 139.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 92.64, 0.0, 0.0, 0.0, 32.68, 29.69, 0.0, 0.0, 0.0, 32.46, 0.0, 0.0, 43.1, 0.0, 59.77], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 40.91], ["speech", 24.01], ["sidetone", 15.84]], [["music", 41.37], ["speech", 13.66], ["explosion", 7.83]], null, null, null, [["speech", 34.54], ["music", 19.07], ["sidetone", 11.57]], null, null, [["speech", 23.07], ["music", 15.53], ["sidetone", 8.72]], null, null], "duration": [2.38, 1.54, 0.97, 0.74, 1.51, 1.15, 2.33, 2.85, 0.63, 0.53, -0.14, 5.17, 5.86, -0.04, 0.62, 1.04, 7.46, 0.12, 0.0, 2.74, 0.97, 2.45]} \ No newline at end of file diff --git a/annotations_1/aEIaR1nlEoo_filtered.json b/annotations_1/aEIaR1nlEoo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbbbfd3e2bc2df5fd4e3766fdb5bd1901d59c2c7 --- /dev/null +++ b/annotations_1/aEIaR1nlEoo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.45], [15.0, 20.09], [25.0, 25.76], [28.0, 31.29], [33.0, 33.86], [41.0, 42.74], [44.0, 45.13], [45.0, 45.87], [48.0, 48.03], [49.0, 49.92], [51.0, 59.83], [63.0, 64.35], [69.0, 69.13], [72.0, 72.57], [77.0, 77.67]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.49, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 25.18], ["mains hum", 17.45], ["car", 8.78]], null, null, null, null, null, null, null, null, [["speech", 27.75], ["hum", 14.53], ["mains hum", 5.45]], null, null, null, null], "duration": [1.45, 5.09, 0.76, 3.29, 0.86, 1.74, 1.13, 0.87, 0.03, 0.92, 8.83, 1.35, 0.13, 0.57, 0.67]} \ No newline at end of file diff --git a/annotations_1/aEfAFo99jEs_filtered.json b/annotations_1/aEfAFo99jEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a316b2d9bb4c6a0819ec5ba828b6e61621d2350 --- /dev/null +++ b/annotations_1/aEfAFo99jEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [7.0, 12.16], [13.0, 21.78], [23.0, 25.25], [26.0, 34.35], [36.0, 56.81], [58.0, 65.64], [67.0, 70.77], [72.0, 73.45], [75.0, 78.46], [81.0, 94.22], [96.0, 97.56], [104.0, 104.63], [105.0, 106.66], [108.0, 110.13], [114.0, 120.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.95, 61.97, 90.43, 61.97, 84.62, 90.43, 95.64, 0.0, 81.89, 79.59, 0.0, 0.0, 0.0, 97.43, 87.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 5.16, 8.78, 2.25, 8.35, 20.81, 7.64, 3.77, 1.45, 3.46, 13.22, 1.56, 0.63, 1.66, 2.13, 6.72]} \ No newline at end of file diff --git a/annotations_1/aFnS18LM8Ws_filtered.json b/annotations_1/aFnS18LM8Ws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8496630361b1e4f799153d6acb135bc6d489cc90 --- /dev/null +++ b/annotations_1/aFnS18LM8Ws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 35.19], [37.0, 46.28], [46.0, 50.41], [53.0, 53.87], [57.0, 59.04], [61.0, 61.77], [63.0, 64.84], [73.0, 75.05], [76.0, 147.48], [149.0, 151.63], [159.0, 160.1], [161.0, 161.82], [162.0, 173.1], [176.0, 175.98], [177.0, 177.74], [178.0, 184.57]], "keep_status": [true, true, true, false, true, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [34.65, 30.72, 33.69, 0.0, 36.22, 0.0, 0.0, 29.15, 0.0, 30.0, 0.0, 0.0, 29.67, 0.0, 0.0, 31.5], "audiomae_on_audioset": [[["speech", 24.97], ["music", 24.48], ["fart", 8.96]], [["speech", 35.3], ["music", 16.81], ["buzz", 8.21]], [["speech", 49.76], ["music", 12.95], ["whale vocalization", 6.78]], null, [["music", 36.95], ["hum", 7.79], ["throbbing", 4.71]], null, null, [["zipper (clothing)", 14.07], ["smash, crash", 11.9], ["whack, thwack", 11.68]], null, [["cattle, bovinae", 45.47], ["livestock, farm animals, working animals", 29.54], ["moo", 24.19]], null, null, [["speech", 19.61], ["music", 11.99], ["sidetone", 7.4]], null, null, [["music", 30.93], ["buzz", 11.51], ["didgeridoo", 8.24]]], "duration": [3.19, 9.28, 4.41, 0.87, 2.04, 0.77, 1.84, 2.05, 71.48, 2.63, 1.1, 0.82, 11.1, -0.02, 0.74, 6.57]} \ No newline at end of file diff --git a/annotations_1/aG3Oc5TNd-Y_filtered.json b/annotations_1/aG3Oc5TNd-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329bf8b8e7a5cca918ce33ad353861dc899883c7 --- /dev/null +++ b/annotations_1/aG3Oc5TNd-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.17], [2.0, 2.24], [2.0, 2.27], [2.0, 10.47], [17.0, 29.66], [33.0, 36.32], [46.0, 47.55], [51.0, 51.14], [52.0, 58.45], [77.0, 77.79], [79.0, 93.46], [95.0, 96.47], [96.0, 96.5], [98.0, 97.88], [98.0, 107.03], [112.0, 112.35], [113.0, 113.1], [114.0, 113.75], [115.0, 140.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.29, 29.49, 45.08, 0.0, 0.0, 30.3, 0.0, 59.07, 0.0, 0.0, 0.0, 29.26, 0.0, 0.0, 0.0, 36.11], "audiomae_on_audioset": [null, null, null, [["music", 60.43], ["musical instrument", 11.1], ["didgeridoo", 5.28]], [["music", 80.59], ["synthetic singing", 2.78], ["singing", 2.19]], [["boing", 56.1], ["echo", 14.74], ["synthesizer", 5.32]], null, null, [["music", 28.3], ["crowd", 17.34], ["speech", 14.99]], null, null, null, null, null, [["cattle, bovinae", 41.66], ["moo", 27.56], ["livestock, farm animals, working animals", 19.74]], null, null, null, [["music", 26.17], ["speech", 19.46], ["hum", 7.26]]], "duration": [0.17, 0.24, 0.27, 8.47, 12.66, 3.32, 1.55, 0.14, 6.45, 0.79, 14.46, 1.47, 0.5, -0.12, 9.03, 0.35, 0.1, -0.25, 25.44]} \ No newline at end of file diff --git a/annotations_1/aG8bSNpEGoE_filtered.json b/annotations_1/aG8bSNpEGoE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83f9b1d1f536e697fb607771ae60ba79a0167414 --- /dev/null +++ b/annotations_1/aG8bSNpEGoE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.69], [19.0, 19.03], [25.0, 25.83], [31.0, 34.08], [56.0, 56.93], [73.0, 77.99], [80.0, 80.5], [83.0, 86.14], [95.0, 95.69], [101.0, 104.57], [110.0, 111.57], [115.0, 115.2], [126.0, 126.49], [140.0, 147.19]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.9, 0.0, 32.6, 0.0, 35.25, 0.0, 32.96, 0.0, 0.0, 0.0, 30.95], "audiomae_on_audioset": [null, null, null, [["music", 61.27], ["musical instrument", 4.43], ["synthesizer", 3.63]], null, [["music", 66.0], ["boing", 3.39], ["musical instrument", 1.79]], null, [["music", 52.05], ["hum", 5.92], ["throbbing", 3.96]], null, [["music", 56.88], ["singing", 6.96], ["bass guitar", 2.67]], null, null, null, [["music", 77.17], ["musical instrument", 5.31], ["guitar", 2.64]]], "duration": [1.69, 0.03, 0.83, 3.08, 0.93, 4.99, 0.5, 3.14, 0.69, 3.57, 1.57, 0.2, 0.49, 7.19]} \ No newline at end of file diff --git a/annotations_1/aGMiaQISzq0_filtered.json b/annotations_1/aGMiaQISzq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79c722ce40a0ca0f2a3cc037cbf220d2d82fa889 --- /dev/null +++ b/annotations_1/aGMiaQISzq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.97], [10.0, 10.98], [11.0, 40.07], [41.0, 42.23], [43.0, 44.22], [45.0, 47.33], [49.0, 50.65], [52.0, 52.79], [55.0, 56.78], [58.0, 59.04]], "keep_status": [false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 28.19, 0.0, 0.0, 47.05, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 17.37], ["hum", 16.04], ["speech", 14.25]], null, null, [["music", 22.64], ["speech", 14.81], ["foghorn", 13.32]], null, null, null, null], "duration": [0.97, 0.98, 29.07, 1.23, 1.22, 2.33, 1.65, 0.79, 1.78, 1.04]} \ No newline at end of file diff --git a/annotations_1/aHI-JX6Q3Xk_filtered.json b/annotations_1/aHI-JX6Q3Xk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/aHI-JX6Q3Xk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/aHQQs4D3krU_filtered.json b/annotations_1/aHQQs4D3krU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..184ab8e54cfd75e2edb5fd449a8465c5ca0fcffe --- /dev/null +++ b/annotations_1/aHQQs4D3krU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [28.0, 29.66], [31.0, 32.05], [34.0, 35.19], [38.0, 39.11], [40.0, 41.1], [42.0, 44.32], [46.0, 54.14], [56.0, 56.62], [63.0, 64.39], [73.0, 73.94], [78.0, 80.47], [84.0, 84.03], [94.0, 94.63], [96.0, 96.5], [99.0, 100.77], [101.0, 103.37], [105.0, 105.44], [106.0, 106.69], [108.0, 117.27], [124.0, 124.73], [129.0, 131.5], [132.0, 132.58]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.15, 29.75, 0.0, 0.0, 0.0, 29.25, 0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 0.0, 34.94, 0.0, 31.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["livestock, farm animals, working animals", 50.24], ["cattle, bovinae", 22.97], ["moo", 20.48]], [["music", 28.65], ["hum", 22.87], ["throbbing", 17.03]], null, null, null, [["music", 28.6], ["speech", 13.44], ["moo", 7.92]], null, null, null, null, [["music", 39.1], ["throbbing", 10.76], ["speech", 9.52]], null, null, [["music", 78.33], ["speech", 6.7], ["electronic music", 1.73]], null, [["music", 75.65], ["yodeling", 3.29], ["middle eastern music", 1.02]], null], "duration": [0.97, 1.66, 1.05, 1.19, 1.11, 1.1, 2.32, 8.14, 0.62, 1.39, 0.94, 2.47, 0.03, 0.63, 0.5, 1.77, 2.37, 0.44, 0.69, 9.27, 0.73, 2.5, 0.58]} \ No newline at end of file diff --git a/annotations_1/aJZL2uoPRZg_filtered.json b/annotations_1/aJZL2uoPRZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a009632d6ae4aa17d776562dcdd3bd44cbe57f --- /dev/null +++ b/annotations_1/aJZL2uoPRZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [6.0, 6.51], [11.0, 11.89], [14.0, 14.18], [15.0, 15.4], [18.0, 19.23], [22.0, 22.84], [24.0, 24.73], [25.0, 26.25], [27.0, 27.67], [32.0, 32.59], [35.0, 38.5], [39.0, 41.71], [45.0, 47.73], [50.0, 51.54], [52.0, 55.02], [57.0, 59.98], [61.0, 64.32], [65.0, 65.97], [69.0, 70.43], [72.0, 78.83], [82.0, 90.21], [92.0, 92.43], [92.0, 92.48], [95.0, 96.11], [97.0, 97.7], [101.0, 101.97], [106.0, 106.76], [108.0, 108.18], [110.0, 111.4], [112.0, 114.05], [119.0, 134.7], [140.0, 140.8], [143.0, 146.64], [152.0, 156.86], [159.0, 159.85], [160.0, 164.42], [165.0, 166.97], [167.0, 167.91], [169.0, 173.1], [175.0, 176.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 80.11, 97.22, 0.0, 62.78, 97.83, 63.42, 0.0, 0.0, 30.81, 30.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.77, 30.43, 0.0, 53.28, 84.43, 0.0, 59.07, 0.0, 0.0, 88.1, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.46], ["throbbing", 9.39], ["electronic music", 3.75]], [["music", 72.91], ["electronic music", 6.42], ["throbbing", 6.11]], null, null, null, null, null, null, null, null, [["music", 55.74], ["throbbing", 6.77], ["electronic music", 6.75]], [["music", 52.87], ["throbbing", 12.14], ["electronic music", 6.06]], null, null, null, null, null, null, null, null, null], "duration": [1.05, 0.51, 0.89, 0.18, 0.4, 1.23, 0.84, 0.73, 1.25, 0.67, 0.59, 3.5, 2.71, 2.73, 1.54, 3.02, 2.98, 3.32, 0.97, 1.43, 6.83, 8.21, 0.43, 0.48, 1.11, 0.7, 0.97, 0.76, 0.18, 1.4, 2.05, 15.7, 0.8, 3.64, 4.86, 0.85, 4.42, 1.97, 0.91, 4.1, 1.15]} \ No newline at end of file diff --git a/annotations_1/aJgS31WWIG8_filtered.json b/annotations_1/aJgS31WWIG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c03921ecc74d00c7f416d49d805074a288f1c464 --- /dev/null +++ b/annotations_1/aJgS31WWIG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.35], [21.0, 77.5], [78.0, 80.0], [82.0, 83.35]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 43.28, 0.0], "audiomae_on_audioset": [null, null, [["chirp tone", 14.2], ["music", 12.79], ["synthesizer", 7.37]], null], "duration": [0.35, 56.5, 2.0, 1.35]} \ No newline at end of file diff --git a/annotations_1/aKE0S2gCOfc_filtered.json b/annotations_1/aKE0S2gCOfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70a2f479883eb642036ae82ef802ad80f7e379e0 --- /dev/null +++ b/annotations_1/aKE0S2gCOfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.15], [10.0, 52.76], [55.0, 54.94], [57.0, 56.71], [60.0, 64.0], [68.0, 95.0], [96.0, 95.94], [99.0, 114.08], [115.0, 121.05], [124.0, 131.43], [132.0, 133.24], [137.0, 136.98], [137.0, 143.16], [147.0, 172.2], [173.0, 173.85], [174.0, 173.89]], "keep_status": [false, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.41, 30.75, 0.0, 31.05, 34.11, 31.35, 0.0, 0.0, 31.86, 32.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 62.53], ["throbbing", 11.21], ["hum", 8.22]], [["music", 40.8], ["hum", 24.21], ["mains hum", 16.66]], null, [["hum", 19.45], ["speech", 17.58], ["throbbing", 11.47]], [["speech", 26.3], ["hum", 14.69], ["mains hum", 13.73]], [["hum", 24.23], ["mains hum", 19.37], ["speech", 13.41]], null, null, [["speech", 53.16], ["music", 13.72], ["hum", 5.04]], [["hum", 35.58], ["throbbing", 17.01], ["music", 14.35]], null, null], "duration": [1.15, 42.76, -0.06, -0.29, 4.0, 27.0, -0.06, 15.08, 6.05, 7.43, 1.24, -0.02, 6.16, 25.2, 0.85, -0.11]} \ No newline at end of file diff --git a/annotations_1/aKtrjeCFCAg_filtered.json b/annotations_1/aKtrjeCFCAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b91bfb215aa4d97228cf474e3e6001df6a88fb --- /dev/null +++ b/annotations_1/aKtrjeCFCAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.39], [10.0, 10.74], [23.0, 29.03], [31.0, 32.27], [33.0, 52.39], [59.0, 59.53], [62.0, 63.09], [70.0, 73.41], [78.0, 78.31], [86.0, 86.86], [89.0, 89.21], [89.0, 89.4], [89.0, 91.52], [96.0, 95.94], [103.0, 103.57], [107.0, 108.36], [117.0, 118.2], [120.0, 119.99], [121.0, 122.23], [131.0, 132.22], [135.0, 136.59], [138.0, 138.4], [139.0, 139.77], [142.0, 143.67], [159.0, 159.12], [165.0, 171.14], [172.0, 172.99], [174.0, 174.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.63, 0.0, 34.0, 0.0, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 71.48], ["speech", 15.43], ["hum", 1.77]], null, null, null, null, null, null, null, [["whale vocalization", 26.28], ["roaring cats (lions, tigers)", 9.41], ["speech", 8.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, 0.74, 6.03, 1.27, 19.39, 0.53, 1.09, 3.41, 0.31, 0.86, 0.21, 0.4, 2.52, -0.06, 0.57, 1.36, 1.2, -0.01, 1.23, 1.22, 1.59, 0.4, 0.77, 1.67, 0.12, 6.14, 0.99, 0.83]} \ No newline at end of file diff --git a/annotations_1/aL4dQo8iBLo_filtered.json b/annotations_1/aL4dQo8iBLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c3c642e5e440b9e6454aab99ecd41f7a906fe80 --- /dev/null +++ b/annotations_1/aL4dQo8iBLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.01], [15.0, 15.3], [16.0, 49.96], [79.0, 81.57], [82.0, 83.52], [89.0, 89.72], [95.0, 96.92], [101.0, 106.19], [109.0, 118.71], [120.0, 120.38]], "keep_status": [false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 0.0, 28.98, 29.72, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.5], ["hum", 12.59], ["mains hum", 7.78]], null, null, null, [["music", 30.14], ["throbbing", 25.92], ["speech", 13.64]], [["mains hum", 60.81], ["hum", 35.71], ["throbbing", 2.97]], null], "duration": [1.01, 0.3, 33.96, 2.57, 1.52, 0.72, 1.92, 5.19, 9.71, 0.38]} \ No newline at end of file diff --git a/annotations_1/aL_6-dQCzwg_filtered.json b/annotations_1/aL_6-dQCzwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..825210b6dba41e5bb7baaba93b3b99d5e1167491 --- /dev/null +++ b/annotations_1/aL_6-dQCzwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 42.77], [44.0, 64.15], [64.0, 73.2], [78.0, 80.59], [82.0, 83.1], [84.0, 110.54], [113.0, 114.08], [115.0, 124.28], [127.0, 127.43]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 53.59, 53.53, 41.78, 0.0, 34.49, 0.0, 36.89, 0.0], "audiomae_on_audioset": [null, null, null, [["singing bowl", 47.0], ["music", 14.82], ["speech", 9.61]], null, [["music", 57.06], ["wind instrument, woodwind instrument", 7.11], ["clarinet", 5.61]], null, [["music", 73.27], ["clarinet", 3.86], ["saxophone", 2.76]], null], "duration": [31.77, 20.15, 9.2, 2.59, 1.1, 26.54, 1.08, 9.28, 0.43]} \ No newline at end of file diff --git a/annotations_1/aNDj-H1jxV0_filtered.json b/annotations_1/aNDj-H1jxV0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0684ca8b1b556551f9e670652cb3a270ba74161 --- /dev/null +++ b/annotations_1/aNDj-H1jxV0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.42], [23.0, 26.82], [29.0, 30.05], [31.0, 32.49], [37.0, 38.92], [47.0, 52.41], [53.0, 54.21], [68.0, 68.23], [78.0, 78.43], [81.0, 80.77], [82.0, 83.73], [85.0, 89.33], [90.0, 91.57], [102.0, 103.4], [105.0, 105.61], [107.0, 108.5], [111.0, 111.25], [115.0, 115.82], [121.0, 122.23], [130.0, 130.08], [135.0, 135.85], [136.0, 136.43], [139.0, 140.73], [144.0, 144.36], [147.0, 148.05], [151.0, 151.51], [154.0, 154.99], [160.0, 159.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 3.82, 1.05, 1.49, 1.92, 5.41, 1.21, 0.23, 0.43, -0.23, 1.73, 4.33, 1.57, 1.4, 0.61, 1.5, 0.25, 0.82, 1.23, 0.08, 0.85, 0.43, 1.73, 0.36, 1.05, 0.51, 0.99, -0.07]} \ No newline at end of file diff --git a/annotations_1/aNbtnYXp9-k_filtered.json b/annotations_1/aNbtnYXp9-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2311a2050fb21a5f89a5a0f2faf437316ea22944 --- /dev/null +++ b/annotations_1/aNbtnYXp9-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.97], [6.0, 6.84], [9.0, 9.9], [12.0, 15.18], [23.0, 23.06], [25.0, 25.25], [38.0, 38.5], [39.0, 38.64], [51.0, 55.39], [56.0, 64.15], [70.0, 72.0], [74.0, 77.75], [80.0, 81.85], [98.0, 98.34], [105.0, 104.79], [109.0, 112.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.09, 0.0, 0.0, 67.63, 0.0, 0.0, 0.0, 0.0, 33.13, 32.48, 35.14, 32.18, 0.0, 0.0, 0.0, 35.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 58.42], ["speech", 8.64], ["electronic music", 7.48]], [["music", 42.57], ["throbbing", 24.67], ["speech", 11.44]], [["music", 60.06], ["synthesizer", 8.88], ["musical instrument", 6.24]], [["music", 68.28], ["speech", 9.11], ["electronic music", 6.26]], null, null, null, [["music", 67.63], ["sidetone", 12.73], ["drum machine", 2.45]]], "duration": [2.97, 0.84, 0.9, 3.18, 0.06, 0.25, 0.5, -0.36, 4.39, 8.15, 2.0, 3.75, 1.85, 0.34, -0.21, 3.7]} \ No newline at end of file diff --git a/annotations_1/aOX72bZr_LA_filtered.json b/annotations_1/aOX72bZr_LA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe70b89c45eac42df523f74fc79a369a5a9fca3c --- /dev/null +++ b/annotations_1/aOX72bZr_LA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.61], [9.0, 10.71], [14.0, 14.84], [19.0, 20.04], [26.0, 26.43], [36.0, 36.29], [37.0, 38.38], [40.0, 41.2], [42.0, 44.66], [47.0, 47.88], [67.0, 72.42], [73.0, 74.38], [78.0, 78.95], [91.0, 91.23], [92.0, 94.32], [98.0, 98.49], [101.0, 102.88], [105.0, 111.84], [113.0, 116.95], [120.0, 121.02], [123.0, 123.57], [125.0, 126.79], [128.0, 130.08], [133.0, 135.01], [135.0, 136.76], [137.0, 138.27], [139.0, 144.09], [145.0, 146.35], [148.0, 149.82], [152.0, 195.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 71.57, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 67.63, 64.63, 0.0, 0.0, 0.0, 54.97, 54.5, 0.0, 0.0, 52.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 1.71, 0.84, 1.04, 0.43, 0.29, 1.38, 1.2, 2.66, 0.88, 5.42, 1.38, 0.95, 0.23, 2.32, 0.49, 1.88, 6.84, 3.95, 1.02, 0.57, 1.79, 2.08, 2.01, 1.76, 1.27, 5.09, 1.35, 1.82, 43.02]} \ No newline at end of file diff --git a/annotations_1/aP7GTu8tbvQ_filtered.json b/annotations_1/aP7GTu8tbvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb71893cd1b4b49aad16f7bb0c294a0f0d485937 --- /dev/null +++ b/annotations_1/aP7GTu8tbvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [8.0, 9.15], [15.0, 16.14], [19.0, 19.38], [21.0, 22.76], [26.0, 26.15], [28.0, 28.7], [31.0, 31.83], [40.0, 43.07], [45.0, 46.62], [47.0, 48.37], [51.0, 52.3], [55.0, 58.89], [60.0, 64.39], [66.0, 66.51], [67.0, 68.15], [68.0, 68.82], [70.0, 70.34], [75.0, 75.63], [78.0, 80.54], [88.0, 88.33], [91.0, 90.85], [93.0, 93.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [36.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 48.56, 38.49, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["snicker", 42.1], ["chuckle, chortle", 24.18], ["laughter", 10.02]], null, null, null, null, null, null, null, null, null, null, null, [["music", 79.4], ["musical instrument", 3.56], ["brass instrument", 2.76]], [["music", 42.5], ["synthesizer", 15.44], ["didgeridoo", 10.01]], null, null, null, null, null, [["laughter", 18.7], ["baby laughter", 16.47], ["snicker", 12.45]], null, null, null], "duration": [2.44, 1.15, 1.14, 0.38, 1.76, 0.15, 0.7, 0.83, 3.07, 1.62, 1.37, 1.3, 3.89, 4.39, 0.51, 1.15, 0.82, 0.34, 0.63, 2.54, 0.33, -0.15, 0.95]} \ No newline at end of file diff --git a/annotations_1/aPFbf954LJ0_filtered.json b/annotations_1/aPFbf954LJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a906a67d4aaf7402c41f466ac7d8a4f2740d450 --- /dev/null +++ b/annotations_1/aPFbf954LJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 35.95], [59.0, 58.97], [72.0, 72.49], [78.0, 78.36], [82.0, 82.34], [103.0, 103.57], [105.0, 106.1], [125.0, 125.73], [133.0, 133.62]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [-0.05, -0.03, 0.49, 0.36, 0.34, 0.57, 1.1, 0.73, 0.62]} \ No newline at end of file diff --git a/annotations_1/aPUaHUwJJk8_filtered.json b/annotations_1/aPUaHUwJJk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90551e3901056b20cb4750d14ade1faab5003028 --- /dev/null +++ b/annotations_1/aPUaHUwJJk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 72.23], [74.0, 96.87], [98.0, 99.01], [100.0, 105.24], [108.0, 109.41], [112.0, 113.31], [114.0, 113.85], [114.0, 114.32], [117.0, 117.37], [119.0, 119.4], [124.0, 145.27]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.44, 0.0, 32.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.69], "audiomae_on_audioset": [null, [["music", 55.09], ["hum", 12.1], ["throbbing", 10.45]], null, [["speech", 30.07], ["music", 23.7], ["gunshot, gunfire", 9.03]], null, null, null, null, null, null, [["hum", 37.68], ["mains hum", 21.17], ["throbbing", 14.7]]], "duration": [48.23, 22.87, 1.01, 5.24, 1.41, 1.31, -0.15, 0.32, 0.37, 0.4, 21.27]} \ No newline at end of file diff --git a/annotations_1/aPdLYN69cfE_filtered.json b/annotations_1/aPdLYN69cfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffee9e0e1f6fbc91e829115dc4948dbbd089223e --- /dev/null +++ b/annotations_1/aPdLYN69cfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.96], [4.0, 5.16], [6.0, 6.51], [7.0, 11.23], [12.0, 13.15], [23.0, 23.28], [24.0, 37.72], [43.0, 46.52], [47.0, 95.89], [97.0, 105.63], [106.0, 129.95], [131.0, 169.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [44.26, 0.0, 0.0, 31.11, 0.0, 0.0, 35.62, 36.2, 0.0, 47.27, 28.78, 0.0], "audiomae_on_audioset": [[["hum", 20.14], ["mains hum", 18.81], ["music", 17.3]], null, null, [["speech", 80.25], ["music", 3.65], ["whale vocalization", 3.32]], null, null, [["music", 60.66], ["sonar", 10.43], ["electronic music", 5.52]], [["music", 74.16], ["musical instrument", 5.42], ["synthesizer", 3.02]], null, [["music", 57.63], ["electronic music", 7.72], ["synthesizer", 7.11]], [["speech", 41.52], ["music", 20.43], ["mains hum", 6.68]], null], "duration": [2.96, 1.16, 0.51, 4.23, 1.15, 0.28, 13.72, 3.52, 48.89, 8.63, 23.95, 38.94]} \ No newline at end of file diff --git a/annotations_1/aPdxMGV1Y28_filtered.json b/annotations_1/aPdxMGV1Y28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71ec11589db79c1753e32bbd7edf29a1b9a4f8a5 --- /dev/null +++ b/annotations_1/aPdxMGV1Y28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.67], [29.0, 31.04], [33.0, 34.75], [36.0, 38.45], [40.0, 46.04], [47.0, 49.74], [51.0, 52.89], [54.0, 56.12], [58.0, 58.77], [60.0, 64.1], [65.0, 66.16], [67.0, 70.29], [71.0, 77.16], [78.0, 88.06], [94.0, 120.01], [121.0, 120.95], [122.0, 122.79], [125.0, 127.09], [128.0, 136.44], [137.0, 137.19], [137.0, 140.53], [144.0, 161.74]], "keep_status": [false, true, false, true, true, true, false, true, false, false, false, true, true, true, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 37.74, 0.0, 41.85, 43.18, 40.41, 0.0, 37.69, 0.0, 37.31, 0.0, 33.94, 34.85, 33.87, 29.43, 0.0, 0.0, 29.56, 31.44, 0.0, 28.45, 28.21], "audiomae_on_audioset": [null, [["gong", 22.83], ["music", 17.86], ["ambient music", 13.36]], null, [["music", 48.18], ["sonar", 9.31], ["ambient music", 7.76]], [["music", 45.62], ["crow", 5.26], ["caw", 4.68]], [["quack", 14.71], ["frog", 14.35], ["gong", 7.53]], null, [["music", 44.52], ["gong", 7.37], ["electronic music", 6.53]], null, [["music", 39.21], ["gong", 27.89], ["electronic music", 10.2]], null, [["caw", 23.13], ["music", 15.49], ["crow", 14.59]], [["speech", 33.39], ["caw", 13.13], ["crow", 5.93]], [["music", 34.13], ["caw", 17.17], ["crow", 11.18]], [["hum", 21.27], ["mains hum", 19.81], ["music", 18.5]], null, null, [["music", 33.18], ["theremin", 21.75], ["civil defense siren", 6.99]], [["music", 25.47], ["whack, thwack", 14.32], ["hum", 6.85]], null, [["groan", 64.43], ["music", 14.2], ["grunt", 9.72]], [["music", 38.78], ["buzz", 6.77], ["outside, rural or natural", 3.89]]], "duration": [1.67, 2.04, 1.75, 2.45, 6.04, 2.74, 1.89, 2.12, 0.77, 4.1, 1.16, 3.29, 6.16, 10.06, 26.01, -0.05, 0.79, 2.09, 8.44, 0.19, 3.53, 17.74]} \ No newline at end of file diff --git a/annotations_1/aQqAUXKn7t4_filtered.json b/annotations_1/aQqAUXKn7t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..392faab964b2b5d358ba70ecef62430ca8cb325a --- /dev/null +++ b/annotations_1/aQqAUXKn7t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.69], [10.0, 10.27], [14.0, 14.45], [16.0, 21.15], [23.0, 28.51], [32.0, 32.21], [36.0, 37.15], [39.0, 38.74], [39.0, 39.61], [41.0, 41.0], [51.0, 54.19], [57.0, 59.37], [60.0, 60.42], [61.0, 63.41], [64.0, 137.37], [143.0, 149.01], [150.0, 150.89], [151.0, 152.51], [153.0, 154.85], [161.0, 161.94], [179.0, 179.63], [180.0, 181.25], [187.0, 187.96], [196.0, 200.06]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.68, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 40.88, 0.0, 38.66, 0.0, 39.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, [["hum", 25.61], ["mains hum", 25.19], ["music", 17.3]], [["fly, housefly", 45.56], ["insect", 21.52], ["bee, wasp, etc.", 9.31]], null, null, null, null, null, [["cattle, bovinae", 33.28], ["livestock, farm animals, working animals", 25.41], ["moo", 21.42]], [["fly, housefly", 37.91], ["insect", 22.83], ["mosquito", 15.14]], null, [["moo", 45.39], ["cattle, bovinae", 30.6], ["livestock, farm animals, working animals", 16.78]], null, [["fly, housefly", 27.8], ["insect", 14.23], ["speech", 8.29]], null, null, null, null, null, null, null, null], "duration": [0.69, 0.27, 0.45, 5.15, 5.51, 0.21, 1.15, -0.26, 0.61, 0.0, 3.19, 2.37, 0.42, 2.41, 73.37, 6.01, 0.89, 1.51, 1.85, 0.94, 0.63, 1.25, 0.96, 4.06]} \ No newline at end of file diff --git a/annotations_1/aRPInpAD3_o_filtered.json b/annotations_1/aRPInpAD3_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed1f5f5c475e4b1224492859bdca1011bd223957 --- /dev/null +++ b/annotations_1/aRPInpAD3_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.36], [2.0, 2.96], [3.0, 4.23], [31.0, 33.34], [53.0, 69.77], [71.0, 84.79], [90.0, 89.68], [109.0, 109.49], [116.0, 116.31], [117.0, 116.72], [121.0, 126.15], [130.0, 129.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.99, 33.15, 30.43, 0.0, 0.0, 0.0, 0.0, 36.59, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 76.53], ["electronic music", 5.17], ["throbbing", 3.5]], [["music", 38.35], ["speech", 25.9], ["didgeridoo", 10.25]], null, null, null, null, [["music", 77.4], ["fart", 2.55], ["boing", 1.79]], null], "duration": [0.36, 0.96, 1.23, 2.34, 16.77, 13.79, -0.32, 0.49, 0.31, -0.28, 5.15, -0.04]} \ No newline at end of file diff --git a/annotations_1/aRav_8OWESA_filtered.json b/annotations_1/aRav_8OWESA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6d2905eff05e22a14479e7f8f5ad4cb439be193 --- /dev/null +++ b/annotations_1/aRav_8OWESA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.75], [5.0, 6.69], [9.0, 9.63], [17.0, 18.82], [29.0, 33.15], [34.0, 34.28], [38.0, 39.18], [48.0, 51.29], [57.0, 57.99], [60.0, 71.1], [79.0, 80.57], [93.0, 93.38], [95.0, 95.18], [96.0, 97.38], [100.0, 102.24], [106.0, 107.38], [115.0, 115.96], [121.0, 124.06], [124.0, 124.8], [126.0, 127.45], [129.0, 130.99], [134.0, 135.19], [138.0, 138.48], [139.0, 141.37], [146.0, 146.65]], "keep_status": [true, false, false, false, true, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.56, 0.0, 0.0, 0.0, 31.66, 0.0, 0.0, 32.11, 0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 36.32, 0.0, 0.0, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 0.0], "audiomae_on_audioset": [[["mosquito", 26.43], ["fly, housefly", 13.68], ["insect", 11.59]], null, null, null, [["music", 44.53], ["speech", 14.13], ["boing", 6.44]], null, null, [["music", 28.03], ["speech", 24.75], ["theremin", 6.97]], null, [["fly, housefly", 27.13], ["insect", 15.42], ["moo", 11.24]], null, null, null, null, [["music", 30.06], ["echo", 10.08], ["reverberation", 8.47]], null, null, [["moo", 36.13], ["cattle, bovinae", 25.46], ["livestock, farm animals, working animals", 12.56]], null, null, null, null, null, [["music", 55.22], ["guitar", 6.88], ["musical instrument", 6.07]], null], "duration": [2.75, 1.69, 0.63, 1.82, 4.15, 0.28, 1.18, 3.29, 0.99, 11.1, 1.57, 0.38, 0.18, 1.38, 2.24, 1.38, 0.96, 3.06, 0.8, 1.45, 1.99, 1.19, 0.48, 2.37, 0.65]} \ No newline at end of file diff --git a/annotations_1/aSajnx9QK-0_filtered.json b/annotations_1/aSajnx9QK-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a62e4b024215da840ca0b009efa83a8d1f696716 --- /dev/null +++ b/annotations_1/aSajnx9QK-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 15.3], [16.0, 16.92], [19.0, 20.14], [22.0, 23.13], [24.0, 27.62], [29.0, 29.57], [32.0, 32.76], [34.0, 35.16], [43.0, 44.05], [46.0, 46.14], [48.0, 50.53], [51.0, 51.7], [53.0, 56.25], [58.0, 58.95], [60.0, 64.0], [67.0, 75.22], [76.0, 89.95], [91.0, 91.54], [113.0, 114.67], [115.0, 115.84], [117.0, 117.73], [120.0, 120.7], [124.0, 125.78], [127.0, 128.87], [131.0, 131.06], [132.0, 135.97], [138.0, 138.84], [142.0, 144.51], [145.0, 147.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.81, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 50.76, 0.0, 39.22, 0.0, 36.79, 33.69, 33.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.51, 0.0, 71.0, 70.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.16], ["speech", 12.72], ["music", 11.68]], null, [["speech", 36.2], ["buzz", 14.19], ["sidetone", 10.06]], [["speech", 79.59], ["cattle, bovinae", 3.07], ["livestock, farm animals, working animals", 2.22]], [["hum", 27.01], ["mains hum", 26.91], ["speech", 19.55]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.3, 0.92, 1.14, 1.13, 3.62, 0.57, 0.76, 1.16, 1.05, 0.14, 2.53, 0.7, 3.25, 0.95, 4.0, 8.22, 13.95, 0.54, 1.67, 0.84, 0.73, 0.7, 1.78, 1.87, 0.06, 3.97, 0.84, 2.51, 2.36]} \ No newline at end of file diff --git a/annotations_1/aSsFjcw8R3Y_filtered.json b/annotations_1/aSsFjcw8R3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc2f447d145260181f589257627cb77234a4b38f --- /dev/null +++ b/annotations_1/aSsFjcw8R3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 16.93], [19.0, 26.23], [29.0, 29.71], [32.0, 32.49], [34.0, 34.23], [35.0, 36.41], [38.0, 39.77], [42.0, 64.27], [65.0, 64.91], [70.0, 69.89], [71.0, 73.48], [74.0, 76.86], [78.0, 78.22], [81.0, 81.35], [84.0, 84.47], [88.0, 88.53], [91.0, 91.76], [93.0, 93.97], [95.0, 96.01], [111.0, 111.28], [114.0, 114.05], [122.0, 122.03], [122.0, 122.08], [122.0, 122.47], [123.0, 122.57], [123.0, 123.2], [125.0, 125.91], [129.0, 128.76]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.05, 30.16, 0.0, 0.0, 0.0, 0.0, 0.0, 31.59, 0.0, 0.0, 98.73, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.22], ["speech", 17.04], ["throbbing", 6.09]], [["throbbing", 40.04], ["hum", 28.65], ["music", 21.99]], null, null, null, null, null, [["music", 52.81], ["throbbing", 7.24], ["speech", 5.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.93, 7.23, 0.71, 0.49, 0.23, 1.41, 1.77, 22.27, -0.09, -0.11, 2.48, 2.86, 0.22, 0.35, 0.47, 0.53, 0.76, 0.97, 1.01, 0.28, 0.05, 0.03, 0.08, 0.47, -0.43, 0.2, 0.91, -0.24]} \ No newline at end of file diff --git a/annotations_1/aSwH4lpuKE8_filtered.json b/annotations_1/aSwH4lpuKE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d5ac4b1f1b60431d040ec93cfacf7707dcaa8fe --- /dev/null +++ b/annotations_1/aSwH4lpuKE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [11.0, 12.66], [25.0, 26.03], [28.0, 28.21], [37.0, 38.65], [53.0, 54.19], [56.0, 56.3], [63.0, 65.53], [66.0, 67.69]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.63, 1.66, 1.03, 0.21, 1.65, 1.19, 0.3, 2.53, 1.69]} \ No newline at end of file diff --git a/annotations_1/aSwi8mzc1gA_filtered.json b/annotations_1/aSwi8mzc1gA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c214bd1c7a42199f94d1c2049ec06efdc75c05a --- /dev/null +++ b/annotations_1/aSwi8mzc1gA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [3.0, 14.4], [15.0, 15.85], [17.0, 17.27], [18.0, 18.79], [20.0, 21.05], [22.0, 22.23], [27.0, 29.84], [32.0, 33.0], [36.0, 36.56], [37.0, 39.83], [40.0, 41.77], [46.0, 46.16], [48.0, 47.9], [50.0, 51.76], [53.0, 53.38], [55.0, 57.57], [59.0, 58.89], [59.0, 59.75], [63.0, 76.99], [79.0, 81.08], [85.0, 85.78], [86.0, 87.42], [93.0, 93.53], [94.0, 94.05], [94.0, 95.59], [97.0, 97.92], [99.0, 99.2], [99.0, 99.67], [103.0, 102.9], [106.0, 105.71], [109.0, 109.54], [110.0, 111.28], [112.0, 115.86], [121.0, 122.44], [124.0, 131.08], [134.0, 133.62], [135.0, 148.61], [150.0, 150.47], [153.0, 155.01], [157.0, 156.84], [159.0, 159.66], [165.0, 165.64], [166.0, 166.58], [169.0, 170.31], [173.0, 173.7], [176.0, 178.61], [179.0, 180.32], [181.0, 181.52], [182.0, 182.26], [183.0, 183.36], [187.0, 189.23], [193.0, 196.74], [197.0, 198.32], [199.0, 203.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 92.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.59, 0.0, 85.9, 0.0, 50.66, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 68.41, 75.23, 0.0, 60.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 19.05], ["chirp tone", 17.56], ["sine wave", 16.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 11.4, 0.85, 0.27, 0.79, 1.05, 0.23, 2.84, 1.0, 0.56, 2.83, 1.77, 0.16, -0.1, 1.76, 0.38, 2.57, -0.11, 0.75, 13.99, 2.08, 0.78, 1.42, 0.53, 0.05, 1.59, 0.92, 0.2, 0.67, -0.1, -0.29, 0.54, 1.28, 3.86, 1.44, 7.08, -0.38, 13.61, 0.47, 2.01, -0.16, 0.66, 0.64, 0.58, 1.31, 0.7, 2.61, 1.32, 0.52, 0.26, 0.36, 2.23, 3.74, 1.32, 4.96]} \ No newline at end of file diff --git a/annotations_1/aTSa6E4_Zgs_filtered.json b/annotations_1/aTSa6E4_Zgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5eae597a09e2f6165e08de4640f7934dca5ba07 --- /dev/null +++ b/annotations_1/aTSa6E4_Zgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 39.93], [41.0, 43.23], [44.0, 46.5], [47.0, 48.36], [50.0, 53.15], [54.0, 55.46], [57.0, 58.89], [59.0, 67.83], [69.0, 72.79], [81.0, 81.31], [85.0, 86.76], [88.0, 89.04], [89.0, 93.39], [94.0, 110.96], [113.0, 113.07], [116.0, 116.38]], "keep_status": [false, true, true, false, true, false, false, true, true, false, false, false, true, true, false, false], "silence_prob": [31.46, 33.75, 33.01, 0.0, 31.17, 0.0, 0.0, 32.51, 31.58, 0.0, 0.0, 0.0, 30.81, 29.95, 0.0, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 34.89], ["moo", 20.95], ["livestock, farm animals, working animals", 19.99]], [["speech", 24.73], ["music", 12.01], ["mains hum", 6.82]], [["speech", 26.27], ["vehicle", 24.13], ["car", 6.2]], null, [["music", 11.94], ["vehicle", 10.3], ["car", 7.9]], null, null, [["music", 37.05], ["theremin", 6.13], ["synthesizer", 4.42]], [["music", 50.65], ["mains hum", 6.57], ["electronic music", 6.11]], null, null, null, [["music", 31.14], ["speech", 12.86], ["synthesizer", 6.16]], [["livestock, farm animals, working animals", 30.77], ["cattle, bovinae", 6.72], ["hum", 6.38]], null, null], "duration": [7.93, 2.23, 2.5, 1.36, 3.15, 1.46, 1.89, 8.83, 3.79, 0.31, 1.76, 1.04, 4.39, 16.96, 0.07, 0.38]} \ No newline at end of file diff --git a/annotations_1/aTc9vNCS8vo_filtered.json b/annotations_1/aTc9vNCS8vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46c90e90d64b7866fc8edf0ea50b2f42da63cc36 --- /dev/null +++ b/annotations_1/aTc9vNCS8vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.43], [8.0, 9.56], [12.0, 12.87], [15.0, 14.96], [28.0, 33.44], [33.0, 33.51], [34.0, 34.33], [46.0, 51.93], [53.0, 56.24], [62.0, 80.86], [82.0, 84.13], [85.0, 86.37], [87.0, 86.75], [88.0, 88.69], [90.0, 91.1], [94.0, 94.69], [97.0, 101.01], [108.0, 109.07], [109.0, 110.71], [111.0, 119.97], [121.0, 129.25], [130.0, 131.73], [134.0, 134.01], [136.0, 137.13], [137.0, 137.42], [140.0, 140.19], [141.0, 142.99], [146.0, 145.76], [149.0, 153.15], [153.0, 155.9], [156.0, 157.98], [159.0, 159.48], [160.0, 160.84], [163.0, 163.56], [165.0, 165.62], [170.0, 171.8], [174.0, 176.39], [179.0, 179.83], [181.0, 181.03], [182.0, 182.53], [183.0, 183.88], [185.0, 185.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [93.45, 0.0, 0.0, 0.0, 34.35, 0.0, 0.0, 46.19, 34.0, 39.28, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 0.0, 99.71, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 87.01], ["radio", 5.9], ["sidetone", 3.03]], null, null, [["speech", 67.64], ["music", 5.34], ["animal", 1.76]], [["speech", 61.69], ["dog", 4.51], ["animal", 3.51]], [["speech", 55.21], ["telephone", 20.57], ["dial tone", 7.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 15.01], ["livestock, farm animals, working animals", 12.77], ["wild animals", 10.08]], null, null, null, null, null], "duration": [2.43, 1.56, 0.87, -0.04, 5.44, 0.51, 0.33, 5.93, 3.24, 18.86, 2.13, 1.37, -0.25, 0.69, 1.1, 0.69, 4.01, 1.07, 1.71, 8.97, 8.25, 1.73, 0.01, 1.13, 0.42, 0.19, 1.99, -0.24, 4.15, 2.9, 1.98, 0.48, 0.84, 0.56, 0.62, 1.8, 2.39, 0.83, 0.03, 0.53, 0.88, 0.62]} \ No newline at end of file diff --git a/annotations_1/aTxu-zthTgs_filtered.json b/annotations_1/aTxu-zthTgs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d66192ae7bb17ee9176d1a4378df83d6d790b178 --- /dev/null +++ b/annotations_1/aTxu-zthTgs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.95], [16.0, 27.97], [31.0, 42.16], [42.0, 69.25], [71.0, 83.44]], "keep_status": [true, false, true, true, false], "silence_prob": [31.3, 31.48, 32.33, 32.89, 34.45], "audiomae_on_audioset": [[["motorcycle", 14.65], ["vehicle", 11.89], ["fly, housefly", 10.91]], [["music", 40.4], ["throbbing", 20.49], ["hum", 14.15]], [["music", 19.5], ["hum", 18.48], ["vehicle", 12.51]], [["music", 27.25], ["vehicle", 18.3], ["speech", 9.19]], [["music", 79.5], ["speech", 3.93], ["brass instrument", 1.76]]], "duration": [5.95, 11.97, 11.16, 27.25, 12.44]} \ No newline at end of file diff --git a/annotations_1/aU9RYKxkRJk_filtered.json b/annotations_1/aU9RYKxkRJk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b509256f7ff304a3e1eb35a443e833b751645e50 --- /dev/null +++ b/annotations_1/aU9RYKxkRJk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [9.0, 9.49], [11.0, 11.89], [13.0, 13.91], [16.0, 16.83], [19.0, 20.73], [21.0, 21.3], [24.0, 26.35], [30.0, 31.08], [31.0, 33.59], [36.0, 36.68], [38.0, 39.7], [41.0, 42.7], [47.0, 48.17], [50.0, 51.07], [52.0, 52.89], [55.0, 55.27], [57.0, 57.21], [58.0, 58.5], [60.0, 61.79], [65.0, 67.61], [69.0, 69.77], [70.0, 72.17], [73.0, 75.79], [77.0, 78.7], [80.0, 81.38], [83.0, 83.67], [85.0, 85.65], [87.0, 89.02], [92.0, 98.58], [99.0, 101.71], [103.0, 103.1], [107.0, 110.19], [112.0, 112.43], [115.0, 115.06], [117.0, 117.29], [119.0, 119.82], [121.0, 122.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 97.92, 99.31, 0.0, 0.0, 0.0, 0.0, 90.95, 82.97, 81.35, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.49, 0.89, 0.91, 0.83, 1.73, 0.3, 2.35, 1.08, 2.59, 0.68, 1.7, 1.7, 1.17, 1.07, 0.89, 0.27, 0.21, 0.5, 1.79, 2.61, 0.77, 2.17, 2.79, 1.7, 1.38, 0.67, 0.65, 2.02, 6.58, 2.71, 0.1, 3.19, 0.43, 0.06, 0.29, 0.82, 1.17]} \ No newline at end of file diff --git a/annotations_1/aUAVPdrvwoA_filtered.json b/annotations_1/aUAVPdrvwoA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df0908d69943f7c6063c5f62deda72afa8657b74 --- /dev/null +++ b/annotations_1/aUAVPdrvwoA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.18], [7.0, 8.16], [9.0, 9.73], [11.0, 14.07], [14.0, 15.16], [16.0, 18.71], [21.0, 21.59], [25.0, 25.93], [27.0, 27.31], [29.0, 37.4], [40.0, 40.8], [42.0, 43.58], [44.0, 46.16], [47.0, 47.49], [52.0, 53.57], [59.0, 59.46], [62.0, 65.79], [66.0, 66.18], [81.0, 85.9], [90.0, 92.26], [96.0, 97.6], [100.0, 100.74]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.62, 0.0, 40.29, 0.0, 0.0, 0.0, 46.83, 0.0, 0.0, 34.04, 0.0, 0.0, 0.0, 30.98, 0.0, 31.72, 47.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.05], ["speech", 19.61], ["hum", 10.24]], null, [["gong", 35.21], ["music", 25.62], ["singing bowl", 11.46]], null, null, null, [["music", 48.22], ["gong", 16.39], ["singing bowl", 11.27]], null, null, [["music", 35.85], ["speech", 21.82], ["whale vocalization", 5.54]], null, null, null, [["music", 25.54], ["mains hum", 23.02], ["hum", 16.88]], null, [["music", 43.06], ["didgeridoo", 9.96], ["buzz", 8.68]], [["animal", 26.42], ["music", 11.48], ["livestock, farm animals, working animals", 5.25]], null, null], "duration": [0.18, 1.16, 0.73, 3.07, 1.16, 2.71, 0.59, 0.93, 0.31, 8.4, 0.8, 1.58, 2.16, 0.49, 1.57, 0.46, 3.79, 0.18, 4.9, 2.26, 1.6, 0.74]} \ No newline at end of file diff --git a/annotations_1/aVHgGXnna94_filtered.json b/annotations_1/aVHgGXnna94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f9b7a1b200628116928bef5708b5c6bfc62408c --- /dev/null +++ b/annotations_1/aVHgGXnna94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.25], [24.0, 24.8], [26.0, 26.6], [31.0, 36.21], [38.0, 38.64], [39.0, 39.63], [40.0, 40.74], [42.0, 46.38], [50.0, 53.42], [56.0, 58.14], [60.0, 61.11], [65.0, 72.39], [73.0, 74.76], [77.0, 89.51], [93.0, 105.93], [112.0, 112.4], [115.0, 130.98], [133.0, 151.16], [152.0, 155.29], [159.0, 159.21], [160.0, 161.35], [162.0, 164.93], [166.0, 167.78], [169.0, 170.23], [171.0, 176.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.16, 0.0, 0.0, 0.0, 73.21, 74.92, 56.63, 0.0, 31.9, 0.0, 31.09, 31.17, 0.0, 31.75, 30.43, 100.0, 0.0, 0.0, 39.78, 0.0, 0.0, 74.44], "audiomae_on_audioset": [null, null, null, [["music", 47.85], ["musical instrument", 15.49], ["synthesizer", 8.54]], null, null, null, null, null, null, null, [["mains hum", 31.07], ["hum", 27.78], ["music", 10.02]], null, [["music", 67.1], ["hum", 6.6], ["throbbing", 4.32]], [["music", 86.88], ["musical instrument", 2.6], ["scary music", 1.57]], null, [["music", 79.9], ["musical instrument", 4.12], ["didgeridoo", 2.76]], [["music", 69.67], ["theremin", 3.21], ["brass instrument", 3.01]], null, null, null, [["speech", 68.82], ["sidetone", 5.06], ["hum", 3.68]], null, null, null], "duration": [0.25, 0.8, 0.6, 5.21, 0.64, 0.63, 0.74, 4.38, 3.42, 2.14, 1.11, 7.39, 1.76, 12.51, 12.93, 0.4, 15.98, 18.16, 3.29, 0.21, 1.35, 2.93, 1.78, 1.23, 5.44]} \ No newline at end of file diff --git a/annotations_1/aW3-E3My-kc_filtered.json b/annotations_1/aW3-E3My-kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7617753746995143795f422e67960333cdcbcaa --- /dev/null +++ b/annotations_1/aW3-E3My-kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.68], [28.0, 32.95], [34.0, 34.96], [37.0, 37.05], [38.0, 37.99], [38.0, 38.04], [38.0, 40.22], [45.0, 46.31], [51.0, 51.8], [53.0, 57.94], [59.0, 59.8], [64.0, 82.27], [91.0, 93.23], [97.0, 99.66], [102.0, 104.72], [120.0, 120.11], [123.0, 122.99], [125.0, 126.74], [128.0, 133.79], [141.0, 141.93], [142.0, 142.67], [143.0, 143.13], [152.0, 154.53], [159.0, 161.5], [169.0, 171.32], [177.0, 177.67], [178.0, 177.72], [178.0, 179.39]], "keep_status": [true, true, false, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [28.78, 28.88, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0, 29.34, 0.0, 28.79, 29.85, 29.53, 29.56, 0.0, 0.0, 0.0, 29.08, 0.0, 0.0, 0.0, 29.29, 28.47, 28.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["creak", 21.97], ["throbbing", 19.36], ["music", 13.03]], [["hum", 25.95], ["throbbing", 25.17], ["music", 11.46]], null, null, null, null, [["music", 24.4], ["speech", 20.83], ["didgeridoo", 3.92]], null, null, [["music", 55.51], ["throbbing", 7.76], ["didgeridoo", 3.47]], null, [["speech", 28.06], ["music", 21.21], ["whack, thwack", 16.31]], [["throbbing", 19.33], ["music", 18.76], ["beatboxing", 7.25]], [["didgeridoo", 71.14], ["music", 14.71], ["musical instrument", 2.34]], [["music", 48.17], ["beatboxing", 17.26], ["didgeridoo", 12.36]], null, null, null, [["speech", 46.1], ["music", 19.35], ["throbbing", 3.51]], null, null, null, [["cattle, bovinae", 21.38], ["music", 9.92], ["throbbing", 9.26]], [["music", 55.03], ["speech", 14.92], ["electronic music", 6.59]], [["speech", 37.66], ["music", 31.67], ["explosion", 5.51]], null, null, null], "duration": [2.68, 4.95, 0.96, 0.05, -0.01, 0.04, 2.22, 1.31, 0.8, 4.94, 0.8, 18.27, 2.23, 2.66, 2.72, 0.11, -0.01, 1.74, 5.79, 0.93, 0.67, 0.13, 2.53, 2.5, 2.32, 0.67, -0.28, 1.39]} \ No newline at end of file diff --git a/annotations_1/aWIcfkvKj9Q_filtered.json b/annotations_1/aWIcfkvKj9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f8fb51ec74fa2ca843ba5022e04a6837b2ea849 --- /dev/null +++ b/annotations_1/aWIcfkvKj9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 10.45], [11.0, 12.45], [13.0, 15.01], [16.0, 21.24], [22.0, 22.92], [24.0, 24.39], [25.0, 29.25], [31.0, 33.96], [35.0, 36.44], [37.0, 38.04], [40.0, 41.49], [43.0, 52.2], [53.0, 53.45], [55.0, 55.83], [56.0, 57.03], [60.0, 60.72], [61.0, 63.21], [64.0, 66.85], [68.0, 70.04], [70.0, 78.02], [78.0, 80.74], [82.0, 85.83], [87.0, 87.45], [88.0, 88.4], [89.0, 90.32], [91.0, 100.79], [102.0, 102.17], [110.0, 110.29], [111.0, 114.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 100.0, 0.0, 93.76, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.23, 5.45, 1.45, 2.01, 5.24, 0.92, 0.39, 4.25, 2.96, 1.44, 1.04, 1.49, 9.2, 0.45, 0.83, 1.03, 0.72, 2.21, 2.85, 2.04, 8.02, 2.74, 3.83, 0.45, 0.4, 1.32, 9.79, 0.17, 0.29, 3.62]} \ No newline at end of file diff --git a/annotations_1/aWjBDI02kSE_filtered.json b/annotations_1/aWjBDI02kSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dda3f6ee0c55b8ce4f3117f6a8babf0d9cfdc2ce --- /dev/null +++ b/annotations_1/aWjBDI02kSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 126.5], [129.0, 136.63], [138.0, 163.44], [164.0, 164.51], [169.0, 172.66], [175.0, 174.9], [180.0, 180.6], [188.0, 189.6], [192.0, 192.27]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.91, 29.36, 0.0, 34.47, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 35.08], ["throbbing", 22.95], ["hum", 13.93]], [["music", 61.81], ["cacophony", 5.93], ["musical instrument", 2.81]], null, [["thunk", 44.64], ["speech", 16.6], ["music", 7.59]], null, null, null, null], "duration": [32.5, 7.63, 25.44, 0.51, 3.66, -0.1, 0.6, 1.6, 0.27]} \ No newline at end of file diff --git a/annotations_1/aX9m-xzauMw_filtered.json b/annotations_1/aX9m-xzauMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2431dbd2e502cb492cb425e3e9812cbc058a4316 --- /dev/null +++ b/annotations_1/aX9m-xzauMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.51], [7.0, 29.76], [31.0, 33.42], [51.0, 52.29], [61.0, 61.13], [67.0, 67.53], [78.0, 80.55], [88.0, 88.79], [90.0, 91.0], [97.0, 98.2], [99.0, 99.37], [105.0, 105.7], [108.0, 108.36], [109.0, 112.58], [114.0, 114.67]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [31.48, 29.83, 32.56, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0], "audiomae_on_audioset": [[["music", 65.47], ["theremin", 5.26], ["musical instrument", 3.88]], [["music", 46.23], ["speech", 18.14], ["fly, housefly", 4.52]], [["music", 40.33], ["speech", 24.53], ["thunk", 5.69]], null, null, null, null, null, null, null, null, null, null, [["speech", 12.99], ["animal", 10.86], ["fart", 9.73]], null], "duration": [2.51, 22.76, 2.42, 1.29, 0.13, 0.53, 2.55, 0.79, 1.0, 1.2, 0.37, 0.7, 0.36, 3.58, 0.67]} \ No newline at end of file diff --git a/annotations_1/aYSdnLgl-FQ_filtered.json b/annotations_1/aYSdnLgl-FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57a6841d3d53c1fecafd7a17e2e8a4cb3a0c334c --- /dev/null +++ b/annotations_1/aYSdnLgl-FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 6.47], [8.0, 10.22], [13.0, 13.9], [18.0, 18.98], [26.0, 26.0], [28.0, 31.24], [35.0, 38.6], [39.0, 41.81], [46.0, 47.14], [48.0, 49.92], [52.0, 56.12], [59.0, 59.98], [64.0, 66.28], [68.0, 68.12], [69.0, 79.19], [80.0, 81.68], [87.0, 119.7], [121.0, 123.72], [126.0, 152.19], [155.0, 156.56], [158.0, 159.53], [161.0, 165.65], [166.0, 165.69], [171.0, 171.37], [174.0, 174.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.92, 53.34, 0.0, 0.0, 0.0, 80.11, 82.07, 57.97, 0.0, 0.0, 50.26, 0.0, 35.8, 0.0, 29.7, 0.0, 0.0, 32.24, 28.93, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 39.4], ["music", 25.71], ["musical instrument", 5.48]], null, null, null, null, null, null, null, null, null, null, null, [["music", 12.56], ["guitar", 12.11], ["clang", 10.13]], null, [["thunk", 38.04], ["speech", 33.1], ["whack, thwack", 8.53]], null, null, [["music", 26.94], ["didgeridoo", 7.52], ["throat clearing", 5.98]], [["breaking", 27.99], ["music", 25.3], ["whack, thwack", 15.48]], null, null, [["speech", 40.66], ["music", 23.02], ["sonar", 8.77]], null, null, null], "duration": [0.08, 2.47, 2.22, 0.9, 0.98, 0.0, 3.24, 3.6, 2.81, 1.14, 1.92, 4.12, 0.98, 2.28, 0.12, 10.19, 1.68, 32.7, 2.72, 26.19, 1.56, 1.53, 4.65, -0.31, 0.37, 0.29]} \ No newline at end of file diff --git a/annotations_1/aZJG26fSy94_filtered.json b/annotations_1/aZJG26fSy94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4662b14ff23655d5c000b6b6781ae71a02d3470 --- /dev/null +++ b/annotations_1/aZJG26fSy94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.76], [12.0, 12.9], [17.0, 18.1], [24.0, 23.9], [24.0, 27.9], [28.0, 32.39], [38.0, 37.86], [61.0, 66.51], [87.0, 92.23], [104.0, 104.19], [109.0, 114.76]], "keep_status": [false, false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.73, 38.03, 0.0, 30.42, 31.45, 0.0, 32.91], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 26.27], ["livestock, farm animals, working animals", 20.47], ["moo", 14.31]], [["drip", 9.13], ["whale vocalization", 8.05], ["music", 8.03]], null, [["rumble", 18.34], ["explosion", 10.26], ["speech", 7.66]], [["music", 22.71], ["hum", 8.77], ["explosion", 7.72]], null, [["sheep", 66.97], ["bleat", 11.9], ["animal", 5.96]]], "duration": [1.76, 0.9, 1.1, -0.1, 3.9, 4.39, -0.14, 5.51, 5.23, 0.19, 5.76]} \ No newline at end of file diff --git a/annotations_1/aZbGlkGWiZc_filtered.json b/annotations_1/aZbGlkGWiZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cbe64509533afc70f775ce89ac66e9ce08bbd6b --- /dev/null +++ b/annotations_1/aZbGlkGWiZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 7.84], [9.0, 9.29], [17.0, 18.27], [19.0, 21.05], [21.0, 32.85], [34.0, 35.14], [36.0, 36.22], [37.0, 40.41], [42.0, 44.36], [47.0, 69.92], [72.0, 101.88], [104.0, 104.92], [109.0, 110.52], [113.0, 123.84]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.47, 29.59, 0.0, 0.0, 44.69, 38.83, 29.77, 29.38, 0.0, 0.0, 32.15], "audiomae_on_audioset": [null, null, null, null, [["music", 39.73], ["speech", 12.02], ["house music", 7.49]], [["music", 44.43], ["throbbing", 13.38], ["hum", 6.68]], null, null, [["music", 82.6], ["synthesizer", 3.57], ["musical instrument", 1.76]], [["music", 80.08], ["synthesizer", 7.28], ["musical instrument", 5.65]], [["music", 70.45], ["house music", 6.22], ["electronic dance music", 5.63]], [["music", 40.48], ["speech", 7.79], ["electronic music", 6.53]], null, null, [["sidetone", 31.79], ["music", 25.18], ["speech", 9.28]]], "duration": [0.68, 0.84, 0.29, 1.27, 2.05, 11.85, 1.14, 0.22, 3.41, 2.36, 22.92, 29.88, 0.92, 1.52, 10.84]} \ No newline at end of file diff --git a/annotations_1/a_9dO9k2TPQ_filtered.json b/annotations_1/a_9dO9k2TPQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/a_9dO9k2TPQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/a_DO8nd7FeA_filtered.json b/annotations_1/a_DO8nd7FeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2967988ee3ba931d891ece6a83a5e310248072db --- /dev/null +++ b/annotations_1/a_DO8nd7FeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 38.31], [45.0, 51.36], [53.0, 54.46], [56.0, 66.99], [68.0, 73.52], [78.0, 93.61], [96.0, 102.39], [108.0, 110.74], [112.0, 123.45], [124.0, 124.44]], "keep_status": [false, true, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 35.71, 0.0, 32.69, 33.53, 38.84, 58.64, 86.45, 45.82, 0.0], "audiomae_on_audioset": [null, [["music", 26.47], ["throbbing", 21.53], ["speech", 16.53]], null, [["speech", 29.1], ["music", 25.92], ["foghorn", 6.71]], [["music", 45.01], ["speech", 21.14], ["hum", 3.83]], [["livestock, farm animals, working animals", 62.77], ["cattle, bovinae", 20.18], ["moo", 16.42]], null, null, [["electric shaver, electric razor", 23.74], ["buzz", 17.1], ["hum", 8.32]], null], "duration": [36.31, 6.36, 1.46, 10.99, 5.52, 15.61, 6.39, 2.74, 11.45, 0.44]} \ No newline at end of file diff --git a/annotations_1/a_DkEkfAO4s_filtered.json b/annotations_1/a_DkEkfAO4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67b2bdc3e9ab36cd6a834c247340a4a2bd4cbf16 --- /dev/null +++ b/annotations_1/a_DkEkfAO4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.52], [23.0, 24.02], [25.0, 25.71], [28.0, 27.82], [29.0, 30.03], [31.0, 31.19], [32.0, 39.95], [42.0, 48.47], [55.0, 56.86], [59.0, 59.05], [64.0, 66.09], [75.0, 80.06], [86.0, 86.97], [89.0, 89.85], [94.0, 94.63], [98.0, 104.26], [108.0, 109.29], [123.0, 122.91], [127.0, 127.9], [134.0, 134.28], [136.0, 138.48], [145.0, 145.05], [152.0, 151.73], [159.0, 159.53], [161.0, 162.11], [174.0, 174.02], [176.0, 175.69], [178.0, 180.0], [186.0, 187.68], [199.0, 198.75], [199.0, 201.07], [206.0, 206.46], [213.0, 213.7], [227.0, 228.01], [233.0, 233.58]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.44, 0.0, 0.0, 0.0, 0.0, 0.0, 29.99, 35.01, 0.0, 0.0, 62.17, 31.54, 0.0, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0, 0.0, 35.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 32.83], ["smash, crash", 28.59], ["breaking", 21.74]], null, null, null, null, null, [["sidetone", 23.93], ["buzz", 16.45], ["hum", 8.65]], [["explosion", 18.79], ["speech", 16.59], ["hum", 8.63]], null, null, null, [["music", 19.4], ["roar", 13.37], ["animal", 5.28]], null, null, null, null, null, null, null, null, [["moo", 27.98], ["cattle, bovinae", 25.55], ["livestock, farm animals, working animals", 24.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.52, 1.02, 0.71, -0.18, 1.03, 0.19, 7.95, 6.47, 1.86, 0.05, 2.09, 5.06, 0.97, 0.85, 0.63, 6.26, 1.29, -0.09, 0.9, 0.28, 2.48, 0.05, -0.27, 0.53, 1.11, 0.02, -0.31, 2.0, 1.68, -0.25, 2.07, 0.46, 0.7, 1.01, 0.58]} \ No newline at end of file diff --git a/annotations_1/a_VIjZa76jI_filtered.json b/annotations_1/a_VIjZa76jI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78330095a29ba96be26b1d8db5c6db96de3533bd --- /dev/null +++ b/annotations_1/a_VIjZa76jI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.31], [36.0, 36.9], [41.0, 41.67], [46.0, 46.53], [48.0, 53.77], [56.0, 56.66], [57.0, 71.07], [72.0, 73.82]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.33, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 43.03], ["speech", 24.2], ["crowd", 5.67]], null, [["music", 35.71], ["speech", 27.93], ["throbbing", 5.01]], null], "duration": [0.31, 0.9, 0.67, 0.53, 5.77, 0.66, 14.07, 1.82]} \ No newline at end of file diff --git a/annotations_1/a_hsjTExzbw_filtered.json b/annotations_1/a_hsjTExzbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a15b41f6fcc7cb88fc7f5e4f98f43f680b2253b --- /dev/null +++ b/annotations_1/a_hsjTExzbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.53], [26.0, 26.65], [32.0, 32.64], [36.0, 35.92], [38.0, 47.49], [51.0, 51.17], [61.0, 65.13], [67.0, 86.7], [90.0, 117.85]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.85, 0.0, 33.84, 31.26, 30.51], "audiomae_on_audioset": [null, null, null, null, [["music", 53.29], ["hum", 8.59], ["mains hum", 5.07]], null, [["music", 49.46], ["hum", 22.76], ["throbbing", 16.54]], [["music", 60.21], ["speech", 6.51], ["hum", 3.76]], [["music", 72.24], ["speech", 3.8], ["electronic music", 1.9]]], "duration": [0.53, 0.65, 0.64, -0.08, 9.49, 0.17, 4.13, 19.7, 27.85]} \ No newline at end of file diff --git a/annotations_1/a_iEYXLXbjY_filtered.json b/annotations_1/a_iEYXLXbjY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e564551477ea60276bbdc4654c3ec0a17450112f --- /dev/null +++ b/annotations_1/a_iEYXLXbjY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [4.0, 4.9], [10.0, 12.45], [16.0, 16.23], [19.0, 19.72], [20.0, 20.87], [22.0, 22.71], [23.0, 24.9], [27.0, 27.5], [30.0, 30.84], [36.0, 38.35], [40.0, 50.57], [52.0, 53.23], [54.0, 56.88], [61.0, 61.94], [73.0, 79.29], [81.0, 86.9], [88.0, 88.26], [93.0, 93.93], [94.0, 96.63], [100.0, 101.21], [102.0, 103.94], [107.0, 134.45], [136.0, 136.95], [145.0, 146.06], [147.0, 147.29], [150.0, 150.48], [154.0, 154.28]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 31.65, 0.0, 56.03, 0.0, 99.99, 46.33, 0.0, 0.0, 44.26, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["moo", 29.82], ["cattle, bovinae", 18.95], ["livestock, farm animals, working animals", 5.51]], null, null, null, null, null, null, null, [["music", 10.19], ["moo", 6.83], ["speech", 6.06]], [["whack, thwack", 35.76], ["speech", 21.1], ["fly, housefly", 6.6]], null, null, null, null, [["music", 54.21], ["thunk", 16.41], ["hum", 2.83]], null, null, [["speech", 28.19], ["music", 19.66], ["gong", 12.71]], null, null, [["music", 79.43], ["psychedelic rock", 3.76], ["punk rock", 1.9]], null, null, null, null, null], "duration": [0.32, 0.9, 2.45, 0.23, 0.72, 0.87, 0.71, 1.9, 0.5, 0.84, 2.35, 10.57, 1.23, 2.88, 0.94, 6.29, 5.9, 0.26, 0.93, 2.63, 1.21, 1.94, 27.45, 0.95, 1.06, 0.29, 0.48, 0.28]} \ No newline at end of file diff --git a/annotations_1/aa0NlkF7Rug_filtered.json b/annotations_1/aa0NlkF7Rug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97eae174bd75a070cf43fbdf7bdc903afcfa09e6 --- /dev/null +++ b/annotations_1/aa0NlkF7Rug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.94], [1.0, 1.07], [1.0, 17.71], [20.0, 28.93], [29.0, 29.94], [30.0, 50.06], [54.0, 66.82], [68.0, 92.4], [96.0, 98.47]], "keep_status": [false, false, true, true, false, true, true, true, true], "silence_prob": [0.0, 0.0, 35.41, 33.53, 0.0, 30.0, 29.58, 30.73, 29.67], "audiomae_on_audioset": [null, null, [["electric shaver, electric razor", 35.41], ["noise", 13.26], ["speech", 9.92]], [["livestock, farm animals, working animals", 22.35], ["whale vocalization", 13.21], ["cattle, bovinae", 11.57]], null, [["music", 17.58], ["speech", 16.68], ["didgeridoo", 14.11]], [["speech", 40.88], ["knock", 10.72], ["music", 10.49]], [["speech", 46.44], ["music", 9.06], ["animal", 7.33]], [["fly, housefly", 30.73], ["insect", 17.58], ["bee, wasp, etc.", 11.53]]], "duration": [-0.06, 0.07, 16.71, 8.93, 0.94, 20.06, 12.82, 24.4, 2.47]} \ No newline at end of file diff --git a/annotations_1/aak6BqNR150_filtered.json b/annotations_1/aak6BqNR150_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc8fd7791554715f004b570d7ca72a475b6fe3b --- /dev/null +++ b/annotations_1/aak6BqNR150_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.66], [18.0, 18.49], [19.0, 20.68], [22.0, 22.81], [31.0, 32.71], [44.0, 44.69], [47.0, 48.66], [52.0, 52.56], [62.0, 62.77], [72.0, 72.49], [82.0, 86.1], [93.0, 94.34], [100.0, 117.59], [126.0, 126.2], [135.0, 140.73], [141.0, 141.13], [153.0, 153.96], [163.0, 163.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99, 0.0, 31.53, 0.0, 30.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["thunk", 41.42], ["music", 26.83], ["fly, housefly", 4.54]], null, [["music", 65.1], ["synthesizer", 7.41], ["musical instrument", 4.9]], null, [["moo", 26.67], ["cattle, bovinae", 21.96], ["groan", 9.72]], null, null, null], "duration": [1.66, 0.49, 1.68, 0.81, 1.71, 0.69, 1.66, 0.56, 0.77, 0.49, 4.1, 1.34, 17.59, 0.2, 5.73, 0.13, 0.96, 0.36]} \ No newline at end of file diff --git a/annotations_1/aazXc06Oycs_filtered.json b/annotations_1/aazXc06Oycs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c698cac7e4df8e2582eebb8f9564b342afcb1b35 --- /dev/null +++ b/annotations_1/aazXc06Oycs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [3.0, 5.59], [24.0, 24.85], [34.0, 33.57], [42.0, 43.28], [46.0, 47.58], [49.0, 50.18], [60.0, 62.18], [74.0, 76.96], [78.0, 79.68], [83.0, 83.49], [102.0, 105.07], [107.0, 108.41], [122.0, 122.77], [123.0, 123.72], [128.0, 128.44], [132.0, 133.74], [135.0, 143.26], [149.0, 151.38], [153.0, 152.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.33, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 93.29, 0.0, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 96.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.08, 2.59, 0.85, -0.43, 1.28, 1.58, 1.18, 2.18, 2.96, 1.68, 0.49, 3.07, 1.41, 0.77, 0.72, 0.44, 1.74, 8.26, 2.38, -0.05]} \ No newline at end of file diff --git a/annotations_1/ab4MM9cHidM_filtered.json b/annotations_1/ab4MM9cHidM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e202f25e1c77b71d6aebbe355ad3d812634f8d4d --- /dev/null +++ b/annotations_1/ab4MM9cHidM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.07], [3.0, 3.59], [4.0, 7.64], [10.0, 11.55], [13.0, 14.72], [15.0, 16.65], [18.0, 25.61], [30.0, 32.95], [34.0, 38.15], [38.0, 38.72], [39.0, 38.96], [39.0, 39.31], [44.0, 43.85], [47.0, 47.83], [51.0, 51.58], [53.0, 54.57], [66.0, 68.12], [70.0, 71.1], [75.0, 75.09], [79.0, 81.57], [85.0, 86.31], [87.0, 88.6], [89.0, 90.85], [94.0, 97.19], [100.0, 128.97], [131.0, 133.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 67.63, 60.05, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 74.76, 79.41, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 58.08], ["sidetone", 16.77], ["radio", 11.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.07, 0.59, 3.64, 1.55, 1.72, 1.65, 7.61, 2.95, 4.15, 0.72, -0.04, 0.31, -0.15, 0.83, 0.58, 1.57, 2.12, 1.1, 0.09, 2.57, 1.31, 1.6, 1.85, 3.19, 28.97, 2.64]} \ No newline at end of file diff --git a/annotations_1/abTZPgqiEto_filtered.json b/annotations_1/abTZPgqiEto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1206f041d85bf9eee083a7744cff8126d021defe --- /dev/null +++ b/annotations_1/abTZPgqiEto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 133.25]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [48.25]} \ No newline at end of file diff --git a/annotations_1/abXL2HrEjyE_filtered.json b/annotations_1/abXL2HrEjyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..601c4cc270155fdb30db78da6fd9359ae33889a5 --- /dev/null +++ b/annotations_1/abXL2HrEjyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.73], [23.0, 23.26], [25.0, 51.26], [53.0, 74.95], [79.0, 126.45]], "keep_status": [false, false, true, true, false], "silence_prob": [0.0, 0.0, 34.75, 29.95, 0.0], "audiomae_on_audioset": [null, null, [["hum", 13.45], ["eruption", 8.12], ["animal", 7.03]], [["animal", 37.85], ["horse", 6.6], ["music", 5.31]], null], "duration": [1.73, 0.26, 26.26, 21.95, 47.45]} \ No newline at end of file diff --git a/annotations_1/abgTPYfdbOE_filtered.json b/annotations_1/abgTPYfdbOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec048553218ca79e829b6168ef6d4e2b814b7a96 --- /dev/null +++ b/annotations_1/abgTPYfdbOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.7], [13.0, 21.47], [24.0, 25.78], [26.0, 28.61], [30.0, 30.52], [33.0, 34.01], [37.0, 37.57], [38.0, 39.61], [40.0, 45.05], [55.0, 55.7], [59.0, 59.7], [61.0, 64.18], [66.0, 67.66], [69.0, 70.17], [71.0, 72.42], [74.0, 76.0], [77.0, 91.32], [95.0, 99.86], [100.0, 111.87], [112.0, 113.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 99.21, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.7, 8.47, 1.78, 2.61, 0.52, 1.01, 0.57, 1.61, 5.05, 0.7, 0.7, 3.18, 1.66, 1.17, 1.42, 2.0, 14.32, 4.86, 11.87, 1.83]} \ No newline at end of file diff --git a/annotations_1/acZDS8WDtHs_filtered.json b/annotations_1/acZDS8WDtHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb22d128a04ee709f1c265f76b0d6c213ba95584 --- /dev/null +++ b/annotations_1/acZDS8WDtHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 68.28], [72.0, 81.31], [83.0, 86.95], [88.0, 88.57], [89.0, 92.3], [94.0, 99.17], [101.0, 107.13], [109.0, 117.95], [118.0, 118.08]], "keep_status": [false, true, false, false, true, true, true, true, false], "silence_prob": [0.0, 40.31, 38.9, 0.0, 34.66, 29.37, 29.65, 29.3, 0.0], "audiomae_on_audioset": [null, [["hum", 22.44], ["speech", 19.08], ["mains hum", 8.79]], [["hum", 51.65], ["mains hum", 9.63], ["throbbing", 8.91]], null, [["speech", 32.87], ["mains hum", 11.21], ["music", 10.81]], [["music", 44.68], ["speech", 9.43], ["musical instrument", 3.51]], [["music", 25.83], ["frog", 10.92], ["electric shaver, electric razor", 5.93]], [["music", 37.94], ["speech", 9.15], ["groan", 7.94]], null], "duration": [0.28, 9.31, 3.95, 0.57, 3.3, 5.17, 6.13, 8.95, 0.08]} \ No newline at end of file diff --git a/annotations_1/adatkf9XY44_filtered.json b/annotations_1/adatkf9XY44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80680f9213b3e76199bdeab8c65f33e3b6e74776 --- /dev/null +++ b/annotations_1/adatkf9XY44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.47], [9.0, 10.94], [24.0, 24.92], [27.0, 26.62], [27.0, 28.19], [35.0, 36.0], [39.0, 40.54], [44.0, 44.15], [48.0, 58.31], [59.0, 61.05], [62.0, 67.93], [69.0, 95.27], [102.0, 107.67], [108.0, 110.13], [112.0, 113.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 99.93, 52.68, 28.83, 35.78, 39.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.42], ["whack, thwack", 12.98], ["artillery fire", 11.29]], [["fly, housefly", 67.84], ["insect", 10.35], ["mosquito", 5.99]], [["speech", 37.39], ["sidetone", 26.62], ["telephone", 15.76]], null], "duration": [0.47, 1.94, 0.92, -0.38, 1.19, 1.0, 1.54, 0.15, 10.31, 2.05, 5.93, 26.27, 5.67, 2.13, 1.86]} \ No newline at end of file diff --git a/annotations_1/adjuOPzkpw4_filtered.json b/annotations_1/adjuOPzkpw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92b71aa54383e1c0193c78c6661b17774be76e1d --- /dev/null +++ b/annotations_1/adjuOPzkpw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.55], [28.0, 29.67], [30.0, 31.43], [34.0, 34.2], [37.0, 40.74], [42.0, 43.95], [45.0, 66.39], [72.0, 78.04], [87.0, 89.23], [91.0, 92.18], [95.0, 96.5], [106.0, 108.46], [110.0, 111.47], [113.0, 114.37], [123.0, 123.7], [127.0, 128.46], [132.0, 134.0], [135.0, 139.72], [145.0, 151.38], [152.0, 152.61], [153.0, 159.07], [173.0, 174.34], [176.0, 177.55], [181.0, 182.51], [188.0, 191.62]], "keep_status": [false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.91, 0.0, 32.85, 34.67, 40.47, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 0.0, 36.01, 41.85, 38.56, 0.0, 37.01, 0.0, 0.0, 0.0, 95.51], "audiomae_on_audioset": [null, null, null, null, [["music", 38.16], ["hum", 13.07], ["throbbing", 8.35]], null, [["speech", 28.36], ["music", 23.21], ["hum", 8.74]], [["music", 48.8], ["moo", 10.86], ["cattle, bovinae", 10.4]], [["music", 37.83], ["throbbing", 11.93], ["hum", 10.73]], null, null, [["music", 69.85], ["speech", 5.88], ["boom", 1.73]], null, null, null, null, [["explosion", 19.77], ["hum", 13.79], ["eruption", 10.46]], [["speech", 67.22], ["rowboat, canoe, kayak", 8.0], ["boat, water vehicle", 4.42]], [["speech", 48.49], ["vehicle", 5.1], ["hum", 5.02]], null, [["speech", 30.34], ["animal", 5.76], ["honk", 4.74]], null, null, null, null], "duration": [1.55, 1.67, 1.43, 0.2, 3.74, 1.95, 21.39, 6.04, 2.23, 1.18, 1.5, 2.46, 1.47, 1.37, 0.7, 1.46, 2.0, 4.72, 6.38, 0.61, 6.07, 1.34, 1.55, 1.51, 3.62]} \ No newline at end of file diff --git a/annotations_1/adxwpSdHj90_filtered.json b/annotations_1/adxwpSdHj90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..810ae234695a3217947e88507e4c86c434bbb0ac --- /dev/null +++ b/annotations_1/adxwpSdHj90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [4.0, 4.6], [6.0, 6.74], [12.0, 13.47], [14.0, 17.09], [20.0, 20.7], [30.0, 31.09], [38.0, 38.04], [43.0, 42.97], [44.0, 44.15], [45.0, 46.53], [52.0, 53.15], [55.0, 56.46], [57.0, 61.37], [63.0, 62.94], [78.0, 80.23], [86.0, 88.59], [89.0, 89.19], [90.0, 90.81], [94.0, 94.58], [95.0, 99.76], [115.0, 114.59], [133.0, 134.03], [139.0, 139.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 72.6, 36.69, 0.0, 0.0, 0.0, 31.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.41], ["neigh, whinny", 26.89], ["horse", 9.34]], null, null, null, [["speech", 89.93], ["music", 2.74], ["synthesizer", 0.72]], null, null, null], "duration": [0.97, 0.6, 0.74, 1.47, 3.09, 0.7, 1.09, 0.04, -0.03, 0.15, 1.53, 1.15, 1.46, 4.37, -0.06, 2.23, 2.59, 0.19, 0.81, 0.58, 4.76, -0.41, 1.03, 0.5]} \ No newline at end of file diff --git a/annotations_1/aecYY1vUiDU_filtered.json b/annotations_1/aecYY1vUiDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1301bd2b39dbebfbfcf91fd212c4728c14903b1d --- /dev/null +++ b/annotations_1/aecYY1vUiDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 10.15], [18.0, 18.5], [47.0, 48.83], [57.0, 57.28], [66.0, 67.39], [68.0, 68.27], [86.0, 87.56], [88.0, 95.25], [103.0, 104.01], [115.0, 115.23], [133.0, 132.9], [136.0, 136.66], [149.0, 150.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 4.15, 0.5, 1.83, 0.28, 1.39, 0.27, 1.56, 7.25, 1.01, 0.23, -0.1, 0.66, 1.92]} \ No newline at end of file diff --git a/annotations_1/af1gSplQfPU_filtered.json b/annotations_1/af1gSplQfPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eff0eb76fd4d3dc214ffd6222250191bad78eab0 --- /dev/null +++ b/annotations_1/af1gSplQfPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 32.97], [36.0, 40.04], [43.0, 55.09], [57.0, 63.1], [64.0, 73.4], [75.0, 78.48], [79.0, 79.34], [81.0, 83.98], [86.0, 89.31], [90.0, 90.46], [91.0, 91.71], [93.0, 92.85]], "keep_status": [false, true, true, false, true, false, false, true, false, false, false, false], "silence_prob": [29.57, 29.05, 29.12, 29.44, 30.71, 42.84, 0.0, 31.04, 52.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.15], ["boing", 7.66], ["burst, pop", 1.58]], [["music", 55.11], ["boing", 6.13], ["speech", 3.37]], [["groan", 34.9], ["music", 18.99], ["cattle, bovinae", 5.12]], [["music", 44.84], ["boing", 22.49], ["speech", 3.55]], [["throbbing", 20.69], ["music", 8.72], ["hum", 8.26]], [["speech", 67.16], ["sidetone", 7.05], ["radio", 4.27]], null, [["speech", 27.48], ["animal", 16.57], ["cattle, bovinae", 12.1]], null, null, null, null], "duration": [10.97, 4.04, 12.09, 6.1, 9.4, 3.48, 0.34, 2.98, 3.31, 0.46, 0.71, -0.15]} \ No newline at end of file diff --git a/annotations_1/afBwkWnwlD0_filtered.json b/annotations_1/afBwkWnwlD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55ee9d1106b088fb247b5929ec01de30ebd133aa --- /dev/null +++ b/annotations_1/afBwkWnwlD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [7.0, 8.06], [10.0, 10.61], [12.0, 12.82], [14.0, 15.01], [18.0, 17.9], [19.0, 20.82], [23.0, 24.95], [27.0, 28.0], [29.0, 30.91], [35.0, 35.58], [36.0, 37.4], [40.0, 40.54], [45.0, 46.16], [47.0, 48.64], [53.0, 53.97], [58.0, 58.04], [60.0, 60.88], [62.0, 62.97], [66.0, 65.91], [68.0, 68.54], [71.0, 73.97], [76.0, 77.82], [80.0, 81.45], [83.0, 84.21], [90.0, 91.91], [96.0, 97.31], [102.0, 108.92], [110.0, 111.57], [113.0, 113.73], [115.0, 115.67], [116.0, 117.9], [121.0, 124.29], [126.0, 128.26], [132.0, 135.23], [138.0, 139.56], [140.0, 141.35], [142.0, 143.43], [146.0, 146.82], [153.0, 154.55], [156.0, 156.3], [162.0, 165.62], [166.0, 168.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 70.86, 63.64, 58.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 45.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.68], ["music", 8.9], ["singing bowl", 3.17]]], "duration": [0.29, 1.06, 0.61, 0.82, 1.01, -0.1, 1.82, 1.95, 1.0, 1.91, 0.58, 1.4, 0.54, 1.16, 1.64, 0.97, 0.04, 0.88, 0.97, -0.09, 0.54, 2.97, 1.82, 1.45, 1.21, 1.91, 1.31, 6.92, 1.57, 0.73, 0.67, 1.9, 3.29, 2.26, 3.23, 1.56, 1.35, 1.43, 0.82, 1.55, 0.3, 3.62, 2.32]} \ No newline at end of file diff --git a/annotations_1/ag2wbvh5VDs_filtered.json b/annotations_1/ag2wbvh5VDs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6dac6caedc300ff9814d4db7102c419c48af821 --- /dev/null +++ b/annotations_1/ag2wbvh5VDs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.12], [6.0, 9.21], [11.0, 28.29], [35.0, 66.16], [72.0, 72.01], [77.0, 90.07], [91.0, 104.14], [105.0, 106.12], [110.0, 115.03], [116.0, 119.65], [121.0, 122.17], [132.0, 132.26], [139.0, 139.5]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.56, 35.34, 30.66, 0.0, 0.0, 29.03, 28.48, 0.0, 36.7, 38.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.2], ["whale vocalization", 11.01], ["theremin", 7.37]], [["music", 52.49], ["musical instrument", 5.59], ["throbbing", 4.16]], [["music", 42.82], ["synthesizer", 13.48], ["cacophony", 6.42]], null, null, [["music", 73.12], ["hum", 7.95], ["throbbing", 3.79]], [["music", 51.98], ["speech", 14.78], ["throbbing", 7.59]], null, [["music", 51.07], ["hum", 15.12], ["throbbing", 12.77]], [["music", 67.45], ["throbbing", 4.42], ["electronic music", 4.38]], null, null, null], "duration": [3.12, 3.21, 17.29, 31.16, 0.01, 13.07, 13.14, 1.12, 5.03, 3.65, 1.17, 0.26, 0.5]} \ No newline at end of file diff --git a/annotations_1/agrpQQWiX48_filtered.json b/annotations_1/agrpQQWiX48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47aa3fed46c9498f368c92502ac933f08859087b --- /dev/null +++ b/annotations_1/agrpQQWiX48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.34], [10.0, 10.27], [19.0, 23.99], [24.0, 47.85], [48.0, 48.36], [49.0, 54.58], [56.0, 59.85], [62.0, 65.7], [66.0, 68.23], [71.0, 71.78], [73.0, 73.84], [79.0, 80.11], [82.0, 82.19], [83.0, 89.36], [91.0, 93.33], [97.0, 97.7], [101.0, 101.58], [122.0, 121.96], [123.0, 124.5], [129.0, 129.74], [131.0, 130.72], [135.0, 135.63], [141.0, 140.58], [144.0, 144.66], [151.0, 152.09], [153.0, 160.78], [164.0, 165.99], [167.0, 168.69], [169.0, 169.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 80.11, 0.0, 48.23, 69.47, 89.72, 99.76, 0.0, 0.0, 0.0, 0.0, 84.8, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.68], ["theremin", 3.36], ["musical instrument", 3.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.47], ["speech", 12.24], ["fart", 11.49]], null, null, null], "duration": [1.34, 0.27, 4.99, 23.85, 0.36, 5.58, 3.85, 3.7, 2.23, 0.78, 0.84, 1.11, 0.19, 6.36, 2.33, 0.7, 0.58, -0.04, 1.5, 0.74, -0.28, 0.63, -0.42, 0.66, 1.09, 7.78, 1.99, 1.69, 0.87]} \ No newline at end of file diff --git a/annotations_1/ahCOQjOPTZw_filtered.json b/annotations_1/ahCOQjOPTZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8b6eb25e002efa1281cd62a701c8833ac2618100 --- /dev/null +++ b/annotations_1/ahCOQjOPTZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [5.0, 6.29], [7.0, 9.36], [10.0, 32.02], [35.0, 46.79], [48.0, 54.08], [55.0, 69.94], [71.0, 74.48], [75.0, 85.89], [87.0, 138.48], [141.0, 142.13], [143.0, 151.46], [152.0, 152.85], [153.0, 153.93], [155.0, 163.49], [166.0, 170.95]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, false, false, false, true, true], "silence_prob": [64.97, 0.0, 79.59, 30.23, 30.49, 29.91, 28.58, 36.48, 34.19, 0.0, 0.0, 34.14, 0.0, 0.0, 34.85, 37.19], "audiomae_on_audioset": [null, null, null, [["didgeridoo", 42.19], ["music", 31.17], ["speech", 4.04]], [["music", 53.75], ["speech", 28.93], ["electronic music", 3.39]], [["music", 34.44], ["didgeridoo", 24.76], ["hum", 5.79]], [["music", 33.95], ["throbbing", 14.01], ["hum", 13.72]], [["music", 47.84], ["theremin", 6.98], ["whack, thwack", 5.36]], [["music", 26.75], ["speech", 13.86], ["dog", 5.0]], null, null, [["music", 50.55], ["didgeridoo", 19.02], ["musical instrument", 7.41]], null, null, [["music", 36.96], ["didgeridoo", 10.51], ["singing bowl", 9.74]], [["music", 49.94], ["synthesizer", 9.18], ["hum", 6.12]]], "duration": [2.0, 1.29, 2.36, 22.02, 11.79, 6.08, 14.94, 3.48, 10.89, 51.48, 1.13, 8.46, 0.85, 0.93, 8.49, 4.95]} \ No newline at end of file diff --git a/annotations_1/ahCg__rBh1Q_filtered.json b/annotations_1/ahCg__rBh1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..867f971b73b147a15be19548658410d749c485b9 --- /dev/null +++ b/annotations_1/ahCg__rBh1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 27.04], [29.0, 40.39], [43.0, 66.63], [70.0, 83.98], [88.0, 88.48], [93.0, 93.88], [97.0, 98.0], [100.0, 105.34], [108.0, 155.01], [156.0, 156.0]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [30.48, 30.44, 29.87, 36.02, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.07], ["didgeridoo", 2.83], ["musical instrument", 2.72]], [["music", 39.39], ["throbbing", 24.17], ["hum", 8.94]], [["music", 63.28], ["speech", 5.86], ["throbbing", 4.64]], [["hum", 46.5], ["music", 18.04], ["mains hum", 17.01]], null, null, null, [["music", 31.04], ["throbbing", 16.76], ["speech", 15.52]], null, null], "duration": [18.04, 11.39, 23.63, 13.98, 0.48, 0.88, 1.0, 5.34, 47.01, 0.0]} \ No newline at end of file diff --git a/annotations_1/ah_Egywb780_filtered.json b/annotations_1/ah_Egywb780_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..500b2109aeb4aef41779e029e03f2264aca09883 --- /dev/null +++ b/annotations_1/ah_Egywb780_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.32], [25.0, 30.28], [31.0, 57.35], [58.0, 60.27], [66.0, 68.37], [69.0, 72.57], [74.0, 75.71], [77.0, 78.33], [79.0, 80.45], [82.0, 88.06], [89.0, 96.55], [100.0, 101.61], [103.0, 105.17], [106.0, 108.46], [110.0, 112.92], [114.0, 121.24], [122.0, 127.23], [128.0, 130.22], [131.0, 134.11], [137.0, 139.89], [141.0, 146.13], [147.0, 147.97], [150.0, 161.35], [162.0, 164.1], [166.0, 166.36], [167.0, 168.84], [171.0, 173.37], [175.0, 177.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [71.29, 99.36, 61.37, 99.94, 99.87, 92.15, 0.0, 0.0, 0.0, 98.44, 99.87, 0.0, 99.94, 99.98, 95.51, 93.91, 99.56, 100.0, 90.95, 96.66, 98.36, 0.0, 87.0, 92.48, 0.0, 0.0, 55.74, 95.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.32, 5.28, 26.35, 2.27, 2.37, 3.57, 1.71, 1.33, 1.45, 6.06, 7.55, 1.61, 2.17, 2.46, 2.92, 7.24, 5.23, 2.22, 3.11, 2.89, 5.13, 0.97, 11.35, 2.1, 0.36, 1.84, 2.37, 2.38]} \ No newline at end of file diff --git a/annotations_1/ahxDiseuAak_filtered.json b/annotations_1/ahxDiseuAak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ec49e992384edd844a95b7a2fffdc0632dcc10a --- /dev/null +++ b/annotations_1/ahxDiseuAak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.25], [48.0, 49.55], [91.0, 103.06], [104.0, 105.38], [107.0, 112.77]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.68, 0.0, 69.34], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.25, 1.55, 12.06, 1.38, 5.77]} \ No newline at end of file diff --git a/annotations_1/aiJtAU0V_60_filtered.json b/annotations_1/aiJtAU0V_60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1cfd10e6b60a9394d09a9a313e7c6d1e3f0036f --- /dev/null +++ b/annotations_1/aiJtAU0V_60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.46], [9.0, 12.88], [16.0, 17.71], [19.0, 19.72], [22.0, 23.5], [32.0, 32.49], [36.0, 37.29], [40.0, 41.64], [43.0, 44.52], [52.0, 53.94], [67.0, 68.42], [77.0, 80.08], [82.0, 93.78], [95.0, 96.45], [104.0, 105.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.46, 3.88, 1.71, 0.72, 1.5, 0.49, 1.29, 1.64, 1.52, 1.94, 1.42, 3.08, 11.78, 1.45, 1.76]} \ No newline at end of file diff --git a/annotations_1/aiiJ0fBFjCQ_filtered.json b/annotations_1/aiiJ0fBFjCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b28fbfc8e4ab238c3fe980678ae8b4f69ffe934d --- /dev/null +++ b/annotations_1/aiiJ0fBFjCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [3.0, 3.23], [7.0, 12.82], [15.0, 17.58], [18.0, 18.76], [22.0, 31.95], [34.0, 45.17], [46.0, 50.03], [51.0, 52.54], [54.0, 57.59], [59.0, 61.08], [62.0, 63.31], [64.0, 65.08], [67.0, 67.56], [69.0, 69.08], [72.0, 73.63], [75.0, 78.7], [80.0, 80.96], [83.0, 84.74], [86.0, 89.19], [90.0, 90.12], [92.0, 100.94], [102.0, 103.1], [105.0, 105.95], [113.0, 116.33], [120.0, 125.9], [129.0, 130.87], [132.0, 134.25], [135.0, 137.02], [138.0, 140.02], [143.0, 144.39]], "keep_status": [false, false, true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.0, 40.48, 0.0, 32.79, 63.1, 46.68, 0.0, 99.16, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 75.23, 0.0, 44.9, 0.0, 0.0, 44.84, 45.11, 0.0, 98.51, 57.17, 91.47, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.58], ["harp", 14.17], ["harmonic", 6.09]], [["music", 49.91], ["rowboat, canoe, kayak", 8.14], ["boat, water vehicle", 5.32]], null, [["livestock, farm animals, working animals", 41.3], ["sheep", 14.7], ["bleat", 6.98]], null, [["whale vocalization", 25.65], ["speech", 14.22], ["hum", 5.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["splash, splatter", 20.91], ["gurgling", 14.26], ["fly, housefly", 10.6]], null, null, [["liquid", 33.65], ["water", 10.79], ["trickle, dribble", 6.6]], [["whale vocalization", 43.57], ["speech", 17.94], ["music", 8.64]], null, null, null, null, null], "duration": [0.75, 0.23, 5.82, 2.58, 0.76, 9.95, 11.17, 4.03, 1.54, 3.59, 2.08, 1.31, 1.08, 0.56, 0.08, 1.63, 3.7, 0.96, 1.74, 3.19, 0.12, 8.94, 1.1, 0.95, 3.33, 5.9, 1.87, 2.25, 2.02, 2.02, 1.39]} \ No newline at end of file diff --git a/annotations_1/ajm_632U-Ac_filtered.json b/annotations_1/ajm_632U-Ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db26d1b97d31f7fb664994274f8a2615c7c2b874 --- /dev/null +++ b/annotations_1/ajm_632U-Ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [11.0, 11.03], [11.0, 11.87], [13.0, 16.97], [32.0, 32.49], [35.0, 38.58], [42.0, 42.58], [46.0, 49.45], [50.0, 51.04], [62.0, 62.41], [63.0, 67.12], [76.0, 76.54], [96.0, 97.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.07, 0.0, 87.0, 0.0, 37.21, 0.0, 0.0, 40.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mosquito", 37.81], ["insect", 23.24], ["fly, housefly", 20.08]], null, null, [["speech", 19.81], ["music", 18.85], ["boing", 6.87]], null, null], "duration": [-0.06, 0.03, 0.87, 3.97, 0.49, 3.58, 0.58, 3.45, 1.04, 0.41, 4.12, 0.54, 1.19]} \ No newline at end of file diff --git a/annotations_1/akSjCFfKAMo_filtered.json b/annotations_1/akSjCFfKAMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1883b9c755c6797ceab38704e6ff4c3e295c0078 --- /dev/null +++ b/annotations_1/akSjCFfKAMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.41], [24.0, 28.7], [29.0, 29.69], [30.0, 44.69]], "keep_status": [false, false, false, false], "silence_prob": [100.0, 98.8, 0.0, 50.56], "audiomae_on_audioset": [null, null, null, null], "duration": [2.41, 4.7, 0.69, 14.69]} \ No newline at end of file diff --git a/annotations_1/alE17GLFoQE_filtered.json b/annotations_1/alE17GLFoQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4599fc26fd264c8f612c4f3ee4f575ecbd9cb5 --- /dev/null +++ b/annotations_1/alE17GLFoQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [9.0, 10.54], [12.0, 14.44], [17.0, 17.9], [19.0, 19.85], [21.0, 21.34], [24.0, 24.24], [26.0, 27.14], [35.0, 36.29], [41.0, 42.94], [45.0, 44.9], [53.0, 55.53], [63.0, 63.68], [67.0, 69.01], [70.0, 71.56], [72.0, 72.81], [79.0, 79.41], [80.0, 83.96], [86.0, 87.51], [89.0, 95.55], [100.0, 106.19], [115.0, 115.42], [122.0, 123.47], [124.0, 129.12], [132.0, 145.27], [149.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 0.0, 68.02, 0.0, 0.0, 0.0, 77.03, 0.0, 41.98, 39.12, 0.0, 0.0, 32.66, 34.19, 36.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 51.95], ["timpani", 4.41], ["shofar", 3.8]], null, null, null, null, null, null, null, [["cattle, bovinae", 39.74], ["moo", 34.87], ["livestock, farm animals, working animals", 22.54]], [["buzz", 21.92], ["mosquito", 14.21], ["electric shaver, electric razor", 13.78]], null, null, [["speech", 48.39], ["crying, sobbing", 7.29], ["electric shaver, electric razor", 6.71]], [["speech", 41.57], ["music", 15.11], ["fly, housefly", 3.54]], [["speech", 37.13], ["electric shaver, electric razor", 14.99], ["hum", 8.6]]], "duration": [0.74, 1.54, 2.44, 0.9, 0.85, 0.34, 0.24, 1.14, 1.29, 1.94, -0.1, 2.53, 0.68, 2.01, 1.56, 0.81, 0.41, 3.96, 1.51, 6.55, 6.19, 0.42, 1.47, 5.12, 13.27, 7.64]} \ No newline at end of file diff --git a/annotations_1/alYZ8jQ5L3A_filtered.json b/annotations_1/alYZ8jQ5L3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac463b8114720d2c64c66b96aaec3f1338d79855 --- /dev/null +++ b/annotations_1/alYZ8jQ5L3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [13.0, 13.81], [23.0, 23.58], [28.0, 29.07], [30.0, 43.7], [46.0, 58.7], [61.0, 70.33], [71.0, 71.25], [71.0, 73.47], [74.0, 76.74], [78.0, 78.19], [79.0, 79.12], [83.0, 93.07], [96.0, 96.74], [99.0, 99.77], [102.0, 103.4], [105.0, 104.84], [109.0, 109.02], [109.0, 113.04], [116.0, 116.83], [118.0, 118.52], [119.0, 123.21]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.52, 40.79, 30.99, 0.0, 30.57, 46.75, 0.0, 0.0, 32.68, 0.0, 0.0, 0.0, 0.0, 0.0, 31.48, 0.0, 0.0, 33.37], "audiomae_on_audioset": [null, null, null, null, [["music", 63.61], ["theremin", 8.14], ["didgeridoo", 5.42]], [["music", 70.11], ["throbbing", 4.94], ["hum", 3.85]], [["speech", 16.25], ["music", 6.86], ["beatboxing", 6.52]], null, [["speech", 77.36], ["boing", 2.12], ["inside, small room", 1.92]], [["speech", 36.14], ["mains hum", 24.51], ["hum", 19.09]], null, null, [["didgeridoo", 23.86], ["electric shaver, electric razor", 23.15], ["speech", 20.74]], null, null, null, null, null, [["fly, housefly", 26.95], ["insect", 19.32], ["speech", 16.14]], null, null, [["speech", 30.59], ["wail, moan", 20.38], ["whimper", 12.79]]], "duration": [0.34, 0.81, 0.58, 1.07, 13.7, 12.7, 9.33, 0.25, 2.47, 2.74, 0.19, 0.12, 10.07, 0.74, 0.77, 1.4, -0.16, 0.02, 4.04, 0.83, 0.52, 4.21]} \ No newline at end of file diff --git a/annotations_1/alhVUKh36_Q_filtered.json b/annotations_1/alhVUKh36_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43b4210b3e8963f17e24fd8fdb87473e28e07ef7 --- /dev/null +++ b/annotations_1/alhVUKh36_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 33.64], [37.0, 42.28], [45.0, 44.58], [45.0, 79.22], [81.0, 81.18], [87.0, 87.78], [101.0, 128.01], [136.0, 136.29], [137.0, 145.89], [151.0, 174.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.15, 28.67, 0.0, 0.0, 0.0, 0.0, 29.07, 0.0, 29.06, 28.83], "audiomae_on_audioset": [[["music", 83.19], ["house music", 1.87], ["sampler", 1.51]], [["music", 81.23], ["electronic music", 2.22], ["house music", 2.04]], null, null, null, null, [["music", 84.82], ["funk", 2.03], ["singing", 0.85]], null, [["music", 73.69], ["didgeridoo", 3.22], ["musical instrument", 2.47]], [["music", 89.1], ["swing music", 0.96], ["funk", 0.82]]], "duration": [9.64, 5.28, -0.42, 34.22, 0.18, 0.78, 27.01, 0.29, 8.89, 23.38]} \ No newline at end of file diff --git a/annotations_1/an8Z9J29zWo_filtered.json b/annotations_1/an8Z9J29zWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d6726e61a0701118e63b138900c8789a9b1940d --- /dev/null +++ b/annotations_1/an8Z9J29zWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 7.08], [7.0, 7.25], [8.0, 9.29], [13.0, 13.29], [18.0, 18.79], [21.0, 22.98], [25.0, 25.62], [28.0, 28.63], [31.0, 34.64], [40.0, 41.47], [42.0, 42.9], [44.0, 46.35], [52.0, 52.05], [58.0, 58.55], [59.0, 59.63], [61.0, 61.38], [62.0, 62.41], [65.0, 65.43], [68.0, 68.18], [71.0, 74.46], [75.0, 77.03], [78.0, 79.22], [80.0, 82.41], [83.0, 87.17], [87.0, 90.17], [94.0, 95.25], [96.0, 96.15], [98.0, 99.01], [101.0, 102.17], [104.0, 104.82], [111.0, 112.01], [118.0, 118.83], [126.0, 128.9], [130.0, 130.79], [134.0, 133.71], [136.0, 137.22], [139.0, 141.51], [142.0, 143.51], [145.0, 149.22], [153.0, 153.52]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 41.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 96.77, 55.67, 72.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 80.11, 0.0, 44.32, 0.0], "audiomae_on_audioset": [null, [["speech", 42.07], ["music", 14.91], ["animal", 3.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 9.89], ["burping, eructation", 6.92], ["moo", 5.97]], null], "duration": [1.96, 2.08, 0.25, 1.29, 0.29, 0.79, 1.98, 0.62, 0.63, 3.64, 1.47, 0.9, 2.35, 0.05, 0.55, 0.63, 0.38, 0.41, 0.43, 0.18, 3.46, 2.03, 1.22, 2.41, 4.17, 3.17, 1.25, 0.15, 1.01, 1.17, 0.82, 1.01, 0.83, 2.9, 0.79, -0.29, 1.22, 2.51, 1.51, 4.22, 0.52]} \ No newline at end of file diff --git a/annotations_1/an9Zfn3IZCY_filtered.json b/annotations_1/an9Zfn3IZCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17b138828e62dc8eaf64d83a678f21c9ec703920 --- /dev/null +++ b/annotations_1/an9Zfn3IZCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 110.4], [112.0, 112.35], [114.0, 138.91], [139.0, 145.98], [147.0, 152.93], [155.0, 192.84], [193.0, 192.94]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [46.26, 0.0, 50.02, 44.9, 51.6, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 22.1], ["hum", 20.02], ["throbbing", 11.74]], null, null, [["whale vocalization", 33.31], ["animal", 12.88], ["music", 10.94]], null, null, null], "duration": [16.4, 0.35, 24.91, 6.98, 5.93, 37.84, -0.06]} \ No newline at end of file diff --git a/annotations_1/aoBeDwBxv04_filtered.json b/annotations_1/aoBeDwBxv04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1952cd69c1fe21c1aea637fddd65593313444886 --- /dev/null +++ b/annotations_1/aoBeDwBxv04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [3.0, 8.48], [12.0, 12.31], [13.0, 15.28], [17.0, 16.98], [27.0, 27.08], [29.0, 33.0], [37.0, 37.02], [38.0, 38.18], [43.0, 43.28], [45.0, 59.21], [60.0, 61.16], [63.0, 63.73], [67.0, 71.27], [73.0, 74.04], [79.0, 82.38], [84.0, 86.8], [89.0, 90.61], [92.0, 92.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.43, 0.0, 72.75, 0.0, 0.0, 33.18, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 100.0, 0.0, 34.83, 95.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 62.87], ["fart", 11.96], ["crying, sobbing", 5.12]], null, null, null, null, null, null, null, null, [["moo", 40.51], ["cattle, bovinae", 34.17], ["livestock, farm animals, working animals", 24.97]], null, null, null], "duration": [0.61, 5.48, 0.31, 2.28, -0.02, 0.08, 4.0, 0.02, 0.18, 0.28, 14.21, 1.16, 0.73, 4.27, 1.04, 3.38, 2.8, 1.61, 0.79]} \ No newline at end of file diff --git a/annotations_1/aoc1wqaK8cc_filtered.json b/annotations_1/aoc1wqaK8cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cd0c86889b63975bee721f5985b8735ccb2f91c --- /dev/null +++ b/annotations_1/aoc1wqaK8cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.92], [4.0, 3.99], [11.0, 10.94], [13.0, 12.97], [14.0, 14.57], [15.0, 21.59], [23.0, 26.2], [28.0, 29.1], [32.0, 32.29], [35.0, 35.5], [40.0, 41.07], [44.0, 45.99], [59.0, 59.71], [79.0, 86.22], [87.0, 87.32], [89.0, 89.11], [104.0, 104.92], [120.0, 126.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.86, 0.0, 0.0, 0.0, 29.61], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 53.57], ["guitar", 13.38], ["effects unit", 7.66]], null, null, null, null, null, null, [["music", 76.59], ["synthetic singing", 2.15], ["sidetone", 2.04]], null, null, null, [["music", 77.07], ["synthetic singing", 3.98], ["trombone", 1.84]]], "duration": [-0.08, -0.01, -0.06, -0.03, 0.57, 6.59, 3.2, 1.1, 0.29, 0.5, 1.07, 1.99, 0.71, 7.22, 0.32, 0.11, 0.92, 6.62]} \ No newline at end of file diff --git a/annotations_1/apasYYh6nEA_filtered.json b/annotations_1/apasYYh6nEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3348c95219d62b89ade2a87ffc2a8ea97db6f64d --- /dev/null +++ b/annotations_1/apasYYh6nEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 24.7], [25.0, 24.8], [25.0, 25.46], [25.0, 36.78], [39.0, 38.84], [39.0, 46.77], [58.0, 60.74], [62.0, 63.49], [65.0, 65.84], [69.0, 73.89], [79.0, 79.25], [79.0, 79.61], [80.0, 80.81], [85.0, 85.36], [93.0, 93.18], [98.0, 98.05], [99.0, 99.17], [100.0, 100.25], [101.0, 101.46], [106.0, 106.3], [107.0, 107.7], [109.0, 109.49], [110.0, 118.2], [125.0, 127.18], [130.0, 132.76], [136.0, 140.78], [143.0, 143.55], [146.0, 151.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.43, 0.0, 36.46, 46.54, 0.0, 0.0, 30.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.88, 39.58, 33.49, 38.12, 0.0, 36.84], "audiomae_on_audioset": [null, null, null, [["speech", 82.47], ["whack, thwack", 6.59], ["hammer", 3.21]], null, [["speech", 84.48], ["firecracker", 3.76], ["explosion", 3.57]], [["speech", 27.46], ["fly, housefly", 17.17], ["insect", 8.19]], null, null, [["fart", 66.72], ["speech", 19.08], ["groan", 1.27]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 12.38], ["police car (siren)", 11.07], ["groan", 10.63]], [["cowbell", 26.14], ["speech", 14.66], ["music", 5.07]], [["speech", 43.31], ["music", 4.96], ["fart", 3.85]], [["speech", 61.44], ["fart", 3.95], ["eruption", 2.15]], null, [["speech", 25.96], ["livestock, farm animals, working animals", 11.02], ["cowbell", 10.34]]], "duration": [-0.3, -0.2, 0.46, 11.78, -0.16, 7.77, 2.74, 1.49, 0.84, 4.89, 0.25, 0.61, 0.81, 0.36, 0.18, 0.05, 0.17, 0.25, 0.46, 0.3, 0.7, 0.49, 8.2, 2.18, 2.76, 4.78, 0.55, 5.6]} \ No newline at end of file diff --git a/annotations_1/ar_o_qS68oA_filtered.json b/annotations_1/ar_o_qS68oA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e4e3dca489d28892fe80d8f43e12bd26af54d00 --- /dev/null +++ b/annotations_1/ar_o_qS68oA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.7], [11.0, 11.91], [14.0, 15.18], [15.0, 16.29], [17.0, 50.23], [52.0, 52.02], [53.0, 53.64], [54.0, 55.19], [57.0, 59.02], [60.0, 60.13], [63.0, 64.18], [67.0, 68.07], [70.0, 70.04], [80.0, 82.05], [84.0, 85.8], [87.0, 108.23], [109.0, 110.17], [113.0, 112.95], [116.0, 115.72], [117.0, 118.15], [119.0, 119.37], [119.0, 119.4], [119.0, 119.43], [119.0, 119.47], [119.0, 119.5], [121.0, 122.64], [125.0, 127.7], [134.0, 142.52], [144.0, 147.43], [149.0, 150.03], [150.0, 152.41], [156.0, 156.24], [158.0, 159.6]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [41.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 48.14, 0.0, 29.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 43.9, 30.2, 0.0, 37.73, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 17.62], ["speech", 11.91], ["hum", 11.43]], null, null, null, null, null, null, null, [["speech", 25.95], ["sidetone", 24.98], ["radio", 16.7]], null, null, null, null, [["music", 28.69], ["hum", 17.11], ["radio", 10.88]], null, [["didgeridoo", 32.08], ["music", 18.57], ["mains hum", 14.89]], null, null, null, null, null, null, null, null, null, null, [["speech", 29.42], ["cattle, bovinae", 28.61], ["moo", 17.25]], [["mains hum", 73.94], ["hum", 17.21], ["buzz", 2.13]], [["music", 10.09], ["didgeridoo", 9.29], ["reverberation", 8.44]], null, [["mains hum", 35.42], ["hum", 29.7], ["speech", 12.82]], null, null], "duration": [2.7, 0.91, 1.18, 1.29, 33.23, 0.02, 0.64, 1.19, 2.02, 0.13, 1.18, 1.07, 0.04, 2.05, 1.8, 21.23, 1.17, -0.05, -0.28, 1.15, 0.37, 0.4, 0.43, 0.47, 0.5, 1.64, 2.7, 8.52, 3.43, 1.03, 2.41, 0.24, 1.6]} \ No newline at end of file diff --git a/annotations_1/arzwnRoAQP0_filtered.json b/annotations_1/arzwnRoAQP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4ec7d03da5cf881cd77bfced05bb820999b8994 --- /dev/null +++ b/annotations_1/arzwnRoAQP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [8.0, 8.95], [14.0, 16.68], [17.0, 17.85], [26.0, 27.58], [40.0, 40.12], [41.0, 41.15], [42.0, 43.5], [52.0, 52.78], [53.0, 54.09], [55.0, 59.7], [61.0, 61.62], [63.0, 64.86], [96.0, 103.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 32.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.08], ["hum", 2.7], ["speech", 2.59]]], "duration": [0.74, 0.95, 2.68, 0.85, 1.58, 0.12, 0.15, 1.5, 0.78, 1.09, 4.7, 0.62, 1.86, 7.62]} \ No newline at end of file diff --git a/annotations_1/atBUgwJAD0U_filtered.json b/annotations_1/atBUgwJAD0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d073aaebaf8decb6a5484f34a0f1e935e5f2f42 --- /dev/null +++ b/annotations_1/atBUgwJAD0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [8.0, 9.21], [13.0, 14.72], [17.0, 23.87], [26.0, 123.8], [127.0, 126.98], [128.0, 131.75], [132.0, 165.27], [166.0, 175.69], [181.0, 182.19]], "keep_status": [false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.76, 0.0, 0.0, 35.97, 0.0, 37.54, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 24.43], ["music", 24.12], ["throbbing", 15.97]], null, null, [["throbbing", 25.54], ["music", 23.49], ["hum", 18.69]], null, [["music", 40.54], ["hum", 16.88], ["throbbing", 14.54]], null], "duration": [0.88, 1.21, 1.72, 6.87, 97.8, -0.02, 3.75, 33.27, 9.69, 1.19]} \ No newline at end of file diff --git a/annotations_1/atQYOl5KL-o_filtered.json b/annotations_1/atQYOl5KL-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dff3df03b1f8ed90e117a1cca5bb15f0d181d82 --- /dev/null +++ b/annotations_1/atQYOl5KL-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 39.61], [40.0, 41.0], [41.0, 45.52], [46.0, 53.52], [54.0, 60.86], [69.0, 69.92]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.64, 63.42, 98.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [35.61, 1.0, 4.52, 7.52, 6.86, 0.92]} \ No newline at end of file diff --git a/annotations_1/auNkHDpPil4_filtered.json b/annotations_1/auNkHDpPil4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f48deeaf61038691386684d0ada0fe2b8a211945 --- /dev/null +++ b/annotations_1/auNkHDpPil4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 26.77], [36.0, 37.89], [38.0, 43.02], [44.0, 44.63], [48.0, 48.39], [50.0, 52.15], [59.0, 63.63], [72.0, 76.81], [82.0, 82.02], [82.0, 82.26], [83.0, 86.41], [87.0, 89.28], [90.0, 91.71], [95.0, 104.26], [106.0, 108.18], [110.0, 117.58], [121.0, 121.83], [124.0, 124.5], [125.0, 127.35], [130.0, 131.09], [138.0, 138.57], [139.0, 140.9], [143.0, 148.49], [152.0, 154.82], [157.0, 159.27], [160.0, 162.3], [163.0, 164.86], [166.0, 167.34], [169.0, 170.07], [171.0, 174.66]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [30.58, 0.0, 30.7, 0.0, 0.0, 31.28, 29.11, 62.17, 0.0, 0.0, 55.11, 56.1, 0.0, 52.45, 56.86, 43.93, 0.0, 0.0, 45.05, 0.0, 0.0, 0.0, 39.75, 61.18, 45.36, 53.1, 0.0, 0.0, 0.0, 56.55], "audiomae_on_audioset": [[["music", 55.64], ["didgeridoo", 15.11], ["musical instrument", 3.2]], null, [["music", 38.21], ["moo", 14.15], ["boing", 10.63]], null, null, [["speech", 33.9], ["livestock, farm animals, working animals", 11.9], ["moo", 8.37]], [["speech", 43.59], ["applause", 7.73], ["fart", 6.18]], null, null, null, null, null, null, null, null, [["music", 42.4], ["speech", 7.95], ["hum", 6.96]], null, null, [["music", 18.33], ["speech", 12.33], ["hum", 8.56]], null, null, null, [["frog", 20.31], ["whale vocalization", 12.89], ["speech", 9.71]], null, [["speech", 43.17], ["music", 6.1], ["fly, housefly", 3.89]], null, null, null, null, null], "duration": [21.77, 1.89, 5.02, 0.63, 0.39, 2.15, 4.63, 4.81, 0.02, 0.26, 3.41, 2.28, 1.71, 9.26, 2.18, 7.58, 0.83, 0.5, 2.35, 1.09, 0.57, 1.9, 5.49, 2.82, 2.27, 2.3, 1.86, 1.34, 1.07, 3.66]} \ No newline at end of file diff --git a/annotations_1/aucs5KRFzhE_filtered.json b/annotations_1/aucs5KRFzhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b72fa63a0307119beff3c521d5593a9a840f405 --- /dev/null +++ b/annotations_1/aucs5KRFzhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.02], [16.0, 16.7], [20.0, 20.93], [43.0, 51.61], [55.0, 55.68], [56.0, 57.57], [61.0, 62.06], [65.0, 66.28], [68.0, 72.64], [77.0, 79.95], [80.0, 89.92], [94.0, 100.13], [105.0, 108.6], [109.0, 109.81], [111.0, 131.11], [132.0, 133.79], [135.0, 155.55], [159.0, 167.95], [169.0, 171.39], [171.0, 177.62], [180.0, 201.31]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, true, false, true, false, false, false, true], "silence_prob": [40.62, 0.0, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 28.29, 28.42, 28.26, 28.37, 28.78, 0.0, 28.62, 0.0, 28.64, 28.97, 28.9, 28.67, 28.29], "audiomae_on_audioset": [[["music", 46.43], ["fart", 31.28], ["zipper (clothing)", 12.49]], null, null, [["mains hum", 44.99], ["hum", 29.79], ["throbbing", 13.19]], null, null, null, null, [["speech", 46.62], ["music", 18.22], ["explosion", 7.18]], [["music", 46.18], ["buzz", 5.55], ["mains hum", 5.0]], [["music", 18.81], ["car", 5.58], ["mains hum", 5.41]], [["music", 59.66], ["speech", 12.87], ["electronic music", 7.13]], [["speech", 28.65], ["music", 19.15], ["vehicle", 5.36]], null, [["music", 55.25], ["cacophony", 6.05], ["synthesizer", 3.72]], null, [["music", 29.86], ["speech", 25.01], ["machine gun", 11.04]], [["music", 62.73], ["didgeridoo", 6.26], ["musical instrument", 4.17]], [["speech", 43.93], ["music", 29.81], ["boing", 4.34]], [["music", 67.33], ["speech", 12.19], ["throbbing", 2.46]], [["hum", 24.27], ["music", 22.65], ["mains hum", 14.2]]], "duration": [2.02, 0.7, 0.93, 8.61, 0.68, 1.57, 1.06, 1.28, 4.64, 2.95, 9.92, 6.13, 3.6, 0.81, 20.11, 1.79, 20.55, 8.95, 2.39, 6.62, 21.31]} \ No newline at end of file diff --git a/annotations_1/avjdKTqiVvQ_filtered.json b/annotations_1/avjdKTqiVvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d95ab994506e30459d716fd0e9cb7b434c036a6 --- /dev/null +++ b/annotations_1/avjdKTqiVvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 89.56], [93.0, 117.04], [118.0, 117.95], [124.0, 124.17], [128.0, 133.96], [138.0, 138.82]], "keep_status": [false, false, false, false, false, false], "silence_prob": [86.82, 47.62, 0.0, 0.0, 83.7, 0.0], "audiomae_on_audioset": [null, [["music", 66.82], ["theremin", 20.3], ["ambient music", 4.36]], null, null, null, null], "duration": [10.56, 24.04, -0.05, 0.17, 5.96, 0.82]} \ No newline at end of file diff --git a/annotations_1/awuqJuO5WOc_filtered.json b/annotations_1/awuqJuO5WOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a52fc4138e83f5298f1534a1cfa844c62d051ec --- /dev/null +++ b/annotations_1/awuqJuO5WOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 20.46], [21.0, 56.08], [57.0, 58.53], [59.0, 60.94], [61.0, 62.19], [64.0, 65.52], [68.0, 74.93], [78.0, 78.34], [80.0, 80.03], [82.0, 102.83], [106.0, 115.13], [116.0, 119.97], [123.0, 124.73], [131.0, 137.29], [139.0, 140.24], [141.0, 142.01], [143.0, 144.44], [145.0, 146.94], [148.0, 148.22], [149.0, 155.24]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [30.56, 0.0, 0.0, 0.0, 0.0, 0.0, 30.75, 0.0, 0.0, 30.6, 34.29, 55.6, 0.0, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 44.49], "audiomae_on_audioset": [[["music", 48.94], ["synthesizer", 6.77], ["sound effect", 3.85]], null, null, null, null, null, [["music", 10.69], ["breaking", 10.37], ["whale vocalization", 8.25]], null, null, [["music", 79.26], ["musical instrument", 4.2], ["synthesizer", 2.09]], [["hum", 30.61], ["noise", 14.58], ["whale vocalization", 10.48]], null, null, [["hum", 24.39], ["speech", 22.09], ["music", 13.23]], null, null, null, null, null, [["hum", 36.53], ["whale vocalization", 23.21], ["throbbing", 6.34]]], "duration": [10.46, 35.08, 1.53, 1.94, 1.19, 1.52, 6.93, 0.34, 0.03, 20.83, 9.13, 3.97, 1.73, 6.29, 1.24, 1.01, 1.44, 1.94, 0.22, 6.24]} \ No newline at end of file diff --git a/annotations_1/axWtCnuctw0_filtered.json b/annotations_1/axWtCnuctw0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86880854117d11d7eebe66feeebdbea89d0d1ec7 --- /dev/null +++ b/annotations_1/axWtCnuctw0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 45.01], [47.0, 47.01], [47.0, 47.28], [52.0, 80.0], [84.0, 90.91]], "keep_status": [true, false, false, true, true], "silence_prob": [32.76, 0.0, 0.0, 28.55, 31.1], "audiomae_on_audioset": [[["music", 18.11], ["whale vocalization", 16.83], ["noise", 7.83]], null, null, [["whale vocalization", 18.4], ["music", 14.47], ["echo", 10.28]], [["gong", 33.69], ["music", 23.0], ["synthesizer", 6.07]]], "duration": [8.01, 0.01, 0.28, 28.0, 6.91]} \ No newline at end of file diff --git a/annotations_1/axhUtepWokA_filtered.json b/annotations_1/axhUtepWokA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfba58030d1b8414f59c30682f2b6c2b3f146e6a --- /dev/null +++ b/annotations_1/axhUtepWokA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [10.0, 11.42], [13.0, 12.7], [13.0, 15.23], [16.0, 28.19], [30.0, 32.9], [42.0, 57.01], [61.0, 73.09], [74.0, 80.57], [82.0, 83.03], [84.0, 84.27], [85.0, 85.6], [92.0, 98.51], [101.0, 100.97], [102.0, 102.95], [107.0, 109.09], [109.0, 126.59], [128.0, 128.92], [131.0, 133.08], [133.0, 133.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 50.41, 29.89, 29.76, 30.84, 34.81, 40.81, 0.0, 0.0, 0.0, 30.09, 0.0, 0.0, 32.1, 32.32, 0.0, 35.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 59.29], ["throbbing", 22.18], ["electronic music", 3.14]], [["music", 79.96], ["dubstep", 6.62], ["electronic music", 3.85]], [["music", 81.95], ["electronic music", 4.82], ["throbbing", 2.45]], [["music", 48.55], ["throbbing", 26.92], ["hum", 11.54]], [["throbbing", 33.9], ["music", 20.75], ["hum", 20.24]], null, null, null, [["music", 43.96], ["electronic music", 9.66], ["moo", 8.65]], null, null, [["speech", 26.94], ["music", 13.46], ["crowd", 13.03]], [["music", 52.76], ["didgeridoo", 8.1], ["throbbing", 4.49]], null, [["music", 40.26], ["throbbing", 11.71], ["cattle, bovinae", 5.84]], null], "duration": [0.56, 1.42, -0.3, 2.23, 12.19, 2.9, 15.01, 12.09, 6.57, 1.03, 0.27, 0.6, 6.51, -0.03, 0.95, 2.09, 17.59, 0.92, 2.08, 0.56]} \ No newline at end of file diff --git a/annotations_1/ay1hpFWZQnI_filtered.json b/annotations_1/ay1hpFWZQnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1f13b204a55ec6ee8c1966d8dee28141819587 --- /dev/null +++ b/annotations_1/ay1hpFWZQnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [28.0, 28.02], [30.0, 29.62], [30.0, 31.43], [34.0, 34.53], [48.0, 48.66], [50.0, 50.45], [51.0, 57.0], [60.0, 60.13], [61.0, 63.02], [64.0, 64.59], [88.0, 89.48]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 45.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.67], ["music", 22.04], ["electronic music", 5.65]], null, null], "duration": [0.64, 0.02, -0.38, 1.43, 0.53, 0.66, 0.45, 6.0, 0.13, 2.02, 0.59, 1.48]} \ No newline at end of file diff --git a/annotations_1/b-w1bY8qhnc_filtered.json b/annotations_1/b-w1bY8qhnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ee709dded09c65f8d4d1e7153d8b9c4e1ca08f --- /dev/null +++ b/annotations_1/b-w1bY8qhnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 28.49], [29.0, 28.54], [32.0, 33.79], [35.0, 37.3], [40.0, 42.57], [44.0, 45.32], [47.0, 50.06], [54.0, 56.08], [58.0, 57.67], [58.0, 60.93], [62.0, 64.15], [66.0, 69.67], [71.0, 71.09], [71.0, 71.79], [79.0, 80.27], [81.0, 82.44], [84.0, 84.69], [85.0, 87.24], [87.0, 87.27], [88.0, 89.77], [90.0, 90.56], [99.0, 98.63], [100.0, 100.48], [106.0, 112.01], [114.0, 114.15], [125.0, 129.78], [138.0, 141.4], [141.0, 149.82], [151.0, 157.05], [158.0, 159.9], [161.0, 162.35], [162.0, 167.86], [168.0, 170.24], [171.0, 173.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, true, true, false], "silence_prob": [55.04, 0.0, 0.0, 91.47, 82.07, 0.0, 88.64, 84.8, 0.0, 52.74, 44.69, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 33.19, 46.9, 39.5, 36.11, 0.0, 0.0, 42.44, 41.5, 58.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 41.12], ["speech", 12.58], ["hum", 7.46]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.63], ["music", 31.33], ["synthetic singing", 1.27]], null, [["speech", 42.12], ["music", 21.83], ["sidetone", 5.78]], [["music", 17.62], ["speech", 8.85], ["animal", 4.75]], [["music", 30.68], ["singing bowl", 10.17], ["synthesizer", 8.13]], [["speech", 58.06], ["music", 22.48], ["synthesizer", 3.44]], null, null, [["music", 36.11], ["speech", 22.14], ["mains hum", 4.69]], [["speech", 40.2], ["music", 23.74], ["musical instrument", 5.86]], null], "duration": [13.49, -0.46, 1.79, 2.3, 2.57, 1.32, 3.06, 2.08, -0.33, 2.93, 2.15, 3.67, 0.09, 0.79, 1.27, 1.44, 0.69, 2.24, 0.27, 1.77, 0.56, -0.37, 0.48, 6.01, 0.15, 4.78, 3.4, 8.82, 6.05, 1.9, 1.35, 5.86, 2.24, 2.33]} \ No newline at end of file diff --git a/annotations_1/b0KSEziycmw_filtered.json b/annotations_1/b0KSEziycmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e213df6382e65dbfdfc31d9ae902dfbf6a2bf986 --- /dev/null +++ b/annotations_1/b0KSEziycmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.1], [10.0, 10.59], [18.0, 18.87], [22.0, 23.43], [27.0, 27.18], [28.0, 28.34], [35.0, 36.56], [38.0, 38.38], [40.0, 40.56], [42.0, 42.94], [49.0, 49.81], [51.0, 52.08], [53.0, 53.87], [55.0, 55.73], [57.0, 58.18], [59.0, 59.8], [67.0, 67.71], [69.0, 70.7], [71.0, 71.98], [74.0, 75.24], [76.0, 77.31], [78.0, 78.31], [80.0, 80.27], [82.0, 82.76], [84.0, 84.45], [86.0, 86.17], [87.0, 87.32], [92.0, 93.26], [95.0, 101.76], [102.0, 104.45], [112.0, 113.27], [116.0, 117.98], [122.0, 123.84], [126.0, 128.36], [129.0, 131.55], [134.0, 135.55], [139.0, 140.71], [142.0, 144.46], [145.0, 152.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 42.96, 0.0, 0.0, 0.0, 38.02, 41.2, 0.0, 0.0, 55.53, 29.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 22.54], ["speech", 18.4], ["fart", 14.78]], [["speech", 36.55], ["music", 28.91], ["echo", 3.09]], null, null, null, [["sine wave", 43.99], ["speech", 12.33], ["chirp tone", 9.39]], [["insect", 20.62], ["fly, housefly", 19.44], ["speech", 10.63]], null, null, null, [["music", 61.0], ["speech", 22.54], ["explosion", 2.26]]], "duration": [1.1, 0.59, 0.87, 1.43, 0.18, 0.34, 1.56, 0.38, 0.56, 0.94, 0.81, 1.08, 0.87, 0.73, 1.18, 0.8, 0.71, 1.7, 0.98, 1.24, 1.31, 0.31, 0.27, 0.76, 0.45, 0.17, 0.32, 1.26, 6.76, 2.45, 1.27, 1.98, 1.84, 2.36, 2.55, 1.55, 1.71, 2.46, 7.59]} \ No newline at end of file diff --git a/annotations_1/b0p7_jQ8HiE_filtered.json b/annotations_1/b0p7_jQ8HiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9680985cdf9cd1d8a62e04efb4ff888367c122e --- /dev/null +++ b/annotations_1/b0p7_jQ8HiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.89], [17.0, 19.16], [24.0, 24.39], [27.0, 29.66], [38.0, 38.97], [43.0, 44.25], [49.0, 49.35], [52.0, 61.84], [63.0, 64.34], [67.0, 68.03], [70.0, 71.66], [74.0, 75.73], [79.0, 84.45], [85.0, 90.36]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [43.18, 41.1, 0.0, 35.82, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 0.0, 37.01, 33.97], "audiomae_on_audioset": [[["music", 46.53], ["musical instrument", 7.08], ["echo", 4.34]], [["gong", 16.8], ["music", 16.11], ["singing bowl", 11.65]], null, [["music", 46.7], ["didgeridoo", 7.44], ["mantra", 6.44]], null, null, null, [["music", 60.66], ["theremin", 8.51], ["synthesizer", 7.73]], null, null, null, null, [["music", 59.51], ["effects unit", 6.27], ["didgeridoo", 4.15]], [["music", 63.54], ["didgeridoo", 12.0], ["musical instrument", 3.78]]], "duration": [5.89, 2.16, 0.39, 2.66, 0.97, 1.25, 0.35, 9.84, 1.34, 1.03, 1.66, 1.73, 5.45, 5.36]} \ No newline at end of file diff --git a/annotations_1/b1MxW8nf_lU_filtered.json b/annotations_1/b1MxW8nf_lU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4f27426bd63416ead985666fc81b220c22bd495 --- /dev/null +++ b/annotations_1/b1MxW8nf_lU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.5], [42.0, 50.4], [55.0, 73.16], [76.0, 76.92], [78.0, 78.97], [84.0, 84.48]], "keep_status": [true, true, true, false, false, false], "silence_prob": [32.28, 32.08, 33.73, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.41], ["crowd", 4.75], ["throbbing", 4.61]], [["music", 47.17], ["throbbing", 10.45], ["speech", 4.94]], [["speech", 35.09], ["livestock, farm animals, working animals", 13.32], ["cattle, bovinae", 10.74]], null, null, null], "duration": [17.5, 8.4, 18.16, 0.92, 0.97, 0.48]} \ No newline at end of file diff --git a/annotations_1/b2MEP246DxY_filtered.json b/annotations_1/b2MEP246DxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1c971b680aaa32be9bdfad52b34d60585b0c8cd --- /dev/null +++ b/annotations_1/b2MEP246DxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 24.16], [27.0, 70.68], [79.0, 79.07], [80.0, 94.64], [98.0, 113.95]], "keep_status": [false, false, false, false, false], "silence_prob": [28.63, 0.0, 0.0, 30.4, 29.34], "audiomae_on_audioset": [[["speech", 44.9], ["music", 26.54], ["outside, rural or natural", 4.2]], null, null, [["speech", 48.08], ["brass instrument", 13.46], ["trombone", 11.75]], [["music", 45.46], ["speech", 20.87], ["electronic music", 7.7]]], "duration": [10.16, 43.68, 0.07, 14.64, 15.95]} \ No newline at end of file diff --git a/annotations_1/b2P-oU216V4_filtered.json b/annotations_1/b2P-oU216V4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f3410f2d9f627d4d1d3601b69b8cdb3f6f52e42 --- /dev/null +++ b/annotations_1/b2P-oU216V4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.79], [16.0, 26.43], [27.0, 29.71], [35.0, 42.36], [45.0, 45.33], [47.0, 55.53], [65.0, 67.96], [73.0, 78.12], [81.0, 88.72], [110.0, 111.72]], "keep_status": [false, true, false, false, false, false, true, false, false, false], "silence_prob": [32.09, 34.04, 54.83, 33.39, 0.0, 32.77, 34.57, 31.79, 32.01, 0.0], "audiomae_on_audioset": [[["speech", 43.85], ["music", 25.81], ["sidetone", 2.33]], [["music", 52.1], ["speech", 11.51], ["whack, thwack", 5.09]], null, [["music", 44.01], ["speech", 22.52], ["throbbing", 5.12]], null, [["cattle, bovinae", 37.54], ["livestock, farm animals, working animals", 35.4], ["moo", 23.38]], [["music", 43.32], ["speech", 18.38], ["moo", 6.35]], [["music", 82.11], ["theremin", 4.17], ["synthesizer", 3.43]], [["music", 72.52], ["throbbing", 4.7], ["musical instrument", 3.23]], null], "duration": [3.79, 10.43, 2.71, 7.36, 0.33, 8.53, 2.96, 5.12, 7.72, 1.72]} \ No newline at end of file diff --git a/annotations_1/b2hhdMiOTOE_filtered.json b/annotations_1/b2hhdMiOTOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46d8205f3a9e000ef6ec075c2bd9d7121043dc91 --- /dev/null +++ b/annotations_1/b2hhdMiOTOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 58.6], [59.0, 96.97], [100.0, 126.98], [128.0, 138.67]], "keep_status": [false, false, true, true], "silence_prob": [0.0, 0.0, 31.65, 34.72], "audiomae_on_audioset": [null, null, [["music", 18.87], ["hum", 6.79], ["noise", 6.63]], [["music", 38.42], ["effects unit", 14.55], ["guitar", 7.35]]], "duration": [-0.4, 37.97, 26.98, 10.67]} \ No newline at end of file diff --git a/annotations_1/b3OlGLDk4pY_filtered.json b/annotations_1/b3OlGLDk4pY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e2233310c6f808c25888d1fedcfdbeaf8f2d921 --- /dev/null +++ b/annotations_1/b3OlGLDk4pY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 57.25], [60.0, 76.69], [79.0, 85.46], [87.0, 104.58], [107.0, 115.26], [119.0, 128.36], [131.0, 131.23], [133.0, 150.36], [154.0, 158.19], [159.0, 167.24], [172.0, 173.15], [175.0, 175.86], [177.0, 234.86]], "keep_status": [false, true, true, true, true, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 29.7, 29.0, 28.73, 29.4, 29.54, 0.0, 28.7, 29.4, 28.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 22.08], ["hum", 10.79], ["mains hum", 10.28]], [["music", 26.03], ["static", 6.54], ["hum", 5.97]], [["music", 23.84], ["speech", 8.63], ["vehicle", 8.05]], [["music", 17.62], ["fly, housefly", 13.73], ["mosquito", 12.18]], [["music", 59.03], ["sound effect", 5.28], ["buzz", 3.97]], null, [["livestock, farm animals, working animals", 25.77], ["cattle, bovinae", 21.67], ["moo", 12.71]], [["music", 26.81], ["hum", 13.23], ["explosion", 12.48]], [["hum", 29.1], ["music", 25.12], ["mains hum", 16.37]], null, null, null], "duration": [52.25, 16.69, 6.46, 17.58, 8.26, 9.36, 0.23, 17.36, 4.19, 8.24, 1.15, 0.86, 57.86]} \ No newline at end of file diff --git a/annotations_1/b3lOpSXhT0c_filtered.json b/annotations_1/b3lOpSXhT0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00186de47ca921c422c09616e5d5d01562eb9522 --- /dev/null +++ b/annotations_1/b3lOpSXhT0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 103.67], [104.0, 104.14], [105.0, 108.63], [109.0, 111.2], [112.0, 113.29], [114.0, 137.71], [138.0, 138.38]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 41.2, 40.92, 0.0, 31.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 30.38], ["hum", 10.08], ["throbbing", 5.84]], [["hum", 36.11], ["throbbing", 19.8], ["mains hum", 13.37]], null, [["whack, thwack", 19.5], ["music", 11.83], ["smash, crash", 9.09]], null], "duration": [33.67, 0.14, 3.63, 2.2, 1.29, 23.71, 0.38]} \ No newline at end of file diff --git a/annotations_1/b4kRHpvisxE_filtered.json b/annotations_1/b4kRHpvisxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9928d1b7c0c3d2b183e9276cebfc679a9ebd3a4a --- /dev/null +++ b/annotations_1/b4kRHpvisxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.89], [10.0, 11.72], [13.0, 14.28], [18.0, 18.0], [18.0, 20.31], [25.0, 26.64], [31.0, 34.47], [35.0, 37.39], [39.0, 41.57], [43.0, 45.81], [50.0, 52.47], [54.0, 57.32], [60.0, 62.94], [64.0, 66.82], [69.0, 72.5], [75.0, 76.27], [79.0, 81.11], [84.0, 86.12], [88.0, 90.54], [92.0, 95.01], [96.0, 97.78], [101.0, 101.51], [103.0, 104.21], [107.0, 107.08], [112.0, 113.0], [117.0, 122.0], [129.0, 130.28], [131.0, 135.89], [137.0, 140.34], [143.0, 145.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 99.92, 56.86, 100.0, 100.0, 100.0, 73.97, 99.98, 99.1, 98.86, 0.0, 100.0, 98.99, 99.05, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 60.32, 0.0, 71.29, 82.25, 76.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.11, 1.72, 1.28, 0.0, 2.31, 1.64, 3.47, 2.39, 2.57, 2.81, 2.47, 3.32, 2.94, 2.82, 3.5, 1.27, 2.11, 2.12, 2.54, 3.01, 1.78, 0.51, 1.21, 0.08, 1.0, 5.0, 1.28, 4.89, 3.34, 2.27]} \ No newline at end of file diff --git a/annotations_1/b4vpGhO2LwA_filtered.json b/annotations_1/b4vpGhO2LwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09b4f793ce7b4480e14dcbe6e4cc18074e0ed17 --- /dev/null +++ b/annotations_1/b4vpGhO2LwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.38], [18.0, 18.18], [19.0, 19.62], [41.0, 41.35], [47.0, 47.82], [50.0, 51.02], [52.0, 54.04], [55.0, 56.54], [61.0, 61.11], [67.0, 67.1], [73.0, 72.82], [73.0, 76.0], [77.0, 77.48], [84.0, 84.08], [85.0, 86.07], [96.0, 96.9]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 0.0, 0.0, 0.0, 0.0, 34.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 12.97], ["honk", 11.75], ["goose", 10.95]], null, null, null, null, [["speech", 35.66], ["hum", 9.83], ["sidetone", 6.71]], null, null, null, null], "duration": [0.38, 0.18, 0.62, 0.35, 0.82, 1.02, 2.04, 1.54, 0.11, 0.1, -0.18, 3.0, 0.48, 0.08, 1.07, 0.9]} \ No newline at end of file diff --git a/annotations_1/b5Q6A_1YyHg_filtered.json b/annotations_1/b5Q6A_1YyHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52dd70b365704288feac7098c9c0d1aeb6f54cc0 --- /dev/null +++ b/annotations_1/b5Q6A_1YyHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.01], [28.0, 32.68], [36.0, 40.76], [48.0, 68.15], [71.0, 80.57], [91.0, 102.69], [103.0, 103.79], [106.0, 106.89], [117.0, 124.38]], "keep_status": [false, false, false, false, false, true, false, false, true], "silence_prob": [31.13, 29.7, 30.1, 29.47, 29.78, 29.92, 0.0, 0.0, 32.68], "audiomae_on_audioset": [[["speech", 41.65], ["music", 33.4], ["theremin", 3.25]], [["music", 82.12], ["mosquito", 2.19], ["theremin", 2.05]], [["speech", 50.87], ["music", 33.41], ["boing", 2.7]], [["music", 57.71], ["speech", 10.03], ["fart", 3.61]], [["music", 54.8], ["speech", 27.43], ["electronic music", 1.92]], [["whack, thwack", 37.8], ["speech", 12.4], ["fart", 11.62]], null, null, [["speech", 45.09], ["whack, thwack", 16.11], ["thunk", 8.59]]], "duration": [5.01, 4.68, 4.76, 20.15, 9.57, 11.69, 0.79, 0.89, 7.38]} \ No newline at end of file diff --git a/annotations_1/b60DLSEemEY_filtered.json b/annotations_1/b60DLSEemEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..398143e0973652773a7d74824d2c282744768aa0 --- /dev/null +++ b/annotations_1/b60DLSEemEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.53], [6.0, 12.38], [13.0, 13.22], [14.0, 18.71], [19.0, 23.41], [24.0, 24.34], [25.0, 27.08], [27.0, 50.84], [52.0, 54.01], [54.0, 55.43], [60.0, 60.13], [62.0, 64.07], [66.0, 65.97], [66.0, 68.23], [69.0, 70.02], [79.0, 79.42], [83.0, 83.34], [85.0, 84.94], [92.0, 92.91], [98.0, 98.17], [103.0, 104.75], [106.0, 119.11], [125.0, 129.98], [130.0, 131.38]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [41.72, 63.1, 0.0, 53.84, 37.34, 0.0, 30.69, 30.7, 32.14, 0.0, 0.0, 43.69, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.52, 96.89, 0.0], "audiomae_on_audioset": [[["hum", 17.11], ["mains hum", 16.89], ["music", 12.81]], null, null, null, [["sidetone", 62.83], ["hum", 12.77], ["speech", 9.22]], null, [["hum", 17.6], ["throbbing", 16.32], ["mains hum", 13.33]], [["music", 46.06], ["hum", 17.2], ["throbbing", 11.46]], [["speech", 34.67], ["music", 11.77], ["hum", 6.01]], null, null, [["speech", 75.45], ["sidetone", 6.15], ["music", 2.94]], null, [["music", 26.08], ["speech", 18.32], ["mains hum", 7.25]], null, null, null, null, null, null, null, [["crow", 40.8], ["caw", 20.29], ["hum", 7.68]], null, null], "duration": [3.53, 6.38, 0.22, 4.71, 4.41, 0.34, 2.08, 23.84, 2.01, 1.43, 0.13, 2.07, -0.03, 2.23, 1.02, 0.42, 0.34, -0.06, 0.91, 0.17, 1.75, 13.11, 4.98, 1.38]} \ No newline at end of file diff --git a/annotations_1/b65C_muXajk_filtered.json b/annotations_1/b65C_muXajk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f6adb319647e32deb720a4f8296bf94a3ad4cc --- /dev/null +++ b/annotations_1/b65C_muXajk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.25], [28.0, 28.26], [29.0, 29.57], [38.0, 38.64], [41.0, 41.2], [42.0, 48.39], [51.0, 50.94], [52.0, 52.32], [53.0, 53.65], [55.0, 56.98], [85.0, 85.33], [86.0, 87.84], [92.0, 94.54], [97.0, 98.49], [100.0, 100.52], [102.0, 102.46], [110.0, 110.54], [114.0, 114.76], [118.0, 122.01], [123.0, 125.9], [126.0, 126.74], [128.0, 130.76], [132.0, 135.4], [136.0, 137.98], [143.0, 144.58], [146.0, 147.26], [149.0, 151.24], [152.0, 153.94], [155.0, 157.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 99.92, 0.0, 0.0, 0.0, 35.46, 0.0, 31.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.33], ["sound effect", 6.28], ["cacophony", 6.08]], null, [["hum", 24.13], ["mains hum", 24.11], ["boat, water vehicle", 5.58]]], "duration": [0.25, 0.26, 0.57, 0.64, 0.2, 6.39, -0.06, 0.32, 0.65, 1.98, 0.33, 1.84, 2.54, 1.49, 0.52, 0.46, 0.54, 0.76, 4.01, 2.9, 0.74, 2.76, 3.4, 1.98, 1.58, 1.26, 2.24, 1.94, 2.67]} \ No newline at end of file diff --git a/annotations_1/b6vOp7_rI6Q_filtered.json b/annotations_1/b6vOp7_rI6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d352b2ad069e2da3660c9009dac04f2c8efdcc6 --- /dev/null +++ b/annotations_1/b6vOp7_rI6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.87], [24.0, 27.84], [28.0, 31.43], [32.0, 34.05], [38.0, 40.98], [42.0, 44.93], [45.0, 50.7], [52.0, 60.93], [63.0, 64.57], [66.0, 66.73], [73.0, 76.17], [77.0, 77.38], [78.0, 81.13], [104.0, 104.53], [112.0, 112.75], [118.0, 119.03], [127.0, 128.28], [131.0, 132.51], [135.0, 135.85], [138.0, 138.0], [142.0, 142.91], [144.0, 145.0], [147.0, 147.31], [152.0, 153.59], [156.0, 156.32], [162.0, 162.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.83, 93.13, 80.64, 99.48, 100.0, 100.0, 83.7, 99.99, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.87, 3.84, 3.43, 2.05, 2.98, 2.93, 5.7, 8.93, 1.57, 0.73, 3.17, 0.38, 3.13, 0.53, 0.75, 1.03, 1.28, 1.51, 0.85, 0.0, 0.91, 1.0, 0.31, 1.59, 0.32, 0.87]} \ No newline at end of file diff --git a/annotations_1/b74611maYgQ_filtered.json b/annotations_1/b74611maYgQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24a45da85759cfdf102186810d3328a3d6dca39a --- /dev/null +++ b/annotations_1/b74611maYgQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.58], [25.0, 28.58], [31.0, 39.23], [42.0, 50.16], [52.0, 55.05], [55.0, 55.14], [60.0, 60.78], [63.0, 69.77], [70.0, 70.88], [74.0, 74.56], [77.0, 87.86], [93.0, 96.03], [97.0, 103.33]], "keep_status": [false, true, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [31.54, 39.74, 40.28, 29.36, 32.42, 0.0, 0.0, 33.27, 0.0, 0.0, 32.87, 31.06, 30.4], "audiomae_on_audioset": [[["speech", 55.79], ["music", 14.47], ["explosion", 4.99]], [["speech", 23.46], ["hum", 20.26], ["mains hum", 10.18]], [["speech", 43.18], ["music", 12.54], ["mains hum", 6.29]], [["electric shaver, electric razor", 15.19], ["buzz", 13.88], ["speech", 13.19]], [["music", 37.65], ["hum", 13.47], ["throbbing", 8.88]], null, null, [["music", 59.23], ["speech", 21.2], ["electronic music", 2.7]], null, null, [["music", 43.08], ["speech", 23.8], ["hum", 14.51]], [["whale vocalization", 55.31], ["speech", 7.79], ["wild animals", 7.25]], [["whale vocalization", 28.49], ["music", 12.85], ["buzz", 10.51]]], "duration": [2.58, 3.58, 8.23, 8.16, 3.05, 0.14, 0.78, 6.77, 0.88, 0.56, 10.86, 3.03, 6.33]} \ No newline at end of file diff --git a/annotations_1/b7AjNXAF-7Y_filtered.json b/annotations_1/b7AjNXAF-7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/b7AjNXAF-7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/b8Dv782UIb4_filtered.json b/annotations_1/b8Dv782UIb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89f3d256de567514377801c0fca86b047acfab18 --- /dev/null +++ b/annotations_1/b8Dv782UIb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 9.78], [10.0, 10.69], [13.0, 15.25], [16.0, 17.1], [19.0, 19.77], [22.0, 22.62], [24.0, 25.93], [27.0, 27.13], [30.0, 30.42], [31.0, 37.34], [39.0, 41.86], [43.0, 44.24], [45.0, 46.63], [47.0, 58.26], [68.0, 69.79], [72.0, 72.84], [74.0, 76.71], [78.0, 78.85], [81.0, 82.68], [85.0, 85.99], [95.0, 95.05], [96.0, 96.7], [98.0, 99.93], [101.0, 103.08], [105.0, 106.19], [108.0, 108.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.48, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 52.33, 0.0, 0.0, 29.41, 0.0, 0.0, 40.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["animal", 29.09], ["grunt", 15.37], ["roaring cats (lions, tigers)", 13.47]], null, null, [["cattle, bovinae", 20.15], ["livestock, farm animals, working animals", 15.91], ["speech", 14.13]], null, null, null, null, null, null, null, null, null], "duration": [1.14, 3.78, 0.69, 2.25, 1.1, 0.77, 0.62, 1.93, 0.13, 0.42, 6.34, 2.86, 1.24, 1.63, 11.26, 1.79, 0.84, 2.71, 0.85, 1.68, 0.99, 0.05, 0.7, 1.93, 2.08, 1.19, 0.9]} \ No newline at end of file diff --git a/annotations_1/b8t5kX7k0vQ_filtered.json b/annotations_1/b8t5kX7k0vQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b4605401fba692878e7b18bad852a7e5141f070 --- /dev/null +++ b/annotations_1/b8t5kX7k0vQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.16], [5.0, 5.8]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.16, 0.8]} \ No newline at end of file diff --git a/annotations_1/b9pr0K7SuYk_filtered.json b/annotations_1/b9pr0K7SuYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6e9fd562c558a77348be8df048df64ed0c68334 --- /dev/null +++ b/annotations_1/b9pr0K7SuYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.12], [6.0, 6.96], [8.0, 10.49], [11.0, 12.26], [13.0, 30.0], [33.0, 39.93], [42.0, 43.8], [46.0, 47.07], [56.0, 56.02], [57.0, 57.81], [58.0, 58.92], [67.0, 67.04], [68.0, 69.25], [70.0, 70.34], [71.0, 71.93], [85.0, 84.92], [86.0, 87.0], [88.0, 88.4], [90.0, 90.32], [94.0, 101.01], [101.0, 102.39], [104.0, 104.33], [106.0, 107.47], [108.0, 108.89], [110.0, 112.08], [115.0, 138.27]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [32.25, 0.0, 64.07, 0.0, 31.85, 32.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.83, 0.0, 0.0, 0.0, 0.0, 34.7, 34.03], "audiomae_on_audioset": [[["music", 38.02], ["throbbing", 21.61], ["hum", 8.07]], null, null, null, [["music", 73.63], ["electronic music", 5.35], ["hum", 2.91]], [["music", 54.31], ["speech", 7.15], ["electronic music", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.36], ["hum", 8.48], ["throbbing", 3.73]], null, null, null, null, [["music", 31.02], ["didgeridoo", 10.38], ["boing", 7.6]], [["music", 25.71], ["whack, thwack", 23.99], ["groan", 11.07]]], "duration": [3.12, 0.96, 2.49, 1.26, 17.0, 6.93, 1.8, 1.07, 0.02, 0.81, 0.92, 0.04, 1.25, 0.34, 0.93, -0.08, 1.0, 0.4, 0.32, 7.01, 1.39, 0.33, 1.47, 0.89, 2.08, 23.27]} \ No newline at end of file diff --git a/annotations_1/bBHFfXCAPLc_filtered.json b/annotations_1/bBHFfXCAPLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d00dd9ba90441d7a1ff5514ea8166970767ad551 --- /dev/null +++ b/annotations_1/bBHFfXCAPLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.87], [6.0, 16.55], [22.0, 38.1], [40.0, 43.36], [44.0, 43.82], [44.0, 44.15], [44.0, 54.77], [58.0, 61.74], [65.0, 65.2], [75.0, 75.68], [77.0, 77.5], [81.0, 82.02], [84.0, 84.18], [85.0, 85.8], [92.0, 94.9], [96.0, 100.67], [103.0, 103.42], [124.0, 124.75], [126.0, 127.79], [131.0, 131.7]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.97, 33.96, 45.78, 0.0, 0.0, 45.59, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 33.63, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 53.21], ["throbbing", 21.63], ["mains hum", 16.77]], [["music", 80.53], ["cacophony", 6.08], ["vehicle", 1.24]], [["hum", 35.62], ["throbbing", 30.44], ["mains hum", 5.65]], null, null, [["sidetone", 29.65], ["speech", 24.86], ["music", 14.04]], [["hum", 18.51], ["speech", 14.58], ["music", 11.48]], null, null, null, null, null, null, null, [["music", 57.79], ["hum", 9.31], ["mains hum", 4.39]], null, null, null, null], "duration": [0.87, 10.55, 16.1, 3.36, -0.18, 0.15, 10.77, 3.74, 0.2, 0.68, 0.5, 1.02, 0.18, 0.8, 2.9, 4.67, 0.42, 0.75, 1.79, 0.7]} \ No newline at end of file diff --git a/annotations_1/bBjLUZgx4WA_filtered.json b/annotations_1/bBjLUZgx4WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebf28905ff90b0739fda7677d16d1cd86dafbb0 --- /dev/null +++ b/annotations_1/bBjLUZgx4WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 8.31], [10.0, 10.98], [13.0, 13.04], [18.0, 19.31], [20.0, 20.43], [21.0, 21.93], [24.0, 29.86], [32.0, 33.74], [35.0, 36.48], [37.0, 38.38], [41.0, 41.03], [43.0, 42.85], [45.0, 45.01], [47.0, 47.28], [50.0, 50.06], [55.0, 55.71], [57.0, 58.18], [60.0, 63.49], [70.0, 70.7], [74.0, 74.48], [75.0, 75.0], [76.0, 77.13], [78.0, 79.42], [81.0, 86.43], [90.0, 90.85], [94.0, 94.95], [98.0, 100.41], [102.0, 108.5], [111.0, 117.53], [119.0, 124.11], [125.0, 130.55], [132.0, 134.77], [139.0, 140.76], [142.0, 143.04], [144.0, 149.13], [150.0, 152.12], [154.0, 157.1], [158.0, 161.38], [164.0, 166.41], [167.0, 168.56]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 41.24, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 0.0, 0.0, 45.3, 0.0, 0.0, 46.9, 46.79, 45.75, 47.74, 43.98, 44.49, 0.0, 0.0, 44.43, 47.82, 45.65, 45.02, 45.21, 0.0], "audiomae_on_audioset": [null, [["speech", 48.42], ["singing bowl", 13.36], ["music", 6.48]], null, null, null, null, null, [["singing bowl", 35.16], ["music", 32.75], ["ambient music", 7.45]], null, null, null, null, null, null, null, null, null, null, [["music", 75.32], ["ambient music", 4.09], ["scary music", 1.95]], null, null, null, null, null, [["music", 47.26], ["hum", 14.24], ["electronic music", 5.01]], null, null, [["music", 38.21], ["gong", 22.28], ["electronic music", 7.89]], [["music", 54.66], ["singing bowl", 7.55], ["hiccup", 4.31]], [["music", 46.28], ["ambient music", 12.67], ["singing bowl", 8.01]], [["music", 68.59], ["scary music", 4.02], ["foghorn", 2.74]], [["music", 56.49], ["ambient music", 20.03], ["scary music", 10.82]], [["music", 70.13], ["ambient music", 13.39], ["electronic music", 3.57]], null, null, [["music", 61.37], ["ambient music", 18.28], ["synthesizer", 3.26]], [["music", 33.88], ["ambient music", 23.76], ["electronic music", 12.75]], [["music", 50.49], ["singing bowl", 14.5], ["ambient music", 5.85]], [["music", 23.33], ["speech", 18.57], ["singing bowl", 17.09]], [["music", 60.36], ["ambient music", 10.57], ["singing bowl", 6.89]], null], "duration": [0.43, 2.31, 0.98, 0.04, 1.31, 0.43, 0.93, 5.86, 1.74, 1.48, 1.38, 0.03, -0.15, 0.01, 0.28, 0.06, 0.71, 1.18, 3.49, 0.7, 0.48, 0.0, 1.13, 1.42, 5.43, 0.85, 0.95, 2.41, 6.5, 6.53, 5.11, 5.55, 2.77, 1.76, 1.04, 5.13, 2.12, 3.1, 3.38, 2.41, 1.56]} \ No newline at end of file diff --git a/annotations_1/bC0vGFJbMjo_filtered.json b/annotations_1/bC0vGFJbMjo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a456da7edb215ea88628f9d841b19b4e23efb68e --- /dev/null +++ b/annotations_1/bC0vGFJbMjo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.14], [37.0, 38.23], [44.0, 44.76], [65.0, 68.01], [75.0, 87.99], [93.0, 99.81], [103.0, 103.33], [104.0, 111.1], [117.0, 129.74], [132.0, 144.0], [145.0, 145.47], [149.0, 149.52], [150.0, 150.21], [151.0, 184.62], [185.0, 185.26]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 84.43, 30.1, 30.26, 0.0, 30.17, 30.14, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 56.57], ["hum", 7.87], ["throbbing", 4.03]], [["music", 68.49], ["smash, crash", 8.39], ["boom", 2.67]], null, [["music", 69.74], ["electronic music", 2.51], ["throbbing", 1.44]], [["music", 72.41], ["electronic music", 4.15], ["throbbing", 3.52]], null, null, null, null, null, null], "duration": [0.14, 1.23, 0.76, 3.01, 12.99, 6.81, 0.33, 7.1, 12.74, 12.0, 0.47, 0.52, 0.21, 33.62, 0.26]} \ No newline at end of file diff --git a/annotations_1/bCLTAaa3qMM_filtered.json b/annotations_1/bCLTAaa3qMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0756a68c0bfa0ad800bb41b011d857803715d449 --- /dev/null +++ b/annotations_1/bCLTAaa3qMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.83], [13.0, 21.03], [21.0, 23.77], [27.0, 27.3], [28.0, 28.24], [31.0, 31.9], [34.0, 34.48], [43.0, 45.23], [47.0, 47.01], [48.0, 47.97], [49.0, 94.51], [95.0, 115.5], [118.0, 122.55], [125.0, 127.62], [129.0, 142.59], [146.0, 152.07], [160.0, 174.11], [177.0, 179.0], [180.0, 180.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, true, true, false, false], "silence_prob": [0.0, 38.56, 50.16, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 30.48, 30.33, 30.36, 32.26, 29.3, 29.59, 37.38, 0.0], "audiomae_on_audioset": [null, [["music", 50.9], ["hum", 10.71], ["mains hum", 5.17]], null, null, null, null, null, null, null, null, null, [["music", 51.92], ["theremin", 11.6], ["synthesizer", 3.89]], [["music", 28.24], ["speech", 28.17], ["throbbing", 5.72]], [["music", 39.65], ["speech", 29.96], ["didgeridoo", 3.05]], [["music", 34.65], ["speech", 26.44], ["hum", 8.94]], [["music", 54.49], ["breaking", 6.69], ["whack, thwack", 5.84]], [["music", 33.04], ["fly, housefly", 15.0], ["hum", 7.55]], [["theremin", 60.15], ["music", 8.42], ["civil defense siren", 4.11]], null], "duration": [1.83, 8.03, 2.77, 0.3, 0.24, 0.9, 0.48, 2.23, 0.01, -0.03, 45.51, 20.5, 4.55, 2.62, 13.59, 6.07, 14.11, 2.0, 0.94]} \ No newline at end of file diff --git a/annotations_1/bCOc7VCSox4_filtered.json b/annotations_1/bCOc7VCSox4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3fb56b1aa8ca5330794a2e94631e28f49b21fa5 --- /dev/null +++ b/annotations_1/bCOc7VCSox4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.29], [5.0, 5.27], [7.0, 7.21], [8.0, 13.41], [21.0, 26.55], [34.0, 39.73], [41.0, 41.79], [45.0, 45.44], [47.0, 47.38], [49.0, 50.3], [52.0, 55.97], [57.0, 59.81], [67.0, 85.83], [87.0, 98.22], [108.0, 111.32], [123.0, 128.76], [134.0, 136.53], [137.0, 143.94], [145.0, 145.22], [146.0, 146.53], [149.0, 149.89], [153.0, 153.84]], "keep_status": [true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [45.11, 0.0, 0.0, 41.48, 35.57, 43.08, 0.0, 0.0, 0.0, 0.0, 33.17, 31.82, 32.32, 89.9, 85.54, 39.91, 43.66, 45.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.24], ["music", 14.07], ["whale vocalization", 9.76]], null, null, [["music", 53.84], ["theremin", 8.07], ["thunk", 7.25]], [["music", 67.36], ["theremin", 10.95], ["carnatic music", 4.05]], [["music", 69.63], ["carnatic music", 6.34], ["theremin", 4.57]], null, null, null, null, [["music", 50.9], ["boing", 21.64], ["theremin", 7.72]], [["music", 60.65], ["theremin", 14.13], ["foghorn", 8.21]], [["music", 83.11], ["didgeridoo", 3.94], ["musical instrument", 2.13]], null, null, [["whimper", 22.97], ["groan", 14.83], ["male singing", 12.84]], [["a capella", 23.22], ["male singing", 15.1], ["music", 8.88]], [["humming", 32.11], ["howl", 9.48], ["frog", 7.58]], null, null, null, null], "duration": [2.29, 0.27, 0.21, 5.41, 5.55, 5.73, 0.79, 0.44, 0.38, 1.3, 3.97, 2.81, 18.83, 11.22, 3.32, 5.76, 2.53, 6.94, 0.22, 0.53, 0.89, 0.84]} \ No newline at end of file diff --git a/annotations_1/bCYs8v0Xji4_filtered.json b/annotations_1/bCYs8v0Xji4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..376cf794380600852c702b0b0e78c1febac98246 --- /dev/null +++ b/annotations_1/bCYs8v0Xji4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 6.86], [9.0, 11.1], [15.0, 19.23], [20.0, 21.17], [26.0, 26.42], [27.0, 31.83], [34.0, 33.91], [35.0, 35.83], [40.0, 40.95], [44.0, 46.03], [52.0, 52.44], [56.0, 56.84], [59.0, 58.99], [60.0, 60.76], [62.0, 62.95], [64.0, 64.47], [65.0, 65.38], [69.0, 72.54], [75.0, 75.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 94.95, 70.44, 0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 39.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sine wave", 49.94], ["speech", 25.88], ["chirp tone", 6.31]], null, null, null, null, null, null, null, [["whack, thwack", 16.44], ["speech", 12.67], ["tuning fork", 9.3]], null], "duration": [0.75, 0.86, 2.1, 4.23, 1.17, 0.42, 4.83, -0.09, 0.83, 0.95, 2.03, 0.44, 0.84, -0.01, 0.76, 0.95, 0.47, 0.38, 3.54, 0.14]} \ No newline at end of file diff --git a/annotations_1/bCZRAcsuRgY_filtered.json b/annotations_1/bCZRAcsuRgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7102a6478a2e60fbb7b3c6ecd7c205852c6bc795 --- /dev/null +++ b/annotations_1/bCZRAcsuRgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.01], [22.0, 23.84], [35.0, 34.75], [35.0, 38.45], [42.0, 51.14], [54.0, 58.92], [66.0, 70.04], [80.0, 82.27], [91.0, 95.39], [106.0, 106.34], [109.0, 109.53], [113.0, 113.97], [122.0, 125.61], [129.0, 129.95], [132.0, 131.65], [132.0, 131.68], [132.0, 138.5], [145.0, 149.25], [155.0, 154.87], [157.0, 159.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.85, 34.83, 33.8, 37.3, 38.45, 33.78, 0.0, 0.0, 0.0, 37.83, 0.0, 0.0, 0.0, 33.88, 36.14, 0.0, 36.01], "audiomae_on_audioset": [null, null, null, [["music", 65.3], ["reggae", 7.19], ["yodeling", 1.99]], [["music", 84.2], ["reggae", 2.38], ["singing", 0.99]], [["music", 74.52], ["reggae", 8.97], ["singing", 1.74]], [["music", 74.59], ["synthesizer", 3.97], ["electronic music", 3.55]], [["music", 55.23], ["throbbing", 18.07], ["synthesizer", 5.45]], [["music", 73.28], ["song", 1.53], ["singing", 1.42]], null, null, null, [["music", 72.41], ["throbbing", 4.0], ["electronic music", 2.38]], null, null, null, [["music", 77.71], ["reggae", 6.99], ["singing", 1.31]], [["music", 54.17], ["musical instrument", 3.16], ["cello", 2.79]], null, [["music", 69.07], ["didgeridoo", 3.55], ["musical instrument", 2.81]]], "duration": [0.01, 1.84, -0.25, 3.45, 9.14, 4.92, 4.04, 2.27, 4.39, 0.34, 0.53, 0.97, 3.61, 0.95, -0.35, -0.32, 6.5, 4.25, -0.13, 2.63]} \ No newline at end of file diff --git a/annotations_1/bD8bl3omDIU_filtered.json b/annotations_1/bD8bl3omDIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cff21cf33898854bac77a00139f318039e89183 --- /dev/null +++ b/annotations_1/bD8bl3omDIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 49.47], [53.0, 54.82], [58.0, 60.62], [65.0, 66.85], [70.0, 73.11], [77.0, 79.15], [85.0, 85.56], [91.0, 91.84], [97.0, 97.87], [103.0, 104.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 74.6, 0.0, 42.0, 30.58, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 71.63], ["theremin", 7.81], ["humming", 1.83]], [["music", 82.4], ["carnatic music", 3.55], ["musical instrument", 2.17]], null, null, null, null], "duration": [47.47, 1.82, 2.62, 1.85, 3.11, 2.15, 0.56, 0.84, 0.87, 1.72]} \ No newline at end of file diff --git a/annotations_1/bD8jQGwyuBU_filtered.json b/annotations_1/bD8jQGwyuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d9a4f235017ab46dcf2bfcc67d4d509f632ad7f --- /dev/null +++ b/annotations_1/bD8jQGwyuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [8.0, 8.88], [9.0, 12.66], [15.0, 15.42], [17.0, 18.13], [20.0, 20.41], [24.0, 28.31], [33.0, 39.92], [42.0, 43.02], [44.0, 47.21], [50.0, 52.15], [81.0, 83.93], [87.0, 88.6], [90.0, 93.29], [96.0, 96.94], [98.0, 99.12], [101.0, 102.29], [103.0, 108.45], [112.0, 115.1], [116.0, 135.48], [139.0, 143.07], [145.0, 147.33], [152.0, 154.41], [156.0, 156.57], [158.0, 158.65], [161.0, 161.22], [167.0, 167.59], [169.0, 168.76]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, true, false, false, false, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 32.49, 31.2, 0.0, 48.27, 93.29, 49.87, 0.0, 36.78, 0.0, 0.0, 0.0, 36.7, 45.72, 34.48, 35.52, 43.05, 52.1, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["laughter", 18.1], ["snicker", 14.39], ["speech", 13.05]], [["boing", 46.9], ["speech", 11.06], ["echo", 8.17]], null, [["throbbing", 43.7], ["music", 21.81], ["hum", 5.39]], null, [["hum", 32.7], ["throbbing", 17.84], ["knock", 10.18]], null, [["music", 27.55], ["throbbing", 11.12], ["hum", 6.07]], null, null, null, [["speech", 45.43], ["sidetone", 35.83], ["radio", 2.94]], [["speech", 14.02], ["animal", 4.63], ["dog", 4.01]], [["music", 41.27], ["effects unit", 6.38], ["musical instrument", 5.51]], [["speech", 13.63], ["cattle, bovinae", 12.36], ["moo", 10.25]], [["cattle, bovinae", 41.69], ["moo", 39.65], ["livestock, farm animals, working animals", 12.25]], null, null, null, null, null, null], "duration": [0.13, 0.88, 3.66, 0.42, 1.13, 0.41, 4.31, 6.92, 1.02, 3.21, 2.15, 2.93, 1.6, 3.29, 0.94, 1.12, 1.29, 5.45, 3.1, 19.48, 4.07, 2.33, 2.41, 0.57, 0.65, 0.22, 0.59, -0.24]} \ No newline at end of file diff --git a/annotations_1/bDW3OVitFE8_filtered.json b/annotations_1/bDW3OVitFE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9e54f99d9c49aca7229816299c1799ac1316113 --- /dev/null +++ b/annotations_1/bDW3OVitFE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [5.0, 5.53], [6.0, 7.33], [18.0, 18.42], [19.0, 19.75], [22.0, 21.69], [23.0, 24.06], [26.0, 26.65], [29.0, 29.64], [31.0, 32.22], [33.0, 34.08], [35.0, 35.09], [42.0, 42.42], [46.0, 46.45], [47.0, 48.05], [49.0, 49.67], [52.0, 53.08], [55.0, 55.41], [56.0, 58.58], [62.0, 62.67], [67.0, 67.98], [68.0, 74.41], [75.0, 76.03], [78.0, 78.31], [80.0, 82.86], [83.0, 83.96], [85.0, 88.13], [89.0, 92.92], [94.0, 94.54], [97.0, 105.65], [106.0, 111.96], [115.0, 124.5], [125.0, 129.47], [130.0, 132.49], [133.0, 133.64], [134.0, 135.4], [136.0, 139.46], [142.0, 142.47], [146.0, 147.46], [149.0, 149.13], [150.0, 151.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.68, 0.0, 0.0, 63.53, 0.0, 0.0, 54.3, 0.0, 100.0, 99.8, 0.0, 99.21, 68.41, 73.97, 83.88, 99.26, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.94, 0.53, 1.33, 0.42, 0.75, -0.31, 1.06, 0.65, 0.64, 1.22, 1.08, 0.09, 0.42, 0.45, 1.05, 0.67, 1.08, 0.41, 2.58, 0.67, 0.98, 6.41, 1.03, 0.31, 2.86, 0.96, 3.13, 3.92, 0.54, 8.65, 5.96, 9.5, 4.47, 2.49, 0.64, 1.4, 3.46, 0.47, 1.46, 0.13, 1.55]} \ No newline at end of file diff --git a/annotations_1/bDcFILIfHU4_filtered.json b/annotations_1/bDcFILIfHU4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dcc594e5db269a6686915a8fdb90df78663195c --- /dev/null +++ b/annotations_1/bDcFILIfHU4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 19.38], [24.0, 24.48], [25.0, 26.4], [36.0, 36.73], [37.0, 38.65], [43.0, 45.17], [45.0, 46.33], [49.0, 48.91], [49.0, 49.65], [55.0, 55.98], [61.0, 61.21], [62.0, 64.34], [65.0, 67.85], [78.0, 79.39], [80.0, 80.74], [82.0, 82.48], [86.0, 88.84], [90.0, 90.41], [91.0, 91.17], [96.0, 96.65], [97.0, 99.03], [100.0, 100.9], [104.0, 106.49], [107.0, 110.19], [111.0, 118.93], [119.0, 122.55], [123.0, 124.92], [128.0, 129.66], [131.0, 133.34], [134.0, 136.09], [137.0, 139.19], [140.0, 141.4], [149.0, 149.57], [156.0, 159.75], [160.0, 160.47], [161.0, 163.07], [164.0, 168.03]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [45.14, 0.0, 0.0, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 0.0, 36.01, 89.54, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 0.0, 44.15, 0.0, 85.17, 68.41, 80.46, 57.89, 0.0, 0.0, 54.76, 72.46, 59.86, 0.0, 0.0, 37.5, 0.0, 64.41, 60.89], "audiomae_on_audioset": [[["speech", 32.14], ["music", 12.75], ["livestock, farm animals, working animals", 11.07]], null, null, null, null, null, null, null, null, null, null, [["speech", 45.62], ["sine wave", 16.63], ["busy signal", 12.34]], null, null, null, null, null, null, null, null, [["music", 28.45], ["speech", 16.27], ["sonar", 11.58]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.03], ["fly, housefly", 12.58], ["insect", 9.96]], null, null, null], "duration": [5.38, 0.48, 1.4, 0.73, 1.65, 2.17, 1.33, -0.09, 0.65, 0.98, 0.21, 2.34, 2.85, 1.39, 0.74, 0.48, 2.84, 0.41, 0.17, 0.65, 2.03, 0.9, 2.49, 3.19, 7.93, 3.55, 1.92, 1.66, 2.34, 2.09, 2.19, 1.4, 0.57, 3.75, 0.47, 2.07, 4.03]} \ No newline at end of file diff --git a/annotations_1/bEBQWhgGM1g_filtered.json b/annotations_1/bEBQWhgGM1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3066291316a614474469bf3a2a8bc2931c642b64 --- /dev/null +++ b/annotations_1/bEBQWhgGM1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 97.88], [98.0, 97.97], [98.0, 117.27]], "keep_status": [false, false, true], "silence_prob": [95.78, 0.0, 49.64], "audiomae_on_audioset": [null, null, [["hum", 21.26], ["whale vocalization", 16.98], ["rumble", 14.6]]], "duration": [9.88, -0.03, 19.27]} \ No newline at end of file diff --git a/annotations_1/bEpL6Mt_jrk_filtered.json b/annotations_1/bEpL6Mt_jrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0cbbbc2ee9e71e60d3bc8c737237d1053c49881 --- /dev/null +++ b/annotations_1/bEpL6Mt_jrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.6], [5.0, 4.92], [14.0, 14.74], [20.0, 32.0], [35.0, 38.03], [39.0, 40.71], [44.0, 44.83], [47.0, 47.44], [48.0, 49.74], [56.0, 58.35], [60.0, 61.97], [65.0, 65.26], [69.0, 69.55], [76.0, 77.67], [80.0, 81.87], [94.0, 95.27], [96.0, 98.02], [100.0, 108.89], [110.0, 116.87], [118.0, 118.89], [120.0, 127.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 99.95, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 97.54, 99.84, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.6, -0.08, 0.74, 12.0, 3.03, 1.71, 0.83, 0.44, 1.74, 2.35, 1.97, 0.26, 0.55, 1.67, 1.87, 1.27, 2.02, 8.89, 6.87, 0.89, 7.72]} \ No newline at end of file diff --git a/annotations_1/bFfnDQ3bDfA_filtered.json b/annotations_1/bFfnDQ3bDfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea6c5a6da264a42949f257af065cfa9afc393935 --- /dev/null +++ b/annotations_1/bFfnDQ3bDfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.48], [7.0, 7.32], [9.0, 9.76], [10.0, 11.6], [13.0, 12.6], [13.0, 13.93], [18.0, 18.49], [25.0, 26.42], [31.0, 31.21], [37.0, 38.47], [42.0, 42.2], [45.0, 45.49], [48.0, 47.7], [49.0, 49.52], [52.0, 53.35], [56.0, 56.57], [59.0, 60.0], [60.0, 61.43], [63.0, 63.26], [64.0, 64.88], [72.0, 71.78], [76.0, 76.2], [85.0, 85.02], [87.0, 87.86], [91.0, 91.64], [97.0, 97.92], [98.0, 99.3], [105.0, 104.77], [105.0, 105.58], [109.0, 109.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.32, 0.76, 1.6, -0.4, 0.93, 0.49, 1.42, 0.21, 1.47, 0.2, 0.49, -0.3, 0.52, 1.35, 0.57, 1.0, 1.43, 0.26, 0.88, -0.22, 0.2, 0.02, 0.86, 0.64, 0.92, 1.3, -0.23, 0.58, 0.51]} \ No newline at end of file diff --git a/annotations_1/bGXeYGkiQDo_filtered.json b/annotations_1/bGXeYGkiQDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c239cb13234d0e820eba8d48858b07d78fb85d9 --- /dev/null +++ b/annotations_1/bGXeYGkiQDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.25], [21.0, 23.13], [24.0, 25.27], [26.0, 30.67], [31.0, 31.87], [32.0, 33.86], [36.0, 38.74], [40.0, 40.54], [42.0, 41.99], [43.0, 43.9], [46.0, 46.6], [47.0, 48.07], [50.0, 50.35], [51.0, 51.63], [61.0, 61.42], [67.0, 68.2], [73.0, 73.35], [75.0, 75.2], [76.0, 77.79], [79.0, 79.79], [86.0, 85.97], [89.0, 89.33], [94.0, 94.61], [95.0, 95.91], [99.0, 99.27], [102.0, 102.39], [106.0, 106.14], [108.0, 108.09], [110.0, 110.37], [113.0, 115.38], [117.0, 117.51], [122.0, 121.98], [124.0, 125.85], [127.0, 127.38], [129.0, 129.46], [131.0, 131.21], [133.0, 133.3], [137.0, 137.25], [142.0, 142.06], [154.0, 154.75], [160.0, 161.4], [162.0, 161.91], [164.0, 163.97], [174.0, 173.97]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.9, 0.0, 88.28, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 49.07], ["hum", 10.39], ["sine wave", 7.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 42.11], ["sidetone", 13.16], ["throbbing", 10.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 2.13, 1.27, 4.67, 0.87, 1.86, 2.74, 0.54, -0.01, 0.9, 0.6, 1.07, 0.35, 0.63, 0.42, 1.2, 0.35, 0.2, 1.79, 0.79, -0.03, 0.33, 0.61, 0.91, 0.27, 0.39, 0.14, 0.09, 0.37, 2.38, 0.51, -0.02, 1.85, 0.38, 0.46, 0.21, 0.3, 0.25, 0.06, 0.75, 1.4, -0.09, -0.03, -0.03]} \ No newline at end of file diff --git a/annotations_1/bHW5h5O-e5I_filtered.json b/annotations_1/bHW5h5O-e5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fbabd1f0b6e36808a8911a2493ef234bca41e90 --- /dev/null +++ b/annotations_1/bHW5h5O-e5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.88], [8.0, 8.26], [9.0, 9.09], [12.0, 15.18], [19.0, 19.16], [21.0, 22.05], [28.0, 28.65], [30.0, 30.37], [31.0, 31.38], [36.0, 37.94], [39.0, 39.73], [41.0, 42.47], [44.0, 46.62], [49.0, 49.84], [54.0, 57.6], [60.0, 60.51], [64.0, 66.21], [69.0, 69.75], [71.0, 71.71], [72.0, 72.99], [76.0, 76.28], [78.0, 78.61], [82.0, 82.46], [88.0, 88.33], [89.0, 89.9], [94.0, 94.44], [103.0, 102.96], [104.0, 103.99], [105.0, 105.34], [107.0, 107.15], [108.0, 110.67], [114.0, 114.22], [116.0, 116.06], [121.0, 121.8], [122.0, 122.66], [125.0, 124.97], [127.0, 127.2], [128.0, 129.74], [134.0, 134.96], [140.0, 140.53], [142.0, 145.69], [147.0, 148.69], [150.0, 151.85], [156.0, 156.57], [157.0, 157.35], [159.0, 159.19], [162.0, 161.97], [164.0, 164.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 99.98, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.26, 0.09, 3.18, 0.16, 1.05, 0.65, 0.37, 0.38, 1.94, 0.73, 1.47, 2.62, 0.84, 3.6, 0.51, 2.21, 0.75, 0.71, 0.99, 0.28, 0.61, 0.46, 0.33, 0.9, 0.44, -0.04, -0.01, 0.34, 0.15, 2.67, 0.22, 0.06, 0.8, 0.66, -0.03, 0.2, 1.74, 0.96, 0.53, 3.69, 1.69, 1.85, 0.57, 0.35, 0.19, -0.03, 0.78]} \ No newline at end of file diff --git a/annotations_1/bICHpdNbsmU_filtered.json b/annotations_1/bICHpdNbsmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ac589aab51791a83cd611c662e2080b25ddb49e --- /dev/null +++ b/annotations_1/bICHpdNbsmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [9.0, 11.08], [15.0, 18.66], [20.0, 38.37], [40.0, 40.61], [43.0, 49.0], [52.0, 64.81], [66.0, 66.83]], "keep_status": [false, false, false, false, false, true, true, false], "silence_prob": [0.0, 92.97, 99.73, 92.8, 0.0, 32.79, 31.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 23.21], ["music", 19.57], ["coin (dropping)", 9.18]], [["music", 28.32], ["clang", 10.04], ["throbbing", 7.84]], null], "duration": [1.28, 2.08, 3.66, 18.37, 0.61, 6.0, 12.81, 0.83]} \ No newline at end of file diff --git a/annotations_1/bIfMAhK7Boo_filtered.json b/annotations_1/bIfMAhK7Boo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de63469bdafd97215c86c35652e0e4bc76435086 --- /dev/null +++ b/annotations_1/bIfMAhK7Boo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.7], [15.0, 19.43], [22.0, 24.53], [25.0, 26.18], [28.0, 29.24], [35.0, 36.21], [40.0, 41.52], [43.0, 44.47], [47.0, 48.61], [51.0, 56.49], [58.0, 58.55], [60.0, 61.52], [63.0, 64.2], [67.0, 73.89], [76.0, 78.6], [81.0, 86.78], [92.0, 95.94], [97.0, 111.03], [114.0, 115.55], [117.0, 117.76], [120.0, 120.99], [122.0, 127.18], [128.0, 139.06], [140.0, 170.31], [173.0, 173.23], [180.0, 180.32], [183.0, 186.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.42, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 62.78, 48.61, 31.78, 31.11, 33.04, 0.0, 0.0, 0.0, 38.31, 71.57, 0.0, 0.0, 0.0, 74.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.49], ["music", 8.85], ["hum", 6.44]], [["fly, housefly", 40.37], ["mosquito", 25.05], ["insect", 24.55]], [["fly, housefly", 36.61], ["mosquito", 29.16], ["insect", 20.48]], [["music", 39.61], ["speech", 35.28], ["breaking", 4.56]], null, null, null, [["breaking", 50.63], ["music", 21.42], ["speech", 10.16]], null, null, null, null, null], "duration": [0.7, 4.43, 2.53, 1.18, 1.24, 1.21, 1.52, 1.47, 1.61, 5.49, 0.55, 1.52, 1.2, 6.89, 2.6, 5.78, 3.94, 14.03, 1.55, 0.76, 0.99, 5.18, 11.06, 30.31, 0.23, 0.32, 3.63]} \ No newline at end of file diff --git a/annotations_1/bIpQoVucszI_filtered.json b/annotations_1/bIpQoVucszI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2d69c5bc808bc7ddd60b89688d7b1fdd830abf5 --- /dev/null +++ b/annotations_1/bIpQoVucszI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 3.18], [5.0, 5.29], [11.0, 11.91], [14.0, 14.94], [16.0, 16.55], [17.0, 22.32], [24.0, 28.26], [35.0, 36.04], [37.0, 37.76], [40.0, 40.59], [42.0, 41.82], [43.0, 44.39], [47.0, 46.94], [47.0, 47.34], [47.0, 47.46], [48.0, 48.41], [51.0, 57.28], [60.0, 61.38], [62.0, 70.46], [71.0, 79.25], [86.0, 86.7], [88.0, 88.45], [91.0, 95.0], [103.0, 104.5], [106.0, 106.78], [107.0, 112.5], [117.0, 116.7], [118.0, 118.3], [119.0, 120.56], [123.0, 123.38], [124.0, 129.57], [131.0, 131.73], [136.0, 143.95], [146.0, 146.42], [148.0, 152.05], [154.0, 154.89], [155.0, 157.35]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.14, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 38.43, 34.92, 0.0, 0.0, 39.25, 0.0, 0.0, 30.37, 0.0, 0.0, 0.0, 0.0, 33.08, 0.0, 35.09, 0.0, 31.56, 0.0, 33.16], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.95], ["moo", 18.16], ["music", 17.06]], [["fly, housefly", 26.07], ["mosquito", 21.59], ["insect", 16.15]], null, null, null, null, null, null, null, null, null, [["music", 28.66], ["speech", 15.1], ["throbbing", 13.97]], null, [["music", 16.27], ["moo", 10.23], ["speech", 10.03]], [["music", 16.18], ["speech", 15.22], ["livestock, farm animals, working animals", 14.52]], null, null, [["speech", 17.94], ["music", 10.23], ["fly, housefly", 8.58]], null, null, [["speech", 35.84], ["music", 28.9], ["sheep", 6.61]], null, null, null, null, [["cattle, bovinae", 22.46], ["moo", 17.92], ["livestock, farm animals, working animals", 16.0]], null, [["music", 58.62], ["speech", 5.03], ["throbbing", 5.0]], null, [["music", 29.55], ["speech", 27.85], ["crowd", 2.51]], null, [["music", 28.5], ["didgeridoo", 15.26], ["speech", 11.37]]], "duration": [1.0, 0.18, 0.29, 0.91, 0.94, 0.55, 5.32, 4.26, 1.04, 0.76, 0.59, -0.18, 1.39, -0.06, 0.34, 0.46, 0.41, 6.28, 1.38, 8.46, 8.25, 0.7, 0.45, 4.0, 1.5, 0.78, 5.5, -0.3, 0.3, 1.56, 0.38, 5.57, 0.73, 7.95, 0.42, 4.05, 0.89, 2.35]} \ No newline at end of file diff --git a/annotations_1/bJSDrRcwwKQ_filtered.json b/annotations_1/bJSDrRcwwKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98985787402640b1f76950182bc0643dcb16abbd --- /dev/null +++ b/annotations_1/bJSDrRcwwKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 27.6], [29.0, 29.91], [33.0, 34.21], [35.0, 37.72], [45.0, 47.34], [51.0, 53.2], [55.0, 57.2], [59.0, 62.55], [64.0, 64.84], [77.0, 82.66], [83.0, 88.47], [93.0, 94.44], [102.0, 107.72], [110.0, 110.44], [111.0, 111.86], [113.0, 123.53], [124.0, 126.03], [127.0, 129.86], [136.0, 136.97], [137.0, 138.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [55.6, 0.0, 0.0, 53.84, 87.92, 48.02, 78.04, 81.17, 0.0, 88.28, 51.28, 0.0, 35.12, 0.0, 0.0, 36.55, 39.46, 45.18, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 30.41], ["music", 28.14], ["singing bowl", 19.12]], null, null, null, null, null, null, [["breaking", 40.87], ["music", 12.86], ["glass", 11.46]], null, null, [["music", 21.42], ["livestock, farm animals, working animals", 13.73], ["insect", 13.35]], [["frog", 57.51], ["croak", 11.63], ["whale vocalization", 10.43]], [["music", 36.71], ["speech", 14.57], ["singing bowl", 8.65]], null, null], "duration": [2.6, 0.91, 1.21, 2.72, 2.34, 2.2, 2.2, 3.55, 0.84, 5.66, 5.47, 1.44, 5.72, 0.44, 0.86, 10.53, 2.03, 2.86, 0.97, 1.21]} \ No newline at end of file diff --git a/annotations_1/bKbZTFrWing_filtered.json b/annotations_1/bKbZTFrWing_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..280c9c3f2effccc5cfa70de13a7534ca07576f1b --- /dev/null +++ b/annotations_1/bKbZTFrWing_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.04], [7.0, 8.63], [9.0, 10.99], [11.0, 12.88], [14.0, 18.89], [21.0, 23.23], [24.0, 26.23], [29.0, 29.47], [31.0, 32.24], [34.0, 34.91], [36.0, 41.94], [44.0, 45.27], [47.0, 48.63], [49.0, 50.43], [51.0, 51.88], [53.0, 52.91], [53.0, 54.58], [55.0, 56.1], [57.0, 57.74], [59.0, 60.71], [66.0, 67.1], [70.0, 71.17], [72.0, 72.49], [74.0, 74.6], [80.0, 81.01], [90.0, 101.33], [102.0, 103.45], [104.0, 105.29], [106.0, 109.76], [115.0, 125.24], [126.0, 126.42], [127.0, 128.14], [129.0, 130.15], [131.0, 133.44], [136.0, 143.72], [146.0, 151.36], [153.0, 162.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [99.98, 0.0, 0.0, 0.0, 92.8, 95.78, 99.76, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.26, 0.0, 0.0, 95.09, 92.8, 0.0, 0.0, 0.0, 90.25, 39.01, 40.06, 35.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.29], ["theremin", 4.5], ["vehicle", 2.25]], null, null, null, null, null, null, null, null, [["heart sounds, heartbeat", 19.62], ["speech", 18.1], ["sneeze", 13.04]], [["music", 52.97], ["speech", 6.72], ["grunt", 4.34]], [["speech", 22.78], ["music", 21.39], ["fly, housefly", 4.96]]], "duration": [3.04, 1.63, 1.99, 1.88, 4.89, 2.23, 2.23, 0.47, 1.24, 0.91, 5.94, 1.27, 1.63, 1.43, 0.88, -0.09, 1.58, 1.1, 0.74, 1.71, 1.1, 1.17, 0.49, 0.6, 1.01, 11.33, 1.45, 1.29, 3.76, 10.24, 0.42, 1.14, 1.15, 2.44, 7.72, 5.36, 9.51]} \ No newline at end of file diff --git a/annotations_1/bLX_zt_MhW0_filtered.json b/annotations_1/bLX_zt_MhW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17034cb9cf0f1a79fa066fc381464b57815b69c2 --- /dev/null +++ b/annotations_1/bLX_zt_MhW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 42.52], [45.0, 70.44], [71.0, 130.82], [134.0, 139.82], [143.0, 142.55], [143.0, 143.63], [144.0, 148.39], [151.0, 152.95], [157.0, 180.99], [185.0, 185.33]], "keep_status": [true, true, false, false, false, false, false, false, false, false], "silence_prob": [44.99, 36.7, 0.0, 40.9, 0.0, 0.0, 53.72, 0.0, 39.72, 0.0], "audiomae_on_audioset": [[["music", 31.53], ["whale vocalization", 21.33], ["livestock, farm animals, working animals", 6.22]], [["music", 27.46], ["whale vocalization", 17.08], ["buzz", 10.69]], null, [["radio", 39.89], ["speech", 27.73], ["noise", 17.33]], null, null, null, null, [["speech", 64.83], ["music", 13.78], ["radio", 10.02]], null], "duration": [21.52, 25.44, 59.82, 5.82, -0.45, 0.63, 4.39, 1.95, 23.99, 0.33]} \ No newline at end of file diff --git a/annotations_1/bLqJo78X3OI_filtered.json b/annotations_1/bLqJo78X3OI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec81f03f64fb6722d8f6819bdc0e0e232fadcc2 --- /dev/null +++ b/annotations_1/bLqJo78X3OI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 85.65], [88.0, 90.81], [92.0, 140.97], [143.0, 151.82]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 32.97, 0.0, 30.95], "audiomae_on_audioset": [null, [["music", 42.97], ["trombone", 14.5], ["brass instrument", 11.24]], null, [["music", 34.88], ["whip", 31.41], ["foghorn", 10.0]]], "duration": [77.65, 2.81, 48.97, 8.82]} \ No newline at end of file diff --git a/annotations_1/bMjYOV8VnYk_filtered.json b/annotations_1/bMjYOV8VnYk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41534e460d29ecd41939aa34a9c35ad7d2def605 --- /dev/null +++ b/annotations_1/bMjYOV8VnYk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 26.23], [28.0, 104.67], [111.0, 124.61], [125.0, 125.96], [128.0, 128.6]], "keep_status": [true, false, true, false, false], "silence_prob": [30.09, 0.0, 30.21, 0.0, 0.0], "audiomae_on_audioset": [[["didgeridoo", 27.31], ["music", 20.13], ["speech", 16.34]], null, [["music", 27.87], ["hum", 14.72], ["throbbing", 13.37]], null, null], "duration": [2.23, 76.67, 13.61, 0.96, 0.6]} \ No newline at end of file diff --git a/annotations_1/bN1E4vf9FlM_filtered.json b/annotations_1/bN1E4vf9FlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9469f5c2d3fd7bd0ee28911cbbf2c2f6dae360d9 --- /dev/null +++ b/annotations_1/bN1E4vf9FlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 155.51]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [146.51]} \ No newline at end of file diff --git a/annotations_1/bNFWITNVAKU_filtered.json b/annotations_1/bNFWITNVAKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bca93a8b0822ab4cda56c754f0c30102094fda44 --- /dev/null +++ b/annotations_1/bNFWITNVAKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.03], [11.0, 28.32], [28.0, 31.19], [32.0, 106.88], [109.0, 110.17], [113.0, 128.02]], "keep_status": [false, false, true, false, false, true], "silence_prob": [0.0, 31.15, 31.88, 0.0, 0.0, 31.25], "audiomae_on_audioset": [null, [["music", 36.98], ["hum", 36.43], ["mains hum", 6.64]], [["whale vocalization", 33.72], ["insect", 9.11], ["fly, housefly", 5.31]], null, null, [["speech", 25.39], ["music", 18.0], ["hum", 15.07]]], "duration": [1.03, 17.32, 3.19, 74.88, 1.17, 15.02]} \ No newline at end of file diff --git a/annotations_1/bNiztacMAJ0_filtered.json b/annotations_1/bNiztacMAJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4156c3be1c70197970d59bb77d33a85ef0e97c11 --- /dev/null +++ b/annotations_1/bNiztacMAJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 28.19], [31.0, 31.67], [32.0, 32.98], [37.0, 38.8], [40.0, 41.45], [43.0, 43.04], [48.0, 51.0], [59.0, 59.76], [61.0, 61.48], [62.0, 64.13], [68.0, 74.16], [75.0, 79.34], [84.0, 95.57], [97.0, 98.71], [101.0, 104.87], [105.0, 107.87], [110.0, 110.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 85.72, 96.17, 99.91, 99.73, 0.0, 93.13, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.19, 0.67, 0.98, 1.8, 1.45, 0.04, 3.0, 0.76, 0.48, 2.13, 6.16, 4.34, 11.57, 1.71, 3.87, 2.87, 0.35]} \ No newline at end of file diff --git a/annotations_1/bOP-THNe4m8_filtered.json b/annotations_1/bOP-THNe4m8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ac06c36e8aa7088e88e8ec2293e711fc56e50e3 --- /dev/null +++ b/annotations_1/bOP-THNe4m8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.87], [10.0, 9.85], [10.0, 36.56], [39.0, 73.53], [76.0, 78.49], [79.0, 81.92], [83.0, 86.12], [87.0, 88.2], [90.0, 160.34]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.64, 0.0, 33.0, 30.99, 31.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 45.38], ["mains hum", 20.71], ["buzz", 9.53]], null, [["hum", 31.54], ["mains hum", 29.11], ["throbbing", 18.14]], [["mains hum", 22.51], ["hum", 20.76], ["music", 14.06]], [["mains hum", 46.2], ["hum", 18.75], ["music", 8.67]], null, null], "duration": [-0.13, -0.15, 26.56, 34.53, 2.49, 2.92, 3.12, 1.2, 70.34]} \ No newline at end of file diff --git a/annotations_1/bPH152eXEfU_filtered.json b/annotations_1/bPH152eXEfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b0d430ebfd9628de60defbc020f341d211083c --- /dev/null +++ b/annotations_1/bPH152eXEfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.85], [7.0, 15.94], [18.0, 18.5], [19.0, 21.63], [24.0, 27.01], [28.0, 29.78], [35.0, 39.26], [41.0, 41.81], [43.0, 45.15], [46.0, 47.8], [50.0, 53.25], [55.0, 56.42], [60.0, 61.03], [64.0, 66.01], [66.0, 67.42], [70.0, 70.34], [76.0, 77.53], [79.0, 81.67], [84.0, 90.34], [91.0, 94.24], [95.0, 95.96], [96.0, 96.5], [97.0, 97.82], [98.0, 105.21], [107.0, 108.62], [111.0, 111.72], [113.0, 113.27], [113.0, 113.44], [114.0, 122.13], [124.0, 125.86], [127.0, 128.19], [129.0, 130.62], [132.0, 137.59], [138.0, 142.38]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.47, 94.52, 0.0, 99.68, 66.27, 0.0, 90.95, 0.0, 46.47, 0.0, 75.23, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 99.98, 85.72, 79.07, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 64.86, 96.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["busy signal", 20.85], ["frog", 11.79], ["sine wave", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.85, 8.94, 0.5, 2.63, 3.01, 1.78, 4.26, 0.81, 2.15, 1.8, 3.25, 1.42, 1.03, 2.01, 1.42, 0.34, 1.53, 2.67, 6.34, 3.24, 0.96, 0.5, 0.82, 7.21, 1.62, 0.72, 0.27, 0.44, 8.13, 1.86, 1.19, 1.62, 5.59, 4.38]} \ No newline at end of file diff --git a/annotations_1/bPiv1wP8q7g_filtered.json b/annotations_1/bPiv1wP8q7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e234ceb4634532565bb8fd92aeddbeb7319af182 --- /dev/null +++ b/annotations_1/bPiv1wP8q7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [4.0, 4.89], [7.0, 7.75], [10.0, 10.57], [13.0, 20.8], [23.0, 23.41], [24.0, 25.34], [28.0, 31.35], [32.0, 32.85], [34.0, 39.53], [41.0, 40.95], [42.0, 47.78], [48.0, 57.87], [59.0, 63.51], [64.0, 66.56], [68.0, 68.84], [72.0, 72.13], [75.0, 75.68], [76.0, 76.91], [77.0, 78.12], [80.0, 81.73], [83.0, 86.16], [87.0, 91.32], [92.0, 92.45], [92.0, 92.84], [94.0, 99.94], [102.0, 101.93], [104.0, 114.27], [132.0, 164.67]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 0.0, 36.68, 0.0, 38.37, 0.0, 36.72, 37.45, 41.24, 39.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.96, 44.18, 0.0, 0.0, 38.28, 0.0, 38.67, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 12.31], ["whack, thwack", 12.3], ["breaking", 11.57]], null, null, [["breaking", 63.61], ["music", 6.1], ["glass", 4.73]], null, [["rumble", 43.95], ["mains hum", 13.04], ["hum", 7.13]], null, [["breaking", 69.33], ["music", 10.8], ["glass", 6.63]], [["hum", 40.5], ["mains hum", 25.37], ["speech", 15.5]], [["rumble", 65.77], ["hum", 7.32], ["noise", 4.45]], [["sidetone", 62.04], ["speech", 17.04], ["rumble", 4.38]], null, null, null, null, null, null, [["hum", 29.28], ["mains hum", 17.0], ["rumble", 15.33]], [["hum", 38.97], ["throbbing", 34.13], ["heart sounds, heartbeat", 9.14]], null, null, [["speech", 43.77], ["whale vocalization", 10.66], ["rumble", 10.53]], null, [["mains hum", 36.63], ["hum", 32.8], ["rumble", 15.15]], null], "duration": [1.0, 0.89, 0.75, 0.57, 7.8, 0.41, 1.34, 3.35, 0.85, 5.53, -0.05, 5.78, 9.87, 4.51, 2.56, 0.84, 0.13, 0.68, 0.91, 1.12, 1.73, 3.16, 4.32, 0.45, 0.84, 5.94, -0.07, 10.27, 32.67]} \ No newline at end of file diff --git a/annotations_1/bQObeZ5R0mc_filtered.json b/annotations_1/bQObeZ5R0mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31a7255223a7e48c246aabe46bcde648e2374e42 --- /dev/null +++ b/annotations_1/bQObeZ5R0mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [5.0, 13.86], [15.0, 17.66], [18.0, 17.86], [18.0, 18.93], [21.0, 26.11], [31.0, 33.88], [45.0, 46.53], [48.0, 48.32], [51.0, 50.72], [57.0, 62.61], [63.0, 73.13], [74.0, 79.73], [81.0, 82.09]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 67.51, 100.0, 0.0, 0.0, 32.61, 76.37, 0.0, 0.0, 0.0, 40.68, 49.54, 49.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 25.41], ["cattle, bovinae", 19.9], ["moo", 18.24]], null, null, null, null, [["livestock, farm animals, working animals", 15.14], ["animal", 14.22], ["cattle, bovinae", 9.07]], [["fly, housefly", 28.77], ["insect", 16.87], ["frog", 14.18]], [["fly, housefly", 58.23], ["insect", 21.75], ["mosquito", 9.75]], null], "duration": [0.31, 8.86, 2.66, -0.14, 0.93, 5.11, 2.88, 1.53, 0.32, -0.28, 5.61, 10.13, 5.73, 1.09]} \ No newline at end of file diff --git a/annotations_1/bRehxlYZ_CE_filtered.json b/annotations_1/bRehxlYZ_CE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95a395255e5dfa5d3eda1ddb7a786908c47a8e01 --- /dev/null +++ b/annotations_1/bRehxlYZ_CE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 65.4], [66.0, 68.25]], "keep_status": [false, true], "silence_prob": [0.0, 30.64], "audiomae_on_audioset": [null, [["cattle, bovinae", 13.56], ["moo", 13.15], ["livestock, farm animals, working animals", 10.94]]], "duration": [50.4, 2.25]} \ No newline at end of file diff --git a/annotations_1/bSm3d9ftiJA_filtered.json b/annotations_1/bSm3d9ftiJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0f021fb652408e719cfeaa9b29b70a4ec4adaa --- /dev/null +++ b/annotations_1/bSm3d9ftiJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.04], [10.0, 11.31], [13.0, 12.95], [14.0, 14.88], [17.0, 17.58], [18.0, 18.86], [23.0, 23.72], [30.0, 29.84], [30.0, 31.04], [33.0, 33.96], [35.0, 35.29], [40.0, 41.07], [41.0, 43.43], [49.0, 48.95], [50.0, 51.7], [55.0, 55.65], [57.0, 57.91], [65.0, 66.43], [75.0, 75.76], [80.0, 80.54], [84.0, 84.67], [86.0, 87.32], [88.0, 90.61], [92.0, 93.21], [101.0, 101.34], [103.0, 102.78], [107.0, 106.76], [110.0, 110.39], [112.0, 115.16], [119.0, 139.19], [139.0, 139.35], [139.0, 140.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.41, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 30.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 11.63], ["boing", 8.75], ["hum", 8.33]], [["music", 59.96], ["moo", 3.99], ["livestock, farm animals, working animals", 3.95]], null, null], "duration": [2.04, 1.31, -0.05, 0.88, 0.58, 0.86, 0.72, -0.16, 1.04, 0.96, 0.29, 1.07, 2.43, -0.05, 1.7, 0.65, 0.91, 1.43, 0.76, 0.54, 0.67, 1.32, 2.61, 1.21, 0.34, -0.22, -0.24, 0.39, 3.16, 20.19, 0.35, 1.34]} \ No newline at end of file diff --git a/annotations_1/bTJAIONGv0Y_filtered.json b/annotations_1/bTJAIONGv0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35217b743117215697740f6cd76528494c3f8c94 --- /dev/null +++ b/annotations_1/bTJAIONGv0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.95], [10.0, 11.5], [17.0, 18.17], [20.0, 21.1], [23.0, 23.73], [34.0, 37.49], [38.0, 39.31], [44.0, 44.49], [46.0, 48.81], [63.0, 65.16], [72.0, 74.65], [80.0, 81.43], [93.0, 95.12], [99.0, 100.36], [111.0, 111.48], [114.0, 114.61], [115.0, 117.1], [118.0, 119.47], [123.0, 122.99], [123.0, 123.55], [126.0, 126.54], [128.0, 129.15], [138.0, 137.94], [138.0, 139.4], [141.0, 142.55], [151.0, 153.71], [156.0, 157.94], [161.0, 163.48], [169.0, 171.85], [174.0, 180.0], [181.0, 185.25], [186.0, 189.41], [190.0, 194.02], [195.0, 196.03]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 0.0, 0.0, 29.46, 29.78, 30.59, 0.0, 29.93, 0.0, 0.0, 0.0, 30.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 46.15, 62.07, 49.59, 63.21, 53.78, 61.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["insect", 49.65], ["fly, housefly", 39.51], ["bee, wasp, etc.", 8.25]], null, null, [["livestock, farm animals, working animals", 33.98], ["cattle, bovinae", 27.08], ["moo", 22.56]], [["livestock, farm animals, working animals", 23.3], ["cattle, bovinae", 15.92], ["insect", 11.84]], [["speech", 22.69], ["music", 18.91], ["didgeridoo", 10.32]], null, [["crackle", 13.93], ["roar", 8.06], ["sidetone", 7.54]], null, null, null, [["insect", 43.66], ["fly, housefly", 38.11], ["bee, wasp, etc.", 9.93]], null, null, null, null, null, null, null, null, null, null, [["speech", 31.75], ["radio", 15.41], ["frying (food)", 5.54]], null, [["mains hum", 26.21], ["hum", 24.69], ["fly, housefly", 5.84]], null, null, null, null], "duration": [-0.05, 1.5, 1.17, 1.1, 0.73, 3.49, 1.31, 0.49, 2.81, 2.16, 2.65, 1.43, 2.12, 1.36, 0.48, 0.61, 2.1, 1.47, -0.01, 0.55, 0.54, 1.15, -0.06, 1.4, 1.55, 2.71, 1.94, 2.48, 2.85, 6.0, 4.25, 3.41, 4.02, 1.03]} \ No newline at end of file diff --git a/annotations_1/bTPrlCglvFo_filtered.json b/annotations_1/bTPrlCglvFo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d7f1331f2002258241df96f0eec947ca9dd1c0f --- /dev/null +++ b/annotations_1/bTPrlCglvFo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.19], [28.0, 28.43], [33.0, 34.21], [35.0, 34.77], [36.0, 40.93], [42.0, 43.06], [52.0, 52.64], [55.0, 58.38], [63.0, 63.61], [79.0, 79.25], [82.0, 82.43], [88.0, 88.45], [92.0, 91.74], [93.0, 93.5], [94.0, 95.55], [116.0, 116.56], [119.0, 124.21], [135.0, 135.73], [144.0, 144.83], [150.0, 150.03], [152.0, 152.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.84, 0.0, 0.0, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 46.0], ["speech", 20.11], ["stomach rumble", 6.02]], null, null, [["music", 51.74], ["boing", 28.28], ["speech", 6.16]], null, null, null, null, null, null, null, null, [["music", 82.5], ["boing", 3.32], ["speech", 2.86]], null, null, null, null], "duration": [1.19, 0.43, 1.21, -0.23, 4.93, 1.06, 0.64, 3.38, 0.61, 0.25, 0.43, 0.45, -0.26, 0.5, 1.55, 0.56, 5.21, 0.73, 0.83, 0.03, 0.49]} \ No newline at end of file diff --git a/annotations_1/bWQ1ekGzhwU_filtered.json b/annotations_1/bWQ1ekGzhwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb7fd7fd3f0c5832add7e99727151cef41f0a38d --- /dev/null +++ b/annotations_1/bWQ1ekGzhwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.41], [24.0, 25.34], [28.0, 28.54], [29.0, 38.2], [39.0, 53.76], [57.0, 61.26], [62.0, 74.22], [75.0, 75.98], [79.0, 106.76], [110.0, 110.76]], "keep_status": [true, false, false, false, true, false, true, false, true, false], "silence_prob": [29.32, 0.0, 0.0, 29.56, 28.64, 30.99, 28.5, 0.0, 28.38, 0.0], "audiomae_on_audioset": [[["music", 36.74], ["musical instrument", 10.0], ["didgeridoo", 8.18]], null, null, [["speech", 45.89], ["vehicle", 32.93], ["car", 3.6]], [["speech", 40.83], ["vehicle", 11.64], ["civil defense siren", 5.89]], [["speech", 64.78], ["vehicle", 14.57], ["aircraft", 3.4]], [["music", 53.59], ["hum", 4.23], ["cacophony", 3.09]], null, [["speech", 26.04], ["music", 16.97], ["vehicle", 14.3]], null], "duration": [9.41, 1.34, 0.54, 9.2, 14.76, 4.26, 12.22, 0.98, 27.76, 0.76]} \ No newline at end of file diff --git a/annotations_1/bWo3nlFcH5k_filtered.json b/annotations_1/bWo3nlFcH5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8cae889245a729228224d4ab9f33d59410a3118 --- /dev/null +++ b/annotations_1/bWo3nlFcH5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.21], [8.0, 8.45], [9.0, 10.15], [16.0, 18.42], [19.0, 20.38], [22.0, 23.09], [26.0, 26.2], [27.0, 26.86], [30.0, 30.62], [31.0, 33.49], [39.0, 39.85], [44.0, 44.96], [46.0, 46.31], [48.0, 49.64], [53.0, 52.95], [54.0, 54.45], [58.0, 58.33], [60.0, 60.49], [61.0, 61.69], [63.0, 63.51], [67.0, 68.82], [72.0, 73.82], [74.0, 80.77], [83.0, 83.32], [84.0, 85.21], [86.0, 87.37], [92.0, 93.02], [96.0, 96.62], [97.0, 97.19], [98.0, 98.61], [99.0, 99.37], [100.0, 100.48], [101.0, 106.74], [108.0, 109.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.45, 1.15, 2.42, 1.38, 1.09, 0.2, -0.14, 0.62, 2.49, 0.85, 0.96, 0.31, 1.64, -0.05, 0.45, 0.33, 0.49, 0.69, 0.51, 1.82, 1.82, 6.77, 0.32, 1.21, 1.37, 1.02, 0.62, 0.19, 0.61, 0.37, 0.48, 5.74, 1.75]} \ No newline at end of file diff --git a/annotations_1/bY-jTccddQo_filtered.json b/annotations_1/bY-jTccddQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..521ed3a25d9068d6f4da269d19c721f942bfa4ba --- /dev/null +++ b/annotations_1/bY-jTccddQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.52], [5.0, 13.91], [15.0, 18.05], [19.0, 19.6], [26.0, 30.21], [41.0, 41.54], [46.0, 47.04], [48.0, 54.14], [58.0, 63.19], [66.0, 66.65], [73.0, 77.04], [79.0, 80.84], [94.0, 95.42]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 29.33, 28.67, 0.0, 28.71, 0.0, 0.0, 28.17, 36.14, 0.0, 50.26, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 33.54], ["speech", 27.53], ["electric shaver, electric razor", 5.26]], [["music", 25.0], ["throbbing", 10.21], ["hum", 8.52]], null, [["speech", 85.74], ["music", 3.67], ["sound effect", 0.95]], null, null, [["livestock, farm animals, working animals", 35.21], ["cattle, bovinae", 20.76], ["speech", 10.04]], [["hum", 38.21], ["mains hum", 22.91], ["throbbing", 11.81]], null, null, null, null], "duration": [0.52, 8.91, 3.05, 0.6, 4.21, 0.54, 1.04, 6.14, 5.19, 0.65, 4.04, 1.84, 1.42]} \ No newline at end of file diff --git a/annotations_1/bY6jLt3owBQ_filtered.json b/annotations_1/bY6jLt3owBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45fdde5c2c2909e09907360a60475143461a2b9c --- /dev/null +++ b/annotations_1/bY6jLt3owBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [8.0, 8.77], [23.0, 23.31], [27.0, 27.4], [29.0, 37.07], [48.0, 48.41], [53.0, 101.02], [106.0, 124.43]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.69, 0.0, 0.0, 31.62], "audiomae_on_audioset": [null, null, null, null, [["music", 61.21], ["synthesizer", 9.79], ["electronic music", 2.81]], null, null, [["music", 79.77], ["electronic music", 1.25], ["musical instrument", 1.16]]], "duration": [1.34, 0.77, 0.31, 0.4, 8.07, 0.41, 48.02, 18.43]} \ No newline at end of file diff --git a/annotations_1/bYO_AhZaG24_filtered.json b/annotations_1/bYO_AhZaG24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eff6993b7ecabc56ad16a378b550dae922803203 --- /dev/null +++ b/annotations_1/bYO_AhZaG24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.28], [22.0, 22.57], [24.0, 27.28], [30.0, 31.08], [33.0, 35.36], [39.0, 60.39], [63.0, 87.49], [94.0, 102.74], [106.0, 113.63], [115.0, 119.28], [124.0, 136.04]], "keep_status": [false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 32.08, 0.0, 31.32, 30.47, 31.22, 32.75, 31.33, 32.06, 33.56], "audiomae_on_audioset": [null, null, [["speech", 51.74], ["music", 16.84], ["musical instrument", 3.63]], null, [["whoosh, swoosh, swish", 12.17], ["fly, housefly", 11.62], ["whip", 10.87]], [["music", 62.78], ["speech", 13.09], ["boing", 6.44]], [["music", 58.28], ["throbbing", 8.47], ["electronic music", 6.75]], [["music", 34.66], ["sidetone", 28.68], ["speech", 15.71]], [["music", 56.65], ["buzz", 6.33], ["boing", 5.59]], [["music", 23.7], ["explosion", 16.08], ["speech", 11.56]], [["music", 60.99], ["theremin", 3.61], ["synthesizer", 3.53]]], "duration": [1.28, 0.57, 3.28, 1.08, 2.36, 21.39, 24.49, 8.74, 7.63, 4.28, 12.04]} \ No newline at end of file diff --git a/annotations_1/bYt5SAF0M3I_filtered.json b/annotations_1/bYt5SAF0M3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06e421d8867b8c9d5fff774f212322b039eef086 --- /dev/null +++ b/annotations_1/bYt5SAF0M3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.48], [11.0, 12.82], [15.0, 15.74], [17.0, 18.86], [20.0, 20.14], [21.0, 24.43], [26.0, 29.49], [30.0, 31.7], [33.0, 36.17], [37.0, 38.15], [39.0, 41.1], [43.0, 48.64], [50.0, 52.22], [54.0, 54.6], [56.0, 57.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 44.23, 0.0, 41.74, 0.0, 52.56, 95.09, 66.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 72.38], ["radio", 7.54], ["sidetone", 4.19]], [["speech", 32.24], ["stomach rumble", 20.87], ["radio", 17.77]], null, [["speech", 42.45], ["radio", 41.6], ["sidetone", 9.95]], null, null, null, null, null, null], "duration": [1.48, 1.82, 0.74, 1.86, 0.14, 3.43, 3.49, 1.7, 3.17, 1.15, 2.1, 5.64, 2.22, 0.6, 1.54]} \ No newline at end of file diff --git a/annotations_1/bZhBhpm6m_A_filtered.json b/annotations_1/bZhBhpm6m_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f2a6648fc590a22eea0fbdf1f4b81afdc5835c0 --- /dev/null +++ b/annotations_1/bZhBhpm6m_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.29], [14.0, 14.4], [15.0, 15.87], [18.0, 18.18], [26.0, 27.51], [28.0, 29.27], [36.0, 37.86], [38.0, 41.35], [46.0, 45.81], [49.0, 50.04], [52.0, 53.4], [56.0, 56.46], [64.0, 64.62], [67.0, 67.41], [68.0, 70.68], [71.0, 81.38], [82.0, 83.66], [84.0, 84.92], [86.0, 86.24], [89.0, 89.31], [90.0, 91.02], [93.0, 93.92], [101.0, 101.63], [104.0, 105.19], [107.0, 107.55], [111.0, 112.78], [113.0, 115.13], [118.0, 120.16], [123.0, 122.99], [128.0, 129.83], [131.0, 131.53], [132.0, 135.9], [137.0, 164.17], [169.0, 170.18], [170.0, 171.26], [172.0, 172.64], [174.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 30.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 99.94, 0.0, 0.0, 0.0, 45.65, 30.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 57.31], ["gunshot, gunfire", 7.89], ["explosion", 7.04]], null, null, null, null, null, null, null, [["speech", 46.58], ["explosion", 23.09], ["gunshot, gunfire", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.85], ["hum", 29.83], ["mains hum", 12.99]], [["music", 25.6], ["hum", 11.11], ["crushing", 6.33]], null, null, null, null], "duration": [0.29, 0.4, 0.87, 0.18, 1.51, 1.27, 1.86, 3.35, -0.19, 1.04, 1.4, 0.46, 0.62, 0.41, 2.68, 10.38, 1.66, 0.92, 0.24, 0.31, 1.02, 0.92, 0.63, 1.19, 0.55, 1.78, 2.13, 2.16, -0.01, 1.83, 0.53, 3.9, 27.17, 1.18, 1.26, 0.64, -0.06]} \ No newline at end of file diff --git a/annotations_1/b_aJy2SE60E_filtered.json b/annotations_1/b_aJy2SE60E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68b82da1e71fdaeb22bbbf50881af64cced368d --- /dev/null +++ b/annotations_1/b_aJy2SE60E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.48], [18.0, 18.98], [30.0, 30.42], [32.0, 31.92], [53.0, 53.6], [71.0, 71.46], [97.0, 98.1], [103.0, 103.17], [106.0, 105.7], [128.0, 129.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.48, 0.98, 0.42, -0.08, 0.6, 0.46, 1.1, 0.17, -0.3, 1.03]} \ No newline at end of file diff --git a/annotations_1/baNc64S4DHY_filtered.json b/annotations_1/baNc64S4DHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cba8ae9719fc0d100daf16d6b0f26a1de696954a --- /dev/null +++ b/annotations_1/baNc64S4DHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.9], [22.0, 23.95], [27.0, 27.65], [29.0, 30.65], [37.0, 38.06], [39.0, 39.66], [49.0, 49.22], [53.0, 53.84], [60.0, 61.05], [63.0, 63.9], [75.0, 76.79], [78.0, 78.66], [80.0, 80.16], [83.0, 83.78], [86.0, 88.37], [89.0, 89.34], [91.0, 91.64], [96.0, 96.47], [99.0, 100.25], [105.0, 105.46], [106.0, 108.65], [114.0, 115.21], [120.0, 121.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 1.95, 0.65, 1.65, 1.06, 0.66, 0.22, 0.84, 1.05, 0.9, 1.79, 0.66, 0.16, 0.78, 2.37, 0.34, 0.64, 0.47, 1.25, 0.46, 2.65, 1.21, 1.54]} \ No newline at end of file diff --git a/annotations_1/bbX5KM0tFVk_filtered.json b/annotations_1/bbX5KM0tFVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43afaa0eded760ba8f95f84e13af6e9d92041dc0 --- /dev/null +++ b/annotations_1/bbX5KM0tFVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [7.0, 10.32], [13.0, 17.51], [18.0, 19.85], [21.0, 24.71], [27.0, 29.27], [31.0, 35.94], [38.0, 40.05], [42.0, 45.01], [46.0, 57.43], [58.0, 59.97], [62.0, 132.66], [135.0, 139.7], [142.0, 144.98], [148.0, 156.1]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 90.95, 100.0, 0.0, 99.31, 47.46, 39.3, 100.0, 90.25, 50.26, 0.0, 0.0, 72.01, 64.63, 47.66], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 77.03], ["sidetone", 8.28], ["dial tone", 3.83]], [["hum", 14.74], ["mains hum", 12.77], ["fly, housefly", 10.1]], null, null, null, null, null, null, null, [["noise", 24.95], ["stomach rumble", 16.14], ["effects unit", 8.99]]], "duration": [0.96, 3.32, 4.51, 1.85, 3.71, 2.27, 4.94, 2.05, 3.01, 11.43, 1.97, 70.66, 4.7, 2.98, 8.1]} \ No newline at end of file diff --git a/annotations_1/bbnkw5RyiCI_filtered.json b/annotations_1/bbnkw5RyiCI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b7a4ab330a45435388726fdd73dd690668c9a4f --- /dev/null +++ b/annotations_1/bbnkw5RyiCI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.38], [25.0, 28.61], [29.0, 29.86], [30.0, 33.22], [37.0, 39.29], [54.0, 57.27], [77.0, 76.99], [81.0, 84.18], [103.0, 104.06], [106.0, 107.33], [114.0, 113.7], [114.0, 113.73], [114.0, 115.4], [117.0, 116.78], [118.0, 122.98], [124.0, 124.48], [125.0, 136.24], [138.0, 141.57], [144.0, 144.61], [146.0, 154.45], [157.0, 157.33]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [66.51, 42.74, 0.0, 63.85, 49.59, 34.36, 0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.56, 0.0, 69.74, 84.43, 0.0, 31.9, 0.0], "audiomae_on_audioset": [null, [["speech", 44.37], ["frog", 12.49], ["croak", 10.33]], null, null, [["speech", 39.4], ["cattle, bovinae", 7.27], ["music", 5.33]], [["livestock, farm animals, working animals", 41.73], ["moo", 27.84], ["cattle, bovinae", 19.13]], null, [["fly, housefly", 27.48], ["insect", 21.31], ["livestock, farm animals, working animals", 20.37]], null, null, null, null, null, null, [["speech", 31.07], ["sidetone", 23.53], ["noise", 12.82]], null, null, null, null, [["music", 37.48], ["speech", 16.22], ["buzz", 6.5]], null], "duration": [2.38, 3.61, 0.86, 3.22, 2.29, 3.27, -0.01, 3.18, 1.06, 1.33, -0.3, -0.27, 1.4, -0.22, 4.98, 0.48, 11.24, 3.57, 0.61, 8.45, 0.33]} \ No newline at end of file diff --git a/annotations_1/bd0IiiCDDGI_filtered.json b/annotations_1/bd0IiiCDDGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8815d9894606b069f3400eb6f727eb85e3c8475 --- /dev/null +++ b/annotations_1/bd0IiiCDDGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [7.0, 7.28], [8.0, 9.24], [11.0, 10.77], [11.0, 11.5], [12.0, 12.5], [14.0, 16.16], [20.0, 24.29], [25.0, 26.08], [28.0, 28.16], [28.0, 28.98], [34.0, 42.3], [44.0, 44.04], [45.0, 45.03], [47.0, 47.17], [52.0, 53.1], [54.0, 64.62], [65.0, 71.78], [73.0, 75.0], [78.0, 121.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 78.04, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 48.31, 47.35, 53.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.99], ["speech", 34.07], ["scary music", 1.2]], [["music", 63.4], ["carnatic music", 12.25], ["theremin", 4.73]], null, null], "duration": [0.18, 0.28, 1.24, -0.23, 0.5, 0.5, 2.16, 4.29, 1.08, 0.16, 0.98, 8.3, 0.04, 0.03, 0.17, 1.1, 10.62, 6.78, 2.0, 43.36]} \ No newline at end of file diff --git a/annotations_1/bdFo-WtjOmA_filtered.json b/annotations_1/bdFo-WtjOmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf2412325ba0f843d0d3f9a290a4992ec9b2021 --- /dev/null +++ b/annotations_1/bdFo-WtjOmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 60.74], [62.0, 82.09], [83.0, 87.44], [88.0, 89.18], [90.0, 92.53], [96.0, 97.58], [102.0, 109.07], [112.0, 114.12], [116.0, 116.28], [118.0, 121.34], [124.0, 126.18]], "keep_status": [true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [48.14, 31.89, 34.87, 0.0, 33.36, 0.0, 31.3, 35.95, 0.0, 34.78, 30.83], "audiomae_on_audioset": [[["cough", 40.69], ["music", 17.73], ["throat clearing", 8.2]], [["hum", 33.52], ["mains hum", 33.49], ["music", 10.97]], [["hum", 34.23], ["mains hum", 29.35], ["music", 10.89]], null, [["whale vocalization", 82.03], ["music", 9.04], ["hum", 1.75]], null, [["music", 52.29], ["theremin", 21.8], ["noise", 1.87]], [["gong", 38.65], ["music", 19.78], ["didgeridoo", 10.65]], null, [["hum", 45.56], ["mains hum", 38.49], ["music", 4.76]], [["hum", 21.68], ["mains hum", 21.44], ["vehicle", 5.48]]], "duration": [4.74, 20.09, 4.44, 1.18, 2.53, 1.58, 7.07, 2.12, 0.28, 3.34, 2.18]} \ No newline at end of file diff --git a/annotations_1/bdJPnMKhsnY_filtered.json b/annotations_1/bdJPnMKhsnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9d5ce27a11f4f18c8b6b61e27e5991f15e84880 --- /dev/null +++ b/annotations_1/bdJPnMKhsnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.86], [32.0, 32.31], [56.0, 56.25], [59.0, 60.2], [62.0, 62.6], [64.0, 64.88], [69.0, 72.59]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.82], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 77.37], ["hum", 3.71], ["electronic music", 1.97]]], "duration": [-0.14, 0.31, 0.25, 1.2, 0.6, 0.88, 3.59]} \ No newline at end of file diff --git a/annotations_1/bdJcCwoJ4KQ_filtered.json b/annotations_1/bdJcCwoJ4KQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..066b91ddb1f7cb886545a67e1fdbe47586bd0bbb --- /dev/null +++ b/annotations_1/bdJcCwoJ4KQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 6.37], [16.0, 21.39], [23.0, 23.7], [26.0, 26.03], [29.0, 28.95], [31.0, 31.72], [35.0, 36.32], [38.0, 49.03], [55.0, 64.13], [65.0, 66.66], [70.0, 80.05], [81.0, 81.08], [84.0, 86.91], [89.0, 92.16], [93.0, 96.74], [97.0, 99.05], [100.0, 100.92], [102.0, 104.68], [109.0, 117.49], [120.0, 140.16], [144.0, 146.79], [147.0, 157.71], [160.0, 175.27]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 93.13, 36.18, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 29.04, 0.0, 49.04, 0.0, 80.82, 75.72, 73.21, 51.12, 0.0, 39.5, 39.47, 42.3, 39.02, 50.91, 43.48], "audiomae_on_audioset": [null, null, [["chirp tone", 22.74], ["tuning fork", 15.5], ["hum", 12.78]], null, null, null, null, null, [["music", 24.36], ["hum", 9.75], ["electric shaver, electric razor", 8.75]], [["quack", 37.27], ["duck", 24.82], ["music", 9.21]], null, [["music", 69.15], ["sonar", 8.18], ["buzz", 5.93]], null, null, null, null, null, null, [["music", 49.93], ["coin (dropping)", 13.37], ["throbbing", 8.9]], [["didgeridoo", 38.78], ["music", 32.69], ["musical instrument", 2.99]], [["music", 68.06], ["hum", 11.85], ["throbbing", 5.24]], [["hum", 46.43], ["throbbing", 14.63], ["mains hum", 12.83]], null, [["ding", 27.16], ["music", 24.59], ["speech", 10.5]]], "duration": [0.89, 2.37, 5.39, 0.7, 0.03, -0.05, 0.72, 1.32, 11.03, 9.13, 1.66, 10.05, 0.08, 2.91, 3.16, 3.74, 2.05, 0.92, 2.68, 8.49, 20.16, 2.79, 10.71, 15.27]} \ No newline at end of file diff --git a/annotations_1/be9FJeol_aQ_filtered.json b/annotations_1/be9FJeol_aQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aafdb4af0ce764f96bf70de37e51645d3f1ba2d4 --- /dev/null +++ b/annotations_1/be9FJeol_aQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 97.8], [101.0, 124.55]], "keep_status": [false, true], "silence_prob": [0.0, 31.25], "audiomae_on_audioset": [null, [["music", 44.97], ["livestock, farm animals, working animals", 12.63], ["moo", 8.59]]], "duration": [93.8, 23.55]} \ No newline at end of file diff --git a/annotations_1/bfKu5Jc8TjA_filtered.json b/annotations_1/bfKu5Jc8TjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b251b5c00589f6529dc550b5722f26b01c0cc3e --- /dev/null +++ b/annotations_1/bfKu5Jc8TjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [15.0, 27.62], [31.0, 35.5], [39.0, 40.46], [44.0, 52.61], [54.0, 56.03], [56.0, 59.0], [64.0, 64.72], [72.0, 109.44], [112.0, 114.29], [116.0, 118.22], [118.0, 118.66], [121.0, 123.04], [126.0, 129.66], [130.0, 135.11], [135.0, 135.68], [136.0, 137.27], [138.0, 143.63]], "keep_status": [false, true, false, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.57, 32.77, 0.0, 33.07, 33.76, 32.91, 0.0, 0.0, 34.8, 93.6, 0.0, 97.54, 77.7, 93.29, 0.0, 0.0, 49.5], "audiomae_on_audioset": [null, [["music", 38.92], ["sidetone", 12.8], ["speech", 10.62]], [["music", 50.07], ["boing", 17.49], ["didgeridoo", 7.1]], null, [["fart", 25.55], ["fly, housefly", 10.51], ["vehicle", 8.69]], [["music", 32.75], ["hum", 10.38], ["mains hum", 6.97]], [["speech", 43.47], ["music", 19.45], ["radio", 5.03]], null, null, [["music", 34.73], ["throbbing", 26.13], ["hum", 6.37]], null, null, null, null, null, null, null, [["music", 73.88], ["didgeridoo", 7.9], ["musical instrument", 4.5]]], "duration": [0.58, 12.62, 4.5, 1.46, 8.61, 2.03, 3.0, 0.72, 37.44, 2.29, 2.22, 0.66, 2.04, 3.66, 5.11, 0.68, 1.27, 5.63]} \ No newline at end of file diff --git a/annotations_1/bgS0GPQhzHg_filtered.json b/annotations_1/bgS0GPQhzHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1c8dc45f731258472ebd42d81191a2f1d6eb6e --- /dev/null +++ b/annotations_1/bgS0GPQhzHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [10.0, 11.38], [12.0, 39.9], [41.0, 40.78], [45.0, 48.3], [49.0, 72.05]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 28.91, 0.0, 29.82, 28.7], "audiomae_on_audioset": [null, null, [["music", 56.12], ["throbbing", 9.19], ["synthesizer", 8.08]], null, [["music", 50.85], ["throbbing", 8.08], ["ambient music", 5.27]], [["music", 83.81], ["ambient music", 3.72], ["synthesizer", 2.2]]], "duration": [1.02, 1.38, 27.9, -0.22, 3.3, 23.05]} \ No newline at end of file diff --git a/annotations_1/bgZWbi1o8bY_filtered.json b/annotations_1/bgZWbi1o8bY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7363af14b5fd809faf8a97c0ecf00cea3aff1b3 --- /dev/null +++ b/annotations_1/bgZWbi1o8bY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.0], [11.0, 23.18], [49.0, 48.84], [81.0, 86.48], [97.0, 97.66], [107.0, 107.49], [110.0, 111.35], [112.0, 112.11], [113.0, 113.04], [114.0, 114.67], [116.0, 117.68], [121.0, 121.76], [122.0, 142.18], [152.0, 152.2], [155.0, 163.44], [172.0, 172.52]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.0, 0.0, 29.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.6, 0.0, 29.75, 0.0], "audiomae_on_audioset": [null, [["music", 34.42], ["speech", 31.63], ["electric shaver, electric razor", 10.98]], null, [["speech", 20.03], ["cattle, bovinae", 16.32], ["livestock, farm animals, working animals", 14.87]], null, null, null, null, null, null, null, null, [["music", 50.07], ["speech", 29.77], ["cattle, bovinae", 4.2]], null, [["music", 29.21], ["whip", 8.97], ["groan", 8.94]], null], "duration": [0.0, 12.18, -0.16, 5.48, 0.66, 0.49, 1.35, 0.11, 0.04, 0.67, 1.68, 0.76, 20.18, 0.2, 8.44, 0.52]} \ No newline at end of file diff --git a/annotations_1/bhtJNsUfHIM_filtered.json b/annotations_1/bhtJNsUfHIM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..985cef5348713349bd081f33085b81214eef080b --- /dev/null +++ b/annotations_1/bhtJNsUfHIM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.41], [7.0, 7.28], [13.0, 13.96], [15.0, 17.39], [19.0, 22.25], [23.0, 25.98], [27.0, 27.3], [29.0, 29.29], [29.0, 30.47], [33.0, 34.8], [36.0, 36.0], [38.0, 39.51], [45.0, 45.39], [48.0, 47.97], [54.0, 54.58], [56.0, 56.47], [60.0, 61.13], [64.0, 63.66], [66.0, 66.16], [67.0, 67.34], [70.0, 72.17], [74.0, 74.07], [76.0, 77.6], [81.0, 81.8], [83.0, 84.6], [94.0, 94.34], [98.0, 99.5], [101.0, 101.82], [102.0, 104.63], [107.0, 107.25], [109.0, 110.07], [111.0, 111.62], [121.0, 121.88], [123.0, 123.52], [127.0, 128.17], [130.0, 130.38], [134.0, 136.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 86.64, 99.62, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.45], ["throbbing", 19.41], ["hum", 13.63]]], "duration": [1.41, 0.28, 0.96, 2.39, 3.25, 2.98, 0.3, 0.29, 1.47, 1.8, 0.0, 1.51, 0.39, -0.03, 0.58, 0.47, 1.13, -0.34, 0.16, 0.34, 2.17, 0.07, 1.6, 0.8, 1.6, 0.34, 1.5, 0.82, 2.63, 0.25, 1.07, 0.62, 0.88, 0.52, 1.17, 0.38, 2.66]} \ No newline at end of file diff --git a/annotations_1/bkhUe1txLoc_filtered.json b/annotations_1/bkhUe1txLoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..135af6e52794f0bc2b20c51d7278bca5d8374e9d --- /dev/null +++ b/annotations_1/bkhUe1txLoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [6.0, 6.61], [8.0, 8.24], [9.0, 9.91], [10.0, 10.25], [10.0, 10.3], [10.0, 10.34], [10.0, 10.83], [11.0, 12.46], [13.0, 14.23], [15.0, 18.1], [19.0, 21.69], [24.0, 24.9], [31.0, 31.43], [36.0, 37.29], [41.0, 42.38], [42.0, 43.33], [51.0, 51.31], [55.0, 55.54], [62.0, 61.7], [68.0, 68.71], [76.0, 78.36], [79.0, 80.22], [83.0, 84.05], [91.0, 91.56], [105.0, 105.39], [118.0, 119.28], [123.0, 123.87], [126.0, 126.84], [128.0, 131.26], [131.0, 133.83], [142.0, 143.16], [146.0, 146.91], [150.0, 150.38], [151.0, 152.05], [153.0, 154.67], [157.0, 158.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.52, 0.61, 0.24, 0.91, 0.25, 0.3, 0.34, 0.83, 1.46, 1.23, 3.1, 2.69, 0.9, 0.43, 1.29, 1.38, 1.33, 0.31, 0.54, -0.3, 0.71, 2.36, 1.22, 1.05, 0.56, 0.39, 1.28, 0.87, 0.84, 3.26, 2.83, 1.16, 0.91, 0.38, 1.05, 1.67, 1.65]} \ No newline at end of file diff --git a/annotations_1/blQ8Wi0VAn0_filtered.json b/annotations_1/blQ8Wi0VAn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3cdbffb233ec404be08d37d1c8de6ef1af4c28f --- /dev/null +++ b/annotations_1/blQ8Wi0VAn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 42.03], [54.0, 64.29], [64.0, 64.44], [65.0, 67.53], [69.0, 69.48], [70.0, 72.79], [74.0, 77.45], [81.0, 80.87], [92.0, 93.28], [96.0, 96.77], [101.0, 103.94], [108.0, 115.87], [120.0, 120.5], [122.0, 122.52], [125.0, 126.6], [129.0, 130.28], [132.0, 132.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.46, 93.29, 0.0, 87.92, 0.0, 94.22, 75.55, 0.0, 0.0, 0.0, 98.73, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.01], ["fart", 20.01], ["musical instrument", 8.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 10.29, 0.44, 2.53, 0.48, 2.79, 3.45, -0.13, 1.28, 0.77, 2.94, 7.87, 0.5, 0.52, 1.6, 1.28, 0.36]} \ No newline at end of file diff --git a/annotations_1/bmBh8DSdcnU_filtered.json b/annotations_1/bmBh8DSdcnU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..001a548147b11a1e5caed444525dcf0c37cd0c76 --- /dev/null +++ b/annotations_1/bmBh8DSdcnU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 140.12], [140.0, 145.22], [145.0, 159.75]], "keep_status": [false, true, true], "silence_prob": [0.0, 29.41, 33.96], "audiomae_on_audioset": [null, [["speech", 31.59], ["explosion", 9.38], ["groan", 6.83]], [["speech", 28.81], ["groan", 17.32], ["outside, rural or natural", 5.86]]], "duration": [44.12, 5.22, 14.75]} \ No newline at end of file diff --git a/annotations_1/bnLhMGzgfSM_filtered.json b/annotations_1/bnLhMGzgfSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cc5a4904a074f515969577d888334fd88d2b6e8 --- /dev/null +++ b/annotations_1/bnLhMGzgfSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [5.0, 6.29], [7.0, 20.58], [22.0, 25.57], [26.0, 29.46], [47.0, 50.46], [58.0, 68.76], [70.0, 71.07], [73.0, 73.23], [74.0, 74.78], [78.0, 83.22], [88.0, 94.1], [101.0, 103.2], [104.0, 105.0], [108.0, 109.98], [111.0, 112.08], [125.0, 126.4], [127.0, 128.39], [129.0, 131.65], [136.0, 137.15], [138.0, 139.4], [140.0, 145.32], [146.0, 148.54], [152.0, 153.55], [155.0, 155.63], [158.0, 163.63], [165.0, 168.57]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 88.46, 95.64, 78.72, 99.56, 42.79, 0.0, 0.0, 0.0, 100.0, 98.99, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.99, 100.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 40.4], ["insect", 16.01], ["frog", 8.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 1.29, 13.58, 3.57, 3.46, 3.46, 10.76, 1.07, 0.23, 0.78, 5.22, 6.1, 2.2, 1.0, 1.98, 1.08, 1.4, 1.39, 2.65, 1.15, 1.4, 5.32, 2.54, 1.55, 0.63, 5.63, 3.57]} \ No newline at end of file diff --git a/annotations_1/bn_Df5UNy3s_filtered.json b/annotations_1/bn_Df5UNy3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40ad8b04ae5025a405beacda02a36d37148c429b --- /dev/null +++ b/annotations_1/bn_Df5UNy3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 95.74], [96.0, 122.12]], "keep_status": [false, true], "silence_prob": [0.0, 29.41], "audiomae_on_audioset": [null, [["music", 30.13], ["cattle, bovinae", 10.11], ["moo", 9.72]]], "duration": [69.74, 26.12]} \ No newline at end of file diff --git a/annotations_1/boGgXcQIe-8_filtered.json b/annotations_1/boGgXcQIe-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be56f0e5d1d7880cc4eccad73ce317c687288059 --- /dev/null +++ b/annotations_1/boGgXcQIe-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.4], [5.0, 9.32], [11.0, 14.52], [16.0, 16.95], [20.0, 20.6], [21.0, 21.63], [22.0, 22.98], [24.0, 24.75], [29.0, 29.27], [32.0, 38.31], [40.0, 43.48], [47.0, 50.41], [51.0, 54.82], [57.0, 102.22], [109.0, 109.56], [112.0, 111.99], [113.0, 113.91], [121.0, 121.2]], "keep_status": [false, true, true, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 30.93, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 40.61, 39.52, 40.24, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 24.61], ["music", 22.82], ["hum", 13.68]], [["hum", 27.71], ["music", 11.0], ["vehicle", 8.49]], null, null, null, null, null, null, [["speech", 14.4], ["music", 9.41], ["singing bowl", 6.8]], [["speech", 25.51], ["rumble", 21.17], ["whale vocalization", 21.07]], [["rumble", 29.51], ["whale vocalization", 25.7], ["speech", 14.94]], [["whale vocalization", 25.17], ["rumble", 20.52], ["hum", 8.81]], null, null, null, null, null], "duration": [1.4, 4.32, 3.52, 0.95, 0.6, 0.63, 0.98, 0.75, 0.27, 6.31, 3.48, 3.41, 3.82, 45.22, 0.56, -0.01, 0.91, 0.2]} \ No newline at end of file diff --git a/annotations_1/bp5HRI2hEW0_filtered.json b/annotations_1/bp5HRI2hEW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fad258bdaa770845b3e2c6c08e1b0123fa3a111 --- /dev/null +++ b/annotations_1/bp5HRI2hEW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 85.4]], "keep_status": [false], "silence_prob": [65.67], "audiomae_on_audioset": [null], "duration": [4.4]} \ No newline at end of file diff --git a/annotations_1/bpNxVXA5dcQ_filtered.json b/annotations_1/bpNxVXA5dcQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..523497a2d713c03d9447d68a11d4e427b39049da --- /dev/null +++ b/annotations_1/bpNxVXA5dcQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.24], [9.0, 9.9], [10.0, 30.23], [35.0, 36.21], [37.0, 37.71], [38.0, 43.14], [52.0, 52.98], [54.0, 54.38], [55.0, 57.69], [58.0, 61.16], [62.0, 64.74], [66.0, 117.88], [121.0, 127.53]], "keep_status": [false, false, true, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 32.05, 0.0, 0.0, 33.64, 0.0, 0.0, 47.98, 42.15, 44.29, 0.0, 99.98], "audiomae_on_audioset": [null, null, [["music", 47.77], ["didgeridoo", 8.37], ["hum", 4.23]], null, null, [["music", 39.66], ["speech", 27.48], ["hum", 6.36]], null, null, [["music", 25.4], ["speech", 15.15], ["effects unit", 11.74]], [["music", 49.66], ["speech", 12.33], ["musical instrument", 11.29]], [["music", 51.92], ["bass guitar", 5.63], ["plucked string instrument", 5.48]], null, null], "duration": [1.24, 0.9, 20.23, 1.21, 0.71, 5.14, 0.98, 0.38, 2.69, 3.16, 2.74, 51.88, 6.53]} \ No newline at end of file diff --git a/annotations_1/bp_GxHYCq90_filtered.json b/annotations_1/bp_GxHYCq90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d02476d694366b3f76ca12206e1c112e158bfb29 --- /dev/null +++ b/annotations_1/bp_GxHYCq90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.26], [6.0, 7.05], [10.0, 10.37], [12.0, 13.37], [24.0, 29.96], [38.0, 40.71], [43.0, 43.55], [46.0, 51.27], [52.0, 52.27], [53.0, 63.14], [65.0, 77.04], [78.0, 78.85], [80.0, 92.58], [95.0, 99.13], [105.0, 107.15], [111.0, 112.68], [116.0, 119.55], [123.0, 124.53], [127.0, 130.03]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, true, true, true, false, true, false, true], "silence_prob": [29.28, 0.0, 0.0, 0.0, 29.11, 28.76, 0.0, 28.82, 0.0, 28.74, 29.69, 0.0, 28.44, 28.5, 29.16, 0.0, 28.29, 0.0, 28.11], "audiomae_on_audioset": [[["fart", 26.26], ["speech", 8.88], ["boing", 7.44]], null, null, null, [["music", 32.02], ["speech", 19.27], ["throbbing", 4.96]], [["speech", 72.76], ["music", 5.13], ["machine gun", 4.78]], null, [["music", 67.3], ["speech", 17.8], ["gunshot, gunfire", 1.93]], null, [["music", 46.45], ["speech", 27.14], ["whack, thwack", 4.12]], [["music", 33.99], ["speech", 27.36], ["throbbing", 20.34]], null, [["music", 30.96], ["hum", 21.71], ["mains hum", 10.4]], [["music", 52.9], ["throbbing", 10.6], ["musical instrument", 4.46]], [["mains hum", 30.11], ["hum", 25.63], ["speech", 7.28]], null, [["hum", 29.28], ["speech", 18.97], ["mains hum", 17.33]], null, [["music", 26.66], ["hum", 11.15], ["mains hum", 8.67]]], "duration": [4.26, 1.05, 0.37, 1.37, 5.96, 2.71, 0.55, 5.27, 0.27, 10.14, 12.04, 0.85, 12.58, 4.13, 2.15, 1.68, 3.55, 1.53, 3.03]} \ No newline at end of file diff --git a/annotations_1/bqvMCDQ3HEU_filtered.json b/annotations_1/bqvMCDQ3HEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e99468cbcf003ad6cd2cb379837878813e73e8 --- /dev/null +++ b/annotations_1/bqvMCDQ3HEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.32], [10.0, 13.12], [14.0, 16.65], [35.0, 36.12], [38.0, 46.2], [50.0, 55.26], [55.0, 118.76], [119.0, 119.82], [122.0, 122.91], [126.0, 137.24], [138.0, 140.1], [144.0, 145.1], [146.0, 147.73], [152.0, 153.44]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.68, 60.14, 0.0, 53.97, 39.07, 0.0, 0.0, 0.0, 42.88, 54.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 38.4], ["music", 22.22], ["didgeridoo", 6.41]], null, null, null, [["animal", 17.2], ["music", 10.43], ["clip-clop", 7.73]], null, null, null, [["speech", 65.42], ["electric shaver, electric razor", 7.79], ["buzz", 6.91]], null, null, null, null], "duration": [0.32, 3.12, 2.65, 1.12, 8.2, 5.26, 63.76, 0.82, 0.91, 11.24, 2.1, 1.1, 1.73, 1.44]} \ No newline at end of file diff --git a/annotations_1/bqwH3cQUlNA_filtered.json b/annotations_1/bqwH3cQUlNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a313e4ff942ae011d623be8b4311c4cc41c4ee3d --- /dev/null +++ b/annotations_1/bqwH3cQUlNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 35.43], [36.0, 36.21], [39.0, 38.89], [43.0, 43.61], [44.0, 45.47], [46.0, 48.02], [49.0, 50.33], [51.0, 52.68], [54.0, 55.88], [66.0, 71.46], [72.0, 73.13], [75.0, 77.33], [92.0, 92.08], [97.0, 98.59], [101.0, 100.92], [102.0, 103.01], [107.0, 135.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [30.77, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 90.08, 0.0, 32.8, 0.0, 0.0, 0.0, 0.0, 30.75], "audiomae_on_audioset": [[["music", 54.43], ["throbbing", 10.0], ["hum", 6.01]], null, null, null, null, null, null, null, null, null, null, [["music", 55.59], ["singing bowl", 7.56], ["musical instrument", 3.36]], null, null, null, null, [["music", 38.25], ["speech", 23.45], ["hum", 6.0]]], "duration": [13.43, 0.21, -0.11, 0.61, 1.47, 2.02, 1.33, 1.68, 1.88, 5.46, 1.13, 2.33, 0.08, 1.59, -0.08, 1.01, 28.9]} \ No newline at end of file diff --git a/annotations_1/bqwS3qz3GhE_filtered.json b/annotations_1/bqwS3qz3GhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d4afe153376a7af4f9588e533d51312b8f7cd9c --- /dev/null +++ b/annotations_1/bqwS3qz3GhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 48.69], [50.0, 51.44], [55.0, 55.8], [59.0, 60.22], [61.0, 61.38], [62.0, 149.35], [150.0, 153.69], [156.0, 156.47], [165.0, 167.51]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 30.73], ["fire", 13.45], ["mains hum", 9.79]], null, null], "duration": [2.69, 1.44, 0.8, 1.22, 0.38, 87.35, 3.69, 0.47, 2.51]} \ No newline at end of file diff --git a/annotations_1/br2rj_3KW1A_filtered.json b/annotations_1/br2rj_3KW1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab79f635adc687793a69bfc55a998621129e90e --- /dev/null +++ b/annotations_1/br2rj_3KW1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.71], [26.0, 26.49], [30.0, 30.48], [35.0, 35.75], [38.0, 38.69], [39.0, 39.18], [44.0, 45.87], [55.0, 55.7], [56.0, 57.45], [62.0, 65.82], [66.0, 68.84], [70.0, 91.86], [92.0, 103.32], [105.0, 107.59], [112.0, 114.3]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 31.4, 29.16, 28.76, 30.16, 30.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.44], ["hum", 17.19], ["mains hum", 10.01]], [["music", 23.79], ["didgeridoo", 18.14], ["mains hum", 8.55]], [["music", 55.89], ["throbbing", 20.47], ["hum", 6.53]], [["music", 53.6], ["hum", 9.3], ["throbbing", 5.62]], [["music", 18.13], ["explosion", 7.92], ["groan", 7.25]], [["music", 34.33], ["speech", 28.46], ["boing", 11.52]]], "duration": [0.71, 0.49, 0.48, 0.75, 0.69, 0.18, 1.87, 0.7, 1.45, 3.82, 2.84, 21.86, 11.32, 2.59, 2.3]} \ No newline at end of file diff --git a/annotations_1/btMisVovQKk_filtered.json b/annotations_1/btMisVovQKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088b21fb54c54f0a56713ea109d96ed996d809da --- /dev/null +++ b/annotations_1/btMisVovQKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [9.0, 8.68], [15.0, 14.82], [19.0, 19.41], [25.0, 25.25], [27.0, 27.6], [36.0, 37.08], [38.0, 38.26], [44.0, 44.44], [45.0, 46.75], [60.0, 60.24], [65.0, 65.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, -0.32, -0.18, 0.41, 0.25, 0.6, 1.08, 0.26, 0.44, 1.75, 0.24, 0.64]} \ No newline at end of file diff --git a/annotations_1/btVoaFC1Aqk_filtered.json b/annotations_1/btVoaFC1Aqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c80f3a2eb803981b2c6a5d98a1f4fc60b613405 --- /dev/null +++ b/annotations_1/btVoaFC1Aqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 38.03], [39.0, 40.78], [43.0, 49.84], [53.0, 55.76], [58.0, 62.21], [63.0, 75.71], [77.0, 76.94], [80.0, 88.6], [90.0, 92.08], [94.0, 94.37]], "keep_status": [false, false, false, true, false, false, false, true, true, false], "silence_prob": [30.24, 0.0, 29.51, 29.41, 30.88, 29.5, 0.0, 30.89, 30.02, 0.0], "audiomae_on_audioset": [[["music", 76.44], ["electronic music", 4.01], ["synthesizer", 3.06]], null, [["throbbing", 36.63], ["hum", 29.41], ["music", 7.2]], [["music", 44.3], ["speech", 17.48], ["breaking", 7.27]], [["hum", 37.69], ["music", 17.51], ["throbbing", 16.34]], [["music", 51.07], ["hum", 21.16], ["throbbing", 14.08]], null, [["speech", 39.19], ["bee, wasp, etc.", 14.43], ["fly, housefly", 11.64]], [["music", 20.44], ["didgeridoo", 17.86], ["speech", 8.56]], null], "duration": [23.03, 1.78, 6.84, 2.76, 4.21, 12.71, -0.06, 8.6, 2.08, 0.37]} \ No newline at end of file diff --git a/annotations_1/btfIH4Q2BQA_filtered.json b/annotations_1/btfIH4Q2BQA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..868faf3a54cea19e9c9504cf04edbf58ea1329da --- /dev/null +++ b/annotations_1/btfIH4Q2BQA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.72], [7.0, 8.13], [9.0, 12.18], [14.0, 17.74], [19.0, 20.12], [21.0, 23.16], [23.0, 27.03], [27.0, 27.53], [32.0, 32.05], [33.0, 33.89], [35.0, 35.92], [38.0, 38.52], [41.0, 41.96], [43.0, 44.12], [46.0, 45.77], [46.0, 48.73], [49.0, 50.55], [51.0, 51.51], [52.0, 52.74], [54.0, 55.17], [57.0, 57.54], [62.0, 63.14], [65.0, 66.6], [68.0, 68.93], [70.0, 70.88], [74.0, 74.09], [76.0, 78.26], [80.0, 80.1], [83.0, 91.22], [95.0, 95.2], [100.0, 104.35], [106.0, 106.78], [109.0, 112.16], [115.0, 116.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 45.95, 86.27, 0.0, 84.98, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 58.81, 0.0, 48.82, 0.0, 57.25, 0.0], "audiomae_on_audioset": [null, null, [["speech", 65.33], ["hum", 4.18], ["inside, small room", 3.42]], null, null, null, [["breaking", 47.09], ["speech", 43.34], ["glass", 3.49]], null, null, null, null, null, null, null, null, [["music", 42.47], ["speech", 17.09], ["sidetone", 10.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.64], ["mains hum", 19.04], ["speech", 6.94]], null, null, null], "duration": [1.72, 1.13, 3.18, 3.74, 1.12, 2.16, 4.03, 0.53, 0.05, 0.89, 0.92, 0.52, 0.96, 1.12, -0.23, 2.73, 1.55, 0.51, 0.74, 1.17, 0.54, 1.14, 1.6, 0.93, 0.88, 0.09, 2.26, 0.1, 8.22, 0.2, 4.35, 0.78, 3.16, 1.51]} \ No newline at end of file diff --git a/annotations_1/btk4Wp0RssY_filtered.json b/annotations_1/btk4Wp0RssY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501588b6822a9bc45785b0f8d0ccde3d49aff0be --- /dev/null +++ b/annotations_1/btk4Wp0RssY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.24], [5.0, 6.44], [8.0, 10.35], [12.0, 12.61], [16.0, 17.83], [20.0, 21.71], [25.0, 26.45], [29.0, 30.23], [33.0, 35.28], [36.0, 38.62], [40.0, 45.89], [48.0, 49.4], [51.0, 52.29], [54.0, 55.98], [58.0, 59.49], [60.0, 60.3], [63.0, 64.1], [66.0, 67.41], [69.0, 71.02], [73.0, 74.53], [79.0, 81.18], [88.0, 88.28], [90.0, 90.88], [92.0, 98.51], [100.0, 99.81], [106.0, 112.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [62.78, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.84, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 43.69, 0.0, 0.0, 49.54, 0.0, 39.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 51.7], ["speech", 7.81], ["sine wave", 7.49]], null, null, [["speech", 20.0], ["mains hum", 15.61], ["hum", 13.31]], null, [["music", 41.29], ["door", 8.81], ["speech", 7.76]]], "duration": [2.24, 1.44, 2.35, 0.61, 1.83, 1.71, 1.45, 1.23, 2.28, 2.62, 5.89, 1.4, 1.29, 1.98, 1.49, 0.3, 1.1, 1.41, 2.02, 1.53, 2.18, 0.28, 0.88, 6.51, -0.19, 6.62]} \ No newline at end of file diff --git a/annotations_1/bu5m4sr6e6I_filtered.json b/annotations_1/bu5m4sr6e6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec297489155df0fa8dccf5f0df4bb548633c3b1d --- /dev/null +++ b/annotations_1/bu5m4sr6e6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 27.35], [30.0, 42.4], [48.0, 54.4], [56.0, 56.69], [58.0, 58.83], [63.0, 68.98], [81.0, 86.83], [100.0, 100.14], [108.0, 123.65]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [29.67, 29.81, 29.8, 0.0, 0.0, 29.94, 30.26, 0.0, 29.79], "audiomae_on_audioset": [[["music", 48.89], ["cacophony", 29.79], ["throbbing", 2.98]], [["music", 77.54], ["throbbing", 6.29], ["electronic music", 2.17]], [["music", 55.15], ["didgeridoo", 18.85], ["throbbing", 6.05]], null, null, [["music", 32.58], ["throbbing", 23.24], ["hum", 13.27]], [["music", 70.79], ["cacophony", 9.18], ["synthesizer", 2.79]], null, [["music", 40.44], ["throbbing", 20.4], ["synthesizer", 12.95]]], "duration": [19.35, 12.4, 6.4, 0.69, 0.83, 5.98, 5.83, 0.14, 15.65]} \ No newline at end of file diff --git a/annotations_1/bu9YxTb6gf8_filtered.json b/annotations_1/bu9YxTb6gf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe43c86110e931023e356fa439d3f2d62ec3a9a5 --- /dev/null +++ b/annotations_1/bu9YxTb6gf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [10.0, 10.57], [23.0, 24.29], [27.0, 27.48], [32.0, 33.59], [38.0, 39.58], [42.0, 43.56], [46.0, 47.53], [53.0, 55.44], [60.0, 63.19], [68.0, 70.04], [71.0, 71.83], [75.0, 78.31], [79.0, 79.66], [82.0, 86.44], [92.0, 92.26], [97.0, 98.1], [105.0, 105.81], [111.0, 113.49], [118.0, 121.88], [125.0, 128.16], [133.0, 135.84]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 30.38, 30.37, 0.0, 29.96, 0.0, 30.31, 0.0, 0.0, 0.0, 32.26, 30.08, 29.96, 30.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.79], ["throbbing", 7.45], ["cacophony", 4.64]], [["music", 73.92], ["sampler", 2.54], ["musical instrument", 2.18]], [["music", 84.15], ["guitar", 3.18], ["musical instrument", 2.93]], null, [["music", 58.51], ["throbbing", 8.3], ["hum", 7.57]], null, [["music", 66.3], ["guitar", 4.19], ["plucked string instrument", 3.73]], null, null, null, [["music", 57.27], ["musical instrument", 7.64], ["electronic music", 2.86]], [["music", 36.99], ["didgeridoo", 34.81], ["boing", 3.67]], [["music", 57.31], ["speech", 4.75], ["boing", 4.26]], [["music", 50.43], ["sampler", 5.04], ["synthesizer", 3.44]]], "duration": [0.4, 0.57, 1.29, 0.48, 1.59, 1.58, 1.56, 1.53, 2.44, 3.19, 2.04, 0.83, 3.31, 0.66, 4.44, 0.26, 1.1, 0.81, 2.49, 3.88, 3.16, 2.84]} \ No newline at end of file diff --git a/annotations_1/buIXWAgTUIU_filtered.json b/annotations_1/buIXWAgTUIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ead5aeb3dc2c43b7d3b00cc77b178ecdc11213d1 --- /dev/null +++ b/annotations_1/buIXWAgTUIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 57.99], [59.0, 60.4], [63.0, 65.3], [68.0, 84.57], [85.0, 89.11], [90.0, 93.16], [94.0, 95.01], [96.0, 99.4], [101.0, 105.0], [106.0, 106.62], [108.0, 108.21], [109.0, 109.75], [111.0, 111.91], [113.0, 113.53], [115.0, 114.94], [117.0, 117.76]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.45, 0.0, 30.22, 30.6, 41.32, 40.21, 0.0, 56.33, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.6], ["didgeridoo", 37.22], ["throbbing", 2.88]], null, [["music", 72.72], ["didgeridoo", 5.09], ["screaming", 2.22]], [["music", 54.76], ["didgeridoo", 11.37], ["speech", 5.69]], [["music", 29.1], ["throbbing", 22.62], ["didgeridoo", 9.42]], [["music", 63.36], ["didgeridoo", 18.93], ["musical instrument", 4.41]], null, null, null, null, null, null, null, null, null, null], "duration": [21.99, 1.4, 2.3, 16.57, 4.11, 3.16, 1.01, 3.4, 4.0, 0.62, 0.21, 0.75, 0.91, 0.53, -0.06, 0.76]} \ No newline at end of file diff --git a/annotations_1/bvEJjjYbgtk_filtered.json b/annotations_1/bvEJjjYbgtk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed900c0d874c2788c6fc3980315e391095429c3 --- /dev/null +++ b/annotations_1/bvEJjjYbgtk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 52.74], [55.0, 58.26], [69.0, 96.79]], "keep_status": [false, false, false], "silence_prob": [0.0, 37.01, 47.16], "audiomae_on_audioset": [null, [["speech", 38.64], ["music", 23.38], ["rumble", 10.65]], [["music", 60.77], ["hum", 13.36], ["buzz", 4.49]]], "duration": [0.74, 3.26, 27.79]} \ No newline at end of file diff --git a/annotations_1/bvITByUy5fA_filtered.json b/annotations_1/bvITByUy5fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1036a1315cfb3213224eff453bd1c84142cb08b0 --- /dev/null +++ b/annotations_1/bvITByUy5fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [43.0, 43.23], [44.0, 44.24], [56.0, 59.21], [65.0, 65.3], [71.0, 72.52], [74.0, 74.65], [76.0, 76.86], [78.0, 78.19], [93.0, 96.06], [97.0, 106.64], [108.0, 108.08], [109.0, 110.22], [113.0, 118.56], [126.0, 129.98], [131.0, 131.19], [143.0, 143.88], [145.0, 147.07], [150.0, 150.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 50.71, 0.0, 0.0, 92.15, 99.98, 0.0, 0.0, 91.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.23, 0.24, 3.21, 0.3, 1.52, 0.65, 0.86, 0.19, 3.06, 9.64, 0.08, 1.22, 5.56, 3.98, 0.19, 0.88, 2.07, 0.52]} \ No newline at end of file diff --git a/annotations_1/bvl-DxX9N8g_filtered.json b/annotations_1/bvl-DxX9N8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9403c74bd8e4ca0deac7830538633f0a88970aea --- /dev/null +++ b/annotations_1/bvl-DxX9N8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.36], [6.0, 6.32], [7.0, 7.77], [8.0, 11.91], [13.0, 13.44], [16.0, 16.5], [19.0, 19.7], [22.0, 22.08], [25.0, 26.23], [27.0, 28.49], [29.0, 30.3], [33.0, 34.25], [36.0, 36.48], [39.0, 39.93], [46.0, 46.95], [57.0, 58.09], [65.0, 74.22], [75.0, 79.73], [80.0, 83.05], [85.0, 85.99], [87.0, 89.29], [93.0, 94.71], [98.0, 104.58], [105.0, 120.48], [122.0, 123.09], [126.0, 127.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 97.33, 0.0, 87.92, 0.0, 61.57, 85.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 63.22], ["sidetone", 8.48], ["radio", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.32, 0.77, 3.91, 0.44, 0.5, 0.7, 0.08, 1.23, 1.49, 1.3, 1.25, 0.48, 0.93, 0.95, 1.09, 9.22, 4.73, 3.05, 0.99, 2.29, 1.71, 6.58, 15.48, 1.09, 1.26]} \ No newline at end of file diff --git a/annotations_1/bvnOqxRHjuc_filtered.json b/annotations_1/bvnOqxRHjuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb47eb89949f9b3e357f0ce59b29e7ee536b5b2 --- /dev/null +++ b/annotations_1/bvnOqxRHjuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 107.11], [108.0, 108.67], [114.0, 115.01]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [43.11, 0.67, 1.01]} \ No newline at end of file diff --git a/annotations_1/bwKwR3hV0zA_filtered.json b/annotations_1/bwKwR3hV0zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21bb9f194a5dc198e48be58a91fe1febea7d8a93 --- /dev/null +++ b/annotations_1/bwKwR3hV0zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.93], [24.0, 34.28], [35.0, 37.2], [39.0, 46.2], [50.0, 66.06], [68.0, 76.99], [78.0, 85.62], [86.0, 95.69], [97.0, 134.15], [136.0, 137.05], [139.0, 140.7], [143.0, 144.8], [146.0, 145.93], [146.0, 158.94], [160.0, 160.88], [161.0, 162.87], [166.0, 166.62], [172.0, 172.88], [177.0, 177.57], [183.0, 183.24], [183.0, 183.9], [185.0, 196.43], [199.0, 199.64], [200.0, 201.21], [203.0, 203.0], [211.0, 211.45], [213.0, 213.83], [216.0, 218.86], [219.0, 219.67]], "keep_status": [false, true, true, false, true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.11, 37.14, 28.97, 29.77, 44.6, 32.2, 29.95, 0.0, 0.0, 0.0, 0.0, 0.0, 29.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 0.0, 0.0, 0.0, 0.0, 34.87, 0.0], "audiomae_on_audioset": [null, [["music", 47.56], ["speech", 16.5], ["didgeridoo", 3.52]], [["music", 47.16], ["throbbing", 7.21], ["musical instrument", 5.65]], [["music", 38.91], ["speech", 16.49], ["throbbing", 14.69]], [["music", 43.29], ["hum", 14.45], ["theremin", 7.09]], [["cattle, bovinae", 22.12], ["animal", 17.04], ["moo", 9.66]], [["music", 31.2], ["noise", 10.08], ["speech", 9.17]], [["music", 53.26], ["throbbing", 13.4], ["hum", 8.44]], null, null, null, null, null, [["speech", 48.1], ["music", 10.61], ["breaking", 5.96]], null, null, null, null, null, null, null, [["speech", 65.14], ["fart", 18.94], ["music", 5.91]], null, null, null, null, null, [["music", 44.45], ["theremin", 13.26], ["grunt", 9.55]], null], "duration": [1.93, 10.28, 2.2, 7.2, 16.06, 8.99, 7.62, 9.69, 37.15, 1.05, 1.7, 1.8, -0.07, 12.94, 0.88, 1.87, 0.62, 0.88, 0.57, 0.24, 0.9, 11.43, 0.64, 1.21, 0.0, 0.45, 0.83, 2.86, 0.67]} \ No newline at end of file diff --git a/annotations_1/bx50ueZJgns_filtered.json b/annotations_1/bx50ueZJgns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90bdb9fa4ba225109db838cbbc333de6cbfd66de --- /dev/null +++ b/annotations_1/bx50ueZJgns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.37], [23.0, 26.4], [27.0, 32.19], [33.0, 33.4], [34.0, 39.68], [41.0, 43.28], [44.0, 69.89], [70.0, 77.13], [77.0, 77.16], [80.0, 80.35], [81.0, 100.47], [104.0, 110.78], [116.0, 138.08], [142.0, 170.21], [171.0, 190.49]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 30.24, 30.76, 0.0, 29.53, 33.46, 32.17, 30.05, 0.0, 0.0, 31.32, 30.3, 29.91, 30.2, 30.57], "audiomae_on_audioset": [null, [["whack, thwack", 20.9], ["mosquito", 16.53], ["fly, housefly", 13.94]], [["speech", 74.28], ["music", 13.56], ["throbbing", 1.04]], null, [["speech", 15.27], ["creak", 13.9], ["music", 13.69]], [["throbbing", 35.08], ["music", 34.07], ["hum", 17.66]], [["throbbing", 43.25], ["hum", 32.1], ["speech", 14.78]], [["music", 30.15], ["speech", 13.21], ["hum", 10.34]], null, null, [["hum", 36.6], ["throbbing", 29.29], ["mains hum", 16.63]], [["speech", 48.24], ["fart", 11.25], ["thump, thud", 8.4]], [["speech", 49.03], ["music", 17.72], ["breaking", 10.47]], [["speech", 37.05], ["music", 25.35], ["whack, thwack", 17.43]], [["music", 40.45], ["speech", 23.89], ["fart", 6.0]]], "duration": [1.37, 3.4, 5.19, 0.4, 5.68, 2.28, 25.89, 7.13, 0.16, 0.35, 19.47, 6.78, 22.08, 28.21, 19.49]} \ No newline at end of file diff --git a/annotations_1/bxEqg39v9Ec_filtered.json b/annotations_1/bxEqg39v9Ec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..264ea9dad80a0598369f93f7ad45936001ca925f --- /dev/null +++ b/annotations_1/bxEqg39v9Ec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [3.0, 3.52], [4.0, 4.51], [5.0, 5.68], [6.0, 8.55], [9.0, 10.93], [12.0, 12.9], [14.0, 16.23], [17.0, 18.86], [20.0, 22.33], [24.0, 23.94], [25.0, 26.72], [27.0, 26.96], [28.0, 28.93], [30.0, 30.11], [31.0, 32.73], [33.0, 34.08], [36.0, 36.37], [37.0, 37.81], [40.0, 40.37], [41.0, 42.6], [44.0, 44.25], [45.0, 46.41], [48.0, 48.29], [49.0, 51.58], [53.0, 53.64], [54.0, 56.2], [58.0, 58.56], [60.0, 69.2], [70.0, 76.84], [80.0, 81.4], [85.0, 85.14], [89.0, 89.18], [94.0, 95.23], [96.0, 96.31], [99.0, 99.1], [102.0, 102.32], [104.0, 104.99], [107.0, 107.87], [109.0, 109.39], [111.0, 111.64], [116.0, 116.24], [120.0, 120.01], [121.0, 121.41], [122.0, 122.61], [125.0, 126.06], [127.0, 127.82], [129.0, 129.47], [130.0, 130.03], [130.0, 131.36], [133.0, 135.26], [136.0, 136.14], [137.0, 138.4], [139.0, 139.97], [140.0, 141.27], [142.0, 146.25], [148.0, 148.71], [151.0, 151.43], [154.0, 154.16], [157.0, 157.17], [158.0, 161.4], [163.0, 165.06], [167.0, 169.72], [170.0, 171.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 77.2, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 99.1, 0.0, 99.85, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 92.97, 97.73, 94.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.52, 0.51, 0.68, 2.55, 1.93, 0.9, 2.23, 1.86, 2.33, -0.06, 1.72, -0.04, 0.93, 0.11, 1.73, 1.08, 0.37, 0.81, 0.37, 1.6, 0.25, 1.41, 0.29, 2.58, 0.64, 2.2, 0.56, 9.2, 6.84, 1.4, 0.14, 0.18, 1.23, 0.31, 0.1, 0.32, 0.99, 0.87, 0.39, 0.64, 0.24, 0.01, 0.41, 0.61, 1.06, 0.82, 0.47, 0.03, 1.36, 2.26, 0.14, 1.4, 0.97, 1.27, 4.25, 0.71, 0.43, 0.16, 0.17, 3.4, 2.06, 2.72, 1.02]} \ No newline at end of file diff --git a/annotations_1/bx_rua3EXFc_filtered.json b/annotations_1/bx_rua3EXFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..313bf9a16676015ae287ac50ce313941de7b7e17 --- /dev/null +++ b/annotations_1/bx_rua3EXFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.26], [14.0, 14.59], [18.0, 19.04], [22.0, 23.33], [30.0, 30.32], [31.0, 32.17], [34.0, 33.93], [34.0, 34.97], [39.0, 44.85], [47.0, 50.14], [54.0, 86.66], [88.0, 92.58], [93.0, 98.46], [99.0, 101.95], [102.0, 103.57], [106.0, 108.43], [109.0, 172.15], [175.0, 177.2], [178.0, 178.51], [185.0, 185.26], [187.0, 188.89], [190.0, 190.16], [206.0, 206.0]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, true, true, true, false, true, false, true, false, false, false, false, false], "silence_prob": [28.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.78, 28.44, 0.0, 30.0, 31.08, 30.42, 0.0, 38.49, 0.0, 29.49, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["rumble", 14.19], ["speech", 11.4], ["music", 8.99]], null, null, null, null, null, null, null, [["music", 51.8], ["speech", 12.66], ["whack, thwack", 5.03]], [["music", 36.87], ["theremin", 9.22], ["vehicle", 4.23]], null, [["whack, thwack", 36.7], ["speech", 25.13], ["boing", 6.49]], [["music", 27.09], ["mains hum", 17.36], ["hum", 16.54]], [["music", 36.61], ["speech", 12.3], ["moo", 8.56]], null, [["music", 35.54], ["musical instrument", 7.98], ["theremin", 4.83]], null, [["music", 51.58], ["speech", 11.37], ["musical instrument", 3.9]], null, null, null, null, null], "duration": [3.26, 0.59, 1.04, 1.33, 0.32, 1.17, -0.07, 0.97, 5.85, 3.14, 32.66, 4.58, 5.46, 2.95, 1.57, 2.43, 63.15, 2.2, 0.51, 0.26, 1.89, 0.16, 0.0]} \ No newline at end of file diff --git a/annotations_1/bxs77K1DkD0_filtered.json b/annotations_1/bxs77K1DkD0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c1881b40b79dd3182eba0e9d42d297ba238bd19 --- /dev/null +++ b/annotations_1/bxs77K1DkD0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.12], [17.0, 17.88], [18.0, 28.41], [29.0, 30.72], [33.0, 32.95], [34.0, 34.57], [35.0, 35.58], [39.0, 39.77], [40.0, 42.43], [44.0, 46.89], [48.0, 49.28], [52.0, 54.58], [55.0, 57.01], [58.0, 60.91], [71.0, 133.86], [134.0, 135.41], [136.0, 140.53], [142.0, 145.32], [146.0, 146.92], [150.0, 150.16], [151.0, 150.69], [152.0, 152.36], [158.0, 158.21], [159.0, 160.17], [161.0, 162.58], [164.0, 168.02], [170.0, 175.05], [177.0, 178.8], [179.0, 179.04], [179.0, 179.07], [179.0, 179.1], [180.0, 181.99], [182.0, 182.55], [183.0, 184.08], [184.0, 184.35], [185.0, 193.38]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.03, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.55, 39.19, 0.0, 37.83, 51.23, 65.09, 0.0, 0.0, 56.4, 48.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.92, 38.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.96], "audiomae_on_audioset": [[["throbbing", 25.65], ["hum", 25.63], ["music", 14.28]], null, [["hum", 38.02], ["speech", 15.23], ["throbbing", 15.14]], null, null, null, null, null, [["sine wave", 46.35], ["chirp tone", 12.69], ["singing bowl", 6.12]], [["sine wave", 16.59], ["chirp tone", 6.7], ["dog", 6.23]], null, [["chirp tone", 40.01], ["sine wave", 23.13], ["music", 9.52]], null, null, null, null, null, [["gong", 25.01], ["music", 14.44], ["hum", 9.25]], null, null, null, null, null, null, null, [["hum", 22.12], ["mains hum", 17.65], ["speech", 15.92]], [["sine wave", 22.17], ["gong", 20.77], ["singing bowl", 12.38]], null, null, null, null, null, null, null, null, [["music", 51.58], ["speech", 13.05], ["didgeridoo", 5.92]]], "duration": [2.12, 0.88, 10.41, 1.72, -0.05, 0.57, 0.58, 0.77, 2.43, 2.89, 1.28, 2.58, 2.01, 2.91, 62.86, 1.41, 4.53, 3.32, 0.92, 0.16, -0.31, 0.36, 0.21, 1.17, 1.58, 4.02, 5.05, 1.8, 0.04, 0.07, 0.1, 1.99, 0.55, 1.08, 0.35, 8.38]} \ No newline at end of file diff --git a/annotations_1/bxxHPYFtbE4_filtered.json b/annotations_1/bxxHPYFtbE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..093faee997b1f6584bc69b25e698e47ffc8d07a2 --- /dev/null +++ b/annotations_1/bxxHPYFtbE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.88], [12.0, 12.01], [21.0, 20.82], [26.0, 26.33], [33.0, 34.03], [34.0, 38.38], [40.0, 42.28], [44.0, 45.57], [47.0, 47.51], [48.0, 50.19], [52.0, 51.76], [52.0, 53.81], [55.0, 55.86], [59.0, 59.29], [63.0, 63.58], [65.0, 65.6], [75.0, 74.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 98.19, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 0.01, -0.18, 0.33, 1.03, 4.38, 2.28, 1.57, 0.51, 2.19, -0.24, 1.81, 0.86, 0.29, 0.58, 0.6, -0.08]} \ No newline at end of file diff --git a/annotations_1/bzSIHZcXwvQ_filtered.json b/annotations_1/bzSIHZcXwvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..604d6d33085d65b9278754cdf02dc86a11abc641 --- /dev/null +++ b/annotations_1/bzSIHZcXwvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.96], [4.0, 4.4], [5.0, 14.28], [15.0, 16.43], [17.0, 18.54], [19.0, 19.47], [20.0, 20.49], [21.0, 24.95], [29.0, 30.2], [31.0, 35.23], [36.0, 38.6], [40.0, 43.28], [45.0, 46.26], [48.0, 48.25], [48.0, 49.84], [51.0, 51.9], [53.0, 52.84], [53.0, 54.95], [56.0, 57.62], [58.0, 57.77], [59.0, 60.78], [61.0, 70.24], [71.0, 72.13], [75.0, 75.59], [77.0, 77.94], [79.0, 81.33], [83.0, 83.44], [84.0, 85.41], [86.0, 88.26], [91.0, 96.09], [97.0, 98.22], [99.0, 101.01], [102.0, 102.66], [104.0, 105.14], [106.0, 108.8], [110.0, 110.81], [111.0, 113.7], [114.0, 114.24], [115.0, 121.78], [123.0, 127.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 98.66, 98.51, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 53.47, 95.64, 0.0, 80.29, 0.0, 0.0, 61.18, 0.0, 54.9, 0.0, 91.81, 95.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["echo", 23.17], ["laughter", 8.51], ["snicker", 6.71]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.04, 0.4, 9.28, 1.43, 1.54, 0.47, 0.49, 3.95, 1.2, 4.23, 2.6, 3.28, 1.26, 0.25, 1.84, 0.9, -0.16, 1.95, 1.62, -0.23, 1.78, 9.24, 1.13, 0.59, 0.94, 2.33, 0.44, 1.41, 2.26, 5.09, 1.22, 2.01, 0.66, 1.14, 2.8, 0.81, 2.7, 0.24, 6.78, 4.35]} \ No newline at end of file diff --git a/annotations_1/c-ej3IOxBno_filtered.json b/annotations_1/c-ej3IOxBno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c89b8bad5a83574d17b28b6460faa5d0e76ce318 --- /dev/null +++ b/annotations_1/c-ej3IOxBno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [3.0, 4.48], [8.0, 8.43], [10.0, 11.2], [12.0, 14.22], [15.0, 16.92], [19.0, 20.61], [22.0, 29.84], [32.0, 32.86]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.4, 1.48, 0.43, 1.2, 2.22, 1.92, 1.61, 7.84, 0.86]} \ No newline at end of file diff --git a/annotations_1/c0N60xOU9yk_filtered.json b/annotations_1/c0N60xOU9yk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..336254599be683c96f79e6d42643d8aa5b430f8b --- /dev/null +++ b/annotations_1/c0N60xOU9yk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.82], [19.0, 21.14], [26.0, 26.4], [29.0, 29.54], [32.0, 31.7], [38.0, 38.15], [40.0, 41.18], [44.0, 45.37], [51.0, 52.27], [53.0, 54.19], [58.0, 58.04], [59.0, 59.02], [61.0, 61.43], [63.0, 62.78], [68.0, 68.88], [72.0, 72.81], [85.0, 84.69], [88.0, 88.59], [106.0, 106.07], [111.0, 113.14], [114.0, 114.76], [121.0, 120.66], [124.0, 127.13], [129.0, 129.3], [133.0, 133.22], [134.0, 134.32], [139.0, 139.68], [141.0, 141.74], [160.0, 160.3], [163.0, 168.47], [169.0, 172.64], [174.0, 176.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 59.96, 72.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 2.14, 0.4, 0.54, -0.3, 0.15, 1.18, 1.37, 1.27, 1.19, 0.04, 0.02, 0.43, -0.22, 0.88, 0.81, -0.31, 0.59, 0.07, 2.14, 0.76, -0.34, 3.13, 0.3, 0.22, 0.32, 0.68, 0.74, 0.3, 5.47, 3.64, 2.32]} \ No newline at end of file diff --git a/annotations_1/c0XTkj3PIWg_filtered.json b/annotations_1/c0XTkj3PIWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd6c1b677ba3e1ae3ce44d065e95fe300463fd1 --- /dev/null +++ b/annotations_1/c0XTkj3PIWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.22], [22.0, 27.99], [29.0, 29.96], [34.0, 34.87], [36.0, 37.4], [38.0, 39.87], [41.0, 43.34], [45.0, 45.81], [50.0, 53.7], [55.0, 55.73], [56.0, 61.94], [65.0, 64.66], [65.0, 66.61], [67.0, 68.17], [80.0, 80.62], [81.0, 81.48], [83.0, 84.48], [88.0, 87.81], [99.0, 101.78], [103.0, 116.92], [117.0, 126.32], [127.0, 126.71], [129.0, 129.22], [131.0, 131.77], [133.0, 133.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 53.72, 0.0, 0.0, 0.0, 0.0, 57.01, 0.0, 64.07, 0.0, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.14, 42.6, 48.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.73], ["thunk", 7.88], ["boing", 7.15]], [["music", 61.73], ["hum", 10.22], ["synthesizer", 4.69]], [["music", 35.0], ["speech", 11.13], ["fly, housefly", 7.93]], null, null, null, null], "duration": [0.22, 5.99, 0.96, 0.87, 1.4, 1.87, 2.34, 0.81, 3.7, 0.73, 5.94, -0.34, 1.61, 1.17, 0.62, 0.48, 1.48, -0.19, 2.78, 13.92, 9.32, -0.29, 0.22, 0.77, 0.08]} \ No newline at end of file diff --git a/annotations_1/c2ecZiVEs70_filtered.json b/annotations_1/c2ecZiVEs70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd1d73503fcb92f6f2e298daeb3e0266cf4b8910 --- /dev/null +++ b/annotations_1/c2ecZiVEs70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.62], [19.0, 21.44], [23.0, 25.71], [26.0, 100.21], [106.0, 105.97], [113.0, 113.21], [116.0, 125.54], [126.0, 131.73], [132.0, 133.08], [134.0, 134.96], [136.0, 136.65], [138.0, 138.03], [139.0, 140.59], [143.0, 143.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 72.01, 89.36, 0.0, 0.0, 0.0, 48.82, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["telephone bell ringing", 41.71], ["music", 31.33], ["telephone", 7.55]], [["speech", 32.98], ["fart", 12.01], ["hum", 7.26]], null, null, null, null, null, null], "duration": [0.62, 2.44, 2.71, 74.21, -0.03, 0.21, 9.54, 5.73, 1.08, 0.96, 0.65, 0.03, 1.59, 0.94]} \ No newline at end of file diff --git a/annotations_1/c2k_kuU84ro_filtered.json b/annotations_1/c2k_kuU84ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c9b1bb4c67daddf763a30d3b0b7226615915249 --- /dev/null +++ b/annotations_1/c2k_kuU84ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 139.94], [143.0, 147.99], [149.0, 152.39], [154.0, 172.56], [174.0, 182.28]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 29.79, 28.88, 29.07, 28.61], "audiomae_on_audioset": [null, [["music", 21.98], ["rumble", 6.88], ["speech", 6.03]], [["speech", 35.31], ["music", 21.58], ["whip", 14.29]], [["speech", 45.54], ["music", 24.83], ["clang", 5.23]], [["music", 49.74], ["speech", 7.62], ["burst, pop", 2.76]]], "duration": [68.94, 4.99, 3.39, 18.56, 8.28]} \ No newline at end of file diff --git a/annotations_1/c3vmsUcknhY_filtered.json b/annotations_1/c3vmsUcknhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32b32cc0fc1f98d91dca3466c426a7726b1469f4 --- /dev/null +++ b/annotations_1/c3vmsUcknhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.25], [20.0, 20.43], [22.0, 22.72], [23.0, 31.31], [32.0, 37.44], [38.0, 39.36], [40.0, 40.19], [42.0, 44.88], [48.0, 66.78], [67.0, 66.95], [67.0, 87.51], [88.0, 107.45], [109.0, 108.99], [109.0, 118.54], [121.0, 122.91], [124.0, 125.27]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [33.3, 0.0, 0.0, 29.0, 28.93, 0.0, 0.0, 28.91, 31.42, 0.0, 29.01, 28.44, 0.0, 28.48, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 25.33], ["didgeridoo", 22.78], ["music", 15.84]], null, null, [["music", 48.23], ["speech", 8.63], ["buzz", 4.19]], [["music", 54.86], ["throbbing", 9.21], ["hum", 7.22]], null, null, [["music", 50.5], ["throbbing", 12.26], ["hum", 4.28]], [["music", 51.75], ["didgeridoo", 10.53], ["musical instrument", 7.95]], null, [["music", 45.51], ["throbbing", 25.0], ["didgeridoo", 6.0]], [["music", 38.42], ["speech", 25.6], ["hum", 6.28]], null, [["music", 31.53], ["speech", 15.19], ["buzz", 9.57]], null, null], "duration": [5.25, 0.43, 0.72, 8.31, 5.44, 1.36, 0.19, 2.88, 18.78, -0.05, 20.51, 19.45, -0.01, 9.54, 1.91, 1.27]} \ No newline at end of file diff --git a/annotations_1/c4X58OjlVPo_filtered.json b/annotations_1/c4X58OjlVPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d7dac749355dba8947bec1610b61e809fbb5221 --- /dev/null +++ b/annotations_1/c4X58OjlVPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 6.13], [11.0, 10.89], [24.0, 24.78], [30.0, 29.88], [31.0, 32.09], [33.0, 33.44], [35.0, 34.75], [41.0, 40.78], [43.0, 43.58], [45.0, 45.22], [47.0, 51.66], [56.0, 57.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.14, 0.13, -0.11, 0.78, -0.12, 1.09, 0.44, -0.25, -0.22, 0.58, 0.22, 4.66, 1.55]} \ No newline at end of file diff --git a/annotations_1/c4ibjfBu1IY_filtered.json b/annotations_1/c4ibjfBu1IY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70e82b13f3e91b1e744f72aca9733fa64752f9e2 --- /dev/null +++ b/annotations_1/c4ibjfBu1IY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [4.0, 3.84], [4.0, 7.01], [9.0, 9.58], [10.0, 12.46], [13.0, 15.58], [17.0, 31.99], [35.0, 44.02], [45.0, 45.37], [53.0, 54.73], [55.0, 61.82], [67.0, 68.67], [69.0, 76.54], [79.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.58, 0.0, 53.78, 73.21, 71.87, 50.86, 0.0, 0.0, 28.22, 0.0, 29.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 42.69], ["speech", 25.37], ["electric shaver, electric razor", 8.05]], null, null, null, null, null, null, null, [["speech", 45.99], ["music", 18.47], ["vehicle", 14.47]], null, [["speech", 50.68], ["music", 23.46], ["mains hum", 7.97]], null], "duration": [-0.07, -0.16, 3.01, 0.58, 2.46, 2.58, 14.99, 9.02, 0.37, 1.73, 6.82, 1.67, 7.54, 0.91]} \ No newline at end of file diff --git a/annotations_1/c4w-IE-Hsqc_filtered.json b/annotations_1/c4w-IE-Hsqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93feea8c3d6f8c523ef0858f2462cbba93be700f --- /dev/null +++ b/annotations_1/c4w-IE-Hsqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.3], [35.0, 35.45], [39.0, 39.85], [51.0, 53.01], [56.0, 55.97], [63.0, 71.68], [72.0, 72.5], [74.0, 74.07], [79.0, 82.44], [83.0, 83.2], [84.0, 84.69], [92.0, 93.07], [94.0, 95.4], [100.0, 100.04], [112.0, 112.68], [114.0, 114.98], [116.0, 116.92], [120.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.44, 0.0, 65.2, 0.0, 0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.45, 0.85, 2.01, -0.03, 8.68, 0.5, 0.07, 3.44, 0.2, 0.69, 1.07, 1.4, 0.04, 0.68, 0.98, 0.92, 1.46]} \ No newline at end of file diff --git a/annotations_1/c5mAaBl_qqk_filtered.json b/annotations_1/c5mAaBl_qqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b893f44ee980a3af4f6e8848469889ddd56065 --- /dev/null +++ b/annotations_1/c5mAaBl_qqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.52], [5.0, 12.48], [13.0, 13.74], [14.0, 15.13], [16.0, 16.93], [18.0, 20.53], [22.0, 62.19], [63.0, 63.54], [64.0, 86.48], [87.0, 95.44], [97.0, 130.86], [134.0, 134.49], [135.0, 136.92], [138.0, 139.16], [142.0, 144.49], [148.0, 151.17], [152.0, 152.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.78, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 46.72, 46.15, 0.0, 0.0, 0.0, 0.0, 71.57, 52.45, 0.0], "audiomae_on_audioset": [null, [["music", 57.93], ["hum", 10.57], ["electronic music", 6.1]], null, null, null, [["hum", 31.19], ["mains hum", 16.52], ["music", 9.82]], null, null, [["speech", 53.35], ["music", 24.4], ["hum", 6.97]], [["hum", 36.72], ["throbbing", 35.2], ["music", 8.61]], null, null, null, null, null, null, null], "duration": [1.52, 7.48, 0.74, 1.13, 0.93, 2.53, 40.19, 0.54, 22.48, 8.44, 33.86, 0.49, 1.92, 1.16, 2.49, 3.17, 0.74]} \ No newline at end of file diff --git a/annotations_1/c6mLa5_GvCQ_filtered.json b/annotations_1/c6mLa5_GvCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532d0bbd83848374c55253097108fa2f2070a5f0 --- /dev/null +++ b/annotations_1/c6mLa5_GvCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.07], [12.0, 14.39], [28.0, 39.63], [45.0, 44.71], [49.0, 49.84], [54.0, 54.35], [63.0, 64.3], [65.0, 65.82], [71.0, 71.27], [76.0, 76.76], [80.0, 79.84], [80.0, 80.0], [80.0, 80.05], [102.0, 104.72], [112.0, 116.56], [126.0, 125.95], [126.0, 126.99], [129.0, 129.37], [130.0, 131.14], [135.0, 135.7], [146.0, 146.53], [156.0, 156.61], [165.0, 168.02], [169.0, 170.29], [172.0, 172.13], [178.0, 179.1]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.95, 44.2, 30.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.51, 38.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.37], ["mains hum", 15.96], ["hum", 15.43]], [["music", 52.07], ["throbbing", 4.37], ["hum", 4.32]], [["music", 63.91], ["animal", 6.16], ["hum", 4.94]], null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 53.23], ["moo", 20.08], ["cattle, bovinae", 16.98]], [["speech", 44.66], ["music", 9.55], ["noise", 5.69]], null, null, null, null, null, null, null, [["mains hum", 31.62], ["hum", 28.64], ["speech", 16.24]], null, null, null], "duration": [7.07, 2.39, 11.63, -0.29, 0.84, 0.35, 1.3, 0.82, 0.27, 0.76, -0.16, 0.0, 0.05, 2.72, 4.56, -0.05, 0.99, 0.37, 1.14, 0.7, 0.53, 0.61, 3.02, 1.29, 0.13, 1.1]} \ No newline at end of file diff --git a/annotations_1/c7-u-fyUSkM_filtered.json b/annotations_1/c7-u-fyUSkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3fc7e683ace785c03a80322ea82f9b45a86818b --- /dev/null +++ b/annotations_1/c7-u-fyUSkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [5.0, 8.92], [10.0, 10.91], [12.0, 12.65], [15.0, 15.4], [17.0, 47.02], [48.0, 51.0], [51.0, 52.15], [54.0, 54.38], [55.0, 59.66], [60.0, 70.04], [71.0, 73.38], [77.0, 81.36], [82.0, 82.97], [85.0, 91.34], [92.0, 95.49], [97.0, 98.05]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 60.89, 46.94, 79.07, 65.67, 0.0, 56.18, 56.63, 0.0], "audiomae_on_audioset": [null, [["speech", 32.27], ["hum", 16.64], ["rumble", 13.98]], null, null, null, null, [["wail, moan", 28.6], ["animal", 18.24], ["speech", 16.21]], null, null, null, [["speech", 72.24], ["beatboxing", 1.96], ["fart", 1.52]], null, null, null, null, null, null], "duration": [1.62, 3.92, 0.91, 0.65, 0.4, 30.02, 3.0, 1.15, 0.38, 4.66, 10.04, 2.38, 4.36, 0.97, 6.34, 3.49, 1.05]} \ No newline at end of file diff --git a/annotations_1/c82FD6lh2LQ_filtered.json b/annotations_1/c82FD6lh2LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c79f764a3e095f4f647a19aee45298000278cf --- /dev/null +++ b/annotations_1/c82FD6lh2LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.68], [7.0, 8.38], [9.0, 15.38], [16.0, 47.44], [49.0, 72.72], [73.0, 77.45], [79.0, 89.58], [91.0, 90.98], [92.0, 92.47], [93.0, 99.33], [100.0, 105.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [87.19, 0.0, 98.1, 0.0, 53.91, 50.41, 31.56, 0.0, 0.0, 35.04, 40.64], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 27.94], ["music", 23.9], ["livestock, farm animals, working animals", 13.24]], null, null, [["speech", 38.98], ["music", 24.97], ["hum", 9.45]], [["speech", 24.73], ["music", 20.7], ["theremin", 13.69]]], "duration": [2.68, 1.38, 6.38, 31.44, 23.72, 4.45, 10.58, -0.02, 0.47, 6.33, 5.29]} \ No newline at end of file diff --git a/annotations_1/c95YKkIbTGg_filtered.json b/annotations_1/c95YKkIbTGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aaf3521933ce7a9f805c412dfa1b842ab115690 --- /dev/null +++ b/annotations_1/c95YKkIbTGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 21.69], [24.0, 24.38], [33.0, 52.96], [54.0, 59.53], [60.0, 61.72], [62.0, 62.75], [65.0, 68.05], [69.0, 69.72], [71.0, 85.92], [87.0, 103.67], [105.0, 163.97], [166.0, 166.6]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false], "silence_prob": [64.63, 0.0, 32.48, 39.86, 0.0, 0.0, 34.78, 0.0, 32.09, 34.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.92], ["buzz", 13.43], ["noise", 5.75]], [["music", 35.16], ["didgeridoo", 15.9], ["effects unit", 9.13]], null, null, [["music", 40.09], ["hum", 12.56], ["speech", 11.47]], null, [["music", 66.25], ["hum", 6.25], ["mains hum", 3.65]], [["music", 44.22], ["didgeridoo", 18.74], ["hum", 8.89]], null, null], "duration": [12.69, 0.38, 19.96, 5.53, 1.72, 0.75, 3.05, 0.72, 14.92, 16.67, 58.97, 0.6]} \ No newline at end of file diff --git a/annotations_1/c9YJ-KJZKyY_filtered.json b/annotations_1/c9YJ-KJZKyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e985b91b1b6ac541e6d14eabe3b88eb6d4d9970 --- /dev/null +++ b/annotations_1/c9YJ-KJZKyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.9], [13.0, 13.37], [14.0, 16.75], [19.0, 19.52], [20.0, 21.69], [42.0, 42.15], [46.0, 46.53], [70.0, 70.98], [74.0, 74.43], [85.0, 85.19], [86.0, 86.61], [88.0, 97.48], [105.0, 118.35], [120.0, 120.8], [142.0, 151.26], [164.0, 165.79], [175.0, 176.0], [181.0, 181.4], [182.0, 183.1], [185.0, 200.3], [205.0, 213.51], [216.0, 225.81]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [37.59, 0.0, 38.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.79, 42.33, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 35.85, 32.25, 41.12], "audiomae_on_audioset": [[["music", 32.89], ["livestock, farm animals, working animals", 5.48], ["animal", 4.47]], null, [["speech", 31.37], ["music", 24.22], ["boing", 6.14]], null, null, null, null, null, null, null, null, [["music", 71.85], ["musical instrument", 2.27], ["speech", 1.65]], [["music", 45.39], ["speech", 31.46], ["outside, rural or natural", 2.91]], null, [["noise", 38.36], ["speech", 25.91], ["music", 17.49]], null, null, null, null, [["music", 70.19], ["synthesizer", 4.65], ["hum", 4.06]], [["speech", 44.29], ["music", 14.36], ["vehicle", 6.53]], [["speech", 28.5], ["music", 19.78], ["whimper", 6.36]]], "duration": [2.9, 0.37, 2.75, 0.52, 1.69, 0.15, 0.53, 0.98, 0.43, 0.19, 0.61, 9.48, 13.35, 0.8, 9.26, 1.79, 1.0, 0.4, 1.1, 15.3, 8.51, 9.81]} \ No newline at end of file diff --git a/annotations_1/c9oE47YW6YM_filtered.json b/annotations_1/c9oE47YW6YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f1be0ea48893b24803465c5106436a631857b88 --- /dev/null +++ b/annotations_1/c9oE47YW6YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.46], [14.0, 14.55], [15.0, 20.43], [21.0, 37.74], [38.0, 39.58], [41.0, 41.49], [43.0, 44.49], [49.0, 51.33], [52.0, 52.42], [53.0, 53.54], [54.0, 54.97], [56.0, 55.8], [56.0, 57.32], [59.0, 59.59], [62.0, 62.16], [63.0, 64.29], [68.0, 70.9], [79.0, 106.98], [108.0, 109.85], [112.0, 113.21], [115.0, 119.4], [123.0, 125.44], [127.0, 129.3]], "keep_status": [false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [40.09, 0.0, 39.37, 36.88, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.85, 42.51, 0.0, 0.0, 43.58, 57.01, 57.72], "audiomae_on_audioset": [[["music", 61.08], ["speech", 8.07], ["electronic music", 3.53]], null, [["music", 30.65], ["speech", 26.71], ["singing bowl", 4.88]], [["music", 33.31], ["ambient music", 12.89], ["hum", 10.16]], null, null, null, [["sidetone", 17.43], ["music", 16.19], ["speech", 15.9]], null, null, null, null, null, null, null, null, [["speech", 33.25], ["aircraft", 17.78], ["fixed-wing aircraft, airplane", 7.87]], [["hum", 57.92], ["mains hum", 20.7], ["throbbing", 17.3]], null, null, [["music", 23.99], ["hum", 23.43], ["throbbing", 11.73]], null, null], "duration": [2.46, 0.55, 5.43, 16.74, 1.58, 0.49, 1.49, 2.33, 0.42, 0.54, 0.97, -0.2, 1.32, 0.59, 0.16, 1.29, 2.9, 27.98, 1.85, 1.21, 4.4, 2.44, 2.3]} \ No newline at end of file diff --git a/annotations_1/cBFrfA6TrB0_filtered.json b/annotations_1/cBFrfA6TrB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e250164d7ca1012459964e93bb533e341bec2ea --- /dev/null +++ b/annotations_1/cBFrfA6TrB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [6.0, 7.77], [12.0, 12.87], [14.0, 13.95], [15.0, 15.01], [17.0, 19.77], [22.0, 23.3], [24.0, 26.5], [29.0, 31.43], [33.0, 33.66], [34.0, 34.35], [35.0, 38.75], [42.0, 42.28], [48.0, 49.57], [51.0, 51.16], [52.0, 51.56], [52.0, 51.93], [52.0, 54.04], [57.0, 60.45], [62.0, 65.48], [68.0, 68.79], [73.0, 73.6], [76.0, 80.84], [82.0, 86.02], [87.0, 88.84], [89.0, 94.83], [97.0, 99.05], [101.0, 104.01], [106.0, 136.19], [137.0, 138.79], [139.0, 142.03], [144.0, 162.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.09, 0.0, 80.46, 76.86, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 62.78, 70.44, 48.61, 0.0, 0.0, 35.32, 45.49, 0.0, 77.2, 99.1, 43.53, 0.0, 0.0, 64.52, 65.32], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 46.0], ["throbbing", 11.7], ["stomach rumble", 11.04]], null, null, [["music", 46.9], ["animal", 6.97], ["livestock, farm animals, working animals", 6.64]], [["music", 50.8], ["eruption", 4.51], ["speech", 4.0]], null, null, null, [["music", 21.34], ["bleat", 18.74], ["sheep", 17.9]], null, null, null, null], "duration": [0.64, 1.77, 0.87, -0.05, 0.01, 2.77, 1.3, 2.5, 2.43, 0.66, 0.35, 3.75, 0.28, 1.57, 0.16, -0.44, -0.07, 2.04, 3.45, 3.48, 0.79, 0.6, 4.84, 4.02, 1.84, 5.83, 2.05, 3.01, 30.19, 1.79, 3.03, 18.43]} \ No newline at end of file diff --git a/annotations_1/cCwn-ROhwyo_filtered.json b/annotations_1/cCwn-ROhwyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501b15422302bd66d75b632a0e459dffb241ad18 --- /dev/null +++ b/annotations_1/cCwn-ROhwyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.76], [28.0, 204.3], [205.0, 208.63], [210.0, 211.25], [211.0, 211.4], [211.0, 211.89], [214.0, 243.18]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 36.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 24.31], ["rumble", 14.59], ["singing bowl", 14.51]]], "duration": [0.76, 176.3, 3.63, 1.25, 0.4, 0.89, 29.18]} \ No newline at end of file diff --git a/annotations_1/cE2bc0vU9pg_filtered.json b/annotations_1/cE2bc0vU9pg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e36ae347cfb7b9765f81da86be7185c81c2bd3fd --- /dev/null +++ b/annotations_1/cE2bc0vU9pg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.35], [13.0, 16.34], [20.0, 20.63], [21.0, 22.64], [28.0, 28.95], [31.0, 36.68], [41.0, 42.99], [44.0, 45.06], [47.0, 47.78], [50.0, 50.55], [51.0, 52.41], [58.0, 60.42], [66.0, 66.19], [71.0, 71.47], [77.0, 78.43], [86.0, 88.52], [89.0, 89.58], [91.0, 92.06], [96.0, 97.38], [99.0, 99.25], [110.0, 111.87], [114.0, 114.86], [116.0, 117.76], [119.0, 120.04], [122.0, 123.38], [124.0, 125.61], [129.0, 130.6], [132.0, 132.76], [134.0, 135.43], [140.0, 141.35], [143.0, 145.18], [152.0, 153.47], [155.0, 156.34], [158.0, 159.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.62, 71.57, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 57.89, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.35, 3.34, 0.63, 1.64, 0.95, 5.68, 1.99, 1.06, 0.78, 0.55, 1.41, 2.42, 0.19, 0.47, 1.43, 2.52, 0.58, 1.06, 1.38, 0.25, 1.87, 0.86, 1.76, 1.04, 1.38, 1.61, 1.6, 0.76, 1.43, 1.35, 2.18, 1.47, 1.34, 1.6]} \ No newline at end of file diff --git a/annotations_1/cE5l32W6Oxc_filtered.json b/annotations_1/cE5l32W6Oxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2b702b90fc6769276a5f0f325cd72a1fab8c13c --- /dev/null +++ b/annotations_1/cE5l32W6Oxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [5.0, 5.76], [6.0, 6.94], [7.0, 9.31], [11.0, 22.05], [23.0, 25.54], [26.0, 27.23], [28.0, 28.56], [31.0, 33.39], [36.0, 42.23], [46.0, 51.31], [53.0, 53.86], [56.0, 64.81], [65.0, 69.42], [71.0, 73.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.16, 94.95, 90.6, 0.0, 0.0, 99.4, 96.66, 96.42, 0.0, 92.48, 73.36, 96.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.76, 0.94, 2.31, 11.05, 2.54, 1.23, 0.56, 2.39, 6.23, 5.31, 0.86, 8.81, 4.42, 2.99]} \ No newline at end of file diff --git a/annotations_1/cEezHIqQrEw_filtered.json b/annotations_1/cEezHIqQrEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..357ecfa23c0ff1625efca29f0790bb4d21b16475 --- /dev/null +++ b/annotations_1/cEezHIqQrEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.44], [7.0, 8.33], [12.0, 12.48], [18.0, 20.36], [23.0, 25.57], [31.0, 31.13], [34.0, 34.77], [39.0, 40.93], [42.0, 42.55], [43.0, 47.66], [49.0, 49.91], [55.0, 75.78], [81.0, 85.51], [86.0, 87.32], [88.0, 96.74], [102.0, 113.61], [115.0, 115.32]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 84.62, 82.25, 0.0, 0.0, 0.0, 0.0, 41.36, 0.0, 32.61, 34.43, 0.0, 33.8, 34.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 38.7], ["fly, housefly", 17.32], ["insect", 13.45]], null, [["noise", 13.41], ["radio", 11.85], ["music", 11.28]], [["vehicle", 16.58], ["car", 9.29], ["race car, auto racing", 7.21]], null, [["speech", 44.44], ["noise", 11.24], ["vehicle", 9.11]], [["music", 12.98], ["cacophony", 9.19], ["vehicle", 7.11]], null], "duration": [1.44, 1.33, 0.48, 2.36, 2.57, 0.13, 0.77, 1.93, 0.55, 4.66, 0.91, 20.78, 4.51, 1.32, 8.74, 11.61, 0.32]} \ No newline at end of file diff --git a/annotations_1/cGDwEP-RWHo_filtered.json b/annotations_1/cGDwEP-RWHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..204950bfb8db841b14ee77ae852552e095c4c98e --- /dev/null +++ b/annotations_1/cGDwEP-RWHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [5.0, 5.49], [8.0, 11.03], [12.0, 17.37], [19.0, 23.11], [24.0, 26.99], [28.0, 29.61], [31.0, 33.32], [34.0, 38.01], [39.0, 45.33], [47.0, 50.9], [52.0, 55.31], [57.0, 74.68], [77.0, 80.0], [81.0, 83.51], [87.0, 93.77], [95.0, 97.9], [99.0, 100.75], [101.0, 102.71], [105.0, 106.81], [111.0, 115.32], [117.0, 122.74], [124.0, 173.72], [174.0, 175.68], [176.0, 178.14]], "keep_status": [false, false, true, true, true, true, false, true, true, true, true, false, true, false, false, false, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 36.52, 31.17, 34.1, 37.08, 0.0, 33.99, 34.72, 29.68, 33.14, 37.8, 46.72, 50.56, 46.43, 30.36, 38.93, 0.0, 0.0, 0.0, 38.41, 32.84, 0.0, 0.0, 37.66], "audiomae_on_audioset": [null, null, [["hum", 16.73], ["music", 15.82], ["chirp tone", 10.9]], [["creak", 28.1], ["speech", 9.43], ["mechanisms", 8.27]], [["hum", 29.89], ["music", 8.9], ["chirp tone", 6.75]], [["music", 21.16], ["hum", 20.4], ["sine wave", 7.14]], null, [["hum", 30.15], ["mains hum", 20.68], ["music", 9.61]], [["speech", 46.07], ["hum", 9.52], ["rumble", 8.56]], [["speech", 21.7], ["sine wave", 19.1], ["chirp tone", 6.4]], [["rumble", 50.68], ["hum", 5.46], ["music", 5.26]], [["hum", 40.5], ["throbbing", 33.09], ["mains hum", 13.85]], [["coin (dropping)", 16.53], ["music", 6.33], ["speech", 5.9]], null, [["hum", 43.79], ["throbbing", 28.44], ["mains hum", 11.35]], [["hum", 38.71], ["throbbing", 21.42], ["mains hum", 15.03]], [["music", 19.81], ["gong", 17.68], ["hum", 17.62]], null, null, null, [["hum", 47.99], ["mains hum", 12.96], ["music", 6.14]], [["music", 28.39], ["hum", 25.52], ["mains hum", 5.22]], null, null, [["rumble", 31.7], ["hum", 11.97], ["eruption", 9.58]]], "duration": [0.24, 0.49, 3.03, 5.37, 4.11, 2.99, 1.61, 2.32, 4.01, 6.33, 3.9, 3.31, 17.68, 3.0, 2.51, 6.77, 2.9, 1.75, 1.71, 1.81, 4.32, 5.74, 49.72, 1.68, 2.14]} \ No newline at end of file diff --git a/annotations_1/cGd2BBjzb0Y_filtered.json b/annotations_1/cGd2BBjzb0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4af7efe957e4a9292d1a90fdc436a71cf65aa69d --- /dev/null +++ b/annotations_1/cGd2BBjzb0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 11.84], [12.0, 14.5], [15.0, 16.12], [17.0, 18.94], [22.0, 22.67], [28.0, 32.14], [37.0, 38.57], [39.0, 38.75], [42.0, 42.52], [44.0, 44.76], [47.0, 48.52]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 42.67, 39.58, 0.0, 0.0, 0.0, 35.87, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["bee, wasp, etc.", 37.64], ["fly, housefly", 23.44], ["insect", 11.21]], [["fly, housefly", 56.63], ["bee, wasp, etc.", 19.92], ["insect", 17.13]], null, null, null, [["speech", 33.37], ["sidetone", 12.49], ["fly, housefly", 4.77]], null, null, null, null, null], "duration": [0.6, 6.84, 2.5, 1.12, 1.94, 0.67, 4.14, 1.57, -0.25, 0.52, 0.76, 1.52]} \ No newline at end of file diff --git a/annotations_1/cIEPiYHzTto_filtered.json b/annotations_1/cIEPiYHzTto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60d455a54a2f9fac92dcaee12c37f7f11a0175eb --- /dev/null +++ b/annotations_1/cIEPiYHzTto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 34.89], [42.0, 42.62], [52.0, 52.66], [62.0, 68.23], [68.0, 68.35], [87.0, 99.62], [103.0, 105.09]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [29.8, 0.0, 0.0, 29.85, 0.0, 29.37, 29.8], "audiomae_on_audioset": [[["music", 60.85], ["drum machine", 12.11], ["synthesizer", 5.8]], null, null, [["music", 88.8], ["hip hop music", 1.75], ["scratching (performance technique)", 1.21]], null, [["music", 65.0], ["hum", 6.69], ["electronic music", 3.62]], [["music", 46.23], ["speech", 15.46], ["electronic music", 2.51]]], "duration": [23.89, 0.62, 0.66, 6.23, 0.35, 12.62, 2.09]} \ No newline at end of file diff --git a/annotations_1/cINFeXqwbDo_filtered.json b/annotations_1/cINFeXqwbDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e18f60cd3fb402a54ac923ff9e5ec09400dd87e --- /dev/null +++ b/annotations_1/cINFeXqwbDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.28], [28.0, 27.94], [28.0, 28.75], [31.0, 78.73], [82.0, 90.32], [91.0, 94.64], [96.0, 95.94], [99.0, 105.43], [107.0, 118.29], [119.0, 119.84], [121.0, 152.86], [155.0, 155.33], [158.0, 158.26], [160.0, 175.51]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [60.79, 0.0, 0.0, 0.0, 48.95, 45.27, 0.0, 48.35, 40.71, 0.0, 0.0, 0.0, 0.0, 41.46], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 32.41], ["electric shaver, electric razor", 15.75], ["noise", 11.27]], [["cattle, bovinae", 33.01], ["livestock, farm animals, working animals", 30.26], ["moo", 21.47]], null, [["electric shaver, electric razor", 52.82], ["radio", 16.65], ["music", 4.62]], [["speech", 34.16], ["frog", 18.48], ["radio", 9.41]], null, null, null, null, [["music", 59.31], ["speech", 20.01], ["electric shaver, electric razor", 4.19]]], "duration": [9.28, -0.06, 0.75, 47.73, 8.32, 3.64, -0.06, 6.43, 11.29, 0.84, 31.86, 0.33, 0.26, 15.51]} \ No newline at end of file diff --git a/annotations_1/cIscGgQD4uE_filtered.json b/annotations_1/cIscGgQD4uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fad7cc545cad756f5695a8f1c8a0189ddb39af1 --- /dev/null +++ b/annotations_1/cIscGgQD4uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.75], [16.0, 16.88], [20.0, 19.82], [31.0, 37.44], [41.0, 41.91], [46.0, 46.38], [48.0, 48.69], [56.0, 57.15], [59.0, 61.03], [61.0, 62.18], [76.0, 80.42], [84.0, 85.94], [89.0, 90.02], [95.0, 95.99], [99.0, 110.91], [111.0, 113.97], [114.0, 115.53], [119.0, 119.04], [122.0, 123.36], [124.0, 124.8], [127.0, 128.26], [128.0, 129.79]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.27, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 35.19, 0.0, 0.0, 0.0, 32.79, 43.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 22.32], ["livestock, farm animals, working animals", 21.71], ["moo", 20.69]], null, null, null, null, null, null, [["music", 74.71], ["musical instrument", 7.88], ["singing", 2.44]], null, null, null, [["music", 78.48], ["speech", 3.2], ["electronic music", 2.13]], [["speech", 45.54], ["music", 16.12], ["moo", 6.57]], null, null, null, null, null, null], "duration": [1.75, 0.88, -0.18, 6.44, 0.91, 0.38, 0.69, 1.15, 2.03, 1.18, 4.42, 1.94, 1.02, 0.99, 11.91, 2.97, 1.53, 0.04, 1.36, 0.8, 1.26, 1.79]} \ No newline at end of file diff --git a/annotations_1/cJyhEAxnQ-U_filtered.json b/annotations_1/cJyhEAxnQ-U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72c5d0af370939dac5fe1c0e3f8c13f2e97d43af --- /dev/null +++ b/annotations_1/cJyhEAxnQ-U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [7.0, 8.72], [11.0, 12.53], [16.0, 16.51], [18.0, 20.01], [23.0, 24.53], [27.0, 27.51], [29.0, 32.95], [38.0, 38.7], [40.0, 41.74], [44.0, 47.49], [49.0, 49.59], [52.0, 52.56], [54.0, 53.99], [57.0, 57.4], [59.0, 59.97], [62.0, 62.58], [66.0, 67.68], [71.0, 72.76], [74.0, 78.06], [80.0, 81.31], [84.0, 85.92], [88.0, 88.62], [91.0, 92.77], [93.0, 94.64], [96.0, 98.31], [100.0, 102.88], [105.0, 108.8], [110.0, 111.91], [113.0, 115.18], [116.0, 117.8], [119.0, 119.43], [121.0, 121.86], [123.0, 125.22]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 43.28, 0.0, 0.0, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 40.34, 55.04, 0.0, 48.23, 0.0, 0.0, 0.0, 65.67], "audiomae_on_audioset": [null, null, null, null, [["music", 24.72], ["speech", 22.71], ["sidetone", 14.64]], null, null, [["music", 35.67], ["singing bowl", 12.75], ["hum", 10.82]], null, null, [["music", 66.45], ["gong", 12.22], ["hum", 3.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 36.12], ["sidetone", 26.86], ["music", 12.49]], [["sidetone", 73.73], ["music", 13.99], ["mains hum", 4.46]], null, null, [["music", 28.1], ["speech", 14.85], ["sidetone", 9.51]], null, null, null, null], "duration": [0.75, 1.72, 1.53, 0.51, 2.01, 1.53, 0.51, 3.95, 0.7, 1.74, 3.49, 0.59, 0.56, -0.01, 0.4, 0.97, 0.58, 1.68, 1.76, 4.06, 1.31, 1.92, 0.62, 1.77, 1.64, 2.31, 2.88, 3.8, 1.91, 2.18, 1.8, 0.43, 0.86, 2.22]} \ No newline at end of file diff --git a/annotations_1/cLomnZIvoFs_filtered.json b/annotations_1/cLomnZIvoFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ad466d954dcec70ba40773b210babb054e70f6 --- /dev/null +++ b/annotations_1/cLomnZIvoFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.53], [20.0, 20.65], [22.0, 24.9], [28.0, 29.71], [32.0, 31.7], [34.0, 34.52], [36.0, 49.5], [53.0, 61.01], [63.0, 66.88], [68.0, 67.8], [80.0, 79.79], [80.0, 79.93], [80.0, 80.0], [92.0, 93.61], [98.0, 99.28], [103.0, 104.18], [109.0, 110.19], [114.0, 115.4], [116.0, 118.34], [122.0, 125.83], [135.0, 136.68], [160.0, 164.29], [203.0, 203.27], [204.0, 207.01], [214.0, 214.79]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [38.62, 0.0, 68.54, 0.0, 0.0, 0.0, 41.2, 37.12, 38.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 35.13, 0.0, 31.5, 0.0, 32.42, 0.0], "audiomae_on_audioset": [[["music", 34.24], ["hum", 15.42], ["speech", 14.49]], null, null, null, null, null, [["hum", 44.57], ["mains hum", 40.88], ["throbbing", 3.41]], [["hum", 46.05], ["music", 10.21], ["throbbing", 9.64]], [["music", 32.62], ["throbbing", 19.51], ["hum", 17.42]], null, null, null, null, null, null, null, null, null, null, [["music", 27.99], ["speech", 23.79], ["synthesizer", 7.63]], null, [["music", 61.99], ["hum", 5.1], ["mains hum", 5.05]], null, [["music", 51.64], ["speech", 11.06], ["sidetone", 2.8]], null], "duration": [15.53, 0.65, 2.9, 1.71, -0.3, 0.52, 13.5, 8.01, 3.88, -0.2, -0.21, -0.07, 0.0, 1.61, 1.28, 1.18, 1.19, 1.4, 2.34, 3.83, 1.68, 4.29, 0.27, 3.01, 0.79]} \ No newline at end of file diff --git a/annotations_1/cMFosgxgPAs_filtered.json b/annotations_1/cMFosgxgPAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b35dd34ab6f79898d56e3b83f0e6fa54924f0ef5 --- /dev/null +++ b/annotations_1/cMFosgxgPAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.2], [19.0, 19.47], [25.0, 25.17], [27.0, 28.85], [31.0, 35.68], [38.0, 38.97], [44.0, 44.93], [52.0, 57.18], [64.0, 65.82], [68.0, 115.74], [117.0, 122.4], [125.0, 131.25], [132.0, 132.07], [134.0, 134.97], [136.0, 137.32], [140.0, 139.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [44.29, 0.0, 0.0, 0.0, 63.96, 0.0, 0.0, 38.41, 0.0, 0.0, 31.14, 30.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 38.9], ["throbbing", 26.65], ["music", 13.23]], null, null, null, null, null, null, [["speech", 40.1], ["music", 36.09], ["drum machine", 6.81]], null, null, [["music", 78.09], ["musical instrument", 4.52], ["bass guitar", 3.45]], [["music", 31.42], ["door", 8.28], ["hum", 6.56]], null, null, null, null], "duration": [2.2, 0.47, 0.17, 1.85, 4.68, 0.97, 0.93, 5.18, 1.82, 47.74, 5.4, 6.25, 0.07, 0.97, 1.32, -0.37]} \ No newline at end of file diff --git a/annotations_1/cMPXArN7f9k_filtered.json b/annotations_1/cMPXArN7f9k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..353ea2b2b770f7d0f1655c6ac7f24352d0bf9c96 --- /dev/null +++ b/annotations_1/cMPXArN7f9k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.25], [15.0, 16.06], [22.0, 23.04], [23.0, 30.05], [31.0, 37.05], [39.0, 45.67], [48.0, 48.02], [48.0, 50.13], [53.0, 53.28], [65.0, 71.34], [72.0, 73.16], [74.0, 75.39], [77.0, 92.67], [95.0, 96.94], [98.0, 111.1], [111.0, 113.04], [115.0, 115.15], [116.0, 115.87], [116.0, 119.65], [120.0, 119.74], [120.0, 121.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [59.59, 0.0, 0.0, 66.03, 94.52, 78.21, 0.0, 51.6, 0.0, 80.64, 0.0, 0.0, 99.97, 0.0, 95.09, 91.47, 0.0, 0.0, 59.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.25, 1.06, 1.04, 7.05, 6.05, 6.67, 0.02, 2.13, 0.28, 6.34, 1.16, 1.39, 15.67, 1.94, 13.1, 2.04, 0.15, -0.13, 3.65, -0.26, 1.47]} \ No newline at end of file diff --git a/annotations_1/cMmi5sRe8wc_filtered.json b/annotations_1/cMmi5sRe8wc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ad2f4741363a21b13cd179e1e8bf7b5af32c31 --- /dev/null +++ b/annotations_1/cMmi5sRe8wc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [13.0, 13.29], [15.0, 14.94], [17.0, 17.17], [30.0, 30.77], [37.0, 37.0], [43.0, 43.83], [47.0, 47.82], [50.0, 50.52], [52.0, 56.91], [57.0, 69.26], [72.0, 72.2], [75.0, 79.42], [81.0, 113.44], [114.0, 128.44], [132.0, 132.29], [134.0, 150.55], [155.0, 168.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.66, 30.47, 0.0, 31.6, 0.0, 37.78, 0.0, 38.94, 35.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 50.86], ["mains hum", 15.56], ["speech", 8.61]], [["hum", 14.49], ["music", 7.68], ["speech", 7.28]], null, [["music", 26.62], ["buzz", 13.62], ["sound effect", 7.99]], null, [["music", 81.45], ["scary music", 2.29], ["soundtrack music", 1.77]], null, [["music", 64.15], ["hum", 6.81], ["gong", 5.72]], [["music", 81.79], ["ambient music", 4.82], ["electronic music", 2.67]]], "duration": [1.07, 0.29, -0.06, 0.17, 0.77, 0.0, 0.83, 0.82, 0.52, 4.91, 12.26, 0.2, 4.42, 32.44, 14.44, 0.29, 16.55, 13.84]} \ No newline at end of file diff --git a/annotations_1/cMwOJoesx8M_filtered.json b/annotations_1/cMwOJoesx8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afcc141680a926b75cd5b63aac0913790272d7a8 --- /dev/null +++ b/annotations_1/cMwOJoesx8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [9.0, 9.51], [12.0, 12.95], [14.0, 14.25], [19.0, 19.65], [21.0, 21.29], [23.0, 25.62], [30.0, 30.23], [38.0, 38.37], [41.0, 41.74], [62.0, 63.73], [66.0, 67.17], [70.0, 70.77], [72.0, 72.59], [75.0, 76.94], [79.0, 79.2], [83.0, 83.19], [86.0, 88.1], [92.0, 93.06], [103.0, 103.1], [105.0, 106.64], [108.0, 108.62], [110.0, 112.94], [115.0, 123.87], [125.0, 126.23], [129.0, 130.76], [131.0, 132.19], [133.0, 133.96], [135.0, 137.3], [138.0, 138.86], [141.0, 143.5], [146.0, 147.61], [151.0, 151.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 94.95, 72.16, 0.0, 0.0, 0.0, 0.0, 62.47, 0.0, 68.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 0.51, 0.95, 0.25, 0.65, 0.29, 2.62, 0.23, 0.37, 0.74, 1.73, 1.17, 0.77, 0.59, 1.94, 0.2, 0.19, 2.1, 1.06, 0.1, 1.64, 0.62, 2.94, 8.87, 1.23, 1.76, 1.19, 0.96, 2.3, 0.86, 2.5, 1.61, 0.55]} \ No newline at end of file diff --git a/annotations_1/cOXVnmVPdtQ_filtered.json b/annotations_1/cOXVnmVPdtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..353f86007e19b7ef7c45740d47b9cd0bbf18f1b3 --- /dev/null +++ b/annotations_1/cOXVnmVPdtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [5.0, 5.85], [8.0, 8.21], [9.0, 10.86], [13.0, 15.01], [16.0, 18.3], [21.0, 22.76], [26.0, 30.82], [34.0, 43.83], [45.0, 46.06], [48.0, 48.41], [49.0, 50.25], [54.0, 56.32], [59.0, 60.83], [62.0, 62.33], [64.0, 68.22], [69.0, 70.83], [72.0, 73.13], [74.0, 75.56], [77.0, 99.13], [100.0, 102.17], [103.0, 103.76], [106.0, 106.96], [107.0, 108.65], [109.0, 111.7], [112.0, 114.32], [115.0, 115.75], [117.0, 123.09], [123.0, 126.44], [127.0, 129.91], [130.0, 141.89], [142.0, 143.63], [145.0, 146.62], [150.0, 152.47]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.84, 35.93, 0.0, 31.74, 32.86, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 48.19, 0.0, 0.0, 0.0, 95.64, 100.0, 0.0, 0.0, 0.0, 97.73, 99.93, 0.0, 98.99, 86.82, 97.54, 82.79, 0.0, 0.0, 92.97], "audiomae_on_audioset": [null, null, null, null, [["music", 68.77], ["guitar", 5.16], ["musical instrument", 4.97]], [["music", 47.69], ["speech", 13.17], ["musical instrument", 7.25]], null, [["music", 76.96], ["theremin", 5.9], ["synthesizer", 2.44]], [["music", 65.6], ["animal", 9.74], ["dog", 5.86]], null, null, null, null, null, null, [["music", 34.04], ["speech", 8.29], ["musical instrument", 7.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 0.85, 0.21, 1.86, 2.01, 2.3, 1.76, 4.82, 9.83, 1.06, 0.41, 1.25, 2.32, 1.83, 0.33, 4.22, 1.83, 1.13, 1.56, 22.13, 2.17, 0.76, 0.96, 1.65, 2.7, 2.32, 0.75, 6.09, 3.44, 2.91, 11.89, 1.63, 1.62, 2.47]} \ No newline at end of file diff --git a/annotations_1/cP63R4QwDFI_filtered.json b/annotations_1/cP63R4QwDFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c88e7e67d34e603efe0b6ad9aa38ccc79c459a10 --- /dev/null +++ b/annotations_1/cP63R4QwDFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.75], [6.0, 8.5], [10.0, 13.22], [15.0, 18.01], [21.0, 24.83], [29.0, 37.34], [40.0, 43.9], [46.0, 50.75], [52.0, 55.49]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.97, 91.81, 78.89, 66.63, 56.55, 38.94, 38.0, 59.86], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.71], ["timpani", 4.36], ["percussion", 4.21]], [["music", 39.4], ["rumble", 20.71], ["gong", 11.48]], null], "duration": [1.75, 2.5, 3.22, 3.01, 3.83, 8.34, 3.9, 4.75, 3.49]} \ No newline at end of file diff --git a/annotations_1/cPVM14Bnf5I_filtered.json b/annotations_1/cPVM14Bnf5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bcc8444a315fae40c02b637ae575d10c2088285 --- /dev/null +++ b/annotations_1/cPVM14Bnf5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.27], [12.0, 13.88], [17.0, 17.25], [21.0, 20.98], [23.0, 23.82], [26.0, 26.79], [33.0, 42.26], [46.0, 48.41], [55.0, 63.63], [67.0, 68.13], [68.0, 71.05], [79.0, 82.81], [85.0, 86.02], [87.0, 87.88], [90.0, 106.17], [107.0, 121.95], [122.0, 122.71], [124.0, 124.51], [138.0, 157.08], [161.0, 161.64]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.52, 34.14, 33.46, 0.0, 33.23, 30.71, 0.0, 0.0, 30.68, 30.73, 0.0, 0.0, 31.18, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.93], ["music", 8.28], ["explosion", 7.97]], [["music", 42.17], ["throbbing", 5.59], ["speech", 3.25]], [["speech", 54.65], ["music", 15.16], ["hum", 8.17]], null, [["music", 67.81], ["musical instrument", 3.11], ["didgeridoo", 3.08]], [["music", 44.89], ["speech", 7.31], ["musical instrument", 3.74]], null, null, [["cattle, bovinae", 39.41], ["moo", 32.64], ["music", 10.07]], [["music", 56.01], ["electronic music", 11.31], ["techno", 5.62]], null, null, [["music", 78.01], ["musical instrument", 2.45], ["theremin", 1.35]], null], "duration": [0.27, 1.88, 0.25, -0.02, 0.82, 0.79, 9.26, 2.41, 8.63, 1.13, 3.05, 3.81, 1.02, 0.88, 16.17, 14.95, 0.71, 0.51, 19.08, 0.64]} \ No newline at end of file diff --git a/annotations_1/cPfMxQLlirI_filtered.json b/annotations_1/cPfMxQLlirI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..614ffca2ff2f5acb7813840aabae8dfd0d68056a --- /dev/null +++ b/annotations_1/cPfMxQLlirI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.16], [25.0, 26.33], [30.0, 39.09], [41.0, 42.08], [43.0, 63.49], [69.0, 70.06], [71.0, 74.68], [76.0, 89.99], [93.0, 98.86], [100.0, 104.16], [105.0, 105.38], [107.0, 109.02], [112.0, 114.51], [119.0, 121.85], [123.0, 123.52], [126.0, 130.1], [132.0, 131.68]], "keep_status": [false, false, true, false, true, false, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 32.51, 0.0, 32.1, 0.0, 29.07, 29.83, 29.45, 29.17, 0.0, 41.62, 56.63, 38.64, 0.0, 56.33, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.49], ["mains hum", 20.91], ["music", 15.01]], null, [["music", 29.55], ["noise", 12.15], ["boing", 11.28]], null, [["hum", 34.72], ["mains hum", 14.81], ["music", 13.7]], [["music", 74.16], ["theremin", 4.84], ["hum", 3.38]], [["music", 54.88], ["hum", 8.43], ["mains hum", 7.02]], [["music", 41.69], ["explosion", 6.7], ["boom", 5.18]], null, [["speech", 33.34], ["hum", 16.45], ["music", 9.98]], null, [["thunk", 39.42], ["whack, thwack", 18.91], ["music", 6.76]], null, null, null], "duration": [1.16, 1.33, 9.09, 1.08, 20.49, 1.06, 3.68, 13.99, 5.86, 4.16, 0.38, 2.02, 2.51, 2.85, 0.52, 4.1, -0.32]} \ No newline at end of file diff --git a/annotations_1/cRZ7bc3nqwA_filtered.json b/annotations_1/cRZ7bc3nqwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56265cb3018d1f2a53ca4a47c9a75b25f9147d53 --- /dev/null +++ b/annotations_1/cRZ7bc3nqwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.79], [50.0, 50.26], [51.0, 52.32], [54.0, 56.57], [60.0, 61.11], [66.0, 68.64], [69.0, 71.49], [72.0, 81.99], [85.0, 112.5], [121.0, 122.98], [125.0, 125.39], [135.0, 138.92], [139.0, 140.85], [147.0, 152.19], [165.0, 164.66], [167.0, 169.28], [170.0, 180.45], [181.0, 183.19]], "keep_status": [false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.13, 0.0, 33.0, 64.75, 31.15, 33.61, 0.0, 0.0, 52.39, 0.0, 57.64, 0.0, 83.88, 37.15, 50.02], "audiomae_on_audioset": [null, null, null, [["hum", 29.24], ["music", 25.0], ["mains hum", 13.97]], null, [["speech", 69.37], ["hum", 8.07], ["music", 3.92]], null, [["music", 34.49], ["hum", 19.83], ["mains hum", 7.6]], [["music", 34.38], ["hum", 8.29], ["speech", 7.92]], null, null, null, null, null, null, null, [["music", 71.89], ["scary music", 7.09], ["ambient music", 3.94]], null], "duration": [1.79, 0.26, 1.32, 2.57, 1.11, 2.64, 2.49, 9.99, 27.5, 1.98, 0.39, 3.92, 1.85, 5.19, -0.34, 2.28, 10.45, 2.19]} \ No newline at end of file diff --git a/annotations_1/cRpMdH1D55o_filtered.json b/annotations_1/cRpMdH1D55o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b901190dd83cd1d81433d87da4b87d07cbac3b7c --- /dev/null +++ b/annotations_1/cRpMdH1D55o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [5.0, 6.66], [8.0, 33.56], [34.0, 35.33], [36.0, 37.05], [39.0, 38.91], [40.0, 40.93], [42.0, 42.74], [43.0, 44.31], [45.0, 50.45], [53.0, 52.86], [54.0, 58.02], [58.0, 58.24], [58.0, 60.93], [62.0, 65.91], [69.0, 73.09], [76.0, 79.27], [82.0, 96.94], [97.0, 99.57], [100.0, 102.47], [103.0, 113.07], [118.0, 120.53], [122.0, 128.65], [133.0, 137.98], [138.0, 150.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.44, 0.0, 28.56, 0.0, 28.64, 28.66, 28.24, 29.42, 29.06, 42.53, 42.93, 39.7, 37.68, 90.6, 57.48, 94.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 58.8], ["theremin", 11.55], ["ambient music", 3.96]], null, [["foghorn", 47.94], ["music", 23.86], ["gong", 8.35]], null, [["noise", 13.77], ["electric shaver, electric razor", 10.79], ["music", 7.16]], [["music", 26.62], ["foghorn", 7.11], ["hum", 3.96]], [["foghorn", 24.48], ["music", 22.73], ["trombone", 16.63]], [["theremin", 38.67], ["foghorn", 28.93], ["music", 10.83]], [["theremin", 58.48], ["music", 25.22], ["buzz", 5.43]], [["tabla", 33.63], ["music", 17.24], ["musical instrument", 7.81]], [["mains hum", 30.83], ["hum", 25.09], ["music", 18.1]], [["music", 27.25], ["mains hum", 23.89], ["hum", 22.45]], [["speech", 37.07], ["gong", 21.65], ["music", 8.37]], null, null, null], "duration": [1.64, 1.66, 25.56, 1.33, 1.05, -0.09, 0.93, 0.74, 1.31, 5.45, -0.14, 4.02, 0.24, 2.93, 3.91, 4.09, 3.27, 14.94, 2.57, 2.47, 10.07, 2.53, 6.65, 4.98, 12.28]} \ No newline at end of file diff --git a/annotations_1/cRuYB2gXpM8_filtered.json b/annotations_1/cRuYB2gXpM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b210b65d989f447b83efd6c1aadb8e6afffc8957 --- /dev/null +++ b/annotations_1/cRuYB2gXpM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [8.0, 11.67], [12.0, 12.97], [15.0, 14.84], [15.0, 15.77], [17.0, 42.5], [44.0, 73.94], [76.0, 91.34], [93.0, 106.22], [111.0, 111.25], [112.0, 122.89], [124.0, 130.54], [131.0, 173.16], [174.0, 174.07]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.82, 0.0, 0.0, 0.0, 31.91, 33.53, 41.98, 46.26, 0.0, 41.22, 59.59, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 30.3], ["hum", 13.57], ["music", 10.12]], null, null, null, [["throbbing", 46.12], ["music", 34.84], ["hum", 13.09]], [["hum", 16.11], ["throbbing", 13.37], ["music", 9.37]], [["mains hum", 34.2], ["hum", 31.87], ["music", 14.35]], [["music", 39.24], ["hum", 18.36], ["mains hum", 15.59]], null, [["hum", 56.41], ["music", 15.29], ["mains hum", 12.6]], null, null, null], "duration": [0.72, 3.67, 0.97, -0.16, 0.77, 25.5, 29.94, 15.34, 13.22, 0.25, 10.89, 6.54, 42.16, 0.07]} \ No newline at end of file diff --git a/annotations_1/cSO2u-StPbY_filtered.json b/annotations_1/cSO2u-StPbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30a9a63a5ecf773e526f8e0b9073d334d575b1a9 --- /dev/null +++ b/annotations_1/cSO2u-StPbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 44.81], [70.0, 70.85], [75.0, 86.19]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.39], "audiomae_on_audioset": [null, null, [["hum", 30.18], ["music", 22.53], ["mains hum", 17.62]]], "duration": [-0.19, 0.85, 11.19]} \ No newline at end of file diff --git a/annotations_1/cSSYFjtc4SY_filtered.json b/annotations_1/cSSYFjtc4SY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ce2abf7987ad030441f46da459f63936bb87cf6 --- /dev/null +++ b/annotations_1/cSSYFjtc4SY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.59], [20.0, 20.78], [22.0, 22.45], [23.0, 23.28], [24.0, 35.23], [38.0, 43.28], [44.0, 103.01], [104.0, 104.82], [105.0, 105.46], [107.0, 107.27], [108.0, 108.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.34, 0.0, 0.0, 0.0, 85.72, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [13.59, 0.78, 0.45, 0.28, 11.23, 5.28, 59.01, 0.82, 0.46, 0.27, 0.82]} \ No newline at end of file diff --git a/annotations_1/cSWMU_rISfw_filtered.json b/annotations_1/cSWMU_rISfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c906df72c1b2c91ca1ab461a69e57f22c88db1 --- /dev/null +++ b/annotations_1/cSWMU_rISfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 100.45], [101.0, 101.85], [102.0, 106.14]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 32.02], "audiomae_on_audioset": [null, null, [["fart", 42.83], ["fly, housefly", 13.73], ["mosquito", 13.67]]], "duration": [76.45, 0.85, 4.14]} \ No newline at end of file diff --git a/annotations_1/cT1iUwGGUAg_filtered.json b/annotations_1/cT1iUwGGUAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ce3858c3fc88a731294350d18d2414de9151a7 --- /dev/null +++ b/annotations_1/cT1iUwGGUAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [17.0, 17.19], [19.0, 19.25], [21.0, 21.05], [23.0, 23.38], [24.0, 24.78], [26.0, 27.24], [32.0, 32.48], [54.0, 54.58], [56.0, 57.75], [60.0, 60.02], [61.0, 61.18], [66.0, 66.83], [68.0, 68.22], [80.0, 80.91], [82.0, 82.39], [85.0, 85.02], [89.0, 89.53], [91.0, 91.37], [93.0, 93.41], [95.0, 95.4], [96.0, 97.07], [100.0, 100.57], [101.0, 101.43], [103.0, 103.55], [104.0, 104.33], [107.0, 107.01], [111.0, 111.74], [114.0, 116.73], [127.0, 128.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 0.19, 0.25, 0.05, 0.38, 0.78, 1.24, 0.48, 0.58, 1.75, 0.02, 0.18, 0.83, 0.22, 0.91, 0.39, 0.02, 0.53, 0.37, 0.41, 0.4, 1.07, 0.57, 0.43, 0.55, 0.33, 0.01, 0.74, 2.73, 1.19]} \ No newline at end of file diff --git a/annotations_1/cTQRH6MPV3A_filtered.json b/annotations_1/cTQRH6MPV3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23a0e232eb2dfbe8cbb00d47e05226abcd20d1ed --- /dev/null +++ b/annotations_1/cTQRH6MPV3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.71], [9.0, 8.87], [9.0, 9.64], [17.0, 17.56], [19.0, 20.07], [20.0, 21.42], [26.0, 26.22], [28.0, 30.01], [34.0, 38.75], [46.0, 46.16], [47.0, 46.99], [51.0, 51.29], [53.0, 57.47], [73.0, 76.74], [80.0, 83.25], [86.0, 86.9], [107.0, 106.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 81.71, 0.0, 0.0, 0.0, 99.98, 96.89, 99.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.71, -0.13, 0.64, 0.56, 1.07, 1.42, 0.22, 2.01, 4.75, 0.16, -0.01, 0.29, 4.47, 3.74, 3.25, 0.9, -0.04]} \ No newline at end of file diff --git a/annotations_1/cTR9Hnxfk7A_filtered.json b/annotations_1/cTR9Hnxfk7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d8463d6fe304ad9a03c7bda6ebef068a1f75e96 --- /dev/null +++ b/annotations_1/cTR9Hnxfk7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [9.0, 9.85], [12.0, 13.12], [15.0, 15.21], [18.0, 18.96], [20.0, 20.83], [22.0, 23.21], [26.0, 27.75], [29.0, 29.74], [34.0, 34.94], [36.0, 36.63], [42.0, 45.5], [46.0, 49.67], [53.0, 53.67], [55.0, 58.13], [59.0, 62.65], [65.0, 65.16], [66.0, 67.34], [68.0, 68.74], [72.0, 71.98], [73.0, 73.7], [75.0, 75.74], [78.0, 78.09], [79.0, 80.13], [92.0, 93.65], [95.0, 95.79], [101.0, 101.9], [104.0, 107.25], [111.0, 112.53], [113.0, 114.39], [119.0, 121.09], [122.0, 122.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 45.3, 0.0, 43.85, 44.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 99.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.9], ["sidetone", 22.27], ["busy signal", 7.36]], [["fart", 32.77], ["hum", 9.97], ["speech", 7.89]], null, [["stomach rumble", 69.63], ["speech", 14.41], ["fart", 1.67]], [["hum", 47.94], ["throbbing", 11.45], ["mains hum", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 0.85, 1.12, 0.21, 0.96, 0.83, 1.21, 1.75, 0.74, 0.94, 0.63, 3.5, 3.67, 0.67, 3.13, 3.65, 0.16, 1.34, 0.74, -0.02, 0.7, 0.74, 0.09, 1.13, 1.65, 0.79, 0.9, 3.25, 1.53, 1.39, 2.09, 0.89]} \ No newline at end of file diff --git a/annotations_1/cUT0WQ9cTrg_filtered.json b/annotations_1/cUT0WQ9cTrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ab1b808bb3910f4f92894c60ba8b4f8ff33bd03 --- /dev/null +++ b/annotations_1/cUT0WQ9cTrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [3.0, 10.07], [17.0, 25.76], [30.0, 31.95], [42.0, 44.74], [48.0, 48.36], [49.0, 51.07], [57.0, 56.89], [62.0, 63.14], [79.0, 79.02], [85.0, 86.16], [89.0, 94.44], [100.0, 103.64], [104.0, 105.22], [106.0, 108.16]], "keep_status": [false, true, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.28, 31.12, 0.0, 32.75, 0.0, 33.83, 0.0, 0.0, 0.0, 0.0, 34.01, 74.44, 0.0, 91.47], "audiomae_on_audioset": [null, [["cattle, bovinae", 24.87], ["moo", 23.05], ["music", 11.62]], [["music", 35.02], ["hum", 24.34], ["throbbing", 12.26]], null, [["music", 40.82], ["speech", 8.96], ["sidetone", 6.11]], null, [["music", 39.19], ["electronic music", 10.38], ["dubstep", 5.06]], null, null, null, null, [["mosquito", 48.37], ["crushing", 13.7], ["music", 8.46]], null, null, null], "duration": [0.79, 7.07, 8.76, 1.95, 2.74, 0.36, 2.07, -0.11, 1.14, 0.02, 1.16, 5.44, 3.64, 1.22, 2.16]} \ No newline at end of file diff --git a/annotations_1/cV9dlsOzyVc_filtered.json b/annotations_1/cV9dlsOzyVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ccde0266eb4da7a3559250514554a086330b0d0 --- /dev/null +++ b/annotations_1/cV9dlsOzyVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [14.0, 20.38], [25.0, 25.69], [27.0, 29.27], [31.0, 31.53], [33.0, 34.75], [38.0, 38.48], [50.0, 51.19], [52.0, 52.84], [61.0, 60.99], [62.0, 62.6], [64.0, 63.69], [67.0, 70.19], [74.0, 83.07], [83.0, 84.84], [85.0, 87.94], [89.0, 89.41], [91.0, 91.56], [92.0, 95.64], [97.0, 97.63], [100.0, 101.43], [104.0, 104.18], [107.0, 107.1], [111.0, 113.05], [119.0, 119.8], [130.0, 134.28], [136.0, 136.34], [139.0, 141.02], [145.0, 144.8], [149.0, 150.6], [151.0, 151.23], [152.0, 153.81], [155.0, 162.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [38.79, 32.76, 0.0, 34.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.66, 31.31, 0.0, 48.61, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 99.68, 0.0, 37.75, 0.0, 0.0, 0.0, 0.0, 33.63], "audiomae_on_audioset": [[["music", 80.22], ["synthesizer", 3.98], ["musical instrument", 2.08]], [["music", 43.48], ["throbbing", 16.96], ["synthesizer", 11.44]], null, [["speech", 25.66], ["whale vocalization", 16.88], ["water", 12.91]], null, null, null, null, null, null, null, null, [["music", 40.75], ["speech", 16.15], ["scratching (performance technique)", 6.62]], [["music", 77.84], ["electronic music", 4.02], ["didgeridoo", 2.83]], null, [["speech", 27.01], ["sidetone", 14.98], ["music", 6.84]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.4], ["music", 30.22], ["inside, small room", 3.16]], null, null, null, null, [["music", 48.31], ["guitar", 11.15], ["effects unit", 10.23]]], "duration": [3.17, 6.38, 0.69, 2.27, 0.53, 1.75, 0.48, 1.19, 0.84, -0.01, 0.6, -0.31, 3.19, 9.07, 1.84, 2.94, 0.41, 0.56, 3.64, 0.63, 1.43, 0.18, 0.1, 2.05, 0.8, 4.28, 0.34, 2.02, -0.2, 1.6, 0.23, 1.81, 7.14]} \ No newline at end of file diff --git a/annotations_1/cW7AkQihsa8_filtered.json b/annotations_1/cW7AkQihsa8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..314267814bd01d59661c247723bcdb4655fb22a4 --- /dev/null +++ b/annotations_1/cW7AkQihsa8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.32], [8.0, 8.41], [10.0, 11.45], [15.0, 16.04], [19.0, 25.44], [27.0, 27.82], [30.0, 30.55], [31.0, 49.17], [50.0, 50.9], [54.0, 54.31], [56.0, 57.03], [58.0, 58.83], [64.0, 64.15], [64.0, 64.96], [67.0, 67.24], [67.0, 68.15], [69.0, 70.73], [73.0, 73.3], [74.0, 75.03], [87.0, 87.72], [95.0, 96.25], [104.0, 104.97], [108.0, 108.23], [111.0, 110.94], [116.0, 116.28], [119.0, 119.87], [127.0, 127.58], [134.0, 133.62], [154.0, 154.5], [184.0, 183.79]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.57, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 70.57], ["radio", 6.92], ["music", 5.66]], null, null, [["creak", 34.6], ["fart", 24.85], ["glass", 7.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 0.41, 1.45, 1.04, 6.44, 0.82, 0.55, 18.17, 0.9, 0.31, 1.03, 0.83, 0.15, 0.96, 0.24, 1.15, 1.73, 0.3, 1.03, 0.72, 1.25, 0.97, 0.23, -0.06, 0.28, 0.87, 0.58, -0.38, 0.5, -0.21]} \ No newline at end of file diff --git a/annotations_1/cWiljyh4NR4_filtered.json b/annotations_1/cWiljyh4NR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c59e033d3e8581923e08d06e19030c96dabd142c --- /dev/null +++ b/annotations_1/cWiljyh4NR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.27], [3.0, 3.35], [4.0, 4.04], [4.0, 4.7], [5.0, 5.97], [6.0, 7.62], [8.0, 8.75], [9.0, 12.14], [14.0, 14.17], [15.0, 15.89], [17.0, 17.05], [18.0, 19.8], [21.0, 21.83], [23.0, 105.31], [106.0, 107.45], [108.0, 111.43], [113.0, 113.44], [114.0, 116.78], [120.0, 120.58], [122.0, 122.89], [124.0, 126.74], [128.0, 128.51], [129.0, 130.52], [132.0, 132.31], [134.0, 134.86], [136.0, 136.83], [139.0, 139.04], [140.0, 148.14], [152.0, 157.05], [159.0, 166.56], [168.0, 173.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 0.0, 55.11, 0.0, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.22, 68.02, 69.88, 66.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.35, 0.04, 0.7, 0.97, 1.62, 0.75, 3.14, 0.17, 0.89, 0.05, 1.8, 0.83, 82.31, 1.45, 3.43, 0.44, 2.78, 0.58, 0.89, 2.74, 0.51, 1.52, 0.31, 0.86, 0.83, 0.04, 8.14, 5.05, 7.56, 5.52]} \ No newline at end of file diff --git a/annotations_1/cWj-sdxFiY4_filtered.json b/annotations_1/cWj-sdxFiY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ca7ab3c421af14502b6d43e69c3693d558cc7f --- /dev/null +++ b/annotations_1/cWj-sdxFiY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.02], [9.0, 9.05], [9.0, 9.09], [9.0, 9.12], [9.0, 9.19], [9.0, 83.61], [86.0, 91.57], [92.0, 95.49], [100.0, 106.61], [111.0, 122.54]], "keep_status": [false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.61, 29.74, 29.6, 29.56], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 31.1], ["vehicle", 29.16], ["car", 19.02]], [["music", 39.05], ["throbbing", 15.75], ["hum", 11.26]], [["vehicle", 38.08], ["speech", 34.98], ["car", 11.61]], [["vehicle", 23.32], ["car", 17.74], ["race car, auto racing", 10.13]]], "duration": [0.02, 0.05, 0.09, 0.12, 0.19, 74.61, 5.57, 3.49, 6.61, 11.54]} \ No newline at end of file diff --git a/annotations_1/cXlRo6pJ9ig_filtered.json b/annotations_1/cXlRo6pJ9ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf3539815930ea86ea22f218bd30495cdd3813ac --- /dev/null +++ b/annotations_1/cXlRo6pJ9ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.87], [26.0, 26.45], [26.0, 39.41], [46.0, 47.44], [48.0, 48.24], [49.0, 50.52], [52.0, 53.65], [66.0, 66.8], [68.0, 68.77], [73.0, 76.15], [77.0, 78.29], [80.0, 82.73], [84.0, 85.95], [86.0, 88.03], [89.0, 88.6], [89.0, 90.34], [91.0, 93.16], [96.0, 95.59], [96.0, 96.7], [97.0, 98.71], [99.0, 128.01], [130.0, 131.33], [134.0, 136.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [50.21, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 97.11, 0.0, 93.45, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 31.0, 0.0, 40.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.94], ["speech", 21.87], ["gunshot, gunfire", 4.38]], null, [["music", 30.02], ["gong", 10.22], ["ambient music", 9.77]]], "duration": [5.87, 0.45, 13.41, 1.44, 0.24, 1.52, 1.65, 0.8, 0.77, 3.15, 1.29, 2.73, 1.95, 2.03, -0.4, 1.34, 2.16, -0.41, 0.7, 1.71, 29.01, 1.33, 2.9]} \ No newline at end of file diff --git a/annotations_1/cXm_h4Zdwpc_filtered.json b/annotations_1/cXm_h4Zdwpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..184f584d2d16f988ae7ee557429bd8caea9b06f4 --- /dev/null +++ b/annotations_1/cXm_h4Zdwpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.13], [15.0, 16.9], [19.0, 19.85], [21.0, 21.3], [22.0, 23.28], [24.0, 25.74], [27.0, 33.07], [34.0, 35.18], [36.0, 36.56], [37.0, 42.38], [46.0, 46.95], [48.0, 49.77], [50.0, 51.98], [53.0, 53.38], [55.0, 56.03], [57.0, 58.18], [60.0, 63.04], [64.0, 67.41], [79.0, 80.25], [84.0, 90.64], [98.0, 98.9], [101.0, 101.02], [102.0, 104.08], [106.0, 108.21], [111.0, 120.01], [121.0, 121.85], [125.0, 126.33], [129.0, 129.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 46.9, 0.0, 0.0, 77.53, 46.26, 43.08, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.48], ["theremin", 9.79], ["musical instrument", 4.32]], null, null, null, [["foghorn", 36.94], ["music", 35.29], ["theremin", 3.26]], [["music", 51.68], ["synthesizer", 9.16], ["musical instrument", 6.86]], null, null, null], "duration": [2.13, 1.9, 0.85, 0.3, 1.28, 1.74, 6.07, 1.18, 0.56, 5.38, 0.95, 1.77, 1.98, 0.38, 1.03, 1.18, 3.04, 3.41, 1.25, 6.64, 0.9, 0.02, 2.08, 2.21, 9.01, 0.85, 1.33, 0.86]} \ No newline at end of file diff --git a/annotations_1/cY8yXitzluU_filtered.json b/annotations_1/cY8yXitzluU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8650d25509de7b3958d108fcba2f2806956b1442 --- /dev/null +++ b/annotations_1/cY8yXitzluU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [5.0, 12.12], [17.0, 46.62], [48.0, 48.63], [49.0, 51.09], [53.0, 53.6], [55.0, 56.57], [57.0, 58.55], [60.0, 61.47], [63.0, 82.66], [83.0, 86.41], [88.0, 89.01], [90.0, 92.06], [93.0, 93.8], [97.0, 97.17], [103.0, 104.77], [106.0, 109.66], [111.0, 111.79], [114.0, 117.98], [122.0, 122.69], [125.0, 125.36], [126.0, 127.01], [128.0, 165.32], [166.0, 171.91], [172.0, 179.71], [180.0, 184.76]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 37.28, 42.13, 0.0, 51.18, 0.0, 0.0, 0.0, 0.0, 45.21, 62.37, 0.0, 89.54, 0.0, 0.0, 0.0, 69.07, 0.0, 52.05, 0.0, 0.0, 0.0, 0.0, 33.94, 39.6, 60.7], "audiomae_on_audioset": [null, [["music", 23.85], ["breaking", 19.13], ["speech", 15.24]], [["music", 69.5], ["didgeridoo", 5.72], ["throbbing", 4.94]], null, null, null, null, null, null, [["coin (dropping)", 20.01], ["music", 16.33], ["noise", 6.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.7], ["moo", 5.25], ["effects unit", 4.2]], [["speech", 22.65], ["music", 21.48], ["hum", 13.58]], null], "duration": [0.26, 7.12, 29.62, 0.63, 2.09, 0.6, 1.57, 1.55, 1.47, 19.66, 3.41, 1.01, 2.06, 0.8, 0.17, 1.77, 3.66, 0.79, 3.98, 0.69, 0.36, 1.01, 37.32, 5.91, 7.71, 4.76]} \ No newline at end of file diff --git a/annotations_1/cZy7qSG8RHQ_filtered.json b/annotations_1/cZy7qSG8RHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d80275d55eda7bfc6a1c5e4bb9374534fbfad3d --- /dev/null +++ b/annotations_1/cZy7qSG8RHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [22.0, 22.25], [27.0, 27.9], [29.0, 29.96], [32.0, 31.82], [32.0, 33.0], [33.0, 34.11], [36.0, 42.21], [49.0, 50.48], [69.0, 69.7], [73.0, 73.85], [74.0, 75.46], [78.0, 78.54], [86.0, 86.98], [90.0, 95.59], [104.0, 104.79], [106.0, 106.66], [119.0, 119.52], [129.0, 128.75], [131.0, 132.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["moo", 18.64], ["speech", 18.6], ["cattle, bovinae", 18.07]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.25, 0.9, 0.96, -0.18, 1.0, 1.11, 6.21, 1.48, 0.7, 0.85, 1.46, 0.54, 0.98, 5.59, 0.79, 0.66, 0.52, -0.25, 1.07]} \ No newline at end of file diff --git a/annotations_1/c_6SIVs_M5Q_filtered.json b/annotations_1/c_6SIVs_M5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a6d3f8f9887adf004eb968a8ab6ed18e08d3604 --- /dev/null +++ b/annotations_1/c_6SIVs_M5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.08], [12.0, 11.87], [13.0, 15.04], [16.0, 16.04], [27.0, 27.31], [30.0, 30.81], [31.0, 31.14], [33.0, 33.47], [34.0, 35.95], [36.0, 55.34], [65.0, 69.04], [74.0, 76.94], [84.0, 89.06], [90.0, 98.71], [100.0, 148.44], [150.0, 157.71]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, true, false, true, false, true], "silence_prob": [32.06, 0.0, 32.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.66, 46.19, 39.52, 32.57, 29.44, 0.0, 33.0], "audiomae_on_audioset": [[["hum", 26.82], ["throbbing", 23.36], ["speech", 14.86]], null, [["music", 47.67], ["foghorn", 4.97], ["musical instrument", 4.69]], null, null, null, null, null, null, [["music", 48.61], ["rumble", 14.7], ["hum", 5.74]], [["speech", 27.51], ["music", 25.33], ["sidetone", 12.75]], [["music", 57.45], ["throbbing", 4.67], ["timpani", 3.14]], [["music", 54.36], ["speech", 16.59], ["throbbing", 6.79]], [["music", 29.69], ["mains hum", 15.01], ["hum", 9.83]], null, [["speech", 18.36], ["buzz", 12.08], ["cattle, bovinae", 7.56]]], "duration": [2.08, -0.13, 2.04, 0.04, 0.31, 0.81, 0.14, 0.47, 1.95, 19.34, 4.04, 2.94, 5.06, 8.71, 48.44, 7.71]} \ No newline at end of file diff --git a/annotations_1/c_SJMeRltkA_filtered.json b/annotations_1/c_SJMeRltkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084c3c8902445fce1459e9dc422347ab9e866427 --- /dev/null +++ b/annotations_1/c_SJMeRltkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[69.0, 88.06]], "keep_status": [false], "silence_prob": [29.38], "audiomae_on_audioset": [[["speech", 67.53], ["whack, thwack", 3.32], ["fart", 2.51]]], "duration": [19.06]} \ No newline at end of file diff --git a/annotations_1/c_u4oXd_Lfo_filtered.json b/annotations_1/c_u4oXd_Lfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87302d030e820917c9867396d4b2b7d19d252733 --- /dev/null +++ b/annotations_1/c_u4oXd_Lfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 115.3], [118.0, 121.73], [123.0, 136.93], [138.0, 155.63], [156.0, 176.86]], "keep_status": [false, true, false, true, true], "silence_prob": [0.0, 36.18, 34.88, 33.04, 33.34], "audiomae_on_audioset": [null, [["speech", 37.31], ["music", 19.27], ["boat, water vehicle", 7.17]], [["music", 35.65], ["speech", 30.31], ["boat, water vehicle", 6.0]], [["hum", 39.17], ["music", 15.34], ["mains hum", 14.36]], [["vehicle", 28.4], ["speech", 16.22], ["car", 10.95]]], "duration": [90.3, 3.73, 13.93, 17.63, 20.86]} \ No newline at end of file diff --git a/annotations_1/cbEbCrrgWiA_filtered.json b/annotations_1/cbEbCrrgWiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27d95ae216563d723cb2d63795cd5f79e0db183a --- /dev/null +++ b/annotations_1/cbEbCrrgWiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.99], [12.0, 13.64], [15.0, 15.9], [17.0, 18.77], [24.0, 24.7], [39.0, 38.87], [47.0, 47.97], [54.0, 53.94], [54.0, 55.61], [58.0, 62.36], [63.0, 64.02], [69.0, 75.41], [78.0, 78.56], [79.0, 81.77], [85.0, 96.45], [100.0, 100.14], [101.0, 101.22], [102.0, 102.42], [111.0, 111.69], [112.0, 113.09], [114.0, 116.63], [123.0, 124.51], [125.0, 125.19], [127.0, 126.74], [127.0, 126.96], [128.0, 128.24], [131.0, 131.33], [132.0, 132.27], [135.0, 138.67], [139.0, 140.12], [144.0, 145.3], [151.0, 150.96], [155.0, 166.53], [168.0, 172.03], [173.0, 173.87], [175.0, 176.0], [177.0, 180.81], [181.0, 183.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 36.86, 0.0, 42.86, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 37.31, 84.62, 0.0, 0.0, 68.54, 46.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.23], ["mains hum", 16.28], ["speech", 16.15]], null, [["music", 28.69], ["hum", 14.43], ["didgeridoo", 10.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.13], ["didgeridoo", 9.28], ["musical instrument", 3.84]], null, null, null, null, [["speech", 32.79], ["busy signal", 26.07], ["sine wave", 5.9]]], "duration": [0.99, 1.64, 0.9, 1.77, 0.7, -0.13, 0.97, -0.06, 1.61, 4.36, 1.02, 6.41, 0.56, 2.77, 11.45, 0.14, 0.22, 0.42, 0.69, 1.09, 2.63, 1.51, 0.19, -0.26, -0.04, 0.24, 0.33, 0.27, 3.67, 1.12, 1.3, -0.04, 11.53, 4.03, 0.87, 1.0, 3.81, 2.05]} \ No newline at end of file diff --git a/annotations_1/cbH10o2VTXI_filtered.json b/annotations_1/cbH10o2VTXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ff32dc6b72acfc962b2ecba07909f70246a5d9 --- /dev/null +++ b/annotations_1/cbH10o2VTXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.68], [6.0, 7.52], [9.0, 11.53], [29.0, 31.6], [36.0, 35.94], [39.0, 39.02], [42.0, 42.94], [48.0, 52.66], [64.0, 63.76], [66.0, 65.82], [66.0, 74.31], [78.0, 78.12], [80.0, 90.26], [92.0, 95.12], [117.0, 118.18], [121.0, 121.54], [129.0, 129.14], [140.0, 140.98], [143.0, 145.05], [146.0, 147.23], [150.0, 149.96], [154.0, 157.22], [161.0, 173.53]], "keep_status": [false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.58, 38.08, 0.0, 0.0, 0.0, 33.2, 0.0, 0.0, 41.58, 0.0, 40.93, 40.95, 0.0, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 50.71, 33.64], "audiomae_on_audioset": [null, null, [["music", 45.54], ["hum", 14.1], ["throbbing", 8.02]], [["speech", 30.87], ["music", 19.75], ["mains hum", 12.68]], null, null, null, [["livestock, farm animals, working animals", 39.89], ["moo", 25.82], ["cattle, bovinae", 25.6]], null, null, [["music", 49.25], ["synthesizer", 7.95], ["theremin", 3.14]], null, [["speech", 38.34], ["music", 33.58], ["grunt", 8.21]], [["music", 71.97], ["speech", 7.01], ["electronic music", 1.54]], null, null, null, null, [["music", 68.72], ["ambient music", 7.23], ["hum", 4.23]], null, null, null, [["music", 65.77], ["theremin", 5.85], ["throbbing", 2.85]]], "duration": [1.68, 1.52, 2.53, 2.6, -0.06, 0.02, 0.94, 4.66, -0.24, -0.18, 8.31, 0.12, 10.26, 3.12, 1.18, 0.54, 0.14, 0.98, 2.05, 1.23, -0.04, 3.22, 12.53]} \ No newline at end of file diff --git a/annotations_1/cbN7TQSGYlI_filtered.json b/annotations_1/cbN7TQSGYlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff8492802812db3ea1c2a5a17542c791c183b98d --- /dev/null +++ b/annotations_1/cbN7TQSGYlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.12], [16.0, 16.31], [19.0, 19.6], [22.0, 23.06], [31.0, 33.67], [35.0, 37.84], [61.0, 85.56], [87.0, 124.11], [127.0, 132.63], [133.0, 133.56], [137.0, 137.05], [139.0, 144.49], [146.0, 146.99], [148.0, 152.41], [153.0, 154.5], [155.0, 158.21], [158.0, 162.19], [165.0, 166.21], [168.0, 169.48], [170.0, 170.28], [183.0, 183.74]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.76, 34.07, 32.61, 0.0, 43.69, 0.0, 0.0, 39.75, 0.0, 56.33, 0.0, 87.55, 72.9, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 34.0], ["boing", 8.67], ["whale vocalization", 6.32]], [["music", 69.93], ["boing", 16.41], ["throbbing", 1.28]], null, [["music", 83.8], ["electronic music", 1.89], ["musical instrument", 1.54]], null, null, [["music", 48.95], ["pour", 6.78], ["speech", 4.77]], null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.31, 0.6, 1.06, 2.67, 2.84, 24.56, 37.11, 5.63, 0.56, 0.05, 5.49, 0.99, 4.41, 1.5, 3.21, 4.19, 1.21, 1.48, 0.28, 0.74]} \ No newline at end of file diff --git a/annotations_1/ccH057kbWTg_filtered.json b/annotations_1/ccH057kbWTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01513aa5ef606d0b0e72d407f9c05e194c436120 --- /dev/null +++ b/annotations_1/ccH057kbWTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [9.0, 9.69], [11.0, 12.73], [15.0, 15.5], [19.0, 22.22], [32.0, 33.61], [40.0, 42.45], [46.0, 45.99], [46.0, 47.26], [50.0, 52.37], [57.0, 57.18], [57.0, 62.34], [66.0, 67.12], [69.0, 72.86], [78.0, 80.18], [81.0, 92.47], [94.0, 96.89], [99.0, 116.77], [117.0, 116.97], [117.0, 118.45], [120.0, 131.45], [133.0, 142.03], [143.0, 144.29], [148.0, 148.24], [151.0, 152.52], [154.0, 155.8], [163.0, 164.08], [167.0, 167.66], [173.0, 173.25], [174.0, 178.12], [180.0, 180.08], [183.0, 199.42], [202.0, 203.07]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 31.61, 0.0, 0.0, 33.47, 0.0, 32.48, 0.0, 31.75, 38.9, 38.79, 44.57, 43.87, 0.0, 0.0, 30.06, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.61, 0.0, 30.87, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 61.16], ["ambient music", 5.53], ["singing", 3.23]], null, [["music", 74.43], ["singing", 2.37], ["carnatic music", 2.14]], null, null, [["music", 44.46], ["double bass", 6.56], ["humming", 5.82]], null, [["music", 67.21], ["singing", 6.7], ["electronic tuner", 2.63]], null, [["music", 66.85], ["singing", 4.67], ["musical instrument", 2.7]], [["music", 42.93], ["carnatic music", 27.26], ["musical instrument", 3.34]], [["music", 56.46], ["flute", 12.95], ["theremin", 6.13]], [["music", 30.34], ["speech", 14.59], ["singing bowl", 13.34]], [["music", 64.51], ["synthesizer", 6.78], ["musical instrument", 3.63]], null, null, [["music", 45.72], ["cello", 5.69], ["theremin", 3.54]], [["music", 30.64], ["singing bowl", 16.57], ["theremin", 6.15]], null, null, null, null, null, null, null, [["music", 44.99], ["speech", 19.14], ["hum", 7.25]], null, [["music", 40.46], ["speech", 16.37], ["fly, housefly", 5.74]], null], "duration": [0.88, 0.69, 1.73, 0.5, 3.22, 1.61, 2.45, -0.01, 1.26, 2.37, 0.18, 5.34, 1.12, 3.86, 2.18, 11.47, 2.89, 17.77, -0.03, 1.45, 11.45, 9.03, 1.29, 0.24, 1.52, 1.8, 1.08, 0.66, 0.25, 4.12, 0.08, 16.42, 1.07]} \ No newline at end of file diff --git a/annotations_1/ccr0gfJ5q0I_filtered.json b/annotations_1/ccr0gfJ5q0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f96600fbd0151dc867315dba717f71eca7f9e4a5 --- /dev/null +++ b/annotations_1/ccr0gfJ5q0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 82.16], [83.0, 83.54], [90.0, 94.9], [97.0, 98.96], [100.0, 100.74], [101.0, 102.52], [104.0, 104.77], [106.0, 106.07], [112.0, 113.48], [114.0, 114.71], [115.0, 115.84], [122.0, 125.52], [127.0, 127.79], [129.0, 129.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.54, 4.9, 1.96, 0.74, 1.52, 0.77, 0.07, 1.48, 0.71, 0.84, 3.52, 0.79, 0.69]} \ No newline at end of file diff --git a/annotations_1/ce5cnb_5dVk_filtered.json b/annotations_1/ce5cnb_5dVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48ba0ac3e0e9d482ca9bdb93512cc72488443fee --- /dev/null +++ b/annotations_1/ce5cnb_5dVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.09], [18.0, 22.33], [24.0, 40.76], [42.0, 45.0], [49.0, 50.16], [51.0, 54.4], [56.0, 58.19], [61.0, 61.18], [62.0, 62.43], [63.0, 63.68], [68.0, 68.59], [70.0, 71.29], [72.0, 79.86], [80.0, 80.42], [80.0, 80.45], [80.0, 80.49], [81.0, 80.52], [82.0, 81.82], [82.0, 86.7], [90.0, 90.69], [91.0, 95.22], [97.0, 99.08], [100.0, 100.72], [104.0, 104.63], [108.0, 108.63], [120.0, 120.72], [121.0, 127.3], [128.0, 131.03], [135.0, 135.84], [136.0, 138.05], [138.0, 141.52], [142.0, 142.05], [142.0, 142.1], [143.0, 146.37], [149.0, 149.42], [153.0, 155.16]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [49.45, 78.55, 43.05, 46.05, 0.0, 34.82, 50.71, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.67, 0.0, 64.75, 77.36, 0.0, 0.0, 0.0, 0.0, 44.2, 33.81, 0.0, 34.47, 33.22, 0.0, 0.0, 35.57, 0.0, 58.72], "audiomae_on_audioset": [[["music", 14.74], ["livestock, farm animals, working animals", 10.18], ["sidetone", 9.64]], null, [["music", 44.97], ["radio", 5.39], ["hum", 3.94]], [["hum", 36.74], ["mains hum", 32.66], ["buzz", 7.0]], null, [["music", 23.31], ["hum", 20.51], ["pulse", 8.63]], null, null, null, null, null, null, [["music", 33.24], ["hum", 25.84], ["mains hum", 13.38]], null, null, null, null, null, [["music", 32.14], ["hum", 23.77], ["throbbing", 14.73]], null, null, null, null, null, null, null, [["music", 46.75], ["didgeridoo", 35.98], ["theremin", 2.7]], [["music", 43.09], ["carnatic music", 10.0], ["musical instrument", 4.23]], null, [["music", 33.88], ["speech", 21.22], ["theremin", 11.76]], [["speech", 34.1], ["theremin", 26.89], ["music", 16.63]], null, null, [["music", 41.57], ["speech", 30.83], ["musical instrument", 3.34]], null, null], "duration": [9.09, 4.33, 16.76, 3.0, 1.16, 3.4, 2.19, 0.18, 0.43, 0.68, 0.59, 1.29, 7.86, 0.42, 0.45, 0.49, -0.48, -0.18, 4.7, 0.69, 4.22, 2.08, 0.72, 0.63, 0.63, 0.72, 6.3, 3.03, 0.84, 2.05, 3.52, 0.05, 0.1, 3.37, 0.42, 2.16]} \ No newline at end of file diff --git a/annotations_1/ceWNY5eNSWY_filtered.json b/annotations_1/ceWNY5eNSWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10469844e7e03983aaf538fb42cc3f338b396103 --- /dev/null +++ b/annotations_1/ceWNY5eNSWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [11.0, 11.13], [20.0, 20.22], [22.0, 22.37], [24.0, 25.34], [28.0, 29.59], [30.0, 32.37], [40.0, 41.13], [42.0, 42.03], [50.0, 52.32], [53.0, 53.23], [55.0, 56.47], [58.0, 60.93], [64.0, 65.28], [71.0, 71.32], [73.0, 72.82], [76.0, 77.67], [96.0, 98.24], [100.0, 102.95], [105.0, 106.71], [107.0, 107.92], [112.0, 112.13], [113.0, 114.03], [117.0, 119.64], [122.0, 130.23], [131.0, 132.02], [132.0, 133.61]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 44.84, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 0.0, 37.75, 99.78, 0.0, 0.0, 0.0, 0.0, 71.29, 67.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.22], ["sine wave", 27.82], ["chirp tone", 11.34]], null, null, null, null, null, null, null, [["speech", 20.08], ["sine wave", 19.86], ["chirp tone", 11.81]], null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.13, 0.22, 0.37, 1.34, 1.59, 2.37, 1.13, 0.03, 2.32, 0.23, 1.47, 2.93, 1.28, 0.32, -0.18, 1.67, 2.24, 2.95, 1.71, 0.92, 0.13, 1.03, 2.64, 8.23, 1.02, 1.61]} \ No newline at end of file diff --git a/annotations_1/cfB1QaweRKU_filtered.json b/annotations_1/cfB1QaweRKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9c7959228ee2e1345934965b8bf5fdf2bf18ff1 --- /dev/null +++ b/annotations_1/cfB1QaweRKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 1.8], [2.0, 2.0], [2.0, 3.64], [5.0, 6.72], [8.0, 9.86], [12.0, 13.2], [17.0, 19.84], [21.0, 23.36], [24.0, 64.13], [64.0, 64.96], [68.0, 75.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 64.75, 0.0, 0.0, 34.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 60.16], ["throbbing", 16.5], ["mains hum", 5.22]]], "duration": [0.53, -0.2, 0.0, 1.64, 1.72, 1.86, 1.2, 2.84, 2.36, 40.13, 0.96, 7.91]} \ No newline at end of file diff --git a/annotations_1/cfB9siDjpLk_filtered.json b/annotations_1/cfB9siDjpLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f01db1437c2e37883330a40090ce18d08bd2685 --- /dev/null +++ b/annotations_1/cfB9siDjpLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [4.0, 5.05], [12.0, 12.8], [14.0, 14.72], [16.0, 16.68], [18.0, 18.5], [34.0, 33.78], [34.0, 33.81], [34.0, 33.84], [34.0, 34.21], [35.0, 35.01], [40.0, 40.05], [41.0, 41.54], [43.0, 43.73], [45.0, 45.59], [47.0, 47.68], [57.0, 59.9], [64.0, 64.34], [93.0, 98.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 30.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.22], ["grunt", 7.67], ["animal", 7.21]], null, [["breaking", 20.0], ["whack, thwack", 17.33], ["clang", 11.48]]], "duration": [1.64, 1.05, 0.8, 0.72, 0.68, 0.5, -0.22, -0.19, -0.16, 0.21, 0.01, 0.05, 0.54, 0.73, 0.59, 0.68, 2.9, 0.34, 5.73]} \ No newline at end of file diff --git a/annotations_1/cfnBcA2ckeQ_filtered.json b/annotations_1/cfnBcA2ckeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1453ce3e4c869e453fe6db860e84ab6056df80fc --- /dev/null +++ b/annotations_1/cfnBcA2ckeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 117.32], [123.0, 123.67], [126.0, 125.96]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [106.32, 0.67, -0.04]} \ No newline at end of file diff --git a/annotations_1/cg49Y3jpZsQ_filtered.json b/annotations_1/cg49Y3jpZsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b6b0d519c05ebf829472cfd51fbc00efae5f2b --- /dev/null +++ b/annotations_1/cg49Y3jpZsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.44], [10.0, 10.15], [13.0, 13.2], [18.0, 19.85], [28.0, 28.93], [31.0, 31.92], [35.0, 35.58], [37.0, 53.6], [55.0, 57.38], [58.0, 60.12], [62.0, 64.25], [71.0, 75.81], [76.0, 77.23], [78.0, 78.14], [87.0, 87.35], [90.0, 108.45], [112.0, 121.68]], "keep_status": [true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, true], "silence_prob": [38.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.45, 31.16, 30.75, 30.0, 30.12, 0.0, 0.0, 0.0, 29.36, 37.36], "audiomae_on_audioset": [[["speech", 26.97], ["music", 21.0], ["outside, rural or natural", 4.22]], null, null, null, null, null, null, [["hum", 33.14], ["throbbing", 18.08], ["mains hum", 15.64]], [["music", 63.06], ["speech", 18.42], ["scary music", 4.1]], [["music", 31.48], ["speech", 16.01], ["moo", 6.4]], [["hum", 34.94], ["mains hum", 32.7], ["music", 12.62]], [["vehicle", 40.18], ["car", 12.17], ["race car, auto racing", 5.74]], null, null, null, [["buzz", 59.74], ["music", 23.83], ["speech", 1.99]], [["hum", 21.93], ["boing", 12.59], ["music", 10.07]]], "duration": [3.44, 0.15, 0.2, 1.85, 0.93, 0.92, 0.58, 16.6, 2.38, 2.12, 2.25, 4.81, 1.23, 0.14, 0.35, 18.45, 9.68]} \ No newline at end of file diff --git a/annotations_1/cgLMSMIU124_filtered.json b/annotations_1/cgLMSMIU124_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a3b4ec029badd09a079aff800a700f04ca90cf8 --- /dev/null +++ b/annotations_1/cgLMSMIU124_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 88.57], [89.0, 90.42], [91.0, 92.5], [93.0, 96.8], [103.0, 103.44], [115.0, 114.89], [123.0, 123.94], [129.0, 129.61]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.01, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["breaking", 36.4], ["whack, thwack", 24.95], ["speech", 11.0]], null, null, null, null], "duration": [64.57, 1.42, 1.5, 3.8, 0.44, -0.11, 0.94, 0.61]} \ No newline at end of file diff --git a/annotations_1/cglsMVVevx8_filtered.json b/annotations_1/cglsMVVevx8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1a2c8c1b7f4e11e44b4a9889d33446d3c9c6a3 --- /dev/null +++ b/annotations_1/cglsMVVevx8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.38], [6.0, 9.19], [10.0, 10.0], [10.0, 11.75], [13.0, 13.0], [15.0, 14.88], [17.0, 17.42], [32.0, 32.73], [35.0, 35.24], [41.0, 42.21], [46.0, 53.05], [54.0, 67.66], [70.0, 71.73], [74.0, 75.69], [78.0, 78.54], [82.0, 84.35], [87.0, 148.22], [152.0, 154.47], [157.0, 177.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true], "silence_prob": [0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 39.58, 0.0, 0.0, 0.0, 34.78, 0.0, 34.12, 34.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.68], ["whack, thwack", 13.09], ["echo", 5.28]], null, null, null, [["music", 38.52], ["didgeridoo", 15.2], ["speech", 11.82]], null, [["trombone", 49.48], ["music", 15.02], ["brass instrument", 12.12]], [["music", 25.22], ["brass instrument", 13.64], ["trombone", 10.51]]], "duration": [0.38, 3.19, 0.0, 1.75, 0.0, -0.12, 0.42, 0.73, 0.24, 1.21, 7.05, 13.66, 1.73, 1.69, 0.54, 2.35, 61.22, 2.47, 20.06]} \ No newline at end of file diff --git a/annotations_1/cgoMJXAmLdc_filtered.json b/annotations_1/cgoMJXAmLdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96855a8343c74b7d4c7785f72d6e971b23ae8f4f --- /dev/null +++ b/annotations_1/cgoMJXAmLdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.82], [10.0, 10.52], [11.0, 11.77], [12.0, 25.83], [26.0, 27.13], [31.0, 33.62], [36.0, 36.31], [39.0, 39.83], [44.0, 45.18]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 0.0, 0.0, 81.89, 0.0, 75.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [2.82, 0.52, 0.77, 13.83, 1.13, 2.62, 0.31, 0.83, 1.18]} \ No newline at end of file diff --git a/annotations_1/ch_JeDyNaFM_filtered.json b/annotations_1/ch_JeDyNaFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9ccd4a7ecca2b4560cd47dafa263a68a59b1e1d --- /dev/null +++ b/annotations_1/ch_JeDyNaFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.59], [23.0, 38.06], [39.0, 176.57], [177.0, 178.41], [180.0, 184.6], [185.0, 191.71], [193.0, 196.01], [197.0, 198.93], [202.0, 202.53], [206.0, 227.37], [230.0, 233.58], [235.0, 235.38], [237.0, 237.52], [242.0, 243.4]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false], "silence_prob": [29.58, 29.64, 0.0, 0.0, 40.07, 39.07, 53.28, 0.0, 0.0, 30.31, 38.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 47.54], ["throbbing", 34.45], ["mains hum", 8.52]], [["hum", 45.1], ["speech", 19.74], ["mains hum", 10.4]], null, null, [["hum", 35.0], ["throbbing", 18.06], ["mains hum", 17.11]], [["speech", 28.21], ["livestock, farm animals, working animals", 22.33], ["rumble", 8.05]], null, null, null, [["hum", 18.13], ["mains hum", 17.85], ["scary music", 16.32]], [["grunt", 20.06], ["music", 10.28], ["groan", 10.14]], null, null, null], "duration": [19.59, 15.06, 137.57, 1.41, 4.6, 6.71, 3.01, 1.93, 0.53, 21.37, 3.58, 0.38, 0.52, 1.4]} \ No newline at end of file diff --git a/annotations_1/chvjkV0jRh8_filtered.json b/annotations_1/chvjkV0jRh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d159e311fc1b6335f3ce17cba084a6676cf363cc --- /dev/null +++ b/annotations_1/chvjkV0jRh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.21], [13.0, 21.02], [23.0, 28.24], [29.0, 31.16], [33.0, 47.01], [48.0, 68.35], [70.0, 69.9], [70.0, 70.97], [72.0, 72.28], [75.0, 75.42], [76.0, 78.9], [80.0, 81.65], [84.0, 83.94], [87.0, 88.01], [92.0, 94.83], [95.0, 97.46], [98.0, 98.58], [100.0, 99.81], [101.0, 100.99], [101.0, 105.39], [106.0, 112.55], [114.0, 114.32], [115.0, 117.58], [120.0, 123.33], [124.0, 125.27], [127.0, 127.08], [128.0, 129.36], [130.0, 131.38], [132.0, 143.99], [145.0, 146.31], [147.0, 148.39], [149.0, 150.42], [153.0, 171.48]], "keep_status": [true, true, false, true, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [33.01, 35.77, 38.45, 37.16, 33.71, 48.61, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 0.0, 35.57, 32.18, 0.0, 0.0, 0.0, 33.54, 31.84, 0.0, 31.59, 29.47, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 30.98], "audiomae_on_audioset": [[["music", 46.29], ["theremin", 17.0], ["double bass", 6.44]], [["music", 45.33], ["double bass", 9.05], ["musical instrument", 7.2]], [["music", 61.69], ["theremin", 9.15], ["guitar", 4.02]], [["music", 50.01], ["foghorn", 10.19], ["ambient music", 3.74]], [["music", 83.31], ["musical instrument", 2.97], ["theremin", 2.81]], [["music", 45.03], ["double bass", 10.93], ["cello", 8.92]], null, null, null, null, [["music", 47.78], ["didgeridoo", 8.99], ["musical instrument", 7.88]], null, null, null, [["music", 50.77], ["theremin", 9.6], ["synthesizer", 5.18]], [["double bass", 28.89], ["music", 25.71], ["cello", 17.05]], null, null, null, [["music", 51.2], ["cello", 8.52], ["double bass", 8.22]], [["music", 38.13], ["cello", 25.3], ["double bass", 12.31]], null, [["cello", 33.88], ["music", 26.16], ["double bass", 12.63]], [["music", 46.98], ["musical instrument", 12.14], ["bowed string instrument", 10.4]], null, null, null, null, [["music", 58.56], ["musical instrument", 6.18], ["violin, fiddle", 5.83]], null, null, null, [["music", 64.28], ["throbbing", 5.87], ["hum", 5.13]]], "duration": [8.21, 8.02, 5.24, 2.16, 14.01, 20.35, -0.1, 0.97, 0.28, 0.42, 2.9, 1.65, -0.06, 1.01, 2.83, 2.46, 0.58, -0.19, -0.01, 4.39, 6.55, 0.32, 2.58, 3.33, 1.27, 0.08, 1.36, 1.38, 11.99, 1.31, 1.39, 1.42, 18.48]} \ No newline at end of file diff --git a/annotations_1/cibZY1GwVQg_filtered.json b/annotations_1/cibZY1GwVQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba5e9254cb788e8ece7fe313a8eea6e6704bad3a --- /dev/null +++ b/annotations_1/cibZY1GwVQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.99], [6.0, 6.51], [9.0, 8.9], [14.0, 14.64], [19.0, 19.26], [25.0, 26.05], [27.0, 28.38], [30.0, 36.09], [38.0, 38.96], [43.0, 44.64], [51.0, 51.12], [53.0, 53.03], [53.0, 54.38], [55.0, 58.13], [59.0, 60.81], [61.0, 62.88], [63.0, 63.02], [63.0, 63.36], [64.0, 64.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 0.51, -0.1, 0.64, 0.26, 1.05, 1.38, 6.09, 0.96, 1.64, 0.12, 0.03, 1.38, 3.13, 1.81, 1.88, 0.02, 0.36, 0.57]} \ No newline at end of file diff --git a/annotations_1/cil6HFXlccw_filtered.json b/annotations_1/cil6HFXlccw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..204b4007982dd2cc4ef30ed6b729e1b952173c26 --- /dev/null +++ b/annotations_1/cil6HFXlccw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 41.39]], "keep_status": [true], "silence_prob": [32.94], "audiomae_on_audioset": [[["music", 34.72], ["speech", 12.69], ["vehicle", 10.06]]], "duration": [20.39]} \ No newline at end of file diff --git a/annotations_1/cio6rIbCs-I_filtered.json b/annotations_1/cio6rIbCs-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba4a15b5fce4223112f50ad5a693afa52d330a5d --- /dev/null +++ b/annotations_1/cio6rIbCs-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.32], [10.0, 10.61], [11.0, 12.41], [15.0, 15.69], [17.0, 22.64], [23.0, 24.38], [25.0, 27.08], [29.0, 29.56], [31.0, 31.58], [33.0, 33.47], [35.0, 36.26], [37.0, 37.61], [39.0, 39.41], [40.0, 45.74], [47.0, 47.53], [48.0, 49.06], [50.0, 50.5], [51.0, 53.47], [54.0, 54.4], [55.0, 55.95], [57.0, 64.52], [69.0, 69.42], [71.0, 72.17], [73.0, 75.36], [76.0, 81.6], [87.0, 87.47], [91.0, 95.54], [96.0, 108.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false], "silence_prob": [50.36, 0.0, 0.0, 0.0, 49.5, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.18, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 45.05, 0.0, 0.0, 35.94, 46.79, 0.0, 58.13, 98.01], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 66.63], ["hum", 16.37], ["clang", 1.12]], null, [["sidetone", 67.92], ["speech", 17.44], ["dial tone", 2.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.48], ["didgeridoo", 23.61], ["noise", 4.98]], null, null, [["speech", 34.53], ["sidetone", 19.53], ["music", 12.33]], [["sidetone", 24.85], ["noise", 21.9], ["mains hum", 11.23]], null, null, null], "duration": [2.32, 0.61, 1.41, 0.69, 5.64, 1.38, 2.08, 0.56, 0.58, 0.47, 1.26, 0.61, 0.41, 5.74, 0.53, 1.06, 0.5, 2.47, 0.4, 0.95, 7.52, 0.42, 1.17, 2.36, 5.6, 0.47, 4.54, 12.94]} \ No newline at end of file diff --git a/annotations_1/cj5Mp68u2tY_filtered.json b/annotations_1/cj5Mp68u2tY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2804ae57f68028ac4becb48832afac311f2bb2 --- /dev/null +++ b/annotations_1/cj5Mp68u2tY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[109.0, 108.94], [110.0, 110.61], [111.0, 125.31]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 30.55], "audiomae_on_audioset": [null, null, [["music", 52.73], ["livestock, farm animals, working animals", 9.23], ["cattle, bovinae", 5.87]]], "duration": [-0.06, 0.61, 14.31]} \ No newline at end of file diff --git a/annotations_1/cjy-8dXBljk_filtered.json b/annotations_1/cjy-8dXBljk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0dc239f8981bba2ae5eed6949420c3df986adef --- /dev/null +++ b/annotations_1/cjy-8dXBljk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[108.0, 118.13], [120.0, 123.3], [126.0, 126.98], [129.0, 132.16], [133.0, 133.95], [136.0, 143.46], [144.0, 146.3], [147.0, 147.6], [149.0, 149.84]], "keep_status": [true, true, false, true, false, true, true, false, false], "silence_prob": [29.26, 30.66, 0.0, 29.09, 0.0, 29.54, 33.85, 0.0, 0.0], "audiomae_on_audioset": [[["music", 11.76], ["vehicle", 11.51], ["air horn, truck horn", 9.85]], [["mains hum", 30.28], ["hum", 19.42], ["throbbing", 18.45]], null, [["mains hum", 20.0], ["speech", 17.53], ["buzz", 10.84]], null, [["fly, housefly", 9.89], ["music", 6.55], ["electric shaver, electric razor", 6.46]], [["speech", 41.68], ["music", 8.78], ["vehicle", 6.68]], null, null], "duration": [10.13, 3.3, 0.98, 3.16, 0.95, 7.46, 2.3, 0.6, 0.84]} \ No newline at end of file diff --git a/annotations_1/clDZPzwANeE_filtered.json b/annotations_1/clDZPzwANeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..687d557bcb88540b969fa05884c7474c21cfd4a9 --- /dev/null +++ b/annotations_1/clDZPzwANeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.91], [11.0, 10.88], [11.0, 19.63], [22.0, 28.92], [33.0, 33.45], [34.0, 36.41], [36.0, 38.33], [41.0, 46.99], [48.0, 50.25], [52.0, 55.32], [57.0, 59.31], [60.0, 61.37], [68.0, 68.67], [71.0, 71.69], [73.0, 78.07], [81.0, 82.38], [84.0, 86.44], [89.0, 93.46], [96.0, 98.76], [111.0, 118.35]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 46.5, 74.13, 0.0, 45.85, 43.45, 47.31, 62.68, 94.52, 70.44, 0.0, 0.0, 0.0, 39.28, 0.0, 76.2, 83.16, 97.54, 37.69], "audiomae_on_audioset": [null, null, [["speech", 77.13], ["hum", 3.05], ["whale vocalization", 1.87]], null, null, [["music", 25.88], ["hum", 16.26], ["throbbing", 11.31]], [["speech", 57.13], ["music", 5.12], ["inside, small room", 3.65]], [["sidetone", 26.77], ["speech", 23.75], ["dishes, pots, and pans", 6.38]], null, null, null, null, null, null, [["speech", 69.31], ["synthesizer", 6.61], ["music", 5.06]], null, null, null, null, [["thunk", 35.81], ["crushing", 14.65], ["hum", 5.17]]], "duration": [0.91, -0.12, 8.63, 6.92, 0.45, 2.41, 2.33, 5.99, 2.25, 3.32, 2.31, 1.37, 0.67, 0.69, 5.07, 1.38, 2.44, 4.46, 2.76, 7.35]} \ No newline at end of file diff --git a/annotations_1/cm1NBLlRxy0_filtered.json b/annotations_1/cm1NBLlRxy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..062e3cf24b90a569a4bc6c64b90ecaae24b77bd4 --- /dev/null +++ b/annotations_1/cm1NBLlRxy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.71], [24.0, 27.16], [27.0, 27.24], [27.0, 30.0], [42.0, 42.53], [45.0, 45.28], [46.0, 46.79], [68.0, 68.37], [72.0, 72.39], [77.0, 87.89], [96.0, 96.3], [97.0, 104.45], [105.0, 105.46], [120.0, 120.33], [121.0, 122.1], [122.0, 151.97], [167.0, 167.21], [171.0, 180.77], [193.0, 194.51], [195.0, 197.9], [206.0, 207.17], [208.0, 213.66], [217.0, 217.17], [219.0, 226.4]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.16, 30.33, 0.0, 30.5, 0.0, 0.0, 0.0, 0.0, 0.0, 33.98, 0.0, 30.88, 0.0, 0.0, 0.0, 29.52, 0.0, 29.55, 0.0, 30.09, 0.0, 30.4, 0.0, 30.76], "audiomae_on_audioset": [[["music", 43.12], ["speech", 19.45], ["didgeridoo", 5.13]], [["moo", 23.47], ["cattle, bovinae", 22.23], ["music", 17.13]], null, [["music", 63.54], ["speech", 6.33], ["didgeridoo", 5.39]], null, null, null, null, null, [["music", 70.66], ["didgeridoo", 7.98], ["speech", 5.99]], null, [["music", 36.34], ["speech", 25.7], ["cattle, bovinae", 3.82]], null, null, null, [["cattle, bovinae", 31.2], ["moo", 28.85], ["livestock, farm animals, working animals", 14.51]], null, [["cattle, bovinae", 30.2], ["moo", 27.6], ["music", 15.16]], null, [["didgeridoo", 43.92], ["music", 26.04], ["musical instrument", 4.6]], null, [["music", 61.19], ["musical instrument", 4.88], ["didgeridoo", 4.49]], null, [["music", 55.89], ["didgeridoo", 12.62], ["synthesizer", 5.62]]], "duration": [4.71, 3.16, 0.24, 3.0, 0.53, 0.28, 0.79, 0.37, 0.39, 10.89, 0.3, 7.45, 0.46, 0.33, 1.1, 29.97, 0.21, 9.77, 1.51, 2.9, 1.17, 5.66, 0.17, 7.4]} \ No newline at end of file diff --git a/annotations_1/cmgeSY8YdO4_filtered.json b/annotations_1/cmgeSY8YdO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c812e170d18137ddb1634f77761dc29b4b76bc7d --- /dev/null +++ b/annotations_1/cmgeSY8YdO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [16.0, 16.36], [21.0, 22.03], [25.0, 25.76], [35.0, 34.82], [37.0, 40.15], [46.0, 48.15], [49.0, 50.23], [52.0, 52.73], [59.0, 59.98], [62.0, 62.78], [64.0, 63.9], [79.0, 78.87], [80.0, 81.24], [83.0, 84.18], [85.0, 86.31], [87.0, 87.1], [88.0, 90.09], [104.0, 107.42], [108.0, 108.38], [112.0, 112.62], [113.0, 113.7], [115.0, 116.13], [117.0, 119.64], [123.0, 137.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.09, 90.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.56, 38.49, 0.0, 0.0, 0.0, 0.0, 97.92, 50.61], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 60.43], ["dishes, pots, and pans", 8.02], ["sidetone", 5.77]], null, null, null, null, null, null, null, null, null, null, null, [["music", 33.15], ["speech", 27.88], ["guitar", 2.38]], [["speech", 17.02], ["fart", 14.88], ["fireworks", 6.54]], null, null, null, null, null, null], "duration": [1.25, 0.36, 1.03, 0.76, -0.18, 3.15, 2.15, 1.23, 0.73, 0.98, 0.78, -0.1, -0.13, 1.24, 1.18, 1.31, 0.1, 2.09, 3.42, 0.38, 0.62, 0.7, 1.13, 2.64, 14.46]} \ No newline at end of file diff --git a/annotations_1/cmkZeTX5fq0_filtered.json b/annotations_1/cmkZeTX5fq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15d1b7f01fd5e913adcd902d3a5cf91ec6fd6bf8 --- /dev/null +++ b/annotations_1/cmkZeTX5fq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [21.0, 22.62], [31.0, 35.58], [40.0, 41.84], [62.0, 170.61], [174.0, 174.12], [177.0, 179.39], [185.0, 188.52], [190.0, 190.49], [191.0, 191.57], [192.0, 192.64], [195.0, 197.68], [198.0, 199.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 99.96, 89.72, 0.0, 0.0, 0.0, 98.8, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.97], ["didgeridoo", 13.24], ["electronic music", 1.79]], null, null, null, null, null, null, null, null, null, null], "duration": [1.5, 1.62, 4.58, 1.84, 108.61, 0.12, 2.39, 3.52, 0.49, 0.57, 0.64, 2.68, 1.84]} \ No newline at end of file diff --git a/annotations_1/cmlELkvVPeQ_filtered.json b/annotations_1/cmlELkvVPeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de697dafdebe46f643f4c4dcfe94b700b29769bd --- /dev/null +++ b/annotations_1/cmlELkvVPeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [5.0, 5.14], [9.0, 9.39], [11.0, 11.94], [33.0, 33.05], [39.0, 39.82], [49.0, 48.64], [49.0, 51.14], [51.0, 53.43], [54.0, 55.71], [66.0, 66.55], [68.0, 67.85], [72.0, 74.71], [75.0, 75.68], [80.0, 81.11], [86.0, 87.08], [89.0, 88.74], [94.0, 94.44], [100.0, 99.91], [122.0, 123.35], [127.0, 127.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.77, 89.72, 0.0, 0.0, 0.0, 51.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.14, 0.39, 0.94, 0.05, 0.82, -0.36, 2.14, 2.43, 1.71, 0.55, -0.15, 2.71, 0.68, 1.11, 1.08, -0.26, 0.44, -0.09, 1.35, 0.58]} \ No newline at end of file diff --git a/annotations_1/cn35LhT9zBg_filtered.json b/annotations_1/cn35LhT9zBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..337ebe0c0ccf71547bb07143e20f525a1352afcc --- /dev/null +++ b/annotations_1/cn35LhT9zBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 31.6], [32.0, 59.16], [60.0, 61.1], [65.0, 78.65], [82.0, 82.44], [83.0, 83.51], [84.0, 91.25], [94.0, 95.1], [97.0, 98.71], [102.0, 105.81], [109.0, 111.18], [114.0, 117.04]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [35.31, 29.49, 0.0, 30.4, 0.0, 0.0, 33.08, 0.0, 0.0, 39.5, 99.99, 30.02], "audiomae_on_audioset": [[["music", 31.28], ["electric shaver, electric razor", 11.27], ["livestock, farm animals, working animals", 5.55]], [["speech", 34.45], ["music", 21.04], ["gong", 3.54]], null, [["hum", 37.88], ["throbbing", 28.06], ["music", 15.15]], null, null, [["speech", 39.61], ["music", 6.74], ["theremin", 6.54]], null, null, [["speech", 52.81], ["beatboxing", 16.77], ["music", 2.37]], null, [["explosion", 44.99], ["burst, pop", 22.74], ["breaking", 4.75]]], "duration": [14.6, 27.16, 1.1, 13.65, 0.44, 0.51, 7.25, 1.1, 1.71, 3.81, 2.18, 3.04]} \ No newline at end of file diff --git a/annotations_1/cnM9pdjp5o4_filtered.json b/annotations_1/cnM9pdjp5o4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ceba763c3ba280bab7f5c2cfcb4ddd4f481b0d1 --- /dev/null +++ b/annotations_1/cnM9pdjp5o4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [4.0, 5.76], [6.0, 6.59], [14.0, 21.1], [30.0, 37.25], [45.0, 52.89], [54.0, 61.08], [62.0, 65.4], [69.0, 76.86], [79.0, 79.32], [86.0, 85.9], [90.0, 91.1]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.45, 31.55, 36.11, 33.11, 32.23, 37.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["ding", 55.17], ["music", 15.44], ["speech", 15.02]], [["music", 81.36], ["boing", 1.52], ["funny music", 1.1]], [["music", 80.27], ["funk", 2.14], ["singing", 1.08]], [["music", 75.09], ["firecracker", 4.18], ["speech", 2.57]], [["music", 26.43], ["mosquito", 22.62], ["cattle, bovinae", 8.23]], [["music", 80.94], ["speech", 7.24], ["boing", 1.83]], null, null, null], "duration": [0.22, 1.76, 0.59, 7.1, 7.25, 7.89, 7.08, 3.4, 7.86, 0.32, -0.1, 1.1]} \ No newline at end of file diff --git a/annotations_1/cnwddNSgakk_filtered.json b/annotations_1/cnwddNSgakk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1631a2ffab3b25ce518046fcba444b3c9926d880 --- /dev/null +++ b/annotations_1/cnwddNSgakk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.85], [21.0, 21.69], [25.0, 26.03], [28.0, 36.1], [38.0, 37.96], [50.0, 52.54], [56.0, 72.13], [74.0, 74.55], [75.0, 76.0], [81.0, 81.62], [89.0, 89.26], [91.0, 94.8], [104.0, 104.53], [115.0, 115.8], [130.0, 141.4], [143.0, 143.43], [144.0, 145.49], [149.0, 157.82], [161.0, 166.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.3, 0.0, 45.43, 30.07, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0, 30.27, 0.0, 0.0, 33.08, 31.21], "audiomae_on_audioset": [null, null, null, [["music", 62.36], ["synthesizer", 9.93], ["musical instrument", 4.73]], null, [["music", 52.67], ["synthesizer", 19.51], ["musical instrument", 10.73]], [["music", 55.38], ["synthesizer", 15.71], ["theremin", 13.32]], null, null, null, null, [["sidetone", 19.04], ["music", 12.08], ["speech", 11.06]], null, null, [["music", 49.04], ["hum", 12.63], ["theremin", 6.2]], null, null, [["music", 76.7], ["synthesizer", 5.44], ["sampler", 3.25]], [["music", 69.01], ["synthesizer", 8.99], ["musical instrument", 8.38]]], "duration": [1.85, 0.69, 1.03, 8.1, -0.04, 2.54, 16.13, 0.55, 1.0, 0.62, 0.26, 3.8, 0.53, 0.8, 11.4, 0.43, 1.49, 8.82, 5.09]} \ No newline at end of file diff --git a/annotations_1/corlGzKJqAc_filtered.json b/annotations_1/corlGzKJqAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..662a133168a969b982296bc6fd18e58a5fc0c3cb --- /dev/null +++ b/annotations_1/corlGzKJqAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.7], [12.0, 13.41], [15.0, 15.43], [20.0, 20.61], [24.0, 24.66], [27.0, 28.04], [30.0, 30.77], [37.0, 37.77], [40.0, 40.81], [43.0, 43.78], [45.0, 46.38], [48.0, 48.54], [53.0, 53.84], [59.0, 59.37], [67.0, 68.62], [71.0, 71.49], [75.0, 76.38], [87.0, 86.88], [90.0, 90.53], [95.0, 95.82], [97.0, 98.05], [101.0, 101.17], [105.0, 105.63], [109.0, 110.22], [113.0, 112.97], [115.0, 117.53], [119.0, 119.2], [121.0, 121.73], [137.0, 138.0], [150.0, 152.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 38.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.97], ["thunk", 11.39], ["wind instrument, woodwind instrument", 8.2]]], "duration": [0.7, 1.41, 0.43, 0.61, 0.66, 1.04, 0.77, 0.77, 0.81, 0.78, 1.38, 0.54, 0.84, 0.37, 1.62, 0.49, 1.38, -0.12, 0.53, 0.82, 1.05, 0.17, 0.63, 1.22, -0.03, 2.53, 0.2, 0.73, 1.0, 2.95]} \ No newline at end of file diff --git a/annotations_1/cpZIiyp8juU_filtered.json b/annotations_1/cpZIiyp8juU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c1bfc646a708f24c5383df5c4001b95513d8dfd --- /dev/null +++ b/annotations_1/cpZIiyp8juU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.19], [7.0, 18.89], [21.0, 26.28], [27.0, 27.09], [33.0, 139.19], [145.0, 153.86], [155.0, 162.06], [162.0, 170.58], [172.0, 171.98], [173.0, 174.75], [178.0, 190.24], [192.0, 205.63]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 33.28, 30.3, 0.0, 0.0, 30.35, 29.74, 29.94, 0.0, 0.0, 30.0, 30.63], "audiomae_on_audioset": [null, [["hum", 22.29], ["music", 19.68], ["didgeridoo", 19.06]], [["speech", 52.53], ["didgeridoo", 8.49], ["hum", 7.17]], null, null, [["moo", 39.07], ["cattle, bovinae", 24.98], ["livestock, farm animals, working animals", 18.14]], [["music", 46.7], ["didgeridoo", 19.03], ["speech", 11.47]], [["music", 65.47], ["didgeridoo", 12.23], ["speech", 7.81]], null, null, [["mains hum", 28.93], ["hum", 22.97], ["music", 17.3]], [["speech", 21.5], ["cattle, bovinae", 10.83], ["music", 9.82]]], "duration": [0.19, 11.89, 5.28, 0.09, 106.19, 8.86, 7.06, 8.58, -0.02, 1.75, 12.24, 13.63]} \ No newline at end of file diff --git a/annotations_1/cqHKducp4MY_filtered.json b/annotations_1/cqHKducp4MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f6c8c2ee5ec0b85d3cbbc0d45f7cc11a9c532c9 --- /dev/null +++ b/annotations_1/cqHKducp4MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.01]], "keep_status": [false], "silence_prob": [32.98], "audiomae_on_audioset": [[["throbbing", 46.47], ["hum", 32.59], ["music", 10.29]]], "duration": [3.01]} \ No newline at end of file diff --git a/annotations_1/crI67brUX84_filtered.json b/annotations_1/crI67brUX84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f2d975f311da7e68e19a93fff189adb9079b725 --- /dev/null +++ b/annotations_1/crI67brUX84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.02], [17.0, 16.65], [19.0, 19.99], [21.0, 22.62], [23.0, 24.07], [26.0, 30.81], [32.0, 38.37], [39.0, 39.85], [41.0, 42.28], [43.0, 44.39], [49.0, 49.22], [51.0, 54.16], [60.0, 61.65], [63.0, 63.44], [69.0, 72.03], [78.0, 78.88], [83.0, 84.86], [86.0, 86.7], [92.0, 93.24], [94.0, 95.37], [99.0, 99.47], [112.0, 122.52], [124.0, 124.95], [127.0, 127.57], [129.0, 130.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.96, 0.0, 0.0, 0.0, 0.0, 82.25, 99.95, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0, 0.0, 38.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 47.1], ["speech", 22.9], ["sine wave", 4.84]], null, null, null, null, null, null, null, null, null, null], "duration": [2.02, -0.35, 0.99, 1.62, 1.07, 4.81, 6.37, 0.85, 1.28, 1.39, 0.22, 3.16, 1.65, 0.44, 3.03, 0.88, 1.86, 0.7, 1.24, 1.37, 0.47, 10.52, 0.95, 0.57, 1.74]} \ No newline at end of file diff --git a/annotations_1/crIlIvBYMoc_filtered.json b/annotations_1/crIlIvBYMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8df0f910252e8794b410d773e987a9a80ad1d0a --- /dev/null +++ b/annotations_1/crIlIvBYMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 41.15], [42.0, 50.67], [58.0, 60.71], [62.0, 65.23], [68.0, 71.83], [75.0, 77.09], [80.0, 81.65], [82.0, 87.62], [89.0, 102.32], [104.0, 107.82], [110.0, 111.84], [113.0, 114.34], [115.0, 116.51], [118.0, 119.99], [126.0, 128.34]], "keep_status": [false, false, true, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.76, 38.16, 32.94, 28.37, 49.5, 0.0, 76.04, 98.93, 98.86, 0.0, 0.0, 0.0, 0.0, 97.33], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 40.89], ["moo", 17.98], ["speech", 11.03]], [["whale vocalization", 58.56], ["cattle, bovinae", 13.55], ["livestock, farm animals, working animals", 13.14]], [["music", 9.23], ["boom", 8.84], ["whack, thwack", 8.07]], [["speech", 21.14], ["animal", 6.05], ["smash, crash", 5.76]], null, null, null, null, null, null, null, null, null], "duration": [31.15, 8.67, 2.71, 3.23, 3.83, 2.09, 1.65, 5.62, 13.32, 3.82, 1.84, 1.34, 1.51, 1.99, 2.34]} \ No newline at end of file diff --git a/annotations_1/crKAy2dGX_8_filtered.json b/annotations_1/crKAy2dGX_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131346fac4cbc596382542a86e2d64c2b02e03ee --- /dev/null +++ b/annotations_1/crKAy2dGX_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.82]], "keep_status": [false], "silence_prob": [56.33], "audiomae_on_audioset": [null], "duration": [3.82]} \ No newline at end of file diff --git a/annotations_1/cslI2draO_E_filtered.json b/annotations_1/cslI2draO_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac34ced775d104c71f794e3351032d4a0862d9f7 --- /dev/null +++ b/annotations_1/cslI2draO_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.79], [18.0, 22.15], [26.0, 26.13], [30.0, 30.81], [38.0, 38.57], [43.0, 44.83], [46.0, 46.8], [48.0, 53.49], [54.0, 55.78], [57.0, 58.16], [61.0, 61.77], [62.0, 63.69], [66.0, 71.04], [73.0, 74.09], [77.0, 79.03], [80.0, 81.14], [82.0, 83.25], [84.0, 85.29], [89.0, 90.24], [91.0, 92.58], [98.0, 103.13], [105.0, 110.22], [118.0, 120.11], [126.0, 141.76]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 46.29, 0.0, 0.0, 0.0, 0.0, 0.0, 31.8, 29.58, 35.81, 29.3], "audiomae_on_audioset": [null, [["noise", 27.71], ["music", 24.07], ["whale vocalization", 6.68]], null, null, null, null, null, [["hum", 24.71], ["speech", 21.12], ["music", 9.45]], null, null, null, null, [["music", 56.48], ["hum", 8.21], ["whale vocalization", 4.9]], null, [["hoot", 37.59], ["owl", 36.17], ["music", 8.97]], null, null, null, null, null, [["hum", 25.67], ["music", 15.11], ["throbbing", 7.79]], [["groan", 17.17], ["music", 15.6], ["livestock, farm animals, working animals", 11.41]], [["sidetone", 70.65], ["music", 10.63], ["speech", 3.29]], [["music", 33.1], ["explosion", 7.32], ["speech", 7.28]]], "duration": [1.79, 4.15, 0.13, 0.81, 0.57, 1.83, 0.8, 5.49, 1.78, 1.16, 0.77, 1.69, 5.04, 1.09, 2.03, 1.14, 1.25, 1.29, 1.24, 1.58, 5.13, 5.22, 2.11, 15.76]} \ No newline at end of file diff --git a/annotations_1/ctd3NPx1pdM_filtered.json b/annotations_1/ctd3NPx1pdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40c20cede90a8862f71d43c49a3aa7c805311d3c --- /dev/null +++ b/annotations_1/ctd3NPx1pdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.3], [4.0, 4.41], [5.0, 7.26], [9.0, 17.07], [19.0, 18.81], [20.0, 20.44], [21.0, 21.22], [21.0, 29.08], [30.0, 30.4], [32.0, 34.55], [35.0, 36.9], [38.0, 39.33], [40.0, 41.35], [42.0, 45.91], [50.0, 50.77], [53.0, 56.25], [59.0, 59.48], [61.0, 62.5], [65.0, 66.38], [67.0, 69.75], [74.0, 74.56], [77.0, 77.41], [79.0, 78.81], [82.0, 82.58], [84.0, 84.96], [89.0, 89.43], [92.0, 92.15], [93.0, 97.53], [98.0, 99.47], [101.0, 102.37], [113.0, 113.02], [114.0, 117.98], [120.0, 120.41], [123.0, 123.9], [126.0, 126.72], [136.0, 137.64], [139.0, 139.92], [143.0, 144.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.98, 58.38, 0.0, 0.0, 0.0, 62.89, 0.0, 91.98, 0.0, 0.0, 0.0, 67.51, 0.0, 99.88, 0.0, 0.0, 0.0, 34.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.72], ["telephone", 17.84], ["busy signal", 6.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.3, 0.41, 2.26, 8.07, -0.19, 0.44, 0.22, 8.08, 0.4, 2.55, 1.9, 1.33, 1.35, 3.91, 0.77, 3.25, 0.48, 1.5, 1.38, 2.75, 0.56, 0.41, -0.19, 0.58, 0.96, 0.43, 0.15, 4.53, 1.47, 1.37, 0.02, 3.98, 0.41, 0.9, 0.72, 1.64, 0.92, 1.58]} \ No newline at end of file diff --git a/annotations_1/ctjucF9fiFw_filtered.json b/annotations_1/ctjucF9fiFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69b2e51d9e865911c4470c579c78a98b23f931d --- /dev/null +++ b/annotations_1/ctjucF9fiFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 25.35], [26.0, 26.64], [27.0, 27.94], [36.0, 37.42], [39.0, 41.28], [46.0, 50.53], [59.0, 62.34], [67.0, 72.08], [75.0, 77.79], [80.0, 83.15], [84.0, 84.97], [85.0, 86.61], [94.0, 93.9], [96.0, 100.92]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [36.24, 0.0, 0.0, 0.0, 41.34, 29.62, 36.76, 70.3, 33.7, 41.6, 0.0, 0.0, 0.0, 30.62], "audiomae_on_audioset": [[["music", 40.59], ["hum", 19.49], ["throbbing", 5.56]], null, null, null, [["music", 65.69], ["speech", 16.8], ["electronic music", 2.27]], [["music", 32.2], ["hum", 23.85], ["mains hum", 15.43]], [["throbbing", 39.22], ["hum", 22.28], ["music", 8.47]], null, [["music", 37.96], ["glass", 16.01], ["breaking", 11.16]], [["music", 63.97], ["musical instrument", 6.53], ["didgeridoo", 5.51]], null, null, null, [["music", 53.29], ["boing", 7.55], ["sound effect", 5.08]]], "duration": [10.35, 0.64, 0.94, 1.42, 2.28, 4.53, 3.34, 5.08, 2.79, 3.15, 0.97, 1.61, -0.1, 4.92]} \ No newline at end of file diff --git a/annotations_1/cv8yjJQg4Nc_filtered.json b/annotations_1/cv8yjJQg4Nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3af38033af164bf371d0687a15eccb20c45d3de --- /dev/null +++ b/annotations_1/cv8yjJQg4Nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [4.0, 3.55], [7.0, 8.19], [12.0, 13.05], [14.0, 14.99], [17.0, 17.24], [20.0, 20.88], [23.0, 24.48], [26.0, 28.11], [49.0, 49.1], [53.0, 53.74], [55.0, 55.43], [61.0, 61.45], [76.0, 78.11]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.91, 0.0, 0.0, 0.0, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["echo", 49.91], ["effects unit", 9.28], ["reverberation", 7.12]], null, null, null, null, null], "duration": [0.04, -0.45, 1.19, 1.05, 0.99, 0.24, 0.88, 1.48, 2.11, 0.1, 0.74, 0.43, 0.45, 2.11]} \ No newline at end of file diff --git a/annotations_1/cvNjYmDiV0Y_filtered.json b/annotations_1/cvNjYmDiV0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92f0d30165524eb512a523afffa08b213e2a3242 --- /dev/null +++ b/annotations_1/cvNjYmDiV0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [10.0, 12.83], [15.0, 15.58], [17.0, 19.38], [21.0, 23.36], [28.0, 28.41], [32.0, 32.58], [35.0, 36.51], [38.0, 39.5], [40.0, 80.35], [81.0, 84.6], [85.0, 107.05], [107.0, 115.53], [116.0, 115.62], [116.0, 116.01], [121.0, 124.16], [125.0, 139.63], [146.0, 147.19], [148.0, 149.03], [150.0, 150.18], [150.0, 150.85], [160.0, 160.62], [165.0, 166.68], [167.0, 168.15], [170.0, 170.92], [173.0, 175.17], [176.0, 179.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.03, 0.0, 67.63, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 36.23, 40.12, 31.11, 0.0, 0.0, 32.26, 31.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 75.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["thunk", 46.54], ["music", 30.27], ["knock", 5.25]], [["music", 37.25], ["fly, housefly", 10.98], ["effects unit", 7.18]], [["whack, thwack", 21.6], ["gong", 11.37], ["breaking", 10.31]], null, null, [["cattle, bovinae", 33.31], ["moo", 26.76], ["livestock, farm animals, working animals", 16.6]], [["animal", 20.66], ["cattle, bovinae", 17.34], ["moo", 9.14]], null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.83, 0.58, 2.38, 2.36, 0.41, 0.58, 1.51, 1.5, 40.35, 3.6, 22.05, 8.53, -0.38, 0.01, 3.16, 14.63, 1.19, 1.03, 0.18, 0.85, 0.62, 1.68, 1.15, 0.92, 2.17, 3.19]} \ No newline at end of file diff --git a/annotations_1/cvPIBkkwvD4_filtered.json b/annotations_1/cvPIBkkwvD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eac1c6fd437b5e1139b1345fa1f72959c449831c --- /dev/null +++ b/annotations_1/cvPIBkkwvD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.47], [12.0, 13.07], [18.0, 20.04], [21.0, 21.74], [22.0, 22.71], [23.0, 30.74], [33.0, 33.3], [39.0, 41.55], [43.0, 52.54], [53.0, 54.19], [63.0, 70.85], [74.0, 81.45]], "keep_status": [false, false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [29.83, 0.0, 38.16, 0.0, 0.0, 38.51, 0.0, 63.53, 38.14, 0.0, 35.84, 34.73], "audiomae_on_audioset": [[["explosion", 38.59], ["speech", 26.31], ["music", 10.14]], null, [["music", 22.76], ["speech", 14.56], ["sheep", 7.12]], null, null, [["whale vocalization", 30.33], ["buzz", 11.84], ["hum", 11.35]], null, null, [["music", 21.05], ["whale vocalization", 9.46], ["explosion", 5.63]], null, [["speech", 61.55], ["whale vocalization", 15.92], ["music", 10.94]], [["music", 67.07], ["speech", 19.91], ["musical instrument", 3.62]]], "duration": [3.47, 1.07, 2.04, 0.74, 0.71, 7.74, 0.3, 2.55, 9.54, 1.19, 7.85, 7.45]} \ No newline at end of file diff --git a/annotations_1/cwOh20xN82E_filtered.json b/annotations_1/cwOh20xN82E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3e201d29b0cb2e5803c9d82f1d81acd64b572a --- /dev/null +++ b/annotations_1/cwOh20xN82E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.35], [12.0, 12.28], [15.0, 15.31], [17.0, 17.07], [18.0, 18.59], [20.0, 21.41], [23.0, 25.14], [26.0, 28.76], [31.0, 31.11], [35.0, 37.79], [39.0, 39.88], [41.0, 42.33], [45.0, 46.57], [48.0, 51.54], [52.0, 54.13], [55.0, 59.14], [70.0, 71.17], [75.0, 75.41], [77.0, 78.07], [89.0, 89.99], [94.0, 95.94], [98.0, 100.74], [102.0, 105.39], [107.0, 108.01], [112.0, 117.69], [119.0, 122.47], [123.0, 127.13], [129.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, true], "silence_prob": [99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 99.48, 0.0, 93.91, 0.0, 0.0, 0.0, 95.64, 56.48, 48.06, 0.0, 0.0, 0.0, 0.0, 0.0, 35.14, 33.71, 0.0, 34.17, 36.02, 35.24, 34.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.01], ["guitar", 22.42], ["musical instrument", 10.67]], null, null, null, null, null, [["music", 49.46], ["guitar", 13.03], ["musical instrument", 12.0]], [["music", 44.95], ["zither", 12.19], ["singing", 5.06]], null, [["music", 27.67], ["double bass", 21.7], ["cello", 9.52]], [["music", 32.34], ["double bass", 9.33], ["cello", 8.94]], [["music", 53.14], ["guitar", 5.76], ["double bass", 4.47]], [["music", 43.07], ["guitar", 6.69], ["musical instrument", 5.11]]], "duration": [2.35, 0.28, 0.31, 0.07, 0.59, 1.41, 2.14, 2.76, 0.11, 2.79, 0.88, 1.33, 1.57, 3.54, 2.13, 4.14, 1.17, 0.41, 1.07, 0.99, 1.94, 2.74, 3.39, 1.01, 5.69, 3.47, 4.13, 4.1]} \ No newline at end of file diff --git a/annotations_1/cwgaR1xDiyE_filtered.json b/annotations_1/cwgaR1xDiyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02d224142c759d2e6956d58472d8984b46f20511 --- /dev/null +++ b/annotations_1/cwgaR1xDiyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.46], [14.0, 16.85], [18.0, 21.1], [24.0, 38.94], [43.0, 44.98], [47.0, 47.17], [48.0, 90.8], [92.0, 92.77], [93.0, 105.48], [110.0, 111.42], [112.0, 115.13], [119.0, 126.42]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [62.99, 52.16, 52.1, 41.74, 0.0, 0.0, 0.0, 0.0, 31.25, 0.0, 41.5, 29.55], "audiomae_on_audioset": [null, null, null, [["hum", 47.1], ["mains hum", 17.22], ["throbbing", 10.8]], null, null, null, null, [["music", 59.91], ["hum", 5.0], ["throbbing", 4.14]], null, [["music", 51.01], ["didgeridoo", 6.94], ["livestock, farm animals, working animals", 6.83]], [["speech", 34.02], ["hum", 10.64], ["music", 8.07]]], "duration": [2.46, 2.85, 3.1, 14.94, 1.98, 0.17, 42.8, 0.77, 12.48, 1.42, 3.13, 7.42]} \ No newline at end of file diff --git a/annotations_1/cyUf4tLI53o_filtered.json b/annotations_1/cyUf4tLI53o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c60a96a9c0d8ce650bf89a752ddf87a03786a5b --- /dev/null +++ b/annotations_1/cyUf4tLI53o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.22], [10.0, 11.37], [12.0, 13.54], [16.0, 15.65], [17.0, 17.15], [21.0, 22.3], [29.0, 29.46], [34.0, 34.35], [35.0, 36.75], [37.0, 38.65], [39.0, 40.04], [42.0, 43.87], [45.0, 45.2], [47.0, 48.52], [49.0, 49.76], [52.0, 53.77], [54.0, 55.27], [58.0, 68.98], [69.0, 71.36], [74.0, 75.17], [76.0, 77.14], [80.0, 81.24], [86.0, 85.75], [87.0, 87.93], [89.0, 89.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.3, 32.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.11], ["theremin", 9.87], ["musical instrument", 5.69]], [["foghorn", 75.53], ["trombone", 8.8], ["music", 7.48]], null, null, null, null, null, null], "duration": [0.22, 1.37, 1.54, -0.35, 0.15, 1.3, 0.46, 0.35, 1.75, 1.65, 1.04, 1.87, 0.2, 1.52, 0.76, 1.77, 1.27, 10.98, 2.36, 1.17, 1.14, 1.24, -0.25, 0.93, 0.48]} \ No newline at end of file diff --git a/annotations_1/cycPu9OddzU_filtered.json b/annotations_1/cycPu9OddzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..225d9105f66c4394ba9ed1a17a7b79422c01efbd --- /dev/null +++ b/annotations_1/cycPu9OddzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.45], [5.0, 6.29], [7.0, 7.64], [9.0, 9.56], [10.0, 10.64], [15.0, 20.63], [27.0, 27.04], [28.0, 28.63], [31.0, 31.26], [33.0, 34.5], [36.0, 38.15], [40.0, 40.37], [42.0, 41.96], [44.0, 45.72], [48.0, 48.68], [50.0, 73.23], [74.0, 74.76], [76.0, 77.21], [80.0, 81.89], [83.0, 83.84], [85.0, 85.51], [88.0, 95.49], [96.0, 97.85], [99.0, 106.62], [107.0, 108.65], [109.0, 110.61], [111.0, 112.35], [113.0, 114.2], [115.0, 120.88], [126.0, 126.96], [129.0, 129.15], [130.0, 131.16], [133.0, 133.56], [135.0, 135.48], [136.0, 139.46], [141.0, 142.11], [143.0, 143.6], [146.0, 146.52], [149.0, 150.8], [153.0, 155.46], [157.0, 158.94], [164.0, 165.27], [166.0, 170.14], [171.0, 173.69], [174.0, 177.74], [179.0, 183.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.74, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 0.0, 0.0, 0.0, 0.0, 40.48, 0.0, 41.87, 0.0, 0.0, 0.0, 0.0, 38.32, 0.0, 0.0, 0.0, 0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 55.31, 0.0, 0.0, 70.86, 56.4, 47.7, 37.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.19], ["music", 15.14], ["sonar", 14.1]], null, [["gong", 32.46], ["music", 21.7], ["hum", 12.1]], null, null, null, null, [["music", 32.1], ["rumble", 10.52], ["hum", 10.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 42.4], ["speech", 24.08], ["music", 14.72]], [["speech", 68.4], ["hum", 4.27], ["rumble", 4.1]]], "duration": [2.45, 1.29, 0.64, 0.56, 0.64, 5.63, 0.04, 0.63, 0.26, 1.5, 2.15, 0.37, -0.04, 1.72, 0.68, 23.23, 0.76, 1.21, 1.89, 0.84, 0.51, 7.49, 1.85, 7.62, 1.65, 1.61, 1.35, 1.2, 5.88, 0.96, 0.15, 1.16, 0.56, 0.48, 3.46, 1.11, 0.6, 0.52, 1.8, 2.46, 1.94, 1.27, 4.14, 2.69, 3.74, 4.03]} \ No newline at end of file diff --git a/annotations_1/czJL-TPz-5M_filtered.json b/annotations_1/czJL-TPz-5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f768e6c85dd5f9832b9a9283505d9c8fbf50ae26 --- /dev/null +++ b/annotations_1/czJL-TPz-5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 18.82], [19.0, 25.2], [26.0, 39.51], [40.0, 64.12], [64.0, 64.17], [67.0, 67.66], [72.0, 72.22], [73.0, 75.2], [86.0, 90.1], [92.0, 93.21], [94.0, 94.54], [95.0, 95.23], [95.0, 95.3], [95.0, 95.34], [95.0, 95.49], [96.0, 96.65], [99.0, 115.28], [115.0, 115.32], [115.0, 115.35], [115.0, 115.38], [115.0, 115.42], [115.0, 115.45], [115.0, 121.44], [123.0, 124.34], [126.0, 127.08], [129.0, 129.63], [131.0, 131.53], [134.0, 135.57], [138.0, 138.96], [140.0, 145.34], [146.0, 146.42], [147.0, 152.1], [156.0, 165.97], [166.0, 166.33], [170.0, 170.4], [174.0, 175.17]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.53, 62.78, 82.97, 71.43, 0.0, 0.0, 0.0, 38.94, 40.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 85.54, 83.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 31.09], ["music", 17.19], ["grunt", 5.34]], [["music", 22.82], ["speech", 5.52], ["electric shaver, electric razor", 4.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.82, 6.2, 13.51, 24.12, 0.17, 0.66, 0.22, 2.2, 4.1, 1.21, 0.54, 0.23, 0.3, 0.34, 0.49, 0.65, 16.28, 0.32, 0.35, 0.38, 0.42, 0.45, 6.44, 1.34, 1.08, 0.63, 0.53, 1.57, 0.96, 5.34, 0.42, 5.1, 9.97, 0.33, 0.4, 1.17]} \ No newline at end of file diff --git a/annotations_1/czOgJJqehv0_filtered.json b/annotations_1/czOgJJqehv0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..820fcfd2fadba0466fc47bdaa03643800f8be288 --- /dev/null +++ b/annotations_1/czOgJJqehv0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.36], [21.0, 21.14], [24.0, 25.0], [33.0, 33.88], [34.0, 34.62], [36.0, 35.99], [44.0, 45.03], [47.0, 48.12]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.36, 0.14, 1.0, 0.88, 0.62, -0.01, 1.03, 1.12]} \ No newline at end of file diff --git a/annotations_1/d0ZOz1i5-PE_filtered.json b/annotations_1/d0ZOz1i5-PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cf28bd6763eee9c1ac7a938c2bb1878d3e7c6b8 --- /dev/null +++ b/annotations_1/d0ZOz1i5-PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.53], [23.0, 24.8], [26.0, 26.22], [28.0, 29.3], [31.0, 36.14], [37.0, 37.23], [40.0, 40.46], [44.0, 46.06], [46.0, 46.6], [49.0, 49.11], [54.0, 54.43], [59.0, 59.48], [63.0, 68.88], [69.0, 70.17], [72.0, 72.15], [84.0, 86.59], [90.0, 91.18], [93.0, 96.3], [103.0, 103.89], [107.0, 109.21], [117.0, 118.34], [122.0, 125.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 43.15, 0.0, 0.0, 34.96, 0.0, 0.0, 0.0, 0.0, 33.86, 0.0, 0.0, 36.11, 0.0, 31.57, 0.0, 36.76, 0.0, 39.55], "audiomae_on_audioset": [null, null, null, null, [["speech", 39.08], ["fly, housefly", 17.56], ["insect", 13.84]], null, null, [["music", 32.73], ["speech", 19.45], ["timpani", 8.0]], null, null, null, null, [["music", 47.04], ["speech", 22.91], ["boing", 11.62]], null, null, [["speech", 26.29], ["boing", 17.4], ["music", 15.57]], null, [["music", 14.96], ["speech", 14.4], ["moo", 13.19]], null, [["music", 39.33], ["speech", 9.48], ["didgeridoo", 5.21]], null, [["music", 49.65], ["boing", 3.43], ["sampler", 2.9]]], "duration": [1.53, 1.8, 0.22, 1.3, 5.14, 0.23, 0.46, 2.06, 0.6, 0.11, 0.43, 0.48, 5.88, 1.17, 0.15, 2.59, 1.18, 3.3, 0.89, 2.21, 1.34, 3.56]} \ No newline at end of file diff --git a/annotations_1/d0c6KWKMAF8_filtered.json b/annotations_1/d0c6KWKMAF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731c01f8d96a24d937cfce3fef7b0fb7bb71b100 --- /dev/null +++ b/annotations_1/d0c6KWKMAF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.35], [7.0, 7.69], [9.0, 11.2], [12.0, 20.8], [22.0, 47.97], [49.0, 50.6], [52.0, 53.18], [55.0, 56.15], [57.0, 62.46], [64.0, 65.57], [66.0, 67.26], [68.0, 68.39], [80.0, 93.93], [96.0, 103.32], [106.0, 106.86], [109.0, 114.91], [116.0, 117.22]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [38.15, 0.0, 84.25, 44.55, 36.2, 0.0, 0.0, 0.0, 36.47, 0.0, 0.0, 0.0, 31.59, 53.1, 0.0, 90.43, 0.0], "audiomae_on_audioset": [[["speech", 56.49], ["music", 8.86], ["synthesizer", 2.92]], null, null, [["hum", 46.55], ["throbbing", 30.95], ["mains hum", 16.7]], [["hum", 41.44], ["throbbing", 40.18], ["mains hum", 7.96]], null, null, null, [["throbbing", 27.99], ["music", 26.95], ["hum", 19.67]], null, null, null, [["hum", 33.15], ["speech", 15.04], ["throbbing", 14.93]], null, null, null, null], "duration": [3.35, 0.69, 2.2, 8.8, 25.97, 1.6, 1.18, 1.15, 5.46, 1.57, 1.26, 0.39, 13.93, 7.32, 0.86, 5.91, 1.22]} \ No newline at end of file diff --git a/annotations_1/d0hM2Ekkk-8_filtered.json b/annotations_1/d0hM2Ekkk-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb78b671029d6789fb1405872c581adaf7580e1b --- /dev/null +++ b/annotations_1/d0hM2Ekkk-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.28], [24.0, 24.33], [33.0, 49.08], [77.0, 76.79], [101.0, 101.39], [135.0, 135.82]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.28, 0.33, 16.08, -0.21, 0.39, 0.82]} \ No newline at end of file diff --git a/annotations_1/d1ZUnCbVoZQ_filtered.json b/annotations_1/d1ZUnCbVoZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e8e0441de433fe7052eae36f6d52438774c402 --- /dev/null +++ b/annotations_1/d1ZUnCbVoZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.58], [6.0, 9.66], [11.0, 14.17], [15.0, 15.7], [16.0, 16.09], [17.0, 17.37], [19.0, 21.57], [22.0, 23.36], [25.0, 25.78], [27.0, 29.49], [30.0, 39.73], [43.0, 42.79], [43.0, 45.35], [51.0, 51.54], [57.0, 57.33], [58.0, 58.48], [59.0, 60.35], [63.0, 63.36], [65.0, 71.52], [76.0, 76.1], [76.0, 78.24], [79.0, 80.01], [82.0, 82.58], [85.0, 86.83], [87.0, 88.32], [89.0, 90.14], [94.0, 95.77], [101.0, 102.63], [104.0, 105.48], [107.0, 107.7], [109.0, 109.75], [112.0, 112.8], [114.0, 114.44], [117.0, 117.37], [122.0, 123.63], [125.0, 126.15], [128.0, 128.97], [134.0, 133.88], [154.0, 154.09], [159.0, 161.06], [163.0, 164.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.07, 99.05, 93.29, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 57.4, 96.42, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.58, 3.66, 3.17, 0.7, 0.09, 0.37, 2.57, 1.36, 0.78, 2.49, 9.73, -0.21, 2.35, 0.54, 0.33, 0.48, 1.35, 0.36, 6.52, 0.1, 2.24, 1.01, 0.58, 1.83, 1.32, 1.14, 1.77, 1.63, 1.48, 0.7, 0.75, 0.8, 0.44, 0.37, 1.63, 1.15, 0.97, -0.12, 0.09, 2.06, 1.46]} \ No newline at end of file diff --git a/annotations_1/d2uvpiz5up0_filtered.json b/annotations_1/d2uvpiz5up0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce078010198df4e2b3af6db53c3373725ae8a0 --- /dev/null +++ b/annotations_1/d2uvpiz5up0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.16], [17.0, 30.81], [34.0, 68.66], [70.0, 103.82], [107.0, 118.37]], "keep_status": [true, false, false, false, true], "silence_prob": [32.14, 31.49, 0.0, 0.0, 30.63], "audiomae_on_audioset": [[["hum", 27.24], ["speech", 25.41], ["mains hum", 15.35]], [["speech", 68.8], ["vehicle", 9.05], ["helicopter", 3.48]], null, null, [["hum", 36.31], ["music", 19.79], ["mains hum", 8.46]]], "duration": [9.16, 13.81, 34.66, 33.82, 11.37]} \ No newline at end of file diff --git a/annotations_1/d35M7d-E_PY_filtered.json b/annotations_1/d35M7d-E_PY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b995c834871dfd270a13f7beb4a22a2ac4e4c35c --- /dev/null +++ b/annotations_1/d35M7d-E_PY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.24], [7.0, 7.65], [9.0, 9.69], [10.0, 11.23], [18.0, 18.32], [30.0, 30.67], [33.0, 33.17], [38.0, 39.5], [43.0, 43.04], [44.0, 44.59], [48.0, 49.59], [51.0, 51.11], [53.0, 53.82], [54.0, 55.53], [59.0, 59.81], [65.0, 65.42], [70.0, 70.55], [74.0, 74.36], [87.0, 87.54], [94.0, 95.01], [99.0, 99.72], [102.0, 102.54], [107.0, 107.62], [109.0, 109.26], [117.0, 118.5], [121.0, 121.86], [125.0, 125.58], [128.0, 129.03], [131.0, 131.68], [132.0, 132.34], [132.0, 133.68], [135.0, 136.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.24, 0.65, 0.69, 1.23, 0.32, 0.67, 0.17, 1.5, 0.04, 0.59, 1.59, 0.11, 0.82, 1.53, 0.81, 0.42, 0.55, 0.36, 0.54, 1.01, 0.72, 0.54, 0.62, 0.26, 1.5, 0.86, 0.58, 1.03, 0.68, 0.34, 1.68, 1.19]} \ No newline at end of file diff --git a/annotations_1/d3HAOZbAj1Q_filtered.json b/annotations_1/d3HAOZbAj1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..160d21a3eb64e839e2d0bfcccefc6d29ec9a8bc8 --- /dev/null +++ b/annotations_1/d3HAOZbAj1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.94], [25.0, 25.46], [30.0, 36.85], [45.0, 45.69], [53.0, 53.45], [53.0, 69.4]], "keep_status": [true, false, true, false, false, true], "silence_prob": [29.84, 0.0, 30.51, 0.0, 0.0, 29.74], "audiomae_on_audioset": [[["music", 28.79], ["hum", 14.97], ["mains hum", 14.13]], null, [["rumble", 22.82], ["speech", 16.18], ["hum", 13.03]], null, null, [["music", 51.69], ["hum", 11.58], ["grunt", 6.59]]], "duration": [3.94, 0.46, 6.85, 0.69, 0.45, 16.4]} \ No newline at end of file diff --git a/annotations_1/d46cDtFv_Rw_filtered.json b/annotations_1/d46cDtFv_Rw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27e94b11ffa738dfff01a742d70d214a852f138b --- /dev/null +++ b/annotations_1/d46cDtFv_Rw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [6.0, 6.45], [8.0, 9.04], [9.0, 10.37], [11.0, 12.83], [19.0, 21.81], [22.0, 23.65], [28.0, 31.46], [38.0, 40.29], [43.0, 43.95], [46.0, 50.99], [52.0, 54.3], [55.0, 57.11], [59.0, 60.57], [62.0, 65.26], [66.0, 67.24], [69.0, 73.84], [76.0, 79.29], [81.0, 82.81], [85.0, 95.61], [99.0, 108.31], [110.0, 111.45], [113.0, 112.78], [115.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 97.43, 72.16, 0.0, 77.36, 65.55, 49.13, 0.0, 99.16, 0.0, 76.2, 65.67, 0.0, 72.31, 71.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.8], ["insect", 3.49], ["hum", 3.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.45, 1.04, 1.37, 1.83, 2.81, 1.65, 3.46, 2.29, 0.95, 4.99, 2.3, 2.11, 1.57, 3.26, 1.24, 4.84, 3.29, 1.81, 10.61, 9.31, 1.45, -0.22, 1.9]} \ No newline at end of file diff --git a/annotations_1/d5Pc-tNsvT4_filtered.json b/annotations_1/d5Pc-tNsvT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4561cfa53942a6ef1b7706a8dd66dd9d6da0071d --- /dev/null +++ b/annotations_1/d5Pc-tNsvT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 5.54], [7.0, 7.21], [16.0, 17.22], [19.0, 19.77], [22.0, 23.95], [33.0, 33.15], [38.0, 38.64], [49.0, 49.47], [53.0, 54.08], [59.0, 59.54], [70.0, 70.02], [73.0, 72.91], [75.0, 75.19], [79.0, 79.88], [82.0, 82.53], [101.0, 107.59], [110.0, 110.96], [115.0, 115.05], [117.0, 116.95], [121.0, 121.58], [129.0, 128.82], [139.0, 145.15], [151.0, 156.63], [159.0, 160.32], [162.0, 165.87]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 42.44, 0.0, 45.75], "audiomae_on_audioset": [[["music", 27.05], ["hum", 20.14], ["speech", 10.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.64], ["trombone", 10.17], ["brass instrument", 5.23]], [["hum", 40.68], ["mains hum", 14.25], ["rumble", 14.17]], null, [["music", 24.48], ["whale vocalization", 11.18], ["sidetone", 8.62]]], "duration": [2.23, 0.54, 0.21, 1.22, 0.77, 1.95, 0.15, 0.64, 0.47, 1.08, 0.54, 0.02, -0.09, 0.19, 0.88, 0.53, 6.59, 0.96, 0.05, -0.05, 0.58, -0.18, 6.15, 5.63, 1.32, 3.87]} \ No newline at end of file diff --git a/annotations_1/d5gSQLPcya0_filtered.json b/annotations_1/d5gSQLPcya0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..245b6dc04837831af18ac439e7fbc9c9fca1fb8b --- /dev/null +++ b/annotations_1/d5gSQLPcya0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.37], [15.0, 17.12], [18.0, 33.78], [37.0, 57.6], [60.0, 82.29], [84.0, 96.85], [98.0, 104.19], [106.0, 107.28], [111.0, 112.5], [123.0, 127.99], [131.0, 134.45], [138.0, 141.32], [143.0, 165.67]], "keep_status": [false, true, false, true, true, true, true, false, false, true, false, true, false], "silence_prob": [30.27, 46.94, 78.21, 30.87, 35.64, 31.96, 36.21, 0.0, 0.0, 31.29, 30.82, 30.15, 50.51], "audiomae_on_audioset": [[["music", 29.9], ["hum", 23.69], ["throbbing", 19.61]], [["speech", 20.15], ["sonar", 10.51], ["music", 9.41]], null, [["speech", 30.81], ["buzz", 13.54], ["livestock, farm animals, working animals", 7.68]], [["music", 36.4], ["hum", 17.42], ["throbbing", 6.06]], [["speech", 34.02], ["music", 14.55], ["hum", 9.58]], [["speech", 45.62], ["music", 9.59], ["sidetone", 6.24]], null, null, [["speech", 41.25], ["vehicle", 10.17], ["mains hum", 5.22]], [["speech", 48.47], ["music", 13.0], ["vehicle", 9.08]], [["speech", 21.31], ["music", 16.95], ["noise", 5.82]], null], "duration": [9.37, 2.12, 15.78, 20.6, 22.29, 12.85, 6.19, 1.28, 1.5, 4.99, 3.45, 3.32, 22.67]} \ No newline at end of file diff --git a/annotations_1/d6263F3UkWo_filtered.json b/annotations_1/d6263F3UkWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b660f419e9e06bb36debcd14623aa221a5d0262 --- /dev/null +++ b/annotations_1/d6263F3UkWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 29.73], [30.0, 29.89], [31.0, 33.79], [36.0, 36.04], [37.0, 39.09], [40.0, 43.56], [44.0, 43.6], [44.0, 49.23], [50.0, 88.11], [89.0, 91.93], [94.0, 104.46], [105.0, 109.22], [112.0, 122.59], [124.0, 131.11], [133.0, 135.21], [138.0, 146.23], [147.0, 169.5], [171.0, 178.56], [184.0, 185.53], [186.0, 186.39]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.31, 0.0, 30.17, 31.18, 0.0, 30.84, 0.0, 29.99, 31.1, 29.49, 31.59, 49.36, 82.61, 79.24, 50.81, 46.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["boing", 66.53], ["music", 20.82], ["didgeridoo", 1.16]], null, [["music", 58.91], ["livestock, farm animals, working animals", 7.1], ["cattle, bovinae", 4.92]], [["music", 61.79], ["speech", 9.67], ["throbbing", 5.51]], null, [["music", 36.66], ["livestock, farm animals, working animals", 16.91], ["cattle, bovinae", 13.36]], null, [["whip", 38.3], ["music", 6.15], ["whack, thwack", 5.92]], [["music", 36.43], ["speech", 27.97], ["synthesizer", 3.52]], [["music", 15.84], ["buzz", 10.95], ["speech", 10.69]], [["music", 69.09], ["speech", 3.45], ["musical instrument", 2.64]], [["speech", 46.91], ["music", 25.64], ["foghorn", 15.04]], null, null, null, [["insect", 23.03], ["music", 21.98], ["fly, housefly", 16.5]], null, null], "duration": [-0.27, -0.11, 2.79, 0.04, 2.09, 3.56, -0.4, 5.23, 38.11, 2.93, 10.46, 4.22, 10.59, 7.11, 2.21, 8.23, 22.5, 7.56, 1.53, 0.39]} \ No newline at end of file diff --git a/annotations_1/d7-pWfZgFKU_filtered.json b/annotations_1/d7-pWfZgFKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a68559ba78998c6293573ba2b450958f14fe8167 --- /dev/null +++ b/annotations_1/d7-pWfZgFKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.05], [7.0, 8.88], [9.0, 13.04], [13.0, 23.33], [25.0, 38.57], [39.0, 41.91], [43.0, 47.01], [48.0, 49.05], [51.0, 90.37], [91.0, 94.66], [96.0, 96.06], [102.0, 103.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 99.16, 57.09, 64.63, 94.07, 99.1, 0.0, 0.0, 82.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.05, 1.88, 4.04, 10.33, 13.57, 2.91, 4.01, 1.05, 39.37, 3.66, 0.06, 1.65]} \ No newline at end of file diff --git a/annotations_1/d7Aot4Wr-Yo_filtered.json b/annotations_1/d7Aot4Wr-Yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de758445de65ce47c6d889b9e12cef090b00ca05 --- /dev/null +++ b/annotations_1/d7Aot4Wr-Yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 34.69], [35.0, 120.01], [121.0, 132.43], [135.0, 135.62], [136.0, 158.75], [159.0, 162.4], [167.0, 169.67], [170.0, 169.84], [170.0, 171.27], [173.0, 173.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.71, 0.0, 99.88, 0.0, 78.04, 99.31, 50.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [25.69, 85.01, 11.43, 0.62, 22.75, 3.4, 2.67, -0.16, 1.27, 0.23]} \ No newline at end of file diff --git a/annotations_1/d7WraA-roN8_filtered.json b/annotations_1/d7WraA-roN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd3b2cdfafeaa65acc1af12c0986c32794d2e4bd --- /dev/null +++ b/annotations_1/d7WraA-roN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [7.0, 7.4], [8.0, 11.11], [12.0, 12.97], [14.0, 15.77], [16.0, 18.52], [23.0, 25.07], [34.0, 39.24], [41.0, 52.05], [54.0, 58.04], [61.0, 61.7], [65.0, 65.87], [67.0, 96.72], [98.0, 102.47], [105.0, 105.7], [107.0, 110.15], [111.0, 111.55], [112.0, 117.09]], "keep_status": [false, false, true, false, false, true, false, true, true, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 0.0, 45.95, 39.21, 41.62, 28.82, 28.38, 0.0, 0.0, 32.85, 36.44, 0.0, 32.09, 0.0, 34.53], "audiomae_on_audioset": [null, null, [["hum", 19.0], ["sidetone", 17.9], ["speech", 15.49]], null, null, [["speech", 32.69], ["music", 11.39], ["mains hum", 8.17]], [["didgeridoo", 36.6], ["music", 24.77], ["trombone", 9.79]], [["speech", 38.5], ["hum", 17.19], ["throbbing", 7.34]], [["speech", 43.3], ["music", 10.99], ["whack, thwack", 7.03]], [["livestock, farm animals, working animals", 22.19], ["breaking", 16.03], ["cowbell", 8.28]], null, null, [["fly, housefly", 17.86], ["hum", 13.51], ["mosquito", 8.34]], [["music", 73.21], ["guitar", 3.82], ["effects unit", 3.57]], null, [["music", 64.51], ["speech", 9.64], ["guitar", 4.0]], null, [["music", 66.85], ["guitar", 7.46], ["musical instrument", 5.54]]], "duration": [1.56, 0.4, 3.11, 0.97, 1.77, 2.52, 2.07, 5.24, 11.05, 4.04, 0.7, 0.87, 29.72, 4.47, 0.7, 3.15, 0.55, 5.09]} \ No newline at end of file diff --git a/annotations_1/d9TdwetEIQ8_filtered.json b/annotations_1/d9TdwetEIQ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6450de9936000eb4608c78acfab6449c07da5005 --- /dev/null +++ b/annotations_1/d9TdwetEIQ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.84], [23.0, 37.62], [39.0, 39.95], [41.0, 70.98], [74.0, 77.95], [80.0, 134.18], [140.0, 145.32], [147.0, 163.31], [165.0, 166.02], [170.0, 172.91]], "keep_status": [false, false, false, true, false, false, true, true, false, true], "silence_prob": [47.2, 30.3, 0.0, 28.27, 28.28, 0.0, 28.48, 34.57, 0.0, 33.45], "audiomae_on_audioset": [[["sidetone", 47.49], ["music", 21.59], ["hum", 4.17]], [["mains hum", 56.67], ["hum", 29.11], ["music", 4.36]], null, [["music", 46.84], ["hum", 12.13], ["mains hum", 9.13]], [["music", 61.91], ["electronic music", 7.96], ["throbbing", 6.08]], null, [["rumble", 31.98], ["eruption", 11.74], ["hum", 8.1]], [["hum", 25.09], ["music", 21.86], ["rumble", 12.13]], null, [["music", 39.44], ["speech", 10.16], ["didgeridoo", 10.03]]], "duration": [2.84, 14.62, 0.95, 29.98, 3.95, 54.18, 5.32, 16.31, 1.02, 2.91]} \ No newline at end of file diff --git a/annotations_1/dAlYuokC9R0_filtered.json b/annotations_1/dAlYuokC9R0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1054ca21ea8509130aaec9aade21548584129b25 --- /dev/null +++ b/annotations_1/dAlYuokC9R0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.87], [10.0, 11.21], [17.0, 17.02], [18.0, 17.93], [18.0, 18.81], [24.0, 24.06], [33.0, 33.24], [35.0, 35.73], [47.0, 50.67], [51.0, 54.84], [56.0, 62.24], [64.0, 64.98], [67.0, 67.26], [70.0, 72.45], [77.0, 77.3], [79.0, 81.3], [86.0, 89.48], [91.0, 91.93], [93.0, 99.45], [101.0, 101.51], [103.0, 109.38], [114.0, 118.96], [120.0, 121.0], [125.0, 133.25], [134.0, 134.54], [137.0, 137.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.72, 63.53, 97.64, 0.0, 0.0, 85.35, 0.0, 93.91, 97.11, 0.0, 99.36, 0.0, 98.19, 76.7, 0.0, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 56.14], ["guitar", 6.83], ["plucked string instrument", 5.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 1.21, 0.02, -0.07, 0.81, 0.06, 0.24, 0.73, 3.67, 3.84, 6.24, 0.98, 0.26, 2.45, 0.3, 2.3, 3.48, 0.93, 6.45, 0.51, 6.38, 4.96, 1.0, 8.25, 0.54, 0.64]} \ No newline at end of file diff --git a/annotations_1/dAoRRTPPIys_filtered.json b/annotations_1/dAoRRTPPIys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..737cd0f35c286f018dc518c0749d772c36adac24 --- /dev/null +++ b/annotations_1/dAoRRTPPIys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.83], [7.0, 7.21], [15.0, 15.58], [16.0, 17.47], [35.0, 37.18], [40.0, 40.96], [42.0, 46.95], [48.0, 50.48], [60.0, 61.18], [64.0, 65.38], [67.0, 67.46], [69.0, 69.35], [71.0, 81.46], [97.0, 107.33], [112.0, 112.55], [126.0, 127.16], [131.0, 131.62], [136.0, 140.59], [143.0, 149.15], [150.0, 151.65], [154.0, 154.38], [156.0, 160.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 99.56, 91.81, 0.0, 0.0, 0.0, 0.0, 42.93, 45.62, 0.0, 0.0, 0.0, 99.98, 78.72, 0.0, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 17.57], ["fly, housefly", 16.19], ["mosquito", 11.89]], [["noise", 58.93], ["hum", 7.08], ["radio", 4.47]], null, null, null, null, null, null, null, null], "duration": [0.83, 0.21, 0.58, 1.47, 2.18, 0.96, 4.95, 2.48, 1.18, 1.38, 0.46, 0.35, 10.46, 10.33, 0.55, 1.16, 0.62, 4.59, 6.15, 1.65, 0.38, 4.79]} \ No newline at end of file diff --git a/annotations_1/dCyrhdW9e8M_filtered.json b/annotations_1/dCyrhdW9e8M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b3a54397dcad0f3c289395ba595e8949e200d47 --- /dev/null +++ b/annotations_1/dCyrhdW9e8M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 25.69], [26.0, 25.73], [26.0, 25.76], [28.0, 27.87], [29.0, 79.88], [82.0, 84.37], [86.0, 93.85], [98.0, 107.94], [109.0, 113.91], [117.0, 121.53], [123.0, 153.32]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 28.5, 34.04, 35.81, 36.69, 37.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 13.41], ["whoosh, swoosh, swish", 9.81], ["music", 7.99]], [["hum", 45.36], ["music", 20.45], ["throbbing", 14.68]], [["music", 55.28], ["hum", 12.3], ["ambient music", 10.44]], [["music", 57.73], ["ambient music", 10.56], ["whale vocalization", 5.48]], [["music", 45.91], ["hum", 10.71], ["electronic music", 8.63]], null], "duration": [-0.31, -0.27, -0.24, -0.13, 50.88, 2.37, 7.85, 9.94, 4.91, 4.53, 30.32]} \ No newline at end of file diff --git a/annotations_1/dDGMTl1Ya78_filtered.json b/annotations_1/dDGMTl1Ya78_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf95e0d5ebcc7fe65300a0cae2ede2ea687b987 --- /dev/null +++ b/annotations_1/dDGMTl1Ya78_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [5.0, 6.25], [10.0, 11.26], [13.0, 18.82], [20.0, 20.55], [24.0, 42.9], [57.0, 58.92], [60.0, 63.58], [66.0, 69.04], [69.0, 70.66], [76.0, 83.66], [85.0, 91.42], [99.0, 105.49], [110.0, 126.4], [128.0, 131.7], [132.0, 137.93]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, true, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 29.26, 0.0, 29.5, 0.0, 30.33, 30.4, 0.0, 30.45, 30.99, 28.67, 29.73, 28.01, 28.24], "audiomae_on_audioset": [null, null, null, [["mains hum", 55.06], ["hum", 14.83], ["noise", 9.45]], null, [["music", 70.65], ["theremin", 11.04], ["speech", 3.02]], null, [["hum", 39.33], ["mains hum", 29.88], ["buzz", 4.18]], [["hum", 21.86], ["mains hum", 10.09], ["rumble", 9.1]], null, [["hum", 17.4], ["music", 16.74], ["rumble", 13.21]], [["vehicle", 21.39], ["aircraft", 18.27], ["fixed-wing aircraft, airplane", 13.27]], [["mains hum", 32.46], ["hum", 14.22], ["music", 11.02]], [["hum", 25.94], ["mains hum", 23.57], ["music", 9.93]], [["music", 23.51], ["cattle, bovinae", 21.3], ["livestock, farm animals, working animals", 9.68]], [["vehicle", 31.55], ["car", 12.04], ["race car, auto racing", 8.26]]], "duration": [0.42, 1.25, 1.26, 5.82, 0.55, 18.9, 1.92, 3.58, 3.04, 1.66, 7.66, 6.42, 6.49, 16.4, 3.7, 5.93]} \ No newline at end of file diff --git a/annotations_1/dEqrnOk8P1Q_filtered.json b/annotations_1/dEqrnOk8P1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a09fa340b2b640012add868178bebca5acb6292b --- /dev/null +++ b/annotations_1/dEqrnOk8P1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.16], [19.0, 20.73], [26.0, 30.42], [32.0, 33.45], [37.0, 38.72], [40.0, 40.26], [42.0, 43.24], [47.0, 47.95], [50.0, 50.38], [57.0, 57.77], [59.0, 59.39], [60.0, 60.66], [62.0, 65.1], [66.0, 66.18], [68.0, 69.43], [70.0, 71.39], [78.0, 78.43], [79.0, 79.93], [82.0, 87.2], [89.0, 89.33], [92.0, 95.81], [96.0, 98.0], [99.0, 99.55], [101.0, 101.66], [108.0, 108.65], [110.0, 110.29], [114.0, 114.27], [115.0, 115.6], [120.0, 120.66], [122.0, 122.57], [124.0, 124.77], [126.0, 128.46], [129.0, 130.44], [132.0, 133.19], [134.0, 134.35], [140.0, 141.25], [146.0, 146.62], [149.0, 149.45], [152.0, 152.96], [158.0, 163.83], [166.0, 167.1], [170.0, 170.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.71, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 100.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.16, 1.73, 4.42, 1.45, 1.72, 0.26, 1.24, 0.95, 0.38, 0.77, 0.39, 0.66, 3.1, 0.18, 1.43, 1.39, 0.43, 0.93, 5.2, 0.33, 3.81, 2.0, 0.55, 0.66, 0.65, 0.29, 0.27, 0.6, 0.66, 0.57, 0.77, 2.46, 1.44, 1.19, 0.35, 1.25, 0.62, 0.45, 0.96, 5.83, 1.1, 0.65]} \ No newline at end of file diff --git a/annotations_1/dH3dqXHH0yU_filtered.json b/annotations_1/dH3dqXHH0yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360ed9a34378e14a33e28639d7482ee365837716 --- /dev/null +++ b/annotations_1/dH3dqXHH0yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.68], [5.0, 8.75], [9.0, 12.83], [14.0, 17.32], [32.0, 57.57], [60.0, 80.2], [85.0, 85.62], [96.0, 96.28], [100.0, 101.92], [104.0, 104.48], [106.0, 107.1], [140.0, 140.7], [150.0, 151.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.22, 71.72, 39.94, 48.82, 97.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.8], ["speech", 13.77], ["groan", 1.78]], [["music", 49.24], ["theremin", 23.15], ["didgeridoo", 6.88]], null, null, null, null, null, null, null, null], "duration": [1.68, 3.75, 3.83, 3.32, 25.57, 20.2, 0.62, 0.28, 1.92, 0.48, 1.1, 0.7, 1.46]} \ No newline at end of file diff --git a/annotations_1/dHXVvD4FFas_filtered.json b/annotations_1/dHXVvD4FFas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7542b878c2bd8b322ee8499059e134f11e11ba --- /dev/null +++ b/annotations_1/dHXVvD4FFas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.1], [12.0, 13.81], [19.0, 19.95], [26.0, 27.55], [33.0, 34.69], [37.0, 39.28], [41.0, 64.12], [65.0, 73.3], [74.0, 90.32], [91.0, 92.23], [105.0, 105.29], [105.0, 108.73], [109.0, 110.27], [113.0, 113.51], [118.0, 120.18], [121.0, 125.12], [126.0, 132.76], [134.0, 144.49], [151.0, 152.22], [153.0, 174.95], [178.0, 180.27], [189.0, 190.22], [193.0, 201.24], [206.0, 207.01], [208.0, 208.52], [210.0, 211.55]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [75.07, 0.0, 0.0, 0.0, 0.0, 34.94, 33.68, 46.33, 31.52, 0.0, 0.0, 32.22, 0.0, 0.0, 56.25, 70.86, 44.49, 31.15, 0.0, 30.34, 34.5, 0.0, 31.74, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.25], ["speech", 24.54], ["foghorn", 9.73]], [["music", 67.49], ["theremin", 13.23], ["ambient music", 4.56]], [["music", 77.48], ["hum", 4.94], ["theremin", 2.19]], [["music", 51.12], ["speech", 16.09], ["throbbing", 10.88]], null, null, [["music", 35.62], ["speech", 30.4], ["throbbing", 6.09]], null, null, null, null, [["music", 40.29], ["speech", 14.26], ["hum", 11.43]], [["music", 48.83], ["throbbing", 22.12], ["hum", 16.14]], null, [["music", 46.32], ["hum", 19.32], ["throbbing", 10.35]], [["music", 30.34], ["brass instrument", 4.67], ["speech", 4.31]], null, [["music", 64.38], ["throbbing", 6.37], ["hum", 4.71]], null, null, null], "duration": [3.1, 1.81, 0.95, 1.55, 1.69, 2.28, 23.12, 8.3, 16.32, 1.23, 0.29, 3.73, 1.27, 0.51, 2.18, 4.12, 6.76, 10.49, 1.22, 21.95, 2.27, 1.22, 8.24, 1.01, 0.52, 1.55]} \ No newline at end of file diff --git a/annotations_1/dIy6QpVNPuo_filtered.json b/annotations_1/dIy6QpVNPuo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17916554023e32969eeb7d24cff240e904ef3c8a --- /dev/null +++ b/annotations_1/dIy6QpVNPuo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 10.37], [22.0, 22.72], [23.0, 27.16], [31.0, 36.22], [45.0, 49.86], [52.0, 62.07], [64.0, 73.04], [76.0, 77.9], [79.0, 92.85], [96.0, 114.66]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.91, 0.0, 30.27, 32.44, 30.18, 30.74, 31.46, 0.0, 30.68, 30.72], "audiomae_on_audioset": [null, [["speech", 57.03], ["vehicle", 14.38], ["rumble", 8.23]], null, [["music", 34.88], ["animal", 10.24], ["roaring cats (lions, tigers)", 9.3]], [["music", 72.83], ["hum", 4.03], ["musical instrument", 2.52]], [["music", 88.8], ["speech", 2.9], ["synthesizer", 0.72]], [["music", 68.06], ["throbbing", 5.3], ["hum", 2.65]], [["music", 34.16], ["skidding", 23.88], ["vehicle", 15.19]], null, [["music", 41.44], ["speech", 27.78], ["vehicle", 4.53]], [["vehicle", 22.55], ["music", 21.94], ["car", 17.28]]], "duration": [0.16, 5.37, 0.72, 4.16, 5.22, 4.86, 10.07, 9.04, 1.9, 13.85, 18.66]} \ No newline at end of file diff --git a/annotations_1/dJBnRYy3mFI_filtered.json b/annotations_1/dJBnRYy3mFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eafe086d72b4176db591b6324fff3f0e287eda30 --- /dev/null +++ b/annotations_1/dJBnRYy3mFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.04], [8.0, 8.33], [14.0, 17.02], [18.0, 19.31], [22.0, 24.95], [30.0, 30.91], [32.0, 32.1], [43.0, 44.31], [45.0, 48.44]], "keep_status": [false, false, true, false, false, false, false, false, true], "silence_prob": [30.88, 0.0, 38.3, 0.0, 32.22, 0.0, 0.0, 0.0, 33.98], "audiomae_on_audioset": [[["music", 82.73], ["speech", 6.37], ["sidetone", 1.72]], null, [["music", 42.47], ["speech", 13.54], ["throbbing", 6.39]], null, [["music", 67.88], ["speech", 13.34], ["gunshot, gunfire", 5.19]], null, null, null, [["music", 58.15], ["speech", 4.82], ["electronic music", 4.52]]], "duration": [3.04, 0.33, 3.02, 1.31, 2.95, 0.91, 0.1, 1.31, 3.44]} \ No newline at end of file diff --git a/annotations_1/dJsuwhIpSDQ_filtered.json b/annotations_1/dJsuwhIpSDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/dJsuwhIpSDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/dK2oGZK490w_filtered.json b/annotations_1/dK2oGZK490w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bf795c7d1db48fd7fda0f2fdf6b70d82d1ba4e6 --- /dev/null +++ b/annotations_1/dK2oGZK490w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.33], [8.0, 9.37], [12.0, 12.78], [14.0, 21.36], [27.0, 28.02], [30.0, 35.78], [39.0, 39.01], [40.0, 41.54], [43.0, 48.32], [51.0, 53.94], [58.0, 60.17], [61.0, 61.92], [64.0, 64.49], [66.0, 66.7], [68.0, 67.83], [70.0, 70.23], [73.0, 87.91], [92.0, 92.35], [97.0, 106.0], [110.0, 112.46], [113.0, 115.25], [120.0, 120.51], [123.0, 123.74], [129.0, 130.2], [131.0, 134.52], [136.0, 137.88], [140.0, 142.48], [144.0, 144.76], [146.0, 146.65], [150.0, 153.49]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.81, 0.0, 41.7, 0.0, 0.0, 65.44, 47.31, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.29, 0.0, 77.87, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 98.44], "audiomae_on_audioset": [null, null, null, [["music", 66.35], ["yodeling", 10.2], ["singing", 2.77]], null, [["music", 54.44], ["brass instrument", 10.9], ["trombone", 6.56]], null, null, null, [["speech", 26.23], ["animal", 11.7], ["music", 6.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 1.37, 0.78, 7.36, 1.02, 5.78, 0.01, 1.54, 5.32, 2.94, 2.17, 0.92, 0.49, 0.7, -0.17, 0.23, 14.91, 0.35, 9.0, 2.46, 2.25, 0.51, 0.74, 1.2, 3.52, 1.88, 2.48, 0.76, 0.65, 3.49]} \ No newline at end of file diff --git a/annotations_1/dN1RMOrtK7A_filtered.json b/annotations_1/dN1RMOrtK7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2911ffbf5f48a40691d7968194e0b0d0e1bfd244 --- /dev/null +++ b/annotations_1/dN1RMOrtK7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.0], [14.0, 20.65], [25.0, 36.49], [43.0, 45.25], [50.0, 53.11], [58.0, 59.09], [67.0, 70.09], [71.0, 71.1], [73.0, 74.02], [75.0, 77.33], [79.0, 79.79], [84.0, 84.7], [87.0, 87.39], [103.0, 103.71], [105.0, 105.6], [114.0, 119.8], [123.0, 122.81], [123.0, 123.65], [125.0, 125.15], [126.0, 125.86], [126.0, 125.98], [138.0, 138.27], [147.0, 147.88], [149.0, 150.21], [155.0, 154.89], [172.0, 175.34], [177.0, 182.38], [184.0, 187.49], [188.0, 196.94], [197.0, 197.61]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [38.16, 36.95, 45.82, 48.78, 36.42, 0.0, 55.11, 0.0, 0.0, 39.17, 0.0, 0.0, 0.0, 0.0, 0.0, 29.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.3, 29.0, 28.56, 86.09, 0.0], "audiomae_on_audioset": [[["speech", 66.66], ["noise", 5.2], ["groan", 2.83]], [["speech", 61.64], ["hum", 11.94], ["music", 10.2]], [["hum", 29.34], ["whale vocalization", 17.54], ["music", 15.81]], [["speech", 30.9], ["sidetone", 30.49], ["music", 13.86]], [["sidetone", 53.17], ["speech", 23.75], ["sine wave", 3.62]], null, null, null, null, [["speech", 32.9], ["music", 17.41], ["hum", 9.26]], null, null, null, null, null, [["music", 26.54], ["hum", 19.85], ["mains hum", 12.72]], null, null, null, null, null, null, null, null, null, [["speech", 75.86], ["animal", 16.54], ["roaring cats (lions, tigers)", 2.64]], [["music", 55.41], ["speech", 11.64], ["electronic music", 2.32]], [["whale vocalization", 32.26], ["sound effect", 5.39], ["music", 5.11]], null, null], "duration": [5.0, 6.65, 11.49, 2.25, 3.11, 1.09, 3.09, 0.1, 1.02, 2.33, 0.79, 0.7, 0.39, 0.71, 0.6, 5.8, -0.19, 0.65, 0.15, -0.14, -0.02, 0.27, 0.88, 1.21, -0.11, 3.34, 5.38, 3.49, 8.94, 0.61]} \ No newline at end of file diff --git a/annotations_1/dOZndhz24OA_filtered.json b/annotations_1/dOZndhz24OA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c27a9471014defc16a1444c33934c7412be2439 --- /dev/null +++ b/annotations_1/dOZndhz24OA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.08], [4.0, 7.94], [10.0, 14.64], [16.0, 23.31], [25.0, 25.68], [38.0, 60.15], [60.0, 61.77], [67.0, 77.28], [78.0, 80.16], [81.0, 81.38], [81.0, 82.53], [87.0, 92.18], [99.0, 99.12], [99.0, 101.44], [104.0, 105.48], [106.0, 108.94], [110.0, 112.13], [115.0, 116.09], [118.0, 118.54], [126.0, 129.22], [130.0, 135.11], [139.0, 139.73], [141.0, 144.39], [162.0, 171.86]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 80.29, 78.89, 31.15, 0.0, 29.95, 0.0, 38.4, 57.64, 0.0, 0.0, 29.84, 0.0, 29.43, 0.0, 29.39, 32.39, 0.0, 0.0, 50.31, 33.46, 0.0, 29.36, 29.68], "audiomae_on_audioset": [null, null, null, [["speech", 26.53], ["sidetone", 20.27], ["whack, thwack", 13.94]], null, [["sidetone", 47.51], ["speech", 12.4], ["music", 7.37]], null, [["music", 73.6], ["whale vocalization", 10.14], ["buzz", 1.92]], null, null, null, [["speech", 86.2], ["grunt", 1.99], ["beatboxing", 1.74]], null, [["speech", 78.11], ["boing", 3.72], ["grunt", 3.5]], null, [["speech", 51.87], ["music", 8.17], ["beatboxing", 7.49]], [["hum", 31.39], ["mains hum", 13.77], ["music", 12.99]], null, null, null, [["speech", 28.11], ["sidetone", 20.74], ["music", 10.44]], null, [["speech", 30.83], ["music", 15.12], ["grunt", 11.13]], [["speech", 51.41], ["grunt", 32.44], ["music", 5.24]]], "duration": [0.08, 3.94, 4.64, 7.31, 0.68, 22.15, 1.77, 10.28, 2.16, 0.38, 1.53, 5.18, 0.12, 2.44, 1.48, 2.94, 2.13, 1.09, 0.54, 3.22, 5.11, 0.73, 3.39, 9.86]} \ No newline at end of file diff --git a/annotations_1/dQNrOoc3NTA_filtered.json b/annotations_1/dQNrOoc3NTA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96eef079bb1de7851ac0d0c894892d3b72f54921 --- /dev/null +++ b/annotations_1/dQNrOoc3NTA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 25.35], [26.0, 27.09], [28.0, 28.85], [30.0, 32.36], [33.0, 33.93], [35.0, 37.05], [37.0, 38.8], [42.0, 44.22], [45.0, 46.52], [48.0, 58.29], [59.0, 63.8], [71.0, 109.0], [112.0, 132.98], [135.0, 135.28], [136.0, 137.71], [139.0, 139.28], [141.0, 141.44], [144.0, 144.69], [146.0, 147.61], [148.0, 148.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.49, 0.0, 41.05, 0.0, 42.51, 0.0, 66.39, 78.89, 0.0, 43.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 54.68], ["music", 12.52], ["livestock, farm animals, working animals", 2.98]], null, [["music", 32.69], ["speech", 17.17], ["hum", 10.36]], null, [["mains hum", 39.7], ["music", 19.27], ["hum", 18.42]], null, null, null, null, [["music", 65.44], ["whale vocalization", 10.63], ["didgeridoo", 2.97]], null, null, null, null, null, null, null], "duration": [0.35, 1.09, 0.85, 2.36, 0.93, 2.05, 1.8, 2.22, 1.52, 10.29, 4.8, 38.0, 20.98, 0.28, 1.71, 0.28, 0.44, 0.69, 1.61, 0.59]} \ No newline at end of file diff --git a/annotations_1/dR0_tMYKwXE_filtered.json b/annotations_1/dR0_tMYKwXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e2f595c758b22db8c6117529a940bef8ee70bdc --- /dev/null +++ b/annotations_1/dR0_tMYKwXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.63], [6.0, 9.46], [10.0, 14.3], [15.0, 16.48], [32.0, 32.78], [37.0, 38.16], [54.0, 54.51], [71.0, 71.0], [73.0, 73.67], [80.0, 79.88], [109.0, 109.59], [112.0, 112.36], [116.0, 116.33], [119.0, 118.99], [121.0, 122.0], [127.0, 127.57], [132.0, 132.61], [134.0, 133.98], [142.0, 142.91], [144.0, 145.74], [146.0, 149.93], [150.0, 159.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.26, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 3.46, 4.3, 1.48, 0.78, 1.16, 0.51, 0.0, 0.67, -0.12, 0.59, 0.36, 0.33, -0.01, 1.0, 0.57, 0.61, -0.02, 0.91, 1.74, 3.93, 9.41]} \ No newline at end of file diff --git a/annotations_1/dR3cjXncoSk_filtered.json b/annotations_1/dR3cjXncoSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb72b0a56673a9d3770fd7005c9e6983f434215b --- /dev/null +++ b/annotations_1/dR3cjXncoSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.43], [12.0, 12.66], [17.0, 17.29], [18.0, 18.47], [27.0, 30.13], [34.0, 42.2], [42.0, 55.98], [63.0, 76.96], [79.0, 84.5], [85.0, 85.43], [86.0, 88.33], [89.0, 89.48], [91.0, 95.57], [97.0, 119.75], [120.0, 120.72], [122.0, 130.23], [132.0, 136.8], [139.0, 139.24], [145.0, 145.13], [149.0, 155.09], [164.0, 170.92], [173.0, 176.01], [183.0, 183.56], [185.0, 186.56], [188.0, 188.65], [189.0, 194.14], [195.0, 198.83]], "keep_status": [true, false, false, false, true, true, true, false, false, false, false, false, true, false, false, true, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [41.24, 0.0, 0.0, 0.0, 36.91, 45.52, 30.58, 29.67, 31.5, 0.0, 31.26, 0.0, 29.66, 28.89, 0.0, 28.7, 29.29, 0.0, 0.0, 31.77, 29.37, 32.42, 0.0, 0.0, 0.0, 32.77, 69.2], "audiomae_on_audioset": [[["hum", 23.32], ["noise", 15.92], ["throbbing", 10.42]], null, null, null, [["speech", 26.39], ["sidetone", 24.52], ["hum", 11.47]], [["frog", 17.13], ["hum", 16.34], ["music", 15.79]], [["music", 32.42], ["throbbing", 16.42], ["cacophony", 5.56]], [["speech", 54.33], ["music", 30.88], ["explosion", 1.79]], [["music", 49.2], ["speech", 16.72], ["electronic music", 5.47]], null, [["speech", 66.05], ["music", 21.63], ["helicopter", 2.51]], null, [["speech", 36.16], ["music", 15.17], ["hum", 11.75]], [["music", 39.68], ["speech", 34.04], ["buzz", 2.8]], null, [["music", 22.7], ["speech", 17.56], ["electric shaver, electric razor", 7.37]], [["livestock, farm animals, working animals", 43.6], ["cattle, bovinae", 27.42], ["moo", 21.45]], null, null, [["music", 34.1], ["speech", 22.32], ["fart", 10.19]], [["music", 33.68], ["speech", 14.72], ["hum", 9.68]], [["music", 49.18], ["speech", 13.24], ["explosion", 4.04]], null, null, null, [["clang", 43.54], ["ding", 40.26], ["fly, housefly", 1.62]], null], "duration": [7.43, 0.66, 0.29, 0.47, 3.13, 8.2, 13.98, 13.96, 5.5, 0.43, 2.33, 0.48, 4.57, 22.75, 0.72, 8.23, 4.8, 0.24, 0.13, 6.09, 6.92, 3.01, 0.56, 1.56, 0.65, 5.14, 3.83]} \ No newline at end of file diff --git a/annotations_1/dRVq4Um7E5Q_filtered.json b/annotations_1/dRVq4Um7E5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2bdd6ea629ead4615199007a0d176ced633c895 --- /dev/null +++ b/annotations_1/dRVq4Um7E5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.01], [17.0, 31.8], [32.0, 34.48], [35.0, 65.74], [67.0, 72.03], [74.0, 82.09], [85.0, 85.43], [88.0, 88.38], [91.0, 93.01], [95.0, 94.69], [99.0, 99.13], [100.0, 132.61], [135.0, 139.14], [143.0, 145.29], [146.0, 152.39], [154.0, 161.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.88, 35.91, 77.03, 0.0, 63.42, 96.54, 0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 50.11, 99.9, 97.83, 89.9], "audiomae_on_audioset": [null, [["music", 39.96], ["neigh, whinny", 21.15], ["horse", 21.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.01, 14.8, 2.48, 30.74, 5.03, 8.09, 0.43, 0.38, 2.01, -0.31, 0.13, 32.61, 4.14, 2.29, 6.39, 7.59]} \ No newline at end of file diff --git a/annotations_1/dSdY41CWixQ_filtered.json b/annotations_1/dSdY41CWixQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd5c0221286b62b97dd062b960a5e9e17f06cf8d --- /dev/null +++ b/annotations_1/dSdY41CWixQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.37], [15.0, 16.71], [23.0, 23.33], [38.0, 39.18], [40.0, 41.72], [49.0, 49.18], [55.0, 55.58], [59.0, 59.54], [60.0, 61.91], [64.0, 68.18], [71.0, 71.93], [73.0, 81.16], [82.0, 88.87], [93.0, 98.61], [101.0, 103.52], [114.0, 118.52], [119.0, 122.5], [129.0, 129.74], [131.0, 132.39], [135.0, 144.66], [145.0, 145.83], [154.0, 169.32], [171.0, 173.53], [177.0, 177.53], [179.0, 178.87], [180.0, 180.05], [180.0, 180.86], [186.0, 189.31], [199.0, 200.13], [202.0, 203.12], [204.0, 206.04], [215.0, 216.55]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.74, 0.0, 28.9, 29.35, 84.62, 65.91, 52.86, 49.68, 0.0, 0.0, 31.92, 0.0, 30.31, 31.39, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0, 51.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 32.01], ["music", 19.01], ["foghorn", 5.19]], null, [["moo", 17.47], ["cattle, bovinae", 16.16], ["buzz", 14.03]], [["thunk", 70.77], ["whack, thwack", 13.6], ["speech", 5.89]], null, null, null, [["hoot", 34.42], ["owl", 15.95], ["music", 14.12]], null, null, [["music", 83.72], ["speech", 4.47], ["groan", 1.85]], null, [["music", 37.3], ["speech", 21.88], ["hum", 7.85]], [["moo", 34.93], ["livestock, farm animals, working animals", 32.13], ["cattle, bovinae", 28.67]], null, null, null, null, [["fart", 41.16], ["speech", 15.68], ["fly, housefly", 10.75]], null, null, null, null], "duration": [1.37, 1.71, 0.33, 1.18, 1.72, 0.18, 0.58, 0.54, 1.91, 4.18, 0.93, 8.16, 6.87, 5.61, 2.52, 4.52, 3.5, 0.74, 1.39, 9.66, 0.83, 15.32, 2.53, 0.53, -0.13, 0.05, 0.86, 3.31, 1.13, 1.12, 2.04, 1.55]} \ No newline at end of file diff --git a/annotations_1/dTVEd7WtyAw_filtered.json b/annotations_1/dTVEd7WtyAw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59d1406d706d36de1de094b7abdedc6bff46c587 --- /dev/null +++ b/annotations_1/dTVEd7WtyAw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [6.0, 8.02], [9.0, 10.25], [10.0, 11.23], [12.0, 13.58], [14.0, 33.56], [34.0, 40.37], [41.0, 45.2], [48.0, 50.04], [52.0, 54.82], [56.0, 55.63], [56.0, 55.66], [56.0, 55.7], [56.0, 67.95], [68.0, 74.34], [76.0, 78.22], [80.0, 93.5], [96.0, 98.46], [99.0, 100.41], [101.0, 102.25], [115.0, 116.13], [118.0, 154.14], [156.0, 158.84], [170.0, 170.72], [173.0, 176.52], [177.0, 185.52], [189.0, 189.75], [191.0, 191.84]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 76.7, 0.0, 0.0, 0.0, 39.91, 36.25, 37.26, 38.37, 41.09, 0.0, 0.0, 0.0, 36.11, 39.33, 68.02, 36.89, 35.52, 0.0, 0.0, 0.0, 0.0, 35.43, 0.0, 37.0, 39.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 59.96], ["speech", 9.57], ["hum", 5.89]], [["music", 70.75], ["musical instrument", 3.92], ["guitar", 2.72]], [["music", 77.1], ["chorus effect", 2.78], ["singing", 2.55]], [["throbbing", 23.51], ["music", 18.46], ["moo", 9.11]], [["music", 64.96], ["synthesizer", 7.75], ["sampler", 3.7]], null, null, null, [["music", 73.57], ["singing", 4.91], ["male singing", 1.85]], [["music", 47.57], ["effects unit", 11.17], ["guitar", 10.55]], null, [["music", 77.07], ["speech", 2.0], ["synthesizer", 1.87]], [["music", 73.97], ["electronic music", 3.0], ["synthesizer", 2.86]], null, null, null, null, [["music", 30.96], ["moo", 14.86], ["cattle, bovinae", 6.85]], null, [["music", 16.26], ["fly, housefly", 16.17], ["grunt", 8.52]], [["music", 41.72], ["speech", 32.76], ["sidetone", 14.26]], null, null], "duration": [1.08, 2.02, 1.25, 1.23, 1.58, 19.56, 6.37, 4.2, 2.04, 2.82, -0.37, -0.34, -0.3, 11.95, 6.34, 2.22, 13.5, 2.46, 1.41, 1.25, 1.13, 36.14, 2.84, 0.72, 3.52, 8.52, 0.75, 0.84]} \ No newline at end of file diff --git a/annotations_1/dUMW1YRsWcY_filtered.json b/annotations_1/dUMW1YRsWcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92942b83de28f58f3bce3137ae73356d1df261d8 --- /dev/null +++ b/annotations_1/dUMW1YRsWcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.91], [16.0, 47.12], [58.0, 58.99], [61.0, 68.08], [69.0, 70.87], [73.0, 74.02], [77.0, 81.55], [83.0, 87.07], [89.0, 91.37], [92.0, 96.87], [97.0, 99.84], [101.0, 105.17], [106.0, 109.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [44.32, 0.0, 0.0, 90.08, 0.0, 0.0, 89.54, 87.92, 84.07, 89.19, 36.37, 84.62, 84.8], "audiomae_on_audioset": [[["hum", 33.54], ["music", 25.6], ["mains hum", 15.14]], null, null, null, null, null, null, null, null, null, [["speech", 40.98], ["whale vocalization", 10.71], ["hum", 6.62]], null, null], "duration": [8.91, 31.12, 0.99, 7.08, 1.87, 1.02, 4.55, 4.07, 2.37, 4.87, 2.84, 4.17, 3.21]} \ No newline at end of file diff --git a/annotations_1/dUbNFv_h6Kc_filtered.json b/annotations_1/dUbNFv_h6Kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4fba173ccfcfcbccf39552ad25c9917e77f3e23 --- /dev/null +++ b/annotations_1/dUbNFv_h6Kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.62], [14.0, 58.56], [59.0, 59.56], [64.0, 69.87], [72.0, 73.21], [74.0, 75.25], [79.0, 79.34], [81.0, 81.55], [97.0, 98.86], [100.0, 100.2], [102.0, 102.49], [107.0, 107.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.31, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 88.49], ["musical instrument", 1.14], ["tick-tock", 1.07]], null, null, [["theremin", 40.7], ["music", 31.87], ["musical instrument", 7.06]], null, null, null, null, null, null, null, null], "duration": [6.62, 44.56, 0.56, 5.87, 1.21, 1.25, 0.34, 0.55, 1.86, 0.2, 0.49, 0.91]} \ No newline at end of file diff --git a/annotations_1/dVFDYCPO19A_filtered.json b/annotations_1/dVFDYCPO19A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e38c3c425cb0dc44be5c6ac72487a5c3804d119f --- /dev/null +++ b/annotations_1/dVFDYCPO19A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.91], [25.0, 28.81], [31.0, 31.33], [33.0, 32.98], [37.0, 37.66], [46.0, 46.67], [48.0, 56.17], [58.0, 58.6], [59.0, 59.83], [67.0, 67.58], [71.0, 76.01], [77.0, 89.06], [90.0, 90.69], [92.0, 92.57], [96.0, 96.65], [97.0, 98.31], [99.0, 99.54], [100.0, 100.79], [103.0, 103.84], [104.0, 104.77], [107.0, 108.94]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.52, 77.87, 0.0, 0.0, 0.0, 0.0, 33.03, 0.0, 0.0, 0.0, 40.04, 35.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 49.7], ["speech", 7.96], ["musical instrument", 2.76]], null, null, null, null, null, [["slap, smack", 47.99], ["whack, thwack", 26.36], ["whip", 5.9]], null, null, null, [["burping, eructation", 50.85], ["thunk", 8.85], ["knock", 5.66]], [["speech", 59.07], ["fart", 28.33], ["animal", 3.51]], null, null, null, null, null, null, null, null, null], "duration": [2.91, 3.81, 0.33, -0.02, 0.66, 0.67, 8.17, 0.6, 0.83, 0.58, 5.01, 12.06, 0.69, 0.57, 0.65, 1.31, 0.54, 0.79, 0.84, 0.77, 1.94]} \ No newline at end of file diff --git a/annotations_1/dVLMfoIop9M_filtered.json b/annotations_1/dVLMfoIop9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cb52715f1684e3c60bfd338cb214396262fbd40 --- /dev/null +++ b/annotations_1/dVLMfoIop9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [6.0, 7.62], [9.0, 9.58], [11.0, 11.99], [13.0, 14.35], [18.0, 19.94], [21.0, 20.97], [21.0, 25.47], [27.0, 30.5], [33.0, 33.96], [37.0, 37.94], [41.0, 41.39], [44.0, 45.39], [49.0, 49.28], [59.0, 59.88], [72.0, 74.31], [84.0, 86.12], [91.0, 97.46], [110.0, 111.77], [123.0, 124.73], [133.0, 133.74], [149.0, 148.91], [149.0, 149.47], [151.0, 151.75], [153.0, 153.77], [168.0, 170.41], [180.0, 183.32], [191.0, 195.08]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 33.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.33, 48.31, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.53, 56.78, 29.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 39.16], ["speech", 9.94], ["wind instrument, woodwind instrument", 9.76]], [["music", 40.34], ["wind instrument, woodwind instrument", 19.16], ["shofar", 8.55]], null, null, null, null, null, null, [["music", 51.99], ["musical instrument", 2.8], ["piano", 2.31]], [["speech", 33.24], ["busy signal", 18.78], ["sidetone", 7.44]], [["music", 69.55], ["funny music", 2.71], ["musical instrument", 2.52]], null, null, null, null, null, null, null, [["music", 61.27], ["marimba, xylophone", 5.76], ["glockenspiel", 4.38]], null, [["music", 46.55], ["synthetic singing", 6.86], ["theremin", 4.05]]], "duration": [1.17, 1.62, 0.58, 0.99, 1.35, 1.94, -0.03, 4.47, 3.5, 0.96, 0.94, 0.39, 1.39, 0.28, 0.88, 2.31, 2.12, 6.46, 1.77, 1.73, 0.74, -0.09, 0.47, 0.75, 0.77, 2.41, 3.32, 4.08]} \ No newline at end of file diff --git a/annotations_1/dVzFy-4c-AY_filtered.json b/annotations_1/dVzFy-4c-AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30c05f6f970d9e25d1efb7585d8b872f9e1c2bcf --- /dev/null +++ b/annotations_1/dVzFy-4c-AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[76.0, 93.93], [97.0, 99.2], [100.0, 102.37], [103.0, 104.57], [109.0, 109.61], [111.0, 112.35], [114.0, 118.29], [119.0, 122.88], [124.0, 131.31], [132.0, 134.37], [139.0, 147.26], [150.0, 150.52], [151.0, 152.49], [154.0, 155.76], [157.0, 157.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.2, 66.51, 62.68, 0.0, 0.0, 0.0, 47.31, 98.8, 54.36, 89.72, 50.51, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 37.54], ["music", 31.31], ["hum", 14.85]], null, null, null, null, null, [["music", 55.0], ["sonar", 17.37], ["electronic music", 4.36]], null, null, null, null, null, null, null, null], "duration": [17.93, 2.2, 2.37, 1.57, 0.61, 1.35, 4.29, 3.88, 7.31, 2.37, 8.26, 0.52, 1.49, 1.76, 0.54]} \ No newline at end of file diff --git a/annotations_1/dX0dcSJE7ek_filtered.json b/annotations_1/dX0dcSJE7ek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3a5714f7bb72e7ec956b7b0548fd8c843e17fe --- /dev/null +++ b/annotations_1/dX0dcSJE7ek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [13.0, 13.42], [16.0, 16.24], [17.0, 18.72], [21.0, 21.36], [23.0, 24.61], [26.0, 27.92], [46.0, 46.92], [62.0, 62.09], [63.0, 63.14], [65.0, 70.98], [88.0, 88.43], [89.0, 90.68], [93.0, 93.58], [99.0, 100.95], [101.0, 102.46], [107.0, 107.77], [114.0, 114.34], [117.0, 120.38], [131.0, 131.55], [132.0, 131.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mosquito", 55.56], ["fly, housefly", 23.4], ["insect", 5.86]], null, null, null, null, null, null, null, [["explosion", 16.82], ["mosquito", 11.14], ["music", 9.13]], null, null], "duration": [0.24, 0.42, 0.24, 1.72, 0.36, 1.61, 1.92, 0.92, 0.09, 0.14, 5.98, 0.43, 1.68, 0.58, 1.95, 1.46, 0.77, 0.34, 3.38, 0.55, -0.37]} \ No newline at end of file diff --git a/annotations_1/dXNmLJXEgQU_filtered.json b/annotations_1/dXNmLJXEgQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6baaf7cf50e104e592851ebff23fb54cbe2bc693 --- /dev/null +++ b/annotations_1/dXNmLJXEgQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.09], [12.0, 11.74], [13.0, 14.86], [15.0, 15.99], [32.0, 36.66], [37.0, 47.02], [52.0, 52.05], [55.0, 56.98], [63.0, 64.05], [66.0, 66.95], [68.0, 70.02], [71.0, 75.69], [82.0, 85.29], [87.0, 96.42], [108.0, 108.58], [110.0, 110.71], [114.0, 114.51], [117.0, 117.46], [121.0, 121.51], [122.0, 123.63], [126.0, 128.04], [133.0, 132.75], [134.0, 134.99], [137.0, 141.79], [142.0, 143.34], [144.0, 144.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [61.27, 0.0, 0.0, 0.0, 74.13, 33.5, 0.0, 0.0, 0.0, 0.0, 89.54, 66.51, 84.07, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 0.0, 42.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["emergency vehicle", 22.52], ["siren", 21.36], ["speech", 15.47]], null, null, null, null, null, null, null, [["music", 48.13], ["whale vocalization", 8.64], ["throbbing", 7.68]], null, null, null, null, null, null, [["fly, housefly", 31.94], ["mosquito", 18.38], ["insect", 16.5]], null, null, [["music", 62.25], ["musical instrument", 6.05], ["trombone", 5.68]], null, null], "duration": [2.09, -0.26, 1.86, 0.99, 4.66, 10.02, 0.05, 1.98, 1.05, 0.95, 2.02, 4.69, 3.29, 9.42, 0.58, 0.71, 0.51, 0.46, 0.51, 1.63, 2.04, -0.25, 0.99, 4.79, 1.34, 0.66]} \ No newline at end of file diff --git a/annotations_1/dXNu5a3KmMg_filtered.json b/annotations_1/dXNu5a3KmMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5ce4d17207c53a4e2de84c5ed5daabcf02c7c1 --- /dev/null +++ b/annotations_1/dXNu5a3KmMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.33], [17.0, 23.03], [26.0, 26.67], [27.0, 27.65], [28.0, 28.51], [29.0, 29.37], [30.0, 29.88], [34.0, 33.89], [37.0, 37.79], [39.0, 38.91], [48.0, 49.2], [50.0, 54.78], [66.0, 66.29], [78.0, 78.9], [81.0, 82.36], [85.0, 85.89], [87.0, 87.25], [97.0, 97.38], [102.0, 102.86], [105.0, 105.11], [110.0, 109.88], [113.0, 114.02], [115.0, 114.98], [139.0, 139.53], [144.0, 145.72], [151.0, 152.1], [155.0, 156.19], [157.0, 158.13], [160.0, 161.69]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 45.56], ["frog", 6.46], ["whale vocalization", 4.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 6.03, 0.67, 0.65, 0.51, 0.37, -0.12, -0.11, 0.79, -0.09, 1.2, 4.78, 0.29, 0.9, 1.36, 0.89, 0.25, 0.38, 0.86, 0.11, -0.12, 1.02, -0.02, 0.53, 1.72, 1.1, 1.19, 1.13, 1.69]} \ No newline at end of file diff --git a/annotations_1/dXk2wGeBUHE_filtered.json b/annotations_1/dXk2wGeBUHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a2505e8dcb6bf2f73d01d11b0ee00fe5b720ea5 --- /dev/null +++ b/annotations_1/dXk2wGeBUHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 3.87], [5.0, 5.7], [7.0, 7.53], [9.0, 10.66], [12.0, 23.3], [24.0, 24.26], [25.0, 26.28], [30.0, 30.84], [31.0, 31.95], [33.0, 33.81], [35.0, 36.14], [43.0, 44.71], [45.0, 49.67], [53.0, 54.41], [55.0, 56.39], [57.0, 57.33], [59.0, 78.58], [87.0, 87.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 0.0, 0.0, 31.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 81.43], ["telephone", 4.85], ["hum", 2.92]], null, null, null, null, null, null, null, [["music", 40.89], ["speech", 24.56], ["theremin", 9.58]], null, null, null, [["throbbing", 37.87], ["hum", 20.96], ["music", 20.45]], null], "duration": [1.1, 0.87, 0.7, 0.53, 1.66, 11.3, 0.26, 1.28, 0.84, 0.95, 0.81, 1.14, 1.71, 4.67, 1.41, 1.39, 0.33, 19.58, 0.88]} \ No newline at end of file diff --git a/annotations_1/dYafG2EuZjs_filtered.json b/annotations_1/dYafG2EuZjs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c91a60df7c8d8c54e5faa66596e8f9968d6e6ee3 --- /dev/null +++ b/annotations_1/dYafG2EuZjs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.56], [8.0, 9.91], [10.0, 11.35], [14.0, 14.67], [23.0, 23.73], [27.0, 27.82], [29.0, 30.38], [34.0, 36.85], [38.0, 38.03], [39.0, 39.04], [40.0, 40.15], [43.0, 44.9], [46.0, 46.43], [47.0, 56.56], [57.0, 58.08], [59.0, 60.13], [61.0, 61.43], [63.0, 63.14], [66.0, 66.92], [77.0, 80.7], [85.0, 103.87], [104.0, 127.52], [133.0, 133.03], [134.0, 135.62], [136.0, 137.71], [138.0, 138.48], [139.0, 140.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 37.72, 53.4, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.96], ["hum", 8.78], ["thunk", 5.16]], null, null, null, null, null, null, null], "duration": [2.56, 1.91, 1.35, 0.67, 0.73, 0.82, 1.38, 2.85, 0.03, 0.04, 0.15, 1.9, 0.43, 9.56, 1.08, 1.13, 0.43, 0.14, 0.92, 3.7, 18.87, 23.52, 0.03, 1.62, 1.71, 0.48, 1.56]} \ No newline at end of file diff --git a/annotations_1/dZb8CGMC1zA_filtered.json b/annotations_1/dZb8CGMC1zA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8ab6b793ae6569c17b0716db507741428868e97 --- /dev/null +++ b/annotations_1/dZb8CGMC1zA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.82], [8.0, 7.94], [8.0, 8.06], [17.0, 29.84], [30.0, 31.46], [31.0, 31.5], [32.0, 32.63], [33.0, 33.61], [34.0, 35.56], [36.0, 41.4], [42.0, 43.85], [45.0, 46.85], [49.0, 49.23], [54.0, 54.31], [54.0, 57.65], [58.0, 59.73], [60.0, 71.34], [72.0, 74.06], [79.0, 79.71], [81.0, 81.53], [84.0, 86.26], [87.0, 88.13], [90.0, 90.12], [91.0, 91.02], [92.0, 92.91], [93.0, 93.82], [99.0, 100.55], [101.0, 104.01], [104.0, 105.39], [106.0, 107.89], [108.0, 110.71], [111.0, 111.97], [113.0, 113.27], [115.0, 115.37], [116.0, 116.92], [118.0, 120.56], [121.0, 125.12], [127.0, 128.48], [130.0, 132.31], [148.0, 147.95], [157.0, 158.09], [160.0, 160.73], [161.0, 161.94], [164.0, 166.94], [180.0, 200.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.04, 0.0, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 0.0, 59.59, 0.0, 0.0, 0.0, 0.0, 39.96, 0.0, 41.81, 44.78, 0.0, 0.0, 45.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 78.89, 98.19, 0.0, 71.29, 0.0, 0.0, 0.0, 0.0, 28.98, 48.48], "audiomae_on_audioset": [[["speech", 83.36], ["whack, thwack", 4.76], ["fart", 2.28]], null, null, [["speech", 78.53], ["whack, thwack", 4.29], ["inside, large room or hall", 2.19]], null, null, null, null, null, null, null, null, null, null, [["speech", 69.21], ["music", 4.49], ["sidetone", 3.33]], null, [["music", 33.32], ["electric shaver, electric razor", 19.91], ["speech", 12.85]], [["music", 46.75], ["speech", 35.13], ["musical instrument", 1.35]], null, null, [["music", 46.78], ["sheep", 5.89], ["livestock, farm animals, working animals", 5.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sound effect", 19.47], ["whack, thwack", 18.57], ["speech", 14.32]], [["music", 54.37], ["hum", 11.81], ["throbbing", 6.74]]], "duration": [6.82, -0.06, 0.06, 12.84, 1.46, 0.5, 0.63, 0.61, 1.56, 5.4, 1.85, 1.85, 0.23, 0.31, 3.65, 1.73, 11.34, 2.06, 0.71, 0.53, 2.26, 1.13, 0.12, 0.02, 0.91, 0.82, 1.55, 3.01, 1.39, 1.89, 2.71, 0.97, 0.27, 0.37, 0.92, 2.56, 4.12, 1.48, 2.31, -0.05, 1.09, 0.73, 0.94, 2.94, 20.82]} \ No newline at end of file diff --git a/annotations_1/dZjgSYTxWsY_filtered.json b/annotations_1/dZjgSYTxWsY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5958bdc350bb22c68f898b373775042ddf80ed0 --- /dev/null +++ b/annotations_1/dZjgSYTxWsY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.88], [12.0, 13.66], [23.0, 23.33], [31.0, 35.33], [36.0, 37.5], [39.0, 40.17], [42.0, 42.89], [44.0, 44.52], [47.0, 47.48], [55.0, 56.12], [58.0, 58.75], [63.0, 64.62], [85.0, 85.16], [95.0, 95.44], [103.0, 103.5], [109.0, 110.17], [110.0, 111.18], [112.0, 112.29], [117.0, 117.34], [118.0, 119.7], [124.0, 124.33], [125.0, 125.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 80.73], ["sidetone", 6.47], ["hum", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 1.66, 0.33, 4.33, 1.5, 1.17, 0.89, 0.52, 0.48, 1.12, 0.75, 1.62, 0.16, 0.44, 0.5, 1.17, 1.18, 0.29, 0.34, 1.7, 0.33, 0.59]} \ No newline at end of file diff --git a/annotations_1/dZmGh0bXqqw_filtered.json b/annotations_1/dZmGh0bXqqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2605fe8a8e3614fca745ad4de7f121ef96973a5 --- /dev/null +++ b/annotations_1/dZmGh0bXqqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.91], [20.0, 21.09], [24.0, 24.61], [27.0, 28.09], [33.0, 36.17], [39.0, 41.81], [44.0, 44.27], [46.0, 46.84], [77.0, 78.46], [80.0, 81.08], [86.0, 86.02], [90.0, 90.22], [94.0, 98.22], [100.0, 101.36], [105.0, 105.66], [108.0, 109.78], [117.0, 118.18], [131.0, 132.53], [150.0, 151.38], [158.0, 159.16], [163.0, 162.68], [163.0, 165.5], [170.0, 173.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [78.89, 0.0, 0.0, 0.0, 92.48, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.21, 34.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.11], ["theremin", 40.57], ["musical instrument", 1.71]], null, null, null, null, null, null, null, null, [["music", 63.26], ["electronica", 2.08], ["didgeridoo", 1.58]], [["music", 58.85], ["disco", 3.0], ["pop music", 1.84]]], "duration": [3.91, 1.09, 0.61, 1.09, 3.17, 2.81, 0.27, 0.84, 1.46, 1.08, 0.02, 0.22, 4.22, 1.36, 0.66, 1.78, 1.18, 1.53, 1.38, 1.16, -0.32, 2.5, 3.1]} \ No newline at end of file diff --git a/annotations_1/d_A4tfEukp4_filtered.json b/annotations_1/d_A4tfEukp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d6dd27f1e8738a6cdab6efd9bf35b25f34f5128 --- /dev/null +++ b/annotations_1/d_A4tfEukp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [9.0, 10.57], [11.0, 12.8], [14.0, 18.18], [24.0, 25.83], [29.0, 30.5], [31.0, 32.48], [34.0, 35.31], [36.0, 41.94], [51.0, 78.46], [80.0, 81.55], [83.0, 139.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.25, 0.0, 0.0, 0.0, 0.0, 33.5, 29.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 77.28], ["hum", 4.74], ["throbbing", 2.26]], null, null, null, null, [["speech", 59.06], ["animal", 14.67], ["music", 2.81]], [["music", 48.74], ["speech", 31.65], ["throbbing", 6.24]], null, null], "duration": [0.5, 1.57, 1.8, 4.18, 1.83, 1.5, 1.48, 1.31, 5.94, 27.46, 1.55, 56.09]} \ No newline at end of file diff --git a/annotations_1/d_hNjBBdcyU_filtered.json b/annotations_1/d_hNjBBdcyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b37e63c10a5e97de9c801142295fa86cdc88013b --- /dev/null +++ b/annotations_1/d_hNjBBdcyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [8.0, 11.13], [16.0, 16.83], [19.0, 19.43], [21.0, 22.27], [23.0, 25.2], [26.0, 27.28], [31.0, 31.67], [35.0, 35.55], [39.0, 38.91], [46.0, 46.7], [58.0, 59.68], [65.0, 65.92], [75.0, 75.05], [82.0, 82.49], [83.0, 87.39], [88.0, 101.43], [102.0, 103.1], [104.0, 104.14], [106.0, 106.14], [108.0, 110.1], [114.0, 115.77], [119.0, 119.7], [121.0, 128.53], [139.0, 141.88], [145.0, 151.12], [163.0, 172.44]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [37.8, 46.12, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 43.69, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 29.08, 42.33, 30.87, 30.09], "audiomae_on_audioset": [[["speech", 62.87], ["telephone bell ringing", 10.19], ["telephone", 6.65]], [["music", 24.1], ["didgeridoo", 11.61], ["speech", 7.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.5], ["singing bowl", 20.19], ["sonar", 5.09]], null, null, null, null, null, null, [["whack, thwack", 27.26], ["speech", 23.95], ["music", 9.25]], [["music", 24.51], ["rumble", 12.53], ["hum", 7.11]], [["music", 26.06], ["rumble", 25.78], ["mains hum", 21.92]], [["hum", 19.69], ["buzz", 18.71], ["mains hum", 10.86]]], "duration": [2.31, 3.13, 0.83, 0.43, 1.27, 2.2, 1.28, 0.67, 0.55, -0.09, 0.7, 1.68, 0.92, 0.05, 0.49, 4.39, 13.43, 1.1, 0.14, 0.14, 2.1, 1.77, 0.7, 7.53, 2.88, 6.12, 9.44]} \ No newline at end of file diff --git a/annotations_1/daVOnsL2wkU_filtered.json b/annotations_1/daVOnsL2wkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bafdcb773bd9398b9696945e6a7bd4f1bcee1777 --- /dev/null +++ b/annotations_1/daVOnsL2wkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.23], [10.0, 10.69], [12.0, 12.12], [13.0, 14.44], [15.0, 26.59], [27.0, 29.22], [30.0, 31.11], [32.0, 34.47], [36.0, 38.15], [39.0, 42.15], [43.0, 46.04], [47.0, 49.37], [50.0, 52.03], [53.0, 54.46], [55.0, 56.86], [59.0, 77.67], [79.0, 85.18], [87.0, 89.65], [90.0, 94.37], [96.0, 99.47], [101.0, 123.38], [124.0, 125.29], [126.0, 129.44]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [37.82, 0.0, 0.0, 0.0, 46.4, 53.84, 0.0, 61.97, 68.41, 53.04, 72.46, 70.44, 54.04, 0.0, 0.0, 40.48, 71.57, 63.96, 61.37, 59.42, 56.18, 0.0, 45.62], "audiomae_on_audioset": [[["fly, housefly", 28.21], ["sidetone", 15.96], ["insect", 14.24]], null, null, null, [["fly, housefly", 30.93], ["bee, wasp, etc.", 24.31], ["animal", 11.68]], null, null, null, null, null, null, null, null, null, null, [["speech", 25.1], ["radio", 17.86], ["hum", 10.28]], null, null, null, null, null, null, [["music", 52.51], ["musical instrument", 7.35], ["guitar", 6.08]]], "duration": [2.23, 0.69, 0.12, 1.44, 11.59, 2.22, 1.11, 2.47, 2.15, 3.15, 3.04, 2.37, 2.03, 1.46, 1.86, 18.67, 6.18, 2.65, 4.37, 3.47, 22.38, 1.29, 3.44]} \ No newline at end of file diff --git a/annotations_1/dapP5W153YE_filtered.json b/annotations_1/dapP5W153YE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..231d6b068247a45c1899830b0c043b9186c25d3f --- /dev/null +++ b/annotations_1/dapP5W153YE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 32.59], [37.0, 45.99], [48.0, 58.28], [59.0, 77.65], [79.0, 94.42], [97.0, 98.63], [100.0, 118.96], [121.0, 126.57], [127.0, 136.29], [139.0, 148.04], [150.0, 153.25], [155.0, 157.59], [159.0, 177.31], [180.0, 205.97], [208.0, 207.81], [209.0, 209.65]], "keep_status": [false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [30.38, 30.75, 30.43, 30.47, 29.95, 0.0, 30.36, 30.28, 30.24, 30.52, 30.47, 31.05, 30.33, 30.12, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.1], ["speech", 8.81], ["throbbing", 5.54]], [["music", 38.89], ["hum", 18.22], ["throbbing", 11.78]], [["livestock, farm animals, working animals", 24.52], ["music", 22.15], ["cattle, bovinae", 20.11]], [["music", 37.81], ["hum", 24.28], ["throbbing", 10.07]], [["music", 67.24], ["speech", 12.29], ["synthesizer", 5.43]], null, [["music", 37.96], ["hum", 25.14], ["throbbing", 13.09]], [["music", 47.43], ["throbbing", 6.46], ["hum", 4.49]], [["music", 49.72], ["speech", 15.64], ["synthesizer", 10.57]], [["vehicle", 21.38], ["speech", 19.3], ["car", 17.06]], [["music", 75.76], ["electronic music", 2.79], ["hum", 1.98]], [["music", 54.06], ["throbbing", 13.44], ["hum", 12.13]], [["music", 71.5], ["speech", 9.38], ["synthesizer", 4.08]], [["throbbing", 34.24], ["hum", 28.8], ["music", 15.58]], null, null], "duration": [13.59, 8.99, 10.28, 18.65, 15.42, 1.63, 18.96, 5.57, 9.29, 9.04, 3.25, 2.59, 18.31, 25.97, -0.19, 0.65]} \ No newline at end of file diff --git a/annotations_1/db1o8mTCBXU_filtered.json b/annotations_1/db1o8mTCBXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e5e59f62aea65ca54ee6d77f893da2d7a8eaba3 --- /dev/null +++ b/annotations_1/db1o8mTCBXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.66], [14.0, 17.14], [18.0, 19.18], [20.0, 22.65], [24.0, 27.58], [29.0, 40.78], [41.0, 41.13], [41.0, 41.2], [42.0, 50.33], [53.0, 52.95], [56.0, 61.7], [64.0, 64.96], [66.0, 67.04], [69.0, 71.52], [72.0, 73.99], [75.0, 78.27], [79.0, 79.76], [82.0, 83.3], [86.0, 87.49], [88.0, 90.31], [91.0, 91.64], [94.0, 95.62], [98.0, 99.1], [103.0, 102.64], [108.0, 108.26], [111.0, 112.36], [114.0, 115.32], [117.0, 116.95], [118.0, 120.73], [121.0, 126.39], [128.0, 128.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 73.51, 0.0, 82.25, 62.47, 50.36, 0.0, 0.0, 62.89, 0.0, 46.33, 0.0, 0.0, 48.91, 0.0, 62.47, 0.0, 0.0, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 60.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 19.63], ["electric shaver, electric razor", 18.18], ["hum", 10.09]], null, null, [["speech", 33.63], ["music", 24.01], ["musical instrument", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 22.31], ["throbbing", 9.39], ["musical instrument", 6.25]], null, null], "duration": [0.66, 3.14, 1.18, 2.65, 3.58, 11.78, 0.13, 0.2, 8.33, -0.05, 5.7, 0.96, 1.04, 2.52, 1.99, 3.27, 0.76, 1.3, 1.49, 2.31, 0.64, 1.62, 1.1, -0.36, 0.26, 1.36, 1.32, -0.05, 2.73, 5.39, 0.19]} \ No newline at end of file diff --git a/annotations_1/dbX-ekoWGWE_filtered.json b/annotations_1/dbX-ekoWGWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d2bfebf10ace4a5ea304b067bb5ea577c030caa --- /dev/null +++ b/annotations_1/dbX-ekoWGWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.81], [11.0, 11.65], [15.0, 17.0], [21.0, 22.5], [26.0, 27.92], [34.0, 34.59], [36.0, 36.44], [39.0, 40.34], [42.0, 43.16], [45.0, 45.89], [52.0, 54.85], [56.0, 56.59], [61.0, 62.4], [67.0, 68.1], [74.0, 74.04], [78.0, 79.74], [81.0, 82.56], [84.0, 85.4], [88.0, 88.13], [92.0, 96.08], [101.0, 102.0], [107.0, 107.84], [113.0, 113.71], [117.0, 118.99], [121.0, 122.17], [124.0, 124.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 49.39], ["speech", 13.22], ["musical instrument", 10.09]], null, null, null, null, null, null, null, null, [["music", 72.97], ["guitar", 7.76], ["musical instrument", 4.84]], null, null, null, null, null, null], "duration": [0.81, 0.65, 2.0, 1.5, 1.92, 0.59, 0.44, 1.34, 1.16, 0.89, 2.85, 0.59, 1.4, 1.1, 0.04, 1.74, 1.56, 1.4, 0.13, 4.08, 1.0, 0.84, 0.71, 1.99, 1.17, 0.85]} \ No newline at end of file diff --git a/annotations_1/dc8glsGbIus_filtered.json b/annotations_1/dc8glsGbIus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c7755a150c30e0f8a8a996ca1e2fd37ddf2f45f --- /dev/null +++ b/annotations_1/dc8glsGbIus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [6.0, 6.47], [7.0, 8.51], [9.0, 9.75], [11.0, 11.28], [13.0, 15.18], [18.0, 20.92], [25.0, 29.03], [33.0, 53.89], [54.0, 54.77], [55.0, 55.81], [56.0, 56.51], [58.0, 64.57], [65.0, 85.77], [87.0, 88.13], [89.0, 110.29], [114.0, 119.45], [120.0, 120.55], [124.0, 124.6], [126.0, 127.23], [130.0, 130.13], [131.0, 132.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, true, false, false, false, false, false], "silence_prob": [52.56, 0.0, 0.0, 0.0, 0.0, 59.07, 71.14, 53.65, 29.26, 0.0, 0.0, 0.0, 29.18, 30.81, 0.0, 30.32, 31.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 49.06], ["buzz", 24.06], ["cacophony", 6.51]], null, null, null, [["speech", 33.27], ["music", 21.47], ["explosion", 10.38]], [["cattle, bovinae", 19.01], ["explosion", 9.91], ["speech", 8.48]], null, [["music", 38.18], ["musical instrument", 3.74], ["explosion", 3.51]], [["music", 30.99], ["hum", 8.82], ["cacophony", 7.78]], null, null, null, null, null], "duration": [2.01, 0.47, 1.51, 0.75, 0.28, 2.18, 2.92, 4.03, 20.89, 0.77, 0.81, 0.51, 6.57, 20.77, 1.13, 21.29, 5.45, 0.55, 0.6, 1.23, 0.13, 1.12]} \ No newline at end of file diff --git a/annotations_1/dcCsAQTY9lQ_filtered.json b/annotations_1/dcCsAQTY9lQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de89f9faf7c3c6f07bf661705a2b9dc75c084d3d --- /dev/null +++ b/annotations_1/dcCsAQTY9lQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [10.0, 10.79], [22.0, 21.83], [26.0, 27.82], [29.0, 29.29], [31.0, 38.26], [43.0, 43.21], [59.0, 67.91], [71.0, 71.2], [75.0, 78.73], [81.0, 83.17], [91.0, 95.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.78, 0.0, 29.22, 0.0, 29.06, 28.86, 29.04], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.69], ["crowd", 22.23], ["electronic music", 6.24]], null, [["music", 68.48], ["speech", 14.74], ["boing", 6.09]], null, [["music", 76.94], ["electronic music", 2.3], ["reggae", 1.37]], [["music", 85.04], ["speech", 1.93], ["boing", 0.95]], [["music", 82.81], ["middle eastern music", 1.79], ["singing", 1.7]]], "duration": [0.26, 0.79, -0.17, 1.82, 0.29, 7.26, 0.21, 8.91, 0.2, 3.73, 2.17, 4.05]} \ No newline at end of file diff --git a/annotations_1/dcSalZZ5YjM_filtered.json b/annotations_1/dcSalZZ5YjM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cd220b99904ba195027a9f3c0f7ff6b438d2478 --- /dev/null +++ b/annotations_1/dcSalZZ5YjM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.11], [4.0, 12.29], [25.0, 28.22], [36.0, 46.92], [47.0, 54.7], [70.0, 71.86], [76.0, 76.65], [80.0, 81.4], [82.0, 82.68], [87.0, 87.49], [95.0, 95.22], [97.0, 97.87], [99.0, 101.66], [104.0, 108.36], [112.0, 113.8], [117.0, 118.29], [122.0, 136.93], [142.0, 145.05], [145.0, 148.8], [150.0, 150.5], [151.0, 151.6], [152.0, 153.66], [154.0, 162.06]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 32.61, 35.01, 37.41, 40.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.52, 34.57, 0.0, 0.0, 34.46, 32.2, 31.3, 0.0, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, [["music", 33.69], ["hum", 28.99], ["throbbing", 18.63]], [["music", 23.46], ["throbbing", 15.88], ["speech", 13.92]], [["music", 46.15], ["throbbing", 17.38], ["hum", 12.87]], [["music", 55.87], ["throbbing", 13.85], ["hum", 12.7]], null, null, null, null, null, null, null, [["music", 34.16], ["hum", 14.53], ["throbbing", 13.18]], [["music", 23.45], ["insect", 16.98], ["fly, housefly", 14.46]], null, null, [["hum", 46.38], ["mains hum", 17.48], ["throbbing", 12.32]], [["hum", 47.19], ["mains hum", 26.15], ["throbbing", 15.57]], [["music", 30.12], ["hum", 18.01], ["throbbing", 15.21]], null, null, null, [["throbbing", 30.15], ["music", 29.46], ["hum", 28.38]]], "duration": [0.11, 8.29, 3.22, 10.92, 7.7, 1.86, 0.65, 1.4, 0.68, 0.49, 0.22, 0.87, 2.66, 4.36, 1.8, 1.29, 14.93, 3.05, 3.8, 0.5, 0.6, 1.66, 8.06]} \ No newline at end of file diff --git a/annotations_1/ddQe0gG79zk_filtered.json b/annotations_1/ddQe0gG79zk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..977830a516156378e8b2db85dabea6b20b63b85b --- /dev/null +++ b/annotations_1/ddQe0gG79zk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[97.0, 100.97], [101.0, 102.22], [104.0, 132.07], [133.0, 138.94], [140.0, 150.25], [151.0, 158.97], [160.0, 170.43], [171.0, 171.75], [173.0, 174.88], [175.0, 176.35]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.87, 0.0, 99.98, 70.44, 96.54, 96.89, 29.96, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["tuning fork", 46.88], ["sine wave", 6.68], ["music", 4.89]], null, null, null], "duration": [3.97, 1.22, 28.07, 5.94, 10.25, 7.97, 10.43, 0.75, 1.88, 1.35]} \ No newline at end of file diff --git a/annotations_1/de1vEYiEMro_filtered.json b/annotations_1/de1vEYiEMro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d82beb217167a1ff9cf9835fcd4fef837a90d9a --- /dev/null +++ b/annotations_1/de1vEYiEMro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.88], [30.0, 37.79], [40.0, 76.77], [78.0, 111.47], [113.0, 151.43]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 41.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.84], ["didgeridoo", 25.1], ["music", 13.18]], null, null, null], "duration": [0.88, 7.79, 36.77, 33.47, 38.43]} \ No newline at end of file diff --git a/annotations_1/deUgUoJ4z5I_filtered.json b/annotations_1/deUgUoJ4z5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e5612526f2d37aaec1351948b0da9c5f32d50ab --- /dev/null +++ b/annotations_1/deUgUoJ4z5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 5.98], [8.0, 9.22], [13.0, 13.93], [14.0, 14.91], [17.0, 18.13], [21.0, 24.14], [25.0, 27.18], [35.0, 36.63], [38.0, 41.1], [44.0, 44.85], [49.0, 50.62], [52.0, 52.96], [56.0, 58.24], [70.0, 73.89], [76.0, 77.53], [85.0, 86.95], [88.0, 89.41], [91.0, 91.1], [91.0, 91.56], [98.0, 100.45], [102.0, 104.35], [105.0, 106.37], [110.0, 111.43], [112.0, 113.31], [116.0, 118.32], [155.0, 163.48], [164.0, 170.31], [171.0, 177.89], [179.0, 182.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.59, 0.0, 0.0, 0.0, 0.0, 59.42, 54.23, 0.0, 87.74, 0.0, 0.0, 0.0, 63.85, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 64.07, 94.07, 0.0, 0.0, 0.0, 45.62, 30.73, 77.87, 89.72, 95.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 57.58], ["musical instrument", 7.73], ["brass instrument", 5.57]], [["music", 62.05], ["theremin", 22.21], ["synthesizer", 2.39]], null, null, null], "duration": [5.98, 1.22, 0.93, 0.91, 1.13, 3.14, 2.18, 1.63, 3.1, 0.85, 1.62, 0.96, 2.24, 3.89, 1.53, 1.95, 1.41, 0.1, 0.56, 2.45, 2.35, 1.37, 1.43, 1.31, 2.32, 8.48, 6.31, 6.89, 3.02]} \ No newline at end of file diff --git a/annotations_1/deUroRuOCwM_filtered.json b/annotations_1/deUroRuOCwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42a8d484c2eb77545f5b43fad39f5b55e07a0093 --- /dev/null +++ b/annotations_1/deUroRuOCwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.22], [22.0, 22.32], [24.0, 25.27], [27.0, 27.97], [29.0, 30.38], [33.0, 33.93], [35.0, 35.16], [35.0, 37.25], [38.0, 38.85], [40.0, 41.39], [42.0, 43.63], [45.0, 47.34], [48.0, 49.08], [53.0, 54.18], [61.0, 63.07], [64.0, 64.96], [67.0, 70.11], [71.0, 72.84], [74.0, 79.84], [81.0, 85.62], [87.0, 86.98], [95.0, 96.23], [114.0, 114.37], [115.0, 115.37], [123.0, 129.66], [134.0, 134.99], [135.0, 135.18], [136.0, 135.73], [136.0, 136.58], [142.0, 151.73], [152.0, 153.99], [155.0, 155.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 49.4, 0.0, 0.0, 99.99, 0.0, 100.0, 0.0, 67.13, 100.0, 0.0, 0.0, 0.0, 0.0, 30.2, 0.0, 0.0, 0.0, 0.0, 38.54, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 91.72], ["speech", 4.41], ["dial tone", 0.92]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.99], ["explosion", 6.49], ["screaming", 5.61]], null, null, null, null, [["fly, housefly", 23.38], ["mosquito", 11.07], ["insect", 9.56]], null, null], "duration": [0.22, 0.32, 1.27, 0.97, 1.38, 0.93, 0.16, 2.25, 0.85, 1.39, 1.63, 2.34, 1.08, 1.18, 2.07, 0.96, 3.11, 1.84, 5.84, 4.62, -0.02, 1.23, 0.37, 0.37, 6.66, 0.99, 0.18, -0.27, 0.58, 9.73, 1.99, 0.66]} \ No newline at end of file diff --git a/annotations_1/de_Dik7HT6E_filtered.json b/annotations_1/de_Dik7HT6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590544eb1139b70e6a56916534fd8f0b8f1ce76b --- /dev/null +++ b/annotations_1/de_Dik7HT6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 17.27], [18.0, 21.37], [22.0, 32.05], [32.0, 33.1], [38.0, 39.99], [46.0, 47.93], [55.0, 55.46], [56.0, 56.74], [70.0, 69.96], [72.0, 72.17], [81.0, 81.55], [85.0, 85.56], [89.0, 89.5], [99.0, 99.69], [105.0, 108.72], [112.0, 116.6], [119.0, 124.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [87.74, 89.36, 41.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.77, 83.88, 45.33], "audiomae_on_audioset": [null, null, [["speech", 37.86], ["hum", 21.47], ["music", 11.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 28.02], ["mains hum", 26.63], ["hum", 7.19]]], "duration": [14.27, 3.37, 10.05, 1.1, 1.99, 1.93, 0.46, 0.74, -0.04, 0.17, 0.55, 0.56, 0.5, 0.69, 3.72, 4.6, 5.14]} \ No newline at end of file diff --git a/annotations_1/df2QdWqKC6Q_filtered.json b/annotations_1/df2QdWqKC6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..accda8097195bc4378a268a526b6eb2c0bbf8827 --- /dev/null +++ b/annotations_1/df2QdWqKC6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [27.0, 28.09], [32.0, 32.19], [36.0, 56.46], [58.0, 58.51], [61.0, 62.56], [63.0, 64.42], [68.0, 68.45], [91.0, 91.42], [132.0, 132.92], [134.0, 133.84], [147.0, 148.61], [150.0, 151.39], [168.0, 168.62], [170.0, 171.49], [172.0, 172.64], [173.0, 175.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.09, 0.19, 20.46, 0.51, 1.56, 1.42, 0.45, 0.42, 0.92, -0.16, 1.61, 1.39, 0.62, 1.49, 0.64, 2.2]} \ No newline at end of file diff --git a/annotations_1/dfLN2aPZ5sM_filtered.json b/annotations_1/dfLN2aPZ5sM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..389bb16fd52c4b9027a3667fd8ff9a2cea04957c --- /dev/null +++ b/annotations_1/dfLN2aPZ5sM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 34.08], [35.0, 96.25], [97.0, 97.12], [102.0, 104.09], [106.0, 107.67], [108.0, 111.96], [112.0, 117.58], [121.0, 121.42], [125.0, 130.47], [131.0, 131.53], [135.0, 135.55]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.03, 0.0, 65.55, 38.43, 0.0, 52.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 52.13], ["pulse", 17.9], ["synthesizer", 7.1]], null, null, [["music", 30.84], ["speech", 28.8], ["siren", 5.05]], null, null, null, null], "duration": [31.08, 61.25, 0.12, 2.09, 1.67, 3.96, 5.58, 0.42, 5.47, 0.53, 0.55]} \ No newline at end of file diff --git a/annotations_1/dfWdmxCHwfc_filtered.json b/annotations_1/dfWdmxCHwfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ab265c9fce1bcb93130bd316308066c6f34e2d0 --- /dev/null +++ b/annotations_1/dfWdmxCHwfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 28.58], [30.0, 31.63], [33.0, 35.14], [38.0, 38.42], [42.0, 56.24], [67.0, 69.92], [78.0, 89.87], [90.0, 89.9], [91.0, 91.64], [94.0, 98.32], [99.0, 106.35], [108.0, 109.49], [112.0, 114.37], [116.0, 117.64], [119.0, 121.78], [123.0, 128.09], [129.0, 130.08], [132.0, 132.33], [134.0, 133.84], [136.0, 136.66], [144.0, 145.05], [149.0, 166.46]], "keep_status": [false, false, true, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [29.78, 0.0, 39.8, 0.0, 35.61, 37.17, 29.93, 0.0, 0.0, 34.8, 41.42, 0.0, 49.22, 0.0, 46.83, 34.89, 0.0, 0.0, 0.0, 0.0, 0.0, 29.79], "audiomae_on_audioset": [[["speech", 41.2], ["music", 33.71], ["trombone", 4.23]], null, [["fly, housefly", 15.15], ["music", 14.32], ["bee, wasp, etc.", 7.4]], null, [["fly, housefly", 28.35], ["insect", 15.4], ["bee, wasp, etc.", 13.08]], [["music", 19.53], ["speech", 17.57], ["foghorn", 4.96]], [["moo", 41.15], ["cattle, bovinae", 35.48], ["livestock, farm animals, working animals", 14.11]], null, null, [["hum", 41.07], ["music", 19.97], ["mains hum", 19.94]], [["insect", 18.3], ["fly, housefly", 17.01], ["hum", 11.89]], null, [["music", 26.62], ["hum", 13.26], ["mains hum", 9.08]], null, [["mains hum", 54.5], ["hum", 36.08], ["livestock, farm animals, working animals", 2.23]], [["mains hum", 43.67], ["hum", 34.32], ["noise", 3.92]], null, null, null, null, null, [["speech", 34.75], ["music", 15.88], ["livestock, farm animals, working animals", 9.18]]], "duration": [24.58, 1.63, 2.14, 0.42, 14.24, 2.92, 11.87, -0.1, 0.64, 4.32, 7.35, 1.49, 2.37, 1.64, 2.78, 5.09, 1.08, 0.33, -0.16, 0.66, 1.05, 17.46]} \ No newline at end of file diff --git a/annotations_1/dfofju459FA_filtered.json b/annotations_1/dfofju459FA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36eb8f7a79cf8f41888591423dd3b259e55c5ad7 --- /dev/null +++ b/annotations_1/dfofju459FA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.2], [40.0, 40.86], [61.0, 69.94], [70.0, 70.12], [76.0, 76.59], [80.0, 80.54], [82.0, 85.94], [89.0, 89.94], [98.0, 99.22], [101.0, 101.53], [104.0, 105.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.61, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.2, 0.86, 8.94, 0.12, 0.59, 0.54, 3.94, 0.94, 1.22, 0.53, 1.44]} \ No newline at end of file diff --git a/annotations_1/dfrJhivMJJY_filtered.json b/annotations_1/dfrJhivMJJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb0bbb3e76c2a4bbfbde6cf46980ebca0b162937 --- /dev/null +++ b/annotations_1/dfrJhivMJJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [7.0, 7.7], [13.0, 14.07], [16.0, 17.73], [21.0, 22.79], [24.0, 24.7], [27.0, 27.33], [33.0, 33.29], [35.0, 34.96], [35.0, 37.56], [39.0, 38.75], [39.0, 40.81], [44.0, 45.32], [47.0, 48.0], [51.0, 52.83], [59.0, 59.73], [62.0, 62.99], [68.0, 71.39], [74.0, 75.29], [80.0, 83.44], [84.0, 88.64]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 63.64, 71.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 29.54], ["music", 7.82], ["throbbing", 4.52]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.7, 1.07, 1.73, 1.79, 0.7, 0.33, 0.29, -0.04, 2.56, -0.25, 1.81, 1.32, 1.0, 1.83, 0.73, 0.99, 3.39, 1.29, 3.44, 4.64]} \ No newline at end of file diff --git a/annotations_1/dg6PaO0e6wA_filtered.json b/annotations_1/dg6PaO0e6wA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c64c59805437a4be6d8cf27396499beed359a49 --- /dev/null +++ b/annotations_1/dg6PaO0e6wA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 24.21], [24.0, 29.73], [31.0, 49.81], [52.0, 55.49], [58.0, 62.48], [63.0, 73.09], [75.0, 87.29], [92.0, 94.24], [96.0, 101.43], [103.0, 110.81], [112.0, 114.93], [116.0, 121.12], [122.0, 126.55], [127.0, 168.29], [169.0, 177.8], [179.0, 196.6]], "keep_status": [true, false, false, true, false, false, true, true, false, false, true, true, true, false, true, true], "silence_prob": [35.8, 35.83, 33.73, 33.41, 35.43, 36.52, 29.14, 29.81, 29.51, 29.95, 29.57, 29.61, 29.23, 0.0, 34.36, 36.79], "audiomae_on_audioset": [[["music", 45.07], ["synthesizer", 11.58], ["keyboard (musical)", 7.75]], [["music", 65.63], ["musical instrument", 13.56], ["keyboard (musical)", 3.79]], [["music", 51.9], ["keyboard (musical)", 9.82], ["electric piano", 9.05]], [["music", 50.86], ["synthesizer", 12.09], ["mains hum", 4.65]], [["music", 65.17], ["guitar", 6.61], ["musical instrument", 6.45]], [["music", 64.38], ["ambient music", 5.9], ["synthesizer", 4.18]], [["music", 59.93], ["breaking", 3.3], ["didgeridoo", 3.22]], [["music", 46.85], ["theremin", 9.09], ["electronic music", 4.03]], [["music", 57.21], ["throbbing", 8.54], ["mechanisms", 4.54]], [["music", 89.8], ["synthesizer", 1.39], ["electronic music", 1.17]], [["cattle, bovinae", 24.91], ["livestock, farm animals, working animals", 18.31], ["moo", 16.17]], [["music", 38.51], ["foghorn", 21.12], ["theremin", 4.37]], [["hum", 24.31], ["music", 23.36], ["mains hum", 21.8]], null, [["music", 47.32], ["speech", 16.49], ["singing bowl", 4.96]], [["music", 58.87], ["musical instrument", 5.57], ["synthesizer", 4.56]]], "duration": [18.21, 5.73, 18.81, 3.49, 4.48, 10.09, 12.29, 2.24, 5.43, 7.81, 2.93, 5.12, 4.55, 41.29, 8.8, 17.6]} \ No newline at end of file diff --git a/annotations_1/dgM9V3lEZvE_filtered.json b/annotations_1/dgM9V3lEZvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ced4b2eb9efc2018ad1ca2ff6822c557a75b900 --- /dev/null +++ b/annotations_1/dgM9V3lEZvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.93], [11.0, 20.01], [22.0, 22.82], [24.0, 25.07], [26.0, 26.2], [28.0, 28.43], [32.0, 31.77], [32.0, 32.71], [33.0, 33.78], [36.0, 37.3], [41.0, 45.1], [48.0, 48.15], [50.0, 52.05], [53.0, 53.64], [59.0, 59.22], [60.0, 64.35], [66.0, 65.8], [67.0, 67.56], [69.0, 68.66], [70.0, 75.24], [77.0, 77.67], [79.0, 82.24], [85.0, 87.84], [89.0, 90.63], [91.0, 92.16], [107.0, 106.98], [112.0, 112.19], [114.0, 115.16], [117.0, 122.08], [122.0, 122.3], [122.0, 122.77], [134.0, 135.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [76.53, 44.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 84.43, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 72.46, 0.0, 52.27, 34.04, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 34.53], ["speech", 23.89], ["hum", 13.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.12], ["hum", 6.26], ["throbbing", 5.36]], null, null, null, null, null, [["speech", 49.91], ["busy signal", 4.75], ["radio", 4.69]], null, null, null], "duration": [2.93, 9.01, 0.82, 1.07, 0.2, 0.43, -0.23, 0.71, 0.78, 1.3, 4.1, 0.15, 2.05, 0.64, 0.22, 4.35, -0.2, 0.56, -0.34, 5.24, 0.67, 3.24, 2.84, 1.63, 1.16, -0.02, 0.19, 1.16, 5.08, 0.3, 0.77, 1.57]} \ No newline at end of file diff --git a/annotations_1/dgdEr-mXQT4_filtered.json b/annotations_1/dgdEr-mXQT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..084a2039bc9911eb0653d02b21b0cd023001eeef --- /dev/null +++ b/annotations_1/dgdEr-mXQT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.72], [14.0, 14.4], [19.0, 19.68], [21.0, 20.98], [26.0, 26.45], [27.0, 27.7], [29.0, 28.88], [35.0, 35.5], [36.0, 36.86], [37.0, 37.93], [47.0, 47.07], [70.0, 71.42], [86.0, 86.86], [91.0, 91.37], [94.0, 94.54], [97.0, 97.5], [98.0, 98.58], [107.0, 107.28], [108.0, 108.57], [111.0, 111.37], [118.0, 117.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.4, 0.68, -0.02, 0.45, 0.7, -0.12, 0.5, 0.86, 0.93, 0.07, 1.42, 0.86, 0.37, 0.54, 0.5, 0.58, 0.28, 0.57, 0.37, -0.14]} \ No newline at end of file diff --git a/annotations_1/dhJPm7NolLc_filtered.json b/annotations_1/dhJPm7NolLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3957b9541de7188e88a0d1ae220bd47937f3a515 --- /dev/null +++ b/annotations_1/dhJPm7NolLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [7.0, 10.72], [12.0, 12.7], [19.0, 19.16], [27.0, 33.22], [38.0, 37.99], [42.0, 43.01], [57.0, 56.96], [58.0, 59.02], [60.0, 60.52], [69.0, 71.59], [79.0, 80.54], [90.0, 90.46], [91.0, 93.31], [94.0, 103.25], [105.0, 104.95], [107.0, 107.33], [110.0, 113.02], [115.0, 116.8], [118.0, 118.57], [128.0, 128.48], [132.0, 132.48], [135.0, 138.82], [139.0, 146.79], [148.0, 147.92]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.1, 36.24, 0.0, 0.0, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 79.76, 0.0, 0.0, 48.95, 39.11, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 44.55, 32.27, 0.0], "audiomae_on_audioset": [[["music", 24.02], ["hum", 6.76], ["throbbing", 6.45]], [["animal", 39.94], ["dog", 27.21], ["domestic animals, pets", 16.25]], null, null, [["sine wave", 67.1], ["chirp tone", 17.53], ["crying, sobbing", 1.65]], null, null, null, null, null, null, null, null, [["music", 40.45], ["speech", 39.0], ["didgeridoo", 2.25]], [["music", 74.84], ["speech", 13.65], ["didgeridoo", 1.71]], null, null, [["music", 58.62], ["speech", 21.49], ["sidetone", 3.82]], null, null, null, null, [["music", 78.19], ["didgeridoo", 4.62], ["musical instrument", 2.57]], [["music", 74.28], ["speech", 18.47], ["smash, crash", 0.73]], null], "duration": [2.11, 3.72, 0.7, 0.16, 6.22, -0.01, 1.01, -0.04, 1.02, 0.52, 2.59, 1.54, 0.46, 2.31, 9.25, -0.05, 0.33, 3.02, 1.8, 0.57, 0.48, 0.48, 3.82, 7.79, -0.08]} \ No newline at end of file diff --git a/annotations_1/di3Xh95aXp8_filtered.json b/annotations_1/di3Xh95aXp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aab3900408105fd9f65648d7b9b066c036e15274 --- /dev/null +++ b/annotations_1/di3Xh95aXp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.17], [9.0, 9.96], [12.0, 12.92], [15.0, 16.65], [18.0, 19.21], [24.0, 25.25], [27.0, 29.12], [30.0, 33.47], [36.0, 37.47], [45.0, 45.76], [47.0, 47.73], [50.0, 51.31], [53.0, 52.96], [54.0, 54.62], [58.0, 59.93], [63.0, 63.34], [72.0, 72.77], [75.0, 76.47], [77.0, 78.75], [80.0, 81.55], [82.0, 83.88], [85.0, 86.21], [89.0, 90.05], [97.0, 98.42], [101.0, 101.46], [106.0, 106.71], [111.0, 111.52], [117.0, 117.17], [119.0, 120.11], [122.0, 127.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 0.96, 0.92, 1.65, 1.21, 1.25, 2.12, 3.47, 1.47, 0.76, 0.73, 1.31, -0.04, 0.62, 1.93, 0.34, 0.77, 1.47, 1.75, 1.55, 1.88, 1.21, 1.05, 1.42, 0.46, 0.71, 0.52, 0.17, 1.11, 5.97]} \ No newline at end of file diff --git a/annotations_1/diNo0cO2Je0_filtered.json b/annotations_1/diNo0cO2Je0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd3d2946e9c90004ff014714247a31b15e6206f --- /dev/null +++ b/annotations_1/diNo0cO2Je0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 41.82], [45.0, 101.22], [103.0, 127.47], [128.0, 128.53], [129.0, 129.51], [134.0, 142.89], [145.0, 166.92], [169.0, 185.25], [188.0, 204.9], [206.0, 213.6]], "keep_status": [false, false, true, false, false, true, false, false, true, false], "silence_prob": [28.6, 0.0, 30.64, 0.0, 0.0, 29.77, 29.47, 28.75, 28.61, 28.18], "audiomae_on_audioset": [[["hum", 42.75], ["mains hum", 30.81], ["throbbing", 13.35]], null, [["music", 40.6], ["whack, thwack", 11.82], ["whip", 8.05]], null, null, [["music", 55.0], ["throbbing", 7.96], ["didgeridoo", 6.29]], [["music", 66.85], ["hum", 7.85], ["throbbing", 7.25]], [["music", 45.81], ["speech", 33.43], ["machine gun", 2.93]], [["cacophony", 26.45], ["mains hum", 21.55], ["hum", 20.61]], [["music", 66.75], ["buzz", 3.77], ["throbbing", 3.71]]], "duration": [21.82, 56.22, 24.47, 0.53, 0.51, 8.89, 21.92, 16.25, 16.9, 7.6]} \ No newline at end of file diff --git a/annotations_1/dj0MEV7d1NE_filtered.json b/annotations_1/dj0MEV7d1NE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ff48419577ada6ba4e15f55e4de0f2cfb6490c --- /dev/null +++ b/annotations_1/dj0MEV7d1NE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 23.79], [25.0, 27.26], [29.0, 43.68], [49.0, 49.13], [53.0, 53.11], [60.0, 62.31], [68.0, 87.67], [94.0, 97.43]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [91.13, 77.36, 36.19, 0.0, 0.0, 42.35, 30.33, 50.97], "audiomae_on_audioset": [null, null, [["music", 71.72], ["hum", 5.12], ["mains hum", 2.77]], null, null, [["speech", 22.89], ["mains hum", 22.06], ["hum", 21.41]], [["hum", 43.02], ["music", 21.06], ["mains hum", 19.59]], null], "duration": [20.79, 2.26, 14.68, 0.13, 0.11, 2.31, 19.67, 3.43]} \ No newline at end of file diff --git a/annotations_1/djPS3AC9DKk_filtered.json b/annotations_1/djPS3AC9DKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d10d60d8d58227b3cee3998cc2c3268ccd634e47 --- /dev/null +++ b/annotations_1/djPS3AC9DKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [7.0, 7.57], [9.0, 9.96], [43.0, 44.02], [72.0, 75.22], [78.0, 84.27], [88.0, 88.42], [90.0, 90.69], [93.0, 92.72]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.67, 35.08, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["applause", 19.54], ["clapping", 17.0], ["fart", 14.54]], [["moo", 30.56], ["cattle, bovinae", 29.93], ["livestock, farm animals, working animals", 13.62]], null, null, null], "duration": [1.29, 0.57, 0.96, 1.02, 3.22, 6.27, 0.42, 0.69, -0.28]} \ No newline at end of file diff --git a/annotations_1/djTx7slpfHI_filtered.json b/annotations_1/djTx7slpfHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..390211033a78318cc055d46b2175cc039f4dd0db --- /dev/null +++ b/annotations_1/djTx7slpfHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 43.04], [44.0, 90.36], [92.0, 102.59], [103.0, 103.28]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 32.31, 0.0], "audiomae_on_audioset": [null, null, [["whack, thwack", 34.53], ["music", 12.27], ["mechanisms", 7.07]], null], "duration": [42.04, 46.36, 10.59, 0.28]} \ No newline at end of file diff --git a/annotations_1/djh21tkgGJ4_filtered.json b/annotations_1/djh21tkgGJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76d604763bb6d8f1b2e174d12bce0cab7bdab283 --- /dev/null +++ b/annotations_1/djh21tkgGJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.43], [14.0, 15.08], [22.0, 22.65], [26.0, 27.16], [28.0, 35.55], [38.0, 37.76], [38.0, 39.55], [41.0, 40.91], [48.0, 52.59], [54.0, 54.46], [56.0, 57.01], [58.0, 58.02], [58.0, 59.66], [61.0, 61.28], [74.0, 81.57], [83.0, 83.88], [86.0, 89.45], [90.0, 90.32], [93.0, 96.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.64, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 85.35, 0.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 1.08, 0.65, 1.16, 7.55, -0.24, 1.55, -0.09, 4.59, 0.46, 1.01, 0.02, 1.66, 0.28, 7.57, 0.88, 3.45, 0.32, 3.18]} \ No newline at end of file diff --git a/annotations_1/djr5QNJG73k_filtered.json b/annotations_1/djr5QNJG73k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb139d2b1d1190ffbee730b10ca34e0370e81834 --- /dev/null +++ b/annotations_1/djr5QNJG73k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.81], [35.0, 35.6], [39.0, 39.19], [40.0, 40.37], [41.0, 41.15], [42.0, 42.45], [48.0, 48.15], [59.0, 60.56], [70.0, 70.01]], "keep_status": [true, false, false, false, false, false, false, false, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 15.39], ["music", 8.6], ["explosion", 1.97]], null, null, null, null, null, null, null, null], "duration": [2.81, 0.6, 0.19, 0.37, 0.15, 0.45, 0.15, 1.56, 0.01]} \ No newline at end of file diff --git a/annotations_1/dkAv65bo8a8_filtered.json b/annotations_1/dkAv65bo8a8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e58b75c16c39f7656119fba999026c350e5e7ecb --- /dev/null +++ b/annotations_1/dkAv65bo8a8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 18.25], [19.0, 21.49], [24.0, 24.88], [28.0, 28.75], [29.0, 30.84], [32.0, 33.25], [36.0, 37.71], [41.0, 41.49], [46.0, 46.06], [49.0, 50.06], [51.0, 52.41], [53.0, 53.97], [55.0, 55.85], [58.0, 59.97], [61.0, 61.16], [62.0, 64.47], [67.0, 68.42], [69.0, 70.29], [71.0, 71.39], [75.0, 75.44], [77.0, 77.9], [80.0, 80.76], [84.0, 88.05], [88.0, 91.52], [93.0, 96.03], [98.0, 100.18], [101.0, 103.0], [105.0, 107.5], [108.0, 112.67], [114.0, 115.79], [117.0, 118.96], [120.0, 123.58], [127.0, 127.67], [130.0, 132.14], [134.0, 136.09], [137.0, 137.27], [138.0, 139.99], [143.0, 144.36], [146.0, 149.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [51.44, 57.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 77.03, 73.06, 91.3, 67.89, 56.48, 65.55, 0.0, 0.0, 49.68, 0.0, 57.48, 55.25, 0.0, 0.0, 0.0, 84.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.42], ["didgeridoo", 22.54], ["musical instrument", 2.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.86], ["musical instrument", 6.07], ["hum", 6.03]], null, null, null, null, null, null, null], "duration": [2.25, 2.49, 0.88, 0.75, 1.84, 1.25, 1.71, 0.49, 0.06, 1.06, 1.41, 0.97, 0.85, 1.97, 0.16, 2.47, 1.42, 1.29, 0.39, 0.44, 0.9, 0.76, 4.05, 3.52, 3.03, 2.18, 2.0, 2.5, 4.67, 1.79, 1.96, 3.58, 0.67, 2.14, 2.09, 0.27, 1.99, 1.36, 3.69]} \ No newline at end of file diff --git a/annotations_1/dkjBBdHZNUs_filtered.json b/annotations_1/dkjBBdHZNUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2470e5b53de23f2591fa6faaa7012578bd02760d --- /dev/null +++ b/annotations_1/dkjBBdHZNUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.24], [34.0, 35.46], [40.0, 40.74], [44.0, 46.21], [69.0, 69.23], [70.0, 70.01], [70.0, 73.11], [81.0, 83.88]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 56.78, 0.0, 0.0, 46.72, 68.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["theremin", 38.32], ["wind instrument, woodwind instrument", 29.04], ["music", 9.26]], null], "duration": [1.24, 1.46, 0.74, 2.21, 0.23, 0.01, 3.11, 2.88]} \ No newline at end of file diff --git a/annotations_1/dmASD5tRwV4_filtered.json b/annotations_1/dmASD5tRwV4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f584b9f4ca3f00d21cae564340aa049cb625cc7 --- /dev/null +++ b/annotations_1/dmASD5tRwV4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 10.35], [11.0, 21.44], [23.0, 23.6], [24.0, 27.04], [28.0, 29.13], [30.0, 30.77], [33.0, 49.2], [51.0, 57.99], [59.0, 61.15], [66.0, 66.63], [68.0, 69.62], [71.0, 75.54], [77.0, 77.35], [79.0, 118.25], [118.0, 118.3], [118.0, 118.44], [118.0, 164.94]], "keep_status": [false, true, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [29.48, 30.14, 0.0, 39.17, 0.0, 0.0, 33.64, 33.48, 32.91, 0.0, 0.0, 31.8, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 47.23], ["music", 22.59], ["rumble", 6.55]], [["speech", 51.45], ["rumble", 12.66], ["hum", 5.12]], null, [["speech", 61.85], ["whale vocalization", 11.68], ["sidetone", 7.99]], null, null, [["whale vocalization", 30.65], ["insect", 13.97], ["fly, housefly", 13.29]], [["whale vocalization", 23.54], ["rumble", 21.51], ["hum", 14.53]], [["music", 63.03], ["hum", 6.07], ["electronic music", 1.93]], null, null, [["rumble", 19.71], ["hum", 19.53], ["music", 9.79]], null, null, null, null, null], "duration": [9.35, 10.44, 0.6, 3.04, 1.13, 0.77, 16.2, 6.99, 2.15, 0.63, 1.62, 4.54, 0.35, 39.25, 0.3, 0.44, 46.94]} \ No newline at end of file diff --git a/annotations_1/dmqo-EuR8Cw_filtered.json b/annotations_1/dmqo-EuR8Cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c03b5ac9856b9238a948c7580869273018b36e33 --- /dev/null +++ b/annotations_1/dmqo-EuR8Cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [9.0, 12.65], [13.0, 15.35], [17.0, 19.35], [27.0, 35.5], [36.0, 38.15], [39.0, 40.96], [42.0, 42.31], [42.0, 42.5], [44.0, 44.12], [45.0, 48.42], [49.0, 51.41], [59.0, 59.09], [61.0, 62.5], [69.0, 73.08], [75.0, 82.49], [85.0, 86.8], [89.0, 104.72], [109.0, 109.12]], "keep_status": [false, true, false, true, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.74, 33.24, 32.55, 29.72, 29.59, 0.0, 0.0, 0.0, 0.0, 30.78, 31.56, 0.0, 0.0, 33.4, 30.45, 0.0, 29.9, 0.0], "audiomae_on_audioset": [null, [["music", 46.04], ["hum", 6.83], ["noise", 6.36]], [["music", 31.21], ["throbbing", 22.13], ["hum", 22.01]], [["speech", 32.95], ["music", 18.82], ["croak", 8.14]], [["music", 48.18], ["groan", 7.77], ["throbbing", 5.66]], [["music", 47.24], ["tabla", 9.1], ["musical instrument", 6.21]], null, null, null, null, [["boing", 55.34], ["music", 14.54], ["speech", 5.48]], [["music", 28.93], ["crowd", 7.46], ["speech", 6.94]], null, null, [["music", 42.26], ["livestock, farm animals, working animals", 15.52], ["cattle, bovinae", 5.23]], [["music", 49.94], ["throbbing", 17.3], ["cacophony", 6.07]], null, [["music", 52.71], ["whack, thwack", 18.09], ["smash, crash", 6.57]], null], "duration": [0.1, 3.65, 2.35, 2.35, 8.5, 2.15, 1.96, 0.31, 0.5, 0.12, 3.42, 2.41, 0.09, 1.5, 4.08, 7.49, 1.8, 15.72, 0.12]} \ No newline at end of file diff --git a/annotations_1/dmy8Lcf_TiE_filtered.json b/annotations_1/dmy8Lcf_TiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94fc5fb8186489c5048c3881b2ed28207698fa19 --- /dev/null +++ b/annotations_1/dmy8Lcf_TiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.94], [10.0, 10.0], [11.0, 11.69], [14.0, 15.11], [15.0, 15.3], [15.0, 15.33], [16.0, 16.5], [17.0, 16.68], [17.0, 17.91], [19.0, 19.79], [23.0, 23.26], [25.0, 25.3], [30.0, 30.91], [32.0, 36.41], [37.0, 38.55], [40.0, 41.23], [42.0, 42.82], [45.0, 45.01], [46.0, 48.96], [58.0, 59.09], [60.0, 61.18], [64.0, 64.81], [70.0, 71.85], [75.0, 75.98], [81.0, 81.18], [83.0, 82.88], [88.0, 88.11], [96.0, 96.79], [101.0, 101.28], [102.0, 104.73], [105.0, 104.77], [109.0, 109.95], [113.0, 112.89], [116.0, 116.23], [118.0, 118.62], [120.0, 126.18], [129.0, 129.81], [131.0, 140.9], [147.0, 149.01], [152.0, 161.25], [164.0, 166.04], [168.0, 168.24], [173.0, 173.06], [174.0, 174.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.13, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 0.0, 30.72, 38.47, 29.12, 41.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.07], ["fart", 5.51], ["crackle", 4.88]], null, null, null, null, null, null, null, [["speech", 64.14], ["whack, thwack", 9.88], ["smash, crash", 8.54]], [["music", 14.34], ["beatboxing", 13.12], ["boing", 9.45]], [["speech", 38.29], ["vehicle", 14.14], ["car", 8.72]], [["speech", 42.74], ["music", 21.33], ["boing", 14.98]], null, null, null], "duration": [1.94, 0.0, 0.69, 1.11, 0.3, 0.33, 0.5, -0.32, 0.91, 0.79, 0.26, 0.3, 0.91, 4.41, 1.55, 1.23, 0.82, 0.01, 2.96, 1.09, 1.18, 0.81, 1.85, 0.98, 0.18, -0.12, 0.11, 0.79, 0.28, 2.73, -0.23, 0.95, -0.11, 0.23, 0.62, 6.18, 0.81, 9.9, 2.01, 9.25, 2.04, 0.24, 0.06, 0.45]} \ No newline at end of file diff --git a/annotations_1/dnrJELv76n4_filtered.json b/annotations_1/dnrJELv76n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ead8c25989442fc7becb410b87015421d4dae3 --- /dev/null +++ b/annotations_1/dnrJELv76n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.34], [10.0, 10.13], [19.0, 18.98], [31.0, 35.43], [44.0, 45.1], [45.0, 61.48], [75.0, 76.71], [84.0, 86.17], [93.0, 93.5], [95.0, 97.88], [111.0, 115.13], [119.0, 120.85], [127.0, 127.67], [134.0, 134.57], [135.0, 135.09], [135.0, 138.2], [143.0, 147.04], [151.0, 156.09], [168.0, 167.91], [172.0, 172.0], [178.0, 179.15], [180.0, 180.49], [187.0, 188.38], [194.0, 194.22], [194.0, 194.36], [200.0, 200.48], [205.0, 206.9], [209.0, 214.41], [218.0, 221.68], [224.0, 225.61]], "keep_status": [false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.61, 0.0, 33.49, 0.0, 35.65, 0.0, 30.93, 34.74, 0.0, 0.0, 0.0, 0.0, 31.74, 30.03, 29.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.78, 31.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 57.54], ["synthesizer", 4.35], ["musical instrument", 2.2]], null, [["music", 69.53], ["quack", 3.14], ["buzz", 2.38]], null, [["music", 57.55], ["synthesizer", 4.1], ["musical instrument", 3.58]], null, [["music", 46.81], ["speech", 11.5], ["electronic music", 4.83]], [["speech", 28.03], ["music", 26.18], ["bleat", 5.64]], null, null, null, null, [["speech", 49.69], ["music", 28.75], ["throbbing", 5.54]], [["music", 70.18], ["synthesizer", 7.69], ["musical instrument", 3.61]], [["speech", 37.19], ["music", 19.22], ["sound effect", 5.47]], null, null, null, null, null, null, null, null, null, [["groan", 40.93], ["speech", 13.92], ["music", 9.46]], [["didgeridoo", 25.94], ["livestock, farm animals, working animals", 16.11], ["cattle, bovinae", 13.05]], null], "duration": [0.34, 0.13, -0.02, 4.43, 1.1, 16.48, 1.71, 2.17, 0.5, 2.88, 4.13, 1.85, 0.67, 0.57, 0.09, 3.2, 4.04, 5.09, -0.09, 0.0, 1.15, 0.49, 1.38, 0.22, 0.36, 0.48, 1.9, 5.41, 3.68, 1.61]} \ No newline at end of file diff --git a/annotations_1/doKP3Il9R1k_filtered.json b/annotations_1/doKP3Il9R1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16e7769c03b0e77897126353984b43b355f8a460 --- /dev/null +++ b/annotations_1/doKP3Il9R1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.65], [4.0, 4.28], [5.0, 6.29], [7.0, 8.34], [10.0, 10.13], [12.0, 15.6], [17.0, 17.12], [24.0, 23.99], [24.0, 25.1], [26.0, 26.25], [28.0, 28.46], [34.0, 34.28], [35.0, 36.02], [37.0, 37.57], [56.0, 56.22], [66.0, 66.28], [68.0, 68.01], [73.0, 73.04], [78.0, 78.04], [78.0, 78.27], [78.0, 79.47], [80.0, 81.11], [92.0, 91.94], [95.0, 95.0], [95.0, 97.23], [105.0, 105.9]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["radio", 15.39], ["speech", 11.67], ["moo", 7.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.13], ["speech", 25.58], ["beatboxing", 5.37]], null], "duration": [0.65, 0.28, 1.29, 1.34, 0.13, 3.6, 0.12, -0.01, 1.1, 0.25, 0.46, 0.28, 1.02, 0.57, 0.22, 0.28, 0.01, 0.04, 0.04, 0.27, 1.47, 1.11, -0.06, 0.0, 2.23, 0.9]} \ No newline at end of file diff --git a/annotations_1/dp2MR9fswWk_filtered.json b/annotations_1/dp2MR9fswWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3024bd13c986cc4a72c17bb4f6120eac1d7cd6a2 --- /dev/null +++ b/annotations_1/dp2MR9fswWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.7], [7.0, 8.21], [13.0, 14.2], [36.0, 36.54], [38.0, 42.2], [47.0, 46.92], [54.0, 54.28], [56.0, 55.92], [69.0, 69.13], [75.0, 76.13], [85.0, 85.73], [89.0, 89.16], [108.0, 108.08], [128.0, 129.61], [131.0, 130.86], [133.0, 133.73], [135.0, 137.46], [138.0, 139.18], [147.0, 147.11], [156.0, 156.37], [161.0, 161.22], [163.0, 170.87], [171.0, 179.76]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.88, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 80.82, 48.39], "audiomae_on_audioset": [[["speech", 38.38], ["music", 25.01], ["hum", 3.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.91], ["arrow", 7.05], ["thunk", 6.38]]], "duration": [4.7, 1.21, 1.2, 0.54, 4.2, -0.08, 0.28, -0.08, 0.13, 1.13, 0.73, 0.16, 0.08, 1.61, -0.14, 0.73, 2.46, 1.18, 0.11, 0.37, 0.22, 7.87, 8.76]} \ No newline at end of file diff --git a/annotations_1/dq_RCN3esGk_filtered.json b/annotations_1/dq_RCN3esGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcddc91619aaf29da3708f7b29c46e047428aa38 --- /dev/null +++ b/annotations_1/dq_RCN3esGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.25], [7.0, 7.65], [12.0, 26.65], [38.0, 43.06], [49.0, 49.01], [52.0, 85.9], [92.0, 99.93]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [48.1, 0.0, 44.69, 29.72, 0.0, 0.0, 29.93], "audiomae_on_audioset": [[["fly, housefly", 27.28], ["insect", 11.14], ["bee, wasp, etc.", 7.33]], null, [["cattle, bovinae", 48.08], ["livestock, farm animals, working animals", 30.9], ["moo", 20.11]], [["cattle, bovinae", 50.52], ["moo", 30.79], ["livestock, farm animals, working animals", 12.5]], null, null, [["cattle, bovinae", 35.4], ["moo", 34.09], ["livestock, farm animals, working animals", 12.46]]], "duration": [2.25, 0.65, 14.65, 5.06, 0.01, 33.9, 7.93]} \ No newline at end of file diff --git a/annotations_1/droww43JVyA_filtered.json b/annotations_1/droww43JVyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9664ee3479f2993bcf3a75c2b404a971762df9f4 --- /dev/null +++ b/annotations_1/droww43JVyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.48], [4.0, 9.17], [14.0, 15.16], [16.0, 17.39], [18.0, 18.37], [21.0, 21.52], [23.0, 23.52], [24.0, 25.49], [26.0, 29.37], [30.0, 33.34], [36.0, 37.07], [40.0, 40.54], [41.0, 41.69], [43.0, 44.54], [46.0, 47.11], [48.0, 49.47], [51.0, 51.93], [52.0, 53.5], [54.0, 55.32], [64.0, 66.23], [71.0, 73.08], [74.0, 76.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 5.17, 1.16, 1.39, 0.37, 0.52, 0.52, 1.49, 3.37, 3.34, 1.07, 0.54, 0.69, 1.54, 1.11, 1.47, 0.93, 1.5, 1.32, 2.23, 2.08, 2.69]} \ No newline at end of file diff --git a/annotations_1/dry7kY2BMlk_filtered.json b/annotations_1/dry7kY2BMlk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67348b1af2ca6d4de0efc3c25d7fee39e0ab580c --- /dev/null +++ b/annotations_1/dry7kY2BMlk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [8.0, 10.57], [12.0, 24.88], [25.0, 57.15], [59.0, 65.65], [67.0, 67.53], [70.0, 75.42], [77.0, 77.94], [88.0, 89.34], [91.0, 91.64], [93.0, 94.17], [95.0, 97.16], [100.0, 100.52], [102.0, 103.69], [105.0, 107.52], [110.0, 110.61], [112.0, 114.49], [122.0, 123.18], [137.0, 146.62], [148.0, 155.28], [156.0, 159.81], [160.0, 161.25], [164.0, 164.61]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 37.53, 31.56, 0.0, 36.79, 0.0, 48.44, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 0.0, 41.28, 0.0, 35.92, 0.0, 30.04, 36.25, 43.4, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.78], ["music", 25.78], ["didgeridoo", 6.07]], [["music", 72.97], ["hum", 6.52], ["throbbing", 3.88]], null, [["speech", 43.19], ["music", 5.47], ["car", 4.96]], null, [["music", 36.39], ["speech", 23.88], ["hum", 10.02]], null, null, null, null, null, null, null, [["music", 35.38], ["throbbing", 9.24], ["hum", 7.63]], null, [["music", 65.4], ["throbbing", 6.75], ["electronic music", 3.81]], null, [["speech", 41.79], ["machine gun", 23.22], ["music", 15.33]], [["music", 54.03], ["hum", 9.0], ["throbbing", 6.35]], [["music", 55.07], ["speech", 17.75], ["didgeridoo", 9.92]], null, null], "duration": [0.51, 2.57, 12.88, 32.15, 6.65, 0.53, 5.42, 0.94, 1.34, 0.64, 1.17, 2.16, 0.52, 1.69, 2.52, 0.61, 2.49, 1.18, 9.62, 7.28, 3.81, 1.25, 0.61]} \ No newline at end of file diff --git a/annotations_1/dshJG5PEOqY_filtered.json b/annotations_1/dshJG5PEOqY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b7cfa17f4ebf2d11bd17efc1d9e3881d4c1bfbb --- /dev/null +++ b/annotations_1/dshJG5PEOqY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.97], [9.0, 18.3], [20.0, 22.91], [23.0, 24.66], [25.0, 25.98], [26.0, 27.36], [28.0, 29.54], [30.0, 33.25], [34.0, 35.18], [36.0, 36.69], [40.0, 41.18], [42.0, 42.85], [44.0, 45.33], [50.0, 51.14], [52.0, 52.3], [55.0, 56.3], [58.0, 58.62], [60.0, 61.52], [63.0, 64.69], [66.0, 66.58], [69.0, 69.84], [72.0, 78.54], [80.0, 81.24], [82.0, 86.95], [92.0, 95.0], [95.0, 98.29], [99.0, 100.6], [103.0, 104.46], [105.0, 106.57], [107.0, 108.26], [109.0, 109.61], [111.0, 113.31], [116.0, 116.38], [122.0, 123.97], [124.0, 125.95], [127.0, 128.29], [129.0, 130.74], [134.0, 134.42], [138.0, 140.73], [141.0, 141.74], [143.0, 143.83], [145.0, 145.22], [147.0, 148.07], [149.0, 149.44], [150.0, 150.77], [154.0, 156.93], [158.0, 158.25], [159.0, 159.29], [169.0, 169.2], [170.0, 173.84], [181.0, 181.03], [189.0, 192.1], [195.0, 195.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.64, 99.97, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 0.0, 90.08, 100.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 52.98, 0.0, 96.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 9.3, 2.91, 1.66, 0.98, 1.36, 1.54, 3.25, 1.18, 0.69, 1.18, 0.85, 1.33, 1.14, 0.3, 1.3, 0.62, 1.52, 1.69, 0.58, 0.84, 6.54, 1.24, 4.95, 3.0, 3.29, 1.6, 1.46, 1.57, 1.26, 0.61, 2.31, 0.38, 1.97, 1.95, 1.29, 1.74, 0.42, 2.73, 0.74, 0.83, 0.22, 1.07, 0.44, 0.77, 2.93, 0.25, 0.29, 0.2, 3.84, 0.03, 3.1, 0.24]} \ No newline at end of file diff --git a/annotations_1/dtgOzzBMl2o_filtered.json b/annotations_1/dtgOzzBMl2o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67fbc3ee17dfccfe3e421c0c392ba45a8e620894 --- /dev/null +++ b/annotations_1/dtgOzzBMl2o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.42], [14.0, 14.72], [16.0, 16.11], [20.0, 20.73], [22.0, 22.82], [23.0, 25.2], [31.0, 31.55], [37.0, 38.42], [39.0, 41.55], [43.0, 42.97], [48.0, 48.34], [50.0, 51.0], [53.0, 54.21], [55.0, 60.03], [68.0, 68.89], [72.0, 72.22], [73.0, 75.37], [78.0, 78.36], [83.0, 82.63], [84.0, 86.04], [109.0, 109.53], [128.0, 128.98], [130.0, 131.31], [132.0, 131.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 78.55, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.42, 0.72, 0.11, 0.73, 0.82, 2.2, 0.55, 1.42, 2.55, -0.03, 0.34, 1.0, 1.21, 5.03, 0.89, 0.22, 2.37, 0.36, -0.37, 2.04, 0.53, 0.98, 1.31, -0.13]} \ No newline at end of file diff --git a/annotations_1/duEErwP8eds_filtered.json b/annotations_1/duEErwP8eds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d74072edad544c61be2d4a295635a8eb0bb5dd0e --- /dev/null +++ b/annotations_1/duEErwP8eds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 31.68], [33.0, 46.79], [49.0, 54.38], [56.0, 59.24], [62.0, 79.57], [83.0, 89.94], [93.0, 115.97], [118.0, 118.89], [119.0, 120.09]], "keep_status": [true, true, false, false, false, false, true, false, false], "silence_prob": [37.72, 38.16, 70.02, 48.78, 33.83, 33.01, 36.82, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 7.26], ["music", 6.52], ["whale vocalization", 5.35]], [["groan", 25.89], ["speech", 21.78], ["grunt", 18.38]], null, [["music", 53.75], ["electronic music", 14.79], ["hum", 5.84]], [["mains hum", 27.26], ["music", 21.72], ["hum", 21.5]], [["fly, housefly", 55.67], ["insect", 27.61], ["mosquito", 5.63]], [["speech", 27.97], ["buzz", 27.59], ["hum", 8.89]], null, null], "duration": [3.68, 13.79, 5.38, 3.24, 17.57, 6.94, 22.97, 0.89, 1.09]} \ No newline at end of file diff --git a/annotations_1/duU5cdQtpSE_filtered.json b/annotations_1/duU5cdQtpSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b57f536be37306121ce725a7729efd82503b2fea --- /dev/null +++ b/annotations_1/duU5cdQtpSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.85], [18.0, 26.45], [27.0, 32.09], [36.0, 36.44], [36.0, 40.24], [41.0, 41.17], [43.0, 43.48], [44.0, 44.31], [45.0, 45.79], [47.0, 48.9], [52.0, 52.34], [57.0, 62.75], [64.0, 80.67], [84.0, 84.37], [86.0, 93.56], [97.0, 96.9], [98.0, 99.3], [101.0, 101.36], [104.0, 104.52], [106.0, 106.17], [107.0, 107.79], [109.0, 109.92], [111.0, 120.65], [121.0, 121.42], [122.0, 122.77], [123.0, 126.01], [126.0, 130.64], [131.0, 132.41]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [99.21, 81.53, 89.36, 0.0, 45.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 40.77, 0.0, 29.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 54.76, 38.09, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 30.82], ["radio", 13.0], ["noise", 5.96]], null, null, null, null, null, null, [["music", 35.91], ["hum", 14.53], ["throbbing", 10.45]], [["hum", 49.76], ["mains hum", 33.11], ["throbbing", 6.81]], null, [["speech", 49.08], ["music", 31.91], ["synthesizer", 5.26]], null, null, null, null, null, null, null, null, null, null, null, [["frog", 43.02], ["speech", 11.07], ["croak", 10.38]], null], "duration": [3.85, 8.45, 5.09, 0.44, 4.24, 0.17, 0.48, 0.31, 0.79, 1.9, 0.34, 5.75, 16.67, 0.37, 7.56, -0.1, 1.3, 0.36, 0.52, 0.17, 0.79, 0.92, 9.65, 0.42, 0.77, 3.01, 4.64, 1.41]} \ No newline at end of file diff --git a/annotations_1/duZLaW_6qLc_filtered.json b/annotations_1/duZLaW_6qLc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e7ec67aa9b0b4dbdd1327167947f80ecd72d4c1 --- /dev/null +++ b/annotations_1/duZLaW_6qLc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [9.0, 9.93], [12.0, 12.87], [17.0, 17.09], [19.0, 19.67], [25.0, 25.76], [26.0, 27.65], [31.0, 31.21], [32.0, 32.39], [33.0, 34.32], [39.0, 39.72], [42.0, 41.82], [50.0, 50.25], [51.0, 51.66], [53.0, 52.73], [54.0, 54.99], [56.0, 55.93], [59.0, 59.44], [61.0, 61.79], [64.0, 65.8], [66.0, 66.45], [68.0, 70.78], [73.0, 73.9]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.22, 0.0], "audiomae_on_audioset": [[["speech", 10.79], ["vehicle", 9.87], ["car", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 25.71], ["boing", 7.4], ["fart", 6.22]], null], "duration": [2.86, 0.93, 0.87, 0.09, 0.67, 0.76, 1.65, 0.21, 0.39, 1.32, 0.72, -0.18, 0.25, 0.66, -0.27, 0.99, -0.07, 0.44, 0.79, 1.8, 0.45, 2.78, 0.9]} \ No newline at end of file diff --git a/annotations_1/dudDh8KZiTE_filtered.json b/annotations_1/dudDh8KZiTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9af911d3071ab8141c4b9e33bded11a0a5f1a828 --- /dev/null +++ b/annotations_1/dudDh8KZiTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.71], [10.0, 9.75], [11.0, 13.41], [22.0, 22.38], [28.0, 28.16], [42.0, 42.08], [44.0, 51.27], [52.0, 52.66], [56.0, 56.46], [62.0, 61.94], [66.0, 67.32], [71.0, 71.19], [72.0, 72.35], [75.0, 75.25], [86.0, 86.21], [88.0, 88.72], [90.0, 90.68], [99.0, 100.77], [102.0, 103.13], [105.0, 106.14], [108.0, 109.04], [113.0, 114.35], [116.0, 116.48], [122.0, 122.98], [124.0, 124.7], [131.0, 131.82], [134.0, 134.59], [136.0, 137.07], [138.0, 139.06], [140.0, 140.8], [142.0, 143.4], [146.0, 146.87], [157.0, 157.17], [160.0, 160.32], [168.0, 168.71], [169.0, 172.0], [173.0, 173.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.16, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, -0.25, 2.41, 0.38, 0.16, 0.08, 7.27, 0.66, 0.46, -0.06, 1.32, 0.19, 0.35, 0.25, 0.21, 0.72, 0.68, 1.77, 1.13, 1.14, 1.04, 1.35, 0.48, 0.98, 0.7, 0.82, 0.59, 1.07, 1.06, 0.8, 1.4, 0.87, 0.17, 0.32, 0.71, 3.0, 0.79]} \ No newline at end of file diff --git a/annotations_1/dvIzAdqrb4U_filtered.json b/annotations_1/dvIzAdqrb4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d85554c4874b0486f40501a5e88288da78f2a15 --- /dev/null +++ b/annotations_1/dvIzAdqrb4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.59], [26.0, 26.59], [50.0, 50.63], [64.0, 65.18], [66.0, 66.28], [78.0, 79.1], [84.0, 84.33], [93.0, 94.17], [102.0, 102.24], [109.0, 109.14], [111.0, 113.07], [119.0, 120.09], [128.0, 128.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.59, 0.63, 1.18, 0.28, 1.1, 0.33, 1.17, 0.24, 0.14, 2.07, 1.09, 0.44]} \ No newline at end of file diff --git a/annotations_1/dw95Qsj59NA_filtered.json b/annotations_1/dw95Qsj59NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe3398ec46fe30f79db049be0244341feadaa5e --- /dev/null +++ b/annotations_1/dw95Qsj59NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.46], [15.0, 17.64], [19.0, 37.05], [40.0, 95.49], [98.0, 143.26], [149.0, 150.26]], "keep_status": [true, false, false, false, false, false], "silence_prob": [28.84, 30.7, 28.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 35.85], ["hum", 12.42], ["music", 11.83]], [["music", 31.43], ["throbbing", 26.4], ["hum", 22.26]], [["hum", 36.96], ["music", 18.94], ["mains hum", 18.63]], null, null, null], "duration": [8.46, 2.64, 18.05, 55.49, 45.26, 1.26]} \ No newline at end of file diff --git a/annotations_1/dwK_rODYMrY_filtered.json b/annotations_1/dwK_rODYMrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30fe9dd2880fcae96e020bb1fe14d28c0f82f4f3 --- /dev/null +++ b/annotations_1/dwK_rODYMrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.83], [11.0, 11.7], [12.0, 52.08], [54.0, 54.04], [56.0, 80.13], [83.0, 84.87], [85.0, 89.26], [90.0, 93.99], [96.0, 98.51], [100.0, 102.03], [106.0, 108.7], [110.0, 111.62], [115.0, 116.65], [120.0, 121.56], [126.0, 130.17], [131.0, 136.38], [140.0, 141.71], [146.0, 146.42], [147.0, 147.6], [149.0, 149.54], [152.0, 153.98], [159.0, 160.59], [162.0, 163.0], [165.0, 167.98], [170.0, 171.58], [173.0, 173.31], [175.0, 175.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [80.46, 0.0, 0.0, 0.0, 51.23, 0.0, 58.72, 56.55, 79.41, 76.86, 36.71, 0.0, 0.0, 0.0, 64.97, 52.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.98, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 30.96], ["speech", 11.73], ["throbbing", 9.18]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.88], ["gasp", 7.43], ["hum", 6.0]], null, null, null], "duration": [3.83, 0.7, 40.08, 0.04, 24.13, 1.87, 4.26, 3.99, 2.51, 2.03, 2.7, 1.62, 1.65, 1.56, 4.17, 5.38, 1.71, 0.42, 0.6, 0.54, 1.98, 1.59, 1.0, 2.98, 1.58, 0.31, 0.8]} \ No newline at end of file diff --git a/annotations_1/dwufX9GKI_4_filtered.json b/annotations_1/dwufX9GKI_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8b0c432feb699890fc9e9ca1f24d203dd0ccf2c --- /dev/null +++ b/annotations_1/dwufX9GKI_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.07], [19.0, 19.47], [20.0, 26.33], [26.0, 26.69], [30.0, 29.78], [32.0, 34.48], [39.0, 38.94], [40.0, 40.32], [40.0, 40.47], [40.0, 50.97], [66.0, 67.59], [68.0, 69.26], [71.0, 70.71], [93.0, 93.11], [95.0, 95.54], [98.0, 98.22], [101.0, 102.81], [105.0, 105.97], [108.0, 124.5], [132.0, 133.22], [135.0, 137.66], [144.0, 148.32], [152.0, 151.77], [154.0, 159.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [51.44, 0.0, 34.48, 0.0, 0.0, 42.19, 0.0, 0.0, 0.0, 34.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 33.38, 35.26, 0.0, 36.57], "audiomae_on_audioset": [null, null, [["speech", 61.89], ["fart", 8.07], ["boing", 4.13]], null, null, [["music", 36.77], ["speech", 31.59], ["didgeridoo", 14.27]], null, null, null, [["music", 61.04], ["speech", 9.57], ["synthesizer", 2.48]], null, null, null, null, null, null, null, null, [["music", 65.2], ["speech", 10.34], ["didgeridoo", 3.1]], null, [["music", 45.05], ["boing", 9.57], ["speech", 9.08]], [["music", 38.21], ["fly, housefly", 11.48], ["mosquito", 7.59]], null, [["music", 52.45], ["didgeridoo", 27.17], ["hum", 1.74]]], "duration": [3.07, 0.47, 6.33, 0.69, -0.22, 2.48, -0.06, 0.32, 0.47, 10.97, 1.59, 1.26, -0.29, 0.11, 0.54, 0.22, 1.81, 0.97, 16.5, 1.22, 2.66, 4.32, -0.23, 5.43]} \ No newline at end of file diff --git a/annotations_1/dwzoyEaHxSM_filtered.json b/annotations_1/dwzoyEaHxSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eca81f9597d0524946d3d8617ac7b9226ee5730 --- /dev/null +++ b/annotations_1/dwzoyEaHxSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [7.0, 7.72], [18.0, 18.45], [19.0, 18.93], [21.0, 21.59], [24.0, 24.46], [26.0, 26.57], [28.0, 29.13], [30.0, 30.75], [34.0, 34.23], [36.0, 38.03], [39.0, 40.17], [42.0, 43.43], [45.0, 45.5], [47.0, 47.44], [50.0, 50.4], [51.0, 52.56], [61.0, 61.2], [63.0, 65.01], [65.0, 66.99], [68.0, 69.97], [71.0, 73.16], [74.0, 75.27], [77.0, 78.41], [80.0, 81.84], [83.0, 83.98], [89.0, 90.02], [93.0, 93.8], [94.0, 95.74], [98.0, 98.05], [99.0, 100.6], [102.0, 104.04], [105.0, 107.01], [108.0, 108.65], [109.0, 110.2], [113.0, 114.03], [115.0, 116.31], [120.0, 121.73], [124.0, 125.79], [127.0, 128.33], [132.0, 133.22], [136.0, 137.56], [140.0, 141.08], [141.0, 142.5], [144.0, 144.15], [147.0, 148.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.72, 0.45, -0.07, 0.59, 0.46, 0.57, 1.13, 0.75, 0.23, 2.03, 1.17, 1.43, 0.5, 0.44, 0.4, 1.56, 0.2, 2.01, 1.99, 1.97, 2.16, 1.27, 1.41, 1.84, 0.98, 1.02, 0.8, 1.74, 0.05, 1.6, 2.04, 2.01, 0.65, 1.2, 1.03, 1.31, 1.73, 1.79, 1.33, 1.22, 1.56, 1.08, 1.5, 0.15, 1.2]} \ No newline at end of file diff --git a/annotations_1/dy3yjv2YLh0_filtered.json b/annotations_1/dy3yjv2YLh0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a29cd97d7a6b915d2875a52e1c6cc30e16f7b44 --- /dev/null +++ b/annotations_1/dy3yjv2YLh0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [15.0, 15.57], [21.0, 32.24], [49.0, 50.5], [55.0, 57.18], [76.0, 77.35], [83.0, 85.83], [95.0, 98.61], [100.0, 101.28], [103.0, 104.16], [108.0, 108.65], [116.0, 117.14], [123.0, 126.01], [127.0, 128.17], [130.0, 132.48], [134.0, 135.6], [139.0, 139.23], [141.0, 141.49], [143.0, 143.31]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 38.97, 0.0, 54.23, 0.0, 56.03, 52.74, 0.0, 0.0, 0.0, 0.0, 46.33, 0.0, 38.14, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["glass", 16.4], ["music", 15.42], ["coin (dropping)", 6.78]], null, null, null, null, null, null, null, null, null, [["speech", 24.85], ["music", 15.4], ["boing", 11.16]], null, [["music", 15.45], ["speech", 13.97], ["singing bowl", 6.0]], null, null, null, null], "duration": [1.17, 0.57, 11.24, 1.5, 2.18, 1.35, 2.83, 3.61, 1.28, 1.16, 0.65, 1.14, 3.01, 1.17, 2.48, 1.6, 0.23, 0.49, 0.31]} \ No newline at end of file diff --git a/annotations_1/dyXlsD7Gx0Y_filtered.json b/annotations_1/dyXlsD7Gx0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ac8a2d63ace8872bde4eb515bc779ee1e2f34c1 --- /dev/null +++ b/annotations_1/dyXlsD7Gx0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 7.21], [8.0, 15.35], [16.0, 68.62], [70.0, 71.73], [72.0, 75.05], [75.0, 76.72], [79.0, 81.04], [82.0, 90.32], [92.0, 105.22], [106.0, 106.66], [107.0, 111.47], [112.0, 112.65], [113.0, 128.76], [131.0, 131.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.19, 100.0, 0.0, 0.0, 99.92, 0.0, 100.0, 97.64, 97.11, 0.0, 91.3, 0.0, 84.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 3.21, 7.35, 52.62, 1.73, 3.05, 1.72, 2.04, 8.32, 13.22, 0.66, 4.47, 0.65, 15.76, 0.8]} \ No newline at end of file diff --git a/annotations_1/dzzijuZof1w_filtered.json b/annotations_1/dzzijuZof1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce546f63bcd3b24d2072b9d8a62bb1dfc32cfb --- /dev/null +++ b/annotations_1/dzzijuZof1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.48], [28.0, 28.66], [29.0, 29.98], [31.0, 40.42], [41.0, 52.64], [59.0, 78.14], [79.0, 103.65], [105.0, 113.24], [114.0, 114.78], [116.0, 132.75], [135.0, 139.6], [143.0, 144.29], [148.0, 148.58]], "keep_status": [false, false, false, true, false, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.43, 29.18, 28.88, 29.03, 29.09, 0.0, 28.84, 28.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.37], ["speech", 22.91], ["hum", 21.42]], [["throbbing", 39.55], ["music", 30.28], ["hum", 15.94]], [["music", 28.51], ["speech", 15.98], ["hum", 9.39]], [["music", 27.05], ["machine gun", 20.18], ["hum", 11.68]], [["music", 27.45], ["rumble", 11.59], ["gong", 9.81]], null, [["music", 43.81], ["hum", 10.74], ["mains hum", 6.94]], [["music", 30.02], ["hum", 19.1], ["mains hum", 10.97]], null, null], "duration": [0.48, 0.66, 0.98, 9.42, 11.64, 19.14, 24.65, 8.24, 0.78, 16.75, 4.6, 1.29, 0.58]} \ No newline at end of file diff --git a/annotations_1/e-NMI6o5ynk_filtered.json b/annotations_1/e-NMI6o5ynk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2bb5390e82e0d15dd6ba2d9fcbc565ce242aad8 --- /dev/null +++ b/annotations_1/e-NMI6o5ynk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.82], [12.0, 13.2], [14.0, 15.67], [16.0, 27.33], [31.0, 32.07], [33.0, 51.56]], "keep_status": [false, false, false, false, false, false], "silence_prob": [35.1, 0.0, 0.0, 33.47, 0.0, 32.65], "audiomae_on_audioset": [[["music", 80.14], ["synthesizer", 1.36], ["sampler", 1.24]], null, null, [["music", 79.07], ["throbbing", 1.48], ["sampler", 1.31]], null, [["music", 71.27], ["singing", 3.02], ["didgeridoo", 2.96]]], "duration": [2.82, 1.2, 1.67, 11.33, 1.07, 18.56]} \ No newline at end of file diff --git a/annotations_1/e0HzBST_794_filtered.json b/annotations_1/e0HzBST_794_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..779a2e2191018a8b0206d12dd87a89ceb49791c1 --- /dev/null +++ b/annotations_1/e0HzBST_794_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.86], [6.0, 15.9], [18.0, 19.84], [27.0, 34.37], [35.0, 49.94], [66.0, 66.11], [68.0, 69.35], [90.0, 90.17], [94.0, 99.76], [105.0, 112.06], [124.0, 157.06], [157.0, 157.1], [157.0, 157.13], [157.0, 157.17]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 31.34, 0.0, 30.99, 32.63, 0.0, 0.0, 0.0, 35.36, 32.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 46.24], ["cattle, bovinae", 21.08], ["moo", 11.12]], null, [["moo", 35.5], ["cattle, bovinae", 33.52], ["livestock, farm animals, working animals", 25.6]], [["animal", 63.47], ["grunt", 17.72], ["livestock, farm animals, working animals", 3.93]], null, null, null, [["music", 22.85], ["whack, thwack", 14.08], ["speech", 13.15]], [["boing", 24.17], ["speech", 15.59], ["music", 14.44]], null, null, null, null], "duration": [-0.14, 9.9, 1.84, 7.37, 14.94, 0.11, 1.35, 0.17, 5.76, 7.06, 33.06, 0.1, 0.13, 0.17]} \ No newline at end of file diff --git a/annotations_1/e0UZ0rc0KH4_filtered.json b/annotations_1/e0UZ0rc0KH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3b51e72f765c63077da9ce45390b815fc3b5662 --- /dev/null +++ b/annotations_1/e0UZ0rc0KH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.88], [10.0, 10.5], [11.0, 11.67], [13.0, 13.1], [13.0, 14.88], [16.0, 23.33], [24.0, 34.57], [37.0, 36.98], [37.0, 37.66], [44.0, 50.04], [52.0, 51.83], [52.0, 56.54], [57.0, 59.61], [61.0, 61.75], [63.0, 63.42], [64.0, 65.31], [66.0, 75.52], [78.0, 80.69], [82.0, 82.73], [86.0, 86.12], [87.0, 87.02], [90.0, 92.18], [93.0, 98.05], [99.0, 99.44], [100.0, 100.84], [104.0, 105.29], [106.0, 115.64], [119.0, 119.65], [120.0, 125.27], [126.0, 130.0], [131.0, 133.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.56, 57.32, 0.0, 0.0, 58.89, 0.0, 52.45, 60.14, 0.0, 0.0, 0.0, 46.43, 58.89, 0.0, 0.0, 0.0, 77.7, 64.07, 0.0, 0.0, 0.0, 78.89, 0.0, 71.43, 69.2, 63.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.08], ["hum", 20.56], ["throbbing", 8.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.5, 0.67, 0.1, 1.88, 7.33, 10.57, -0.02, 0.66, 6.04, -0.17, 4.54, 2.61, 0.75, 0.42, 1.31, 9.52, 2.69, 0.73, 0.12, 0.02, 2.18, 5.05, 0.44, 0.84, 1.29, 9.64, 0.65, 5.27, 4.0, 2.02]} \ No newline at end of file diff --git a/annotations_1/e198XToyAkk_filtered.json b/annotations_1/e198XToyAkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f3f3a094afcbbba59d2555e3da78de62b17ab4f --- /dev/null +++ b/annotations_1/e198XToyAkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [35.0, 35.58], [41.0, 41.47], [49.0, 49.72], [52.0, 51.75], [64.0, 65.48], [67.0, 66.93], [68.0, 74.49], [76.0, 75.96], [78.0, 77.95], [95.0, 97.78], [103.0, 103.84], [115.0, 115.52], [136.0, 136.81], [138.0, 138.43], [146.0, 148.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 35.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 72.9], ["speech", 11.73], ["wail, moan", 3.73]], null, null, [["music", 77.4], ["musical instrument", 5.51], ["synthesizer", 3.79]], null, null, null, null, [["boing", 36.42], ["speech", 18.1], ["ding", 6.88]]], "duration": [0.1, 0.58, 0.47, 0.72, -0.25, 1.48, -0.07, 6.49, -0.04, -0.05, 2.78, 0.84, 0.52, 0.81, 0.43, 2.22]} \ No newline at end of file diff --git a/annotations_1/e1FWoMLjAU0_filtered.json b/annotations_1/e1FWoMLjAU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..536c72b9ab7c550cdaf7649ed71db5e75e50b3dc --- /dev/null +++ b/annotations_1/e1FWoMLjAU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.79], [63.0, 63.86], [65.0, 65.97], [71.0, 72.82], [73.0, 74.76], [76.0, 77.41], [79.0, 81.35], [83.0, 84.21], [86.0, 86.54], [88.0, 90.14], [90.0, 93.43], [94.0, 95.3], [97.0, 97.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 77.03, 50.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.79, 0.86, 0.97, 1.82, 1.76, 1.41, 2.35, 1.21, 0.54, 2.14, 3.43, 1.3, 0.43]} \ No newline at end of file diff --git a/annotations_1/e2dAiCB6igE_filtered.json b/annotations_1/e2dAiCB6igE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f068ad82f8c2fba909e4acfc89c68cb0292185f --- /dev/null +++ b/annotations_1/e2dAiCB6igE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.0], [16.0, 16.44], [22.0, 22.64], [24.0, 24.75], [28.0, 29.44], [30.0, 31.21], [33.0, 34.42], [39.0, 40.61], [52.0, 52.44], [57.0, 57.84], [61.0, 64.77], [67.0, 69.38], [71.0, 70.87], [72.0, 73.79], [82.0, 88.25], [91.0, 91.84], [93.0, 93.68], [101.0, 107.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 99.91, 0.0, 0.0, 42.67, 0.0, 0.0, 30.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.51], ["fly, housefly", 8.75], ["buzz", 3.29]], null, null, [["music", 30.06], ["fly, housefly", 7.36], ["mosquito", 6.73]]], "duration": [1.0, 0.44, 0.64, 0.75, 1.44, 1.21, 1.42, 1.61, 0.44, 0.84, 3.77, 2.38, -0.13, 1.79, 6.25, 0.84, 0.68, 6.86]} \ No newline at end of file diff --git a/annotations_1/e3BZn-XJ4mU_filtered.json b/annotations_1/e3BZn-XJ4mU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2529c6881564014a6fafbcd77b29321b31553cbe --- /dev/null +++ b/annotations_1/e3BZn-XJ4mU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 35.53], [36.0, 35.58], [36.0, 44.9], [46.0, 49.57], [50.0, 73.52], [75.0, 74.87], [76.0, 78.11], [80.0, 93.9], [97.0, 97.77], [100.0, 111.28], [112.0, 114.76], [117.0, 120.88], [121.0, 129.71], [130.0, 134.22], [137.0, 142.28], [143.0, 143.77]], "keep_status": [true, false, false, true, false, false, true, true, false, false, true, true, true, true, true, false], "silence_prob": [28.15, 0.0, 31.04, 31.14, 29.69, 0.0, 29.67, 27.86, 0.0, 28.48, 29.48, 29.45, 29.51, 28.81, 29.46, 0.0], "audiomae_on_audioset": [[["explosion", 20.85], ["music", 10.57], ["whack, thwack", 7.35]], null, [["speech", 66.87], ["music", 7.8], ["breaking", 2.28]], [["music", 52.39], ["hum", 2.64], ["vehicle", 2.21]], [["livestock, farm animals, working animals", 40.85], ["cattle, bovinae", 28.52], ["moo", 9.5]], null, [["sound effect", 13.32], ["whale vocalization", 12.86], ["roar", 8.7]], [["explosion", 15.17], ["rumble", 14.42], ["music", 6.74]], null, [["music", 72.89], ["throbbing", 6.81], ["hum", 6.34]], [["speech", 10.31], ["hum", 9.14], ["whack, thwack", 8.64]], [["music", 28.39], ["whack, thwack", 8.72], ["throbbing", 8.18]], [["music", 36.92], ["whack, thwack", 9.25], ["clang", 8.34]], [["music", 54.73], ["speech", 7.26], ["boing", 5.89]], [["ding", 31.02], ["boing", 11.6], ["music", 11.59]], null], "duration": [12.53, -0.42, 8.9, 3.57, 23.52, -0.13, 2.11, 13.9, 0.77, 11.28, 2.76, 3.88, 8.71, 4.22, 5.28, 0.77]} \ No newline at end of file diff --git a/annotations_1/e48T01eVXtU_filtered.json b/annotations_1/e48T01eVXtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80d23c29423f83d21063b1a26b88032ce4027483 --- /dev/null +++ b/annotations_1/e48T01eVXtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.52], [12.0, 12.23], [21.0, 22.49], [37.0, 44.41], [48.0, 49.92], [52.0, 56.61], [57.0, 58.36], [65.0, 68.84], [73.0, 74.48], [75.0, 75.22], [76.0, 81.7], [91.0, 91.47], [92.0, 94.53], [96.0, 99.2], [102.0, 103.32], [104.0, 108.65], [109.0, 108.9], [110.0, 110.17], [113.0, 114.52], [117.0, 118.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false], "silence_prob": [38.15, 0.0, 0.0, 30.13, 0.0, 30.45, 0.0, 29.71, 0.0, 0.0, 30.93, 0.0, 30.46, 32.8, 0.0, 30.68, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 43.41], ["cattle, bovinae", 28.68], ["moo", 14.11]], null, null, [["music", 42.17], ["speech", 24.34], ["cattle, bovinae", 5.57]], null, [["moo", 42.12], ["cattle, bovinae", 26.57], ["livestock, farm animals, working animals", 9.8]], null, [["music", 59.82], ["speech", 17.54], ["boing", 5.08]], null, null, [["fly, housefly", 24.32], ["mosquito", 18.31], ["music", 16.1]], null, [["music", 45.94], ["boing", 12.05], ["speech", 5.94]], [["music", 40.04], ["speech", 9.65], ["musical instrument", 9.28]], null, [["cattle, bovinae", 23.48], ["moo", 21.46], ["fart", 11.48]], null, null, null, null], "duration": [7.52, 0.23, 1.49, 7.41, 1.92, 4.61, 1.36, 3.84, 1.48, 0.22, 5.7, 0.47, 2.53, 3.2, 1.32, 4.65, -0.1, 0.17, 1.52, 1.47]} \ No newline at end of file diff --git a/annotations_1/e4Dlc6yqJuA_filtered.json b/annotations_1/e4Dlc6yqJuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..235efaa26013283e0a0b96fba1839414e0e6722c --- /dev/null +++ b/annotations_1/e4Dlc6yqJuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.73], [14.0, 16.58], [18.0, 42.06], [45.0, 45.47], [47.0, 48.05]], "keep_status": [false, false, true, false, false], "silence_prob": [90.43, 89.9, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 40.2], ["hum", 19.74], ["mains hum", 7.03]], null, null], "duration": [4.73, 2.58, 24.06, 0.47, 1.05]} \ No newline at end of file diff --git a/annotations_1/e56FOw5rIhw_filtered.json b/annotations_1/e56FOw5rIhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..707598d521f5aed2cf1ece65c944a5435a51886c --- /dev/null +++ b/annotations_1/e56FOw5rIhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 50.28], [51.0, 77.95]], "keep_status": [false, false], "silence_prob": [0.0, 30.83], "audiomae_on_audioset": [null, [["music", 56.45], ["throbbing", 10.65], ["musical instrument", 4.5]]], "duration": [0.28, 26.95]} \ No newline at end of file diff --git a/annotations_1/e5LZR3vCkzo_filtered.json b/annotations_1/e5LZR3vCkzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af3689afb1730ee77c57ec550a720ecf591eecf1 --- /dev/null +++ b/annotations_1/e5LZR3vCkzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.13], [10.0, 10.88], [13.0, 14.5], [16.0, 20.17], [27.0, 64.5], [66.0, 66.46], [70.0, 78.75], [79.0, 80.33], [81.0, 108.63]], "keep_status": [false, false, false, true, false, false, false, false, true], "silence_prob": [60.42, 0.0, 0.0, 35.0, 0.0, 0.0, 32.52, 0.0, 30.57], "audiomae_on_audioset": [null, null, null, [["music", 36.42], ["throbbing", 16.46], ["hum", 16.37]], null, null, [["music", 68.46], ["speech", 5.44], ["throbbing", 4.54]], null, [["music", 42.24], ["speech", 12.1], ["whack, thwack", 10.14]]], "duration": [3.13, 0.88, 1.5, 4.17, 37.5, 0.46, 8.75, 1.33, 27.63]} \ No newline at end of file diff --git a/annotations_1/e5cg1EeFISo_filtered.json b/annotations_1/e5cg1EeFISo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91d8d4497fbfe35fb60226aabcabb30a65f078db --- /dev/null +++ b/annotations_1/e5cg1EeFISo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.04], [9.0, 9.07], [30.0, 30.27], [39.0, 40.47], [50.0, 50.77], [74.0, 74.6], [76.0, 75.83], [91.0, 91.03], [103.0, 106.86], [109.0, 109.76], [127.0, 127.01], [128.0, 128.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.07, 0.27, 1.47, 0.77, 0.6, -0.17, 0.03, 3.86, 0.76, 0.01, 0.33]} \ No newline at end of file diff --git a/annotations_1/e6B-T4KYIFQ_filtered.json b/annotations_1/e6B-T4KYIFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..815885a22353b1ce15a8abb21898376c1b1c10e1 --- /dev/null +++ b/annotations_1/e6B-T4KYIFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.64], [8.0, 29.32], [32.0, 33.89], [36.0, 38.58], [39.0, 38.75], [39.0, 39.04], [39.0, 49.54], [54.0, 56.76], [58.0, 59.64], [63.0, 73.3], [77.0, 98.63], [103.0, 105.61], [106.0, 118.56], [126.0, 126.32], [127.0, 143.04]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 49.04, 0.0, 46.19, 0.0, 0.0, 48.74, 94.22, 0.0, 47.78, 35.4, 30.67, 33.5, 0.0, 39.91], "audiomae_on_audioset": [null, [["music", 32.85], ["speech", 9.39], ["boing", 8.27]], null, [["speech", 20.76], ["music", 6.79], ["singing bowl", 3.8]], null, null, [["music", 35.7], ["speech", 29.53], ["whack, thwack", 6.13]], null, null, [["music", 66.71], ["electronic music", 4.64], ["thunk", 3.67]], [["music", 60.17], ["electronic music", 6.74], ["ambient music", 5.88]], [["speech", 32.66], ["sheep", 22.94], ["bleat", 13.85]], [["music", 71.56], ["scary music", 6.47], ["speech", 4.28]], null, [["speech", 58.1], ["animal", 14.81], ["dog", 5.38]]], "duration": [1.64, 21.32, 1.89, 2.58, -0.25, 0.04, 10.54, 2.76, 1.64, 10.3, 21.63, 2.61, 12.56, 0.32, 16.04]} \ No newline at end of file diff --git a/annotations_1/e7qjmOp9G34_filtered.json b/annotations_1/e7qjmOp9G34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c2f9bd802ffed71bd588d578847a61db7a6f522 --- /dev/null +++ b/annotations_1/e7qjmOp9G34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 51.98], [54.0, 80.22], [81.0, 85.62], [87.0, 88.48], [90.0, 90.22], [96.0, 97.8], [99.0, 107.5], [110.0, 111.82], [115.0, 125.29], [127.0, 130.92], [131.0, 136.7], [137.0, 139.85], [140.0, 141.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 32.25, 37.76, 0.0, 0.0, 0.0, 30.35, 0.0, 29.97, 40.45, 40.59, 44.01, 0.0], "audiomae_on_audioset": [null, [["music", 38.4], ["throbbing", 25.24], ["hum", 22.43]], [["music", 58.09], ["throbbing", 10.74], ["hum", 6.82]], null, null, null, [["throbbing", 55.86], ["hum", 17.57], ["music", 11.31]], null, [["speech", 42.21], ["music", 17.63], ["throbbing", 12.82]], [["music", 28.99], ["throbbing", 23.65], ["hum", 14.09]], [["throbbing", 24.47], ["hum", 23.09], ["music", 16.9]], [["music", 37.44], ["throbbing", 19.49], ["hum", 12.31]], null], "duration": [47.98, 26.22, 4.62, 1.48, 0.22, 1.8, 8.5, 1.82, 10.29, 3.92, 5.7, 2.85, 1.66]} \ No newline at end of file diff --git a/annotations_1/e80zdJ6pWlI_filtered.json b/annotations_1/e80zdJ6pWlI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..573ea4c1b1d99d488122c051e5bcb2ab5e65d138 --- /dev/null +++ b/annotations_1/e80zdJ6pWlI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 40.68], [44.0, 83.86]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [35.68, 39.86]} \ No newline at end of file diff --git a/annotations_1/e8EAVtsvfxc_filtered.json b/annotations_1/e8EAVtsvfxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76e0d9b311f4e62772e0554e3b8360256662a226 --- /dev/null +++ b/annotations_1/e8EAVtsvfxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [11.0, 13.63], [15.0, 16.46], [22.0, 24.34], [25.0, 27.01], [28.0, 28.46], [31.0, 31.9], [33.0, 34.05], [35.0, 36.02], [40.0, 39.95], [50.0, 52.08], [56.0, 81.03], [84.0, 85.36], [86.0, 87.35], [89.0, 89.68], [91.0, 91.45], [93.0, 120.28], [121.0, 122.67], [125.0, 127.03], [128.0, 128.95], [131.0, 132.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.8, 0.0, 99.97, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 77.87, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 89.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 2.63, 1.46, 2.34, 2.01, 0.46, 0.9, 1.05, 1.02, -0.05, 2.08, 25.03, 1.36, 1.35, 0.68, 0.45, 27.28, 1.67, 2.03, 0.95, 1.06]} \ No newline at end of file diff --git a/annotations_1/e96_1NxL9no_filtered.json b/annotations_1/e96_1NxL9no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2919183fa313e40ece60403dcc508101218f4c --- /dev/null +++ b/annotations_1/e96_1NxL9no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [9.0, 10.57], [12.0, 11.99], [13.0, 13.91], [17.0, 17.37], [20.0, 24.66], [33.0, 35.07], [37.0, 39.36], [43.0, 43.58], [45.0, 45.45], [47.0, 48.44], [49.0, 50.11], [54.0, 54.45], [58.0, 58.56], [59.0, 60.37], [61.0, 62.95], [65.0, 66.01], [71.0, 82.56], [84.0, 86.04], [87.0, 88.28], [92.0, 92.47], [93.0, 99.28], [100.0, 102.27], [115.0, 115.64], [116.0, 133.95], [138.0, 139.94], [141.0, 141.64], [143.0, 143.9], [154.0, 165.89]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 34.12, 33.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.34, 38.93, 0.0, 0.0, 32.85, 48.82, 0.0, 34.01, 0.0, 0.0, 0.0, 33.66], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 15.13], ["speech", 15.11], ["boing", 14.92]], [["music", 36.97], ["speech", 21.62], ["boing", 16.77]], null, null, null, null, null, null, null, null, null, [["music", 81.96], ["livestock, farm animals, working animals", 1.69], ["musical instrument", 1.47]], [["music", 50.34], ["speech", 9.22], ["oink", 7.07]], null, null, [["music", 29.97], ["livestock, farm animals, working animals", 13.03], ["animal", 7.64]], [["bleat", 14.17], ["owl", 13.46], ["speech", 13.45]], null, [["music", 82.37], ["hum", 2.29], ["speech", 1.82]], null, null, null, [["music", 33.85], ["livestock, farm animals, working animals", 14.9], ["moo", 9.37]]], "duration": [0.5, 1.57, -0.01, 0.91, 0.37, 4.66, 2.07, 2.36, 0.58, 0.45, 1.44, 1.11, 0.45, 0.56, 1.37, 1.95, 1.01, 11.56, 2.04, 1.28, 0.47, 6.28, 2.27, 0.64, 17.95, 1.94, 0.64, 0.9, 11.89]} \ No newline at end of file diff --git a/annotations_1/e9_4oS3hTPk_filtered.json b/annotations_1/e9_4oS3hTPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e94a3dd15c22a68715517a35a499504b69a4e8c --- /dev/null +++ b/annotations_1/e9_4oS3hTPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [10.0, 9.88], [12.0, 14.4], [16.0, 16.75], [18.0, 19.55], [20.0, 21.78], [23.0, 25.41], [27.0, 27.82], [29.0, 30.05], [32.0, 32.43], [34.0, 39.26], [48.0, 106.19], [108.0, 109.04], [110.0, 110.51], [112.0, 112.31], [113.0, 115.6], [120.0, 122.64], [126.0, 125.83], [127.0, 128.68], [133.0, 134.69], [138.0, 139.94], [142.0, 143.94], [145.0, 145.72], [147.0, 148.74], [150.0, 151.34], [153.0, 155.38]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 44.66, 0.0, 0.0, 0.0, 33.72, 0.0, 0.0, 0.0, 0.0, 47.74, 45.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.81], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 28.05], ["speech", 16.41], ["hum", 14.15]], null, null, null, [["music", 32.58], ["speech", 29.92], ["hum", 7.6]], null, null, null, null, [["speech", 48.76], ["singing bowl", 14.51], ["gong", 7.26]], [["speech", 33.68], ["sidetone", 33.62], ["music", 3.02]], null, null, null, null, null, null, null, null, null], "duration": [0.92, -0.12, 2.4, 0.75, 1.55, 1.78, 2.41, 0.82, 1.05, 0.43, 5.26, 58.19, 1.04, 0.51, 0.31, 2.6, 2.64, -0.17, 1.68, 1.69, 1.94, 1.94, 0.72, 1.74, 1.34, 2.38]} \ No newline at end of file diff --git a/annotations_1/eA-V5wUcWos_filtered.json b/annotations_1/eA-V5wUcWos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08f07cc030232a21f05f3e84c29572d68f2d547b --- /dev/null +++ b/annotations_1/eA-V5wUcWos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.28], [18.0, 54.82], [59.0, 95.2], [95.0, 96.11], [104.0, 105.41], [106.0, 106.51], [108.0, 130.62], [131.0, 135.24]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [28.29, 0.0, 0.0, 0.0, 0.0, 0.0, 28.59, 29.02], "audiomae_on_audioset": [[["speech", 54.0], ["artillery fire", 9.21], ["explosion", 8.35]], null, null, null, null, null, [["eruption", 17.85], ["white noise", 7.54], ["livestock, farm animals, working animals", 6.92]], [["cattle, bovinae", 33.77], ["speech", 14.51], ["moo", 11.81]]], "duration": [8.28, 36.82, 36.2, 1.11, 1.41, 0.51, 22.62, 4.24]} \ No newline at end of file diff --git a/annotations_1/eAC2kNiKuEg_filtered.json b/annotations_1/eAC2kNiKuEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6169d05caa53ca068376259080b208f896206b21 --- /dev/null +++ b/annotations_1/eAC2kNiKuEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 55.19], [57.0, 67.41], [68.0, 69.13], [71.0, 71.47], [74.0, 80.37], [81.0, 82.12], [83.0, 87.88], [92.0, 94.53], [98.0, 112.48]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.82, 0.0, 0.0, 52.74, 0.0, 32.48, 37.24, 33.67], "audiomae_on_audioset": [null, [["music", 48.34], ["speech", 28.58], ["electronic music", 4.45]], null, null, null, null, [["music", 69.74], ["throbbing", 5.18], ["speech", 4.13]], [["music", 36.06], ["throbbing", 15.39], ["speech", 13.13]], [["music", 63.48], ["speech", 15.1], ["electronic music", 1.8]]], "duration": [38.19, 10.41, 1.13, 0.47, 6.37, 1.12, 4.88, 2.53, 14.48]} \ No newline at end of file diff --git a/annotations_1/eAp8Vm19uQU_filtered.json b/annotations_1/eAp8Vm19uQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a19b8330a184452b00433c61412dea0f6dc1ebf --- /dev/null +++ b/annotations_1/eAp8Vm19uQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 80.38], [83.0, 82.81], [84.0, 85.75], [86.0, 109.61], [113.0, 120.18], [120.0, 133.25]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.93, 29.9, 29.67], "audiomae_on_audioset": [null, null, null, [["music", 36.81], ["throbbing", 18.51], ["hum", 12.39]], [["hum", 43.1], ["throbbing", 37.64], ["music", 9.01]], [["music", 74.61], ["cacophony", 7.85], ["hum", 2.75]]], "duration": [0.38, -0.19, 1.75, 23.61, 7.18, 13.25]} \ No newline at end of file diff --git a/annotations_1/eB-ldQkL--0_filtered.json b/annotations_1/eB-ldQkL--0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba67f7cc920ae313d9c8552b611bbcc7b11e339f --- /dev/null +++ b/annotations_1/eB-ldQkL--0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.54], [7.0, 15.18], [19.0, 27.63], [31.0, 31.45], [35.0, 36.73], [38.0, 46.72], [51.0, 52.47], [53.0, 54.04], [57.0, 62.09], [64.0, 70.06], [72.0, 75.05], [76.0, 79.37], [81.0, 82.16], [83.0, 83.71], [86.0, 116.67], [118.0, 118.34], [126.0, 135.78], [138.0, 139.45], [140.0, 150.04], [153.0, 152.95], [156.0, 156.66], [157.0, 158.65], [166.0, 169.16], [170.0, 170.65], [183.0, 184.03], [187.0, 188.33], [189.0, 193.35], [196.0, 201.21], [203.0, 203.1], [205.0, 206.71], [207.0, 208.84], [218.0, 234.55], [235.0, 236.7], [240.0, 240.21]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.97, 31.23, 0.0, 0.0, 30.28, 0.0, 0.0, 30.22, 30.45, 31.83, 29.39, 0.0, 0.0, 0.0, 0.0, 31.07, 0.0, 29.74, 0.0, 0.0, 0.0, 30.19, 0.0, 0.0, 0.0, 28.68, 28.36, 0.0, 0.0, 0.0, 28.31, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.81], ["music", 23.73], ["sidetone", 11.04]], [["speech", 29.26], ["music", 24.22], ["throbbing", 17.9]], null, null, [["throbbing", 48.4], ["music", 24.91], ["hum", 17.83]], null, null, [["speech", 39.22], ["music", 12.57], ["throbbing", 7.95]], [["throbbing", 46.64], ["hum", 21.88], ["music", 14.31]], [["throbbing", 26.87], ["hum", 21.73], ["music", 20.72]], [["music", 32.64], ["speech", 22.99], ["didgeridoo", 13.37]], null, null, null, null, [["music", 70.28], ["throbbing", 11.22], ["hum", 2.13]], null, [["music", 45.76], ["speech", 31.33], ["didgeridoo", 12.5]], null, null, null, [["speech", 45.04], ["music", 29.92], ["throbbing", 7.63]], null, null, null, [["music", 60.89], ["throbbing", 11.13], ["hum", 7.15]], [["music", 44.9], ["speech", 35.9], ["electronic music", 2.51]], null, null, null, [["buzz", 20.94], ["electric shaver, electric razor", 10.85], ["music", 8.22]], null, null], "duration": [0.54, 8.18, 8.63, 0.45, 1.73, 8.72, 1.47, 1.04, 5.09, 6.06, 3.05, 3.37, 1.16, 0.71, 30.67, 0.34, 9.78, 1.45, 10.04, -0.05, 0.66, 1.65, 3.16, 0.65, 1.03, 1.33, 4.35, 5.21, 0.1, 1.71, 1.84, 16.55, 1.7, 0.21]} \ No newline at end of file diff --git a/annotations_1/eBVqcDJbl5A_filtered.json b/annotations_1/eBVqcDJbl5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4894fba56aa44d7e80973fd24f4c4b51d30397e1 --- /dev/null +++ b/annotations_1/eBVqcDJbl5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.97], [21.0, 31.97], [35.0, 46.01], [50.0, 61.35], [62.0, 63.44], [65.0, 77.89], [78.0, 91.17], [92.0, 100.53], [103.0, 114.05], [119.0, 119.52], [122.0, 122.71], [125.0, 129.22], [135.0, 138.74], [140.0, 141.17], [141.0, 146.2], [147.0, 153.55], [158.0, 161.64]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 32.23, 30.83, 31.32, 0.0, 62.27, 39.11, 31.67, 68.41, 0.0, 0.0, 59.07, 34.0, 0.0, 32.56, 36.26, 31.68], "audiomae_on_audioset": [null, [["mains hum", 37.19], ["hum", 34.01], ["music", 14.56]], [["music", 45.39], ["electronic music", 7.23], ["cacophony", 5.57]], [["buzz", 39.63], ["electric shaver, electric razor", 37.1], ["speech", 8.44]], null, null, [["hum", 71.31], ["mains hum", 12.63], ["throbbing", 8.77]], [["music", 32.65], ["hum", 16.51], ["breaking", 7.69]], null, null, null, null, [["music", 39.99], ["theremin", 34.58], ["musical instrument", 5.54]], null, [["music", 30.6], ["didgeridoo", 19.83], ["theremin", 17.95]], [["music", 39.37], ["theremin", 20.95], ["musical instrument", 7.53]], [["music", 30.66], ["theremin", 18.33], ["noise", 10.59]]], "duration": [0.97, 10.97, 11.01, 11.35, 1.44, 12.89, 13.17, 8.53, 11.05, 0.52, 0.71, 4.22, 3.74, 1.17, 5.2, 6.55, 3.64]} \ No newline at end of file diff --git a/annotations_1/eCvY-ualWwY_filtered.json b/annotations_1/eCvY-ualWwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f85a3b82dbd0f70d33c13d3189fbc26cb4ab038 --- /dev/null +++ b/annotations_1/eCvY-ualWwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 47.9], [50.0, 78.04], [82.0, 88.59], [98.0, 181.3]], "keep_status": [true, false, true, false], "silence_prob": [28.85, 28.38, 28.41, 0.0], "audiomae_on_audioset": [[["music", 30.89], ["buzz", 12.74], ["hum", 6.82]], [["music", 29.11], ["mains hum", 26.39], ["hum", 21.4]], [["music", 45.49], ["hum", 7.48], ["whale vocalization", 6.96]], null], "duration": [12.9, 28.04, 6.59, 83.3]} \ No newline at end of file diff --git a/annotations_1/eDPbu2vNrWk_filtered.json b/annotations_1/eDPbu2vNrWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0061c1e1d3f93ebdc1de735ff0bd97a18daa61b7 --- /dev/null +++ b/annotations_1/eDPbu2vNrWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[96.0, 108.09], [109.0, 147.19], [148.0, 152.86], [154.0, 158.41]], "keep_status": [true, false, true, true], "silence_prob": [43.3, 0.0, 47.74, 38.64], "audiomae_on_audioset": [[["hum", 25.53], ["mains hum", 15.2], ["music", 10.05]], null, [["music", 38.16], ["whale vocalization", 21.74], ["musical instrument", 3.92]], [["music", 16.52], ["speech", 16.14], ["hum", 13.92]]], "duration": [12.09, 38.19, 4.86, 4.41]} \ No newline at end of file diff --git a/annotations_1/eFF1grhBvsE_filtered.json b/annotations_1/eFF1grhBvsE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da5a29835f56db664b3d3b9d33b67b3adce9a022 --- /dev/null +++ b/annotations_1/eFF1grhBvsE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [8.0, 10.93], [11.0, 12.72], [13.0, 16.68], [18.0, 21.96], [24.0, 25.81], [30.0, 31.67], [38.0, 39.51], [53.0, 53.52], [56.0, 58.41], [60.0, 63.12], [73.0, 73.35], [76.0, 76.74], [85.0, 85.95], [87.0, 88.64], [90.0, 90.09], [96.0, 96.11], [107.0, 107.94], [117.0, 117.15], [119.0, 119.48], [131.0, 131.25], [134.0, 135.35], [136.0, 136.02], [137.0, 138.5], [142.0, 143.04], [150.0, 151.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.08, 0.0, 40.22, 100.0, 0.0, 0.0, 0.0, 0.0, 87.37, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 66.64], ["domestic animals, pets", 3.77], ["dog", 3.3]], null, null, null, null, null, null, [["speech", 38.72], ["fly, housefly", 14.21], ["mosquito", 13.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 2.93, 1.72, 3.68, 3.96, 1.81, 1.67, 1.51, 0.52, 2.41, 3.12, 0.35, 0.74, 0.95, 1.64, 0.09, 0.11, 0.94, 0.15, 0.48, 0.25, 1.35, 0.02, 1.5, 1.04, 1.02]} \ No newline at end of file diff --git a/annotations_1/eG2Yo0l78tM_filtered.json b/annotations_1/eG2Yo0l78tM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..171f7b70a6d13ec8a62314e46331f7ec56a5dc37 --- /dev/null +++ b/annotations_1/eG2Yo0l78tM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.81], [14.0, 14.94], [16.0, 16.75], [24.0, 24.19], [33.0, 34.08], [35.0, 36.17], [37.0, 38.69], [40.0, 40.64], [41.0, 43.34], [47.0, 48.09], [53.0, 55.38], [59.0, 60.61], [65.0, 65.67], [71.0, 76.91], [82.0, 82.11], [82.0, 83.25], [88.0, 89.28], [97.0, 97.48], [113.0, 113.91], [115.0, 116.46], [118.0, 120.21], [124.0, 124.53], [125.0, 128.07], [134.0, 134.79], [139.0, 143.4], [146.0, 148.15], [154.0, 155.76]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.97, 0.0, 57.64, 0.0, 0.0, 31.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.07, 0.0, 29.42, 0.0, 39.83, 39.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["chirp tone", 25.76], ["speech", 22.94], ["sidetone", 18.31]], null, null, null, null, [["music", 49.29], ["synthesizer", 9.16], ["drum machine", 7.46]], null, null, null, null, null, null, [["music", 74.92], ["grunt", 2.49], ["caw", 1.84]], null, [["music", 22.7], ["bleat", 13.71], ["livestock, farm animals, working animals", 9.2]], null, [["animal", 22.13], ["speech", 20.15], ["wild animals", 17.33]], [["speech", 57.31], ["dial tone", 9.27], ["sidetone", 4.63]], null], "duration": [0.81, 0.94, 0.75, 0.19, 1.08, 1.17, 1.69, 0.64, 2.34, 1.09, 2.38, 1.61, 0.67, 5.91, 0.11, 1.25, 1.28, 0.48, 0.91, 1.46, 2.21, 0.53, 3.07, 0.79, 4.4, 2.15, 1.76]} \ No newline at end of file diff --git a/annotations_1/eGLC0vhemeA_filtered.json b/annotations_1/eGLC0vhemeA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3c7e0b269bab06f145453c3aa3a31668fdc1b4e8 --- /dev/null +++ b/annotations_1/eGLC0vhemeA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 37.94], [41.0, 75.59], [77.0, 88.45], [91.0, 91.52], [92.0, 94.22], [94.0, 101.09], [103.0, 104.25], [104.0, 105.58], [107.0, 108.21], [108.0, 111.67], [112.0, 141.66], [143.0, 166.28], [167.0, 170.75]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false, true], "silence_prob": [31.38, 0.0, 29.41, 0.0, 33.0, 34.77, 0.0, 0.0, 0.0, 53.53, 31.08, 35.22, 36.15], "audiomae_on_audioset": [[["hum", 36.53], ["music", 14.65], ["throbbing", 14.64]], null, [["hum", 41.11], ["mains hum", 20.33], ["music", 16.98]], null, [["music", 64.41], ["gong", 11.93], ["ambient music", 6.85]], [["music", 28.48], ["pulse", 8.79], ["hum", 8.42]], null, null, null, null, [["hum", 30.54], ["music", 14.58], ["breaking", 12.9]], [["music", 58.41], ["crack", 8.6], ["electronic music", 4.14]], [["music", 28.43], ["throbbing", 15.32], ["hum", 10.56]]], "duration": [9.94, 34.59, 11.45, 0.52, 2.22, 7.09, 1.25, 1.58, 1.21, 3.67, 29.66, 23.28, 3.75]} \ No newline at end of file diff --git a/annotations_1/eGXnEeW_KdA_filtered.json b/annotations_1/eGXnEeW_KdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7523bd52a3a3436e47d6f4bdb672ecd7bdecc0c2 --- /dev/null +++ b/annotations_1/eGXnEeW_KdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.36], [10.0, 12.33], [21.0, 38.69], [47.0, 73.31], [80.0, 83.66], [85.0, 102.37]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 29.9, 30.5, 30.34, 29.92, 29.9], "audiomae_on_audioset": [null, [["cattle, bovinae", 40.9], ["livestock, farm animals, working animals", 25.47], ["moo", 25.28]], [["whale vocalization", 42.74], ["animal", 7.48], ["sidetone", 6.01]], [["music", 21.05], ["speech", 5.3], ["throbbing", 4.38]], [["cattle, bovinae", 44.53], ["livestock, farm animals, working animals", 31.29], ["moo", 20.86]], [["livestock, farm animals, working animals", 45.07], ["animal", 21.11], ["cattle, bovinae", 16.54]]], "duration": [1.36, 2.33, 17.69, 26.31, 3.66, 17.37]} \ No newline at end of file diff --git a/annotations_1/eGtDmvtBZQY_filtered.json b/annotations_1/eGtDmvtBZQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b9b33d67d8fa84b190452ac964d50474ec27f05 --- /dev/null +++ b/annotations_1/eGtDmvtBZQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 22.03], [26.0, 32.05], [38.0, 50.09], [51.0, 54.35], [56.0, 56.22], [66.0, 67.9], [77.0, 78.19], [79.0, 79.44], [90.0, 90.31], [90.0, 94.12], [96.0, 98.61], [99.0, 102.81], [113.0, 114.71], [127.0, 129.05], [131.0, 132.65], [133.0, 133.46], [142.0, 143.14], [144.0, 145.1]], "keep_status": [false, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [36.38, 38.49, 44.29, 39.58, 0.0, 0.0, 0.0, 0.0, 0.0, 41.74, 42.22, 47.94, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whack, thwack", 49.29], ["speech", 15.07], ["boing", 9.39]], [["music", 18.53], ["thunk", 11.17], ["sound effect", 8.84]], [["music", 43.54], ["speech", 23.19], ["thunk", 5.3]], [["groan", 36.3], ["whack, thwack", 9.85], ["sound effect", 7.58]], null, null, null, null, null, [["music", 44.35], ["scratching (performance technique)", 16.27], ["speech", 10.86]], [["beatboxing", 34.35], ["grunt", 16.34], ["music", 7.74]], [["music", 27.32], ["whack, thwack", 18.49], ["thunk", 10.89]], null, null, null, null, null, null], "duration": [3.03, 6.05, 12.09, 3.35, 0.22, 1.9, 1.19, 0.44, 0.31, 4.12, 2.61, 3.81, 1.71, 2.05, 1.65, 0.46, 1.14, 1.1]} \ No newline at end of file diff --git a/annotations_1/eI1dAmDZrZE_filtered.json b/annotations_1/eI1dAmDZrZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3332fcfa134e2d143b1cf275bfd94964c75b0ac --- /dev/null +++ b/annotations_1/eI1dAmDZrZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.53], [49.0, 49.98], [53.0, 53.11], [56.0, 58.08], [59.0, 61.08], [80.0, 79.81], [80.0, 91.23], [92.0, 92.6], [93.0, 94.31], [95.0, 96.11], [96.0, 103.6], [105.0, 115.16], [122.0, 122.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 87.37, 73.67, 0.0, 42.88, 0.0, 0.0, 0.0, 34.75, 34.23, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 20.06], ["music", 17.86], ["hum", 14.49]], null, null, null, [["grunt", 46.36], ["groan", 7.39], ["livestock, farm animals, working animals", 7.03]], [["grunt", 28.0], ["music", 18.9], ["speech", 14.37]], null], "duration": [0.53, 0.98, 0.11, 2.08, 2.08, -0.19, 11.23, 0.6, 1.31, 1.11, 7.6, 10.16, 0.71]} \ No newline at end of file diff --git a/annotations_1/eIlzY-UcYZU_filtered.json b/annotations_1/eIlzY-UcYZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..566b3a4f33e7eb36801a5e5261eb882eb1edb49c --- /dev/null +++ b/annotations_1/eIlzY-UcYZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.77], [6.0, 9.51], [12.0, 13.09], [15.0, 15.85], [17.0, 21.22], [24.0, 24.11], [26.0, 26.52], [29.0, 29.17], [31.0, 31.26], [33.0, 33.51], [40.0, 40.04], [43.0, 43.46], [45.0, 46.87], [49.0, 49.13], [51.0, 53.42], [54.0, 55.27], [62.0, 62.24], [65.0, 66.34], [67.0, 68.2], [70.0, 70.61], [71.0, 79.61], [81.0, 82.46], [83.0, 83.74], [93.0, 93.93], [95.0, 95.49], [98.0, 98.73], [99.0, 99.91], [102.0, 104.3], [105.0, 107.42], [108.0, 109.0], [111.0, 112.24], [113.0, 113.86], [115.0, 115.65], [122.0, 122.28], [123.0, 125.83], [127.0, 127.06], [128.0, 130.47], [132.0, 132.34], [133.0, 135.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.89, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 99.87, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 40.28, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 10.92], ["speech", 5.29], ["walk, footsteps", 4.5]], null, null, null, null, null, null, null, null, [["speech", 73.1], ["sidetone", 3.68], ["radio", 2.34]], null, null], "duration": [-0.23, 3.51, 1.09, 0.85, 4.22, 0.11, 0.52, 0.17, 0.26, 0.51, 0.04, 0.46, 1.87, 0.13, 2.42, 1.27, 0.24, 1.34, 1.2, 0.61, 8.61, 1.46, 0.74, 0.93, 0.49, 0.73, 0.91, 2.3, 2.42, 1.0, 1.24, 0.86, 0.65, 0.28, 2.83, 0.06, 2.47, 0.34, 2.46]} \ No newline at end of file diff --git a/annotations_1/eJ93IIgvVyI_filtered.json b/annotations_1/eJ93IIgvVyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74d1a686b226a6faa14eced0387faa50dae87262 --- /dev/null +++ b/annotations_1/eJ93IIgvVyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.77], [14.0, 15.82], [20.0, 20.83], [22.0, 21.84], [26.0, 27.01], [28.0, 28.73], [29.0, 33.84], [34.0, 37.1], [39.0, 46.6], [50.0, 51.09], [54.0, 56.39], [57.0, 58.55], [61.0, 61.94], [68.0, 70.34], [73.0, 74.09], [78.0, 78.07], [79.0, 79.84], [80.0, 94.12], [95.0, 95.77], [98.0, 100.85], [106.0, 114.99], [116.0, 117.61], [119.0, 119.72], [121.0, 123.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 52.68, 74.92, 48.19, 0.0, 78.55, 0.0, 0.0, 80.64, 0.0, 0.0, 0.0, 62.99, 0.0, 42.67, 35.87, 0.0, 0.0, 40.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["didgeridoo", 46.52], ["music", 23.37], ["speech", 10.71]], null, null, null, null, null, null, null, null, null, null, [["music", 41.82], ["speech", 7.39], ["mantra", 5.16]], [["clang", 23.01], ["ding", 18.63], ["speech", 18.15]], null, null, [["throbbing", 22.82], ["hum", 17.2], ["sidetone", 13.07]]], "duration": [8.77, 1.82, 0.83, -0.16, 1.01, 0.73, 4.84, 3.1, 7.6, 1.09, 2.39, 1.55, 0.94, 2.34, 1.09, 0.07, 0.84, 14.12, 0.77, 2.85, 8.99, 1.61, 0.72, 2.33]} \ No newline at end of file diff --git a/annotations_1/eJPXQfvokV8_filtered.json b/annotations_1/eJPXQfvokV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a78dd354bccbf13110b5d3c64f74c36a0b36014f --- /dev/null +++ b/annotations_1/eJPXQfvokV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.71], [26.0, 27.89], [29.0, 31.92], [32.0, 37.96], [42.0, 43.73], [45.0, 46.48], [47.0, 51.93], [52.0, 64.93], [66.0, 81.46], [83.0, 88.11]], "keep_status": [false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 65.91, 42.67, 0.0, 0.0, 60.05, 30.62, 29.89, 33.24], "audiomae_on_audioset": [null, null, null, [["mains hum", 62.58], ["hum", 23.7], ["speech", 4.07]], null, null, null, [["speech", 21.44], ["music", 13.18], ["sidetone", 7.08]], [["music", 35.6], ["speech", 8.07], ["whip", 3.77]], [["hum", 36.64], ["mains hum", 36.3], ["speech", 8.12]]], "duration": [1.71, 1.89, 2.92, 5.96, 1.73, 1.48, 4.93, 12.93, 15.46, 5.11]} \ No newline at end of file diff --git a/annotations_1/eK20uOpc_AM_filtered.json b/annotations_1/eK20uOpc_AM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81168fdc8ba14967e84ee4720bc7a99070475f56 --- /dev/null +++ b/annotations_1/eK20uOpc_AM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.78], [18.0, 18.89], [20.0, 38.48], [40.0, 42.18], [43.0, 44.46], [45.0, 45.39], [48.0, 48.22], [50.0, 55.9], [57.0, 57.57], [59.0, 59.12], [64.0, 64.54], [84.0, 84.32], [88.0, 87.93], [89.0, 91.3], [93.0, 94.12], [95.0, 95.61], [98.0, 98.52], [101.0, 102.41], [103.0, 105.66], [110.0, 112.19], [115.0, 115.75], [119.0, 119.21], [121.0, 123.18], [124.0, 126.72], [132.0, 132.75], [133.0, 134.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.27, 0.0, 35.62, 45.49, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 90.43, 32.87, 0.0, 0.0, 35.12, 40.4, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.46], ["whack, thwack", 28.79], ["thunk", 11.25]], null, [["music", 46.28], ["speech", 20.4], ["whack, thwack", 16.95]], [["music", 59.58], ["throbbing", 8.45], ["hum", 5.17]], null, null, null, [["music", 59.98], ["speech", 13.75], ["theremin", 3.6]], null, null, null, null, null, null, null, null, null, null, null, [["music", 61.69], ["thunk", 4.35], ["bang", 4.16]], null, null, [["music", 36.4], ["burping, eructation", 27.93], ["grunt", 16.09]], [["music", 72.98], ["grunt", 9.28], ["didgeridoo", 3.45]], null, null], "duration": [3.78, 0.89, 18.48, 2.18, 1.46, 0.39, 0.22, 5.9, 0.57, 0.12, 0.54, 0.32, -0.07, 2.3, 1.12, 0.61, 0.52, 1.41, 2.66, 2.19, 0.75, 0.21, 2.18, 2.72, 0.75, 1.79]} \ No newline at end of file diff --git a/annotations_1/eKCkxzJFP5M_filtered.json b/annotations_1/eKCkxzJFP5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62f6ab4193a6246db2ecd86e2758e1f974f99902 --- /dev/null +++ b/annotations_1/eKCkxzJFP5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.26], [17.0, 18.1], [19.0, 20.7], [24.0, 26.23], [28.0, 29.57], [32.0, 32.8], [35.0, 35.99], [37.0, 39.26], [41.0, 42.11], [44.0, 44.24], [49.0, 50.67], [54.0, 56.08], [59.0, 76.22], [79.0, 80.57], [84.0, 85.23], [86.0, 86.71], [90.0, 90.58], [92.0, 93.61], [95.0, 95.27], [96.0, 97.6], [99.0, 100.23], [104.0, 104.48], [106.0, 107.5], [120.0, 121.56], [122.0, 123.53], [126.0, 127.38], [129.0, 129.44], [131.0, 131.45], [133.0, 133.69], [135.0, 135.95], [145.0, 147.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.76, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 94.07, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.23], ["electronic music", 11.27], ["pulse", 4.45]]], "duration": [1.26, 1.1, 1.7, 2.23, 1.57, 0.8, 0.99, 2.26, 1.11, 0.24, 1.67, 2.08, 17.22, 1.57, 1.23, 0.71, 0.58, 1.61, 0.27, 1.6, 1.23, 0.48, 1.5, 1.56, 1.53, 1.38, 0.44, 0.45, 0.69, 0.95, 2.75]} \ No newline at end of file diff --git a/annotations_1/eKxv7whkFMM_filtered.json b/annotations_1/eKxv7whkFMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb7dfcda99a6bb2bb7f8b26c257987cb13b7cba0 --- /dev/null +++ b/annotations_1/eKxv7whkFMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.62], [27.0, 27.21], [30.0, 30.37], [30.0, 30.42], [47.0, 48.63], [51.0, 51.88], [55.0, 56.35], [63.0, 64.18], [65.0, 79.62], [81.0, 82.07]], "keep_status": [true, false, false, false, false, false, false, false, true, false], "silence_prob": [31.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.75, 0.0], "audiomae_on_audioset": [[["speech", 17.58], ["moo", 16.89], ["cattle, bovinae", 13.61]], null, null, null, null, null, null, null, [["speech", 50.68], ["whale vocalization", 6.55], ["animal", 5.46]], null], "duration": [4.62, 0.21, 0.37, 0.42, 1.63, 0.88, 1.35, 1.18, 14.62, 1.07]} \ No newline at end of file diff --git a/annotations_1/eL62rDiuqDE_filtered.json b/annotations_1/eL62rDiuqDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51d069d3abd02b3c7ef776efd7ebedc70cc414fc --- /dev/null +++ b/annotations_1/eL62rDiuqDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 94.76], [95.0, 95.08], [97.0, 100.23], [103.0, 119.5], [120.0, 121.12], [126.0, 127.53], [130.0, 130.64], [133.0, 133.74], [135.0, 136.32], [139.0, 140.66], [141.0, 145.89]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [46.36, 0.0, 81.89, 40.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 41.91], ["cattle, bovinae", 22.05], ["moo", 17.95]], null, null, [["livestock, farm animals, working animals", 27.36], ["moo", 18.07], ["cattle, bovinae", 15.9]], null, null, null, null, null, null, null], "duration": [14.76, 0.08, 3.23, 16.5, 1.12, 1.53, 0.64, 0.74, 1.32, 1.66, 4.89]} \ No newline at end of file diff --git a/annotations_1/eMHv9pPuDiI_filtered.json b/annotations_1/eMHv9pPuDiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c3c600c8f916379cb8d008c21b561ad5f4d6ef0 --- /dev/null +++ b/annotations_1/eMHv9pPuDiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.26], [12.0, 15.6], [17.0, 18.44], [19.0, 23.4], [24.0, 25.62], [31.0, 34.01], [36.0, 37.49], [40.0, 49.25], [51.0, 67.53], [69.0, 73.79], [77.0, 77.28], [82.0, 83.47], [85.0, 86.83], [88.0, 95.98], [101.0, 105.95], [107.0, 113.54]], "keep_status": [true, false, false, false, false, true, false, true, false, true, false, false, false, false, false, true], "silence_prob": [29.44, 31.23, 0.0, 30.76, 0.0, 32.33, 0.0, 29.21, 29.86, 29.59, 0.0, 0.0, 0.0, 29.68, 29.73, 29.81], "audiomae_on_audioset": [[["music", 56.71], ["cacophony", 3.45], ["electronic music", 2.12]], [["fly, housefly", 57.16], ["insect", 18.37], ["bee, wasp, etc.", 10.87]], null, [["throbbing", 41.6], ["hum", 17.09], ["music", 12.92]], null, [["music", 45.68], ["buzz", 10.62], ["scary music", 4.65]], null, [["music", 29.95], ["explosion", 18.01], ["hum", 9.87]], [["hum", 40.16], ["music", 22.54], ["throbbing", 18.92]], [["music", 41.28], ["speech", 22.49], ["throbbing", 5.1]], null, null, null, [["hum", 39.2], ["throbbing", 20.23], ["mains hum", 18.13]], [["speech", 30.9], ["hum", 24.07], ["mains hum", 21.47]], [["speech", 43.04], ["music", 11.9], ["eruption", 3.8]]], "duration": [5.26, 3.6, 1.44, 4.4, 1.62, 3.01, 1.49, 9.25, 16.53, 4.79, 0.28, 1.47, 1.83, 7.98, 4.95, 6.54]} \ No newline at end of file diff --git a/annotations_1/eMgfTq1Z2n8_filtered.json b/annotations_1/eMgfTq1Z2n8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e945aeb5d3713de4716d832bac89e6a73573d9fd --- /dev/null +++ b/annotations_1/eMgfTq1Z2n8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [8.0, 8.6], [11.0, 17.46], [18.0, 30.97], [34.0, 34.33], [42.0, 49.44], [54.0, 55.0], [66.0, 72.39], [75.0, 81.51], [84.0, 83.96], [84.0, 85.94], [87.0, 89.56], [91.0, 91.2], [92.0, 92.53], [95.0, 95.98], [97.0, 98.22], [99.0, 98.96], [103.0, 110.81], [112.0, 122.49], [123.0, 131.25], [133.0, 138.96], [141.0, 141.59], [144.0, 146.04], [149.0, 151.63]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.07, 37.67, 0.0, 49.68, 0.0, 41.87, 51.18, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 0.0, 33.91, 54.23, 97.22, 97.92, 0.0, 53.4, 94.52], "audiomae_on_audioset": [null, null, null, [["hum", 27.76], ["speech", 19.05], ["mains hum", 17.94]], null, [["hum", 32.76], ["mains hum", 21.87], ["buzz", 11.86]], null, [["speech", 40.83], ["music", 33.21], ["animal", 4.3]], null, null, null, [["music", 45.83], ["hum", 11.49], ["electronic music", 6.85]], null, null, null, null, null, [["music", 40.99], ["didgeridoo", 17.3], ["hum", 7.88]], null, null, null, null, null, null], "duration": [1.62, 0.6, 6.46, 12.97, 0.33, 7.44, 1.0, 6.39, 6.51, -0.04, 1.94, 2.56, 0.2, 0.53, 0.98, 1.22, -0.04, 7.81, 10.49, 8.25, 5.96, 0.59, 2.04, 2.63]} \ No newline at end of file diff --git a/annotations_1/eMyuRmZNaTk_filtered.json b/annotations_1/eMyuRmZNaTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c308f687939d8f7ddd5a8ea7996a511056f1dc26 --- /dev/null +++ b/annotations_1/eMyuRmZNaTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[149.0, 150.58], [154.0, 219.77]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.58, 65.77]} \ No newline at end of file diff --git a/annotations_1/eNCK08cInIE_filtered.json b/annotations_1/eNCK08cInIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb5cb08847cf8559b9ccfeb4c85d778e3cba7cd4 --- /dev/null +++ b/annotations_1/eNCK08cInIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.73], [19.0, 29.05], [30.0, 30.5], [31.0, 32.85], [37.0, 37.42], [41.0, 42.5], [47.0, 48.51], [50.0, 50.97], [54.0, 57.5], [62.0, 64.03], [68.0, 69.4], [73.0, 72.84], [73.0, 75.59], [77.0, 77.36], [79.0, 80.84], [85.0, 84.69], [86.0, 88.37], [89.0, 91.03], [92.0, 92.6], [98.0, 101.61], [102.0, 102.3], [103.0, 109.81], [110.0, 110.39], [115.0, 116.01], [117.0, 117.49], [121.0, 122.01]], "keep_status": [false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.59, 34.65, 0.0, 0.0, 32.23, 0.0, 0.0, 0.0, 31.86, 34.04, 0.0, 29.7, 0.0, 28.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 25.76], ["mosquito", 19.3], ["ding", 6.99]], null, null, null, null, null, null, [["music", 15.56], ["speech", 15.37], ["vehicle", 9.32]], [["hum", 31.73], ["throbbing", 19.64], ["mains hum", 17.67]], null, null, [["speech", 64.56], ["music", 4.3], ["sidetone", 2.8]], null, null, null, [["speech", 28.65], ["sidetone", 20.52], ["music", 13.26]], [["throbbing", 40.5], ["music", 23.11], ["hum", 21.02]], null, [["music", 37.38], ["didgeridoo", 29.39], ["beatboxing", 10.85]], null, [["cattle, bovinae", 33.74], ["livestock, farm animals, working animals", 17.59], ["moo", 15.71]], null, null, null, null], "duration": [0.73, 10.05, 0.5, 1.85, 0.42, 1.5, 1.51, 0.97, 3.5, 2.03, 1.4, -0.16, 2.59, 0.36, 1.84, -0.31, 2.37, 2.03, 0.6, 3.61, 0.3, 6.81, 0.39, 1.01, 0.49, 1.01]} \ No newline at end of file diff --git a/annotations_1/eOYwXi0B6KQ_filtered.json b/annotations_1/eOYwXi0B6KQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53b6aa3747b3ba2c169fbcc8178e22e9f9840584 --- /dev/null +++ b/annotations_1/eOYwXi0B6KQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.85], [14.0, 14.37], [15.0, 24.93], [27.0, 27.06], [35.0, 36.46], [39.0, 39.9], [42.0, 42.65], [47.0, 48.47], [54.0, 54.35], [56.0, 64.32], [67.0, 72.01], [74.0, 76.23], [81.0, 81.48], [82.0, 87.54], [89.0, 89.09], [91.0, 108.82], [113.0, 130.11], [132.0, 137.81], [140.0, 140.1]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.65, 0.0, 34.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.55, 34.89, 38.84, 0.0, 78.04, 0.0, 47.46, 35.91, 41.89, 0.0], "audiomae_on_audioset": [[["music", 45.57], ["speech", 14.78], ["music of latin america", 4.79]], null, [["music", 49.47], ["didgeridoo", 5.9], ["throbbing", 4.44]], null, null, null, null, null, null, [["music", 68.26], ["speech", 5.3], ["boing", 5.26]], [["music", 55.63], ["fly, housefly", 9.64], ["insect", 7.67]], [["speech", 52.53], ["thunk", 9.75], ["whack, thwack", 5.85]], null, null, null, [["music", 68.36], ["boing", 7.18], ["synthesizer", 4.1]], [["music", 51.36], ["didgeridoo", 11.29], ["speech", 9.24]], [["speech", 62.57], ["whack, thwack", 27.35], ["groan", 1.82]], null], "duration": [4.85, 0.37, 9.93, 0.06, 1.46, 0.9, 0.65, 1.47, 0.35, 8.32, 5.01, 2.23, 0.48, 5.54, 0.09, 17.82, 17.11, 5.81, 0.1]} \ No newline at end of file diff --git a/annotations_1/ePgiRqRIdwg_filtered.json b/annotations_1/ePgiRqRIdwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185ca67762f000f58275f0ccb8685bff8e3d2272 --- /dev/null +++ b/annotations_1/ePgiRqRIdwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.15], [7.0, 8.7], [11.0, 12.72], [16.0, 16.8], [23.0, 24.6], [33.0, 33.05], [34.0, 35.02], [39.0, 40.26], [42.0, 42.38], [44.0, 44.37], [50.0, 62.8], [80.0, 81.01], [85.0, 85.62], [86.0, 90.26], [91.0, 91.99], [100.0, 101.29], [102.0, 106.57], [107.0, 107.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 31.93, 0.0, 0.0, 49.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["a capella", 20.82], ["music", 17.86], ["mantra", 11.94]], null, null, [["speech", 13.96], ["fart", 12.41], ["livestock, farm animals, working animals", 10.53]], null], "duration": [0.15, 1.7, 1.72, 0.8, 1.6, 0.05, 1.02, 1.26, 0.38, 0.37, 12.8, 1.01, 0.62, 4.26, 0.99, 1.29, 4.57, 0.96]} \ No newline at end of file diff --git a/annotations_1/ePlb7b2nQm4_filtered.json b/annotations_1/ePlb7b2nQm4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b8df92952021a973833d17e4237cbaeacb55bb --- /dev/null +++ b/annotations_1/ePlb7b2nQm4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.18], [15.0, 20.7], [26.0, 27.46], [32.0, 33.18], [34.0, 34.75], [39.0, 39.29], [40.0, 41.22], [41.0, 42.67], [43.0, 46.5], [47.0, 51.36], [52.0, 53.72], [56.0, 58.67], [66.0, 66.43], [71.0, 71.32], [72.0, 73.2], [75.0, 76.11], [78.0, 83.2], [84.0, 91.88], [93.0, 97.97], [99.0, 119.96], [121.0, 123.58], [130.0, 131.43], [134.0, 135.36]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [45.95, 64.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 60.7, 0.0, 34.1, 0.0, 0.0, 0.0, 0.0, 47.23, 29.07, 31.15, 29.67, 92.31, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 12.63], ["vehicle", 5.73], ["hum", 5.36]], null, null, null, null, null, null, null, null, null, null, [["speech", 41.26], ["whale vocalization", 11.72], ["music", 6.73]], null, null, null, null, [["fly, housefly", 42.99], ["insect", 28.68], ["bee, wasp, etc.", 17.34]], [["livestock, farm animals, working animals", 30.87], ["cattle, bovinae", 21.41], ["speech", 10.29]], [["speech", 71.72], ["crowd", 7.26], ["outside, urban or manmade", 5.23]], [["music", 27.69], ["hum", 25.08], ["whale vocalization", 13.15]], null, null, null], "duration": [10.18, 5.7, 1.46, 1.18, 0.75, 0.29, 1.22, 1.67, 3.5, 4.36, 1.72, 2.67, 0.43, 0.32, 1.2, 1.11, 5.2, 7.88, 4.97, 20.96, 2.58, 1.43, 1.36]} \ No newline at end of file diff --git a/annotations_1/ePtwxRF1WZA_filtered.json b/annotations_1/ePtwxRF1WZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5036db55d30df075a7f2676f0928e2dc2982c71c --- /dev/null +++ b/annotations_1/ePtwxRF1WZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 16.88], [22.0, 27.55], [30.0, 35.31], [46.0, 52.15], [53.0, 53.81], [56.0, 64.3], [74.0, 77.18], [81.0, 81.82], [83.0, 85.65], [87.0, 97.7], [103.0, 111.92], [115.0, 122.49], [126.0, 136.07], [140.0, 143.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [31.18, 30.62, 30.81, 30.35, 0.0, 30.84, 31.32, 0.0, 33.95, 30.58, 30.57, 31.66, 30.51, 32.19], "audiomae_on_audioset": [[["speech", 40.99], ["music", 38.09], ["hum", 2.07]], [["music", 52.82], ["speech", 10.63], ["didgeridoo", 6.47]], [["music", 52.84], ["throbbing", 12.33], ["hum", 12.21]], [["music", 67.96], ["speech", 9.6], ["didgeridoo", 2.38]], null, [["throbbing", 58.34], ["music", 17.84], ["hum", 12.38]], [["throbbing", 30.79], ["music", 29.24], ["hum", 17.99]], null, [["music", 58.65], ["boing", 11.9], ["speech", 4.59]], [["music", 40.84], ["hum", 18.1], ["throbbing", 12.89]], [["music", 63.09], ["speech", 12.15], ["throbbing", 5.39]], [["music", 60.71], ["theremin", 9.5], ["hum", 3.05]], [["music", 33.81], ["throbbing", 21.27], ["speech", 9.01]], [["music", 50.64], ["boing", 11.61], ["throbbing", 7.04]]], "duration": [7.88, 5.55, 5.31, 6.15, 0.81, 8.3, 3.18, 0.82, 2.65, 10.7, 8.92, 7.49, 10.07, 3.23]} \ No newline at end of file diff --git a/annotations_1/eQSqgubHzn0_filtered.json b/annotations_1/eQSqgubHzn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66b722f4e4af1395e709e71fb2852958a3413a7c --- /dev/null +++ b/annotations_1/eQSqgubHzn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 112.51], [114.0, 114.94]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [33.51, 0.94]} \ No newline at end of file diff --git a/annotations_1/eRITzdlHJXA_filtered.json b/annotations_1/eRITzdlHJXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..009ed5fea152d0aed481e2435c690c95131719a4 --- /dev/null +++ b/annotations_1/eRITzdlHJXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.15], [15.0, 15.89], [16.0, 19.5], [26.0, 26.59], [31.0, 31.9], [33.0, 33.57], [35.0, 36.76], [37.0, 39.48], [48.0, 48.47], [50.0, 51.65], [56.0, 56.51], [58.0, 60.13], [66.0, 66.48], [71.0, 71.69], [80.0, 81.18]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 39.52, 0.0, 0.0, 0.0, 0.0, 39.69, 0.0, 0.0, 0.0, 37.84, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 29.64], ["music", 28.48], ["rumble", 6.87]], null, null, null, null, [["speech", 42.1], ["music", 12.7], ["mains hum", 6.24]], null, null, null, [["music", 44.86], ["scary music", 8.8], ["speech", 5.43]], null, null, null], "duration": [0.15, 0.89, 3.5, 0.59, 0.9, 0.57, 1.76, 2.48, 0.47, 1.65, 0.51, 2.13, 0.48, 0.69, 1.18]} \ No newline at end of file diff --git a/annotations_1/eRNCIg86DKs_filtered.json b/annotations_1/eRNCIg86DKs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f06c6cfb1b9dfd7dc253513be7ec8ec23ba8d9 --- /dev/null +++ b/annotations_1/eRNCIg86DKs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [6.0, 6.99], [8.0, 8.13], [15.0, 14.89], [17.0, 17.98], [19.0, 20.41], [21.0, 22.27], [23.0, 24.48], [26.0, 27.85], [43.0, 43.55], [44.0, 44.74], [57.0, 57.72], [60.0, 60.13], [61.0, 61.72], [62.0, 63.56], [65.0, 65.6], [67.0, 67.05], [69.0, 69.38], [72.0, 72.45], [75.0, 76.11], [78.0, 79.56], [80.0, 81.77], [83.0, 83.96], [87.0, 87.64], [90.0, 90.19], [94.0, 94.46], [95.0, 96.16], [99.0, 100.79], [102.0, 102.42], [107.0, 107.6], [110.0, 110.2], [118.0, 118.72], [126.0, 126.27], [127.0, 127.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.99, 0.13, -0.11, 0.98, 1.41, 1.27, 1.48, 1.85, 0.55, 0.74, 0.72, 0.13, 0.72, 1.56, 0.6, 0.05, 0.38, 0.45, 1.11, 1.56, 1.77, 0.96, 0.64, 0.19, 0.46, 1.16, 1.79, 0.42, 0.6, 0.2, 0.72, 0.27, 0.94]} \ No newline at end of file diff --git a/annotations_1/eTepvIyKhIo_filtered.json b/annotations_1/eTepvIyKhIo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..549e313637fe74765937a54ec6216a1c79dc5ed7 --- /dev/null +++ b/annotations_1/eTepvIyKhIo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [6.0, 8.24], [10.0, 20.04], [24.0, 34.77], [36.0, 83.17], [86.0, 88.72], [89.0, 162.87]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [0.0, 94.22, 42.39, 34.33, 0.0, 35.84, 0.0], "audiomae_on_audioset": [null, null, [["music", 37.07], ["speech", 24.93], ["hum", 5.04]], [["music", 21.04], ["rumble", 14.08], ["sonar", 6.84]], null, [["speech", 30.36], ["sidetone", 25.65], ["music", 13.69]], null], "duration": [1.26, 2.24, 10.04, 10.77, 47.17, 2.72, 73.87]} \ No newline at end of file diff --git a/annotations_1/eU4-wIieuWU_filtered.json b/annotations_1/eU4-wIieuWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ade88518da8669469005def5dded8e58cfcc1b3a --- /dev/null +++ b/annotations_1/eU4-wIieuWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.88], [13.0, 13.91], [18.0, 18.86], [20.0, 20.38], [23.0, 23.84], [27.0, 27.01], [33.0, 34.21], [35.0, 35.9], [37.0, 37.22], [40.0, 41.0], [47.0, 47.41], [52.0, 53.67], [56.0, 56.39], [60.0, 60.24], [64.0, 67.8], [72.0, 73.38], [75.0, 76.62], [80.0, 80.7], [85.0, 85.5], [87.0, 87.18], [92.0, 93.36], [100.0, 103.01], [103.0, 104.38], [109.0, 110.22], [114.0, 117.85], [120.0, 120.34], [123.0, 123.26], [125.0, 125.81], [128.0, 128.16], [130.0, 130.79], [133.0, 134.4], [140.0, 140.53], [143.0, 144.05], [148.0, 149.12], [154.0, 155.68], [157.0, 157.96], [159.0, 163.38], [165.0, 165.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.59, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.91, 0.86, 0.38, 0.84, 0.01, 1.21, 0.9, 0.22, 1.0, 0.41, 1.67, 0.39, 0.24, 3.8, 1.38, 1.62, 0.7, 0.5, 0.18, 1.36, 3.01, 1.38, 1.22, 3.85, 0.34, 0.26, 0.81, 0.16, 0.79, 1.4, 0.53, 1.05, 1.12, 1.68, 0.96, 4.38, 0.67]} \ No newline at end of file diff --git a/annotations_1/eUogxXRPC7E_filtered.json b/annotations_1/eUogxXRPC7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdee989d55bcaffb73827bfbafebbd41408711bc --- /dev/null +++ b/annotations_1/eUogxXRPC7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [11.0, 10.54], [11.0, 20.19], [27.0, 27.68], [29.0, 30.15], [42.0, 42.92], [45.0, 45.89], [46.0, 46.57], [48.0, 48.03], [52.0, 84.82], [85.0, 86.04], [87.0, 89.06], [90.0, 103.76], [107.0, 111.75]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 99.62, 99.73], "audiomae_on_audioset": [null, null, [["music", 56.68], ["didgeridoo", 8.57], ["cattle, bovinae", 4.55]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.12, -0.46, 9.19, 0.68, 1.15, 0.92, 0.89, 0.57, 0.03, 32.82, 1.04, 2.06, 13.76, 4.75]} \ No newline at end of file diff --git a/annotations_1/eVJhlVgr9lM_filtered.json b/annotations_1/eVJhlVgr9lM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb1b913449a270be5a22f1a3d2daeee9d9e7987 --- /dev/null +++ b/annotations_1/eVJhlVgr9lM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.92], [10.0, 89.55]], "keep_status": [false, false], "silence_prob": [99.92, 0.0], "audiomae_on_audioset": [null, null], "duration": [7.92, 79.55]} \ No newline at end of file diff --git a/annotations_1/eVmYZJQxawo_filtered.json b/annotations_1/eVmYZJQxawo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0d37ad54fb13933612d683eca5a7c536438067 --- /dev/null +++ b/annotations_1/eVmYZJQxawo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 28.85], [36.0, 36.53], [37.0, 37.61], [47.0, 48.24], [50.0, 49.77], [51.0, 64.83], [66.0, 88.37], [96.0, 97.04], [98.0, 105.21], [112.0, 118.3], [123.0, 134.76], [136.0, 137.83], [145.0, 146.72], [153.0, 181.8], [187.0, 186.8]], "keep_status": [true, false, false, false, false, true, false, false, true, true, true, false, false, false, false], "silence_prob": [30.72, 0.0, 0.0, 0.0, 0.0, 29.89, 30.21, 0.0, 30.0, 33.3, 32.44, 0.0, 0.0, 29.52, 0.0], "audiomae_on_audioset": [[["music", 43.36], ["speech", 15.65], ["didgeridoo", 8.12]], null, null, null, null, [["music", 39.17], ["breaking", 18.45], ["hum", 5.3]], [["music", 49.69], ["theremin", 27.76], ["musical instrument", 2.8]], null, [["music", 46.68], ["speech", 7.56], ["throbbing", 7.36]], [["music", 46.23], ["foghorn", 8.76], ["didgeridoo", 6.03]], [["music", 25.08], ["moo", 13.72], ["cattle, bovinae", 12.34]], null, null, [["music", 89.22], ["musical instrument", 2.26], ["brass instrument", 1.17]], null], "duration": [25.85, 0.53, 0.61, 1.24, -0.23, 13.83, 22.37, 1.04, 7.21, 6.3, 11.76, 1.83, 1.72, 28.8, -0.2]} \ No newline at end of file diff --git a/annotations_1/eVzxDwu506A_filtered.json b/annotations_1/eVzxDwu506A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a3dafb2e935dee27bc887101157ea30679c020a --- /dev/null +++ b/annotations_1/eVzxDwu506A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.18], [23.0, 23.73], [33.0, 33.98], [35.0, 34.94], [44.0, 47.31], [50.0, 57.86], [58.0, 59.91], [63.0, 62.78], [63.0, 62.83], [65.0, 91.18], [92.0, 94.17], [96.0, 101.17], [104.0, 107.97], [108.0, 110.81], [115.0, 115.65]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.92, 29.18, 0.0, 0.0, 0.0, 28.89, 44.81, 30.15, 31.07, 44.63, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 50.86], ["horse", 9.33], ["music", 9.21]], [["music", 56.31], ["speech", 14.22], ["smash, crash", 2.84]], null, null, null, [["music", 24.84], ["speech", 19.02], ["livestock, farm animals, working animals", 14.92]], [["throbbing", 16.82], ["noise", 12.4], ["hum", 5.69]], [["breaking", 24.97], ["car alarm", 17.56], ["cattle, bovinae", 11.66]], [["speech", 18.76], ["whack, thwack", 14.26], ["explosion", 7.08]], [["noise", 19.93], ["speech", 13.11], ["sidetone", 10.68]], null], "duration": [0.18, 0.73, 0.98, -0.06, 3.31, 7.86, 1.91, -0.22, -0.17, 26.18, 2.17, 5.17, 3.97, 2.81, 0.65]} \ No newline at end of file diff --git a/annotations_1/eWP8JMcy3O0_filtered.json b/annotations_1/eWP8JMcy3O0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbae7e77b1ef787ee8f9771b237a32a085449a97 --- /dev/null +++ b/annotations_1/eWP8JMcy3O0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.71], [7.0, 11.92], [21.0, 20.98], [24.0, 24.09], [28.0, 28.7], [29.0, 31.13], [32.0, 33.22], [38.0, 39.24], [45.0, 45.37], [51.0, 51.65], [53.0, 54.43], [55.0, 55.46], [59.0, 61.96], [63.0, 64.59], [67.0, 68.44], [70.0, 70.6], [77.0, 77.58], [79.0, 79.64], [87.0, 88.5], [96.0, 96.8], [100.0, 100.4], [105.0, 105.54], [109.0, 109.44], [116.0, 116.88], [117.0, 126.84], [131.0, 132.22], [134.0, 134.5], [135.0, 135.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.91, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["wail, moan", 81.33], ["gasp", 5.07], ["speech", 3.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.6], ["beatboxing", 12.33], ["music", 3.68]], null, null, null], "duration": [0.71, 4.92, -0.02, 0.09, 0.7, 2.13, 1.22, 1.24, 0.37, 0.65, 1.43, 0.46, 2.96, 1.59, 1.44, 0.6, 0.58, 0.64, 1.5, 0.8, 0.4, 0.54, 0.44, 0.88, 9.84, 1.22, 0.5, 0.04]} \ No newline at end of file diff --git a/annotations_1/eYrt5n8DA2M_filtered.json b/annotations_1/eYrt5n8DA2M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fb5c7952009c3696674c94d8b7d6f91e61e0f65 --- /dev/null +++ b/annotations_1/eYrt5n8DA2M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.05], [8.0, 13.09], [13.0, 15.08], [16.0, 16.38], [17.0, 17.95], [21.0, 21.83], [23.0, 30.52], [31.0, 34.13], [36.0, 36.9], [37.0, 39.55], [40.0, 41.15], [42.0, 43.11], [44.0, 43.78], [45.0, 106.02], [108.0, 119.43], [120.0, 124.63], [125.0, 141.22], [142.0, 146.87], [147.0, 158.21], [159.0, 161.5], [162.0, 172.12], [173.0, 175.42]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false], "silence_prob": [100.0, 43.13, 37.57, 0.0, 0.0, 0.0, 89.54, 34.19, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 30.1, 99.97, 38.46, 100.0, 29.68, 43.66, 28.06, 30.86], "audiomae_on_audioset": [null, [["sidetone", 27.96], ["sine wave", 17.31], ["dial tone", 13.82]], [["sidetone", 32.88], ["speech", 19.7], ["busy signal", 9.67]], null, null, null, null, [["speech", 41.96], ["animal", 10.32], ["domestic animals, pets", 8.12]], null, null, null, null, null, null, [["music", 12.12], ["rumble", 11.8], ["sonar", 3.79]], null, [["whale vocalization", 12.72], ["sidetone", 11.94], ["boing", 8.95]], null, [["speech", 26.51], ["burst, pop", 8.12], ["beep, bleep", 7.06]], [["sidetone", 57.63], ["hum", 11.21], ["speech", 4.96]], [["speech", 61.63], ["screaming", 8.58], ["burst, pop", 5.8]], [["moo", 35.69], ["cattle, bovinae", 30.78], ["speech", 8.69]]], "duration": [4.05, 5.09, 2.08, 0.38, 0.95, 0.83, 7.52, 3.13, 0.9, 2.55, 1.15, 1.11, -0.22, 61.02, 11.43, 4.63, 16.22, 4.87, 11.21, 2.5, 10.12, 2.42]} \ No newline at end of file diff --git a/annotations_1/eZc3GMgzwyk_filtered.json b/annotations_1/eZc3GMgzwyk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680948c6c43ad180ebb660d0df87b8163ed643a5 --- /dev/null +++ b/annotations_1/eZc3GMgzwyk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.51], [31.0, 35.58], [40.0, 50.9], [51.0, 51.92], [53.0, 60.44], [65.0, 77.21], [78.0, 78.98], [85.0, 85.5], [87.0, 87.96], [89.0, 90.12], [90.0, 92.16], [93.0, 93.02]], "keep_status": [true, true, true, false, true, true, false, false, false, false, false, false], "silence_prob": [33.0, 32.88, 33.0, 0.0, 32.82, 32.73, 0.0, 0.0, 0.0, 0.0, 50.21, 0.0], "audiomae_on_audioset": [[["music", 22.26], ["synthesizer", 15.56], ["buzz", 9.36]], [["music", 18.16], ["speech", 11.42], ["fly, housefly", 5.09]], [["music", 51.93], ["cacophony", 4.37], ["speech", 3.42]], null, [["music", 26.43], ["vehicle", 18.6], ["speech", 8.04]], [["music", 29.26], ["cattle, bovinae", 9.61], ["moo", 8.75]], null, null, null, null, null, null], "duration": [10.51, 4.58, 10.9, 0.92, 7.44, 12.21, 0.98, 0.5, 0.96, 1.12, 2.16, 0.02]} \ No newline at end of file diff --git a/annotations_1/e_S58iPZYu8_filtered.json b/annotations_1/e_S58iPZYu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd7266a6ecbc78b61b11249ef27207663f579b64 --- /dev/null +++ b/annotations_1/e_S58iPZYu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.91], [19.0, 20.01], [23.0, 23.26], [28.0, 28.7], [31.0, 36.0], [48.0, 48.68], [49.0, 63.15], [67.0, 70.33], [71.0, 71.86], [73.0, 115.8], [117.0, 118.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 53.84, 55.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.09, 1.01, 0.26, 0.7, 5.0, 0.68, 14.15, 3.33, 0.86, 42.8, 1.96]} \ No newline at end of file diff --git a/annotations_1/ebHQ50ZRvM4_filtered.json b/annotations_1/ebHQ50ZRvM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97f100b0d2d324821d12f0ac98cdec8e8a7eb722 --- /dev/null +++ b/annotations_1/ebHQ50ZRvM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [10.0, 10.54], [15.0, 17.49], [19.0, 41.27], [43.0, 44.19], [47.0, 47.44], [50.0, 50.97], [52.0, 51.75], [52.0, 51.87], [55.0, 54.95], [57.0, 95.17], [96.0, 97.56], [98.0, 101.61], [102.0, 107.47], [111.0, 112.9], [115.0, 115.7], [116.0, 118.83], [121.0, 125.69], [127.0, 128.14], [129.0, 130.42], [132.0, 149.94]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.43, 39.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.31, 47.62, 0.0, 0.0, 51.23, 52.62, 0.0, 0.0, 62.89], "audiomae_on_audioset": [null, null, [["music", 68.7], ["guitar", 7.66], ["musical instrument", 6.12]], [["music", 55.3], ["livestock, farm animals, working animals", 6.46], ["sheep", 6.12]], null, null, null, null, null, null, null, null, null, [["music", 50.44], ["speech", 23.44], ["synthesizer", 1.5]], null, null, null, null, null, null, null], "duration": [0.71, 0.54, 2.49, 22.27, 1.19, 0.44, 0.97, -0.25, -0.13, -0.05, 38.17, 1.56, 3.61, 5.47, 1.9, 0.7, 2.83, 4.69, 1.14, 1.42, 17.94]} \ No newline at end of file diff --git a/annotations_1/ebkY0u1-NKk_filtered.json b/annotations_1/ebkY0u1-NKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bca25d2594ab280702db763835f0bf82c2779da --- /dev/null +++ b/annotations_1/ebkY0u1-NKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.34], [15.0, 21.1], [26.0, 26.1], [27.0, 28.76], [31.0, 32.97], [34.0, 34.8], [36.0, 36.21], [38.0, 38.37], [40.0, 46.5], [48.0, 49.38], [50.0, 51.19], [52.0, 52.1], [53.0, 53.72], [55.0, 56.05], [57.0, 57.84], [59.0, 59.64], [63.0, 63.78], [68.0, 67.93], [68.0, 70.19], [71.0, 72.59], [76.0, 76.2], [78.0, 78.85], [82.0, 82.32], [85.0, 85.77], [96.0, 101.82], [102.0, 102.9], [105.0, 105.92], [107.0, 110.71], [111.0, 112.63], [114.0, 114.59], [120.0, 124.65]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 48.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 0.0, 30.07, 0.0, 0.0, 39.86, 0.0, 0.0, 47.9], "audiomae_on_audioset": [null, [["hum", 40.81], ["throbbing", 15.34], ["radio", 7.47]], null, null, null, null, null, null, [["speech", 70.53], ["echo", 5.65], ["wail, moan", 5.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.45], ["fart", 11.46], ["whack, thwack", 5.39]], null, null, [["sidetone", 44.18], ["speech", 30.67], ["radio", 14.96]], null, null, [["hum", 19.34], ["fart", 11.96], ["speech", 7.94]]], "duration": [0.34, 6.1, 0.1, 1.76, 1.97, 0.8, 0.21, 0.37, 6.5, 1.38, 1.19, 0.1, 0.72, 1.05, 0.84, 0.64, 0.78, -0.07, 2.19, 1.59, 0.2, 0.85, 0.32, 0.77, 5.82, 0.9, 0.92, 3.71, 1.63, 0.59, 4.65]} \ No newline at end of file diff --git a/annotations_1/ec9h1IjltJg_filtered.json b/annotations_1/ec9h1IjltJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..666014ec76183e8ffe5e8af842593e986c5313d8 --- /dev/null +++ b/annotations_1/ec9h1IjltJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 16.34], [22.0, 30.28], [31.0, 98.93], [102.0, 102.46], [103.0, 104.67], [105.0, 107.42], [109.0, 109.66], [111.0, 116.78], [118.0, 119.47], [121.0, 123.79], [124.0, 127.14], [128.0, 129.1], [131.0, 131.41]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.22, 41.22, 0.0, 0.0, 0.0, 87.74, 0.0, 99.59, 0.0, 99.62, 55.74, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.37], ["singing bowl", 15.42], ["speech", 10.14]], [["music", 37.2], ["hum", 14.41], ["mains hum", 9.79]], null, null, null, null, null, null, null, null, null, null, null], "duration": [13.34, 8.28, 67.93, 0.46, 1.67, 2.42, 0.66, 5.78, 1.47, 2.79, 3.14, 1.1, 0.41]} \ No newline at end of file diff --git a/annotations_1/eclUi6kVFcM_filtered.json b/annotations_1/eclUi6kVFcM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abc7ea596200b2baf4cfcfa1e546a11e9fbc7b2b --- /dev/null +++ b/annotations_1/eclUi6kVFcM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.75], [10.0, 11.69], [30.0, 33.47], [36.0, 41.15], [43.0, 46.58], [56.0, 57.15], [61.0, 61.89], [64.0, 64.72], [78.0, 83.61], [84.0, 84.32], [86.0, 86.44], [89.0, 89.14], [93.0, 93.39], [94.0, 95.01], [96.0, 96.57], [98.0, 98.47], [100.0, 100.84], [107.0, 106.88], [114.0, 114.94], [115.0, 116.31], [117.0, 123.26], [130.0, 130.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.33, 37.95, 39.37, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0], "audiomae_on_audioset": [null, null, [["music", 64.18], ["chorus effect", 9.98], ["effects unit", 4.24]], [["music", 80.75], ["singing", 1.75], ["country", 1.26]], [["music", 76.22], ["middle eastern music", 2.14], ["musical instrument", 1.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 1.69, 3.47, 5.15, 3.58, 1.15, 0.89, 0.72, 5.61, 0.32, 0.44, 0.14, 0.39, 1.01, 0.57, 0.47, 0.84, -0.12, 0.94, 1.31, 6.26, 0.5]} \ No newline at end of file diff --git a/annotations_1/ecmDPqCP8ms_filtered.json b/annotations_1/ecmDPqCP8ms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648f49308d26ed08d815634200c336f6f7b47e9d --- /dev/null +++ b/annotations_1/ecmDPqCP8ms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [16.0, 17.07], [18.0, 18.39], [19.0, 20.88], [22.0, 23.95], [25.0, 26.74], [27.0, 29.79], [30.0, 31.77], [32.0, 33.93], [37.0, 39.5], [41.0, 42.23], [46.0, 46.58], [48.0, 49.74], [52.0, 51.83], [54.0, 54.97], [57.0, 57.59], [59.0, 59.04], [61.0, 71.59], [77.0, 78.83], [80.0, 82.04], [86.0, 87.93], [88.0, 92.85], [93.0, 95.69], [96.0, 99.82], [101.0, 103.32], [106.0, 106.84], [107.0, 108.53], [112.0, 111.75], [114.0, 115.64], [119.0, 119.57], [125.0, 124.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 99.78, 0.0, 99.31, 98.01, 99.92, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.07, 0.39, 1.88, 1.95, 1.74, 2.79, 1.77, 1.93, 2.5, 1.23, 0.58, 1.74, -0.17, 0.97, 0.59, 0.04, 10.59, 1.83, 2.04, 1.93, 4.85, 2.69, 3.82, 2.32, 0.84, 1.53, -0.25, 1.64, 0.57, -0.15]} \ No newline at end of file diff --git a/annotations_1/edHmOaS0lRU_filtered.json b/annotations_1/edHmOaS0lRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c119e136408e6906cf79375a9198122a98e8e112 --- /dev/null +++ b/annotations_1/edHmOaS0lRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.99], [12.0, 35.48], [41.0, 61.43], [65.0, 77.33], [81.0, 81.67], [83.0, 93.43], [96.0, 95.82], [97.0, 99.47], [102.0, 126.86], [129.0, 134.89], [137.0, 158.62], [160.0, 159.63]], "keep_status": [true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [28.74, 28.9, 29.57, 30.19, 0.0, 29.66, 0.0, 30.53, 29.37, 29.8, 29.65, 0.0], "audiomae_on_audioset": [[["speech", 27.97], ["explosion", 15.54], ["burst, pop", 13.17]], [["music", 29.9], ["cacophony", 10.32], ["explosion", 10.18]], [["music", 47.88], ["smash, crash", 8.98], ["clang", 6.64]], [["music", 67.72], ["speech", 18.13], ["gunshot, gunfire", 2.28]], null, [["machine gun", 28.65], ["speech", 26.78], ["music", 19.87]], null, [["music", 65.01], ["throbbing", 8.76], ["trance music", 3.52]], [["music", 83.11], ["smash, crash", 2.2], ["cacophony", 1.97]], [["music", 63.24], ["speech", 17.65], ["throbbing", 4.84]], [["music", 47.91], ["speech", 34.04], ["breaking", 2.05]], null], "duration": [5.99, 23.48, 20.43, 12.33, 0.67, 10.43, -0.18, 2.47, 24.86, 5.89, 21.62, -0.37]} \ No newline at end of file diff --git a/annotations_1/edQy5jBxhV8_filtered.json b/annotations_1/edQy5jBxhV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49cccc5fd2e0b09430e14bee90fec8d68ebf743a --- /dev/null +++ b/annotations_1/edQy5jBxhV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [8.0, 9.12], [14.0, 14.59], [17.0, 18.77], [20.0, 20.01], [26.0, 28.41], [29.0, 30.06], [34.0, 34.55], [35.0, 35.67], [39.0, 44.68], [45.0, 45.47], [46.0, 47.17], [48.0, 55.05], [57.0, 58.87], [61.0, 65.85], [67.0, 72.08], [73.0, 73.16], [74.0, 74.71], [75.0, 75.81], [76.0, 80.18], [81.0, 84.69], [92.0, 95.91], [97.0, 97.77], [99.0, 101.14], [102.0, 106.91], [108.0, 108.26], [114.0, 114.96], [116.0, 116.26], [119.0, 122.74], [124.0, 127.89], [128.0, 129.59], [133.0, 135.57], [138.0, 138.67], [143.0, 144.29], [145.0, 145.22], [146.0, 146.89], [148.0, 149.03], [154.0, 153.93], [156.0, 159.7], [168.0, 167.88], [171.0, 174.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 100.0, 68.02, 0.0, 0.0, 0.0, 98.66, 76.2, 100.0, 0.0, 99.97, 98.66, 0.0, 0.0, 0.0, 100.0, 87.55, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.12, 0.59, 1.77, 0.01, 2.41, 1.06, 0.55, 0.67, 5.68, 0.47, 1.17, 7.05, 1.87, 4.85, 5.08, 0.16, 0.71, 0.81, 4.18, 3.69, 3.91, 0.77, 2.14, 4.91, 0.26, 0.96, 0.26, 3.74, 3.89, 1.59, 2.57, 0.67, 1.29, 0.22, 0.89, 1.03, -0.07, 3.7, -0.12, 3.18]} \ No newline at end of file diff --git a/annotations_1/edaHyeIxzcI_filtered.json b/annotations_1/edaHyeIxzcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12c1143b2b2782f7534150f0bc8759a5138d72b6 --- /dev/null +++ b/annotations_1/edaHyeIxzcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 33.03], [35.0, 52.41], [87.0, 93.61], [98.0, 106.59], [108.0, 130.13], [131.0, 131.89]], "keep_status": [true, true, false, false, true, false], "silence_prob": [28.77, 28.5, 28.49, 28.67, 28.72, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 23.73], ["moo", 16.47], ["livestock, farm animals, working animals", 10.87]], [["sidetone", 30.71], ["speech", 12.96], ["music", 8.55]], [["cattle, bovinae", 37.13], ["moo", 31.01], ["livestock, farm animals, working animals", 30.37]], [["livestock, farm animals, working animals", 52.48], ["cattle, bovinae", 29.5], ["moo", 14.9]], [["music", 19.75], ["speech", 11.15], ["hum", 8.0]], null], "duration": [2.03, 17.41, 6.61, 8.59, 22.13, 0.89]} \ No newline at end of file diff --git a/annotations_1/edhJGqAjG7s_filtered.json b/annotations_1/edhJGqAjG7s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2d9997db706aca3e96db6c0b11d5af303248d1b --- /dev/null +++ b/annotations_1/edhJGqAjG7s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.01], [8.0, 12.31], [13.0, 51.22], [57.0, 62.85], [64.0, 64.08], [66.0, 66.53], [69.0, 68.89], [70.0, 71.47], [72.0, 75.81], [77.0, 82.9], [84.0, 85.5], [93.0, 94.86], [96.0, 96.04], [96.0, 98.88], [100.0, 102.37], [103.0, 104.63], [106.0, 107.2]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.63, 29.83, 0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 58.22, 76.37, 0.0, 0.0, 0.0, 45.05, 59.24, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.87], ["musical instrument", 6.78], ["speech", 3.82]], [["mains hum", 31.88], ["hum", 28.72], ["music", 13.64]], null, [["hum", 40.61], ["music", 16.84], ["throbbing", 9.73]], null, null, null, null, null, null, null, null, null, [["music", 34.79], ["speech", 24.44], ["hum", 5.28]], null, null, null], "duration": [4.01, 4.31, 38.22, 5.85, 0.08, 0.53, -0.11, 1.47, 3.81, 5.9, 1.5, 1.86, 0.04, 2.88, 2.37, 1.63, 1.2]} \ No newline at end of file diff --git a/annotations_1/eeWPnGsY-Xc_filtered.json b/annotations_1/eeWPnGsY-Xc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..664b6e4bb3769c6ea34bcdd937dc02b42c5a3ff1 --- /dev/null +++ b/annotations_1/eeWPnGsY-Xc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.17], [6.0, 6.66], [8.0, 8.77], [10.0, 10.62], [12.0, 12.46], [13.0, 13.49], [15.0, 15.75], [17.0, 16.75], [18.0, 18.03], [22.0, 22.08], [25.0, 25.05], [27.0, 27.46], [29.0, 29.24], [32.0, 31.95], [35.0, 35.07], [38.0, 38.96], [40.0, 40.15], [41.0, 41.34], [42.0, 42.75], [47.0, 47.87], [51.0, 51.24], [52.0, 52.2], [56.0, 57.59], [60.0, 61.37], [63.0, 65.13], [67.0, 67.53], [70.0, 70.39], [71.0, 71.59], [75.0, 75.19], [76.0, 75.78], [80.0, 80.76], [83.0, 84.15], [87.0, 87.64], [89.0, 90.51], [94.0, 93.95], [95.0, 95.08], [97.0, 97.73], [99.0, 99.55], [101.0, 101.39], [104.0, 104.52], [108.0, 108.18], [110.0, 110.46], [113.0, 113.54], [115.0, 115.52], [117.0, 117.88], [120.0, 135.38], [136.0, 136.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 42.77], ["music", 26.28], ["mains hum", 13.99]], null], "duration": [2.17, 0.66, 0.77, 0.62, 0.46, 0.49, 0.75, -0.25, 0.03, 0.08, 0.05, 0.46, 0.24, -0.05, 0.07, 0.96, 0.15, 0.34, 0.75, 0.87, 0.24, 0.2, 1.59, 1.37, 2.13, 0.53, 0.39, 0.59, 0.19, -0.22, 0.76, 1.15, 0.64, 1.51, -0.05, 0.08, 0.73, 0.55, 0.39, 0.52, 0.18, 0.46, 0.54, 0.52, 0.88, 15.38, 0.16]} \ No newline at end of file diff --git a/annotations_1/ef7rQniaz5c_filtered.json b/annotations_1/ef7rQniaz5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ff6f1d59e20e3b78024f237ab2e563223ee7879 --- /dev/null +++ b/annotations_1/ef7rQniaz5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [2.0, 3.64], [6.0, 6.47], [11.0, 12.72], [15.0, 16.34], [22.0, 22.23], [25.0, 26.42], [28.0, 31.13], [32.0, 33.56], [34.0, 34.74], [37.0, 39.77], [41.0, 45.99], [46.0, 50.25], [53.0, 56.59], [58.0, 59.56], [62.0, 62.8], [64.0, 64.98], [66.0, 68.4], [69.0, 70.14], [72.0, 79.27], [80.0, 83.1], [84.0, 86.66], [88.0, 99.32], [101.0, 115.86], [117.0, 122.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 84.8, 99.98, 83.52, 96.29, 0.0, 0.0, 0.0, 73.82, 0.0, 99.97, 100.0, 77.03, 95.91, 83.7, 74.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.64, 0.47, 1.72, 1.34, 0.23, 1.42, 3.13, 1.56, 0.74, 2.77, 4.99, 4.25, 3.59, 1.56, 0.8, 0.98, 2.4, 1.14, 7.27, 3.1, 2.66, 11.32, 14.86, 5.94]} \ No newline at end of file diff --git a/annotations_1/efkuXTpfxhc_filtered.json b/annotations_1/efkuXTpfxhc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b43e67bc40dc2dc788b11c5f89012637efde9c85 --- /dev/null +++ b/annotations_1/efkuXTpfxhc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.81], [13.0, 14.5], [18.0, 18.52], [22.0, 22.28], [24.0, 25.44], [26.0, 26.79], [31.0, 31.45], [40.0, 42.16], [43.0, 43.87], [45.0, 49.28], [54.0, 58.09], [59.0, 61.03], [63.0, 69.43], [70.0, 91.89], [92.0, 103.01], [105.0, 108.09], [111.0, 112.56], [116.0, 116.19], [118.0, 121.83], [122.0, 124.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.92, 0.0, 82.25, 57.81, 75.55, 87.37, 47.94, 40.09, 99.26, 0.0, 0.0, 82.07, 39.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 60.18], ["radio", 8.42], ["music", 3.84]], null, null, null, null, null, [["music", 46.55], ["effects unit", 5.9], ["mains hum", 4.71]], [["music", 60.63], ["effects unit", 11.34], ["guitar", 4.68]], null, null, null, null, [["music", 39.07], ["fart", 12.6], ["speech", 6.43]]], "duration": [1.81, 1.5, 0.52, 0.28, 1.44, 0.79, 0.45, 2.16, 0.87, 4.28, 4.09, 2.03, 6.43, 21.89, 11.01, 3.09, 1.56, 0.19, 3.83, 2.68]} \ No newline at end of file diff --git a/annotations_1/eg8WzaSrZpg_filtered.json b/annotations_1/eg8WzaSrZpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c73494e2604208ba2f71549068033224a83e61b3 --- /dev/null +++ b/annotations_1/eg8WzaSrZpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 39.95], [43.0, 84.23], [88.0, 101.44], [104.0, 105.58], [112.0, 113.56], [114.0, 117.15], [118.0, 117.98]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 29.95, 0.0, 0.0, 29.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 68.42], ["throbbing", 2.78], ["hum", 2.65]], null, null, [["hum", 21.25], ["throbbing", 21.17], ["music", 19.66]], null], "duration": [-0.05, 41.23, 13.44, 1.58, 1.56, 3.15, -0.02]} \ No newline at end of file diff --git a/annotations_1/egB-SG97EcI_filtered.json b/annotations_1/egB-SG97EcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a1b487628f3f9932486111e7594c88083a567fe --- /dev/null +++ b/annotations_1/egB-SG97EcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.55], [21.0, 20.87], [28.0, 28.61], [36.0, 36.53], [37.0, 41.86], [45.0, 45.57], [46.0, 55.11], [56.0, 56.15], [62.0, 73.82], [75.0, 75.25], [79.0, 80.37], [81.0, 82.43], [84.0, 83.83], [84.0, 85.48], [89.0, 90.05], [93.0, 93.55], [95.0, 95.66], [97.0, 98.76], [99.0, 100.4], [102.0, 106.0], [107.0, 108.23], [109.0, 109.51], [117.0, 118.4], [119.0, 121.54], [124.0, 123.63], [125.0, 126.86], [129.0, 129.96], [132.0, 132.02], [133.0, 135.65], [138.0, 139.33], [140.0, 142.91], [149.0, 150.04], [152.0, 152.54], [154.0, 155.55], [156.0, 156.57], [158.0, 158.57], [160.0, 160.32], [161.0, 161.32], [162.0, 171.36], [173.0, 173.96], [175.0, 175.32], [176.0, 181.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [81.17, 0.0, 0.0, 0.0, 84.43, 0.0, 66.88, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 39.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 38.59], ["burst, pop", 15.24], ["speech", 8.26]]], "duration": [4.55, -0.13, 0.61, 0.53, 4.86, 0.57, 9.11, 0.15, 11.82, 0.25, 1.37, 1.43, -0.17, 1.48, 1.05, 0.55, 0.66, 1.76, 1.4, 4.0, 1.23, 0.51, 1.4, 2.54, -0.37, 1.86, 0.96, 0.02, 2.65, 1.33, 2.91, 1.04, 0.54, 1.55, 0.57, 0.57, 0.32, 0.32, 9.36, 0.96, 0.32, 5.77]} \ No newline at end of file diff --git a/annotations_1/egTtyS-PlRM_filtered.json b/annotations_1/egTtyS-PlRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d49cef1f9fd2ca47a404f2496c3b216c523432fe --- /dev/null +++ b/annotations_1/egTtyS-PlRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.25], [12.0, 13.2], [15.0, 15.87], [18.0, 19.26], [21.0, 27.65], [32.0, 32.21], [40.0, 58.24], [60.0, 61.91], [64.0, 68.27], [71.0, 71.04], [71.0, 71.1], [85.0, 85.58], [91.0, 90.68], [91.0, 98.12], [104.0, 119.23], [122.0, 122.28], [126.0, 127.63], [128.0, 129.3], [131.0, 132.71], [135.0, 137.74], [139.0, 140.48], [154.0, 153.93], [166.0, 173.23]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.15, 0.0, 0.0, 0.0, 45.05, 0.0, 33.08, 0.0, 38.95, 0.0, 0.0, 0.0, 0.0, 34.84, 32.14, 0.0, 0.0, 0.0, 0.0, 81.53, 0.0, 0.0, 35.57], "audiomae_on_audioset": [[["music", 57.83], ["synthesizer", 7.37], ["musical instrument", 3.73]], null, null, null, [["music", 54.69], ["hum", 10.07], ["mains hum", 7.16]], null, [["music", 45.72], ["hum", 16.16], ["speech", 10.32]], null, [["music", 30.09], ["synthesizer", 10.75], ["speech", 6.3]], null, null, null, null, [["speech", 37.1], ["music", 21.23], ["fart", 5.73]], [["music", 53.74], ["speech", 12.29], ["didgeridoo", 8.46]], null, null, null, null, null, null, null, [["mains hum", 52.76], ["hum", 18.66], ["noise", 9.55]]], "duration": [2.25, 1.2, 0.87, 1.26, 6.65, 0.21, 18.24, 1.91, 4.27, 0.04, 0.1, 0.58, -0.32, 7.12, 15.23, 0.28, 1.63, 1.3, 1.71, 2.74, 1.48, -0.07, 7.23]} \ No newline at end of file diff --git a/annotations_1/egrmjjy2Pgo_filtered.json b/annotations_1/egrmjjy2Pgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f7e009b58b72d25b2c839c0f99f0b458ebdfc22 --- /dev/null +++ b/annotations_1/egrmjjy2Pgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.62], [28.0, 28.46], [30.0, 30.5], [31.0, 37.32], [38.0, 38.08], [39.0, 39.26], [40.0, 41.2], [42.0, 42.8], [44.0, 44.98], [46.0, 46.03], [48.0, 51.19], [52.0, 53.03], [54.0, 54.62], [58.0, 58.89], [60.0, 61.33], [63.0, 64.2], [66.0, 67.31], [68.0, 70.56], [71.0, 70.93], [72.0, 72.77], [74.0, 74.82], [78.0, 80.2], [81.0, 82.63], [83.0, 84.47], [85.0, 86.31], [87.0, 88.87], [90.0, 91.93], [95.0, 95.76], [97.0, 97.31], [100.0, 102.79], [107.0, 109.22]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [36.74, 0.0, 0.0, 50.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 68.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 47.94], "audiomae_on_audioset": [[["music", 40.09], ["speech", 25.03], ["didgeridoo", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.73], ["speech", 10.4], ["musical instrument", 7.43]]], "duration": [10.62, 0.46, 0.5, 6.32, 0.08, 0.26, 1.2, 0.8, 0.98, 0.03, 3.19, 1.03, 0.62, 0.89, 1.33, 1.2, 1.31, 2.56, -0.07, 0.77, 0.82, 2.2, 1.63, 1.47, 1.31, 1.87, 1.93, 0.76, 0.31, 2.79, 2.22]} \ No newline at end of file diff --git a/annotations_1/egwR6gS9UMM_filtered.json b/annotations_1/egwR6gS9UMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/egwR6gS9UMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ejD-W0F0hr8_filtered.json b/annotations_1/ejD-W0F0hr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecea21fc728383a77c7fc0264d3306dde7df817f --- /dev/null +++ b/annotations_1/ejD-W0F0hr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.81], [23.0, 23.82], [24.0, 30.21], [31.0, 41.18], [44.0, 45.5], [47.0, 47.31], [48.0, 48.36], [49.0, 49.71], [51.0, 72.08], [73.0, 73.65], [74.0, 74.26], [79.0, 84.91], [86.0, 87.91], [89.0, 90.81], [92.0, 121.61], [122.0, 122.76], [125.0, 126.18], [127.0, 130.81], [133.0, 141.4], [146.0, 147.18], [147.0, 159.78]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 37.27, 94.81, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 78.04, 0.0, 0.0, 67.0, 0.0, 0.0, 46.36, 41.16, 0.0, 38.93], "audiomae_on_audioset": [null, null, [["speech", 25.52], ["fart", 9.46], ["throbbing", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.36], ["theremin", 12.87], ["hum", 10.68]], [["music", 72.26], ["hum", 5.67], ["synthesizer", 4.0]], null, [["music", 56.53], ["speech", 32.29], ["fart", 1.56]]], "duration": [0.81, 0.82, 6.21, 10.18, 1.5, 0.31, 0.36, 0.71, 21.08, 0.65, 0.26, 5.91, 1.91, 1.81, 29.61, 0.76, 1.18, 3.81, 8.4, 1.18, 12.78]} \ No newline at end of file diff --git a/annotations_1/ek0jTQAdN8Y_filtered.json b/annotations_1/ek0jTQAdN8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bed3388e1d61ba283898087eb611cc99b17f5cb --- /dev/null +++ b/annotations_1/ek0jTQAdN8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.78], [3.0, 4.09], [4.0, 5.78], [9.0, 8.94], [9.0, 10.35], [11.0, 12.07], [15.0, 17.14], [18.0, 18.37], [19.0, 19.94], [22.0, 24.93], [25.0, 27.09], [30.0, 30.94], [32.0, 32.91], [36.0, 37.49], [43.0, 43.39], [44.0, 50.48], [56.0, 58.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0, 99.56, 91.98, 0.0, 0.0, 0.0, 0.0, 46.9, 38.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 30.77], ["music", 17.8], ["mains hum", 15.61]], [["hum", 39.08], ["mains hum", 22.27], ["throbbing", 7.13]]], "duration": [0.78, 1.09, 1.78, -0.06, 1.35, 1.07, 2.14, 0.37, 0.94, 2.93, 2.09, 0.94, 0.91, 1.49, 0.39, 6.48, 2.19]} \ No newline at end of file diff --git a/annotations_1/ekSSp-zvdgk_filtered.json b/annotations_1/ekSSp-zvdgk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad12f9dffd27adf73d0b01bbc97f2ec2e794c421 --- /dev/null +++ b/annotations_1/ekSSp-zvdgk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.88], [18.0, 18.01], [24.0, 23.85], [25.0, 28.78], [30.0, 30.37], [32.0, 50.31], [52.0, 115.15], [121.0, 120.93], [123.0, 130.59], [132.0, 132.68]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 41.56, 0.0, 32.92, 0.0, 0.0, 47.16, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 47.94], ["sidetone", 17.01], ["radio", 15.26]], null, [["music", 32.94], ["throbbing", 28.05], ["hum", 22.12]], null, null, [["music", 28.64], ["didgeridoo", 22.21], ["speech", 10.65]], null], "duration": [1.88, 0.01, -0.15, 3.78, 0.37, 18.31, 63.15, -0.07, 7.59, 0.68]} \ No newline at end of file diff --git a/annotations_1/ekqjBZdbYJU_filtered.json b/annotations_1/ekqjBZdbYJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fa45ede8110f320a477217b5a275e2da3cf1260 --- /dev/null +++ b/annotations_1/ekqjBZdbYJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [8.0, 9.26], [10.0, 11.84], [13.0, 15.16], [16.0, 17.41], [19.0, 26.25], [27.0, 35.87], [37.0, 37.99], [39.0, 40.53], [41.0, 57.65], [59.0, 70.51], [71.0, 80.2], [84.0, 83.86], [96.0, 97.78], [98.0, 101.75], [103.0, 105.48], [106.0, 106.56], [107.0, 107.62], [109.0, 109.43], [110.0, 110.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.89, 0.0, 50.86, 84.43, 0.0, 0.0, 91.81, 65.67, 30.66, 0.0, 0.0, 49.31, 58.64, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["explosion", 15.77], ["rumble", 12.29], ["whack, thwack", 11.87]], null, null, [["speech", 67.49], ["grunt", 5.43], ["animal", 4.31]], null, null, null, null, null], "duration": [0.13, 1.26, 1.84, 2.16, 1.41, 7.25, 8.87, 0.99, 1.53, 16.65, 11.51, 9.2, -0.14, 1.78, 3.75, 2.48, 0.56, 0.62, 0.43, 0.78]} \ No newline at end of file diff --git a/annotations_1/elcYyXvJF7U_filtered.json b/annotations_1/elcYyXvJF7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36d4d1cc5034a882e46cd49274ddb691e90a4907 --- /dev/null +++ b/annotations_1/elcYyXvJF7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.62], [12.0, 146.35]], "keep_status": [false, false], "silence_prob": [32.0, 0.0], "audiomae_on_audioset": [[["speech", 38.25], ["music", 29.52], ["sonar", 7.81]], null], "duration": [5.62, 134.35]} \ No newline at end of file diff --git a/annotations_1/elmk8Hsbw_0_filtered.json b/annotations_1/elmk8Hsbw_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f5154bd215bbeb0f8ce5cbc90dbeff9571e1543 --- /dev/null +++ b/annotations_1/elmk8Hsbw_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.98], [7.0, 7.18], [10.0, 10.12], [16.0, 15.97], [17.0, 17.56], [18.0, 19.85], [20.0, 21.07], [23.0, 24.54], [27.0, 27.78], [29.0, 29.35], [39.0, 39.75], [41.0, 41.89], [43.0, 43.68], [45.0, 46.16], [49.0, 51.8], [54.0, 55.21], [58.0, 58.7], [59.0, 60.03], [60.0, 60.12], [60.0, 60.49], [66.0, 72.05], [83.0, 84.25], [89.0, 88.8], [90.0, 89.99], [90.0, 91.02], [92.0, 93.9], [95.0, 95.55], [97.0, 101.44], [103.0, 105.73], [106.0, 107.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0, 0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 55.11, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.72], ["electronic music", 8.41], ["hum", 4.47]], null, null, null, null, null, [["speech", 37.92], ["music", 27.14], ["fly, housefly", 3.63]], null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.18, 0.12, -0.03, 0.56, 1.85, 1.07, 1.54, 0.78, 0.35, 0.75, 0.89, 0.68, 1.16, 2.8, 1.21, 0.7, 1.03, 0.12, 0.49, 6.05, 1.25, -0.2, -0.01, 1.02, 1.9, 0.55, 4.44, 2.73, 1.62]} \ No newline at end of file diff --git a/annotations_1/elpUGB9Ap1Y_filtered.json b/annotations_1/elpUGB9Ap1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532448da6a841820dade7ba5b34395fb6d2e91db --- /dev/null +++ b/annotations_1/elpUGB9Ap1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [10.0, 10.54], [12.0, 27.13], [35.0, 48.61], [51.0, 65.87], [70.0, 78.33], [78.0, 85.67], [92.0, 97.12], [100.0, 100.16]], "keep_status": [false, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 29.4, 29.56, 29.8, 29.77, 29.74, 30.71, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.1], ["hum", 19.61], ["throbbing", 15.62]], [["speech", 43.8], ["music", 12.18], ["aircraft", 9.61]], [["vehicle", 19.66], ["music", 18.64], ["aircraft", 5.31]], [["music", 40.67], ["insect", 10.26], ["fly, housefly", 10.24]], [["speech", 39.79], ["music", 18.17], ["vehicle", 7.72]], [["music", 73.18], ["throbbing", 8.33], ["hum", 3.84]], null], "duration": [1.6, 0.54, 15.13, 13.61, 14.87, 8.33, 7.67, 5.12, 0.16]} \ No newline at end of file diff --git a/annotations_1/em9lziI07M4_filtered.json b/annotations_1/em9lziI07M4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b756ab977f3698f3c49f64a3702ac7b48cb6cd8 --- /dev/null +++ b/annotations_1/em9lziI07M4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 43.98], [46.0, 65.45], [70.0, 108.75], [112.0, 127.2], [136.0, 136.54], [158.0, 162.23], [163.0, 179.69]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [0.0, 30.84, 0.0, 31.99, 0.0, 74.29, 30.53], "audiomae_on_audioset": [null, [["music", 67.11], ["electronic music", 3.01], ["throbbing", 2.21]], null, [["music", 68.48], ["sampler", 3.12], ["electronic music", 2.87]], null, null, [["animal", 35.71], ["whale vocalization", 8.55], ["howl", 7.25]]], "duration": [31.98, 19.45, 38.75, 15.2, 0.54, 4.23, 16.69]} \ No newline at end of file diff --git a/annotations_1/emW6qKMxIUU_filtered.json b/annotations_1/emW6qKMxIUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3e059e1eb140a948c33c92dea8f7e8799379e6c --- /dev/null +++ b/annotations_1/emW6qKMxIUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 88.94], [90.0, 99.0]], "keep_status": [false, false], "silence_prob": [0.0, 28.98], "audiomae_on_audioset": [null, [["music", 59.45], ["throbbing", 15.23], ["hum", 4.91]]], "duration": [58.94, 9.0]} \ No newline at end of file diff --git a/annotations_1/enG1CfTbT08_filtered.json b/annotations_1/enG1CfTbT08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60f025edf198c02a83119d173ea3b611ed361236 --- /dev/null +++ b/annotations_1/enG1CfTbT08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 100.26], [103.0, 103.86], [107.0, 119.67], [121.0, 123.92], [125.0, 126.3], [128.0, 130.28], [132.0, 134.18]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 44.46, 79.24, 0.0, 76.37, 82.43], "audiomae_on_audioset": [null, null, [["sidetone", 19.67], ["busy signal", 18.54], ["speech", 11.85]], null, null, null, null], "duration": [39.26, 0.86, 12.67, 2.92, 1.3, 2.28, 2.18]} \ No newline at end of file diff --git a/annotations_1/enNm82zd1Ho_filtered.json b/annotations_1/enNm82zd1Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e966248680d9d83b65499b6159ee86346b29b852 --- /dev/null +++ b/annotations_1/enNm82zd1Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.52], [7.0, 25.56], [29.0, 31.36], [33.0, 39.99], [41.0, 42.04], [45.0, 45.55], [46.0, 76.4], [79.0, 79.54], [81.0, 104.43], [105.0, 111.91], [112.0, 114.51], [116.0, 117.07], [118.0, 119.7], [121.0, 123.13], [125.0, 128.01], [129.0, 129.3], [131.0, 130.62], [134.0, 134.01], [137.0, 137.27], [138.0, 139.87], [141.0, 143.43], [144.0, 146.23], [151.0, 173.06], [174.0, 174.31], [176.0, 175.96]], "keep_status": [false, true, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.9, 29.12, 29.57, 0.0, 0.0, 0.0, 0.0, 29.76, 33.15, 36.16, 0.0, 0.0, 38.19, 40.88, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 55.53, 29.55, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.23], ["music", 15.14], ["fart", 12.14]], [["music", 60.44], ["hum", 9.36], ["throbbing", 7.53]], [["music", 25.2], ["throbbing", 20.44], ["hum", 16.93]], null, null, null, null, [["music", 53.14], ["buzz", 13.32], ["mains hum", 10.25]], [["speech", 59.5], ["music", 10.73], ["synthesizer", 3.71]], [["speech", 21.48], ["mains hum", 14.95], ["music", 13.8]], null, null, [["music", 30.52], ["electronic music", 11.21], ["hum", 4.62]], [["music", 17.75], ["speech", 12.97], ["mains hum", 9.34]], null, null, null, null, null, null, null, [["music", 54.9], ["speech", 16.39], ["groan", 10.3]], null, null], "duration": [-0.48, 18.56, 2.36, 6.99, 1.04, 0.55, 30.4, 0.54, 23.43, 6.91, 2.51, 1.07, 1.7, 2.13, 3.01, 0.3, -0.38, 0.01, 0.27, 1.87, 2.43, 2.23, 22.06, 0.31, -0.04]} \ No newline at end of file diff --git a/annotations_1/engSFG20kaA_filtered.json b/annotations_1/engSFG20kaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6314f7d226a00bcd2e8dd4bf4f20c03c615a326 --- /dev/null +++ b/annotations_1/engSFG20kaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [20.0, 38.69], [45.0, 45.17], [48.0, 86.73], [91.0, 90.75], [93.0, 150.72], [152.0, 152.27]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 35.74, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 40.25], ["hum", 15.71], ["throbbing", 7.89]], null, null, null, null, null], "duration": [0.4, 18.69, 0.17, 38.73, -0.25, 57.72, 0.27]} \ No newline at end of file diff --git a/annotations_1/eoREjwjeH30_filtered.json b/annotations_1/eoREjwjeH30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c887436f625f56a59c330b116e599b971afcd5d --- /dev/null +++ b/annotations_1/eoREjwjeH30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.97], [5.0, 36.0], [53.0, 53.81], [54.0, 54.58], [55.0, 56.24], [59.0, 59.75], [75.0, 75.68], [78.0, 79.37], [95.0, 96.09], [107.0, 107.5], [108.0, 108.89], [117.0, 130.35], [130.0, 130.38], [130.0, 130.45], [130.0, 130.49], [131.0, 130.52], [131.0, 146.75], [150.0, 164.51], [167.0, 188.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.17, 0.0, 0.0, 0.0, 0.0, 30.63, 31.39, 34.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 37.68], ["boing", 6.65], ["livestock, farm animals, working animals", 3.89]], null, null, null, null, [["music", 58.09], ["speech", 15.1], ["boing", 7.88]], [["music", 40.14], ["speech", 19.52], ["groan", 3.61]], [["music", 75.91], ["electronic music", 4.52], ["synthesizer", 2.63]]], "duration": [2.97, 31.0, 0.81, 0.58, 1.24, 0.75, 0.68, 1.37, 1.09, 0.5, 0.89, 13.35, 0.38, 0.45, 0.49, -0.48, 15.75, 14.51, 21.72]} \ No newline at end of file diff --git a/annotations_1/eoffuyXUhLs_filtered.json b/annotations_1/eoffuyXUhLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28d925c3f4757a1217fb3f12ce0d3bf1e9de9419 --- /dev/null +++ b/annotations_1/eoffuyXUhLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [8.0, 12.63], [13.0, 12.66], [13.0, 12.7], [13.0, 12.73], [13.0, 12.77], [13.0, 12.8], [13.0, 12.83], [13.0, 12.87], [15.0, 66.61], [69.0, 72.87], [73.0, 76.38], [80.0, 82.98], [84.0, 84.84], [87.0, 88.03], [88.0, 90.07], [92.0, 106.17], [111.0, 135.09], [136.0, 138.43], [139.0, 140.09], [141.0, 147.92], [149.0, 156.47], [157.0, 157.74], [163.0, 163.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 29.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.08, 52.8, 71.0, 0.0, 0.0, 56.86, 42.76, 40.97, 36.89, 0.0, 31.79, 40.66, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 13.92], ["rumble", 11.67], ["hum", 10.97]], null, null, null, null, null, null, null, null, [["music", 13.62], ["singing bowl", 11.92], ["speech", 9.84]], null, null, null, null, null, [["speech", 48.15], ["music", 22.02], ["sonar", 16.62]], [["music", 26.9], ["speech", 19.46], ["electronic music", 8.3]], [["whale vocalization", 41.31], ["music", 13.1], ["hum", 4.93]], null, [["speech", 48.5], ["hum", 14.14], ["music", 7.26]], [["music", 43.73], ["hum", 23.69], ["mains hum", 12.1]], null, null], "duration": [0.48, 4.63, -0.34, -0.3, -0.27, -0.23, -0.2, -0.17, -0.13, 51.61, 3.87, 3.38, 2.98, 0.84, 1.03, 2.07, 14.17, 24.09, 2.43, 1.09, 6.92, 7.47, 0.74, 0.04]} \ No newline at end of file diff --git a/annotations_1/epupZLvDDts_filtered.json b/annotations_1/epupZLvDDts_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f83a107cfefed98c733d12efb32af925ddd4409 --- /dev/null +++ b/annotations_1/epupZLvDDts_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.41], [6.0, 7.52], [10.0, 21.12], [22.0, 40.63], [42.0, 43.14], [45.0, 47.01], [49.0, 50.5], [51.0, 55.65], [59.0, 94.53], [95.0, 99.27], [100.0, 101.41], [102.0, 104.14], [106.0, 112.16], [113.0, 128.49], [129.0, 130.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 0.0, 53.59, 96.66, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 0.0, 100.0, 99.1, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.41, 1.52, 11.12, 18.63, 1.14, 2.01, 1.5, 4.65, 35.53, 4.27, 1.41, 2.14, 6.16, 15.49, 1.98]} \ No newline at end of file diff --git a/annotations_1/eq3vD93GgLs_filtered.json b/annotations_1/eq3vD93GgLs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11ade6fc935cfefb35aa00789ba9691a6e3eb02f --- /dev/null +++ b/annotations_1/eq3vD93GgLs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [12.0, 12.29], [13.0, 13.91], [18.0, 20.39], [21.0, 23.41], [26.0, 26.25], [35.0, 35.75], [38.0, 45.22], [46.0, 46.74], [49.0, 49.69], [52.0, 109.63]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.02, 38.16, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.37], ["didgeridoo", 7.36], ["musical instrument", 5.59]], [["music", 45.83], ["hum", 2.54], ["musical instrument", 2.45]], null, null, [["speech", 45.44], ["rumble", 13.62], ["music", 10.65]], null, null, null], "duration": [0.49, 0.29, 0.91, 2.39, 2.41, 0.25, 0.75, 7.22, 0.74, 0.69, 57.63]} \ No newline at end of file diff --git a/annotations_1/erE6UlOi3E0_filtered.json b/annotations_1/erE6UlOi3E0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39eb21559151c3d8d36a0d6729d25644bd983e9c --- /dev/null +++ b/annotations_1/erE6UlOi3E0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 49.77], [52.0, 55.21], [59.0, 62.09], [63.0, 74.19], [75.0, 75.17], [76.0, 99.37], [100.0, 114.15], [117.0, 124.56]], "keep_status": [true, true, true, true, false, false, false, true], "silence_prob": [31.3, 31.33, 32.86, 31.07, 0.0, 31.21, 31.33, 32.56], "audiomae_on_audioset": [[["music", 36.3], ["vehicle", 7.24], ["hum", 7.13]], [["music", 29.47], ["mosquito", 25.06], ["fly, housefly", 7.75]], [["music", 49.56], ["cacophony", 8.77], ["musical instrument", 4.84]], [["music", 36.99], ["speech", 15.96], ["buzz", 8.37]], null, [["music", 46.71], ["buzz", 26.32], ["vehicle", 4.09]], [["mains hum", 40.99], ["hum", 30.25], ["music", 16.36]], [["music", 40.47], ["foghorn", 20.53], ["trombone", 5.31]]], "duration": [11.77, 3.21, 3.09, 11.19, 0.17, 23.37, 14.15, 7.56]} \ No newline at end of file diff --git a/annotations_1/erX0T5r5xbE_filtered.json b/annotations_1/erX0T5r5xbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..420326a8b7270db5e3605a57a1213965a017e4b3 --- /dev/null +++ b/annotations_1/erX0T5r5xbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.36], [25.0, 26.05], [28.0, 28.61], [32.0, 32.9], [39.0, 39.93], [41.0, 47.24], [50.0, 52.86], [55.0, 56.44], [60.0, 61.26], [65.0, 67.56], [73.0, 73.74], [74.0, 74.51], [75.0, 77.68], [84.0, 84.28], [91.0, 91.07], [93.0, 93.55], [94.0, 95.42], [106.0, 106.74], [108.0, 108.4], [113.0, 113.58], [117.0, 116.94], [118.0, 118.96], [120.0, 121.39], [122.0, 122.62], [123.0, 148.17], [150.0, 150.53], [172.0, 172.29], [173.0, 174.19], [182.0, 181.89], [184.0, 184.03], [185.0, 189.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.98, 44.87, 0.0, 0.0, 80.82, 0.0, 0.0, 31.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8], "audiomae_on_audioset": [null, null, null, null, null, [["music", 60.41], ["theremin", 8.72], ["musical instrument", 3.54]], [["speech", 41.85], ["music", 28.97], ["theremin", 4.05]], null, null, null, null, null, [["music", 54.11], ["speech", 13.18], ["didgeridoo", 2.39]], null, null, null, null, null, null, null, null, null, null, null, [["music", 45.58], ["didgeridoo", 18.34], ["wind instrument, woodwind instrument", 7.27]], null, null, null, null, null, null], "duration": [0.36, 1.05, 0.61, 0.9, 0.93, 6.24, 2.86, 1.44, 1.26, 2.56, 0.74, 0.51, 2.68, 0.28, 0.07, 0.55, 1.42, 0.74, 0.4, 0.58, -0.06, 0.96, 1.39, 0.62, 25.17, 0.53, 0.29, 1.19, -0.11, 0.03, 4.7]} \ No newline at end of file diff --git a/annotations_1/ermD7PGA3Do_filtered.json b/annotations_1/ermD7PGA3Do_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe2cc183c35d6693968293239969b99d693db97e --- /dev/null +++ b/annotations_1/ermD7PGA3Do_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 28.39], [32.0, 51.48], [53.0, 53.96], [57.0, 59.54], [64.0, 64.39], [66.0, 68.13], [69.0, 70.02], [71.0, 73.2], [80.0, 82.76], [84.0, 95.94], [97.0, 100.26], [103.0, 104.73], [111.0, 112.65], [114.0, 115.15], [119.0, 119.38], [120.0, 156.9], [158.0, 158.06], [159.0, 159.63], [162.0, 164.91], [166.0, 172.83]], "keep_status": [true, true, false, true, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [31.84, 30.2, 0.0, 33.46, 0.0, 31.71, 0.0, 31.86, 32.78, 28.89, 31.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 70.58], "audiomae_on_audioset": [[["music", 14.26], ["hum", 11.14], ["car", 10.5]], [["rumble", 50.81], ["hum", 9.7], ["speech", 8.91]], null, [["hum", 26.98], ["music", 11.52], ["sonar", 8.63]], null, [["hum", 51.98], ["mains hum", 10.76], ["throbbing", 8.26]], null, [["hum", 47.71], ["throbbing", 7.25], ["chirp tone", 6.42]], [["hum", 37.31], ["rumble", 12.6], ["throbbing", 10.94]], [["speech", 42.34], ["hum", 17.54], ["rumble", 6.79]], [["whale vocalization", 26.31], ["hum", 24.91], ["chirp tone", 8.82]], null, null, null, null, null, null, null, null, null], "duration": [11.39, 19.48, 0.96, 2.54, 0.39, 2.13, 1.02, 2.2, 2.76, 11.94, 3.26, 1.73, 1.65, 1.15, 0.38, 36.9, 0.06, 0.63, 2.91, 6.83]} \ No newline at end of file diff --git a/annotations_1/esFVrrZCvwA_filtered.json b/annotations_1/esFVrrZCvwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bba2b4f607837f2ddebe859e1bae44828568e6a3 --- /dev/null +++ b/annotations_1/esFVrrZCvwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 30.5], [36.0, 35.87]], "keep_status": [true, false], "silence_prob": [28.98, 0.0], "audiomae_on_audioset": [[["music", 62.49], ["car", 3.49], ["motorcycle", 3.02]], null], "duration": [11.5, -0.13]} \ No newline at end of file diff --git a/annotations_1/esg4w4b2xvc_filtered.json b/annotations_1/esg4w4b2xvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edf89ec225afe5aa1dba351b3ee82f53d496f763 --- /dev/null +++ b/annotations_1/esg4w4b2xvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [6.0, 12.12], [15.0, 15.45], [18.0, 18.05], [19.0, 19.72], [25.0, 29.39], [31.0, 31.6], [37.0, 37.86], [39.0, 40.53], [43.0, 52.39], [57.0, 56.69], [64.0, 68.81], [69.0, 70.17], [74.0, 80.37], [85.0, 86.68], [91.0, 95.71], [100.0, 100.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 35.84, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 30.43, 0.0, 44.69, 0.0, 30.38, 0.0, 34.55, 0.0], "audiomae_on_audioset": [null, [["speech", 47.22], ["music", 28.73], ["sidetone", 10.83]], null, null, null, null, null, null, null, [["music", 52.01], ["throbbing", 28.43], ["hum", 8.1]], null, [["hum", 16.12], ["throbbing", 14.32], ["music", 11.77]], null, [["music", 61.65], ["squish", 13.47], ["drip", 5.16]], null, [["music", 47.05], ["throbbing", 34.56], ["hum", 6.02]], null], "duration": [1.59, 6.12, 0.45, 0.05, 0.72, 4.39, 0.6, 0.86, 1.53, 9.39, -0.31, 4.81, 1.17, 6.37, 1.68, 4.71, 0.92]} \ No newline at end of file diff --git a/annotations_1/etixMqUt8Ak_filtered.json b/annotations_1/etixMqUt8Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b53914c4eea26aa5e301dc92d1d3a30822740db --- /dev/null +++ b/annotations_1/etixMqUt8Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [11.0, 11.42], [15.0, 18.62], [38.0, 47.66], [71.0, 71.47]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 60.89, 37.55, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 24.82], ["snicker", 20.73], ["livestock, farm animals, working animals", 14.4]], null], "duration": [0.33, 0.42, 3.62, 9.66, 0.47]} \ No newline at end of file diff --git a/annotations_1/euCWQcrBwPY_filtered.json b/annotations_1/euCWQcrBwPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3dd2d70514a95a785f67baee44b5e583ab09d92 --- /dev/null +++ b/annotations_1/euCWQcrBwPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [14.0, 14.23], [15.0, 15.38], [16.0, 16.56], [17.0, 131.3]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.49, 0.23, 0.38, 0.56, 114.3]} \ No newline at end of file diff --git a/annotations_1/euJyO4E3FzE_filtered.json b/annotations_1/euJyO4E3FzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86922ba6d099510a8f44aec19fbb24c841af243f --- /dev/null +++ b/annotations_1/euJyO4E3FzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.42], [8.0, 9.39], [11.0, 12.02], [31.0, 34.13], [35.0, 42.77], [47.0, 48.42], [51.0, 50.97], [53.0, 53.2], [58.0, 82.93], [84.0, 85.51], [89.0, 90.86], [91.0, 90.9], [91.0, 93.5], [99.0, 111.45], [114.0, 124.07], [124.0, 130.64], [131.0, 139.24]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 33.36, 45.11, 0.0, 0.0, 0.0, 30.85, 0.0, 0.0, 0.0, 31.27, 31.67, 31.66, 31.11, 31.13], "audiomae_on_audioset": [null, null, null, [["music", 46.61], ["didgeridoo", 16.39], ["speech", 12.84]], [["fly, housefly", 22.1], ["speech", 10.09], ["hum", 9.85]], null, null, null, [["music", 18.7], ["hum", 14.18], ["mains hum", 11.04]], null, null, null, [["music", 25.54], ["throbbing", 21.62], ["hum", 9.42]], [["music", 23.32], ["hum", 17.75], ["speech", 6.72]], [["vehicle", 22.12], ["speech", 8.49], ["car", 7.19]], [["cattle, bovinae", 41.98], ["livestock, farm animals, working animals", 29.57], ["moo", 22.31]], [["music", 27.82], ["speech", 11.5], ["whack, thwack", 7.72]]], "duration": [0.42, 1.39, 1.02, 3.13, 7.77, 1.42, -0.03, 0.2, 24.93, 1.51, 1.86, -0.1, 2.5, 12.45, 10.07, 6.64, 8.24]} \ No newline at end of file diff --git a/annotations_1/ev-4cz3hlr0_filtered.json b/annotations_1/ev-4cz3hlr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18219cf8d29420790fc23980bc7ec5fbd0d6a2ec --- /dev/null +++ b/annotations_1/ev-4cz3hlr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.44], [7.0, 8.01], [10.0, 10.93], [12.0, 22.05], [23.0, 25.03], [26.0, 27.85], [30.0, 32.05], [34.0, 35.38], [37.0, 37.72], [41.0, 42.31], [48.0, 48.81], [52.0, 53.1], [54.0, 59.54], [61.0, 63.22], [65.0, 65.4], [67.0, 69.96], [72.0, 85.36], [87.0, 87.32]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [35.05, 0.0, 0.0, 93.13, 99.52, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 43.4, 0.0, 51.18, 45.88, 0.0], "audiomae_on_audioset": [[["hum", 19.79], ["music", 8.76], ["insect", 8.22]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.35], ["speech", 17.01], ["hum", 9.19]], null, null, [["hum", 44.46], ["music", 15.7], ["mains hum", 14.05]], null], "duration": [3.44, 1.01, 0.93, 10.05, 2.03, 1.85, 2.05, 1.38, 0.72, 1.31, 0.81, 1.1, 5.54, 2.22, 0.4, 2.96, 13.36, 0.32]} \ No newline at end of file diff --git a/annotations_1/evJPzjgv-2s_filtered.json b/annotations_1/evJPzjgv-2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea0c341e0073cf4a677f90cbc6cf074f61ed1ee7 --- /dev/null +++ b/annotations_1/evJPzjgv-2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 75.71], [76.0, 83.08], [85.0, 87.88], [89.0, 91.77], [95.0, 98.63], [102.0, 110.93], [117.0, 120.78], [123.0, 123.35], [124.0, 124.51]], "keep_status": [false, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 31.37, 30.42, 30.72, 30.44, 30.4, 31.24, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 26.3], ["motorcycle", 17.75], ["vehicle", 6.36]], [["music", 51.21], ["cacophony", 10.96], ["boing", 4.47]], [["music", 66.43], ["electronic music", 3.75], ["didgeridoo", 3.32]], [["music", 52.42], ["throbbing", 5.59], ["hum", 4.39]], [["music", 65.69], ["throbbing", 3.51], ["foghorn", 1.75]], [["music", 38.6], ["speech", 14.08], ["throbbing", 8.93]], null, null], "duration": [0.71, 7.08, 2.88, 2.77, 3.63, 8.93, 3.78, 0.35, 0.51]} \ No newline at end of file diff --git a/annotations_1/evM3k7ep4wo_filtered.json b/annotations_1/evM3k7ep4wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6590105c7ad45caff2998a6ebf8d57c54e856088 --- /dev/null +++ b/annotations_1/evM3k7ep4wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 82.56], [85.0, 128.16], [132.0, 145.34]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 28.82], "audiomae_on_audioset": [null, null, [["speech", 27.61], ["music", 22.1], ["buzz", 9.26]]], "duration": [77.56, 43.16, 13.34]} \ No newline at end of file diff --git a/annotations_1/evQcKvkQCl0_filtered.json b/annotations_1/evQcKvkQCl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9d370b9acf92f398ae9d97305f097e1f42f1a9d --- /dev/null +++ b/annotations_1/evQcKvkQCl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [3.0, 3.59], [5.0, 5.46], [8.0, 8.92], [16.0, 15.75], [43.0, 44.1], [51.0, 50.9], [53.0, 53.06], [53.0, 53.35], [55.0, 55.0], [63.0, 63.39], [82.0, 82.11], [82.0, 90.15], [91.0, 91.91], [99.0, 100.92], [102.0, 102.57], [104.0, 106.73], [110.0, 110.59], [118.0, 137.57], [140.0, 149.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 97.0, 0.0, 34.52, 29.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.68], ["thump, thud", 7.35], ["reverberation", 4.77]], null, null, null, null, null, [["speech", 31.69], ["music", 15.61], ["whack, thwack", 5.22]], [["music", 78.63], ["didgeridoo", 3.11], ["electronic music", 2.88]]], "duration": [1.17, 0.59, 0.46, 0.92, -0.25, 1.1, -0.1, 0.06, 0.35, 0.0, 0.39, 0.11, 8.15, 0.91, 1.92, 0.57, 2.73, 0.59, 19.57, 9.89]} \ No newline at end of file diff --git a/annotations_1/ewbUaMvCaYg_filtered.json b/annotations_1/ewbUaMvCaYg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd7d10210c485a037c05c67b6200f46a37b6ae0e --- /dev/null +++ b/annotations_1/ewbUaMvCaYg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 72.67]], "keep_status": [false], "silence_prob": [35.39], "audiomae_on_audioset": [[["speech", 61.85], ["breaking", 8.67], ["groan", 7.34]]], "duration": [25.67]} \ No newline at end of file diff --git a/annotations_1/ewiNzru8Kek_filtered.json b/annotations_1/ewiNzru8Kek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..027878543ab42a34e42227b63bea12b595de78f5 --- /dev/null +++ b/annotations_1/ewiNzru8Kek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.98], [7.0, 9.8], [10.0, 10.2], [11.0, 11.85], [14.0, 15.15], [16.0, 16.6], [20.0, 19.94], [20.0, 32.95], [33.0, 33.3], [34.0, 39.18], [41.0, 42.2], [45.0, 62.29], [69.0, 73.41], [77.0, 79.96], [84.0, 89.33], [94.0, 97.61], [98.0, 98.59], [101.0, 103.6], [104.0, 106.56], [108.0, 126.03], [127.0, 127.99], [130.0, 131.85], [134.0, 134.87], [135.0, 137.79], [139.0, 140.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 30.26, 0.0, 32.34, 0.0, 31.59, 29.99, 36.35, 29.19, 49.27, 0.0, 29.72, 31.56, 31.38, 0.0, 0.0, 0.0, 72.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 63.56], ["whale vocalization", 20.39], ["music", 2.44]], null, [["speech", 47.82], ["boing", 12.44], ["hum", 5.79]], null, [["music", 50.5], ["speech", 14.63], ["didgeridoo", 9.11]], [["mains hum", 40.12], ["hum", 17.59], ["electric shaver, electric razor", 10.13]], [["whale vocalization", 61.01], ["roar", 4.72], ["sound effect", 3.31]], [["hum", 26.72], ["music", 10.61], ["mains hum", 8.02]], [["speech", 50.74], ["cough", 20.71], ["music", 3.64]], null, [["music", 30.12], ["speech", 19.01], ["cattle, bovinae", 11.5]], [["cattle, bovinae", 29.78], ["moo", 18.46], ["livestock, farm animals, working animals", 16.83]], [["speech", 48.08], ["music", 19.28], ["didgeridoo", 8.5]], null, null, null, null, null], "duration": [-0.02, 2.8, 0.2, 0.85, 1.15, 0.6, -0.06, 12.95, 0.3, 5.18, 1.2, 17.29, 4.41, 2.96, 5.33, 3.61, 0.59, 2.6, 2.56, 18.03, 0.99, 1.85, 0.87, 2.79, 1.9]} \ No newline at end of file diff --git a/annotations_1/exCuIisMWl0_filtered.json b/annotations_1/exCuIisMWl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fcca5eebf945aab5c7d407327d029624ac6c78e4 --- /dev/null +++ b/annotations_1/exCuIisMWl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.91], [7.0, 8.8], [11.0, 17.02], [19.0, 20.06], [20.0, 20.8], [21.0, 22.71], [24.0, 29.44], [31.0, 32.53], [34.0, 34.92], [35.0, 40.53], [43.0, 48.52], [50.0, 50.75], [51.0, 52.44], [55.0, 56.66], [58.0, 59.53], [61.0, 65.74], [66.0, 68.81], [71.0, 70.98], [71.0, 71.74], [73.0, 74.43], [76.0, 78.27], [78.0, 81.89], [83.0, 83.4], [85.0, 86.05], [86.0, 86.76], [87.0, 87.67], [88.0, 91.0], [92.0, 92.79], [94.0, 93.72], [95.0, 103.52], [104.0, 118.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 100.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 99.21, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.91, 1.8, 6.02, 1.06, 0.8, 1.71, 5.44, 1.53, 0.92, 5.53, 5.52, 0.75, 1.44, 1.66, 1.53, 4.74, 2.81, -0.02, 0.74, 1.43, 2.27, 3.89, 0.4, 1.05, 0.76, 0.67, 3.0, 0.79, -0.28, 8.52, 14.5]} \ No newline at end of file diff --git a/annotations_1/exFv7Srgwpk_filtered.json b/annotations_1/exFv7Srgwpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75bb211d956f0be33cec4e0c0e151cdfe8c51da3 --- /dev/null +++ b/annotations_1/exFv7Srgwpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [11.0, 11.75], [16.0, 15.75], [18.0, 19.4], [25.0, 26.22], [28.0, 28.98], [30.0, 32.93], [46.0, 55.76], [56.0, 60.4], [67.0, 76.94], [81.0, 82.63], [83.0, 84.2], [86.0, 89.46], [94.0, 124.44]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.5, 37.52, 93.76, 54.3, 0.0, 0.0, 96.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 26.13], ["mains hum", 24.48], ["throbbing", 9.54]], [["music", 27.18], ["wind instrument, woodwind instrument", 17.36], ["speech", 11.41]], null, null, null, null, null, null], "duration": [1.5, 0.75, -0.25, 1.4, 1.22, 0.98, 2.93, 9.76, 4.4, 9.94, 1.63, 1.2, 3.46, 30.44]} \ No newline at end of file diff --git a/annotations_1/exu61pb5X68_filtered.json b/annotations_1/exu61pb5X68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8b9a86c5d14e22ae6742c559888d5dfce3f15cc --- /dev/null +++ b/annotations_1/exu61pb5X68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.41], [13.0, 13.51], [15.0, 16.92], [29.0, 29.86], [31.0, 33.18], [43.0, 43.9], [50.0, 51.27], [58.0, 58.65], [71.0, 72.57], [75.0, 75.02], [78.0, 82.75], [84.0, 85.4]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.68, 0.0, 0.0, 0.0, 0.0, 0.0, 41.12, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 36.63], ["music", 20.23], ["synthesizer", 5.09]], null, null, null, null, null, [["music", 73.85], ["grunt", 3.83], ["synthesizer", 2.56]], null], "duration": [0.41, 0.51, 1.92, 0.86, 2.18, 0.9, 1.27, 0.65, 1.57, 0.02, 4.75, 1.4]} \ No newline at end of file diff --git a/annotations_1/ezOyoEG6GW8_filtered.json b/annotations_1/ezOyoEG6GW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..531a2f3737a91f27e68c2364d92b8b352d2c6f7e --- /dev/null +++ b/annotations_1/ezOyoEG6GW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [3.0, 4.09], [5.0, 5.44], [5.0, 5.98], [8.0, 9.05], [11.0, 11.52], [13.0, 14.08], [23.0, 23.68], [27.0, 28.11], [34.0, 35.55], [38.0, 39.24], [44.0, 45.1], [51.0, 52.12], [57.0, 58.43], [66.0, 66.63], [69.0, 69.21], [70.0, 70.44], [72.0, 72.81], [74.0, 76.23], [95.0, 96.08], [97.0, 97.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 1.09, 0.44, 0.98, 1.05, 0.52, 1.08, 0.68, 1.11, 1.55, 1.24, 1.1, 1.12, 1.43, 0.63, 0.21, 0.44, 0.81, 2.23, 1.08, 0.56]} \ No newline at end of file diff --git a/annotations_1/f-3Bldu8BJ4_filtered.json b/annotations_1/f-3Bldu8BJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9848ec3a303b5eee661e37f01b35ed22aef2be6 --- /dev/null +++ b/annotations_1/f-3Bldu8BJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [8.0, 10.2], [12.0, 15.55], [17.0, 19.48], [21.0, 26.1], [27.0, 31.06], [33.0, 36.26], [37.0, 43.83], [44.0, 46.18], [46.0, 46.21], [64.0, 64.45], [66.0, 70.31], [75.0, 77.09], [82.0, 81.92], [85.0, 89.72], [93.0, 98.47], [100.0, 99.94], [103.0, 109.32], [110.0, 111.86], [113.0, 115.91], [117.0, 127.53], [128.0, 130.23], [132.0, 133.1], [137.0, 137.61], [138.0, 141.12], [144.0, 150.92], [153.0, 156.61], [157.0, 158.53], [159.0, 160.78], [162.0, 162.58], [164.0, 163.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [73.51, 87.92, 82.07, 81.35, 79.41, 78.38, 82.07, 94.81, 73.97, 0.0, 0.0, 62.68, 80.82, 0.0, 68.67, 74.44, 0.0, 57.64, 0.0, 99.59, 64.63, 84.98, 0.0, 0.0, 81.35, 68.8, 75.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.09, 2.2, 3.55, 2.48, 5.1, 4.06, 3.26, 6.83, 2.18, 0.21, 0.45, 4.31, 2.09, -0.08, 4.72, 5.47, -0.06, 6.32, 1.86, 2.91, 10.53, 2.23, 1.1, 0.61, 3.12, 6.92, 3.61, 1.53, 1.78, 0.58, -0.14]} \ No newline at end of file diff --git a/annotations_1/f-DiniX_1mI_filtered.json b/annotations_1/f-DiniX_1mI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf08c41fc2b79477fdacee974b9fbb27f01d0d0 --- /dev/null +++ b/annotations_1/f-DiniX_1mI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.78], [17.0, 17.74], [18.0, 20.87], [28.0, 29.39], [30.0, 30.75], [33.0, 35.83], [37.0, 37.66], [39.0, 39.78], [41.0, 44.93], [48.0, 54.73], [69.0, 72.22]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 64.41, 0.0, 0.0, 31.25, 0.0, 0.0, 32.17, 29.61, 60.42], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 38.09], ["gunshot, gunfire", 18.54], ["burst, pop", 18.34]], null, null, [["explosion", 36.08], ["burst, pop", 14.05], ["gunshot, gunfire", 9.82]], [["gunshot, gunfire", 29.6], ["explosion", 13.98], ["clang", 9.46]], null], "duration": [0.78, 0.74, 2.87, 1.39, 0.75, 2.83, 0.66, 0.78, 3.93, 6.73, 3.22]} \ No newline at end of file diff --git a/annotations_1/f-EjBwpuVFI_filtered.json b/annotations_1/f-EjBwpuVFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327a97dac1267e092dd2c587ff0fac2615669909 --- /dev/null +++ b/annotations_1/f-EjBwpuVFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 23.82], [30.0, 43.38], [46.0, 49.06], [51.0, 51.31], [54.0, 56.74], [66.0, 66.99], [74.0, 75.71], [77.0, 76.96], [79.0, 80.43], [84.0, 86.26], [89.0, 99.25], [99.0, 103.98], [104.0, 118.42], [123.0, 134.65], [139.0, 141.72], [149.0, 149.93], [151.0, 152.76], [158.0, 158.43], [171.0, 173.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, true], "silence_prob": [34.94, 37.89, 43.56, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 40.9, 38.84, 48.31, 37.31, 34.63, 44.55, 0.0, 0.0, 0.0, 39.61], "audiomae_on_audioset": [[["music", 56.38], ["hum", 8.73], ["musical instrument", 5.93]], [["music", 59.06], ["didgeridoo", 17.49], ["insect", 3.35]], [["music", 76.92], ["didgeridoo", 3.25], ["musical instrument", 2.48]], null, [["music", 67.29], ["electronic music", 6.86], ["synthesizer", 3.75]], null, null, null, null, [["speech", 32.91], ["music", 15.78], ["hum", 15.63]], [["music", 70.01], ["hum", 5.02], ["electronic music", 3.41]], [["music", 35.05], ["speech", 24.42], ["whale vocalization", 8.18]], [["music", 35.91], ["speech", 21.4], ["whale vocalization", 5.14]], [["music", 31.24], ["hum", 25.55], ["throbbing", 11.53]], [["music", 49.66], ["pulse", 18.57], ["theremin", 6.33]], null, null, null, [["music", 42.22], ["buzz", 9.42], ["didgeridoo", 4.76]]], "duration": [16.82, 13.38, 3.06, 0.31, 2.74, 0.99, 1.71, -0.04, 1.43, 2.26, 10.25, 4.98, 14.42, 11.65, 2.72, 0.93, 1.76, 0.43, 2.94]} \ No newline at end of file diff --git a/annotations_1/f0-Ea9Ki7YU_filtered.json b/annotations_1/f0-Ea9Ki7YU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf71aaa6185c4382b70c3a038ce1aa5a68d25d7 --- /dev/null +++ b/annotations_1/f0-Ea9Ki7YU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.48], [15.0, 35.48], [40.0, 96.01], [97.0, 98.04], [100.0, 120.31], [121.0, 121.78], [127.0, 127.33], [129.0, 130.23], [132.0, 132.21], [133.0, 133.93], [138.0, 138.33], [139.0, 140.86], [141.0, 148.05], [149.0, 151.87], [153.0, 154.65], [156.0, 179.29], [180.0, 180.76]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.68, 28.37, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 64.52, 0.0, 29.87, 0.0], "audiomae_on_audioset": [[["music", 43.22], ["buzzer", 10.91], ["theremin", 8.38]], [["music", 71.47], ["didgeridoo", 8.21], ["musical instrument", 3.24]], null, null, [["trombone", 23.01], ["music", 22.49], ["brass instrument", 21.31]], null, null, null, null, null, null, null, null, null, null, [["theremin", 60.98], ["music", 30.85], ["musical instrument", 0.87]], null], "duration": [3.48, 20.48, 56.01, 1.04, 20.31, 0.78, 0.33, 1.23, 0.21, 0.93, 0.33, 1.86, 7.05, 2.87, 1.65, 23.29, 0.76]} \ No newline at end of file diff --git a/annotations_1/f06qimixOOI_filtered.json b/annotations_1/f06qimixOOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39bf11a64bc30e5bd67f7fde2bcca26fcb93a4bf --- /dev/null +++ b/annotations_1/f06qimixOOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.31], [5.0, 6.67], [9.0, 18.32], [20.0, 28.16], [31.0, 51.14], [52.0, 51.71], [55.0, 55.05], [56.0, 65.67], [67.0, 69.21], [73.0, 83.49], [86.0, 91.59]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 81.53, 72.31, 33.6, 0.0, 0.0, 30.5, 50.56, 46.47, 29.07], "audiomae_on_audioset": [null, null, null, null, [["music", 61.82], ["musical instrument", 4.5], ["singing bowl", 2.76]], null, null, [["music", 18.4], ["livestock, farm animals, working animals", 17.67], ["cattle, bovinae", 10.12]], null, [["music", 61.56], ["effects unit", 9.36], ["guitar", 6.42]], [["didgeridoo", 33.32], ["speech", 28.02], ["music", 23.54]]], "duration": [1.31, 1.67, 9.32, 8.16, 20.14, -0.29, 0.05, 9.67, 2.21, 10.49, 5.59]} \ No newline at end of file diff --git a/annotations_1/f0sDG0nnftw_filtered.json b/annotations_1/f0sDG0nnftw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aab1ab2850bfafa19bcefcfeb0439425c6815270 --- /dev/null +++ b/annotations_1/f0sDG0nnftw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 40.37], [51.0, 51.85], [53.0, 53.25], [54.0, 62.99], [79.0, 86.36], [91.0, 91.88], [95.0, 99.27], [101.0, 105.53]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.42, 80.82, 0.0, 78.21, 63.96], "audiomae_on_audioset": [null, null, null, [["music", 43.94], ["didgeridoo", 10.07], ["musical instrument", 9.0]], null, null, null, null], "duration": [33.37, 0.85, 0.25, 8.99, 7.36, 0.88, 4.27, 4.53]} \ No newline at end of file diff --git a/annotations_1/f1bk5a_jaEA_filtered.json b/annotations_1/f1bk5a_jaEA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66a26ddd90f09051a41dd89b48c7e148e2a6efdd --- /dev/null +++ b/annotations_1/f1bk5a_jaEA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.83], [31.0, 31.97], [34.0, 38.6], [40.0, 40.49], [41.0, 57.16], [58.0, 62.01], [77.0, 76.65], [79.0, 78.93], [83.0, 85.68], [89.0, 101.06], [102.0, 102.93], [103.0, 103.81], [104.0, 150.63], [152.0, 154.8], [157.0, 158.16], [161.0, 172.3], [177.0, 177.15], [177.0, 178.09], [179.0, 179.0], [180.0, 179.86], [188.0, 212.45], [218.0, 225.9]], "keep_status": [false, false, true, false, false, true, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 36.86, 0.0, 34.94, 30.54, 0.0, 0.0, 30.66, 31.95, 0.0, 0.0, 0.0, 31.69, 0.0, 29.96, 0.0, 0.0, 0.0, 0.0, 31.57, 30.94], "audiomae_on_audioset": [null, null, [["music", 48.99], ["marimba, xylophone", 6.3], ["glockenspiel", 4.12]], null, [["music", 71.17], ["brass instrument", 4.08], ["echo", 2.93]], [["music", 34.83], ["effects unit", 6.56], ["musical instrument", 5.73]], null, null, [["chant", 28.32], ["choir", 12.67], ["music", 12.61]], [["music", 46.92], ["musical instrument", 13.39], ["brass instrument", 5.44]], null, null, null, [["sidetone", 29.36], ["music", 12.03], ["fly, housefly", 10.36]], null, [["music", 73.8], ["theremin", 4.44], ["singing", 2.16]], null, null, null, null, [["music", 36.68], ["didgeridoo", 33.97], ["theremin", 14.9]], [["music", 42.67], ["animal", 11.55], ["noise", 10.9]]], "duration": [1.83, 0.97, 4.6, 0.49, 16.16, 4.01, -0.35, -0.07, 2.68, 12.06, 0.93, 0.81, 46.63, 2.8, 1.16, 11.3, 0.15, 1.09, 0.0, -0.14, 24.45, 7.9]} \ No newline at end of file diff --git a/annotations_1/f1mbRj3ejAk_filtered.json b/annotations_1/f1mbRj3ejAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e74efa0197d77af7ace0001d20a95c3ac937f93a --- /dev/null +++ b/annotations_1/f1mbRj3ejAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.45], [25.0, 26.62], [28.0, 28.31], [30.0, 31.53], [33.0, 33.08], [35.0, 35.19], [36.0, 36.61], [38.0, 38.37], [45.0, 50.4], [51.0, 51.93], [55.0, 57.77], [58.0, 58.13], [59.0, 61.33], [62.0, 76.59], [80.0, 83.1]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, true, true], "silence_prob": [56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0, 34.73, 0.0, 32.89, 33.06, 32.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 27.47], ["music", 15.36], ["tick-tock", 5.7]], null, [["music", 30.57], ["throbbing", 29.6], ["hum", 13.84]], null, [["music", 50.36], ["didgeridoo", 12.81], ["speech", 3.37]], [["music", 26.82], ["hum", 19.1], ["throbbing", 14.77]], [["speech", 28.3], ["hum", 12.41], ["music", 11.35]]], "duration": [2.45, 1.62, 0.31, 1.53, 0.08, 0.19, 0.61, 0.37, 5.4, 0.93, 2.77, 0.13, 2.33, 14.59, 3.1]} \ No newline at end of file diff --git a/annotations_1/f2FzrfnfQPY_filtered.json b/annotations_1/f2FzrfnfQPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e5be64a0c96034bab94ed0b1c3fac0b74580cb1 --- /dev/null +++ b/annotations_1/f2FzrfnfQPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.55], [10.0, 11.21], [13.0, 13.8], [16.0, 17.46], [20.0, 21.95], [25.0, 25.14], [26.0, 26.25], [32.0, 31.95], [33.0, 33.54], [36.0, 37.32], [38.0, 38.52], [42.0, 42.74], [44.0, 45.96], [47.0, 48.9], [54.0, 54.8], [64.0, 65.43], [76.0, 79.15], [81.0, 84.2], [86.0, 88.03], [95.0, 106.95], [112.0, 112.24], [114.0, 116.16], [118.0, 121.17], [124.0, 128.17], [133.0, 135.38], [137.0, 139.04], [145.0, 146.4], [149.0, 150.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 31.92, 38.16, 29.65, 0.0, 29.59, 32.8, 46.33, 28.92, 40.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.92], ["mains hum", 29.22], ["fly, housefly", 7.01]], [["whack, thwack", 14.03], ["vehicle", 10.43], ["car", 8.64]], [["throbbing", 24.06], ["music", 23.79], ["hum", 19.79]], [["music", 35.49], ["hum", 12.77], ["mains hum", 8.48]], null, [["music", 63.44], ["theremin", 4.51], ["sound effect", 3.46]], [["music", 25.91], ["hum", 10.22], ["pulse", 6.58]], [["music", 33.48], ["hum", 16.28], ["throbbing", 7.46]], [["music", 54.86], ["musical instrument", 3.91], ["whale vocalization", 3.62]], [["speech", 32.0], ["hum", 16.13], ["music", 15.54]], null, null], "duration": [1.55, 1.21, 0.8, 1.46, 1.95, 0.14, 0.25, -0.05, 0.54, 1.32, 0.52, 0.74, 1.96, 1.9, 0.8, 1.43, 3.15, 3.2, 2.03, 11.95, 0.24, 2.16, 3.17, 4.17, 2.38, 2.04, 1.4, 1.43]} \ No newline at end of file diff --git a/annotations_1/f2Hz2k2PcfI_filtered.json b/annotations_1/f2Hz2k2PcfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a3e49abaaaa6d267ea25144b61e9f3c77ad14c --- /dev/null +++ b/annotations_1/f2Hz2k2PcfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.66], [30.0, 32.16], [35.0, 38.03], [39.0, 40.88], [61.0, 62.55], [64.0, 64.71], [74.0, 75.07], [81.0, 81.84], [84.0, 86.04], [90.0, 90.46], [96.0, 97.34], [99.0, 100.41], [102.0, 102.3], [116.0, 117.86], [119.0, 120.19], [121.0, 122.52], [123.0, 123.57], [125.0, 125.07], [136.0, 136.76], [143.0, 143.45], [145.0, 148.63], [150.0, 151.55], [153.0, 154.75], [159.0, 159.71], [164.0, 167.88], [170.0, 170.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.07, 87.37, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.66, 2.16, 3.03, 1.88, 1.55, 0.71, 1.07, 0.84, 2.04, 0.46, 1.34, 1.41, 0.3, 1.86, 1.19, 1.52, 0.57, 0.07, 0.76, 0.45, 3.63, 1.55, 1.75, 0.71, 3.88, 0.73]} \ No newline at end of file diff --git a/annotations_1/f4LEgmt0roE_filtered.json b/annotations_1/f4LEgmt0roE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6971f69435405ce0cbe2dee87e7129b36aeb9d54 --- /dev/null +++ b/annotations_1/f4LEgmt0roE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.86], [18.0, 18.15], [22.0, 22.67], [79.0, 79.25], [88.0, 90.15], [95.0, 94.96], [99.0, 99.71], [106.0, 107.76], [108.0, 108.75]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.15, 0.67, 0.25, 2.15, -0.04, 0.71, 1.76, 0.75]} \ No newline at end of file diff --git a/annotations_1/f4gmgTebHog_filtered.json b/annotations_1/f4gmgTebHog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ecc79f3b3a0686f5f2e17d7b3378155362bedf38 --- /dev/null +++ b/annotations_1/f4gmgTebHog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [6.0, 6.96], [9.0, 25.51], [26.0, 64.93], [69.0, 71.09], [72.0, 74.53], [77.0, 78.68], [80.0, 87.57], [88.0, 89.04], [90.0, 94.95], [99.0, 140.54], [141.0, 155.22], [158.0, 158.57], [162.0, 161.99], [163.0, 164.62], [168.0, 169.67], [174.0, 175.41], [179.0, 180.76], [182.0, 182.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.9, 0.0, 75.23, 55.81, 0.0, 40.31, 0.0, 34.39, 0.0, 30.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.35], ["hum", 9.54], ["sonar", 6.95]], null, null, null, null, [["music", 65.75], ["hum", 8.59], ["throbbing", 4.94]], null, [["music", 73.53], ["musical instrument", 6.1], ["guitar", 2.16]], null, [["music", 80.6], ["theremin", 5.71], ["scary music", 2.48]], null, null, null, null, null, null, null], "duration": [0.94, 0.96, 16.51, 38.93, 2.09, 2.53, 1.68, 7.57, 1.04, 4.95, 41.54, 14.22, 0.57, -0.01, 1.62, 1.67, 1.41, 1.76, 0.28]} \ No newline at end of file diff --git a/annotations_1/f4wmj-Nq9xA_filtered.json b/annotations_1/f4wmj-Nq9xA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba272ed2de4d8fdd257da8624ed29b16d7f2c4f1 --- /dev/null +++ b/annotations_1/f4wmj-Nq9xA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.26], [13.0, 13.44], [23.0, 22.79], [51.0, 51.49], [66.0, 66.77], [69.0, 69.72], [73.0, 75.57], [77.0, 78.44]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.26, 0.44, -0.21, 0.49, 0.77, 0.72, 2.57, 1.44]} \ No newline at end of file diff --git a/annotations_1/f6Dan7z0p4c_filtered.json b/annotations_1/f6Dan7z0p4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/f6Dan7z0p4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/f6F6MzMT2g8_filtered.json b/annotations_1/f6F6MzMT2g8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00649e2cc13bb03957e77a57ce3d9f145a56c040 --- /dev/null +++ b/annotations_1/f6F6MzMT2g8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 12.09], [13.0, 16.93], [18.0, 18.32], [19.0, 21.0], [24.0, 27.57], [28.0, 31.51], [35.0, 34.82], [43.0, 44.64], [46.0, 48.1], [57.0, 63.44], [72.0, 72.12], [74.0, 75.52], [78.0, 78.16], [80.0, 79.96], [82.0, 84.06], [92.0, 91.69], [95.0, 94.95], [96.0, 100.28], [113.0, 113.43], [114.0, 118.67], [120.0, 121.12], [122.0, 123.35], [126.0, 126.2], [130.0, 130.15], [144.0, 144.64]], "keep_status": [true, true, false, true, true, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [33.03, 32.04, 0.0, 44.72, 37.2, 38.27, 0.0, 0.0, 35.5, 34.92, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 0.0, 32.3, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.26], ["speech", 20.99], ["throbbing", 11.58]], [["music", 43.75], ["speech", 15.22], ["hum", 3.44]], null, [["speech", 20.27], ["music", 14.68], ["fly, housefly", 7.36]], [["music", 19.69], ["foghorn", 18.88], ["speech", 10.07]], [["music", 30.89], ["speech", 26.63], ["radio", 7.85]], null, null, [["music", 55.66], ["speech", 10.33], ["musical instrument", 3.42]], [["music", 63.02], ["throbbing", 5.72], ["noise", 5.58]], null, null, null, null, [["music", 74.66], ["synthesizer", 10.35], ["musical instrument", 4.21]], null, null, [["music", 38.66], ["speech", 17.93], ["hum", 11.79]], null, [["speech", 36.69], ["music", 28.19], ["hum", 9.87]], null, null, null, null, null], "duration": [6.09, 3.93, 0.32, 2.0, 3.57, 3.51, -0.18, 1.64, 2.1, 6.44, 0.12, 1.52, 0.16, -0.04, 2.06, -0.31, -0.05, 4.28, 0.43, 4.67, 1.12, 1.35, 0.2, 0.15, 0.64]} \ No newline at end of file diff --git a/annotations_1/f7l5I6ZPt_Y_filtered.json b/annotations_1/f7l5I6ZPt_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25ea6f117d624d49322552c6b42deaef9d8f3cb1 --- /dev/null +++ b/annotations_1/f7l5I6ZPt_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.93], [48.0, 56.34], [59.0, 59.91], [61.0, 62.55], [64.0, 73.94], [75.0, 77.11], [78.0, 85.09], [88.0, 89.65], [91.0, 91.29], [92.0, 92.42], [93.0, 94.83], [96.0, 97.75], [100.0, 100.2], [101.0, 101.63], [103.0, 105.58], [107.0, 108.38], [111.0, 114.12], [115.0, 115.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.48, 0.0, 0.0, 97.22, 74.76, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 0.0, 78.55, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 8.34, 0.91, 1.55, 9.94, 2.11, 7.09, 1.65, 0.29, 0.42, 1.83, 1.75, 0.2, 0.63, 2.58, 1.38, 3.12, 0.86]} \ No newline at end of file diff --git a/annotations_1/f8-6UgJ6dSo_filtered.json b/annotations_1/f8-6UgJ6dSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de342df75d9ccead19319dbdaff5be0cb87a1734 --- /dev/null +++ b/annotations_1/f8-6UgJ6dSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.28], [1.0, 0.78], [2.0, 3.45], [5.0, 6.64], [10.0, 10.61], [11.0, 11.42], [12.0, 13.88], [14.0, 15.28], [17.0, 17.86], [20.0, 20.48], [25.0, 25.47], [27.0, 27.84], [28.0, 29.07], [30.0, 30.32], [32.0, 34.6], [35.0, 35.6], [38.0, 38.87], [39.0, 40.36], [42.0, 43.16], [44.0, 44.86], [46.0, 47.09], [49.0, 49.2], [52.0, 54.24], [55.0, 58.73], [59.0, 63.19], [64.0, 65.69], [66.0, 69.3], [69.0, 69.33], [70.0, 69.89], [71.0, 72.05], [74.0, 76.84], [78.0, 78.78], [80.0, 80.43], [81.0, 82.59], [83.0, 84.28], [85.0, 85.8], [86.0, 87.39], [92.0, 92.57], [98.0, 99.23], [100.0, 100.89], [101.0, 102.66], [103.0, 103.52], [104.0, 108.45], [110.0, 121.15], [123.0, 124.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.98, 98.1, 0.0, 65.32, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, -0.22, 1.45, 1.64, 0.61, 0.42, 1.88, 1.28, 0.86, 0.48, 0.47, 0.84, 1.07, 0.32, 2.6, 0.6, 0.87, 1.36, 1.16, 0.86, 1.09, 0.2, 2.24, 3.73, 4.19, 1.69, 3.3, 0.33, -0.11, 1.05, 2.84, 0.78, 0.43, 1.59, 1.28, 0.8, 1.39, 0.57, 1.23, 0.89, 1.66, 0.52, 4.45, 11.15, 1.68]} \ No newline at end of file diff --git a/annotations_1/f86_fLGHu6M_filtered.json b/annotations_1/f86_fLGHu6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..814d31f90c8cb72d23dab44744705340be017312 --- /dev/null +++ b/annotations_1/f86_fLGHu6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 5.0], [8.0, 12.46], [13.0, 12.99], [21.0, 21.86], [27.0, 27.97], [36.0, 36.15], [40.0, 40.09], [50.0, 50.8], [53.0, 53.77], [55.0, 55.26], [60.0, 61.16], [62.0, 63.41], [65.0, 66.02], [71.0, 71.91], [73.0, 74.75], [78.0, 79.29], [87.0, 87.37], [89.0, 95.39], [97.0, 100.63], [101.0, 102.12], [110.0, 110.03], [112.0, 116.28], [119.0, 120.29], [130.0, 131.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 99.98, 0.0, 0.0, 82.43, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.0, 4.46, -0.01, 0.86, 0.97, 0.15, 0.09, 0.8, 0.77, 0.26, 1.16, 1.41, 1.02, 0.91, 1.75, 1.29, 0.37, 6.39, 3.63, 1.12, 0.03, 4.28, 1.29, 1.43]} \ No newline at end of file diff --git a/annotations_1/f8P51JbIp9g_filtered.json b/annotations_1/f8P51JbIp9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eda4d559fe70cbc8cde790417ae16f26797ebf1d --- /dev/null +++ b/annotations_1/f8P51JbIp9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.28], [19.0, 75.42], [75.0, 75.96]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.28, 56.42, 0.96]} \ No newline at end of file diff --git a/annotations_1/f8dkNziRlHg_filtered.json b/annotations_1/f8dkNziRlHg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94b5980eb6d5590cd63b881b7251f71b903910c1 --- /dev/null +++ b/annotations_1/f8dkNziRlHg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 10.49], [11.0, 19.74], [20.0, 42.84], [44.0, 43.97], [48.0, 49.35], [51.0, 51.9], [54.0, 55.85], [59.0, 60.05], [60.0, 65.94], [66.0, 72.01], [72.0, 78.0], [81.0, 83.52], [86.0, 87.78], [88.0, 92.45], [93.0, 98.66], [99.0, 102.41], [111.0, 111.92], [112.0, 116.01], [117.0, 117.44], [117.0, 118.0], [124.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, true, false, true, true, true, false, true, false, false, true], "silence_prob": [72.16, 55.74, 36.31, 0.0, 0.0, 0.0, 0.0, 0.0, 41.62, 32.91, 30.21, 44.37, 0.0, 38.25, 40.47, 41.56, 0.0, 36.72, 0.0, 0.0, 42.42], "audiomae_on_audioset": [null, null, [["music", 44.71], ["theremin", 22.98], ["hum", 3.82]], null, null, null, null, null, [["speech", 31.85], ["music", 26.14], ["fart", 7.43]], [["music", 48.82], ["speech", 9.1], ["theremin", 8.51]], [["theremin", 65.6], ["music", 21.11], ["musical instrument", 2.52]], [["music", 36.57], ["didgeridoo", 18.87], ["hum", 7.65]], null, [["music", 37.83], ["didgeridoo", 19.62], ["speech", 6.09]], [["music", 43.94], ["didgeridoo", 9.61], ["theremin", 8.22]], [["music", 62.13], ["brass instrument", 3.78], ["musical instrument", 2.54]], null, [["speech", 26.19], ["music", 21.22], ["foghorn", 12.33]], null, null, [["music", 37.39], ["throbbing", 17.2], ["heart sounds, heartbeat", 9.28]]], "duration": [6.49, 8.74, 22.84, -0.03, 1.35, 0.9, 1.85, 1.05, 5.94, 6.01, 6.0, 2.52, 1.78, 4.45, 5.66, 3.41, 0.92, 4.01, 0.44, 1.0, 5.19]} \ No newline at end of file diff --git a/annotations_1/f96ppJ3DSGE_filtered.json b/annotations_1/f96ppJ3DSGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa5330686d4ec74b6fc0f55a541db13f25e77096 --- /dev/null +++ b/annotations_1/f96ppJ3DSGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 53.01], [55.0, 67.66], [72.0, 93.39], [94.0, 143.02], [144.0, 148.09], [149.0, 152.05]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 39.24, 32.66, 0.0, 81.71, 89.36], "audiomae_on_audioset": [null, [["music", 47.56], ["hum", 21.63], ["mains hum", 11.45]], [["hum", 22.04], ["music", 14.05], ["burping, eructation", 6.51]], null, null, null], "duration": [33.01, 12.66, 21.39, 49.02, 4.09, 3.05]} \ No newline at end of file diff --git a/annotations_1/f9Od8yx9gmg_filtered.json b/annotations_1/f9Od8yx9gmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95f657ce81ff9dfa9c340c3b213593178bcf0147 --- /dev/null +++ b/annotations_1/f9Od8yx9gmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 41.59], [44.0, 53.03], [54.0, 80.37], [82.0, 85.83], [88.0, 101.9], [104.0, 125.93], [134.0, 151.36], [154.0, 158.45], [161.0, 166.8], [171.0, 170.67], [173.0, 175.74], [179.0, 180.49], [184.0, 194.17]], "keep_status": [true, false, false, true, false, true, false, true, false, false, false, false, true], "silence_prob": [29.05, 29.18, 28.73, 29.13, 28.85, 29.53, 29.13, 32.96, 36.31, 0.0, 30.12, 0.0, 29.62], "audiomae_on_audioset": [[["music", 26.51], ["hum", 23.71], ["speech", 16.45]], [["music", 64.12], ["noise", 7.23], ["speech", 5.76]], [["speech", 44.05], ["music", 32.21], ["buzz", 2.12]], [["explosion", 24.84], ["rumble", 15.01], ["speech", 6.58]], [["music", 40.66], ["mains hum", 19.94], ["hum", 12.82]], [["music", 22.45], ["whack, thwack", 16.52], ["speech", 9.12]], [["throbbing", 53.38], ["hum", 17.23], ["music", 16.41]], [["music", 36.56], ["hum", 14.01], ["mains hum", 7.85]], [["throbbing", 33.58], ["music", 30.02], ["hum", 20.65]], null, [["music", 73.37], ["electronic music", 4.71], ["speech", 2.75]], null, [["music", 57.41], ["hum", 6.96], ["mains hum", 5.59]]], "duration": [27.59, 9.03, 26.37, 3.83, 13.9, 21.93, 17.36, 4.45, 5.8, -0.33, 2.74, 1.49, 10.17]} \ No newline at end of file diff --git a/annotations_1/f9Wq05WVXiQ_filtered.json b/annotations_1/f9Wq05WVXiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eefd62c4ebbfddead142e324adfd8e0d643ae02 --- /dev/null +++ b/annotations_1/f9Wq05WVXiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [7.0, 8.07], [9.0, 8.78], [17.0, 16.95], [18.0, 19.84], [20.0, 20.36], [24.0, 25.83], [27.0, 28.11], [29.0, 40.02], [42.0, 42.03], [43.0, 44.71], [47.0, 48.78], [49.0, 52.62], [54.0, 69.09], [70.0, 158.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 44.46, 59.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["fly, housefly", 47.39], ["mosquito", 17.37], ["insect", 16.99]], null, null, null, [["speech", 48.4], ["hum", 19.67], ["mains hum", 7.91]], null, null], "duration": [1.97, 1.07, -0.22, -0.05, 1.84, 0.36, 1.83, 1.11, 11.02, 0.03, 1.71, 1.78, 3.62, 15.09, 88.7]} \ No newline at end of file diff --git a/annotations_1/f9wFKCfic8Q_filtered.json b/annotations_1/f9wFKCfic8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e0b983a81a38fa950d797f45450901858a4c57e --- /dev/null +++ b/annotations_1/f9wFKCfic8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 10.59], [11.0, 19.6], [20.0, 25.35], [27.0, 28.39], [29.0, 30.37], [33.0, 59.56], [64.0, 72.47], [76.0, 86.91], [92.0, 95.18]], "keep_status": [false, true, true, false, false, true, false, false, false], "silence_prob": [38.46, 34.2, 32.22, 0.0, 0.0, 31.09, 31.76, 35.24, 35.51], "audiomae_on_audioset": [[["music", 41.56], ["hum", 19.26], ["throbbing", 9.51]], [["livestock, farm animals, working animals", 32.62], ["speech", 14.61], ["cattle, bovinae", 10.16]], [["speech", 33.5], ["music", 32.94], ["electronic music", 3.14]], null, null, [["music", 28.44], ["speech", 16.65], ["livestock, farm animals, working animals", 9.59]], [["music", 41.18], ["speech", 32.05], ["explosion", 6.13]], [["music", 44.23], ["throbbing", 21.7], ["hum", 19.04]], [["speech", 51.17], ["music", 18.92], ["boing", 8.17]]], "duration": [5.59, 8.6, 5.35, 1.39, 1.37, 26.56, 8.47, 10.91, 3.18]} \ No newline at end of file diff --git a/annotations_1/fAaVf_wel0c_filtered.json b/annotations_1/fAaVf_wel0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eda908f7d469aa0d9fdcef67c1fa07d83dfed7d --- /dev/null +++ b/annotations_1/fAaVf_wel0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [9.0, 8.58], [13.0, 14.32], [25.0, 27.4], [29.0, 29.0], [37.0, 39.92], [41.0, 42.74], [44.0, 44.66], [47.0, 47.83], [49.0, 49.77], [51.0, 51.04], [55.0, 55.41], [57.0, 56.89], [57.0, 56.93], [57.0, 57.0], [57.0, 57.59], [58.0, 57.81], [58.0, 57.94], [59.0, 59.58], [75.0, 75.41], [85.0, 87.24], [90.0, 93.77], [111.0, 110.64], [113.0, 114.57], [117.0, 118.4], [126.0, 126.23], [128.0, 130.05], [131.0, 133.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 94.81, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.87, 30.44, 0.0, 0.0, 0.0, 0.0, 29.47, 29.17], "audiomae_on_audioset": [null, null, null, null, null, [["music", 66.24], ["musical instrument", 11.32], ["harp", 6.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.26], ["musical instrument", 6.99], ["didgeridoo", 6.73]], [["music", 66.87], ["singing", 2.51], ["synthetic singing", 1.97]], null, null, null, null, [["music", 57.47], ["musical instrument", 4.25], ["didgeridoo", 3.49]], [["music", 52.68], ["theremin", 5.64], ["musical instrument", 4.11]]], "duration": [0.26, -0.42, 1.32, 2.4, 0.0, 2.92, 1.74, 0.66, 0.83, 0.77, 0.04, 0.41, -0.11, -0.07, 0.0, 0.59, -0.19, -0.06, 0.58, 0.41, 2.24, 3.77, -0.36, 1.57, 1.4, 0.23, 2.05, 2.83]} \ No newline at end of file diff --git a/annotations_1/fAdsL7AXW6A_filtered.json b/annotations_1/fAdsL7AXW6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0eda811c1a6b994e97a7766eac51b33272fce15 --- /dev/null +++ b/annotations_1/fAdsL7AXW6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [5.0, 6.0], [7.0, 7.6], [9.0, 10.17], [30.0, 31.53], [32.0, 32.88], [38.0, 39.34], [42.0, 90.34], [91.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.54], ["buzz", 10.57], ["cattle, bovinae", 10.18]]], "duration": [0.83, 1.0, 0.6, 1.17, 1.53, 0.88, 1.34, 48.34, 28.94]} \ No newline at end of file diff --git a/annotations_1/fAiJAcgjWeQ_filtered.json b/annotations_1/fAiJAcgjWeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5706b119fdebdf9c3356a623b61fe531da9b56 --- /dev/null +++ b/annotations_1/fAiJAcgjWeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.72], [15.0, 15.35], [17.0, 19.03], [19.0, 20.97], [22.0, 23.43], [25.0, 25.76], [27.0, 27.6], [29.0, 31.14], [33.0, 33.35], [35.0, 36.1], [36.0, 38.58], [41.0, 41.17], [52.0, 54.38], [55.0, 57.69], [63.0, 63.27], [65.0, 65.35], [67.0, 66.97], [67.0, 67.31], [68.0, 70.17], [73.0, 73.58], [76.0, 76.18], [78.0, 78.33], [79.0, 79.39], [80.0, 80.55], [81.0, 81.5], [87.0, 87.35], [91.0, 92.31], [94.0, 97.48], [98.0, 99.87], [100.0, 106.25], [113.0, 114.29], [116.0, 119.13], [120.0, 122.18], [123.0, 128.63], [129.0, 129.81], [131.0, 131.4], [132.0, 133.25], [134.0, 134.92], [140.0, 141.96], [143.0, 143.63], [146.0, 145.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 0.0, 95.23, 0.0, 0.0, 86.27, 0.0, 88.46, 95.91, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 87.55, 0.0, 99.16, 98.99, 60.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.35, 2.03, 1.97, 1.43, 0.76, 0.6, 2.14, 0.35, 1.1, 2.58, 0.17, 2.38, 2.69, 0.27, 0.35, -0.03, 0.31, 2.17, 0.58, 0.18, 0.33, 0.39, 0.55, 0.5, 0.35, 1.31, 3.48, 1.87, 6.25, 1.29, 3.13, 2.18, 5.63, 0.81, 0.4, 1.25, 0.92, 1.96, 0.63, -0.07]} \ No newline at end of file diff --git a/annotations_1/fB5HTcFhCso_filtered.json b/annotations_1/fB5HTcFhCso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b8b98e88d942d4c8f8f93c2038d3818b7f31c26 --- /dev/null +++ b/annotations_1/fB5HTcFhCso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.84], [11.0, 11.55], [12.0, 12.56], [18.0, 18.54], [20.0, 20.82], [23.0, 24.24], [31.0, 39.73], [42.0, 43.16], [44.0, 45.6], [50.0, 53.16], [56.0, 59.29], [61.0, 64.91], [66.0, 71.17], [73.0, 88.45], [89.0, 89.73], [90.0, 90.81], [91.0, 92.69], [97.0, 98.95], [102.0, 102.41], [104.0, 107.27], [109.0, 114.66], [115.0, 116.61], [117.0, 118.18], [124.0, 126.0], [128.0, 131.94], [132.0, 133.57], [142.0, 143.61], [148.0, 148.78], [149.0, 150.47], [154.0, 155.46], [156.0, 157.92], [159.0, 160.68], [165.0, 167.34], [168.0, 170.09], [173.0, 175.76], [176.0, 177.2], [178.0, 179.19], [184.0, 185.45]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 42.3, 56.18, 45.65, 42.3, 31.5, 0.0, 0.0, 0.0, 0.0, 0.0, 42.39, 51.55, 0.0, 0.0, 48.52, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 69.74, 57.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.15], ["hum", 7.67], ["throbbing", 6.32]], null, null, [["cattle, bovinae", 42.3], ["moo", 32.14], ["livestock, farm animals, working animals", 12.26]], null, [["music", 16.22], ["mains hum", 14.85], ["hum", 12.14]], [["whale vocalization", 37.9], ["music", 24.06], ["theremin", 7.26]], [["music", 66.47], ["throbbing", 16.9], ["didgeridoo", 2.71]], null, null, null, null, null, [["music", 25.64], ["hum", 9.0], ["speech", 8.1]], null, null, null, [["speech", 32.17], ["hum", 9.95], ["mains hum", 8.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.55, 0.56, 0.54, 0.82, 1.24, 8.73, 1.16, 1.6, 3.16, 3.29, 3.91, 5.17, 15.45, 0.73, 0.81, 1.69, 1.95, 0.41, 3.27, 5.66, 1.61, 1.18, 2.0, 3.94, 1.57, 1.61, 0.78, 1.47, 1.46, 1.92, 1.68, 2.34, 2.09, 2.76, 1.2, 1.19, 1.45]} \ No newline at end of file diff --git a/annotations_1/fB8_lNQJ-JM_filtered.json b/annotations_1/fB8_lNQJ-JM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b7a1cbcd5b5b805884e2530f502a1a58ced305 --- /dev/null +++ b/annotations_1/fB8_lNQJ-JM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.86], [18.0, 18.23], [18.0, 28.9], [32.0, 31.97], [32.0, 32.53], [36.0, 36.31], [38.0, 39.24], [40.0, 40.76], [43.0, 43.21], [45.0, 45.81], [48.0, 51.95], [62.0, 62.67], [65.0, 65.52], [66.0, 66.48], [67.0, 68.15], [69.0, 69.92], [71.0, 72.33], [75.0, 76.25], [82.0, 82.97], [84.0, 85.8], [88.0, 89.02], [89.0, 89.97], [92.0, 92.89], [94.0, 95.66], [99.0, 99.15], [101.0, 102.69], [104.0, 107.99], [109.0, 110.66], [111.0, 114.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 44.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.14, 0.0, 47.82], "audiomae_on_audioset": [null, null, [["boat, water vehicle", 33.02], ["speech", 26.9], ["rowboat, canoe, kayak", 20.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 10.73], ["music", 8.25], ["speech", 7.61]]], "duration": [1.86, 0.23, 10.9, -0.03, 0.53, 0.31, 1.24, 0.76, 0.21, 0.81, 3.95, 0.67, 0.52, 0.48, 1.15, 0.92, 1.33, 1.25, 0.97, 1.8, 1.02, 0.97, 0.89, 1.66, 0.15, 1.69, 3.99, 1.66, 3.56]} \ No newline at end of file diff --git a/annotations_1/fBNzgfFkvEo_filtered.json b/annotations_1/fBNzgfFkvEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a34a374e7e6780da9a131313701a93a14f9a31d --- /dev/null +++ b/annotations_1/fBNzgfFkvEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 108.77], [110.0, 147.78]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [58.77, 37.78]} \ No newline at end of file diff --git a/annotations_1/fBTODK66ymw_filtered.json b/annotations_1/fBTODK66ymw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7f6766c4794f78be559b108f93e6a8734f66c05 --- /dev/null +++ b/annotations_1/fBTODK66ymw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [6.0, 7.35], [10.0, 15.65], [17.0, 63.05], [67.0, 73.63], [76.0, 81.55], [83.0, 85.31], [89.0, 106.0], [111.0, 111.91], [113.0, 115.25], [117.0, 118.44], [119.0, 119.79], [120.0, 121.29], [122.0, 134.67], [135.0, 149.55], [153.0, 153.54], [154.0, 153.62], [154.0, 154.74], [157.0, 157.05], [161.0, 160.83], [164.0, 164.81], [170.0, 183.78], [185.0, 186.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.64, 0.0, 30.09, 30.04, 31.37, 28.78, 0.0, 29.08, 0.0, 0.0, 0.0, 28.64, 29.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.15, 0.0], "audiomae_on_audioset": [null, null, [["buzz", 26.54], ["electric shaver, electric razor", 15.6], ["hum", 13.94]], null, [["throbbing", 54.53], ["music", 20.72], ["hum", 15.67]], [["hum", 42.97], ["throbbing", 26.99], ["mains hum", 18.21]], [["music", 44.37], ["throbbing", 18.72], ["hum", 10.08]], [["music", 71.55], ["buzz", 3.53], ["cacophony", 2.91]], null, [["electric shaver, electric razor", 38.33], ["music", 24.27], ["mains hum", 9.4]], null, null, null, [["music", 26.71], ["buzz", 16.99], ["hum", 15.83]], [["music", 29.35], ["hum", 23.21], ["mains hum", 21.07]], null, null, null, null, null, null, [["mains hum", 33.89], ["hum", 27.65], ["music", 19.9]], null], "duration": [0.37, 1.35, 5.65, 46.05, 6.63, 5.55, 2.31, 17.0, 0.91, 2.25, 1.44, 0.79, 1.29, 12.67, 14.55, 0.54, -0.38, 0.74, 0.05, -0.17, 0.81, 13.78, 1.19]} \ No newline at end of file diff --git a/annotations_1/fBXXvn4s-74_filtered.json b/annotations_1/fBXXvn4s-74_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2cc97b6e1a1dee6edc0ce0dc4d00b6777510852c --- /dev/null +++ b/annotations_1/fBXXvn4s-74_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.49], [34.0, 34.7], [37.0, 37.86], [52.0, 51.97], [86.0, 86.32], [98.0, 98.15], [110.0, 112.35], [120.0, 120.56], [136.0, 136.75], [143.0, 142.86], [145.0, 146.1], [149.0, 148.8], [153.0, 153.91], [175.0, 176.15], [207.0, 209.22], [213.0, 216.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.98, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.49, 0.7, 0.86, -0.03, 0.32, 0.15, 2.35, 0.56, 0.75, -0.14, 1.1, -0.2, 0.91, 1.15, 2.22, 3.57]} \ No newline at end of file diff --git a/annotations_1/fB_fwuJOx7I_filtered.json b/annotations_1/fB_fwuJOx7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b82114dcc07741991bf311b69fb2c4680a1a3b60 --- /dev/null +++ b/annotations_1/fB_fwuJOx7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.02], [28.0, 40.53], [41.0, 41.88], [43.0, 45.77], [47.0, 48.14], [49.0, 49.42], [53.0, 54.06], [55.0, 56.12], [57.0, 58.72], [60.0, 65.08], [66.0, 68.5], [70.0, 70.43], [71.0, 71.64], [74.0, 79.56], [84.0, 87.86], [88.0, 88.92], [90.0, 94.51], [100.0, 100.35], [102.0, 101.98], [103.0, 105.31], [107.0, 107.08], [109.0, 121.12]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.65, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 99.73, 0.0, 0.0, 88.28, 29.92, 0.0, 52.39, 0.0, 0.0, 95.91, 0.0, 38.84], "audiomae_on_audioset": [null, [["music", 18.16], ["thunk", 11.38], ["speech", 10.65]], null, null, null, null, null, null, null, null, null, null, null, null, [["clang", 45.4], ["music", 17.06], ["ding", 16.73]], null, null, null, null, null, null, [["music", 77.98], ["hip hop music", 2.57], ["dubstep", 2.34]]], "duration": [1.02, 12.53, 0.88, 2.77, 1.14, 0.42, 1.06, 1.12, 1.72, 5.08, 2.5, 0.43, 0.64, 5.56, 3.86, 0.92, 4.51, 0.35, -0.02, 2.31, 0.08, 12.12]} \ No newline at end of file diff --git a/annotations_1/fBpNFLngzT4_filtered.json b/annotations_1/fBpNFLngzT4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc3c80b9452615ab118d6bff9d469a6e8bc73231 --- /dev/null +++ b/annotations_1/fBpNFLngzT4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.02], [7.0, 8.14], [10.0, 13.98], [18.0, 18.66], [20.0, 20.49], [23.0, 27.94], [29.0, 45.4], [48.0, 64.44], [65.0, 65.52], [68.0, 77.58], [83.0, 82.78], [83.0, 83.39], [84.0, 86.14], [87.0, 87.13], [90.0, 96.23], [105.0, 106.51], [108.0, 108.28], [113.0, 116.88], [117.0, 117.59], [127.0, 129.05], [131.0, 130.94]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [61.97, 0.0, 38.93, 0.0, 0.0, 33.67, 33.36, 33.33, 0.0, 37.53, 0.0, 0.0, 33.92, 0.0, 33.28, 0.0, 0.0, 34.96, 0.0, 34.39, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.0], ["speech", 13.17], ["hum", 7.43]], null, null, [["speech", 63.91], ["throbbing", 3.74], ["fart", 3.45]], [["speech", 62.22], ["music", 9.92], ["hum", 5.29]], [["music", 20.08], ["hum", 15.62], ["throbbing", 11.94]], null, [["music", 72.25], ["musical instrument", 3.86], ["speech", 2.94]], null, null, [["music", 69.12], ["boing", 8.06], ["musical instrument", 2.59]], null, [["boing", 42.29], ["music", 32.03], ["speech", 3.26]], null, null, [["music", 69.28], ["musical instrument", 6.64], ["saxophone", 4.1]], null, [["music", 42.1], ["boing", 12.44], ["musical instrument", 4.41]], null], "duration": [2.02, 1.14, 3.98, 0.66, 0.49, 4.94, 16.4, 16.44, 0.52, 9.58, -0.22, 0.39, 2.14, 0.13, 6.23, 1.51, 0.28, 3.88, 0.59, 2.05, -0.06]} \ No newline at end of file diff --git a/annotations_1/fC1zzL9DjdU_filtered.json b/annotations_1/fC1zzL9DjdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c4c80bf4e9da3e13158ba73fa0711393d226ef9 --- /dev/null +++ b/annotations_1/fC1zzL9DjdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.41], [18.0, 19.68], [24.0, 24.54], [39.0, 39.07], [48.0, 49.23], [50.0, 51.93], [56.0, 57.43], [58.0, 57.97], [58.0, 59.66], [61.0, 61.89], [65.0, 65.69], [68.0, 68.67], [70.0, 73.55], [80.0, 81.58], [83.0, 84.21], [87.0, 87.88], [89.0, 89.02], [89.0, 90.1], [96.0, 100.18], [101.0, 103.3], [105.0, 108.48], [112.0, 117.63], [118.0, 124.8], [135.0, 135.68], [137.0, 138.3], [140.0, 145.1], [154.0, 153.82], [154.0, 155.26], [156.0, 160.56], [165.0, 165.57], [168.0, 168.88], [172.0, 173.77], [176.0, 176.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.09, 81.71, 74.44, 52.1, 87.92, 0.0, 0.0, 83.52, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 1.68, 0.54, 0.07, 1.23, 1.93, 1.43, -0.03, 1.66, 0.89, 0.69, 0.67, 3.55, 1.58, 1.21, 0.88, 0.02, 1.1, 4.18, 2.3, 3.48, 5.63, 6.8, 0.68, 1.3, 5.1, -0.18, 1.26, 4.56, 0.57, 0.88, 1.77, 0.0]} \ No newline at end of file diff --git a/annotations_1/fCNsIYsWjXo_filtered.json b/annotations_1/fCNsIYsWjXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baf4b2d001cce142a26aa77f6e0c0bcf14047160 --- /dev/null +++ b/annotations_1/fCNsIYsWjXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.63], [22.0, 23.03], [24.0, 24.71], [26.0, 26.6], [27.0, 27.46], [30.0, 30.27], [31.0, 31.51], [33.0, 33.84], [35.0, 35.56], [36.0, 37.76], [42.0, 42.99], [45.0, 45.82], [51.0, 51.7], [53.0, 53.38], [56.0, 56.03], [57.0, 56.94], [58.0, 58.77], [67.0, 66.9], [69.0, 69.18], [70.0, 69.97], [71.0, 71.09], [73.0, 73.75], [76.0, 76.54], [82.0, 82.31], [83.0, 83.39], [85.0, 85.94], [86.0, 87.56], [88.0, 89.16], [90.0, 90.96], [97.0, 97.82], [100.0, 99.79], [100.0, 101.66], [106.0, 106.68], [108.0, 109.27], [111.0, 113.04], [114.0, 115.87], [117.0, 118.94], [123.0, 123.48]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.23, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.02], ["speech", 11.08], ["hum", 8.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.77], ["cattle, bovinae", 9.87], ["moo", 6.28]], null, null, null], "duration": [15.63, 1.03, 0.71, 0.6, 0.46, 0.27, 0.51, 0.84, 0.56, 1.76, 0.99, 0.82, 0.7, 0.38, 0.03, -0.06, 0.77, -0.1, 0.18, -0.03, 0.09, 0.75, 0.54, 0.31, 0.39, 0.94, 1.56, 1.16, 0.96, 0.82, -0.21, 1.66, 0.68, 1.27, 2.04, 1.87, 1.94, 0.48]} \ No newline at end of file diff --git a/annotations_1/fDcZoI_wy_w_filtered.json b/annotations_1/fDcZoI_wy_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..169b89fd874c8f7022b44956eca8db838bac2485 --- /dev/null +++ b/annotations_1/fDcZoI_wy_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[91.0, 110.42], [111.0, 111.59], [113.0, 113.88], [117.0, 129.44]], "keep_status": [false, false, false, true], "silence_prob": [33.41, 0.0, 0.0, 32.2], "audiomae_on_audioset": [[["music", 74.51], ["glass", 5.73], ["smash, crash", 5.25]], null, null, [["mains hum", 21.2], ["hum", 20.6], ["noise", 14.92]]], "duration": [19.42, 0.59, 0.88, 12.44]} \ No newline at end of file diff --git a/annotations_1/fDeQjTPTlDE_filtered.json b/annotations_1/fDeQjTPTlDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42cba589f3cb07c8a4103e5b12a1431aa97b2987 --- /dev/null +++ b/annotations_1/fDeQjTPTlDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.4], [12.0, 12.36], [18.0, 18.03], [24.0, 24.17], [28.0, 31.89], [38.0, 38.48], [40.0, 40.05], [40.0, 40.83], [45.0, 45.45], [50.0, 51.93], [54.0, 57.05], [68.0, 68.08], [71.0, 72.44], [80.0, 80.16], [81.0, 82.16], [88.0, 89.01], [91.0, 91.29], [92.0, 92.85], [94.0, 94.53], [100.0, 100.65], [105.0, 105.56], [114.0, 113.63], [121.0, 121.85], [133.0, 133.1], [138.0, 139.11], [146.0, 158.6], [160.0, 160.79], [162.0, 165.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.62, 0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 0.0, 42.69], "audiomae_on_audioset": [null, null, null, null, [["cattle, bovinae", 27.03], ["livestock, farm animals, working animals", 25.57], ["animal", 18.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.47], ["speech", 20.12], ["hum", 12.83]], null, [["speech", 51.03], ["hum", 15.11], ["music", 5.07]]], "duration": [0.4, 0.36, 0.03, 0.17, 3.89, 0.48, 0.05, 0.83, 0.45, 1.93, 3.05, 0.08, 1.44, 0.16, 1.16, 1.01, 0.29, 0.85, 0.53, 0.65, 0.56, -0.37, 0.85, 0.1, 1.11, 12.6, 0.79, 3.75]} \ No newline at end of file diff --git a/annotations_1/fEA9BJfaaYA_filtered.json b/annotations_1/fEA9BJfaaYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58d20bcd81a2a222ac6eb18f5d3733e4f0c367b3 --- /dev/null +++ b/annotations_1/fEA9BJfaaYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 62.88], [64.0, 69.47], [70.0, 71.04], [72.0, 80.16], [83.0, 98.96], [99.0, 162.87], [173.0, 174.75], [176.0, 177.9]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [36.48, 99.98, 0.0, 79.94, 54.04, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 27.53], ["groan", 9.07], ["music", 7.23]], null, null, null, null, null, null, null], "duration": [14.88, 5.47, 1.04, 8.16, 15.96, 63.87, 1.75, 1.9]} \ No newline at end of file diff --git a/annotations_1/fEsN1FMfBvI_filtered.json b/annotations_1/fEsN1FMfBvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c34c56157c3d730607fcfd0c3052ba173081b2b1 --- /dev/null +++ b/annotations_1/fEsN1FMfBvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.52], [3.0, 4.09], [7.0, 9.66], [11.0, 12.82], [14.0, 14.4], [16.0, 16.55], [21.0, 22.01], [23.0, 23.43], [26.0, 26.15], [29.0, 30.18], [30.0, 38.45], [39.0, 40.74], [44.0, 53.74], [57.0, 58.99], [64.0, 64.83], [68.0, 117.05], [118.0, 152.96], [154.0, 159.34], [160.0, 160.51], [163.0, 175.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 40.7, 0.0, 38.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 18.92], ["fly, housefly", 9.7], ["speech", 7.58]], null, [["mains hum", 48.62], ["hum", 42.33], ["throbbing", 6.27]], null, null, null, null, [["music", 31.13], ["hum", 20.79], ["mains hum", 18.49]], null, [["mains hum", 31.02], ["hum", 26.92], ["music", 21.94]]], "duration": [0.52, 1.09, 2.66, 1.82, 0.4, 0.55, 1.01, 0.43, 0.15, 1.18, 8.45, 1.74, 9.74, 1.99, 0.83, 49.05, 34.96, 5.34, 0.51, 12.78]} \ No newline at end of file diff --git a/annotations_1/fEwSNiZ3zn4_filtered.json b/annotations_1/fEwSNiZ3zn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53051f32d62c0cf503d97963132da6962ea9f292 --- /dev/null +++ b/annotations_1/fEwSNiZ3zn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [9.0, 9.02], [10.0, 10.0], [13.0, 13.46], [14.0, 14.34], [17.0, 17.63], [19.0, 19.48], [21.0, 21.79], [28.0, 28.31], [29.0, 29.62], [32.0, 32.34], [38.0, 41.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 73.69], ["speech", 9.45], ["hum", 7.37]]], "duration": [0.23, 0.02, 0.0, 0.46, 0.34, 0.63, 0.48, 0.79, 0.31, 0.62, 0.34, 3.66]} \ No newline at end of file diff --git a/annotations_1/fFE8_U07a5I_filtered.json b/annotations_1/fFE8_U07a5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78be30610782bc77aa7e40dc6bcba99d58ac3310 --- /dev/null +++ b/annotations_1/fFE8_U07a5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.18], [6.0, 6.49], [7.0, 18.59], [19.0, 19.95], [20.0, 20.78], [25.0, 25.74], [29.0, 29.44], [31.0, 31.85], [35.0, 35.5], [45.0, 45.42], [49.0, 50.19], [52.0, 53.18], [54.0, 57.74], [59.0, 61.28], [63.0, 68.25], [69.0, 71.02], [71.0, 73.23], [74.0, 74.09], [76.0, 76.74], [78.0, 78.92], [80.0, 81.82], [85.0, 90.26], [93.0, 92.85], [94.0, 94.58], [96.0, 97.19], [97.0, 99.17], [101.0, 103.38], [104.0, 111.13], [112.0, 112.82], [113.0, 115.3], [116.0, 120.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 99.84, 100.0, 99.99, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 63.85, 100.0, 100.0, 0.0, 71.87, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.49, 11.59, 0.95, 0.78, 0.74, 0.44, 0.85, 0.5, 0.42, 1.19, 1.18, 3.74, 2.28, 5.25, 2.02, 2.23, 0.09, 0.74, 0.92, 1.82, 5.26, -0.15, 0.58, 1.19, 2.17, 2.38, 7.13, 0.82, 2.3, 4.34]} \ No newline at end of file diff --git a/annotations_1/fHerVxCsbyc_filtered.json b/annotations_1/fHerVxCsbyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44ed62312ebe93c1d4f4e5b6da7ee89076d45550 --- /dev/null +++ b/annotations_1/fHerVxCsbyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.9], [5.0, 11.15], [20.0, 22.27], [23.0, 24.49], [26.0, 26.97], [37.0, 37.57], [38.0, 38.99], [39.0, 39.46], [40.0, 41.94], [45.0, 47.28], [47.0, 47.49], [48.0, 48.66], [50.0, 50.16], [54.0, 55.92], [58.0, 59.43], [65.0, 65.25], [72.0, 73.04], [76.0, 77.6], [78.0, 83.74], [85.0, 86.34], [88.0, 88.38], [89.0, 89.65], [92.0, 91.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.83, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 65.98], ["fart", 7.99], ["radio", 4.37]], null, null, null, null, null, null, null, [["speech", 34.68], ["radio", 26.95], ["sidetone", 6.02]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.9, 6.15, 2.27, 1.49, 0.97, 0.57, 0.99, 0.46, 1.94, 2.28, 0.49, 0.66, 0.16, 1.92, 1.43, 0.25, 1.04, 1.6, 5.74, 1.34, 0.38, 0.65, -0.34]} \ No newline at end of file diff --git a/annotations_1/fIfQbocblZc_filtered.json b/annotations_1/fIfQbocblZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..725bec80814ab09a4ef3d15345be2f6dbd167a81 --- /dev/null +++ b/annotations_1/fIfQbocblZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.63], [20.0, 20.49], [21.0, 24.0], [26.0, 26.67], [29.0, 30.13], [31.0, 34.62], [35.0, 36.88], [39.0, 50.95], [56.0, 55.61], [56.0, 58.82], [59.0, 65.87], [67.0, 114.57], [115.0, 131.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 79.94, 0.0, 0.0, 85.17, 0.0, 74.44, 0.0, 81.17, 73.51, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.63, 0.49, 3.0, 0.67, 1.13, 3.62, 1.88, 11.95, -0.39, 2.82, 6.87, 47.57, 16.79]} \ No newline at end of file diff --git a/annotations_1/fJV0KtMZ7x8_filtered.json b/annotations_1/fJV0KtMZ7x8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9b4cbb9f3a2661a3a2dc30a66098b97b85a6d89 --- /dev/null +++ b/annotations_1/fJV0KtMZ7x8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.01], [15.0, 16.24], [17.0, 18.08], [18.0, 18.47], [19.0, 24.93], [26.0, 25.83], [26.0, 26.2], [27.0, 27.33], [35.0, 35.75], [37.0, 37.59], [39.0, 40.85], [41.0, 42.16], [53.0, 53.0], [55.0, 58.43], [79.0, 79.66], [92.0, 92.2], [95.0, 96.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.97, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.35], ["moo", 15.58], ["cattle, bovinae", 9.85]], null, null, null], "duration": [5.01, 1.24, 1.08, 0.47, 5.93, -0.17, 0.2, 0.33, 0.75, 0.59, 1.85, 1.16, 0.0, 3.43, 0.66, 0.2, 1.4]} \ No newline at end of file diff --git a/annotations_1/fJlJX4Rj_WU_filtered.json b/annotations_1/fJlJX4Rj_WU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f7158b2a30fbbef9411cfe3761e1a6ca4a24cee --- /dev/null +++ b/annotations_1/fJlJX4Rj_WU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [12.0, 12.82], [14.0, 15.03], [16.0, 16.14], [18.0, 19.23], [23.0, 22.84], [25.0, 26.54], [28.0, 28.07], [28.0, 28.95], [29.0, 29.07], [33.0, 48.69], [51.0, 57.52], [60.0, 60.34], [61.0, 70.51], [76.0, 76.32], [81.0, 81.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.16, 30.63, 0.0, 30.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 61.02], ["quack", 24.13], ["boing", 5.88]], [["music", 56.39], ["didgeridoo", 5.85], ["boing", 5.69]], null, [["music", 19.55], ["siren", 16.69], ["emergency vehicle", 13.44]], null, null], "duration": [0.72, 0.82, 1.03, 0.14, 1.23, -0.16, 1.54, 0.07, 0.95, 0.07, 15.69, 6.52, 0.34, 9.51, 0.32, 0.24]} \ No newline at end of file diff --git a/annotations_1/fKGjSXtCou4_filtered.json b/annotations_1/fKGjSXtCou4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..301da6ecfc9bb51ca72d26ceac25daae71e0ed69 --- /dev/null +++ b/annotations_1/fKGjSXtCou4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [5.0, 6.56], [7.0, 7.42], [9.0, 9.36], [11.0, 16.68], [19.0, 21.81], [22.0, 22.23], [22.0, 22.47], [22.0, 25.03], [26.0, 31.04], [34.0, 39.04], [40.0, 59.44], [59.0, 59.51], [60.0, 60.84], [61.0, 61.15], [61.0, 64.22], [65.0, 76.52], [79.0, 80.72], [82.0, 89.48], [91.0, 94.83], [99.0, 100.82], [102.0, 102.91], [105.0, 106.08], [111.0, 121.83]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.82, 31.79, 0.0, 0.0, 29.74, 63.74, 67.76, 47.12, 0.0, 0.0, 0.0, 48.69, 31.48, 0.0, 28.98, 36.31, 0.0, 0.0, 0.0, 28.68], "audiomae_on_audioset": [null, null, null, null, [["didgeridoo", 58.49], ["music", 30.43], ["electronic music", 2.25]], [["music", 28.12], ["whale vocalization", 18.84], ["didgeridoo", 11.14]], null, null, [["didgeridoo", 45.21], ["whale vocalization", 13.65], ["speech", 6.66]], null, null, [["music", 60.36], ["hum", 8.74], ["mains hum", 2.05]], null, null, null, [["music", 70.75], ["theremin", 14.19], ["shofar", 2.3]], [["music", 32.7], ["didgeridoo", 12.03], ["hum", 11.47]], null, [["music", 48.87], ["hum", 10.75], ["mains hum", 7.09]], [["music", 49.84], ["didgeridoo", 15.34], ["theremin", 4.52]], null, null, null, [["speech", 40.09], ["music", 12.13], ["explosion", 10.2]]], "duration": [0.55, 1.56, 0.42, 0.36, 5.68, 2.81, 0.23, 0.47, 3.03, 5.04, 5.04, 19.44, 0.51, 0.84, 0.15, 3.22, 11.52, 1.72, 7.48, 3.83, 1.82, 0.91, 1.08, 10.83]} \ No newline at end of file diff --git a/annotations_1/fKaiHVTL5nQ_filtered.json b/annotations_1/fKaiHVTL5nQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cab9717ec2863bd04bb0c1db975cce23034b6a4 --- /dev/null +++ b/annotations_1/fKaiHVTL5nQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 62.02], [64.0, 65.08], [67.0, 78.88]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 32.26], "audiomae_on_audioset": [null, null, [["throbbing", 35.51], ["mains hum", 18.72], ["hum", 17.4]]], "duration": [56.02, 1.08, 11.88]} \ No newline at end of file diff --git a/annotations_1/fKpKz3dysY0_filtered.json b/annotations_1/fKpKz3dysY0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bfde46f16cf0153628b184ed29e74e870467a30 --- /dev/null +++ b/annotations_1/fKpKz3dysY0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.53], [11.0, 20.01], [21.0, 26.94], [33.0, 39.43], [47.0, 47.43], [57.0, 57.84], [67.0, 67.85], [71.0, 71.51], [73.0, 89.33], [92.0, 96.65], [100.0, 101.76], [105.0, 116.68]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [40.33, 43.38, 66.15, 37.49, 0.0, 0.0, 0.0, 0.0, 28.38, 33.08, 0.0, 29.49], "audiomae_on_audioset": [[["music", 54.65], ["ambient music", 4.27], ["musical instrument", 3.55]], [["hum", 36.31], ["speech", 22.1], ["mains hum", 13.92]], null, [["speech", 56.96], ["music", 18.95], ["hum", 6.01]], null, null, null, null, [["music", 50.46], ["speech", 11.82], ["hum", 7.89]], [["mains hum", 27.35], ["hum", 24.83], ["music", 19.31]], null, [["music", 56.0], ["buzz", 5.52], ["hum", 5.28]]], "duration": [2.53, 9.01, 5.94, 6.43, 0.43, 0.84, 0.85, 0.51, 16.33, 4.65, 1.76, 11.68]} \ No newline at end of file diff --git a/annotations_1/fLswSc81mw8_filtered.json b/annotations_1/fLswSc81mw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bf877ccba06f256464fe879e1b80db4fa002bfd --- /dev/null +++ b/annotations_1/fLswSc81mw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 34.23], [36.0, 46.52], [47.0, 59.31], [60.0, 63.48], [64.0, 67.41], [68.0, 77.03], [79.0, 79.64], [84.0, 85.11], [90.0, 92.52], [97.0, 100.94], [102.0, 104.87], [106.0, 107.4], [114.0, 113.88], [115.0, 124.95]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [31.26, 30.58, 36.58, 49.64, 85.54, 46.64, 0.0, 0.0, 97.54, 32.1, 33.65, 0.0, 0.0, 41.95], "audiomae_on_audioset": [[["music", 31.39], ["grunt", 21.09], ["burping, eructation", 15.74]], [["music", 66.69], ["speech", 5.46], ["boing", 3.03]], [["music", 75.38], ["speech", 5.04], ["buzz", 1.91]], [["music", 65.52], ["speech", 3.52], ["electronic music", 2.32]], null, [["music", 57.16], ["music for children", 12.17], ["boing", 10.51]], null, null, null, [["music", 23.27], ["fly, housefly", 17.91], ["mosquito", 10.5]], [["speech", 19.84], ["fart", 15.5], ["hum", 7.0]], null, null, [["music", 62.46], ["speech", 2.78], ["musical instrument", 2.49]]], "duration": [9.23, 10.52, 12.31, 3.48, 3.41, 9.03, 0.64, 1.11, 2.52, 3.94, 2.87, 1.4, -0.12, 9.95]} \ No newline at end of file diff --git a/annotations_1/fM3FUot8TCY_filtered.json b/annotations_1/fM3FUot8TCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1710394383eac4d6baa264ac7ea6b0b97cc7be0d --- /dev/null +++ b/annotations_1/fM3FUot8TCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [7.0, 7.94], [10.0, 10.5], [14.0, 15.89], [36.0, 37.44], [39.0, 38.97], [39.0, 41.64], [43.0, 48.79], [51.0, 51.51], [56.0, 57.13], [60.0, 60.3], [87.0, 87.88], [93.0, 93.41], [110.0, 110.76], [113.0, 121.27]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.14, 35.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["fly, housefly", 41.02], ["bee, wasp, etc.", 19.33], ["insect", 18.28]], [["music", 51.08], ["musical instrument", 8.02], ["theremin", 4.06]], null, null, null, null, null, null, [["vehicle", 42.79], ["speech", 13.39], ["car", 13.37]]], "duration": [1.7, 0.94, 0.5, 1.89, 1.44, -0.03, 2.64, 5.79, 0.51, 1.13, 0.3, 0.88, 0.41, 0.76, 8.27]} \ No newline at end of file diff --git a/annotations_1/fNjMYPeG8IU_filtered.json b/annotations_1/fNjMYPeG8IU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a33c37346176589e94bf01fb5298342c0d4419ce --- /dev/null +++ b/annotations_1/fNjMYPeG8IU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.2], [3.0, 3.75], [4.0, 11.13], [13.0, 19.43], [23.0, 26.27], [27.0, 40.64], [62.0, 63.76], [67.0, 66.88], [74.0, 77.03], [78.0, 80.69], [81.0, 82.49], [86.0, 87.02], [88.0, 88.11], [89.0, 89.78], [96.0, 97.53], [98.0, 98.95], [102.0, 103.0], [109.0, 109.54], [111.0, 111.67], [113.0, 116.36], [119.0, 121.68], [122.0, 121.71], [122.0, 121.74], [122.0, 121.9], [125.0, 125.91]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.78, 45.27, 47.94, 45.65, 0.0, 0.0, 44.23, 43.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 41.76, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 47.86], ["musical instrument", 6.19], ["theremin", 6.11]], [["music", 20.5], ["cello", 17.9], ["bowed string instrument", 14.32]], [["music", 67.02], ["musical instrument", 2.24], ["hum", 2.03]], [["music", 61.79], ["musical instrument", 6.69], ["foghorn", 5.54]], null, null, [["insect", 17.55], ["fly, housefly", 16.32], ["speech", 14.49]], [["sidetone", 51.96], ["speech", 26.03], ["radio", 5.04]], null, null, null, null, null, null, null, null, null, null, [["speech", 67.59], ["animal", 3.3], ["music", 2.07]], null, null, null, null], "duration": [0.2, 0.75, 7.13, 6.43, 3.27, 13.64, 1.76, -0.12, 3.03, 2.69, 1.49, 1.02, 0.11, 0.78, 1.53, 0.95, 1.0, 0.54, 0.67, 3.36, 2.68, -0.29, -0.26, -0.1, 0.91]} \ No newline at end of file diff --git a/annotations_1/fO8fKHbg4kw_filtered.json b/annotations_1/fO8fKHbg4kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14ebefc45f2d4270a38194f398deea18c773550e --- /dev/null +++ b/annotations_1/fO8fKHbg4kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [7.0, 12.55], [19.0, 18.84], [25.0, 29.42], [32.0, 32.85], [63.0, 64.3]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 30.67, 0.0, 29.89, 0.0, 0.0], "audiomae_on_audioset": [null, [["applause", 31.03], ["speech", 29.12], ["crowd", 15.94]], null, [["speech", 35.84], ["music", 10.11], ["crowd", 8.08]], null, null], "duration": [1.06, 5.55, -0.16, 4.42, 0.85, 1.3]} \ No newline at end of file diff --git a/annotations_1/fPEGcx4MFHI_filtered.json b/annotations_1/fPEGcx4MFHI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3a1049a96065bed641a5949ff66565654d816e1 --- /dev/null +++ b/annotations_1/fPEGcx4MFHI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.51], [17.0, 17.95], [20.0, 20.53], [29.0, 30.59], [32.0, 84.64], [85.0, 109.04], [110.0, 110.49]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 40.08], ["hum", 24.21], ["mains hum", 16.98]], null], "duration": [1.51, 0.95, 0.53, 1.59, 52.64, 24.04, 0.49]} \ No newline at end of file diff --git a/annotations_1/fPcbyFeefXs_filtered.json b/annotations_1/fPcbyFeefXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..498cf21057354211af86f907a4d183fa3219e8b2 --- /dev/null +++ b/annotations_1/fPcbyFeefXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.91], [36.0, 37.54], [43.0, 43.9], [60.0, 59.73], [60.0, 61.1], [63.0, 63.29], [64.0, 64.18], [77.0, 77.57], [81.0, 80.82], [82.0, 84.72], [85.0, 86.14], [90.0, 90.59], [114.0, 114.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 1.54, 0.9, -0.27, 1.1, 0.29, 0.18, 0.57, -0.18, 2.72, 1.14, 0.59, 0.69]} \ No newline at end of file diff --git a/annotations_1/fQ09ePfYLpU_filtered.json b/annotations_1/fQ09ePfYLpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..01f32f41e0768f6414246232e39f3b9b9f023448 --- /dev/null +++ b/annotations_1/fQ09ePfYLpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.82], [25.0, 25.95], [29.0, 29.54], [30.0, 30.5], [46.0, 60.44], [71.0, 72.66], [77.0, 78.11], [85.0, 86.91], [99.0, 100.04], [103.0, 103.28], [104.0, 105.97], [111.0, 111.74], [116.0, 117.78], [118.0, 118.96], [122.0, 122.66], [125.0, 125.14], [125.0, 127.13], [131.0, 135.3], [144.0, 144.22], [145.0, 146.85], [153.0, 155.95], [163.0, 164.47], [165.0, 166.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.79, 31.05, 0.0, 0.0, 29.82, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 72.26], ["livestock, farm animals, working animals", 10.85], ["cattle, bovinae", 2.47]], null, null, null, null, null, null, null, null, null, null, null, [["music", 32.48], ["mains hum", 10.14], ["buzz", 9.86]], [["hum", 31.77], ["mains hum", 25.91], ["music", 14.92]], null, null, [["music", 21.43], ["noise", 14.16], ["boing", 10.64]], null, null], "duration": [-0.18, 0.95, 0.54, 0.5, 14.44, 1.66, 1.11, 1.91, 1.04, 0.28, 1.97, 0.74, 1.78, 0.96, 0.66, 0.14, 2.13, 4.3, 0.22, 1.85, 2.95, 1.47, 1.11]} \ No newline at end of file diff --git a/annotations_1/fQEGMNLTYPs_filtered.json b/annotations_1/fQEGMNLTYPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4848754edccac86f9d82800fdf62f6045d1d5320 --- /dev/null +++ b/annotations_1/fQEGMNLTYPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 126.94], [127.0, 129.78], [132.0, 137.1]], "keep_status": [false, true, true], "silence_prob": [0.0, 28.92, 31.64], "audiomae_on_audioset": [null, [["noise", 32.81], ["music", 17.66], ["didgeridoo", 10.81]], [["vehicle", 35.17], ["car", 10.01], ["speech", 5.54]]], "duration": [77.94, 2.78, 5.1]} \ No newline at end of file diff --git a/annotations_1/fQWMKUF7dvA_filtered.json b/annotations_1/fQWMKUF7dvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eac71f5041df06cdd16da42ee73cab129b2a237 --- /dev/null +++ b/annotations_1/fQWMKUF7dvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [4.0, 6.3], [7.0, 7.1], [7.0, 9.26], [10.0, 10.4], [11.0, 12.93], [14.0, 14.76], [17.0, 17.68], [19.0, 21.52], [30.0, 30.84], [41.0, 42.77], [44.0, 46.79], [48.0, 53.57], [67.0, 67.85], [72.0, 73.16], [77.0, 77.25], [78.0, 78.38], [81.0, 81.19], [82.0, 83.03], [86.0, 86.88], [88.0, 88.92], [90.0, 90.78], [96.0, 96.36], [98.0, 99.1], [100.0, 99.81], [100.0, 101.09], [107.0, 107.52], [108.0, 107.57], [110.0, 111.11], [112.0, 112.89], [115.0, 116.92], [118.0, 118.77], [122.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.96, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 84.98, 30.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 44.54], ["owl", 5.69], ["hoot", 4.19]], null, null, null, [["whale vocalization", 72.81], ["speech", 14.06], ["sidetone", 1.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.04, 2.3, 0.1, 2.26, 0.4, 1.93, 0.76, 0.68, 2.52, 0.84, 1.77, 2.79, 5.57, 0.85, 1.16, 0.25, 0.38, 0.19, 1.03, 0.88, 0.92, 0.78, 0.36, 1.1, -0.19, 1.09, 0.52, -0.43, 1.11, 0.89, 1.92, 0.77, -0.02]} \ No newline at end of file diff --git a/annotations_1/fQy1yr_K_L4_filtered.json b/annotations_1/fQy1yr_K_L4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1ecf2ee095215472356a3603ace580dda91e337 --- /dev/null +++ b/annotations_1/fQy1yr_K_L4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.61], [8.0, 11.2], [13.0, 15.94], [18.0, 20.75], [23.0, 23.25], [24.0, 26.32], [31.0, 33.76], [35.0, 37.18], [38.0, 39.39], [41.0, 42.63], [44.0, 46.85], [50.0, 51.27], [52.0, 53.23], [55.0, 61.5], [63.0, 64.42], [65.0, 67.27], [68.0, 71.98], [75.0, 74.8], [75.0, 76.71], [78.0, 82.59], [83.0, 88.43], [89.0, 93.51], [94.0, 95.61], [96.0, 104.57], [106.0, 108.08], [109.0, 110.34], [113.0, 123.13], [125.0, 127.08], [128.0, 133.52], [135.0, 139.51], [141.0, 142.11], [143.0, 153.49], [155.0, 156.98], [158.0, 160.62], [162.0, 164.32], [167.0, 168.74], [170.0, 174.07], [175.0, 178.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.01, 100.0, 99.99, 100.0, 0.0, 98.36, 99.88, 99.95, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 91.3, 99.96, 0.0, 0.0, 99.36, 78.72, 98.27, 0.0, 77.36, 99.92, 0.0, 99.52, 99.78, 85.35, 86.45, 0.0, 98.66, 0.0, 99.36, 99.93, 0.0, 99.99, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.61, 3.2, 2.94, 2.75, 0.25, 2.32, 2.76, 2.18, 1.39, 1.63, 2.85, 1.27, 1.23, 6.5, 1.42, 2.27, 3.98, -0.2, 1.71, 4.59, 5.43, 4.51, 1.61, 8.57, 2.08, 1.34, 10.13, 2.08, 5.52, 4.51, 1.11, 10.49, 1.98, 2.62, 2.32, 1.74, 4.07, 3.95]} \ No newline at end of file diff --git a/annotations_1/fRF7InV7TfI_filtered.json b/annotations_1/fRF7InV7TfI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e6cd9b44438477cb8181a72642230b9a8b90eda --- /dev/null +++ b/annotations_1/fRF7InV7TfI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.37], [28.0, 28.41], [32.0, 33.29], [33.0, 33.35], [39.0, 40.09], [50.0, 51.61], [53.0, 54.13], [57.0, 57.81], [62.0, 64.35], [66.0, 66.36], [67.0, 68.99], [70.0, 70.93], [74.0, 80.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 31.74], "audiomae_on_audioset": [[["cattle, bovinae", 28.33], ["livestock, farm animals, working animals", 26.6], ["moo", 18.98]], null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 22.45], ["livestock, farm animals, working animals", 17.5], ["music", 16.89]]], "duration": [2.37, 0.41, 1.29, 0.35, 1.09, 1.61, 1.13, 0.81, 2.35, 0.36, 1.99, 0.93, 6.89]} \ No newline at end of file diff --git a/annotations_1/fRNR8-FqzM4_filtered.json b/annotations_1/fRNR8-FqzM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc5956a6e446c09349dac6702e0270054f8e573f --- /dev/null +++ b/annotations_1/fRNR8-FqzM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 34.5], [38.0, 38.13], [65.0, 66.5], [72.0, 74.14], [85.0, 85.83], [87.0, 87.17], [92.0, 92.82], [101.0, 103.71], [116.0, 116.43]], "keep_status": [true, false, false, false, false, false, false, true, false], "silence_prob": [31.74, 0.0, 0.0, 31.99, 0.0, 0.0, 0.0, 35.67, 0.0], "audiomae_on_audioset": [[["hum", 26.26], ["theremin", 17.57], ["music", 17.3]], null, null, [["music", 80.4], ["guitar", 6.32], ["musical instrument", 4.4]], null, null, null, [["music", 52.61], ["effects unit", 10.0], ["distortion", 4.73]], null], "duration": [10.5, 0.13, 1.5, 2.14, 0.83, 0.17, 0.82, 2.71, 0.43]} \ No newline at end of file diff --git a/annotations_1/fRhJPuDCXRk_filtered.json b/annotations_1/fRhJPuDCXRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b73f458814b0da0ccb426a6806b7c88f138f791b --- /dev/null +++ b/annotations_1/fRhJPuDCXRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [5.0, 5.22], [9.0, 14.82], [19.0, 20.88], [22.0, 22.4], [23.0, 25.71], [26.0, 28.53], [33.0, 35.13], [37.0, 41.01], [42.0, 48.36], [49.0, 51.0], [53.0, 53.32], [55.0, 56.03], [57.0, 59.17], [59.0, 60.56], [63.0, 63.42], [65.0, 66.11], [79.0, 80.37], [91.0, 97.5], [101.0, 101.17], [102.0, 102.51], [113.0, 113.0], [115.0, 115.4], [115.0, 115.5], [116.0, 115.62], [121.0, 122.0], [128.0, 128.01], [133.0, 132.95], [136.0, 139.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.42, 0.0, 0.0, 74.6, 99.82, 99.4, 86.09, 31.02, 33.14, 0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 36.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 28.59], ["hum", 17.22], ["electric shaver, electric razor", 9.88]], [["music", 63.77], ["didgeridoo", 7.17], ["musical instrument", 2.95]], null, null, [["music", 67.4], ["throbbing", 2.79], ["guitar", 1.63]], null, null, null, null, [["music", 65.1], ["throbbing", 3.96], ["musical instrument", 2.29]], null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.22, 5.82, 1.88, 0.4, 2.71, 2.53, 2.13, 4.01, 6.36, 2.0, 0.32, 1.03, 2.17, 1.56, 0.42, 1.11, 1.37, 6.5, 0.17, 0.51, 0.0, 0.4, 0.5, -0.38, 1.0, 0.01, -0.05, 3.83]} \ No newline at end of file diff --git a/annotations_1/fTIIhYZ_CzA_filtered.json b/annotations_1/fTIIhYZ_CzA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b34f27f4a4564afd371543d87392ff6a6b2dbdae --- /dev/null +++ b/annotations_1/fTIIhYZ_CzA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.77], [14.0, 25.03], [27.0, 27.6], [43.0, 53.03], [54.0, 59.43], [62.0, 65.1], [66.0, 67.81], [69.0, 68.89], [69.0, 70.36], [73.0, 82.07], [83.0, 85.35], [87.0, 88.32], [95.0, 100.8], [101.0, 104.31], [104.0, 114.37], [116.0, 132.6]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [40.99, 41.22, 0.0, 38.64, 36.6, 38.93, 0.0, 0.0, 0.0, 34.14, 31.92, 0.0, 31.16, 30.06, 31.54, 31.85], "audiomae_on_audioset": [[["heart sounds, heartbeat", 38.86], ["throbbing", 30.1], ["hum", 10.3]], [["hum", 54.25], ["mains hum", 16.09], ["throbbing", 12.92]], null, [["hum", 46.79], ["mains hum", 21.58], ["throbbing", 8.74]], [["speech", 70.82], ["sidetone", 8.4], ["hum", 7.31]], [["hum", 32.69], ["throbbing", 23.95], ["gong", 9.99]], null, null, null, [["hum", 55.86], ["mains hum", 16.49], ["throbbing", 15.61]], [["sidetone", 74.72], ["speech", 16.61], ["music", 1.51]], null, [["throbbing", 37.33], ["hum", 33.65], ["sidetone", 11.07]], [["speech", 24.81], ["hum", 19.09], ["throbbing", 15.71]], [["speech", 44.67], ["hum", 16.06], ["gong", 15.62]], [["hum", 37.52], ["sidetone", 21.93], ["mains hum", 20.06]]], "duration": [4.77, 11.03, 0.6, 10.03, 5.43, 3.1, 1.81, -0.11, 1.36, 9.07, 2.35, 1.32, 5.8, 3.31, 10.37, 16.6]} \ No newline at end of file diff --git a/annotations_1/fUKoBAi7qCg_filtered.json b/annotations_1/fUKoBAi7qCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e58d5935c3bffc3cda6d7ae817493ad57200461e --- /dev/null +++ b/annotations_1/fUKoBAi7qCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.59], [4.0, 5.54], [6.0, 13.05], [15.0, 15.16], [15.0, 23.03], [24.0, 24.71], [26.0, 75.22], [77.0, 88.87], [89.0, 94.17], [96.0, 101.46], [104.0, 122.88]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.9, 0.0, 28.43, 0.0, 0.0, 30.5, 30.02, 39.64, 32.72], "audiomae_on_audioset": [null, null, [["music", 50.77], ["speech", 25.56], ["theremin", 8.33]], null, [["music", 60.01], ["speech", 22.11], ["throbbing", 2.65]], null, null, [["music", 85.66], ["theremin", 1.3], ["didgeridoo", 1.24]], [["livestock, farm animals, working animals", 38.36], ["cattle, bovinae", 14.95], ["moo", 11.39]], [["music", 53.03], ["musical instrument", 4.94], ["guitar", 2.7]], [["music", 55.0], ["theremin", 9.88], ["synthesizer", 6.89]]], "duration": [1.59, 1.54, 7.05, 0.16, 8.03, 0.71, 49.22, 11.87, 5.17, 5.46, 18.88]} \ No newline at end of file diff --git a/annotations_1/fV-wb1gZOyo_filtered.json b/annotations_1/fV-wb1gZOyo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131354adf53f14861a9c613adf076c9df2f1dfe0 --- /dev/null +++ b/annotations_1/fV-wb1gZOyo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.33], [8.0, 9.05], [11.0, 13.54], [15.0, 16.33], [19.0, 19.01], [20.0, 24.04], [26.0, 28.66], [29.0, 34.47], [35.0, 39.09], [41.0, 42.9], [44.0, 47.43], [48.0, 51.92], [52.0, 67.26], [68.0, 70.02], [72.0, 71.68], [73.0, 73.72], [76.0, 75.69], [78.0, 80.37], [80.0, 81.72], [84.0, 84.57], [86.0, 86.17], [87.0, 88.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 99.44, 0.0, 0.0, 96.77, 90.95, 84.8, 95.51, 0.0, 77.2, 47.98, 33.82, 34.31, 0.0, 0.0, 0.0, 31.67, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 46.76], ["speech", 17.72], ["theremin", 7.33]], [["music", 61.31], ["hum", 7.63], ["theremin", 4.47]], [["music", 28.22], ["didgeridoo", 25.84], ["speech", 4.7]], null, null, null, [["speech", 51.95], ["mains hum", 11.62], ["radio", 7.1]], null, null, null, null], "duration": [5.33, 1.05, 2.54, 1.33, 0.01, 4.04, 2.66, 5.47, 4.09, 1.9, 3.43, 3.92, 15.26, 2.02, -0.32, 0.72, -0.31, 2.37, 1.72, 0.57, 0.17, 1.3]} \ No newline at end of file diff --git a/annotations_1/fVoHEZb6imE_filtered.json b/annotations_1/fVoHEZb6imE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6922225ae5d55b27f2781b328ae43c692b2f5d3 --- /dev/null +++ b/annotations_1/fVoHEZb6imE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 37.25], [38.0, 43.75], [45.0, 60.99], [63.0, 63.27], [65.0, 65.89], [71.0, 72.49]], "keep_status": [true, false, true, false, false, false], "silence_prob": [44.63, 58.81, 45.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.76], ["electronic music", 3.52], ["thunk", 2.4]], null, [["music", 38.07], ["hum", 20.5], ["rumble", 9.94]], null, null, null], "duration": [5.25, 5.75, 15.99, 0.27, 0.89, 1.49]} \ No newline at end of file diff --git a/annotations_1/fWYs-bFK9_s_filtered.json b/annotations_1/fWYs-bFK9_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07b2516216cd201a24ace86c057e398a2ca66433 --- /dev/null +++ b/annotations_1/fWYs-bFK9_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.96], [18.0, 30.13], [34.0, 34.84], [42.0, 60.99], [70.0, 70.71], [99.0, 121.07], [122.0, 124.41], [141.0, 141.4], [141.0, 141.47], [144.0, 147.88], [149.0, 150.5]], "keep_status": [false, true, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 31.93, 0.0, 33.0, 0.0, 31.93, 33.19, 0.0, 0.0, 32.53, 0.0], "audiomae_on_audioset": [null, [["speech", 36.99], ["vehicle", 15.41], ["boat, water vehicle", 6.17]], null, [["speech", 56.19], ["buzz", 11.3], ["vehicle", 8.0]], null, [["speech", 52.64], ["vehicle", 10.7], ["boat, water vehicle", 4.89]], [["speech", 47.27], ["vehicle", 5.97], ["music", 4.49]], null, null, [["speech", 32.66], ["explosion", 13.71], ["buzz", 6.16]], null], "duration": [0.96, 12.13, 0.84, 18.99, 0.71, 22.07, 2.41, 0.4, 0.47, 3.88, 1.5]} \ No newline at end of file diff --git a/annotations_1/fWgpZ_2oYfE_filtered.json b/annotations_1/fWgpZ_2oYfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bc3eb39c85b91bd61ad71051b50b856e64ec146 --- /dev/null +++ b/annotations_1/fWgpZ_2oYfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.63], [20.0, 21.29], [24.0, 37.05], [40.0, 66.14]], "keep_status": [false, false, false, true], "silence_prob": [32.41, 0.0, 31.48, 29.79], "audiomae_on_audioset": [[["speech", 66.16], ["foghorn", 3.84], ["outside, urban or manmade", 3.12]], null, [["speech", 57.54], ["electric shaver, electric razor", 11.74], ["buzz", 10.17]], [["speech", 45.91], ["music", 7.44], ["hubbub, speech noise, speech babble", 7.16]]], "duration": [2.63, 1.29, 13.05, 26.14]} \ No newline at end of file diff --git a/annotations_1/fWx9V0xoYsI_filtered.json b/annotations_1/fWx9V0xoYsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00bd38e26b05204a24e9b6032b90df8b9f2dbb6d --- /dev/null +++ b/annotations_1/fWx9V0xoYsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 36.75], [38.0, 38.58], [39.0, 40.51], [42.0, 41.86], [42.0, 43.36], [46.0, 46.09], [47.0, 47.55], [53.0, 54.46], [57.0, 58.62], [59.0, 60.0], [61.0, 63.39], [66.0, 67.31], [68.0, 68.77], [69.0, 69.74], [71.0, 72.22], [78.0, 79.05], [81.0, 81.55], [83.0, 83.13], [85.0, 88.59], [90.0, 91.62], [93.0, 94.05], [97.0, 98.17], [101.0, 101.34], [104.0, 104.03], [107.0, 108.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 0.58, 1.51, -0.14, 1.36, 0.09, 0.55, 1.46, 1.62, 1.0, 2.39, 1.31, 0.77, 0.74, 1.22, 1.05, 0.55, 0.13, 3.59, 1.62, 1.05, 1.17, 0.34, 0.03, 1.41]} \ No newline at end of file diff --git a/annotations_1/fYNZsz9o3Sg_filtered.json b/annotations_1/fYNZsz9o3Sg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8db0c38e4d02a5e93dde6fec96466fca0bbf88c --- /dev/null +++ b/annotations_1/fYNZsz9o3Sg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [2.0, 1.92], [14.0, 14.62], [26.0, 26.91], [40.0, 41.12], [42.0, 43.01], [44.0, 48.66], [50.0, 50.55], [66.0, 66.95], [67.0, 67.46], [68.0, 70.14], [71.0, 72.81], [76.0, 77.23], [91.0, 91.84], [99.0, 99.87], [102.0, 103.55], [104.0, 104.84], [105.0, 106.88], [108.0, 108.5], [110.0, 110.15], [112.0, 122.62], [123.0, 123.82], [125.0, 125.68], [137.0, 136.92], [138.0, 138.59], [139.0, 139.65], [141.0, 141.56], [145.0, 145.45], [149.0, 149.01], [153.0, 153.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, -0.08, 0.62, 0.91, 1.12, 1.01, 4.66, 0.55, 0.95, 0.46, 2.14, 1.81, 1.23, 0.84, 0.87, 1.55, 0.84, 1.88, 0.5, 0.15, 10.62, 0.82, 0.68, -0.08, 0.59, 0.65, 0.56, 0.45, 0.01, 0.06]} \ No newline at end of file diff --git a/annotations_1/fYVAGoTb8w4_filtered.json b/annotations_1/fYVAGoTb8w4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdb3cb88578ec0736ada5743ffda2b1fff51db49 --- /dev/null +++ b/annotations_1/fYVAGoTb8w4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.34], [19.0, 26.54], [30.0, 31.48], [32.0, 39.51], [41.0, 41.35], [44.0, 44.15], [51.0, 51.39], [56.0, 57.11], [58.0, 59.05], [60.0, 63.0], [64.0, 64.3], [65.0, 66.06], [67.0, 67.46], [69.0, 69.26], [70.0, 77.89], [78.0, 79.91], [81.0, 81.5], [83.0, 121.14], [130.0, 132.16], [133.0, 137.17], [138.0, 144.24], [145.0, 175.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.29, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0, 0.0, 99.98, 94.95, 82.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.24], ["music", 28.59], ["fly, housefly", 3.58]], null, null, null, null, null, null, null], "duration": [1.34, 7.54, 1.48, 7.51, 0.35, 0.15, 0.39, 1.11, 1.05, 3.0, 0.3, 1.06, 0.46, 0.26, 7.89, 1.91, 0.5, 38.14, 2.16, 4.17, 6.24, 30.58]} \ No newline at end of file diff --git a/annotations_1/fYbbxzLGpbI_filtered.json b/annotations_1/fYbbxzLGpbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e6991e976c0b29344f5a8efdb9485a139ff5064 --- /dev/null +++ b/annotations_1/fYbbxzLGpbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.81], [15.0, 21.91], [24.0, 24.56], [27.0, 47.44], [51.0, 81.38], [83.0, 94.66], [96.0, 103.65], [105.0, 133.46], [134.0, 138.5], [139.0, 149.64]], "keep_status": [true, true, false, true, false, false, false, false, true, true], "silence_prob": [33.23, 28.61, 0.0, 28.3, 0.0, 28.31, 28.36, 28.43, 28.54, 28.32], "audiomae_on_audioset": [[["hum", 28.14], ["music", 14.98], ["throbbing", 11.9]], [["music", 45.37], ["throbbing", 12.14], ["speech", 7.62]], null, [["music", 22.99], ["explosion", 9.16], ["speech", 8.41]], null, [["speech", 51.13], ["music", 12.43], ["vehicle", 6.66]], [["speech", 48.45], ["music", 25.73], ["vehicle", 4.84]], [["music", 35.11], ["speech", 31.38], ["burst, pop", 3.77]], [["music", 33.35], ["hum", 14.33], ["throbbing", 13.81]], [["speech", 45.82], ["buzz", 8.25], ["music", 7.77]]], "duration": [4.81, 6.91, 0.56, 20.44, 30.38, 11.66, 7.65, 28.46, 4.5, 10.64]} \ No newline at end of file diff --git a/annotations_1/fZB65wj9nz8_filtered.json b/annotations_1/fZB65wj9nz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0bd600bbd3c375a64b85c633f52954c30f55d9b --- /dev/null +++ b/annotations_1/fZB65wj9nz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.28], [42.0, 42.43], [65.0, 65.3], [74.0, 74.38], [85.0, 85.29], [91.0, 91.15], [92.0, 92.87], [104.0, 104.85], [106.0, 106.64], [109.0, 123.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.43, 0.3, 0.38, 0.29, 0.15, 0.87, 0.85, 0.64, 14.16]} \ No newline at end of file diff --git a/annotations_1/fZNHk9DKvtM_filtered.json b/annotations_1/fZNHk9DKvtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce0f559336b1fa6626679eb37c28a20c54130aad --- /dev/null +++ b/annotations_1/fZNHk9DKvtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [5.0, 5.9], [7.0, 7.55], [9.0, 10.02], [11.0, 12.21], [13.0, 16.71], [21.0, 21.74], [23.0, 24.43], [26.0, 26.15], [27.0, 26.99], [29.0, 29.3], [30.0, 40.02], [43.0, 43.09], [47.0, 48.73], [51.0, 52.29], [54.0, 55.71], [60.0, 77.5], [80.0, 85.9], [89.0, 90.32], [93.0, 96.31], [97.0, 97.33], [98.0, 104.14], [115.0, 115.33], [121.0, 123.38], [130.0, 130.17], [135.0, 135.01], [135.0, 135.04], [135.0, 135.23], [135.0, 135.26], [135.0, 141.79], [148.0, 151.23], [154.0, 154.38], [156.0, 155.82], [159.0, 160.17], [160.0, 161.86], [163.0, 163.17], [166.0, 179.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 59.15, 96.77, 0.0, 83.88, 0.0, 31.13, 0.0, 30.94, 0.0, 0.0, 0.0, 0.0, 0.0, 30.16, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 32.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.68], ["livestock, farm animals, working animals", 11.78], ["cattle, bovinae", 10.94]], null, [["speech", 31.35], ["skateboard", 6.9], ["fart", 6.11]], null, null, null, null, null, [["throbbing", 24.08], ["speech", 15.71], ["sidetone", 12.81]], [["speech", 22.86], ["sidetone", 22.17], ["music", 21.68]], null, null, null, null, null, [["music", 42.91], ["hum", 25.1], ["throbbing", 23.49]]], "duration": [0.54, 0.9, 0.55, 1.02, 1.21, 3.71, 0.74, 1.43, 0.15, -0.01, 0.3, 10.02, 0.09, 1.73, 1.29, 1.71, 17.5, 5.9, 1.32, 3.31, 0.33, 6.14, 0.33, 2.38, 0.17, 0.01, 0.04, 0.23, 0.26, 6.79, 3.23, 0.38, -0.18, 1.17, 1.86, 0.17, 13.46]} \ No newline at end of file diff --git a/annotations_1/fZflzybv5T0_filtered.json b/annotations_1/fZflzybv5T0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd1ed48c3948c5cf9a3d35bc19b88a7a871260cc --- /dev/null +++ b/annotations_1/fZflzybv5T0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.35], [12.0, 13.17], [13.0, 13.64], [19.0, 20.46], [21.0, 22.57], [28.0, 29.62], [32.0, 32.75], [38.0, 41.77], [47.0, 48.0]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.35, 1.17, 0.64, 1.46, 1.57, 1.62, 0.75, 3.77, 1.0]} \ No newline at end of file diff --git a/annotations_1/fZrN9LabLQQ_filtered.json b/annotations_1/fZrN9LabLQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b534775b38f3793ac0a274829310e855a95fb9d2 --- /dev/null +++ b/annotations_1/fZrN9LabLQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 17.41], [21.0, 23.63], [28.0, 32.58], [36.0, 39.33], [43.0, 58.16], [62.0, 102.68], [107.0, 110.13], [112.0, 114.34], [116.0, 146.97], [149.0, 149.42], [161.0, 162.87], [164.0, 165.3], [167.0, 167.61]], "keep_status": [true, true, false, true, true, false, true, true, false, false, false, false, false], "silence_prob": [29.14, 29.13, 34.72, 30.83, 29.05, 0.0, 31.62, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.82], ["hum", 7.05], ["mains hum", 6.28]], [["mains hum", 30.76], ["hum", 24.9], ["throbbing", 11.58]], [["music", 40.23], ["speech", 28.37], ["hum", 5.28]], [["music", 17.71], ["mains hum", 16.32], ["buzz", 10.05]], [["music", 55.85], ["whip", 4.84], ["whoosh, swoosh, swish", 3.73]], null, [["speech", 41.1], ["vehicle", 7.75], ["hum", 7.4]], [["speech", 54.3], ["vehicle", 9.85], ["music", 2.98]], null, null, null, null, null], "duration": [8.41, 2.63, 4.58, 3.33, 15.16, 40.68, 3.13, 2.34, 30.97, 0.42, 1.87, 1.3, 0.61]} \ No newline at end of file diff --git a/annotations_1/f_LDdElm9fc_filtered.json b/annotations_1/f_LDdElm9fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3d421efb26f3488ad169b38f717f7e803797fa --- /dev/null +++ b/annotations_1/f_LDdElm9fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.35], [20.0, 48.17], [49.0, 51.19], [51.0, 60.44], [63.0, 63.39], [64.0, 102.32], [107.0, 110.25], [117.0, 129.47], [130.0, 130.77], [132.0, 138.15], [139.0, 139.78], [141.0, 143.41], [145.0, 145.5]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [29.24, 28.49, 34.44, 29.55, 0.0, 0.0, 28.21, 29.03, 0.0, 29.65, 0.0, 96.42, 0.0], "audiomae_on_audioset": [[["mains hum", 33.1], ["hum", 22.2], ["music", 13.89]], [["speech", 47.4], ["music", 15.51], ["hum", 6.18]], [["music", 35.49], ["speech", 24.0], ["electronic music", 4.87]], [["mains hum", 46.37], ["hum", 42.12], ["music", 2.9]], null, null, [["music", 14.94], ["hum", 13.72], ["mains hum", 9.28]], [["speech", 54.72], ["music", 21.99], ["sidetone", 6.46]], null, [["music", 39.7], ["throbbing", 22.17], ["hum", 20.15]], null, null, null], "duration": [7.35, 28.17, 2.19, 9.44, 0.39, 38.32, 3.25, 12.47, 0.77, 6.15, 0.78, 2.41, 0.5]} \ No newline at end of file diff --git a/annotations_1/fb-9_MV15I4_filtered.json b/annotations_1/fb-9_MV15I4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/fb-9_MV15I4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/fbDgv4huUp4_filtered.json b/annotations_1/fbDgv4huUp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa44cfaa29d7f9b4c7465bf84d7fee9e68258d85 --- /dev/null +++ b/annotations_1/fbDgv4huUp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 55.11], [55.0, 56.05], [58.0, 64.45], [68.0, 70.53], [72.0, 72.82], [77.0, 77.06], [80.0, 80.42], [83.0, 86.56], [87.0, 88.6], [92.0, 101.51], [104.0, 105.98], [107.0, 115.1], [117.0, 138.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 38.62, 92.64, 0.0, 0.0, 0.0, 43.13, 0.0, 29.37, 0.0, 30.41, 31.32], "audiomae_on_audioset": [null, null, [["music", 47.2], ["hum", 16.46], ["throbbing", 13.69]], null, null, null, null, [["hum", 44.46], ["throbbing", 14.59], ["music", 12.22]], null, [["speech", 38.06], ["music", 30.58], ["crowd", 4.98]], null, [["music", 48.08], ["speech", 14.88], ["thunk", 3.83]], [["music", 20.52], ["gong", 14.62], ["speech", 10.63]]], "duration": [48.11, 1.05, 6.45, 2.53, 0.82, 0.06, 0.42, 3.56, 1.6, 9.51, 1.98, 8.1, 21.6]} \ No newline at end of file diff --git a/annotations_1/fbR1gtlY7FM_filtered.json b/annotations_1/fbR1gtlY7FM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40454eb811f461b4681b8438027526950cbf0d3b --- /dev/null +++ b/annotations_1/fbR1gtlY7FM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 73.38]], "keep_status": [false], "silence_prob": [30.58], "audiomae_on_audioset": [[["vehicle", 44.31], ["skidding", 21.74], ["car", 15.11]]], "duration": [25.38]} \ No newline at end of file diff --git a/annotations_1/fbkfr-S420o_filtered.json b/annotations_1/fbkfr-S420o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ec8da8ed604e2b9600ea410b6b6c67b47b356a0 --- /dev/null +++ b/annotations_1/fbkfr-S420o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.86], [20.0, 21.73], [22.0, 23.09], [28.0, 28.07], [29.0, 31.06], [32.0, 36.66], [38.0, 39.12], [41.0, 42.52], [45.0, 47.97], [49.0, 50.68], [52.0, 51.68], [54.0, 53.91], [55.0, 55.66], [57.0, 58.24], [60.0, 63.69], [66.0, 67.58], [69.0, 71.81], [75.0, 75.14], [77.0, 78.36], [79.0, 82.16], [85.0, 88.92], [92.0, 93.6], [96.0, 97.63]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.11, 95.64, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4, 0.0, 33.48, 0.0, 0.0, 33.43, 34.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.68], ["livestock, farm animals, working animals", 17.78], ["moo", 9.18]], null, null, null, null, null, null, null, null, null, [["music", 28.23], ["boing", 18.25], ["sidetone", 11.08]], null, [["music", 53.36], ["speech", 26.8], ["boing", 1.51]], null, null, [["music", 54.58], ["speech", 32.76], ["synthesizer", 3.55]], [["music", 57.48], ["speech", 30.24], ["synthesizer", 2.75]], null, null], "duration": [0.86, 1.73, 1.09, 0.07, 2.06, 4.66, 1.12, 1.52, 2.97, 1.68, -0.32, -0.09, 0.66, 1.24, 3.69, 1.58, 2.81, 0.14, 1.36, 3.16, 3.92, 1.6, 1.63]} \ No newline at end of file diff --git a/annotations_1/fcFKVVHQn7o_filtered.json b/annotations_1/fcFKVVHQn7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a0fce49901011f421145d92fe725e4f5a173f3 --- /dev/null +++ b/annotations_1/fcFKVVHQn7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.0], [10.0, 12.02], [13.0, 25.24], [27.0, 26.76], [29.0, 29.19], [30.0, 31.04], [34.0, 34.89], [35.0, 38.57], [39.0, 42.72], [43.0, 44.09], [48.0, 69.4], [74.0, 75.44], [78.0, 80.69], [81.0, 81.84], [82.0, 84.67], [88.0, 91.1], [95.0, 95.34], [96.0, 104.8], [107.0, 118.89], [120.0, 128.11], [132.0, 149.05]], "keep_status": [false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, false, true, true, false, false], "silence_prob": [55.11, 44.99, 35.28, 0.0, 0.0, 0.0, 0.0, 49.97, 38.09, 0.0, 33.9, 0.0, 60.6, 0.0, 59.77, 35.76, 0.0, 35.01, 35.46, 35.36, 32.54], "audiomae_on_audioset": [null, [["music", 28.84], ["trombone", 22.62], ["brass instrument", 21.05]], [["music", 73.88], ["wind instrument, woodwind instrument", 4.13], ["musical instrument", 3.14]], null, null, null, null, [["music", 44.5], ["musical instrument", 7.62], ["foghorn", 6.35]], [["music", 28.29], ["mains hum", 11.77], ["hum", 9.12]], null, [["music", 54.11], ["tabla", 7.45], ["drum", 3.86]], null, null, null, null, [["music", 53.05], ["musical instrument", 6.58], ["drum", 5.41]], null, [["music", 31.99], ["speech", 30.07], ["buzz", 7.0]], [["music", 58.48], ["horse", 4.59], ["brass instrument", 4.56]], [["music", 73.45], ["fart", 3.05], ["didgeridoo", 2.47]], [["music", 75.19], ["theremin", 4.59], ["musical instrument", 2.9]]], "duration": [2.0, 2.02, 12.24, -0.24, 0.19, 1.04, 0.89, 3.57, 3.72, 1.09, 21.4, 1.44, 2.69, 0.84, 2.67, 3.1, 0.34, 8.8, 11.89, 8.11, 17.05]} \ No newline at end of file diff --git a/annotations_1/fegOYb4_PSk_filtered.json b/annotations_1/fegOYb4_PSk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cca285b134cd25edd9d71c0614a8bac914d9ac0 --- /dev/null +++ b/annotations_1/fegOYb4_PSk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.38], [23.0, 24.81], [26.0, 27.28], [36.0, 36.0], [39.0, 39.02], [40.0, 45.28], [52.0, 52.62], [54.0, 55.98], [57.0, 57.15], [58.0, 68.89], [69.0, 75.36], [76.0, 80.38], [86.0, 89.28], [92.0, 92.16], [106.0, 106.79], [109.0, 114.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [61.47, 0.0, 0.0, 0.0, 0.0, 42.79, 0.0, 0.0, 0.0, 32.63, 38.28, 46.64, 54.7, 0.0, 0.0, 84.43], "audiomae_on_audioset": [null, null, null, null, null, [["music", 67.15], ["electronic music", 4.89], ["synthesizer", 2.7]], null, null, null, [["music", 47.76], ["synthesizer", 12.63], ["hum", 11.76]], [["music", 32.87], ["throbbing", 22.49], ["hum", 8.68]], [["music", 33.52], ["throbbing", 15.49], ["hum", 12.65]], null, null, null, null], "duration": [20.38, 1.81, 1.28, 0.0, 0.02, 5.28, 0.62, 1.98, 0.15, 10.89, 6.36, 4.38, 3.28, 0.16, 0.79, 5.4]} \ No newline at end of file diff --git a/annotations_1/ffknf2fIpiY_filtered.json b/annotations_1/ffknf2fIpiY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16abd547edf6abc87a6d93e5a404d782c9eecff9 --- /dev/null +++ b/annotations_1/ffknf2fIpiY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.13], [27.0, 27.45], [28.0, 33.37], [35.0, 36.68], [38.0, 38.18], [38.0, 40.91], [42.0, 46.16], [47.0, 47.83], [48.0, 48.56], [50.0, 63.91], [65.0, 65.03], [65.0, 70.06], [71.0, 76.52], [77.0, 79.02], [80.0, 79.79], [80.0, 81.19], [84.0, 84.45], [87.0, 90.48], [91.0, 90.98], [92.0, 93.7]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.73, 0.0, 0.0, 38.17, 40.01, 0.0, 0.0, 45.14, 0.0, 48.02, 48.14, 51.6, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 61.21], ["sidetone", 22.53], ["telephone", 8.84]], [["speech", 45.39], ["grunt", 5.54], ["burping, eructation", 3.67]], null, null, [["sidetone", 12.07], ["speech", 9.22], ["radio", 8.65]], null, [["speech", 58.33], ["sidetone", 8.12], ["radio", 7.55]], [["crushing", 41.49], ["bouncing", 25.04], ["thunk", 6.3]], null, null, null, null, null, null, null], "duration": [1.13, 0.45, 5.37, 1.68, 0.18, 2.91, 4.16, 0.83, 0.56, 13.91, 0.03, 5.06, 5.52, 2.02, -0.21, 1.19, 0.45, 3.48, -0.02, 1.7]} \ No newline at end of file diff --git a/annotations_1/ffmSFNEG6pM_filtered.json b/annotations_1/ffmSFNEG6pM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e343dbba815487713d11b4701698e0a64399fdfc --- /dev/null +++ b/annotations_1/ffmSFNEG6pM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.11], [40.0, 73.57], [76.0, 100.09], [100.0, 131.06], [134.0, 138.28], [139.0, 148.49], [149.0, 149.89], [152.0, 168.39], [170.0, 170.77]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.87, 0.0, 57.48, 29.57, 0.0, 51.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 66.12], ["throbbing", 8.86], ["didgeridoo", 6.45]], null, null, [["speech", 71.41], ["music", 8.56], ["rumble", 8.33]], null, null, null], "duration": [1.11, 33.57, 24.09, 31.06, 4.28, 9.49, 0.89, 16.39, 0.77]} \ No newline at end of file diff --git a/annotations_1/fgDgZGePcwk_filtered.json b/annotations_1/fgDgZGePcwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0939206360eae6556047421ba8d83125662e8ecb --- /dev/null +++ b/annotations_1/fgDgZGePcwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [3.0, 3.96], [4.0, 4.94], [10.0, 10.17], [14.0, 84.94], [85.0, 119.57], [121.0, 120.99]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.69, 0.96, 0.94, 0.17, 70.94, 34.57, -0.01]} \ No newline at end of file diff --git a/annotations_1/fgbjvvCPa88_filtered.json b/annotations_1/fgbjvvCPa88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b68c0cc217a26d824dfc4f21100a08e7ce2f5074 --- /dev/null +++ b/annotations_1/fgbjvvCPa88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.78], [17.0, 19.31], [20.0, 24.88], [29.0, 29.08], [30.0, 39.48], [41.0, 41.45], [45.0, 45.44], [50.0, 50.68], [54.0, 54.53], [55.0, 61.42], [68.0, 68.55], [74.0, 74.88], [80.0, 81.35], [82.0, 83.98], [86.0, 91.71], [93.0, 97.5]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 54.04, 29.68, 0.0, 28.75, 0.0, 0.0, 0.0, 0.0, 46.15, 0.0, 0.0, 0.0, 0.0, 36.12, 30.6], "audiomae_on_audioset": [null, null, [["music", 66.65], ["speech", 9.76], ["vehicle", 3.53]], null, [["hum", 52.73], ["throbbing", 32.29], ["mains hum", 6.15]], null, null, null, null, [["music", 34.87], ["speech", 16.55], ["musical instrument", 5.11]], null, null, null, null, [["speech", 53.27], ["music", 11.93], ["animal", 3.11]], [["noise", 48.25], ["mains hum", 12.57], ["hum", 9.0]]], "duration": [0.78, 2.31, 4.88, 0.08, 9.48, 0.45, 0.44, 0.68, 0.53, 6.42, 0.55, 0.88, 1.35, 1.98, 5.71, 4.5]} \ No newline at end of file diff --git a/annotations_1/fhK8qpO-iD4_filtered.json b/annotations_1/fhK8qpO-iD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86f6c45157dfaef64e2a98493e5fbd2cc6d055e7 --- /dev/null +++ b/annotations_1/fhK8qpO-iD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.33], [5.0, 5.91], [6.0, 9.39], [11.0, 10.86], [12.0, 12.63], [15.0, 16.23], [18.0, 18.23], [19.0, 42.72], [44.0, 47.46], [53.0, 53.65], [55.0, 60.59], [61.0, 64.23], [66.0, 66.21], [68.0, 70.44], [74.0, 74.78], [78.0, 80.7], [81.0, 83.29], [90.0, 90.27], [93.0, 94.9], [105.0, 105.51], [110.0, 113.17], [115.0, 116.21], [117.0, 116.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 30.22, 60.51, 0.0, 99.99, 91.13, 0.0, 79.94, 0.0, 67.51, 47.43, 0.0, 0.0, 0.0, 32.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 77.44], ["throbbing", 4.87], ["hum", 2.27]], null, null, null, null, null, null, null, null, [["music", 65.39], ["musical instrument", 3.37], ["synthesizer", 3.24]], null, null, null, [["music", 60.98], ["throbbing", 15.01], ["hum", 4.98]], null, null], "duration": [1.33, 0.91, 3.39, -0.14, 0.63, 1.23, 0.23, 23.72, 3.46, 0.65, 5.59, 3.23, 0.21, 2.44, 0.78, 2.7, 2.29, 0.27, 1.9, 0.51, 3.17, 1.21, -0.01]} \ No newline at end of file diff --git a/annotations_1/fi7cppyGPPw_filtered.json b/annotations_1/fi7cppyGPPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc6f9f2c73938b031d1fbdfc9bbc2ab83213dbca --- /dev/null +++ b/annotations_1/fi7cppyGPPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.32], [19.0, 20.39], [21.0, 21.91], [28.0, 28.73], [34.0, 35.11], [38.0, 38.18], [39.0, 41.32], [45.0, 45.54], [48.0, 48.51], [51.0, 51.33], [53.0, 54.4], [55.0, 55.75], [56.0, 60.1], [61.0, 61.11], [64.0, 65.04], [66.0, 67.14], [71.0, 71.98], [75.0, 75.17], [76.0, 76.27], [79.0, 85.63], [91.0, 94.26], [102.0, 163.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 37.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.44, 47.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.93], ["fart", 9.46], ["inside, small room", 2.43]], null, null, null, null, null, null, [["speech", 92.89], ["burst, pop", 1.06], ["explosion", 1.0]], [["fart", 39.03], ["speech", 27.45], ["clip-clop", 5.89]], null], "duration": [1.32, 1.39, 0.91, 0.73, 1.11, 0.18, 2.32, 0.54, 0.51, 0.33, 1.4, 0.75, 4.1, 0.11, 1.04, 1.14, 0.98, 0.17, 0.27, 6.63, 3.26, 61.07]} \ No newline at end of file diff --git a/annotations_1/fkiY6TBT4mo_filtered.json b/annotations_1/fkiY6TBT4mo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..010e2910f1ff5e642da0b72deb4d7f7be711bca1 --- /dev/null +++ b/annotations_1/fkiY6TBT4mo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.59], [2.0, 2.88], [4.0, 4.7], [5.0, 6.67], [8.0, 13.9], [15.0, 15.3], [16.0, 29.73], [33.0, 33.0], [34.0, 35.26], [38.0, 38.8], [40.0, 40.95], [42.0, 42.85], [47.0, 48.02], [50.0, 49.98], [52.0, 52.83], [57.0, 58.16], [61.0, 62.41], [64.0, 66.24], [67.0, 73.6], [74.0, 76.82], [79.0, 81.46], [83.0, 82.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.72, 0.0, 50.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 72.46, 61.18, 85.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.41, 0.88, 0.7, 1.67, 5.9, 0.3, 13.73, 0.0, 1.26, 0.8, 0.95, 0.85, 1.02, -0.02, 0.83, 1.16, 1.41, 2.24, 6.6, 2.82, 2.46, -0.07]} \ No newline at end of file diff --git a/annotations_1/fmMPmWO6b4E_filtered.json b/annotations_1/fmMPmWO6b4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1001f034c14273c33524713e05854e1825f5c9 --- /dev/null +++ b/annotations_1/fmMPmWO6b4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 101.33], [103.0, 127.48], [129.0, 151.29]], "keep_status": [false, true, true], "silence_prob": [0.0, 33.17, 31.71], "audiomae_on_audioset": [null, [["music", 44.09], ["throbbing", 10.47], ["whack, thwack", 8.66]], [["music", 29.21], ["whack, thwack", 23.64], ["mosquito", 8.59]]], "duration": [92.33, 24.48, 22.29]} \ No newline at end of file diff --git a/annotations_1/fmRWWrBqiJE_filtered.json b/annotations_1/fmRWWrBqiJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adfaf2292993cdd4caa7bcb438a4d3ca6a2ffc53 --- /dev/null +++ b/annotations_1/fmRWWrBqiJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.36], [17.0, 26.5], [27.0, 28.49], [32.0, 38.45], [42.0, 66.56], [68.0, 85.11], [87.0, 86.95], [87.0, 87.4], [89.0, 89.77], [91.0, 161.03], [166.0, 166.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.44, 94.95, 0.0, 74.76, 91.81, 71.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [11.36, 9.5, 1.49, 6.45, 24.56, 17.11, -0.05, 0.4, 0.77, 70.03, 0.48]} \ No newline at end of file diff --git a/annotations_1/fn5dXUu_qxM_filtered.json b/annotations_1/fn5dXUu_qxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c987772d9f4be6d4dd929ea39e052a2e3a2cabe --- /dev/null +++ b/annotations_1/fn5dXUu_qxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 43.87], [45.0, 46.52], [51.0, 52.1], [53.0, 54.01], [54.0, 61.37], [62.0, 62.33], [67.0, 68.79], [79.0, 82.09], [85.0, 84.57], [85.0, 85.06], [87.0, 89.38], [91.0, 94.69], [97.0, 97.46], [101.0, 104.11], [107.0, 107.64], [108.0, 109.49], [116.0, 116.8], [120.0, 120.21], [131.0, 132.49], [133.0, 134.7], [136.0, 138.91], [143.0, 144.68], [147.0, 150.13], [151.0, 152.19], [153.0, 154.6], [179.0, 180.64], [183.0, 184.38], [217.0, 217.54], [219.0, 219.6], [224.0, 224.46], [227.0, 227.65], [230.0, 229.78], [235.0, 235.74], [237.0, 239.8], [240.0, 240.58], [252.0, 252.0], [253.0, 253.84], [259.0, 261.32], [265.0, 265.4], [266.0, 266.72]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.31, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 44.81, 0.0, 0.0, 95.09, 91.64, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0], "audiomae_on_audioset": [[["insect", 26.21], ["fly, housefly", 22.97], ["mosquito", 15.69]], null, null, null, [["hum", 34.82], ["mains hum", 20.05], ["dishes, pots, and pans", 4.92]], null, null, [["speech", 39.63], ["whale vocalization", 13.57], ["chirp tone", 7.68]], null, null, null, null, null, [["speech", 24.16], ["hum", 20.31], ["mains hum", 14.24]], null, null, null, null, null, null, [["speech", 43.18], ["music", 13.03], ["electronic music", 3.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.87, 1.52, 1.1, 1.01, 7.37, 0.33, 1.79, 3.09, -0.43, 0.06, 2.38, 3.69, 0.46, 3.11, 0.64, 1.49, 0.8, 0.21, 1.49, 1.7, 2.91, 1.68, 3.13, 1.19, 1.6, 1.64, 1.38, 0.54, 0.6, 0.46, 0.65, -0.22, 0.74, 2.8, 0.58, 0.0, 0.84, 2.32, 0.4, 0.72]} \ No newline at end of file diff --git a/annotations_1/fnpUxSXWy6I_filtered.json b/annotations_1/fnpUxSXWy6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c1fe33c38e6a080dbaa6b6faeb1aa0fee585c9 --- /dev/null +++ b/annotations_1/fnpUxSXWy6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.75], [15.0, 15.03], [15.0, 15.99], [18.0, 18.1], [21.0, 21.12], [27.0, 27.53], [29.0, 28.93], [32.0, 32.66], [55.0, 55.58], [57.0, 57.69], [59.0, 59.49], [60.0, 64.59], [71.0, 71.83], [73.0, 72.94], [74.0, 74.98], [75.0, 77.31], [78.0, 78.98], [85.0, 84.99], [104.0, 104.41], [104.0, 105.9], [106.0, 107.81], [111.0, 111.4], [117.0, 118.18], [119.0, 120.9], [122.0, 123.67], [130.0, 141.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.03, 0.99, 0.1, 0.12, 0.53, -0.07, 0.66, 0.58, 0.69, 0.49, 4.59, 0.83, -0.06, 0.98, 2.31, 0.98, -0.01, 0.41, 1.9, 1.81, 0.4, 1.18, 1.9, 1.67, 11.2]} \ No newline at end of file diff --git a/annotations_1/fo0KBFhChFU_filtered.json b/annotations_1/fo0KBFhChFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..840163d9fba73610c449db64fbd5e40d611d97ea --- /dev/null +++ b/annotations_1/fo0KBFhChFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.76], [13.0, 13.73], [17.0, 17.14], [19.0, 20.06], [21.0, 25.51], [27.0, 27.36], [31.0, 32.02], [33.0, 80.27], [82.0, 90.73]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.24, 0.0, 0.0, 0.0, 32.6], "audiomae_on_audioset": [null, null, null, null, [["music", 29.42], ["hum", 16.5], ["throbbing", 11.04]], null, null, null, [["music", 47.85], ["speech", 22.97], ["throbbing", 4.47]]], "duration": [0.76, 0.73, 0.14, 1.06, 4.51, 0.36, 1.02, 47.27, 8.73]} \ No newline at end of file diff --git a/annotations_1/foQnR1eZO-Y_filtered.json b/annotations_1/foQnR1eZO-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dca8d6a91d2765959797122d525f7f15b732da2a --- /dev/null +++ b/annotations_1/foQnR1eZO-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [4.0, 3.86], [12.0, 12.72], [15.0, 15.43], [17.0, 17.93], [20.0, 20.09], [21.0, 22.0], [25.0, 31.31], [33.0, 34.48], [37.0, 38.13], [38.0, 43.93], [45.0, 48.03], [49.0, 49.67], [50.0, 50.19], [61.0, 63.21], [64.0, 64.89], [68.0, 68.27], [69.0, 71.31], [77.0, 82.9], [85.0, 84.97], [92.0, 91.93], [95.0, 95.82], [105.0, 106.47], [110.0, 110.62], [112.0, 113.07], [117.0, 117.81], [128.0, 129.32], [133.0, 134.7], [138.0, 138.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 42.79, 53.16, 0.0, 0.0, 70.3, 0.0, 0.0, 49.45, 33.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["cough", 19.87], ["speech", 18.83], ["music", 7.78]], null, null, null, null, null, null, [["whale vocalization", 23.58], ["speech", 23.39], ["hum", 7.98]], [["music", 84.67], ["musical instrument", 3.6], ["guitar", 1.98]], null, null, null, null, null, null, null, null, null, null], "duration": [0.15, -0.14, 0.72, 0.43, 0.93, 0.09, 1.0, 6.31, 1.48, 1.13, 5.93, 3.03, 0.67, 0.19, 2.21, 0.89, 0.27, 2.31, 5.9, -0.03, -0.07, 0.82, 1.47, 0.62, 1.07, 0.81, 1.32, 1.7, 0.86]} \ No newline at end of file diff --git a/annotations_1/foV6LGohzBI_filtered.json b/annotations_1/foV6LGohzBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b12869198bddbf047e8a6aa503997a40e5dd6ebe --- /dev/null +++ b/annotations_1/foV6LGohzBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.32], [28.0, 29.93], [31.0, 44.79], [50.0, 53.87], [61.0, 64.34], [72.0, 74.63], [81.0, 85.41], [106.0, 109.81], [115.0, 131.7], [133.0, 158.09], [159.0, 191.39], [193.0, 208.67]], "keep_status": [false, false, false, false, true, false, true, true, false, true, false, true], "silence_prob": [40.28, 0.0, 35.05, 38.12, 42.84, 38.04, 35.91, 28.85, 29.13, 28.99, 0.0, 28.77], "audiomae_on_audioset": [[["humming", 83.85], ["theremin", 7.14], ["music", 6.58]], null, [["music", 59.83], ["humming", 19.68], ["theremin", 5.13]], [["music", 71.04], ["theremin", 8.75], ["musical instrument", 2.86]], [["music", 50.8], ["guitar", 3.93], ["plucked string instrument", 3.8]], [["music", 48.73], ["carnatic music", 25.66], ["singing", 4.45]], [["music", 49.86], ["tabla", 11.09], ["carnatic music", 6.56]], [["music", 34.5], ["carnatic music", 20.01], ["tabla", 5.86]], [["music", 93.93], ["singing", 0.68], ["didgeridoo", 0.49]], [["music", 64.8], ["singing", 2.44], ["didgeridoo", 1.61]], null, [["music", 58.58], ["gospel music", 3.65], ["didgeridoo", 3.41]]], "duration": [16.32, 1.93, 13.79, 3.87, 3.34, 2.63, 4.41, 3.81, 16.7, 25.09, 32.39, 15.67]} \ No newline at end of file diff --git a/annotations_1/fpK36FZmTFY_filtered.json b/annotations_1/fpK36FZmTFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1ce36b899971538e8cca21b348ce58ff0f49ab8 --- /dev/null +++ b/annotations_1/fpK36FZmTFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.21], [25.0, 25.19], [26.0, 27.19], [28.0, 28.8], [29.0, 33.44], [79.0, 80.57], [81.0, 82.41], [95.0, 99.59], [100.0, 100.33], [101.0, 131.31], [132.0, 141.1], [143.0, 147.38], [148.0, 152.44], [154.0, 154.04], [159.0, 159.09], [167.0, 167.02], [171.0, 171.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 99.99, 0.0, 0.0, 83.52, 98.1, 99.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 79.36], ["sidetone", 3.72], ["radio", 3.43]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.19, 1.19, 0.8, 4.44, 1.57, 1.41, 4.59, 0.33, 30.31, 9.1, 4.38, 4.44, 0.04, 0.09, 0.02, 0.14]} \ No newline at end of file diff --git a/annotations_1/fpwM2-jDwQU_filtered.json b/annotations_1/fpwM2-jDwQU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7cc2edacd01fc3236fc3d041d2266d2bda6579 --- /dev/null +++ b/annotations_1/fpwM2-jDwQU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 37.42], [44.0, 44.85], [50.0, 50.38], [51.0, 52.86], [59.0, 65.69], [66.0, 65.94], [66.0, 66.01], [67.0, 68.4], [76.0, 76.94], [88.0, 87.83], [96.0, 96.7], [100.0, 103.44], [112.0, 114.91], [117.0, 119.79], [125.0, 126.62], [129.0, 132.0], [135.0, 134.96], [139.0, 151.71], [153.0, 154.97], [156.0, 155.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [31.79, 0.0, 0.0, 0.0, 32.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.57, 31.32, 37.85, 0.0, 51.77, 0.0, 36.05, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 77.6], ["beatboxing", 5.53], ["boing", 2.56]], null, null, null, [["speech", 76.83], ["mains hum", 4.4], ["electric shaver, electric razor", 3.54]], null, null, null, null, null, null, [["whack, thwack", 50.74], ["breaking", 18.13], ["smash, crash", 7.32]], [["speech", 29.62], ["music", 28.26], ["boing", 10.88]], [["music", 26.87], ["hum", 24.04], ["mains hum", 15.14]], null, null, null, [["music", 33.68], ["hum", 22.64], ["mains hum", 13.88]], null, null], "duration": [2.42, 0.85, 0.38, 1.86, 6.69, -0.06, 0.01, 1.4, 0.94, -0.17, 0.7, 3.44, 2.91, 2.79, 1.62, 3.0, -0.04, 12.71, 1.97, -0.13]} \ No newline at end of file diff --git a/annotations_1/fq5JFon-LOs_filtered.json b/annotations_1/fq5JFon-LOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15fb2dda16d91627722bdaab10e551cb38725c33 --- /dev/null +++ b/annotations_1/fq5JFon-LOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [2.0, 2.62], [4.0, 4.85], [7.0, 7.26], [8.0, 8.56], [9.0, 9.66], [11.0, 12.82], [27.0, 27.43], [29.0, 30.1], [31.0, 31.85], [34.0, 34.3], [45.0, 45.08], [46.0, 45.76], [48.0, 48.86], [55.0, 55.02], [56.0, 56.27], [58.0, 59.12], [60.0, 60.62], [79.0, 79.32], [82.0, 82.58], [87.0, 87.67], [89.0, 89.36], [90.0, 90.34], [92.0, 97.46], [98.0, 98.88], [100.0, 100.97], [105.0, 105.17], [107.0, 108.89], [113.0, 114.2], [119.0, 119.15], [120.0, 119.99], [121.0, 121.12], [125.0, 125.37], [127.0, 127.16], [128.0, 129.14], [130.0, 130.5], [134.0, 134.82], [135.0, 135.53], [140.0, 140.16], [141.0, 140.91], [142.0, 141.69], [148.0, 147.83], [149.0, 148.93], [153.0, 153.06], [160.0, 161.03], [168.0, 170.28], [173.0, 173.25], [176.0, 176.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 56.08], ["music", 30.73], ["thunk", 4.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 17.74], ["speech", 12.15], ["animal", 7.43]], null, null], "duration": [0.51, 0.62, 0.85, 0.26, 0.56, 0.66, 1.82, 0.43, 1.1, 0.85, 0.3, 0.08, -0.24, 0.86, 0.02, 0.27, 1.12, 0.62, 0.32, 0.58, 0.67, 0.36, 0.34, 5.46, 0.88, 0.97, 0.17, 1.89, 1.2, 0.15, -0.01, 0.12, 0.37, 0.16, 1.14, 0.5, 0.82, 0.53, 0.16, -0.09, -0.31, -0.17, -0.07, 0.06, 1.03, 2.28, 0.25, 0.13]} \ No newline at end of file diff --git a/annotations_1/fqKdFZ1jKMY_filtered.json b/annotations_1/fqKdFZ1jKMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3050ff85e2e6cd13bfb0506e86e79ded70adeb20 --- /dev/null +++ b/annotations_1/fqKdFZ1jKMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.36], [13.0, 14.93], [16.0, 20.76], [24.0, 24.09], [26.0, 26.3], [29.0, 29.17], [41.0, 42.33], [48.0, 49.49], [51.0, 53.84], [57.0, 59.86], [64.0, 65.31], [69.0, 71.39], [75.0, 75.76], [77.0, 81.72], [84.0, 92.21], [95.0, 96.67], [98.0, 111.21], [115.0, 118.83], [120.0, 123.16], [125.0, 128.24], [129.0, 132.16], [136.0, 136.17], [140.0, 141.03], [144.0, 153.35], [154.0, 154.85], [155.0, 159.76], [160.0, 159.97]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [34.07, 0.0, 33.02, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 33.38, 0.0, 31.39, 0.0, 31.46, 30.18, 0.0, 29.78, 31.91, 35.78, 30.08, 32.85, 0.0, 0.0, 29.7, 0.0, 28.76, 0.0], "audiomae_on_audioset": [[["music", 49.91], ["throbbing", 20.36], ["frog", 4.3]], null, [["music", 47.04], ["speech", 21.13], ["propeller, airscrew", 2.33]], null, null, null, null, null, null, [["music", 26.96], ["speech", 20.65], ["throbbing", 6.4]], null, [["speech", 64.37], ["music", 10.0], ["vehicle", 4.44]], null, [["fly, housefly", 45.33], ["insect", 39.59], ["mosquito", 10.77]], [["music", 81.21], ["didgeridoo", 5.36], ["musical instrument", 3.4]], null, [["music", 36.96], ["speech", 11.21], ["groan", 6.96]], [["music", 64.42], ["speech", 19.44], ["throbbing", 1.14]], [["music", 63.62], ["throbbing", 2.79], ["sampler", 2.64]], [["speech", 43.16], ["music", 24.47], ["whack, thwack", 6.41]], [["music", 78.63], ["creak", 4.52], ["grunt", 4.27]], null, null, [["music", 73.84], ["speech", 16.62], ["electronic music", 1.43]], null, [["music", 33.03], ["speech", 22.94], ["hum", 15.15]], null], "duration": [9.36, 1.93, 4.76, 0.09, 0.3, 0.17, 1.33, 1.49, 2.84, 2.86, 1.31, 2.39, 0.76, 4.72, 8.21, 1.67, 13.21, 3.83, 3.16, 3.24, 3.16, 0.17, 1.03, 9.35, 0.85, 4.76, -0.03]} \ No newline at end of file diff --git a/annotations_1/fqnhqkXclUk_filtered.json b/annotations_1/fqnhqkXclUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5087727e2b2475d4efbe7585a9af22a9c2f70917 --- /dev/null +++ b/annotations_1/fqnhqkXclUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 48.91], [52.0, 51.98], [52.0, 52.02], [53.0, 66.51], [67.0, 67.31], [67.0, 67.37], [69.0, 108.57], [109.0, 112.67], [113.0, 113.48], [115.0, 119.42], [120.0, 121.2], [122.0, 122.47], [125.0, 141.66], [144.0, 170.8], [171.0, 172.44], [174.0, 174.8]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.2, 0.0, 0.0, 0.0, 37.12, 0.0, 57.48, 0.0, 0.0, 35.64, 33.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 54.42], ["speech", 20.04], ["didgeridoo", 4.03]], null, null, null, [["speech", 21.21], ["mosquito", 18.37], ["fly, housefly", 14.96]], null, null, null, null, [["music", 30.88], ["fireworks", 11.78], ["speech", 11.57]], [["music", 35.28], ["fly, housefly", 5.39], ["vehicle", 4.32]], null, null], "duration": [31.91, -0.02, 0.02, 13.51, 0.31, 0.37, 39.57, 3.67, 0.48, 4.42, 1.2, 0.47, 16.66, 26.8, 1.44, 0.8]} \ No newline at end of file diff --git a/annotations_1/fr93wwtiKQM_filtered.json b/annotations_1/fr93wwtiKQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..888a60bd2623c06bb2acb67cd2d45c9889aba7c9 --- /dev/null +++ b/annotations_1/fr93wwtiKQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.99], [5.0, 6.32], [7.0, 7.91], [11.0, 11.47], [14.0, 15.35], [17.0, 18.47], [21.0, 22.54], [24.0, 24.56], [26.0, 28.04], [29.0, 33.17], [34.0, 35.51], [37.0, 39.56], [41.0, 52.57], [53.0, 62.56], [66.0, 92.85], [95.0, 106.29], [108.0, 136.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.99, 63.31, 65.91, 56.63, 61.67, 31.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.96], ["hum", 8.39], ["mains hum", 7.65]]], "duration": [-0.01, 1.32, 0.91, 0.47, 1.35, 1.47, 1.54, 0.56, 2.04, 4.17, 1.51, 2.56, 11.57, 9.56, 26.85, 11.29, 28.24]} \ No newline at end of file diff --git a/annotations_1/frV4tvni8H0_filtered.json b/annotations_1/frV4tvni8H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a17d3838378b6e5167c4dd6387782f23954c9d3 --- /dev/null +++ b/annotations_1/frV4tvni8H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.59], [16.0, 16.41], [18.0, 18.1], [23.0, 23.23], [24.0, 24.87], [27.0, 27.41], [29.0, 33.34], [36.0, 43.6], [44.0, 44.44], [45.0, 46.01], [48.0, 57.05], [63.0, 64.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.83, 0.0, 0.0, 0.0, 0.0, 0.0, 29.39, 28.83, 0.0, 0.0, 29.38, 0.0], "audiomae_on_audioset": [[["music", 61.69], ["speech", 6.77], ["sheep", 6.73]], null, null, null, null, null, [["music", 74.47], ["static", 1.93], ["didgeridoo", 1.91]], [["music", 79.03], ["static", 1.7], ["hum", 1.54]], null, null, [["music", 77.62], ["singing", 4.23], ["rhythm and blues", 1.41]], null], "duration": [3.59, 0.41, 0.1, 0.23, 0.87, 0.41, 4.34, 7.6, 0.44, 1.01, 9.05, 1.57]} \ No newline at end of file diff --git a/annotations_1/frZrAIZrOI8_filtered.json b/annotations_1/frZrAIZrOI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c70f2e3cbe1e969c2ac72d9de33f686a499b0104 --- /dev/null +++ b/annotations_1/frZrAIZrOI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.66], [8.0, 8.07], [16.0, 22.45], [23.0, 24.36], [31.0, 31.41], [43.0, 42.75], [49.0, 49.28], [52.0, 52.68], [55.0, 55.51], [62.0, 62.11], [64.0, 65.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.38], ["speech", 35.03], ["musical instrument", 3.5]], null, null, null, null, null, null, null, null], "duration": [-0.34, 0.07, 6.45, 1.36, 0.41, -0.25, 0.28, 0.68, 0.51, 0.11, 1.7]} \ No newline at end of file diff --git a/annotations_1/ftDkeswkEYU_filtered.json b/annotations_1/ftDkeswkEYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d9f957ca80d83362615dd9e7726941717cbb2b2 --- /dev/null +++ b/annotations_1/ftDkeswkEYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.16], [10.0, 13.2], [15.0, 18.12], [20.0, 22.84], [27.0, 29.76], [38.0, 38.67], [39.0, 40.98], [45.0, 56.56], [59.0, 58.99], [60.0, 61.13], [62.0, 75.14], [80.0, 83.59], [86.0, 92.13], [98.0, 126.86], [127.0, 130.5], [135.0, 134.96], [135.0, 135.06], [135.0, 135.19], [135.0, 136.85], [138.0, 139.77], [141.0, 166.5], [172.0, 172.98], [177.0, 177.45], [178.0, 191.51], [194.0, 197.24], [198.0, 200.97], [201.0, 201.04], [201.0, 203.54], [204.0, 211.96], [214.0, 219.87], [222.0, 223.26], [224.0, 237.84], [240.0, 245.86], [246.0, 249.4], [250.0, 250.87], [253.0, 256.07]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true, true, false, true, true, true, false, true, false, false, false, false], "silence_prob": [44.6, 44.96, 40.92, 30.19, 32.03, 0.0, 0.0, 33.0, 0.0, 0.0, 33.34, 46.19, 31.8, 31.34, 32.46, 0.0, 0.0, 0.0, 0.0, 0.0, 35.28, 0.0, 0.0, 33.56, 30.68, 31.63, 0.0, 29.45, 29.22, 29.23, 0.0, 30.5, 30.68, 58.05, 0.0, 54.56], "audiomae_on_audioset": [[["music", 24.75], ["frog", 16.1], ["animal", 6.72]], [["music", 32.44], ["speech", 28.51], ["quack", 11.4]], [["music", 29.52], ["whale vocalization", 14.82], ["frog", 3.21]], [["music", 34.27], ["speech", 28.81], ["throbbing", 5.67]], [["speech", 51.09], ["music", 18.41], ["throbbing", 5.38]], null, null, [["hum", 31.54], ["music", 15.24], ["throbbing", 14.35]], null, null, [["fly, housefly", 56.22], ["insect", 18.12], ["mosquito", 9.71]], [["music", 30.45], ["frog", 11.77], ["animal", 10.78]], [["speech", 47.73], ["music", 18.0], ["explosion", 4.73]], [["throbbing", 28.1], ["speech", 22.35], ["hum", 18.2]], [["music", 29.13], ["speech", 24.43], ["throbbing", 5.72]], null, null, null, null, null, [["throbbing", 24.93], ["music", 13.39], ["quack", 12.16]], null, null, [["music", 55.21], ["speech", 13.7], ["hum", 7.25]], [["speech", 25.04], ["music", 14.97], ["fly, housefly", 5.39]], [["music", 26.15], ["hum", 13.2], ["throbbing", 6.34]], null, [["music", 36.58], ["whale vocalization", 8.79], ["didgeridoo", 5.36]], [["vehicle", 22.98], ["hum", 17.39], ["car", 13.78]], [["music", 31.58], ["vehicle", 15.07], ["car", 6.38]], null, [["hum", 29.72], ["mains hum", 18.48], ["throbbing", 15.49]], [["speech", 60.99], ["music", 6.44], ["explosion", 4.55]], null, null, null], "duration": [2.16, 3.2, 3.12, 2.84, 2.76, 0.67, 1.98, 11.56, -0.01, 1.13, 13.14, 3.59, 6.13, 28.86, 3.5, -0.04, 0.06, 0.19, 1.85, 1.77, 25.5, 0.98, 0.45, 13.51, 3.24, 2.97, 0.04, 2.54, 7.96, 5.87, 1.26, 13.84, 5.86, 3.4, 0.87, 3.07]} \ No newline at end of file diff --git a/annotations_1/fuCe9uaRx_0_filtered.json b/annotations_1/fuCe9uaRx_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ab8abaeb6661cf581e8ffd8c186f005f1c04742 --- /dev/null +++ b/annotations_1/fuCe9uaRx_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.65], [32.0, 86.68], [88.0, 91.27], [92.0, 96.03], [96.0, 96.92], [98.0, 98.36], [101.0, 106.46]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.99, 34.26, 0.0, 0.0, 44.52], "audiomae_on_audioset": [null, null, null, [["speech", 82.08], ["inside, small room", 1.65], ["sidetone", 1.48]], null, null, [["throbbing", 49.51], ["hum", 26.68], ["heart sounds, heartbeat", 5.74]]], "duration": [0.65, 54.68, 3.27, 4.03, 0.92, 0.36, 5.46]} \ No newline at end of file diff --git a/annotations_1/futultLrWms_filtered.json b/annotations_1/futultLrWms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6021c4d9ae3e3a844865e11966615026e62d89ce --- /dev/null +++ b/annotations_1/futultLrWms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [5.0, 9.26], [14.0, 26.11], [28.0, 30.72], [32.0, 35.51], [41.0, 43.43], [45.0, 47.93], [50.0, 50.84], [51.0, 52.37], [55.0, 54.82], [58.0, 60.79], [63.0, 63.41], [68.0, 68.5], [72.0, 72.82], [74.0, 79.96], [84.0, 90.68], [94.0, 98.0], [102.0, 107.92], [109.0, 109.65], [112.0, 115.01], [117.0, 118.13], [122.0, 123.33], [130.0, 131.08], [134.0, 134.74], [138.0, 140.53], [143.0, 148.95], [150.0, 150.52], [152.0, 153.93], [157.0, 157.32], [159.0, 182.55], [186.0, 187.39], [195.0, 196.18], [199.0, 207.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.82, 70.44, 72.31, 84.98, 82.79, 70.72, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 52.92, 39.67, 40.54, 41.66, 0.0, 47.82, 0.0, 0.0, 0.0, 0.0, 33.24, 32.51, 0.0, 0.0, 0.0, 34.61, 0.0, 0.0, 32.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 81.58], ["synthesizer", 3.43], ["ambient music", 1.6]], [["music", 70.96], ["synthesizer", 4.39], ["didgeridoo", 4.16]], [["hum", 49.33], ["throbbing", 13.65], ["music", 13.54]], null, [["music", 64.82], ["singing bowl", 4.39], ["synthesizer", 4.09]], null, null, null, null, [["music", 68.04], ["speech", 2.02], ["didgeridoo", 1.79]], [["music", 78.92], ["hum", 2.08], ["throbbing", 1.5]], null, null, null, [["music", 70.83], ["throbbing", 4.99], ["hum", 4.52]], null, null, [["hum", 39.37], ["music", 18.19], ["mains hum", 12.68]]], "duration": [0.51, 4.26, 12.11, 2.72, 3.51, 2.43, 2.93, 0.84, 1.37, -0.18, 2.79, 0.41, 0.5, 0.82, 5.96, 6.68, 4.0, 5.92, 0.65, 3.01, 1.13, 1.33, 1.08, 0.74, 2.53, 5.95, 0.52, 1.93, 0.32, 23.55, 1.39, 1.18, 8.99]} \ No newline at end of file diff --git a/annotations_1/fuwfQJrMgLI_filtered.json b/annotations_1/fuwfQJrMgLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f488a288de783335325be26454d739f95edc1c8f --- /dev/null +++ b/annotations_1/fuwfQJrMgLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.13], [2.0, 3.67], [6.0, 11.7], [12.0, 13.34], [22.0, 25.08], [47.0, 47.26], [57.0, 61.15], [79.0, 79.27], [80.0, 80.74], [83.0, 83.73], [90.0, 91.08], [91.0, 93.53], [96.0, 96.9], [98.0, 102.32], [106.0, 107.23], [110.0, 116.33], [122.0, 123.58], [125.0, 125.56]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 32.3, 0.0, 31.38, 0.0, 31.19, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 45.27, 0.0, 54.56, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 18.89], ["speech", 14.7], ["sheep", 14.03]], null, [["moo", 40.97], ["cattle, bovinae", 39.28], ["livestock, farm animals, working animals", 19.24]], null, [["livestock, farm animals, working animals", 70.77], ["cattle, bovinae", 17.31], ["moo", 9.0]], null, null, null, null, null, null, [["music", 31.39], ["speech", 13.09], ["glass", 9.82]], null, null, null, null], "duration": [0.13, 1.67, 5.7, 1.34, 3.08, 0.26, 4.15, 0.27, 0.74, 0.73, 1.08, 2.53, 0.9, 4.32, 1.23, 6.33, 1.58, 0.56]} \ No newline at end of file diff --git a/annotations_1/fvHgXzOY12Y_filtered.json b/annotations_1/fvHgXzOY12Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e82862e94038892bd54a05ccfa9edf48090429 --- /dev/null +++ b/annotations_1/fvHgXzOY12Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.59], [15.0, 16.31], [18.0, 23.41], [29.0, 29.79], [31.0, 47.33], [51.0, 51.24], [53.0, 72.81], [85.0, 100.4]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 44.34, 0.0, 35.95, 0.0, 31.47, 33.91], "audiomae_on_audioset": [null, null, [["music", 74.09], ["musical instrument", 5.19], ["synthesizer", 4.15]], null, [["music", 51.29], ["synthesizer", 12.0], ["musical instrument", 4.73]], null, [["music", 69.83], ["speech", 7.19], ["didgeridoo", 2.31]], [["music", 73.02], ["beatboxing", 5.32], ["singing", 2.86]]], "duration": [-0.41, 1.31, 5.41, 0.79, 16.33, 0.24, 19.81, 15.4]} \ No newline at end of file diff --git a/annotations_1/fvNfhUZ-5z8_filtered.json b/annotations_1/fvNfhUZ-5z8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e78c3cfd357394e204ea52ee2d948119c1843789 --- /dev/null +++ b/annotations_1/fvNfhUZ-5z8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 47.26], [49.0, 54.01], [55.0, 57.18], [63.0, 64.47], [66.0, 68.2], [69.0, 69.74], [75.0, 76.52], [77.0, 79.74], [81.0, 81.35], [82.0, 83.07], [86.0, 86.04], [88.0, 96.28], [97.0, 99.2], [103.0, 104.26], [106.0, 107.3], [108.0, 109.56], [114.0, 114.29], [116.0, 117.09], [123.0, 124.38], [125.0, 125.83], [128.0, 130.64], [138.0, 155.46]], "keep_status": [true, true, true, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [32.92, 34.82, 46.09, 0.0, 49.36, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 53.47, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.19, 31.96], "audiomae_on_audioset": [[["hum", 24.94], ["mains hum", 24.57], ["music", 19.84]], [["music", 31.89], ["knock", 24.02], ["speech", 7.45]], [["hum", 15.1], ["speech", 12.63], ["hiccup", 9.13]], null, [["speech", 43.65], ["music", 9.24], ["hum", 8.99]], null, null, [["speech", 28.14], ["music", 8.28], ["didgeridoo", 7.28]], null, null, null, null, [["speech", 29.02], ["music", 24.47], ["synthesizer", 5.49]], null, null, null, null, null, null, null, [["music", 25.9], ["hum", 12.16], ["mains hum", 9.01]], [["fly, housefly", 49.23], ["insect", 22.31], ["buzz", 10.27]]], "duration": [16.26, 5.01, 2.18, 1.47, 2.2, 0.74, 1.52, 2.74, 0.35, 1.07, 0.04, 8.28, 2.2, 1.26, 1.3, 1.56, 0.29, 1.09, 1.38, 0.83, 2.64, 17.46]} \ No newline at end of file diff --git a/annotations_1/fwITaMQj7S8_filtered.json b/annotations_1/fwITaMQj7S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f57cb0bbb1fdc0328b1fc25de2b8b8dafea09f9a --- /dev/null +++ b/annotations_1/fwITaMQj7S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 55.31]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.31]} \ No newline at end of file diff --git a/annotations_1/fwZw8vujVMU_filtered.json b/annotations_1/fwZw8vujVMU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38585f18734427c4c849a256883dcdc951296869 --- /dev/null +++ b/annotations_1/fwZw8vujVMU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.78], [30.0, 31.62], [42.0, 47.29], [59.0, 59.14], [70.0, 72.32], [75.0, 78.44], [79.0, 105.04], [107.0, 107.97], [112.0, 113.88], [117.0, 130.74], [131.0, 132.0], [142.0, 145.88], [151.0, 155.58], [156.0, 156.74], [158.0, 163.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 33.97, 0.0, 34.78, 34.43, 38.63, 0.0, 0.0, 33.81, 0.0, 31.74, 39.25, 0.0, 30.55], "audiomae_on_audioset": [null, null, [["music", 64.33], ["throbbing", 4.65], ["hum", 3.76]], null, [["music", 42.03], ["didgeridoo", 29.36], ["hum", 5.57]], [["music", 58.39], ["hum", 7.72], ["throbbing", 4.81]], [["music", 53.79], ["hum", 18.2], ["throbbing", 6.45]], null, null, [["music", 83.09], ["electronic music", 3.55], ["throbbing", 2.9]], null, [["music", 20.09], ["boing", 18.5], ["groan", 9.56]], [["music", 34.98], ["throbbing", 20.55], ["hum", 9.5]], null, [["music", 73.62], ["speech", 8.53], ["electronic music", 3.7]]], "duration": [0.78, 1.62, 5.29, 0.14, 2.32, 3.44, 26.04, 0.97, 1.88, 13.74, 1.0, 3.88, 4.58, 0.74, 5.92]} \ No newline at end of file diff --git a/annotations_1/fwkB6wAxNVM_filtered.json b/annotations_1/fwkB6wAxNVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..942acc6b9a0dd777b829b763d65e917fd71be354 --- /dev/null +++ b/annotations_1/fwkB6wAxNVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [3.0, 7.38], [8.0, 9.66], [11.0, 18.08], [18.0, 24.11], [24.0, 44.44], [45.0, 94.36], [97.0, 113.44], [115.0, 115.57]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 66.88, 0.0, 34.29, 32.66, 33.62, 0.0, 34.7, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 42.6], ["didgeridoo", 18.33], ["timpani", 6.03]], [["didgeridoo", 60.86], ["music", 21.6], ["speech", 7.05]], [["music", 84.89], ["trombone", 3.17], ["brass instrument", 1.77]], null, [["music", 78.98], ["video game music", 1.82], ["vibraphone", 1.73]], null], "duration": [1.05, 4.38, 1.66, 7.08, 6.11, 20.44, 49.36, 16.44, 0.57]} \ No newline at end of file diff --git a/annotations_1/fwkzz6A_Qv4_filtered.json b/annotations_1/fwkzz6A_Qv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e62288284e8d9b58a89e906a7dc03c8775f052eb --- /dev/null +++ b/annotations_1/fwkzz6A_Qv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.46], [9.0, 12.43], [13.0, 14.61], [15.0, 16.71], [18.0, 18.87], [20.0, 20.93], [26.0, 26.59], [29.0, 28.66], [29.0, 29.94], [34.0, 33.67], [36.0, 35.72], [37.0, 37.08], [38.0, 38.38], [43.0, 44.19], [52.0, 53.05], [54.0, 54.33], [55.0, 55.85], [59.0, 59.24], [62.0, 62.18], [63.0, 64.4], [72.0, 72.86], [76.0, 77.09], [79.0, 79.93], [81.0, 82.19], [83.0, 83.94], [85.0, 89.04], [93.0, 93.6], [95.0, 94.69], [95.0, 96.69], [99.0, 99.94], [101.0, 101.66], [104.0, 104.6], [109.0, 115.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 3.43, 1.61, 1.71, 0.87, 0.93, 0.59, -0.34, 0.94, -0.33, -0.28, 0.08, 0.38, 1.19, 1.05, 0.33, 0.85, 0.24, 0.18, 1.4, 0.86, 1.09, 0.93, 1.19, 0.94, 4.04, 0.6, -0.31, 1.69, 0.94, 0.66, 0.6, 6.55]} \ No newline at end of file diff --git a/annotations_1/fxBoqr7OicA_filtered.json b/annotations_1/fxBoqr7OicA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1548813a403242d1e6d9c70468866f185bdce5d1 --- /dev/null +++ b/annotations_1/fxBoqr7OicA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.66], [16.0, 20.87], [26.0, 26.38], [34.0, 34.15], [35.0, 34.62], [35.0, 37.15], [38.0, 39.95], [41.0, 42.77], [46.0, 51.9], [58.0, 57.82], [62.0, 62.92], [64.0, 71.73], [72.0, 74.48], [85.0, 86.85], [88.0, 88.23], [91.0, 91.45], [94.0, 98.07], [101.0, 101.75], [114.0, 114.84], [117.0, 119.11], [126.0, 127.38], [130.0, 131.53]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.98, 0.0, 0.0, 0.0, 57.17, 0.0, 0.0, 39.67, 0.0, 0.0, 52.39, 33.43, 0.0, 0.0, 0.0, 39.83, 0.0, 0.0, 54.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 39.97], ["telephone", 14.26], ["door", 7.84]], null, null, null, null, null, null, [["speech", 44.74], ["music", 34.48], ["didgeridoo", 6.07]], null, null, null, [["cowbell", 38.94], ["speech", 17.07], ["animal", 14.44]], null, null, null, [["speech", 43.25], ["beatboxing", 18.84], ["music", 10.46]], null, null, null, null, null], "duration": [-0.34, 4.87, 0.38, 0.15, -0.38, 2.15, 1.95, 1.77, 5.9, -0.18, 0.92, 7.73, 2.48, 1.85, 0.23, 0.45, 4.07, 0.75, 0.84, 2.11, 1.38, 1.53]} \ No newline at end of file diff --git a/annotations_1/fxVsGcxK1nc_filtered.json b/annotations_1/fxVsGcxK1nc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3af05747bf10bcb69168b7e5244c4fd1caa9620 --- /dev/null +++ b/annotations_1/fxVsGcxK1nc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.75], [14.0, 76.59], [78.0, 83.07], [84.0, 85.33], [86.0, 89.73], [91.0, 92.38], [95.0, 102.39]], "keep_status": [true, false, true, false, true, false, true], "silence_prob": [30.65, 0.0, 31.38, 0.0, 40.33, 0.0, 29.32], "audiomae_on_audioset": [[["explosion", 29.51], ["eruption", 14.48], ["hum", 13.42]], null, [["vehicle", 15.13], ["rumble", 11.65], ["creak", 10.69]], null, [["hum", 13.26], ["rumble", 9.79], ["creak", 8.91]], null, [["explosion", 27.86], ["speech", 13.72], ["music", 12.73]]], "duration": [6.75, 62.59, 5.07, 1.33, 3.73, 1.38, 7.39]} \ No newline at end of file diff --git a/annotations_1/fyOv0TB4lXU_filtered.json b/annotations_1/fyOv0TB4lXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7e797cedb2ba4d81079311cff9ac6f294e0120c --- /dev/null +++ b/annotations_1/fyOv0TB4lXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.48], [2.0, 2.0], [5.0, 5.36], [12.0, 12.9], [14.0, 14.13], [27.0, 38.33], [39.0, 39.87], [45.0, 45.67], [46.0, 49.79], [54.0, 58.01], [58.0, 58.72], [60.0, 63.09], [65.0, 65.65], [67.0, 67.9], [69.0, 69.47], [71.0, 72.0], [73.0, 74.09], [75.0, 75.74], [83.0, 83.34], [84.0, 84.86], [86.0, 91.1], [91.0, 93.99], [95.0, 95.44], [113.0, 114.24], [117.0, 117.1], [135.0, 135.57], [139.0, 142.43], [143.0, 146.13], [149.0, 153.64], [157.0, 157.74], [159.0, 159.09], [176.0, 176.49], [183.0, 184.69], [188.0, 190.16]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.17, 0.0, 0.0, 32.38, 34.72, 0.0, 32.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.03, 31.41, 0.0, 0.0, 0.0, 0.0, 29.91, 32.36, 32.0, 0.0, 0.0, 0.0, 0.0, 31.32], "audiomae_on_audioset": [null, null, null, null, null, [["music", 36.49], ["speech", 35.62], ["boing", 9.05]], null, null, [["cattle, bovinae", 47.85], ["moo", 33.61], ["livestock, farm animals, working animals", 13.35]], [["frog", 26.23], ["animal", 12.25], ["chirp, tweet", 9.65]], null, [["animal", 32.95], ["wild animals", 9.68], ["whale vocalization", 8.84]], null, null, null, null, null, null, null, null, [["boing", 70.37], ["moo", 7.13], ["cattle, bovinae", 5.39]], [["boing", 23.31], ["speech", 14.65], ["cattle, bovinae", 9.66]], null, null, null, null, [["music", 27.24], ["carnatic music", 7.13], ["musical instrument", 5.76]], [["boing", 21.88], ["music", 18.55], ["music for children", 9.33]], [["boing", 45.07], ["sheep", 8.97], ["music", 8.25]], null, null, null, null, [["music", 54.49], ["speech", 8.37], ["musical instrument", 1.97]]], "duration": [0.48, 0.0, 0.36, 0.9, 0.13, 11.33, 0.87, 0.67, 3.79, 4.01, 0.72, 3.09, 0.65, 0.9, 0.47, 1.0, 1.09, 0.74, 0.34, 0.86, 5.1, 2.99, 0.44, 1.24, 0.1, 0.57, 3.43, 3.13, 4.64, 0.74, 0.09, 0.49, 1.69, 2.16]} \ No newline at end of file diff --git a/annotations_1/fz_9uPJnGEQ_filtered.json b/annotations_1/fz_9uPJnGEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3643de0711122e2eb8c6d27d383ccfb0dc83d0e8 --- /dev/null +++ b/annotations_1/fz_9uPJnGEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.36], [6.0, 7.64], [9.0, 11.48], [12.0, 23.06], [24.0, 24.39], [25.0, 29.05], [29.0, 29.62], [30.0, 30.32], [31.0, 32.56], [34.0, 39.7], [40.0, 41.86], [42.0, 43.66], [44.0, 45.64], [47.0, 49.87], [51.0, 55.86], [58.0, 58.77], [59.0, 60.35], [61.0, 62.46], [64.0, 65.06], [67.0, 66.93], [68.0, 70.09], [73.0, 74.28], [75.0, 75.44], [76.0, 76.3], [78.0, 78.09], [79.0, 78.68], [79.0, 79.83], [82.0, 82.38], [83.0, 83.88], [84.0, 85.23], [87.0, 87.17], [88.0, 88.84], [89.0, 89.33], [90.0, 90.63], [91.0, 92.96], [94.0, 95.62], [96.0, 99.22], [102.0, 103.98], [105.0, 108.11], [110.0, 110.62], [111.0, 112.01], [112.0, 112.87], [113.0, 115.7], [116.0, 123.18], [124.0, 125.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [91.13, 0.0, 97.92, 96.89, 0.0, 78.72, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 80.82, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 73.82, 0.0, 0.0, 0.0, 81.71, 46.19, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 40.27], ["cattle, bovinae", 18.98], ["moo", 15.45]], null, null, null, null, null, [["music", 45.31], ["speech", 18.81], ["theremin", 3.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.9], ["crow", 15.76], ["caw", 8.57]], null], "duration": [2.36, 1.64, 2.48, 11.06, 0.39, 4.05, 0.62, 0.32, 1.56, 5.7, 1.86, 1.66, 1.64, 2.87, 4.86, 0.77, 1.35, 1.46, 1.06, -0.07, 2.09, 1.28, 0.44, 0.3, 0.09, -0.32, 0.83, 0.38, 0.88, 1.23, 0.17, 0.84, 0.33, 0.63, 1.96, 1.62, 3.22, 1.98, 3.11, 0.62, 1.01, 0.87, 2.7, 7.18, 1.25]} \ No newline at end of file diff --git a/annotations_1/g0nhEzoCkJo_filtered.json b/annotations_1/g0nhEzoCkJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e190ef944fd23ed6d514d2488a68ba4c4c280a26 --- /dev/null +++ b/annotations_1/g0nhEzoCkJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 93.16], [94.0, 114.67], [117.0, 117.75], [119.0, 122.08], [123.0, 129.0], [130.0, 131.28]], "keep_status": [true, true, false, true, false, false], "silence_prob": [38.51, 32.24, 0.0, 29.39, 55.89, 0.0], "audiomae_on_audioset": [[["whale vocalization", 13.65], ["livestock, farm animals, working animals", 11.27], ["music", 10.4]], [["music", 27.56], ["cattle, bovinae", 14.43], ["livestock, farm animals, working animals", 14.33]], null, [["mosquito", 22.21], ["insect", 18.74], ["fly, housefly", 16.96]], null, null], "duration": [4.16, 20.67, 0.75, 3.08, 6.0, 1.28]} \ No newline at end of file diff --git a/annotations_1/g1jO4_HQQX4_filtered.json b/annotations_1/g1jO4_HQQX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..952fc6a3e384303fcfc8aa7cf9ccd8691b2a028f --- /dev/null +++ b/annotations_1/g1jO4_HQQX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.35], [9.0, 12.9], [21.0, 21.29], [25.0, 25.76], [28.0, 28.32], [39.0, 39.63], [41.0, 41.89], [42.0, 43.6], [45.0, 45.47], [46.0, 62.29], [67.0, 67.24], [74.0, 87.1], [88.0, 93.07]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [0.0, 31.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.48, 0.0, 29.71, 28.67], "audiomae_on_audioset": [null, [["hum", 31.29], ["speech", 11.97], ["music", 9.27]], null, null, null, null, null, null, null, [["music", 46.74], ["hum", 10.28], ["throbbing", 9.32]], null, [["hum", 30.43], ["mains hum", 15.89], ["speech", 12.65]], [["fly, housefly", 33.14], ["mosquito", 11.65], ["whack, thwack", 10.69]]], "duration": [0.35, 3.9, 0.29, 0.76, 0.32, 0.63, 0.89, 1.6, 0.47, 16.29, 0.24, 13.1, 5.07]} \ No newline at end of file diff --git a/annotations_1/g1lpI9wZtiI_filtered.json b/annotations_1/g1lpI9wZtiI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31a2e1d60acb30b2c088989b156325f0b3784cce --- /dev/null +++ b/annotations_1/g1lpI9wZtiI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.36], [20.0, 28.56], [31.0, 48.39], [52.0, 53.32], [58.0, 58.08], [72.0, 84.74], [86.0, 173.25]], "keep_status": [false, false, false, false, false, true, false], "silence_prob": [29.85, 31.44, 64.75, 0.0, 0.0, 35.16, 0.0], "audiomae_on_audioset": [[["music", 43.07], ["hum", 25.29], ["mains hum", 13.43]], [["hum", 40.97], ["mains hum", 20.74], ["music", 11.19]], null, null, null, [["music", 44.82], ["theremin", 19.12], ["didgeridoo", 2.72]], null], "duration": [9.36, 8.56, 17.39, 1.32, 0.08, 12.74, 87.25]} \ No newline at end of file diff --git a/annotations_1/g1r-B5ZGZWY_filtered.json b/annotations_1/g1r-B5ZGZWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17099f8c58832901c850c1ac20ff7a04d8c7695a --- /dev/null +++ b/annotations_1/g1r-B5ZGZWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 51.44], [52.0, 52.73], [54.0, 54.23], [55.0, 56.29], [57.0, 59.0], [60.0, 66.29], [68.0, 89.51], [91.0, 119.03], [120.0, 138.47], [139.0, 140.8], [143.0, 143.02], [144.0, 145.1], [148.0, 148.53], [154.0, 154.5], [157.0, 164.22], [175.0, 188.94], [190.0, 196.55], [197.0, 198.36], [201.0, 201.75]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.74, 32.56, 32.42, 32.89, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 38.98, 35.96, 93.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 25.45], ["music", 18.08], ["throbbing", 17.42]], [["music", 33.56], ["speech", 25.97], ["buzz", 4.36]], [["music", 31.59], ["throbbing", 30.15], ["hum", 17.59]], null, null, null, null, null, null, [["music", 57.22], ["speech", 9.47], ["frog", 2.85]], [["music", 64.38], ["speech", 12.64], ["bleat", 2.03]], null, null, null], "duration": [0.44, 0.73, 0.23, 1.29, 2.0, 6.29, 21.51, 28.03, 18.47, 1.8, 0.02, 1.1, 0.53, 0.5, 7.22, 13.94, 6.55, 1.36, 0.75]} \ No newline at end of file diff --git a/annotations_1/g2tNQ_6-kpg_filtered.json b/annotations_1/g2tNQ_6-kpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b0018c51301ba55612032f5ac37fb6e43a11421 --- /dev/null +++ b/annotations_1/g2tNQ_6-kpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.22], [7.0, 8.13], [10.0, 11.3], [13.0, 14.25], [15.0, 15.75], [17.0, 25.17], [26.0, 29.74], [30.0, 33.71], [36.0, 40.58], [42.0, 43.75], [44.0, 46.38], [47.0, 49.72], [51.0, 51.85], [55.0, 57.15], [59.0, 60.76], [62.0, 62.5], [63.0, 63.76], [65.0, 65.42], [67.0, 72.66], [75.0, 85.16], [86.0, 91.52], [92.0, 91.57], [92.0, 96.47], [98.0, 100.35], [101.0, 104.48], [107.0, 107.74], [109.0, 110.76], [113.0, 112.94], [114.0, 115.5], [117.0, 123.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [72.9, 0.0, 0.0, 0.0, 0.0, 65.67, 66.15, 59.15, 78.38, 0.0, 65.55, 53.65, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 55.18, 53.1, 61.67, 0.0, 44.84, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 41.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 21.25], ["noise", 12.27], ["hum", 11.54]], null, null, null, null, null, null, [["noise", 35.53], ["speech", 11.33], ["music", 7.73]]], "duration": [2.22, 1.13, 1.3, 1.25, 0.75, 8.17, 3.74, 3.71, 4.58, 1.75, 2.38, 2.72, 0.85, 2.15, 1.76, 0.5, 0.76, 0.42, 5.66, 10.16, 5.52, -0.43, 4.47, 2.35, 3.48, 0.74, 1.76, -0.06, 1.5, 6.69]} \ No newline at end of file diff --git a/annotations_1/g3D2eGiLoeI_filtered.json b/annotations_1/g3D2eGiLoeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e287aec50b6f774cc84b05f8606e5caf459d777 --- /dev/null +++ b/annotations_1/g3D2eGiLoeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 36.73], [39.0, 53.43], [55.0, 55.16], [56.0, 63.29], [67.0, 68.57], [76.0, 77.08], [78.0, 78.92], [85.0, 86.48], [88.0, 88.94], [90.0, 92.11], [93.0, 95.54], [98.0, 98.76], [99.0, 100.77], [101.0, 102.74], [104.0, 106.19]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.55, 33.94, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 99.99, 0.0, 0.0, 0.0, 66.15], "audiomae_on_audioset": [null, [["speech", 51.88], ["fart", 5.09], ["aircraft", 3.92]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [25.73, 14.43, 0.16, 7.29, 1.57, 1.08, 0.92, 1.48, 0.94, 2.11, 2.54, 0.76, 1.77, 1.74, 2.19]} \ No newline at end of file diff --git a/annotations_1/g3FFfmWvyAk_filtered.json b/annotations_1/g3FFfmWvyAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd5564e4ba36e03e2b4082da5e40325057dcd75a --- /dev/null +++ b/annotations_1/g3FFfmWvyAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.48], [9.0, 10.45], [11.0, 11.99], [18.0, 19.45], [22.0, 24.16], [27.0, 27.18], [28.0, 30.7], [38.0, 39.5], [43.0, 50.48], [51.0, 53.27], [54.0, 61.7], [63.0, 63.41], [64.0, 64.49], [71.0, 71.64], [72.0, 74.31], [98.0, 99.47], [111.0, 111.05], [114.0, 114.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 65.2, 0.0, 68.15, 99.94, 80.29, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.45, 0.99, 1.45, 2.16, 0.18, 2.7, 1.5, 7.48, 2.27, 7.7, 0.41, 0.49, 0.64, 2.31, 1.47, 0.05, 0.64]} \ No newline at end of file diff --git a/annotations_1/g3WSsm57iVM_filtered.json b/annotations_1/g3WSsm57iVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06546f538eb4feb7aacb53807b6952da5ba52096 --- /dev/null +++ b/annotations_1/g3WSsm57iVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.56], [16.0, 21.1], [22.0, 23.46], [26.0, 27.6], [29.0, 34.37], [35.0, 39.04], [41.0, 40.85], [44.0, 44.56], [46.0, 48.02], [49.0, 51.33], [52.0, 65.3], [66.0, 70.12], [72.0, 72.35], [73.0, 79.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.95, 100.0, 0.0, 0.0, 94.07, 90.08, 0.0, 0.0, 99.94, 99.97, 99.96, 98.51, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.56, 5.1, 1.46, 1.6, 5.37, 4.04, -0.15, 0.56, 2.02, 2.33, 13.3, 4.12, 0.35, 6.49]} \ No newline at end of file diff --git a/annotations_1/g3kYdbqIwBE_filtered.json b/annotations_1/g3kYdbqIwBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0d0fd94c14d15f02076da9481dd9372e9500123 --- /dev/null +++ b/annotations_1/g3kYdbqIwBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.33], [17.0, 18.25], [21.0, 25.22], [35.0, 36.39], [49.0, 51.8], [55.0, 55.51], [64.0, 64.35], [68.0, 68.45], [88.0, 88.89], [90.0, 90.93]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.5, 0.0, 33.62, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mosquito", 23.43], ["fly, housefly", 17.39], ["insect", 12.71]], null, [["boing", 73.83], ["speech", 8.73], ["cattle, bovinae", 2.73]], null, null, null, null, null], "duration": [0.33, 1.25, 4.22, 1.39, 2.8, 0.51, 0.35, 0.45, 0.89, 0.93]} \ No newline at end of file diff --git a/annotations_1/g425SDBoDBI_filtered.json b/annotations_1/g425SDBoDBI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c28410c3efc7e15a20cea07cd77dbf69a8a9ee75 --- /dev/null +++ b/annotations_1/g425SDBoDBI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.57], [9.0, 9.48], [15.0, 15.58], [18.0, 20.6], [24.0, 25.19], [29.0, 29.22], [31.0, 31.68], [32.0, 32.88], [40.0, 42.28], [44.0, 45.5], [58.0, 58.35], [60.0, 60.0], [61.0, 61.53], [62.0, 63.26], [64.0, 64.52], [65.0, 65.5], [66.0, 67.34], [68.0, 69.55], [73.0, 76.06], [80.0, 80.32], [82.0, 86.95], [92.0, 92.58], [97.0, 96.77], [104.0, 104.45], [105.0, 105.88], [107.0, 201.11], [203.0, 205.34], [207.0, 208.26], [208.0, 211.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [59.59, 0.0, 0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 40.62, 0.0, 0.0, 0.0, 0.0, 0.0, 39.63, 0.0, 31.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.9], ["throbbing", 13.75], ["hum", 9.29]], null, null, null, null, null, [["music", 43.05], ["ambient music", 12.78], ["hum", 9.34]], null, [["music", 40.59], ["ambient music", 14.58], ["gong", 7.39]]], "duration": [2.57, 0.48, 0.58, 2.6, 1.19, 0.22, 0.68, 0.88, 2.28, 1.5, 0.35, 0.0, 0.53, 1.26, 0.52, 0.5, 1.34, 1.55, 3.06, 0.32, 4.95, 0.58, -0.23, 0.45, 0.88, 94.11, 2.34, 1.26, 3.67]} \ No newline at end of file diff --git a/annotations_1/g4FOpeshqA8_filtered.json b/annotations_1/g4FOpeshqA8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30c00d7e8698efbe8b1346813cccb70d4bd5b4d0 --- /dev/null +++ b/annotations_1/g4FOpeshqA8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.7], [6.0, 8.95], [11.0, 12.65], [15.0, 17.98], [19.0, 20.34], [22.0, 22.82], [36.0, 36.29], [49.0, 49.37], [51.0, 51.33], [56.0, 56.98], [58.0, 60.39], [65.0, 66.19], [72.0, 73.01], [82.0, 85.16], [89.0, 90.86], [94.0, 95.2], [97.0, 98.27], [104.0, 105.02], [111.0, 112.83], [116.0, 117.91], [120.0, 122.25], [124.0, 126.94], [129.0, 131.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 91.13, 0.0, 68.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.17, 52.22, 50.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 73.36], ["synthesizer", 5.3], ["electronic music", 3.06]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.7, 2.95, 1.65, 2.98, 1.34, 0.82, 0.29, 0.37, 0.33, 0.98, 2.39, 1.19, 1.01, 3.16, 1.86, 1.2, 1.27, 1.02, 1.83, 1.91, 2.25, 2.94, 2.04]} \ No newline at end of file diff --git a/annotations_1/g5-KsABvVzU_filtered.json b/annotations_1/g5-KsABvVzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8e2501e85c33a48197d6c613abc72904b985320 --- /dev/null +++ b/annotations_1/g5-KsABvVzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [4.0, 6.25], [7.0, 9.27], [9.0, 11.16], [13.0, 13.88], [15.0, 16.44], [18.0, 18.45], [20.0, 24.46], [26.0, 26.86], [28.0, 39.53], [40.0, 47.95], [51.0, 55.93], [58.0, 61.91], [67.0, 68.28], [70.0, 70.65], [79.0, 98.44], [100.0, 104.55], [106.0, 121.96], [123.0, 125.44], [128.0, 132.98], [134.0, 135.46], [139.0, 141.08], [146.0, 147.61], [151.0, 150.94], [152.0, 169.35], [171.0, 171.26], [171.0, 174.51]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 89.01, 98.51, 0.0, 0.0, 0.0, 45.72, 0.0, 50.31, 75.88, 96.42, 82.43, 0.0, 0.0, 53.34, 100.0, 62.07, 75.72, 67.51, 0.0, 50.41, 0.0, 0.0, 41.16, 0.0, 35.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["stomach rumble", 50.44], ["whale vocalization", 7.97], ["burping, eructation", 5.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.8], ["throbbing", 12.29], ["hum", 5.3]], null, [["speech", 54.32], ["whale vocalization", 13.08], ["music", 6.62]]], "duration": [1.38, 2.25, 2.27, 2.16, 0.88, 1.44, 0.45, 4.46, 0.86, 11.53, 7.95, 4.93, 3.91, 1.28, 0.65, 19.44, 4.55, 15.96, 2.44, 4.98, 1.46, 2.08, 1.61, -0.06, 17.35, 0.26, 3.51]} \ No newline at end of file diff --git a/annotations_1/g511NYTRiOE_filtered.json b/annotations_1/g511NYTRiOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61e13f1de9afbf806e0d2115222bb2e2d5f87e8b --- /dev/null +++ b/annotations_1/g511NYTRiOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.97], [6.0, 7.52], [8.0, 12.38], [13.0, 14.07], [15.0, 16.6], [17.0, 17.2], [17.0, 29.94], [32.0, 35.94], [37.0, 39.7], [40.0, 42.65], [45.0, 46.77], [50.0, 54.08], [59.0, 60.59], [61.0, 63.81], [65.0, 67.78], [68.0, 69.89], [83.0, 85.46], [90.0, 93.39], [95.0, 95.61], [98.0, 98.14], [99.0, 99.42], [101.0, 101.65], [104.0, 105.09], [114.0, 113.9], [122.0, 127.3], [128.0, 131.63], [132.0, 134.22], [135.0, 136.0], [138.0, 140.29], [146.0, 147.28], [151.0, 151.75], [154.0, 154.08], [169.0, 168.59], [169.0, 169.87], [190.0, 189.94], [192.0, 191.91], [196.0, 196.57], [198.0, 198.68], [201.0, 201.99], [203.0, 203.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.67, 0.0, 62.78, 0.0, 0.0, 0.0, 55.89, 97.92, 96.54, 59.07, 0.0, 98.8, 0.0, 98.66, 47.5, 0.0, 96.04, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 97.22, 39.54, 0.0, 35.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 53.62], ["speech", 19.83], ["sine wave", 5.3]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.49], ["hum", 11.99], ["throbbing", 5.89]], null, [["music", 28.54], ["musical instrument", 21.74], ["drum", 10.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [4.97, 1.52, 4.38, 1.07, 1.6, 0.2, 12.94, 3.94, 2.7, 2.65, 1.77, 4.08, 1.59, 2.81, 2.78, 1.89, 2.46, 3.39, 0.61, 0.14, 0.42, 0.65, 1.09, -0.1, 5.3, 3.63, 2.22, 1.0, 2.29, 1.28, 0.75, 0.08, -0.41, 0.87, -0.06, -0.09, 0.57, 0.68, 0.99, 0.23]} \ No newline at end of file diff --git a/annotations_1/g6DnsZvudTI_filtered.json b/annotations_1/g6DnsZvudTI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63002ff5e4247fb49c980b55888c5f7481299124 --- /dev/null +++ b/annotations_1/g6DnsZvudTI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.76], [17.0, 21.95], [25.0, 28.0], [29.0, 50.06], [53.0, 54.23], [58.0, 61.25]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 79.94, 33.06, 69.47, 0.0, 72.75], "audiomae_on_audioset": [null, null, [["thunk", 53.01], ["speech", 28.62], ["telephone", 2.35]], null, null, null], "duration": [0.76, 4.95, 3.0, 21.06, 1.23, 3.25]} \ No newline at end of file diff --git a/annotations_1/g7bQ7ynurn8_filtered.json b/annotations_1/g7bQ7ynurn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8623a008a7afdd3a293c9a7ede0f138820626dc --- /dev/null +++ b/annotations_1/g7bQ7ynurn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.83], [16.0, 18.52], [19.0, 22.17], [27.0, 27.75], [32.0, 33.57], [42.0, 44.96], [50.0, 51.44], [54.0, 54.4], [58.0, 57.97], [60.0, 62.43], [64.0, 64.67]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 59.86, 33.65, 0.0, 0.0, 29.74, 0.0, 0.0, 0.0, 31.11, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.93], ["guitar", 6.3], ["musical instrument", 6.21]], null, null, [["music", 88.43], ["rock music", 1.15], ["musical instrument", 0.85]], null, null, null, [["music", 34.36], ["didgeridoo", 20.89], ["synthesizer", 7.97]], null], "duration": [0.83, 2.52, 3.17, 0.75, 1.57, 2.96, 1.44, 0.4, -0.03, 2.43, 0.67]} \ No newline at end of file diff --git a/annotations_1/g8hPeRFRiHY_filtered.json b/annotations_1/g8hPeRFRiHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ccc394846fe809222cf5ac47d7c45ec8582dd17 --- /dev/null +++ b/annotations_1/g8hPeRFRiHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.8], [6.0, 7.25], [8.0, 8.61], [11.0, 12.6], [16.0, 17.46], [23.0, 24.06], [26.0, 25.74], [28.0, 28.26], [31.0, 31.77], [33.0, 34.08], [35.0, 35.55], [37.0, 38.48], [41.0, 42.47], [46.0, 46.65], [48.0, 65.64], [66.0, 72.91], [74.0, 74.68], [77.0, 78.65], [79.0, 92.67], [96.0, 98.39], [99.0, 101.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [39.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.71, 33.49, 0.0, 0.0, 46.02, 69.34, 40.48], "audiomae_on_audioset": [[["moo", 37.02], ["cattle, bovinae", 35.33], ["livestock, farm animals, working animals", 20.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.74], ["cattle, bovinae", 4.51], ["moo", 3.62]], null, null, [["music", 56.46], ["theremin", 11.32], ["bleat", 9.11]], null, [["didgeridoo", 19.03], ["music", 13.75], ["throbbing", 7.44]]], "duration": [2.8, 1.25, 0.61, 1.6, 1.46, 1.06, -0.26, 0.26, 0.77, 1.08, 0.55, 1.48, 1.47, 0.65, 17.64, 6.91, 0.68, 1.65, 13.67, 2.39, 2.92]} \ No newline at end of file diff --git a/annotations_1/g8pt9OoaPlY_filtered.json b/annotations_1/g8pt9OoaPlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5d8c25ccf9af345223455f1db38faba1b734b5b --- /dev/null +++ b/annotations_1/g8pt9OoaPlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [4.0, 6.08], [8.0, 10.88], [16.0, 26.06], [33.0, 33.54], [35.0, 35.18], [40.0, 45.52], [48.0, 50.35], [56.0, 72.6], [74.0, 74.33], [75.0, 75.47], [76.0, 76.87], [78.0, 80.72], [84.0, 101.12], [102.0, 103.72], [107.0, 115.06]], "keep_status": [false, true, true, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 46.12, 28.83, 28.72, 0.0, 0.0, 28.97, 28.87, 29.49, 0.0, 0.0, 0.0, 31.0, 29.73, 0.0, 29.37], "audiomae_on_audioset": [null, [["speech", 34.59], ["music", 18.02], ["sidetone", 14.17]], [["music", 39.76], ["burst, pop", 7.14], ["whack, thwack", 5.48]], [["music", 20.02], ["whip", 15.59], ["speech", 12.58]], null, null, [["music", 42.08], ["speech", 35.95], ["sidetone", 5.74]], [["music", 46.48], ["speech", 24.86], ["sound effect", 2.21]], [["sonar", 28.78], ["music", 21.29], ["gong", 10.37]], null, null, null, [["foghorn", 44.64], ["music", 28.15], ["speech", 13.91]], [["speech", 53.34], ["whack, thwack", 10.04], ["groan", 4.98]], null, [["music", 59.76], ["breaking", 9.06], ["speech", 4.58]]], "duration": [0.5, 2.08, 2.88, 10.06, 0.54, 0.18, 5.52, 2.35, 16.6, 0.33, 0.47, 0.87, 2.72, 17.12, 1.72, 8.06]} \ No newline at end of file diff --git a/annotations_1/g9S5GndUhko_filtered.json b/annotations_1/g9S5GndUhko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa13fb79062e7e2937c3624a1634c0b907cd385a --- /dev/null +++ b/annotations_1/g9S5GndUhko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[158.0, 157.94], [158.0, 170.31]], "keep_status": [false, true], "silence_prob": [0.0, 28.15], "audiomae_on_audioset": [null, [["music", 52.27], ["drum and bass", 10.79], ["electronic music", 5.9]]], "duration": [-0.06, 12.31]} \ No newline at end of file diff --git a/annotations_1/g9d1TR6Lb9g_filtered.json b/annotations_1/g9d1TR6Lb9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4087d6ef78fd6cfcf435cd22e2117e130574f210 --- /dev/null +++ b/annotations_1/g9d1TR6Lb9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 49.89], [52.0, 51.95], [52.0, 55.36], [59.0, 73.13], [74.0, 73.94], [74.0, 84.94], [85.0, 172.29]], "keep_status": [false, false, true, true, false, true, false], "silence_prob": [31.37, 0.0, 29.96, 31.36, 0.0, 30.89, 0.0], "audiomae_on_audioset": [[["music", 65.38], ["speech", 8.9], ["breaking", 3.23]], null, [["music", 21.57], ["cacophony", 19.1], ["noise", 13.15]], [["music", 25.53], ["speech", 25.02], ["hum", 13.49]], null, [["music", 25.77], ["hum", 25.3], ["mains hum", 16.29]], null], "duration": [15.89, -0.05, 3.36, 14.13, -0.06, 10.94, 87.29]} \ No newline at end of file diff --git a/annotations_1/g9hEJv2uZLM_filtered.json b/annotations_1/g9hEJv2uZLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1fa0267ed529846b6b8d926eea30e4d8d23cf564 --- /dev/null +++ b/annotations_1/g9hEJv2uZLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.66], [38.0, 40.32], [41.0, 46.65], [47.0, 48.98], [50.0, 50.97], [51.0, 52.93], [57.0, 87.1], [89.0, 89.19], [96.0, 101.95], [102.0, 102.54]], "keep_status": [false, false, true, false, false, false, false, false, true, false], "silence_prob": [30.85, 30.31, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 0.0], "audiomae_on_audioset": [[["music", 55.67], ["didgeridoo", 19.12], ["speech", 10.12]], [["didgeridoo", 43.87], ["music", 23.97], ["cattle, bovinae", 2.32]], [["music", 47.81], ["animal", 4.94], ["speech", 3.3]], null, null, null, null, null, [["breaking", 44.97], ["glass", 18.74], ["livestock, farm animals, working animals", 5.02]], null], "duration": [6.66, 2.32, 5.65, 1.98, 0.97, 1.93, 30.1, 0.19, 5.95, 0.54]} \ No newline at end of file diff --git a/annotations_1/gA-VU0mczSI_filtered.json b/annotations_1/gA-VU0mczSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e05c546cb74cfae35d4600a9c83536c1c6af2c73 --- /dev/null +++ b/annotations_1/gA-VU0mczSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.82], [18.0, 20.46], [21.0, 22.49], [23.0, 57.16], [57.0, 57.94], [59.0, 68.67], [69.0, 70.92], [73.0, 73.82], [79.0, 80.91], [89.0, 92.1], [92.0, 92.82], [93.0, 92.94], [93.0, 96.52], [97.0, 108.9], [111.0, 114.54], [117.0, 122.77]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [42.69, 60.6, 0.0, 0.0, 0.0, 33.04, 0.0, 0.0, 0.0, 29.88, 0.0, 0.0, 31.07, 48.06, 53.34, 49.27], "audiomae_on_audioset": [[["civil defense siren", 53.47], ["music", 11.42], ["siren", 8.35]], null, null, null, null, [["music", 35.47], ["theremin", 11.86], ["speech", 10.85]], null, null, null, [["cattle, bovinae", 50.46], ["moo", 18.74], ["livestock, farm animals, working animals", 12.01]], null, null, [["speech", 46.46], ["music", 7.22], ["hum", 5.99]], [["music", 59.89], ["frog", 11.18], ["croak", 8.37]], null, [["music", 44.51], ["theremin", 7.58], ["musical instrument", 4.67]]], "duration": [9.82, 2.46, 1.49, 34.16, 0.94, 9.67, 1.92, 0.82, 1.91, 3.1, 0.82, -0.06, 3.52, 11.9, 3.54, 5.77]} \ No newline at end of file diff --git a/annotations_1/gA0u3Iir0CU_filtered.json b/annotations_1/gA0u3Iir0CU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1915720bfaf3ca5f5dcfb48cb6b23840a43d31ff --- /dev/null +++ b/annotations_1/gA0u3Iir0CU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.71], [21.0, 23.11], [28.0, 69.97], [70.0, 70.24], [70.0, 70.38], [70.0, 95.35], [96.0, 97.46], [98.0, 111.64], [112.0, 138.79], [139.0, 167.16]], "keep_status": [true, true, false, false, false, false, false, false, true, false], "silence_prob": [32.0, 31.07, 0.0, 0.0, 0.0, 44.46, 0.0, 48.82, 36.9, 74.6], "audiomae_on_audioset": [[["throbbing", 28.97], ["hum", 17.53], ["speech", 14.49]], [["music", 24.53], ["hum", 20.1], ["throbbing", 14.74]], null, null, null, [["throbbing", 39.18], ["hum", 37.5], ["music", 10.05]], null, [["hum", 45.3], ["throbbing", 44.8], ["heart sounds, heartbeat", 3.47]], [["speech", 37.2], ["hum", 10.61], ["throbbing", 4.92]], null], "duration": [3.71, 2.11, 41.97, 0.24, 0.38, 25.35, 1.46, 13.64, 26.79, 28.16]} \ No newline at end of file diff --git a/annotations_1/gA3wJRuClks_filtered.json b/annotations_1/gA3wJRuClks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1616f23a9787ea6296cc2e9813112973b3454a5 --- /dev/null +++ b/annotations_1/gA3wJRuClks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.71], [11.0, 11.5], [13.0, 13.09], [14.0, 14.74], [19.0, 19.57], [21.0, 26.84], [27.0, 27.77], [28.0, 28.95], [30.0, 30.28], [32.0, 31.8], [34.0, 34.57], [35.0, 39.61], [43.0, 43.48], [48.0, 48.1], [49.0, 49.81], [51.0, 50.99], [51.0, 51.6], [53.0, 54.8], [57.0, 57.77], [58.0, 58.45], [60.0, 60.13], [61.0, 61.3], [63.0, 63.14], [67.0, 67.42], [69.0, 69.18], [71.0, 70.71], [72.0, 72.22], [74.0, 74.93], [75.0, 75.64], [79.0, 79.41], [87.0, 88.08], [92.0, 92.82], [94.0, 94.2], [96.0, 97.23], [101.0, 101.93], [114.0, 114.78], [117.0, 117.42], [119.0, 119.2], [121.0, 121.53], [123.0, 124.04], [126.0, 126.32], [127.0, 130.49], [132.0, 133.07], [135.0, 135.57], [139.0, 139.23], [140.0, 141.07], [142.0, 142.3], [144.0, 144.19], [145.0, 144.96], [148.0, 150.18], [151.0, 151.04], [152.0, 152.88], [154.0, 155.71], [156.0, 157.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.71, 0.5, 0.09, 0.74, 0.57, 5.84, 0.77, 0.95, 0.28, -0.2, 0.57, 4.61, 0.48, 0.1, 0.81, -0.01, 0.6, 1.8, 0.77, 0.45, 0.13, 0.3, 0.14, 0.42, 0.18, -0.29, 0.22, 0.93, 0.64, 0.41, 1.08, 0.82, 0.2, 1.23, 0.93, 0.78, 0.42, 0.2, 0.53, 1.04, 0.32, 3.49, 1.07, 0.57, 0.23, 1.07, 0.3, 0.19, -0.04, 2.18, 0.04, 0.88, 1.71, 1.77]} \ No newline at end of file diff --git a/annotations_1/gBdbUMTXKIA_filtered.json b/annotations_1/gBdbUMTXKIA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..838f37130402f6ec0fce12cccbc9bed52831e643 --- /dev/null +++ b/annotations_1/gBdbUMTXKIA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[88.0, 88.5], [90.0, 114.84], [117.0, 126.0], [126.0, 126.23], [126.0, 126.72], [127.0, 127.68], [130.0, 130.06]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [0.0, 33.93, 38.62, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["cattle, bovinae", 20.39], ["moo", 20.21], ["whale vocalization", 17.59]], [["speech", 64.96], ["whale vocalization", 16.27], ["noise", 4.38]], null, null, null, null], "duration": [0.5, 24.84, 9.0, 0.23, 0.72, 0.68, 0.06]} \ No newline at end of file diff --git a/annotations_1/gC672314kEU_filtered.json b/annotations_1/gC672314kEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aaced5c502d1ac40c0bc7f0c4f88cfdfa5da6a3 --- /dev/null +++ b/annotations_1/gC672314kEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.65], [17.0, 17.68], [23.0, 23.09], [29.0, 29.22], [32.0, 32.59], [36.0, 40.0], [47.0, 47.87], [49.0, 63.39], [65.0, 65.26], [67.0, 66.78], [69.0, 70.78], [74.0, 73.99], [75.0, 84.72], [88.0, 87.94], [91.0, 90.8], [92.0, 92.38], [96.0, 97.8], [102.0, 102.66], [103.0, 103.37], [106.0, 105.85], [108.0, 116.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 44.93, 0.0, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 44.21], ["music", 28.04], ["hum", 4.4]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.05], ["throbbing", 7.48], ["hum", 5.86]]], "duration": [0.65, 0.68, 0.09, 0.22, 0.59, 4.0, 0.87, 14.39, 0.26, -0.22, 1.78, -0.01, 9.72, -0.06, -0.2, 0.38, 1.8, 0.66, 0.37, -0.15, 8.26]} \ No newline at end of file diff --git a/annotations_1/gC6gD7Qzry8_filtered.json b/annotations_1/gC6gD7Qzry8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4aca73613a494db29d430c00a73f0ff912b189b --- /dev/null +++ b/annotations_1/gC6gD7Qzry8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 55.71], [58.0, 60.0], [60.0, 61.13], [70.0, 70.56], [79.0, 79.1], [86.0, 87.44], [104.0, 103.77], [111.0, 114.89], [117.0, 128.51], [131.0, 131.94], [134.0, 135.11], [140.0, 145.2], [146.0, 148.76], [151.0, 151.01], [152.0, 155.01], [159.0, 159.29], [161.0, 161.38], [162.0, 196.3]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 40.16, 57.81, 0.0, 0.0, 99.95, 92.15, 0.0, 68.28, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 30.63], ["sidetone", 14.02], ["hum", 11.68]], null, null, null, null, null, null, null, null, null, null], "duration": [41.71, 2.0, 1.13, 0.56, 0.1, 1.44, -0.23, 3.89, 11.51, 0.94, 1.11, 5.2, 2.76, 0.01, 3.01, 0.29, 0.38, 34.3]} \ No newline at end of file diff --git a/annotations_1/gCE5175IkoY_filtered.json b/annotations_1/gCE5175IkoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a05026df8684a7cdcd41d48779b6829a691b67 --- /dev/null +++ b/annotations_1/gCE5175IkoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 22.35], [29.0, 32.16], [42.0, 42.85], [45.0, 121.56], [123.0, 130.11], [133.0, 133.73], [149.0, 152.25], [158.0, 158.94], [178.0, 179.9]], "keep_status": [false, true, false, false, false, false, false, false, false], "silence_prob": [54.3, 43.74, 0.0, 0.0, 32.28, 0.0, 61.47, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.2], ["speech", 17.17], ["musical instrument", 5.29]], null, null, [["music", 84.72], ["musical instrument", 3.11], ["synthesizer", 2.07]], null, null, null, null], "duration": [10.35, 3.16, 0.85, 76.56, 7.11, 0.73, 3.25, 0.94, 1.9]} \ No newline at end of file diff --git a/annotations_1/gCHCR0wZclg_filtered.json b/annotations_1/gCHCR0wZclg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..376d2396f3b184a7a152d436574c7958d35fbbf8 --- /dev/null +++ b/annotations_1/gCHCR0wZclg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [8.0, 9.46], [13.0, 17.59], [19.0, 21.57], [23.0, 25.95], [29.0, 30.32], [31.0, 32.76], [34.0, 35.73], [38.0, 38.77], [42.0, 42.72], [51.0, 52.24], [61.0, 61.33], [62.0, 62.72], [65.0, 66.21], [67.0, 67.78], [71.0, 71.39], [73.0, 73.01], [79.0, 78.76], [86.0, 86.48], [105.0, 106.69], [110.0, 116.04], [117.0, 118.07], [130.0, 130.54], [132.0, 132.73], [138.0, 139.65], [141.0, 142.57], [143.0, 144.31], [145.0, 146.5], [150.0, 151.66], [153.0, 152.91], [164.0, 172.94], [178.0, 178.46], [180.0, 182.63], [186.0, 187.51], [201.0, 204.94], [205.0, 205.44]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.33, 98.99, 41.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.09, 0.0, 99.8, 0.0, 29.33, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.49], ["hiccup", 5.92], ["chirp tone", 4.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.75], ["livestock, farm animals, working animals", 28.18], ["moo", 19.55]], null, null, null, [["speech", 66.86], ["crowd", 7.34], ["outside, urban or manmade", 2.94]], null], "duration": [0.5, 1.46, 4.59, 2.57, 2.95, 1.32, 1.76, 1.73, 0.77, 0.72, 1.24, 0.33, 0.72, 1.21, 0.78, 0.39, 0.01, -0.24, 0.48, 1.69, 6.04, 1.07, 0.54, 0.73, 1.65, 1.57, 1.31, 1.5, 1.66, -0.09, 8.94, 0.46, 2.63, 1.51, 3.94, 0.44]} \ No newline at end of file diff --git a/annotations_1/gDOSJkcKPbo_filtered.json b/annotations_1/gDOSJkcKPbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a9c3c4306693699807d7bdc9e48f522e18b3145 --- /dev/null +++ b/annotations_1/gDOSJkcKPbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [6.0, 5.9], [7.0, 8.11], [12.0, 12.23], [13.0, 13.24], [15.0, 15.67], [20.0, 20.41], [23.0, 23.6], [25.0, 25.42], [26.0, 26.25], [27.0, 27.65], [31.0, 30.91], [35.0, 35.46], [36.0, 36.26], [43.0, 43.34], [48.0, 48.09], [58.0, 58.72], [60.0, 60.3], [69.0, 69.8], [73.0, 73.45], [77.0, 82.26], [83.0, 85.4], [97.0, 101.41], [106.0, 106.14], [114.0, 114.94], [119.0, 119.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.09, 47.46, 71.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 22.68], ["speech", 10.79], ["frog", 9.21]], [["speech", 50.64], ["radio", 12.04], ["sidetone", 8.2]], null, null, null, null], "duration": [0.57, -0.1, 1.11, 0.23, 0.24, 0.67, 0.41, 0.6, 0.42, 0.25, 0.65, -0.09, 0.46, 0.26, 0.34, 0.09, 0.72, 0.3, 0.8, 0.45, 5.26, 2.4, 4.41, 0.14, 0.94, 0.42]} \ No newline at end of file diff --git a/annotations_1/gDPJG9FP3iM_filtered.json b/annotations_1/gDPJG9FP3iM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd82778675541676888aa779886d285ce1d88965 --- /dev/null +++ b/annotations_1/gDPJG9FP3iM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.13], [8.0, 9.42], [12.0, 14.88], [15.0, 20.76], [27.0, 37.37], [40.0, 57.37], [58.0, 59.05], [61.0, 61.64], [64.0, 65.5], [66.0, 69.92], [72.0, 71.85], [75.0, 77.6], [80.0, 82.48], [84.0, 88.5], [94.0, 94.39], [101.0, 105.73], [107.0, 109.14], [110.0, 112.18], [114.0, 119.25], [120.0, 120.9], [122.0, 125.22], [126.0, 128.09], [132.0, 138.67], [140.0, 140.75], [142.0, 146.47], [148.0, 148.14], [149.0, 158.52], [161.0, 164.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.51, 0.0, 52.8, 30.11, 30.83, 53.72, 0.0, 0.0, 0.0, 54.43, 0.0, 67.25, 60.6, 71.43, 0.0, 54.7, 75.07, 62.99, 73.67, 0.0, 75.88, 95.51, 60.23, 0.0, 73.21, 0.0, 50.56, 52.45], "audiomae_on_audioset": [null, null, null, [["speech", 62.5], ["music", 12.81], ["outside, rural or natural", 5.75]], [["hum", 39.85], ["mains hum", 26.83], ["music", 17.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.13, 1.42, 2.88, 5.76, 10.37, 17.37, 1.05, 0.64, 1.5, 3.92, -0.15, 2.6, 2.48, 4.5, 0.39, 4.73, 2.14, 2.18, 5.25, 0.9, 3.22, 2.09, 6.67, 0.75, 4.47, 0.14, 9.52, 3.44]} \ No newline at end of file diff --git a/annotations_1/gDSrAm2CKdU_filtered.json b/annotations_1/gDSrAm2CKdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe43afa6b1f40b2b1f2c3bc6be9051123a375646 --- /dev/null +++ b/annotations_1/gDSrAm2CKdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [7.0, 7.4], [8.0, 9.05], [12.0, 12.04], [33.0, 34.08], [55.0, 56.73], [58.0, 58.29], [58.0, 58.99], [60.0, 60.96], [67.0, 67.02], [78.0, 79.14], [82.0, 82.97], [84.0, 84.35], [89.0, 91.37], [97.0, 97.63], [99.0, 100.06], [101.0, 101.28], [102.0, 101.92], [103.0, 104.53], [105.0, 105.85], [107.0, 108.45], [110.0, 111.15], [113.0, 114.0], [115.0, 115.89], [131.0, 131.13], [139.0, 138.99], [156.0, 157.22], [159.0, 159.44], [161.0, 162.67], [164.0, 164.83], [166.0, 165.92], [167.0, 167.71], [169.0, 169.64], [175.0, 175.02], [181.0, 182.44], [186.0, 185.92], [187.0, 189.92], [191.0, 192.42], [194.0, 195.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.4, 1.05, 0.04, 1.08, 1.73, 0.29, 0.99, 0.96, 0.02, 1.14, 0.97, 0.35, 2.37, 0.63, 1.06, 0.28, -0.08, 1.53, 0.85, 1.45, 1.15, 1.0, 0.89, 0.13, -0.01, 1.22, 0.44, 1.67, 0.83, -0.08, 0.71, 0.64, 0.02, 1.44, -0.08, 2.92, 1.42, 1.17]} \ No newline at end of file diff --git a/annotations_1/gDVyEzQNvhU_filtered.json b/annotations_1/gDVyEzQNvhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1586c8b9225bec467d2482bfdea40075f8c8b0a5 --- /dev/null +++ b/annotations_1/gDVyEzQNvhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [6.0, 7.42], [8.0, 8.28], [15.0, 17.02], [19.0, 19.18], [19.0, 52.84], [53.0, 55.93], [58.0, 65.7], [67.0, 73.68], [76.0, 82.07], [84.0, 89.04], [90.0, 111.1], [113.0, 113.09], [119.0, 129.47]], "keep_status": [false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 30.06, 30.18, 30.0, 30.15, 32.35, 31.08, 0.0, 31.09], "audiomae_on_audioset": [null, null, null, [["music", 24.76], ["didgeridoo", 6.88], ["effects unit", 5.61]], null, null, [["music", 60.87], ["speech", 11.26], ["dubstep", 4.76]], [["music", 44.38], ["whack, thwack", 16.92], ["whip", 6.39]], [["music", 42.54], ["livestock, farm animals, working animals", 15.27], ["cattle, bovinae", 9.04]], [["speech", 30.55], ["music", 18.75], ["whack, thwack", 8.15]], [["music", 69.83], ["throbbing", 5.83], ["electronic music", 2.33]], [["music", 46.33], ["throbbing", 31.78], ["hum", 7.38]], null, [["music", 46.49], ["carnatic music", 15.5], ["musical instrument", 9.85]]], "duration": [0.98, 1.42, 0.28, 2.02, 0.18, 33.84, 2.93, 7.7, 6.68, 6.07, 5.04, 21.1, 0.09, 10.47]} \ No newline at end of file diff --git a/annotations_1/gDtB0Sr8sbY_filtered.json b/annotations_1/gDtB0Sr8sbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b4b7027e30634d2ea558808f205c3037cfc6059 --- /dev/null +++ b/annotations_1/gDtB0Sr8sbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [17.0, 18.22], [19.0, 20.07], [22.0, 25.25], [29.0, 30.47], [33.0, 43.48], [45.0, 127.31], [127.0, 127.45], [127.0, 127.58], [130.0, 142.69], [153.0, 154.52], [158.0, 161.08], [170.0, 172.37], [176.0, 176.42], [184.0, 186.0]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 38.03, 0.0, 37.05, 0.0, 0.0, 0.0, 45.62, 0.0, 37.58, 31.02, 0.0, 32.78], "audiomae_on_audioset": [null, null, null, [["speech", 57.7], ["radio", 16.75], ["sidetone", 5.67]], null, [["livestock, farm animals, working animals", 28.08], ["animal", 9.69], ["cattle, bovinae", 8.82]], null, null, null, [["music", 61.02], ["effects unit", 6.21], ["synthesizer", 5.21]], null, [["speech", 14.53], ["music", 14.53], ["inside, small room", 6.52]], [["frog", 25.32], ["whale vocalization", 18.57], ["speech", 17.06]], null, [["whale vocalization", 30.11], ["cattle, bovinae", 13.33], ["moo", 10.47]]], "duration": [0.53, 1.22, 1.07, 3.25, 1.47, 10.48, 82.31, 0.45, 0.58, 12.69, 1.52, 3.08, 2.37, 0.42, 2.0]} \ No newline at end of file diff --git a/annotations_1/gFJT9ziRAUI_filtered.json b/annotations_1/gFJT9ziRAUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7d1804cb69dc634d1fe2b6389307e366c9140f6 --- /dev/null +++ b/annotations_1/gFJT9ziRAUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.71], [16.0, 17.36], [19.0, 65.15], [68.0, 69.99], [72.0, 71.85], [74.0, 75.49], [78.0, 90.86], [95.0, 98.91], [99.0, 101.78], [104.0, 104.62], [106.0, 108.09], [115.0, 115.86], [119.0, 120.75], [121.0, 121.34], [125.0, 125.58], [130.0, 130.71], [131.0, 135.41], [139.0, 151.41], [157.0, 156.78], [158.0, 159.17], [160.0, 164.76], [167.0, 167.91], [170.0, 170.75]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [35.41, 0.0, 0.0, 0.0, 0.0, 0.0, 30.82, 31.07, 34.18, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 31.16, 29.76, 0.0, 0.0, 29.38, 0.0, 0.0], "audiomae_on_audioset": [[["music", 39.89], ["throbbing", 14.45], ["speech", 12.78]], null, null, null, null, null, [["speech", 35.56], ["music", 21.52], ["whack, thwack", 10.17]], [["speech", 35.2], ["music", 31.93], ["throbbing", 7.35]], [["speech", 42.78], ["music", 16.19], ["aircraft", 5.77]], null, [["mains hum", 58.71], ["hum", 23.44], ["speech", 4.59]], null, null, null, null, null, [["music", 40.42], ["throbbing", 8.01], ["hum", 5.63]], [["music", 43.18], ["speech", 11.5], ["hum", 9.54]], null, null, [["music", 39.82], ["throbbing", 6.89], ["electronic music", 5.61]], null, null], "duration": [5.71, 1.36, 46.15, 1.99, -0.15, 1.49, 12.86, 3.91, 2.78, 0.62, 2.09, 0.86, 1.75, 0.34, 0.58, 0.71, 4.41, 12.41, -0.22, 1.17, 4.76, 0.91, 0.75]} \ No newline at end of file diff --git a/annotations_1/gFX14TEiBOw_filtered.json b/annotations_1/gFX14TEiBOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d5d14dd2a3d4d8f94aa464ba447a63a19f3f868 --- /dev/null +++ b/annotations_1/gFX14TEiBOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [5.0, 5.24], [16.0, 16.58], [38.0, 38.52], [48.0, 49.06], [73.0, 74.33], [95.0, 97.6], [99.0, 101.58], [103.0, 103.18], [103.0, 103.42], [105.0, 104.9], [108.0, 108.55], [110.0, 110.46], [110.0, 110.54], [111.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.24, 0.58, 0.52, 1.06, 1.33, 2.6, 2.58, 0.18, 0.42, -0.1, 0.55, 0.46, 0.54, 45.64]} \ No newline at end of file diff --git a/annotations_1/gFocZQa78ho_filtered.json b/annotations_1/gFocZQa78ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8db7b574fbe70752524b6ae0c02cdd9e08d64c --- /dev/null +++ b/annotations_1/gFocZQa78ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.2], [20.0, 22.89], [23.0, 25.15], [25.0, 40.98], [46.0, 47.9], [49.0, 51.85], [54.0, 54.9], [61.0, 64.98], [66.0, 66.21], [70.0, 86.8], [89.0, 90.19], [97.0, 98.64], [100.0, 99.87], [108.0, 112.11], [113.0, 113.91], [118.0, 118.93], [120.0, 126.96], [130.0, 134.74], [135.0, 136.66], [164.0, 165.45]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 28.79, 28.71, 30.13, 0.0, 31.54, 0.0, 32.43, 0.0, 32.08, 0.0, 0.0, 0.0, 39.05, 0.0, 0.0, 34.71, 35.95, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.81], ["electronic music", 6.21], ["whale vocalization", 4.26]], [["music", 78.31], ["musical instrument", 2.84], ["electronic music", 1.36]], [["music", 82.65], ["brass instrument", 4.17], ["musical instrument", 3.06]], null, [["music", 66.53], ["foghorn", 3.74], ["theremin", 3.21]], null, [["music", 31.12], ["cacophony", 5.86], ["fly, housefly", 5.51]], null, [["music", 59.66], ["speech", 6.72], ["crowd", 6.1]], null, null, null, [["music", 42.0], ["throbbing", 15.82], ["hum", 12.77]], null, null, [["music", 60.66], ["throbbing", 3.67], ["trombone", 3.37]], [["music", 64.54], ["foghorn", 10.45], ["throbbing", 3.03]], null, null], "duration": [1.2, 2.89, 2.15, 15.98, 1.9, 2.85, 0.9, 3.98, 0.21, 16.8, 1.19, 1.64, -0.13, 4.11, 0.91, 0.93, 6.96, 4.74, 1.66, 1.45]} \ No newline at end of file diff --git a/annotations_1/gH1kstAfb5g_filtered.json b/annotations_1/gH1kstAfb5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31b56773e734e3ba0b67170235308e7d6b3b38b6 --- /dev/null +++ b/annotations_1/gH1kstAfb5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.81], [17.0, 16.78], [19.0, 21.14], [21.0, 21.17], [22.0, 23.97], [35.0, 35.13], [36.0, 36.1], [37.0, 37.32], [44.0, 50.89], [52.0, 52.39], [56.0, 56.3], [63.0, 75.57], [83.0, 98.71], [100.0, 100.9], [101.0, 100.97], [101.0, 101.04], [101.0, 103.6], [104.0, 103.87], [104.0, 106.2], [108.0, 114.25], [115.0, 116.29]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 35.59, 0.0, 0.0, 29.84, 29.18, 0.0, 0.0, 0.0, 29.56, 0.0, 28.83, 38.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 44.97], ["fart", 11.01], ["fly, housefly", 9.93]], null, null, [["music", 62.63], ["speech", 10.72], ["boing", 9.12]], [["music", 70.02], ["speech", 9.71], ["cacophony", 2.37]], null, null, null, [["music", 89.59], ["boing", 0.6], ["funny music", 0.47]], null, [["music", 81.69], ["throbbing", 2.1], ["boing", 1.26]], [["music", 31.07], ["didgeridoo", 10.47], ["gong", 7.41]], null], "duration": [-0.19, -0.22, 2.14, 0.17, 1.97, 0.13, 0.1, 0.32, 6.89, 0.39, 0.3, 12.57, 15.71, 0.9, -0.03, 0.04, 2.6, -0.13, 2.2, 6.25, 1.29]} \ No newline at end of file diff --git a/annotations_1/gH4dw-S1esk_filtered.json b/annotations_1/gH4dw-S1esk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f8c54c652094f2e8ce88ce0f088e7d9faa9edff --- /dev/null +++ b/annotations_1/gH4dw-S1esk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 80.27], [81.0, 82.24], [87.0, 95.12], [97.0, 104.63], [106.0, 106.44], [106.0, 150.58], [153.0, 175.73]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.96, 29.0, 0.0, 0.0, 28.16], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 31.3], ["speech", 11.21], ["cattle, bovinae", 8.39]], [["music", 50.54], ["mains hum", 11.78], ["hum", 11.71]], null, null, [["music", 59.18], ["speech", 13.67], ["musical instrument", 2.75]]], "duration": [76.27, 1.24, 8.12, 7.63, 0.44, 44.58, 22.73]} \ No newline at end of file diff --git a/annotations_1/gHJwn_JEazA_filtered.json b/annotations_1/gHJwn_JEazA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eccfac2a197778a74d2f389e89344b7db25c15ac --- /dev/null +++ b/annotations_1/gHJwn_JEazA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.44], [8.0, 18.2], [19.0, 24.83], [25.0, 26.11], [27.0, 28.63], [31.0, 31.67], [34.0, 34.64], [37.0, 37.56], [38.0, 39.5], [41.0, 48.57], [49.0, 49.69], [50.0, 51.44], [52.0, 53.03], [53.0, 56.67], [58.0, 59.37], [60.0, 61.4], [63.0, 64.02], [65.0, 66.88], [70.0, 72.52], [73.0, 73.82], [75.0, 75.84], [76.0, 80.45], [81.0, 82.09], [83.0, 85.56], [87.0, 88.21], [91.0, 91.18], [92.0, 92.33], [94.0, 94.59], [96.0, 99.06], [100.0, 103.23], [103.0, 103.35], [103.0, 104.55], [105.0, 105.36], [106.0, 110.3], [117.0, 120.82], [122.0, 124.04], [126.0, 126.96], [128.0, 131.72]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [35.39, 38.46, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 0.0, 46.19, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 89.36, 49.31, 0.0, 0.0, 0.0, 42.37, 57.81, 99.96, 0.0, 55.53], "audiomae_on_audioset": [[["speech", 35.73], ["music", 9.14], ["moo", 5.34]], [["speech", 12.83], ["hum", 11.09], ["music", 10.76]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.07], ["radio", 7.98], ["music", 4.93]], null, null, null, null, null, null, null, [["speech", 33.56], ["music", 27.15], ["hum", 4.26]], null, null, null, null, null, null, null, [["music", 43.25], ["hum", 6.24], ["throbbing", 4.96]], null, null, null, [["music", 39.2], ["speech", 21.78], ["synthesizer", 10.0]], null, null, null, null], "duration": [2.44, 10.2, 5.83, 1.11, 1.63, 0.67, 0.64, 0.56, 1.5, 7.57, 0.69, 1.44, 1.03, 3.67, 1.37, 1.4, 1.02, 1.88, 2.52, 0.82, 0.84, 4.45, 1.09, 2.56, 1.21, 0.18, 0.33, 0.59, 3.06, 3.23, 0.35, 1.55, 0.36, 4.3, 3.82, 2.04, 0.96, 3.72]} \ No newline at end of file diff --git a/annotations_1/gIZ64_sZbCY_filtered.json b/annotations_1/gIZ64_sZbCY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73d14f094cdb352f9a1274bb94caa2ad62699fda --- /dev/null +++ b/annotations_1/gIZ64_sZbCY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [5.0, 5.02], [5.0, 9.71], [15.0, 27.51], [28.0, 36.22], [40.0, 43.93], [47.0, 47.6], [59.0, 60.52], [64.0, 64.72], [66.0, 67.73], [75.0, 76.01], [78.0, 79.78], [82.0, 97.44], [98.0, 102.63], [103.0, 104.55], [108.0, 126.64], [128.0, 130.91], [132.0, 133.54], [145.0, 145.84]], "keep_status": [false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 35.01, 37.28, 36.42, 40.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 64.75, 0.0, 42.02, 34.2, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 33.93], ["fart", 12.09], ["cattle, bovinae", 6.92]], [["music", 56.16], ["speech", 8.23], ["smash, crash", 3.44]], [["speech", 44.28], ["crack", 7.61], ["music", 7.05]], [["speech", 19.11], ["fart", 13.33], ["thunk", 8.17]], null, null, null, null, null, null, null, null, null, [["music", 40.29], ["didgeridoo", 13.32], ["theremin", 5.65]], [["music", 25.39], ["speech", 15.36], ["sheep", 3.04]], null, null], "duration": [0.43, 0.02, 4.71, 12.51, 8.22, 3.93, 0.6, 1.52, 0.72, 1.73, 1.01, 1.78, 15.44, 4.63, 1.55, 18.64, 2.91, 1.54, 0.84]} \ No newline at end of file diff --git a/annotations_1/gIaqrkn0ymo_filtered.json b/annotations_1/gIaqrkn0ymo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..514e2057a476dfc66c3369ecb61165db33c8ce43 --- /dev/null +++ b/annotations_1/gIaqrkn0ymo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.96], [14.0, 14.45], [20.0, 20.28], [37.0, 38.53], [53.0, 53.25], [54.0, 53.74], [69.0, 69.21], [80.0, 83.91], [87.0, 88.21], [92.0, 92.13], [113.0, 114.71], [117.0, 120.29], [122.0, 123.69], [125.0, 125.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 0.0, 35.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.19], ["music", 24.58], ["sidetone", 2.46]], null, null], "duration": [-0.04, 0.45, 0.28, 1.53, 0.25, -0.26, 0.21, 3.91, 1.21, 0.13, 1.71, 3.29, 1.69, 0.51]} \ No newline at end of file diff --git a/annotations_1/gJDpyQ1Efto_filtered.json b/annotations_1/gJDpyQ1Efto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654115c39eaddc40334354b13d938a4c82e4a992 --- /dev/null +++ b/annotations_1/gJDpyQ1Efto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.1], [17.0, 19.33], [24.0, 25.39], [30.0, 34.69], [35.0, 35.26], [36.0, 38.1], [47.0, 48.95], [56.0, 58.82], [70.0, 71.32], [72.0, 73.2], [80.0, 80.86], [95.0, 95.69], [96.0, 96.99], [98.0, 98.85], [104.0, 103.99], [105.0, 105.04], [105.0, 105.51], [111.0, 113.83], [115.0, 116.73], [121.0, 121.56], [122.0, 122.55]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [31.73, 32.85, 0.0, 38.52, 0.0, 33.57, 0.0, 30.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.18], ["speech", 20.0], ["boing", 8.21]], [["music", 31.74], ["didgeridoo", 14.1], ["clarinet", 11.03]], null, [["music", 49.03], ["brass instrument", 13.75], ["trombone", 9.8]], null, [["music", 45.79], ["speech", 12.34], ["saxophone", 7.61]], null, [["music", 40.2], ["speech", 35.05], ["musical instrument", 5.29]], null, null, null, null, null, null, null, null, null, [["echo", 14.78], ["wild animals", 9.78], ["speech", 7.63]], null, null, null], "duration": [4.1, 2.33, 1.39, 4.69, 0.26, 2.1, 1.95, 2.82, 1.32, 1.2, 0.86, 0.69, 0.99, 0.85, -0.01, 0.04, 0.51, 2.83, 1.73, 0.56, 0.55]} \ No newline at end of file diff --git a/annotations_1/gJvoeKHjuvE_filtered.json b/annotations_1/gJvoeKHjuvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fb1624f0f66be872ffdc89b8303aaab0fdecdfc --- /dev/null +++ b/annotations_1/gJvoeKHjuvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.94], [11.0, 13.0], [14.0, 17.14], [18.0, 18.87], [23.0, 26.4], [29.0, 30.08], [35.0, 35.67], [39.0, 39.58], [40.0, 41.42], [42.0, 46.6], [55.0, 56.89], [60.0, 61.69], [65.0, 72.3], [73.0, 73.89], [77.0, 77.19], [82.0, 81.92], [92.0, 97.63], [100.0, 103.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 50.36, 52.27, 0.0, 45.65, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 36.67, 0.0, 0.0, 0.0, 35.23, 36.65], "audiomae_on_audioset": [null, null, null, null, [["music", 80.37], ["bass guitar", 1.73], ["ding-dong", 1.09]], null, null, null, null, [["boing", 47.88], ["speech", 15.07], ["music", 14.97]], null, null, [["music", 24.75], ["effects unit", 7.19], ["boing", 6.64]], null, null, null, [["music", 35.72], ["speech", 31.98], ["boing", 4.45]], [["moo", 40.88], ["cattle, bovinae", 17.64], ["livestock, farm animals, working animals", 7.66]]], "duration": [1.94, 2.0, 3.14, 0.87, 3.4, 1.08, 0.67, 0.58, 1.42, 4.6, 1.89, 1.69, 7.3, 0.89, 0.19, -0.08, 5.63, 3.03]} \ No newline at end of file diff --git a/annotations_1/gK6JyAanVNE_filtered.json b/annotations_1/gK6JyAanVNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af846a6fa957f36868cde733411e0cb51f5a45e --- /dev/null +++ b/annotations_1/gK6JyAanVNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.36], [13.0, 14.01], [14.0, 15.31], [20.0, 19.95], [20.0, 34.06], [47.0, 57.35], [58.0, 58.6], [62.0, 65.96], [66.0, 66.06], [66.0, 66.11], [66.0, 66.21], [66.0, 74.38], [79.0, 82.21], [86.0, 89.16], [95.0, 97.28], [105.0, 107.82], [109.0, 109.41], [111.0, 111.87], [115.0, 118.08], [122.0, 125.69], [127.0, 130.57], [133.0, 133.59]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, true, true, false], "silence_prob": [31.56, 0.0, 0.0, 0.0, 29.95, 30.54, 0.0, 29.7, 0.0, 0.0, 0.0, 29.89, 30.17, 30.58, 30.43, 30.41, 0.0, 0.0, 37.84, 35.24, 30.72, 0.0], "audiomae_on_audioset": [[["music", 24.94], ["throbbing", 13.85], ["electronic music", 9.61]], null, null, null, [["music", 79.95], ["electronic music", 3.69], ["shout", 1.49]], [["music", 72.25], ["speech", 10.91], ["didgeridoo", 2.62]], null, [["music", 41.6], ["boing", 10.59], ["cattle, bovinae", 6.36]], null, null, null, [["cattle, bovinae", 31.89], ["music", 26.67], ["moo", 19.86]], [["music", 56.31], ["sidetone", 8.8], ["speech", 6.77]], [["music", 44.7], ["fly, housefly", 15.48], ["mosquito", 10.31]], [["music", 51.64], ["speech", 18.37], ["musical instrument", 2.66]], [["music", 27.8], ["livestock, farm animals, working animals", 15.25], ["cattle, bovinae", 11.11]], null, null, [["music", 37.58], ["frog", 9.58], ["croak", 8.98]], [["music", 54.0], ["theremin", 6.31], ["musical instrument", 3.49]], [["music", 23.36], ["cattle, bovinae", 11.62], ["moo", 9.67]], null], "duration": [2.36, 1.01, 1.31, -0.05, 14.06, 10.35, 0.6, 3.96, 0.06, 0.11, 0.21, 8.38, 3.21, 3.16, 2.28, 2.82, 0.41, 0.87, 3.08, 3.69, 3.57, 0.59]} \ No newline at end of file diff --git a/annotations_1/gKJerAxfSzw_filtered.json b/annotations_1/gKJerAxfSzw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0e54e0e4b0289ca7f829ad53c6f3c72f4ee4673 --- /dev/null +++ b/annotations_1/gKJerAxfSzw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 52.27], [52.0, 53.08], [53.0, 54.6], [56.0, 56.57], [58.0, 58.08], [60.0, 65.8], [66.0, 67.26], [70.0, 73.4], [74.0, 74.55], [76.0, 78.51], [79.0, 83.57], [84.0, 85.82], [87.0, 87.42], [89.0, 89.01], [90.0, 90.85], [91.0, 93.39], [94.0, 95.35], [98.0, 98.88], [100.0, 102.25], [110.0, 110.37], [116.0, 117.12], [127.0, 127.97], [128.0, 128.07], [128.0, 134.1], [135.0, 136.95], [138.0, 140.44], [142.0, 143.26], [146.0, 154.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 56.25, 0.0, 51.99, 66.76, 0.0, 0.0, 0.0, 0.0, 32.21, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 33.66, 0.0, 32.48, 0.0, 37.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.35], ["music", 14.93], ["didgeridoo", 6.53]], null, null, [["hum", 33.3], ["throbbing", 29.4], ["music", 13.41]], null, null, null, null, [["hum", 29.67], ["throbbing", 20.32], ["music", 18.97]], null, [["music", 72.48], ["speech", 8.52], ["didgeridoo", 6.6]], null, [["music", 58.69], ["theremin", 6.04], ["musical instrument", 3.6]]], "duration": [36.27, 1.08, 1.6, 0.57, 0.08, 5.8, 1.26, 3.4, 0.55, 2.51, 4.57, 1.82, 0.42, 0.01, 0.85, 2.39, 1.35, 0.88, 2.25, 0.37, 1.12, 0.97, 0.07, 6.1, 1.95, 2.44, 1.26, 8.87]} \ No newline at end of file diff --git a/annotations_1/gM8trQSURdg_filtered.json b/annotations_1/gM8trQSURdg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb1b1d31dbc05b9597d8ff1bc5b4ee8a3baab584 --- /dev/null +++ b/annotations_1/gM8trQSURdg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.95], [6.0, 8.31], [10.0, 13.12], [14.0, 18.03], [19.0, 23.09], [25.0, 27.9], [32.0, 32.68], [34.0, 41.54], [42.0, 43.33], [48.0, 50.25], [52.0, 53.38], [55.0, 56.52], [62.0, 63.98], [67.0, 68.81], [71.0, 74.04], [77.0, 78.26], [80.0, 80.42], [81.0, 82.88], [91.0, 91.94], [93.0, 95.23], [97.0, 98.54], [100.0, 101.83], [107.0, 108.5], [113.0, 113.95], [115.0, 115.59], [131.0, 131.09], [139.0, 139.95], [144.0, 146.26], [148.0, 149.81], [153.0, 154.84], [162.0, 163.17], [166.0, 167.73], [168.0, 169.69], [171.0, 174.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 100.0, 100.0, 99.97, 99.99, 0.0, 99.21, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 2.31, 3.12, 4.03, 4.09, 2.9, 0.68, 7.54, 1.33, 2.25, 1.38, 1.52, 1.98, 1.81, 3.04, 1.26, 0.42, 1.88, 0.94, 2.23, 1.54, 1.83, 1.5, 0.95, 0.59, 0.09, 0.95, 2.26, 1.81, 1.84, 1.17, 1.73, 1.69, 3.16]} \ No newline at end of file diff --git a/annotations_1/gMCgkXpEOIY_filtered.json b/annotations_1/gMCgkXpEOIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d819d2866f174c216ccab57c811ef4bf4af0b17 --- /dev/null +++ b/annotations_1/gMCgkXpEOIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.66], [12.0, 21.93], [26.0, 26.74], [28.0, 32.21], [33.0, 35.87], [37.0, 53.08], [54.0, 53.79], [56.0, 57.5], [63.0, 63.17], [64.0, 64.74], [68.0, 69.62], [71.0, 71.78], [72.0, 73.58], [76.0, 77.36], [81.0, 81.73], [83.0, 91.23], [93.0, 93.68], [96.0, 98.39], [102.0, 102.63], [104.0, 105.24], [107.0, 107.6], [110.0, 137.35], [139.0, 140.61], [158.0, 158.58], [159.0, 161.64], [164.0, 165.55], [166.0, 167.36], [169.0, 169.05], [172.0, 172.27], [176.0, 182.75], [191.0, 190.63], [192.0, 200.15], [201.0, 201.78], [204.0, 204.53]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.51, 0.0, 47.9, 98.8, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.94, 0.0, 99.52, 0.0, 0.0, 0.0, 32.23, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 38.74, 0.0, 72.9, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.5], ["fly, housefly", 16.55], ["insect", 5.69]], null, [["theremin", 79.49], ["music", 13.41], ["musical instrument", 1.25]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 94.16], ["cough", 2.8], ["noise", 0.52]], null, null, null, null, null, [["vehicle", 24.34], ["buzz", 17.39], ["race car, auto racing", 11.85]], null, null, null, null, null, null, null, [["snicker", 35.39], ["laughter", 33.03], ["baby laughter", 8.02]], null, null, null, null], "duration": [0.66, 9.93, 0.74, 4.21, 2.87, 16.08, -0.21, 1.5, 0.17, 0.74, 1.62, 0.78, 1.58, 1.36, 0.73, 8.23, 0.68, 2.39, 0.63, 1.24, 0.6, 27.35, 1.61, 0.58, 2.64, 1.55, 1.36, 0.05, 0.27, 6.75, -0.37, 8.15, 0.78, 0.53]} \ No newline at end of file diff --git a/annotations_1/gMdTl2R354A_filtered.json b/annotations_1/gMdTl2R354A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10c67be9fa6959c90f2002195bbcc3e7416698de --- /dev/null +++ b/annotations_1/gMdTl2R354A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.38], [44.0, 45.0], [52.0, 53.22], [68.0, 67.91], [70.0, 70.97], [83.0, 83.07], [86.0, 86.95], [91.0, 91.89], [93.0, 94.91], [102.0, 104.4], [111.0, 110.94], [120.0, 120.65], [123.0, 124.7], [127.0, 128.48], [138.0, 138.55], [157.0, 157.98], [167.0, 168.05], [174.0, 175.59], [209.0, 210.56], [213.0, 213.14], [235.0, 236.21], [237.0, 238.17], [239.0, 241.64], [244.0, 246.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.52, 34.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["didgeridoo", 14.64], ["speech", 11.17], ["music", 7.17]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.49], ["hum", 5.57], ["busy signal", 5.49]], [["music", 32.48], ["musical instrument", 17.54], ["hum", 12.84]]], "duration": [0.38, 1.0, 1.22, -0.09, 0.97, 0.07, 0.95, 0.89, 1.91, 2.4, -0.06, 0.65, 1.7, 1.48, 0.55, 0.98, 1.05, 1.59, 1.56, 0.14, 1.21, 1.17, 2.64, 2.27]} \ No newline at end of file diff --git a/annotations_1/gNCkFkii-tA_filtered.json b/annotations_1/gNCkFkii-tA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..602a8045f794eb87741eb5b733be4a254f78c68d --- /dev/null +++ b/annotations_1/gNCkFkii-tA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.85], [7.0, 7.57], [9.0, 10.17], [15.0, 15.45], [18.0, 20.41], [24.0, 27.28], [29.0, 31.46], [38.0, 45.89], [48.0, 50.25], [55.0, 55.54], [56.0, 56.56], [58.0, 60.25], [64.0, 64.76], [65.0, 66.02], [75.0, 79.08], [82.0, 86.46], [86.0, 86.51], [94.0, 99.12], [107.0, 108.28], [113.0, 113.56], [116.0, 116.85], [125.0, 126.55], [129.0, 131.08]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, true, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.66, 33.57, 35.29, 34.89, 30.43, 0.0, 0.0, 30.35, 0.0, 0.0, 29.04, 30.72, 0.0, 30.5, 0.0, 0.0, 0.0, 0.0, 34.07], "audiomae_on_audioset": [null, null, null, null, [["speech", 44.04], ["sidetone", 17.38], ["rumble", 7.13]], [["whale vocalization", 36.97], ["speech", 31.21], ["stomach rumble", 10.89]], [["speech", 20.89], ["creak", 11.1], ["animal", 8.19]], [["speech", 48.91], ["mains hum", 15.18], ["hum", 13.98]], [["sidetone", 40.96], ["speech", 22.93], ["radio", 11.66]], null, null, [["music", 27.16], ["whale vocalization", 17.43], ["hum", 3.85]], null, null, [["whale vocalization", 29.7], ["hum", 13.32], ["throbbing", 10.32]], [["throbbing", 20.43], ["speech", 18.2], ["hum", 14.15]], null, [["speech", 47.43], ["car", 8.44], ["vehicle", 6.77]], null, null, null, null, [["music", 67.67], ["musical instrument", 6.2], ["synthesizer", 3.58]]], "duration": [0.85, 0.57, 1.17, 0.45, 2.41, 3.28, 2.46, 7.89, 2.25, 0.54, 0.56, 2.25, 0.76, 1.02, 4.08, 4.46, 0.51, 5.12, 1.28, 0.56, 0.85, 1.55, 2.08]} \ No newline at end of file diff --git a/annotations_1/gNbqn47rt3M_filtered.json b/annotations_1/gNbqn47rt3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c83cd3d2085304d2b09b7d1aa2fd68f1d870a49e --- /dev/null +++ b/annotations_1/gNbqn47rt3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.88], [13.0, 13.54], [39.0, 55.81], [79.0, 79.59], [82.0, 81.65], [84.0, 84.35], [87.0, 88.59], [90.0, 93.99], [95.0, 96.7], [108.0, 109.92], [114.0, 114.51], [119.0, 119.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.69, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.47], ["psychedelic rock", 1.11], ["musical instrument", 0.79]], null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.54, 16.81, 0.59, -0.35, 0.35, 1.59, 3.99, 1.7, 1.92, 0.51, 0.31]} \ No newline at end of file diff --git a/annotations_1/gO6qemCFhEU_filtered.json b/annotations_1/gO6qemCFhEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbc7bb37dabd592a750932d6dfa60e8df66315c9 --- /dev/null +++ b/annotations_1/gO6qemCFhEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [6.0, 6.59], [10.0, 36.41], [38.0, 39.73], [42.0, 42.63], [43.0, 43.9], [45.0, 46.03], [47.0, 49.91], [50.0, 53.37], [54.0, 64.22], [70.0, 73.95], [75.0, 78.26], [79.0, 80.5], [81.0, 82.24], [83.0, 83.15], [85.0, 85.02], [86.0, 88.33], [89.0, 98.24], [99.0, 111.42], [112.0, 111.55], [112.0, 112.46], [113.0, 128.38], [132.0, 133.95], [135.0, 136.53], [148.0, 156.39], [157.0, 158.43]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.93, 0.0, 0.0, 0.0, 0.0, 41.34, 40.73, 37.92, 82.97, 85.17, 0.0, 0.0, 0.0, 0.0, 71.72, 38.9, 36.48, 0.0, 0.0, 38.36, 0.0, 0.0, 33.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 44.39], ["speech", 10.45], ["musical instrument", 7.13]], null, null, null, null, [["music", 66.45], ["theremin", 5.59], ["wind instrument, woodwind instrument", 3.93]], [["music", 35.17], ["theremin", 23.36], ["wind instrument, woodwind instrument", 8.95]], [["music", 48.34], ["wind instrument, woodwind instrument", 16.85], ["speech", 9.21]], null, null, null, null, null, null, null, [["music", 33.3], ["whale vocalization", 19.37], ["wind instrument, woodwind instrument", 13.21]], [["music", 37.18], ["wind instrument, woodwind instrument", 25.57], ["musical instrument", 9.72]], null, null, [["music", 45.12], ["theremin", 22.23], ["musical instrument", 10.59]], null, null, [["music", 34.05], ["clarinet", 27.0], ["wind instrument, woodwind instrument", 13.47]], null], "duration": [1.23, 0.59, 26.41, 1.73, 0.63, 0.9, 1.03, 2.91, 3.37, 10.22, 3.95, 3.26, 1.5, 1.24, 0.15, 0.02, 2.33, 9.24, 12.42, -0.45, 0.46, 15.38, 1.95, 1.53, 8.39, 1.43]} \ No newline at end of file diff --git a/annotations_1/gPAI19a84KU_filtered.json b/annotations_1/gPAI19a84KU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0544fa8591782c6f6c265209c67a9f69ef973111 --- /dev/null +++ b/annotations_1/gPAI19a84KU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [8.0, 8.88], [13.0, 16.66], [18.0, 32.7], [33.0, 33.84], [34.0, 34.99], [40.0, 42.08], [44.0, 48.44], [49.0, 52.52], [54.0, 75.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.99, 53.72, 0.0, 0.0, 98.1, 99.26, 95.51, 99.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 0.88, 3.66, 14.7, 0.84, 0.99, 2.08, 4.44, 3.52, 21.07]} \ No newline at end of file diff --git a/annotations_1/gPJFxEvmHpQ_filtered.json b/annotations_1/gPJFxEvmHpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02ae43f335342554fda7d7a3024ef5725a6180a4 --- /dev/null +++ b/annotations_1/gPJFxEvmHpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[132.0, 135.62], [137.0, 138.03], [142.0, 142.23], [145.0, 146.25], [151.0, 160.84]], "keep_status": [true, false, false, false, true], "silence_prob": [42.84, 0.0, 0.0, 0.0, 39.88], "audiomae_on_audioset": [[["music", 26.6], ["synthesizer", 11.01], ["sine wave", 7.9]], null, null, null, [["music", 30.3], ["speech", 29.08], ["synthesizer", 10.39]]], "duration": [3.62, 1.03, 0.23, 1.25, 9.84]} \ No newline at end of file diff --git a/annotations_1/gQ48-nl8wwc_filtered.json b/annotations_1/gQ48-nl8wwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a872c78a25fc7072da5f930c59781d548eccf5b8 --- /dev/null +++ b/annotations_1/gQ48-nl8wwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [4.0, 12.63], [15.0, 22.23], [25.0, 60.51], [64.0, 66.87], [68.0, 68.17], [70.0, 70.88], [72.0, 75.0], [84.0, 84.94], [91.0, 92.37], [99.0, 99.25], [101.0, 114.64]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.99, 29.95, 0.0, 48.19, 0.0, 0.0, 33.99, 0.0, 0.0, 0.0, 31.58], "audiomae_on_audioset": [null, [["music", 69.51], ["fart", 5.42], ["speech", 2.79]], [["music", 37.46], ["speech", 15.57], ["vehicle", 7.59]], null, [["hum", 25.17], ["music", 19.35], ["throbbing", 10.63]], null, null, [["whale vocalization", 24.62], ["speech", 16.99], ["hum", 5.7]], null, null, null, [["music", 72.48], ["speech", 4.37], ["synthesizer", 3.78]]], "duration": [1.05, 8.63, 7.23, 35.51, 2.87, 0.17, 0.88, 3.0, 0.94, 1.37, 0.25, 13.64]} \ No newline at end of file diff --git a/annotations_1/gQ5KDSBMFRU_filtered.json b/annotations_1/gQ5KDSBMFRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27c3c979771484ddca6f3b46f292e7e5c8f034ab --- /dev/null +++ b/annotations_1/gQ5KDSBMFRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.8], [2.0, 2.49], [4.0, 5.19], [6.0, 12.83], [17.0, 18.2], [20.0, 20.93], [24.0, 26.13], [28.0, 29.56], [31.0, 33.47], [36.0, 36.46], [38.0, 41.22], [41.0, 41.91], [42.0, 42.8], [44.0, 44.81], [46.0, 49.22], [50.0, 50.63], [53.0, 53.65], [55.0, 54.95], [58.0, 60.54], [62.0, 62.82], [67.0, 68.94], [71.0, 72.77], [74.0, 77.04], [79.0, 79.12], [80.0, 80.99], [84.0, 85.21], [89.0, 90.39], [92.0, 92.85], [96.0, 96.23], [96.0, 100.41], [100.0, 103.06], [106.0, 106.73], [108.0, 110.96], [113.0, 115.05], [116.0, 119.82], [121.0, 127.52], [130.0, 131.25], [132.0, 133.15], [136.0, 136.66], [138.0, 140.22], [145.0, 146.2], [149.0, 151.24], [154.0, 154.68], [157.0, 159.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 99.97, 0.0, 96.42, 0.0, 79.24, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 99.26, 0.0, 99.94, 100.0, 86.82, 99.65, 0.0, 0.0, 0.0, 99.26, 0.0, 94.95, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.2, 0.49, 1.19, 6.83, 1.2, 0.93, 2.13, 1.56, 2.47, 0.46, 3.22, 0.91, 0.8, 0.81, 3.22, 0.63, 0.65, -0.05, 2.54, 0.82, 1.94, 1.77, 3.04, 0.12, 0.99, 1.21, 1.39, 0.85, 0.23, 4.41, 3.06, 0.73, 2.96, 2.05, 3.82, 6.52, 1.25, 1.15, 0.66, 2.22, 1.2, 2.24, 0.68, 2.73]} \ No newline at end of file diff --git a/annotations_1/gQATrdAXELg_filtered.json b/annotations_1/gQATrdAXELg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea760fb48498da72c699bf772ca317d016f9c046 --- /dev/null +++ b/annotations_1/gQATrdAXELg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [1.0, 25.52], [27.0, 46.53], [47.0, 48.49], [50.0, 50.9], [54.0, 54.77], [60.0, 62.21], [63.0, 103.59], [104.0, 110.0], [115.0, 115.64], [116.0, 116.97], [118.0, 133.07], [135.0, 134.97], [137.0, 137.62], [142.0, 143.68], [145.0, 145.96], [146.0, 146.1], [147.0, 150.84], [153.0, 155.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 30.41, 30.04, 0.0, 0.0, 0.0, 42.48, 0.0, 59.15, 0.0, 0.0, 31.03, 0.0, 0.0, 0.0, 0.0, 0.0, 28.54, 36.91], "audiomae_on_audioset": [null, [["music", 54.36], ["speech", 14.99], ["hum", 4.69]], [["music", 48.24], ["hum", 15.78], ["mains hum", 10.68]], null, null, null, [["helicopter", 15.42], ["vehicle", 11.92], ["hum", 8.78]], null, null, null, null, [["music", 63.4], ["speech", 7.4], ["throbbing", 6.9]], null, null, null, null, null, [["music", 40.65], ["eruption", 13.57], ["explosion", 8.63]], [["music", 56.5], ["ambient music", 6.11], ["scary music", 4.11]]], "duration": [0.21, 24.52, 19.53, 1.49, 0.9, 0.77, 2.21, 40.59, 6.0, 0.64, 0.97, 15.07, -0.03, 0.62, 1.68, 0.96, 0.1, 3.84, 2.29]} \ No newline at end of file diff --git a/annotations_1/gQMtp2WxEA4_filtered.json b/annotations_1/gQMtp2WxEA4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe069e9fcdc8099d7f8e3397d47fdb78570aabe4 --- /dev/null +++ b/annotations_1/gQMtp2WxEA4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.26], [5.0, 5.1], [6.0, 7.74], [16.0, 15.75], [18.0, 19.53], [26.0, 26.43], [29.0, 29.62], [32.0, 32.68], [52.0, 56.89], [66.0, 66.78], [70.0, 70.66], [97.0, 98.1], [101.0, 104.7], [134.0, 134.99], [153.0, 159.07], [165.0, 169.94], [173.0, 177.35], [180.0, 179.91]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 0.0, 0.0, 46.97, 0.0, 42.6, 31.5, 30.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["grunt", 53.87], ["fart", 6.97], ["animal", 5.01]], null, null, null, [["speech", 11.33], ["music", 8.4], ["bleat", 7.48]], null, [["music", 16.68], ["speech", 12.94], ["didgeridoo", 12.29]], [["music", 79.12], ["didgeridoo", 4.25], ["musical instrument", 3.74]], [["music", 58.02], ["foghorn", 9.23], ["trombone", 8.39]], null], "duration": [0.26, 0.1, 1.74, -0.25, 1.53, 0.43, 0.62, 0.68, 4.89, 0.78, 0.66, 1.1, 3.7, 0.99, 6.07, 4.94, 4.35, -0.09]} \ No newline at end of file diff --git a/annotations_1/gQNFCRom7c0_filtered.json b/annotations_1/gQNFCRom7c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba7df57a7d1e7df69f26fea8f27a48fc1d5f467 --- /dev/null +++ b/annotations_1/gQNFCRom7c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.99], [8.0, 7.92], [10.0, 14.4], [16.0, 16.21], [21.0, 22.42], [24.0, 26.65], [28.0, 31.11], [31.0, 41.52], [42.0, 41.55], [42.0, 41.59], [42.0, 41.62], [42.0, 45.28], [46.0, 45.94], [46.0, 49.54], [51.0, 51.46], [54.0, 55.0], [56.0, 58.26], [61.0, 68.18], [74.0, 75.88], [79.0, 78.87], [79.0, 78.95], [89.0, 90.86], [93.0, 92.8], [93.0, 93.43], [94.0, 96.85], [99.0, 101.83], [117.0, 118.23], [121.0, 124.23], [126.0, 125.74], [128.0, 128.92], [129.0, 131.73], [132.0, 133.51], [134.0, 135.19], [135.0, 142.89], [144.0, 145.12]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 42.04, 0.0, 0.0, 41.91, 37.57, 42.24, 0.0, 0.0, 0.0, 45.43, 0.0, 39.7, 0.0, 0.0, 37.99, 40.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 49.31, 0.0, 40.97, 0.0, 0.0, 40.28, 0.0, 0.0, 39.4, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.18], ["musical instrument", 7.22], ["guitar", 7.17]], null, null, [["music", 53.33], ["electric piano", 3.97], ["keyboard (musical)", 3.34]], [["music", 40.45], ["musical instrument", 9.35], ["plucked string instrument", 7.37]], [["music", 78.81], ["musical instrument", 6.79], ["keyboard (musical)", 2.11]], null, null, null, [["music", 52.15], ["speech", 9.91], ["keyboard (musical)", 5.56]], null, [["music", 37.13], ["harp", 6.75], ["pizzicato", 5.27]], null, null, [["music", 65.01], ["musical instrument", 7.08], ["plucked string instrument", 4.44]], [["music", 65.27], ["musical instrument", 5.53], ["double bass", 4.98]], null, null, null, null, null, null, [["music", 49.34], ["musical instrument", 15.84], ["piano", 5.44]], [["music", 72.97], ["didgeridoo", 8.22], ["musical instrument", 5.2]], null, [["music", 43.4], ["musical instrument", 19.46], ["piano", 15.99]], null, null, [["music", 49.95], ["musical instrument", 10.78], ["double bass", 7.67]], null, null, [["music", 50.78], ["musical instrument", 11.46], ["plucked string instrument", 7.21]], null], "duration": [1.99, -0.08, 4.4, 0.21, 1.42, 2.65, 3.11, 10.52, -0.45, -0.41, -0.38, 3.28, -0.06, 3.54, 0.46, 1.0, 2.26, 7.18, 1.88, -0.13, -0.05, 1.86, -0.2, 0.43, 2.85, 2.83, 1.23, 3.23, -0.26, 0.92, 2.73, 1.51, 1.19, 7.89, 1.12]} \ No newline at end of file diff --git a/annotations_1/gQO9bgOLhmg_filtered.json b/annotations_1/gQO9bgOLhmg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..806adc9577dd85bd1fe8bbc2f0fc1f09741cd290 --- /dev/null +++ b/annotations_1/gQO9bgOLhmg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.9], [6.0, 6.37], [9.0, 16.87], [22.0, 29.27], [31.0, 35.07], [36.0, 36.68], [38.0, 38.55], [39.0, 40.14], [42.0, 44.24], [51.0, 52.02], [53.0, 58.83], [61.0, 62.41], [64.0, 65.82], [67.0, 69.47], [72.0, 116.13], [117.0, 136.07], [138.0, 138.82], [143.0, 146.82], [148.0, 152.32]], "keep_status": [false, false, true, true, true, false, false, false, true, false, true, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 38.45, 31.12, 43.23, 0.0, 0.0, 0.0, 30.75, 0.0, 30.87, 0.0, 0.0, 34.53, 0.0, 30.75, 0.0, 57.48, 37.41], "audiomae_on_audioset": [null, null, [["speech", 26.89], ["hum", 21.71], ["mains hum", 17.79]], [["hum", 23.38], ["mains hum", 20.36], ["music", 16.6]], [["music", 38.03], ["hum", 11.93], ["throbbing", 11.49]], null, null, null, [["speech", 25.2], ["vehicle", 13.51], ["mains hum", 7.98]], null, [["music", 31.5], ["hum", 14.44], ["mains hum", 8.69]], null, null, [["music", 55.86], ["throbbing", 9.0], ["hum", 6.28]], null, [["music", 28.38], ["hum", 17.58], ["speech", 10.76]], null, null, [["hum", 30.31], ["speech", 18.34], ["mains hum", 14.1]]], "duration": [0.9, 0.37, 7.87, 7.27, 4.07, 0.68, 0.55, 1.14, 2.24, 1.02, 5.83, 1.41, 1.82, 2.47, 44.13, 19.07, 0.82, 3.82, 4.32]} \ No newline at end of file diff --git a/annotations_1/gQgdweybPwk_filtered.json b/annotations_1/gQgdweybPwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c820bbc6371a85007b9a948bbb12577eb7db9fa9 --- /dev/null +++ b/annotations_1/gQgdweybPwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [5.0, 5.58], [6.0, 6.76], [8.0, 9.69], [16.0, 17.2], [22.0, 22.82], [23.0, 23.09], [23.0, 23.14], [23.0, 23.23], [23.0, 23.4], [23.0, 23.75], [24.0, 23.97], [26.0, 29.02], [31.0, 32.64], [33.0, 33.83], [43.0, 54.53], [56.0, 56.83], [62.0, 62.5], [66.0, 66.58], [94.0, 97.07], [100.0, 99.84], [105.0, 105.16], [109.0, 111.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.53, 0.0, 0.0, 40.04, 0.0, 0.0, 0.0, 37.32, 0.0, 0.0, 38.31], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 75.27], ["radio", 4.29], ["noise", 3.27]], null, null, [["speech", 85.92], ["animal", 3.02], ["electric shaver, electric razor", 2.42]], null, null, null, [["moo", 23.67], ["livestock, farm animals, working animals", 20.37], ["cattle, bovinae", 19.28]], null, null, [["music", 28.39], ["moo", 13.13], ["livestock, farm animals, working animals", 11.52]]], "duration": [0.45, 0.58, 0.76, 1.69, 1.2, 0.82, 0.09, 0.14, 0.23, 0.4, 0.75, -0.03, 3.02, 1.64, 0.83, 11.53, 0.83, 0.5, 0.58, 3.07, -0.16, 0.16, 2.45]} \ No newline at end of file diff --git a/annotations_1/gRP3sdjszlQ_filtered.json b/annotations_1/gRP3sdjszlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360380962c4eed01698851764b80421759784a3f --- /dev/null +++ b/annotations_1/gRP3sdjszlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.87], [22.0, 27.62], [28.0, 27.8], [28.0, 34.28], [44.0, 47.19], [50.0, 50.14], [52.0, 53.0], [54.0, 61.99], [71.0, 72.12], [73.0, 75.74], [78.0, 79.2], [83.0, 84.72], [87.0, 91.79], [100.0, 104.87], [110.0, 114.59], [119.0, 120.36], [128.0, 136.04], [138.0, 143.33], [145.0, 146.97], [147.0, 151.38]], "keep_status": [true, false, false, true, true, false, false, true, false, false, false, false, true, true, true, false, true, true, false, true], "silence_prob": [40.62, 34.04, 0.0, 35.27, 32.97, 0.0, 0.0, 30.12, 0.0, 33.3, 0.0, 0.0, 31.55, 30.49, 32.43, 0.0, 31.49, 30.26, 0.0, 33.19], "audiomae_on_audioset": [[["music", 48.35], ["speech", 5.05], ["boing", 3.22]], [["music", 52.9], ["speech", 19.22], ["thunk", 2.68]], null, [["music", 43.69], ["thunk", 8.05], ["sound effect", 7.73]], [["music", 15.56], ["speech", 12.49], ["boing", 9.37]], null, null, [["fly, housefly", 20.69], ["music", 15.85], ["mosquito", 11.35]], null, [["speech", 36.68], ["music", 31.75], ["effects unit", 4.77]], null, null, [["livestock, farm animals, working animals", 17.46], ["cattle, bovinae", 15.42], ["mosquito", 10.14]], [["music", 40.7], ["boing", 7.72], ["cacophony", 6.16]], [["music", 25.38], ["speech", 11.84], ["musical instrument", 3.14]], null, [["music", 24.6], ["speech", 18.53], ["mosquito", 12.27]], [["music", 33.13], ["throbbing", 5.7], ["fart", 4.53]], null, [["music", 57.19], ["musical instrument", 8.15], ["synthesizer", 3.2]]], "duration": [2.87, 5.62, -0.2, 6.28, 3.19, 0.14, 1.0, 7.99, 1.12, 2.74, 1.2, 1.72, 4.79, 4.87, 4.59, 1.36, 8.04, 5.33, 1.97, 4.38]} \ No newline at end of file diff --git a/annotations_1/gSG9bZu1NtM_filtered.json b/annotations_1/gSG9bZu1NtM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5c265f3bd61dd6785c07ea1ee562dd48bab5f31 --- /dev/null +++ b/annotations_1/gSG9bZu1NtM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.64], [4.0, 7.33], [9.0, 13.68], [20.0, 20.14], [23.0, 23.92], [25.0, 27.5], [29.0, 57.89], [59.0, 60.59], [66.0, 67.09], [68.0, 68.4], [70.0, 70.29], [71.0, 71.56], [72.0, 81.23], [83.0, 84.28], [86.0, 87.99], [90.0, 92.18], [96.0, 103.81], [106.0, 106.66], [110.0, 114.78], [118.0, 118.12], [122.0, 124.16], [131.0, 130.94], [133.0, 136.43], [137.0, 137.83], [140.0, 146.67], [150.0, 161.0], [164.0, 178.19]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 52.74, 51.6, 0.0, 0.0, 39.74, 33.99, 0.0, 0.0, 0.0, 0.0, 0.0, 31.36, 0.0, 0.0, 86.45, 31.63, 0.0, 34.67, 0.0, 35.51, 0.0, 33.19, 0.0, 31.96, 33.89, 32.52], "audiomae_on_audioset": [null, null, null, null, null, [["music", 46.8], ["musical instrument", 11.56], ["foghorn", 7.42]], [["whale vocalization", 25.95], ["speech", 23.25], ["noise", 13.49]], null, null, null, null, null, [["music", 48.02], ["speech", 17.33], ["thump, thud", 4.59]], null, null, null, [["music", 39.13], ["mains hum", 7.31], ["hum", 6.78]], null, [["music", 29.04], ["throbbing", 20.97], ["hum", 12.36]], null, [["music", 71.75], ["throbbing", 7.38], ["hum", 3.07]], null, [["music", 38.91], ["hum", 8.45], ["throbbing", 7.97]], null, [["music", 56.02], ["hum", 7.41], ["throbbing", 5.61]], [["hum", 37.85], ["throbbing", 28.02], ["music", 18.74]], [["hum", 46.71], ["music", 19.05], ["mains hum", 12.91]]], "duration": [0.64, 3.33, 4.68, 0.14, 0.92, 2.5, 28.89, 1.59, 1.09, 0.4, 0.29, 0.56, 9.23, 1.28, 1.99, 2.18, 7.81, 0.66, 4.78, 0.12, 2.16, -0.06, 3.43, 0.83, 6.67, 11.0, 14.19]} \ No newline at end of file diff --git a/annotations_1/gSZ82TOHWc0_filtered.json b/annotations_1/gSZ82TOHWc0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6ef2889234d47070c29bad698536a98385b3668 --- /dev/null +++ b/annotations_1/gSZ82TOHWc0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.61], [13.0, 13.83], [21.0, 21.64], [45.0, 45.86], [46.0, 46.47], [48.0, 48.76], [49.0, 49.71], [50.0, 50.38], [51.0, 51.63], [55.0, 56.93], [78.0, 78.63], [80.0, 80.0], [85.0, 86.54], [90.0, 91.59], [99.0, 100.7], [112.0, 112.43], [113.0, 114.62], [115.0, 120.07], [121.0, 125.22], [127.0, 128.58], [130.0, 130.27], [133.0, 136.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.53, 79.41, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.62], ["music", 16.04], ["fart", 6.58]], null, null, null, null], "duration": [1.61, 0.83, 0.64, 0.86, 0.47, 0.76, 0.71, 0.38, 0.63, 1.93, 0.63, 0.0, 1.54, 1.59, 1.7, 0.43, 1.62, 5.07, 4.22, 1.58, 0.27, 3.53]} \ No newline at end of file diff --git a/annotations_1/gT7MQhe8gRE_filtered.json b/annotations_1/gT7MQhe8gRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec24fae43ef41e48f583056adc6a2ef3a8640dc9 --- /dev/null +++ b/annotations_1/gT7MQhe8gRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.97], [12.0, 62.8], [65.0, 68.55], [70.0, 84.94], [92.0, 92.16], [93.0, 94.09], [99.0, 99.32], [100.0, 101.51], [104.0, 104.75], [106.0, 106.52], [107.0, 109.56], [111.0, 111.87], [113.0, 113.75], [117.0, 133.62], [134.0, 136.48], [139.0, 141.29], [142.0, 161.15]], "keep_status": [false, false, true, true, false, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [46.68, 0.0, 39.91, 46.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.65, 0.0, 0.0, 31.09, 30.66, 29.88, 34.63], "audiomae_on_audioset": [[["speech", 73.26], ["music", 8.1], ["hum", 3.71]], null, [["music", 34.18], ["speech", 29.32], ["didgeridoo", 6.32]], [["music", 40.27], ["buzz", 6.66], ["male singing", 5.74]], null, null, null, null, null, null, [["music", 60.03], ["synthesizer", 2.82], ["singing", 2.74]], null, null, [["music", 51.69], ["cattle, bovinae", 8.72], ["moo", 7.05]], [["music", 38.19], ["didgeridoo", 35.59], ["synthesizer", 3.94]], [["moo", 42.55], ["cattle, bovinae", 33.51], ["livestock, farm animals, working animals", 13.39]], [["fly, housefly", 23.4], ["mosquito", 13.17], ["hum", 12.57]]], "duration": [8.97, 50.8, 3.55, 14.94, 0.16, 1.09, 0.32, 1.51, 0.75, 0.52, 2.56, 0.87, 0.75, 16.62, 2.48, 2.29, 19.15]} \ No newline at end of file diff --git a/annotations_1/gTakZ13l8xY_filtered.json b/annotations_1/gTakZ13l8xY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bf2c089522e7bf118d64db09dc97cb3222dc947 --- /dev/null +++ b/annotations_1/gTakZ13l8xY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [4.0, 4.23], [14.0, 14.89], [18.0, 18.57], [20.0, 20.38], [25.0, 25.74], [28.0, 28.41], [38.0, 38.79], [46.0, 46.3], [48.0, 48.68], [52.0, 54.65], [56.0, 56.37], [59.0, 60.24], [66.0, 67.56], [72.0, 73.18], [75.0, 75.2], [76.0, 77.35], [83.0, 83.13], [84.0, 86.37], [88.0, 88.7], [93.0, 92.8], [100.0, 99.98], [102.0, 102.79], [107.0, 107.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 17.05], ["throbbing", 12.74], ["speech", 7.43]], null, null, null, null, null, null, null, [["music", 35.8], ["whale vocalization", 9.83], ["hum", 6.49]], null, null, null, null, null], "duration": [0.47, 0.23, 0.89, 0.57, 0.38, 0.74, 0.41, 0.79, 0.3, 0.68, 2.65, 0.37, 1.24, 1.56, 1.18, 0.2, 1.35, 0.13, 2.37, 0.7, -0.2, -0.02, 0.79, 0.69]} \ No newline at end of file diff --git a/annotations_1/gTt8yvw4MJE_filtered.json b/annotations_1/gTt8yvw4MJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bdab74c8d1af68307b989fca7ce1e88b32d7fab --- /dev/null +++ b/annotations_1/gTt8yvw4MJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.32], [13.0, 16.04], [18.0, 20.85], [23.0, 23.8], [29.0, 29.1], [41.0, 41.28], [47.0, 49.44], [50.0, 49.62], [50.0, 51.39], [53.0, 55.83], [65.0, 65.45], [76.0, 77.09], [83.0, 82.97], [86.0, 88.03], [89.0, 91.84], [94.0, 95.44], [105.0, 106.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 100.0, 39.34, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 38.67, 0.0, 0.0, 0.0, 44.09, 44.23, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["stomach rumble", 30.71], ["speech", 28.24], ["crack", 12.79]], null, null, null, null, null, null, [["hum", 28.2], ["music", 26.8], ["throbbing", 16.47]], null, null, null, [["music", 37.17], ["throbbing", 19.28], ["hum", 15.5]], [["music", 29.17], ["hum", 19.18], ["speech", 7.7]], null, null], "duration": [1.32, 3.04, 2.85, 0.8, 0.1, 0.28, 2.44, -0.38, 1.39, 2.83, 0.45, 1.09, -0.03, 2.03, 2.84, 1.44, 1.15]} \ No newline at end of file diff --git a/annotations_1/gU886wmXhQo_filtered.json b/annotations_1/gU886wmXhQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..577051a1e717400bb81775de2bb9efbbb0249b1d --- /dev/null +++ b/annotations_1/gU886wmXhQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.99], [35.0, 36.32], [58.0, 58.7]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.99, 1.32, 0.7]} \ No newline at end of file diff --git a/annotations_1/gUKbFeHjYX8_filtered.json b/annotations_1/gUKbFeHjYX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e59fe727db9e3c5a3368ac0ce71d2b4472564d3 --- /dev/null +++ b/annotations_1/gUKbFeHjYX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.67], [12.0, 62.45], [65.0, 134.4], [135.0, 138.96], [142.0, 153.69]], "keep_status": [false, false, false, false, true], "silence_prob": [38.67, 0.0, 0.0, 59.96, 33.31], "audiomae_on_audioset": [[["music", 38.96], ["hum", 23.32], ["mains hum", 10.62]], null, null, null, [["music", 21.27], ["explosion", 16.32], ["rumble", 13.52]]], "duration": [2.67, 50.45, 69.4, 3.96, 11.69]} \ No newline at end of file diff --git a/annotations_1/gUeHamRZkSY_filtered.json b/annotations_1/gUeHamRZkSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89000d6cb04e750cded316431994c13c19fd6ee1 --- /dev/null +++ b/annotations_1/gUeHamRZkSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.08], [9.0, 12.41], [15.0, 16.36], [17.0, 17.81], [21.0, 20.93], [21.0, 22.08], [24.0, 27.77], [29.0, 29.44], [32.0, 32.05], [36.0, 44.34], [46.0, 48.27], [49.0, 61.7], [64.0, 66.65], [67.0, 67.81], [70.0, 70.58], [72.0, 72.69], [73.0, 74.26], [81.0, 81.67], [83.0, 83.05], [84.0, 85.11], [86.0, 85.75], [91.0, 91.17], [97.0, 98.31], [100.0, 101.44], [102.0, 103.81], [116.0, 138.75], [143.0, 142.77], [150.0, 150.77], [154.0, 154.63], [157.0, 156.95]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [48.91, 47.2, 0.0, 0.0, 0.0, 0.0, 40.4, 0.0, 0.0, 82.07, 86.82, 92.15, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 41.43], ["animal", 11.9], ["speech", 5.73]], [["music", 36.21], ["hum", 11.42], ["mains hum", 6.49]], null, null, null, null, [["sidetone", 36.9], ["speech", 29.69], ["mains hum", 10.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.44], ["speech", 14.68], ["animal", 6.6]], null, null, null, null], "duration": [6.08, 3.41, 1.36, 0.81, -0.07, 1.08, 3.77, 0.44, 0.05, 8.34, 2.27, 12.7, 2.65, 0.81, 0.58, 0.69, 1.26, 0.67, 0.05, 1.11, -0.25, 0.17, 1.31, 1.44, 1.81, 22.75, -0.23, 0.77, 0.63, -0.05]} \ No newline at end of file diff --git a/annotations_1/gV6Y3OwR2n0_filtered.json b/annotations_1/gV6Y3OwR2n0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27d6e127f09b8cac0d180181a0228e8ae6d12ebb --- /dev/null +++ b/annotations_1/gV6Y3OwR2n0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.24], [7.0, 11.8], [12.0, 14.52], [15.0, 17.41], [19.0, 22.86], [23.0, 96.11], [98.0, 98.74], [100.0, 101.43], [105.0, 105.41], [108.0, 108.68], [110.0, 111.06], [112.0, 113.86], [116.0, 116.95], [118.0, 118.94], [122.0, 122.69], [123.0, 124.24], [126.0, 125.95], [129.0, 129.66], [131.0, 132.65], [133.0, 152.66], [154.0, 156.02], [158.0, 158.46], [167.0, 167.14], [169.0, 169.59], [174.0, 174.68], [176.0, 177.03], [178.0, 179.07]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.45, 41.6, 52.27, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.53, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 45.21], ["hum", 6.72], ["fly, housefly", 5.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.61], ["synthesizer", 8.76], ["musical instrument", 4.97]], null, null, null, null, null, null, null], "duration": [1.24, 4.8, 2.52, 2.41, 3.86, 73.11, 0.74, 1.43, 0.41, 0.68, 1.06, 1.86, 0.95, 0.94, 0.69, 1.24, -0.05, 0.66, 1.65, 19.66, 2.02, 0.46, 0.14, 0.59, 0.68, 1.03, 1.07]} \ No newline at end of file diff --git a/annotations_1/gVdIiTE1ykg_filtered.json b/annotations_1/gVdIiTE1ykg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dbff3b08e36792516677de853ec9e7cfb06e9c8 --- /dev/null +++ b/annotations_1/gVdIiTE1ykg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [6.0, 6.89], [9.0, 10.02], [14.0, 14.96], [17.0, 17.95], [19.0, 18.87], [24.0, 25.08], [28.0, 28.22], [30.0, 31.68], [32.0, 34.2], [45.0, 46.65], [49.0, 49.82], [50.0, 53.22], [55.0, 56.46], [59.0, 59.24], [60.0, 66.18], [67.0, 78.22], [88.0, 88.42], [90.0, 91.76], [94.0, 95.22], [96.0, 97.7], [104.0, 125.02], [128.0, 129.51], [131.0, 131.5], [133.0, 137.0], [140.0, 144.63], [147.0, 149.22], [152.0, 153.05], [156.0, 157.64], [159.0, 161.91], [162.0, 163.83], [166.0, 168.44]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.86, 0.0, 0.0, 33.12, 0.0, 0.0, 31.22, 31.43, 0.0, 0.0, 0.0, 0.0, 32.68, 0.0, 0.0, 81.89, 31.97, 36.81, 0.0, 0.0, 63.64, 0.0, 93.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 37.01], ["speech", 21.22], ["bee, wasp, etc.", 5.05]], null, null, [["speech", 32.39], ["music", 27.8], ["hum", 9.44]], null, null, [["music", 52.38], ["hum", 8.99], ["speech", 6.01]], [["music", 72.07], ["synthesizer", 7.66], ["timpani", 2.98]], null, null, null, null, [["music", 82.3], ["hum", 1.58], ["thunk", 1.55]], null, null, null, [["clang", 22.5], ["ding", 18.18], ["gunshot, gunfire", 12.25]], [["speech", 63.36], ["breaking", 21.55], ["outside, rural or natural", 2.26]], null, null, null, null, null], "duration": [1.28, 0.89, 1.02, 0.96, 0.95, -0.13, 1.08, 0.22, 1.68, 2.2, 1.65, 0.82, 3.22, 1.46, 0.24, 6.18, 11.22, 0.42, 1.76, 1.22, 1.7, 21.02, 1.51, 0.5, 4.0, 4.63, 2.22, 1.05, 1.64, 2.91, 1.83, 2.44]} \ No newline at end of file diff --git a/annotations_1/gW7ozVNSL8k_filtered.json b/annotations_1/gW7ozVNSL8k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2207c8e21162dd4fda648dd267654a6dd7058b2e --- /dev/null +++ b/annotations_1/gW7ozVNSL8k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [7.0, 7.7], [14.0, 14.61], [15.0, 15.99], [24.0, 25.79], [26.0, 26.91], [31.0, 32.1], [35.0, 35.06], [36.0, 38.57], [41.0, 44.61], [46.0, 47.53], [53.0, 56.71], [64.0, 64.71], [68.0, 68.84], [70.0, 70.75], [71.0, 73.67], [75.0, 80.45], [81.0, 81.77], [83.0, 84.62], [86.0, 86.95], [88.0, 89.29], [95.0, 97.97], [104.0, 104.89], [105.0, 106.34], [112.0, 112.26], [113.0, 127.97], [129.0, 129.36], [138.0, 147.19], [149.0, 150.67]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.96, 42.46, 0.0, 80.11, 0.0, 0.0, 0.0, 60.32, 62.47, 0.0, 0.0, 0.0, 0.0, 31.05, 0.0, 0.0, 0.0, 42.55, 0.0, 37.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 49.71], ["speech", 8.28], ["mosquito", 5.58]], [["moo", 41.38], ["cattle, bovinae", 34.4], ["livestock, farm animals, working animals", 11.43]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 21.8], ["music", 12.84], ["fly, housefly", 9.61]], null, null, null, [["speech", 61.83], ["buzz", 7.13], ["sheep", 5.08]], null, [["music", 65.0], ["scary music", 12.55], ["whale vocalization", 6.1]], null], "duration": [0.35, 0.7, 0.61, 0.99, 1.79, 0.91, 1.1, 0.06, 2.57, 3.61, 1.53, 3.71, 0.71, 0.84, 0.75, 2.67, 5.45, 0.77, 1.62, 0.95, 1.29, 2.97, 0.89, 1.34, 0.26, 14.97, 0.36, 9.19, 1.67]} \ No newline at end of file diff --git a/annotations_1/gWGhsJWFOrU_filtered.json b/annotations_1/gWGhsJWFOrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/gWGhsJWFOrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/gWHvF157sFI_filtered.json b/annotations_1/gWHvF157sFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a348c8fc320b925952f30781afb1ce39b867050 --- /dev/null +++ b/annotations_1/gWHvF157sFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [7.0, 7.72], [10.0, 10.44], [14.0, 15.9], [17.0, 17.74], [18.0, 18.86], [19.0, 19.8], [20.0, 20.71], [22.0, 23.11], [25.0, 25.32], [33.0, 33.24], [35.0, 35.48], [36.0, 36.09], [38.0, 38.69], [43.0, 44.9], [50.0, 56.69], [59.0, 59.07], [61.0, 61.82], [64.0, 65.13], [68.0, 68.39], [70.0, 75.1], [81.0, 81.23], [85.0, 86.37], [88.0, 87.93], [111.0, 169.48], [170.0, 170.19], [174.0, 176.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.07, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.21], ["speech", 11.35], ["synthesizer", 7.14]], null, null, null, null, [["music", 58.25], ["synthesizer", 4.47], ["hum", 4.44]], null, null, null, null, null, [["music", 61.13], ["theremin", 8.67], ["bass guitar", 8.6]]], "duration": [0.51, 0.72, 0.44, 1.9, 0.74, 0.86, 0.8, 0.71, 1.11, 0.32, 0.24, 0.48, 0.09, 0.69, 1.9, 6.69, 0.07, 0.82, 1.13, 0.39, 5.1, 0.23, 1.37, -0.07, 58.48, 0.19, 2.79]} \ No newline at end of file diff --git a/annotations_1/gZ-QU3KT1PE_filtered.json b/annotations_1/gZ-QU3KT1PE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afcd6ca75ac335e554272139d1d8ee2f0f6d96a7 --- /dev/null +++ b/annotations_1/gZ-QU3KT1PE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [2.0, 2.34], [3.0, 3.79], [4.0, 4.62], [6.0, 8.51], [9.0, 13.59], [15.0, 18.28], [20.0, 53.49], [55.0, 81.77], [83.0, 87.61], [91.0, 116.5], [117.0, 116.77], [117.0, 116.8], [117.0, 116.83], [119.0, 119.21], [123.0, 125.46], [126.0, 126.77], [130.0, 131.4], [134.0, 135.51], [136.0, 149.08], [155.0, 160.49]], "keep_status": [false, false, false, false, true, true, true, false, true, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.69, 40.47, 33.37, 0.0, 33.63, 31.63, 32.69, 0.0, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 0.0, 33.35, 73.82], "audiomae_on_audioset": [null, null, null, null, [["aircraft", 19.51], ["music", 13.91], ["fixed-wing aircraft, airplane", 12.2]], [["mains hum", 25.7], ["hum", 22.01], ["music", 17.87]], [["speech", 12.67], ["grunt", 12.1], ["music", 9.53]], null, [["music", 38.88], ["throbbing", 21.33], ["hum", 7.97]], [["music", 32.35], ["hum", 15.05], ["mains hum", 10.48]], [["music", 29.44], ["hum", 25.44], ["throbbing", 11.5]], null, null, null, null, [["fly, housefly", 37.0], ["insect", 11.4], ["music", 9.06]], null, null, null, [["music", 45.96], ["fly, housefly", 6.23], ["throbbing", 5.62]], null], "duration": [0.29, 0.34, 0.79, 0.62, 2.51, 4.59, 3.28, 33.49, 26.77, 4.61, 25.5, -0.23, -0.2, -0.17, 0.21, 2.46, 0.77, 1.4, 1.51, 13.08, 5.49]} \ No newline at end of file diff --git a/annotations_1/g_C56llGC1E_filtered.json b/annotations_1/g_C56llGC1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebd18ea90fcc7d37f39393642e288d4144d2509 --- /dev/null +++ b/annotations_1/g_C56llGC1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [7.0, 10.32], [15.0, 34.8], [50.0, 50.25], [58.0, 57.74], [58.0, 64.3], [68.0, 69.7], [74.0, 89.68], [94.0, 97.48], [100.0, 101.48], [108.0, 136.63], [144.0, 145.89], [150.0, 161.05], [169.0, 169.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.76, 32.72, 0.0, 0.0, 33.56, 0.0, 31.36, 31.6, 0.0, 36.26, 0.0, 31.59, 0.0], "audiomae_on_audioset": [null, [["music", 66.54], ["musical instrument", 9.95], ["carnatic music", 8.83]], [["music", 55.11], ["effects unit", 12.83], ["guitar", 7.53]], null, null, [["music", 71.09], ["theremin", 7.33], ["musical instrument", 4.26]], null, [["music", 78.42], ["theremin", 3.39], ["musical instrument", 2.94]], [["music", 71.87], ["electronic music", 1.72], ["musical instrument", 1.5]], null, [["music", 57.26], ["effects unit", 9.35], ["theremin", 6.5]], null, [["theremin", 55.98], ["music", 18.14], ["crowd", 3.39]], null], "duration": [1.88, 3.32, 19.8, 0.25, -0.26, 6.3, 1.7, 15.68, 3.48, 1.48, 28.63, 1.89, 11.05, 0.4]} \ No newline at end of file diff --git a/annotations_1/g_O0J66490k_filtered.json b/annotations_1/g_O0J66490k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/g_O0J66490k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/g_fIDwoORl4_filtered.json b/annotations_1/g_fIDwoORl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79a1312a28d8c4331baa1870dcace4833f079a2d --- /dev/null +++ b/annotations_1/g_fIDwoORl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.15], [10.0, 15.38], [16.0, 19.33], [21.0, 24.43], [26.0, 29.24], [30.0, 32.7], [35.0, 36.93], [39.0, 40.74], [46.0, 50.33], [51.0, 57.62], [59.0, 63.59], [65.0, 69.08], [70.0, 76.38], [77.0, 86.14], [87.0, 114.22], [116.0, 142.05], [143.0, 157.94], [159.0, 166.33], [167.0, 174.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [79.76, 61.18, 99.92, 92.97, 99.87, 64.41, 0.0, 0.0, 99.97, 72.16, 66.88, 88.46, 98.36, 95.91, 78.21, 81.71, 44.6, 77.87, 72.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.52], ["hum", 13.07], ["mains hum", 8.02]], null, null], "duration": [2.15, 5.38, 3.33, 3.43, 3.24, 2.7, 1.93, 1.74, 4.33, 6.62, 4.59, 4.08, 6.38, 9.14, 27.22, 26.05, 14.94, 7.33, 7.28]} \ No newline at end of file diff --git a/annotations_1/g_wEMoy_wi0_filtered.json b/annotations_1/g_wEMoy_wi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdd6be91165a026d60a571cbfacfa6ca3a15453 --- /dev/null +++ b/annotations_1/g_wEMoy_wi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.08], [8.0, 12.83], [16.0, 18.96], [26.0, 36.91], [42.0, 44.63], [47.0, 49.72], [52.0, 55.26], [60.0, 60.18], [62.0, 62.83], [68.0, 69.48], [79.0, 79.15], [81.0, 82.21], [86.0, 86.9], [88.0, 90.49], [92.0, 95.98], [96.0, 98.14], [103.0, 108.04], [109.0, 112.78], [115.0, 117.51], [120.0, 122.12], [124.0, 127.01], [129.0, 153.52], [154.0, 153.94]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [99.95, 99.98, 44.55, 46.97, 37.8, 69.34, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.88, 46.68, 53.1, 96.77, 85.17, 83.16, 84.43, 92.31, 65.79, 0.0], "audiomae_on_audioset": [null, null, [["speech", 17.04], ["noise", 9.06], ["hum", 8.57]], [["hiccup", 24.36], ["gasp", 18.65], ["groan", 13.95]], [["thunk", 44.6], ["glass", 14.41], ["arrow", 6.4]], null, null, null, null, null, null, null, null, [["sine wave", 32.05], ["chirp tone", 30.77], ["music", 4.31]], [["chink, clink", 27.58], ["speech", 10.8], ["cutlery, silverware", 6.07]], null, null, null, null, null, null, null, null], "duration": [4.08, 4.83, 2.96, 10.91, 2.63, 2.72, 3.26, 0.18, 0.83, 1.48, 0.15, 1.21, 0.9, 2.49, 3.98, 2.14, 5.04, 3.78, 2.51, 2.12, 3.01, 24.52, -0.06]} \ No newline at end of file diff --git a/annotations_1/gap2gWQy77A_filtered.json b/annotations_1/gap2gWQy77A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40a44b261b83d124c950325471b42848043e29ce --- /dev/null +++ b/annotations_1/gap2gWQy77A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.58], [16.0, 19.67], [20.0, 21.34], [22.0, 29.3], [33.0, 37.79], [40.0, 40.31], [41.0, 42.3], [45.0, 46.33], [47.0, 48.39], [50.0, 50.46], [53.0, 53.87], [56.0, 57.08], [58.0, 58.6], [60.0, 62.26], [74.0, 78.34], [79.0, 81.03], [82.0, 83.44], [84.0, 85.08], [104.0, 106.47], [111.0, 111.2], [113.0, 115.06], [118.0, 118.96], [119.0, 122.69], [124.0, 124.33], [128.0, 145.96]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, true, false, true], "silence_prob": [0.0, 32.54, 0.0, 29.88, 35.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.9, 45.05, 60.89, 0.0, 0.0, 35.33, 0.0, 29.1, 0.0, 30.85, 0.0, 28.14], "audiomae_on_audioset": [null, [["music", 22.4], ["throbbing", 21.93], ["hum", 13.4]], null, [["speech", 50.7], ["hum", 7.37], ["music", 5.67]], [["speech", 70.88], ["music", 14.13], ["sidetone", 3.72]], null, null, null, null, null, null, null, null, null, [["speech", 41.6], ["hum", 6.12], ["music", 6.06]], null, null, null, [["music", 32.06], ["hum", 27.89], ["mains hum", 9.21]], null, [["hum", 30.82], ["mains hum", 15.11], ["throbbing", 12.32]], null, [["music", 21.81], ["mains hum", 19.92], ["hum", 18.19]], null, [["music", 43.99], ["throbbing", 11.94], ["didgeridoo", 8.29]]], "duration": [1.58, 3.67, 1.34, 7.3, 4.79, 0.31, 1.3, 1.33, 1.39, 0.46, 0.87, 1.08, 0.6, 2.26, 4.34, 2.03, 1.44, 1.08, 2.47, 0.2, 2.06, 0.96, 3.69, 0.33, 17.96]} \ No newline at end of file diff --git a/annotations_1/gcPY3RIvtCw_filtered.json b/annotations_1/gcPY3RIvtCw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6df5faf994ef206edfefed274a3a4aa37fa3ef4 --- /dev/null +++ b/annotations_1/gcPY3RIvtCw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.54], [21.0, 23.41], [33.0, 34.08], [38.0, 38.28], [41.0, 43.14], [53.0, 53.62], [58.0, 57.96], [69.0, 69.25], [73.0, 74.36], [85.0, 86.85], [93.0, 99.05], [101.0, 102.73], [103.0, 103.71], [113.0, 114.17], [115.0, 115.05], [115.0, 119.77], [121.0, 123.23], [130.0, 133.37], [172.0, 175.07], [186.0, 187.19], [193.0, 215.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.57, 0.0, 0.0, 35.7, 0.0, 0.0, 0.0, 0.0, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 31.56, 33.41, 31.28, 31.8, 0.0, 31.5], "audiomae_on_audioset": [null, [["music", 66.47], ["musical instrument", 3.12], ["electric piano", 2.13]], null, null, [["music", 63.35], ["musical instrument", 6.88], ["guitar", 6.01]], null, null, null, null, null, [["music", 74.88], ["theremin", 3.2], ["effects unit", 3.12]], null, null, null, null, [["music", 79.74], ["musical instrument", 4.06], ["guitar", 2.36]], [["music", 73.35], ["musical instrument", 3.69], ["guitar", 3.67]], [["music", 75.7], ["carnatic music", 2.27], ["musical instrument", 1.48]], [["music", 65.12], ["musical instrument", 5.31], ["guitar", 4.1]], null, [["music", 77.41], ["musical instrument", 2.44], ["guitar", 0.97]]], "duration": [0.54, 2.41, 1.08, 0.28, 2.14, 0.62, -0.04, 0.25, 1.36, 1.85, 6.05, 1.73, 0.71, 1.17, 0.05, 4.77, 2.23, 3.37, 3.07, 1.19, 22.49]} \ No newline at end of file diff --git a/annotations_1/ge9ahoqNSLE_filtered.json b/annotations_1/ge9ahoqNSLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0666161ae0ea57f63734944a91a99a27c2fb19bf --- /dev/null +++ b/annotations_1/ge9ahoqNSLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.54], [39.0, 43.01], [46.0, 48.41], [51.0, 52.17], [54.0, 61.23]], "keep_status": [false, true, true, false, true], "silence_prob": [0.0, 30.83, 33.62, 0.0, 30.4], "audiomae_on_audioset": [null, [["music", 12.11], ["hum", 11.78], ["mains hum", 7.67]], [["music", 31.74], ["musical instrument", 6.66], ["theremin", 3.99]], null, [["brass instrument", 23.93], ["music", 21.48], ["foghorn", 19.26]]], "duration": [0.54, 4.01, 2.41, 1.17, 7.23]} \ No newline at end of file diff --git a/annotations_1/geGO_emEsqs_filtered.json b/annotations_1/geGO_emEsqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c97edb74a86329e3721f29a55545aa4d84ca30d9 --- /dev/null +++ b/annotations_1/geGO_emEsqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [34.0, 34.21], [38.0, 38.15], [53.0, 53.01], [100.0, 101.6], [110.0, 109.88], [113.0, 113.31], [125.0, 125.41], [144.0, 144.0], [154.0, 154.99], [171.0, 171.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.21, 0.15, 0.01, 1.6, -0.12, 0.31, 0.41, 0.0, 0.99, 0.46]} \ No newline at end of file diff --git a/annotations_1/geiub8WP_XE_filtered.json b/annotations_1/geiub8WP_XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54114841171d99b7bce4128e738afc7e054f1b5d --- /dev/null +++ b/annotations_1/geiub8WP_XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.31], [9.0, 10.03], [13.0, 14.34], [17.0, 18.84], [25.0, 25.3], [26.0, 29.64], [32.0, 33.29], [35.0, 39.33], [41.0, 41.57], [43.0, 43.39], [47.0, 48.63], [50.0, 53.03], [53.0, 54.78], [57.0, 57.99], [59.0, 71.96], [75.0, 77.85], [87.0, 88.35], [93.0, 94.9], [96.0, 97.19], [99.0, 100.58], [103.0, 104.33], [107.0, 107.76], [109.0, 109.59], [115.0, 116.65], [118.0, 118.34], [119.0, 120.06], [122.0, 123.09], [128.0, 133.02], [134.0, 137.83], [139.0, 141.02], [143.0, 143.09], [145.0, 145.86], [150.0, 150.96], [171.0, 171.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 67.89, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 45.95, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 75.23, 55.89, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.26], ["musical instrument", 7.38], ["buzz", 5.93]], [["music", 42.17], ["double bass", 9.58], ["cello", 9.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.03, 1.34, 1.84, 0.3, 3.64, 1.29, 4.33, 0.57, 0.39, 1.63, 3.03, 1.78, 0.99, 12.96, 2.85, 1.35, 1.9, 1.19, 1.58, 1.33, 0.76, 0.59, 1.65, 0.34, 1.06, 1.09, 5.02, 3.83, 2.02, 0.09, 0.86, 0.96, 0.51]} \ No newline at end of file diff --git a/annotations_1/geoi6Sxyg7g_filtered.json b/annotations_1/geoi6Sxyg7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fb1ed733def18077144d1cea41d332d7f0255dc --- /dev/null +++ b/annotations_1/geoi6Sxyg7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.16], [8.0, 10.27], [12.0, 18.15], [19.0, 22.52], [28.0, 30.1], [31.0, 38.64], [45.0, 46.03], [49.0, 50.13], [52.0, 53.33], [57.0, 59.29], [61.0, 61.92], [67.0, 69.33], [72.0, 77.18], [80.0, 81.68], [82.0, 82.75], [83.0, 87.59], [88.0, 91.29], [93.0, 95.05], [95.0, 97.31], [99.0, 103.25], [104.0, 106.93], [109.0, 109.56], [112.0, 112.04], [113.0, 116.56], [118.0, 123.26], [125.0, 129.05], [129.0, 131.19], [133.0, 153.84], [154.0, 157.01], [159.0, 161.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.01, 59.33, 81.71, 69.34, 98.36, 96.54, 0.0, 0.0, 0.0, 90.95, 0.0, 93.29, 96.66, 0.0, 0.0, 59.59, 87.0, 95.51, 51.28, 97.0, 76.86, 0.0, 0.0, 96.66, 95.91, 37.09, 32.02, 44.26, 45.95, 52.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 60.2], ["speech", 16.3], ["hum", 8.67]], [["speech", 42.85], ["sidetone", 34.72], ["telephone", 3.75]], [["hum", 44.3], ["mains hum", 43.48], ["speech", 2.15]], [["speech", 62.67], ["music", 7.75], ["hum", 4.96]], null], "duration": [2.16, 2.27, 6.15, 3.52, 2.1, 7.64, 1.03, 1.13, 1.33, 2.29, 0.92, 2.33, 5.18, 1.68, 0.75, 4.59, 3.29, 2.05, 2.31, 4.25, 2.93, 0.56, 0.04, 3.56, 5.26, 4.05, 2.19, 20.84, 3.01, 2.91]} \ No newline at end of file diff --git a/annotations_1/gfXns_cU8I8_filtered.json b/annotations_1/gfXns_cU8I8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..587c0100dfa0c15affcb1084bee7c3f697943ced --- /dev/null +++ b/annotations_1/gfXns_cU8I8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.44], [18.0, 17.64], [18.0, 37.13], [41.0, 53.27], [56.0, 56.13], [58.0, 59.9], [61.0, 65.72]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [29.01, 0.0, 29.26, 29.63, 0.0, 0.0, 30.16], "audiomae_on_audioset": [[["buzz", 22.66], ["music", 14.25], ["hum", 9.84]], null, [["mains hum", 46.87], ["hum", 24.66], ["noise", 4.11]], [["music", 34.66], ["hum", 13.97], ["buzz", 7.42]], null, null, [["fly, housefly", 36.81], ["insect", 31.54], ["mosquito", 6.61]]], "duration": [9.44, -0.36, 19.13, 12.27, 0.13, 1.9, 4.72]} \ No newline at end of file diff --git a/annotations_1/ghUFMbHmw8s_filtered.json b/annotations_1/ghUFMbHmw8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e342994547eae92c346f12d61650e7a5581a2239 --- /dev/null +++ b/annotations_1/ghUFMbHmw8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [2.0, 4.43], [7.0, 18.22], [42.0, 43.12], [51.0, 51.12], [52.0, 61.96], [62.0, 75.76], [76.0, 84.82], [85.0, 85.56], [91.0, 93.51], [95.0, 98.34], [104.0, 104.92], [122.0, 122.81], [125.0, 126.33], [143.0, 143.4], [144.0, 144.19], [169.0, 169.16], [174.0, 175.34], [194.0, 202.96], [204.0, 209.56], [210.0, 210.25], [213.0, 213.6], [217.0, 217.71], [219.0, 219.3], [221.0, 221.43], [228.0, 228.77]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 70.72, 30.79, 0.0, 0.0, 33.99, 32.84, 31.91, 0.0, 49.59, 49.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.59, 32.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 44.45], ["moo", 34.21], ["livestock, farm animals, working animals", 19.15]], null, null, [["music", 80.8], ["electronic music", 2.95], ["didgeridoo", 2.85]], [["whack, thwack", 21.98], ["music", 12.41], ["fly, housefly", 9.94]], [["speech", 18.81], ["groan", 8.57], ["moo", 7.38]], null, [["speech", 35.17], ["music", 34.86], ["boing", 8.62]], [["music", 64.57], ["synthesizer", 6.65], ["musical instrument", 5.76]], null, null, null, null, null, null, null, [["music", 29.15], ["noise", 15.72], ["hum", 12.44]], [["music", 24.39], ["crowd", 6.97], ["whale vocalization", 6.82]], null, null, null, null, null, null], "duration": [0.53, 2.43, 11.22, 1.12, 0.12, 9.96, 13.76, 8.82, 0.56, 2.51, 3.34, 0.92, 0.81, 1.33, 0.4, 0.19, 0.16, 1.34, 8.96, 5.56, 0.25, 0.6, 0.71, 0.3, 0.43, 0.77]} \ No newline at end of file diff --git a/annotations_1/ghZ6ntXQp3E_filtered.json b/annotations_1/ghZ6ntXQp3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87c6dd4e7dce1ccfe970e84947af0bfe8ae8fd0b --- /dev/null +++ b/annotations_1/ghZ6ntXQp3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.97], [22.0, 22.5], [28.0, 29.78], [31.0, 31.43], [45.0, 45.32], [46.0, 47.22], [49.0, 49.82], [52.0, 57.94], [72.0, 74.06], [79.0, 80.1], [81.0, 82.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.45, 84.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 58.34], ["electronic music", 7.77], ["synthesizer", 4.34]], null, null, null], "duration": [0.97, 0.5, 1.78, 0.43, 0.32, 1.22, 0.82, 5.94, 2.06, 1.1, 1.53]} \ No newline at end of file diff --git a/annotations_1/ghfqnmL0d_A_filtered.json b/annotations_1/ghfqnmL0d_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0959f9818bd6cee3781a6f68188bf0918d1cfa --- /dev/null +++ b/annotations_1/ghfqnmL0d_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.77], [13.0, 15.03], [17.0, 17.83], [19.0, 19.77], [27.0, 28.65], [30.0, 35.26], [38.0, 62.21], [66.0, 66.85], [71.0, 70.8], [97.0, 97.83], [98.0, 97.87], [109.0, 116.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.82, 0.0, 0.0, 0.0, 34.06, 31.74, 0.0, 0.0, 0.0, 0.0, 35.7], "audiomae_on_audioset": [null, [["speech", 63.37], ["telephone", 7.94], ["radio", 6.21]], null, null, null, [["music", 59.61], ["boing", 12.8], ["didgeridoo", 3.35]], [["music", 88.53], ["musical instrument", 1.49], ["funny music", 1.4]], null, null, null, null, [["speech", 65.04], ["music", 17.89], ["radio", 9.26]]], "duration": [0.77, 2.03, 0.83, 0.77, 1.65, 5.26, 24.21, 0.85, -0.2, 0.83, -0.13, 7.48]} \ No newline at end of file diff --git a/annotations_1/gi9EwdK-6L4_filtered.json b/annotations_1/gi9EwdK-6L4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1fe647d3c175c2ec899f0d9f037845f47e69f30 --- /dev/null +++ b/annotations_1/gi9EwdK-6L4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.83], [15.0, 16.14], [19.0, 21.46], [22.0, 29.24], [36.0, 36.41], [38.0, 38.01], [39.0, 41.32], [42.0, 45.22], [50.0, 50.65], [54.0, 53.74], [57.0, 58.11], [63.0, 64.05], [80.0, 88.6], [94.0, 96.65], [98.0, 97.58], [98.0, 97.88], [98.0, 99.5], [107.0, 107.4], [112.0, 113.56], [114.0, 115.26], [117.0, 119.57], [121.0, 137.66], [140.0, 142.11], [143.0, 145.15]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 94.52, 36.34, 0.0, 0.0, 40.81, 38.6, 0.0, 0.0, 0.0, 0.0, 31.09, 41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 33.04, 39.8, 30.73], "audiomae_on_audioset": [null, null, null, [["singing bowl", 29.06], ["music", 20.98], ["speech", 15.11]], null, null, [["speech", 32.79], ["music", 22.12], ["sidetone", 14.9]], [["didgeridoo", 49.06], ["music", 29.19], ["livestock, farm animals, working animals", 2.48]], null, null, null, null, [["hum", 24.61], ["mains hum", 23.62], ["music", 16.91]], [["music", 61.82], ["didgeridoo", 13.86], ["speech", 2.97]], null, null, null, null, null, null, null, [["hum", 22.06], ["gong", 22.03], ["music", 15.69]], [["music", 51.07], ["electronic music", 5.94], ["gong", 4.49]], [["speech", 44.32], ["boom", 11.91], ["gunshot, gunfire", 5.02]]], "duration": [1.83, 1.14, 2.46, 7.24, 0.41, 0.01, 2.32, 3.22, 0.65, -0.26, 1.11, 1.05, 8.6, 2.65, -0.42, -0.12, 1.5, 0.4, 1.56, 1.26, 2.57, 16.66, 2.11, 2.15]} \ No newline at end of file diff --git a/annotations_1/giajSDY8kCs_filtered.json b/annotations_1/giajSDY8kCs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df14689e1a3248e379dfc1dcbb7f96ba6cc715d3 --- /dev/null +++ b/annotations_1/giajSDY8kCs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [4.0, 4.41], [6.0, 6.61], [10.0, 10.25], [11.0, 12.7], [14.0, 15.82], [16.0, 23.35], [25.0, 26.55], [27.0, 29.51], [32.0, 32.02], [35.0, 36.41], [41.0, 41.5], [61.0, 62.72], [63.0, 65.47], [68.0, 71.29], [74.0, 74.82], [76.0, 76.45], [77.0, 77.95], [79.0, 80.92], [82.0, 84.5], [92.0, 96.87], [103.0, 106.24], [107.0, 108.95], [111.0, 111.99], [116.0, 126.22], [130.0, 130.96], [139.0, 140.27], [142.0, 142.65], [151.0, 152.69], [153.0, 154.47], [156.0, 159.12], [164.0, 163.88], [169.0, 170.36], [172.0, 172.23], [173.0, 173.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 99.98, 94.07, 0.0, 0.0, 0.0, 0.0, 61.67, 68.93, 98.8, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 0.41, 0.61, 0.25, 1.7, 1.82, 7.35, 1.55, 2.51, 0.02, 1.41, 0.5, 1.72, 2.47, 3.29, 0.82, 0.45, 0.95, 1.92, 2.5, 4.87, 3.24, 1.95, 0.99, 10.22, 0.96, 1.27, 0.65, 1.69, 1.47, 3.12, -0.12, 1.36, 0.23, 0.03]} \ No newline at end of file diff --git a/annotations_1/gj_BH6Suku0_filtered.json b/annotations_1/gj_BH6Suku0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50f5679b009fa7055fe66886cf2286ad05dbf5ed --- /dev/null +++ b/annotations_1/gj_BH6Suku0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.28], [9.0, 10.81], [12.0, 12.97], [16.0, 15.8], [38.0, 39.21], [41.0, 42.31], [46.0, 47.83], [52.0, 52.05], [59.0, 60.22], [67.0, 67.36], [88.0, 88.43], [92.0, 92.15], [99.0, 99.79], [103.0, 103.0], [105.0, 105.29], [108.0, 107.86], [127.0, 128.63], [131.0, 131.72], [140.0, 140.93], [146.0, 148.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.28, 1.81, 0.97, -0.2, 1.21, 1.31, 1.83, 0.05, 1.22, 0.36, 0.43, 0.15, 0.79, 0.0, 0.29, -0.14, 1.63, 0.72, 0.93, 2.34]} \ No newline at end of file diff --git a/annotations_1/gjjJePytKig_filtered.json b/annotations_1/gjjJePytKig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59ed6393b2e3da19a1b8e3a2636f3680bbd9bdad --- /dev/null +++ b/annotations_1/gjjJePytKig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[89.0, 91.96], [93.0, 95.74], [96.0, 99.23], [100.0, 100.35], [101.0, 113.68], [114.0, 114.51], [115.0, 115.57], [116.0, 117.59], [120.0, 123.57], [124.0, 125.79], [129.0, 129.37], [131.0, 132.24], [135.0, 139.92], [141.0, 141.56], [142.0, 169.03], [170.0, 170.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 95.37, 85.72, 0.0, 99.52, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 61.27, 0.0, 40.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.3], ["noise", 24.78], ["theremin", 20.77]], null], "duration": [2.96, 2.74, 3.23, 0.35, 12.68, 0.51, 0.57, 1.59, 3.57, 1.79, 0.37, 1.24, 4.92, 0.56, 27.03, 0.55]} \ No newline at end of file diff --git a/annotations_1/gjmt7I1OJfw_filtered.json b/annotations_1/gjmt7I1OJfw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44217f613e3c80f021fa0135c2584d507fc0851 --- /dev/null +++ b/annotations_1/gjmt7I1OJfw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.03], [11.0, 13.15], [14.0, 14.94], [17.0, 18.08], [19.0, 19.99], [22.0, 22.47], [26.0, 26.65], [29.0, 29.15], [61.0, 61.37], [65.0, 65.55], [101.0, 106.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 49.82], ["cattle, bovinae", 27.43], ["moo", 17.53]], null, null, null, null, null, null, null, null, null], "duration": [0.03, 2.15, 0.94, 1.08, 0.99, 0.47, 0.65, 0.15, 0.37, 0.55, 5.32]} \ No newline at end of file diff --git a/annotations_1/gjuizikJ2bk_filtered.json b/annotations_1/gjuizikJ2bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2ca4dd43c60773beb2355abb3f63e9f77f57c43 --- /dev/null +++ b/annotations_1/gjuizikJ2bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.96], [15.0, 21.91], [23.0, 24.04], [27.0, 28.24], [30.0, 31.08], [33.0, 40.83], [47.0, 48.56], [50.0, 52.08], [54.0, 55.58], [58.0, 60.2], [66.0, 69.01], [72.0, 73.47], [76.0, 79.57], [82.0, 83.2], [84.0, 85.53], [87.0, 91.37], [93.0, 93.41], [95.0, 122.89], [125.0, 125.95], [127.0, 134.49], [136.0, 138.89], [141.0, 177.74]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [45.14, 54.17, 0.0, 0.0, 0.0, 70.44, 0.0, 61.57, 0.0, 65.2, 66.03, 0.0, 78.55, 0.0, 0.0, 44.78, 0.0, 55.39, 0.0, 51.99, 78.04, 0.0], "audiomae_on_audioset": [[["sine wave", 36.9], ["chirp tone", 18.55], ["hum", 6.03]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.04], ["mains hum", 27.98], ["music", 9.87]], null, null, null, null, null, null], "duration": [6.96, 6.91, 1.04, 1.24, 1.08, 7.83, 1.56, 2.08, 1.58, 2.2, 3.01, 1.47, 3.57, 1.2, 1.53, 4.37, 0.41, 27.89, 0.95, 7.49, 2.89, 36.74]} \ No newline at end of file diff --git a/annotations_1/gm-sqEK2InM_filtered.json b/annotations_1/gm-sqEK2InM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..698cd64d78a2456e701d9941b08ee0ef8bb8e862 --- /dev/null +++ b/annotations_1/gm-sqEK2InM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.43], [14.0, 15.77], [17.0, 17.32], [19.0, 19.21], [19.0, 30.64], [32.0, 33.44], [34.0, 62.97], [65.0, 66.48], [72.0, 73.63], [74.0, 74.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 96.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.43, 1.77, 0.32, 0.21, 11.64, 1.44, 28.97, 1.48, 1.63, 0.24]} \ No newline at end of file diff --git a/annotations_1/gm0I_zdgs8o_filtered.json b/annotations_1/gm0I_zdgs8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d918513d26d880186f831d9c855ea7b61b9db030 --- /dev/null +++ b/annotations_1/gm0I_zdgs8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.07], [10.0, 9.75], [10.0, 42.11], [44.0, 56.66], [58.0, 61.65], [65.0, 64.71], [67.0, 96.31], [103.0, 106.54], [111.0, 113.97], [116.0, 145.89]], "keep_status": [true, false, false, false, false, false, true, false, false, false], "silence_prob": [47.2, 0.0, 0.0, 87.92, 99.82, 0.0, 31.48, 46.26, 64.97, 52.98], "audiomae_on_audioset": [[["speech", 28.37], ["music", 15.36], ["buzz", 5.68]], null, null, null, null, null, [["music", 47.49], ["whale vocalization", 9.78], ["hum", 8.78]], [["mosquito", 58.02], ["fly, housefly", 14.72], ["throbbing", 4.8]], null, null], "duration": [6.07, -0.25, 32.11, 12.66, 3.65, -0.29, 29.31, 3.54, 2.97, 29.89]} \ No newline at end of file diff --git a/annotations_1/gmElew2NIS8_filtered.json b/annotations_1/gmElew2NIS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f34e075987c2f1494f34da60718ad9371da07ea3 --- /dev/null +++ b/annotations_1/gmElew2NIS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.9], [7.0, 7.82], [14.0, 14.98], [16.0, 16.75], [18.0, 18.96], [20.0, 20.63], [27.0, 27.19], [30.0, 29.88], [47.0, 51.66], [52.0, 53.54], [56.0, 56.79], [58.0, 58.01], [58.0, 58.72], [60.0, 59.71], [60.0, 59.81], [60.0, 59.85], [60.0, 60.66], [63.0, 72.93], [73.0, 74.07], [75.0, 75.39], [77.0, 77.79], [79.0, 84.55], [90.0, 103.89], [105.0, 107.52], [110.0, 121.47], [125.0, 141.22]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.24, 0.0, 0.0, 0.0, 42.65, 36.8, 43.33, 34.31, 31.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["baby cry, infant cry", 17.26], ["moo", 14.65], ["cattle, bovinae", 14.35]], null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 13.53], ["fart", 11.0], ["animal", 7.82]], [["speech", 29.72], ["fart", 5.87], ["explosion", 5.33]], [["fly, housefly", 15.48], ["insect", 12.95], ["speech", 11.24]], [["speech", 40.13], ["wail, moan", 8.15], ["groan", 3.52]], [["livestock, farm animals, working animals", 32.47], ["cattle, bovinae", 31.07], ["moo", 17.17]]], "duration": [1.9, 0.82, 0.98, 0.75, 0.96, 0.63, 0.19, -0.12, 4.66, 1.54, 0.79, 0.01, 0.72, -0.29, -0.19, -0.15, 0.66, 9.93, 1.07, 0.39, 0.79, 5.55, 13.89, 2.52, 11.47, 16.22]} \ No newline at end of file diff --git a/annotations_1/gmJtNjLjsNQ_filtered.json b/annotations_1/gmJtNjLjsNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f26d9e514315f2f0516997787757a034e276aca8 --- /dev/null +++ b/annotations_1/gmJtNjLjsNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 71.91], [73.0, 76.28], [77.0, 80.23], [81.0, 83.05], [83.0, 84.55], [86.0, 86.71], [88.0, 91.12], [92.0, 99.99], [100.0, 107.03], [107.0, 124.78], [127.0, 127.18], [128.0, 134.28], [135.0, 141.22], [142.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 95.23, 92.15, 95.23, 0.0, 0.0, 97.43, 97.0, 80.46, 72.6, 0.0, 73.51, 78.21, 70.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.91, 3.28, 3.23, 2.05, 1.55, 0.71, 3.12, 7.99, 7.03, 17.78, 0.18, 6.28, 6.22, 15.76]} \ No newline at end of file diff --git a/annotations_1/gmSeaKdO9IQ_filtered.json b/annotations_1/gmSeaKdO9IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed58bd7e2a62e5c04e2b29dcb0e51c01f41260d --- /dev/null +++ b/annotations_1/gmSeaKdO9IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 24.98], [27.0, 28.07], [29.0, 30.4], [35.0, 34.77], [36.0, 36.44], [41.0, 41.32], [43.0, 46.68], [48.0, 49.98], [51.0, 52.81], [54.0, 62.8], [64.0, 75.14], [77.0, 82.68], [84.0, 108.94], [110.0, 111.03], [114.0, 116.24], [117.0, 117.64]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, true, false], "silence_prob": [47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 33.62, 73.36, 54.63, 38.2, 0.0, 44.32, 0.0], "audiomae_on_audioset": [[["speech", 73.61], ["sidetone", 5.37], ["speech synthesizer", 3.8]], null, null, null, null, null, null, null, null, [["music", 44.91], ["gong", 5.54], ["fly, housefly", 5.13]], null, null, [["music", 14.99], ["effects unit", 14.09], ["singing bowl", 13.14]], null, [["music", 35.16], ["noise", 7.58], ["hum", 6.17]], null], "duration": [4.98, 1.07, 1.4, -0.23, 0.44, 0.32, 3.68, 1.98, 1.81, 8.8, 11.14, 5.68, 24.94, 1.03, 2.24, 0.64]} \ No newline at end of file diff --git a/annotations_1/gmnU4tK8GOo_filtered.json b/annotations_1/gmnU4tK8GOo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b863e4493786c06d708a5d926d0f8335ec9384c --- /dev/null +++ b/annotations_1/gmnU4tK8GOo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 38.28], [39.0, 66.21], [74.0, 75.84], [76.0, 119.82], [120.0, 121.17], [124.0, 128.12], [139.0, 141.32], [142.0, 144.58], [146.0, 146.62], [147.0, 147.82]], "keep_status": [true, true, false, false, false, true, false, false, false, false], "silence_prob": [39.74, 32.14, 0.0, 0.0, 0.0, 31.46, 62.07, 59.77, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 32.5], ["throbbing", 13.37], ["hum", 8.0]], [["breaking", 30.82], ["glass", 19.01], ["music", 13.27]], null, null, null, [["whack, thwack", 21.19], ["thunk", 15.31], ["speech", 9.09]], null, null, null, null], "duration": [2.28, 27.21, 1.84, 43.82, 1.17, 4.12, 2.32, 2.58, 0.62, 0.82]} \ No newline at end of file diff --git a/annotations_1/gnWkYf8Peo8_filtered.json b/annotations_1/gnWkYf8Peo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cea6ef870f3bd58e0058055fd2be921c66e4673a --- /dev/null +++ b/annotations_1/gnWkYf8Peo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.64], [17.0, 17.17], [17.0, 17.98], [21.0, 32.12], [33.0, 38.42], [39.0, 40.24], [42.0, 42.47], [43.0, 45.28], [46.0, 47.9], [49.0, 49.32], [50.0, 51.56], [53.0, 68.64], [72.0, 113.12], [113.0, 117.0], [120.0, 158.03]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 35.56, 81.89, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 40.38, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 42.21], ["hum", 9.96], ["breaking", 9.36]], null, null, null, null, null, null, null, [["music", 18.13], ["fart", 8.88], ["ambient music", 8.73]], null, [["whale vocalization", 15.09], ["music", 14.18], ["buzz", 9.16]], null], "duration": [1.64, 0.17, 0.98, 11.12, 5.42, 1.24, 0.47, 2.28, 1.9, 0.32, 1.56, 15.64, 41.12, 4.0, 38.03]} \ No newline at end of file diff --git a/annotations_1/gnallHWgupY_filtered.json b/annotations_1/gnallHWgupY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4abc0a73a098e3b2c6d08e8ffe99e5bea44e1c4 --- /dev/null +++ b/annotations_1/gnallHWgupY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.17], [4.0, 4.72], [6.0, 6.64], [8.0, 15.97], [17.0, 18.77], [22.0, 21.86], [26.0, 26.84], [28.0, 30.0], [30.0, 30.99], [33.0, 33.54], [43.0, 43.93], [47.0, 48.59], [52.0, 53.15], [57.0, 57.86], [63.0, 65.08], [69.0, 75.63], [80.0, 81.38], [83.0, 84.13], [86.0, 85.99], [88.0, 89.38], [93.0, 93.48], [95.0, 97.83], [99.0, 99.06], [103.0, 116.94], [119.0, 120.45], [121.0, 130.62], [131.0, 175.71], [179.0, 179.96], [181.0, 181.72], [184.0, 184.28], [186.0, 186.49], [188.0, 193.5], [195.0, 195.83], [198.0, 199.13], [202.0, 202.53], [204.0, 208.14], [208.0, 212.95], [213.0, 214.68], [216.0, 217.17]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.12, 33.06, 0.0, 0.0, 0.0, 0.0, 0.0, 31.03, 0.0, 30.81, 0.0, 30.63, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0, 0.0, 37.15, 34.02, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.61], ["synthesizer", 14.57], ["whale vocalization", 5.99]], null, null, null, null, null, null, null, null, null, null, [["speech", 32.9], ["music", 14.16], ["vehicle", 7.28]], [["cattle, bovinae", 30.3], ["moo", 27.05], ["livestock, farm animals, working animals", 14.49]], null, null, null, null, null, [["music", 28.74], ["vehicle", 10.32], ["speech", 4.47]], null, [["music", 40.12], ["whale vocalization", 3.76], ["buzz", 3.15]], null, [["music", 51.47], ["speech", 6.16], ["whack, thwack", 4.68]], null, null, null, null, null, null, null, null, null, [["hum", 32.16], ["glass", 21.03], ["mains hum", 11.64]], [["music", 38.37], ["speech", 32.85], ["electronic music", 1.44]], null, null], "duration": [1.17, 0.72, 0.64, 7.97, 1.77, -0.14, 0.84, 2.0, 0.99, 0.54, 0.93, 1.59, 1.15, 0.86, 2.08, 6.63, 1.38, 1.13, -0.01, 1.38, 0.48, 2.83, 0.06, 13.94, 1.45, 9.62, 44.71, 0.96, 0.72, 0.28, 0.49, 5.5, 0.83, 1.13, 0.53, 4.14, 4.95, 1.68, 1.17]} \ No newline at end of file diff --git a/annotations_1/gnbjy2tWfd4_filtered.json b/annotations_1/gnbjy2tWfd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94d42bf6cbcc9aa45b54957d18d18a93497a9e79 --- /dev/null +++ b/annotations_1/gnbjy2tWfd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.77], [50.0, 51.34], [86.0, 87.76]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [0.77, 1.34, 1.76]} \ No newline at end of file diff --git a/annotations_1/gnfp7yyQgH8_filtered.json b/annotations_1/gnfp7yyQgH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dad5d13aaf9af920594ec3e3fe786bb42339da37 --- /dev/null +++ b/annotations_1/gnfp7yyQgH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 30.91], [31.0, 34.72], [36.0, 38.18], [49.0, 60.08], [61.0, 64.22], [66.0, 66.65], [82.0, 82.41], [85.0, 90.31], [93.0, 101.12], [104.0, 120.36], [131.0, 131.35]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [47.39, 45.3, 49.09, 48.74, 34.3, 0.0, 0.0, 42.39, 33.77, 31.0, 0.0], "audiomae_on_audioset": [[["music", 86.54], ["speech", 1.75], ["electronic music", 1.07]], [["music", 71.41], ["hum", 7.14], ["musical instrument", 3.91]], [["music", 37.52], ["gong", 21.0], ["singing bowl", 9.54]], [["throbbing", 48.04], ["hum", 32.25], ["music", 6.26]], [["music", 27.37], ["synthesizer", 24.01], ["sonar", 12.25]], null, null, [["hum", 46.68], ["sidetone", 19.51], ["speech", 11.61]], [["music", 52.55], ["speech", 24.09], ["hum", 4.07]], [["hum", 52.52], ["mains hum", 23.73], ["throbbing", 6.89]], null], "duration": [12.91, 3.72, 2.18, 11.08, 3.22, 0.65, 0.41, 5.31, 8.12, 16.36, 0.35]} \ No newline at end of file diff --git a/annotations_1/gnlvKhPzx5A_filtered.json b/annotations_1/gnlvKhPzx5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/gnlvKhPzx5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/go4K4rCFjMQ_filtered.json b/annotations_1/go4K4rCFjMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97ca9fba01d9cc826a0764b19077352e1d5582a2 --- /dev/null +++ b/annotations_1/go4K4rCFjMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 31.68], [35.0, 35.94], [37.0, 40.0], [50.0, 50.55], [53.0, 55.11], [60.0, 60.37], [64.0, 64.61], [69.0, 72.59], [76.0, 75.93], [80.0, 80.33], [82.0, 82.24], [84.0, 84.18], [95.0, 96.01], [97.0, 96.97], [98.0, 98.02], [101.0, 103.84], [112.0, 112.31], [113.0, 113.63], [115.0, 115.48], [117.0, 117.07], [119.0, 119.23], [119.0, 120.18], [120.0, 124.85], [126.0, 133.02], [134.0, 134.97], [137.0, 151.17], [174.0, 174.33], [190.0, 190.48], [197.0, 199.18], [203.0, 202.8], [207.0, 210.19], [214.0, 214.29], [223.0, 225.17], [226.0, 226.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 41.66, 0.0, 36.37, 0.0, 0.0, 33.32, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.11, 33.48, 0.0, 31.67, 0.0, 0.0, 31.79, 0.0, 32.83, 0.0, 35.15, 0.0], "audiomae_on_audioset": [null, null, [["music", 46.23], ["didgeridoo", 18.28], ["musical instrument", 5.53]], null, [["music", 62.25], ["musical instrument", 10.52], ["theremin", 9.78]], null, null, [["music", 26.65], ["didgeridoo", 23.55], ["effects unit", 6.22]], null, null, null, null, null, null, null, [["music", 48.0], ["musical instrument", 6.55], ["synthesizer", 6.11]], null, null, null, null, null, null, [["music", 32.19], ["hum", 13.52], ["synthesizer", 9.17]], [["theremin", 33.86], ["music", 31.86], ["quack", 5.29]], null, [["music", 72.38], ["musical instrument", 3.71], ["quack", 3.16]], null, null, [["music", 50.91], ["didgeridoo", 28.59], ["theremin", 5.06]], null, [["music", 35.42], ["gong", 20.91], ["musical instrument", 6.18]], null, [["theremin", 60.77], ["music", 20.91], ["ambient music", 5.21]], null], "duration": [-0.32, 0.94, 3.0, 0.55, 2.11, 0.37, 0.61, 3.59, -0.07, 0.33, 0.24, 0.18, 1.01, -0.03, 0.02, 2.84, 0.31, 0.63, 0.48, 0.07, 0.23, 1.18, 4.85, 7.02, 0.97, 14.17, 0.33, 0.48, 2.18, -0.2, 3.19, 0.29, 2.17, 0.47]} \ No newline at end of file diff --git a/annotations_1/goEiURelfsM_filtered.json b/annotations_1/goEiURelfsM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e953a4e0c11d6eeb9401c1a2abe91ce6d3568c1 --- /dev/null +++ b/annotations_1/goEiURelfsM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [8.0, 8.29], [11.0, 11.8], [13.0, 13.63], [15.0, 16.46], [18.0, 19.25], [21.0, 22.11], [28.0, 33.57], [35.0, 35.95], [38.0, 40.51], [41.0, 41.89], [42.0, 41.99], [42.0, 42.4], [47.0, 48.09], [53.0, 53.86], [58.0, 58.82], [63.0, 65.57], [67.0, 67.56], [70.0, 71.64], [77.0, 77.65], [78.0, 78.83], [82.0, 82.36], [85.0, 85.33], [86.0, 86.32], [87.0, 90.19], [97.0, 99.18], [99.0, 102.73], [105.0, 106.76], [109.0, 111.82], [115.0, 115.21], [117.0, 123.58], [125.0, 128.21], [130.0, 130.87], [134.0, 134.81], [137.0, 137.44], [142.0, 142.74], [149.0, 150.03], [153.0, 153.77]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 32.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.38, 32.91, 31.32, 0.0, 30.83, 0.0, 31.04, 32.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 46.55], ["bleat", 6.54], ["speech", 6.34]], null, [["livestock, farm animals, working animals", 36.74], ["cattle, bovinae", 12.95], ["moo", 11.72]], null, null, null, null, null, null, [["moo", 24.12], ["cattle, bovinae", 21.08], ["music", 13.76]], null, null, null, null, null, null, null, [["speech", 39.17], ["music", 15.01], ["mosquito", 5.72]], [["music", 28.34], ["didgeridoo", 10.59], ["speech", 4.39]], [["speech", 44.65], ["music", 29.61], ["boing", 6.83]], null, [["music", 64.35], ["singing", 7.36], ["saxophone", 3.7]], null, [["music", 54.5], ["singing", 7.62], ["bleat", 6.85]], [["moo", 36.45], ["livestock, farm animals, working animals", 34.73], ["cattle, bovinae", 20.46]], null, null, null, null, null, null], "duration": [1.86, 0.29, 0.8, 0.63, 1.46, 1.25, 1.11, 5.57, 0.95, 2.51, 0.89, -0.01, 0.4, 1.09, 0.86, 0.82, 2.57, 0.56, 1.64, 0.65, 0.83, 0.36, 0.33, 0.32, 3.19, 2.18, 3.73, 1.76, 2.82, 0.21, 6.58, 3.21, 0.87, 0.81, 0.44, 0.74, 1.03, 0.77]} \ No newline at end of file diff --git a/annotations_1/gp6FX1H99NA_filtered.json b/annotations_1/gp6FX1H99NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/gp6FX1H99NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/gp7K6ZwuDow_filtered.json b/annotations_1/gp7K6ZwuDow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb6cf83cc5c38270acb42af53f0b3618754b693 --- /dev/null +++ b/annotations_1/gp7K6ZwuDow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.24], [11.0, 12.95], [13.0, 14.88], [16.0, 22.77], [24.0, 24.76], [26.0, 28.88], [31.0, 31.8], [33.0, 33.45], [37.0, 39.93], [43.0, 43.04], [44.0, 44.24], [57.0, 57.54], [59.0, 59.1], [77.0, 78.11], [79.0, 79.76]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.1, 0.0, 46.75, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 29.7], ["music", 14.43], ["rumble", 9.84]], null, [["speech", 69.94], ["thunk", 5.83], ["hum", 5.64]], null, null, null, null, null, null, null, null, null], "duration": [0.24, 1.95, 1.88, 6.77, 0.76, 2.88, 0.8, 0.45, 2.93, 0.04, 0.24, 0.54, 0.1, 1.11, 0.76]} \ No newline at end of file diff --git a/annotations_1/gp8OWUqg4r4_filtered.json b/annotations_1/gp8OWUqg4r4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93046af204c39fe878b44ca73bacab34ad2f0d5c --- /dev/null +++ b/annotations_1/gp8OWUqg4r4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [14.0, 14.45], [17.0, 17.32], [22.0, 21.64], [30.0, 31.67], [35.0, 39.82], [42.0, 42.08], [47.0, 51.92], [54.0, 58.94], [63.0, 69.55], [85.0, 85.97], [88.0, 88.03], [92.0, 94.49], [98.0, 99.08], [106.0, 106.84], [109.0, 110.12], [116.0, 115.89], [118.0, 118.56], [119.0, 120.36], [121.0, 121.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 98.73, 91.13, 94.52, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.45, 0.32, -0.36, 1.67, 4.82, 0.08, 4.92, 4.94, 6.55, 0.97, 0.03, 2.49, 1.08, 0.84, 1.12, -0.11, 0.56, 1.36, 0.88]} \ No newline at end of file diff --git a/annotations_1/gpjYU0C2yrY_filtered.json b/annotations_1/gpjYU0C2yrY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..164f7da682b854881d3db8e5c64197b561e3a536 --- /dev/null +++ b/annotations_1/gpjYU0C2yrY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 62.14], [64.0, 93.11], [94.0, 93.93], [94.0, 103.59], [105.0, 139.63], [142.0, 162.24]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.33, 29.14, 0.0, 33.56, 0.0, 70.02], "audiomae_on_audioset": [[["hum", 40.38], ["throbbing", 25.5], ["music", 14.62]], [["music", 44.15], ["hum", 20.26], ["throbbing", 7.66]], null, [["music", 71.12], ["electronic music", 6.65], ["hum", 4.53]], null, null], "duration": [26.14, 29.11, -0.07, 9.59, 34.63, 20.24]} \ No newline at end of file diff --git a/annotations_1/gq1gSTF2oyA_filtered.json b/annotations_1/gq1gSTF2oyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c6e4c01b3b6317a70a044135625266ac90a1204 --- /dev/null +++ b/annotations_1/gq1gSTF2oyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 28.17], [29.0, 31.55], [33.0, 39.02], [44.0, 46.75], [51.0, 53.28], [56.0, 57.5], [64.0, 66.66], [68.0, 68.62], [71.0, 72.54], [73.0, 79.78], [84.0, 85.45], [87.0, 97.29], [101.0, 102.3], [104.0, 104.55], [106.0, 107.4], [112.0, 113.64], [120.0, 119.97], [121.0, 122.54], [124.0, 124.39], [125.0, 127.52], [130.0, 131.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [81.17, 54.7, 67.51, 60.05, 94.52, 0.0, 55.67, 0.0, 0.0, 62.37, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.17, 2.55, 6.02, 2.75, 2.28, 1.5, 2.66, 0.62, 1.54, 6.78, 1.45, 10.29, 1.3, 0.55, 1.4, 1.64, -0.03, 1.54, 0.39, 2.52, 1.7]} \ No newline at end of file diff --git a/annotations_1/gq5WIcSz2ko_filtered.json b/annotations_1/gq5WIcSz2ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/gq5WIcSz2ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/gq6JKq3Q_uw_filtered.json b/annotations_1/gq6JKq3Q_uw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..638549fc6050d6d74869d1f6fba37df4ea856157 --- /dev/null +++ b/annotations_1/gq6JKq3Q_uw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 25.25], [45.0, 46.6], [62.0, 62.29], [67.0, 68.2], [85.0, 84.92], [88.0, 88.92]], "keep_status": [false, false, false, false, false, false], "silence_prob": [40.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.85], ["synthesizer", 33.32], ["keyboard (musical)", 5.13]], null, null, null, null, null], "duration": [11.25, 1.6, 0.29, 1.2, -0.08, 0.92]} \ No newline at end of file diff --git a/annotations_1/gqe-oAUoEto_filtered.json b/annotations_1/gqe-oAUoEto_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62acf0e2aa79ee0b12218197d1c2cb132670d51f --- /dev/null +++ b/annotations_1/gqe-oAUoEto_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.22], [15.0, 15.48], [17.0, 26.6], [27.0, 28.68], [29.0, 52.56], [55.0, 55.29], [63.0, 73.95], [77.0, 85.83], [98.0, 99.12], [101.0, 105.71], [113.0, 114.17], [114.0, 115.42], [119.0, 119.58], [122.0, 122.34], [138.0, 145.54], [148.0, 149.34], [154.0, 155.63], [157.0, 159.58], [160.0, 160.19], [161.0, 164.64]], "keep_status": [false, false, true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 28.78, 0.0, 29.16, 0.0, 28.78, 31.44, 0.0, 37.49, 0.0, 0.0, 0.0, 0.0, 31.41, 0.0, 0.0, 49.64, 0.0, 73.21], "audiomae_on_audioset": [null, null, [["speech", 46.43], ["whale vocalization", 13.11], ["rumble", 5.84]], null, [["speech", 50.02], ["frog", 9.59], ["whale vocalization", 4.52]], null, [["speech", 65.85], ["music", 13.16], ["whale vocalization", 10.93]], [["music", 23.74], ["speech", 18.17], ["livestock, farm animals, working animals", 11.92]], null, [["speech", 28.32], ["animal", 8.48], ["sidetone", 7.15]], null, null, null, null, [["cattle, bovinae", 26.82], ["livestock, farm animals, working animals", 23.64], ["speech", 19.99]], null, null, [["cattle, bovinae", 26.52], ["speech", 17.38], ["moo", 13.28]], null, null], "duration": [1.22, 0.48, 9.6, 1.68, 23.56, 0.29, 10.95, 8.83, 1.12, 4.71, 1.17, 1.42, 0.58, 0.34, 7.54, 1.34, 1.63, 2.58, 0.19, 3.64]} \ No newline at end of file diff --git a/annotations_1/grdxSWSHJaY_filtered.json b/annotations_1/grdxSWSHJaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8442dfd72ff44acab5f8305a963ca72a6ccf4fc8 --- /dev/null +++ b/annotations_1/grdxSWSHJaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.9], [23.0, 51.51], [52.0, 54.9], [58.0, 60.44], [61.0, 62.6], [69.0, 68.81], [69.0, 68.98], [69.0, 69.36], [70.0, 70.09], [72.0, 72.59], [73.0, 72.96], [77.0, 77.21], [80.0, 80.0], [87.0, 89.77], [90.0, 91.56], [94.0, 96.23], [96.0, 103.03], [104.0, 104.5], [105.0, 106.19], [107.0, 109.56], [110.0, 110.2], [111.0, 114.59], [115.0, 116.83], [120.0, 120.83], [121.0, 124.5], [130.0, 130.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 97.54, 99.99, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.38, 0.0, 32.96, 32.28, 0.0, 0.0, 79.41, 0.0, 99.97, 0.0, 0.0, 43.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["canidae, dogs, wolves", 17.38], ["animal", 16.82], ["music", 10.77]], null, [["vehicle", 27.54], ["speech", 18.55], ["car", 11.35]], [["music", 25.18], ["effects unit", 6.2], ["echo", 6.05]], null, null, null, null, null, null, null, [["speech", 50.89], ["inside, small room", 7.16], ["whimper", 5.8]], null], "duration": [0.9, 28.51, 2.9, 2.44, 1.6, -0.19, -0.02, 0.36, 0.09, 0.59, -0.04, 0.21, 0.0, 2.77, 1.56, 2.23, 7.03, 0.5, 1.19, 2.56, 0.2, 3.59, 1.83, 0.83, 3.5, 0.59]} \ No newline at end of file diff --git a/annotations_1/grpGRWYL6mQ_filtered.json b/annotations_1/grpGRWYL6mQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34d0e0d3e44c8af229ee840d5408c721d6f104b4 --- /dev/null +++ b/annotations_1/grpGRWYL6mQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 41.71], [42.0, 43.7], [45.0, 60.17], [62.0, 63.1], [63.0, 64.84], [66.0, 66.36], [71.0, 71.52], [72.0, 72.87], [76.0, 78.02], [79.0, 80.06], [81.0, 81.24], [82.0, 86.16], [88.0, 88.75], [92.0, 92.67], [94.0, 94.71], [99.0, 98.88], [105.0, 105.41], [106.0, 108.5], [112.0, 120.7], [124.0, 125.12], [126.0, 126.59], [132.0, 131.77], [137.0, 137.84], [139.0, 139.04], [143.0, 150.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 61.37, 42.39, 0.0, 0.0, 0.0, 0.0, 0.0, 36.11], "audiomae_on_audioset": [null, null, [["music", 68.93], ["speech", 19.75], ["sound effect", 1.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.69], ["didgeridoo", 19.81], ["musical instrument", 1.88]], null, null, null, null, null, [["theremin", 50.26], ["speech", 19.64], ["music", 13.94]]], "duration": [38.71, 1.7, 15.17, 1.1, 1.84, 0.36, 0.52, 0.87, 2.02, 1.06, 0.24, 4.16, 0.75, 0.67, 0.71, -0.12, 0.41, 2.5, 8.7, 1.12, 0.59, -0.23, 0.84, 0.04, 7.82]} \ No newline at end of file diff --git a/annotations_1/grwlYBNyMk4_filtered.json b/annotations_1/grwlYBNyMk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0114a5f1a3a7d1d0cce2f1a92f93f995a23a7ebc --- /dev/null +++ b/annotations_1/grwlYBNyMk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.1], [19.0, 19.95], [23.0, 27.65], [31.0, 31.01], [38.0, 40.42], [44.0, 44.69], [51.0, 51.12], [53.0, 55.9], [59.0, 59.48], [60.0, 60.34], [61.0, 62.88], [65.0, 66.85], [72.0, 76.33], [80.0, 81.65], [83.0, 85.9], [90.0, 89.94], [90.0, 94.29], [95.0, 96.06], [97.0, 97.56], [125.0, 151.65], [155.0, 157.99], [160.0, 162.03], [168.0, 168.25], [173.0, 178.7], [185.0, 189.48], [192.0, 192.4]], "keep_status": [false, false, true, false, true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 31.06, 0.0, 30.34, 0.0, 0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 29.59, 0.0, 30.74, 0.0, 0.0, 30.2, 28.58, 53.59, 0.0, 33.17, 32.98, 0.0], "audiomae_on_audioset": [null, null, [["whip", 16.37], ["hum", 15.8], ["speech", 15.47]], null, [["whale vocalization", 16.87], ["fly, housefly", 16.13], ["hum", 6.19]], null, null, [["sound effect", 21.01], ["whale vocalization", 17.2], ["boing", 10.29]], null, null, null, null, [["music", 64.84], ["speech", 9.67], ["mosquito", 6.74]], null, [["whack, thwack", 25.54], ["speech", 15.46], ["sound effect", 8.93]], null, [["music", 49.12], ["speech", 26.23], ["thunk", 4.86]], null, null, [["speech", 46.06], ["music", 18.57], ["whack, thwack", 8.39]], [["speech", 57.17], ["boing", 4.31], ["music", 3.57]], null, null, [["music", 29.28], ["speech", 21.62], ["synthesizer", 10.98]], [["speech", 31.23], ["sidetone", 13.6], ["music", 13.19]], null], "duration": [1.1, 0.95, 4.65, 0.01, 2.42, 0.69, 0.12, 2.9, 0.48, 0.34, 1.88, 1.85, 4.33, 1.65, 2.9, -0.06, 4.29, 1.06, 0.56, 26.65, 2.99, 2.03, 0.25, 5.7, 4.48, 0.4]} \ No newline at end of file diff --git a/annotations_1/gs0WQmW1icQ_filtered.json b/annotations_1/gs0WQmW1icQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be39a29d924014b43ae565151788aca962c5b0ca --- /dev/null +++ b/annotations_1/gs0WQmW1icQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.56], [8.0, 10.17], [11.0, 37.74], [38.0, 84.0]], "keep_status": [false, true, true, false], "silence_prob": [47.2, 47.82, 42.26, 0.0], "audiomae_on_audioset": [[["gong", 43.8], ["music", 23.07], ["sonar", 13.32]], [["chirp tone", 27.34], ["sine wave", 24.64], ["ambient music", 9.54]], [["music", 45.41], ["sonar", 6.41], ["glass", 5.29]], null], "duration": [5.56, 2.17, 26.74, 46.0]} \ No newline at end of file diff --git a/annotations_1/gs3GHB24IaM_filtered.json b/annotations_1/gs3GHB24IaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c899f790e8c50640e87008761451a2706c7e5fe --- /dev/null +++ b/annotations_1/gs3GHB24IaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.2], [12.0, 20.76], [28.0, 29.51], [53.0, 53.1], [54.0, 54.57], [61.0, 66.19], [68.0, 74.02], [81.0, 88.94], [95.0, 95.76], [99.0, 99.52], [104.0, 104.73], [113.0, 114.32], [121.0, 121.56]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.56, 30.54, 0.0, 0.0, 0.0, 32.13, 29.62, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 60.32], ["speech", 9.21], ["throbbing", 3.92]], [["music", 44.92], ["hum", 19.02], ["mains hum", 12.78]], null, null, null, [["music", 80.03], ["groan", 3.78], ["hum", 2.47]], [["music", 73.84], ["throbbing", 5.49], ["cacophony", 3.49]], [["music", 47.0], ["sonar", 9.73], ["hum", 7.37]], null, null, null, null, null], "duration": [4.2, 8.76, 1.51, 0.1, 0.57, 5.19, 6.02, 7.94, 0.76, 0.52, 0.73, 1.32, 0.56]} \ No newline at end of file diff --git a/annotations_1/gsG8sEK2md8_filtered.json b/annotations_1/gsG8sEK2md8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca82d90a4656905713159054e15db0810a21856f --- /dev/null +++ b/annotations_1/gsG8sEK2md8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.11], [32.0, 34.84], [35.0, 35.43], [36.0, 40.39], [41.0, 41.57], [42.0, 42.72], [45.0, 55.61], [56.0, 63.48], [64.0, 63.95], [64.0, 64.07], [64.0, 64.94], [67.0, 69.43], [70.0, 71.29], [73.0, 77.87], [85.0, 95.28], [97.0, 128.71], [130.0, 130.33], [131.0, 131.94], [132.0, 152.96], [153.0, 154.06], [155.0, 169.2], [170.0, 186.58], [187.0, 189.4]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 33.16, 0.0, 30.99, 0.0, 0.0, 31.03, 34.25, 0.0, 0.0, 0.0, 59.68, 0.0, 50.51, 29.27, 0.0, 0.0, 0.0, 29.74, 0.0, 29.32, 29.01, 33.09], "audiomae_on_audioset": [null, [["music", 46.79], ["didgeridoo", 9.71], ["whale vocalization", 3.95]], null, [["didgeridoo", 36.58], ["music", 18.96], ["theremin", 18.57]], null, null, [["music", 20.54], ["didgeridoo", 11.88], ["hum", 10.32]], [["music", 62.95], ["didgeridoo", 10.0], ["speech", 6.79]], null, null, null, null, null, null, [["hum", 33.71], ["throbbing", 15.01], ["music", 11.69]], null, null, null, [["speech", 64.17], ["music", 20.48], ["breaking", 2.39]], null, [["hum", 23.2], ["music", 21.35], ["throbbing", 16.27]], [["music", 69.38], ["didgeridoo", 5.24], ["animal", 3.28]], [["speech", 18.26], ["electric shaver, electric razor", 11.3], ["mains hum", 7.21]]], "duration": [0.11, 2.84, 0.43, 4.39, 0.57, 0.72, 10.61, 7.48, -0.05, 0.07, 0.94, 2.43, 1.29, 4.87, 10.28, 31.71, 0.33, 0.94, 20.96, 1.06, 14.2, 16.58, 2.4]} \ No newline at end of file diff --git a/annotations_1/gt6_2qd75F8_filtered.json b/annotations_1/gt6_2qd75F8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58493056258ac0024b1b554eb8d5bdfd455d784c --- /dev/null +++ b/annotations_1/gt6_2qd75F8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.21], [6.0, 14.01], [17.0, 17.85], [24.0, 56.34], [63.0, 105.07], [107.0, 121.58], [122.0, 124.17], [127.0, 129.66], [130.0, 133.34], [136.0, 162.95]], "keep_status": [false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 29.89, 0.0, 0.0, 0.0, 51.5, 40.57, 30.93, 34.98, 30.23], "audiomae_on_audioset": [null, [["music", 43.15], ["didgeridoo", 41.07], ["noise", 1.54]], null, null, null, null, [["speech", 35.31], ["hum", 12.76], ["whale vocalization", 9.07]], [["music", 23.94], ["speech", 16.86], ["eruption", 5.02]], [["speech", 35.26], ["frog", 18.04], ["noise", 6.16]], [["music", 65.67], ["hum", 4.89], ["throbbing", 3.31]]], "duration": [0.21, 8.01, 0.85, 32.34, 42.07, 14.58, 2.17, 2.66, 3.34, 26.95]} \ No newline at end of file diff --git a/annotations_1/gtHhlD6p8BY_filtered.json b/annotations_1/gtHhlD6p8BY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb500dc1c3f37d839e14b9dc909a64e03d3a958c --- /dev/null +++ b/annotations_1/gtHhlD6p8BY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[78.0, 79.64], [81.0, 81.67], [83.0, 83.39], [87.0, 89.01], [93.0, 94.1], [95.0, 95.69], [101.0, 119.35], [120.0, 131.19], [135.0, 134.89], [136.0, 155.83], [157.0, 163.92], [165.0, 172.56], [177.0, 196.94], [200.0, 200.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.31, 0.0, 0.0, 30.51, 31.55, 0.0, 31.85, 31.97, 30.87, 33.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 36.48], ["music", 31.22], ["throbbing", 15.45]], [["fart", 39.6], ["speech", 31.22], ["music", 6.13]], null, [["speech", 55.43], ["music", 14.71], ["outside, rural or natural", 4.02]], [["speech", 61.48], ["music", 7.51], ["fart", 3.55]], [["cattle, bovinae", 36.54], ["livestock, farm animals, working animals", 30.71], ["moo", 27.53]], [["cattle, bovinae", 37.69], ["moo", 35.08], ["livestock, farm animals, working animals", 11.96]], null], "duration": [1.64, 0.67, 0.39, 2.01, 1.1, 0.69, 18.35, 11.19, -0.11, 19.83, 6.92, 7.56, 19.94, 0.84]} \ No newline at end of file diff --git a/annotations_1/gtngV41jpcw_filtered.json b/annotations_1/gtngV41jpcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec772b7f1dcbe86c41d4e6f3dc84bd395d83cd45 --- /dev/null +++ b/annotations_1/gtngV41jpcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.58], [15.0, 16.55], [20.0, 28.44], [29.0, 30.21], [33.0, 34.62], [36.0, 39.38], [44.0, 45.45], [47.0, 47.55], [50.0, 50.65], [56.0, 55.83], [60.0, 61.2], [63.0, 64.74], [66.0, 67.85], [69.0, 68.76], [71.0, 72.22]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [49.92, 0.0, 58.47, 0.0, 0.0, 32.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 84.17], ["synthesizer", 1.78], ["noise", 1.26]], null, null, null, null, [["fart", 38.93], ["sound effect", 13.56], ["explosion", 11.28]], null, null, null, null, null, null, null, null, null], "duration": [9.58, 1.55, 8.44, 1.21, 1.62, 3.38, 1.45, 0.55, 0.65, -0.17, 1.2, 1.74, 1.85, -0.24, 1.22]} \ No newline at end of file diff --git a/annotations_1/gvTCSxLPy0Q_filtered.json b/annotations_1/gvTCSxLPy0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c250e61cf39d206a60cc143aa7b1db87d000454f --- /dev/null +++ b/annotations_1/gvTCSxLPy0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.15], [5.0, 6.35], [7.0, 7.47], [8.0, 9.17], [15.0, 15.04], [16.0, 17.47], [20.0, 21.2], [22.0, 22.45], [27.0, 28.05], [32.0, 35.38], [37.0, 38.13], [41.0, 52.32], [53.0, 68.79]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [43.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 0.0, 34.08, 30.28], "audiomae_on_audioset": [[["cattle, bovinae", 10.56], ["moo", 8.92], ["livestock, farm animals, working animals", 8.25]], null, null, null, null, null, null, null, null, [["music", 47.65], ["hum", 15.07], ["throbbing", 7.06]], null, [["music", 65.05], ["echo", 6.76], ["synthesizer", 6.4]], [["music", 59.49], ["speech", 9.82], ["thump, thud", 3.4]]], "duration": [2.15, 1.35, 0.47, 1.17, 0.04, 1.47, 1.2, 0.45, 1.05, 3.38, 1.13, 11.32, 15.79]} \ No newline at end of file diff --git a/annotations_1/gvuZShYhzX8_filtered.json b/annotations_1/gvuZShYhzX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f057894ed237090734a956e20fd8a01354e2793a --- /dev/null +++ b/annotations_1/gvuZShYhzX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 57.94], [63.0, 66.88], [69.0, 70.41], [72.0, 83.17], [84.0, 83.83], [84.0, 89.9], [97.0, 97.71], [101.0, 102.07], [105.0, 106.57], [111.0, 114.86], [116.0, 115.87], [117.0, 117.34], [119.0, 119.94], [124.0, 124.61], [131.0, 133.89], [141.0, 140.76], [148.0, 149.08], [150.0, 150.3], [154.0, 154.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 29.86, 0.0, 28.21, 0.0, 30.81, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 45.52, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 74.07], ["didgeridoo", 5.64], ["whale vocalization", 4.34]], null, [["music", 63.29], ["synthesizer", 4.32], ["throbbing", 3.82]], null, [["music", 54.92], ["electronic music", 11.11], ["throbbing", 5.2]], null, null, null, null, null, null, null, null, [["music", 20.82], ["hum", 15.55], ["noise", 6.93]], null, null, null, null], "duration": [32.94, 3.88, 1.41, 11.17, -0.17, 5.9, 0.71, 1.07, 1.57, 3.86, -0.13, 0.34, 0.94, 0.61, 2.89, -0.24, 1.08, 0.3, 0.87]} \ No newline at end of file diff --git a/annotations_1/gwEoo0r_8EY_filtered.json b/annotations_1/gwEoo0r_8EY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1f9716f1c77e07b9d81842975c1f4692e883f2f --- /dev/null +++ b/annotations_1/gwEoo0r_8EY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.76], [16.0, 18.13], [20.0, 21.51], [23.0, 23.4], [25.0, 25.71], [26.0, 28.07], [29.0, 29.79], [31.0, 32.91], [33.0, 33.64], [34.0, 55.04], [62.0, 81.26], [86.0, 91.99], [96.0, 98.74], [102.0, 102.44], [105.0, 117.69], [119.0, 120.46], [122.0, 122.18], [123.0, 127.13], [128.0, 129.1], [141.0, 142.1], [151.0, 151.28], [159.0, 160.52]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [55.81, 65.44, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 35.37, 30.7, 31.5, 35.39, 0.0, 32.56, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 39.15], ["singing bowl", 23.81], ["music", 7.73]], null, null, null, [["music", 40.09], ["rumble", 11.13], ["hum", 11.12]], [["speech", 58.98], ["music", 5.9], ["groan", 5.15]], [["whack, thwack", 36.28], ["music", 24.36], ["speech", 6.57]], [["rumble", 36.46], ["music", 19.25], ["speech", 17.22]], null, [["speech", 23.29], ["music", 18.87], ["hum", 7.91]], null, null, null, null, null, null, null], "duration": [6.76, 2.13, 1.51, 0.4, 0.71, 2.07, 0.79, 1.91, 0.64, 21.04, 19.26, 5.99, 2.74, 0.44, 12.69, 1.46, 0.18, 4.13, 1.1, 1.1, 0.28, 1.52]} \ No newline at end of file diff --git a/annotations_1/gx-03rUq-1Q_filtered.json b/annotations_1/gx-03rUq-1Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8670847ca0589d7e40f5ea1f80879365e553b1e7 --- /dev/null +++ b/annotations_1/gx-03rUq-1Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.46], [10.0, 11.79], [29.0, 30.15], [32.0, 32.07], [39.0, 39.28], [43.0, 45.1], [48.0, 48.79], [60.0, 60.34], [63.0, 63.04], [65.0, 65.25], [68.0, 68.44], [69.0, 69.38], [72.0, 72.15], [74.0, 74.58], [77.0, 77.21], [78.0, 79.15], [81.0, 82.93], [84.0, 88.72], [98.0, 98.44], [105.0, 109.43], [111.0, 111.67], [112.0, 120.12], [125.0, 126.18], [127.0, 128.75], [130.0, 130.59], [146.0, 146.26], [149.0, 149.96], [151.0, 152.05], [154.0, 154.6], [160.0, 160.62], [163.0, 164.81], [170.0, 170.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.61, 0.0, 44.81, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.55], ["noise", 2.6], ["effects unit", 0.9]], null, [["thunk", 16.11], ["cattle, bovinae", 10.03], ["moo", 9.61]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.46, 1.79, 1.15, 0.07, 0.28, 2.1, 0.79, 0.34, 0.04, 0.25, 0.44, 0.38, 0.15, 0.58, 0.21, 1.15, 1.93, 4.72, 0.44, 4.43, 0.67, 8.12, 1.18, 1.75, 0.59, 0.26, 0.96, 1.05, 0.6, 0.62, 1.81, 0.16]} \ No newline at end of file diff --git a/annotations_1/gxacglqQMqE_filtered.json b/annotations_1/gxacglqQMqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa245fb381388f25fb5a3a3cf5a5693a444c712a --- /dev/null +++ b/annotations_1/gxacglqQMqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.15], [25.0, 33.99], [34.0, 34.03], [34.0, 34.06], [34.0, 34.13], [34.0, 34.21], [34.0, 34.26], [34.0, 34.32], [34.0, 35.4], [36.0, 38.57], [40.0, 47.21], [52.0, 54.14], [71.0, 87.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [35.88, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86, 41.58, 51.88, 30.86], "audiomae_on_audioset": [[["mains hum", 35.91], ["hum", 32.23], ["music", 11.13]], null, null, null, null, null, null, null, null, null, [["music", 41.29], ["hum", 18.07], ["throbbing", 13.99]], null, [["buzz", 25.27], ["hum", 14.96], ["music", 11.44]]], "duration": [13.15, 8.99, 0.03, 0.06, 0.13, 0.21, 0.26, 0.32, 1.4, 2.57, 7.21, 2.14, 16.4]} \ No newline at end of file diff --git a/annotations_1/gxhMfM0QlwM_filtered.json b/annotations_1/gxhMfM0QlwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de28eb0534a28666d169c64e51be0d75eb0dce6 --- /dev/null +++ b/annotations_1/gxhMfM0QlwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.75], [40.0, 40.51], [45.0, 44.93], [45.0, 45.03], [45.0, 45.27], [49.0, 49.38], [52.0, 56.42], [57.0, 56.69], [72.0, 72.45], [78.0, 80.23], [81.0, 86.56], [87.0, 86.7], [88.0, 102.07], [108.0, 109.11], [114.0, 114.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.15, 0.0, 0.0, 48.19, 40.09, 0.0, 41.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 48.51], ["didgeridoo", 31.84], ["speech", 5.91]], null, null, [["didgeridoo", 63.14], ["music", 20.0], ["synthesizer", 2.15]], [["music", 33.69], ["didgeridoo", 16.63], ["fly, housefly", 4.32]], null, [["music", 62.77], ["didgeridoo", 15.18], ["throbbing", 3.67]], null, null], "duration": [1.75, 0.51, -0.07, 0.03, 0.27, 0.38, 4.42, -0.31, 0.45, 2.23, 5.56, -0.3, 14.07, 1.11, 0.29]} \ No newline at end of file diff --git a/annotations_1/gxqt6x5ThcU_filtered.json b/annotations_1/gxqt6x5ThcU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/gxqt6x5ThcU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/gxsDfmzU-Lo_filtered.json b/annotations_1/gxsDfmzU-Lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c349b715ed2022f7716be4490abf7b22b34ef16b --- /dev/null +++ b/annotations_1/gxsDfmzU-Lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 57.87], [60.0, 66.48], [68.0, 78.76], [87.0, 102.14], [104.0, 116.46], [119.0, 120.26], [121.0, 121.39], [125.0, 126.28]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.93, 28.54, 29.08, 30.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 31.74], ["theremin", 21.49], ["musical instrument", 5.03]], [["music", 51.42], ["speech", 17.9], ["explosion", 9.78]], [["music", 40.9], ["hum", 23.42], ["throbbing", 17.31]], [["music", 42.49], ["hum", 19.72], ["throbbing", 16.28]], null, null, null], "duration": [50.87, 6.48, 10.76, 15.14, 12.46, 1.26, 0.39, 1.28]} \ No newline at end of file diff --git a/annotations_1/gxuEGIzZrGc_filtered.json b/annotations_1/gxuEGIzZrGc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3162807b79214f508459d154ced4c8c725f1cce --- /dev/null +++ b/annotations_1/gxuEGIzZrGc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.6], [21.0, 26.1], [34.0, 40.73], [43.0, 46.36], [48.0, 54.82], [56.0, 60.59], [62.0, 66.61], [71.0, 76.17], [78.0, 163.34]], "keep_status": [false, true, false, false, false, true, true, false, false], "silence_prob": [63.85, 45.78, 73.51, 69.07, 39.89, 32.49, 44.18, 32.83, 0.0], "audiomae_on_audioset": [null, [["music", 43.29], ["speech", 12.28], ["fly, housefly", 8.17]], null, null, [["music", 45.56], ["effects unit", 16.87], ["musical instrument", 13.39]], [["crack", 32.36], ["breaking", 16.23], ["crushing", 12.39]], [["grunt", 44.66], ["music", 4.1], ["fart", 3.15]], [["music", 34.25], ["speech", 33.01], ["breaking", 16.24]], null], "duration": [5.6, 5.1, 6.73, 3.36, 6.82, 4.59, 4.61, 5.17, 85.34]} \ No newline at end of file diff --git a/annotations_1/gzPiBOc_Nfs_filtered.json b/annotations_1/gzPiBOc_Nfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f74218857608756809d71843e31c839eb67a7df --- /dev/null +++ b/annotations_1/gzPiBOc_Nfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.18], [15.0, 25.07], [28.0, 35.13], [37.0, 48.14], [50.0, 82.53], [85.0, 88.92], [89.0, 91.59], [92.0, 93.73], [98.0, 104.26], [107.0, 156.88], [159.0, 162.95], [167.0, 166.89], [167.0, 168.94], [171.0, 170.95]], "keep_status": [true, true, false, true, false, true, true, false, true, false, false, false, false, false], "silence_prob": [30.47, 39.17, 99.62, 31.73, 0.0, 30.33, 32.81, 0.0, 29.41, 0.0, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.45], ["mains hum", 16.8], ["hum", 11.62]], [["music", 28.24], ["hum", 23.13], ["mains hum", 14.45]], null, [["music", 24.02], ["speech", 9.73], ["foghorn", 8.25]], null, [["music", 45.5], ["speech", 14.47], ["didgeridoo", 5.09]], [["foghorn", 48.34], ["speech", 15.63], ["music", 3.49]], null, [["music", 25.56], ["noise", 21.98], ["hum", 10.12]], null, null, null, null, null], "duration": [2.18, 10.07, 7.13, 11.14, 32.53, 3.92, 2.59, 1.73, 6.26, 49.88, 3.95, -0.11, 1.94, -0.05]} \ No newline at end of file diff --git a/annotations_1/gzbYTUXZkSI_filtered.json b/annotations_1/gzbYTUXZkSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83e9281c6e2d9f44dc5fb0d21e6575033db6c44a --- /dev/null +++ b/annotations_1/gzbYTUXZkSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.24], [2.0, 1.85], [7.0, 11.37], [13.0, 14.93], [16.0, 30.97], [33.0, 33.37], [44.0, 45.47], [47.0, 59.61], [63.0, 81.51], [83.0, 121.22], [122.0, 135.65], [137.0, 146.87], [150.0, 150.5], [154.0, 155.56], [159.0, 206.71]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 51.44, 0.0, 30.65, 0.0, 0.0, 31.04, 31.77, 0.0, 32.54, 30.69, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 36.52], ["speech", 26.49], ["sound effect", 3.43]], null, null, [["music", 34.71], ["didgeridoo", 16.46], ["hum", 13.85]], [["fly, housefly", 45.69], ["mosquito", 23.24], ["insect", 22.45]], null, [["music", 77.97], ["throbbing", 5.06], ["electronic music", 4.38]], [["music", 83.24], ["speech", 3.38], ["didgeridoo", 1.55]], null, null, null], "duration": [0.24, -0.15, 4.37, 1.93, 14.97, 0.37, 1.47, 12.61, 18.51, 38.22, 13.65, 9.87, 0.5, 1.56, 47.71]} \ No newline at end of file diff --git a/annotations_1/h0i2KfT2SB0_filtered.json b/annotations_1/h0i2KfT2SB0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bd4a39f5ccc0476f95affacf73d4db388a728dc --- /dev/null +++ b/annotations_1/h0i2KfT2SB0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.9], [16.0, 16.39], [16.0, 21.0], [24.0, 25.3], [27.0, 28.07], [30.0, 31.18], [32.0, 34.1], [42.0, 43.5], [45.0, 45.37], [48.0, 51.04], [54.0, 56.91], [58.0, 61.16], [61.0, 72.93], [76.0, 76.44], [77.0, 94.15], [95.0, 109.54], [110.0, 109.58], [110.0, 109.61], [113.0, 129.66]], "keep_status": [false, false, false, false, false, false, true, false, false, true, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 41.85, 0.0, 0.0, 47.62, 41.52, 50.26, 42.72, 0.0, 33.14, 32.33, 0.0, 0.0, 32.15], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 24.04], ["music", 23.09], ["throbbing", 10.22]], null, null, [["music", 15.65], ["hum", 11.85], ["speech", 11.17]], [["music", 38.01], ["electronic music", 11.39], ["hum", 11.1]], null, [["hum", 47.09], ["mains hum", 15.08], ["music", 15.05]], null, [["music", 27.1], ["speech", 17.89], ["didgeridoo", 7.98]], [["music", 22.3], ["throbbing", 19.26], ["whack, thwack", 17.18]], null, null, [["music", 58.59], ["didgeridoo", 4.55], ["speech", 3.73]]], "duration": [1.9, 0.39, 5.0, 1.3, 1.07, 1.18, 2.1, 1.5, 0.37, 3.04, 2.91, 3.16, 11.93, 0.44, 17.15, 14.54, -0.42, -0.39, 16.66]} \ No newline at end of file diff --git a/annotations_1/h0qniQTX3r8_filtered.json b/annotations_1/h0qniQTX3r8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55bba2a99b9a194fe851dbfc9c880ab86b359995 --- /dev/null +++ b/annotations_1/h0qniQTX3r8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.45], [46.0, 45.99], [47.0, 73.04], [73.0, 78.19], [81.0, 80.65], [82.0, 86.59], [88.0, 91.18], [93.0, 96.01], [98.0, 98.76], [102.0, 104.57], [105.0, 108.08], [109.0, 123.26], [127.0, 128.83], [130.0, 134.96], [137.0, 142.65], [145.0, 148.88]], "keep_status": [false, false, true, true, false, true, false, false, false, true, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 35.25, 34.54, 0.0, 38.74, 42.11, 54.56, 0.0, 47.16, 92.31, 40.59, 0.0, 47.98, 33.88, 35.38], "audiomae_on_audioset": [null, null, [["hum", 22.25], ["buzz", 14.08], ["music", 12.33]], [["music", 12.52], ["mains hum", 12.33], ["hum", 9.4]], null, [["grunt", 32.61], ["music", 17.54], ["throbbing", 8.97]], [["livestock, farm animals, working animals", 39.8], ["moo", 19.39], ["cattle, bovinae", 18.7]], null, null, [["mains hum", 17.22], ["hum", 12.92], ["bow-wow", 10.71]], null, [["speech", 33.11], ["music", 32.6], ["didgeridoo", 4.01]], null, [["music", 31.24], ["didgeridoo", 12.39], ["speech", 7.23]], [["music", 25.94], ["hum", 19.4], ["mains hum", 11.57]], [["throbbing", 46.64], ["music", 24.96], ["hum", 14.1]]], "duration": [0.45, -0.01, 26.04, 5.19, -0.35, 4.59, 3.18, 3.01, 0.76, 2.57, 3.08, 14.26, 1.83, 4.96, 5.65, 3.88]} \ No newline at end of file diff --git a/annotations_1/h1aJoWg4vGo_filtered.json b/annotations_1/h1aJoWg4vGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee4ead3006c5f7f42ec5b02e3c6b309eb555fd5a --- /dev/null +++ b/annotations_1/h1aJoWg4vGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [7.0, 7.79], [11.0, 11.2], [13.0, 13.56], [16.0, 16.56], [18.0, 19.89], [20.0, 21.2], [22.0, 25.03], [26.0, 26.38], [27.0, 28.88], [32.0, 34.4], [36.0, 36.58], [37.0, 37.72], [38.0, 38.79], [39.0, 40.07], [42.0, 42.06], [43.0, 43.88], [49.0, 54.08], [56.0, 57.03], [59.0, 59.64], [60.0, 72.71], [74.0, 75.03], [76.0, 77.79], [80.0, 81.5], [82.0, 83.91], [88.0, 88.35], [89.0, 90.17], [92.0, 92.47], [93.0, 93.55], [94.0, 95.2], [96.0, 96.45], [97.0, 101.34], [102.0, 109.14], [114.0, 114.98], [116.0, 123.13], [125.0, 126.17], [128.0, 127.8], [129.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 99.95, 0.0, 68.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 0.79, 0.2, 0.56, 0.56, 1.89, 1.2, 3.03, 0.38, 1.88, 2.4, 0.58, 0.72, 0.79, 1.07, 0.06, 0.88, 5.08, 1.03, 0.64, 12.71, 1.03, 1.79, 1.5, 1.91, 0.35, 1.17, 0.47, 0.55, 1.2, 0.45, 4.34, 7.14, 0.98, 7.13, 1.17, -0.2, 0.64]} \ No newline at end of file diff --git a/annotations_1/h36wtoBcAS8_filtered.json b/annotations_1/h36wtoBcAS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3544a14a1c2052bb675d549f19b7819755dbf9ec --- /dev/null +++ b/annotations_1/h36wtoBcAS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [4.0, 7.13], [14.0, 14.82], [15.0, 15.58], [21.0, 22.5], [31.0, 30.86], [32.0, 32.41], [33.0, 35.51], [36.0, 37.76], [42.0, 42.09], [44.0, 44.25], [54.0, 54.55], [56.0, 56.67], [58.0, 59.75], [60.0, 62.04], [64.0, 64.18], [66.0, 66.9], [68.0, 68.57], [70.0, 71.22], [72.0, 72.86], [74.0, 75.17], [76.0, 77.5], [80.0, 81.28], [83.0, 83.67], [85.0, 85.08], [86.0, 86.66], [87.0, 88.05], [90.0, 91.57], [92.0, 92.91], [98.0, 99.35], [100.0, 101.19], [101.0, 101.97], [103.0, 103.45], [105.0, 105.09], [107.0, 109.11], [117.0, 116.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 49.99], ["sidetone", 19.34], ["telephone", 6.11]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 34.69], ["throbbing", 19.02], ["speech", 14.88]], null], "duration": [0.76, 3.13, 0.82, 0.58, 1.5, -0.14, 0.41, 2.51, 1.76, 0.09, 0.25, 0.55, 0.67, 1.75, 2.04, 0.18, 0.9, 0.57, 1.22, 0.86, 1.17, 1.5, 1.28, 0.67, 0.08, 0.66, 1.05, 1.57, 0.91, 1.35, 1.19, 0.97, 0.45, 0.09, 2.11, -0.1]} \ No newline at end of file diff --git a/annotations_1/h3AqOR2Ru1s_filtered.json b/annotations_1/h3AqOR2Ru1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51e1c26cd1dc68f1404784f0d332a45e8e091f5f --- /dev/null +++ b/annotations_1/h3AqOR2Ru1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.61], [13.0, 13.17], [13.0, 13.22], [14.0, 14.42], [16.0, 17.02], [29.0, 30.3], [31.0, 31.75], [35.0, 38.53], [39.0, 38.58], [41.0, 43.73], [54.0, 54.45], [60.0, 60.61], [63.0, 65.7], [73.0, 82.17], [85.0, 94.46], [98.0, 108.01], [116.0, 124.31], [126.0, 127.89], [131.0, 134.57], [138.0, 137.94], [149.0, 149.3], [153.0, 153.79], [156.0, 155.55], [180.0, 184.55], [193.0, 194.83], [196.0, 200.21], [207.0, 209.22], [213.0, 214.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.02, 0.0, 68.54, 0.0, 0.0, 61.08, 55.89, 45.49, 40.54, 33.53, 0.0, 39.57, 0.0, 0.0, 0.0, 0.0, 35.45, 0.0, 39.38, 36.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 36.74], ["music", 31.03], ["thunk", 11.34]], null, null, null, null, null, null, [["music", 37.88], ["speech", 6.8], ["musical instrument", 3.92]], [["music", 43.81], ["hum", 13.97], ["throbbing", 7.65]], [["whack, thwack", 39.53], ["groan", 24.1], ["music", 15.48]], null, [["music", 45.74], ["synthesizer", 8.64], ["hum", 7.36]], null, null, null, null, [["music", 46.93], ["boing", 14.76], ["speech", 13.02]], null, [["music", 57.5], ["theremin", 6.44], ["synthesizer", 5.54]], [["music", 53.27], ["speech", 7.32], ["quack", 3.24]], null], "duration": [1.61, 0.17, 0.22, 0.42, 1.02, 1.3, 0.75, 3.53, -0.42, 2.73, 0.45, 0.61, 2.7, 9.17, 9.46, 10.01, 8.31, 1.89, 3.57, -0.06, 0.3, 0.79, -0.45, 4.55, 1.83, 4.21, 2.22, 1.62]} \ No newline at end of file diff --git a/annotations_1/h3g5B5JhFcY_filtered.json b/annotations_1/h3g5B5JhFcY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45afd4a0052d04c2779895b24747081132b55143 --- /dev/null +++ b/annotations_1/h3g5B5JhFcY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 51.21], [66.0, 66.39], [68.0, 67.93], [79.0, 79.69], [83.0, 83.56], [85.0, 86.97], [89.0, 112.78], [113.0, 114.79], [116.0, 133.12], [133.0, 133.24]], "keep_status": [false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.55, 0.0, 39.05, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 31.38], ["stomach rumble", 12.99], ["animal", 11.51]], null, [["hum", 40.7], ["music", 13.71], ["mains hum", 12.94]], null], "duration": [1.21, 0.39, -0.07, 0.69, 0.56, 1.97, 23.78, 1.79, 17.12, 0.24]} \ No newline at end of file diff --git a/annotations_1/h41ylpWhV1I_filtered.json b/annotations_1/h41ylpWhV1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50aa29c280ed18eaaa71ab9d5ae010cb63bb46c --- /dev/null +++ b/annotations_1/h41ylpWhV1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.71], [33.0, 34.06], [37.0, 89.95], [95.0, 105.92]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.55], "audiomae_on_audioset": [null, null, null, null], "duration": [1.71, 1.06, 52.95, 10.92]} \ No newline at end of file diff --git a/annotations_1/h4lbn5nDXwY_filtered.json b/annotations_1/h4lbn5nDXwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6c57ff8702ccf915473589b2f9877efbec0579d --- /dev/null +++ b/annotations_1/h4lbn5nDXwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.85], [10.0, 11.69], [14.0, 14.91], [15.0, 16.04], [17.0, 17.32], [35.0, 46.18], [47.0, 47.09], [53.0, 54.45], [62.0, 63.64], [66.0, 67.07], [89.0, 90.44], [99.0, 100.16], [102.0, 103.69]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 57.01], ["whack, thwack", 3.63], ["mosquito", 2.7]], null, null, null, null, null, null, null], "duration": [0.85, 1.69, 0.91, 1.04, 0.32, 11.18, 0.09, 1.45, 1.64, 1.07, 1.44, 1.16, 1.69]} \ No newline at end of file diff --git a/annotations_1/h5KBS20Ke6U_filtered.json b/annotations_1/h5KBS20Ke6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dd207567f14a56218383251620149ba6be3f12f --- /dev/null +++ b/annotations_1/h5KBS20Ke6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 28.02], [29.0, 30.08], [32.0, 32.81], [37.0, 37.81], [38.0, 39.55], [41.0, 41.81], [45.0, 48.39], [54.0, 55.61], [56.0, 59.1], [62.0, 62.68], [63.0, 63.54], [81.0, 81.45], [86.0, 87.03], [103.0, 103.06], [104.0, 104.08], [110.0, 110.35], [112.0, 112.28], [113.0, 113.24], [114.0, 123.11], [125.0, 139.97], [143.0, 142.89], [144.0, 145.52]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 0.0, 48.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.94, 44.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 29.16], ["chirp tone", 25.45], ["noise", 8.28]], null, [["sidetone", 30.77], ["speech", 22.99], ["whale vocalization", 9.98]], null, null, null, null, null, null, null, null, null, [["animal", 15.49], ["music", 14.86], ["buzz", 7.42]], [["speech", 10.61], ["crow", 9.88], ["animal", 8.94]], null, null], "duration": [2.02, 1.08, 0.81, 0.81, 1.55, 0.81, 3.39, 1.61, 3.1, 0.68, 0.54, 0.45, 1.03, 0.06, 0.08, 0.35, 0.28, 0.24, 9.11, 14.97, -0.11, 1.52]} \ No newline at end of file diff --git a/annotations_1/h5OjSHDUn8c_filtered.json b/annotations_1/h5OjSHDUn8c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96b454912652b8d5520cb1f7f398cb9489397b16 --- /dev/null +++ b/annotations_1/h5OjSHDUn8c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [5.0, 12.92], [14.0, 15.26], [16.0, 16.53], [18.0, 18.84], [21.0, 21.37], [23.0, 24.75], [27.0, 27.92], [34.0, 37.57], [43.0, 44.46], [46.0, 47.14], [54.0, 55.97], [57.0, 58.5], [60.0, 59.93], [64.0, 63.8], [68.0, 68.67], [73.0, 72.87], [80.0, 81.03], [84.0, 84.7], [87.0, 89.01], [94.0, 95.72], [102.0, 108.89], [116.0, 115.79], [116.0, 115.96], [122.0, 122.69], [141.0, 143.24], [149.0, 150.23], [156.0, 157.27], [160.0, 161.64], [164.0, 165.11], [166.0, 168.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.11, 0.0, 98.99, 0.0, 0.0, 0.0, 50.41, 0.0, 0.0, 0.0, 0.0, 40.81], "audiomae_on_audioset": [null, [["applause", 90.09], ["clapping", 1.27], ["eruption", 1.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.73], ["hum", 14.9], ["theremin", 9.43]], null, null, null, null, null, null, null, null, null, null, [["music", 48.89], ["musical instrument", 6.53], ["sidetone", 4.56]]], "duration": [0.5, 7.92, 1.26, 0.53, 0.84, 0.37, 1.75, 0.92, 3.57, 1.46, 1.14, 1.97, 1.5, -0.07, -0.2, 0.67, -0.13, 1.03, 0.7, 2.01, 1.72, 6.89, -0.21, -0.04, 0.69, 2.24, 1.23, 1.27, 1.64, 1.11, 2.12]} \ No newline at end of file diff --git a/annotations_1/h5UGcMYOaaU_filtered.json b/annotations_1/h5UGcMYOaaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d201505495f7dbc0d0b34c9d016bc4cd959c71a6 --- /dev/null +++ b/annotations_1/h5UGcMYOaaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.78], [6.0, 13.98], [19.0, 19.45], [20.0, 20.93], [22.0, 26.0], [30.0, 30.06], [31.0, 31.23], [33.0, 34.74], [60.0, 60.29], [61.0, 62.02], [77.0, 78.06], [94.0, 97.95], [104.0, 105.02], [108.0, 122.2], [123.0, 122.82], [126.0, 126.15], [127.0, 127.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.28, 0.0, 0.0, 37.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.11, 0.0, 34.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.82], ["smash, crash", 4.99], ["breaking", 4.03]], null, null, [["speech", 27.94], ["music", 23.04], ["didgeridoo", 13.53]], null, null, null, null, null, null, [["snicker", 30.41], ["laughter", 26.11], ["speech", 11.65]], null, [["music", 52.07], ["hum", 13.93], ["throbbing", 13.05]], null, null, null], "duration": [-0.22, 7.98, 0.45, 0.93, 4.0, 0.06, 0.23, 1.74, 0.29, 1.02, 1.06, 3.95, 1.02, 14.2, -0.18, 0.15, 0.31]} \ No newline at end of file diff --git a/annotations_1/h5dCFGJp__0_filtered.json b/annotations_1/h5dCFGJp__0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..485590f70e10137777923a92e145232657c13a55 --- /dev/null +++ b/annotations_1/h5dCFGJp__0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [7.0, 7.05], [8.0, 8.09], [9.0, 9.95], [12.0, 12.45], [13.0, 14.82], [16.0, 17.56], [18.0, 20.88], [22.0, 27.13], [31.0, 33.07], [37.0, 52.0], [52.0, 54.21], [55.0, 59.75], [63.0, 63.42], [68.0, 69.31], [72.0, 72.71], [74.0, 74.34], [77.0, 77.21], [78.0, 79.49], [80.0, 81.43], [82.0, 86.12], [87.0, 94.17], [97.0, 99.12], [100.0, 102.07], [103.0, 102.79], [111.0, 110.96], [112.0, 112.35], [114.0, 114.37], [115.0, 116.75], [117.0, 116.82], [117.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 37.75, 98.01, 99.99, 49.64, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 99.99, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 76.12], ["sidetone", 6.68], ["hum", 4.22]], null, null, [["speech", 32.17], ["sine wave", 16.38], ["dial tone", 8.95]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 63.9], ["fart", 12.51], ["inside, small room", 3.52]], null, null, null, null, null, null, null], "duration": [1.41, 0.05, 0.09, 0.95, 0.45, 1.82, 1.56, 2.88, 5.13, 2.07, 15.0, 2.21, 4.75, 0.42, 1.31, 0.71, 0.34, 0.21, 1.49, 1.43, 4.12, 7.17, 2.12, 2.07, -0.21, -0.04, 0.35, 0.37, 1.75, -0.18, 0.54]} \ No newline at end of file diff --git a/annotations_1/h5f5GgqVWes_filtered.json b/annotations_1/h5f5GgqVWes_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2136c73d253f6c8f41a85dcc97979848129dc876 --- /dev/null +++ b/annotations_1/h5f5GgqVWes_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [3.0, 3.15], [4.0, 4.94], [6.0, 6.42], [9.0, 9.58], [11.0, 11.11], [13.0, 13.85], [15.0, 17.17], [19.0, 18.71], [24.0, 24.0], [27.0, 27.18], [29.0, 29.54], [30.0, 31.87], [32.0, 33.47], [35.0, 35.4], [38.0, 39.39], [40.0, 42.74], [46.0, 47.09], [50.0, 50.25], [51.0, 53.47], [59.0, 65.5], [66.0, 72.37], [75.0, 75.88], [77.0, 85.23], [87.0, 87.79], [90.0, 91.22], [92.0, 93.87], [98.0, 101.68], [103.0, 104.23], [105.0, 106.49], [110.0, 110.51], [119.0, 118.69], [119.0, 126.37], [128.0, 129.27], [135.0, 152.95], [154.0, 154.47], [156.0, 157.42], [158.0, 159.97], [161.0, 163.21], [165.0, 166.77], [168.0, 168.88], [172.0, 181.6], [185.0, 184.87], [186.0, 187.29]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.43, 0.0, 0.0, 35.45, 36.25, 35.84, 0.0, 40.73, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 0.0, 28.73, 0.0, 29.69, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 42.06, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 42.9], ["theremin", 8.67], ["didgeridoo", 4.23]], null, null, null, null, null, null, null, null, [["whale vocalization", 55.35], ["hum", 7.65], ["music", 7.25]], null, null, [["speech", 40.57], ["clip-clop", 7.25], ["horse", 6.04]], [["music", 35.22], ["burping, eructation", 13.38], ["hum", 8.14]], [["music", 38.14], ["speech", 26.11], ["sidetone", 6.84]], null, [["music", 61.67], ["speech", 8.9], ["throbbing", 7.37]], null, null, null, null, null, null, null, null, [["gong", 20.22], ["music", 19.82], ["speech", 18.24]], null, [["music", 46.78], ["breaking", 13.87], ["buzz", 4.32]], null, null, null, null, null, null, [["music", 28.27], ["hum", 22.99], ["mains hum", 10.87]], null, null], "duration": [0.3, 0.15, 0.94, 0.42, 0.58, 0.11, 0.85, 2.17, -0.29, 0.0, 0.18, 0.54, 1.87, 1.47, 0.4, 1.39, 2.74, 1.09, 0.25, 2.47, 6.5, 6.37, 0.88, 8.23, 0.79, 1.22, 1.87, 3.68, 1.23, 1.49, 0.51, -0.31, 7.37, 1.27, 17.95, 0.47, 1.42, 1.97, 2.21, 1.77, 0.88, 9.6, -0.13, 1.29]} \ No newline at end of file diff --git a/annotations_1/h5nhyFFSweU_filtered.json b/annotations_1/h5nhyFFSweU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9ce3a4d2250912c428947e574af5366ee7f22fe --- /dev/null +++ b/annotations_1/h5nhyFFSweU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.54], [10.0, 11.08], [13.0, 13.26], [14.0, 15.28], [18.0, 19.58], [21.0, 22.05], [23.0, 23.08], [25.0, 25.89], [27.0, 27.72], [28.0, 29.22], [30.0, 30.99], [31.0, 32.88], [35.0, 35.02], [35.0, 36.91], [41.0, 41.91], [43.0, 43.06], [45.0, 46.31], [47.0, 48.03], [50.0, 50.85], [54.0, 54.85], [57.0, 57.69], [60.0, 60.37], [62.0, 68.82], [70.0, 71.0], [71.0, 73.74], [77.0, 81.77], [83.0, 84.75], [87.0, 88.1], [89.0, 89.95], [91.0, 98.85], [101.0, 101.39], [105.0, 105.81], [107.0, 108.19], [112.0, 112.23], [114.0, 115.99], [119.0, 120.26], [129.0, 130.27], [131.0, 132.68], [133.0, 134.15], [135.0, 135.68], [136.0, 137.69], [138.0, 139.55], [141.0, 141.35], [142.0, 143.21], [145.0, 146.26], [147.0, 147.34], [150.0, 150.75], [151.0, 151.88], [153.0, 154.5], [156.0, 160.07], [161.0, 174.48], [176.0, 177.09], [180.0, 180.57], [181.0, 201.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.35, 0.0, 67.89, 92.48, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 71.43, 0.0, 0.0, 80.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 45.37], ["speech", 16.63], ["radio", 12.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 1.08, 0.26, 1.28, 1.58, 1.05, 0.08, 0.89, 0.72, 1.22, 0.99, 1.88, 0.02, 1.91, 0.91, 0.06, 1.31, 1.03, 0.85, 0.85, 0.69, 0.37, 6.82, 1.0, 2.74, 4.77, 1.75, 1.1, 0.95, 7.85, 0.39, 0.81, 1.19, 0.23, 1.99, 1.26, 1.27, 1.68, 1.15, 0.68, 1.69, 1.55, 0.35, 1.21, 1.26, 0.34, 0.75, 0.88, 1.5, 4.07, 13.48, 1.09, 0.57, 20.92]} \ No newline at end of file diff --git a/annotations_1/h6iHbAju1cI_filtered.json b/annotations_1/h6iHbAju1cI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea5417cea2f3cbf4ad69e90f6730cb4aa09cb4dc --- /dev/null +++ b/annotations_1/h6iHbAju1cI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.59], [19.0, 20.63], [22.0, 35.29], [54.0, 54.48], [55.0, 57.0], [58.0, 58.38], [79.0, 82.22], [83.0, 85.13], [86.0, 86.63]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [34.4, 0.0, 30.86, 0.0, 99.97, 0.0, 30.75, 98.51, 0.0], "audiomae_on_audioset": [[["music", 39.17], ["speech", 34.89], ["sidetone", 4.09]], null, [["music", 71.91], ["throbbing", 7.47], ["smash, crash", 3.99]], null, null, null, [["cattle, bovinae", 33.1], ["moo", 22.97], ["livestock, farm animals, working animals", 22.9]], null, null], "duration": [3.59, 1.63, 13.29, 0.48, 2.0, 0.38, 3.22, 2.13, 0.63]} \ No newline at end of file diff --git a/annotations_1/h7NG9ZEfyKo_filtered.json b/annotations_1/h7NG9ZEfyKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/h7NG9ZEfyKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/h7ZUKB_zYQ0_filtered.json b/annotations_1/h7ZUKB_zYQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6447a40526001aacce22265aa69217c6468cad26 --- /dev/null +++ b/annotations_1/h7ZUKB_zYQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [8.0, 13.34], [15.0, 14.91], [18.0, 21.66], [22.0, 24.22], [34.0, 36.78], [37.0, 38.1], [41.0, 43.48], [45.0, 45.79], [47.0, 49.42], [55.0, 57.59], [85.0, 85.95], [90.0, 93.23], [94.0, 98.39], [105.0, 106.1], [113.0, 115.2], [117.0, 118.35], [120.0, 120.45]], "keep_status": [false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 36.11, 0.0, 33.37, 62.68, 58.47, 0.0, 64.63, 0.0, 49.64, 35.47, 0.0, 40.52, 69.2, 0.0, 43.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 29.2], ["whale vocalization", 13.55], ["speech", 10.12]], null, [["music", 60.05], ["theremin", 12.25], ["synthesizer", 5.57]], null, null, null, null, null, [["music", 49.07], ["didgeridoo", 8.61], ["theremin", 7.96]], [["speech", 31.37], ["vehicle", 11.38], ["field recording", 7.32]], null, [["music", 45.23], ["foghorn", 9.39], ["theremin", 6.1]], null, null, [["speech", 36.54], ["hum", 11.3], ["telephone", 8.46]], null, null], "duration": [0.54, 5.34, -0.09, 3.66, 2.22, 2.78, 1.1, 2.48, 0.79, 2.42, 2.59, 0.95, 3.23, 4.39, 1.1, 2.2, 1.35, 0.45]} \ No newline at end of file diff --git a/annotations_1/h8Rxb-9snJQ_filtered.json b/annotations_1/h8Rxb-9snJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c85a18809aa38da4ce1c46f7f654f330d6fb1b84 --- /dev/null +++ b/annotations_1/h8Rxb-9snJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.87], [6.0, 8.48], [9.0, 10.13], [12.0, 13.86], [15.0, 19.57], [21.0, 22.74], [24.0, 26.43], [28.0, 28.75], [30.0, 31.72], [33.0, 33.37], [34.0, 36.15], [37.0, 38.65], [39.0, 40.69], [42.0, 43.26], [47.0, 47.12], [49.0, 49.5], [52.0, 52.98], [54.0, 55.36], [56.0, 56.61], [58.0, 58.45], [60.0, 60.03], [62.0, 61.75], [64.0, 66.21], [70.0, 72.17], [74.0, 74.01], [74.0, 74.34], [78.0, 82.68], [84.0, 87.94], [93.0, 94.36], [95.0, 96.89], [99.0, 99.93], [101.0, 101.65], [102.0, 105.97], [113.0, 115.5], [119.0, 122.64], [124.0, 125.69], [127.0, 128.63]], "keep_status": [true, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, true, true, true, false, false], "silence_prob": [34.1, 33.0, 0.0, 0.0, 38.23, 0.0, 37.02, 0.0, 0.0, 0.0, 35.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 31.84, 0.0, 0.0, 35.68, 36.89, 0.0, 0.0, 0.0, 0.0, 33.12, 41.64, 36.11, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 32.54], ["music", 15.58], ["hum", 9.35]], [["speech", 65.18], ["music", 12.02], ["throbbing", 7.75]], null, null, [["fly, housefly", 23.16], ["bee, wasp, etc.", 18.88], ["throbbing", 14.45]], null, [["throbbing", 24.22], ["hum", 23.67], ["music", 20.48]], null, null, null, [["speech", 14.62], ["music", 11.39], ["fly, housefly", 8.61]], null, null, null, null, null, null, null, null, null, null, null, [["music", 46.45], ["hum", 9.7], ["mains hum", 9.21]], [["fly, housefly", 53.61], ["mosquito", 16.98], ["insect", 16.62]], null, null, [["hum", 26.72], ["throbbing", 21.24], ["music", 13.32]], [["music", 33.06], ["didgeridoo", 14.58], ["throbbing", 8.44]], null, null, null, null, [["speech", 38.21], ["hum", 12.64], ["bee, wasp, etc.", 9.93]], [["fly, housefly", 23.38], ["bee, wasp, etc.", 18.43], ["insect", 12.3]], [["throbbing", 20.62], ["hum", 11.72], ["music", 7.99]], null, null], "duration": [2.87, 2.48, 1.13, 1.86, 4.57, 1.74, 2.43, 0.75, 1.72, 0.37, 2.15, 1.65, 1.69, 1.26, 0.12, 0.5, 0.98, 1.36, 0.61, 0.45, 0.03, -0.25, 2.21, 2.17, 0.01, 0.34, 4.68, 3.94, 1.36, 1.89, 0.93, 0.65, 3.97, 2.5, 3.64, 1.69, 1.63]} \ No newline at end of file diff --git a/annotations_1/h8wzJimC5Zc_filtered.json b/annotations_1/h8wzJimC5Zc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..14e79bfa9bcb37ae34f81329bedaaf114b7b5fa1 --- /dev/null +++ b/annotations_1/h8wzJimC5Zc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.37], [19.0, 55.78], [57.0, 59.48], [62.0, 75.64], [77.0, 78.54], [80.0, 81.7], [83.0, 84.99]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.4, 37.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.5], ["hum", 28.14], ["mains hum", 13.88]], null, null, null], "duration": [1.37, 36.78, 2.48, 13.64, 1.54, 1.7, 1.99]} \ No newline at end of file diff --git a/annotations_1/h9GHe5K0kOI_filtered.json b/annotations_1/h9GHe5K0kOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc2c046969f876254c71d61106efd3e1443ed2f --- /dev/null +++ b/annotations_1/h9GHe5K0kOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.32], [8.0, 7.89], [16.0, 16.6], [17.0, 17.64], [26.0, 29.49], [34.0, 34.92], [36.0, 36.32], [37.0, 37.47], [49.0, 50.36], [68.0, 70.77], [84.0, 83.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, -0.11, 0.6, 0.64, 3.49, 0.92, 0.32, 0.47, 1.36, 2.77, -0.21]} \ No newline at end of file diff --git a/annotations_1/h9WDm1k4Hz4_filtered.json b/annotations_1/h9WDm1k4Hz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1181efcf2eae0326c5bcfe0ee3aaa79eff5a9540 --- /dev/null +++ b/annotations_1/h9WDm1k4Hz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 25.57], [28.0, 29.76], [31.0, 32.9], [35.0, 36.9], [39.0, 45.25], [46.0, 51.95], [52.0, 56.61], [58.0, 60.76], [62.0, 64.94], [66.0, 66.11], [67.0, 72.67], [73.0, 77.97], [79.0, 82.85], [84.0, 87.3], [90.0, 93.04], [95.0, 97.11], [99.0, 100.89], [102.0, 111.0], [112.0, 120.12], [121.0, 122.32], [123.0, 124.93], [126.0, 127.67], [129.0, 129.71], [132.0, 134.42], [136.0, 141.72], [143.0, 164.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.89, 0.0, 0.0, 0.0, 99.99, 99.84, 55.04, 100.0, 100.0, 0.0, 99.98, 100.0, 98.66, 65.91, 55.74, 100.0, 0.0, 100.0, 99.92, 0.0, 0.0, 0.0, 0.0, 100.0, 81.53, 92.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.57, 1.76, 1.9, 1.9, 6.25, 5.95, 4.61, 2.76, 2.94, 0.11, 5.67, 4.97, 3.85, 3.3, 3.04, 2.11, 1.89, 9.0, 8.12, 1.32, 1.93, 1.67, 0.71, 2.42, 5.72, 21.17]} \ No newline at end of file diff --git a/annotations_1/hA063IaOHyQ_filtered.json b/annotations_1/hA063IaOHyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a91809a6080cfecff724544566841c917923a2d4 --- /dev/null +++ b/annotations_1/hA063IaOHyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [5.0, 7.69], [10.0, 10.52], [15.0, 14.99], [29.0, 29.93], [33.0, 38.48], [49.0, 49.4], [50.0, 50.48], [59.0, 62.31], [67.0, 68.34], [77.0, 81.92], [86.0, 87.39], [94.0, 94.41], [94.0, 96.01], [100.0, 100.55], [105.0, 105.14], [110.0, 113.39], [121.0, 121.29], [129.0, 129.64], [133.0, 134.1]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 60.14, 0.0, 0.0, 0.0, 39.25, 0.0, 0.0, 99.65, 0.0, 90.78, 0.0, 0.0, 70.86, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.17], ["timpani", 8.42], ["foghorn", 7.26]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 2.69, 0.52, -0.01, 0.93, 5.48, 0.4, 0.48, 3.31, 1.34, 4.92, 1.39, 0.41, 2.01, 0.55, 0.14, 3.39, 0.29, 0.64, 1.1]} \ No newline at end of file diff --git a/annotations_1/hAU8AQ6xlw8_filtered.json b/annotations_1/hAU8AQ6xlw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40fe8756bed6f49a30c43970a2843368aa20c080 --- /dev/null +++ b/annotations_1/hAU8AQ6xlw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.66], [11.0, 11.87], [13.0, 14.15], [15.0, 15.43], [18.0, 18.33], [19.0, 21.44], [22.0, 23.04], [31.0, 30.92], [32.0, 34.53], [35.0, 36.05], [37.0, 39.83], [47.0, 48.42], [55.0, 55.17], [60.0, 60.49], [65.0, 67.49], [70.0, 70.93], [76.0, 76.35], [107.0, 108.06], [114.0, 115.89], [117.0, 118.15], [121.0, 121.44], [123.0, 123.43], [124.0, 123.84], [140.0, 140.34], [144.0, 145.99], [148.0, 148.51], [149.0, 148.59], [149.0, 149.13], [151.0, 151.26], [154.0, 154.85], [158.0, 158.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.29, 0.0, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 100.0, 0.0, 99.99, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.66, 0.87, 1.15, 0.43, 0.33, 2.44, 1.04, -0.08, 2.53, 1.05, 2.83, 1.42, 0.17, 0.49, 2.49, 0.93, 0.35, 1.06, 1.89, 1.15, 0.44, 0.43, -0.16, 0.34, 1.99, 0.51, -0.41, 0.13, 0.26, 0.85, 0.19]} \ No newline at end of file diff --git a/annotations_1/hAbVFxYi_q0_filtered.json b/annotations_1/hAbVFxYi_q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088ee49b8ed653114aa1f2c584d49eb90a6b0b70 --- /dev/null +++ b/annotations_1/hAbVFxYi_q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [9.0, 14.13], [27.0, 27.28], [49.0, 49.0], [59.0, 59.76], [61.0, 61.35], [63.0, 63.27], [65.0, 65.99], [68.0, 68.13], [79.0, 79.02], [80.0, 80.11], [83.0, 84.37], [85.0, 85.14], [96.0, 96.99], [108.0, 108.21], [116.0, 118.18], [120.0, 120.97], [121.0, 124.66], [127.0, 127.82], [132.0, 132.6], [143.0, 143.4], [144.0, 145.1], [147.0, 146.67], [158.0, 159.76], [162.0, 162.41], [167.0, 167.46], [172.0, 172.05], [173.0, 173.18], [177.0, 179.83], [183.0, 185.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 92.8], "audiomae_on_audioset": [null, [["speech", 69.16], ["tap", 5.81], ["music", 4.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 5.13, 0.28, 0.0, 0.76, 0.35, 0.27, 0.99, 0.13, 0.02, 0.11, 1.37, 0.14, 0.99, 0.21, 2.18, 0.97, 3.66, 0.82, 0.6, 0.4, 1.1, -0.33, 1.76, 0.41, 0.46, 0.05, 0.18, 2.83, 2.23]} \ No newline at end of file diff --git a/annotations_1/hAf3IBKWubo_filtered.json b/annotations_1/hAf3IBKWubo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c8d02b0dca194ccf88bb1ce7c949a21a897dff5 --- /dev/null +++ b/annotations_1/hAf3IBKWubo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 50.8], [56.0, 95.59], [104.0, 117.58], [120.0, 119.96], [122.0, 122.35], [127.0, 146.62], [152.0, 154.04], [156.0, 166.95], [176.0, 179.88], [182.0, 239.92], [241.0, 242.28], [248.0, 253.0]], "keep_status": [false, false, false, false, false, true, true, true, true, false, false, true], "silence_prob": [0.0, 0.0, 29.94, 0.0, 0.0, 31.09, 29.77, 29.19, 30.07, 0.0, 0.0, 28.67], "audiomae_on_audioset": [null, null, [["hum", 34.65], ["mains hum", 28.47], ["speech", 15.61]], null, null, [["music", 53.17], ["sonar", 8.6], ["synthesizer", 7.76]], [["hum", 20.91], ["music", 15.68], ["buzz", 11.16]], [["speech", 40.29], ["eruption", 14.21], ["explosion", 9.09]], [["music", 36.92], ["speech", 22.46], ["hum", 4.5]], null, null, [["speech", 27.51], ["vehicle", 13.24], ["motorcycle", 6.43]]], "duration": [47.8, 39.59, 13.58, -0.04, 0.35, 19.62, 2.04, 10.95, 3.88, 57.92, 1.28, 5.0]} \ No newline at end of file diff --git a/annotations_1/hCN8UAdH55A_filtered.json b/annotations_1/hCN8UAdH55A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3199b64f905e9dabdff9064243a4b3999a0a10 --- /dev/null +++ b/annotations_1/hCN8UAdH55A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 80.67], [82.0, 82.16], [83.0, 84.67], [89.0, 89.48], [91.0, 97.17], [98.0, 98.78], [99.0, 99.47], [100.0, 100.2], [101.0, 101.87], [103.0, 105.19], [106.0, 106.47], [108.0, 108.13], [109.0, 110.32], [111.0, 111.38], [114.0, 115.65], [119.0, 121.07], [122.0, 123.55], [127.0, 128.01], [129.0, 129.36], [140.0, 143.58], [145.0, 145.96], [147.0, 146.96], [149.0, 149.79], [153.0, 153.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 69.61, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 0.0, 0.0, 31.53, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.87], ["hum", 7.6], ["rumble", 6.23]], null, null, null, [["bee, wasp, etc.", 22.64], ["insect", 8.47], ["vehicle", 6.24]], null, null, null, null], "duration": [63.67, 0.16, 1.67, 0.48, 6.17, 0.78, 0.47, 0.2, 0.87, 2.19, 0.47, 0.13, 1.32, 0.38, 1.65, 2.07, 1.55, 1.01, 0.36, 3.58, 0.96, -0.04, 0.79, 0.57]} \ No newline at end of file diff --git a/annotations_1/hD7KaqFoSq0_filtered.json b/annotations_1/hD7KaqFoSq0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d6690765d9290d511ebe78f1d30979dc3303edf --- /dev/null +++ b/annotations_1/hD7KaqFoSq0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.51], [34.0, 61.82]], "keep_status": [false, false], "silence_prob": [0.0, 31.2], "audiomae_on_audioset": [null, [["music", 66.19], ["didgeridoo", 9.58], ["musical instrument", 3.16]]], "duration": [0.51, 27.82]} \ No newline at end of file diff --git a/annotations_1/hDA_Bn7UhlA_filtered.json b/annotations_1/hDA_Bn7UhlA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..667b9c284098f410b89af2f39169ad7381867e92 --- /dev/null +++ b/annotations_1/hDA_Bn7UhlA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 37.2], [37.0, 37.81], [39.0, 39.45], [40.0, 40.81], [42.0, 43.12], [44.0, 44.07], [46.0, 45.86], [48.0, 49.44], [50.0, 50.85], [52.0, 54.87], [56.0, 56.91], [58.0, 59.48], [60.0, 63.1], [66.0, 66.5], [67.0, 68.13], [69.0, 69.53], [71.0, 73.14], [77.0, 79.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [94.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 37.26, 0.0, 0.0, 0.0, 43.33, 36.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.84], ["crow", 21.63], ["animal", 16.82]], null, null, null, [["speech", 31.25], ["fart", 22.33], ["hum", 5.66]], [["speech", 47.18], ["animal", 7.25], ["sheep", 7.1]]], "duration": [11.2, 0.81, 0.45, 0.81, 1.12, 0.07, -0.14, 1.44, 0.85, 2.87, 0.91, 1.48, 3.1, 0.5, 1.13, 0.53, 2.14, 2.17]} \ No newline at end of file diff --git a/annotations_1/hE5rsmIsYPA_filtered.json b/annotations_1/hE5rsmIsYPA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..393f74ae66ed48c2b7c00b2c1dd8daa078e05720 --- /dev/null +++ b/annotations_1/hE5rsmIsYPA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 67.22], [68.0, 95.76], [96.0, 97.82], [99.0, 100.11]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 47.5, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 23.23], ["speech", 14.7], ["mains hum", 11.86]], null, null], "duration": [1.22, 27.76, 1.82, 1.11]} \ No newline at end of file diff --git a/annotations_1/hEZcqWRB2iU_filtered.json b/annotations_1/hEZcqWRB2iU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aca13d1354cc0448fe797ed0fd5cd0ed3dc2004c --- /dev/null +++ b/annotations_1/hEZcqWRB2iU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.55], [15.0, 15.79], [23.0, 25.19], [27.0, 27.7], [29.0, 29.71], [31.0, 34.47], [36.0, 36.86], [39.0, 39.7], [43.0, 43.66], [45.0, 46.36], [48.0, 131.6]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.88, 0.0, 0.0, 32.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 26.55], ["music", 7.75], ["fly, housefly", 5.08]], null, null, [["animal", 20.99], ["whale vocalization", 18.93], ["wild animals", 10.19]], null, null, null, null, null], "duration": [0.55, 0.79, 2.19, 0.7, 0.71, 3.47, 0.86, 0.7, 0.66, 1.36, 83.6]} \ No newline at end of file diff --git a/annotations_1/hF_9GQFISow_filtered.json b/annotations_1/hF_9GQFISow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b34f39dfa7db41564337ee72694bbf2e9b8b3356 --- /dev/null +++ b/annotations_1/hF_9GQFISow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.16], [24.0, 25.15], [28.0, 28.54], [31.0, 38.69], [44.0, 44.19], [48.0, 50.3], [50.0, 52.02], [71.0, 71.25], [86.0, 86.41], [104.0, 105.14], [109.0, 118.98], [130.0, 130.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.83, 0.0, 0.0, 29.66, 0.0, 31.89, 30.99, 0.0, 0.0, 0.0, 31.72, 0.0], "audiomae_on_audioset": [[["music", 81.39], ["synthesizer", 2.44], ["sampler", 1.79]], null, null, [["music", 68.12], ["synthesizer", 7.63], ["musical instrument", 3.36]], null, [["music", 57.87], ["speech", 23.91], ["livestock, farm animals, working animals", 1.14]], [["speech", 43.17], ["music", 34.31], ["synthesizer", 3.4]], null, null, null, [["music", 62.02], ["synthesizer", 10.06], ["speech", 7.39]], null], "duration": [2.16, 1.15, 0.54, 7.69, 0.19, 2.3, 2.02, 0.25, 0.41, 1.14, 9.98, 0.42]} \ No newline at end of file diff --git a/annotations_1/hFfQhVgQU44_filtered.json b/annotations_1/hFfQhVgQU44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97596821912127285637cea331dca26855616048 --- /dev/null +++ b/annotations_1/hFfQhVgQU44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.82], [13.0, 13.53], [15.0, 14.99], [22.0, 22.44], [25.0, 25.42], [30.0, 31.31], [40.0, 45.05], [46.0, 46.8], [80.0, 83.32], [86.0, 86.39], [96.0, 97.95], [99.0, 100.45], [155.0, 155.53], [158.0, 158.58], [160.0, 161.37], [166.0, 167.41], [187.0, 189.85], [193.0, 195.12], [202.0, 202.69], [204.0, 206.42], [219.0, 221.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 0.0, 50.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.66, 31.04, 0.0, 35.47, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 75.03], ["synthesizer", 8.75], ["throbbing", 2.96]], null, null, null, null, null, null, null, null, null, [["music", 24.42], ["mosquito", 4.85], ["carnatic music", 3.97]], [["music", 49.01], ["speech", 16.79], ["synthesizer", 5.8]], null, [["speech", 58.8], ["music", 21.93], ["quack", 6.46]], [["music", 72.39], ["effects unit", 6.26], ["guitar", 5.21]]], "duration": [4.82, 0.53, -0.01, 0.44, 0.42, 1.31, 5.05, 0.8, 3.32, 0.39, 1.95, 1.45, 0.53, 0.58, 1.37, 1.41, 2.85, 2.12, 0.69, 2.42, 2.19]} \ No newline at end of file diff --git a/annotations_1/hH0av1iDYVI_filtered.json b/annotations_1/hH0av1iDYVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..188d9589f3037ad4ceaab265d520cdf3b420a82f --- /dev/null +++ b/annotations_1/hH0av1iDYVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.07], [17.0, 19.03], [20.0, 21.27], [23.0, 23.08], [25.0, 29.88], [33.0, 54.9], [61.0, 62.31], [63.0, 63.9], [65.0, 80.1], [81.0, 85.99], [87.0, 107.59], [109.0, 111.97], [112.0, 127.58]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 76.86, 0.0, 0.0, 51.18, 40.82, 0.0, 0.0, 34.49, 37.46, 35.68, 39.52, 34.46], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.98], ["synthesizer", 5.06], ["musical instrument", 4.77]], null, null, [["music", 40.02], ["fly, housefly", 12.11], ["groan", 12.05]], [["boing", 60.55], ["music", 21.9], ["speech", 3.03]], [["music", 43.94], ["fly, housefly", 21.93], ["insect", 6.0]], [["music", 78.0], ["synthesizer", 2.02], ["musical instrument", 1.58]], [["music", 27.46], ["boing", 16.27], ["whack, thwack", 13.0]]], "duration": [1.07, 2.03, 1.27, 0.08, 4.88, 21.9, 1.31, 0.9, 15.1, 4.99, 20.59, 2.97, 15.58]} \ No newline at end of file diff --git a/annotations_1/hH1TgDvC7sY_filtered.json b/annotations_1/hH1TgDvC7sY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe286a82b2211f6dee38899166fd2e0eff3c9605 --- /dev/null +++ b/annotations_1/hH1TgDvC7sY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.76], [21.0, 21.0], [21.0, 22.2], [24.0, 56.29], [57.0, 69.18], [71.0, 71.56], [74.0, 119.94], [120.0, 120.99], [123.0, 154.7], [157.0, 157.81], [159.0, 161.03], [162.0, 162.8], [163.0, 164.94], [169.0, 169.92], [170.0, 181.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [32.26, 0.0, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 59.86, 0.0, 0.0, 0.0, 34.43], "audiomae_on_audioset": [[["speech", 19.33], ["electric shaver, electric razor", 13.22], ["groan", 8.52]], null, null, null, [["hum", 48.58], ["mains hum", 16.4], ["throbbing", 15.72]], null, null, null, null, null, null, null, null, null, [["bee, wasp, etc.", 23.87], ["fly, housefly", 11.02], ["buzz", 9.47]]], "duration": [11.76, 0.0, 1.2, 32.29, 12.18, 0.56, 45.94, 0.99, 31.7, 0.81, 2.03, 0.8, 1.94, 0.92, 11.45]} \ No newline at end of file diff --git a/annotations_1/hH3peh07eq4_filtered.json b/annotations_1/hH3peh07eq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a22fa9d5b872159f8a42448a6c18e200862d19d --- /dev/null +++ b/annotations_1/hH3peh07eq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.09], [3.0, 3.84], [15.0, 16.31], [18.0, 18.37], [31.0, 32.09], [36.0, 36.54], [41.0, 41.84], [44.0, 44.61], [56.0, 56.39], [57.0, 58.19], [65.0, 65.01], [67.0, 67.24], [78.0, 80.38], [82.0, 83.46], [95.0, 95.25], [112.0, 112.26], [113.0, 114.22], [115.0, 115.74], [134.0, 134.03], [146.0, 152.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.09, 0.84, 1.31, 0.37, 1.09, 0.54, 0.84, 0.61, 0.39, 1.19, 0.01, 0.24, 2.38, 1.46, 0.25, 0.26, 1.22, 0.74, 0.03, 6.68]} \ No newline at end of file diff --git a/annotations_1/hIHC635Q9dc_filtered.json b/annotations_1/hIHC635Q9dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38b1ef476583aa6cf240857551f14d82df82b33b --- /dev/null +++ b/annotations_1/hIHC635Q9dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.86], [14.0, 15.09], [29.0, 30.82], [71.0, 72.69], [81.0, 82.32], [103.0, 104.62], [133.0, 134.74]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.86, 1.09, 1.82, 1.69, 1.32, 1.62, 1.74]} \ No newline at end of file diff --git a/annotations_1/hIJ0gMDZT_4_filtered.json b/annotations_1/hIJ0gMDZT_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a4c055eb11d5ba2654bb4e17adcc094b0fec690 --- /dev/null +++ b/annotations_1/hIJ0gMDZT_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [7.0, 33.64], [57.0, 57.6], [61.0, 61.47], [63.0, 63.81], [71.0, 71.54], [74.0, 76.27], [78.0, 79.59], [82.0, 85.21], [87.0, 88.8], [89.0, 102.56], [103.0, 102.86], [104.0, 104.7], [108.0, 108.51], [114.0, 122.15], [123.0, 125.79], [131.0, 140.21], [143.0, 159.8], [172.0, 183.44], [184.0, 189.03]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 88.83, 0.0, 56.03, 0.0, 0.0, 0.0, 31.26, 30.84, 31.19, 31.75, 30.69, 33.01], "audiomae_on_audioset": [null, [["music", 28.93], ["speech", 11.34], ["groan", 8.64]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.91], ["musical instrument", 5.04], ["guitar", 1.81]], [["music", 55.9], ["didgeridoo", 4.63], ["electronic music", 4.37]], [["music", 58.45], ["speech", 16.08], ["electronic music", 3.44]], [["music", 65.19], ["synthesizer", 4.51], ["throbbing", 4.49]], [["music", 50.72], ["animal", 24.56], ["neigh, whinny", 13.48]], [["music", 25.04], ["speech", 24.59], ["boing", 18.02]]], "duration": [0.58, 26.64, 0.6, 0.47, 0.81, 0.54, 2.27, 1.59, 3.21, 1.8, 13.56, -0.14, 0.7, 0.51, 8.15, 2.79, 9.21, 16.8, 11.44, 5.03]} \ No newline at end of file diff --git a/annotations_1/hIMv_pWXqFY_filtered.json b/annotations_1/hIMv_pWXqFY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c916c63b39bcd0b881a480d9ce3324b07be21a1 --- /dev/null +++ b/annotations_1/hIMv_pWXqFY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 14.39], [15.0, 17.31], [18.0, 31.06], [31.0, 36.8], [40.0, 40.19], [41.0, 42.16], [43.0, 44.0], [45.0, 46.01], [47.0, 51.68], [52.0, 62.63], [64.0, 66.45], [71.0, 81.26], [82.0, 83.64], [85.0, 87.51], [89.0, 99.49], [100.0, 101.11], [102.0, 104.94], [105.0, 112.7], [113.0, 118.32], [122.0, 123.65], [125.0, 126.08], [128.0, 129.57], [136.0, 136.76], [139.0, 141.72], [143.0, 151.48]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [97.43, 99.88, 92.15, 46.19, 0.0, 0.0, 0.0, 0.0, 93.45, 59.96, 57.97, 88.83, 0.0, 82.07, 50.97, 0.0, 57.25, 48.61, 52.68, 0.0, 0.0, 0.0, 0.0, 81.17, 74.76], "audiomae_on_audioset": [null, null, null, [["speech", 33.69], ["music", 21.14], ["singing bowl", 14.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.49], ["singing bowl", 15.42], ["theremin", 10.72]], null, null, null, null, null, null, null], "duration": [12.39, 2.31, 13.06, 5.8, 0.19, 1.16, 1.0, 1.01, 4.68, 10.63, 2.45, 10.26, 1.64, 2.51, 10.49, 1.11, 2.94, 7.7, 5.32, 1.65, 1.08, 1.57, 0.76, 2.72, 8.48]} \ No newline at end of file diff --git a/annotations_1/hITWJ6vE1os_filtered.json b/annotations_1/hITWJ6vE1os_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a3455024fe3eacdde38a648d260d8ed8954fd40 --- /dev/null +++ b/annotations_1/hITWJ6vE1os_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.55], [9.0, 9.37], [11.0, 10.84], [12.0, 12.9], [16.0, 64.59], [65.0, 102.56], [106.0, 107.32], [108.0, 116.97], [125.0, 126.18], [129.0, 128.55], [129.0, 129.78], [131.0, 132.63]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 35.44], ["music", 20.0], ["whack, thwack", 13.59]], null, null, null, null], "duration": [0.55, 0.37, -0.16, 0.9, 48.59, 37.56, 1.32, 8.97, 1.18, -0.45, 0.78, 1.63]} \ No newline at end of file diff --git a/annotations_1/hIUrt0AsTjw_filtered.json b/annotations_1/hIUrt0AsTjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4424255afe160bc1adf42be25bf6361cec1bbdf --- /dev/null +++ b/annotations_1/hIUrt0AsTjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.1], [14.0, 14.71], [16.0, 16.04], [17.0, 17.85], [18.0, 18.64], [19.0, 19.74], [22.0, 27.82], [30.0, 30.81], [32.0, 34.21], [35.0, 39.77], [41.0, 41.72], [42.0, 50.75], [52.0, 71.78], [74.0, 77.33], [79.0, 83.47], [85.0, 92.3], [96.0, 101.26], [103.0, 105.26], [106.0, 108.43]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.38, 0.0, 34.53, 30.8, 0.0, 31.67, 29.89, 30.68, 31.95, 31.56, 30.1, 36.97, 32.85], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.63], ["speech", 4.06], ["hum", 2.31]], null, [["mains hum", 44.0], ["hum", 21.7], ["electric shaver, electric razor", 7.24]], [["whack, thwack", 25.72], ["mosquito", 6.04], ["speech", 5.88]], null, [["music", 46.44], ["throbbing", 16.0], ["hum", 15.56]], [["music", 56.11], ["throbbing", 16.65], ["hum", 7.6]], [["throbbing", 27.33], ["hum", 24.42], ["mains hum", 18.62]], [["cattle, bovinae", 45.1], ["moo", 33.43], ["livestock, farm animals, working animals", 15.81]], [["throbbing", 35.3], ["music", 35.03], ["hum", 12.67]], [["music", 68.91], ["hum", 6.03], ["throbbing", 5.73]], [["music", 34.36], ["hum", 19.29], ["mains hum", 10.56]], [["hum", 43.1], ["sidetone", 15.15], ["mains hum", 14.08]]], "duration": [1.1, 0.71, 0.04, 0.85, 0.64, 0.74, 5.82, 0.81, 2.21, 4.77, 0.72, 8.75, 19.78, 3.33, 4.47, 7.3, 5.26, 2.26, 2.43]} \ No newline at end of file diff --git a/annotations_1/hIokX-nhQd8_filtered.json b/annotations_1/hIokX-nhQd8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bb43f3106c1090011395a43d1f705e4d12619be --- /dev/null +++ b/annotations_1/hIokX-nhQd8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.8], [16.0, 16.29], [41.0, 41.22], [43.0, 43.71], [47.0, 55.44], [57.0, 57.57], [59.0, 60.32], [63.0, 63.26], [65.0, 66.78], [72.0, 73.45], [77.0, 78.38], [81.0, 82.36], [84.0, 84.13], [86.0, 86.91], [88.0, 88.37], [89.0, 90.17], [92.0, 93.29], [95.0, 95.1], [97.0, 96.99], [99.0, 101.31], [103.0, 103.32], [105.0, 105.66], [108.0, 113.76], [114.0, 115.69], [117.0, 119.64], [121.0, 122.86], [124.0, 124.95], [126.0, 127.13], [130.0, 132.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [48.56, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 98.01, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [[["bouncing", 30.15], ["speech", 9.2], ["noise", 6.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [11.8, 0.29, 0.22, 0.71, 8.44, 0.57, 1.32, 0.26, 1.78, 1.45, 1.38, 1.36, 0.13, 0.91, 0.37, 1.17, 1.29, 0.1, -0.01, 2.31, 0.32, 0.66, 5.76, 1.69, 2.64, 1.86, 0.95, 1.13, 2.66]} \ No newline at end of file diff --git a/annotations_1/hKuh_h2nzN8_filtered.json b/annotations_1/hKuh_h2nzN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e4eb848b148bcb07fc9413a7c0e8be6425e4df --- /dev/null +++ b/annotations_1/hKuh_h2nzN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 68.71], [70.0, 75.03], [78.0, 82.39], [84.0, 88.05], [96.0, 97.7], [98.0, 100.26], [102.0, 102.69], [104.0, 103.86], [107.0, 144.26], [148.0, 148.59]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [28.06, 31.11, 36.98, 35.17, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 81.69], ["electronic music", 1.5], ["song", 0.92]], [["speech", 40.01], ["crowd", 13.15], ["outside, urban or manmade", 4.97]], [["cattle, bovinae", 42.06], ["moo", 38.43], ["livestock, farm animals, working animals", 19.13]], [["speech", 16.93], ["sheep", 11.03], ["bleat", 6.1]], null, null, null, null, null, null], "duration": [23.71, 5.03, 4.39, 4.05, 1.7, 2.26, 0.69, -0.14, 37.26, 0.59]} \ No newline at end of file diff --git a/annotations_1/hM1OunX-QBg_filtered.json b/annotations_1/hM1OunX-QBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f17d015c54bbf9e41771fb2d14ecad3370d6337 --- /dev/null +++ b/annotations_1/hM1OunX-QBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[79.0, 83.88], [85.0, 84.94], [85.0, 90.88], [92.0, 100.38], [106.0, 128.95]], "keep_status": [false, false, true, true, false], "silence_prob": [31.25, 0.0, 31.23, 29.42, 29.88], "audiomae_on_audioset": [[["speech", 35.27], ["music", 30.19], ["quack", 7.77]], null, [["hum", 27.13], ["speech", 19.95], ["throbbing", 15.43]], [["music", 38.14], ["speech", 11.73], ["burst, pop", 4.57]], [["speech", 36.29], ["music", 33.69], ["gunshot, gunfire", 4.78]]], "duration": [4.88, -0.06, 5.88, 8.38, 22.95]} \ No newline at end of file diff --git a/annotations_1/hM3nn30NxCE_filtered.json b/annotations_1/hM3nn30NxCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6574311a9231b2d2a7940745ec1949568a11798 --- /dev/null +++ b/annotations_1/hM3nn30NxCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [13.0, 13.02], [17.0, 18.13], [22.0, 22.03], [24.0, 24.85], [26.0, 27.09], [44.0, 44.41], [69.0, 69.5], [70.0, 70.46], [79.0, 79.73], [85.0, 85.87], [87.0, 87.1], [91.0, 91.56], [95.0, 95.98], [99.0, 101.44], [108.0, 108.35], [111.0, 124.34], [125.0, 126.45], [126.0, 126.87], [129.0, 133.02], [134.0, 135.78], [136.0, 136.8], [137.0, 138.59], [139.0, 141.84], [142.0, 147.88], [149.0, 148.91], [151.0, 163.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 49.5, 0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 33.6, 36.52, 0.0, 30.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 25.54], ["insect", 11.35], ["frog", 8.6]], null, null, null, null, null, null, [["speech", 26.27], ["whistling", 4.9], ["radio", 4.05]], [["animal", 18.46], ["livestock, farm animals, working animals", 12.53], ["speech", 11.38]], null, [["speech", 12.23], ["animal", 9.1], ["hum", 5.96]]], "duration": [1.01, 0.02, 1.13, 0.03, 0.85, 1.09, 0.41, 0.5, 0.46, 0.73, 0.87, 0.1, 0.56, 0.98, 2.44, 0.35, 13.34, 1.45, 0.87, 4.02, 1.78, 0.8, 1.59, 2.84, 5.88, -0.09, 12.14]} \ No newline at end of file diff --git a/annotations_1/hM6KNsz7_mk_filtered.json b/annotations_1/hM6KNsz7_mk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44ffd61e75acd39a9ff3107991149161d08dfa1d --- /dev/null +++ b/annotations_1/hM6KNsz7_mk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.47], [8.0, 9.12], [11.0, 12.58], [14.0, 15.25], [21.0, 21.07], [30.0, 31.41], [33.0, 34.13], [37.0, 37.4], [39.0, 40.42], [42.0, 42.57], [44.0, 47.73], [51.0, 51.33], [56.0, 57.55], [58.0, 58.24], [84.0, 84.43], [86.0, 89.13], [90.0, 91.45], [93.0, 94.22], [105.0, 105.75], [107.0, 107.08], [117.0, 117.64], [121.0, 121.34], [122.0, 122.32], [123.0, 123.16], [125.0, 125.52], [134.0, 134.86], [135.0, 136.32], [141.0, 141.2], [143.0, 143.11], [143.0, 144.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 26.32], ["speech", 20.02], ["electronic music", 14.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 1.12, 1.58, 1.25, 0.07, 1.41, 1.13, 0.4, 1.42, 0.57, 3.73, 0.33, 1.55, 0.24, 0.43, 3.13, 1.45, 1.22, 0.75, 0.08, 0.64, 0.34, 0.32, 0.16, 0.52, 0.86, 1.32, 0.2, 0.11, 1.19]} \ No newline at end of file diff --git a/annotations_1/hMGHJFVuqpg_filtered.json b/annotations_1/hMGHJFVuqpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d027acd110c88820a225f85f7f94c901af5d387 --- /dev/null +++ b/annotations_1/hMGHJFVuqpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.28], [21.0, 21.96], [23.0, 25.08], [27.0, 27.01], [33.0, 34.06], [35.0, 36.26], [37.0, 38.1], [39.0, 60.72], [61.0, 85.7], [88.0, 98.88], [102.0, 102.46], [105.0, 108.21], [114.0, 133.68], [134.0, 148.59], [151.0, 158.08], [160.0, 167.46], [171.0, 172.47], [175.0, 182.31], [184.0, 186.81], [190.0, 199.12], [200.0, 202.86], [203.0, 204.58], [205.0, 206.81], [210.0, 214.59], [218.0, 221.21], [226.0, 228.78], [233.0, 235.48], [238.0, 238.01], [241.0, 245.49], [248.0, 252.83], [254.0, 259.17], [263.0, 265.69]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 0.0, 34.68, 34.55, 33.64, 0.0, 36.2, 35.66, 30.97, 31.35, 33.99, 0.0, 31.94, 32.15, 46.29, 42.62, 0.0, 0.0, 72.01, 43.79, 85.54, 93.29, 0.0, 73.51, 48.44, 41.78, 72.31], "audiomae_on_audioset": [null, null, [["music", 45.19], ["throbbing", 7.36], ["hum", 6.57]], null, null, null, null, [["music", 71.44], ["speech", 5.61], ["theremin", 5.17]], [["music", 44.2], ["buzz", 18.5], ["speech", 6.84]], [["music", 49.59], ["speech", 11.38], ["hum", 5.08]], null, [["throbbing", 53.96], ["music", 32.6], ["hum", 5.02]], [["music", 67.38], ["throbbing", 4.96], ["hum", 4.72]], [["music", 61.5], ["throbbing", 12.8], ["hum", 3.27]], [["music", 40.9], ["throbbing", 7.58], ["hum", 6.95]], [["music", 35.59], ["hum", 27.24], ["mains hum", 15.1]], null, [["music", 39.44], ["speech", 21.0], ["throbbing", 7.9]], [["speech", 15.41], ["vehicle", 7.51], ["cattle, bovinae", 6.16]], [["music", 59.83], ["ambient music", 11.81], ["electronic music", 5.5]], [["ambient music", 34.0], ["music", 32.98], ["synthesizer", 7.32]], null, null, null, [["music", 68.58], ["synthesizer", 2.47], ["keyboard (musical)", 2.27]], null, null, null, null, [["music", 43.71], ["electric piano", 7.28], ["piano", 5.96]], [["music", 74.23], ["singing", 4.84], ["lullaby", 2.57]], null], "duration": [0.28, 0.96, 2.08, 0.01, 1.06, 1.26, 1.1, 21.72, 24.7, 10.88, 0.46, 3.21, 19.68, 14.59, 7.08, 7.46, 1.47, 7.31, 2.81, 9.12, 2.86, 1.58, 1.81, 4.59, 3.21, 2.78, 2.48, 0.01, 4.49, 4.83, 5.17, 2.69]} \ No newline at end of file diff --git a/annotations_1/hMbcMlAVxeg_filtered.json b/annotations_1/hMbcMlAVxeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ded20533a58204d923ecdf005a319213c0dc5f1 --- /dev/null +++ b/annotations_1/hMbcMlAVxeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 10.71], [11.0, 12.18], [14.0, 19.21], [21.0, 21.86], [26.0, 27.11], [29.0, 33.51], [34.0, 40.95], [45.0, 50.97], [51.0, 55.7], [58.0, 70.09], [70.0, 72.39], [73.0, 74.43], [75.0, 96.04]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [79.76, 0.0, 85.17, 0.0, 0.0, 42.65, 40.57, 35.18, 35.68, 38.15, 55.31, 0.0, 36.5], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 52.64], ["mains hum", 25.65], ["throbbing", 10.52]], [["hum", 25.48], ["speech", 22.0], ["mains hum", 15.87]], [["hum", 42.84], ["music", 22.25], ["throbbing", 6.8]], [["hum", 56.43], ["mains hum", 20.32], ["throbbing", 8.47]], [["hum", 62.93], ["throbbing", 14.2], ["mains hum", 7.21]], null, null, [["hum", 13.64], ["grunt", 13.19], ["noise", 5.78]]], "duration": [8.71, 1.18, 5.21, 0.86, 1.11, 4.51, 6.95, 5.97, 4.7, 12.09, 2.39, 1.43, 21.04]} \ No newline at end of file diff --git a/annotations_1/hN5We42pLhs_filtered.json b/annotations_1/hN5We42pLhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d375251d2c76f2aeed50c88e1c289998b6580015 --- /dev/null +++ b/annotations_1/hN5We42pLhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 59.73], [76.0, 76.57], [77.0, 83.15], [90.0, 90.56], [92.0, 93.19], [99.0, 99.62], [101.0, 102.54], [103.0, 104.11], [106.0, 107.1], [109.0, 110.1], [111.0, 111.72], [114.0, 114.13], [115.0, 118.66], [124.0, 123.6], [126.0, 126.17], [127.0, 127.65], [129.0, 133.22], [134.0, 136.16], [136.0, 137.73], [139.0, 140.66], [141.0, 150.65], [153.0, 152.95]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [30.97, 0.0, 33.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.68, 0.0, 0.0, 0.0, 41.76, 34.86, 0.0, 0.0, 30.28, 0.0], "audiomae_on_audioset": [[["thunk", 25.42], ["breaking", 14.07], ["music", 12.32]], null, [["music", 55.04], ["speech", 11.53], ["mains hum", 7.87]], null, null, null, null, null, null, null, null, null, [["breaking", 46.67], ["speech", 26.08], ["music", 13.84]], null, null, null, [["music", 36.53], ["singing bowl", 10.5], ["musical instrument", 5.42]], [["music", 48.62], ["speech", 12.87], ["didgeridoo", 8.27]], null, null, [["music", 42.41], ["speech", 32.47], ["didgeridoo", 7.83]], null], "duration": [27.73, 0.57, 6.15, 0.56, 1.19, 0.62, 1.54, 1.11, 1.1, 1.1, 0.72, 0.13, 3.66, -0.4, 0.17, 0.65, 4.22, 2.16, 1.73, 1.66, 9.65, -0.05]} \ No newline at end of file diff --git a/annotations_1/hOB4Qm1IiOY_filtered.json b/annotations_1/hOB4Qm1IiOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6abb8bf131f33a583a44ff77e73f6a137fc3b73 --- /dev/null +++ b/annotations_1/hOB4Qm1IiOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.36], [2.0, 4.89], [9.0, 9.19], [15.0, 16.31], [20.0, 21.49], [25.0, 27.67], [34.0, 35.73], [42.0, 43.9], [47.0, 48.71], [49.0, 49.76], [52.0, 52.81], [55.0, 56.05], [68.0, 68.44], [71.0, 71.25], [74.0, 78.09], [84.0, 85.09], [89.0, 91.62], [94.0, 96.94], [98.0, 102.69], [104.0, 112.04], [113.0, 115.42], [116.0, 116.88], [118.0, 124.48], [127.0, 128.9], [132.0, 138.21], [139.0, 141.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.58, 0.0, 0.0, 0.0, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 47.66, 41.68, 72.31, 68.8, 69.88, 0.0, 74.76, 0.0, 81.35, 84.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.62], ["gong", 21.9], ["singing bowl", 20.09]], [["music", 53.87], ["ambient music", 10.51], ["sonar", 4.83]], null, null, null, null, null, null, null, null], "duration": [0.36, 2.89, 0.19, 1.31, 1.49, 2.67, 1.73, 1.9, 1.71, 0.76, 0.81, 1.05, 0.44, 0.25, 4.09, 1.09, 2.62, 2.94, 4.69, 8.04, 2.42, 0.88, 6.48, 1.9, 6.21, 2.08]} \ No newline at end of file diff --git a/annotations_1/hOH-oOCfsX4_filtered.json b/annotations_1/hOH-oOCfsX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b9e7837ef5e3bdd8f03a277f3bfca833737c473 --- /dev/null +++ b/annotations_1/hOH-oOCfsX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.38], [11.0, 11.47], [12.0, 12.48], [16.0, 19.92], [21.0, 48.51], [53.0, 67.12], [107.0, 157.01], [158.0, 159.54], [162.0, 164.39], [165.0, 168.34]], "keep_status": [true, false, false, true, true, true, false, false, true, true], "silence_prob": [33.71, 0.0, 0.0, 31.08, 34.29, 33.1, 0.0, 0.0, 31.05, 31.75], "audiomae_on_audioset": [[["speech", 47.41], ["creak", 7.09], ["livestock, farm animals, working animals", 6.93]], null, null, [["livestock, farm animals, working animals", 30.6], ["cattle, bovinae", 21.2], ["moo", 12.77]], [["animal", 24.77], ["horse", 20.29], ["clip-clop", 18.36]], [["speech", 37.4], ["clip-clop", 7.17], ["animal", 6.69]], null, null, [["hum", 21.87], ["speech", 16.82], ["throbbing", 16.41]], [["cattle, bovinae", 36.39], ["moo", 14.44], ["livestock, farm animals, working animals", 10.29]]], "duration": [3.38, 0.47, 0.48, 3.92, 27.51, 14.12, 50.01, 1.54, 2.39, 3.34]} \ No newline at end of file diff --git a/annotations_1/hQIL99lP484_filtered.json b/annotations_1/hQIL99lP484_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2020207d29bffea14deeced76f7b23ef3931d5b3 --- /dev/null +++ b/annotations_1/hQIL99lP484_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.74], [19.0, 19.26], [30.0, 31.53], [32.0, 32.27], [38.0, 38.72], [40.0, 40.85], [45.0, 50.08], [52.0, 56.64], [63.0, 63.04], [67.0, 72.52], [76.0, 77.25], [80.0, 80.54], [82.0, 82.56], [84.0, 87.54], [92.0, 99.5], [103.0, 105.38], [106.0, 111.16], [115.0, 124.82], [126.0, 131.68], [132.0, 134.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, true], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 55.53, 54.23, 0.0, 70.02, 0.0, 0.0, 0.0, 65.79, 60.6, 45.69, 33.51, 30.5, 35.2, 36.4], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.41], ["speech", 7.85], ["theremin", 5.95]], [["speech", 25.99], ["groan", 23.86], ["music", 18.32]], [["music", 23.68], ["vehicle", 22.56], ["car", 15.98]], [["music", 34.16], ["speech", 15.05], ["livestock, farm animals, working animals", 7.08]], [["moo", 18.41], ["music", 17.97], ["speech", 16.36]]], "duration": [2.74, 0.26, 1.53, 0.27, 0.72, 0.85, 5.08, 4.64, 0.04, 5.52, 1.25, 0.54, 0.56, 3.54, 7.5, 2.38, 5.16, 9.82, 5.68, 2.7]} \ No newline at end of file diff --git a/annotations_1/hQUBid6LIPU_filtered.json b/annotations_1/hQUBid6LIPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b9694a9094fc8eee7b23fd99a393a1398714ef --- /dev/null +++ b/annotations_1/hQUBid6LIPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.56], [34.0, 39.11], [42.0, 43.14], [45.0, 48.05], [51.0, 52.71], [54.0, 57.28], [61.0, 62.99], [64.0, 65.92], [66.0, 67.39], [69.0, 71.24], [74.0, 75.81], [78.0, 84.65], [88.0, 89.85], [92.0, 93.85], [96.0, 99.15], [103.0, 105.33], [107.0, 107.0], [109.0, 111.25], [114.0, 115.84], [117.0, 118.2], [119.0, 120.97], [122.0, 127.01], [128.0, 129.32], [130.0, 131.43], [132.0, 134.72], [136.0, 143.01], [143.0, 151.44], [154.0, 154.95], [159.0, 159.46], [160.0, 162.94], [166.0, 167.85], [169.0, 174.93], [177.0, 183.95], [185.0, 188.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.41, 0.0, 99.92, 0.0, 79.41, 0.0, 0.0, 0.0, 94.37, 0.0, 86.45, 0.0, 0.0, 99.95, 99.95, 0.0, 99.78, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 99.05, 77.2, 93.29, 0.0, 0.0, 56.18, 0.0, 99.96, 99.97, 99.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 5.11, 1.14, 3.05, 1.71, 3.28, 1.99, 1.92, 1.39, 2.24, 1.81, 6.65, 1.85, 1.85, 3.15, 2.33, 0.0, 2.25, 1.84, 1.2, 1.97, 5.01, 1.32, 1.43, 2.72, 7.01, 8.44, 0.95, 0.46, 2.94, 1.85, 5.93, 6.95, 3.3]} \ No newline at end of file diff --git a/annotations_1/hQmDmh3qA6s_filtered.json b/annotations_1/hQmDmh3qA6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1569b72b3a07196b9422a8aee332d358e3bdaedc --- /dev/null +++ b/annotations_1/hQmDmh3qA6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 40.24], [42.0, 42.89], [47.0, 47.73], [49.0, 49.92], [54.0, 61.3], [63.0, 76.25], [79.0, 78.97], [82.0, 84.3], [85.0, 85.73], [87.0, 87.49], [89.0, 90.29], [91.0, 91.81], [94.0, 94.91], [100.0, 100.72], [107.0, 107.6], [115.0, 115.89], [117.0, 118.22], [121.0, 126.94], [127.0, 131.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.88, 0.0, 0.0, 0.0, 50.56, 32.0, 0.0, 38.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.16, 34.31], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 43.24], ["music", 30.16], ["explosion", 5.38]], null, [["speech", 51.27], ["eruption", 4.83], ["hum", 2.5]], null, null, null, null, null, null, null, null, null, [["speech", 92.67], ["fart", 1.61], ["whack, thwack", 0.67]], [["speech", 42.51], ["animal", 15.51], ["dog", 13.35]]], "duration": [5.24, 0.89, 0.73, 0.92, 7.3, 13.25, -0.03, 2.3, 0.73, 0.49, 1.29, 0.81, 0.91, 0.72, 0.6, 0.89, 1.22, 5.94, 4.46]} \ No newline at end of file diff --git a/annotations_1/hR4oc1us1aU_filtered.json b/annotations_1/hR4oc1us1aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf6cf1a3c7d574b2362f625a1996c810d812535c --- /dev/null +++ b/annotations_1/hR4oc1us1aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.4], [10.0, 10.02], [10.0, 11.16], [12.0, 12.29], [13.0, 13.39], [24.0, 25.1], [44.0, 44.85], [47.0, 53.03], [54.0, 54.97], [60.0, 61.23], [63.0, 64.66], [67.0, 67.2], [71.0, 71.17], [75.0, 80.28], [90.0, 92.82], [98.0, 101.98], [104.0, 109.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 31.91, 29.86, 29.52, 29.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["explosion", 45.36], ["speech", 20.66], ["burst, pop", 8.14]], null, null, null, null, null, [["speech", 65.18], ["groan", 5.43], ["music", 5.24]], [["music", 30.61], ["speech", 27.36], ["whack, thwack", 12.88]], [["speech", 37.32], ["explosion", 9.47], ["whack, thwack", 9.06]], [["whack, thwack", 48.64], ["speech", 10.46], ["thunk", 7.69]]], "duration": [0.4, 0.02, 1.16, 0.29, 0.39, 1.1, 0.85, 6.03, 0.97, 1.23, 1.66, 0.2, 0.17, 5.28, 2.82, 3.98, 5.21]} \ No newline at end of file diff --git a/annotations_1/hRfF8Kes77E_filtered.json b/annotations_1/hRfF8Kes77E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55014348cd1511c261217b2d2c37301f133262cb --- /dev/null +++ b/annotations_1/hRfF8Kes77E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.85], [12.0, 19.82], [22.0, 24.73], [25.0, 26.5], [31.0, 32.58], [49.0, 49.13], [49.0, 53.45], [54.0, 54.26], [61.0, 74.44], [77.0, 77.84], [82.0, 83.51], [89.0, 114.47], [115.0, 117.64], [119.0, 119.1], [119.0, 136.61]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 35.76, 31.23, 0.0, 0.0, 0.0, 38.8, 0.0, 33.02, 0.0, 0.0, 32.13, 36.89, 0.0, 44.09], "audiomae_on_audioset": [null, [["music", 18.0], ["whale vocalization", 14.99], ["noise", 10.6]], [["noise", 31.76], ["grunt", 12.71], ["whale vocalization", 12.45]], null, null, null, [["speech", 43.37], ["music", 34.79], ["electronic music", 2.22]], null, [["speech", 51.42], ["music", 23.18], ["noise", 5.15]], null, null, [["music", 26.87], ["buzz", 16.64], ["speech", 7.39]], [["whale vocalization", 11.03], ["music", 10.39], ["mosquito", 5.55]], null, [["music", 49.78], ["electronic music", 9.79], ["ambient music", 4.97]]], "duration": [1.85, 7.82, 2.73, 1.5, 1.58, 0.13, 4.45, 0.26, 13.44, 0.84, 1.51, 25.47, 2.64, 0.1, 17.61]} \ No newline at end of file diff --git a/annotations_1/hRg2HEpwD5A_filtered.json b/annotations_1/hRg2HEpwD5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfa6152dfe8dc796de959bc15a842d3f7224073d --- /dev/null +++ b/annotations_1/hRg2HEpwD5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [7.0, 8.46], [9.0, 10.05], [12.0, 12.09], [13.0, 14.49], [16.0, 17.59], [23.0, 49.96], [53.0, 58.06], [64.0, 82.44], [82.0, 82.48], [82.0, 82.51], [83.0, 119.91], [120.0, 120.26], [121.0, 138.69], [139.0, 143.16], [144.0, 150.25], [153.0, 161.5], [163.0, 168.67]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.62, 33.14, 30.91, 0.0, 0.0, 0.0, 0.0, 30.78, 30.77, 31.48, 38.94, 57.17], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 50.33], ["whack, thwack", 7.67], ["hum", 4.26]], [["boing", 25.77], ["crowd", 18.94], ["speech", 10.96]], [["music", 27.81], ["whack, thwack", 6.6], ["speech", 3.9]], null, null, null, null, [["music", 56.03], ["speech", 9.94], ["animal", 5.01]], [["vehicle", 34.54], ["motorcycle", 9.94], ["car", 7.87]], [["music", 46.87], ["speech", 7.57], ["explosion", 6.4]], [["sidetone", 26.51], ["noise", 6.58], ["cacophony", 6.44]], null], "duration": [0.74, 1.46, 1.05, 0.09, 1.49, 1.59, 26.96, 5.06, 18.44, 0.48, 0.51, 36.91, 0.26, 17.69, 4.16, 6.25, 8.5, 5.67]} \ No newline at end of file diff --git a/annotations_1/hSBoEivF-hk_filtered.json b/annotations_1/hSBoEivF-hk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29b1d0ccbc8f18c31c075b8791df88ba75732a06 --- /dev/null +++ b/annotations_1/hSBoEivF-hk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 34.8], [36.0, 36.54], [37.0, 50.85], [52.0, 78.14], [87.0, 89.02], [91.0, 97.34], [99.0, 99.52], [102.0, 103.57], [104.0, 111.18], [111.0, 111.52], [112.0, 114.08], [115.0, 115.3], [116.0, 116.45], [119.0, 122.89], [125.0, 126.45]], "keep_status": [false, false, true, true, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.44, 30.09, 29.49, 31.37, 0.0, 0.0, 30.55, 0.0, 33.62, 0.0, 0.0, 31.65, 0.0], "audiomae_on_audioset": [null, null, [["music", 29.98], ["buzz", 8.04], ["radio", 5.41]], [["music", 60.45], ["livestock, farm animals, working animals", 4.83], ["moo", 4.44]], [["music", 52.76], ["musical instrument", 6.42], ["trombone", 3.89]], [["music", 32.47], ["brass instrument", 18.27], ["speech", 11.0]], null, null, [["music", 47.31], ["speech", 28.52], ["foghorn", 5.95]], null, [["speech", 14.56], ["music", 13.8], ["moo", 5.78]], null, null, [["music", 70.42], ["theremin", 7.87], ["musical instrument", 6.05]], null], "duration": [30.8, 0.54, 13.85, 26.14, 2.02, 6.34, 0.52, 1.57, 7.18, 0.52, 2.08, 0.3, 0.45, 3.89, 1.45]} \ No newline at end of file diff --git a/annotations_1/hT_CiaTcnN8_filtered.json b/annotations_1/hT_CiaTcnN8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..077a548041060754c53887194022e334d50e2795 --- /dev/null +++ b/annotations_1/hT_CiaTcnN8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 22.15], [23.0, 30.0], [30.0, 32.16], [32.0, 33.98], [40.0, 41.59], [48.0, 58.6]], "keep_status": [true, false, false, false, false, true], "silence_prob": [29.99, 28.94, 30.07, 0.0, 0.0, 29.24], "audiomae_on_audioset": [[["music", 36.18], ["speech", 18.08], ["didgeridoo", 11.79]], [["mains hum", 34.1], ["music", 20.53], ["hum", 15.9]], [["music", 43.76], ["speech", 21.93], ["sidetone", 13.01]], null, null, [["speech", 21.27], ["music", 20.28], ["throbbing", 19.16]]], "duration": [11.15, 7.0, 2.16, 1.98, 1.59, 10.6]} \ No newline at end of file diff --git a/annotations_1/hT_G4j4nI-8_filtered.json b/annotations_1/hT_G4j4nI-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6ac2f2b38e14c1fb983f32cfb087dad7ddc743e --- /dev/null +++ b/annotations_1/hT_G4j4nI-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.08], [23.0, 25.46], [32.0, 32.66], [45.0, 50.95], [57.0, 60.25]], "keep_status": [false, true, false, true, true], "silence_prob": [0.0, 40.24, 0.0, 32.29, 30.71], "audiomae_on_audioset": [null, [["music", 20.18], ["fart", 9.66], ["speech", 8.36]], null, [["speech", 35.1], ["music", 7.83], ["sidetone", 6.26]], [["crowd", 15.83], ["echo", 11.27], ["cheering", 10.92]]], "duration": [1.08, 2.46, 0.66, 5.95, 3.25]} \ No newline at end of file diff --git a/annotations_1/hTpVCu5DzpA_filtered.json b/annotations_1/hTpVCu5DzpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8958d44d8245339b1c83b68cc0de7e61e834dc18 --- /dev/null +++ b/annotations_1/hTpVCu5DzpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 26.62], [28.0, 28.16], [30.0, 30.48], [32.0, 33.57], [35.0, 72.93], [76.0, 78.02], [79.0, 105.61], [106.0, 113.51], [117.0, 118.39], [119.0, 148.76], [150.0, 158.01]], "keep_status": [true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [31.48, 0.0, 0.0, 0.0, 0.0, 31.66, 31.98, 30.83, 0.0, 31.36, 32.9], "audiomae_on_audioset": [[["music", 54.31], ["vehicle", 6.63], ["carnatic music", 4.27]], null, null, null, null, [["music", 48.03], ["throbbing", 11.77], ["roar", 9.11]], [["boing", 77.74], ["music", 12.76], ["cattle, bovinae", 2.38]], [["music", 26.53], ["sidetone", 26.3], ["throbbing", 10.28]], null, [["speech", 41.31], ["music", 27.3], ["throbbing", 4.04]], [["livestock, farm animals, working animals", 38.05], ["cattle, bovinae", 16.28], ["moo", 10.29]]], "duration": [18.62, 0.16, 0.48, 1.57, 37.93, 2.02, 26.61, 7.51, 1.39, 29.76, 8.01]} \ No newline at end of file diff --git a/annotations_1/hTzUYt__ogY_filtered.json b/annotations_1/hTzUYt__ogY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d248a78efdac0411978a997ff02929cef89816c --- /dev/null +++ b/annotations_1/hTzUYt__ogY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 21.57], [22.0, 23.72], [24.0, 24.93]], "keep_status": [false, false, false], "silence_prob": [60.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [3.57, 1.72, 0.93]} \ No newline at end of file diff --git a/annotations_1/hV55sjy1QFI_filtered.json b/annotations_1/hV55sjy1QFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad3e10d5a9ef7d9c98197e1a62304fcfff71208 --- /dev/null +++ b/annotations_1/hV55sjy1QFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [6.0, 6.83], [15.0, 17.44], [35.0, 35.8], [36.0, 36.85], [38.0, 44.31], [60.0, 60.54], [65.0, 65.08], [68.0, 69.58], [76.0, 91.32], [94.0, 94.85], [96.0, 96.79], [98.0, 99.1], [103.0, 103.44], [104.0, 108.35], [112.0, 112.67], [122.0, 135.41], [136.0, 138.81], [140.0, 144.85], [146.0, 146.96], [150.0, 154.75], [156.0, 166.18]], "keep_status": [false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 29.66, 0.0, 0.0, 28.86, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 0.0, 0.0, 34.95, 0.0, 30.67, 34.48, 30.11, 0.0, 30.59, 30.14], "audiomae_on_audioset": [null, null, [["music", 25.73], ["smash, crash", 18.21], ["speech", 14.23]], null, null, [["music", 30.26], ["skidding", 17.45], ["vehicle", 14.04]], null, null, null, [["music", 72.44], ["throbbing", 6.23], ["didgeridoo", 4.95]], null, null, null, null, [["speech", 21.53], ["music", 19.89], ["throbbing", 13.12]], null, [["music", 71.59], ["hum", 6.78], ["speech", 5.89]], [["music", 39.38], ["speech", 22.66], ["throbbing", 8.44]], [["music", 44.92], ["throbbing", 8.31], ["techno", 6.89]], null, [["music", 36.58], ["speech", 18.54], ["throbbing", 16.99]], [["music", 69.53], ["throbbing", 11.0], ["soundtrack music", 3.8]]], "duration": [0.5, 0.83, 2.44, 0.8, 0.85, 6.31, 0.54, 0.08, 1.58, 15.32, 0.85, 0.79, 1.1, 0.44, 4.35, 0.67, 13.41, 2.81, 4.85, 0.96, 4.75, 10.18]} \ No newline at end of file diff --git a/annotations_1/hX-ezXejcU0_filtered.json b/annotations_1/hX-ezXejcU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..808566eee2af3aeb88e29e43f5ed39783a259f2f --- /dev/null +++ b/annotations_1/hX-ezXejcU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.36], [37.0, 38.92], [39.0, 38.96], [39.0, 39.41], [39.0, 78.95], [81.0, 89.88], [90.0, 90.69], [92.0, 92.69], [94.0, 94.74], [97.0, 98.0], [98.0, 155.66]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.63, 0.0, 0.0, 0.0, 0.0, 30.48, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.6], ["drum", 6.31], ["speech", 5.3]], null, null, null, null, [["music", 23.46], ["boing", 15.11], ["whack, thwack", 13.81]], null, null, null, null, null], "duration": [15.36, 1.92, -0.04, 0.41, 39.95, 8.88, 0.69, 0.69, 0.74, 1.0, 57.66]} \ No newline at end of file diff --git a/annotations_1/hYIWCm-Lpj0_filtered.json b/annotations_1/hYIWCm-Lpj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96b28153575eb8c0d9075a2f41262cdf03c27521 --- /dev/null +++ b/annotations_1/hYIWCm-Lpj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.71], [14.0, 19.99], [28.0, 28.83], [32.0, 43.28], [45.0, 45.55], [47.0, 47.75], [51.0, 51.56], [55.0, 55.88], [59.0, 63.78], [69.0, 69.25], [73.0, 76.62], [78.0, 78.81], [80.0, 87.81], [90.0, 90.59], [107.0, 106.83], [112.0, 114.47], [116.0, 117.9], [119.0, 121.34], [126.0, 126.98], [130.0, 130.77], [132.0, 132.02], [134.0, 134.77], [137.0, 137.25], [144.0, 143.75], [150.0, 152.29], [153.0, 154.52], [165.0, 165.82]], "keep_status": [false, true, false, false, false, false, false, false, true, false, true, false, true, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.92, 0.0, 30.75, 0.0, 0.0, 0.0, 0.0, 29.8, 0.0, 29.92, 0.0, 34.98, 0.0, 0.0, 49.73, 0.0, 46.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 47.87], ["vehicle", 12.39], ["boat, water vehicle", 2.92]], null, [["speech", 73.62], ["crowd", 2.57], ["horse", 2.46]], null, null, null, null, [["cattle, bovinae", 35.2], ["moo", 15.12], ["speech", 14.59]], null, [["zipper (clothing)", 12.76], ["music", 9.28], ["cacophony", 7.65]], null, [["hum", 26.16], ["noise", 21.96], ["mains hum", 7.98]], null, null, [["hum", 22.96], ["music", 10.83], ["mains hum", 8.11]], null, [["theremin", 19.18], ["music", 17.08], ["speech", 14.24]], null, null, null, null, null, null, null, null, null], "duration": [0.71, 5.99, 0.83, 11.28, 0.55, 0.75, 0.56, 0.88, 4.78, 0.25, 3.62, 0.81, 7.81, 0.59, -0.17, 2.47, 1.9, 2.34, 0.98, 0.77, 0.02, 0.77, 0.25, -0.25, 2.29, 1.52, 0.82]} \ No newline at end of file diff --git a/annotations_1/hYvxbtiGvrk_filtered.json b/annotations_1/hYvxbtiGvrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dc827a8e782c07f5690eac1c3324252f01353bf --- /dev/null +++ b/annotations_1/hYvxbtiGvrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.11], [24.0, 24.44], [26.0, 26.4], [28.0, 29.0], [29.0, 29.66], [30.0, 31.87], [33.0, 44.9], [46.0, 51.04], [53.0, 142.74]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.77, 30.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 36.58], ["didgeridoo", 24.67], ["speech", 14.35]], [["music", 63.34], ["speech", 11.99], ["musical instrument", 6.25]], null], "duration": [0.11, 0.44, 0.4, 1.0, 0.66, 1.87, 11.9, 5.04, 89.74]} \ No newline at end of file diff --git a/annotations_1/hZPz4w3jLXI_filtered.json b/annotations_1/hZPz4w3jLXI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..328cf06263ae313c23e526456119047eb0231297 --- /dev/null +++ b/annotations_1/hZPz4w3jLXI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.83], [6.0, 6.83], [8.0, 8.65], [14.0, 21.34], [23.0, 24.17], [30.0, 35.45], [38.0, 39.7], [42.0, 42.85], [43.0, 46.89], [47.0, 49.45], [50.0, 50.84], [51.0, 52.3], [55.0, 55.66], [56.0, 56.24], [59.0, 60.03], [64.0, 64.84], [69.0, 74.98], [75.0, 75.02], [76.0, 88.6], [93.0, 93.66], [94.0, 94.31], [95.0, 96.48], [98.0, 99.52], [102.0, 104.01], [106.0, 106.19], [106.0, 114.44], [116.0, 119.03], [122.0, 123.28], [126.0, 127.52], [129.0, 130.0], [131.0, 131.99], [134.0, 135.58], [136.0, 140.09], [141.0, 142.28], [144.0, 144.41], [146.0, 150.03], [153.0, 153.12], [154.0, 154.23]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 58.3, 0.0, 63.53, 0.0, 0.0, 40.55, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.92, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0, 41.44, 0.0, 30.34, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 91.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.56], ["moo", 21.32], ["livestock, farm animals, working animals", 14.79]], [["speech", 24.41], ["cattle, bovinae", 10.49], ["moo", 9.48]], null, null, null, null, null, null, null, null, [["music", 69.61], ["musical instrument", 5.45], ["effects unit", 2.87]], null, null, null, null, [["speech", 26.01], ["breaking", 19.97], ["smash, crash", 6.83]], null, [["whack, thwack", 10.79], ["livestock, farm animals, working animals", 8.66], ["boing", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 0.83, 0.65, 7.34, 1.17, 5.45, 1.7, 0.85, 3.89, 2.45, 0.84, 1.3, 0.66, 0.24, 1.03, 0.84, 5.98, 0.02, 12.6, 0.66, 0.31, 1.48, 1.52, 2.01, 0.19, 8.44, 3.03, 1.28, 1.52, 1.0, 0.99, 1.58, 4.09, 1.28, 0.41, 4.03, 0.12, 0.23]} \ No newline at end of file diff --git a/annotations_1/hZvud4MnaQ0_filtered.json b/annotations_1/hZvud4MnaQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef73b3da0ce680289af3ae6d1b20e4075e25d89 --- /dev/null +++ b/annotations_1/hZvud4MnaQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.4], [12.0, 11.75], [13.0, 13.19], [16.0, 17.0], [20.0, 20.46], [22.0, 22.92], [26.0, 27.75], [31.0, 33.84], [38.0, 46.9], [47.0, 48.27], [49.0, 49.62], [50.0, 51.24], [58.0, 79.17], [80.0, 82.78], [85.0, 86.12], [88.0, 88.3], [93.0, 96.03], [97.0, 98.32], [99.0, 101.58], [102.0, 102.24], [102.0, 105.56], [106.0, 108.53], [110.0, 114.45], [116.0, 124.19], [125.0, 135.99], [138.0, 143.77], [146.0, 147.16], [149.0, 150.06], [151.0, 151.93]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.33, 32.35, 0.0, 0.0, 0.0, 28.47, 35.45, 0.0, 0.0, 86.82, 0.0, 98.1, 0.0, 68.67, 87.92, 76.37, 68.02, 63.42, 46.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 40.31], ["rumble", 6.58], ["speech", 5.59]], null, null, null, null, null, null, null, [["speech", 70.26], ["music", 12.47], ["breaking", 5.26]], null, null, null, [["hum", 40.87], ["throbbing", 22.56], ["mains hum", 20.06]], [["music", 41.98], ["musical instrument", 8.45], ["ambient music", 6.42]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.07], ["music", 20.1], ["speech", 15.23]], null, null, null], "duration": [4.4, -0.25, 0.19, 1.0, 0.46, 0.92, 1.75, 2.84, 8.9, 1.27, 0.62, 1.24, 21.17, 2.78, 1.12, 0.3, 3.03, 1.32, 2.58, 0.24, 3.56, 2.53, 4.45, 8.19, 10.99, 5.77, 1.16, 1.06, 0.93]} \ No newline at end of file diff --git a/annotations_1/haX0ACElUQc_filtered.json b/annotations_1/haX0ACElUQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49545b65ffef7d847d7fe29899b5a41a15313706 --- /dev/null +++ b/annotations_1/haX0ACElUQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.22], [16.0, 22.37], [32.0, 33.54], [38.0, 38.1], [39.0, 39.73], [40.0, 40.14], [42.0, 46.43], [50.0, 50.18], [54.0, 54.77], [61.0, 68.35], [71.0, 71.66], [72.0, 73.09], [73.0, 74.49], [75.0, 76.37], [77.0, 84.1], [86.0, 86.86], [88.0, 98.07], [102.0, 103.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.44, 0.0, 0.0, 0.0, 0.0, 63.53, 0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 38.68, 0.0, 32.37, 0.0], "audiomae_on_audioset": [null, [["speech", 35.92], ["tap", 15.64], ["clapping", 9.87]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.8], ["hum", 30.96], ["mains hum", 15.32]], null, [["hum", 39.68], ["mains hum", 36.23], ["white noise", 3.05]], null], "duration": [0.22, 6.37, 1.54, 0.1, 0.73, 0.14, 4.43, 0.18, 0.77, 7.35, 0.66, 1.09, 1.49, 1.37, 7.1, 0.86, 10.07, 1.23]} \ No newline at end of file diff --git a/annotations_1/hbDdiPNS3ck_filtered.json b/annotations_1/hbDdiPNS3ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa4a606c51e3a2f4494e1a3ce782f0bac85aa3c7 --- /dev/null +++ b/annotations_1/hbDdiPNS3ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.93], [21.0, 28.48], [33.0, 33.42], [36.0, 36.42], [38.0, 38.33], [42.0, 41.96], [46.0, 45.96], [48.0, 49.03], [54.0, 54.6], [56.0, 57.01], [61.0, 60.76]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whack, thwack", 13.14], ["throbbing", 11.0], ["breaking", 10.86]], null, null, null, null, null, null, null, null, null], "duration": [0.93, 7.48, 0.42, 0.42, 0.33, -0.04, -0.04, 1.03, 0.6, 1.01, -0.24]} \ No newline at end of file diff --git a/annotations_1/hcWY1CYRCsw_filtered.json b/annotations_1/hcWY1CYRCsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37045782e42e9921f4742dab20efd3c717f1cbba --- /dev/null +++ b/annotations_1/hcWY1CYRCsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 37.49], [42.0, 43.09], [48.0, 48.66], [52.0, 68.28], [72.0, 92.25], [94.0, 100.38]], "keep_status": [true, false, false, false, false, false], "silence_prob": [29.41, 0.0, 0.0, 28.87, 31.65, 52.92], "audiomae_on_audioset": [[["music", 42.77], ["synthesizer", 9.65], ["hum", 8.61]], null, null, [["music", 36.64], ["speech", 34.95], ["fart", 2.1]], [["music", 48.54], ["sonar", 17.59], ["synthesizer", 4.04]], null], "duration": [14.49, 1.09, 0.66, 16.28, 20.25, 6.38]} \ No newline at end of file diff --git a/annotations_1/hcb0vROvmWk_filtered.json b/annotations_1/hcb0vROvmWk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e09e8d286fb55c7bf396154fb20c58a128d36d74 --- /dev/null +++ b/annotations_1/hcb0vROvmWk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 45.55], [49.0, 50.28], [52.0, 90.44], [92.0, 106.52], [107.0, 107.59]], "keep_status": [false, false, false, true, false], "silence_prob": [30.53, 0.0, 0.0, 38.88, 0.0], "audiomae_on_audioset": [[["music", 56.92], ["boing", 30.71], ["echo", 1.58]], null, null, [["hum", 18.19], ["music", 15.01], ["fly, housefly", 12.62]], null], "duration": [9.55, 1.28, 38.44, 14.52, 0.59]} \ No newline at end of file diff --git a/annotations_1/hck3C2VMRzk_filtered.json b/annotations_1/hck3C2VMRzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4aac57e2c000d1a2c4424163fc6b6b5e51917c3 --- /dev/null +++ b/annotations_1/hck3C2VMRzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.13], [10.0, 14.35], [24.0, 25.03], [28.0, 33.27], [41.0, 46.53], [51.0, 57.3], [58.0, 58.75], [71.0, 77.38], [81.0, 81.97], [89.0, 89.11], [99.0, 102.69], [107.0, 121.81], [124.0, 126.66], [127.0, 131.11]], "keep_status": [true, true, false, true, true, true, false, true, false, false, false, true, true, false], "silence_prob": [35.57, 35.16, 0.0, 31.04, 31.02, 30.4, 0.0, 33.14, 0.0, 0.0, 30.53, 30.3, 31.33, 31.06], "audiomae_on_audioset": [[["creak", 25.05], ["music", 9.17], ["smash, crash", 7.1]], [["music", 23.96], ["fly, housefly", 19.43], ["insect", 19.27]], null, [["music", 35.78], ["speech", 30.37], ["fart", 3.27]], [["music", 33.65], ["speech", 20.78], ["throbbing", 10.83]], [["speech", 37.93], ["music", 13.98], ["hum", 9.87]], null, [["music", 43.38], ["fly, housefly", 11.53], ["speech", 4.51]], null, null, [["music", 71.43], ["speech", 12.51], ["scratching (performance technique)", 3.31]], [["music", 48.52], ["tabla", 9.35], ["percussion", 5.9]], [["music", 22.19], ["fly, housefly", 13.33], ["boing", 12.65]], [["music", 58.17], ["thunk", 8.43], ["speech", 5.9]]], "duration": [3.13, 4.35, 1.03, 5.27, 5.53, 6.3, 0.75, 6.38, 0.97, 0.11, 3.69, 14.81, 2.66, 4.11]} \ No newline at end of file diff --git a/annotations_1/hdQOL2aFufE_filtered.json b/annotations_1/hdQOL2aFufE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fdceb9e607de23aa08f9a6d226edc6752af1ab0 --- /dev/null +++ b/annotations_1/hdQOL2aFufE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [6.0, 6.99], [12.0, 12.43], [16.0, 16.12], [38.0, 38.42], [54.0, 54.53], [55.0, 55.78], [58.0, 58.82], [63.0, 64.35], [67.0, 67.41], [69.0, 69.2], [71.0, 71.73], [73.0, 73.77], [74.0, 76.4], [78.0, 78.48], [88.0, 88.48], [91.0, 91.57], [98.0, 98.25], [102.0, 102.96], [104.0, 103.87], [105.0, 105.29], [109.0, 109.32], [110.0, 110.98], [113.0, 113.95], [116.0, 115.96], [117.0, 118.62], [122.0, 122.17], [123.0, 124.61], [127.0, 127.92], [132.0, 133.27], [135.0, 136.16], [138.0, 140.78], [143.0, 144.48], [146.0, 147.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.99, 0.43, 0.12, 0.42, 0.53, 0.78, 0.82, 1.35, 0.41, 0.2, 0.73, 0.77, 2.4, 0.48, 0.48, 0.57, 0.25, 0.96, -0.13, 0.29, 0.32, 0.98, 0.95, -0.04, 1.62, 0.17, 1.61, 0.92, 1.27, 1.16, 2.78, 1.48, 1.26]} \ No newline at end of file diff --git a/annotations_1/hdnrorjl0WM_filtered.json b/annotations_1/hdnrorjl0WM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5858776ba293db95241a421df92462f3475a8b13 --- /dev/null +++ b/annotations_1/hdnrorjl0WM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 21.68], [23.0, 24.78], [31.0, 32.12], [37.0, 37.94], [42.0, 42.9], [44.0, 47.29], [49.0, 53.05], [54.0, 55.97], [57.0, 57.15], [58.0, 59.88], [61.0, 60.59], [61.0, 60.79], [62.0, 64.12], [65.0, 65.35], [68.0, 69.92], [71.0, 72.45], [77.0, 77.48], [79.0, 84.99], [89.0, 92.06], [95.0, 95.27], [96.0, 96.75], [99.0, 101.31], [105.0, 106.66], [114.0, 115.6], [117.0, 118.79], [121.0, 121.41], [127.0, 130.13], [132.0, 132.71], [137.0, 136.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 0.0, 0.0, 100.0, 90.25, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.91, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.68, 1.78, 1.12, 0.94, 0.9, 3.29, 4.05, 1.97, 0.15, 1.88, -0.41, -0.21, 2.12, 0.35, 1.92, 1.45, 0.48, 5.99, 3.06, 0.27, 0.75, 2.31, 1.66, 1.6, 1.79, 0.41, 3.13, 0.71, -0.08]} \ No newline at end of file diff --git a/annotations_1/hf1wQVWs0DA_filtered.json b/annotations_1/hf1wQVWs0DA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d1fd5f0c5c0eac33b5ca51fd1239ba8683aafb --- /dev/null +++ b/annotations_1/hf1wQVWs0DA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.59], [4.0, 4.63], [8.0, 8.83], [15.0, 15.13], [18.0, 18.23], [19.0, 20.39], [21.0, 21.17], [23.0, 23.87], [25.0, 25.78], [28.0, 29.79], [31.0, 31.36], [33.0, 33.88], [34.0, 35.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.63, 0.83, 0.13, 0.23, 1.39, 0.17, 0.87, 0.78, 1.79, 0.36, 0.88, 1.75]} \ No newline at end of file diff --git a/annotations_1/hfNlv4HLZ5k_filtered.json b/annotations_1/hfNlv4HLZ5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1696f38f44983753c248e21a3b1bd5e7b6e6c28e --- /dev/null +++ b/annotations_1/hfNlv4HLZ5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.05], [14.0, 15.35], [17.0, 17.88], [19.0, 20.38], [21.0, 22.99], [23.0, 24.21], [28.0, 29.98], [32.0, 33.29], [34.0, 37.71], [38.0, 47.48], [49.0, 51.29], [53.0, 55.09], [56.0, 56.13], [57.0, 57.87], [59.0, 60.35], [63.0, 64.02], [66.0, 67.07], [68.0, 68.86], [70.0, 70.33], [71.0, 72.18], [74.0, 76.03], [77.0, 80.1], [82.0, 83.27], [85.0, 86.9], [87.0, 93.6], [95.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.95, 50.02, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 98.19, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["dial tone", 44.93], ["busy signal", 9.39], ["speech", 6.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.35, 0.88, 1.38, 1.99, 1.21, 1.98, 1.29, 3.71, 9.48, 2.29, 2.09, 0.13, 0.87, 1.35, 1.02, 1.07, 0.86, 0.33, 1.18, 2.03, 3.1, 1.27, 1.9, 6.6, 1.01]} \ No newline at end of file diff --git a/annotations_1/hfzsR-3PLcg_filtered.json b/annotations_1/hfzsR-3PLcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73caf0da8920f660d32f7904eef9886b2a01a46b --- /dev/null +++ b/annotations_1/hfzsR-3PLcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [9.0, 10.03], [12.0, 12.29], [13.0, 14.22], [17.0, 18.84], [20.0, 20.92], [27.0, 33.29], [34.0, 33.88], [35.0, 35.14], [44.0, 45.81], [50.0, 55.0], [60.0, 60.4], [61.0, 63.53], [64.0, 84.65]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.24, 0.0, 0.0, 0.0, 60.51, 0.0, 34.93, 33.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 23.62], ["speech", 19.08], ["hum", 11.88]], null, null, null, null, null, [["fart", 80.08], ["music", 6.38], ["musical instrument", 0.97]], [["music", 59.13], ["speech", 19.56], ["musical instrument", 3.1]]], "duration": [0.38, 1.03, 0.29, 1.22, 1.84, 0.92, 6.29, -0.12, 0.14, 1.81, 5.0, 0.4, 2.53, 20.65]} \ No newline at end of file diff --git a/annotations_1/hgGi1ODlBBo_filtered.json b/annotations_1/hgGi1ODlBBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd74cedc989df879e73ec6e71e88822fcbaf935c --- /dev/null +++ b/annotations_1/hgGi1ODlBBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.5], [12.0, 13.0], [15.0, 16.29], [19.0, 21.56], [23.0, 24.58], [26.0, 27.97], [30.0, 32.71], [34.0, 34.65], [39.0, 43.97], [47.0, 48.78], [51.0, 61.28], [63.0, 67.37], [68.0, 87.76], [88.0, 95.44], [98.0, 144.51]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, true, false], "silence_prob": [40.28, 0.0, 0.0, 35.35, 0.0, 0.0, 55.6, 0.0, 29.69, 0.0, 28.47, 29.16, 29.05, 28.62, 0.0], "audiomae_on_audioset": [[["coin (dropping)", 67.94], ["music", 12.48], ["breaking", 6.62]], null, null, [["music", 32.63], ["mains hum", 22.35], ["hum", 20.51]], null, null, null, null, [["music", 41.23], ["didgeridoo", 13.99], ["speech", 6.05]], null, [["music", 28.9], ["mains hum", 13.7], ["hum", 12.8]], [["music", 28.97], ["mains hum", 16.52], ["hum", 15.36]], [["music", 52.31], ["speech", 22.87], ["throbbing", 5.77]], [["music", 52.24], ["hum", 6.2], ["mains hum", 5.89]], null], "duration": [5.5, 1.0, 1.29, 2.56, 1.58, 1.97, 2.71, 0.65, 4.97, 1.78, 10.28, 4.37, 19.76, 7.44, 46.51]} \ No newline at end of file diff --git a/annotations_1/hgLkypdC6wo_filtered.json b/annotations_1/hgLkypdC6wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca2cccc736f739b937a226b768c7bde417482f2a --- /dev/null +++ b/annotations_1/hgLkypdC6wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 22.57], [23.0, 24.75], [26.0, 38.48], [43.0, 44.58], [45.0, 85.83], [88.0, 91.17], [93.0, 97.44], [98.0, 98.96], [100.0, 100.33], [102.0, 103.57], [107.0, 107.18], [110.0, 109.85], [112.0, 112.77], [113.0, 113.81]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [37.74, 0.0, 36.02, 0.0, 0.0, 38.32, 39.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.96], ["speech", 19.98], ["sidetone", 4.09]], null, [["music", 46.35], ["speech", 8.35], ["radio", 4.48]], null, null, [["music", 37.33], ["whip", 5.23], ["rattle (instrument)", 5.18]], [["music", 49.94], ["synthesizer", 6.3], ["hum", 5.12]], null, null, null, null, null, null, null], "duration": [16.57, 1.75, 12.48, 1.58, 40.83, 3.17, 4.44, 0.96, 0.33, 1.57, 0.18, -0.15, 0.77, 0.81]} \ No newline at end of file diff --git a/annotations_1/hgqJjr7pBa0_filtered.json b/annotations_1/hgqJjr7pBa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f2bd388d8350c01e91e2bf983aa09dcaaf2574 --- /dev/null +++ b/annotations_1/hgqJjr7pBa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.56], [8.0, 7.57], [11.0, 11.04], [16.0, 16.06], [27.0, 30.97], [31.0, 33.79], [35.0, 39.56], [40.0, 41.64], [42.0, 43.92], [46.0, 46.04], [48.0, 48.69], [50.0, 53.5], [55.0, 55.41], [56.0, 66.97], [69.0, 70.68], [71.0, 72.01], [73.0, 74.22], [77.0, 78.43], [84.0, 84.99], [86.0, 87.69], [88.0, 89.04], [97.0, 97.55], [99.0, 110.02], [111.0, 111.16], [112.0, 129.05], [130.0, 131.53]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 32.81, 36.18, 36.77, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.1, 0.0, 29.65, 0.0], "audiomae_on_audioset": [[["speech", 20.83], ["music", 16.84], ["didgeridoo", 13.91]], null, null, null, [["hum", 28.64], ["mains hum", 15.4], ["speech", 14.98]], [["speech", 64.93], ["mains hum", 8.5], ["hum", 6.86]], [["speech", 17.91], ["hum", 11.94], ["mains hum", 11.26]], null, null, null, null, [["music", 43.62], ["didgeridoo", 13.7], ["musical instrument", 5.44]], null, [["speech", 37.34], ["music", 35.46], ["electronic music", 2.31]], null, null, null, null, null, null, null, null, [["music", 47.06], ["scary music", 13.23], ["ambient music", 9.0]], null, [["hum", 38.96], ["throbbing", 35.1], ["mains hum", 9.27]], null], "duration": [2.56, -0.43, 0.04, 0.06, 3.97, 2.79, 4.56, 1.64, 1.92, 0.04, 0.69, 3.5, 0.41, 10.97, 1.68, 1.01, 1.22, 1.43, 0.99, 1.69, 1.04, 0.55, 11.02, 0.16, 17.05, 1.53]} \ No newline at end of file diff --git a/annotations_1/hhmPqQpJWks_filtered.json b/annotations_1/hhmPqQpJWks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ccd3dfd76ca89cbbbdaaaef910f5eb1fd13c7d --- /dev/null +++ b/annotations_1/hhmPqQpJWks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.26], [20.0, 20.43], [23.0, 23.36], [25.0, 25.39], [29.0, 36.1], [41.0, 41.93], [45.0, 45.03], [45.0, 47.63], [55.0, 55.81], [60.0, 60.57], [67.0, 68.96], [73.0, 73.38], [74.0, 75.39], [78.0, 78.88], [80.0, 80.86], [108.0, 112.04], [112.0, 113.1], [119.0, 120.56], [122.0, 123.09], [123.0, 124.98], [125.0, 127.94], [128.0, 130.5]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.17, 0.0, 0.0, 49.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.09, 0.0, 0.0, 0.0, 0.0, 84.43, 57.72], "audiomae_on_audioset": [null, null, null, null, [["thump, thud", 23.04], ["throbbing", 14.0], ["whack, thwack", 10.4]], null, null, [["speech", 27.38], ["bee, wasp, etc.", 8.44], ["fly, housefly", 7.5]], null, null, null, null, null, null, null, [["speech", 66.53], ["noise", 7.52], ["sidetone", 4.39]], null, null, null, null, null, null], "duration": [0.26, 0.43, 0.36, 0.39, 7.1, 0.93, 0.03, 2.63, 0.81, 0.57, 1.96, 0.38, 1.39, 0.88, 0.86, 4.04, 1.1, 1.56, 1.09, 1.98, 2.94, 2.5]} \ No newline at end of file diff --git a/annotations_1/hjhBzRH-plo_filtered.json b/annotations_1/hjhBzRH-plo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1406b20e0476b73406b0e3b883202235c5379de --- /dev/null +++ b/annotations_1/hjhBzRH-plo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.19], [12.0, 13.31], [15.0, 15.08], [15.0, 15.67], [17.0, 18.39], [19.0, 22.98], [27.0, 27.23], [42.0, 42.01], [45.0, 45.47], [51.0, 53.86], [54.0, 54.7], [56.0, 56.76], [58.0, 58.85], [60.0, 60.29], [63.0, 64.0], [70.0, 72.42], [74.0, 74.34], [76.0, 75.59], [80.0, 81.08], [83.0, 83.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 35.62, 0.0, 0.0, 0.0, 0.0, 0.0, 33.38, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["boing", 44.36], ["animal", 19.35], ["grunt", 7.32]], null, null, null, null, null, [["wail, moan", 9.35], ["groan", 6.78], ["honk", 6.53]], null, null, null, null], "duration": [0.19, 1.31, 0.08, 0.67, 1.39, 3.98, 0.23, 0.01, 0.47, 2.86, 0.7, 0.76, 0.85, 0.29, 1.0, 2.42, 0.34, -0.41, 1.08, 0.51]} \ No newline at end of file diff --git a/annotations_1/hjuvr5uGA4s_filtered.json b/annotations_1/hjuvr5uGA4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f38dd0034648164fa9aab52214585dd606147ba --- /dev/null +++ b/annotations_1/hjuvr5uGA4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.79], [5.0, 5.85], [6.0, 8.38], [9.0, 9.61], [10.0, 10.77], [11.0, 12.29], [13.0, 15.42], [16.0, 16.93], [17.0, 18.44], [19.0, 19.7], [21.0, 21.51], [22.0, 22.76], [29.0, 29.17], [31.0, 31.35], [35.0, 36.48], [37.0, 37.59], [39.0, 40.37], [41.0, 42.01], [42.0, 43.11], [44.0, 44.25], [47.0, 47.28], [49.0, 49.71], [51.0, 51.51], [52.0, 52.83], [55.0, 55.59], [56.0, 56.74], [57.0, 58.35], [59.0, 59.66], [62.0, 61.72], [62.0, 62.36], [63.0, 66.75], [68.0, 68.34], [70.0, 70.38], [72.0, 85.41], [86.0, 87.15], [88.0, 88.45], [91.0, 99.13], [100.0, 101.61], [102.0, 104.13], [105.0, 105.97], [110.0, 110.69], [126.0, 126.67], [129.0, 128.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.58, 0.0, 0.0, 34.98, 0.0, 0.0, 99.97, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.78], ["dial tone", 21.87], ["sidetone", 15.0]], null, null, [["animal", 26.66], ["cattle, bovinae", 8.6], ["dog", 7.09]], null, null, null, null, null, null, null, null, null], "duration": [-0.21, 0.85, 2.38, 0.61, 0.77, 1.29, 2.42, 0.93, 1.44, 0.7, 0.51, 0.76, 0.17, 0.35, 1.48, 0.59, 1.37, 1.01, 1.11, 0.25, 0.28, 0.71, 0.51, 0.83, 0.59, 0.74, 1.35, 0.66, -0.28, 0.36, 3.75, 0.34, 0.38, 13.41, 1.15, 0.45, 8.13, 1.61, 2.13, 0.97, 0.69, 0.67, -0.02]} \ No newline at end of file diff --git a/annotations_1/hjyWtmbAyco_filtered.json b/annotations_1/hjyWtmbAyco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19ad8c7eb63cd565d88286e708745835efe4763b --- /dev/null +++ b/annotations_1/hjyWtmbAyco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.89], [6.0, 7.05], [10.0, 11.23], [12.0, 13.24], [14.0, 15.99], [17.0, 18.35], [20.0, 24.46], [27.0, 28.71], [30.0, 34.48], [35.0, 41.5], [43.0, 44.17], [45.0, 48.14], [50.0, 50.8], [54.0, 55.04], [59.0, 64.25], [68.0, 67.73], [69.0, 70.12], [71.0, 73.06], [82.0, 82.51], [85.0, 86.8], [88.0, 88.62], [95.0, 96.16], [97.0, 100.77], [104.0, 104.48], [105.0, 106.39], [115.0, 115.59], [120.0, 126.66], [140.0, 147.87]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 0.0, 44.87, 39.54, 0.0, 46.4, 0.0, 0.0, 46.22, 0.0, 0.0, 40.12, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 33.28, 32.66], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 47.53], ["speech", 22.73], ["bass guitar", 2.24]], null, [["music", 35.66], ["hum", 11.73], ["mains hum", 10.32]], [["music", 51.08], ["speech", 10.51], ["didgeridoo", 5.88]], null, [["mains hum", 42.71], ["hum", 33.65], ["throbbing", 5.72]], null, null, [["music", 71.41], ["didgeridoo", 4.03], ["hum", 3.0]], null, null, [["music", 30.33], ["hum", 13.23], ["throbbing", 11.69]], null, null, null, null, [["music", 40.87], ["hum", 10.22], ["throbbing", 9.74]], null, null, null, [["music", 31.04], ["speech", 23.39], ["boing", 9.39]], [["music", 27.77], ["throbbing", 23.08], ["hum", 17.82]]], "duration": [-0.11, 1.05, 1.23, 1.24, 1.99, 1.35, 4.46, 1.71, 4.48, 6.5, 1.17, 3.14, 0.8, 1.04, 5.25, -0.27, 1.12, 2.06, 0.51, 1.8, 0.62, 1.16, 3.77, 0.48, 1.39, 0.59, 6.66, 7.87]} \ No newline at end of file diff --git a/annotations_1/hkEXnpQ_c5I_filtered.json b/annotations_1/hkEXnpQ_c5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edc72c07cfe57781981dadbaeb997734a7a27843 --- /dev/null +++ b/annotations_1/hkEXnpQ_c5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.81], [12.0, 13.04], [28.0, 40.51], [47.0, 90.22], [94.0, 97.28], [102.0, 102.42], [104.0, 104.7], [107.0, 106.98], [107.0, 113.05], [114.0, 115.55], [122.0, 122.5], [124.0, 124.78], [128.0, 130.4], [131.0, 133.02], [138.0, 138.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.27, 0.0, 30.67, 0.0, 37.27, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 78.55, 59.42, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 42.8], ["hum", 27.6], ["music", 17.17]], null, [["moo", 20.99], ["music", 17.45], ["cattle, bovinae", 15.9]], null, null, null, null, null, null, null, null, null, null], "duration": [2.81, 1.04, 12.51, 43.22, 3.28, 0.42, 0.7, -0.02, 6.05, 1.55, 0.5, 0.78, 2.4, 2.02, 0.1]} \ No newline at end of file diff --git a/annotations_1/hktlkG0QuKY_filtered.json b/annotations_1/hktlkG0QuKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a512e3fad5fe530b9cc69a83da2c1acf6ae14182 --- /dev/null +++ b/annotations_1/hktlkG0QuKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.71], [29.0, 42.75], [45.0, 51.54], [54.0, 61.74], [64.0, 75.74], [77.0, 77.92], [83.0, 84.21], [85.0, 85.68], [90.0, 91.64], [93.0, 94.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.66, 31.2, 31.99, 41.76, 38.97, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.83], ["throbbing", 7.52], ["hum", 4.07]], [["music", 61.98], ["speech", 14.5], ["didgeridoo", 7.3]], [["speech", 58.02], ["music", 20.88], ["hum", 4.5]], [["fly, housefly", 38.63], ["bee, wasp, etc.", 20.81], ["insect", 19.16]], [["music", 50.09], ["hum", 20.9], ["throbbing", 5.5]], null, null, null, null, null], "duration": [2.71, 13.75, 6.54, 7.74, 11.74, 0.92, 1.21, 0.68, 1.64, 1.17]} \ No newline at end of file diff --git a/annotations_1/hl1z_vp3kXg_filtered.json b/annotations_1/hl1z_vp3kXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4665ce593e12741b239830311168566ccf4cd36 --- /dev/null +++ b/annotations_1/hl1z_vp3kXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.66], [9.0, 9.85], [23.0, 37.32], [45.0, 46.67], [48.0, 48.37], [53.0, 54.57], [62.0, 61.77], [74.0, 76.4], [79.0, 99.18]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.24, 0.0, 0.0, 0.0, 0.0, 92.8, 32.54], "audiomae_on_audioset": [null, null, [["music", 21.88], ["livestock, farm animals, working animals", 14.01], ["cattle, bovinae", 11.97]], null, null, null, null, null, [["music", 47.35], ["didgeridoo", 17.23], ["theremin", 14.69]]], "duration": [1.66, 0.85, 14.32, 1.67, 0.37, 1.57, -0.23, 2.4, 20.18]} \ No newline at end of file diff --git a/annotations_1/hlWL5Az4pow_filtered.json b/annotations_1/hlWL5Az4pow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76bbcbc2113417d8f05ddb1b710ecfbd2bd68c63 --- /dev/null +++ b/annotations_1/hlWL5Az4pow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.12], [9.0, 14.22], [16.0, 23.31], [27.0, 30.94], [34.0, 35.5], [38.0, 38.3], [40.0, 43.01], [57.0, 58.63], [61.0, 67.27], [72.0, 72.55], [74.0, 73.99], [83.0, 83.69], [89.0, 99.32], [102.0, 103.65], [105.0, 106.81], [108.0, 110.27], [125.0, 126.93], [129.0, 133.79], [136.0, 136.65], [175.0, 175.59], [178.0, 183.34], [185.0, 195.3], [198.0, 199.62]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [98.01, 53.91, 40.29, 33.31, 0.0, 0.0, 34.6, 0.0, 33.3, 0.0, 0.0, 0.0, 33.23, 0.0, 0.0, 36.82, 0.0, 34.89, 0.0, 0.0, 33.02, 33.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.27], ["speech", 24.59], ["fly, housefly", 7.96]], [["music", 77.08], ["throbbing", 3.55], ["cacophony", 2.18]], null, null, [["music", 83.62], ["musical instrument", 1.91], ["guitar", 1.5]], null, [["music", 72.31], ["didgeridoo", 2.96], ["funny music", 1.83]], null, null, null, [["music", 42.78], ["livestock, farm animals, working animals", 7.34], ["speech", 7.25]], null, null, [["music", 68.83], ["video game music", 3.06], ["throbbing", 2.8]], null, [["music", 78.65], ["reggae", 2.54], ["electronic music", 1.33]], null, null, [["music", 71.09], ["throbbing", 8.48], ["hum", 3.32]], [["music", 40.68], ["animal", 6.72], ["speech", 5.22]], null], "duration": [2.12, 5.22, 7.31, 3.94, 1.5, 0.3, 3.01, 1.63, 6.27, 0.55, -0.01, 0.69, 10.32, 1.65, 1.81, 2.27, 1.93, 4.79, 0.65, 0.59, 5.34, 10.3, 1.62]} \ No newline at end of file diff --git a/annotations_1/hn3XR4o8M4c_filtered.json b/annotations_1/hn3XR4o8M4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73744fed5d2f6944728e0293f4b4ad3326b528e3 --- /dev/null +++ b/annotations_1/hn3XR4o8M4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.41], [12.0, 12.21], [14.0, 14.4], [17.0, 18.87], [24.0, 28.58], [36.0, 36.8], [38.0, 38.91], [43.0, 45.47], [48.0, 50.92], [52.0, 53.7], [56.0, 57.15], [58.0, 58.53], [59.0, 59.61], [61.0, 61.1], [64.0, 64.84], [65.0, 66.36], [68.0, 68.59], [74.0, 74.39], [77.0, 78.75], [85.0, 93.48], [100.0, 100.5], [103.0, 102.88], [105.0, 132.44], [137.0, 145.15], [145.0, 149.76], [150.0, 150.74], [170.0, 170.83], [172.0, 172.13], [172.0, 176.18]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.31, 0.0, 0.0, 31.81, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.83, 0.0, 0.0, 41.1, 61.97, 41.07, 0.0, 0.0, 0.0, 37.33], "audiomae_on_audioset": [null, null, null, null, [["speech", 38.6], ["music", 34.15], ["hum", 3.72]], null, null, [["speech", 9.58], ["whack, thwack", 8.24], ["squeak", 7.47]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.68], ["music", 27.89], ["whack, thwack", 6.34]], null, null, [["music", 50.21], ["hum", 7.33], ["mains hum", 6.64]], null, [["cattle, bovinae", 23.86], ["music", 18.21], ["livestock, farm animals, working animals", 16.8]], null, null, null, [["music", 37.54], ["speech", 24.96], ["didgeridoo", 9.38]]], "duration": [1.41, 0.21, 0.4, 1.87, 4.58, 0.8, 0.91, 2.47, 2.92, 1.7, 1.15, 0.53, 0.61, 0.1, 0.84, 1.36, 0.59, 0.39, 1.75, 8.48, 0.5, -0.12, 27.44, 8.15, 4.76, 0.74, 0.83, 0.13, 4.18]} \ No newline at end of file diff --git a/annotations_1/hoKvbJSMShA_filtered.json b/annotations_1/hoKvbJSMShA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74e2d9356fa285ca884147114b004e5cfb2d929a --- /dev/null +++ b/annotations_1/hoKvbJSMShA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.89], [4.0, 14.05], [14.0, 15.63], [17.0, 17.14], [18.0, 17.86], [20.0, 20.21], [21.0, 22.4], [24.0, 24.54], [27.0, 27.04], [27.0, 29.83], [30.0, 30.43], [31.0, 31.77], [33.0, 35.02], [36.0, 38.06], [39.0, 42.06], [43.0, 44.39], [45.0, 46.65], [48.0, 48.56], [50.0, 50.58], [51.0, 51.29], [52.0, 52.73], [53.0, 53.45], [54.0, 56.51], [58.0, 59.54], [60.0, 62.11], [62.0, 64.18], [65.0, 72.32], [73.0, 74.93], [75.0, 76.0], [78.0, 82.38], [83.0, 83.59], [85.0, 85.58], [86.0, 86.64], [95.0, 96.62], [99.0, 99.59], [102.0, 103.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 89.36, 74.29, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 47.62, 54.36, 33.64, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 29.17], ["music", 27.31], ["speech", 19.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.21], ["vehicle", 3.86], ["cattle, bovinae", 3.77]], null, [["vehicle", 20.61], ["whale vocalization", 11.84], ["speech", 6.66]], null, null, null, null, null, null, null, null, null], "duration": [1.89, 10.05, 1.63, 0.14, -0.14, 0.21, 1.4, 0.54, 0.04, 2.83, 0.43, 0.77, 2.02, 2.06, 3.06, 1.39, 1.65, 0.56, 0.58, 0.29, 0.73, 0.45, 2.51, 1.54, 2.11, 2.18, 7.32, 1.93, 1.0, 4.38, 0.59, 0.58, 0.64, 1.62, 0.59, 1.59]} \ No newline at end of file diff --git a/annotations_1/hoWEYBSlctc_filtered.json b/annotations_1/hoWEYBSlctc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8d7a459d4f38f99c2fb34e57cfbf104bf370f98b --- /dev/null +++ b/annotations_1/hoWEYBSlctc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.23], [15.0, 18.05], [19.0, 20.16], [26.0, 25.83], [28.0, 30.28], [36.0, 36.64], [38.0, 38.79], [41.0, 41.62], [48.0, 48.44], [50.0, 50.79], [52.0, 52.14], [59.0, 58.75], [61.0, 68.5], [69.0, 69.72], [83.0, 83.54], [88.0, 89.77], [92.0, 92.48], [94.0, 94.95], [96.0, 96.5], [98.0, 98.25], [106.0, 106.56], [108.0, 108.03], [114.0, 115.26], [116.0, 116.63], [120.0, 120.63], [125.0, 125.91], [126.0, 127.41], [129.0, 129.56], [134.0, 135.21], [141.0, 141.35], [145.0, 145.99], [148.0, 150.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.73, 49.54, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.67], "audiomae_on_audioset": [[["music", 77.39], ["speech", 8.26], ["musical instrument", 3.65]], [["telephone dialing, dtmf", 37.13], ["telephone", 17.66], ["speech", 15.71]], null, null, [["music", 46.35], ["speech", 29.71], ["radio", 2.3]], null, null, null, null, null, null, null, [["sidetone", 30.4], ["music", 26.24], ["hum", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [10.23, 3.05, 1.16, -0.17, 2.28, 0.64, 0.79, 0.62, 0.44, 0.79, 0.14, -0.25, 7.5, 0.72, 0.54, 1.77, 0.48, 0.95, 0.5, 0.25, 0.56, 0.03, 1.26, 0.63, 0.63, 0.91, 1.41, 0.56, 1.21, 0.35, 0.99, 2.55]} \ No newline at end of file diff --git a/annotations_1/hoe24aSvLtw_filtered.json b/annotations_1/hoe24aSvLtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22f65a276191383c6c588a4400955dab08ea52ab --- /dev/null +++ b/annotations_1/hoe24aSvLtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.64], [14.0, 14.44], [15.0, 15.45], [17.0, 17.9], [20.0, 20.73], [30.0, 32.32], [39.0, 38.77], [40.0, 40.07], [41.0, 41.69], [42.0, 43.17], [55.0, 55.71], [60.0, 61.16], [63.0, 63.71], [64.0, 66.5], [68.0, 68.35], [69.0, 69.87], [70.0, 72.96], [73.0, 74.7], [75.0, 75.36], [76.0, 76.55], [82.0, 85.01], [90.0, 90.22], [91.0, 91.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.44, 0.45, 0.9, 0.73, 2.32, -0.23, 0.07, 0.69, 1.17, 0.71, 1.16, 0.71, 2.5, 0.35, 0.87, 2.96, 1.7, 0.36, 0.55, 3.01, 0.22, 0.4]} \ No newline at end of file diff --git a/annotations_1/honAzu3xOP0_filtered.json b/annotations_1/honAzu3xOP0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2651e170a2e608322230387840bd93a52ab71398 --- /dev/null +++ b/annotations_1/honAzu3xOP0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [14.0, 14.82], [17.0, 18.89], [20.0, 21.22], [22.0, 23.21], [27.0, 27.31], [28.0, 28.54], [30.0, 30.21], [31.0, 34.53], [36.0, 36.29], [45.0, 49.99], [61.0, 60.86], [89.0, 91.5], [92.0, 93.78], [102.0, 104.85], [108.0, 116.21], [118.0, 118.49], [124.0, 123.99], [126.0, 126.0], [153.0, 153.79], [165.0, 165.59], [194.0, 194.04]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 43.1, 0.0, 33.88, 0.0, 39.52, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 21.38], ["speech", 16.92], ["sidetone", 9.33]], null, [["music", 45.13], ["speech", 15.32], ["sidetone", 5.69]], null, [["speech", 45.37], ["radio", 10.47], ["sidetone", 7.03]], null, [["music", 45.58], ["speech", 14.73], ["sidetone", 5.19]], [["music", 67.55], ["bass guitar", 8.2], ["guitar", 4.7]], null, null, null, null, null, null], "duration": [0.51, 0.82, 1.89, 1.22, 1.21, 0.31, 0.54, 0.21, 3.53, 0.29, 4.99, -0.14, 2.5, 1.78, 2.85, 8.21, 0.49, -0.01, 0.0, 0.79, 0.59, 0.04]} \ No newline at end of file diff --git a/annotations_1/howhfMAoEt0_filtered.json b/annotations_1/howhfMAoEt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fda3e6488a353f00c4aa190c896f68e329e0cff --- /dev/null +++ b/annotations_1/howhfMAoEt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.03], [7.0, 24.16], [24.0, 26.91], [28.0, 29.0], [30.0, 31.21], [34.0, 34.53], [35.0, 48.14], [50.0, 62.56], [64.0, 65.31], [65.0, 72.72], [73.0, 73.45], [75.0, 77.9], [81.0, 93.72], [94.0, 95.86], [97.0, 99.12], [101.0, 101.98], [102.0, 103.6], [105.0, 107.86], [108.0, 108.9], [109.0, 111.06], [112.0, 116.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.97, 53.78, 97.54, 0.0, 0.0, 0.0, 100.0, 97.64, 0.0, 99.95, 0.0, 99.78, 80.64, 0.0, 97.11, 0.0, 0.0, 95.51, 0.0, 99.1, 91.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.03, 17.16, 2.91, 1.0, 1.21, 0.53, 13.14, 12.56, 1.31, 7.72, 0.45, 2.9, 12.72, 1.86, 2.12, 0.98, 1.6, 2.86, 0.9, 2.06, 4.36]} \ No newline at end of file diff --git a/annotations_1/hp3HX9PAkcA_filtered.json b/annotations_1/hp3HX9PAkcA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..55544402fd2a2be5c946b03e018f8251a0ca55c5 --- /dev/null +++ b/annotations_1/hp3HX9PAkcA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.97], [7.0, 8.87], [9.0, 10.42], [11.0, 12.8], [13.0, 14.17], [14.0, 15.38], [23.0, 25.51], [26.0, 29.08], [29.0, 30.48], [31.0, 32.97], [34.0, 37.86], [44.0, 44.79], [48.0, 48.98], [51.0, 52.62], [54.0, 54.78], [57.0, 59.0], [60.0, 61.33], [64.0, 64.39], [70.0, 71.63], [73.0, 74.22], [79.0, 79.59], [81.0, 81.85], [85.0, 85.72], [87.0, 88.42], [99.0, 99.89], [100.0, 102.78], [111.0, 111.72], [112.0, 113.02], [116.0, 119.2], [121.0, 121.95], [125.0, 126.32], [128.0, 128.63], [130.0, 129.88], [130.0, 131.16], [135.0, 141.34], [143.0, 142.72], [145.0, 145.27], [146.0, 145.54], [146.0, 147.39], [151.0, 151.48], [168.0, 168.4], [169.0, 171.17], [174.0, 176.28], [184.0, 184.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 77.87, 0.0, 0.0, 51.77, 0.0, 0.0, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 52.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 1.87, 1.42, 1.8, 1.17, 1.38, 2.51, 3.08, 1.48, 1.97, 3.86, 0.79, 0.98, 1.62, 0.78, 2.0, 1.33, 0.39, 1.63, 1.22, 0.59, 0.85, 0.72, 1.42, 0.89, 2.78, 0.72, 1.02, 3.2, 0.95, 1.32, 0.63, -0.12, 1.16, 6.34, -0.28, 0.27, -0.46, 1.39, 0.48, 0.4, 2.17, 2.28, 0.62]} \ No newline at end of file diff --git a/annotations_1/hp3n_sA4Sqo_filtered.json b/annotations_1/hp3n_sA4Sqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff75e6a8b956e9cb125e7a854dfd2a18fc0ea0c4 --- /dev/null +++ b/annotations_1/hp3n_sA4Sqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 61.53], [68.0, 81.21], [86.0, 88.13], [90.0, 90.41], [92.0, 93.53], [94.0, 94.51], [102.0, 103.32], [106.0, 106.88], [108.0, 108.55], [110.0, 110.03], [112.0, 112.48], [113.0, 116.29], [119.0, 118.89], [119.0, 124.97]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.82, 31.72, 44.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81, 0.0, 37.17], "audiomae_on_audioset": [[["music", 61.99], ["throbbing", 10.32], ["sampler", 2.88]], [["music", 79.7], ["cacophony", 2.57], ["synthesizer", 2.11]], [["music", 51.21], ["speech", 5.25], ["electronic music", 4.87]], null, null, null, null, null, null, null, null, [["music", 65.05], ["electronic music", 3.96], ["electronica", 3.26]], null, [["music", 61.09], ["speech", 9.1], ["throbbing", 4.17]]], "duration": [23.53, 13.21, 2.13, 0.41, 1.53, 0.51, 1.32, 0.88, 0.55, 0.03, 0.48, 3.29, -0.11, 5.97]} \ No newline at end of file diff --git a/annotations_1/hprw4GtCu1w_filtered.json b/annotations_1/hprw4GtCu1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..603244ddec9ac3323c25bee9b4e34aa2a897c7e6 --- /dev/null +++ b/annotations_1/hprw4GtCu1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.49], [11.0, 19.03], [19.0, 19.09], [19.0, 19.47], [19.0, 25.59], [26.0, 26.54], [31.0, 31.18], [35.0, 35.24], [36.0, 36.27], [39.0, 40.12], [43.0, 52.66], [53.0, 53.72], [54.0, 55.04], [56.0, 56.86], [58.0, 58.21], [59.0, 60.93], [61.0, 61.33], [65.0, 65.16], [65.0, 66.55], [68.0, 68.32], [73.0, 74.66], [76.0, 79.49], [80.0, 82.05], [83.0, 83.22], [84.0, 93.63], [97.0, 97.41], [100.0, 103.03], [104.0, 106.17], [107.0, 108.8], [112.0, 113.78], [116.0, 116.67], [119.0, 120.61], [123.0, 125.46], [130.0, 139.58], [142.0, 147.26], [149.0, 153.94], [158.0, 162.7]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.67, 32.89, 0.0, 0.0, 33.73, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 62.27, 0.0, 37.02, 0.0, 55.67, 98.1, 0.0, 0.0, 0.0, 0.0, 98.51, 42.79, 39.07, 56.86, 36.39], "audiomae_on_audioset": [[["music", 37.8], ["synthesizer", 10.64], ["effects unit", 8.49]], [["music", 51.15], ["didgeridoo", 18.71], ["speech", 12.67]], null, null, [["didgeridoo", 52.26], ["music", 11.12], ["mantra", 8.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 25.83], ["speech", 17.17], ["telephone", 13.85]], null, null, [["music", 66.98], ["speech", 6.82], ["timpani", 3.54]], null, null, null, null, null, null, null, null, [["music", 55.16], ["theremin", 25.86], ["singing bowl", 2.89]], [["music", 66.56], ["theremin", 5.96], ["musical instrument", 4.09]], null, [["music", 25.21], ["throbbing", 14.93], ["hum", 14.09]]], "duration": [2.49, 8.03, 0.09, 0.47, 6.59, 0.54, 0.18, 0.24, 0.27, 1.12, 9.66, 0.72, 1.04, 0.86, 0.21, 1.93, 0.33, 0.16, 1.55, 0.32, 1.66, 3.49, 2.05, 0.22, 9.63, 0.41, 3.03, 2.17, 1.8, 1.78, 0.67, 1.61, 2.46, 9.58, 5.26, 4.94, 4.7]} \ No newline at end of file diff --git a/annotations_1/hq4lKhTXzXQ_filtered.json b/annotations_1/hq4lKhTXzXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..948c005ff8f0aee70b9ba04083b548af59a22a97 --- /dev/null +++ b/annotations_1/hq4lKhTXzXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.74], [11.0, 19.84], [20.0, 20.48], [23.0, 23.48], [25.0, 25.03], [27.0, 43.33], [46.0, 46.72], [52.0, 52.46], [57.0, 57.91], [60.0, 60.03], [61.0, 74.53], [78.0, 85.09], [85.0, 85.14], [87.0, 87.49], [90.0, 98.76]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [31.23, 31.24, 0.0, 0.0, 0.0, 29.07, 0.0, 0.0, 0.0, 0.0, 30.53, 30.65, 0.0, 0.0, 29.9], "audiomae_on_audioset": [[["music", 39.32], ["didgeridoo", 23.37], ["electric shaver, electric razor", 6.98]], [["music", 50.42], ["didgeridoo", 33.23], ["musical instrument", 6.93]], null, null, null, [["music", 34.21], ["noise", 21.54], ["didgeridoo", 7.99]], null, null, null, null, [["throbbing", 55.92], ["hum", 25.01], ["music", 12.0]], [["throbbing", 57.02], ["hum", 37.74], ["mains hum", 2.48]], null, null, [["hum", 33.77], ["throbbing", 17.19], ["speech", 10.4]]], "duration": [4.74, 8.84, 0.48, 0.48, 0.03, 16.33, 0.72, 0.46, 0.91, 0.03, 13.53, 7.09, 0.14, 0.49, 8.76]} \ No newline at end of file diff --git a/annotations_1/hqqlSTB5CfU_filtered.json b/annotations_1/hqqlSTB5CfU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3606ddf89e94962f9b4f4c22c2412db6bdde15ec --- /dev/null +++ b/annotations_1/hqqlSTB5CfU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.0], [7.0, 7.52], [9.0, 9.24], [11.0, 11.82], [13.0, 13.51], [14.0, 15.69], [22.0, 23.63], [26.0, 26.27], [28.0, 28.92], [30.0, 30.2], [31.0, 32.24], [33.0, 34.28], [36.0, 36.66], [40.0, 41.47], [42.0, 42.6], [43.0, 44.32], [45.0, 45.37], [46.0, 49.47], [50.0, 51.14], [53.0, 54.03], [57.0, 58.06], [60.0, 62.55], [63.0, 63.69], [65.0, 66.24], [68.0, 69.58], [71.0, 72.13], [72.0, 72.72], [74.0, 74.63], [76.0, 77.16], [78.0, 78.61], [79.0, 80.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.52, 0.24, 0.82, 0.51, 1.69, 1.63, 0.27, 0.92, 0.2, 1.24, 1.28, 0.66, 1.47, 0.6, 1.32, 0.37, 3.47, 1.14, 1.03, 1.06, 2.55, 0.69, 1.24, 1.58, 1.13, 0.72, 0.63, 1.16, 0.61, 1.7]} \ No newline at end of file diff --git a/annotations_1/hqslb1FVoQQ_filtered.json b/annotations_1/hqslb1FVoQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d66d3c31b3cf276b167fd02289e792c48bf1ad7 --- /dev/null +++ b/annotations_1/hqslb1FVoQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 21.46], [25.0, 33.44], [37.0, 37.54], [43.0, 46.01], [49.0, 49.22], [58.0, 59.59], [66.0, 66.82], [70.0, 72.39], [82.0, 86.68], [89.0, 92.1], [112.0, 113.17], [114.0, 115.6]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [34.56, 35.2, 0.0, 93.6, 0.0, 0.0, 0.0, 77.2, 39.54, 33.88, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.06], ["hum", 11.87], ["synthesizer", 10.76]], [["hum", 46.12], ["music", 17.15], ["mains hum", 13.87]], null, null, null, null, null, null, [["speech", 42.78], ["music", 37.77], ["timpani", 2.78]], [["music", 47.61], ["speech", 10.72], ["drum", 2.66]], null, null], "duration": [13.46, 8.44, 0.54, 3.01, 0.22, 1.59, 0.82, 2.39, 4.68, 3.1, 1.17, 1.6]} \ No newline at end of file diff --git a/annotations_1/htHKbsUKDDw_filtered.json b/annotations_1/htHKbsUKDDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca486ccdf7f9a280d82dfe65fd73ad1042bc5036 --- /dev/null +++ b/annotations_1/htHKbsUKDDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.42], [13.0, 13.93], [17.0, 17.27], [21.0, 20.75], [23.0, 24.76], [30.0, 31.06], [36.0, 36.32], [39.0, 41.86], [50.0, 52.64], [53.0, 53.81], [58.0, 58.4], [63.0, 67.8], [77.0, 77.16], [83.0, 83.13], [86.0, 86.85], [88.0, 88.62], [91.0, 96.58], [99.0, 105.87], [107.0, 108.31], [115.0, 115.69], [120.0, 121.31], [127.0, 127.58], [133.0, 133.12], [141.0, 143.65], [147.0, 148.47], [154.0, 155.12], [158.0, 159.44], [172.0, 173.03], [175.0, 175.56], [178.0, 178.75], [184.0, 184.37], [187.0, 187.83], [191.0, 191.39], [194.0, 195.76], [196.0, 197.5], [200.0, 200.3], [204.0, 204.15], [212.0, 212.21], [215.0, 232.61], [237.0, 241.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.26, 49.0, 0.0, 0.0, 36.29, 0.0, 0.0, 0.0, 0.0, 38.55, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 30.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.91, 47.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 82.75], ["musical instrument", 1.14], ["electronic music", 1.04]], [["music", 59.66], ["throbbing", 9.77], ["hum", 5.6]], null, null, [["speech", 47.86], ["typewriter", 13.85], ["music", 13.56]], null, null, null, null, [["speech", 40.1], ["music", 15.72], ["whale vocalization", 4.06]], [["music", 59.07], ["speech", 16.17], ["musical instrument", 5.76]], null, null, null, null, null, [["coin (dropping)", 33.69], ["ding", 26.97], ["clang", 13.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.78], ["throbbing", 24.15], ["hum", 20.69]], [["bee, wasp, etc.", 22.17], ["fly, housefly", 13.52], ["hum", 8.62]]], "duration": [3.42, 0.93, 0.27, -0.25, 1.76, 1.06, 0.32, 2.86, 2.64, 0.81, 0.4, 4.8, 0.16, 0.13, 0.85, 0.62, 5.58, 6.87, 1.31, 0.69, 1.31, 0.58, 0.12, 2.65, 1.47, 1.12, 1.44, 1.03, 0.56, 0.75, 0.37, 0.83, 0.39, 1.76, 1.5, 0.3, 0.15, 0.21, 17.61, 4.78]} \ No newline at end of file diff --git a/annotations_1/hudgzkYfSvU_filtered.json b/annotations_1/hudgzkYfSvU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97803a59c4c655345609a148dbac5b8090fd56ad --- /dev/null +++ b/annotations_1/hudgzkYfSvU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 12.38], [14.0, 15.69], [21.0, 23.75], [32.0, 31.92], [35.0, 38.33], [41.0, 41.81], [47.0, 48.37], [57.0, 57.18], [59.0, 59.37], [76.0, 76.72], [79.0, 81.77], [84.0, 85.23], [94.0, 94.14], [104.0, 104.75], [106.0, 107.08], [109.0, 111.57], [114.0, 115.5], [124.0, 124.56], [128.0, 129.22]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [54.43, 0.0, 38.36, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 33.88, 0.0, 0.0, 0.0, 0.0, 33.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 23.12], ["mains hum", 18.41], ["didgeridoo", 17.61]], null, null, null, null, null, null, null, [["speech", 23.63], ["music", 19.0], ["hum", 6.01]], null, null, null, null, [["speech", 32.8], ["civil defense siren", 27.92], ["siren", 12.17]], null, null, null], "duration": [7.38, 1.69, 2.75, -0.08, 3.33, 0.81, 1.37, 0.18, 0.37, 0.72, 2.77, 1.23, 0.14, 0.75, 1.08, 2.57, 1.5, 0.56, 1.22]} \ No newline at end of file diff --git a/annotations_1/huxXgcGvTPk_filtered.json b/annotations_1/huxXgcGvTPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e900fb3b3da6d40a23527704808fea4f3dbdef7 --- /dev/null +++ b/annotations_1/huxXgcGvTPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 19.48], [21.0, 21.1], [22.0, 40.1], [41.0, 51.95], [54.0, 60.56], [66.0, 66.46], [79.0, 79.27], [81.0, 81.7], [85.0, 85.26], [87.0, 88.03], [97.0, 97.75], [107.0, 107.35], [108.0, 108.65], [110.0, 110.89], [120.0, 120.9], [122.0, 123.67], [124.0, 125.19], [127.0, 127.57], [129.0, 130.0], [133.0, 134.81], [136.0, 139.24], [139.0, 139.48], [139.0, 139.51], [140.0, 141.05], [146.0, 145.79], [146.0, 148.07], [151.0, 160.19], [165.0, 165.42], [166.0, 166.95], [169.0, 169.13]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [54.04, 0.0, 68.15, 41.1, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.63, 0.0, 0.0, 0.0, 0.0, 40.36, 30.27, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 59.2], ["hum", 6.35], ["mains hum", 2.32]], [["hum", 40.69], ["music", 25.37], ["throbbing", 9.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.57], ["throbbing", 11.19], ["hum", 10.15]], null, null, null, null, [["music", 54.5], ["speech", 8.66], ["hum", 6.43]], [["music", 52.22], ["hum", 11.03], ["mains hum", 8.05]], null, null, null], "duration": [8.48, 0.1, 18.1, 10.95, 6.56, 0.46, 0.27, 0.7, 0.26, 1.03, 0.75, 0.35, 0.65, 0.89, 0.9, 1.67, 1.19, 0.57, 1.0, 1.81, 3.24, 0.48, 0.51, 1.05, -0.21, 2.07, 9.19, 0.42, 0.95, 0.13]} \ No newline at end of file diff --git a/annotations_1/hv_mYkUEGko_filtered.json b/annotations_1/hv_mYkUEGko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abf7924a11a4c84d152424592bab5bb6b8055bc2 --- /dev/null +++ b/annotations_1/hv_mYkUEGko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.7], [26.0, 31.38], [36.0, 36.78], [39.0, 39.11], [46.0, 49.81], [52.0, 51.87], [53.0, 53.54], [54.0, 54.82], [56.0, 56.79], [71.0, 71.02], [73.0, 73.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.61, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 64.27], ["synthesizer", 20.27], ["musical instrument", 4.89]], null, null, [["fart", 52.4], ["speech", 14.12], ["boing", 6.9]], null, null, null, null, null, null], "duration": [0.7, 5.38, 0.78, 0.11, 3.81, -0.13, 0.54, 0.82, 0.79, 0.02, 0.5]} \ No newline at end of file diff --git a/annotations_1/hvuQCnADQRM_filtered.json b/annotations_1/hvuQCnADQRM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edf4688ef420a5d4609c47285d5e6d73e58588d3 --- /dev/null +++ b/annotations_1/hvuQCnADQRM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.51], [7.0, 7.37], [10.0, 11.21], [14.0, 14.74], [16.0, 23.35], [26.0, 29.39], [30.0, 34.25], [36.0, 36.36], [40.0, 61.75], [62.0, 72.71], [73.0, 74.26], [77.0, 77.45], [78.0, 83.56], [84.0, 85.67], [87.0, 86.7], [87.0, 88.62], [89.0, 89.18], [93.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 35.54, 82.97, 0.0, 40.88, 30.47, 0.0, 0.0, 61.87, 0.0, 0.0, 0.0, 0.0, 36.93], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 62.26], ["moo", 27.02], ["livestock, farm animals, working animals", 9.05]], null, null, [["howl", 32.86], ["animal", 9.17], ["livestock, farm animals, working animals", 7.32]], [["car", 18.59], ["vehicle", 16.72], ["skidding", 15.23]], null, null, null, null, null, null, null, [["speech", 27.0], ["snicker", 13.41], ["animal", 6.9]]], "duration": [0.89, 0.51, 0.37, 1.21, 0.74, 7.35, 3.39, 4.25, 0.36, 21.75, 10.71, 1.26, 0.45, 5.56, 1.67, -0.3, 1.62, 0.18, 3.01]} \ No newline at end of file diff --git a/annotations_1/hw3lBV-89M0_filtered.json b/annotations_1/hw3lBV-89M0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0734ab3431ec925cc8e29de7c94d3d629d8243f9 --- /dev/null +++ b/annotations_1/hw3lBV-89M0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.53], [9.0, 9.53], [11.0, 13.54], [17.0, 17.36], [20.0, 20.7], [23.0, 23.46], [27.0, 28.7], [35.0, 35.19], [47.0, 47.39], [54.0, 56.54], [58.0, 58.5], [60.0, 60.64], [62.0, 63.05], [64.0, 64.71], [74.0, 74.85]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.47, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 34.87], ["synthesizer", 5.02], ["fart", 3.62]], null, null, null, null, null, null, [["music", 56.31], ["synthesizer", 12.79], ["sampler", 3.2]], null, null, null, null, null], "duration": [0.53, 0.53, 2.54, 0.36, 0.7, 0.46, 1.7, 0.19, 0.39, 2.54, 0.5, 0.64, 1.05, 0.71, 0.85]} \ No newline at end of file diff --git a/annotations_1/hwTf9WurF4U_filtered.json b/annotations_1/hwTf9WurF4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2bc5b8e2636f2a00ba5c56b552f579b0b28657 --- /dev/null +++ b/annotations_1/hwTf9WurF4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.31], [12.0, 14.94], [16.0, 16.73], [21.0, 29.44], [35.0, 35.61], [37.0, 37.91], [39.0, 41.44], [47.0, 47.24], [49.0, 57.45], [58.0, 83.24], [84.0, 125.91], [129.0, 131.82], [134.0, 154.36]], "keep_status": [false, true, false, false, false, false, true, false, true, true, false, true, false], "silence_prob": [51.99, 38.8, 0.0, 30.17, 0.0, 0.0, 30.59, 0.0, 31.11, 30.25, 0.0, 28.67, 29.82], "audiomae_on_audioset": [null, [["fly, housefly", 32.96], ["mosquito", 15.18], ["insect", 14.27]], null, [["music", 63.19], ["drum", 5.72], ["theremin", 5.32]], null, null, [["music", 39.45], ["boing", 12.76], ["whip", 6.2]], null, [["speech", 25.92], ["music", 23.2], ["hum", 10.21]], [["mains hum", 29.36], ["speech", 17.18], ["hum", 14.24]], null, [["hum", 34.06], ["mains hum", 22.84], ["throbbing", 6.99]], [["music", 63.3], ["buzz", 8.59], ["mains hum", 6.0]]], "duration": [4.31, 2.94, 0.73, 8.44, 0.61, 0.91, 2.44, 0.24, 8.45, 25.24, 41.91, 2.82, 20.36]} \ No newline at end of file diff --git a/annotations_1/hwb1MK66new_filtered.json b/annotations_1/hwb1MK66new_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cadd8c51a8fe2ac84a79c25f67e74e8bef07e26a --- /dev/null +++ b/annotations_1/hwb1MK66new_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 73.7], [81.0, 84.67], [89.0, 90.75], [93.0, 118.15]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 29.05, 0.0, 31.0], "audiomae_on_audioset": [null, [["music", 12.81], ["speech", 12.64], ["fly, housefly", 12.05]], null, [["rumble", 23.2], ["speech", 14.06], ["whale vocalization", 11.04]]], "duration": [54.7, 3.67, 1.75, 25.15]} \ No newline at end of file diff --git a/annotations_1/hwevrtap9AY_filtered.json b/annotations_1/hwevrtap9AY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3f234356862f12ba67b6bb295598b61bd1297fc --- /dev/null +++ b/annotations_1/hwevrtap9AY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[72.0, 71.52], [73.0, 76.15], [80.0, 90.81]], "keep_status": [false, false, false], "silence_prob": [0.0, 31.13, 30.87], "audiomae_on_audioset": [null, [["music", 71.54], ["throbbing", 4.14], ["noise", 3.32]], [["throbbing", 39.63], ["hum", 22.6], ["music", 22.29]]], "duration": [-0.48, 3.15, 10.81]} \ No newline at end of file diff --git a/annotations_1/hxi06yeErvk_filtered.json b/annotations_1/hxi06yeErvk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4c4c24217cbbe1c06cb9bb7824672fddacad8ac --- /dev/null +++ b/annotations_1/hxi06yeErvk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.63], [1.0, 0.67], [1.0, 1.97], [2.0, 2.42], [3.0, 2.86], [3.0, 4.26], [4.0, 11.91], [14.0, 14.13], [14.0, 36.27], [48.0, 48.37], [51.0, 52.68], [54.0, 57.18], [62.0, 62.63], [70.0, 73.87], [75.0, 80.11]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 35.88, 0.0, 0.0, 60.51, 0.0, 39.25, 38.36], "audiomae_on_audioset": [null, null, null, null, null, null, [["whale vocalization", 31.47], ["livestock, farm animals, working animals", 13.03], ["hum", 12.31]], null, [["music", 49.69], ["musical instrument", 13.78], ["didgeridoo", 4.93]], null, null, null, null, [["music", 71.8], ["boing", 4.84], ["musical instrument", 3.57]], [["music", 64.8], ["musical instrument", 7.16], ["brass instrument", 6.94]]], "duration": [0.63, -0.33, 0.97, 0.42, -0.14, 1.26, 7.91, 0.13, 22.27, 0.37, 1.68, 3.18, 0.63, 3.87, 5.11]} \ No newline at end of file diff --git a/annotations_1/hzmZJcPlJlE_filtered.json b/annotations_1/hzmZJcPlJlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1d1ef8c8576d0bd6bc850e243b80dfe5fc52c8 --- /dev/null +++ b/annotations_1/hzmZJcPlJlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.94], [12.0, 15.25], [16.0, 24.11], [25.0, 25.81], [28.0, 29.98], [32.0, 32.0], [33.0, 33.47], [34.0, 43.16], [48.0, 52.37], [55.0, 55.07], [56.0, 56.86], [58.0, 107.42], [110.0, 123.47], [127.0, 132.17], [135.0, 142.15], [144.0, 148.24], [155.0, 156.09], [158.0, 159.0], [161.0, 164.42]], "keep_status": [false, true, true, false, false, false, false, true, true, false, false, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 29.61, 33.93, 0.0, 0.0, 0.0, 0.0, 28.54, 29.25, 0.0, 0.0, 0.0, 28.34, 29.25, 28.78, 28.87, 0.0, 0.0, 29.61], "audiomae_on_audioset": [null, [["sound effect", 16.12], ["speech", 10.61], ["echo", 9.85]], [["music", 29.24], ["noise", 9.61], ["buzz", 7.5]], null, null, null, null, [["music", 12.68], ["fly, housefly", 12.58], ["mosquito", 10.96]], [["foghorn", 36.99], ["theremin", 11.83], ["music", 9.95]], null, null, null, [["speech", 14.55], ["music", 13.34], ["buzz", 9.68]], [["music", 69.45], ["speech", 5.01], ["animal", 3.07]], [["music", 19.2], ["pulse", 6.21], ["sound effect", 5.88]], [["music", 39.21], ["hum", 6.98], ["musical instrument", 6.66]], null, null, [["foghorn", 24.99], ["music", 17.64], ["trombone", 16.74]]], "duration": [0.94, 3.25, 8.11, 0.81, 1.98, 0.0, 0.47, 9.16, 4.37, 0.07, 0.86, 49.42, 13.47, 5.17, 7.15, 4.24, 1.09, 1.0, 3.42]} \ No newline at end of file diff --git a/annotations_1/i-2kXcQgs_w_filtered.json b/annotations_1/i-2kXcQgs_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6800b234e211ce713747d1ed25f7a95c685de8ac --- /dev/null +++ b/annotations_1/i-2kXcQgs_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.78], [5.0, 5.75], [10.0, 13.36], [14.0, 15.01], [16.0, 16.77], [18.0, 20.82], [21.0, 21.03], [21.0, 21.07], [21.0, 21.44], [22.0, 22.6], [25.0, 30.13], [33.0, 34.37], [35.0, 36.96], [38.0, 44.36], [45.0, 49.72], [53.0, 53.11], [55.0, 55.92], [60.0, 64.03], [67.0, 68.57], [70.0, 71.25], [73.0, 74.63], [76.0, 85.65], [90.0, 91.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.81, 0.0, 0.0, 76.37, 0.0, 0.0, 0.0, 0.0, 29.86, 0.0, 0.0, 100.0, 99.85, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 49.05], ["sidetone", 14.96], ["crackle", 3.11]], null, null, null, null, null, null, null, [["speech", 48.12], ["whack, thwack", 13.41], ["music", 5.62]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 0.75, 3.36, 1.01, 0.77, 2.82, 0.03, 0.07, 0.44, 0.6, 5.13, 1.37, 1.96, 6.36, 4.72, 0.11, 0.92, 4.03, 1.57, 1.25, 1.63, 9.65, 1.76]} \ No newline at end of file diff --git a/annotations_1/i07yEczcujQ_filtered.json b/annotations_1/i07yEczcujQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fef55c8bd8975f654568b00e668849d0e4a18e9a --- /dev/null +++ b/annotations_1/i07yEczcujQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.65], [13.0, 15.03], [16.0, 16.73], [18.0, 18.17], [19.0, 19.8], [21.0, 21.84], [27.0, 27.11], [29.0, 30.05], [34.0, 37.25], [42.0, 42.9], [44.0, 45.25], [49.0, 50.06], [55.0, 55.12], [57.0, 57.72], [65.0, 65.06], [77.0, 78.24], [80.0, 80.76], [85.0, 86.91], [88.0, 88.69], [90.0, 90.53], [91.0, 92.33], [93.0, 93.99], [97.0, 97.46], [100.0, 100.62], [104.0, 104.33], [107.0, 107.43], [108.0, 108.99]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.49], ["whale vocalization", 15.65], ["hum", 7.21]], null, null, null, null, null, null, [["music", 58.09], ["theremin", 13.29], ["musical instrument", 6.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 2.03, 0.73, 0.17, 0.8, 0.84, 0.11, 1.05, 3.25, 0.9, 1.25, 1.06, 0.12, 0.72, 0.06, 1.24, 0.76, 1.91, 0.69, 0.53, 1.33, 0.99, 0.46, 0.62, 0.33, 0.43, 0.99]} \ No newline at end of file diff --git a/annotations_1/i1igdJh44yU_filtered.json b/annotations_1/i1igdJh44yU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ed6adcd8b04ea7423a8761403bbf52a47ce90ff --- /dev/null +++ b/annotations_1/i1igdJh44yU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 34.18], [70.0, 71.42], [74.0, 96.31], [97.0, 97.78], [98.0, 99.49], [101.0, 102.41], [109.0, 111.42], [116.0, 117.12], [123.0, 124.95], [130.0, 131.48], [141.0, 143.45], [148.0, 148.09], [156.0, 158.3]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, true], "silence_prob": [28.51, 0.0, 28.83, 0.0, 0.0, 0.0, 32.82, 0.0, 0.0, 0.0, 37.04, 0.0, 34.88], "audiomae_on_audioset": [[["music", 62.8], ["electronic music", 11.65], ["speech", 4.74]], null, [["music", 92.84], ["techno", 1.69], ["electronic music", 1.42]], null, null, null, [["livestock, farm animals, working animals", 18.75], ["moo", 16.55], ["sheep", 15.99]], null, null, null, [["speech", 26.5], ["fly, housefly", 15.29], ["insect", 10.15]], null, [["sheep", 13.73], ["bleat", 11.43], ["fly, housefly", 10.85]]], "duration": [25.18, 1.42, 22.31, 0.78, 1.49, 1.41, 2.42, 1.12, 1.95, 1.48, 2.45, 0.09, 2.3]} \ No newline at end of file diff --git a/annotations_1/i2xyQnF1kro_filtered.json b/annotations_1/i2xyQnF1kro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b73a6af2d0bdcc62c443e4636d02d5550b367abf --- /dev/null +++ b/annotations_1/i2xyQnF1kro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.04], [5.0, 21.29], [25.0, 26.33], [27.0, 28.92], [30.0, 30.52], [39.0, 43.39], [44.0, 44.09], [45.0, 45.74], [47.0, 47.51], [53.0, 54.41], [55.0, 56.69], [61.0, 61.26], [62.0, 67.83], [83.0, 84.32], [86.0, 87.13], [88.0, 89.18], [91.0, 93.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 73.21, 0.0, 0.0, 0.0, 78.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.02, 0.0, 0.0, 0.0, 98.27], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.01], ["fly, housefly", 17.05], ["insect", 9.94]], null, null, null, null], "duration": [0.04, 16.29, 1.33, 1.92, 0.52, 4.39, 0.09, 0.74, 0.51, 1.41, 1.69, 0.26, 5.83, 1.32, 1.13, 1.18, 2.23]} \ No newline at end of file diff --git a/annotations_1/i31XFSORRfc_filtered.json b/annotations_1/i31XFSORRfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bdf27a1003d57e9ad5141a1c68aa02e02bce97 --- /dev/null +++ b/annotations_1/i31XFSORRfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.72], [37.0, 45.1], [46.0, 51.04], [58.0, 64.05], [66.0, 66.5], [68.0, 95.77], [96.0, 106.76], [108.0, 111.96], [113.0, 123.42], [125.0, 125.27], [126.0, 131.52], [133.0, 135.58], [139.0, 159.33]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [28.83, 29.49, 29.61, 34.56, 0.0, 32.56, 30.6, 42.58, 30.03, 0.0, 61.18, 29.71, 29.77], "audiomae_on_audioset": [[["music", 31.67], ["hum", 21.22], ["rumble", 10.66]], [["hum", 30.48], ["mains hum", 24.58], ["rumble", 15.42]], [["music", 60.87], ["hum", 5.59], ["mains hum", 4.6]], [["hum", 29.71], ["music", 24.93], ["mains hum", 21.21]], null, [["music", 43.6], ["hum", 29.88], ["mains hum", 12.04]], [["hum", 41.93], ["mains hum", 14.03], ["music", 14.03]], [["music", 67.71], ["sonar", 4.39], ["synthesizer", 3.43]], [["music", 57.83], ["scary music", 16.85], ["speech", 9.69]], null, null, [["music", 51.76], ["speech", 23.55], ["mains hum", 6.43]], [["music", 44.19], ["buzz", 9.36], ["mains hum", 5.14]]], "duration": [8.72, 8.1, 5.04, 6.05, 0.5, 27.77, 10.76, 3.96, 10.42, 0.27, 5.52, 2.58, 20.33]} \ No newline at end of file diff --git a/annotations_1/i3VNgECX8Ko_filtered.json b/annotations_1/i3VNgECX8Ko_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e335a6d1b95ca7e954f444259faf8b305b3c0b5 --- /dev/null +++ b/annotations_1/i3VNgECX8Ko_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.49], [24.0, 26.49], [29.0, 61.16], [63.0, 70.71], [71.0, 71.0], [72.0, 72.13], [76.0, 111.48], [112.0, 111.52]], "keep_status": [false, true, false, true, false, false, false, false], "silence_prob": [0.0, 36.41, 0.0, 34.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 42.58], ["hum", 8.19], ["vehicle", 6.54]], null, [["music", 45.39], ["speech", 14.19], ["throbbing", 6.81]], null, null, null, null], "duration": [1.49, 2.49, 32.16, 7.71, 0.0, 0.13, 35.48, -0.48]} \ No newline at end of file diff --git a/annotations_1/i3yO0OagpNY_filtered.json b/annotations_1/i3yO0OagpNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6df3013821b5a1252ee6035f000eb7c97479aeb0 --- /dev/null +++ b/annotations_1/i3yO0OagpNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.45], [24.0, 33.45], [34.0, 34.2], [37.0, 37.77], [41.0, 41.76], [42.0, 59.95], [61.0, 83.2], [83.0, 86.21], [91.0, 116.95], [118.0, 123.75], [124.0, 124.88], [128.0, 154.95]], "keep_status": [true, true, false, false, false, true, true, true, true, true, false, true], "silence_prob": [30.42, 33.9, 0.0, 0.0, 0.0, 35.73, 42.13, 33.85, 30.39, 28.88, 0.0, 28.82], "audiomae_on_audioset": [[["music", 34.23], ["brass instrument", 16.41], ["foghorn", 7.97]], [["music", 50.74], ["brass instrument", 8.72], ["didgeridoo", 8.42]], null, null, null, [["music", 47.46], ["effects unit", 10.6], ["musical instrument", 7.21]], [["music", 51.33], ["synthesizer", 11.76], ["theremin", 5.42]], [["music", 47.53], ["musical instrument", 6.59], ["foghorn", 2.95]], [["music", 26.82], ["theremin", 10.71], ["trombone", 7.77]], [["machine gun", 16.76], ["synthesizer", 13.69], ["music", 11.99]], null, [["music", 62.02], ["electronic music", 3.5], ["eruption", 2.69]]], "duration": [6.45, 9.45, 0.2, 0.77, 0.76, 17.95, 22.2, 3.21, 25.95, 5.75, 0.88, 26.95]} \ No newline at end of file diff --git a/annotations_1/i4NIiCSEiTg_filtered.json b/annotations_1/i4NIiCSEiTg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c72f7d29f5f10340fb025a7a62dc6e56307ccbcd --- /dev/null +++ b/annotations_1/i4NIiCSEiTg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [6.0, 6.08], [11.0, 11.65], [20.0, 20.83], [21.0, 30.48], [32.0, 32.44], [35.0, 41.69], [44.0, 45.0], [46.0, 47.71], [48.0, 48.86], [49.0, 52.07], [53.0, 54.09], [54.0, 54.67], [55.0, 56.13], [57.0, 57.82], [59.0, 61.33], [64.0, 65.67], [68.0, 73.84], [79.0, 87.59], [88.0, 91.74], [93.0, 96.15], [97.0, 98.54], [100.0, 111.79], [113.0, 114.12], [115.0, 123.87], [126.0, 126.1], [129.0, 130.77]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.15, 0.0, 49.87, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 84.07, 61.97, 76.53, 83.7, 0.0, 38.72, 0.0, 40.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 46.88], ["guitar", 9.8], ["singing bowl", 6.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.5], ["hum", 7.69], ["cello", 4.24]], null, [["music", 45.64], ["hum", 4.52], ["musical instrument", 3.6]], null, null], "duration": [0.48, 0.08, 0.65, 0.83, 9.48, 0.44, 6.69, 1.0, 1.71, 0.86, 3.07, 1.09, 0.67, 1.13, 0.82, 2.33, 1.67, 5.84, 8.59, 3.74, 3.15, 1.54, 11.79, 1.12, 8.87, 0.1, 1.77]} \ No newline at end of file diff --git a/annotations_1/i4NRgUeziqA_filtered.json b/annotations_1/i4NRgUeziqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..733c6ec958d40182a22a7fc9a3baaade45095a32 --- /dev/null +++ b/annotations_1/i4NRgUeziqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 79.54], [84.0, 116.07], [117.0, 120.28], [121.0, 121.54], [124.0, 125.05]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 46.52], ["eruption", 11.52], ["explosion", 5.15]], null, null], "duration": [75.54, 32.07, 3.28, 0.54, 1.05]} \ No newline at end of file diff --git a/annotations_1/i5dTE5dgWOw_filtered.json b/annotations_1/i5dTE5dgWOw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b96b967e4703cc639dc5bdded1beaee811e3bbe --- /dev/null +++ b/annotations_1/i5dTE5dgWOw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[84.0, 93.66], [95.0, 179.34], [184.0, 184.5], [187.0, 188.03], [189.0, 190.38], [191.0, 208.95]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.22, 0.0, 0.0, 0.0, 0.0, 30.58], "audiomae_on_audioset": [[["music", 40.22], ["hum", 24.9], ["throbbing", 9.57]], null, null, null, null, [["speech", 63.8], ["hum", 11.05], ["music", 7.46]]], "duration": [9.66, 84.34, 0.5, 1.03, 1.38, 17.95]} \ No newline at end of file diff --git a/annotations_1/i6oNzS6kCR8_filtered.json b/annotations_1/i6oNzS6kCR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..938ec32a033bc4a9e36482ad1105607487383dd4 --- /dev/null +++ b/annotations_1/i6oNzS6kCR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.41], [9.0, 11.57], [14.0, 13.88], [15.0, 16.01], [19.0, 20.78], [23.0, 23.7], [25.0, 28.71], [31.0, 31.97], [33.0, 33.52], [34.0, 100.47], [102.0, 101.83]], "keep_status": [true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [35.46, 42.74, 0.0, 0.0, 0.0, 0.0, 44.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 24.62], ["insect", 16.06], ["mains hum", 9.96]], [["speech", 14.46], ["music", 12.95], ["electric shaver, electric razor", 12.1]], null, null, null, null, [["music", 29.52], ["speech", 18.63], ["ding", 4.24]], null, null, null, null], "duration": [5.41, 2.57, -0.12, 1.01, 1.78, 0.7, 3.71, 0.97, 0.52, 66.47, -0.17]} \ No newline at end of file diff --git a/annotations_1/i7Jg_6-fYF8_filtered.json b/annotations_1/i7Jg_6-fYF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c603b9c662a3b6532b97e01632555dc8a937a9f --- /dev/null +++ b/annotations_1/i7Jg_6-fYF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.24], [6.0, 11.72], [14.0, 32.58], [35.0, 36.88], [41.0, 41.05], [42.0, 42.72], [45.0, 45.08], [46.0, 46.5], [48.0, 50.04], [54.0, 54.08], [56.0, 56.57], [62.0, 67.98], [69.0, 76.77], [80.0, 81.26], [86.0, 86.31], [88.0, 118.2], [120.0, 152.44]], "keep_status": [false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 32.58, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 46.29, 51.02, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.86], ["livestock, farm animals, working animals", 6.42], ["fly, housefly", 5.37]], [["speech", 27.71], ["explosion", 21.89], ["artillery fire", 11.64]], null, null, null, null, null, [["speech", 32.85], ["whack, thwack", 23.92], ["hum", 5.26]], null, null, [["speech", 49.74], ["hum", 11.0], ["mains hum", 5.22]], null, null, null, null, null], "duration": [0.24, 5.72, 18.58, 1.88, 0.05, 0.72, 0.08, 0.5, 2.04, 0.08, 0.57, 5.98, 7.77, 1.26, 0.31, 30.2, 32.44]} \ No newline at end of file diff --git a/annotations_1/iA_KZwlnrcI_filtered.json b/annotations_1/iA_KZwlnrcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c44f17dd7a31daf0b0d8623b860b16e889f2e1f2 --- /dev/null +++ b/annotations_1/iA_KZwlnrcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.9], [10.0, 11.11], [12.0, 14.94], [15.0, 18.87], [20.0, 22.15], [23.0, 29.25], [31.0, 34.1], [37.0, 43.65], [44.0, 57.54], [61.0, 64.3], [65.0, 66.12], [68.0, 78.78], [81.0, 126.49], [127.0, 127.79]], "keep_status": [false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [67.0, 0.0, 63.42, 44.93, 57.72, 74.44, 72.16, 31.39, 35.03, 30.71, 0.0, 31.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 46.88], ["whale vocalization", 8.01], ["music", 7.29]], null, null, null, [["music", 27.31], ["electric shaver, electric razor", 19.58], ["speech", 9.52]], [["music", 40.95], ["didgeridoo", 14.58], ["hum", 10.4]], [["hum", 22.51], ["throbbing", 18.8], ["speech", 15.09]], null, [["throbbing", 52.77], ["hum", 17.72], ["music", 11.24]], null, null], "duration": [2.9, 1.11, 2.94, 3.87, 2.15, 6.25, 3.1, 6.65, 13.54, 3.3, 1.12, 10.78, 45.49, 0.79]} \ No newline at end of file diff --git a/annotations_1/iAlU6xt7Y_s_filtered.json b/annotations_1/iAlU6xt7Y_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3601bb7d165c4645408cc04f0aaeb44bf89b37ee --- /dev/null +++ b/annotations_1/iAlU6xt7Y_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [4.0, 5.24], [9.0, 10.35], [11.0, 12.11], [16.0, 15.9], [18.0, 18.91], [19.0, 20.38], [23.0, 25.24], [26.0, 26.42], [27.0, 28.97], [36.0, 37.29], [39.0, 39.16], [41.0, 41.96], [44.0, 45.81], [46.0, 48.59], [49.0, 58.02], [61.0, 65.26], [70.0, 70.39], [78.0, 79.81], [82.0, 85.21], [95.0, 96.21], [97.0, 100.5], [102.0, 106.52], [108.0, 109.86], [114.0, 116.04], [118.0, 119.97], [121.0, 128.78], [130.0, 130.23], [131.0, 138.27], [140.0, 140.05], [140.0, 141.56], [144.0, 144.15], [146.0, 146.7], [147.0, 148.39], [149.0, 149.01], [150.0, 150.87], [152.0, 154.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 87.92, 95.91, 0.0, 0.0, 96.77, 0.0, 85.35, 87.55, 0.0, 50.02, 0.0, 99.26, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.09], ["sidetone", 34.01], ["hum", 7.22]], null, null, null, null, null, null, null, null], "duration": [0.89, 1.24, 1.35, 1.11, -0.1, 0.91, 1.38, 2.24, 0.42, 1.97, 1.29, 0.16, 0.96, 1.81, 2.59, 9.02, 4.26, 0.39, 1.81, 3.21, 1.21, 3.5, 4.52, 1.86, 2.04, 1.97, 7.78, 0.23, 7.27, 0.05, 1.56, 0.15, 0.7, 1.39, 0.01, 0.87, 2.41]} \ No newline at end of file diff --git a/annotations_1/iAzMFB3QaBk_filtered.json b/annotations_1/iAzMFB3QaBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e4d22e2e43f627c211b0b45500fcf1c3c70ebb4 --- /dev/null +++ b/annotations_1/iAzMFB3QaBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.06], [4.0, 5.04], [9.0, 9.73], [13.0, 14.22], [17.0, 17.58], [22.0, 22.0], [24.0, 25.66], [42.0, 43.7], [45.0, 45.91], [54.0, 54.4], [63.0, 63.61], [66.0, 67.12], [68.0, 70.01], [73.0, 74.61], [76.0, 76.99], [77.0, 78.06], [78.0, 84.69], [85.0, 85.67], [86.0, 90.02], [94.0, 95.54], [97.0, 97.73], [98.0, 100.01], [112.0, 112.51], [113.0, 114.79], [121.0, 121.9], [126.0, 128.28], [129.0, 129.44], [141.0, 142.23], [144.0, 147.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 93.6, 0.0, 48.39, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 47.39, 0.0, 0.0, 48.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.26], ["burping, eructation", 14.17], ["speech", 5.18]], null, null, null, null, null, null, [["noise", 18.82], ["whale vocalization", 14.95], ["hum", 12.18]], null, null, [["speech", 47.35], ["hum", 11.26], ["mains hum", 8.43]]], "duration": [1.06, 1.04, 0.73, 1.22, 0.58, 0.0, 1.66, 1.7, 0.91, 0.4, 0.61, 1.12, 2.01, 1.61, 0.99, 1.06, 6.69, 0.67, 4.02, 1.54, 0.73, 2.01, 0.51, 1.79, 0.9, 2.28, 0.44, 1.23, 3.23]} \ No newline at end of file diff --git a/annotations_1/iBptyagVaEQ_filtered.json b/annotations_1/iBptyagVaEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b32bb220dfa3d981fae4b0e8e6b5a64bed92b0e4 --- /dev/null +++ b/annotations_1/iBptyagVaEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.36], [24.0, 26.76], [28.0, 33.61], [36.0, 44.14], [46.0, 51.12], [52.0, 73.16], [74.0, 90.61], [91.0, 99.67]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [97.64, 98.1, 96.42, 97.83, 97.83, 97.11, 93.45, 95.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [6.36, 2.76, 5.61, 8.14, 5.12, 21.16, 16.61, 8.67]} \ No newline at end of file diff --git a/annotations_1/iDnE3PV4YNc_filtered.json b/annotations_1/iDnE3PV4YNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd272334f2a9d9142ff8981bd01d0430001555a3 --- /dev/null +++ b/annotations_1/iDnE3PV4YNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.6], [5.0, 7.5], [9.0, 10.15], [12.0, 18.49], [20.0, 21.83], [23.0, 24.92], [26.0, 27.01], [29.0, 38.38], [43.0, 43.46], [45.0, 45.35], [51.0, 51.63], [55.0, 55.44], [57.0, 62.5], [63.0, 69.62], [70.0, 81.35], [83.0, 89.75], [93.0, 97.33], [98.0, 98.63], [101.0, 100.85], [102.0, 103.84], [108.0, 108.9], [112.0, 116.7], [119.0, 129.95]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, true, true], "silence_prob": [0.0, 41.83, 0.0, 40.28, 0.0, 0.0, 0.0, 38.22, 0.0, 0.0, 0.0, 0.0, 42.26, 29.14, 29.59, 30.57, 48.19, 0.0, 0.0, 0.0, 0.0, 27.9, 28.48], "audiomae_on_audioset": [null, [["speech", 57.59], ["music", 14.68], ["sidetone", 3.59]], null, [["music", 35.84], ["hum", 14.51], ["throbbing", 11.16]], null, null, null, [["music", 54.63], ["hum", 14.04], ["mains hum", 6.63]], null, null, null, null, [["speech", 29.01], ["music", 22.72], ["hum", 8.43]], [["speech", 23.44], ["music", 20.54], ["rumble", 19.28]], [["music", 39.29], ["speech", 16.64], ["sound effect", 4.57]], [["music", 14.36], ["crack", 11.33], ["speech", 10.97]], [["theremin", 42.57], ["music", 36.77], ["synthesizer", 4.75]], null, null, null, null, [["music", 19.89], ["zipper (clothing)", 18.75], ["mosquito", 13.49]], [["mains hum", 27.65], ["hum", 23.95], ["electric shaver, electric razor", 12.47]]], "duration": [1.6, 2.5, 1.15, 6.49, 1.83, 1.92, 1.01, 9.38, 0.46, 0.35, 0.63, 0.44, 5.5, 6.62, 11.35, 6.75, 4.33, 0.63, -0.15, 1.84, 0.9, 4.7, 10.95]} \ No newline at end of file diff --git a/annotations_1/iErVeElswus_filtered.json b/annotations_1/iErVeElswus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8774e6a5661ca0ad80dc199d1cfb40b2e7832a52 --- /dev/null +++ b/annotations_1/iErVeElswus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.8], [8.0, 9.39], [13.0, 13.71], [19.0, 28.09], [28.0, 31.87], [33.0, 44.59], [45.0, 45.57], [47.0, 61.75], [63.0, 64.27], [65.0, 66.12], [69.0, 70.58], [71.0, 78.63], [79.0, 80.55], [82.0, 84.28], [85.0, 86.86], [88.0, 93.33], [94.0, 131.31]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 89.19, 98.51, 77.87, 0.0, 46.9, 0.0, 0.0, 0.0, 73.36, 0.0, 62.58, 0.0, 59.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["singing bowl", 28.09], ["speech", 27.43], ["hum", 8.78]], null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.39, 0.71, 9.09, 3.87, 11.59, 0.57, 14.75, 1.27, 1.12, 1.58, 7.63, 1.55, 2.28, 1.86, 5.33, 37.31]} \ No newline at end of file diff --git a/annotations_1/iG5M3WSF1DY_filtered.json b/annotations_1/iG5M3WSF1DY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..797f90cdf0bdc7b5ba77212e26dedc333309397d --- /dev/null +++ b/annotations_1/iG5M3WSF1DY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [10.0, 10.62], [11.0, 17.54], [19.0, 20.02], [22.0, 26.13], [28.0, 29.08], [30.0, 32.1], [35.0, 40.85], [42.0, 43.85], [46.0, 47.51], [50.0, 66.77], [68.0, 71.09], [72.0, 73.03], [74.0, 76.18], [77.0, 77.95], [79.0, 80.54], [82.0, 88.97], [91.0, 91.45], [94.0, 95.23], [96.0, 99.22], [100.0, 101.53], [104.0, 110.44], [112.0, 112.5], [117.0, 145.99], [149.0, 150.42], [152.0, 153.45]], "keep_status": [false, false, true, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 34.16, 0.0, 35.57, 0.0, 35.26, 29.45, 0.0, 0.0, 40.48, 94.37, 0.0, 40.17, 0.0, 0.0, 61.18, 0.0, 0.0, 58.13, 0.0, 29.96, 0.0, 31.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 22.1], ["cattle, bovinae", 20.15], ["moo", 12.1]], null, [["hum", 46.99], ["mains hum", 25.02], ["throbbing", 19.48]], null, [["speech", 56.38], ["vehicle", 6.31], ["music", 2.62]], [["music", 21.47], ["speech", 16.82], ["whip", 6.23]], null, null, [["music", 45.09], ["hum", 9.03], ["throbbing", 4.82]], null, null, [["speech", 45.14], ["fart", 37.06], ["music", 2.04]], null, null, null, null, null, null, null, [["music", 31.17], ["speech", 25.55], ["theremin", 2.18]], null, [["music", 18.23], ["thump, thud", 7.1], ["whack, thwack", 6.4]], null, null], "duration": [1.17, 0.62, 6.54, 1.02, 4.13, 1.08, 2.1, 5.85, 1.85, 1.51, 16.77, 3.09, 1.03, 2.18, 0.95, 1.54, 6.97, 0.45, 1.23, 3.22, 1.53, 6.44, 0.5, 28.99, 1.42, 1.45]} \ No newline at end of file diff --git a/annotations_1/iG5oSrAW9FQ_filtered.json b/annotations_1/iG5oSrAW9FQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6376f3dcfc6762fc3390c6293bfda4f6bf7d999d --- /dev/null +++ b/annotations_1/iG5oSrAW9FQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 46.45], [48.0, 90.14], [90.0, 92.5], [95.0, 107.38]], "keep_status": [true, false, false, true], "silence_prob": [30.4, 0.0, 30.75, 38.83], "audiomae_on_audioset": [[["music", 55.97], ["didgeridoo", 8.66], ["cattle, bovinae", 3.3]], null, [["speech", 59.65], ["buzzer", 14.96], ["music", 5.55]], [["cattle, bovinae", 18.97], ["moo", 14.52], ["sidetone", 10.94]]], "duration": [6.45, 42.14, 2.5, 12.38]} \ No newline at end of file diff --git a/annotations_1/iGVsptoMsKE_filtered.json b/annotations_1/iGVsptoMsKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68232e726d5d899036be4b5d37c4879672d0aa72 --- /dev/null +++ b/annotations_1/iGVsptoMsKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.59], [14.0, 14.67], [19.0, 31.35], [34.0, 43.11], [44.0, 44.74], [46.0, 94.96], [97.0, 105.93], [107.0, 107.43], [110.0, 110.74], [111.0, 112.97], [118.0, 118.15], [118.0, 119.37], [122.0, 129.84], [131.0, 142.26], [154.0, 154.99], [160.0, 160.79], [166.0, 175.05]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.73, 36.98, 0.0, 0.0, 30.01, 0.0, 0.0, 0.0, 0.0, 0.0, 30.04, 30.4, 0.0, 0.0, 31.7], "audiomae_on_audioset": [null, null, [["music", 48.66], ["fart", 7.24], ["hum", 5.22]], [["music", 71.57], ["wild animals", 7.95], ["animal", 4.3]], null, null, [["music", 43.11], ["hum", 12.51], ["theremin", 6.59]], null, null, null, null, null, [["music", 43.19], ["theremin", 35.74], ["speech", 2.43]], [["music", 61.32], ["theremin", 21.29], ["ambient music", 1.49]], null, null, [["music", 25.53], ["speech", 22.45], ["theremin", 9.75]]], "duration": [1.59, 0.67, 12.35, 9.11, 0.74, 48.96, 8.93, 0.43, 0.74, 1.97, 0.15, 1.37, 7.84, 11.26, 0.99, 0.79, 9.05]} \ No newline at end of file diff --git a/annotations_1/iGawlpfe6a0_filtered.json b/annotations_1/iGawlpfe6a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73e4503191192b610f172ad6deafa863f46f66f9 --- /dev/null +++ b/annotations_1/iGawlpfe6a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[53.0, 53.28], [66.0, 67.27], [84.0, 83.71], [87.0, 87.13], [88.0, 87.98]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.28, 1.27, -0.29, 0.13, -0.02]} \ No newline at end of file diff --git a/annotations_1/iGk7QYThMTk_filtered.json b/annotations_1/iGk7QYThMTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f74fa908bc549397220eb4f699f972e55596d4d --- /dev/null +++ b/annotations_1/iGk7QYThMTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 34.38], [35.0, 36.07], [38.0, 71.15], [72.0, 88.05], [88.0, 118.0], [120.0, 143.94], [145.0, 144.96], [145.0, 145.25], [146.0, 151.34], [151.0, 151.38], [152.0, 161.65], [164.0, 168.12]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, true], "silence_prob": [39.54, 0.0, 0.0, 30.31, 29.42, 30.42, 0.0, 0.0, 30.94, 0.0, 29.72, 36.16], "audiomae_on_audioset": [[["music", 31.51], ["effects unit", 5.94], ["frog", 3.93]], null, null, [["music", 75.01], ["mains hum", 7.01], ["hum", 6.95]], [["music", 50.79], ["speech", 13.39], ["fireworks", 6.89]], [["music", 57.44], ["effects unit", 7.16], ["musical instrument", 6.24]], null, null, [["music", 61.86], ["mains hum", 3.93], ["hum", 3.51]], null, [["music", 55.59], ["speech", 9.44], ["buzz", 4.53]], [["speech", 44.88], ["music", 11.06], ["fly, housefly", 4.08]]], "duration": [2.38, 1.07, 33.15, 16.05, 30.0, 23.94, -0.04, 0.25, 5.34, 0.38, 9.65, 4.12]} \ No newline at end of file diff --git a/annotations_1/iGsce-w4TtY_filtered.json b/annotations_1/iGsce-w4TtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd9c10694396ec5705593091630c9c77f50f531 --- /dev/null +++ b/annotations_1/iGsce-w4TtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.99], [17.0, 36.36], [39.0, 40.05], [41.0, 43.65], [45.0, 61.35], [65.0, 83.07], [84.0, 84.43], [85.0, 92.75], [94.0, 97.53], [100.0, 109.65], [110.0, 110.27], [110.0, 110.79], [111.0, 125.9]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, true], "silence_prob": [30.21, 30.83, 0.0, 31.07, 30.23, 30.99, 0.0, 30.05, 29.97, 30.89, 0.0, 0.0, 29.16], "audiomae_on_audioset": [[["cattle, bovinae", 30.26], ["moo", 20.86], ["livestock, farm animals, working animals", 19.28]], [["cattle, bovinae", 58.38], ["moo", 23.1], ["livestock, farm animals, working animals", 15.53]], null, [["music", 34.59], ["speech", 34.37], ["electronic music", 4.24]], [["speech", 32.31], ["explosion", 14.52], ["whack, thwack", 5.86]], [["speech", 43.59], ["fart", 32.67], ["music", 5.16]], null, [["explosion", 39.01], ["speech", 25.4], ["eruption", 8.03]], [["speech", 26.47], ["fart", 24.86], ["explosion", 19.57]], [["hum", 21.05], ["rumble", 10.63], ["speech", 8.85]], null, null, [["grunt", 11.85], ["music", 8.36], ["hum", 6.14]]], "duration": [2.99, 19.36, 1.05, 2.65, 16.35, 18.07, 0.43, 7.75, 3.53, 9.65, 0.27, 0.79, 14.9]} \ No newline at end of file diff --git a/annotations_1/iHQZhYadNwQ_filtered.json b/annotations_1/iHQZhYadNwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47e6cf46920bcdcf19f687b243661b9ac9f0d37a --- /dev/null +++ b/annotations_1/iHQZhYadNwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 27.57], [28.0, 58.7], [62.0, 65.33], [66.0, 67.1], [68.0, 73.45], [74.0, 76.35], [77.0, 79.57], [80.0, 83.12], [84.0, 91.37], [93.0, 99.81], [101.0, 103.6], [106.0, 111.47], [113.0, 133.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.38, 0.0, 75.39, 0.0, 94.52, 96.66, 93.91, 93.91, 85.72, 96.29, 96.66, 82.07, 66.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.57, 30.7, 3.33, 1.1, 5.45, 2.35, 2.57, 3.12, 7.37, 6.81, 2.6, 5.47, 20.1]} \ No newline at end of file diff --git a/annotations_1/iJDnG2RAlzk_filtered.json b/annotations_1/iJDnG2RAlzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab9c04ce9deaeb35607de7a4d45861294715b2ec --- /dev/null +++ b/annotations_1/iJDnG2RAlzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.33], [16.0, 16.92], [21.0, 20.63], [21.0, 30.25], [31.0, 59.93], [61.0, 71.46], [72.0, 73.35], [74.0, 76.69], [79.0, 80.45], [82.0, 83.4], [84.0, 85.99], [87.0, 95.1]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.52, 31.67, 30.88, 0.0, 40.71, 0.0, 0.0, 0.0, 32.2], "audiomae_on_audioset": [null, null, null, [["speech", 49.88], ["sidetone", 13.96], ["electric shaver, electric razor", 11.86]], [["livestock, farm animals, working animals", 30.08], ["cattle, bovinae", 19.19], ["moo", 17.59]], [["speech", 28.08], ["music", 8.45], ["fly, housefly", 8.26]], null, [["whale vocalization", 38.83], ["speech", 33.58], ["music", 3.42]], null, null, null, [["speech", 45.84], ["explosion", 12.3], ["rumble", 7.59]]], "duration": [0.33, 0.92, -0.37, 9.25, 28.93, 10.46, 1.35, 2.69, 1.45, 1.4, 1.99, 8.1]} \ No newline at end of file diff --git a/annotations_1/iJGazi2EdrQ_filtered.json b/annotations_1/iJGazi2EdrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..172fdc62f6b87303566499b7b7c4e8842f1972f6 --- /dev/null +++ b/annotations_1/iJGazi2EdrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 6.49], [7.0, 8.34], [9.0, 9.1], [11.0, 11.25], [14.0, 15.26], [16.0, 16.51], [19.0, 19.36], [21.0, 23.62], [25.0, 30.57], [32.0, 75.46], [77.0, 84.59], [85.0, 99.3], [102.0, 107.13], [107.0, 111.6], [113.0, 116.72], [120.0, 120.6], [122.0, 124.44], [125.0, 135.14], [136.0, 141.35], [142.0, 144.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.16, 0.0, 98.44, 83.16, 94.66, 83.7, 85.72, 0.0, 95.37, 72.75, 81.53, 56.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.49, 1.34, 0.1, 0.25, 1.26, 0.51, 0.36, 2.62, 5.57, 43.46, 7.59, 14.3, 5.13, 4.6, 3.72, 0.6, 2.44, 10.14, 5.35, 2.37]} \ No newline at end of file diff --git a/annotations_1/iJKQl3uGg0I_filtered.json b/annotations_1/iJKQl3uGg0I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26928dc7bd547ec40cd1c0a157d433fb2c09281b --- /dev/null +++ b/annotations_1/iJKQl3uGg0I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [3.0, 4.13], [6.0, 7.11], [8.0, 9.53], [10.0, 11.31], [12.0, 12.78], [14.0, 18.35], [20.0, 20.68], [25.0, 25.88], [27.0, 28.44], [29.0, 29.42], [31.0, 33.32], [34.0, 34.55], [37.0, 43.5], [45.0, 45.64], [50.0, 50.79], [52.0, 56.27], [59.0, 59.24], [62.0, 63.02], [65.0, 65.08], [66.0, 67.69], [69.0, 69.31], [70.0, 71.36], [73.0, 74.14], [76.0, 77.85], [80.0, 80.86], [82.0, 83.12], [84.0, 85.63], [87.0, 87.24], [88.0, 99.22], [101.0, 102.12], [103.0, 103.87], [104.0, 107.4], [110.0, 110.37], [120.0, 121.68], [123.0, 123.96], [125.0, 125.83], [129.0, 129.02], [130.0, 131.46], [133.0, 132.87], [137.0, 139.14], [142.0, 143.29], [145.0, 145.32], [146.0, 146.48], [148.0, 149.23], [150.0, 151.43], [153.0, 154.14], [155.0, 156.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.96, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 37.21, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 63.58], ["hum", 4.11], ["radio", 3.43]], null, null, null, null, null, null, [["music", 17.13], ["fart", 14.13], ["speech", 10.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.44, 1.13, 1.11, 1.53, 1.31, 0.78, 4.35, 0.68, 0.88, 1.44, 0.42, 2.32, 0.55, 6.5, 0.64, 0.79, 4.27, 0.24, 1.02, 0.08, 1.69, 0.31, 1.36, 1.14, 1.85, 0.86, 1.12, 1.63, 0.24, 11.22, 1.12, 0.87, 3.4, 0.37, 1.68, 0.96, 0.83, 0.02, 1.46, -0.13, 2.14, 1.29, 0.32, 0.48, 1.23, 1.43, 1.14, 1.66]} \ No newline at end of file diff --git a/annotations_1/iJ_DrM05hp4_filtered.json b/annotations_1/iJ_DrM05hp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf10cda20fe0ab35244e0c8731e1773ade72b6a2 --- /dev/null +++ b/annotations_1/iJ_DrM05hp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.19], [9.0, 9.54], [15.0, 15.31], [17.0, 17.51], [24.0, 26.05], [29.0, 30.0], [35.0, 35.56], [37.0, 37.66], [41.0, 41.05], [44.0, 44.24], [50.0, 50.9], [54.0, 53.7], [60.0, 61.8], [89.0, 89.55], [90.0, 91.1], [92.0, 92.38], [122.0, 123.09], [140.0, 140.29], [145.0, 145.47], [147.0, 148.26], [150.0, 150.47], [154.0, 155.01], [162.0, 162.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.54, 0.31, 0.51, 2.05, 1.0, 0.56, 0.66, 0.05, 0.24, 0.9, -0.3, 1.8, 0.55, 1.1, 0.38, 1.09, 0.29, 0.47, 1.26, 0.47, 1.01, 0.77]} \ No newline at end of file diff --git a/annotations_1/iJrgXYnUVe8_filtered.json b/annotations_1/iJrgXYnUVe8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d95d6c089f27f0010d0e6f69c5efe411cf8a60ab --- /dev/null +++ b/annotations_1/iJrgXYnUVe8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.35], [29.0, 30.54], [33.0, 33.81], [37.0, 39.29], [41.0, 41.2], [42.0, 79.69], [82.0, 82.56], [88.0, 87.72], [93.0, 95.01], [96.0, 98.27], [102.0, 102.86], [104.0, 104.77], [114.0, 118.02], [120.0, 124.28], [126.0, 128.68]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [30.94, 0.0, 0.0, 32.73, 0.0, 0.0, 0.0, 0.0, 100.0, 94.52, 0.0, 0.0, 30.83, 30.21, 32.64], "audiomae_on_audioset": [[["hum", 46.47], ["throbbing", 43.11], ["music", 6.14]], null, null, [["music", 19.19], ["hum", 14.31], ["rumble", 7.31]], null, null, null, null, null, null, null, null, [["boom", 24.09], ["whack, thwack", 9.47], ["explosion", 9.43]], [["speech", 30.7], ["boing", 21.92], ["music", 11.72]], [["music", 41.53], ["boing", 21.77], ["speech", 5.51]]], "duration": [17.35, 1.54, 0.81, 2.29, 0.2, 37.69, 0.56, -0.28, 2.01, 2.27, 0.86, 0.77, 4.02, 4.28, 2.68]} \ No newline at end of file diff --git a/annotations_1/iK03b228mmo_filtered.json b/annotations_1/iK03b228mmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f73cf951c694189ff4769083751fa7fc2952c41e --- /dev/null +++ b/annotations_1/iK03b228mmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.85], [11.0, 17.74], [18.0, 19.63], [22.0, 25.62], [27.0, 29.37], [31.0, 32.04], [33.0, 39.68], [40.0, 41.13], [43.0, 44.2], [45.0, 54.51], [55.0, 55.9], [56.0, 68.79], [70.0, 86.02], [89.0, 90.24], [94.0, 110.94], [117.0, 118.56], [122.0, 125.44], [131.0, 130.87], [132.0, 140.09], [142.0, 152.68], [157.0, 166.24]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [29.13, 29.07, 0.0, 30.24, 32.05, 0.0, 30.73, 0.0, 0.0, 30.33, 0.0, 30.85, 29.43, 0.0, 31.63, 0.0, 32.77, 0.0, 36.35, 34.66, 35.37], "audiomae_on_audioset": [[["music", 47.5], ["hum", 8.65], ["throbbing", 8.04]], [["music", 30.56], ["hum", 13.73], ["throbbing", 12.16]], null, [["music", 21.14], ["hum", 17.92], ["throbbing", 7.06]], [["music", 46.54], ["hum", 11.33], ["throbbing", 8.23]], null, [["music", 31.96], ["hum", 22.62], ["speech", 18.78]], null, null, [["speech", 34.61], ["hum", 20.0], ["music", 18.54]], null, [["didgeridoo", 72.48], ["music", 11.04], ["gong", 2.44]], [["hum", 29.3], ["didgeridoo", 23.52], ["music", 19.48]], null, [["music", 45.04], ["hum", 27.01], ["throbbing", 9.71]], null, [["music", 35.98], ["hum", 7.37], ["speech", 6.82]], null, [["hum", 33.84], ["mains hum", 23.41], ["music", 20.84]], [["mains hum", 34.7], ["hum", 19.0], ["speech", 8.17]], [["music", 25.51], ["mains hum", 14.37], ["hum", 8.57]]], "duration": [5.85, 6.74, 1.63, 3.62, 2.37, 1.04, 6.68, 1.13, 1.2, 9.51, 0.9, 12.79, 16.02, 1.24, 16.94, 1.56, 3.44, -0.13, 8.09, 10.68, 9.24]} \ No newline at end of file diff --git a/annotations_1/iKRpMjVJKZc_filtered.json b/annotations_1/iKRpMjVJKZc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f0fc91a0d223c0eb66cb62a86457d13eb46ae1f --- /dev/null +++ b/annotations_1/iKRpMjVJKZc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [12.0, 12.16], [16.0, 16.34], [19.0, 20.38], [23.0, 24.09], [25.0, 25.42], [27.0, 27.8], [29.0, 29.51], [36.0, 36.58], [42.0, 45.27], [49.0, 48.64], [50.0, 50.77], [52.0, 53.87], [55.0, 55.66], [60.0, 60.03], [64.0, 64.5], [65.0, 66.18], [67.0, 68.32], [77.0, 79.79], [81.0, 81.53], [83.0, 84.5], [97.0, 97.38], [99.0, 99.59], [100.0, 103.42], [105.0, 118.12], [123.0, 125.59], [135.0, 151.7], [154.0, 154.55], [156.0, 161.45], [163.0, 170.16], [172.0, 175.85], [177.0, 177.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 0.0, 0.0, 0.0, 30.72, 32.46, 39.44, 30.42, 0.0, 32.15, 33.92, 39.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 33.17], ["frog", 15.14], ["sidetone", 7.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 23.99], ["cattle, bovinae", 22.16], ["music", 15.88]], [["music", 53.39], ["electronic music", 6.27], ["techno", 5.91]], [["fly, housefly", 25.48], ["insect", 14.55], ["music", 11.41]], [["music", 46.82], ["speech", 10.53], ["theremin", 3.96]], null, [["music", 63.06], ["trance music", 7.07], ["speech", 5.71]], [["music", 45.01], ["sidetone", 30.87], ["speech", 9.5]], [["music", 28.33], ["speech", 17.68], ["fly, housefly", 9.37]], null], "duration": [0.73, 0.16, 0.34, 1.38, 1.09, 0.42, 0.8, 0.51, 0.58, 3.27, -0.36, 0.77, 1.87, 0.66, 0.03, 0.5, 1.18, 1.32, 2.79, 0.53, 1.5, 0.38, 0.59, 3.42, 13.12, 2.59, 16.7, 0.55, 5.45, 7.16, 3.85, 0.9]} \ No newline at end of file diff --git a/annotations_1/iKS_327EF84_filtered.json b/annotations_1/iKS_327EF84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c05d7f2a37cb41e5fa3dc55572db75f139090c01 --- /dev/null +++ b/annotations_1/iKS_327EF84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.7], [15.0, 16.11], [17.0, 20.14], [21.0, 25.46], [30.0, 31.94], [33.0, 40.63], [47.0, 49.37], [66.0, 71.71], [82.0, 84.62], [86.0, 87.72], [90.0, 96.09], [99.0, 101.09], [110.0, 116.95], [125.0, 168.98], [173.0, 174.09], [174.0, 174.24], [177.0, 176.89]], "keep_status": [false, false, true, true, false, true, true, true, true, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 32.08, 30.08, 0.0, 29.25, 31.32, 29.91, 33.34, 0.0, 31.36, 30.68, 30.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 31.67], ["music", 27.9], ["speech", 6.95]], [["speech", 35.46], ["music", 24.92], ["electronic music", 6.76]], null, [["music", 24.12], ["electronic music", 16.81], ["speech", 9.92]], [["music", 29.05], ["throbbing", 19.26], ["hum", 7.23]], [["music", 24.72], ["throbbing", 13.05], ["hum", 7.24]], [["fly, housefly", 20.14], ["mosquito", 16.67], ["groan", 11.6]], null, [["music", 60.43], ["didgeridoo", 3.97], ["throbbing", 2.8]], [["speech", 32.47], ["music", 17.61], ["outside, urban or manmade", 3.71]], [["buzz", 31.55], ["fly, housefly", 12.15], ["mosquito", 12.15]], null, null, null, null], "duration": [1.7, 1.11, 3.14, 4.46, 1.94, 7.63, 2.37, 5.71, 2.62, 1.72, 6.09, 2.09, 6.95, 43.98, 1.09, 0.24, -0.11]} \ No newline at end of file diff --git a/annotations_1/iKduvC0uNs8_filtered.json b/annotations_1/iKduvC0uNs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dce2d841152e643e2e96d88d3c3a3b1a6bacb455 --- /dev/null +++ b/annotations_1/iKduvC0uNs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 61.8], [62.0, 73.55], [78.0, 80.79], [82.0, 101.44], [104.0, 110.1], [115.0, 123.31], [123.0, 137.35], [140.0, 142.11], [145.0, 150.87], [152.0, 152.31]], "keep_status": [false, false, true, false, false, false, true, false, false, false], "silence_prob": [35.8, 32.23, 29.51, 29.02, 28.78, 29.04, 29.01, 55.74, 48.69, 0.0], "audiomae_on_audioset": [[["music", 53.32], ["mains hum", 21.54], ["hum", 15.75]], [["music", 66.64], ["didgeridoo", 6.62], ["throbbing", 3.27]], [["music", 33.88], ["shofar", 15.88], ["wind instrument, woodwind instrument", 4.61]], [["music", 72.05], ["synthesizer", 6.48], ["musical instrument", 3.69]], [["music", 71.57], ["musical instrument", 3.08], ["vehicle", 2.23]], [["music", 52.55], ["theremin", 15.68], ["speech", 2.88]], [["music", 21.94], ["wind instrument, woodwind instrument", 15.07], ["shofar", 8.64]], null, [["music", 42.94], ["didgeridoo", 27.73], ["musical instrument", 3.78]], null], "duration": [13.8, 11.55, 2.79, 19.44, 6.1, 8.31, 14.35, 2.11, 5.87, 0.31]} \ No newline at end of file diff --git a/annotations_1/iKi2wYZNAnE_filtered.json b/annotations_1/iKi2wYZNAnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80f724378da20af00726f9443c8af7a66f553f68 --- /dev/null +++ b/annotations_1/iKi2wYZNAnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [12.0, 13.83], [19.0, 20.19], [23.0, 26.45], [30.0, 32.54], [34.0, 34.89], [39.0, 39.51], [48.0, 51.34], [52.0, 53.52], [54.0, 54.5], [55.0, 56.17], [67.0, 66.97], [69.0, 69.5], [79.0, 80.13], [81.0, 81.5], [82.0, 83.39], [103.0, 103.94], [113.0, 113.68]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.39, 41.64, 0.0, 0.0, 32.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 20.12], ["livestock, farm animals, working animals", 19.33], ["cattle, bovinae", 17.62]], [["speech", 15.41], ["mains hum", 7.01], ["moo", 5.41]], null, null, [["music", 37.76], ["didgeridoo", 14.12], ["speech", 8.97]], null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 1.83, 1.19, 3.45, 2.54, 0.89, 0.51, 3.34, 1.52, 0.5, 1.17, -0.03, 0.5, 1.13, 0.5, 1.39, 0.94, 0.68]} \ No newline at end of file diff --git a/annotations_1/iKp5ARBBpyc_filtered.json b/annotations_1/iKp5ARBBpyc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c076a4e2faa8ab99f6af5bf55b3634a086793851 --- /dev/null +++ b/annotations_1/iKp5ARBBpyc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.68], [16.0, 20.51], [21.0, 22.03], [31.0, 31.68], [40.0, 40.36], [43.0, 44.04], [45.0, 46.33], [52.0, 54.11], [64.0, 65.21], [72.0, 72.22], [73.0, 74.04], [74.0, 74.98], [79.0, 80.62], [82.0, 83.46], [94.0, 94.14], [100.0, 103.0], [110.0, 111.0], [124.0, 124.98], [125.0, 125.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 42.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["tuning fork", 48.87], ["speech", 28.73], ["busy signal", 4.88]], null, null, null, null, null, null, null, [["sidetone", 38.08], ["noise", 17.7], ["music", 6.87]], null, null, null], "duration": [0.68, 4.51, 1.03, 0.68, 0.36, 1.04, 1.33, 2.11, 1.21, 0.22, 1.04, 0.98, 1.62, 1.46, 0.14, 3.0, 1.0, 0.98, 0.64]} \ No newline at end of file diff --git a/annotations_1/iKscMa0XRXo_filtered.json b/annotations_1/iKscMa0XRXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d04a2c2e7a08abf9437ed2d4e9d2f1f8a7d515b --- /dev/null +++ b/annotations_1/iKscMa0XRXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.53], [10.0, 10.15], [13.0, 12.66], [29.0, 31.04], [39.0, 39.01], [41.0, 41.76], [51.0, 52.59], [54.0, 55.53], [94.0, 94.61], [124.0, 124.78], [125.0, 125.52], [163.0, 164.42]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 42.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["single-lens reflex camera", 36.51], ["music", 10.69], ["noise", 9.08]], null, null, null, null, null, null, null, null], "duration": [0.53, 0.15, -0.34, 2.04, 0.01, 0.76, 1.59, 1.53, 0.61, 0.78, 0.52, 1.42]} \ No newline at end of file diff --git a/annotations_1/iLFMRsi07_I_filtered.json b/annotations_1/iLFMRsi07_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/iLFMRsi07_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/iLJtz-2nkGk_filtered.json b/annotations_1/iLJtz-2nkGk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..143cf5e937c5782a9171f4809b8e1ad3db266e70 --- /dev/null +++ b/annotations_1/iLJtz-2nkGk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.28], [17.0, 17.47], [19.0, 20.19], [22.0, 23.68], [27.0, 35.85], [38.0, 58.28], [63.0, 63.29], [65.0, 80.37], [82.0, 84.33], [85.0, 86.32], [94.0, 102.68], [103.0, 107.79], [108.0, 109.05], [110.0, 111.03], [112.0, 112.4], [114.0, 116.6], [121.0, 125.74], [127.0, 126.87], [129.0, 130.54], [131.0, 132.06], [134.0, 157.0], [161.0, 161.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.83, 30.04, 0.0, 30.38, 29.64, 0.0, 30.83, 31.5, 0.0, 0.0, 0.0, 30.14, 30.63, 0.0, 0.0, 0.0, 32.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 48.94], ["speech", 22.95], ["thump, thud", 5.02]], null, [["music", 49.38], ["speech", 42.72], ["electronic music", 0.53]], [["music", 47.85], ["cacophony", 33.54], ["throbbing", 6.25]], null, [["music", 55.03], ["didgeridoo", 12.44], ["speech", 12.31]], [["speech", 41.94], ["music", 38.22], ["musical instrument", 2.24]], null, null, null, [["music", 65.64], ["musical instrument", 3.85], ["drum", 1.95]], [["speech", 49.72], ["music", 14.9], ["vehicle", 3.36]], null, null, null, [["speech", 39.5], ["music", 14.56], ["sound effect", 4.48]], null], "duration": [0.28, 0.47, 1.19, 1.68, 8.85, 20.28, 0.29, 15.37, 2.33, 1.32, 8.68, 4.79, 1.05, 1.03, 0.4, 2.6, 4.74, -0.13, 1.54, 1.06, 23.0, 0.76]} \ No newline at end of file diff --git a/annotations_1/iLN9GLRC5is_filtered.json b/annotations_1/iLN9GLRC5is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec132a116b6006c1da9d6406e4ae5ca615a1d94e --- /dev/null +++ b/annotations_1/iLN9GLRC5is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.41], [16.0, 18.17], [21.0, 21.96], [30.0, 30.33], [30.0, 30.5], [31.0, 31.78], [49.0, 49.27], [54.0, 55.09], [72.0, 72.23], [76.0, 76.27], [82.0, 83.84], [85.0, 86.66], [87.0, 90.9], [93.0, 93.34], [97.0, 98.14], [112.0, 112.72], [145.0, 146.99], [147.0, 148.46], [150.0, 154.13], [157.0, 158.75], [160.0, 161.82], [165.0, 165.67], [166.0, 166.5], [168.0, 168.99], [176.0, 176.89], [187.0, 187.3], [190.0, 190.97], [192.0, 192.62], [199.0, 199.37], [201.0, 201.87], [212.0, 216.57]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.99], "audiomae_on_audioset": [null, [["music", 35.88], ["didgeridoo", 10.96], ["musical instrument", 6.66]], null, null, null, null, null, null, null, null, null, null, [["music", 57.22], ["boing", 6.01], ["didgeridoo", 4.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 48.18], ["moo", 38.63], ["livestock, farm animals, working animals", 8.96]]], "duration": [1.41, 2.17, 0.96, 0.33, 0.5, 0.78, 0.27, 1.09, 0.23, 0.27, 1.84, 1.66, 3.9, 0.34, 1.14, 0.72, 1.99, 1.46, 4.13, 1.75, 1.82, 0.67, 0.5, 0.99, 0.89, 0.3, 0.97, 0.62, 0.37, 0.87, 4.57]} \ No newline at end of file diff --git a/annotations_1/iM0hP-LZIvI_filtered.json b/annotations_1/iM0hP-LZIvI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66356d2c75e62207ea1b381baa8bb0c35f49412c --- /dev/null +++ b/annotations_1/iM0hP-LZIvI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 42.89], [44.0, 45.59], [46.0, 59.19], [60.0, 73.65]], "keep_status": [false, false, false, false], "silence_prob": [28.71, 0.0, 28.11, 28.2], "audiomae_on_audioset": [[["music", 91.64], ["electronic music", 1.41], ["didgeridoo", 1.26]], null, [["music", 38.21], ["throbbing", 22.85], ["hum", 16.04]], [["music", 79.37], ["electronic music", 3.28], ["hum", 1.9]]], "duration": [7.89, 1.59, 13.19, 13.65]} \ No newline at end of file diff --git a/annotations_1/iMPV0eFLxbQ_filtered.json b/annotations_1/iMPV0eFLxbQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f824e770b9d23741cfb65332b3ee211b82430b1a --- /dev/null +++ b/annotations_1/iMPV0eFLxbQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.39], [15.0, 15.7], [17.0, 16.98], [19.0, 19.06], [20.0, 25.05], [35.0, 35.02], [37.0, 40.44], [41.0, 43.77], [52.0, 54.04], [56.0, 56.27], [64.0, 65.11], [68.0, 69.65], [73.0, 73.65], [75.0, 76.49], [82.0, 82.53], [88.0, 89.06], [95.0, 95.34], [100.0, 102.05], [105.0, 115.28], [116.0, 117.22], [119.0, 119.57], [121.0, 121.64]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 35.97, 35.93, 47.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 36.32, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 63.93], ["drum", 4.86], ["musical instrument", 3.92]], null, [["foghorn", 42.13], ["music", 24.1], ["trombone", 4.54]], [["music", 48.16], ["trombone", 11.35], ["foghorn", 10.66]], [["music", 60.28], ["foghorn", 4.47], ["musical instrument", 2.78]], null, null, null, null, null, null, null, null, null, [["music", 70.46], ["musical instrument", 6.76], ["wind instrument, woodwind instrument", 3.0]], null, null, null], "duration": [0.39, 0.7, -0.02, 0.06, 5.05, 0.02, 3.44, 2.77, 2.04, 0.27, 1.11, 1.65, 0.65, 1.49, 0.53, 1.06, 0.34, 2.05, 10.28, 1.22, 0.57, 0.64]} \ No newline at end of file diff --git a/annotations_1/iN0ZnG7yo6o_filtered.json b/annotations_1/iN0ZnG7yo6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ba09679bceadffb683e5938ead19d1ba7f27a4f --- /dev/null +++ b/annotations_1/iN0ZnG7yo6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [5.0, 12.18], [14.0, 14.35], [16.0, 18.94], [20.0, 20.26], [21.0, 22.01], [27.0, 30.74], [37.0, 36.86], [44.0, 44.05], [49.0, 50.11], [51.0, 50.77], [54.0, 56.46], [58.0, 57.84], [60.0, 63.91], [65.0, 65.67], [67.0, 67.68], [70.0, 70.73], [72.0, 73.72], [77.0, 77.48], [78.0, 79.56], [81.0, 85.23], [86.0, 86.73], [93.0, 106.51], [112.0, 127.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 98.44, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 0.0, 30.78, 30.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.47], ["singing", 2.82], ["rock and roll", 1.48]], [["music", 77.37], ["singing", 5.04], ["song", 2.06]]], "duration": [0.51, 7.18, 0.35, 2.94, 0.26, 1.01, 3.74, -0.14, 0.05, 1.11, -0.23, 2.46, -0.16, 3.91, 0.67, 0.68, 0.73, 1.72, 0.48, 1.56, 4.23, 0.73, 13.51, 15.25]} \ No newline at end of file diff --git a/annotations_1/iNQYIdE6DOg_filtered.json b/annotations_1/iNQYIdE6DOg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2382046f39e854c358d126e279013ca1e2d67ded --- /dev/null +++ b/annotations_1/iNQYIdE6DOg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.19], [44.0, 44.17], [46.0, 46.8], [49.0, 48.9], [51.0, 51.14], [52.0, 52.62], [54.0, 55.14], [56.0, 57.35], [58.0, 57.84], [58.0, 70.43], [73.0, 73.03], [74.0, 76.17], [78.0, 78.43], [81.0, 81.45], [84.0, 128.38], [131.0, 131.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.16, 0.0, 50.16, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 50.0], ["hum", 12.21], ["mains hum", 11.43]], null, null, null, null, null, null], "duration": [0.19, 0.17, 0.8, -0.1, 0.14, 0.62, 1.14, 1.35, -0.16, 12.43, 0.03, 2.17, 0.43, 0.45, 44.38, 0.11]} \ No newline at end of file diff --git a/annotations_1/iNg7uRYtqLA_filtered.json b/annotations_1/iNg7uRYtqLA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de42fb29d09f614922dc4d52906a72c0d9c60d23 --- /dev/null +++ b/annotations_1/iNg7uRYtqLA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.79], [18.0, 20.43], [25.0, 26.62], [27.0, 37.67], [38.0, 38.47], [42.0, 48.86], [52.0, 58.21], [60.0, 75.36], [78.0, 97.55], [98.0, 107.03], [109.0, 132.07], [142.0, 145.44], [153.0, 156.46], [164.0, 165.69], [178.0, 179.69], [193.0, 196.72], [197.0, 198.29]], "keep_status": [false, false, false, true, false, true, true, true, false, false, false, false, false, false, false, true, false], "silence_prob": [40.81, 46.43, 0.0, 38.63, 0.0, 32.36, 30.49, 31.31, 31.69, 35.87, 42.19, 33.04, 33.88, 0.0, 0.0, 32.25, 0.0], "audiomae_on_audioset": [[["music", 42.66], ["speech", 31.83], ["theremin", 4.13]], [["speech", 40.16], ["music", 34.45], ["hum", 4.63]], null, [["music", 23.12], ["fly, housefly", 12.33], ["speech", 7.66]], null, [["speech", 14.67], ["mosquito", 11.63], ["whack, thwack", 10.97]], [["music", 25.1], ["hum", 17.48], ["throbbing", 12.71]], [["music", 23.19], ["speech", 19.57], ["throbbing", 13.49]], [["speech", 61.13], ["music", 18.55], ["explosion", 1.68]], [["livestock, farm animals, working animals", 41.55], ["cattle, bovinae", 31.81], ["moo", 20.57]], [["music", 74.15], ["electronic music", 3.89], ["techno", 2.95]], [["music", 61.91], ["electronic music", 5.18], ["speech", 4.81]], [["music", 77.83], ["didgeridoo", 5.8], ["musical instrument", 3.94]], null, null, [["music", 26.32], ["cattle, bovinae", 17.57], ["moo", 10.78]], null], "duration": [5.79, 2.43, 1.62, 10.67, 0.47, 6.86, 6.21, 15.36, 19.55, 9.03, 23.07, 3.44, 3.46, 1.69, 1.69, 3.72, 1.29]} \ No newline at end of file diff --git a/annotations_1/iP7_QcV9Q9s_filtered.json b/annotations_1/iP7_QcV9Q9s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76c38f91cd2add1dfa934963f9f025f1eba02d2e --- /dev/null +++ b/annotations_1/iP7_QcV9Q9s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.43], [9.0, 10.32], [21.0, 23.62], [40.0, 40.96], [42.0, 43.11], [45.0, 45.69], [48.0, 48.51], [50.0, 50.31], [57.0, 58.04], [60.0, 61.16], [62.0, 62.33], [63.0, 63.68], [66.0, 69.97], [76.0, 80.05], [83.0, 84.84], [87.0, 87.25], [92.0, 93.51], [94.0, 96.36], [98.0, 103.47], [111.0, 112.63], [118.0, 135.89], [140.0, 139.82], [141.0, 145.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 49.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.07, 29.35, 0.0, 0.0, 0.0, 30.47, 28.78, 0.0, 28.68, 0.0, 29.06], "audiomae_on_audioset": [null, null, [["cattle, bovinae", 42.81], ["moo", 40.6], ["livestock, farm animals, working animals", 14.68]], null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 37.72], ["livestock, farm animals, working animals", 34.95], ["moo", 26.95]], [["music", 66.32], ["speech", 5.64], ["boing", 3.85]], null, null, null, [["music", 37.74], ["speech", 18.44], ["sidetone", 9.07]], [["cattle, bovinae", 38.4], ["livestock, farm animals, working animals", 31.4], ["moo", 27.33]], null, [["music", 86.77], ["cattle, bovinae", 2.37], ["speech", 1.48]], null, [["music", 58.63], ["speech", 8.87], ["throbbing", 7.62]]], "duration": [1.43, 1.32, 2.62, 0.96, 1.11, 0.69, 0.51, 0.31, 1.04, 1.16, 0.33, 0.68, 3.97, 4.05, 1.84, 0.25, 1.51, 2.36, 5.47, 1.63, 17.89, -0.18, 4.29]} \ No newline at end of file diff --git a/annotations_1/iPcAns5pKVw_filtered.json b/annotations_1/iPcAns5pKVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b99a5b722d0c12f6fa69a112872804eee35eaf9 --- /dev/null +++ b/annotations_1/iPcAns5pKVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.97], [20.0, 19.89], [24.0, 27.36], [28.0, 29.69], [31.0, 36.15], [41.0, 43.93], [46.0, 52.59], [56.0, 57.2], [62.0, 64.83], [66.0, 66.95], [72.0, 90.22], [92.0, 93.39], [94.0, 98.79], [105.0, 125.83]], "keep_status": [false, false, true, false, true, true, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.16, 0.0, 30.08, 29.95, 29.49, 0.0, 29.58, 0.0, 29.56, 0.0, 29.67, 33.46], "audiomae_on_audioset": [null, null, [["sidetone", 29.26], ["speech", 14.49], ["vehicle", 11.04]], null, [["speech", 52.06], ["vehicle", 7.75], ["fixed-wing aircraft, airplane", 6.15]], [["cattle, bovinae", 16.77], ["moo", 14.72], ["livestock, farm animals, working animals", 10.88]], [["cattle, bovinae", 43.7], ["livestock, farm animals, working animals", 30.29], ["moo", 20.44]], null, [["speech", 16.06], ["vehicle", 9.58], ["noise", 5.16]], null, [["cattle, bovinae", 45.92], ["livestock, farm animals, working animals", 30.05], ["moo", 17.95]], null, [["livestock, farm animals, working animals", 42.48], ["cattle, bovinae", 34.51], ["moo", 19.46]], [["grunt", 39.95], ["speech", 11.87], ["sound effect", 9.24]]], "duration": [1.97, -0.11, 3.36, 1.69, 5.15, 2.93, 6.59, 1.2, 2.83, 0.95, 18.22, 1.39, 4.79, 20.83]} \ No newline at end of file diff --git a/annotations_1/iPgcg3DVoUY_filtered.json b/annotations_1/iPgcg3DVoUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37e4dd9ad8748b4f7d5926a58474dd18d1c03a03 --- /dev/null +++ b/annotations_1/iPgcg3DVoUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.24], [14.0, 16.61], [20.0, 20.53], [23.0, 23.84], [26.0, 27.21], [32.0, 39.5], [41.0, 42.16], [45.0, 55.39], [63.0, 64.77], [66.0, 66.16], [67.0, 69.11], [73.0, 76.01], [77.0, 79.88], [82.0, 83.52], [87.0, 87.99], [89.0, 89.63], [91.0, 95.0], [98.0, 100.01], [103.0, 103.5], [105.0, 106.17], [108.0, 110.54], [114.0, 116.5], [120.0, 123.36]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, true, false, true], "silence_prob": [0.0, 30.36, 0.0, 0.0, 0.0, 29.54, 0.0, 28.32, 0.0, 0.0, 29.17, 30.41, 31.22, 0.0, 0.0, 0.0, 30.44, 32.84, 0.0, 0.0, 31.55, 31.06, 31.17], "audiomae_on_audioset": [null, [["music", 18.2], ["hum", 13.3], ["rumble", 11.14]], null, null, null, [["hum", 48.62], ["throbbing", 22.18], ["mains hum", 17.12]], null, [["hum", 38.76], ["mains hum", 37.22], ["music", 6.62]], null, null, [["music", 63.03], ["throbbing", 5.35], ["hum", 5.02]], [["hum", 51.17], ["mains hum", 20.49], ["throbbing", 12.41]], [["speech", 33.3], ["hum", 20.47], ["music", 11.71]], null, null, null, [["music", 31.42], ["hum", 26.02], ["mains hum", 9.59]], [["mains hum", 16.11], ["hum", 14.05], ["music", 11.7]], null, null, [["speech", 34.56], ["hum", 14.86], ["mains hum", 10.37]], [["hum", 47.47], ["mains hum", 33.78], ["throbbing", 6.57]], [["music", 24.81], ["speech", 21.28], ["hum", 13.02]]], "duration": [0.24, 2.61, 0.53, 0.84, 1.21, 7.5, 1.16, 10.39, 1.77, 0.16, 2.11, 3.01, 2.88, 1.52, 0.99, 0.63, 4.0, 2.01, 0.5, 1.17, 2.54, 2.5, 3.36]} \ No newline at end of file diff --git a/annotations_1/iQJh6I8kH_E_filtered.json b/annotations_1/iQJh6I8kH_E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/iQJh6I8kH_E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/iRIIcZuSiBo_filtered.json b/annotations_1/iRIIcZuSiBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8e465b4beedeedec3575a55d46ad754efa62264 --- /dev/null +++ b/annotations_1/iRIIcZuSiBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [6.0, 6.64], [9.0, 14.61], [15.0, 14.99], [16.0, 43.88], [44.0, 79.86]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.35, 0.0, 33.63, 0.0], "audiomae_on_audioset": [null, null, [["livestock, farm animals, working animals", 34.21], ["moo", 23.61], ["cattle, bovinae", 22.54]], null, [["music", 64.45], ["speech", 8.87], ["electronic music", 4.11]], null], "duration": [0.99, 0.64, 5.61, -0.01, 27.88, 35.86]} \ No newline at end of file diff --git a/annotations_1/iRdSH-u1wWI_filtered.json b/annotations_1/iRdSH-u1wWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ef1ed4d38b8c70d42e6de9240ac89e8d0a59ea --- /dev/null +++ b/annotations_1/iRdSH-u1wWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 43.34], [44.0, 44.64], [66.0, 66.24], [71.0, 81.45]], "keep_status": [true, false, false, true], "silence_prob": [30.21, 0.0, 0.0, 28.25], "audiomae_on_audioset": [[["didgeridoo", 27.86], ["music", 20.62], ["foghorn", 8.54]], null, null, [["music", 27.59], ["speech", 20.49], ["fly, housefly", 4.98]]], "duration": [19.34, 0.64, 0.24, 10.45]} \ No newline at end of file diff --git a/annotations_1/iSio5xjSYqs_filtered.json b/annotations_1/iSio5xjSYqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5eea7217cdb76ced5bd0bb440b1a2f91bca3938e --- /dev/null +++ b/annotations_1/iSio5xjSYqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 24.41], [26.0, 76.89], [79.0, 86.14], [91.0, 103.32], [107.0, 126.3]], "keep_status": [false, false, true, true, true], "silence_prob": [30.03, 0.0, 29.38, 29.56, 29.11], "audiomae_on_audioset": [[["hum", 44.72], ["throbbing", 24.36], ["mains hum", 14.49]], null, [["hum", 27.01], ["mains hum", 25.65], ["music", 10.89]], [["music", 31.96], ["hum", 15.15], ["mains hum", 12.85]], [["buzz", 14.22], ["electric shaver, electric razor", 13.21], ["music", 12.33]]], "duration": [19.41, 50.89, 7.14, 12.32, 19.3]} \ No newline at end of file diff --git a/annotations_1/iTQ4b0d3HxM_filtered.json b/annotations_1/iTQ4b0d3HxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..478192bfffb3ffbcd3fd969894d7355c90393a75 --- /dev/null +++ b/annotations_1/iTQ4b0d3HxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.27], [9.0, 9.58], [11.0, 12.07], [17.0, 17.09], [19.0, 18.79], [21.0, 21.42], [23.0, 23.38], [28.0, 28.65], [34.0, 34.87], [37.0, 37.57], [38.0, 39.82], [51.0, 51.63], [53.0, 53.7], [59.0, 60.13], [66.0, 69.4], [70.0, 71.39], [73.0, 73.75], [77.0, 78.16], [80.0, 80.7], [83.0, 83.49], [87.0, 92.91], [104.0, 110.19], [113.0, 117.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 48.52, 54.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.29], ["mains hum", 15.95], ["throbbing", 6.95]], null, null, null, null, null, [["hum", 40.54], ["mains hum", 24.51], ["speech", 11.41]], [["hum", 62.34], ["mains hum", 19.0], ["throbbing", 9.37]], null], "duration": [1.27, 0.58, 1.07, 0.09, -0.21, 0.42, 0.38, 0.65, 0.87, 0.57, 1.82, 0.63, 0.7, 1.13, 3.4, 1.39, 0.75, 1.16, 0.7, 0.49, 5.91, 6.19, 4.66]} \ No newline at end of file diff --git a/annotations_1/iVsfWht3zmo_filtered.json b/annotations_1/iVsfWht3zmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b01bc4fa5d9cb3a904f498d9a18670852a5836c --- /dev/null +++ b/annotations_1/iVsfWht3zmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.31], [15.0, 17.47], [18.0, 22.22], [25.0, 47.95], [60.0, 60.35], [62.0, 62.18], [75.0, 106.35]], "keep_status": [true, false, true, true, false, false, false], "silence_prob": [39.37, 32.46, 32.33, 29.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.64], ["didgeridoo", 8.98], ["speech", 6.97]], [["music", 57.67], ["didgeridoo", 13.05], ["musical instrument", 2.58]], [["music", 54.45], ["didgeridoo", 8.86], ["noise", 5.4]], [["music", 25.74], ["hum", 23.14], ["mains hum", 18.55]], null, null, null], "duration": [7.31, 2.47, 4.22, 22.95, 0.35, 0.18, 31.35]} \ No newline at end of file diff --git a/annotations_1/iXo8qxLvcSs_filtered.json b/annotations_1/iXo8qxLvcSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13d8305ccec3e5dbb5e103e98cfdf22852a00b67 --- /dev/null +++ b/annotations_1/iXo8qxLvcSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 39.58], [41.0, 40.93], [42.0, 43.5], [44.0, 44.85], [49.0, 49.91], [51.0, 51.11], [53.0, 54.08], [54.0, 61.94], [63.0, 65.5], [67.0, 70.55], [71.0, 75.93], [77.0, 81.28], [82.0, 83.88], [85.0, 132.53], [137.0, 155.78], [158.0, 167.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.99, 89.9, 99.99, 97.64, 99.95, 0.0, 0.0, 30.76, 30.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.26], ["buzz", 15.14], ["throbbing", 7.55]], [["speech", 52.48], ["radio", 5.47], ["electric shaver, electric razor", 4.93]]], "duration": [0.58, -0.07, 1.5, 0.85, 0.91, 0.11, 1.08, 7.94, 2.5, 3.55, 4.93, 4.28, 1.88, 47.53, 18.78, 9.64]} \ No newline at end of file diff --git a/annotations_1/i_9mM4F_JVI_filtered.json b/annotations_1/i_9mM4F_JVI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5664806c3b05c20f97f8469293a69335d377ecec --- /dev/null +++ b/annotations_1/i_9mM4F_JVI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.93], [14.0, 14.1], [14.0, 14.93], [22.0, 30.59], [35.0, 35.92], [39.0, 39.66], [45.0, 55.53], [56.0, 58.26], [61.0, 81.45], [84.0, 85.5], [86.0, 87.45], [89.0, 90.21], [91.0, 93.43], [95.0, 104.13], [106.0, 106.68], [108.0, 109.31]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [45.24, 0.0, 0.0, 35.89, 0.0, 0.0, 31.82, 34.19, 30.47, 0.0, 0.0, 0.0, 43.64, 39.37, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 19.66], ["insect", 14.99], ["speech", 12.41]], null, null, [["speech", 88.04], ["radio", 2.1], ["animal", 1.38]], null, null, [["speech", 92.83], ["applause", 2.7], ["animal", 0.64]], [["speech", 26.81], ["clapping", 11.85], ["applause", 7.15]], [["speech", 56.03], ["vehicle", 7.94], ["boat, water vehicle", 6.66]], null, null, null, [["music", 35.34], ["speech", 28.22], ["sheep", 7.2]], [["speech", 20.81], ["music", 17.31], ["hum", 14.72]], null, null], "duration": [2.93, 0.1, 0.93, 8.59, 0.92, 0.66, 10.53, 2.26, 20.45, 1.5, 1.45, 1.21, 2.43, 9.13, 0.68, 1.31]} \ No newline at end of file diff --git a/annotations_1/i_Rupd9NU4E_filtered.json b/annotations_1/i_Rupd9NU4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3602f2702df65413fd7d89a0cb90a101d43969c4 --- /dev/null +++ b/annotations_1/i_Rupd9NU4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.75], [11.0, 11.65], [20.0, 20.41], [26.0, 26.1], [33.0, 33.37], [34.0, 34.38], [36.0, 37.52], [39.0, 40.15], [45.0, 46.35], [47.0, 47.38], [48.0, 49.11], [72.0, 72.05], [73.0, 73.31], [75.0, 75.52], [76.0, 76.92], [80.0, 80.2], [82.0, 82.63], [86.0, 88.26], [92.0, 92.79], [101.0, 103.94], [111.0, 116.7], [118.0, 118.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.46, 0.0, 37.35, 29.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.14], ["throbbing", 9.53], ["hum", 5.42]], [["music", 36.49], ["speech", 17.75], ["vehicle", 7.78]], null], "duration": [0.75, 0.65, 0.41, 0.1, 0.37, 0.38, 1.52, 1.15, 1.35, 0.38, 1.11, 0.05, 0.31, 0.52, 0.92, 0.2, 0.63, 2.26, 0.79, 2.94, 5.7, 0.42]} \ No newline at end of file diff --git a/annotations_1/i_SnR25Zoho_filtered.json b/annotations_1/i_SnR25Zoho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6974ccc113d40255881fc240010a9edfff77d48 --- /dev/null +++ b/annotations_1/i_SnR25Zoho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 3.28], [4.0, 8.02], [9.0, 12.5], [15.0, 16.9], [19.0, 21.2], [22.0, 23.7], [25.0, 25.56], [27.0, 27.26], [29.0, 30.42], [32.0, 32.29], [36.0, 36.51], [39.0, 40.42], [41.0, 45.17], [46.0, 48.34], [50.0, 50.82], [52.0, 53.82], [56.0, 56.46], [57.0, 58.56], [63.0, 63.68], [65.0, 65.79], [69.0, 69.11], [71.0, 72.98], [86.0, 88.25], [105.0, 105.53], [108.0, 109.14], [111.0, 110.98], [113.0, 113.21], [114.0, 115.43], [120.0, 120.6], [121.0, 121.78], [123.0, 122.89], [124.0, 124.44], [126.0, 128.87], [132.0, 132.02], [134.0, 134.4], [135.0, 135.92], [137.0, 137.07], [138.0, 138.23], [140.0, 139.87], [140.0, 141.22], [143.0, 143.19], [144.0, 145.27], [149.0, 149.13], [151.0, 151.53], [161.0, 162.89], [164.0, 164.17], [165.0, 169.16], [176.0, 176.18], [181.0, 180.67], [188.0, 188.28], [191.0, 191.02], [192.0, 193.62], [199.0, 200.69], [201.0, 201.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [80.11, 75.07, 99.98, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 90.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.65], ["throbbing", 20.9], ["music", 15.4]], null, null, null, null, null, null, null], "duration": [3.28, 4.02, 3.5, 1.9, 2.2, 1.7, 0.56, 0.26, 1.42, 0.29, 0.51, 1.42, 4.17, 2.34, 0.82, 1.82, 0.46, 1.56, 0.68, 0.79, 0.11, 1.98, 2.25, 0.53, 1.14, -0.02, 0.21, 1.43, 0.6, 0.78, -0.11, 0.44, 2.87, 0.02, 0.4, 0.92, 0.07, 0.23, -0.13, 1.22, 0.19, 1.27, 0.13, 0.53, 1.89, 0.17, 4.16, 0.18, -0.33, 0.28, 0.02, 1.62, 1.69, 0.95]} \ No newline at end of file diff --git a/annotations_1/i_rch_cy7dM_filtered.json b/annotations_1/i_rch_cy7dM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5533c8939b71ec263bba04a9272cf2a3d81ce275 --- /dev/null +++ b/annotations_1/i_rch_cy7dM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.75], [20.0, 21.47], [24.0, 25.1], [31.0, 31.48], [33.0, 39.56], [41.0, 43.92], [44.0, 44.79], [46.0, 53.25], [54.0, 58.82], [61.0, 81.8], [83.0, 84.64], [86.0, 95.4], [96.0, 96.89], [98.0, 98.31], [99.0, 113.58]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 89.72, 80.46, 0.0, 40.9, 38.5, 40.26, 0.0, 39.91, 0.0, 0.0, 34.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 73.03], ["brass instrument", 6.84], ["foghorn", 4.37]], [["music", 61.42], ["musical instrument", 6.73], ["brass instrument", 6.11]], [["music", 41.54], ["brass instrument", 19.92], ["trombone", 8.33]], null, [["music", 75.44], ["theremin", 6.47], ["didgeridoo", 4.28]], null, null, [["music", 56.1], ["brass instrument", 13.38], ["trombone", 7.08]]], "duration": [0.75, 1.47, 1.1, 0.48, 6.56, 2.92, 0.79, 7.25, 4.82, 20.8, 1.64, 9.4, 0.89, 0.31, 14.58]} \ No newline at end of file diff --git a/annotations_1/i_uA0oZ3xnI_filtered.json b/annotations_1/i_uA0oZ3xnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/i_uA0oZ3xnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/i_zdyGw0tEo_filtered.json b/annotations_1/i_zdyGw0tEo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab073231207cb84f2df1730e87a97948bf1ca62a --- /dev/null +++ b/annotations_1/i_zdyGw0tEo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 19.03], [21.0, 30.16], [31.0, 42.3], [45.0, 44.58], [46.0, 47.04], [50.0, 50.55], [52.0, 52.56], [53.0, 52.86], [56.0, 57.1], [64.0, 64.84], [71.0, 80.22], [84.0, 84.37], [85.0, 86.91], [90.0, 90.78], [96.0, 96.01], [99.0, 101.24], [105.0, 106.52], [110.0, 112.77], [114.0, 114.74], [116.0, 120.73], [125.0, 129.14], [130.0, 130.2], [130.0, 130.87], [132.0, 133.02], [135.0, 135.14], [137.0, 139.68], [143.0, 144.17], [145.0, 146.35], [147.0, 147.83], [150.0, 149.84], [151.0, 151.16], [152.0, 158.14], [159.0, 164.46], [167.0, 173.7], [177.0, 180.57], [182.0, 183.91], [193.0, 204.45]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [34.05, 32.91, 33.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 41.76, 0.0, 32.75, 0.0, 32.56, 32.05, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 31.95, 33.87, 31.55, 35.32, 0.0, 36.36], "audiomae_on_audioset": [[["music", 74.69], ["didgeridoo", 4.29], ["funny music", 1.32]], [["music", 56.01], ["speech", 4.36], ["whimper", 3.55]], [["music", 66.49], ["speech", 6.51], ["boing", 2.15]], null, null, null, null, null, null, null, [["music", 22.2], ["livestock, farm animals, working animals", 16.94], ["speech", 10.1]], null, null, null, null, [["music", 26.81], ["speech", 20.86], ["synthesizer", 10.85]], null, [["moo", 18.91], ["cattle, bovinae", 18.14], ["livestock, farm animals, working animals", 11.31]], null, [["music", 37.87], ["speech", 12.91], ["throbbing", 11.57]], [["music", 35.9], ["groan", 32.09], ["bleat", 3.5]], null, null, null, null, null, null, null, null, null, null, [["music", 45.9], ["didgeridoo", 7.98], ["theremin", 4.6]], [["livestock, farm animals, working animals", 36.54], ["cattle, bovinae", 23.93], ["music", 13.47]], [["music", 37.85], ["cattle, bovinae", 18.9], ["moo", 13.57]], [["speech", 49.23], ["music", 23.4], ["fart", 4.42]], null, [["theremin", 49.84], ["music", 35.32], ["musical instrument", 2.05]]], "duration": [16.03, 9.16, 11.3, -0.42, 1.04, 0.55, 0.56, -0.14, 1.1, 0.84, 9.22, 0.37, 1.91, 0.78, 0.01, 2.24, 1.52, 2.77, 0.74, 4.73, 4.14, 0.2, 0.87, 1.02, 0.14, 2.68, 1.17, 1.35, 0.83, -0.16, 0.16, 6.14, 5.46, 6.7, 3.57, 1.91, 11.45]} \ No newline at end of file diff --git a/annotations_1/iaCvBhskyk0_filtered.json b/annotations_1/iaCvBhskyk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8baa792b216c914305e85789569453e0e1c72f89 --- /dev/null +++ b/annotations_1/iaCvBhskyk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.88], [3.0, 3.3], [5.0, 5.59], [6.0, 6.91], [9.0, 9.14], [10.0, 11.28], [12.0, 26.38], [28.0, 47.66], [51.0, 140.66], [141.0, 142.13], [143.0, 143.92], [145.0, 148.12], [150.0, 161.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 36.26, 0.0, 0.0, 0.0, 78.55, 64.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 31.06], ["heart sounds, heartbeat", 26.24], ["hum", 24.56]], null, null, null, null, null], "duration": [0.88, 0.3, 0.59, 0.91, 0.14, 1.28, 14.38, 19.66, 89.66, 1.13, 0.92, 3.12, 11.94]} \ No newline at end of file diff --git a/annotations_1/iaTG4JflfqM_filtered.json b/annotations_1/iaTG4JflfqM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c68023fcc0ba136605e85c1e7cc9848378d7ae0 --- /dev/null +++ b/annotations_1/iaTG4JflfqM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [1.0, 1.32], [1.0, 1.92], [9.0, 9.93], [20.0, 20.33], [29.0, 30.69], [35.0, 37.91], [40.0, 41.28], [44.0, 44.58], [45.0, 46.31], [48.0, 48.84], [51.0, 52.56], [59.0, 58.67], [59.0, 62.21], [65.0, 65.16], [69.0, 70.65], [76.0, 77.84], [79.0, 79.03], [82.0, 82.32], [83.0, 83.2], [84.0, 85.6], [89.0, 89.5], [92.0, 93.04], [94.0, 96.38], [98.0, 99.4], [102.0, 102.91], [103.0, 102.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 21.02], ["speech", 6.07], ["crow", 4.76]], null, null, null], "duration": [0.21, 0.32, 0.92, 0.93, 0.33, 1.69, 2.91, 1.28, 0.58, 1.31, 0.84, 1.56, -0.33, 3.21, 0.16, 1.65, 1.84, 0.03, 0.32, 0.2, 1.6, 0.5, 1.04, 2.38, 1.4, 0.91, -0.05]} \ No newline at end of file diff --git a/annotations_1/ibAU8weiUOI_filtered.json b/annotations_1/ibAU8weiUOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d653c669b820ef402bfc446cde611b794169db58 --- /dev/null +++ b/annotations_1/ibAU8weiUOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.44], [19.0, 18.99], [25.0, 30.54], [33.0, 35.18], [39.0, 41.08], [42.0, 42.58], [49.0, 49.52], [56.0, 55.66], [60.0, 75.36], [78.0, 82.34], [86.0, 86.85], [88.0, 89.33], [93.0, 95.62], [100.0, 104.95], [108.0, 109.51], [111.0, 113.22], [116.0, 116.97], [118.0, 118.05], [124.0, 125.04], [126.0, 126.71], [128.0, 137.51], [140.0, 140.61], [141.0, 142.75], [144.0, 144.53], [147.0, 150.6], [151.0, 172.42]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 28.99, 29.31, 30.78, 0.0, 0.0, 0.0, 30.45, 35.82, 0.0, 0.0, 47.31, 30.75, 0.0, 32.19, 0.0, 0.0, 0.0, 0.0, 28.57, 0.0, 0.0, 0.0, 35.68, 28.91], "audiomae_on_audioset": [null, null, [["music", 40.04], ["mains hum", 14.57], ["hum", 9.01]], [["music", 70.3], ["cacophony", 9.85], ["throbbing", 2.48]], [["music", 22.42], ["throbbing", 14.79], ["hum", 13.56]], null, null, null, [["hum", 56.24], ["mains hum", 26.32], ["throbbing", 12.57]], [["hum", 32.45], ["throbbing", 19.94], ["music", 19.73]], null, null, [["music", 56.45], ["throbbing", 8.34], ["hum", 6.5]], [["hum", 44.15], ["throbbing", 22.97], ["music", 13.06]], null, [["throbbing", 24.32], ["hum", 18.02], ["music", 9.83]], null, null, null, null, [["speech", 49.55], ["music", 21.8], ["throbbing", 6.48]], null, null, null, [["music", 31.5], ["throbbing", 22.07], ["hum", 9.88]], [["hum", 44.22], ["throbbing", 24.41], ["mains hum", 15.63]]], "duration": [0.44, -0.01, 5.54, 2.18, 2.08, 0.58, 0.52, -0.34, 15.36, 4.34, 0.85, 1.33, 2.62, 4.95, 1.51, 2.22, 0.97, 0.05, 1.04, 0.71, 9.51, 0.61, 1.75, 0.53, 3.6, 21.42]} \ No newline at end of file diff --git a/annotations_1/ibcYEwzgai8_filtered.json b/annotations_1/ibcYEwzgai8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/ibcYEwzgai8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/iddBzE3syI4_filtered.json b/annotations_1/iddBzE3syI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f3792ff9500a61d721e0aced4cae748c37076e7 --- /dev/null +++ b/annotations_1/iddBzE3syI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.05], [18.0, 21.0], [23.0, 23.04], [23.0, 35.68], [38.0, 39.21], [41.0, 41.07], [41.0, 59.24], [60.0, 61.62], [65.0, 64.56]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.15, 0.0, 59.51, 0.0, 0.0, 63.42, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.05, 3.0, 0.04, 12.68, 1.21, 0.07, 18.24, 1.62, -0.44]} \ No newline at end of file diff --git a/annotations_1/idvqLiOeLgc_filtered.json b/annotations_1/idvqLiOeLgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..682f369a6eea986dcb1039a78d0dd4b01e288fdc --- /dev/null +++ b/annotations_1/idvqLiOeLgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.91], [8.0, 7.91], [9.0, 40.49], [49.0, 74.06], [92.0, 108.87], [111.0, 122.89], [128.0, 141.08], [144.0, 147.53], [151.0, 151.63], [152.0, 176.22], [179.0, 179.64]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.21, 29.91, 31.1, 30.37, 32.52, 0.0, 29.88, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.33], ["throbbing", 7.7], ["hum", 2.65]], [["music", 61.71], ["burst, pop", 4.65], ["bang", 3.09]], [["music", 68.67], ["speech", 9.08], ["didgeridoo", 5.02]], [["music", 48.88], ["groan", 10.76], ["buzz", 5.35]], [["music", 34.46], ["trombone", 33.17], ["brass instrument", 8.23]], null, [["music", 81.24], ["buzz", 2.43], ["cacophony", 1.67]], null], "duration": [-0.09, -0.09, 31.49, 25.06, 16.87, 11.89, 13.08, 3.53, 0.63, 24.22, 0.64]} \ No newline at end of file diff --git a/annotations_1/ieVPPV5S0Ps_filtered.json b/annotations_1/ieVPPV5S0Ps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbe48fe6f5ba7b606af0fdebd83b03ee5243d27f --- /dev/null +++ b/annotations_1/ieVPPV5S0Ps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 35.31], [38.0, 41.39], [42.0, 42.45], [42.0, 42.63], [43.0, 84.45], [88.0, 123.82], [126.0, 132.49]], "keep_status": [false, true, false, false, false, false, true], "silence_prob": [0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 31.0], "audiomae_on_audioset": [null, [["wild animals", 25.37], ["roaring cats (lions, tigers)", 19.26], ["animal", 11.88]], null, null, null, null, [["music", 40.9], ["hum", 18.72], ["mains hum", 10.29]]], "duration": [35.31, 3.39, 0.45, 0.63, 41.45, 35.82, 6.49]} \ No newline at end of file diff --git a/annotations_1/iga0_T5B8dU_filtered.json b/annotations_1/iga0_T5B8dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58f9ce3b0d1724ccbe48eb296c535f4c2dc8d2bb --- /dev/null +++ b/annotations_1/iga0_T5B8dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.69], [14.0, 15.4], [24.0, 26.32], [28.0, 29.25], [31.0, 35.01], [38.0, 46.13], [53.0, 55.86], [57.0, 61.2], [63.0, 74.7], [75.0, 74.76], [76.0, 84.05], [87.0, 96.5], [97.0, 97.23], [100.0, 108.41], [109.0, 109.19]], "keep_status": [false, false, false, false, true, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 36.17, 0.0, 40.26, 36.32, 35.92, 30.74, 31.86, 0.0, 30.81, 31.96, 0.0, 33.55, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 48.42], ["music", 19.02], ["theremin", 9.64]], null, [["music", 52.3], ["hum", 7.83], ["throbbing", 7.82]], [["mains hum", 50.2], ["hum", 33.81], ["music", 6.02]], [["music", 63.39], ["bleat", 11.12], ["sheep", 6.29]], [["bleat", 29.61], ["sheep", 18.52], ["livestock, farm animals, working animals", 16.68]], [["animal", 30.84], ["horse", 18.52], ["neigh, whinny", 17.52]], null, [["fart", 29.45], ["animal", 16.67], ["livestock, farm animals, working animals", 14.8]], [["animal", 32.76], ["roaring cats (lions, tigers)", 20.25], ["speech", 17.94]], null, [["fart", 19.89], ["speech", 11.96], ["animal", 11.38]], null], "duration": [0.69, 1.4, 2.32, 1.25, 4.01, 8.13, 2.86, 4.2, 11.7, -0.24, 8.05, 9.5, 0.23, 8.41, 0.19]} \ No newline at end of file diff --git a/annotations_1/ih9NffWqWgM_filtered.json b/annotations_1/ih9NffWqWgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f98ad11cfd95f455e25a0f0998d44814f1155cd --- /dev/null +++ b/annotations_1/ih9NffWqWgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.75], [11.0, 14.08], [16.0, 17.98], [19.0, 26.54], [27.0, 31.78], [34.0, 37.22], [38.0, 44.79], [48.0, 67.09], [71.0, 133.47], [135.0, 136.19], [137.0, 138.82], [140.0, 141.03], [142.0, 143.02], [145.0, 145.61]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [72.31, 34.83, 0.0, 35.21, 30.73, 34.84, 32.39, 28.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.11], ["mains hum", 14.28], ["music", 14.12]], null, [["music", 48.79], ["hum", 20.53], ["mains hum", 7.23]], [["hum", 34.78], ["music", 22.96], ["mains hum", 16.45]], [["hum", 43.1], ["throbbing", 28.36], ["mains hum", 14.16]], [["hum", 54.05], ["throbbing", 25.75], ["mains hum", 17.47]], [["music", 37.19], ["cacophony", 23.9], ["noise", 3.97]], null, null, null, null, null, null], "duration": [2.75, 3.08, 1.98, 7.54, 4.78, 3.22, 6.79, 19.09, 62.47, 1.19, 1.82, 1.03, 1.02, 0.61]} \ No newline at end of file diff --git a/annotations_1/ihKHvNOTcwk_filtered.json b/annotations_1/ihKHvNOTcwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..565983128772759741c57c73b829693fdc057b76 --- /dev/null +++ b/annotations_1/ihKHvNOTcwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.94], [16.0, 16.9], [20.0, 22.84], [24.0, 38.5], [40.0, 41.03], [43.0, 65.67], [66.0, 79.83], [80.0, 81.94], [82.0, 86.07], [87.0, 89.29], [95.0, 95.18], [97.0, 97.34], [100.0, 100.38], [102.0, 104.4], [105.0, 105.54], [106.0, 106.66], [115.0, 125.64], [128.0, 137.89], [151.0, 152.04], [153.0, 166.6], [168.0, 168.52]], "keep_status": [true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [47.66, 0.0, 47.43, 35.8, 0.0, 30.99, 32.75, 0.0, 41.22, 78.89, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 33.43, 33.08, 0.0, 34.6, 0.0], "audiomae_on_audioset": [[["music", 61.62], ["soundtrack music", 4.05], ["synthesizer", 3.91]], null, [["fly, housefly", 64.98], ["insect", 16.88], ["mosquito", 14.11]], [["insect", 25.19], ["fly, housefly", 23.34], ["mosquito", 23.11]], null, [["speech", 35.74], ["music", 21.61], ["synthesizer", 5.04]], [["music", 30.95], ["groan", 15.24], ["sound effect", 6.59]], null, [["music", 27.87], ["speech", 11.11], ["animal", 7.12]], null, null, null, null, null, null, null, [["music", 60.76], ["boing", 13.18], ["speech", 4.1]], [["music", 55.28], ["fly, housefly", 11.33], ["insect", 4.67]], null, [["fly, housefly", 25.51], ["music", 22.82], ["fart", 6.77]], null], "duration": [2.94, 0.9, 2.84, 14.5, 1.03, 22.67, 13.83, 1.94, 4.07, 2.29, 0.18, 0.34, 0.38, 2.4, 0.54, 0.66, 10.64, 9.89, 1.04, 13.6, 0.52]} \ No newline at end of file diff --git a/annotations_1/ij0JLKDJOrc_filtered.json b/annotations_1/ij0JLKDJOrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab8be65755a8a056692e4f4191053132b8741084 --- /dev/null +++ b/annotations_1/ij0JLKDJOrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 4.62], [5.0, 5.71], [9.0, 9.59], [10.0, 10.79], [20.0, 22.94], [30.0, 30.81], [34.0, 34.25], [35.0, 35.48], [38.0, 53.22], [60.0, 61.79], [92.0, 93.51], [95.0, 95.76]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 42.67, 0.0, 0.0, 0.0, 30.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 26.53], ["frog", 13.5], ["inside, small room", 5.07]], null, null, null, [["music", 51.76], ["speech", 18.73], ["tubular bells", 2.95]], null, null, null], "duration": [0.44, 0.62, 0.71, 0.59, 0.79, 2.94, 0.81, 0.25, 0.48, 15.22, 1.79, 1.51, 0.76]} \ No newline at end of file diff --git a/annotations_1/ijBU9q7fb3U_filtered.json b/annotations_1/ijBU9q7fb3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10538e3cd8f1af6637d1ab80fb6e2d3121847895 --- /dev/null +++ b/annotations_1/ijBU9q7fb3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.04], [6.0, 8.01], [9.0, 9.95], [10.0, 10.45], [11.0, 13.54], [16.0, 16.48], [21.0, 21.39], [22.0, 22.76], [25.0, 25.51], [27.0, 27.06], [31.0, 31.16], [34.0, 34.79], [36.0, 36.86], [39.0, 39.41], [40.0, 40.69], [42.0, 43.6], [45.0, 45.59], [52.0, 55.11], [55.0, 56.84], [57.0, 57.92], [59.0, 59.75], [61.0, 61.53], [65.0, 65.37], [67.0, 67.53], [69.0, 71.41], [75.0, 75.03], [79.0, 80.15], [85.0, 85.87], [93.0, 96.04], [100.0, 119.5], [122.0, 130.32], [137.0, 137.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 100.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 47.27, 30.51, 29.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 20.91], ["moo", 13.95], ["cattle, bovinae", 13.27]], null, null, null, null, null, null, [["boing", 46.88], ["cattle, bovinae", 10.34], ["moo", 8.23]], null, null, null, [["speech", 19.34], ["explosion", 16.43], ["burst, pop", 12.08]], [["speech", 60.92], ["explosion", 6.62], ["music", 1.94]], [["vehicle", 52.33], ["car", 19.4], ["skidding", 9.43]], null], "duration": [1.04, 2.01, 0.95, 0.45, 2.54, 0.48, 0.39, 0.76, 0.51, 0.06, 0.16, 0.79, 0.86, 0.41, 0.69, 1.6, 0.59, 3.11, 1.84, 0.92, 0.75, 0.53, 0.37, 0.53, 2.41, 0.03, 1.15, 0.87, 3.04, 19.5, 8.32, 0.25]} \ No newline at end of file diff --git a/annotations_1/ijaNlufpcMs_filtered.json b/annotations_1/ijaNlufpcMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..046ab8ee905e0183c1afa0b6f78adcfab16ebc9d --- /dev/null +++ b/annotations_1/ijaNlufpcMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [14.0, 47.06], [54.0, 105.38], [114.0, 126.89], [140.0, 140.51]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 82.74], ["cacophony", 5.61], ["musical instrument", 1.06]], null], "duration": [1.39, 33.06, 51.38, 12.89, 0.51]} \ No newline at end of file diff --git a/annotations_1/ik-n-L9UNTY_filtered.json b/annotations_1/ik-n-L9UNTY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd3517c4842e8a982b37c2922f58bf0d112ce4ad --- /dev/null +++ b/annotations_1/ik-n-L9UNTY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.77], [30.0, 30.37], [31.0, 118.86], [120.0, 119.89], [120.0, 120.53], [121.0, 136.41]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.73], "audiomae_on_audioset": [null, null, null, null, null, [["music", 79.57], ["musical instrument", 3.61], ["didgeridoo", 2.56]]], "duration": [0.77, 0.37, 87.86, -0.11, 0.53, 15.41]} \ No newline at end of file diff --git a/annotations_1/ikcKKvKkf4Y_filtered.json b/annotations_1/ikcKKvKkf4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f87ca9e826e28891676e168b3857b125af398d4 --- /dev/null +++ b/annotations_1/ikcKKvKkf4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [12.0, 11.77], [17.0, 18.23], [19.0, 21.29], [22.0, 22.59], [24.0, 25.19], [26.0, 26.55], [37.0, 39.07], [40.0, 42.26], [44.0, 47.76], [52.0, 60.42], [61.0, 62.83], [63.0, 63.73], [65.0, 65.03], [67.0, 67.31], [70.0, 72.67], [73.0, 73.33], [81.0, 82.27], [83.0, 85.02], [91.0, 90.96], [105.0, 105.21], [107.0, 108.43], [119.0, 119.28], [121.0, 125.27], [140.0, 140.56], [151.0, 151.43], [153.0, 152.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 100.0, 53.34, 58.13, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 0.0, 55.46, 0.0, 0.0, 0.0, 0.0, 29.15, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.63], ["cattle, bovinae", 7.37], ["livestock, farm animals, working animals", 7.35]], null, null, null], "duration": [-0.07, -0.23, 1.23, 2.29, 0.59, 1.19, 0.55, 2.07, 2.26, 3.76, 8.42, 1.83, 0.73, 0.03, 0.31, 2.67, 0.33, 1.27, 2.02, -0.04, 0.21, 1.43, 0.28, 4.27, 0.56, 0.43, -0.02]} \ No newline at end of file diff --git a/annotations_1/ikqLKMZ86d8_filtered.json b/annotations_1/ikqLKMZ86d8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6227bb7c4d57674862f81e567ad386f8e063a173 --- /dev/null +++ b/annotations_1/ikqLKMZ86d8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.05], [14.0, 22.13], [22.0, 23.13], [26.0, 26.23], [27.0, 27.41], [38.0, 39.43], [39.0, 39.46], [39.0, 41.99], [45.0, 48.42], [51.0, 51.92], [53.0, 53.16], [54.0, 55.54], [57.0, 60.34], [63.0, 66.5], [67.0, 69.36], [71.0, 74.21], [75.0, 74.85], [75.0, 83.22], [87.0, 87.35], [90.0, 90.17], [91.0, 94.85], [101.0, 106.08], [110.0, 115.03], [119.0, 118.79], [119.0, 119.97], [120.0, 120.95], [121.0, 121.69], [128.0, 128.24]], "keep_status": [true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [40.12, 33.26, 0.0, 0.0, 0.0, 0.0, 0.0, 38.9, 48.19, 0.0, 0.0, 0.0, 98.51, 50.11, 89.72, 47.27, 0.0, 33.48, 0.0, 0.0, 34.27, 33.37, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 17.75], ["mosquito", 12.7], ["speech", 12.46]], [["music", 28.86], ["speech", 12.66], ["animal", 8.67]], null, null, null, null, null, [["music", 50.55], ["speech", 22.48], ["boing", 16.66]], [["music", 47.77], ["frog", 7.83], ["animal", 6.13]], null, null, null, null, null, null, [["stomach rumble", 13.96], ["hum", 9.79], ["moo", 6.08]], null, [["speech", 83.53], ["screaming", 2.06], ["crying, sobbing", 1.19]], null, null, [["speech", 60.44], ["boing", 5.41], ["sidetone", 3.9]], [["animal", 32.49], ["domestic animals, pets", 12.24], ["dog", 10.53]], [["speech", 22.34], ["livestock, farm animals, working animals", 13.89], ["sidetone", 11.02]], null, null, null, null, null], "duration": [2.05, 8.13, 1.13, 0.23, 0.41, 1.43, 0.46, 2.99, 3.42, 0.92, 0.16, 1.54, 3.34, 3.5, 2.36, 3.21, -0.15, 8.22, 0.35, 0.17, 3.85, 5.08, 5.03, -0.21, 0.97, 0.95, 0.69, 0.24]} \ No newline at end of file diff --git a/annotations_1/iktC8imMBnw_filtered.json b/annotations_1/iktC8imMBnw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e69a55ad3d3be917da02e32253e1a4b111ebd19 --- /dev/null +++ b/annotations_1/iktC8imMBnw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.78], [3.0, 31.28], [33.0, 37.32], [39.0, 39.36], [39.0, 39.58], [41.0, 42.63], [51.0, 54.5], [59.0, 61.86], [63.0, 63.26], [68.0, 68.64], [70.0, 74.88], [79.0, 79.89], [84.0, 85.85], [89.0, 99.4], [100.0, 112.53], [115.0, 117.05], [120.0, 120.7]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 29.95, 36.15, 0.0, 0.0, 0.0, 31.39, 39.88, 0.0, 0.0, 43.79, 0.0, 0.0, 30.96, 28.89, 35.72, 0.0], "audiomae_on_audioset": [null, [["music", 19.54], ["speech", 18.89], ["throbbing", 8.41]], [["frog", 16.62], ["croak", 14.75], ["music", 14.13]], null, null, null, [["music", 37.93], ["speech", 30.35], ["grunt", 7.04]], [["music", 19.58], ["frog", 17.23], ["croak", 16.02]], null, null, [["music", 75.92], ["didgeridoo", 8.3], ["musical instrument", 4.47]], null, null, [["music", 45.5], ["hum", 14.52], ["throbbing", 6.3]], [["music", 36.17], ["throbbing", 9.42], ["hum", 7.78]], [["hum", 45.52], ["throbbing", 40.96], ["music", 4.82]], null], "duration": [0.78, 28.28, 4.32, 0.36, 0.58, 1.63, 3.5, 2.86, 0.26, 0.64, 4.88, 0.89, 1.85, 10.4, 12.53, 2.05, 0.7]} \ No newline at end of file diff --git a/annotations_1/ilCjx9gigWI_filtered.json b/annotations_1/ilCjx9gigWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b7d2f28939730f239b471708aeef219a2d4c9f4 --- /dev/null +++ b/annotations_1/ilCjx9gigWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 25.32], [28.0, 27.75], [29.0, 32.86], [35.0, 38.18], [39.0, 40.83], [42.0, 44.32], [46.0, 47.43], [51.0, 53.59], [59.0, 58.83], [62.0, 62.09], [63.0, 63.54], [66.0, 67.53], [69.0, 69.04], [70.0, 70.7], [72.0, 72.55], [74.0, 74.28], [76.0, 76.32], [84.0, 85.09], [94.0, 96.33]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 97.11, 99.92, 0.0, 54.3, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.1], "audiomae_on_audioset": [[["music", 38.48], ["theremin", 24.81], ["didgeridoo", 4.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.32, -0.25, 3.86, 3.18, 1.83, 2.32, 1.43, 2.59, -0.17, 0.09, 0.54, 1.53, 0.04, 0.7, 0.55, 0.28, 0.32, 1.09, 2.33]} \ No newline at end of file diff --git a/annotations_1/ilRq_PR6oi4_filtered.json b/annotations_1/ilRq_PR6oi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ee91601ccaadf047fff8e27cb1ee3c3957d6c8 --- /dev/null +++ b/annotations_1/ilRq_PR6oi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 71.52], [72.0, 75.34], [76.0, 78.63], [81.0, 83.51], [87.0, 89.45], [91.0, 128.78]], "keep_status": [true, true, true, true, true, false], "silence_prob": [30.42, 35.19, 37.67, 42.74, 42.08, 0.0], "audiomae_on_audioset": [[["music", 40.87], ["synthesizer", 16.83], ["musical instrument", 12.14]], [["music", 19.38], ["mains hum", 16.45], ["hum", 15.17]], [["music", 37.59], ["synthesizer", 16.13], ["hum", 12.05]], [["music", 41.9], ["hum", 8.39], ["mains hum", 7.02]], [["fly, housefly", 15.88], ["music", 14.19], ["insect", 11.89]], null], "duration": [26.52, 3.34, 2.63, 2.51, 2.45, 37.78]} \ No newline at end of file diff --git a/annotations_1/ilXtCX0-CkE_filtered.json b/annotations_1/ilXtCX0-CkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58235276692975de656e0a89d03b5c8ffda9dfe9 --- /dev/null +++ b/annotations_1/ilXtCX0-CkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.34], [11.0, 11.65], [13.0, 13.14], [14.0, 14.3], [16.0, 16.48], [17.0, 18.12], [20.0, 24.53], [26.0, 26.81], [32.0, 41.07], [44.0, 45.28], [46.0, 46.62], [49.0, 51.6], [52.0, 58.14], [60.0, 63.68], [64.0, 70.02], [71.0, 72.37], [77.0, 77.65], [78.0, 79.96], [81.0, 81.21], [82.0, 84.84], [90.0, 90.34], [91.0, 91.61], [92.0, 109.83], [111.0, 111.52], [112.0, 114.54], [125.0, 128.85], [129.0, 131.14], [132.0, 134.01], [135.0, 138.54], [139.0, 139.38]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.16, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 99.99, 0.0, 0.0, 92.97, 82.97, 100.0, 98.44, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 84.98, 0.0, 95.78, 67.89, 63.64, 49.09, 69.2, 0.0], "audiomae_on_audioset": [[["thunk", 47.07], ["hum", 6.89], ["breaking", 6.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.46], ["music", 19.83], ["whale vocalization", 11.18]], null, null], "duration": [7.34, 0.65, 0.14, 0.3, 0.48, 1.12, 4.53, 0.81, 9.07, 1.28, 0.62, 2.6, 6.14, 3.68, 6.02, 1.37, 0.65, 1.96, 0.21, 2.84, 0.34, 0.61, 17.83, 0.52, 2.54, 3.85, 2.14, 2.01, 3.54, 0.38]} \ No newline at end of file diff --git a/annotations_1/io-hA6pxffU_filtered.json b/annotations_1/io-hA6pxffU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35a4b238719209beaf6720af3808d4a5c53581d7 --- /dev/null +++ b/annotations_1/io-hA6pxffU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.47], [3.0, 2.54], [11.0, 12.02], [14.0, 14.62], [17.0, 18.12], [27.0, 27.4], [28.0, 28.98], [30.0, 30.92], [33.0, 33.42], [37.0, 37.4], [38.0, 38.82], [41.0, 43.14], [46.0, 48.05], [49.0, 49.27], [56.0, 55.76], [56.0, 57.35], [59.0, 59.46], [61.0, 61.38], [65.0, 66.65], [84.0, 84.1], [90.0, 91.64], [93.0, 93.46], [101.0, 102.54], [107.0, 109.78], [111.0, 110.86], [114.0, 113.9], [121.0, 120.9], [122.0, 121.81], [122.0, 123.57], [134.0, 134.01], [134.0, 139.28], [141.0, 141.99], [147.0, 146.97], [148.0, 148.2], [151.0, 151.17], [152.0, 152.46], [154.0, 155.12], [159.0, 159.36], [164.0, 168.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.85, 58.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.87], "audiomae_on_audioset": [[["music", 49.45], ["boing", 20.46], ["speech", 10.39]], null, null, null, null, null, null, null, null, null, null, [["music", 27.75], ["speech", 17.69], ["synthesizer", 5.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 39.06], ["insect", 22.68], ["mosquito", 12.52]], null, null, null, null, null, null, null, [["cattle, bovinae", 28.39], ["moo", 25.62], ["speech", 19.27]]], "duration": [2.47, -0.46, 1.02, 0.62, 1.12, 0.4, 0.98, 0.92, 0.42, 0.4, 0.82, 2.14, 2.05, 0.27, -0.24, 1.35, 0.46, 0.38, 1.65, 0.1, 1.64, 0.46, 1.54, 2.78, -0.14, -0.1, -0.1, -0.19, 1.57, 0.01, 5.28, 0.99, -0.03, 0.2, 0.17, 0.46, 1.12, 0.36, 4.74]} \ No newline at end of file diff --git a/annotations_1/ioE_djgs810_filtered.json b/annotations_1/ioE_djgs810_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f68ddd956f01a9b25db6b3beb2877cf2003d105b --- /dev/null +++ b/annotations_1/ioE_djgs810_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.47], [28.0, 156.12]], "keep_status": [false, false], "silence_prob": [30.22, 0.0], "audiomae_on_audioset": [[["music", 62.44], ["throbbing", 7.92], ["whack, thwack", 4.59]], null], "duration": [16.47, 128.12]} \ No newline at end of file diff --git a/annotations_1/ioQQ3gbY0vY_filtered.json b/annotations_1/ioQQ3gbY0vY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/ioQQ3gbY0vY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ioUedV29CQE_filtered.json b/annotations_1/ioUedV29CQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2369a0cddb0e854a937d3fa46d9e62c5ffe8aa7b --- /dev/null +++ b/annotations_1/ioUedV29CQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.47], [8.0, 14.52], [16.0, 79.54], [80.0, 88.37], [89.0, 90.36], [91.0, 102.39]], "keep_status": [false, false, false, true, false, true], "silence_prob": [0.0, 56.1, 0.0, 34.2, 0.0, 37.63], "audiomae_on_audioset": [null, null, null, [["hum", 26.31], ["music", 15.28], ["throbbing", 14.86]], null, [["music", 50.86], ["sonar", 9.64], ["hum", 6.95]]], "duration": [1.47, 6.52, 63.54, 8.37, 1.36, 11.39]} \ No newline at end of file diff --git a/annotations_1/ipb0Bfg_FTs_filtered.json b/annotations_1/ipb0Bfg_FTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1e9e042d4666fa468cad848c080706f5ca3153e --- /dev/null +++ b/annotations_1/ipb0Bfg_FTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.08], [5.0, 10.23], [12.0, 12.9], [14.0, 16.01], [18.0, 20.51], [23.0, 40.22], [43.0, 43.8], [44.0, 56.34], [57.0, 58.04], [60.0, 71.96], [75.0, 75.36], [76.0, 76.89], [79.0, 79.91], [82.0, 84.03], [86.0, 125.2]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [66.63, 61.27, 0.0, 36.99, 68.67, 69.74, 0.0, 34.74, 0.0, 45.85, 0.0, 0.0, 0.0, 54.97, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 15.24], ["noise", 8.07], ["whale vocalization", 6.42]], null, null, null, [["speech", 38.82], ["music", 21.62], ["thump, thud", 5.16]], null, [["music", 61.56], ["speech", 12.63], ["didgeridoo", 12.43]], null, null, null, null, null], "duration": [2.08, 5.23, 0.9, 2.01, 2.51, 17.22, 0.8, 12.34, 1.04, 11.96, 0.36, 0.89, 0.91, 2.03, 39.2]} \ No newline at end of file diff --git a/annotations_1/iqZmwwUvgVU_filtered.json b/annotations_1/iqZmwwUvgVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae92d0c63c40719998526ce597cdb51498713472 --- /dev/null +++ b/annotations_1/iqZmwwUvgVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.02], [16.0, 17.2], [60.0, 60.57], [68.0, 74.09], [75.0, 75.46], [77.0, 82.44], [83.0, 91.39], [93.0, 101.63], [107.0, 109.65], [115.0, 120.01], [126.0, 127.13], [130.0, 131.08], [140.0, 142.48]], "keep_status": [true, false, false, false, false, true, true, true, true, false, false, false, true], "silence_prob": [28.76, 0.0, 0.0, 28.62, 0.0, 28.66, 29.29, 29.2, 29.08, 29.42, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["whale vocalization", 25.54], ["speech", 17.68], ["music", 7.46]], null, null, [["fly, housefly", 35.32], ["mosquito", 30.96], ["insect", 13.8]], null, [["vehicle", 16.27], ["speech", 15.77], ["outside, rural or natural", 4.03]], [["speech", 50.53], ["music", 6.07], ["groan", 5.82]], [["speech", 38.28], ["music", 22.12], ["explosion", 4.92]], [["groan", 54.19], ["speech", 4.42], ["music", 4.33]], [["music", 57.7], ["theremin", 12.51], ["mosquito", 5.57]], null, null, [["animal", 19.99], ["roaring cats (lions, tigers)", 11.84], ["wild animals", 10.4]]], "duration": [2.02, 1.2, 0.57, 6.09, 0.46, 5.44, 8.39, 8.63, 2.65, 5.01, 1.13, 1.08, 2.48]} \ No newline at end of file diff --git a/annotations_1/irnju0G-lBg_filtered.json b/annotations_1/irnju0G-lBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..590191f59a028aee525c9d1415a0587f50d2a2ec --- /dev/null +++ b/annotations_1/irnju0G-lBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.45], [15.0, 61.32], [62.0, 70.23], [71.0, 71.91], [73.0, 131.68], [136.0, 136.8], [139.0, 144.51], [146.0, 153.4], [154.0, 157.1], [161.0, 170.95], [171.0, 206.88], [208.0, 208.62], [214.0, 217.11], [219.0, 221.31], [222.0, 223.38], [224.0, 224.65], [226.0, 226.15], [227.0, 228.5], [232.0, 234.66], [237.0, 238.28], [243.0, 243.77]], "keep_status": [true, false, true, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [30.8, 0.0, 30.92, 0.0, 0.0, 0.0, 31.24, 33.76, 42.67, 85.72, 0.0, 0.0, 88.1, 46.09, 0.0, 0.0, 0.0, 0.0, 28.96, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 29.89], ["music", 16.57], ["sidetone", 5.28]], null, [["music", 41.79], ["speech", 10.65], ["foghorn", 6.82]], null, null, null, [["music", 25.97], ["theremin", 22.9], ["synthesizer", 13.3]], [["music", 23.02], ["whale vocalization", 17.33], ["synthesizer", 8.59]], [["music", 49.97], ["pulse", 7.52], ["didgeridoo", 5.14]], null, null, null, null, [["speech", 32.76], ["whale vocalization", 16.94], ["sine wave", 8.19]], null, null, null, null, [["moo", 12.76], ["cattle, bovinae", 9.61], ["livestock, farm animals, working animals", 7.25]], null, null], "duration": [2.45, 46.32, 8.23, 0.91, 58.68, 0.8, 5.51, 7.4, 3.1, 9.95, 35.88, 0.62, 3.11, 2.31, 1.38, 0.65, 0.15, 1.5, 2.66, 1.28, 0.77]} \ No newline at end of file diff --git a/annotations_1/iropsnsCEjA_filtered.json b/annotations_1/iropsnsCEjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..767df24d427f7c60279b62d38b815658bb59d058 --- /dev/null +++ b/annotations_1/iropsnsCEjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.7], [20.0, 51.29], [52.0, 51.81], [60.0, 91.69], [122.0, 122.2], [124.0, 123.77], [125.0, 125.09], [131.0, 131.79], [133.0, 172.64], [176.0, 176.74], [178.0, 178.73], [192.0, 192.5], [202.0, 202.32], [205.0, 208.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.86], ["speech", 15.68], ["foghorn", 14.04]]], "duration": [3.7, 31.29, -0.19, 31.69, 0.2, -0.23, 0.09, 0.79, 39.64, 0.74, 0.73, 0.5, 0.32, 3.08]} \ No newline at end of file diff --git a/annotations_1/is4ZtB0U7Vo_filtered.json b/annotations_1/is4ZtB0U7Vo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8abda3a737a041e823d2314c4787662a4c030f1 --- /dev/null +++ b/annotations_1/is4ZtB0U7Vo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 26.45], [28.0, 29.71], [31.0, 31.45], [38.0, 51.41], [67.0, 88.8], [93.0, 115.75], [117.0, 127.74], [129.0, 129.95], [131.0, 156.96], [157.0, 157.03], [157.0, 205.14], [206.0, 207.76], [209.0, 209.97], [211.0, 214.66]], "keep_status": [true, false, false, true, true, true, false, false, false, false, false, false, false, true], "silence_prob": [28.95, 0.0, 0.0, 29.27, 28.73, 28.63, 29.22, 0.0, 29.06, 0.0, 0.0, 0.0, 0.0, 32.5], "audiomae_on_audioset": [[["music", 32.08], ["vehicle", 7.03], ["race car, auto racing", 3.49]], null, null, [["music", 39.1], ["explosion", 8.01], ["speech", 6.49]], [["music", 26.51], ["speech", 21.96], ["hum", 7.57]], [["music", 45.48], ["speech", 12.31], ["hum", 3.16]], [["speech", 43.16], ["music", 34.4], ["throbbing", 6.04]], null, [["speech", 57.83], ["music", 13.57], ["explosion", 7.86]], null, null, null, null, [["speech", 19.81], ["music", 15.43], ["hum", 15.12]]], "duration": [9.45, 1.71, 0.45, 13.41, 21.8, 22.75, 10.74, 0.95, 25.96, 0.03, 48.14, 1.76, 0.97, 3.66]} \ No newline at end of file diff --git a/annotations_1/isFVKJA4E-k_filtered.json b/annotations_1/isFVKJA4E-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59e9268b9c7476419285ac6fe173f4738805d630 --- /dev/null +++ b/annotations_1/isFVKJA4E-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [15.0, 16.01], [20.0, 20.61], [33.0, 34.06], [36.0, 36.68], [37.0, 38.85], [59.0, 59.22], [60.0, 60.08], [63.0, 63.31], [64.0, 65.1], [66.0, 66.02], [68.0, 69.13], [75.0, 76.89], [79.0, 85.28], [86.0, 86.81], [87.0, 104.63], [105.0, 104.67], [106.0, 107.22], [108.0, 108.99], [111.0, 112.38], [113.0, 113.81], [114.0, 114.0], [114.0, 119.58], [121.0, 131.4], [133.0, 133.95], [136.0, 137.3], [139.0, 139.9], [141.0, 141.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 66.39, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.71], ["cattle, bovinae", 13.82], ["moo", 13.23]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.01, 0.61, 1.06, 0.68, 1.85, 0.22, 0.08, 0.31, 1.1, 0.02, 1.13, 1.89, 6.28, 0.81, 17.63, -0.33, 1.22, 0.99, 1.38, 0.81, 0.0, 5.58, 10.4, 0.95, 1.3, 0.9, 0.4]} \ No newline at end of file diff --git a/annotations_1/isct-XNu38E_filtered.json b/annotations_1/isct-XNu38E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30fca7df9443da7de8059c28dfebb3b0c0dd663f --- /dev/null +++ b/annotations_1/isct-XNu38E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [11.0, 12.58], [14.0, 41.49], [42.0, 54.14], [55.0, 57.0], [58.0, 65.74], [67.0, 76.18], [79.0, 79.59], [82.0, 82.44], [86.0, 85.89], [90.0, 93.19], [94.0, 95.25], [97.0, 99.42], [104.0, 106.47], [107.0, 110.1], [111.0, 115.37], [125.0, 128.53], [132.0, 171.41], [172.0, 182.41], [183.0, 183.95], [187.0, 190.58], [191.0, 191.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 91.47, 95.91, 99.97, 99.62, 91.98, 0.0, 0.0, 0.0, 64.75, 0.0, 97.73, 96.04, 87.55, 99.87, 38.35, 0.0, 34.73, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 16.84], ["hum", 9.83], ["music", 6.65]], null, [["whack, thwack", 33.44], ["speech", 32.91], ["music", 8.18]], null, null, null], "duration": [1.28, 1.58, 27.49, 12.14, 2.0, 7.74, 9.18, 0.59, 0.44, -0.11, 3.19, 1.25, 2.42, 2.47, 3.1, 4.37, 3.53, 39.41, 10.41, 0.95, 3.58, 0.62]} \ No newline at end of file diff --git a/annotations_1/iswgTDjihrU_filtered.json b/annotations_1/iswgTDjihrU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bd9bc5dc5d9d21e8162a759fddf5f2c5f8c3a37 --- /dev/null +++ b/annotations_1/iswgTDjihrU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 53.25], [64.0, 81.57], [90.0, 118.0], [118.0, 152.78], [155.0, 167.95], [170.0, 181.99], [182.0, 189.31]], "keep_status": [false, true, false, false, true, true, false], "silence_prob": [28.73, 28.52, 28.74, 0.0, 28.75, 28.56, 29.76], "audiomae_on_audioset": [[["music", 62.4], ["throbbing", 18.08], ["hum", 6.56]], [["music", 34.13], ["siren", 19.71], ["vehicle", 6.7]], [["music", 50.66], ["throbbing", 28.29], ["hum", 10.56]], null, [["music", 18.31], ["hum", 17.38], ["buzz", 15.27]], [["speech", 34.3], ["music", 18.7], ["burst, pop", 3.45]], [["speech", 59.24], ["music", 16.88], ["explosion", 5.47]]], "duration": [29.25, 17.57, 28.0, 34.78, 12.95, 11.99, 7.31]} \ No newline at end of file diff --git a/annotations_1/iuPDl6n2vO0_filtered.json b/annotations_1/iuPDl6n2vO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64c3f20e83333e381de0e222d99a8bc6004a6223 --- /dev/null +++ b/annotations_1/iuPDl6n2vO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.99], [12.0, 13.09], [15.0, 16.6], [17.0, 17.78], [18.0, 19.92], [21.0, 21.47], [23.0, 26.47], [28.0, 28.8], [32.0, 32.12], [35.0, 36.19], [43.0, 43.87], [47.0, 51.63], [52.0, 52.54], [60.0, 60.47], [62.0, 62.04], [62.0, 64.02], [65.0, 66.87], [68.0, 71.9], [73.0, 74.24], [76.0, 76.92], [85.0, 86.58], [88.0, 89.73], [92.0, 92.91], [97.0, 97.19], [99.0, 99.0], [104.0, 105.48], [109.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [41.28, 0.0, 0.0, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 68.54, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52], "audiomae_on_audioset": [[["music", 74.06], ["musical instrument", 4.02], ["speech", 3.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.99, 1.09, 1.6, 0.78, 1.92, 0.47, 3.47, 0.8, 0.12, 1.19, 0.87, 4.63, 0.54, 0.47, 0.04, 2.02, 1.87, 3.9, 1.24, 0.92, 1.58, 1.73, 0.91, 0.19, 0.0, 1.48, 3.21]} \ No newline at end of file diff --git a/annotations_1/ivG26TnBWGI_filtered.json b/annotations_1/ivG26TnBWGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18308e37d1f6d22994505ffe26b685222a5f3717 --- /dev/null +++ b/annotations_1/ivG26TnBWGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.85], [10.0, 20.73], [22.0, 24.24], [27.0, 30.7], [32.0, 32.26], [34.0, 41.15], [43.0, 44.27], [45.0, 52.71], [58.0, 58.67], [59.0, 63.15], [66.0, 71.07], [71.0, 71.68], [74.0, 82.95], [84.0, 84.57], [86.0, 97.14], [106.0, 123.52]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [33.05, 29.86, 30.06, 31.35, 0.0, 29.5, 0.0, 29.18, 0.0, 34.22, 30.0, 0.0, 30.37, 0.0, 29.61, 29.28], "audiomae_on_audioset": [[["music", 37.84], ["speech", 37.49], ["throbbing", 8.06]], [["music", 27.45], ["speech", 24.49], ["fly, housefly", 3.64]], [["music", 38.06], ["speech", 10.47], ["vehicle", 7.57]], [["music", 35.23], ["hum", 17.8], ["mains hum", 17.5]], null, [["music", 41.13], ["speech", 40.05], ["theremin", 1.77]], null, [["music", 42.25], ["didgeridoo", 21.36], ["theremin", 9.6]], null, [["music", 69.77], ["speech", 5.97], ["electronic music", 3.25]], [["music", 49.43], ["thunk", 12.9], ["whack, thwack", 9.84]], null, [["speech", 29.95], ["mains hum", 13.25], ["animal", 10.46]], null, [["music", 65.19], ["throbbing", 4.34], ["musical instrument", 2.29]], [["fly, housefly", 40.62], ["insect", 37.16], ["mosquito", 16.52]]], "duration": [3.85, 10.73, 2.24, 3.7, 0.26, 7.15, 1.27, 7.71, 0.67, 4.15, 5.07, 0.68, 8.95, 0.57, 11.14, 17.52]} \ No newline at end of file diff --git a/annotations_1/iv_Q51lofKM_filtered.json b/annotations_1/iv_Q51lofKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ecd9f5b4d0977f8073d2e6dcd32e8617b425b1e --- /dev/null +++ b/annotations_1/iv_Q51lofKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.47], [16.0, 16.77], [17.0, 17.78], [20.0, 22.27], [29.0, 29.57], [30.0, 36.53], [40.0, 40.86], [41.0, 41.5], [45.0, 48.0], [48.0, 48.03], [48.0, 48.07], [49.0, 48.71], [54.0, 55.54], [57.0, 58.46], [71.0, 71.44], [79.0, 80.35], [95.0, 95.2], [96.0, 96.3], [97.0, 97.75], [98.0, 98.24], [101.0, 104.58], [110.0, 111.03], [112.0, 115.52], [116.0, 116.04], [118.0, 117.68], [130.0, 133.52], [134.0, 134.62], [145.0, 145.17], [148.0, 148.36]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [42.39, 0.0, 0.0, 46.09, 0.0, 39.96, 0.0, 0.0, 35.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.07, 0.0, 42.67, 0.0, 0.0, 35.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.01], ["thunk", 31.35], ["breaking", 3.38]], null, null, [["speech", 29.54], ["music", 18.66], ["noise", 5.76]], null, [["music", 40.74], ["speech", 35.31], ["sidetone", 2.39]], null, null, [["speech", 53.35], ["music", 16.3], ["speech synthesizer", 6.57]], null, null, null, null, null, null, null, null, null, null, null, [["music", 53.78], ["throbbing", 5.97], ["hum", 3.77]], null, [["music", 60.01], ["throbbing", 17.12], ["hum", 5.68]], null, null, [["cattle, bovinae", 26.92], ["music", 21.48], ["moo", 19.27]], null, null, null], "duration": [3.47, 0.77, 0.78, 2.27, 0.57, 6.53, 0.86, 0.5, 3.0, 0.03, 0.07, -0.29, 1.54, 1.46, 0.44, 1.35, 0.2, 0.3, 0.75, 0.24, 3.58, 1.03, 3.52, 0.04, -0.32, 3.52, 0.62, 0.17, 0.36]} \ No newline at end of file diff --git a/annotations_1/iw-0Y6HWb9Q_filtered.json b/annotations_1/iw-0Y6HWb9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33451406383d552e601f69be10390a8a38b061f3 --- /dev/null +++ b/annotations_1/iw-0Y6HWb9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.16], [8.0, 10.32], [12.0, 13.15], [17.0, 17.9], [19.0, 24.02], [25.0, 25.61], [27.0, 27.7], [30.0, 31.29], [32.0, 32.66], [33.0, 33.89], [35.0, 35.56], [38.0, 38.47], [39.0, 39.75], [44.0, 44.98], [45.0, 47.61], [48.0, 51.34], [52.0, 55.0], [62.0, 64.05], [67.0, 113.44], [114.0, 114.79], [115.0, 120.65], [122.0, 123.74], [124.0, 127.25], [128.0, 128.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [91.47, 67.51, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 81.89, 29.52, 61.27, 0.0, 0.0, 30.76, 0.0, 35.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.25], ["hum", 13.46], ["music", 7.81]], null, [["speech", 34.28], ["music", 18.98], ["thump, thud", 12.16]], null, null, null, [["explosion", 44.66], ["speech", 23.58], ["burst, pop", 13.68]], null, [["speech", 68.16], ["groan", 7.35], ["animal", 2.87]], null], "duration": [4.16, 2.32, 1.15, 0.9, 5.02, 0.61, 0.7, 1.29, 0.66, 0.89, 0.56, 0.47, 0.75, 0.98, 2.61, 3.34, 3.0, 2.05, 46.44, 0.79, 5.65, 1.74, 3.25, 0.82]} \ No newline at end of file diff --git a/annotations_1/iwGU5hY6stw_filtered.json b/annotations_1/iwGU5hY6stw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..806ca80c4619f0edd5fafcb73e57e3bb9ad0ea6a --- /dev/null +++ b/annotations_1/iwGU5hY6stw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.54], [13.0, 15.48], [19.0, 19.77], [23.0, 24.06], [31.0, 32.34], [42.0, 72.57], [73.0, 78.04], [78.0, 89.99], [95.0, 120.72], [121.0, 126.3], [128.0, 129.76], [130.0, 130.35], [131.0, 132.06], [132.0, 134.27]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 30.78, 0.0, 0.0, 0.0, 0.0, 28.97, 29.06, 29.01, 27.93, 0.0, 0.0, 0.0, 28.2], "audiomae_on_audioset": [null, [["music", 55.17], ["mains hum", 10.64], ["hum", 9.38]], null, null, null, null, [["music", 36.66], ["theremin", 17.07], ["didgeridoo", 12.62]], [["music", 53.56], ["hum", 7.22], ["throbbing", 4.64]], [["music", 51.08], ["didgeridoo", 16.89], ["hum", 10.73]], [["livestock, farm animals, working animals", 51.7], ["cattle, bovinae", 38.16], ["moo", 7.14]], null, null, null, [["rumble", 20.11], ["fly, housefly", 17.94], ["insect", 12.93]]], "duration": [1.54, 2.48, 0.77, 1.06, 1.34, 30.57, 5.04, 11.99, 25.72, 5.3, 1.76, 0.35, 1.06, 2.27]} \ No newline at end of file diff --git a/annotations_1/iwxe2sIgQL0_filtered.json b/annotations_1/iwxe2sIgQL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c278db80deb9879b50f54fbfb03eada121d16121 --- /dev/null +++ b/annotations_1/iwxe2sIgQL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.26], [5.0, 7.6], [17.0, 18.17], [24.0, 24.19], [30.0, 31.35], [37.0, 36.76], [41.0, 41.42], [49.0, 48.84], [50.0, 51.51], [52.0, 53.91], [55.0, 56.05], [57.0, 57.77], [59.0, 60.12], [62.0, 63.49], [66.0, 67.64], [69.0, 70.51], [75.0, 76.47]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fly, housefly", 16.81], ["insect", 10.74], ["crushing", 6.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 2.6, 1.17, 0.19, 1.35, -0.24, 0.42, -0.16, 1.51, 1.91, 1.05, 0.77, 1.12, 1.49, 1.64, 1.51, 1.47]} \ No newline at end of file diff --git a/annotations_1/iy-SmSGYYBM_filtered.json b/annotations_1/iy-SmSGYYBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a524713cce6c1fb1fffb67c3f849801ac16f58 --- /dev/null +++ b/annotations_1/iy-SmSGYYBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 33.64], [47.0, 47.22], [51.0, 57.54], [67.0, 99.52], [103.0, 104.18]], "keep_status": [false, false, false, false, false], "silence_prob": [30.84, 0.0, 31.18, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.1], ["speech", 8.83], ["boing", 5.98]], null, [["music", 80.82], ["boing", 5.03], ["didgeridoo", 2.44]], null, null], "duration": [25.64, 0.22, 6.54, 32.52, 1.18]} \ No newline at end of file diff --git a/annotations_1/iz3ETniN1NI_filtered.json b/annotations_1/iz3ETniN1NI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da67efc296f07bdebd6b7f71d35f4eea1147b675 --- /dev/null +++ b/annotations_1/iz3ETniN1NI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.28], [19.0, 21.3], [22.0, 22.89], [23.0, 25.57], [27.0, 29.1], [31.0, 31.99], [43.0, 46.85], [47.0, 51.44], [53.0, 53.97], [56.0, 57.11], [58.0, 60.69], [62.0, 63.54], [74.0, 74.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.29, 0.0, 94.66, 95.91, 0.0, 100.0, 98.93, 0.0, 0.0, 99.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 2.3, 0.89, 2.57, 2.1, 0.99, 3.85, 4.44, 0.97, 1.11, 2.69, 1.54, 0.39]} \ No newline at end of file diff --git a/annotations_1/izLhF-Oodrg_filtered.json b/annotations_1/izLhF-Oodrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86c76a5d9d709ea9a8d7bac94b2432f81929fca4 --- /dev/null +++ b/annotations_1/izLhF-Oodrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [6.0, 8.67], [10.0, 13.04], [14.0, 16.39], [22.0, 23.57], [25.0, 25.68], [28.0, 27.68], [30.0, 30.32], [33.0, 36.02], [45.0, 46.2], [49.0, 48.96], [55.0, 55.68], [57.0, 57.13], [58.0, 59.24], [61.0, 61.92], [66.0, 67.1], [69.0, 71.41], [72.0, 72.0], [73.0, 73.4], [75.0, 76.22], [80.0, 82.19], [86.0, 86.83], [90.0, 91.18], [92.0, 93.45], [99.0, 101.12], [103.0, 103.64], [105.0, 108.58], [112.0, 113.44], [116.0, 119.3], [121.0, 123.9], [125.0, 128.07], [134.0, 140.9], [146.0, 149.08], [151.0, 152.1], [153.0, 154.97], [156.0, 160.37], [161.0, 160.96], [161.0, 165.91], [167.0, 174.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.8, 74.44, 73.36, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 78.89, 0.0, 0.0, 0.0, 78.38, 0.0, 74.92, 0.0, 76.04, 90.08, 82.43, 95.51, 83.7, 0.0, 0.0, 70.44, 0.0, 65.44, 80.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 2.67, 3.04, 2.39, 1.57, 0.68, -0.32, 0.32, 3.02, 1.2, -0.04, 0.68, 0.13, 1.24, 0.92, 1.1, 2.41, 0.0, 0.4, 1.22, 2.19, 0.83, 1.18, 1.45, 2.12, 0.64, 3.58, 1.44, 3.3, 2.9, 3.07, 6.9, 3.08, 1.1, 1.97, 4.37, -0.04, 4.91, 7.51]} \ No newline at end of file diff --git a/annotations_1/izP8mDH8XOc_filtered.json b/annotations_1/izP8mDH8XOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2edc67451d09ce229d078533995c7ae844c3e2e --- /dev/null +++ b/annotations_1/izP8mDH8XOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [4.0, 5.64], [7.0, 82.22], [83.0, 121.88], [125.0, 151.7], [152.0, 152.73], [156.0, 156.15], [160.0, 161.42]], "keep_status": [false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 28.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 20.62], ["hum", 16.04], ["mains hum", 12.24]], null, null, null], "duration": [0.12, 1.64, 75.22, 38.88, 26.7, 0.73, 0.15, 1.42]} \ No newline at end of file diff --git a/annotations_1/izWrKfUUP9o_filtered.json b/annotations_1/izWrKfUUP9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..576c48adad1a481065163f48f667f6ad4110007f --- /dev/null +++ b/annotations_1/izWrKfUUP9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.88], [20.0, 27.18], [31.0, 31.99], [35.0, 37.03], [43.0, 44.39], [47.0, 48.88], [52.0, 57.59], [72.0, 73.53], [78.0, 78.7], [81.0, 82.0], [98.0, 98.79], [101.0, 100.99], [107.0, 108.33], [110.0, 110.73], [112.0, 113.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.36, 30.98, 0.0, 30.06, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 37.57], ["throbbing", 30.1], ["hum", 4.05]], [["music", 62.13], ["speech", 6.65], ["animal", 2.53]], null, [["music", 37.43], ["speech", 30.61], ["fart", 5.08]], null, null, [["music", 53.98], ["speech", 27.6], ["musical instrument", 3.4]], null, null, null, null, null, null, null, null], "duration": [3.88, 7.18, 0.99, 2.03, 1.39, 1.88, 5.59, 1.53, 0.7, 1.0, 0.79, -0.01, 1.33, 0.73, 1.21]} \ No newline at end of file diff --git a/annotations_1/j-7pVks8avo_filtered.json b/annotations_1/j-7pVks8avo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2639ad4e822d856c5089d1953a4e5205274ca7d7 --- /dev/null +++ b/annotations_1/j-7pVks8avo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.42], [16.0, 16.11], [38.0, 38.35], [41.0, 40.88], [47.0, 47.71], [51.0, 52.22], [57.0, 57.01], [63.0, 63.95], [66.0, 66.7], [67.0, 67.49], [77.0, 77.94], [84.0, 84.82], [132.0, 132.09], [133.0, 133.44], [144.0, 145.03], [146.0, 147.39], [148.0, 152.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.47], ["radio", 24.87], ["speech", 19.64]]], "duration": [0.42, 0.11, 0.35, -0.12, 0.71, 1.22, 0.01, 0.95, 0.7, 0.49, 0.94, 0.82, 0.09, 0.44, 1.03, 1.39, 4.31]} \ No newline at end of file diff --git a/annotations_1/j-TPDJFWErg_filtered.json b/annotations_1/j-TPDJFWErg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52ce7f027cb48f9c66f689496c2ec31dc41b5765 --- /dev/null +++ b/annotations_1/j-TPDJFWErg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [5.0, 8.53], [12.0, 12.51], [14.0, 55.49], [57.0, 62.99], [63.0, 64.15], [65.0, 70.8], [71.0, 72.03], [73.0, 74.29], [75.0, 81.58], [84.0, 92.01], [96.0, 120.68], [123.0, 136.92], [138.0, 138.38], [141.0, 141.17], [143.0, 145.2], [146.0, 146.5], [147.0, 148.44], [149.0, 151.01], [151.0, 152.79], [153.0, 160.17], [162.0, 163.51], [164.0, 167.59], [168.0, 170.78], [171.0, 172.52], [173.0, 174.04]], "keep_status": [false, false, false, false, true, false, true, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.81, 0.0, 0.0, 33.3, 0.0, 34.98, 0.0, 0.0, 34.14, 32.26, 34.07, 33.98, 0.0, 0.0, 63.1, 0.0, 0.0, 74.44, 0.0, 51.6, 0.0, 63.64, 79.24, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 58.52], ["speech", 21.63], ["animal", 1.21]], null, null, [["music", 27.81], ["noise", 14.59], ["theremin", 8.23]], null, [["speech", 22.75], ["music", 19.09], ["noise", 10.49]], null, null, [["music", 17.3], ["noise", 16.54], ["speech", 13.02]], [["music", 38.99], ["smash, crash", 14.07], ["whack, thwack", 9.83]], [["music", 54.57], ["speech", 20.23], ["throbbing", 8.14]], [["music", 41.43], ["throbbing", 11.01], ["hum", 10.99]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 3.53, 0.51, 41.49, 5.99, 1.15, 5.8, 1.03, 1.29, 6.58, 8.01, 24.68, 13.92, 0.38, 0.17, 2.2, 0.5, 1.44, 2.01, 1.79, 7.17, 1.51, 3.59, 2.78, 1.52, 1.04]} \ No newline at end of file diff --git a/annotations_1/j0IXQIUh3jQ_filtered.json b/annotations_1/j0IXQIUh3jQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/j0IXQIUh3jQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/j0c_RQDfjSM_filtered.json b/annotations_1/j0c_RQDfjSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d791adac4962f9c273399a74b2152edddd6920dc --- /dev/null +++ b/annotations_1/j0c_RQDfjSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [6.0, 6.1], [14.0, 13.91], [18.0, 18.57], [23.0, 23.28], [24.0, 24.95], [35.0, 35.65], [38.0, 38.97], [42.0, 42.77], [46.0, 47.56], [52.0, 52.51], [57.0, 57.18], [63.0, 63.04], [63.0, 63.91], [65.0, 66.43], [68.0, 68.96], [69.0, 81.09], [82.0, 83.37], [84.0, 84.94], [88.0, 88.96], [93.0, 100.36], [102.0, 108.38], [110.0, 121.05], [121.0, 121.17], [121.0, 136.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.63, 0.0, 0.0, 0.0, 29.35, 29.12, 29.18, 0.0, 30.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 88.64], ["boing", 4.79], ["speech", 1.66]], null, null, null, [["music", 82.08], ["fly, housefly", 2.34], ["sidetone", 1.7]], [["music", 50.23], ["didgeridoo", 15.0], ["hum", 3.49]], [["music", 62.88], ["electric shaver, electric razor", 9.88], ["electronic music", 3.1]], null, [["music", 88.33], ["throbbing", 1.83], ["speech", 1.33]]], "duration": [1.82, 0.1, -0.09, 0.57, 0.28, 0.95, 0.65, 0.97, 0.77, 1.56, 0.51, 0.18, 0.04, 0.91, 1.43, 0.96, 12.09, 1.37, 0.94, 0.96, 7.36, 6.38, 11.05, 0.17, 15.71]} \ No newline at end of file diff --git a/annotations_1/j0cqqCpIZHE_filtered.json b/annotations_1/j0cqqCpIZHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09f0fb70bc35010ddd106faa10b54eab7f103c3e --- /dev/null +++ b/annotations_1/j0cqqCpIZHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [6.0, 7.32], [11.0, 11.77], [26.0, 25.89], [26.0, 26.0], [26.0, 26.18], [26.0, 26.22], [26.0, 26.45], [26.0, 27.18], [27.0, 27.23], [28.0, 28.59], [30.0, 30.18], [32.0, 33.52], [35.0, 35.34], [40.0, 44.71], [45.0, 46.23], [48.0, 48.51], [50.0, 50.23], [54.0, 54.55], [60.0, 67.51], [69.0, 70.73], [72.0, 72.93], [75.0, 77.4], [79.0, 81.04], [88.0, 88.48], [89.0, 90.41], [97.0, 97.56], [98.0, 98.36], [99.0, 99.84], [115.0, 115.32], [118.0, 118.84], [120.0, 120.51], [122.0, 123.74], [125.0, 126.1], [127.0, 128.46], [135.0, 136.81], [138.0, 140.12], [141.0, 143.63], [144.0, 147.7], [149.0, 150.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.35, 0.0, 0.0, 0.0, 0.0, 30.6, 0.0, 0.0, 40.55, 37.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 57.89, 50.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.82], ["mains hum", 8.46], ["hum", 6.42]], null, null, null, null, [["speech", 67.69], ["music", 12.28], ["breaking", 2.32]], null, null, [["music", 55.71], ["didgeridoo", 8.39], ["hum", 6.08]], [["music", 35.96], ["musical instrument", 5.33], ["vehicle", 3.29]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.76], ["speech", 24.3], ["theremin", 16.26]], null, null, null], "duration": [0.4, 1.32, 0.77, -0.11, 0.0, 0.18, 0.22, 0.45, 1.18, 0.23, 0.59, 0.18, 1.52, 0.34, 4.71, 1.23, 0.51, 0.23, 0.55, 7.51, 1.73, 0.93, 2.4, 2.04, 0.48, 1.41, 0.56, 0.36, 0.84, 0.32, 0.84, 0.51, 1.74, 1.1, 1.46, 1.81, 2.12, 2.63, 3.7, 1.04]} \ No newline at end of file diff --git a/annotations_1/j0iplsU1qa4_filtered.json b/annotations_1/j0iplsU1qa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3aef6da62c77721baa8e3032eb9f03575fc9bad --- /dev/null +++ b/annotations_1/j0iplsU1qa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [7.0, 7.25], [8.0, 8.68], [13.0, 14.0], [21.0, 21.47], [24.0, 24.54], [26.0, 30.47], [32.0, 34.74], [36.0, 45.22], [50.0, 50.35], [52.0, 53.16], [56.0, 58.01], [59.0, 60.79], [61.0, 62.68], [68.0, 68.39], [73.0, 73.41], [77.0, 80.32], [81.0, 81.19], [86.0, 86.68], [88.0, 88.57], [90.0, 97.31], [98.0, 102.96], [103.0, 104.21], [108.0, 108.87], [114.0, 114.35], [115.0, 119.45], [120.0, 120.97], [123.0, 126.47], [128.0, 129.83], [132.0, 133.69], [135.0, 137.15], [138.0, 138.97], [140.0, 141.24], [145.0, 145.94], [152.0, 153.55], [155.0, 155.88], [157.0, 157.96], [159.0, 159.92], [164.0, 164.73]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.22, 53.1, 28.98, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 30.69, 30.38, 0.0, 0.0, 0.0, 28.81, 0.0, 34.07, 0.0, 0.0, 31.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 32.17], ["music", 16.16], ["throbbing", 13.5]], null, [["hum", 46.09], ["mains hum", 17.32], ["whale vocalization", 8.72]], null, null, [["music", 14.26], ["hum", 13.45], ["mains hum", 9.15]], null, null, null, null, [["hum", 35.76], ["mains hum", 24.92], ["throbbing", 6.9]], null, null, null, [["hum", 29.61], ["fly, housefly", 11.37], ["bee, wasp, etc.", 10.02]], [["bee, wasp, etc.", 36.47], ["insect", 16.69], ["fly, housefly", 14.32]], null, null, null, [["speech", 63.13], ["music", 5.4], ["rumble", 3.59]], null, [["music", 18.39], ["hum", 15.08], ["speech", 11.99]], null, null, [["noise", 29.61], ["white noise", 10.44], ["hum", 8.41]], null, null, null, null, null, null, null, null], "duration": [1.04, 0.25, 0.68, 1.0, 0.47, 0.54, 4.47, 2.74, 9.22, 0.35, 1.16, 2.01, 1.79, 1.68, 0.39, 0.41, 3.32, 0.19, 0.68, 0.57, 7.31, 4.96, 1.21, 0.87, 0.35, 4.45, 0.97, 3.47, 1.83, 1.69, 2.15, 0.97, 1.24, 0.94, 1.55, 0.88, 0.96, 0.92, 0.73]} \ No newline at end of file diff --git a/annotations_1/j0z0V2JJ5II_filtered.json b/annotations_1/j0z0V2JJ5II_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2292ed294fb524e35f407c67c0d2c41f6f01047 --- /dev/null +++ b/annotations_1/j0z0V2JJ5II_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.32], [1.0, 1.36], [1.0, 1.39], [1.0, 1.43], [2.0, 1.53], [3.0, 13.76], [17.0, 18.12], [21.0, 21.32], [26.0, 44.07], [46.0, 54.48], [56.0, 70.04], [71.0, 73.8], [76.0, 79.56], [80.0, 94.05], [95.0, 101.24], [108.0, 110.78], [113.0, 121.59]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.76, 0.0, 0.0, 38.6, 31.11, 35.96, 40.9, 63.1, 38.49, 33.13, 30.14, 30.44], "audiomae_on_audioset": [null, null, null, null, null, [["music", 24.18], ["sidetone", 22.43], ["throbbing", 14.22]], null, null, [["hum", 27.49], ["throbbing", 16.24], ["mains hum", 11.34]], [["music", 49.98], ["noise", 20.77], ["grunt", 6.91]], [["grunt", 49.69], ["noise", 19.04], ["groan", 16.39]], [["sidetone", 49.17], ["speech", 26.68], ["radio", 6.35]], null, [["insect", 40.06], ["fly, housefly", 28.57], ["music", 9.94]], [["music", 49.71], ["theremin", 6.06], ["musical instrument", 4.44]], [["cattle, bovinae", 38.42], ["moo", 31.73], ["speech", 9.58]], [["speech", 46.58], ["electric shaver, electric razor", 10.67], ["hum", 10.19]]], "duration": [0.32, 0.36, 0.39, 0.43, -0.47, 10.76, 1.12, 0.32, 18.07, 8.48, 14.04, 2.8, 3.56, 14.05, 6.24, 2.78, 8.59]} \ No newline at end of file diff --git a/annotations_1/j1tXIl0snEk_filtered.json b/annotations_1/j1tXIl0snEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2c4473114cdb61fd52a020d255226838828477b --- /dev/null +++ b/annotations_1/j1tXIl0snEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.95], [27.0, 28.29], [30.0, 30.65], [33.0, 34.35], [36.0, 36.75], [39.0, 45.69], [47.0, 48.17], [56.0, 57.4], [73.0, 77.48], [83.0, 83.83], [100.0, 101.58], [105.0, 116.6], [118.0, 121.09]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, true, true], "silence_prob": [29.46, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0, 28.69, 0.0, 0.0, 30.37, 30.08], "audiomae_on_audioset": [[["hum", 55.57], ["throbbing", 19.32], ["mains hum", 13.19]], null, null, null, null, [["hum", 28.02], ["music", 20.58], ["throbbing", 17.62]], null, null, [["hum", 35.29], ["mains hum", 22.22], ["music", 9.84]], null, null, [["music", 34.68], ["electronic music", 8.95], ["speech", 6.93]], [["hum", 36.85], ["ambient music", 17.32], ["music", 12.99]]], "duration": [5.95, 1.29, 0.65, 1.35, 0.75, 6.69, 1.17, 1.4, 4.48, 0.83, 1.58, 11.6, 3.09]} \ No newline at end of file diff --git a/annotations_1/j21idqW08wU_filtered.json b/annotations_1/j21idqW08wU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50e1c32ea39da6e66b66438c1eb6ecad62d7b2bd --- /dev/null +++ b/annotations_1/j21idqW08wU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 33.86], [35.0, 35.4], [40.0, 46.55], [50.0, 50.79], [52.0, 61.74], [64.0, 70.83], [73.0, 86.04], [101.0, 114.15], [115.0, 115.57], [117.0, 122.72], [128.0, 128.39], [129.0, 130.15], [134.0, 135.38], [136.0, 137.0], [141.0, 141.02], [142.0, 146.31], [152.0, 156.84], [161.0, 161.97], [167.0, 172.66], [173.0, 174.9]], "keep_status": [false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.22, 0.0, 32.6, 0.0, 34.22, 33.96, 34.56, 33.99, 0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 36.75, 63.64, 0.0, 35.58, 0.0], "audiomae_on_audioset": [[["music", 44.84], ["speech", 19.84], ["throbbing", 10.25]], null, [["music", 37.8], ["speech", 26.58], ["hum", 4.77]], null, [["music", 51.83], ["speech", 21.56], ["hum", 5.21]], [["music", 37.02], ["hum", 18.68], ["mains hum", 12.15]], [["hum", 38.0], ["throbbing", 18.42], ["music", 18.25]], [["speech", 32.13], ["buzz", 25.72], ["vehicle", 9.6]], null, [["hum", 22.53], ["music", 22.48], ["mains hum", 21.9]], null, null, null, null, null, [["speech", 40.96], ["music", 17.52], ["hum", 6.61]], null, null, [["speech", 57.15], ["music", 7.3], ["rumble", 3.78]], null], "duration": [19.86, 0.4, 6.55, 0.79, 9.74, 6.83, 13.04, 13.15, 0.57, 5.72, 0.39, 1.15, 1.38, 1.0, 0.02, 4.31, 4.84, 0.97, 5.66, 1.9]} \ No newline at end of file diff --git a/annotations_1/j2JFTz9KQhk_filtered.json b/annotations_1/j2JFTz9KQhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d64d5ff58e67ee36dff1cbc5f5dc33cacf1ad403 --- /dev/null +++ b/annotations_1/j2JFTz9KQhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.85], [14.0, 32.04], [37.0, 38.26], [40.0, 47.98], [50.0, 51.44], [53.0, 63.09], [63.0, 72.32], [73.0, 73.28], [74.0, 74.26], [77.0, 83.13], [84.0, 85.21], [86.0, 88.89], [90.0, 93.21], [94.0, 94.24], [96.0, 98.51], [99.0, 99.13], [101.0, 101.21], [103.0, 102.76], [109.0, 109.29], [123.0, 124.5], [129.0, 130.23], [133.0, 132.68], [137.0, 137.13], [138.0, 139.68]], "keep_status": [false, true, false, true, false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.72, 0.0, 34.88, 0.0, 32.09, 30.54, 0.0, 0.0, 32.85, 0.0, 30.19, 31.94, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.43], ["throbbing", 8.11], ["hum", 5.67]], null, [["music", 23.4], ["throbbing", 15.32], ["hum", 5.86]], null, [["fly, housefly", 29.84], ["insect", 18.46], ["mosquito", 17.36]], [["hum", 23.12], ["speech", 20.18], ["music", 19.81]], null, null, [["hum", 49.85], ["music", 19.37], ["throbbing", 17.11]], null, [["hum", 27.64], ["music", 15.93], ["throbbing", 15.17]], [["vehicle", 17.77], ["music", 16.51], ["hum", 10.52]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.85, 18.04, 1.26, 7.98, 1.44, 10.09, 9.32, 0.28, 0.26, 6.13, 1.21, 2.89, 3.21, 0.24, 2.51, 0.13, 0.21, -0.24, 0.29, 1.5, 1.23, -0.32, 0.13, 1.68]} \ No newline at end of file diff --git a/annotations_1/j2MbvFYy_8Y_filtered.json b/annotations_1/j2MbvFYy_8Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4723294235a641e7c067252076d81aa7efbe2d5 --- /dev/null +++ b/annotations_1/j2MbvFYy_8Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.86], [11.0, 11.23], [13.0, 13.32], [15.0, 14.91], [19.0, 22.06], [26.0, 26.81], [29.0, 29.73], [31.0, 48.03], [48.0, 48.44], [50.0, 49.92], [54.0, 58.48], [64.0, 65.43], [67.0, 67.42], [69.0, 69.74], [73.0, 75.02], [76.0, 76.79], [77.0, 78.19], [81.0, 82.22], [83.0, 83.86], [86.0, 91.67], [94.0, 98.02], [99.0, 99.57], [101.0, 101.43], [102.0, 102.41], [104.0, 105.19], [119.0, 119.31], [120.0, 121.04], [122.0, 123.08], [125.0, 141.0], [144.0, 155.76]], "keep_status": [false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.71, 0.0, 0.0, 30.07, 0.0, 0.0, 41.62, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 73.06, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.68, 32.52], "audiomae_on_audioset": [null, null, null, null, [["music", 51.0], ["musical instrument", 7.89], ["percussion", 4.2]], null, null, [["music", 27.78], ["noise", 15.02], ["mains hum", 9.2]], null, null, [["breaking", 22.9], ["crushing", 14.49], ["thunk", 12.59]], null, null, null, [["sidetone", 46.67], ["speech", 41.12], ["echo", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.85], ["musical instrument", 6.8], ["effects unit", 2.0]], [["music", 62.93], ["speech", 11.34], ["guitar", 3.87]]], "duration": [0.86, 0.23, 0.32, -0.09, 3.06, 0.81, 0.73, 17.03, 0.44, -0.08, 4.48, 1.43, 0.42, 0.74, 2.02, 0.79, 1.19, 1.22, 0.86, 5.67, 4.02, 0.57, 0.43, 0.41, 1.19, 0.31, 1.04, 1.08, 16.0, 11.76]} \ No newline at end of file diff --git a/annotations_1/j2ZsEQ4Fr4c_filtered.json b/annotations_1/j2ZsEQ4Fr4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c49880a9fad71d77fc1a6f5cd1717e22e5d7be4 --- /dev/null +++ b/annotations_1/j2ZsEQ4Fr4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 8.19], [41.0, 40.78], [73.0, 73.43], [77.0, 78.02], [79.0, 80.74], [82.0, 83.66], [87.0, 87.07], [88.0, 89.29], [90.0, 92.2], [93.0, 93.02], [94.0, 95.57], [96.0, 98.54], [99.0, 100.67]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 77.36, 0.0], "audiomae_on_audioset": [[["speech", 22.34], ["music", 17.83], ["mosquito", 11.07]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.19, -0.22, 0.43, 1.02, 1.74, 1.66, 0.07, 1.29, 2.2, 0.02, 1.57, 2.54, 1.67]} \ No newline at end of file diff --git a/annotations_1/j4onAJ-3FAM_filtered.json b/annotations_1/j4onAJ-3FAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89184e3c218aaee5a07f776bcf927dd61f172acd --- /dev/null +++ b/annotations_1/j4onAJ-3FAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.44], [5.0, 4.94], [5.0, 7.65], [8.0, 7.86], [8.0, 8.01], [9.0, 8.56], [10.0, 9.63], [11.0, 24.88], [28.0, 36.85], [43.0, 52.2], [52.0, 54.19], [55.0, 60.15], [61.0, 77.97], [79.0, 83.86]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [0.0, 0.0, 32.68, 0.0, 0.0, 0.0, 0.0, 31.84, 32.89, 33.3, 40.38, 30.89, 29.1, 29.22], "audiomae_on_audioset": [null, null, [["music", 59.93], ["speech", 10.05], ["electronic music", 6.49]], null, null, null, null, [["throbbing", 33.85], ["hum", 27.74], ["music", 25.22]], [["music", 39.41], ["throbbing", 18.43], ["fart", 5.85]], [["music", 46.49], ["throbbing", 23.09], ["hum", 15.45]], [["music", 74.41], ["throbbing", 11.33], ["hum", 2.95]], [["music", 49.95], ["speech", 7.65], ["electronic music", 4.5]], [["music", 44.19], ["throbbing", 13.42], ["buzz", 10.64]], [["explosion", 30.12], ["whack, thwack", 10.38], ["music", 5.6]]], "duration": [0.44, -0.06, 2.65, -0.14, 0.01, -0.44, -0.37, 13.88, 8.85, 9.2, 2.19, 5.15, 16.97, 4.86]} \ No newline at end of file diff --git a/annotations_1/j66Fsl_q5Ig_filtered.json b/annotations_1/j66Fsl_q5Ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d803ebec844b67b00447dc13a0639572b69c517 --- /dev/null +++ b/annotations_1/j66Fsl_q5Ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.04], [19.0, 21.76], [23.0, 23.36], [25.0, 25.95], [28.0, 29.08], [32.0, 34.87], [38.0, 38.04], [39.0, 53.35], [59.0, 59.98], [63.0, 74.9], [76.0, 90.21], [92.0, 94.04], [99.0, 99.98], [102.0, 105.02], [106.0, 107.05], [111.0, 112.13], [113.0, 113.7], [115.0, 115.48], [119.0, 142.5], [146.0, 151.43], [154.0, 166.62], [168.0, 198.41]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [31.03, 43.58, 0.0, 0.0, 0.0, 31.17, 0.0, 31.2, 0.0, 30.56, 30.17, 32.12, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 30.91, 31.26, 30.95, 0.0], "audiomae_on_audioset": [[["music", 41.92], ["throbbing", 19.18], ["hum", 9.42]], [["music", 68.98], ["synthesizer", 3.41], ["musical instrument", 2.98]], null, null, null, [["speech", 22.66], ["music", 21.91], ["eruption", 3.77]], null, [["music", 56.6], ["electronic music", 6.76], ["cacophony", 4.1]], null, [["music", 38.69], ["speech", 25.57], ["hum", 4.62]], [["mains hum", 34.69], ["music", 24.04], ["hum", 16.33]], [["music", 33.04], ["hum", 8.99], ["throbbing", 8.05]], null, [["music", 52.22], ["hum", 6.57], ["cacophony", 5.99]], null, null, null, null, [["music", 55.75], ["throbbing", 14.39], ["hum", 10.11]], [["music", 36.34], ["throbbing", 20.42], ["hum", 12.54]], [["music", 46.95], ["speech", 26.96], ["electric shaver, electric razor", 2.43]], null], "duration": [5.04, 2.76, 0.36, 0.95, 1.08, 2.87, 0.04, 14.35, 0.98, 11.9, 14.21, 2.04, 0.98, 3.02, 1.05, 1.13, 0.7, 0.48, 23.5, 5.43, 12.62, 30.41]} \ No newline at end of file diff --git a/annotations_1/j71oHN1i2pU_filtered.json b/annotations_1/j71oHN1i2pU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85e96644f3fecfb6ef412ddd8ab38d16e595f6ea --- /dev/null +++ b/annotations_1/j71oHN1i2pU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.98], [29.0, 29.34], [30.0, 30.45], [31.0, 31.48], [32.0, 35.43], [38.0, 38.5], [55.0, 66.9], [67.0, 68.82], [70.0, 82.27], [86.0, 85.95], [89.0, 108.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.08, 0.0, 28.95, 0.0, 31.53, 0.0, 29.8], "audiomae_on_audioset": [null, null, null, null, [["music", 14.46], ["grunt", 14.01], ["groan", 13.98]], null, [["music", 65.78], ["speech", 4.59], ["hum", 4.4]], null, [["music", 48.5], ["speech", 19.42], ["foghorn", 4.17]], null, [["livestock, farm animals, working animals", 41.39], ["cattle, bovinae", 12.81], ["moo", 8.54]]], "duration": [-0.02, 0.34, 0.45, 0.48, 3.43, 0.5, 11.9, 1.82, 12.27, -0.05, 19.94]} \ No newline at end of file diff --git a/annotations_1/j7m47I9BuuY_filtered.json b/annotations_1/j7m47I9BuuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3300fae37101dd5d7c47a91e925ae7c9a8980f60 --- /dev/null +++ b/annotations_1/j7m47I9BuuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[209.0, 214.22]], "keep_status": [false], "silence_prob": [60.89], "audiomae_on_audioset": [null], "duration": [5.22]} \ No newline at end of file diff --git a/annotations_1/j8cGENcePl0_filtered.json b/annotations_1/j8cGENcePl0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547838df3d080f02fef44f39d34097d09e949e86 --- /dev/null +++ b/annotations_1/j8cGENcePl0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.88], [12.0, 16.31], [19.0, 29.2], [35.0, 41.03], [45.0, 45.94], [47.0, 56.94], [58.0, 63.95], [66.0, 68.22], [69.0, 95.52], [97.0, 104.3], [105.0, 122.62], [124.0, 124.09]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 39.35, 37.88, 36.86, 0.0, 34.37, 32.47, 33.1, 32.05, 34.01, 32.45, 0.0], "audiomae_on_audioset": [null, [["music", 60.89], ["musical instrument", 6.27], ["guitar", 3.35]], [["boing", 39.0], ["music", 17.9], ["fly, housefly", 17.11]], [["music", 74.93], ["speech", 10.38], ["boing", 3.53]], null, [["music", 56.58], ["speech", 17.04], ["throbbing", 2.8]], [["music", 63.24], ["boing", 6.66], ["electronic music", 4.09]], [["sidetone", 44.04], ["music", 14.19], ["moo", 4.78]], [["music", 50.53], ["speech", 15.63], ["boing", 5.15]], [["music", 47.04], ["boing", 8.9], ["throbbing", 3.24]], [["livestock, farm animals, working animals", 44.18], ["cattle, bovinae", 13.58], ["moo", 11.36]], null], "duration": [0.88, 4.31, 10.2, 6.03, 0.94, 9.94, 5.95, 2.22, 26.52, 7.3, 17.62, 0.09]} \ No newline at end of file diff --git a/annotations_1/j8nLPMys3b8_filtered.json b/annotations_1/j8nLPMys3b8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86a92ca104f8112798a9b823e57865c065717794 --- /dev/null +++ b/annotations_1/j8nLPMys3b8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 44.07], [48.0, 80.43], [81.0, 106.91], [109.0, 122.57], [125.0, 137.19], [139.0, 139.06], [141.0, 142.48], [145.0, 184.2]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.55, 41.26, 31.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 56.01], ["breaking", 20.63], ["glass", 3.69]], [["music", 80.66], ["theremin", 6.27], ["scary music", 2.77]], [["music", 40.54], ["hum", 20.14], ["mains hum", 10.92]], null, null, null], "duration": [38.07, 32.43, 25.91, 13.57, 12.19, 0.06, 1.48, 39.2]} \ No newline at end of file diff --git a/annotations_1/j91qPMHaqbg_filtered.json b/annotations_1/j91qPMHaqbg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ad105e4a68637f05e2e8c17901885efd5f2393b --- /dev/null +++ b/annotations_1/j91qPMHaqbg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.92], [1.0, 2.84], [6.0, 7.94], [15.0, 15.99], [17.0, 20.51], [22.0, 22.45], [23.0, 24.09], [28.0, 32.44], [33.0, 35.24], [40.0, 42.96], [56.0, 58.48], [60.0, 60.76], [61.0, 61.5], [72.0, 72.35], [83.0, 85.43], [87.0, 89.02], [91.0, 92.62], [95.0, 97.68], [100.0, 104.58], [105.0, 108.53], [110.0, 110.69], [114.0, 115.11], [129.0, 133.42], [135.0, 140.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 0.0, 56.4, 40.41, 54.83, 59.07, 0.0, 0.0, 0.0, 51.44, 98.8, 0.0, 100.0, 44.93, 38.72, 0.0, 0.0, 97.0, 77.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 71.96], ["sidetone", 8.41], ["noise", 2.6]], null, null, null, null, null, null, null, null, null, [["speech", 94.31], ["music", 0.83], ["inside, small room", 0.76]], [["speech", 35.54], ["music", 29.46], ["inside, small room", 5.11]], null, null, null, null], "duration": [-0.08, 1.84, 1.94, 0.99, 3.51, 0.45, 1.09, 4.44, 2.24, 2.96, 2.48, 0.76, 0.5, 0.35, 2.43, 2.02, 1.62, 2.68, 4.58, 3.53, 0.69, 1.11, 4.42, 5.26]} \ No newline at end of file diff --git a/annotations_1/jA83iWbczFc_filtered.json b/annotations_1/jA83iWbczFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92d08bc1d6f9b507ee200e044cfa43d814a73ca1 --- /dev/null +++ b/annotations_1/jA83iWbczFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 22.3], [23.0, 24.19], [25.0, 26.15], [27.0, 27.8], [29.0, 29.15], [33.0, 34.21], [36.0, 37.18], [37.0, 38.47], [40.0, 41.71], [43.0, 46.67], [48.0, 48.05], [48.0, 48.39], [49.0, 48.93], [49.0, 50.79], [51.0, 52.42], [53.0, 53.47], [56.0, 57.3], [59.0, 59.66], [61.0, 89.01], [92.0, 99.22], [100.0, 100.72], [110.0, 114.08], [116.0, 121.56], [123.0, 130.74], [132.0, 144.91], [146.0, 146.45], [147.0, 148.34], [151.0, 152.42], [153.0, 158.82], [161.0, 161.64], [162.0, 161.69], [162.0, 162.28], [163.0, 165.75], [168.0, 168.45], [170.0, 169.96], [171.0, 171.49]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.51, 33.47, 0.0, 42.53, 44.26, 29.69, 29.35, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 27.47], ["siren", 14.91], ["emergency vehicle", 13.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 28.81], ["hum", 27.02], ["music", 23.89]], [["music", 70.99], ["scary music", 6.73], ["ambient music", 4.59]], null, [["music", 57.71], ["hum", 10.23], ["mains hum", 9.1]], [["music", 36.57], ["scary music", 23.98], ["mains hum", 12.85]], [["music", 83.19], ["speech", 2.78], ["burst, pop", 2.42]], [["speech", 24.23], ["music", 15.29], ["throbbing", 12.8]], null, null, null, [["mains hum", 22.07], ["hum", 17.08], ["speech", 6.62]], null, null, null, [["speech", 58.98], ["music", 10.54], ["whack, thwack", 5.24]], null, null, null], "duration": [20.3, 1.19, 1.15, 0.8, 0.15, 1.21, 1.18, 1.47, 1.71, 3.67, 0.05, 0.39, -0.07, 1.79, 1.42, 0.47, 1.3, 0.66, 28.01, 7.22, 0.72, 4.08, 5.56, 7.74, 12.91, 0.45, 1.34, 1.42, 5.82, 0.64, -0.31, 0.28, 2.75, 0.45, -0.04, 0.49]} \ No newline at end of file diff --git a/annotations_1/jB9WGpVrYBs_filtered.json b/annotations_1/jB9WGpVrYBs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d3b666822a84850a50f1cf644612e25cc98044e --- /dev/null +++ b/annotations_1/jB9WGpVrYBs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.19], [8.0, 21.88], [23.0, 23.65], [25.0, 29.15], [29.0, 31.16], [35.0, 38.25], [44.0, 112.45]], "keep_status": [true, false, false, true, true, true, false], "silence_prob": [28.64, 29.06, 0.0, 29.45, 32.41, 29.52, 0.0], "audiomae_on_audioset": [[["music", 52.09], ["speech", 11.2], ["explosion", 3.62]], [["music", 48.57], ["speech", 26.72], ["burst, pop", 2.89]], null, [["speech", 28.26], ["mains hum", 21.67], ["music", 16.06]], [["music", 23.79], ["throbbing", 17.96], ["mains hum", 13.98]], [["speech", 28.73], ["music", 19.31], ["mains hum", 5.78]], null], "duration": [2.19, 13.88, 0.65, 4.15, 2.16, 3.25, 68.45]} \ No newline at end of file diff --git a/annotations_1/jBMZnAIY_Ng_filtered.json b/annotations_1/jBMZnAIY_Ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0f8c9324f30b3a444a6355694b57c8c6c29a3d --- /dev/null +++ b/annotations_1/jBMZnAIY_Ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 58.41], [62.0, 80.23], [81.0, 111.25]], "keep_status": [true, false, false], "silence_prob": [42.28, 33.66, 0.0], "audiomae_on_audioset": [[["throbbing", 31.67], ["hum", 24.78], ["mains hum", 9.06]], [["music", 58.66], ["throbbing", 9.74], ["didgeridoo", 6.27]], null], "duration": [2.41, 18.23, 30.25]} \ No newline at end of file diff --git a/annotations_1/jBotZTDEcP8_filtered.json b/annotations_1/jBotZTDEcP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04a39cc6a3353c234e2c50131833dd5945036d50 --- /dev/null +++ b/annotations_1/jBotZTDEcP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.0], [21.0, 21.25], [22.0, 23.31], [27.0, 26.91], [30.0, 31.19], [32.0, 32.78], [34.0, 33.99], [38.0, 39.16], [40.0, 40.51], [41.0, 41.91], [43.0, 45.22], [52.0, 59.86], [65.0, 65.89], [68.0, 69.13], [71.0, 77.41], [89.0, 88.97], [91.0, 92.94], [95.0, 95.81], [98.0, 98.85], [104.0, 109.56], [111.0, 115.75], [122.0, 122.88], [125.0, 125.91], [145.0, 145.91], [147.0, 148.39], [152.0, 152.0], [158.0, 158.65]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 30.73, 0.0, 0.0, 30.66, 0.0, 0.0, 0.0, 0.0, 46.97, 38.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 33.97], ["croak", 12.46], ["speech", 7.82]], null, null, null, null, null, null, null, null, null, null, [["music", 70.25], ["speech", 10.68], ["thunk", 2.43]], null, null, [["music", 48.66], ["thunk", 29.06], ["whack, thwack", 4.65]], null, null, null, null, [["music", 42.55], ["theremin", 16.25], ["speech", 15.0]], [["livestock, farm animals, working animals", 36.08], ["moo", 32.43], ["cattle, bovinae", 24.06]], null, null, null, null, null, null], "duration": [2.0, 0.25, 1.31, -0.09, 1.19, 0.78, -0.01, 1.16, 0.51, 0.91, 2.22, 7.86, 0.89, 1.13, 6.41, -0.03, 1.94, 0.81, 0.85, 5.56, 4.75, 0.88, 0.91, 0.91, 1.39, 0.0, 0.65]} \ No newline at end of file diff --git a/annotations_1/jCSsP6ooQf8_filtered.json b/annotations_1/jCSsP6ooQf8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1c0664fafb0575a5f426ab4f0f5d1f1d82b5c62 --- /dev/null +++ b/annotations_1/jCSsP6ooQf8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.65], [4.0, 4.82], [10.0, 11.57], [12.0, 13.53], [14.0, 34.05], [37.0, 42.82], [43.0, 56.39], [59.0, 63.91], [67.0, 72.84], [82.0, 99.86], [100.0, 100.48], [101.0, 103.62], [105.0, 120.02], [121.0, 123.04], [130.0, 139.99], [142.0, 150.96], [152.0, 162.3], [166.0, 173.15], [174.0, 174.72]], "keep_status": [false, false, false, false, true, true, true, true, false, true, false, true, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.93, 30.1, 30.09, 30.32, 30.51, 29.49, 0.0, 29.99, 29.87, 29.62, 29.99, 30.12, 30.08, 29.81, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 24.32], ["hum", 22.91], ["mains hum", 7.44]], [["speech", 39.67], ["music", 18.61], ["mains hum", 6.97]], [["speech", 38.22], ["hum", 10.57], ["music", 9.53]], [["music", 31.25], ["speech", 12.84], ["hum", 10.07]], [["throbbing", 45.17], ["hum", 40.95], ["mains hum", 8.35]], [["speech", 27.76], ["music", 25.37], ["hum", 14.02]], null, [["speech", 39.53], ["eruption", 12.26], ["explosion", 6.64]], [["music", 38.46], ["throbbing", 8.04], ["hum", 5.89]], [["throbbing", 34.64], ["music", 23.51], ["hum", 17.48]], [["speech", 34.19], ["throbbing", 21.87], ["music", 18.23]], [["speech", 42.97], ["music", 27.04], ["throbbing", 7.44]], [["music", 24.36], ["speech", 21.29], ["hum", 21.27]], [["mains hum", 37.32], ["music", 22.1], ["hum", 21.68]], null], "duration": [0.65, 0.82, 1.57, 1.53, 20.05, 5.82, 13.39, 4.91, 5.84, 17.86, 0.48, 2.62, 15.02, 2.04, 9.99, 8.96, 10.3, 7.15, 0.72]} \ No newline at end of file diff --git a/annotations_1/jCh_3SFr7M4_filtered.json b/annotations_1/jCh_3SFr7M4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00b4ca43185e7f01a4844b2f2563ee77819b6755 --- /dev/null +++ b/annotations_1/jCh_3SFr7M4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [14.0, 16.92], [19.0, 25.83], [26.0, 36.05], [38.0, 45.84], [47.0, 50.77], [51.0, 52.1], [54.0, 56.47], [58.0, 63.83], [64.0, 64.22], [65.0, 65.79], [66.0, 77.95], [78.0, 81.72], [85.0, 85.94]], "keep_status": [false, true, true, true, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 35.04, 41.81, 36.14, 69.88, 34.45, 0.0, 37.18, 38.2, 0.0, 0.0, 37.98, 76.37, 0.0], "audiomae_on_audioset": [null, [["boing", 24.75], ["thunk", 22.18], ["clang", 11.52]], [["speech", 26.6], ["hum", 20.97], ["synthesizer", 11.26]], [["music", 27.49], ["throbbing", 7.61], ["thunk", 5.71]], null, [["speech", 30.08], ["music", 22.15], ["clang", 9.91]], null, [["music", 24.69], ["speech", 10.16], ["synthesizer", 6.47]], [["speech", 48.38], ["music", 6.89], ["ping", 5.59]], null, null, [["speech", 39.05], ["music", 38.2], ["musical instrument", 4.49]], null, null], "duration": [1.96, 2.92, 6.83, 10.05, 7.84, 3.77, 1.1, 2.47, 5.83, 0.22, 0.79, 11.95, 3.72, 0.94]} \ No newline at end of file diff --git a/annotations_1/jDD8IQgUPEU_filtered.json b/annotations_1/jDD8IQgUPEU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b032567901b8be5c298c520f60726c73003760b3 --- /dev/null +++ b/annotations_1/jDD8IQgUPEU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.81], [7.0, 7.82], [10.0, 11.08], [12.0, 12.48], [14.0, 14.35], [16.0, 17.04], [20.0, 20.49], [25.0, 25.86], [29.0, 29.03], [30.0, 30.62], [51.0, 52.08], [55.0, 56.02], [57.0, 63.19], [65.0, 65.45], [78.0, 78.7], [103.0, 102.71], [106.0, 105.53], [106.0, 106.66], [108.0, 108.99], [110.0, 110.24], [112.0, 113.41], [114.0, 114.67], [128.0, 128.22], [134.0, 135.78], [140.0, 143.11], [146.0, 146.67], [149.0, 149.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.64], ["quack", 3.67], ["honk", 2.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 0.82, 1.08, 0.48, 0.35, 1.04, 0.49, 0.86, 0.03, 0.62, 1.08, 1.02, 6.19, 0.45, 0.7, -0.29, -0.47, 0.66, 0.99, 0.24, 1.41, 0.67, 0.22, 1.78, 3.11, 0.67, 0.34]} \ No newline at end of file diff --git a/annotations_1/jEKFfdQEbcg_filtered.json b/annotations_1/jEKFfdQEbcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24808308a122df0233cf76e89dc3adf322ef19cf --- /dev/null +++ b/annotations_1/jEKFfdQEbcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.34], [3.0, 5.17], [7.0, 7.84], [9.0, 8.75], [11.0, 11.57], [13.0, 13.59], [15.0, 17.74], [29.0, 30.45], [35.0, 35.53], [46.0, 47.38], [48.0, 49.2], [50.0, 50.92], [53.0, 53.33], [57.0, 57.54], [62.0, 62.75], [64.0, 64.4], [65.0, 67.51], [70.0, 70.21], [71.0, 71.93], [78.0, 79.37], [80.0, 81.35], [85.0, 88.1], [91.0, 93.28], [95.0, 95.47], [97.0, 97.71], [98.0, 99.2], [102.0, 103.13], [104.0, 104.53], [105.0, 107.16], [111.0, 111.72], [116.0, 117.21], [122.0, 123.16], [123.0, 124.68], [128.0, 130.27], [134.0, 135.46], [144.0, 145.49], [146.0, 146.65], [150.0, 152.63], [154.0, 153.96], [158.0, 158.48], [160.0, 161.67], [162.0, 162.87], [164.0, 164.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.64, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0, 0.0, 92.15, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 2.17, 0.84, -0.25, 0.57, 0.59, 2.74, 1.45, 0.53, 1.38, 1.2, 0.92, 0.33, 0.54, 0.75, 0.4, 2.51, 0.21, 0.93, 1.37, 1.35, 3.1, 2.28, 0.47, 0.71, 1.2, 1.13, 0.53, 2.16, 0.72, 1.21, 1.16, 1.68, 2.27, 1.46, 1.49, 0.65, 2.63, -0.04, 0.48, 1.67, 0.87, 0.07]} \ No newline at end of file diff --git a/annotations_1/jEav9DdL4iI_filtered.json b/annotations_1/jEav9DdL4iI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dc8eb66ae81c7a5f2f7db1a9ab7b8e745127516 --- /dev/null +++ b/annotations_1/jEav9DdL4iI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.68], [38.0, 38.06], [44.0, 46.08], [51.0, 51.75], [53.0, 53.03], [54.0, 55.07], [59.0, 59.61], [64.0, 64.83], [68.0, 71.24], [71.0, 71.37], [77.0, 85.21], [104.0, 105.63], [108.0, 108.14], [116.0, 117.22], [117.0, 118.39], [119.0, 124.34], [131.0, 137.78], [138.0, 138.62], [142.0, 149.12]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false], "silence_prob": [34.2, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 35.25, 0.0, 43.45, 0.0, 0.0, 0.0, 0.0, 49.31, 58.81, 0.0, 47.05], "audiomae_on_audioset": [[["speech", 67.41], ["music", 21.02], ["animal", 1.21]], null, null, null, null, null, null, null, [["music", 17.42], ["livestock, farm animals, working animals", 13.72], ["cattle, bovinae", 12.59]], null, [["hum", 37.0], ["music", 17.55], ["speech", 14.27]], null, null, null, null, [["music", 40.0], ["clip-clop", 5.01], ["horse", 4.18]], null, null, [["music", 67.52], ["speech", 4.87], ["synthesizer", 3.67]]], "duration": [2.68, 0.06, 2.08, 0.75, 0.03, 1.07, 0.61, 0.83, 3.24, 0.37, 8.21, 1.63, 0.14, 1.22, 1.39, 5.34, 6.78, 0.62, 7.12]} \ No newline at end of file diff --git a/annotations_1/jEveVtZmPu0_filtered.json b/annotations_1/jEveVtZmPu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce73b5f57c88c8eb1fdf742e76d840e1a9ea29a1 --- /dev/null +++ b/annotations_1/jEveVtZmPu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.75], [7.0, 8.51], [9.0, 10.12], [11.0, 12.72], [13.0, 14.34], [16.0, 25.66], [27.0, 38.82], [39.0, 43.85], [47.0, 65.26], [69.0, 69.48], [73.0, 74.02], [78.0, 78.26], [84.0, 87.44], [89.0, 92.01], [93.0, 96.23], [98.0, 99.2], [101.0, 107.69], [110.0, 114.34], [126.0, 126.69], [129.0, 131.19], [132.0, 133.39], [134.0, 134.5], [135.0, 160.56], [163.0, 165.91], [167.0, 166.94], [168.0, 168.72]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, true, true, false, false, false, true, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.78, 56.18, 38.51, 32.49, 0.0, 0.0, 0.0, 35.11, 43.38, 61.67, 0.0, 35.71, 35.32, 0.0, 48.65, 0.0, 0.0, 31.32, 31.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 49.76], ["livestock, farm animals, working animals", 6.62], ["sheep", 5.03]], null, [["whale vocalization", 88.98], ["music", 1.15], ["animal", 0.91]], [["music", 45.08], ["speech", 11.58], ["throbbing", 8.06]], null, null, null, [["music", 43.36], ["hum", 9.83], ["throbbing", 8.2]], [["reverberation", 12.71], ["music", 11.81], ["speech", 10.31]], null, null, [["throbbing", 31.56], ["hum", 27.38], ["music", 17.06]], [["speech", 33.43], ["music", 29.18], ["electronic music", 1.85]], null, [["music", 47.43], ["foghorn", 22.69], ["theremin", 5.74]], null, null, [["fly, housefly", 23.85], ["music", 21.4], ["insect", 15.0]], [["speech", 40.04], ["music", 16.03], ["sidetone", 6.84]], null, null], "duration": [-0.25, 1.51, 1.12, 1.72, 1.34, 9.66, 11.82, 4.85, 18.26, 0.48, 1.02, 0.26, 3.44, 3.01, 3.23, 1.2, 6.69, 4.34, 0.69, 2.19, 1.39, 0.5, 25.56, 2.91, -0.06, 0.72]} \ No newline at end of file diff --git a/annotations_1/jF6JN1VSpmY_filtered.json b/annotations_1/jF6JN1VSpmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e54551c482fb1f1b6fe1911a86d5ac21b694e13a --- /dev/null +++ b/annotations_1/jF6JN1VSpmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.15], [20.0, 21.69], [24.0, 25.22], [35.0, 35.36], [36.0, 36.19], [38.0, 38.58], [42.0, 43.85], [45.0, 47.41], [48.0, 49.47], [50.0, 52.54], [53.0, 64.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.69, 0.0, 90.25, 58.22], "audiomae_on_audioset": [[["music", 57.27], ["throbbing", 15.5], ["hum", 9.28]], null, null, null, null, null, null, [["breaking", 55.99], ["music", 29.31], ["speech", 2.07]], null, null, null], "duration": [3.15, 1.69, 1.22, 0.36, 0.19, 0.58, 1.85, 2.41, 1.47, 2.54, 11.25]} \ No newline at end of file diff --git a/annotations_1/jFQAy28o7Kc_filtered.json b/annotations_1/jFQAy28o7Kc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca7ba27312c346524df4996869f587354c214b78 --- /dev/null +++ b/annotations_1/jFQAy28o7Kc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.45], [30.0, 29.93], [34.0, 36.0], [45.0, 44.79], [49.0, 49.18], [50.0, 59.58], [62.0, 78.92], [81.0, 91.96], [93.0, 93.83], [95.0, 95.12], [96.0, 96.03], [104.0, 104.79], [105.0, 107.2], [108.0, 108.36], [111.0, 110.86], [111.0, 111.82]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 47.66, 0.0, 0.0, 30.15, 29.41, 30.71, 0.0, 0.0, 0.0, 0.0, 43.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 17.48], ["music", 17.15], ["throbbing", 16.27]], null, null, [["speech", 45.19], ["music", 35.56], ["musical instrument", 2.39]], [["cattle, bovinae", 32.99], ["livestock, farm animals, working animals", 27.98], ["moo", 16.69]], [["music", 69.87], ["whack, thwack", 3.44], ["sound effect", 3.29]], null, null, null, null, [["sidetone", 18.46], ["hum", 15.44], ["speech", 12.77]], null, null, null], "duration": [0.45, -0.07, 2.0, -0.21, 0.18, 9.58, 16.92, 10.96, 0.83, 0.12, 0.03, 0.79, 2.2, 0.36, -0.14, 0.82]} \ No newline at end of file diff --git a/annotations_1/jFQUE_6Zhn0_filtered.json b/annotations_1/jFQUE_6Zhn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b368b2eb4f5ee9602530c46ea16f0e3e17c8589 --- /dev/null +++ b/annotations_1/jFQUE_6Zhn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.71], [7.0, 9.27], [10.0, 39.8], [41.0, 42.5], [51.0, 54.09], [62.0, 67.63], [75.0, 88.53], [91.0, 135.53], [137.0, 143.92], [146.0, 155.41]], "keep_status": [false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 40.26, 32.08, 0.0, 39.3, 53.59, 36.84, 0.0, 29.64, 29.78], "audiomae_on_audioset": [null, [["music", 54.16], ["theremin", 18.29], ["didgeridoo", 4.04]], [["music", 42.43], ["theremin", 17.18], ["hum", 7.79]], null, [["whale vocalization", 85.31], ["stomach rumble", 4.84], ["liquid", 1.31]], null, [["music", 59.0], ["didgeridoo", 8.92], ["speech", 5.05]], null, [["throbbing", 31.1], ["music", 22.97], ["hum", 18.71]], [["music", 30.36], ["animal", 4.84], ["throbbing", 4.21]]], "duration": [0.71, 2.27, 29.8, 1.5, 3.09, 5.63, 13.53, 44.53, 6.92, 9.41]} \ No newline at end of file diff --git a/annotations_1/jFWnVdsSgxs_filtered.json b/annotations_1/jFWnVdsSgxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8777c4841dc462eebc7e536c946847b87ba6111 --- /dev/null +++ b/annotations_1/jFWnVdsSgxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 28.61], [29.0, 36.17], [38.0, 41.12], [44.0, 45.52], [47.0, 47.92], [49.0, 56.47], [59.0, 66.51], [69.0, 76.77], [83.0, 86.49], [98.0, 126.3], [129.0, 142.25], [145.0, 145.62], [147.0, 154.14], [155.0, 196.97]], "keep_status": [false, false, true, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [33.0, 31.48, 30.87, 0.0, 0.0, 33.09, 31.73, 32.97, 33.08, 30.76, 31.39, 0.0, 31.86, 0.0], "audiomae_on_audioset": [[["hum", 44.34], ["music", 22.87], ["mains hum", 8.44]], [["hum", 37.56], ["throbbing", 22.85], ["music", 17.65]], [["music", 43.0], ["boing", 9.76], ["hum", 9.72]], null, null, [["music", 23.62], ["didgeridoo", 14.05], ["sound effect", 9.57]], [["music", 52.69], ["hum", 11.34], ["throbbing", 5.25]], [["music", 49.38], ["speech", 19.59], ["throbbing", 5.85]], [["music", 48.91], ["didgeridoo", 19.49], ["singing", 4.11]], [["music", 71.04], ["house music", 4.66], ["electronic music", 3.81]], [["music", 63.44], ["throbbing", 4.91], ["electronic music", 4.31]], null, [["music", 63.79], ["house music", 4.03], ["synthetic singing", 3.71]], null], "duration": [14.61, 7.17, 3.12, 1.52, 0.92, 7.47, 7.51, 7.77, 3.49, 28.3, 13.25, 0.62, 7.14, 41.97]} \ No newline at end of file diff --git a/annotations_1/jFjy1RkmXUg_filtered.json b/annotations_1/jFjy1RkmXUg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca9d2233ffcb7bc4ce185c967bc2eadd7c24aa02 --- /dev/null +++ b/annotations_1/jFjy1RkmXUg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.71], [8.0, 8.24], [13.0, 13.73], [18.0, 19.52], [23.0, 24.12], [26.0, 26.69], [30.0, 29.83], [32.0, 32.34], [34.0, 35.6], [37.0, 38.89], [40.0, 40.63], [43.0, 43.9], [49.0, 49.27], [59.0, 60.05], [62.0, 64.5], [67.0, 67.76], [69.0, 69.85], [84.0, 92.84], [100.0, 99.72], [102.0, 106.57], [107.0, 108.63], [110.0, 110.62], [113.0, 113.39], [119.0, 121.19], [127.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.98, 0.0, 0.0, 29.07, 0.0, 29.43, 0.0, 0.0, 0.0, 29.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.89], ["livestock, farm animals, working animals", 15.1], ["cattle, bovinae", 12.49]], null, [["music", 54.11], ["choir", 17.04], ["singing", 8.99]], null, null, null, [["music", 30.85], ["electric shaver, electric razor", 13.55], ["buzzer", 10.11]], null], "duration": [1.71, 0.24, 0.73, 1.52, 1.12, 0.69, -0.17, 0.34, 1.6, 1.89, 0.63, 0.9, 0.27, 1.05, 2.5, 0.76, 0.85, 8.84, -0.28, 4.57, 1.63, 0.62, 0.39, 2.19, 1.26]} \ No newline at end of file diff --git a/annotations_1/jG7W6jwCSd0_filtered.json b/annotations_1/jG7W6jwCSd0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86f822eef418d43f4851bb76647d93a075ccdbf5 --- /dev/null +++ b/annotations_1/jG7W6jwCSd0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.25], [11.0, 19.82], [21.0, 23.45], [25.0, 26.94], [31.0, 34.1], [36.0, 37.83], [40.0, 41.32], [46.0, 46.2], [47.0, 46.7], [47.0, 48.63], [50.0, 55.7], [57.0, 59.07], [59.0, 60.74], [68.0, 69.09], [74.0, 83.0], [85.0, 85.89], [90.0, 90.54], [93.0, 94.17]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.35, 36.7, 0.0, 35.66, 0.0, 0.0, 0.0, 0.0, 0.0, 33.18, 32.24, 0.0, 0.0, 32.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 65.86], ["guitar", 4.24], ["speech", 3.94]], [["music", 51.41], ["guitar", 6.21], ["bass guitar", 5.88]], null, [["music", 65.69], ["guitar", 8.09], ["musical instrument", 6.93]], null, null, null, null, null, [["music", 72.5], ["guitar", 2.75], ["singing", 2.63]], [["music", 70.29], ["musical instrument", 4.03], ["plucked string instrument", 2.76]], null, null, [["music", 81.8], ["singing", 2.14], ["folk music", 1.64]], null, null, null], "duration": [0.25, 8.82, 2.45, 1.94, 3.1, 1.83, 1.32, 0.2, -0.3, 1.63, 5.7, 2.07, 1.74, 1.09, 9.0, 0.89, 0.54, 1.17]} \ No newline at end of file diff --git a/annotations_1/jGXpyMDIZ_U_filtered.json b/annotations_1/jGXpyMDIZ_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fcb5c1caff429d00155f03d181a25b145a649b --- /dev/null +++ b/annotations_1/jGXpyMDIZ_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.26], [15.0, 16.07], [20.0, 22.25], [24.0, 24.11], [26.0, 26.86], [30.0, 31.11], [32.0, 32.51], [35.0, 35.7], [37.0, 37.67], [39.0, 39.33], [41.0, 48.17], [50.0, 52.86], [54.0, 56.94], [58.0, 59.37], [61.0, 63.14], [67.0, 69.03], [70.0, 74.55], [76.0, 83.32], [87.0, 92.5], [97.0, 100.65], [101.0, 100.72], [101.0, 107.16], [108.0, 111.72], [112.0, 112.31], [112.0, 115.75], [118.0, 134.86], [137.0, 138.52], [140.0, 141.27], [143.0, 144.12], [148.0, 149.54], [156.0, 157.84], [160.0, 161.69], [162.0, 163.07], [167.0, 168.27], [171.0, 172.67], [174.0, 177.53], [178.0, 181.68], [187.0, 190.09], [193.0, 195.49], [200.0, 202.36], [203.0, 206.59], [212.0, 212.97], [219.0, 221.93], [224.0, 225.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 82.25, 78.21, 0.0, 91.47, 64.41, 55.46, 48.82, 28.38, 28.04, 0.0, 29.43, 30.39, 0.0, 30.49, 32.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 47.7, 49.78, 51.71, 66.88, 83.16, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["sidetone", 81.77], ["speech", 12.99], ["music", 1.2]], null, null, null, null, null, null, [["speech", 43.26], ["music", 25.3], ["didgeridoo", 5.16]], [["speech", 69.68], ["fart", 6.78], ["music", 4.66]], [["speech", 24.64], ["mains hum", 12.92], ["hum", 6.3]], null, [["breaking", 33.72], ["whack, thwack", 14.14], ["fart", 5.04]], [["frog", 39.47], ["fart", 7.74], ["croak", 6.27]], null, [["fart", 39.0], ["didgeridoo", 23.29], ["theremin", 5.55]], [["sound effect", 10.12], ["fart", 9.5], ["boing", 9.47]], null, null, null, null, null, null, null, null, null, null, [["speech", 77.91], ["telephone bell ringing", 6.61], ["music", 2.96]], [["dog", 46.04], ["animal", 11.68], ["domestic animals, pets", 10.97]], null, null, null, null, null, null], "duration": [2.26, 1.07, 2.25, 0.11, 0.86, 1.11, 0.51, 0.7, 0.67, 0.33, 7.17, 2.86, 2.94, 1.37, 2.14, 2.03, 4.55, 7.32, 5.5, 3.65, -0.28, 6.16, 3.72, 0.31, 3.75, 16.86, 1.52, 1.27, 1.12, 1.54, 1.84, 1.69, 1.07, 1.27, 1.67, 3.53, 3.68, 3.09, 2.49, 2.36, 3.59, 0.97, 2.93, 1.58]} \ No newline at end of file diff --git a/annotations_1/jH07BdMRP0g_filtered.json b/annotations_1/jH07BdMRP0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..892a93006bf2c2bf259876b4b7efc45f63768042 --- /dev/null +++ b/annotations_1/jH07BdMRP0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.67], [31.0, 32.83], [43.0, 45.1], [55.0, 55.26], [58.0, 58.41], [62.0, 61.92], [64.0, 64.59], [73.0, 73.13], [85.0, 90.39], [94.0, 95.44], [98.0, 99.52], [111.0, 111.3], [123.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.4, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 0.0, 0.0, 0.0, 47.58], "audiomae_on_audioset": [null, null, [["music", 71.65], ["drip", 2.31], ["whale vocalization", 2.24]], null, null, null, null, null, [["music", 61.78], ["electronic music", 7.06], ["throbbing", 5.36]], null, null, null, [["music", 73.98], ["speech", 3.84], ["musical instrument", 2.0]]], "duration": [1.67, 1.83, 2.1, 0.26, 0.41, -0.08, 0.59, 0.13, 5.39, 1.44, 1.52, 0.3, 6.73]} \ No newline at end of file diff --git a/annotations_1/jJ8rgMkWFWA_filtered.json b/annotations_1/jJ8rgMkWFWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da17b7d982c26870d72e108732cab7ebeace005d --- /dev/null +++ b/annotations_1/jJ8rgMkWFWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 7.6], [10.0, 10.25], [15.0, 15.52], [21.0, 21.69], [23.0, 23.08], [24.0, 24.75], [26.0, 26.49], [28.0, 28.09], [30.0, 30.45], [37.0, 38.75], [39.0, 41.15], [42.0, 45.1], [47.0, 49.44], [50.0, 51.36], [55.0, 55.48], [57.0, 57.4], [61.0, 62.61], [68.0, 84.13], [86.0, 102.84], [103.0, 105.71], [106.0, 109.59], [110.0, 111.11], [113.0, 114.02], [115.0, 114.99], [118.0, 120.53], [126.0, 126.32], [129.0, 130.03], [132.0, 132.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 32.12, 32.07, 0.0, 0.0, 0.0, 0.0, 47.12, 60.05, 58.13, 54.04, 0.0, 0.0, 0.0, 36.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.71], ["fly, housefly", 6.17], ["sidetone", 5.95]], [["cattle, bovinae", 35.48], ["moo", 34.76], ["livestock, farm animals, working animals", 29.23]], null, null, null, null, [["music", 47.74], ["trombone", 17.1], ["brass instrument", 12.59]], null, null, null, null, null, null, [["speech", 79.08], ["sidetone", 14.75], ["radio", 2.31]], null, null, null], "duration": [1.42, 2.6, 0.25, 0.52, 0.69, 0.08, 0.75, 0.49, 0.09, 0.45, 1.75, 2.15, 3.1, 2.44, 1.36, 0.48, 0.4, 1.61, 16.13, 16.84, 2.71, 3.59, 1.11, 1.02, -0.01, 2.53, 0.32, 1.03, 0.87]} \ No newline at end of file diff --git a/annotations_1/jJvvT_Sb0jo_filtered.json b/annotations_1/jJvvT_Sb0jo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf8dffa56a8a1f9a7bf55f22b0ea4cdd9827f33d --- /dev/null +++ b/annotations_1/jJvvT_Sb0jo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 19.82], [20.0, 22.3], [23.0, 25.07], [27.0, 30.3], [35.0, 36.64], [40.0, 40.83], [45.0, 45.39], [62.0, 61.72], [62.0, 68.28], [71.0, 72.4], [75.0, 75.34], [79.0, 80.28], [86.0, 88.06], [90.0, 100.74], [102.0, 111.5], [113.0, 113.58], [120.0, 121.07], [125.0, 126.33], [128.0, 127.72], [136.0, 136.8], [140.0, 148.49], [150.0, 152.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 93.91, 96.17, 59.86, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 59.07, 41.87, 42.22, 0.0, 0.0, 0.0, 0.0, 0.0, 33.26, 37.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.07], ["hum", 17.51], ["music", 11.26]], [["music", 36.37], ["burping, eructation", 14.79], ["fart", 11.76]], null, null, null, null, null, [["hum", 24.41], ["music", 23.24], ["mains hum", 16.38]], [["music", 28.88], ["mains hum", 25.15], ["hum", 19.68]]], "duration": [1.51, 0.82, 2.3, 2.07, 3.3, 1.64, 0.83, 0.39, -0.28, 6.28, 1.4, 0.34, 1.28, 2.06, 10.74, 9.5, 0.58, 1.07, 1.33, -0.28, 0.8, 8.49, 2.36]} \ No newline at end of file diff --git a/annotations_1/jKIG_-544gY_filtered.json b/annotations_1/jKIG_-544gY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad6fd9969664938e1a9783d343fd7f14a8d2edbf --- /dev/null +++ b/annotations_1/jKIG_-544gY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.55], [20.0, 38.42], [40.0, 46.3], [55.0, 67.37], [68.0, 68.34], [70.0, 70.58], [72.0, 84.57], [86.0, 89.02], [92.0, 92.75], [95.0, 95.66], [96.0, 103.71], [105.0, 107.08], [109.0, 121.37], [123.0, 123.45], [125.0, 124.87], [126.0, 127.23], [130.0, 130.01], [131.0, 131.48], [132.0, 134.25], [135.0, 135.19], [138.0, 139.16], [142.0, 150.15], [150.0, 150.94], [151.0, 156.24], [158.0, 158.5], [159.0, 165.7], [168.0, 169.33]], "keep_status": [false, false, true, true, false, false, true, true, false, false, false, true, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 37.07, 35.13, 32.85, 0.0, 0.0, 30.31, 34.05, 0.0, 0.0, 33.02, 36.47, 29.55, 0.0, 0.0, 0.0, 0.0, 0.0, 30.87, 0.0, 0.0, 29.33, 0.0, 30.64, 0.0, 31.13, 0.0], "audiomae_on_audioset": [null, [["hum", 30.15], ["music", 25.72], ["mains hum", 18.78]], [["music", 40.1], ["didgeridoo", 6.89], ["speech", 4.09]], [["speech", 44.44], ["fart", 11.59], ["animal", 6.81]], null, null, [["speech", 24.91], ["fart", 14.64], ["music", 12.95]], [["music", 47.81], ["theremin", 4.65], ["musical instrument", 3.97]], null, null, [["fly, housefly", 49.4], ["fart", 21.92], ["insect", 13.92]], [["music", 31.2], ["hum", 7.4], ["mains hum", 6.44]], [["speech", 34.41], ["music", 10.23], ["groan", 10.07]], null, null, null, null, null, [["vehicle", 29.93], ["boat, water vehicle", 15.39], ["motorboat, speedboat", 9.95]], null, null, [["music", 34.47], ["speech", 21.11], ["rumble", 7.41]], null, [["music", 55.28], ["speech", 21.34], ["didgeridoo", 5.59]], null, [["music", 45.14], ["foghorn", 20.15], ["fly, housefly", 5.52]], null], "duration": [1.55, 18.42, 6.3, 12.37, 0.34, 0.58, 12.57, 3.02, 0.75, 0.66, 7.71, 2.08, 12.37, 0.45, -0.13, 1.23, 0.01, 0.48, 2.25, 0.19, 1.16, 8.15, 0.94, 5.24, 0.5, 6.7, 1.33]} \ No newline at end of file diff --git a/annotations_1/jL6rrLaw6rc_filtered.json b/annotations_1/jL6rrLaw6rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13c2923b02724eeea9a062ad0698bb2da3482a54 --- /dev/null +++ b/annotations_1/jL6rrLaw6rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.19], [9.0, 17.96], [18.0, 33.56], [37.0, 38.55], [42.0, 41.99], [48.0, 48.63], [50.0, 65.82], [67.0, 69.4], [72.0, 74.02], [75.0, 90.29], [91.0, 92.2], [93.0, 93.39], [94.0, 103.77], [104.0, 140.68], [142.0, 142.69], [146.0, 155.7], [158.0, 163.78], [165.0, 170.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.66, 45.85, 0.0, 0.0, 0.0, 54.7, 92.64, 92.15, 77.87, 0.0, 0.0, 59.68, 0.0, 0.0, 46.12, 72.01, 85.17], "audiomae_on_audioset": [null, [["hum", 29.69], ["music", 25.01], ["throbbing", 24.92]], [["music", 20.3], ["speech", 13.84], ["theremin", 9.75]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 58.43], ["ambient music", 11.64], ["hum", 3.28]], null, null], "duration": [1.19, 8.96, 15.56, 1.55, -0.01, 0.63, 15.82, 2.4, 2.02, 15.29, 1.2, 0.39, 9.77, 36.68, 0.69, 9.7, 5.78, 5.77]} \ No newline at end of file diff --git a/annotations_1/jME-000LFNY_filtered.json b/annotations_1/jME-000LFNY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3541c4d182678a39960ba598cae60b009e0ea8dc --- /dev/null +++ b/annotations_1/jME-000LFNY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.26], [16.0, 16.93], [32.0, 32.24], [36.0, 36.8], [54.0, 56.64], [63.0, 63.76], [67.0, 73.31], [77.0, 77.67], [92.0, 91.98], [93.0, 93.97]], "keep_status": [false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.15, 0.0, 34.77, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 49.93], ["speech", 6.94], ["didgeridoo", 2.72]], null, [["music", 37.41], ["throbbing", 21.56], ["fly, housefly", 11.19]], null, null, null], "duration": [0.26, 0.93, 0.24, 0.8, 2.64, 0.76, 6.31, 0.67, -0.02, 0.97]} \ No newline at end of file diff --git a/annotations_1/jMqI9UV3ob4_filtered.json b/annotations_1/jMqI9UV3ob4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dde8352a3d7c2b391137190cd8395e7b61552b9a --- /dev/null +++ b/annotations_1/jMqI9UV3ob4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.64], [20.0, 21.91], [22.0, 22.62], [23.0, 23.9], [27.0, 26.76], [32.0, 33.67], [36.0, 36.61], [37.0, 37.45], [39.0, 42.57], [47.0, 46.9], [48.0, 48.66], [53.0, 53.59], [55.0, 55.29], [61.0, 60.79]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 19.19], ["sidetone", 15.25], ["frog", 7.67]], null, null, null, null, null], "duration": [0.64, 1.91, 0.62, 0.9, -0.24, 1.67, 0.61, 0.45, 3.57, -0.1, 0.66, 0.59, 0.29, -0.21]} \ No newline at end of file diff --git a/annotations_1/jMvR4K4QICQ_filtered.json b/annotations_1/jMvR4K4QICQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..028dd8f5d45776bf20914352031c38965bc2d84b --- /dev/null +++ b/annotations_1/jMvR4K4QICQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.42], [17.0, 27.82], [32.0, 33.37], [35.0, 38.6], [41.0, 43.41], [44.0, 44.98], [46.0, 51.73], [52.0, 52.89], [54.0, 55.14], [56.0, 57.89], [59.0, 59.73], [60.0, 63.59], [65.0, 121.66], [123.0, 123.48], [126.0, 144.96], [146.0, 164.74], [165.0, 165.18]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.77, 38.76, 0.0, 33.3, 44.96, 0.0, 28.71, 0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 28.52, 28.57, 0.0], "audiomae_on_audioset": [[["music", 40.88], ["hum", 27.09], ["throbbing", 13.31]], [["music", 69.3], ["hum", 2.72], ["scary music", 2.51]], null, [["music", 26.97], ["hum", 20.43], ["shuffling cards", 11.84]], [["music", 38.77], ["hum", 14.81], ["mains hum", 8.52]], null, [["music", 44.1], ["speech", 6.46], ["whack, thwack", 5.6]], null, null, null, null, [["speech", 50.42], ["music", 16.33], ["sidetone", 8.17]], null, null, [["music", 69.09], ["speech", 5.37], ["electric shaver, electric razor", 4.88]], [["music", 62.65], ["groan", 7.11], ["whack, thwack", 5.32]], null], "duration": [14.42, 10.82, 1.37, 3.6, 2.41, 0.98, 5.73, 0.89, 1.14, 1.89, 0.73, 3.59, 56.66, 0.48, 18.96, 18.74, 0.18]} \ No newline at end of file diff --git a/annotations_1/jMxYv05A7B0_filtered.json b/annotations_1/jMxYv05A7B0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de058c46c4b965c95ee0b186877a1af5bedee7da --- /dev/null +++ b/annotations_1/jMxYv05A7B0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.8], [6.0, 6.57], [11.0, 12.99], [17.0, 17.58], [18.0, 18.17], [27.0, 27.04], [35.0, 36.26], [38.0, 38.33], [41.0, 41.05], [51.0, 51.41], [66.0, 66.82], [73.0, 73.84], [76.0, 77.19], [78.0, 81.16], [84.0, 85.45], [86.0, 87.24], [88.0, 89.61], [91.0, 91.1], [91.0, 92.94], [96.0, 96.7], [97.0, 98.41], [105.0, 105.87], [114.0, 115.25], [119.0, 120.38], [121.0, 122.98], [124.0, 125.76], [127.0, 130.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 0.57, 1.99, 0.58, 0.17, 0.04, 1.26, 0.33, 0.05, 0.41, 0.82, 0.84, 1.19, 3.16, 1.45, 1.24, 1.61, 0.1, 1.94, 0.7, 1.41, 0.87, 1.25, 1.38, 1.98, 1.76, 3.82]} \ No newline at end of file diff --git a/annotations_1/jNNX5a8ogr8_filtered.json b/annotations_1/jNNX5a8ogr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c9efe97be7af0e7560818d3b215f2efeb40460 --- /dev/null +++ b/annotations_1/jNNX5a8ogr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 64.56], [66.0, 95.99], [100.0, 105.33], [109.0, 111.81], [114.0, 116.87], [120.0, 121.91], [123.0, 129.07], [130.0, 140.95], [146.0, 149.17], [151.0, 163.14], [164.0, 165.96], [168.0, 168.62], [169.0, 171.68]], "keep_status": [false, false, true, false, true, false, true, false, true, true, false, false, true], "silence_prob": [0.0, 32.37, 42.22, 59.68, 45.95, 0.0, 38.62, 36.18, 34.82, 34.48, 0.0, 0.0, 48.06], "audiomae_on_audioset": [null, [["music", 79.73], ["theremin", 8.76], ["musical instrument", 1.07]], [["music", 45.62], ["theremin", 9.62], ["hum", 6.41]], null, [["music", 41.91], ["synthesizer", 9.58], ["didgeridoo", 8.31]], null, [["music", 43.6], ["electronic music", 12.8], ["whale vocalization", 8.75]], [["theremin", 62.29], ["music", 19.73], ["musical instrument", 2.53]], [["music", 26.85], ["ambient music", 16.39], ["gong", 11.4]], [["music", 28.85], ["ambient music", 22.98], ["hum", 11.04]], null, null, [["music", 45.32], ["electronic music", 11.82], ["ambient music", 7.14]]], "duration": [44.56, 29.99, 5.33, 2.81, 2.87, 1.91, 6.07, 10.95, 3.17, 12.14, 1.96, 0.62, 2.68]} \ No newline at end of file diff --git a/annotations_1/jNPBfvcLIMs_filtered.json b/annotations_1/jNPBfvcLIMs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0948bac0984dde69213be175659afe14ed36a7e2 --- /dev/null +++ b/annotations_1/jNPBfvcLIMs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [5.0, 6.29], [12.0, 15.38], [16.0, 29.2], [31.0, 39.78], [42.0, 58.65], [59.0, 62.5], [64.0, 102.51], [103.0, 103.98], [108.0, 117.31], [119.0, 120.66]], "keep_status": [false, false, true, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 28.02, 28.37, 31.79, 28.68, 28.73, 0.0, 0.0, 28.35, 0.0], "audiomae_on_audioset": [null, null, [["music", 59.35], ["sound effect", 3.34], ["boom", 2.56]], [["music", 55.11], ["sound effect", 6.88], ["hum", 3.5]], [["throbbing", 40.15], ["hum", 22.53], ["mains hum", 19.03]], [["music", 40.94], ["hum", 7.51], ["mains hum", 6.41]], [["fly, housefly", 22.08], ["speech", 14.54], ["insect", 11.49]], null, null, [["hum", 25.79], ["mains hum", 16.15], ["music", 14.08]], null], "duration": [1.05, 1.29, 3.38, 13.2, 8.78, 16.65, 3.5, 38.51, 0.98, 9.31, 1.66]} \ No newline at end of file diff --git a/annotations_1/jPH8I5QWFUU_filtered.json b/annotations_1/jPH8I5QWFUU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54c130451b48ba9ab3abb8c10f5bdf3901d9cb6a --- /dev/null +++ b/annotations_1/jPH8I5QWFUU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.91], [26.0, 28.58], [31.0, 34.32], [35.0, 35.63], [36.0, 54.28], [56.0, 56.44], [65.0, 72.71], [75.0, 75.54], [79.0, 94.66]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [40.93, 58.64, 52.86, 0.0, 33.4, 0.0, 36.87, 0.0, 39.12], "audiomae_on_audioset": [[["music", 68.97], ["synthesizer", 4.01], ["musical instrument", 3.25]], null, null, null, [["music", 57.98], ["hum", 11.29], ["rumble", 4.96]], null, [["hum", 36.59], ["mains hum", 29.48], ["music", 13.1]], null, [["music", 74.67], ["musical instrument", 3.37], ["synthesizer", 2.78]]], "duration": [2.91, 2.58, 3.32, 0.63, 18.28, 0.44, 7.71, 0.54, 15.66]} \ No newline at end of file diff --git a/annotations_1/jPRiyRmsLBo_filtered.json b/annotations_1/jPRiyRmsLBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988571a8317384a7efa81a4e5b98f2f9dae06807 --- /dev/null +++ b/annotations_1/jPRiyRmsLBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [4.0, 4.19], [6.0, 6.59], [8.0, 8.24], [11.0, 13.02], [13.0, 15.18], [17.0, 19.48], [20.0, 20.56], [24.0, 24.81], [26.0, 26.49], [31.0, 31.46], [35.0, 35.92], [37.0, 41.03], [42.0, 47.16], [49.0, 50.58], [52.0, 52.69], [56.0, 56.94], [60.0, 61.28], [65.0, 66.06], [69.0, 69.16], [71.0, 72.22], [74.0, 75.05], [76.0, 77.16], [82.0, 82.98], [85.0, 86.02], [87.0, 88.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.0, 57.81, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 41.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 83.75], ["telephone", 5.7], ["radio", 1.96]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 0.19, 0.59, 0.24, 2.02, 2.18, 2.48, 0.56, 0.81, 0.49, 0.46, 0.92, 4.03, 5.16, 1.58, 0.69, 0.94, 1.28, 1.06, 0.16, 1.22, 1.05, 1.16, 0.98, 1.02, 1.06]} \ No newline at end of file diff --git a/annotations_1/jPfje0jZeMo_filtered.json b/annotations_1/jPfje0jZeMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73211c8aa9bc414532e4e3706cd8e01de75eb7c6 --- /dev/null +++ b/annotations_1/jPfje0jZeMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.97], [8.0, 9.63], [22.0, 24.75], [32.0, 32.97], [42.0, 57.23], [59.0, 64.69], [66.0, 66.26], [67.0, 67.98], [70.0, 70.19], [72.0, 72.57], [77.0, 77.63], [79.0, 81.09], [88.0, 89.19], [93.0, 102.66], [106.0, 106.42], [108.0, 108.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 48.31, 0.0, 41.3, 55.67, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 33.12, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 60.92], ["synthesizer", 11.63], ["musical instrument", 4.19]], null, [["music", 62.0], ["musical instrument", 8.8], ["theremin", 7.0]], null, null, null, null, null, null, null, null, [["music", 62.76], ["breaking", 5.97], ["speech", 5.88]], null, null], "duration": [1.97, 1.63, 2.75, 0.97, 15.23, 5.69, 0.26, 0.98, 0.19, 0.57, 0.63, 2.09, 1.19, 9.66, 0.42, 0.65]} \ No newline at end of file diff --git a/annotations_1/jPgV4d4ZmZo_filtered.json b/annotations_1/jPgV4d4ZmZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3be9d245f41585fd9a23887ddd0d6b36e34075d6 --- /dev/null +++ b/annotations_1/jPgV4d4ZmZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.65], [10.0, 10.86], [13.0, 14.15], [22.0, 24.36], [26.0, 26.77], [28.0, 28.88], [31.0, 31.23], [36.0, 36.61], [37.0, 37.72], [40.0, 39.92], [42.0, 43.43], [44.0, 44.37], [45.0, 52.86], [54.0, 55.44], [57.0, 57.79], [59.0, 61.38], [68.0, 69.2], [72.0, 73.57], [77.0, 78.06], [82.0, 82.46], [93.0, 96.06], [102.0, 101.68], [103.0, 103.45], [112.0, 112.7], [114.0, 115.13], [121.0, 121.09], [125.0, 125.76], [126.0, 127.03], [128.0, 128.56], [130.0, 130.98], [132.0, 132.83], [133.0, 134.25], [136.0, 137.79], [138.0, 140.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.65, 0.86, 1.15, 2.36, 0.77, 0.88, 0.23, 0.61, 0.72, -0.08, 1.43, 0.37, 7.86, 1.44, 0.79, 2.38, 1.2, 1.57, 1.06, 0.46, 3.06, -0.32, 0.45, 0.7, 1.13, 0.09, 0.76, 1.03, 0.56, 0.98, 0.83, 1.25, 1.79, 2.17]} \ No newline at end of file diff --git a/annotations_1/jQp4IlURoNg_filtered.json b/annotations_1/jQp4IlURoNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00880e19c37de5037bf98b5c3b53303387b3046b --- /dev/null +++ b/annotations_1/jQp4IlURoNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 29.0], [40.0, 41.4], [44.0, 45.67], [56.0, 62.8], [65.0, 86.58], [94.0, 94.83], [96.0, 97.28], [100.0, 100.7], [102.0, 102.52], [104.0, 107.0], [116.0, 117.49], [125.0, 129.37], [133.0, 133.07]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.49, 0.0, 0.0, 31.84, 30.53, 0.0, 0.0, 0.0, 0.0, 33.04, 0.0, 37.33, 0.0], "audiomae_on_audioset": [[["music", 62.85], ["throbbing", 10.5], ["electronic music", 5.59]], null, null, [["music", 48.83], ["speech", 19.63], ["throbbing", 5.34]], [["music", 43.37], ["speech", 34.86], ["electronic music", 5.45]], null, null, null, null, [["music", 29.4], ["hum", 16.64], ["mains hum", 15.02]], null, [["moo", 42.93], ["cattle, bovinae", 29.04], ["livestock, farm animals, working animals", 13.68]], null], "duration": [22.0, 1.4, 1.67, 6.8, 21.58, 0.83, 1.28, 0.7, 0.52, 3.0, 1.49, 4.37, 0.07]} \ No newline at end of file diff --git a/annotations_1/jRSw_0zpNE8_filtered.json b/annotations_1/jRSw_0zpNE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae19ef4154956fc906428e188392ece9745e6568 --- /dev/null +++ b/annotations_1/jRSw_0zpNE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.77], [5.0, 5.49], [6.0, 8.46], [9.0, 11.94], [13.0, 16.48], [17.0, 21.63], [22.0, 22.47], [23.0, 31.56], [33.0, 34.53], [36.0, 38.25], [40.0, 41.76], [43.0, 43.9], [45.0, 48.96], [50.0, 52.1], [54.0, 56.51], [57.0, 67.39], [71.0, 76.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.71, 100.0, 82.79, 100.0, 0.0, 99.84, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 76.2, 90.95, 49.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.24], ["singing bowl", 14.14], ["mains hum", 13.12]]], "duration": [0.77, 0.49, 2.46, 2.94, 3.48, 4.63, 0.47, 8.56, 1.53, 2.25, 1.76, 0.9, 3.96, 2.1, 2.51, 10.39, 5.5]} \ No newline at end of file diff --git a/annotations_1/jR_kxdUm1bc_filtered.json b/annotations_1/jR_kxdUm1bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a84a86042a3e6eeb1b9169052e89bb4c991ff4f6 --- /dev/null +++ b/annotations_1/jR_kxdUm1bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 40.73], [41.0, 41.44], [41.0, 70.55], [73.0, 77.8], [79.0, 79.61], [80.0, 81.36], [82.0, 82.8]], "keep_status": [false, false, true, false, false, false, false], "silence_prob": [30.67, 0.0, 30.8, 31.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.34], ["speech", 18.11], ["electronic music", 5.56]], null, [["hum", 18.48], ["music", 15.08], ["mains hum", 14.58]], [["music", 42.16], ["sidetone", 30.68], ["speech", 7.69]], null, null, null], "duration": [22.73, 0.44, 29.55, 4.8, 0.61, 1.36, 0.8]} \ No newline at end of file diff --git a/annotations_1/jSnvLrw4YR0_filtered.json b/annotations_1/jSnvLrw4YR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54dbf40ec48cd467c882ffc7dc2c1e2be1060b4c --- /dev/null +++ b/annotations_1/jSnvLrw4YR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.51], [8.0, 9.32], [12.0, 12.58], [17.0, 18.86], [33.0, 34.45], [36.0, 36.86], [42.0, 41.77], [48.0, 49.4], [52.0, 51.85], [56.0, 56.56], [65.0, 65.6], [70.0, 69.97], [73.0, 75.57], [77.0, 77.45], [79.0, 79.61], [80.0, 81.43], [83.0, 83.19], [85.0, 84.82], [92.0, 91.62], [96.0, 96.3], [102.0, 102.02], [103.0, 104.13], [107.0, 108.31], [110.0, 110.25], [114.0, 114.18], [117.0, 118.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 1.32, 0.58, 1.86, 1.45, 0.86, -0.23, 1.4, -0.15, 0.56, 0.6, -0.03, 2.57, 0.45, 0.61, 1.43, 0.19, -0.18, -0.38, 0.3, 0.02, 1.13, 1.31, 0.25, 0.18, 1.13]} \ No newline at end of file diff --git a/annotations_1/jTkt23CfSp4_filtered.json b/annotations_1/jTkt23CfSp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..104b50538a4071c9f30e938a82a384e3e5595a87 --- /dev/null +++ b/annotations_1/jTkt23CfSp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.49], [38.0, 39.11], [40.0, 48.41], [52.0, 53.82], [62.0, 63.63], [64.0, 65.15], [71.0, 73.3], [83.0, 85.68], [88.0, 89.24], [90.0, 95.25], [98.0, 98.36], [102.0, 103.69], [105.0, 105.27]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.19, 0.0, 0.0, 0.0, 68.02, 100.0, 0.0, 46.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mosquito", 52.61], ["fly, housefly", 28.7], ["insect", 6.69]], null, null, null, null, null, null, [["fart", 26.67], ["speech", 22.7], ["noise", 20.3]], null, null, null], "duration": [0.49, 1.11, 8.41, 1.82, 1.63, 1.15, 2.3, 2.68, 1.24, 5.25, 0.36, 1.69, 0.27]} \ No newline at end of file diff --git a/annotations_1/jTz_VNAGqog_filtered.json b/annotations_1/jTz_VNAGqog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3edc13eb9f398236a4f38c286e86ca1c7f2964c8 --- /dev/null +++ b/annotations_1/jTz_VNAGqog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.35], [12.0, 15.4], [19.0, 20.01], [21.0, 33.96], [34.0, 34.47], [35.0, 34.94], [36.0, 36.41], [37.0, 41.57], [43.0, 43.36], [48.0, 51.98], [56.0, 56.05], [57.0, 57.28], [58.0, 58.62], [59.0, 70.78], [73.0, 73.52], [82.0, 87.81], [93.0, 94.02], [96.0, 97.17], [100.0, 100.28], [102.0, 108.09], [110.0, 111.84], [114.0, 114.66], [115.0, 116.28], [119.0, 123.77], [126.0, 127.14], [130.0, 130.27], [132.0, 132.43], [134.0, 134.13], [140.0, 140.12], [141.0, 141.03], [145.0, 145.81], [147.0, 147.53], [149.0, 149.82]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.18, 0.0, 42.26, 0.0, 0.0, 0.0, 41.14, 0.0, 35.91, 0.0, 0.0, 0.0, 32.78, 0.0, 37.27, 0.0, 0.0, 0.0, 47.35, 0.0, 0.0, 0.0, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 24.08], ["glockenspiel", 11.24], ["mallet percussion", 10.46]], null, null, null, [["music", 44.8], ["wind instrument, woodwind instrument", 19.75], ["musical instrument", 5.32]], null, [["music", 41.45], ["musical instrument", 6.72], ["didgeridoo", 5.42]], null, null, null, [["wind instrument, woodwind instrument", 26.84], ["music", 24.69], ["harmonica", 20.37]], null, [["mains hum", 34.12], ["music", 22.21], ["hum", 22.15]], null, null, null, [["music", 35.83], ["tick-tock", 10.58], ["musical instrument", 6.42]], null, null, null, [["music", 68.03], ["theremin", 13.83], ["musical instrument", 1.92]], null, null, null, null, null, null, null, null, null], "duration": [0.35, 3.4, 1.01, 12.96, 0.47, -0.06, 0.41, 4.57, 0.36, 3.98, 0.05, 0.28, 0.62, 11.78, 0.52, 5.81, 1.02, 1.17, 0.28, 6.09, 1.84, 0.66, 1.28, 4.77, 1.14, 0.27, 0.43, 0.13, 0.12, 0.03, 0.81, 0.53, 0.82]} \ No newline at end of file diff --git a/annotations_1/jUYCTHwAQvw_filtered.json b/annotations_1/jUYCTHwAQvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8c5d9a79697fb27a2df9975d0abffee7b8d4956 --- /dev/null +++ b/annotations_1/jUYCTHwAQvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 32.37], [36.0, 73.84], [76.0, 76.59], [88.0, 90.22], [91.0, 94.15], [95.0, 97.53], [100.0, 99.84], [100.0, 100.62], [102.0, 121.95]], "keep_status": [false, false, false, true, true, true, false, false, true], "silence_prob": [31.47, 0.0, 0.0, 39.17, 37.44, 35.74, 0.0, 0.0, 29.74], "audiomae_on_audioset": [[["throbbing", 49.35], ["hum", 36.93], ["music", 3.91]], null, null, [["whale vocalization", 19.25], ["throbbing", 12.68], ["hum", 8.9]], [["breaking", 35.86], ["speech", 14.23], ["hum", 4.96]], [["speech", 19.41], ["eruption", 9.16], ["hum", 6.97]], null, null, [["speech", 19.35], ["explosion", 12.83], ["music", 8.85]]], "duration": [2.37, 37.84, 0.59, 2.22, 3.15, 2.53, -0.16, 0.62, 19.95]} \ No newline at end of file diff --git a/annotations_1/jUkqho3OUos_filtered.json b/annotations_1/jUkqho3OUos_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..071aa5d56b560ce6918e1313efbe97365aad58bd --- /dev/null +++ b/annotations_1/jUkqho3OUos_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.4], [6.0, 5.83], [13.0, 16.33], [20.0, 20.82], [39.0, 39.6], [40.0, 40.8], [76.0, 76.94], [95.0, 95.44]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [99.36, 0.0, 43.85, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["frog", 14.83], ["radio", 9.8], ["wheeze", 7.11]], null, null, null, null, null], "duration": [3.4, -0.17, 3.33, 0.82, 0.6, 0.8, 0.94, 0.44]} \ No newline at end of file diff --git a/annotations_1/jVH_NN7phnA_filtered.json b/annotations_1/jVH_NN7phnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..829ed704ecf60fc857054b8965abc7eafbaba49c --- /dev/null +++ b/annotations_1/jVH_NN7phnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.91], [10.0, 10.13], [15.0, 15.36], [23.0, 24.76], [28.0, 28.65], [37.0, 36.9], [44.0, 44.34], [49.0, 48.74], [54.0, 54.03], [55.0, 57.86], [59.0, 59.12], [61.0, 61.67], [65.0, 65.3], [71.0, 71.29], [81.0, 80.77], [84.0, 84.43], [88.0, 88.79], [90.0, 90.49], [91.0, 95.52], [97.0, 97.44], [100.0, 100.4], [101.0, 101.98], [107.0, 108.36], [109.0, 111.82], [117.0, 117.54], [118.0, 118.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 0.0, 0.0, 0.0, 0.0, 35.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["dog", 25.2], ["bark", 18.16], ["domestic animals, pets", 10.16]], null, null], "duration": [-0.09, 0.13, 0.36, 1.76, 0.65, -0.1, 0.34, -0.26, 0.03, 2.86, 0.12, 0.67, 0.3, 0.29, -0.23, 0.43, 0.79, 0.49, 4.52, 0.44, 0.4, 0.98, 1.36, 2.82, 0.54, 0.84]} \ No newline at end of file diff --git a/annotations_1/jVu_cuFHZnc_filtered.json b/annotations_1/jVu_cuFHZnc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..260c56405c09768b68efb7ab6e63e9a2dcd34c5f --- /dev/null +++ b/annotations_1/jVu_cuFHZnc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [6.0, 6.42], [9.0, 9.58], [12.0, 12.39], [13.0, 13.85], [16.0, 16.48], [24.0, 25.95], [28.0, 34.28], [40.0, 45.82], [48.0, 51.39], [52.0, 53.28], [54.0, 55.98], [57.0, 58.58], [60.0, 60.61], [64.0, 65.16], [68.0, 68.82], [71.0, 71.86], [74.0, 76.77], [77.0, 79.76], [82.0, 82.93], [85.0, 86.31], [89.0, 90.1], [93.0, 95.23], [96.0, 97.24], [98.0, 99.62], [100.0, 101.11], [102.0, 102.93], [107.0, 108.55], [110.0, 113.24], [115.0, 116.48], [117.0, 117.36], [123.0, 124.36], [128.0, 127.77], [129.0, 129.83], [132.0, 132.53], [133.0, 133.08], [134.0, 136.11], [137.0, 138.99], [140.0, 140.88], [143.0, 143.31]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.08, 40.14, 38.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 49.5, 0.0, 0.0, 0.0, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.99, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.08], ["ambient music", 15.46], ["hum", 6.67]], [["music", 59.79], ["ambient music", 19.69], ["gong", 2.09]], [["music", 48.3], ["harmonic", 5.09], ["ambient music", 4.55]], null, null, null, null, null, null, null, null, [["music", 29.92], ["effects unit", 3.71], ["musical instrument", 3.23]], null, null, null, null, null, null, null, null, null, [["music", 50.21], ["ambient music", 15.93], ["singing bowl", 5.29]], null, null, null, null, null, null, null, [["speech", 77.69], ["telephone", 8.83], ["sidetone", 3.96]], null, null, null], "duration": [1.33, 0.42, 0.58, 0.39, 0.85, 0.48, 1.95, 6.28, 5.82, 3.39, 1.28, 1.98, 1.58, 0.61, 1.16, 0.82, 0.86, 2.77, 2.76, 0.93, 1.31, 1.1, 2.23, 1.24, 1.62, 1.11, 0.93, 1.55, 3.24, 1.48, 0.36, 1.36, -0.23, 0.83, 0.53, 0.08, 2.11, 1.99, 0.88, 0.31]} \ No newline at end of file diff --git a/annotations_1/jW2zOdceqr8_filtered.json b/annotations_1/jW2zOdceqr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a029933b2008a5c6c73a440589bac034048f8b4 --- /dev/null +++ b/annotations_1/jW2zOdceqr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.87], [20.0, 20.95], [22.0, 40.96], [44.0, 45.45], [49.0, 50.03], [51.0, 52.08], [56.0, 64.15], [65.0, 66.31], [68.0, 86.22], [87.0, 145.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 34.01, 0.0, 0.0, 0.0, 31.06, 0.0, 31.03, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.48], ["musical instrument", 6.7], ["didgeridoo", 3.94]], null, null, null, [["throbbing", 24.38], ["speech", 21.64], ["music", 20.3]], null, [["music", 40.26], ["throbbing", 36.77], ["hum", 9.91]], null], "duration": [0.87, 0.95, 18.96, 1.45, 1.03, 1.08, 8.15, 1.31, 18.22, 58.56]} \ No newline at end of file diff --git a/annotations_1/jXIFh5Gwqno_filtered.json b/annotations_1/jXIFh5Gwqno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d5c57cae09c4ffd213b5a4d750f640f289b1f40 --- /dev/null +++ b/annotations_1/jXIFh5Gwqno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.98], [35.0, 38.94], [39.0, 39.46], [46.0, 51.75], [56.0, 62.82], [65.0, 68.01], [76.0, 76.47], [80.0, 80.33], [84.0, 90.95], [94.0, 96.42], [99.0, 105.44], [107.0, 106.64], [108.0, 111.25], [130.0, 130.82], [132.0, 142.57], [150.0, 152.09], [154.0, 162.65], [163.0, 163.75], [164.0, 164.47], [166.0, 167.54], [169.0, 170.24]], "keep_status": [false, false, false, true, true, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 37.21, 0.0, 31.26, 43.35, 82.61, 0.0, 0.0, 64.29, 32.33, 31.52, 0.0, 34.11, 0.0, 30.26, 99.71, 31.26, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.58], ["boing", 29.42], ["music", 13.03]], null, [["music", 39.42], ["boing", 23.6], ["cattle, bovinae", 4.42]], [["music", 58.01], ["speech", 6.39], ["hum", 5.21]], null, null, null, null, [["music", 33.29], ["speech", 14.36], ["cattle, bovinae", 11.85]], [["music", 33.0], ["boing", 26.22], ["speech", 10.25]], null, [["music", 56.57], ["groan", 4.82], ["cattle, bovinae", 3.96]], null, [["music", 59.28], ["noise", 5.28], ["theremin", 4.6]], null, [["music", 68.99], ["hum", 5.99], ["foghorn", 2.89]], null, null, null, null], "duration": [-0.02, 3.94, 0.46, 5.75, 6.82, 3.01, 0.47, 0.33, 6.95, 2.42, 6.44, -0.36, 3.25, 0.82, 10.57, 2.09, 8.65, 0.75, 0.47, 1.54, 1.24]} \ No newline at end of file diff --git a/annotations_1/jXKc-0nVIkQ_filtered.json b/annotations_1/jXKc-0nVIkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bddb5fbe4ff10f28bfbc4dd5768a32e10d016cc5 --- /dev/null +++ b/annotations_1/jXKc-0nVIkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [17.0, 18.42], [19.0, 20.36], [22.0, 23.3], [24.0, 24.46], [26.0, 29.39], [31.0, 33.07], [46.0, 47.01], [48.0, 69.8], [70.0, 79.07], [84.0, 87.51], [89.0, 90.14], [97.0, 101.93], [103.0, 107.47], [108.0, 108.92], [116.0, 118.52], [129.0, 128.82], [132.0, 132.78], [137.0, 137.12], [137.0, 141.79], [142.0, 141.83], [142.0, 141.86], [142.0, 141.89], [142.0, 141.93], [142.0, 141.96], [142.0, 141.99], [142.0, 142.03], [144.0, 150.35], [151.0, 152.66], [154.0, 154.33], [154.0, 161.32], [162.0, 166.68], [169.0, 169.75], [171.0, 171.93], [173.0, 174.12], [175.0, 177.21]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.78, 55.18, 0.0, 30.91, 28.42, 28.8, 0.0, 29.03, 29.11, 0.0, 29.16, 0.0, 0.0, 0.0, 28.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 0.0, 35.44, 35.87, 0.0, 0.0, 0.0, 50.02], "audiomae_on_audioset": [null, null, null, null, null, [["fly, housefly", 44.4], ["mosquito", 38.37], ["insect", 7.71]], null, null, [["noise", 31.35], ["grunt", 14.19], ["speech", 8.34]], [["music", 28.63], ["hum", 11.15], ["mains hum", 11.08]], [["speech", 20.74], ["vehicle", 16.45], ["cacophony", 5.04]], null, [["vehicle", 28.05], ["speech", 23.46], ["car", 8.79]], [["speech", 40.3], ["buzzer", 9.12], ["buzz", 7.66]], null, [["vehicle", 43.41], ["car", 8.22], ["whir", 4.98]], null, null, null, [["speech", 18.92], ["roaring cats (lions, tigers)", 16.91], ["fart", 11.4]], null, null, null, null, null, null, null, [["hum", 48.38], ["mains hum", 35.42], ["electric shaver, electric razor", 3.23]], null, null, [["creak", 31.69], ["mechanisms", 8.19], ["animal", 6.61]], [["music", 55.98], ["hum", 8.19], ["mains hum", 5.73]], null, null, null, null], "duration": [0.59, 1.42, 1.36, 1.3, 0.46, 3.39, 2.07, 1.01, 21.8, 9.07, 3.51, 1.14, 4.93, 4.47, 0.92, 2.52, -0.18, 0.78, 0.12, 4.79, -0.17, -0.14, -0.11, -0.07, -0.04, -0.01, 0.03, 6.35, 1.66, 0.33, 7.32, 4.68, 0.75, 0.93, 1.12, 2.21]} \ No newline at end of file diff --git a/annotations_1/jXReN1Nzlws_filtered.json b/annotations_1/jXReN1Nzlws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..369499a1466a7c13af386a85477f681d9f0c8607 --- /dev/null +++ b/annotations_1/jXReN1Nzlws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.02], [30.0, 30.67], [42.0, 43.63], [45.0, 50.3], [52.0, 52.22], [61.0, 62.19], [63.0, 63.61], [64.0, 64.93], [67.0, 82.22], [82.0, 82.29], [82.0, 83.05], [86.0, 98.29], [101.0, 103.5], [138.0, 139.63], [145.0, 146.82], [149.0, 149.44], [151.0, 155.09]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.72, 0.0, 0.0, 0.0, 0.0, 30.72, 0.0, 0.0, 30.54, 31.07, 0.0, 0.0, 0.0, 34.82], "audiomae_on_audioset": [null, null, null, [["speech", 27.63], ["animal", 19.54], ["frog", 14.99]], null, null, null, null, [["music", 76.41], ["cacophony", 8.27], ["synthesizer", 3.1]], null, null, [["music", 71.99], ["boing", 8.41], ["speech", 6.69]], [["music", 35.2], ["speech", 13.41], ["boing", 7.11]], null, null, null, [["music", 44.18], ["speech", 21.88], ["boing", 8.78]]], "duration": [1.02, 0.67, 1.63, 5.3, 0.22, 1.19, 0.61, 0.93, 15.22, 0.29, 1.05, 12.29, 2.5, 1.63, 1.82, 0.44, 4.09]} \ No newline at end of file diff --git a/annotations_1/jY2PzzjO3zo_filtered.json b/annotations_1/jY2PzzjO3zo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed2710d1fa26516cb3c1596cb6d45ea3d61658d8 --- /dev/null +++ b/annotations_1/jY2PzzjO3zo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.84], [12.0, 12.55], [18.0, 18.4], [37.0, 37.59], [42.0, 42.96], [54.0, 54.18], [61.0, 61.72], [64.0, 64.23], [65.0, 65.5], [78.0, 78.02], [85.0, 86.27], [92.0, 95.3], [96.0, 96.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 33.67], ["hum", 22.07], ["mains hum", 15.84]], null], "duration": [0.84, 0.55, 0.4, 0.59, 0.96, 0.18, 0.72, 0.23, 0.5, 0.02, 1.27, 3.3, 0.48]} \ No newline at end of file diff --git a/annotations_1/jY4nU1rwWv8_filtered.json b/annotations_1/jY4nU1rwWv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9cc925ffbf9693256f33392b32435e16fb5869 --- /dev/null +++ b/annotations_1/jY4nU1rwWv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.6], [23.0, 26.65], [36.0, 37.18], [42.0, 42.11], [43.0, 43.21], [43.0, 43.41], [44.0, 56.29], [67.0, 69.62], [84.0, 84.55], [90.0, 92.26], [93.0, 94.53], [95.0, 128.07], [128.0, 128.53], [134.0, 143.01], [146.0, 146.7]], "keep_status": [false, true, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [33.09, 45.69, 0.0, 0.0, 0.0, 0.0, 34.35, 36.79, 0.0, 33.57, 0.0, 0.0, 0.0, 37.03, 0.0], "audiomae_on_audioset": [[["music", 54.47], ["speech", 15.63], ["explosion", 3.51]], [["music", 24.0], ["speech", 12.05], ["breaking", 8.45]], null, null, null, null, [["music", 29.41], ["speech", 20.07], ["whack, thwack", 6.95]], [["music", 23.27], ["thunk", 10.97], ["animal", 6.46]], null, [["speech", 26.65], ["music", 24.3], ["sidetone", 7.48]], null, null, null, [["speech", 44.51], ["music", 31.88], ["whack, thwack", 4.07]], null], "duration": [12.6, 3.65, 1.18, 0.11, 0.21, 0.41, 12.29, 2.62, 0.55, 2.26, 1.53, 33.07, 0.53, 9.01, 0.7]} \ No newline at end of file diff --git a/annotations_1/jYbI8iVYCpc_filtered.json b/annotations_1/jYbI8iVYCpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..345c23471a525385719128207de8c7eb53c10cb2 --- /dev/null +++ b/annotations_1/jYbI8iVYCpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [9.0, 9.12], [13.0, 14.03], [14.0, 16.95], [18.0, 19.01], [20.0, 21.15], [23.0, 27.31], [28.0, 29.71], [30.0, 35.06], [38.0, 54.36], [55.0, 64.15]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 45.88, 0.0, 63.85, 92.64, 29.76], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.13], ["hum", 5.96], ["chirp tone", 5.78]], null, null, null, [["mains hum", 34.66], ["hum", 16.62], ["noise", 14.66]]], "duration": [1.56, 0.12, 1.03, 2.95, 1.01, 1.15, 4.31, 1.71, 5.06, 16.36, 9.15]} \ No newline at end of file diff --git a/annotations_1/jZXuLQdIrEg_filtered.json b/annotations_1/jZXuLQdIrEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d22bd873b3c3835a17d3628c6ad68e5aba78bec --- /dev/null +++ b/annotations_1/jZXuLQdIrEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [5.0, 5.8], [6.0, 7.55], [9.0, 9.73], [12.0, 12.51], [13.0, 13.32], [14.0, 15.15], [16.0, 17.02], [20.0, 20.71], [22.0, 23.01], [26.0, 26.0], [29.0, 30.43], [31.0, 32.39], [34.0, 35.31], [38.0, 41.69], [43.0, 43.68], [45.0, 45.4], [46.0, 47.01], [49.0, 51.63], [53.0, 52.89], [54.0, 59.36], [60.0, 61.25], [63.0, 63.9], [64.0, 64.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 96.29, 0.0, 57.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 0.8, 1.55, 0.73, 0.51, 0.32, 1.15, 1.02, 0.71, 1.01, 0.0, 1.43, 1.39, 1.31, 3.69, 0.68, 0.4, 1.01, 2.63, -0.11, 5.36, 1.25, 0.9, 0.35]} \ No newline at end of file diff --git a/annotations_1/j_1k-SzcOrs_filtered.json b/annotations_1/j_1k-SzcOrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb2f3a68085855fd2ad980409a6cc4869eb6415d --- /dev/null +++ b/annotations_1/j_1k-SzcOrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 25.96], [34.0, 38.04], [38.0, 38.08], [42.0, 45.27], [49.0, 49.52], [55.0, 55.58], [59.0, 65.1], [70.0, 72.35], [97.0, 97.85], [99.0, 101.14], [108.0, 108.33], [112.0, 114.44], [118.0, 117.58], [118.0, 118.42], [119.0, 119.91], [123.0, 124.71], [126.0, 127.04], [128.0, 131.58], [132.0, 133.0], [135.0, 137.61], [138.0, 139.67], [144.0, 144.9], [146.0, 145.62], [155.0, 155.6], [158.0, 158.09], [162.0, 163.27], [165.0, 165.94]], "keep_status": [true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.73, 41.85, 0.0, 42.11, 0.0, 0.0, 32.07, 45.14, 0.0, 58.98, 0.0, 52.33, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 20.74], ["vehicle", 15.53], ["car", 9.59]], [["speech", 33.28], ["sidetone", 32.61], ["music", 5.96]], null, [["speech", 26.92], ["music", 15.39], ["sidetone", 7.3]], null, null, [["speech", 61.26], ["vehicle", 6.98], ["hum", 4.77]], [["speech", 38.54], ["music", 20.34], ["sidetone", 10.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.96, 4.04, 0.08, 3.27, 0.52, 0.58, 6.1, 2.35, 0.85, 2.14, 0.33, 2.44, -0.42, 0.42, 0.91, 1.71, 1.04, 3.58, 1.0, 2.61, 1.67, 0.9, -0.38, 0.6, 0.09, 1.27, 0.94]} \ No newline at end of file diff --git a/annotations_1/j_3wS3OIgc8_filtered.json b/annotations_1/j_3wS3OIgc8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6787197433cb968f3ad5201a6e00c95dd00226b9 --- /dev/null +++ b/annotations_1/j_3wS3OIgc8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.39], [31.0, 83.96], [91.0, 98.74], [115.0, 116.21], [117.0, 116.97], [117.0, 130.37], [135.0, 141.47], [143.0, 143.21], [149.0, 160.41]], "keep_status": [false, false, true, false, false, true, true, false, true], "silence_prob": [32.81, 0.0, 30.54, 0.0, 0.0, 34.19, 33.06, 0.0, 39.09], "audiomae_on_audioset": [[["speech", 48.38], ["music", 22.93], ["boing", 3.45]], null, [["speech", 56.42], ["frog", 7.23], ["fart", 3.81]], null, null, [["fart", 30.62], ["speech", 23.95], ["livestock, farm animals, working animals", 7.95]], [["speech", 20.79], ["laughter", 12.71], ["animal", 5.63]], null, [["speech", 38.39], ["animal", 11.83], ["livestock, farm animals, working animals", 9.64]]], "duration": [4.39, 52.96, 7.74, 1.21, -0.03, 13.37, 6.47, 0.21, 11.41]} \ No newline at end of file diff --git a/annotations_1/j_sD0t5L8kE_filtered.json b/annotations_1/j_sD0t5L8kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdfc6fa07f98a0e10684d6249fdaa278525dc455 --- /dev/null +++ b/annotations_1/j_sD0t5L8kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 20.16], [29.0, 32.0], [33.0, 37.25], [38.0, 41.86], [47.0, 48.0], [50.0, 50.62], [53.0, 53.77], [57.0, 58.09], [61.0, 62.61], [63.0, 65.08], [66.0, 70.19], [72.0, 72.89], [75.0, 76.05], [80.0, 81.31], [83.0, 85.62], [87.0, 89.02], [90.0, 91.62], [92.0, 92.65], [93.0, 95.37], [98.0, 99.27], [101.0, 104.4], [105.0, 107.32], [109.0, 113.51], [117.0, 118.5], [122.0, 123.79], [125.0, 126.55], [128.0, 128.58], [131.0, 133.05], [135.0, 136.02], [138.0, 139.72], [148.0, 149.2], [150.0, 151.38], [154.0, 156.05], [158.0, 158.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.0, 80.29, 95.09, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 74.29, 0.0, 0.0, 0.0, 96.42, 52.51, 0.0, 0.0, 100.0, 0.0, 99.16, 42.22, 72.75, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.54], ["telephone", 8.26], ["radio", 5.26]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.16, 3.0, 4.25, 3.86, 1.0, 0.62, 0.77, 1.09, 1.61, 2.08, 4.19, 0.89, 1.05, 1.31, 2.62, 2.02, 1.62, 0.65, 2.37, 1.27, 3.4, 2.32, 4.51, 1.5, 1.79, 1.55, 0.58, 2.05, 1.02, 1.72, 1.2, 1.38, 2.05, 0.53]} \ No newline at end of file diff --git a/annotations_1/j_txRPwTvpk_filtered.json b/annotations_1/j_txRPwTvpk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..771b42fca4b0fe6bc0005e997bb9180b56f3a10d --- /dev/null +++ b/annotations_1/j_txRPwTvpk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [9.0, 8.97], [16.0, 16.61], [18.0, 19.35], [20.0, 22.55], [24.0, 25.35], [26.0, 27.72], [29.0, 29.76], [34.0, 34.15], [35.0, 35.9], [49.0, 49.05], [50.0, 50.45], [55.0, 55.71], [63.0, 81.87], [83.0, 85.5], [86.0, 86.8], [88.0, 91.64], [93.0, 93.38], [94.0, 96.16], [97.0, 98.25], [99.0, 100.18]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.9, 28.72, 0.0, 29.89, 0.0, 35.71, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 18.54], ["telephone", 14.49], ["hum", 14.3]], null, null, null, null, null, null, null, null, [["music", 41.63], ["noise", 15.58], ["hum", 6.0]], [["speech", 11.4], ["music", 6.57], ["insect", 5.26]], null, [["throbbing", 12.52], ["hum", 11.87], ["fly, housefly", 11.84]], null, [["cattle, bovinae", 50.41], ["moo", 26.23], ["livestock, farm animals, working animals", 21.5]], null, null], "duration": [0.66, -0.03, 0.61, 1.35, 2.55, 1.35, 1.72, 0.76, 0.15, 0.9, 0.05, 0.45, 0.71, 18.87, 2.5, 0.8, 3.64, 0.38, 2.16, 1.25, 1.18]} \ No newline at end of file diff --git a/annotations_1/j_z70ZaqWUE_filtered.json b/annotations_1/j_z70ZaqWUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1419d676ec3cceac97a9c2502c7af669e6c1dd1f --- /dev/null +++ b/annotations_1/j_z70ZaqWUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [13.0, 16.41], [20.0, 21.59], [24.0, 24.98], [25.0, 26.0], [27.0, 37.08], [45.0, 44.81], [50.0, 50.58], [58.0, 58.43], [60.0, 60.37], [61.0, 61.32], [78.0, 78.61], [83.0, 84.0], [88.0, 89.02], [90.0, 90.56], [91.0, 92.15], [94.0, 96.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.83, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.26, 3.41, 1.59, 0.98, 1.0, 10.08, -0.19, 0.58, 0.43, 0.37, 0.32, 0.61, 1.0, 1.02, 0.56, 1.15, 2.82]} \ No newline at end of file diff --git a/annotations_1/ja00D_L5tm8_filtered.json b/annotations_1/ja00D_L5tm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a2ef8f0d0683038b1bf5eda033763681b4fcec8 --- /dev/null +++ b/annotations_1/ja00D_L5tm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.51], [15.0, 24.12], [26.0, 28.49], [30.0, 35.24], [36.0, 37.89], [39.0, 40.04], [42.0, 43.9], [44.0, 44.85], [46.0, 58.56], [63.0, 71.68], [72.0, 75.47], [78.0, 79.83], [82.0, 81.7], [84.0, 85.24], [89.0, 90.14], [92.0, 92.69], [93.0, 93.23], [94.0, 95.44], [99.0, 100.08], [101.0, 102.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 53.4, 75.39, 72.16, 0.0, 0.0, 0.0, 0.0, 91.13, 53.84, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.51, 9.12, 2.49, 5.24, 1.89, 1.04, 1.9, 0.85, 12.56, 8.68, 3.47, 1.83, -0.3, 1.24, 1.14, 0.69, 0.23, 1.44, 1.08, 1.66]} \ No newline at end of file diff --git a/annotations_1/jaM0sgoi0vw_filtered.json b/annotations_1/jaM0sgoi0vw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/jaM0sgoi0vw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/jaSSXV5AFHk_filtered.json b/annotations_1/jaSSXV5AFHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50400734df721ab07294453cbf865041e03c77a --- /dev/null +++ b/annotations_1/jaSSXV5AFHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 49.98], [50.0, 59.51], [60.0, 67.78], [70.0, 72.1], [74.0, 74.41], [75.0, 77.03], [81.0, 83.17], [86.0, 91.2], [92.0, 94.64], [96.0, 96.85], [97.0, 97.43], [100.0, 100.68], [102.0, 102.76], [104.0, 106.32], [107.0, 108.35], [110.0, 112.6], [113.0, 113.97], [115.0, 116.45], [118.0, 120.43]], "keep_status": [false, false, true, false, false, false, true, true, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 33.9, 37.65, 56.86, 0.0, 39.34, 38.28, 41.1, 43.15, 0.0, 0.0, 0.0, 0.0, 49.45, 0.0, 37.44, 0.0, 0.0, 32.83], "audiomae_on_audioset": [null, [["music", 49.89], ["synthesizer", 18.67], ["musical instrument", 9.95]], [["music", 55.02], ["effects unit", 8.59], ["chorus effect", 6.33]], null, null, [["sidetone", 43.6], ["speech", 17.34], ["music", 12.73]], [["music", 48.39], ["musical instrument", 9.83], ["synthesizer", 9.27]], [["music", 32.94], ["hum", 19.89], ["mains hum", 9.05]], [["hum", 29.03], ["mains hum", 15.03], ["music", 11.26]], null, null, null, null, [["hum", 35.94], ["mains hum", 35.46], ["speech", 2.8]], null, [["music", 34.11], ["speech", 14.75], ["sidetone", 7.78]], null, null, [["hum", 32.38], ["gong", 18.74], ["mains hum", 12.63]]], "duration": [0.98, 9.51, 7.78, 2.1, 0.41, 2.03, 2.17, 5.2, 2.64, 0.85, 0.43, 0.68, 0.76, 2.32, 1.35, 2.6, 0.97, 1.45, 2.43]} \ No newline at end of file diff --git a/annotations_1/jbvQvJV_97M_filtered.json b/annotations_1/jbvQvJV_97M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6a3f937cef5c7422ad173b25e40abcac764a719 --- /dev/null +++ b/annotations_1/jbvQvJV_97M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.48], [40.0, 41.07], [43.0, 43.85], [46.0, 46.89], [48.0, 48.59], [54.0, 54.5], [57.0, 57.86], [59.0, 60.05], [69.0, 71.04], [72.0, 85.09], [90.0, 90.95], [92.0, 92.47], [96.0, 122.61], [123.0, 124.5], [125.0, 127.87], [130.0, 132.7], [133.0, 144.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 28.21, 0.0, 0.0, 28.62, 0.0, 28.43, 30.86, 29.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 39.96], ["music", 15.73], ["synthesizer", 5.07]], [["music", 42.95], ["hum", 17.24], ["mains hum", 10.58]], null, null, [["music", 30.96], ["hum", 16.89], ["mains hum", 10.45]], null, [["speech", 28.45], ["explosion", 25.07], ["burst, pop", 14.81]], [["music", 28.96], ["theremin", 16.47], ["didgeridoo", 7.62]], [["livestock, farm animals, working animals", 24.32], ["cattle, bovinae", 19.98], ["moo", 15.47]]], "duration": [1.48, 1.07, 0.85, 0.89, 0.59, 0.5, 0.86, 1.05, 2.04, 13.09, 0.95, 0.47, 26.61, 1.5, 2.87, 2.7, 11.44]} \ No newline at end of file diff --git a/annotations_1/jc2T3qbPJNI_filtered.json b/annotations_1/jc2T3qbPJNI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d884b6cdb1d5be09218621e1efaa1ade2d66f87 --- /dev/null +++ b/annotations_1/jc2T3qbPJNI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [9.0, 8.56], [9.0, 9.04], [9.0, 9.07], [9.0, 30.54], [35.0, 56.57], [59.0, 61.16], [62.0, 66.23], [73.0, 73.36], [75.0, 75.09], [77.0, 78.21], [84.0, 84.28], [87.0, 86.97], [88.0, 88.84], [90.0, 92.4], [94.0, 95.39], [98.0, 108.65], [111.0, 124.53]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.54, 30.0, 32.56, 30.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.93, 0.0, 29.66, 29.82], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.58], ["music", 14.47], ["whack, thwack", 4.74]], [["music", 67.57], ["synthesizer", 7.18], ["electronic music", 4.52]], [["music", 29.34], ["hum", 10.66], ["synthesizer", 10.57]], [["music", 53.04], ["throbbing", 6.48], ["hum", 6.45]], null, null, null, null, null, null, [["speech", 26.68], ["whale vocalization", 23.22], ["music", 10.08]], null, [["music", 64.8], ["musical instrument", 7.58], ["livestock, farm animals, working animals", 6.16]], [["whale vocalization", 11.76], ["music", 10.16], ["buzz", 8.28]]], "duration": [0.58, -0.44, 0.04, 0.07, 21.54, 21.57, 2.16, 4.23, 0.36, 0.09, 1.21, 0.28, -0.03, 0.84, 2.4, 1.39, 10.65, 13.53]} \ No newline at end of file diff --git a/annotations_1/jcmTZfv5z-k_filtered.json b/annotations_1/jcmTZfv5z-k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1551a5c0614d23b66b664cd93c1debd0b4b1e27e --- /dev/null +++ b/annotations_1/jcmTZfv5z-k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 23.09]], "keep_status": [true], "silence_prob": [31.52], "audiomae_on_audioset": [[["hum", 23.23], ["music", 13.28], ["mains hum", 6.67]]], "duration": [22.09]} \ No newline at end of file diff --git a/annotations_1/jdd1py-ilwc_filtered.json b/annotations_1/jdd1py-ilwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ecb3d17d0606713bda21acb9e0e23355200d035 --- /dev/null +++ b/annotations_1/jdd1py-ilwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.43], [23.0, 24.22], [25.0, 26.4], [31.0, 31.75], [33.0, 33.44], [37.0, 38.1], [41.0, 42.06], [45.0, 45.89], [47.0, 47.49], [52.0, 52.93], [62.0, 66.53], [77.0, 88.53], [89.0, 90.8], [94.0, 105.85], [113.0, 112.68], [114.0, 117.39], [122.0, 125.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 37.24, 0.0, 46.05, 0.0, 77.7, 34.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 63.79], ["animal", 3.88], ["dog", 3.76]], [["music", 63.99], ["didgeridoo", 14.48], ["speech", 13.21]], null, [["music", 66.77], ["synthesizer", 5.17], ["ding", 3.02]], null, null, [["speech", 37.01], ["music", 28.57], ["musical instrument", 4.0]]], "duration": [3.43, 1.22, 1.4, 0.75, 0.44, 1.1, 1.06, 0.89, 0.49, 0.93, 4.53, 11.53, 1.8, 11.85, -0.32, 3.39, 3.17]} \ No newline at end of file diff --git a/annotations_1/jeYdR_r0iGo_filtered.json b/annotations_1/jeYdR_r0iGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f567873396044dcbd5fc951f24938253f5018246 --- /dev/null +++ b/annotations_1/jeYdR_r0iGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.37], [22.0, 23.97], [25.0, 27.5], [30.0, 31.28], [34.0, 34.69], [36.0, 36.02], [39.0, 39.34], [47.0, 48.07], [49.0, 58.06], [61.0, 61.45], [70.0, 104.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 97.54, 0.0, 0.0, 0.0, 0.0, 0.0, 50.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [5.37, 1.97, 2.5, 1.28, 0.69, 0.02, 0.34, 1.07, 9.06, 0.45, 34.19]} \ No newline at end of file diff --git a/annotations_1/jfhEIIK-jB8_filtered.json b/annotations_1/jfhEIIK-jB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5590bc869c913da6ea6d685f474467c4b66cc652 --- /dev/null +++ b/annotations_1/jfhEIIK-jB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [4.0, 4.41], [8.0, 9.98], [17.0, 17.17], [19.0, 19.85], [34.0, 34.13], [35.0, 35.72], [39.0, 39.78], [41.0, 42.35], [43.0, 43.9], [45.0, 47.06], [54.0, 55.02], [58.0, 64.52], [70.0, 84.72], [87.0, 101.88], [105.0, 105.9], [107.0, 108.16], [109.0, 114.61], [118.0, 146.48], [149.0, 179.12], [185.0, 191.71], [201.0, 216.33], [219.0, 222.3], [223.0, 224.06], [225.0, 229.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.64, 0.0, 33.63, 29.63, 28.42, 0.0, 0.0, 28.5, 27.94, 0.0, 29.73, 28.67, 94.07, 0.0, 61.57], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.84], ["music", 34.05], ["thunk", 12.08]], [["music", 53.48], ["throbbing", 12.64], ["hum", 10.28]], [["music", 62.45], ["synthesizer", 10.71], ["musical instrument", 4.78]], null, null, [["music", 66.33], ["throbbing", 7.15], ["didgeridoo", 5.05]], [["music", 67.63], ["speech", 16.02], ["theremin", 2.3]], null, [["speech", 31.96], ["music", 23.1], ["buzz", 8.06]], [["music", 32.51], ["mains hum", 7.98], ["hum", 6.49]], null, null, null], "duration": [0.13, 0.41, 1.98, 0.17, 0.85, 0.13, 0.72, 0.78, 1.35, 0.9, 2.06, 1.02, 6.52, 14.72, 14.88, 0.9, 1.16, 5.61, 28.48, 30.12, 6.71, 15.33, 3.3, 1.06, 4.63]} \ No newline at end of file diff --git a/annotations_1/jgBGoS4a5rc_filtered.json b/annotations_1/jgBGoS4a5rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da9a43b822d2cb18b028a9e75a351d34b7fa64b5 --- /dev/null +++ b/annotations_1/jgBGoS4a5rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.45], [13.0, 17.05], [18.0, 19.14], [22.0, 21.69], [23.0, 26.5], [28.0, 28.41], [31.0, 31.82], [33.0, 32.93], [35.0, 35.09], [40.0, 41.72], [46.0, 46.36], [48.0, 51.16], [54.0, 55.27], [57.0, 58.09], [59.0, 58.82], [60.0, 60.35], [61.0, 70.77], [81.0, 81.65], [90.0, 90.49], [93.0, 95.5], [98.0, 99.13], [107.0, 107.77], [110.0, 110.93], [112.0, 112.02], [115.0, 116.16], [118.0, 119.31], [121.0, 122.5], [125.0, 127.06], [131.0, 131.4], [132.0, 132.27], [133.0, 133.12], [133.0, 134.13], [135.0, 135.9], [136.0, 154.65], [158.0, 159.8], [163.0, 165.08], [171.0, 174.72], [177.0, 182.49], [184.0, 184.67]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [47.27, 46.57, 0.0, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 50.16, 0.0, 0.0, 52.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 33.32, 0.0, 32.38, 31.33, 30.98, 0.0], "audiomae_on_audioset": [[["music", 14.67], ["burping, eructation", 13.82], ["sine wave", 13.45]], [["speech", 55.06], ["gears", 3.85], ["mechanisms", 3.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 39.46], ["hum", 18.08], ["music", 12.13]], null, null, null, null, null, [["music", 51.59], ["speech", 16.0], ["synthesizer", 7.23]], null, [["music", 48.03], ["throbbing", 8.84], ["drum machine", 7.7]], [["music", 66.51], ["electronic music", 9.18], ["dubstep", 6.0]], [["music", 75.85], ["electronic music", 2.69], ["speech", 2.53]], null], "duration": [4.45, 4.05, 1.14, -0.31, 3.5, 0.41, 0.82, -0.07, 0.09, 1.72, 0.36, 3.16, 1.27, 1.09, -0.18, 0.35, 9.77, 0.65, 0.49, 2.5, 1.13, 0.77, 0.93, 0.02, 1.16, 1.31, 1.5, 2.06, 0.4, 0.27, 0.12, 1.13, 0.9, 18.65, 1.8, 2.08, 3.72, 5.49, 0.67]} \ No newline at end of file diff --git a/annotations_1/jgk96izcJbw_filtered.json b/annotations_1/jgk96izcJbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6741e8bcb89549bc509807bdda6aefb3c05a5059 --- /dev/null +++ b/annotations_1/jgk96izcJbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.84], [10.0, 10.79], [15.0, 33.54], [34.0, 37.15], [41.0, 43.95], [45.0, 46.23], [47.0, 69.11], [72.0, 100.48], [102.0, 149.1]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 42.53, 50.61, 77.36, 0.0, 31.45, 29.4, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.53], ["speech", 10.23], ["hum", 8.81]], null, null, null, [["throbbing", 30.89], ["music", 29.81], ["hum", 14.54]], [["throbbing", 36.48], ["hum", 35.54], ["music", 16.35]], null], "duration": [0.84, 0.79, 18.54, 3.15, 2.95, 1.23, 22.11, 28.48, 47.1]} \ No newline at end of file diff --git a/annotations_1/jgosH8zc83Q_filtered.json b/annotations_1/jgosH8zc83Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34de6f5a7ee7c7ef80a1a06297011ed149ecd191 --- /dev/null +++ b/annotations_1/jgosH8zc83Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [6.0, 7.16], [8.0, 8.51], [10.0, 11.84], [13.0, 13.02], [15.0, 17.64], [19.0, 20.09], [27.0, 27.51], [29.0, 29.52], [31.0, 31.16], [32.0, 35.58], [39.0, 39.63], [40.0, 41.42], [44.0, 44.04], [45.0, 44.93], [46.0, 46.3], [46.0, 46.77], [52.0, 52.84], [54.0, 54.95], [58.0, 59.29], [61.0, 61.48], [62.0, 62.7], [63.0, 63.95], [64.0, 64.91], [66.0, 65.87], [66.0, 67.56], [69.0, 69.85], [73.0, 87.56], [89.0, 90.12], [93.0, 93.31], [95.0, 95.3], [96.0, 96.92], [98.0, 98.78], [101.0, 101.93], [105.0, 105.46], [106.0, 106.73], [109.0, 111.43], [116.0, 116.46], [118.0, 118.72], [120.0, 120.19], [125.0, 125.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mains hum", 20.41], ["hum", 18.47], ["music", 8.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.88], ["foghorn", 5.62], ["brass instrument", 5.21]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 1.16, 0.51, 1.84, 0.02, 2.64, 1.09, 0.51, 0.52, 0.16, 3.58, 0.63, 1.42, 0.04, -0.07, 0.3, 0.77, 0.84, 0.95, 1.29, 0.48, 0.7, 0.95, 0.91, -0.13, 1.56, 0.85, 14.56, 1.12, 0.31, 0.3, 0.92, 0.78, 0.93, 0.46, 0.73, 2.43, 0.46, 0.72, 0.19, 0.73]} \ No newline at end of file diff --git a/annotations_1/jh_EME9M-mg_filtered.json b/annotations_1/jh_EME9M-mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fb92a8487641ef380b35c8004bccbbc1b0c8646 --- /dev/null +++ b/annotations_1/jh_EME9M-mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 39.09], [40.0, 40.61], [42.0, 57.0], [60.0, 60.96], [64.0, 65.62], [67.0, 69.9], [75.0, 84.97], [87.0, 87.35]], "keep_status": [true, false, false, false, false, true, true, false], "silence_prob": [43.9, 0.0, 68.8, 0.0, 0.0, 39.64, 37.02, 0.0], "audiomae_on_audioset": [[["speech", 35.25], ["animal", 7.72], ["fart", 4.48]], null, null, null, null, [["speech", 27.29], ["sidetone", 20.35], ["music", 6.27]], [["music", 33.96], ["pant", 17.45], ["beatboxing", 5.83]], null], "duration": [14.09, 0.61, 15.0, 0.96, 1.62, 2.9, 9.97, 0.35]} \ No newline at end of file diff --git a/annotations_1/jiHXahhmzjw_filtered.json b/annotations_1/jiHXahhmzjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f5cec812587d2828a802d92df353876ae56d2fc --- /dev/null +++ b/annotations_1/jiHXahhmzjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.6], [15.0, 16.34], [17.0, 17.34], [20.0, 21.42], [24.0, 39.24], [41.0, 46.33], [47.0, 47.06], [49.0, 49.55], [55.0, 55.71], [57.0, 58.04], [63.0, 63.22], [67.0, 68.23], [75.0, 75.57], [78.0, 78.22], [84.0, 85.55], [88.0, 89.43], [106.0, 106.91], [109.0, 110.61], [114.0, 114.51], [119.0, 119.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [95.64, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.6, 1.34, 0.34, 1.42, 15.24, 5.33, 0.06, 0.55, 0.71, 1.04, 0.22, 1.23, 0.57, 0.22, 1.55, 1.43, 0.91, 1.61, 0.51, 0.99]} \ No newline at end of file diff --git a/annotations_1/jjDuR4d7Iik_filtered.json b/annotations_1/jjDuR4d7Iik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a97d5984ed55b29ee34a89ebe227dc233d071db7 --- /dev/null +++ b/annotations_1/jjDuR4d7Iik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.84], [26.0, 27.46], [31.0, 32.63], [56.0, 56.51], [64.0, 63.78], [69.0, 74.12], [77.0, 77.6], [81.0, 81.31], [84.0, 86.9], [92.0, 93.14], [104.0, 104.04], [109.0, 109.14], [112.0, 112.68], [116.0, 116.14], [116.0, 117.51], [118.0, 119.52], [126.0, 126.87], [144.0, 150.2], [151.0, 152.81], [155.0, 155.76], [158.0, 158.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 97.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.46, 1.63, 0.51, -0.22, 5.12, 0.6, 0.31, 2.9, 1.14, 0.04, 0.14, 0.68, 0.14, 1.51, 1.52, 0.87, 6.2, 1.81, 0.76, 0.82]} \ No newline at end of file diff --git a/annotations_1/jjPq-r91oB4_filtered.json b/annotations_1/jjPq-r91oB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfd79ff37842787eef01675c63aa1c8703337f7f --- /dev/null +++ b/annotations_1/jjPq-r91oB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.86], [16.0, 20.39], [21.0, 23.31], [25.0, 27.7], [51.0, 51.49], [54.0, 56.29], [82.0, 83.22], [84.0, 85.67], [86.0, 87.03], [94.0, 97.11], [102.0, 103.79], [106.0, 107.94], [120.0, 119.92], [126.0, 127.62], [129.0, 130.17], [151.0, 160.27], [162.0, 169.26], [171.0, 171.76], [176.0, 176.01], [177.0, 182.63], [190.0, 192.11]], "keep_status": [true, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [30.05, 32.43, 85.9, 34.26, 0.0, 32.13, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 43.64, 40.97, 0.0, 0.0, 37.86, 38.94], "audiomae_on_audioset": [[["siren", 24.5], ["emergency vehicle", 23.1], ["police car (siren)", 19.24]], [["whack, thwack", 27.43], ["breaking", 12.65], ["speech", 8.08]], null, [["speech", 28.18], ["music", 13.29], ["hum", 6.45]], null, [["music", 50.83], ["vehicle", 6.44], ["hum", 5.47]], null, null, null, null, null, null, null, null, null, [["music", 52.27], ["theremin", 19.52], ["ambient music", 6.42]], [["music", 56.12], ["ambient music", 16.09], ["theremin", 11.56]], null, null, [["speech", 29.51], ["music", 24.56], ["didgeridoo", 10.16]], [["music", 32.45], ["hum", 13.65], ["throbbing", 7.54]]], "duration": [2.86, 4.39, 2.31, 2.7, 0.49, 2.29, 1.22, 1.67, 1.03, 3.11, 1.79, 1.94, -0.08, 1.62, 1.17, 9.27, 7.26, 0.76, 0.01, 5.63, 2.11]} \ No newline at end of file diff --git a/annotations_1/jjpQORCD0ZU_filtered.json b/annotations_1/jjpQORCD0ZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..628739a49b26e470f896d3d010a73ebfefef2907 --- /dev/null +++ b/annotations_1/jjpQORCD0ZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.39], [7.0, 6.88], [8.0, 8.48], [11.0, 11.45], [13.0, 13.17], [18.0, 18.93], [20.0, 20.98], [22.0, 21.86], [30.0, 30.81], [36.0, 36.14], [39.0, 39.04], [40.0, 40.59], [48.0, 48.0], [51.0, 51.71], [52.0, 52.79], [55.0, 55.9], [58.0, 57.86], [64.0, 64.17], [66.0, 65.82], [67.0, 67.14], [73.0, 73.26], [75.0, 76.55], [79.0, 79.95], [106.0, 107.96], [109.0, 110.25], [118.0, 118.98], [121.0, 122.52], [126.0, 126.99], [128.0, 128.85], [129.0, 130.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.39, -0.12, 0.48, 0.45, 0.17, 0.93, 0.98, -0.14, 0.81, 0.14, 0.04, 0.59, 0.0, 0.71, 0.79, 0.9, -0.14, 0.17, -0.18, 0.14, 0.26, 1.55, 0.95, 1.96, 1.25, 0.98, 1.52, 0.99, 0.85, 1.05]} \ No newline at end of file diff --git a/annotations_1/jjwg2PeDUxM_filtered.json b/annotations_1/jjwg2PeDUxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39ad2b7c5a1c82eb4dfe3e2f3b70c9ac345fa691 --- /dev/null +++ b/annotations_1/jjwg2PeDUxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.5], [9.0, 10.57], [12.0, 17.37], [23.0, 31.51], [32.0, 33.45], [36.0, 36.73], [38.0, 38.69], [40.0, 42.58], [43.0, 53.32], [54.0, 54.43], [55.0, 55.34], [57.0, 58.19], [62.0, 66.04], [70.0, 70.04], [71.0, 72.03], [74.0, 74.14], [75.0, 75.66], [78.0, 77.68], [78.0, 82.92], [94.0, 102.93], [103.0, 103.82], [104.0, 109.85], [115.0, 127.3], [128.0, 138.25], [141.0, 140.63], [141.0, 142.37], [143.0, 143.29], [145.0, 145.67], [147.0, 149.49], [153.0, 153.94], [154.0, 154.53], [155.0, 173.16], [173.0, 174.07], [175.0, 183.61]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [33.15, 0.0, 33.54, 30.06, 0.0, 0.0, 0.0, 31.22, 29.34, 0.0, 0.0, 0.0, 28.91, 0.0, 0.0, 0.0, 0.0, 0.0, 28.59, 29.32, 0.0, 28.85, 30.99, 28.76, 0.0, 0.0, 0.0, 0.0, 29.05, 0.0, 0.0, 28.93, 0.0, 29.51], "audiomae_on_audioset": [[["didgeridoo", 38.71], ["mains hum", 14.13], ["hum", 12.75]], null, [["music", 20.2], ["throbbing", 15.75], ["speech", 15.18]], [["speech", 23.88], ["hum", 12.54], ["music", 11.59]], null, null, null, [["oink", 12.49], ["beatboxing", 10.08], ["pig", 8.59]], [["speech", 61.24], ["music", 10.87], ["hum", 3.56]], null, null, null, [["music", 48.92], ["speech", 20.21], ["didgeridoo", 14.43]], null, null, null, null, null, [["speech", 40.53], ["buzz", 27.1], ["electric shaver, electric razor", 4.11]], [["music", 53.44], ["throbbing", 6.63], ["electronic music", 4.22]], null, [["speech", 59.31], ["music", 9.22], ["whack, thwack", 6.53]], [["didgeridoo", 22.67], ["music", 22.42], ["hum", 20.31]], [["music", 34.56], ["throbbing", 15.91], ["hum", 9.36]], null, null, null, null, [["music", 62.45], ["speech", 10.79], ["electronic music", 2.45]], null, null, [["music", 49.41], ["speech", 7.41], ["livestock, farm animals, working animals", 7.12]], null, [["grunt", 67.45], ["speech", 5.01], ["groan", 4.99]]], "duration": [4.5, 1.57, 5.37, 8.51, 1.45, 0.73, 0.69, 2.58, 10.32, 0.43, 0.34, 1.19, 4.04, 0.04, 1.03, 0.14, 0.66, -0.32, 4.92, 8.93, 0.82, 5.85, 12.3, 10.25, -0.37, 1.37, 0.29, 0.67, 2.49, 0.94, 0.53, 18.16, 1.07, 8.61]} \ No newline at end of file diff --git a/annotations_1/jk2mjuWhQ_0_filtered.json b/annotations_1/jk2mjuWhQ_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8e6ec14b217b264ce0a9d9acdf7128bbea4fefe --- /dev/null +++ b/annotations_1/jk2mjuWhQ_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.08], [7.0, 15.13], [16.0, 16.9], [19.0, 21.61], [22.0, 31.26], [37.0, 60.61], [61.0, 62.28], [63.0, 72.23], [73.0, 73.67], [75.0, 84.0], [86.0, 88.72], [89.0, 91.34], [93.0, 93.92], [95.0, 113.88], [115.0, 121.02], [124.0, 131.77]], "keep_status": [true, false, false, false, true, false, false, false, false, false, true, false, false, false, true, true], "silence_prob": [37.37, 36.14, 0.0, 43.93, 35.27, 32.71, 0.0, 36.1, 0.0, 35.54, 33.42, 32.56, 0.0, 33.36, 35.42, 38.86], "audiomae_on_audioset": [[["music", 19.21], ["throbbing", 15.1], ["hum", 13.81]], [["hum", 50.91], ["music", 18.94], ["throbbing", 10.16]], null, [["music", 42.79], ["throbbing", 17.85], ["hum", 14.72]], [["hum", 22.08], ["mains hum", 18.18], ["music", 11.14]], [["music", 79.19], ["hum", 4.37], ["throbbing", 3.76]], null, [["hum", 54.28], ["mains hum", 17.5], ["speech", 8.13]], null, [["music", 36.98], ["speech", 18.74], ["hum", 17.92]], [["mains hum", 28.98], ["hum", 21.65], ["speech", 15.14]], [["music", 64.13], ["speech", 9.54], ["throbbing", 2.23]], null, [["music", 63.93], ["hum", 5.11], ["coin (dropping)", 4.59]], [["hum", 21.84], ["music", 15.86], ["mains hum", 14.43]], [["hum", 29.94], ["music", 27.26], ["mains hum", 12.57]]], "duration": [2.08, 8.13, 0.9, 2.61, 9.26, 23.61, 1.28, 9.23, 0.67, 9.0, 2.72, 2.34, 0.92, 18.88, 6.02, 7.77]} \ No newline at end of file diff --git a/annotations_1/jkmyjHYMH0Q_filtered.json b/annotations_1/jkmyjHYMH0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29984b95c4b20cc53ad42dff92d8feb69f7b05c7 --- /dev/null +++ b/annotations_1/jkmyjHYMH0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[120.0, 121.68], [123.0, 127.92], [147.0, 147.92], [158.0, 158.65], [169.0, 170.28], [171.0, 173.89]], "keep_status": [false, true, false, false, false, true], "silence_prob": [0.0, 30.88, 0.0, 0.0, 0.0, 40.14], "audiomae_on_audioset": [null, [["music", 45.89], ["synthesizer", 13.2], ["speech", 8.65]], null, null, null, [["music", 32.52], ["sonar", 14.73], ["synthesizer", 13.09]]], "duration": [1.68, 4.92, 0.92, 0.65, 1.28, 2.89]} \ No newline at end of file diff --git a/annotations_1/jlCEAJXSwJc_filtered.json b/annotations_1/jlCEAJXSwJc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef749447f645e36e855442aafdac83bc9e61fece --- /dev/null +++ b/annotations_1/jlCEAJXSwJc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[134.0, 133.95]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [-0.05]} \ No newline at end of file diff --git a/annotations_1/jlcZPO2FhGE_filtered.json b/annotations_1/jlcZPO2FhGE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12949b5a1c72a506e8155ad8dc60ce8c67552834 --- /dev/null +++ b/annotations_1/jlcZPO2FhGE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.01], [4.0, 9.76], [10.0, 24.92], [27.0, 26.96], [27.0, 28.21], [30.0, 34.16], [35.0, 39.85], [41.0, 41.62], [45.0, 46.58], [47.0, 48.39], [55.0, 56.08], [57.0, 58.06], [59.0, 59.7], [61.0, 62.92], [64.0, 64.15], [68.0, 68.03], [70.0, 71.52], [72.0, 72.28], [76.0, 84.62], [85.0, 86.88], [88.0, 93.36], [94.0, 95.1], [99.0, 102.79], [106.0, 105.98], [106.0, 107.1], [112.0, 112.95], [114.0, 114.64], [115.0, 116.58], [117.0, 118.07], [119.0, 120.06], [121.0, 121.22], [122.0, 122.98]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 54.7, 46.4, 0.0, 0.0, 34.76, 40.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 0.0, 38.97, 0.0, 44.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.08], ["speech", 17.2], ["ping", 8.39]], null, null, [["music", 56.05], ["didgeridoo", 21.42], ["speech", 3.91]], [["music", 48.24], ["didgeridoo", 9.73], ["hum", 8.04]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.36], ["music", 29.5], ["musical instrument", 4.38]], null, [["music", 60.15], ["didgeridoo", 16.78], ["musical instrument", 8.86]], null, [["music", 21.39], ["throbbing", 9.43], ["hum", 9.08]], null, null, null, null, null, null, null, null, null], "duration": [2.01, 5.76, 14.92, -0.04, 1.21, 4.16, 4.85, 0.62, 1.58, 1.39, 1.08, 1.06, 0.7, 1.92, 0.15, 0.03, 1.52, 0.28, 8.62, 1.88, 5.36, 1.1, 3.79, -0.02, 1.1, 0.95, 0.64, 1.58, 1.07, 1.06, 0.22, 0.98]} \ No newline at end of file diff --git a/annotations_1/jmC2y7EsXqk_filtered.json b/annotations_1/jmC2y7EsXqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17e9fea5205700744703478d66e77e2c18a3b823 --- /dev/null +++ b/annotations_1/jmC2y7EsXqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.45], [13.0, 12.53], [14.0, 32.05], [32.0, 35.68], [40.0, 42.58], [45.0, 46.01], [49.0, 49.35], [50.0, 63.09], [63.0, 63.15]], "keep_status": [false, false, false, true, false, false, false, false, false], "silence_prob": [31.8, 0.0, 32.68, 37.22, 75.55, 0.0, 0.0, 58.3, 0.0], "audiomae_on_audioset": [[["music", 65.51], ["synthesizer", 3.9], ["sampler", 3.46]], null, [["music", 55.52], ["speech", 12.68], ["sidetone", 6.55]], [["music", 23.76], ["thunk", 21.46], ["whack, thwack", 10.09]], null, null, null, null, null], "duration": [5.45, -0.47, 18.05, 3.68, 2.58, 1.01, 0.35, 13.09, 0.15]} \ No newline at end of file diff --git a/annotations_1/jmuC1ebmYQg_filtered.json b/annotations_1/jmuC1ebmYQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6cf304acbb46e3aa9414929e87a0a76d7bf789d8 --- /dev/null +++ b/annotations_1/jmuC1ebmYQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [5.0, 13.14], [15.0, 15.82], [18.0, 22.3], [39.0, 39.58], [43.0, 43.58], [45.0, 46.31], [47.0, 47.24], [54.0, 54.46], [55.0, 56.81], [59.0, 59.58], [60.0, 61.4], [62.0, 62.94], [67.0, 69.94], [72.0, 73.47], [74.0, 79.64], [85.0, 86.7], [90.0, 90.15], [93.0, 93.83], [94.0, 94.07], [95.0, 96.01], [97.0, 97.53], [98.0, 110.42], [111.0, 112.97], [116.0, 117.37], [119.0, 119.38], [124.0, 127.57], [128.0, 130.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.29, 0.0, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 34.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 77.53, 62.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.58], ["speech", 14.92], ["scratching (performance technique)", 2.69]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.35, 8.14, 0.82, 4.3, 0.58, 0.58, 1.31, 0.24, 0.46, 1.81, 0.58, 1.4, 0.94, 2.94, 1.47, 5.64, 1.7, 0.15, 0.83, 0.07, 1.01, 0.53, 12.42, 1.97, 1.37, 0.38, 3.57, 2.89]} \ No newline at end of file diff --git a/annotations_1/jn_D02Tvr4k_filtered.json b/annotations_1/jn_D02Tvr4k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb7e6ce3625fa7e0c6a0d1389dac7fcc92a5fa93 --- /dev/null +++ b/annotations_1/jn_D02Tvr4k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.33], [5.0, 5.93], [7.0, 7.21], [10.0, 12.7], [14.0, 15.67], [17.0, 17.95], [19.0, 19.33], [21.0, 22.2], [25.0, 26.3], [27.0, 29.42], [31.0, 31.99], [34.0, 34.65], [37.0, 37.47], [39.0, 39.43], [40.0, 42.15], [44.0, 46.63], [48.0, 47.9], [51.0, 51.83], [57.0, 59.37], [63.0, 66.26], [68.0, 70.39], [75.0, 79.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.97, 99.62, 0.0, 0.0, 76.86, 58.38, 100.0, 91.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.33, 0.93, 0.21, 2.7, 1.67, 0.95, 0.33, 1.2, 1.3, 2.42, 0.99, 0.65, 0.47, 0.43, 2.15, 2.63, -0.1, 0.83, 2.37, 3.26, 2.39, 4.91]} \ No newline at end of file diff --git a/annotations_1/jo-aQkgNMKQ_filtered.json b/annotations_1/jo-aQkgNMKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..921b78ec8a45848bbf824e58168b0ac389bca388 --- /dev/null +++ b/annotations_1/jo-aQkgNMKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [10.0, 10.98], [11.0, 14.69], [19.0, 38.55], [40.0, 39.99], [41.0, 41.76], [42.0, 44.59], [47.0, 47.93], [50.0, 51.61], [55.0, 56.54], [58.0, 58.56], [62.0, 62.94], [66.0, 66.83], [67.0, 67.59], [69.0, 69.85], [70.0, 70.55], [80.0, 80.06], [82.0, 83.05], [88.0, 89.72], [92.0, 92.42], [95.0, 95.96], [97.0, 98.9], [106.0, 106.54], [111.0, 111.5], [115.0, 117.96], [119.0, 122.0], [124.0, 125.0], [126.0, 126.84], [130.0, 131.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 57.97, 54.7, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 74.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.98, 3.69, 19.55, -0.01, 0.76, 2.59, 0.93, 1.61, 1.54, 0.56, 0.94, 0.83, 0.59, 0.85, 0.55, 0.06, 1.05, 1.72, 0.42, 0.96, 1.9, 0.54, 0.5, 2.96, 3.0, 1.0, 0.84, 1.53]} \ No newline at end of file diff --git a/annotations_1/jojFdN-oysU_filtered.json b/annotations_1/jojFdN-oysU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e53897332db113ec72177cd6566f319f07b6dfc --- /dev/null +++ b/annotations_1/jojFdN-oysU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 41.72], [42.0, 45.87], [52.0, 52.29], [53.0, 98.24], [103.0, 103.82], [105.0, 116.06], [128.0, 130.79]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [29.71, 32.03, 0.0, 0.0, 0.0, 29.18, 30.45], "audiomae_on_audioset": [[["music", 71.34], ["throbbing", 10.16], ["electronic music", 3.54]], [["livestock, farm animals, working animals", 43.81], ["cattle, bovinae", 35.45], ["moo", 18.13]], null, null, null, [["music", 45.25], ["didgeridoo", 9.0], ["speech", 3.69]], [["music", 31.74], ["theremin", 24.36], ["mains hum", 11.85]]], "duration": [12.72, 3.87, 0.29, 45.24, 0.82, 11.06, 2.79]} \ No newline at end of file diff --git a/annotations_1/jpEfgrff8z0_filtered.json b/annotations_1/jpEfgrff8z0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c97f90fe567006b5b7f2c5f9e258e0d7764fd814 --- /dev/null +++ b/annotations_1/jpEfgrff8z0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 4.72], [23.0, 23.38], [32.0, 35.94], [51.0, 51.31], [54.0, 54.09], [61.0, 61.8], [64.0, 63.78], [74.0, 73.99], [81.0, 85.06], [94.0, 95.07], [98.0, 103.28], [135.0, 136.56], [140.0, 140.17], [148.0, 149.52], [174.0, 177.5]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 65.67, 0.0, 0.0, 0.0, 32.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 19.37], ["music", 15.54], ["speech", 15.19]], null, null, null, null, null, [["music", 40.03], ["speech", 32.56], ["thunk", 10.13]]], "duration": [4.72, 0.38, 3.94, 0.31, 0.09, 0.8, -0.22, -0.01, 4.06, 1.07, 5.28, 1.56, 0.17, 1.52, 3.5]} \ No newline at end of file diff --git a/annotations_1/jpTj6qTyIwY_filtered.json b/annotations_1/jpTj6qTyIwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..640d0e5ef69ab8fa73b4697a232d15ab657bb457 --- /dev/null +++ b/annotations_1/jpTj6qTyIwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.74], [16.0, 16.63], [17.0, 17.9], [19.0, 19.62], [28.0, 36.95], [37.0, 47.92], [48.0, 52.2], [55.0, 64.5], [66.0, 67.24], [70.0, 76.5], [77.0, 78.38], [81.0, 81.84], [83.0, 87.2], [90.0, 102.93], [105.0, 104.72], [105.0, 105.31], [106.0, 113.53], [116.0, 133.74], [135.0, 135.55], [139.0, 141.34], [143.0, 143.8], [144.0, 156.34]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [52.05, 0.0, 0.0, 0.0, 36.6, 39.4, 42.72, 40.19, 0.0, 45.4, 0.0, 0.0, 35.99, 36.04, 0.0, 0.0, 34.58, 40.43, 0.0, 36.62, 0.0, 35.37], "audiomae_on_audioset": [null, null, null, null, [["music", 69.91], ["hum", 5.26], ["throbbing", 3.66]], [["hum", 27.91], ["speech", 19.81], ["mains hum", 12.1]], [["music", 25.18], ["hum", 22.7], ["speech", 9.51]], [["speech", 24.87], ["music", 22.35], ["sheep", 4.47]], null, [["speech", 41.93], ["music", 33.44], ["sidetone", 3.88]], null, null, [["didgeridoo", 25.15], ["groan", 17.71], ["music", 14.87]], [["livestock, farm animals, working animals", 33.01], ["cattle, bovinae", 30.35], ["moo", 24.11]], null, null, [["music", 29.43], ["fly, housefly", 11.49], ["cattle, bovinae", 8.38]], [["speech", 42.2], ["cattle, bovinae", 8.57], ["livestock, farm animals, working animals", 6.31]], null, [["whale vocalization", 88.98], ["moo", 1.33], ["livestock, farm animals, working animals", 0.85]], null, [["music", 50.17], ["speech", 26.75], ["musical instrument", 1.28]]], "duration": [4.74, 0.63, 0.9, 0.62, 8.95, 10.92, 4.2, 9.5, 1.24, 6.5, 1.38, 0.84, 4.2, 12.93, -0.28, 0.31, 7.53, 17.74, 0.55, 2.34, 0.8, 12.34]} \ No newline at end of file diff --git a/annotations_1/jpoR10Zh0ig_filtered.json b/annotations_1/jpoR10Zh0ig_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c146f91cef5b4512bd4e8793b08f5de78abc97d --- /dev/null +++ b/annotations_1/jpoR10Zh0ig_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [6.0, 6.59], [8.0, 10.12], [12.0, 14.18], [16.0, 16.88], [19.0, 19.26], [21.0, 22.17], [24.0, 34.4], [37.0, 37.79], [40.0, 41.07], [45.0, 45.99], [48.0, 48.84], [50.0, 51.63], [56.0, 57.6], [61.0, 61.42], [62.0, 62.11], [63.0, 64.05], [66.0, 66.6], [67.0, 69.01], [71.0, 72.91], [74.0, 74.51], [75.0, 76.28], [79.0, 80.47], [88.0, 88.3], [94.0, 95.45], [97.0, 97.43], [98.0, 99.23], [108.0, 111.06], [117.0, 117.9], [121.0, 122.32], [123.0, 124.24], [126.0, 126.91], [128.0, 128.85], [132.0, 132.07], [133.0, 134.0], [139.0, 138.99], [145.0, 158.75], [160.0, 161.3], [163.0, 163.78], [165.0, 166.23], [167.0, 171.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.95, 66.51, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 79.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.59, 2.12, 2.18, 0.88, 0.26, 1.17, 10.4, 0.79, 1.07, 0.99, 0.84, 1.63, 1.6, 0.42, 0.11, 1.05, 0.6, 2.01, 1.91, 0.51, 1.28, 1.47, 0.3, 1.45, 0.43, 1.23, 3.06, 0.9, 1.32, 1.24, 0.91, 0.85, 0.07, 1.0, -0.01, 13.75, 1.3, 0.78, 1.23, 4.83]} \ No newline at end of file diff --git a/annotations_1/jq_tO6NAlPI_filtered.json b/annotations_1/jq_tO6NAlPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..958f09e3f3d437cbc7364f020e633fbc1de93e81 --- /dev/null +++ b/annotations_1/jq_tO6NAlPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.54], [21.0, 31.29], [34.0, 35.77], [38.0, 39.63], [43.0, 43.97], [46.0, 48.39], [51.0, 51.49], [53.0, 54.41], [55.0, 56.64], [66.0, 66.82], [67.0, 66.85], [75.0, 75.17], [87.0, 90.63], [106.0, 111.45], [116.0, 119.3], [124.0, 125.51], [126.0, 127.67], [131.0, 140.16], [174.0, 178.51], [179.0, 179.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.52, 85.54, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.28, 32.19, 31.37, 0.0, 0.0, 30.52, 30.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.95], ["boing", 18.1], ["didgeridoo", 13.41]], [["music", 57.83], ["speech", 18.45], ["musical instrument", 2.7]], [["music", 60.21], ["didgeridoo", 17.0], ["boing", 5.39]], null, null, [["music", 90.58], ["didgeridoo", 1.97], ["electronic music", 1.28]], [["music", 61.35], ["boing", 9.33], ["didgeridoo", 3.69]], null], "duration": [2.54, 10.29, 1.77, 1.63, 0.97, 2.39, 0.49, 1.41, 1.64, 0.82, -0.15, 0.17, 3.63, 5.45, 3.3, 1.51, 1.67, 9.16, 4.51, 0.41]} \ No newline at end of file diff --git a/annotations_1/jqpkvCebSmU_filtered.json b/annotations_1/jqpkvCebSmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09226084c53d3dc14f670445c75080e208911350 --- /dev/null +++ b/annotations_1/jqpkvCebSmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.79], [20.0, 61.69], [62.0, 80.84], [82.0, 82.21], [87.0, 91.57], [92.0, 92.65]], "keep_status": [false, false, false, false, false, false], "silence_prob": [64.07, 0.0, 83.16, 0.0, 67.13, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [6.79, 41.69, 18.84, 0.21, 4.57, 0.65]} \ No newline at end of file diff --git a/annotations_1/jqzTeVVmTvc_filtered.json b/annotations_1/jqzTeVVmTvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..517139ccb57e5af66684dbe575dd08e2b23fffd6 --- /dev/null +++ b/annotations_1/jqzTeVVmTvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.58], [8.0, 8.94], [12.0, 15.06], [16.0, 31.72], [32.0, 33.56], [34.0, 153.57]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.95, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.58, 0.94, 3.06, 15.72, 1.56, 119.57]} \ No newline at end of file diff --git a/annotations_1/js11RqXLkZg_filtered.json b/annotations_1/js11RqXLkZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10f102616a04dfce4fb5d58746f7d9fc0ed14c0b --- /dev/null +++ b/annotations_1/js11RqXLkZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.58], [14.0, 29.07], [32.0, 33.39], [35.0, 37.1], [41.0, 42.47], [45.0, 46.01], [47.0, 49.23], [50.0, 52.86], [55.0, 56.98], [62.0, 64.5], [65.0, 68.0], [69.0, 74.38], [75.0, 79.56], [81.0, 84.82], [86.0, 86.78], [88.0, 89.85], [91.0, 95.3], [98.0, 100.67], [102.0, 106.19], [107.0, 109.16], [111.0, 121.66], [123.0, 126.81], [128.0, 129.22], [130.0, 132.7], [135.0, 139.08]], "keep_status": [false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 46.57, 0.0, 0.0, 69.07, 40.07, 0.0, 98.99, 38.67, 99.91, 67.0, 53.22, 0.0, 0.0, 96.04, 51.28, 99.87, 98.51, 97.22, 72.16, 0.0, 93.45, 60.6], "audiomae_on_audioset": [null, null, null, [["sidetone", 24.88], ["speech", 17.51], ["music", 12.72]], null, null, null, [["music", 44.89], ["musical instrument", 6.47], ["hum", 6.27]], null, null, [["didgeridoo", 15.87], ["cattle, bovinae", 12.13], ["moo", 11.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.42, 15.07, 1.39, 2.1, 1.47, 1.01, 2.23, 2.86, 1.98, 2.5, 3.0, 5.38, 4.56, 3.82, 0.78, 1.85, 4.3, 2.67, 4.19, 2.16, 10.66, 3.81, 1.22, 2.7, 4.08]} \ No newline at end of file diff --git a/annotations_1/jsUGvhq2MLM_filtered.json b/annotations_1/jsUGvhq2MLM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f2b2cf476a0d51839d24e78ddd42dc2807621ff --- /dev/null +++ b/annotations_1/jsUGvhq2MLM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 18.0], [18.0, 19.14], [20.0, 25.37], [26.0, 26.92], [27.0, 32.49], [34.0, 41.59], [44.0, 47.06], [52.0, 55.68], [56.0, 60.13], [62.0, 65.37], [66.0, 66.92], [67.0, 86.51], [91.0, 93.65], [101.0, 104.13], [107.0, 111.74], [112.0, 122.98], [126.0, 142.15], [146.0, 147.07], [149.0, 162.38], [163.0, 167.68]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [30.35, 0.0, 30.38, 0.0, 30.55, 30.14, 40.55, 59.15, 63.53, 71.14, 0.0, 48.56, 41.09, 48.35, 41.48, 51.07, 32.94, 0.0, 32.18, 32.03], "audiomae_on_audioset": [[["music", 86.1], ["musical instrument", 1.23], ["singing", 1.2]], null, [["music", 38.15], ["moo", 12.18], ["cattle, bovinae", 10.04]], null, [["music", 78.48], ["theremin", 1.52], ["funk", 1.25]], [["music", 71.37], ["didgeridoo", 8.41], ["theremin", 2.11]], [["music", 21.43], ["snicker", 18.44], ["chuckle, chortle", 14.97]], null, null, null, null, [["music", 58.47], ["speech", 18.73], ["inside, small room", 4.95]], [["music", 21.09], ["didgeridoo", 18.38], ["tabla", 9.68]], [["speech", 23.02], ["music", 20.87], ["didgeridoo", 4.28]], [["speech", 24.72], ["sidetone", 17.91], ["didgeridoo", 10.0]], null, [["music", 79.56], ["musical instrument", 2.92], ["synthesizer", 1.77]], null, [["music", 82.73], ["swing music", 2.61], ["musical instrument", 2.3]], [["music", 57.6], ["musical instrument", 10.86], ["brass instrument", 4.85]]], "duration": [14.0, 1.14, 5.37, 0.92, 5.49, 7.59, 3.06, 3.68, 4.13, 3.37, 0.92, 19.51, 2.65, 3.13, 4.74, 10.98, 16.15, 1.07, 13.38, 4.68]} \ No newline at end of file diff --git a/annotations_1/jsbjmWo3c38_filtered.json b/annotations_1/jsbjmWo3c38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58a0f66b299d93738408ef49873be4f4b26512c9 --- /dev/null +++ b/annotations_1/jsbjmWo3c38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 23.92], [25.0, 32.12], [37.0, 37.94], [41.0, 56.17], [58.0, 64.98], [67.0, 72.54], [74.0, 79.32], [81.0, 81.38], [83.0, 87.08], [90.0, 101.11]], "keep_status": [true, false, false, true, true, true, true, false, true, false], "silence_prob": [46.15, 30.68, 0.0, 30.28, 29.69, 30.16, 34.18, 0.0, 33.61, 30.66], "audiomae_on_audioset": [[["music", 46.71], ["synthesizer", 5.98], ["hum", 4.36]], [["speech", 56.75], ["music", 18.04], ["sidetone", 5.35]], null, [["music", 27.84], ["hum", 17.39], ["mains hum", 10.17]], [["music", 54.81], ["electronic music", 5.96], ["synthesizer", 4.8]], [["music", 46.66], ["noise", 7.29], ["cacophony", 6.34]], [["music", 41.15], ["hum", 8.08], ["mains hum", 5.6]], null, [["music", 21.47], ["speech", 9.23], ["vehicle", 2.32]], [["speech", 62.17], ["music", 11.0], ["didgeridoo", 4.95]]], "duration": [9.92, 7.12, 0.94, 15.17, 6.98, 5.54, 5.32, 0.38, 4.08, 11.11]} \ No newline at end of file diff --git a/annotations_1/jsyzJJFZzsg_filtered.json b/annotations_1/jsyzJJFZzsg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a523935cc8def32ada980c19f86f6ef1c5eab0ec --- /dev/null +++ b/annotations_1/jsyzJJFZzsg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [10.0, 15.94], [25.0, 26.03], [27.0, 40.05], [65.0, 75.73], [77.0, 81.8], [83.0, 86.51], [87.0, 90.26]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [0.0, 54.5, 0.0, 40.64, 46.83, 67.13, 70.72, 66.03], "audiomae_on_audioset": [null, null, null, [["music", 52.1], ["cello", 4.96], ["double bass", 3.89]], [["music", 56.54], ["theremin", 14.67], ["musical instrument", 4.03]], null, null, null], "duration": [0.43, 5.94, 1.03, 13.05, 10.73, 4.8, 3.51, 3.26]} \ No newline at end of file diff --git a/annotations_1/jt2BPBAWiEQ_filtered.json b/annotations_1/jt2BPBAWiEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb22cf7620b93323fbd5f1ac7991f54aa5526c4 --- /dev/null +++ b/annotations_1/jt2BPBAWiEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.55], [15.0, 15.63], [19.0, 20.49], [34.0, 36.61], [56.0, 59.24], [61.0, 61.26], [62.0, 62.83], [70.0, 74.31], [79.0, 78.95], [80.0, 80.99], [85.0, 88.38], [90.0, 91.15], [92.0, 95.4]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.54, 50.21, 0.0, 0.0, 46.26, 0.0, 0.0, 34.6, 0.0, 35.77], "audiomae_on_audioset": [null, null, null, [["hum", 33.27], ["throbbing", 25.51], ["music", 20.51]], null, null, null, [["music", 42.14], ["throbbing", 11.67], ["boing", 3.53]], null, null, [["hum", 25.93], ["speech", 18.82], ["mains hum", 10.99]], null, [["speech", 54.35], ["hum", 12.72], ["throbbing", 4.78]]], "duration": [1.55, 0.63, 1.49, 2.61, 3.24, 0.26, 0.83, 4.31, -0.05, 0.99, 3.38, 1.15, 3.4]} \ No newline at end of file diff --git a/annotations_1/jtSnHOkSJxM_filtered.json b/annotations_1/jtSnHOkSJxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/jtSnHOkSJxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ju9K6nk07iE_filtered.json b/annotations_1/ju9K6nk07iE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4c09bcaeb2618060424021e71116d9ff14393be --- /dev/null +++ b/annotations_1/ju9K6nk07iE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.77], [19.0, 27.68], [32.0, 44.19], [46.0, 49.82], [51.0, 182.36], [182.0, 186.87], [188.0, 188.32], [191.0, 192.13], [194.0, 199.3], [201.0, 205.11], [206.0, 212.33], [214.0, 218.98], [221.0, 223.13], [225.0, 226.83]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.94, 35.67, 38.47, 0.0, 62.47, 0.0, 0.0, 90.25, 93.13, 87.55, 82.79, 79.59, 0.0], "audiomae_on_audioset": [null, [["music", 71.36], ["theremin", 9.08], ["musical instrument", 2.44]], [["music", 42.62], ["theremin", 8.84], ["piano", 6.32]], [["music", 45.59], ["theremin", 16.92], ["cello", 3.22]], null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 8.68, 12.19, 3.82, 131.36, 4.87, 0.32, 1.13, 5.3, 4.11, 6.33, 4.98, 2.13, 1.83]} \ No newline at end of file diff --git a/annotations_1/jv6-p4kphmc_filtered.json b/annotations_1/jv6-p4kphmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59975c974620a2320a328ceeb4cabfa661be0865 --- /dev/null +++ b/annotations_1/jv6-p4kphmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.18], [16.0, 19.09], [21.0, 21.68], [23.0, 23.4], [24.0, 26.45], [28.0, 34.79], [36.0, 37.79], [39.0, 58.38], [59.0, 60.69], [61.0, 69.74], [75.0, 76.06], [79.0, 81.48], [82.0, 87.27], [89.0, 89.36], [96.0, 97.95], [100.0, 101.26], [102.0, 102.68], [107.0, 107.25], [108.0, 108.24], [109.0, 109.59], [111.0, 116.83], [118.0, 120.38], [121.0, 125.88], [129.0, 130.11], [131.0, 131.85], [133.0, 133.78], [134.0, 135.18]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 85.72, 0.0, 0.0, 42.11, 85.9, 0.0, 96.54, 0.0, 87.19, 0.0, 51.23, 51.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.63, 42.22, 63.1, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 21.62], ["hum", 20.74], ["music", 14.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.83], ["musical instrument", 6.72], ["speech", 3.94]], null, null, null, null, null], "duration": [1.18, 3.09, 0.68, 0.4, 2.45, 6.79, 1.79, 19.38, 1.69, 8.74, 1.06, 2.48, 5.27, 0.36, 1.95, 1.26, 0.68, 0.25, 0.24, 0.59, 5.83, 2.38, 4.88, 1.11, 0.85, 0.78, 1.18]} \ No newline at end of file diff --git a/annotations_1/jvBp6TqoHWw_filtered.json b/annotations_1/jvBp6TqoHWw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95e81567ed467e6a5a615beb33e98cd609e28daf --- /dev/null +++ b/annotations_1/jvBp6TqoHWw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [3.0, 3.79], [5.0, 5.19], [11.0, 14.2], [15.0, 18.62], [22.0, 22.25], [24.0, 25.44], [27.0, 27.36], [30.0, 31.36], [34.0, 34.38], [34.0, 34.42], [34.0, 35.26], [44.0, 44.46], [48.0, 48.03], [50.0, 50.38], [51.0, 51.12], [52.0, 52.51], [55.0, 55.36], [56.0, 63.53], [65.0, 65.45], [75.0, 74.97], [76.0, 76.65], [87.0, 87.83], [89.0, 89.43], [89.0, 89.46], [90.0, 90.46], [93.0, 97.26], [100.0, 102.52], [109.0, 110.44], [111.0, 111.37], [112.0, 111.97], [115.0, 117.14], [118.0, 119.26], [120.0, 120.83], [123.0, 129.78], [131.0, 132.0], [132.0, 133.83], [135.0, 136.11], [138.0, 137.64], [140.0, 140.81], [143.0, 143.82], [144.0, 146.42], [150.0, 152.66], [154.0, 154.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 95.23, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 87.0, 0.0, 0.0, 0.0, 45.24, 0.0, 0.0, 38.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 39.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.97], ["music", 32.79], ["sidetone", 3.99]], null, null, [["music", 50.79], ["thunk", 18.93], ["musical instrument", 4.15]], null, null, null, null, null, null, null, [["music", 38.54], ["trombone", 12.03], ["brass instrument", 6.25]], null], "duration": [0.51, 0.79, 0.19, 3.2, 3.62, 0.25, 1.44, 0.36, 1.36, 0.38, 0.42, 1.26, 0.46, 0.03, 0.38, 0.12, 0.51, 0.36, 7.53, 0.45, -0.03, 0.65, 0.83, 0.43, 0.46, 0.46, 4.26, 2.52, 1.44, 0.37, -0.03, 2.14, 1.26, 0.83, 6.78, 1.0, 1.83, 1.11, -0.36, 0.81, 0.82, 2.42, 2.66, 0.35]} \ No newline at end of file diff --git a/annotations_1/jwjCPSUGPXU_filtered.json b/annotations_1/jwjCPSUGPXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd04fc0b908ee03dd9e7bb51ca9c35abb44e8706 --- /dev/null +++ b/annotations_1/jwjCPSUGPXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [10.0, 11.69], [16.0, 17.58], [21.0, 22.38], [23.0, 24.58], [25.0, 27.04], [32.0, 32.58], [34.0, 34.4], [40.0, 40.74], [48.0, 49.5], [52.0, 52.56], [54.0, 56.03], [61.0, 60.69], [70.0, 72.23], [75.0, 78.44]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 42.44, 0.0, 36.27, 57.01], "audiomae_on_audioset": [null, null, null, null, null, [["sidetone", 29.39], ["music", 17.39], ["hum", 10.42]], null, null, null, null, null, [["whale vocalization", 30.24], ["music", 13.29], ["frog", 6.99]], null, [["grunt", 34.34], ["speech", 9.8], ["animal", 6.29]], null], "duration": [0.28, 1.69, 1.58, 1.38, 1.58, 2.04, 0.58, 0.4, 0.74, 1.5, 0.56, 2.03, -0.31, 2.23, 3.44]} \ No newline at end of file diff --git a/annotations_1/jwnPI-d36vU_filtered.json b/annotations_1/jwnPI-d36vU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e027c639309c03de8dd9e1e645b2a2d15295a2 --- /dev/null +++ b/annotations_1/jwnPI-d36vU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 30.25], [31.0, 32.22], [33.0, 34.57], [36.0, 37.54], [38.0, 41.99], [43.0, 44.09], [45.0, 63.42], [64.0, 69.65], [70.0, 71.69], [72.0, 74.63], [77.0, 78.36], [80.0, 97.71], [98.0, 98.52], [101.0, 108.73], [110.0, 115.28], [118.0, 120.7], [122.0, 121.98], [122.0, 122.12], [122.0, 132.53], [133.0, 134.6], [136.0, 136.11], [141.0, 142.06], [144.0, 152.49]], "keep_status": [true, false, false, false, false, false, true, true, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [31.9, 0.0, 0.0, 0.0, 34.16, 0.0, 37.13, 39.01, 0.0, 34.98, 0.0, 31.04, 0.0, 30.18, 37.43, 36.57, 0.0, 0.0, 40.36, 0.0, 0.0, 0.0, 62.17], "audiomae_on_audioset": [[["music", 17.98], ["sound effect", 7.57], ["roar", 6.03]], null, null, null, [["noise", 77.11], ["music", 7.52], ["synthesizer", 1.63]], null, [["music", 38.95], ["didgeridoo", 10.51], ["noise", 9.83]], [["whale vocalization", 29.69], ["music", 25.91], ["speech", 7.88]], null, [["thunk", 42.94], ["whack, thwack", 15.0], ["music", 13.4]], null, [["music", 20.3], ["hum", 16.83], ["livestock, farm animals, working animals", 10.39]], null, [["music", 13.58], ["electric shaver, electric razor", 7.24], ["whack, thwack", 6.96]], [["hum", 28.71], ["music", 18.65], ["throbbing", 10.2]], [["speech", 43.58], ["music", 25.39], ["fart", 7.2]], null, null, [["speech", 44.61], ["music", 35.73], ["hum", 3.48]], null, null, null, null], "duration": [3.25, 1.22, 1.57, 1.54, 3.99, 1.09, 18.42, 5.65, 1.69, 2.63, 1.36, 17.71, 0.52, 7.73, 5.28, 2.7, -0.02, 0.12, 10.53, 1.6, 0.11, 1.06, 8.49]} \ No newline at end of file diff --git a/annotations_1/jyDUZd-Orlc_filtered.json b/annotations_1/jyDUZd-Orlc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba04fcb6c4968a359bec10154a7ed616f3404682 --- /dev/null +++ b/annotations_1/jyDUZd-Orlc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.42], [15.0, 20.49], [21.0, 26.08], [27.0, 27.26], [30.0, 68.22], [69.0, 82.98], [84.0, 86.46], [92.0, 92.94], [95.0, 96.23], [98.0, 106.2], [107.0, 107.45], [108.0, 109.36], [110.0, 113.66], [115.0, 160.42], [161.0, 161.25], [162.0, 162.99], [163.0, 175.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [99.4, 67.13, 92.31, 0.0, 0.0, 28.91, 30.12, 0.0, 0.0, 28.65, 0.0, 0.0, 29.12, 0.0, 0.0, 0.0, 41.91], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 73.13], ["music", 11.7], ["electronic music", 1.35]], [["music", 55.89], ["throbbing", 9.53], ["speech", 4.94]], null, null, [["speech", 46.06], ["music", 40.55], ["hum", 3.02]], null, null, [["music", 27.55], ["speech", 18.95], ["hum", 13.48]], null, null, null, [["music", 33.02], ["gasp", 11.33], ["groan", 10.0]]], "duration": [4.42, 5.49, 5.08, 0.26, 38.22, 13.98, 2.46, 0.94, 1.23, 8.2, 0.45, 1.36, 3.66, 45.42, 0.25, 0.99, 12.85]} \ No newline at end of file diff --git a/annotations_1/jyNtMzHeJ6I_filtered.json b/annotations_1/jyNtMzHeJ6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1294b72e7b253889550d8c08c77dc42a3e6439ee --- /dev/null +++ b/annotations_1/jyNtMzHeJ6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.09], [16.0, 16.97], [26.0, 26.7], [29.0, 30.27], [33.0, 34.42], [35.0, 36.9], [41.0, 43.28], [43.0, 43.46], [43.0, 47.12], [49.0, 50.08], [51.0, 51.83], [60.0, 61.16], [64.0, 64.5], [66.0, 67.76], [69.0, 74.38], [77.0, 77.82], [79.0, 79.93], [82.0, 82.46], [85.0, 95.44], [98.0, 99.45], [102.0, 102.74], [103.0, 110.0], [113.0, 116.72], [119.0, 120.73], [122.0, 123.08], [129.0, 130.67], [134.0, 135.45], [138.0, 138.01], [141.0, 141.71], [150.0, 150.42], [154.0, 154.99], [161.0, 161.4], [167.0, 172.35], [173.0, 175.24]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 96.42, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 0.0, 32.24, 0.0, 0.0, 0.0, 30.53, 0.0, 0.0, 29.95, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.57, 63.85], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 45.33], ["hum", 15.34], ["music", 9.02]], null, null, null, null, null, [["speech", 38.53], ["music", 18.76], ["thunk", 3.15]], null, null, null, [["music", 70.5], ["hip hop music", 4.92], ["electronic music", 4.55]], null, null, [["music", 77.46], ["electronic music", 4.33], ["hip hop music", 2.73]], null, null, null, null, null, null, null, null, null, null, [["speech", 67.21], ["sidetone", 5.21], ["music", 3.99]], null], "duration": [7.09, 0.97, 0.7, 1.27, 1.42, 1.9, 2.28, 0.46, 4.12, 1.08, 0.83, 1.16, 0.5, 1.76, 5.38, 0.82, 0.93, 0.46, 10.44, 1.45, 0.74, 7.0, 3.72, 1.73, 1.08, 1.67, 1.45, 0.01, 0.71, 0.42, 0.99, 0.4, 5.35, 2.24]} \ No newline at end of file diff --git a/annotations_1/jypAc6XYFfA_filtered.json b/annotations_1/jypAc6XYFfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d11ffd1b76ac30754270cb23058b39f15b390ad --- /dev/null +++ b/annotations_1/jypAc6XYFfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.43], [7.0, 8.11], [17.0, 20.31], [23.0, 23.95], [28.0, 29.3], [33.0, 39.95], [40.0, 51.53], [53.0, 54.46], [57.0, 57.81], [61.0, 64.23], [65.0, 68.67], [70.0, 78.88], [81.0, 84.65], [85.0, 85.72], [86.0, 102.05], [106.0, 112.62], [115.0, 116.23]], "keep_status": [true, false, true, false, false, false, true, false, false, true, false, false, true, false, false, true, false], "silence_prob": [45.3, 0.0, 43.77, 0.0, 0.0, 39.41, 44.43, 0.0, 0.0, 43.08, 43.82, 41.4, 32.87, 0.0, 34.65, 34.08, 0.0], "audiomae_on_audioset": [[["hum", 20.99], ["mains hum", 17.67], ["speech", 12.99]], null, [["speech", 18.92], ["rumble", 17.02], ["hum", 7.17]], null, null, [["speech", 58.7], ["music", 9.64], ["didgeridoo", 9.54]], [["hum", 35.68], ["mains hum", 29.23], ["throbbing", 4.19]], null, null, [["music", 14.19], ["hum", 13.34], ["sine wave", 7.57]], [["sine wave", 61.98], ["chirp tone", 14.44], ["singing bowl", 8.59]], [["hum", 36.9], ["music", 21.9], ["mains hum", 20.86]], [["music", 44.92], ["musical instrument", 6.49], ["hum", 4.61]], null, [["speech", 34.52], ["throbbing", 29.07], ["hum", 15.25]], [["music", 33.06], ["hum", 18.28], ["throbbing", 10.28]], null], "duration": [3.43, 1.11, 3.31, 0.95, 1.3, 6.95, 11.53, 1.46, 0.81, 3.23, 3.67, 8.88, 3.65, 0.72, 16.05, 6.62, 1.23]} \ No newline at end of file diff --git a/annotations_1/jzhXtCHYrAM_filtered.json b/annotations_1/jzhXtCHYrAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b624f04b1f0e96d700f49e85623e9ceb72f9c9f3 --- /dev/null +++ b/annotations_1/jzhXtCHYrAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 16.98], [20.0, 22.06], [23.0, 26.76], [28.0, 37.61], [38.0, 38.69], [40.0, 48.05], [50.0, 50.62], [54.0, 54.36], [55.0, 56.03], [58.0, 59.44], [60.0, 61.25], [63.0, 62.73], [65.0, 66.09], [68.0, 67.71], [69.0, 68.82], [70.0, 70.68], [73.0, 73.01], [76.0, 77.41], [78.0, 80.77], [92.0, 94.32], [96.0, 97.23], [100.0, 108.26], [111.0, 113.83], [119.0, 121.05], [130.0, 130.64], [145.0, 148.71], [153.0, 154.3], [156.0, 159.41], [164.0, 166.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [93.45, 90.25, 95.23, 92.31, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 89.19, 0.0, 99.92, 81.89, 95.51, 0.0, 99.76, 0.0, 96.54, 39.46], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 36.19], ["moo", 34.27], ["livestock, farm animals, working animals", 24.83]]], "duration": [5.98, 2.06, 3.76, 9.61, 0.69, 8.05, 0.62, 0.36, 1.03, 1.44, 1.25, -0.27, 1.09, -0.29, -0.18, 0.68, 0.01, 1.41, 2.77, 2.32, 1.23, 8.26, 2.83, 2.05, 0.64, 3.71, 1.3, 3.41, 2.82]} \ No newline at end of file diff --git a/annotations_1/jzxMo2UKUKM_filtered.json b/annotations_1/jzxMo2UKUKM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef9cee8507871329c8e2e4985401d3109005672 --- /dev/null +++ b/annotations_1/jzxMo2UKUKM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 81.57], [83.0, 83.61], [88.0, 90.0], [92.0, 117.12], [123.0, 126.22], [133.0, 136.22], [141.0, 143.65], [144.0, 146.13], [148.0, 149.07]], "keep_status": [false, false, true, true, true, false, true, true, false], "silence_prob": [0.0, 0.0, 29.79, 28.87, 28.99, 31.08, 30.92, 32.06, 0.0], "audiomae_on_audioset": [null, null, [["music", 24.07], ["speech", 21.76], ["mains hum", 10.93]], [["music", 29.78], ["hum", 17.72], ["mains hum", 14.57]], [["sound effect", 13.48], ["explosion", 11.14], ["cacophony", 10.47]], [["music", 47.0], ["hum", 13.44], ["throbbing", 10.68]], [["music", 35.33], ["hum", 14.81], ["throbbing", 13.01]], [["noise", 26.38], ["hum", 16.36], ["music", 11.65]], null], "duration": [72.57, 0.61, 2.0, 25.12, 3.22, 3.22, 2.65, 2.13, 1.07]} \ No newline at end of file diff --git a/annotations_1/k01VcZkKDME_filtered.json b/annotations_1/k01VcZkKDME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de91ae67ce46e87a181ff7d3bde49dfec26b11c0 --- /dev/null +++ b/annotations_1/k01VcZkKDME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.14], [10.0, 10.4], [12.0, 12.63], [16.0, 17.36], [20.0, 20.34], [23.0, 23.87], [24.0, 26.22], [28.0, 28.14], [33.0, 37.86], [40.0, 42.84], [45.0, 45.55], [46.0, 46.85], [48.0, 48.41], [49.0, 49.89], [53.0, 53.42], [56.0, 55.9], [56.0, 56.54], [61.0, 61.69], [63.0, 63.81], [65.0, 66.36], [69.0, 69.5], [71.0, 71.71], [74.0, 74.85], [78.0, 78.8], [91.0, 91.18], [93.0, 93.39], [98.0, 99.81], [106.0, 106.44]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.39, 0.0, 99.99, 61.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 47.18], ["animal", 4.89], ["livestock, farm animals, working animals", 4.07]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.14, 0.4, 0.63, 1.36, 0.34, 0.87, 2.22, 0.14, 4.86, 2.84, 0.55, 0.85, 0.41, 0.89, 0.42, -0.1, 0.54, 0.69, 0.81, 1.36, 0.5, 0.71, 0.85, 0.8, 0.18, 0.39, 1.81, 0.44]} \ No newline at end of file diff --git a/annotations_1/k0LLcRLSSlE_filtered.json b/annotations_1/k0LLcRLSSlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8044e47670aefdb9bbd54328c490444264d3047e --- /dev/null +++ b/annotations_1/k0LLcRLSSlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [4.0, 5.31], [6.0, 6.91], [20.0, 20.39], [24.0, 25.88], [29.0, 30.32], [32.0, 32.85], [44.0, 45.91], [49.0, 51.88], [65.0, 66.18], [69.0, 70.41], [71.0, 81.67], [92.0, 92.69], [97.0, 97.93], [100.0, 102.57], [108.0, 117.22], [120.0, 121.34], [124.0, 126.2], [126.0, 129.34], [130.0, 133.66], [135.0, 154.63], [160.0, 161.89], [167.0, 181.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 100.0, 100.0, 30.38, 0.0, 31.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["insect", 27.52], ["speech", 14.97], ["cricket", 11.27]], null, [["music", 69.83], ["speech", 11.43], ["didgeridoo", 7.3]]], "duration": [0.92, 1.31, 0.91, 0.39, 1.88, 1.32, 0.85, 1.91, 2.88, 1.18, 1.41, 10.67, 0.69, 0.93, 2.57, 9.22, 1.34, 2.2, 3.34, 3.66, 19.63, 1.89, 14.14]} \ No newline at end of file diff --git a/annotations_1/k2-SBnbz7pE_filtered.json b/annotations_1/k2-SBnbz7pE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e8bbf237f65e698f2e66944de2ccba85d6b2f198 --- /dev/null +++ b/annotations_1/k2-SBnbz7pE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 67.07], [68.0, 75.88], [79.0, 80.25], [83.0, 84.11], [87.0, 89.4], [90.0, 90.56], [91.0, 94.39], [95.0, 95.3], [96.0, 96.5], [97.0, 96.99], [99.0, 100.09], [102.0, 103.49], [108.0, 117.44], [120.0, 145.98], [151.0, 155.63], [156.0, 161.08], [162.0, 162.95], [164.0, 164.3], [165.0, 166.16]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 33.59, 0.0, 0.0, 50.71, 0.0, 33.04, 0.0, 0.0, 0.0, 0.0, 0.0, 44.34, 31.89, 37.09, 38.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["buzz", 20.19], ["insect", 12.99], ["hum", 11.88]], null, null, null, null, [["whale vocalization", 53.52], ["fly, housefly", 13.02], ["mosquito", 12.94]], null, null, null, null, null, [["whale vocalization", 53.7], ["rumble", 11.36], ["fart", 4.93]], [["music", 36.14], ["speech", 33.88], ["throbbing", 3.18]], [["speech", 25.45], ["music", 21.06], ["whale vocalization", 14.33]], [["hum", 24.02], ["music", 16.4], ["mains hum", 12.89]], null, null, null], "duration": [1.07, 7.88, 1.25, 1.11, 2.4, 0.56, 3.39, 0.3, 0.5, -0.01, 1.09, 1.49, 9.44, 25.98, 4.63, 5.08, 0.95, 0.3, 1.16]} \ No newline at end of file diff --git a/annotations_1/k2s7U_7gHtE_filtered.json b/annotations_1/k2s7U_7gHtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb4fc3339b6a8dd415ce92e4ed058c51173e61d1 --- /dev/null +++ b/annotations_1/k2s7U_7gHtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [3.0, 4.26], [16.0, 17.36], [19.0, 20.29], [22.0, 23.7], [26.0, 28.32], [31.0, 33.84], [35.0, 36.27], [38.0, 38.43], [42.0, 45.72], [47.0, 51.95], [53.0, 60.78], [62.0, 66.02], [69.0, 71.47], [76.0, 76.5], [78.0, 80.18], [82.0, 91.66], [93.0, 95.98], [99.0, 101.21], [105.0, 109.09], [109.0, 110.24], [114.0, 116.75], [117.0, 118.67], [123.0, 123.74], [125.0, 126.08], [140.0, 140.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 83.7, 0.0, 0.0, 97.92, 91.3, 100.0, 63.64, 92.8, 0.0, 99.52, 89.9, 39.09, 88.28, 87.55, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.9], ["music", 20.99], ["hum", 8.65]], null, null, null, null, null, null, null, null], "duration": [0.03, 1.26, 1.36, 1.29, 1.7, 2.32, 2.84, 1.27, 0.43, 3.72, 4.95, 7.78, 4.02, 2.47, 0.5, 2.18, 9.66, 2.98, 2.21, 4.09, 1.24, 2.75, 1.67, 0.74, 1.08, 0.98]} \ No newline at end of file diff --git a/annotations_1/k3KR3Wz29FY_filtered.json b/annotations_1/k3KR3Wz29FY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4cdb63c563651a9f82a7bd8bdbafaf0d9893181 --- /dev/null +++ b/annotations_1/k3KR3Wz29FY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.87], [13.0, 17.71], [18.0, 20.24], [31.0, 31.7], [37.0, 39.02], [42.0, 42.72], [45.0, 56.94], [60.0, 63.24], [82.0, 82.39], [83.0, 89.26], [91.0, 94.54], [99.0, 106.49], [107.0, 107.81], [111.0, 112.14], [116.0, 126.25], [136.0, 136.78], [160.0, 160.61]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 29.81, 43.79, 0.0, 32.76, 0.0, 29.09, 32.23, 0.0, 29.61, 35.77, 33.55, 0.0, 0.0, 31.54, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.5], ["speech", 14.71], ["mains hum", 12.98]], [["music", 55.59], ["throbbing", 9.09], ["speech", 4.47]], null, [["music", 52.25], ["throbbing", 15.33], ["hum", 3.77]], null, [["music", 66.17], ["hum", 6.33], ["throbbing", 5.33]], [["music", 38.87], ["throbbing", 28.43], ["hum", 16.44]], null, [["music", 47.81], ["speech", 37.15], ["musical instrument", 4.34]], [["music", 36.32], ["throbbing", 27.86], ["hum", 11.27]], [["music", 50.35], ["throbbing", 17.23], ["hum", 5.48]], null, null, [["music", 45.81], ["throbbing", 27.47], ["hum", 13.13]], null, null], "duration": [0.87, 4.71, 2.24, 0.7, 2.02, 0.72, 11.94, 3.24, 0.39, 6.26, 3.54, 7.49, 0.81, 1.14, 10.25, 0.78, 0.61]} \ No newline at end of file diff --git a/annotations_1/k3TpBfnaEmI_filtered.json b/annotations_1/k3TpBfnaEmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73c356494ef58cb33412fe54a1e40f5a271766e3 --- /dev/null +++ b/annotations_1/k3TpBfnaEmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.8], [11.0, 12.06], [13.0, 18.74], [19.0, 29.03], [30.0, 49.28], [50.0, 54.11], [55.0, 59.7], [61.0, 61.62], [63.0, 69.06], [70.0, 70.78], [72.0, 74.73], [77.0, 77.68], [80.0, 81.24], [83.0, 83.17], [85.0, 86.85], [89.0, 89.68], [91.0, 93.97], [100.0, 101.82], [106.0, 109.54], [111.0, 111.32], [112.0, 115.77], [117.0, 125.95], [129.0, 129.76], [132.0, 135.58], [140.0, 142.92], [144.0, 146.37], [147.0, 148.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.25, 56.7, 100.0, 99.98, 65.55, 0.0, 99.99, 0.0, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 48.27, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 100.0, 92.31, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 56.89], ["chirp tone", 19.06], ["sidetone", 6.72]], null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 1.06, 5.74, 10.03, 19.28, 4.11, 4.7, 0.62, 6.06, 0.78, 2.73, 0.68, 1.24, 0.17, 1.85, 0.68, 2.97, 1.82, 3.54, 0.32, 3.77, 8.95, 0.76, 3.58, 2.92, 2.37, 1.93]} \ No newline at end of file diff --git a/annotations_1/k3oMPqUTxCE_filtered.json b/annotations_1/k3oMPqUTxCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..987bd871d70a827e4f0f5b76c14061c5abd00baa --- /dev/null +++ b/annotations_1/k3oMPqUTxCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.29], [10.0, 14.22], [16.0, 17.93], [28.0, 28.68], [35.0, 35.23], [44.0, 45.72], [46.0, 47.28], [48.0, 48.49], [59.0, 59.22], [67.0, 67.19], [68.0, 69.8], [81.0, 81.99], [83.0, 86.29], [98.0, 98.79], [102.0, 102.36], [104.0, 105.75], [107.0, 109.38], [112.0, 112.35], [121.0, 132.81], [141.0, 150.53], [152.0, 152.25], [153.0, 154.23], [154.0, 154.97], [156.0, 155.98], [156.0, 156.91], [159.0, 159.46]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 44.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.84, 0.0, 0.0, 0.0, 37.3, 0.0, 31.52, 32.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 45.11], ["musical instrument", 10.42], ["guitar", 9.65]], null, null, null, null, null, null, null, null, null, null, [["music", 47.74], ["didgeridoo", 24.14], ["speech", 11.07]], null, null, null, [["music", 45.14], ["speech", 20.32], ["guitar", 6.82]], null, [["moo", 41.81], ["cattle, bovinae", 37.03], ["livestock, farm animals, working animals", 14.26]], [["speech", 14.1], ["moo", 12.65], ["cattle, bovinae", 11.16]], null, null, null, null, null, null], "duration": [1.29, 4.22, 1.93, 0.68, 0.23, 1.72, 1.28, 0.49, 0.22, 0.19, 1.8, 0.99, 3.29, 0.79, 0.36, 1.75, 2.38, 0.35, 11.81, 9.53, 0.25, 1.23, 0.97, -0.02, 0.91, 0.46]} \ No newline at end of file diff --git a/annotations_1/k5bN73OnGmo_filtered.json b/annotations_1/k5bN73OnGmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0de2bc67e9122145eb02605e209d41e4950de5be --- /dev/null +++ b/annotations_1/k5bN73OnGmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.02], [14.0, 17.41], [18.0, 25.19], [27.0, 30.43], [31.0, 58.95], [60.0, 63.53]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 97.64, 100.0, 100.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.02, 3.41, 7.19, 3.43, 27.95, 3.53]} \ No newline at end of file diff --git a/annotations_1/k5fJmkv02is_filtered.json b/annotations_1/k5fJmkv02is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef194f6d2dd80ef9c373063d01ed6c6c31f803ec --- /dev/null +++ b/annotations_1/k5fJmkv02is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [36.0, 36.27], [48.0, 48.66], [51.0, 53.59], [72.0, 71.66], [98.0, 100.16], [120.0, 123.74], [125.0, 128.9], [130.0, 130.49], [134.0, 134.64], [161.0, 160.73], [164.0, 165.05], [167.0, 167.98], [175.0, 177.77]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 43.74, 0.0, 45.36, 39.72, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.81], "audiomae_on_audioset": [null, null, null, [["music", 41.01], ["throbbing", 13.01], ["hum", 11.07]], null, [["music", 40.95], ["throbbing", 18.64], ["hum", 10.01]], [["music", 35.12], ["throbbing", 17.14], ["hum", 14.33]], null, null, null, null, null, null, [["music", 30.08], ["throbbing", 27.05], ["hum", 7.1]]], "duration": [0.63, 0.27, 0.66, 2.59, -0.34, 2.16, 3.74, 3.9, 0.49, 0.64, -0.27, 1.05, 0.98, 2.77]} \ No newline at end of file diff --git a/annotations_1/k67i1cISzsI_filtered.json b/annotations_1/k67i1cISzsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba1569d9fa65ead4f6f9ca597e3f79c9badc9f94 --- /dev/null +++ b/annotations_1/k67i1cISzsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.82], [6.0, 7.74], [8.0, 13.85], [15.0, 17.41], [19.0, 19.77], [21.0, 23.09], [23.0, 24.46], [27.0, 28.92], [32.0, 35.65], [38.0, 40.05], [41.0, 41.88], [43.0, 46.21], [47.0, 48.98], [52.0, 65.3], [67.0, 74.38], [77.0, 86.46], [88.0, 89.46], [90.0, 121.53], [124.0, 129.22], [130.0, 135.73], [137.0, 138.1], [139.0, 141.17], [142.0, 165.79], [167.0, 169.37], [170.0, 171.1], [172.0, 172.34], [173.0, 174.58], [175.0, 183.69], [184.0, 184.76], [185.0, 184.99], [185.0, 185.09]], "keep_status": [false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.18, 0.0, 43.08, 43.56, 0.0, 38.36, 0.0, 0.0, 44.55, 45.62, 0.0, 43.82, 0.0, 38.9, 39.82, 38.71, 0.0, 0.0, 32.19, 35.29, 0.0, 54.83, 49.64, 34.46, 0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.85], ["throbbing", 11.82], ["bow-wow", 3.65]], null, [["hum", 35.8], ["music", 23.29], ["throbbing", 12.67]], [["music", 41.01], ["throbbing", 13.33], ["didgeridoo", 9.99]], null, [["music", 64.27], ["hum", 6.69], ["throbbing", 6.12]], null, null, [["music", 40.3], ["throbbing", 19.24], ["hum", 9.93]], [["music", 46.33], ["throbbing", 14.04], ["hum", 6.45]], null, [["music", 42.35], ["throbbing", 11.16], ["synthesizer", 10.68]], null, [["music", 44.4], ["throbbing", 14.44], ["hum", 11.94]], [["music", 45.76], ["didgeridoo", 13.93], ["throbbing", 13.54]], [["music", 68.88], ["didgeridoo", 14.59], ["throbbing", 2.93]], null, null, [["music", 33.76], ["didgeridoo", 23.33], ["hum", 11.7]], [["music", 34.2], ["didgeridoo", 11.76], ["hum", 10.98]], null, null, [["hum", 49.4], ["mains hum", 23.74], ["throbbing", 13.95]], [["speech", 54.17], ["fart", 22.87], ["inside, small room", 3.09]], null, null, null, null, null, null, null], "duration": [2.82, 1.74, 5.85, 2.41, 0.77, 2.09, 1.46, 1.92, 3.65, 2.05, 0.88, 3.21, 1.98, 13.3, 7.38, 9.46, 1.46, 31.53, 5.22, 5.73, 1.1, 2.17, 23.79, 2.37, 1.1, 0.34, 1.58, 8.69, 0.76, -0.01, 0.09]} \ No newline at end of file diff --git a/annotations_1/k6dRH6fO3Xw_filtered.json b/annotations_1/k6dRH6fO3Xw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a24d7c6573d0f7829f34fbddcbccb4b90179685 --- /dev/null +++ b/annotations_1/k6dRH6fO3Xw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 33.56], [34.0, 34.57], [35.0, 35.7], [37.0, 96.47], [98.0, 122.37], [125.0, 139.28]], "keep_status": [false, false, false, false, true, false], "silence_prob": [31.72, 0.0, 0.0, 0.0, 31.75, 31.72], "audiomae_on_audioset": [[["hum", 35.97], ["throbbing", 22.6], ["music", 16.54]], null, null, null, [["music", 16.5], ["vehicle", 14.14], ["race car, auto racing", 13.77]], [["speech", 50.34], ["buzz", 12.47], ["vehicle", 8.93]]], "duration": [24.56, 0.57, 0.7, 59.47, 24.37, 14.28]} \ No newline at end of file diff --git a/annotations_1/k6u3YvvvgjQ_filtered.json b/annotations_1/k6u3YvvvgjQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dff6ad67a8f91fe81867e6673b7a342350f5ce7b --- /dev/null +++ b/annotations_1/k6u3YvvvgjQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.31], [7.0, 8.19], [12.0, 12.18], [13.0, 13.42], [19.0, 19.87], [28.0, 31.48], [33.0, 34.13], [35.0, 36.69], [37.0, 38.92], [42.0, 47.12], [49.0, 61.35], [62.0, 64.57], [65.0, 66.97], [68.0, 68.62], [70.0, 70.48], [71.0, 73.21], [75.0, 75.73], [77.0, 77.84], [79.0, 80.42], [81.0, 81.6], [83.0, 86.09], [88.0, 90.51], [91.0, 91.81], [93.0, 94.44], [95.0, 96.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 99.48, 84.62, 53.22, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 46.43, 38.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.21], ["thunk", 12.7], ["hum", 8.89]], [["music", 50.57], ["theremin", 15.41], ["walk, footsteps", 2.07]], null, null, null], "duration": [1.31, 1.19, 0.18, 0.42, 0.87, 3.48, 1.13, 1.69, 1.92, 5.12, 12.35, 2.57, 1.97, 0.62, 0.48, 2.21, 0.73, 0.84, 1.42, 0.6, 3.09, 2.51, 0.81, 1.44, 1.01]} \ No newline at end of file diff --git a/annotations_1/k7_V-3ApEiM_filtered.json b/annotations_1/k7_V-3ApEiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aad4df210fd012a9831cf5b7b9b3db9efa588149 --- /dev/null +++ b/annotations_1/k7_V-3ApEiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.85], [7.0, 8.36], [9.0, 17.69], [19.0, 19.92], [21.0, 21.73], [23.0, 23.84], [26.0, 26.69], [30.0, 31.68], [32.0, 82.98], [85.0, 96.45], [98.0, 101.12], [102.0, 103.98], [105.0, 111.2], [112.0, 158.08]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 59.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.64, 51.99, 0.0, 30.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 35.65], ["music", 18.38], ["mains hum", 13.64]], null, null, [["hum", 26.91], ["music", 24.8], ["throbbing", 9.52]], null], "duration": [1.85, 1.36, 8.69, 0.92, 0.73, 0.84, 0.69, 1.68, 50.98, 11.45, 3.12, 1.98, 6.2, 46.08]} \ No newline at end of file diff --git a/annotations_1/k7ej9E5b8js_filtered.json b/annotations_1/k7ej9E5b8js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..323fdcaabd94651403f5d222eca6689a303a29a7 --- /dev/null +++ b/annotations_1/k7ej9E5b8js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.45], [20.0, 21.44], [22.0, 24.24], [25.0, 26.3], [27.0, 28.02], [30.0, 30.23], [31.0, 33.29], [34.0, 38.8], [41.0, 41.96], [43.0, 44.39], [46.0, 63.49], [64.0, 64.66], [69.0, 71.19], [73.0, 82.61], [83.0, 102.42], [103.0, 104.31], [105.0, 116.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 53.34, 0.0, 0.0, 0.0, 49.78, 41.76, 0.0, 0.0, 38.19, 0.0, 76.37, 36.9, 34.25, 0.0, 36.45], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 51.92], ["whale vocalization", 11.05], ["mains hum", 7.98]], [["hum", 55.87], ["mains hum", 24.74], ["throbbing", 11.41]], null, null, [["hum", 29.3], ["mains hum", 23.31], ["speech", 7.82]], null, null, [["hum", 34.12], ["mains hum", 18.14], ["throbbing", 7.54]], [["hum", 39.81], ["throbbing", 21.93], ["mains hum", 13.27]], null, [["throbbing", 47.18], ["hum", 27.8], ["heart sounds, heartbeat", 5.08]]], "duration": [1.45, 1.44, 2.24, 1.3, 1.02, 0.23, 2.29, 4.8, 0.96, 1.39, 17.49, 0.66, 2.19, 9.61, 19.42, 1.31, 11.58]} \ No newline at end of file diff --git a/annotations_1/k8Vn9zLollY_filtered.json b/annotations_1/k8Vn9zLollY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/k8Vn9zLollY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/k8bJrJ7_LKI_filtered.json b/annotations_1/k8bJrJ7_LKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5176d384b94693a21bc49b43ed934099979397f8 --- /dev/null +++ b/annotations_1/k8bJrJ7_LKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.15], [13.0, 24.33], [36.0, 36.66], [39.0, 39.31], [58.0, 58.73], [59.0, 60.12], [62.0, 65.18], [66.0, 66.92], [71.0, 73.58], [75.0, 75.2], [77.0, 77.45], [79.0, 78.7], [79.0, 79.98], [83.0, 83.1], [91.0, 91.25], [94.0, 94.58], [98.0, 98.58], [99.0, 99.98], [100.0, 101.49], [106.0, 105.71], [106.0, 107.64], [109.0, 109.14], [111.0, 110.89], [111.0, 111.4], [113.0, 113.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.55, 53.78, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 11.33, 0.66, 0.31, 0.73, 1.12, 3.18, 0.92, 2.58, 0.2, 0.45, -0.3, 0.98, 0.1, 0.25, 0.58, 0.58, 0.98, 1.49, -0.29, 1.64, 0.14, -0.11, 0.4, 0.71]} \ No newline at end of file diff --git a/annotations_1/k96h1dYQrj0_filtered.json b/annotations_1/k96h1dYQrj0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a04bcef27d1c4be57b9f7171d3ffe556dc0032 --- /dev/null +++ b/annotations_1/k96h1dYQrj0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.66], [13.0, 18.64], [21.0, 22.13], [24.0, 25.32], [31.0, 31.4], [33.0, 32.95], [34.0, 34.35], [38.0, 37.94], [39.0, 39.29], [41.0, 41.42], [53.0, 54.09], [58.0, 66.97], [72.0, 71.88], [75.0, 76.62], [77.0, 78.58], [80.0, 81.11], [82.0, 88.84], [89.0, 91.98], [93.0, 96.01], [97.0, 99.0], [100.0, 100.57], [102.0, 106.1], [107.0, 107.57], [108.0, 111.2], [113.0, 114.29], [116.0, 117.91], [120.0, 123.11], [125.0, 128.43], [129.0, 129.93], [130.0, 131.55], [137.0, 145.72], [146.0, 146.92], [149.0, 150.45], [152.0, 153.69], [158.0, 160.78]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [33.95, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 91.81, 77.03, 100.0, 43.69, 0.0, 35.59, 0.0, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 42.35], "audiomae_on_audioset": [[["speech", 19.0], ["music", 14.63], ["cattle, bovinae", 8.48]], [["mosquito", 23.23], ["fly, housefly", 13.09], ["speech", 11.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 78.43], ["music", 3.06], ["inside, small room", 2.62]], null, [["speech", 27.96], ["baby laughter", 10.0], ["belly laugh", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.29], ["hum", 7.12], ["whale vocalization", 5.08]]], "duration": [9.66, 5.64, 1.13, 1.32, 0.4, -0.05, 0.35, -0.06, 0.29, 0.42, 1.09, 8.97, -0.12, 1.62, 1.58, 1.11, 6.84, 2.98, 3.01, 2.0, 0.57, 4.1, 0.57, 3.2, 1.29, 1.91, 3.11, 3.43, 0.93, 1.55, 8.72, 0.92, 1.45, 1.69, 2.78]} \ No newline at end of file diff --git a/annotations_1/k9DO26O6dIg_filtered.json b/annotations_1/k9DO26O6dIg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1191b4ee6f7935e1bff6782e3424be884dd90615 --- /dev/null +++ b/annotations_1/k9DO26O6dIg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [3.0, 4.14], [5.0, 5.66], [11.0, 12.33], [15.0, 15.74], [19.0, 18.94], [24.0, 24.41], [26.0, 25.61], [30.0, 29.79], [32.0, 33.07], [39.0, 41.84], [49.0, 53.86], [55.0, 57.32], [62.0, 62.65], [81.0, 81.55], [83.0, 84.18], [90.0, 90.88], [93.0, 98.68], [102.0, 103.59], [106.0, 107.06], [110.0, 110.98], [120.0, 123.77], [127.0, 127.48], [135.0, 136.71], [137.0, 139.04], [140.0, 141.39], [143.0, 144.34], [146.0, 149.55], [151.0, 151.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 100.0, 98.99, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 32.21, 0.0, 0.0, 79.76, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["radio", 43.91], ["speech", 38.11], ["inside, small room", 2.11]], null, null, null, null, null, null, null], "duration": [0.7, 1.14, 0.66, 1.33, 0.74, -0.06, 0.41, -0.39, -0.21, 1.07, 2.84, 4.86, 2.32, 0.65, 0.55, 1.18, 0.88, 5.68, 1.59, 1.06, 0.98, 3.77, 0.48, 1.71, 2.04, 1.39, 1.34, 3.55, 0.21]} \ No newline at end of file diff --git a/annotations_1/k9utcDoerr0_filtered.json b/annotations_1/k9utcDoerr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c51ed02f65ad8b3a56832c8b60ac5bd2935392c --- /dev/null +++ b/annotations_1/k9utcDoerr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.75], [12.0, 24.0], [28.0, 27.77], [28.0, 31.53], [34.0, 40.07], [46.0, 48.81], [49.0, 50.65], [54.0, 53.99], [58.0, 59.56], [61.0, 63.37], [67.0, 70.31], [71.0, 72.2], [75.0, 76.59], [77.0, 78.51], [81.0, 81.72], [84.0, 84.37], [88.0, 88.47], [90.0, 91.18], [92.0, 95.45], [97.0, 97.19], [99.0, 99.66], [101.0, 101.49], [102.0, 101.53], [103.0, 104.31], [107.0, 108.41], [111.0, 112.41], [113.0, 114.4], [120.0, 121.07], [126.0, 127.04], [129.0, 130.22], [135.0, 136.85], [141.0, 141.29], [143.0, 143.34], [147.0, 147.31], [151.0, 151.75], [153.0, 153.47], [155.0, 162.95], [164.0, 166.7], [169.0, 169.5], [172.0, 172.54], [179.0, 181.65]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 37.15, 0.0, 39.21, 99.62, 97.11, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.72, 33.03, 0.0, 0.0, 97.43], "audiomae_on_audioset": [null, [["frog", 23.67], ["animal", 9.65], ["livestock, farm animals, working animals", 6.99]], null, [["speech", 22.43], ["frog", 18.76], ["noise", 11.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.74], ["music", 5.52], ["hum", 5.26]], [["dog", 21.43], ["domestic animals, pets", 14.08], ["animal", 10.55]], null, null, null], "duration": [1.75, 12.0, -0.23, 3.53, 6.07, 2.81, 1.65, -0.01, 1.56, 2.37, 3.31, 1.2, 1.59, 1.51, 0.72, 0.37, 0.47, 1.18, 3.45, 0.19, 0.66, 0.49, -0.47, 1.31, 1.41, 1.41, 1.4, 1.07, 1.04, 1.22, 1.85, 0.29, 0.34, 0.31, 0.75, 0.47, 7.95, 2.7, 0.5, 0.54, 2.65]} \ No newline at end of file diff --git a/annotations_1/kARcfM_M6VE_filtered.json b/annotations_1/kARcfM_M6VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3102e6abb616fe264bd9a515e7163af9993ea2ed --- /dev/null +++ b/annotations_1/kARcfM_M6VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.77], [28.0, 28.36], [43.0, 43.01], [53.0, 55.29], [57.0, 58.73], [59.0, 60.78], [68.0, 68.62], [81.0, 85.75], [90.0, 90.88], [101.0, 101.75], [104.0, 105.36], [110.0, 110.17], [114.0, 113.95], [117.0, 117.1], [125.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [29.6, 0.0, 0.0, 28.65, 0.0, 0.0, 0.0, 29.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.64], "audiomae_on_audioset": [[["music", 58.75], ["didgeridoo", 17.94], ["musical instrument", 5.87]], null, null, [["throbbing", 31.13], ["hum", 29.33], ["music", 14.24]], null, null, null, [["music", 49.07], ["musical instrument", 8.4], ["synthesizer", 7.86]], null, null, null, null, null, null, [["sidetone", 29.94], ["hum", 21.43], ["mains hum", 18.46]]], "duration": [2.77, 0.36, 0.01, 2.29, 1.73, 1.78, 0.62, 4.75, 0.88, 0.75, 1.36, 0.17, -0.05, 0.1, 4.64]} \ No newline at end of file diff --git a/annotations_1/kBErrmmqnkI_filtered.json b/annotations_1/kBErrmmqnkI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc7b8e9f07b7ca43e5dac68639387495b53d1198 --- /dev/null +++ b/annotations_1/kBErrmmqnkI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 51.26], [52.0, 78.81], [83.0, 97.88], [105.0, 106.2], [114.0, 114.22], [118.0, 127.94], [131.0, 162.28], [165.0, 180.94], [182.0, 185.36], [189.0, 190.49], [193.0, 193.5], [194.0, 199.94], [200.0, 200.26], [201.0, 201.24], [203.0, 204.25]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [30.12, 30.1, 29.29, 0.0, 0.0, 29.25, 0.0, 29.19, 33.17, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.21], ["theremin", 7.94], ["musical instrument", 6.19]], [["music", 43.91], ["clarinet", 17.14], ["trombone", 14.0]], [["music", 19.99], ["boing", 10.47], ["cattle, bovinae", 9.42]], null, null, [["livestock, farm animals, working animals", 31.73], ["cattle, bovinae", 24.42], ["moo", 18.21]], null, [["music", 27.27], ["trombone", 15.39], ["brass instrument", 9.26]], [["speech", 66.24], ["whimper", 10.46], ["crying, sobbing", 6.09]], null, null, [["speech", 38.06], ["clip-clop", 10.01], ["horse", 8.01]], null, null, null], "duration": [22.26, 26.81, 14.88, 1.2, 0.22, 9.94, 31.28, 15.94, 3.36, 1.49, 0.5, 5.94, 0.26, 0.24, 1.25]} \ No newline at end of file diff --git a/annotations_1/kBTPEpA8BzU_filtered.json b/annotations_1/kBTPEpA8BzU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ab374097817636fc4e83f6fffb653179b6c4ebc --- /dev/null +++ b/annotations_1/kBTPEpA8BzU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 78.39], [79.0, 79.12], [86.0, 93.16], [94.0, 103.72], [106.0, 162.35], [167.0, 168.24]], "keep_status": [false, false, false, false, false, false], "silence_prob": [30.83, 0.0, 29.84, 31.88, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 29.48], ["hum", 27.65], ["speech", 17.34]], null, [["speech", 62.22], ["explosion", 7.94], ["music", 4.17]], [["speech", 59.69], ["electric shaver, electric razor", 10.1], ["noise", 5.27]], null, null], "duration": [24.39, 0.12, 7.16, 9.72, 56.35, 1.24]} \ No newline at end of file diff --git a/annotations_1/kBwVWrBk_uo_filtered.json b/annotations_1/kBwVWrBk_uo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9efc0491713b8049a5b295426953256d967bcb98 --- /dev/null +++ b/annotations_1/kBwVWrBk_uo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 13.93], [16.0, 19.33], [20.0, 20.83], [22.0, 25.78], [27.0, 28.83], [30.0, 32.43], [35.0, 36.61], [39.0, 39.56], [40.0, 41.99], [43.0, 44.98], [46.0, 54.51], [55.0, 57.37], [58.0, 59.43], [62.0, 64.3], [65.0, 66.19], [68.0, 69.67], [72.0, 73.63], [74.0, 85.55], [87.0, 92.26], [93.0, 100.74], [102.0, 103.2], [104.0, 104.65], [105.0, 104.85], [105.0, 104.89], [105.0, 104.92], [108.0, 113.19], [114.0, 116.01], [119.0, 175.31], [175.0, 194.22]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [65.55, 40.41, 0.0, 75.72, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 54.43, 78.55, 0.0, 48.91, 0.0, 0.0, 0.0, 43.96, 54.43, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 67.76, 0.0, 36.85], "audiomae_on_audioset": [null, [["music", 18.8], ["whale vocalization", 9.78], ["chime", 8.31]], null, null, null, null, null, null, null, null, null, null, null, [["chime", 21.17], ["wind chime", 16.96], ["glass", 8.32]], null, null, null, [["hum", 16.8], ["music", 16.11], ["speech", 15.41]], null, [["hum", 28.69], ["music", 25.35], ["mains hum", 10.66]], null, null, null, null, null, null, null, null, [["music", 43.71], ["singing bowl", 13.6], ["chirp tone", 5.68]]], "duration": [11.93, 3.33, 0.83, 3.78, 1.83, 2.43, 1.61, 0.56, 1.99, 1.98, 8.51, 2.37, 1.43, 2.3, 1.19, 1.67, 1.63, 11.55, 5.26, 7.74, 1.2, 0.65, -0.15, -0.11, -0.08, 5.19, 2.01, 56.31, 19.22]} \ No newline at end of file diff --git a/annotations_1/kCrtP_gPMwk_filtered.json b/annotations_1/kCrtP_gPMwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..501020f55a9e2dd35422d46643baff12848e363a --- /dev/null +++ b/annotations_1/kCrtP_gPMwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [3.0, 3.65], [4.0, 4.29], [5.0, 6.76], [7.0, 12.41], [15.0, 15.6], [17.0, 19.4], [21.0, 21.39], [22.0, 22.33], [23.0, 23.43], [24.0, 25.62], [29.0, 32.61], [33.0, 33.91], [38.0, 41.79], [42.0, 44.39], [45.0, 45.45], [48.0, 48.09], [50.0, 54.5], [65.0, 68.0], [69.0, 71.25], [74.0, 78.24], [79.0, 81.03], [85.0, 85.33], [89.0, 91.62], [94.0, 95.42], [97.0, 97.38], [98.0, 101.6], [107.0, 110.49], [114.0, 116.7], [118.0, 118.79], [121.0, 121.44], [123.0, 124.28], [126.0, 125.76], [130.0, 131.55], [138.0, 138.11], [140.0, 140.19], [147.0, 151.12], [151.0, 154.48], [158.0, 162.13], [162.0, 162.82], [164.0, 164.78], [169.0, 169.97], [181.0, 180.74], [191.0, 192.23], [194.0, 194.56], [195.0, 195.91], [196.0, 196.6], [202.0, 202.2], [203.0, 204.08], [212.0, 212.26], [214.0, 216.01], [216.0, 217.88], [222.0, 222.84], [229.0, 229.51], [230.0, 231.09], [231.0, 234.52], [235.0, 234.82], [237.0, 237.69], [240.0, 240.61], [244.0, 245.27], [245.0, 245.44], [250.0, 252.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 88.83, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 50.26, 0.0, 60.89, 52.51, 0.0, 0.0, 34.37, 99.92, 95.91, 40.66, 73.82, 0.0, 60.6, 0.0, 0.0, 36.11, 33.95, 39.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.74, 44.46, 79.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.05, 0.0, 0.0, 0.0, 0.0, 42.51, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 74.52], ["beatboxing", 6.13], ["laughter", 2.26]], null, null, [["howl", 29.99], ["animal", 12.13], ["domestic animals, pets", 10.04]], null, null, null, null, null, [["music", 33.58], ["clarinet", 13.47], ["wind instrument, woodwind instrument", 12.75]], [["music", 43.42], ["musical instrument", 11.0], ["wind instrument, woodwind instrument", 9.77]], [["music", 61.45], ["musical instrument", 7.12], ["whimper", 3.45]], null, null, null, null, null, null, null, [["thunk", 14.41], ["music", 10.26], ["speech", 7.91]], [["tuning fork", 34.44], ["speech", 32.29], ["sine wave", 10.76]], null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 40.09], ["bouncing", 8.89], ["music", 6.59]], null, null, null, null, [["speech", 36.75], ["whimper", 7.67], ["owl", 5.32]], null, null, null, null, null, null], "duration": [1.16, 0.65, 0.29, 1.76, 5.41, 0.6, 2.4, 0.39, 0.33, 0.43, 1.62, 3.61, 0.91, 3.79, 2.39, 0.45, 0.09, 4.5, 3.0, 2.25, 4.24, 2.03, 0.33, 2.62, 1.42, 0.38, 3.6, 3.49, 2.7, 0.79, 0.44, 1.28, -0.24, 1.55, 0.11, 0.19, 4.12, 3.48, 4.13, 0.82, 0.78, 0.97, -0.26, 1.23, 0.56, 0.91, 0.6, 0.2, 1.08, 0.26, 2.01, 1.88, 0.84, 0.51, 1.09, 3.52, -0.18, 0.69, 0.61, 1.27, 0.44, 2.73]} \ No newline at end of file diff --git a/annotations_1/kCxqmweKXZ0_filtered.json b/annotations_1/kCxqmweKXZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d49eb477d59f739c4d228e3562cbe3ec7baa5047 --- /dev/null +++ b/annotations_1/kCxqmweKXZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.76], [16.0, 29.52], [30.0, 30.75], [32.0, 34.62], [39.0, 40.34], [42.0, 45.01], [47.0, 47.7], [49.0, 50.82], [54.0, 57.25], [59.0, 61.52], [63.0, 62.94], [73.0, 73.87], [76.0, 94.56], [96.0, 96.42], [98.0, 98.04], [100.0, 140.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [29.98, 32.38, 0.0, 29.43, 0.0, 38.4, 0.0, 0.0, 30.49, 30.43, 0.0, 0.0, 29.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 32.26], ["mains hum", 25.16], ["electric shaver, electric razor", 14.82]], [["music", 48.35], ["throbbing", 19.65], ["hum", 16.66]], null, [["livestock, farm animals, working animals", 36.89], ["moo", 35.81], ["cattle, bovinae", 25.54]], null, [["hum", 65.74], ["throbbing", 12.68], ["mains hum", 12.01]], null, null, [["music", 22.84], ["hum", 12.47], ["mains hum", 10.01]], [["hum", 32.17], ["music", 18.71], ["mains hum", 14.46]], null, null, [["hum", 38.74], ["throbbing", 24.84], ["music", 16.58]], null, null, null], "duration": [7.76, 13.52, 0.75, 2.62, 1.34, 3.01, 0.7, 1.82, 3.25, 2.52, -0.06, 0.87, 18.56, 0.42, 0.04, 40.19]} \ No newline at end of file diff --git a/annotations_1/kD0zHgK3BJ8_filtered.json b/annotations_1/kD0zHgK3BJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bc71b96463b3d93d48570c65b37b3c779e34cbf --- /dev/null +++ b/annotations_1/kD0zHgK3BJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.89], [4.0, 4.75], [6.0, 10.77], [12.0, 12.9], [15.0, 18.76], [22.0, 22.33], [24.0, 24.36], [31.0, 31.06], [37.0, 38.35], [40.0, 41.25], [43.0, 43.53], [44.0, 49.35], [54.0, 57.06], [63.0, 64.07], [65.0, 66.31], [67.0, 67.64], [69.0, 69.52], [71.0, 71.46], [75.0, 75.25], [80.0, 80.43], [83.0, 83.37], [84.0, 84.94], [87.0, 87.86], [89.0, 89.4], [90.0, 92.8], [94.0, 94.88], [97.0, 98.17], [99.0, 99.72], [102.0, 105.43], [108.0, 108.97], [113.0, 115.43], [120.0, 122.1], [124.0, 129.27], [131.0, 131.89], [133.0, 135.82], [137.0, 144.61], [145.0, 145.88], [148.0, 149.61], [151.0, 151.48], [153.0, 154.33], [156.0, 157.3], [158.0, 160.41], [162.0, 163.34], [169.0, 175.32], [177.0, 179.07], [180.0, 182.21], [183.0, 183.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 95.09, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.64, 0.0, 0.0, 0.0, 96.42, 0.0, 82.79, 99.05, 78.04, 0.0, 90.43, 83.7, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 76.86, 93.76, 87.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 36.48], ["mains hum", 13.63], ["throbbing", 10.52]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 0.75, 4.77, 0.9, 3.76, 0.33, 0.36, 0.06, 1.35, 1.25, 0.53, 5.35, 3.06, 1.07, 1.31, 0.64, 0.52, 0.46, 0.25, 0.43, 0.37, 0.94, 0.86, 0.4, 2.8, 0.88, 1.17, 0.72, 3.43, 0.97, 2.43, 2.1, 5.27, 0.89, 2.82, 7.61, 0.88, 1.61, 0.48, 1.33, 1.3, 2.41, 1.34, 6.32, 2.07, 2.21, 0.51]} \ No newline at end of file diff --git a/annotations_1/kDDU-k-5v6s_filtered.json b/annotations_1/kDDU-k-5v6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07cbc9d44932cf66fc68abef344b6cd6ed45dfb1 --- /dev/null +++ b/annotations_1/kDDU-k-5v6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.0], [29.0, 29.29], [30.0, 32.09], [35.0, 36.64], [38.0, 50.41], [54.0, 77.94], [78.0, 103.03], [105.0, 105.21], [105.0, 108.46], [113.0, 115.18], [116.0, 118.5], [121.0, 121.09], [122.0, 122.27], [128.0, 128.65], [129.0, 135.31], [138.0, 148.83]], "keep_status": [false, false, true, false, true, true, true, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 33.14, 0.0, 28.88, 29.15, 29.35, 0.0, 29.32, 30.0, 32.76, 0.0, 0.0, 0.0, 29.86, 28.71], "audiomae_on_audioset": [null, null, [["music", 26.44], ["speech", 20.39], ["inside, small room", 4.16]], null, [["music", 43.15], ["speech", 3.45], ["animal", 3.1]], [["music", 44.82], ["buzz", 9.6], ["fly, housefly", 4.75]], [["music", 35.05], ["roaring cats (lions, tigers)", 8.34], ["animal", 7.4]], null, [["speech", 33.89], ["music", 25.6], ["electric shaver, electric razor", 15.66]], [["music", 40.41], ["fart", 5.86], ["fly, housefly", 4.06]], [["hum", 41.8], ["throbbing", 17.25], ["music", 14.55]], null, null, null, [["music", 23.81], ["speech", 20.92], ["mains hum", 14.55]], [["speech", 32.36], ["music", 13.49], ["vehicle", 8.68]]], "duration": [1.0, 0.29, 2.09, 1.64, 12.41, 23.94, 25.03, 0.21, 3.46, 2.18, 2.5, 0.09, 0.27, 0.65, 6.31, 10.83]} \ No newline at end of file diff --git a/annotations_1/kDSiyU72RpA_filtered.json b/annotations_1/kDSiyU72RpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f06761400f8a665b28a8be0f4069e0aeb63507d --- /dev/null +++ b/annotations_1/kDSiyU72RpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.95], [11.0, 11.8], [13.0, 17.71], [18.0, 19.11], [20.0, 21.25], [24.0, 24.44], [27.0, 27.62], [28.0, 29.49], [41.0, 41.25], [51.0, 55.11], [59.0, 59.17], [60.0, 60.57], [63.0, 62.92], [66.0, 66.73], [68.0, 68.84], [73.0, 73.03], [77.0, 76.84], [78.0, 78.48], [79.0, 79.95], [81.0, 81.11], [85.0, 85.72], [90.0, 91.05], [92.0, 92.35], [93.0, 102.03], [104.0, 109.54], [111.0, 112.02], [113.0, 117.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [87.0, 0.0, 95.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 35.94, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 14.38], ["wood", 13.74], ["splinter", 13.39]], null, null], "duration": [5.95, 0.8, 4.71, 1.11, 1.25, 0.44, 0.62, 1.49, 0.25, 4.11, 0.17, 0.57, -0.08, 0.73, 0.84, 0.03, -0.16, 0.48, 0.95, 0.11, 0.72, 1.05, 0.35, 9.03, 5.54, 1.02, 4.29]} \ No newline at end of file diff --git a/annotations_1/kDTjN5dVCzg_filtered.json b/annotations_1/kDTjN5dVCzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26482692417579631dd86d735cc4326802471183 --- /dev/null +++ b/annotations_1/kDTjN5dVCzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.38], [15.0, 15.08], [20.0, 23.26], [41.0, 41.62], [47.0, 58.28], [82.0, 83.4], [87.0, 101.09], [102.0, 102.54], [104.0, 109.17], [118.0, 120.51], [121.0, 122.2], [124.0, 124.77]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 49.36, 0.0, 29.81, 0.0, 70.86, 0.0, 34.03, 99.95, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 82.69], ["sidetone", 2.24], ["music", 2.23]], null, [["throbbing", 34.24], ["music", 27.85], ["didgeridoo", 13.15]], null, null, null, [["speech", 53.34], ["arrow", 5.4], ["door", 3.35]], null, null, null], "duration": [0.38, 0.08, 3.26, 0.62, 11.28, 1.4, 14.09, 0.54, 5.17, 2.51, 1.2, 0.77]} \ No newline at end of file diff --git a/annotations_1/kEL5reRoNk8_filtered.json b/annotations_1/kEL5reRoNk8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa8eb6a137475bfacf4070887912b86a0d4ab12 --- /dev/null +++ b/annotations_1/kEL5reRoNk8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.88], [18.0, 20.38], [22.0, 24.78], [26.0, 28.97], [31.0, 39.72], [53.0, 54.23], [56.0, 72.71]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 78.72, 74.44, 77.36, 52.68, 0.0, 30.84], "audiomae_on_audioset": [null, null, null, null, null, null, [["cattle, bovinae", 28.81], ["livestock, farm animals, working animals", 24.34], ["moo", 23.84]]], "duration": [0.88, 2.38, 2.78, 2.97, 8.72, 1.23, 16.71]} \ No newline at end of file diff --git a/annotations_1/kEnK0ZdMThc_filtered.json b/annotations_1/kEnK0ZdMThc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..682fb180f6a0aeff5687419940455ca345646680 --- /dev/null +++ b/annotations_1/kEnK0ZdMThc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 74.24], [76.0, 82.51], [85.0, 84.99], [86.0, 87.42], [88.0, 88.37], [91.0, 92.37], [93.0, 97.11], [102.0, 103.18], [105.0, 113.66], [116.0, 115.94], [120.0, 131.19], [133.0, 168.44], [169.0, 168.81], [169.0, 169.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [30.14, 35.62, 0.0, 0.0, 0.0, 0.0, 35.7, 0.0, 34.85, 0.0, 27.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.49], ["hum", 13.41], ["ambient music", 8.34]], [["throbbing", 31.3], ["hum", 23.67], ["music", 20.64]], null, null, null, null, [["music", 29.09], ["throbbing", 23.55], ["hum", 18.54]], null, [["throbbing", 37.46], ["music", 35.27], ["hum", 8.76]], null, [["eruption", 14.76], ["breaking", 12.17], ["smash, crash", 7.08]], null, null, null], "duration": [6.24, 6.51, -0.01, 1.42, 0.37, 1.37, 4.11, 1.18, 8.66, -0.06, 11.19, 35.44, -0.19, 0.6]} \ No newline at end of file diff --git a/annotations_1/kFbDy90VZQY_filtered.json b/annotations_1/kFbDy90VZQY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60c9af075d6c5fa557e0a465abfc7a24969a49f6 --- /dev/null +++ b/annotations_1/kFbDy90VZQY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.94], [8.0, 8.83], [10.0, 9.85], [19.0, 20.02], [21.0, 22.2], [23.0, 38.42], [39.0, 46.99], [51.0, 53.99], [60.0, 62.45], [71.0, 77.5], [79.0, 78.87], [84.0, 88.53], [89.0, 100.04], [104.0, 105.56], [108.0, 109.26], [117.0, 118.32], [120.0, 123.38], [130.0, 132.73], [133.0, 133.47]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.08, 31.52, 33.61, 34.75, 29.68, 0.0, 30.3, 39.35, 0.0, 0.0, 0.0, 44.04, 43.35, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 54.93], ["speech", 15.72], ["buzz", 3.78]], [["music", 31.28], ["hum", 25.75], ["throbbing", 13.6]], [["music", 34.22], ["noise", 8.94], ["hum", 6.5]], [["music", 42.82], ["brass instrument", 8.63], ["trombone", 6.24]], [["music", 79.62], ["musical instrument", 4.22], ["foghorn", 2.22]], null, [["music", 50.5], ["didgeridoo", 14.47], ["pulse", 6.28]], [["music", 50.43], ["speech", 24.03], ["hum", 6.72]], null, null, null, [["music", 42.25], ["whale vocalization", 11.23], ["theremin", 6.07]], [["music", 49.09], ["hum", 7.15], ["ambient music", 4.7]], null], "duration": [0.94, 0.83, -0.15, 1.02, 1.2, 15.42, 7.99, 2.99, 2.45, 6.5, -0.13, 4.53, 11.04, 1.56, 1.26, 1.32, 3.38, 2.73, 0.47]} \ No newline at end of file diff --git a/annotations_1/kFeduM49hBY_filtered.json b/annotations_1/kFeduM49hBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e585a0211eb4d31a7c41156e33e619d1a9233776 --- /dev/null +++ b/annotations_1/kFeduM49hBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.12], [3.0, 6.3], [7.0, 7.52], [8.0, 8.45], [9.0, 24.53], [26.0, 26.49], [29.0, 95.72], [96.0, 95.77]], "keep_status": [false, true, false, false, true, false, false, false], "silence_prob": [0.0, 30.95, 0.0, 0.0, 29.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 44.76], ["buzz", 10.84], ["sound effect", 5.23]], null, null, [["speech", 47.21], ["buzz", 10.32], ["fly, housefly", 9.27]], null, null, null], "duration": [0.12, 3.3, 0.52, 0.45, 15.53, 0.49, 66.72, -0.23]} \ No newline at end of file diff --git a/annotations_1/kFhDGoJh4O4_filtered.json b/annotations_1/kFhDGoJh4O4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b81dfd50631831245d9f390e09b28a732396df9a --- /dev/null +++ b/annotations_1/kFhDGoJh4O4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [7.0, 9.78], [11.0, 13.09], [15.0, 16.58], [19.0, 23.75], [25.0, 26.5], [28.0, 29.81], [32.0, 35.61], [37.0, 38.26], [39.0, 39.45], [41.0, 47.78], [51.0, 53.86], [54.0, 56.66], [59.0, 71.59], [72.0, 73.2], [74.0, 75.34], [77.0, 77.84], [78.0, 79.41], [81.0, 84.03], [85.0, 86.9], [88.0, 88.35], [90.0, 90.22], [91.0, 95.61], [97.0, 97.01], [98.0, 98.83], [99.0, 101.14], [102.0, 102.34], [103.0, 105.11], [108.0, 108.11], [111.0, 112.08], [113.0, 114.54], [115.0, 116.8], [120.0, 121.46], [125.0, 125.1], [125.0, 125.46], [127.0, 128.39], [131.0, 136.98], [139.0, 140.07], [141.0, 142.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 80.82, 0.0, 98.1, 0.0, 0.0, 98.36, 0.0, 0.0, 95.91, 99.44, 57.64, 99.1, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 38.33, 0.0, 0.0, 98.27, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.05], ["dial tone", 16.53], ["sine wave", 16.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 2.78, 2.09, 1.58, 4.75, 1.5, 1.81, 3.61, 1.26, 0.45, 6.78, 2.86, 2.66, 12.59, 1.2, 1.34, 0.84, 1.41, 3.03, 1.9, 0.35, 0.22, 4.61, 0.01, 0.83, 2.14, 0.34, 2.11, 0.11, 1.08, 1.54, 1.8, 1.46, 0.1, 0.46, 1.39, 5.98, 1.07, 1.67]} \ No newline at end of file diff --git a/annotations_1/kFuzbEylajA_filtered.json b/annotations_1/kFuzbEylajA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d736725f5741ba5396e622c66417748714734425 --- /dev/null +++ b/annotations_1/kFuzbEylajA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.15], [30.0, 33.18], [38.0, 38.38], [39.0, 39.11], [41.0, 41.64], [49.0, 49.37], [53.0, 57.08], [60.0, 60.98], [64.0, 64.3], [66.0, 69.13], [84.0, 84.75], [85.0, 86.68], [92.0, 94.2], [98.0, 97.85], [105.0, 105.33], [115.0, 115.35]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 31.92, 0.0, 0.0, 34.63, 0.0, 0.0, 87.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 48.78], ["boing", 9.18], ["musical instrument", 7.31]], null, null, [["music", 42.91], ["speech", 12.99], ["musical instrument", 2.79]], null, null, null, null, null, null], "duration": [0.15, 3.18, 0.38, 0.11, 0.64, 0.37, 4.08, 0.98, 0.3, 3.13, 0.75, 1.68, 2.2, -0.15, 0.33, 0.35]} \ No newline at end of file diff --git a/annotations_1/kHQq6ri9MDI_filtered.json b/annotations_1/kHQq6ri9MDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e59d2df508d8e4dd0059a71e1d4499d78020ba --- /dev/null +++ b/annotations_1/kHQq6ri9MDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.94], [15.0, 16.63], [18.0, 19.52], [20.0, 21.37], [23.0, 31.02], [32.0, 33.42], [34.0, 36.17], [37.0, 100.06], [102.0, 112.11], [113.0, 115.32], [117.0, 129.44], [132.0, 133.74], [135.0, 136.43], [138.0, 139.83], [141.0, 143.88], [146.0, 145.77]], "keep_status": [false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 55.89, 0.0, 28.74, 35.96, 31.14, 0.0, 0.0, 0.0, 69.07, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 69.9], ["hum", 5.24], ["ambient music", 2.88]], null, null, null, [["clang", 18.59], ["music", 17.56], ["ding", 13.24]], [["chirp tone", 20.62], ["speech", 14.16], ["music", 9.41]], [["music", 30.17], ["burst, pop", 21.98], ["explosion", 9.68]], null, null, null, null, null], "duration": [-0.06, 1.63, 1.52, 1.37, 8.02, 1.42, 2.17, 63.06, 10.11, 2.32, 12.44, 1.74, 1.43, 1.83, 2.88, -0.23]} \ No newline at end of file diff --git a/annotations_1/kIIY1-f_rBg_filtered.json b/annotations_1/kIIY1-f_rBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185fc877e1d26f497a1b6101a038f4d774456c53 --- /dev/null +++ b/annotations_1/kIIY1-f_rBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [2.0, 2.79], [3.0, 5.43], [9.0, 12.33], [28.0, 28.75], [36.0, 40.95], [41.0, 42.74], [44.0, 44.93], [47.0, 49.18], [51.0, 52.1], [55.0, 56.64], [58.0, 58.7], [61.0, 62.11], [64.0, 64.93], [67.0, 68.64], [70.0, 94.14], [95.0, 100.84], [106.0, 107.16], [110.0, 124.23], [129.0, 147.51], [150.0, 154.58]], "keep_status": [false, false, true, true, false, true, false, false, true, false, false, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 31.08, 29.0, 0.0, 33.07, 0.0, 0.0, 37.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.5, 28.48, 0.0, 28.93, 28.96, 29.2], "audiomae_on_audioset": [null, null, [["music", 11.82], ["whale vocalization", 5.38], ["buzz", 5.22]], [["whack, thwack", 29.28], ["fly, housefly", 8.3], ["groan", 5.69]], null, [["livestock, farm animals, working animals", 32.27], ["whale vocalization", 12.34], ["cattle, bovinae", 8.08]], null, null, [["whale vocalization", 34.35], ["speech", 14.41], ["cattle, bovinae", 11.36]], null, null, null, null, null, null, [["music", 29.34], ["speech", 18.19], ["didgeridoo", 8.85]], [["music", 52.0], ["electronic music", 7.93], ["buzz", 4.38]], null, [["music", 40.76], ["cattle, bovinae", 11.36], ["speech", 11.29]], [["music", 72.39], ["electronic music", 4.21], ["throbbing", 3.83]], [["music", 63.66], ["speech", 5.25], ["electronic music", 4.44]]], "duration": [1.27, 0.79, 2.43, 3.33, 0.75, 4.95, 1.74, 0.93, 2.18, 1.1, 1.64, 0.7, 1.11, 0.93, 1.64, 24.14, 5.84, 1.16, 14.23, 18.51, 4.58]} \ No newline at end of file diff --git a/annotations_1/kJ-UZ4DvYBg_filtered.json b/annotations_1/kJ-UZ4DvYBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b802ae738f97bbe235e1cebd8aaf552a9270e2 --- /dev/null +++ b/annotations_1/kJ-UZ4DvYBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 36.07], [37.0, 37.4], [39.0, 38.92], [40.0, 41.55], [44.0, 44.56], [47.0, 49.74], [51.0, 58.24], [60.0, 63.36], [67.0, 67.19], [69.0, 69.04], [70.0, 71.63], [73.0, 73.7], [76.0, 78.61], [80.0, 81.01], [83.0, 86.14], [88.0, 89.21], [90.0, 91.88], [94.0, 95.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 36.8, 100.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 53.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["noise", 47.7], ["music", 23.31], ["hum", 8.85]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.07, 0.4, -0.08, 1.55, 0.56, 2.74, 7.24, 3.36, 0.19, 0.04, 1.63, 0.7, 2.61, 1.01, 3.14, 1.21, 1.88, 1.25]} \ No newline at end of file diff --git a/annotations_1/kJEvR6GEb7U_filtered.json b/annotations_1/kJEvR6GEb7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00baf8a4753cd63967ecf9c7b5f173ca8c51c3b4 --- /dev/null +++ b/annotations_1/kJEvR6GEb7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 67.58], [71.0, 74.02], [75.0, 82.58], [85.0, 86.34], [88.0, 90.56], [94.0, 95.57], [96.0, 101.34], [102.0, 105.76], [109.0, 114.83], [115.0, 116.23]], "keep_status": [false, true, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 29.18, 33.33, 0.0, 33.49, 0.0, 33.04, 31.58, 31.01, 0.0], "audiomae_on_audioset": [null, [["music", 34.57], ["vehicle", 12.54], ["car", 9.97]], [["screaming", 40.48], ["groan", 21.79], ["music", 14.28]], null, [["music", 23.59], ["mains hum", 20.01], ["hum", 18.82]], null, [["music", 56.78], ["synthesizer", 5.68], ["cacophony", 4.79]], [["fly, housefly", 18.14], ["insect", 17.47], ["speech", 14.62]], [["music", 41.83], ["mains hum", 29.64], ["hum", 13.86]], null], "duration": [32.58, 3.02, 7.58, 1.34, 2.56, 1.57, 5.34, 3.76, 5.83, 1.23]} \ No newline at end of file diff --git a/annotations_1/kJKWjeMtEDM_filtered.json b/annotations_1/kJKWjeMtEDM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b10868da6f192622d00918b704559a021dcbd508 --- /dev/null +++ b/annotations_1/kJKWjeMtEDM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.12], [3.0, 3.37], [5.0, 6.0], [7.0, 7.79], [10.0, 12.7], [17.0, 27.33], [28.0, 28.9], [31.0, 40.17], [40.0, 41.62], [42.0, 42.82], [45.0, 45.5], [48.0, 48.22], [50.0, 51.58], [53.0, 55.43], [60.0, 84.4], [89.0, 144.75], [146.0, 165.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.31, 52.74, 0.0, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 95.23, 33.73, 0.0, 35.87], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 77.53], ["electronic music", 4.77], ["throbbing", 4.7]], null, [["music", 48.85], ["speech", 14.54], ["cacophony", 7.66]]], "duration": [1.12, 0.37, 1.0, 0.79, 2.7, 10.33, 0.9, 9.17, 1.62, 0.82, 0.5, 0.22, 1.58, 2.43, 24.4, 55.75, 19.18]} \ No newline at end of file diff --git a/annotations_1/kJlqNXhZE_I_filtered.json b/annotations_1/kJlqNXhZE_I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e874411dc5d432b8cc9cc4040dd0ae4ab5c4d39a --- /dev/null +++ b/annotations_1/kJlqNXhZE_I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.67], [8.0, 7.77], [10.0, 12.56], [13.0, 19.74], [23.0, 24.97], [28.0, 29.61], [32.0, 32.37], [41.0, 40.74], [41.0, 41.54], [42.0, 44.51], [45.0, 47.65], [49.0, 50.87], [53.0, 82.09], [88.0, 87.81], [93.0, 104.04], [105.0, 107.79], [122.0, 130.77], [169.0, 171.22]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [55.39, 0.0, 62.47, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 34.18, 48.52, 0.0, 42.58, 0.0, 33.97, 32.0, 34.06, 36.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 41.53], ["music", 10.84], ["speech synthesizer", 6.51]], [["mains hum", 32.02], ["hum", 18.71], ["busy signal", 12.53]], null, [["music", 77.22], ["boing", 2.34], ["thunk", 1.64]], null, [["sheep", 16.21], ["bleat", 10.11], ["screaming", 9.89]], [["livestock, farm animals, working animals", 78.88], ["moo", 9.71], ["cattle, bovinae", 5.87]], [["moo", 47.24], ["cattle, bovinae", 23.32], ["livestock, farm animals, working animals", 11.82]], [["music", 67.57], ["musical instrument", 3.62], ["cacophony", 2.4]]], "duration": [3.67, -0.23, 2.56, 6.74, 1.97, 1.61, 0.37, -0.26, 0.54, 2.51, 2.65, 1.87, 29.09, -0.19, 11.04, 2.79, 8.77, 2.22]} \ No newline at end of file diff --git a/annotations_1/kJnH45GslL0_filtered.json b/annotations_1/kJnH45GslL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c488781e4d62feb2a4cc2f670e95e53e950fd573 --- /dev/null +++ b/annotations_1/kJnH45GslL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.62], [8.0, 9.27], [14.0, 33.99], [35.0, 36.69], [41.0, 41.39], [45.0, 45.66], [49.0, 52.59], [57.0, 70.61], [72.0, 71.86], [74.0, 75.19], [76.0, 76.82], [79.0, 79.2], [79.0, 79.24], [82.0, 82.71], [86.0, 90.91], [92.0, 102.84], [105.0, 105.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.54, 0.0, 0.0, 0.0, 88.46, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.81, 30.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.79], ["mains hum", 5.67], ["sonar", 3.45]], [["music", 76.82], ["speech", 6.74], ["throbbing", 2.09]], null], "duration": [1.62, 1.27, 19.99, 1.69, 0.39, 0.66, 3.59, 13.61, -0.14, 1.19, 0.82, 0.2, 0.24, 0.71, 4.91, 10.84, 0.27]} \ No newline at end of file diff --git a/annotations_1/kKBsDfBDmG0_filtered.json b/annotations_1/kKBsDfBDmG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b8fed6a04d890887c399b3bc623e56a69d6f0c --- /dev/null +++ b/annotations_1/kKBsDfBDmG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.07], [15.0, 14.93], [21.0, 23.84], [28.0, 28.56], [34.0, 36.27], [39.0, 39.92], [42.0, 44.0], [45.0, 45.77], [50.0, 52.3], [53.0, 53.32], [56.0, 65.35], [67.0, 67.46], [70.0, 69.74], [72.0, 74.07], [81.0, 81.77], [87.0, 89.75], [96.0, 95.84], [101.0, 101.73], [104.0, 103.84], [104.0, 105.14], [107.0, 107.45], [114.0, 114.54], [115.0, 116.73], [129.0, 130.77], [142.0, 143.56], [144.0, 145.2], [147.0, 149.71], [152.0, 152.58], [153.0, 154.92], [157.0, 157.64], [163.0, 165.86]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 39.52, 0.0, 99.98, 0.0, 100.0, 0.0, 45.78, 0.0, 43.43, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 40.55], "audiomae_on_audioset": [null, null, [["whack, thwack", 41.61], ["smash, crash", 19.55], ["breaking", 14.18]], null, null, null, null, null, [["speech", 49.86], ["inside, small room", 3.42], ["animal", 3.35]], null, [["mains hum", 26.7], ["hum", 25.91], ["speech", 21.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.05], ["singing bowl", 14.06], ["hum", 7.69]]], "duration": [1.07, -0.07, 2.84, 0.56, 2.27, 0.92, 2.0, 0.77, 2.3, 0.32, 9.35, 0.46, -0.26, 2.07, 0.77, 2.75, -0.16, 0.73, -0.16, 1.14, 0.45, 0.54, 1.73, 1.77, 1.56, 1.2, 2.71, 0.58, 1.92, 0.64, 2.86]} \ No newline at end of file diff --git a/annotations_1/kKUsYDTykUQ_filtered.json b/annotations_1/kKUsYDTykUQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86770e89d2c350824c66c64df2368029a361dd10 --- /dev/null +++ b/annotations_1/kKUsYDTykUQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 62.36], [64.0, 64.67], [66.0, 67.86], [68.0, 120.8]], "keep_status": [true, false, false, false], "silence_prob": [28.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 40.43], ["buzz", 12.07], ["music", 9.29]], null, null, null], "duration": [29.36, 0.67, 1.86, 52.8]} \ No newline at end of file diff --git a/annotations_1/kL8e9CEgm6A_filtered.json b/annotations_1/kL8e9CEgm6A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d79d27da9accd9bba413ebd0868c55e152a272 --- /dev/null +++ b/annotations_1/kL8e9CEgm6A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [6.0, 6.71], [9.0, 9.9], [11.0, 13.14], [19.0, 19.79], [22.0, 26.54], [27.0, 28.7], [29.0, 29.83], [32.0, 33.3], [35.0, 37.23], [40.0, 40.71], [44.0, 49.45], [50.0, 50.97], [53.0, 53.23], [54.0, 54.57], [56.0, 56.56], [58.0, 59.17], [65.0, 65.18], [72.0, 72.57], [89.0, 101.09], [103.0, 116.14], [117.0, 130.52], [133.0, 134.27], [135.0, 135.73], [138.0, 138.57], [140.0, 140.7], [141.0, 142.84], [144.0, 150.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 82.97, 0.0, 86.09, 0.0, 0.0, 0.0, 75.72, 0.0, 72.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.32, 29.41, 30.66, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.28], ["hum", 23.51], ["mains hum", 11.92]], [["music", 47.09], ["speech", 40.72], ["hum", 2.3]], [["music", 78.87], ["hum", 5.74], ["throbbing", 2.85]], null, null, null, null, null, null], "duration": [0.78, 0.71, 0.9, 2.14, 0.79, 4.54, 1.7, 0.83, 1.3, 2.23, 0.71, 5.45, 0.97, 0.23, 0.57, 0.56, 1.17, 0.18, 0.57, 12.09, 13.14, 13.52, 1.27, 0.73, 0.57, 0.7, 1.84, 6.97]} \ No newline at end of file diff --git a/annotations_1/kLjET9nE2dQ_filtered.json b/annotations_1/kLjET9nE2dQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ade54b575db6870eb12fd46770aeccadffd16051 --- /dev/null +++ b/annotations_1/kLjET9nE2dQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.34], [18.0, 31.43], [35.0, 47.71], [48.0, 51.51], [54.0, 54.51], [57.0, 60.44], [69.0, 78.14], [79.0, 80.38], [81.0, 83.81]], "keep_status": [false, false, true, true, false, true, false, false, true], "silence_prob": [31.31, 31.9, 32.47, 30.95, 0.0, 35.47, 36.89, 0.0, 30.67], "audiomae_on_audioset": [[["speech", 37.11], ["whack, thwack", 24.01], ["groan", 14.0]], [["speech", 59.68], ["whack, thwack", 16.75], ["thump, thud", 3.94]], [["speech", 32.68], ["whack, thwack", 23.74], ["breaking", 10.47]], [["whack, thwack", 29.01], ["music", 18.1], ["smash, crash", 11.14]], null, [["speech", 40.44], ["hum", 14.32], ["mains hum", 8.48]], [["throbbing", 43.52], ["music", 16.68], ["hum", 13.0]], null, [["music", 32.99], ["hum", 8.8], ["reverberation", 5.96]]], "duration": [7.34, 13.43, 12.71, 3.51, 0.51, 3.44, 9.14, 1.38, 2.81]} \ No newline at end of file diff --git a/annotations_1/kMcvRpOOIwY_filtered.json b/annotations_1/kMcvRpOOIwY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9c3a56b40987c7e9956d8ded776b529d6d0f972 --- /dev/null +++ b/annotations_1/kMcvRpOOIwY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.34], [13.0, 13.83], [17.0, 56.57], [60.0, 95.2], [96.0, 98.59], [102.0, 106.64], [108.0, 118.59], [122.0, 122.28], [123.0, 129.61], [131.0, 153.06], [155.0, 164.61]], "keep_status": [false, false, false, false, true, true, false, false, true, true, false], "silence_prob": [29.78, 0.0, 0.0, 0.0, 31.7, 28.87, 29.24, 0.0, 29.19, 29.38, 28.93], "audiomae_on_audioset": [[["music", 84.23], ["quack", 3.29], ["animal", 1.67]], null, null, null, [["music", 21.35], ["sine wave", 7.38], ["moo", 7.02]], [["cattle, bovinae", 20.72], ["moo", 20.5], ["speech", 14.16]], [["groan", 38.75], ["music", 27.34], ["whack, thwack", 4.76]], null, [["music", 25.44], ["cattle, bovinae", 10.1], ["sheep", 7.78]], [["music", 54.89], ["speech", 5.67], ["didgeridoo", 4.2]], [["music", 76.01], ["cacophony", 2.25], ["speech", 1.5]]], "duration": [5.34, 0.83, 39.57, 35.2, 2.59, 4.64, 10.59, 0.28, 6.61, 22.06, 9.61]} \ No newline at end of file diff --git a/annotations_1/kNtopT3-5t0_filtered.json b/annotations_1/kNtopT3-5t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889c310a0ad0dfdcb959271ac078c46ae2abd017 --- /dev/null +++ b/annotations_1/kNtopT3-5t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.3], [47.0, 47.51], [54.0, 56.61], [75.0, 75.56], [76.0, 76.76], [78.0, 82.59], [85.0, 86.7], [90.0, 91.13], [102.0, 103.45], [113.0, 113.88], [117.0, 117.69], [125.0, 126.17], [134.0, 134.28], [137.0, 138.18], [143.0, 143.02], [159.0, 160.44], [163.0, 165.42], [175.0, 175.59], [177.0, 182.73]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.17, 0.0, 0.0, 41.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.29, 0.0, 69.47], "audiomae_on_audioset": [null, null, [["speech", 44.92], ["music", 16.11], ["boing", 9.86]], null, null, [["music", 39.96], ["synthesizer", 19.04], ["musical instrument", 8.49]], null, null, null, null, null, null, null, null, null, null, [["music", 56.27], ["synthesizer", 9.44], ["speech", 5.64]], null, null], "duration": [0.3, 0.51, 2.61, 0.56, 0.76, 4.59, 1.7, 1.13, 1.45, 0.88, 0.69, 1.17, 0.28, 1.18, 0.02, 1.44, 2.42, 0.59, 5.73]} \ No newline at end of file diff --git a/annotations_1/kOe-yLCbA4E_filtered.json b/annotations_1/kOe-yLCbA4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eeb0e18030af615f8f2835a4cd70af810196098 --- /dev/null +++ b/annotations_1/kOe-yLCbA4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 6.3], [10.0, 16.31], [18.0, 36.88], [38.0, 38.3], [44.0, 44.68], [46.0, 46.06], [48.0, 48.56], [49.0, 55.32], [56.0, 55.93], [57.0, 58.18], [60.0, 69.7], [72.0, 73.28], [74.0, 76.49], [82.0, 81.58], [84.0, 84.35], [86.0, 88.13], [92.0, 95.71], [96.0, 96.38], [100.0, 100.52], [102.0, 102.79], [103.0, 103.57], [108.0, 110.07], [111.0, 111.94], [113.0, 112.9], [114.0, 116.94], [117.0, 117.61], [118.0, 128.58], [133.0, 142.5], [144.0, 144.37], [145.0, 145.77], [150.0, 153.96], [155.0, 155.92]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 78.04, 46.19, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 32.61, 0.0, 38.75, 0.0, 0.0, 66.51, 35.31, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 0.0, 49.22, 0.0, 50.97, 38.88, 0.0, 0.0, 37.02, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 22.52], ["speech", 10.61], ["hum", 8.81]], null, null, null, null, null, null, null, [["music", 73.43], ["brass instrument", 2.92], ["musical instrument", 2.54]], null, [["didgeridoo", 43.9], ["music", 16.68], ["chop", 4.35]], null, null, null, [["music", 27.1], ["speech", 22.34], ["didgeridoo", 18.85]], null, null, null, null, null, null, null, [["noise", 14.61], ["music", 8.65], ["mains hum", 6.11]], null, null, [["music", 64.47], ["wind instrument, woodwind instrument", 4.45], ["brass instrument", 3.19]], null, null, [["noise", 18.82], ["mains hum", 16.67], ["hum", 16.48]], null], "duration": [1.96, 1.3, 6.31, 18.88, 0.3, 0.68, 0.06, 0.56, 6.32, -0.07, 1.18, 9.7, 1.28, 2.49, -0.42, 0.35, 2.13, 3.71, 0.38, 0.52, 0.79, 0.57, 2.07, 0.94, -0.1, 2.94, 0.61, 10.58, 9.5, 0.37, 0.77, 3.96, 0.92]} \ No newline at end of file diff --git a/annotations_1/kOfY6wIKT40_filtered.json b/annotations_1/kOfY6wIKT40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71b544fafc805a4dd67c9ccc853ebc6273da2b63 --- /dev/null +++ b/annotations_1/kOfY6wIKT40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [4.0, 4.09], [5.0, 9.42], [11.0, 11.25], [13.0, 15.38], [16.0, 17.64], [20.0, 20.14], [21.0, 21.68], [27.0, 26.62], [32.0, 32.41], [33.0, 43.44], [45.0, 45.89], [47.0, 47.48], [48.0, 48.49], [49.0, 49.84], [51.0, 51.17], [52.0, 52.84], [54.0, 54.97], [58.0, 59.19], [60.0, 61.3], [62.0, 62.51], [64.0, 64.93], [65.0, 67.46], [68.0, 75.56], [77.0, 77.8], [79.0, 79.66], [84.0, 84.2], [85.0, 85.33], [88.0, 88.82], [91.0, 91.69], [95.0, 94.91], [96.0, 96.2], [97.0, 98.29], [99.0, 100.04], [103.0, 104.6], [105.0, 105.43], [105.0, 106.39], [108.0, 109.17], [110.0, 110.05], [110.0, 110.59], [111.0, 112.11], [113.0, 113.24], [114.0, 114.89], [116.0, 116.95], [119.0, 118.93], [120.0, 120.7], [122.0, 123.84], [125.0, 129.78], [130.0, 130.81], [132.0, 133.08], [134.0, 134.96], [137.0, 144.46], [146.0, 146.57], [152.0, 156.02], [158.0, 158.62], [159.0, 161.64], [165.0, 166.01], [166.0, 167.29], [168.0, 177.09], [178.0, 179.41]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.2, 0.0, 41.4, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 97.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 0.0, 48.35, 0.0, 48.44, 0.0, 60.14, 0.0, 0.0, 49.45, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.8], ["musical instrument", 11.14], ["guitar", 10.74]], null, [["theremin", 55.33], ["music", 19.16], ["speech", 14.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 55.38], ["music", 24.99], ["synthesizer", 3.99]], null, [["theremin", 47.35], ["music", 34.1], ["synthesizer", 5.32]], null, null, null, null, [["theremin", 56.85], ["music", 20.41], ["synthesizer", 6.3]], null], "duration": [0.49, 0.09, 4.42, 0.25, 2.38, 1.64, 0.14, 0.68, -0.38, 0.41, 10.44, 0.89, 0.48, 0.49, 0.84, 0.17, 0.84, 0.97, 1.19, 1.3, 0.51, 0.93, 2.46, 7.56, 0.8, 0.66, 0.2, 0.33, 0.82, 0.69, -0.09, 0.2, 1.29, 1.04, 1.6, 0.43, 1.39, 1.17, 0.05, 0.59, 1.11, 0.24, 0.89, 0.95, -0.07, 0.7, 1.84, 4.78, 0.81, 1.08, 0.96, 7.46, 0.57, 4.02, 0.62, 2.64, 1.01, 1.29, 9.09, 1.41]} \ No newline at end of file diff --git a/annotations_1/kP5GKIrGoeQ_filtered.json b/annotations_1/kP5GKIrGoeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d28419f9ba27271ebc67af7d76dde4e782e44f22 --- /dev/null +++ b/annotations_1/kP5GKIrGoeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.48], [11.0, 12.21], [13.0, 22.2], [24.0, 25.91], [27.0, 28.98], [30.0, 35.56], [36.0, 44.91], [46.0, 46.5], [47.0, 49.91], [52.0, 53.91], [55.0, 57.45], [58.0, 59.78], [60.0, 61.72], [62.0, 66.34], [68.0, 71.12], [73.0, 74.17], [74.0, 77.38], [79.0, 82.34], [84.0, 86.76], [88.0, 89.58], [90.0, 94.71], [96.0, 96.79], [97.0, 99.87], [104.0, 105.29], [107.0, 107.99], [112.0, 115.97], [117.0, 119.69], [122.0, 123.7], [124.0, 125.88], [127.0, 129.76], [131.0, 135.65], [138.0, 139.72], [141.0, 149.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.81, 0.0, 81.89, 0.0, 0.0, 99.16, 78.55, 0.0, 71.72, 0.0, 99.44, 0.0, 0.0, 57.89, 97.33, 0.0, 71.29, 98.73, 69.34, 0.0, 76.53, 0.0, 81.17, 0.0, 0.0, 70.86, 92.15, 0.0, 0.0, 98.01, 97.83, 0.0, 87.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.48, 1.21, 9.2, 1.91, 1.98, 5.56, 8.91, 0.5, 2.91, 1.91, 2.45, 1.78, 1.72, 4.34, 3.12, 1.17, 3.38, 3.34, 2.76, 1.58, 4.71, 0.79, 2.87, 1.29, 0.99, 3.97, 2.69, 1.7, 1.88, 2.76, 4.65, 1.72, 8.49]} \ No newline at end of file diff --git a/annotations_1/kPE7ZCGjw4o_filtered.json b/annotations_1/kPE7ZCGjw4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77b3e79024c3b049f99959d069627b091af09ad6 --- /dev/null +++ b/annotations_1/kPE7ZCGjw4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.27], [7.0, 27.01], [30.0, 41.37], [47.0, 48.19], [54.0, 56.12], [60.0, 60.0], [61.0, 61.32], [62.0, 65.69], [67.0, 67.32], [83.0, 83.94], [99.0, 99.3], [99.0, 99.77], [100.0, 107.18], [109.0, 117.91], [120.0, 125.46], [126.0, 125.71], [126.0, 129.07], [131.0, 132.83], [136.0, 136.41], [141.0, 142.33], [159.0, 159.21], [165.0, 168.74], [170.0, 171.05], [172.0, 172.5], [173.0, 173.8], [179.0, 179.49], [180.0, 185.46], [187.0, 195.2], [196.0, 196.08], [197.0, 196.75], [199.0, 198.8], [200.0, 200.35], [204.0, 204.87], [207.0, 207.66], [212.0, 214.91], [216.0, 217.24]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.6, 34.14, 0.0, 31.48, 0.0, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 34.03, 34.65, 39.47, 0.0, 72.46, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 33.38, 48.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.09, 0.0], "audiomae_on_audioset": [null, [["music", 69.13], ["speech", 18.15], ["throbbing", 3.53]], [["speech", 38.44], ["animal", 8.62], ["music", 5.31]], null, [["music", 62.96], ["speech", 15.16], ["skidding", 1.07]], null, null, [["speech", 58.35], ["music", 19.33], ["didgeridoo", 2.4]], null, null, null, null, [["music", 71.09], ["speech", 4.31], ["fart", 2.94]], [["music", 42.92], ["speech", 9.95], ["throbbing", 5.18]], [["speech", 53.49], ["crack", 13.34], ["sidetone", 12.66]], null, null, null, null, null, null, null, null, null, null, null, [["roar", 42.3], ["creak", 19.98], ["whale vocalization", 6.75]], [["music", 51.24], ["fly, housefly", 8.73], ["mosquito", 7.51]], null, null, null, null, null, null, [["music", 69.96], ["didgeridoo", 2.19], ["wind instrument, woodwind instrument", 1.98]], null], "duration": [0.27, 20.01, 11.37, 1.19, 2.12, 0.0, 0.32, 3.69, 0.32, 0.94, 0.3, 0.77, 7.18, 8.91, 5.46, -0.29, 3.07, 1.83, 0.41, 1.33, 0.21, 3.74, 1.05, 0.5, 0.8, 0.49, 5.46, 8.2, 0.08, -0.25, -0.2, 0.35, 0.87, 0.66, 2.91, 1.24]} \ No newline at end of file diff --git a/annotations_1/kPNy_yGvpKI_filtered.json b/annotations_1/kPNy_yGvpKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4126b8d4f157a070ba94a56a30b75a297cd02ee4 --- /dev/null +++ b/annotations_1/kPNy_yGvpKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.81], [15.0, 14.89], [19.0, 19.65], [21.0, 21.3], [25.0, 56.96], [58.0, 58.41], [59.0, 60.15], [62.0, 72.64], [79.0, 100.36], [105.0, 105.71], [106.0, 107.11]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.72, 43.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 39.34], ["cattle, bovinae", 15.26], ["moo", 9.32]], [["speech", 31.95], ["fly, housefly", 8.49], ["hum", 7.32]], null, null], "duration": [1.81, -0.11, 0.65, 0.3, 31.96, 0.41, 1.15, 10.64, 21.36, 0.71, 1.11]} \ No newline at end of file diff --git a/annotations_1/kPXFWplmSyA_filtered.json b/annotations_1/kPXFWplmSyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32f155d20a355d232fa0d2f2e764547f2657a9a5 --- /dev/null +++ b/annotations_1/kPXFWplmSyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 24.48], [26.0, 27.89], [29.0, 30.21], [36.0, 39.72], [41.0, 41.86], [43.0, 43.93], [45.0, 46.16], [47.0, 50.18], [55.0, 55.32], [57.0, 57.59], [59.0, 62.5], [63.0, 63.54], [66.0, 66.56], [68.0, 68.88], [69.0, 72.12], [75.0, 79.08], [83.0, 83.29], [85.0, 88.05], [91.0, 92.72], [95.0, 96.01], [98.0, 100.09], [102.0, 103.52], [105.0, 112.19], [112.0, 112.23], [114.0, 113.68], [114.0, 113.85], [118.0, 129.02], [130.0, 130.92], [132.0, 133.22], [134.0, 134.84], [138.0, 140.17], [144.0, 163.53], [165.0, 165.55], [166.0, 166.8], [167.0, 170.23], [171.0, 176.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.11, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 75.23, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 44.07, 51.71, 0.0, 77.87, 0.0, 0.0, 67.38, 0.0, 32.39, 0.0, 0.0, 0.0, 31.31, 0.0, 0.0, 0.0, 57.48, 52.05, 0.0, 0.0, 61.67, 80.11], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.38], ["music", 13.76], ["hum", 5.14]], null, null, null, null, null, null, null, [["speech", 51.32], ["radio", 5.86], ["noise", 5.75]], null, null, null, [["music", 53.57], ["cacophony", 10.27], ["speech", 9.07]], null, null, null, null, null, null, null, null, null], "duration": [2.48, 1.89, 1.21, 3.72, 0.86, 0.93, 1.16, 3.18, 0.32, 0.59, 3.5, 0.54, 0.56, 0.88, 3.12, 4.08, 0.29, 3.05, 1.72, 1.01, 2.09, 1.52, 7.19, 0.23, -0.32, -0.15, 11.02, 0.92, 1.22, 0.84, 2.17, 19.53, 0.55, 0.8, 3.23, 5.89]} \ No newline at end of file diff --git a/annotations_1/kPiMgLB7S7c_filtered.json b/annotations_1/kPiMgLB7S7c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..372316319d0aa6ec4c700bfa606ba3236fcaf950 --- /dev/null +++ b/annotations_1/kPiMgLB7S7c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.06], [9.0, 24.58], [26.0, 28.41], [29.0, 31.53], [32.0, 32.71], [38.0, 40.29], [45.0, 46.31], [48.0, 48.66], [49.0, 49.1], [50.0, 50.33], [65.0, 82.54], [93.0, 94.32], [100.0, 99.94], [102.0, 106.37], [107.0, 118.72], [120.0, 120.87], [124.0, 125.64], [137.0, 139.53], [141.0, 142.45], [143.0, 145.37], [146.0, 168.69]], "keep_status": [false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.38, 30.74, 29.89, 0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 29.89, 0.0, 0.0, 38.84, 55.18, 0.0, 0.0, 37.82, 0.0, 91.64, 67.13], "audiomae_on_audioset": [null, [["hum", 42.94], ["mains hum", 23.44], ["music", 16.86]], [["music", 47.47], ["theremin", 27.44], ["musical instrument", 3.43]], [["speech", 42.81], ["explosion", 12.44], ["whack, thwack", 10.85]], null, [["music", 18.22], ["speech", 14.48], ["whoosh, swoosh, swish", 12.7]], null, null, null, null, [["music", 30.84], ["hum", 14.51], ["electronic music", 7.64]], null, null, [["mains hum", 37.07], ["hum", 36.0], ["throbbing", 9.22]], null, null, null, [["hum", 29.83], ["music", 21.79], ["mains hum", 21.09]], null, null, null], "duration": [1.06, 15.58, 2.41, 2.53, 0.71, 2.29, 1.31, 0.66, 0.1, 0.33, 17.54, 1.32, -0.06, 4.37, 11.72, 0.87, 1.64, 2.53, 1.45, 2.37, 22.69]} \ No newline at end of file diff --git a/annotations_1/kRNhyHiBUXs_filtered.json b/annotations_1/kRNhyHiBUXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34e54b964e1f47cf9f3882dfba060b49f104d4c0 --- /dev/null +++ b/annotations_1/kRNhyHiBUXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.79], [20.0, 22.18], [23.0, 24.06], [25.0, 26.84], [35.0, 35.45], [43.0, 43.24], [49.0, 48.95], [50.0, 51.02], [59.0, 59.81], [61.0, 62.61], [82.0, 83.52], [86.0, 86.97], [102.0, 102.63], [104.0, 105.78], [109.0, 109.56], [110.0, 112.73], [114.0, 114.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 2.18, 1.06, 1.84, 0.45, 0.24, -0.05, 1.02, 0.81, 1.61, 1.52, 0.97, 0.63, 1.78, 0.56, 2.73, 0.56]} \ No newline at end of file diff --git a/annotations_1/kRuKg_khl8Q_filtered.json b/annotations_1/kRuKg_khl8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..435795a403c3dba48e06fe55754bb56363bacc1c --- /dev/null +++ b/annotations_1/kRuKg_khl8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 17.68], [22.0, 25.08], [28.0, 28.27], [31.0, 39.16], [45.0, 48.17], [54.0, 55.14], [55.0, 55.17], [55.0, 55.21], [55.0, 55.34], [55.0, 55.49], [58.0, 61.45], [65.0, 66.8], [68.0, 68.66], [69.0, 69.57], [72.0, 71.73], [72.0, 83.44], [92.0, 100.65], [103.0, 108.6], [111.0, 110.86], [111.0, 114.3], [122.0, 121.9], [123.0, 124.77], [127.0, 129.81], [130.0, 131.11], [134.0, 139.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [59.33, 52.45, 0.0, 53.28, 43.45, 0.0, 0.0, 0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 38.62, 36.52, 39.6, 0.0, 90.43, 0.0, 0.0, 71.43, 0.0, 87.19], "audiomae_on_audioset": [null, null, null, null, [["music", 59.95], ["bass guitar", 7.16], ["guitar", 5.7]], null, null, null, null, null, [["music", 84.01], ["musical instrument", 2.45], ["guitar", 1.47]], null, null, null, null, [["music", 83.26], ["bass guitar", 4.38], ["musical instrument", 1.57]], [["music", 87.96], ["musical instrument", 1.3], ["soundtrack music", 0.41]], [["music", 42.41], ["bass guitar", 8.44], ["guitar", 8.18]], null, null, null, null, null, null, null], "duration": [5.68, 3.08, 0.27, 8.16, 3.17, 1.14, 0.17, 0.21, 0.34, 0.49, 3.45, 1.8, 0.66, 0.57, -0.27, 11.44, 8.65, 5.6, -0.14, 3.3, -0.1, 1.77, 2.81, 1.11, 5.67]} \ No newline at end of file diff --git a/annotations_1/kSQaXjYkZpc_filtered.json b/annotations_1/kSQaXjYkZpc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcc142c942463220d1db8f25574c01043fe596d1 --- /dev/null +++ b/annotations_1/kSQaXjYkZpc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 21.47], [29.0, 48.96], [63.0, 63.68], [76.0, 87.22], [90.0, 94.34], [100.0, 100.57], [113.0, 122.81], [124.0, 124.38], [127.0, 133.17], [138.0, 143.04], [146.0, 148.86], [149.0, 159.26], [163.0, 163.58], [165.0, 166.6], [168.0, 172.64]], "keep_status": [true, true, false, true, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [29.67, 29.43, 0.0, 29.07, 31.15, 0.0, 29.8, 0.0, 31.24, 30.51, 28.81, 30.4, 0.0, 0.0, 30.69], "audiomae_on_audioset": [[["speech", 31.9], ["music", 18.68], ["boing", 16.88]], [["livestock, farm animals, working animals", 24.51], ["cattle, bovinae", 23.1], ["moo", 13.79]], null, [["music", 45.43], ["speech", 4.91], ["sound effect", 4.81]], [["music", 34.68], ["speech", 33.7], ["sidetone", 3.17]], null, [["speech", 59.46], ["music", 16.32], ["outside, rural or natural", 2.79]], null, [["music", 52.74], ["cattle, bovinae", 5.07], ["moo", 4.95]], [["cattle, bovinae", 44.85], ["moo", 21.23], ["livestock, farm animals, working animals", 7.82]], [["music", 36.57], ["mosquito", 15.94], ["fly, housefly", 12.35]], [["music", 39.51], ["speech", 35.93], ["vehicle", 1.96]], null, null, [["music", 18.81], ["hum", 12.46], ["noise", 11.6]]], "duration": [16.47, 19.96, 0.68, 11.22, 4.34, 0.57, 9.81, 0.38, 6.17, 5.04, 2.86, 10.26, 0.58, 1.6, 4.64]} \ No newline at end of file diff --git a/annotations_1/kS_QskTI8WI_filtered.json b/annotations_1/kS_QskTI8WI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40e9defc43bc143c78aa810cf451971b319a9e09 --- /dev/null +++ b/annotations_1/kS_QskTI8WI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 47.22], [50.0, 54.94], [62.0, 80.77], [81.0, 84.55], [86.0, 87.08], [88.0, 95.34], [99.0, 100.35], [101.0, 104.85], [106.0, 106.46], [109.0, 124.95], [127.0, 128.11], [133.0, 139.26], [141.0, 142.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [78.04, 65.67, 59.15, 83.16, 0.0, 72.46, 0.0, 63.42, 0.0, 51.18, 0.0, 65.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.22, 4.94, 18.77, 3.55, 1.08, 7.34, 1.35, 3.85, 0.46, 15.95, 1.11, 6.26, 1.57]} \ No newline at end of file diff --git a/annotations_1/kSaOMRXiLVA_filtered.json b/annotations_1/kSaOMRXiLVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..247eb6fb9fb8e59911cbe7f7a1241b08363f2bed --- /dev/null +++ b/annotations_1/kSaOMRXiLVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.19], [16.0, 17.32], [18.0, 18.49], [27.0, 27.99], [29.0, 29.25], [31.0, 36.66], [41.0, 41.76], [43.0, 46.94], [48.0, 49.81], [51.0, 77.21], [79.0, 84.84], [89.0, 96.06], [97.0, 98.71], [103.0, 113.14], [116.0, 116.94], [120.0, 123.67]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.84, 0.0, 39.8, 0.0, 29.6, 31.05, 36.58, 0.0, 44.26, 0.0, 57.17], "audiomae_on_audioset": [null, null, null, null, null, [["music", 53.26], ["theremin", 11.21], ["effects unit", 7.9]], null, [["hum", 36.13], ["mains hum", 15.25], ["speech", 11.32]], null, [["music", 61.47], ["speech", 10.93], ["synthesizer", 4.6]], [["music", 47.31], ["sidetone", 11.93], ["speech", 10.59]], [["music", 39.43], ["fart", 4.57], ["synthesizer", 4.18]], null, [["insect", 39.31], ["music", 13.61], ["mosquito", 9.17]], null, null], "duration": [1.19, 1.32, 0.49, 0.99, 0.25, 5.66, 0.76, 3.94, 1.81, 26.21, 5.84, 7.06, 1.71, 10.14, 0.94, 3.67]} \ No newline at end of file diff --git a/annotations_1/kSmAfIP9CoQ_filtered.json b/annotations_1/kSmAfIP9CoQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4928f950ca646f4c00d6cdd08218ad887e6e50dd --- /dev/null +++ b/annotations_1/kSmAfIP9CoQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [12.0, 12.36], [14.0, 15.16], [19.0, 19.65], [22.0, 25.61], [28.0, 28.49], [30.0, 31.67], [33.0, 33.99], [36.0, 35.82], [39.0, 42.65], [44.0, 49.4], [50.0, 55.34], [57.0, 59.61], [62.0, 83.39], [84.0, 98.46], [102.0, 103.01], [104.0, 103.92], [104.0, 145.23], [146.0, 146.42]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false], "silence_prob": [40.28, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 0.0, 0.0, 34.82, 33.4, 33.1, 33.36, 32.42, 34.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.14], ["pulse", 5.68], ["croak", 2.68]], null, null, null, [["music", 63.73], ["hum", 3.2], ["ambient music", 3.18]], null, null, null, null, [["music", 23.42], ["mains hum", 23.38], ["hum", 18.4]], [["speech", 33.26], ["vehicle", 12.49], ["hum", 8.34]], [["hum", 24.01], ["music", 23.56], ["mains hum", 10.87]], [["music", 45.47], ["whip", 11.61], ["electronic music", 4.0]], [["music", 67.37], ["electronic music", 5.38], ["speech", 5.06]], [["hum", 36.58], ["mains hum", 25.09], ["throbbing", 22.45]], null, null, null, null], "duration": [2.21, 0.36, 1.16, 0.65, 3.61, 0.49, 1.67, 0.99, -0.18, 3.65, 5.4, 5.34, 2.61, 21.39, 14.46, 1.01, -0.08, 41.23, 0.42]} \ No newline at end of file diff --git a/annotations_1/kTNDYiONld8_filtered.json b/annotations_1/kTNDYiONld8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92c5c59500a48559a2e00bf733db7dd1024d33ab --- /dev/null +++ b/annotations_1/kTNDYiONld8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 133.96], [134.0, 162.51]], "keep_status": [false, false], "silence_prob": [0.0, 29.04], "audiomae_on_audioset": [null, [["music", 66.75], ["throbbing", 10.65], ["hum", 4.99]]], "duration": [88.96, 28.51]} \ No newline at end of file diff --git a/annotations_1/kTUnQubJMoc_filtered.json b/annotations_1/kTUnQubJMoc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e0d249262e4abf6357525c60032f6c16ba3275c --- /dev/null +++ b/annotations_1/kTUnQubJMoc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.67], [26.0, 26.38], [31.0, 32.95], [37.0, 39.46], [40.0, 65.6], [66.0, 67.39], [68.0, 71.85], [72.0, 92.94], [94.0, 111.97], [115.0, 116.92], [118.0, 119.89], [121.0, 121.41], [127.0, 127.67], [129.0, 130.49]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.55, 34.73, 0.0, 98.8, 96.42, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sine wave", 19.76], ["music", 13.78], ["noise", 11.87]], null, null, null, null, null, null, null, null, null], "duration": [0.67, 0.38, 1.95, 2.46, 25.6, 1.39, 3.85, 20.94, 17.97, 1.92, 1.89, 0.41, 0.67, 1.49]} \ No newline at end of file diff --git a/annotations_1/kT_dXxp7eAo_filtered.json b/annotations_1/kT_dXxp7eAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..815c10429a1ce3a949595c895f755e086cb11c91 --- /dev/null +++ b/annotations_1/kT_dXxp7eAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.5], [14.0, 15.01], [16.0, 20.01], [27.0, 30.33], [33.0, 51.02], [52.0, 52.98], [55.0, 56.32], [61.0, 72.25], [76.0, 76.99], [80.0, 92.6], [99.0, 102.03], [103.0, 103.03], [103.0, 103.5], [104.0, 104.53], [105.0, 107.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [41.03, 0.0, 31.08, 35.35, 32.07, 0.0, 0.0, 31.71, 0.0, 32.96, 32.59, 0.0, 0.0, 0.0, 31.0], "audiomae_on_audioset": [[["music", 24.34], ["throbbing", 6.82], ["hum", 4.49]], null, [["music", 60.33], ["sidetone", 7.07], ["throbbing", 4.1]], [["music", 75.78], ["sidetone", 3.3], ["electronic music", 2.34]], [["music", 42.78], ["speech", 31.22], ["throbbing", 2.55]], null, null, [["music", 39.62], ["speech", 23.26], ["hum", 10.08]], null, [["music", 72.83], ["speech", 6.01], ["musical instrument", 3.72]], [["music", 44.87], ["electronic music", 10.81], ["throbbing", 7.29]], null, null, null, [["music", 46.46], ["throbbing", 9.1], ["fly, housefly", 4.98]]], "duration": [2.5, 1.01, 4.01, 3.33, 18.02, 0.98, 1.32, 11.25, 0.99, 12.6, 3.03, 0.03, 0.5, 0.53, 2.72]} \ No newline at end of file diff --git a/annotations_1/kTtxe4pWpfQ_filtered.json b/annotations_1/kTtxe4pWpfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/kTtxe4pWpfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/kU74wgKk8lo_filtered.json b/annotations_1/kU74wgKk8lo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6a204622030dc7c55fb08215cf1576f2c3e4d968 --- /dev/null +++ b/annotations_1/kU74wgKk8lo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.56], [18.0, 20.53], [26.0, 26.08], [28.0, 31.11], [32.0, 32.93], [34.0, 35.21], [39.0, 40.83], [43.0, 43.5], [45.0, 45.1], [49.0, 49.86], [51.0, 52.17], [53.0, 61.65], [63.0, 65.04], [65.0, 83.94], [85.0, 89.65], [92.0, 122.61]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 48.95, 0.0, 36.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 29.62, 30.83, 30.03, 0.0], "audiomae_on_audioset": [null, [["speech", 24.99], ["whale vocalization", 13.64], ["fly, housefly", 9.16]], null, [["speech", 53.42], ["hum", 8.01], ["music", 6.09]], null, null, null, null, null, null, null, null, [["music", 65.77], ["breaking", 12.18], ["thump, thud", 3.5]], [["hum", 23.54], ["speech", 14.82], ["music", 10.5]], [["whale vocalization", 50.8], ["livestock, farm animals, working animals", 12.78], ["music", 7.56]], null], "duration": [0.56, 2.53, 0.08, 3.11, 0.93, 1.21, 1.83, 0.5, 0.1, 0.86, 1.17, 8.65, 2.04, 18.94, 4.65, 30.61]} \ No newline at end of file diff --git a/annotations_1/kVbmTKqZ31M_filtered.json b/annotations_1/kVbmTKqZ31M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a00a605d4c2710e835281435810e0616cca93e9 --- /dev/null +++ b/annotations_1/kVbmTKqZ31M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.94], [11.0, 11.8], [13.0, 17.39], [19.0, 24.17], [25.0, 32.85], [34.0, 35.8], [37.0, 42.87], [47.0, 50.48], [51.0, 55.78], [58.0, 58.92], [61.0, 62.18], [63.0, 64.81], [66.0, 72.2], [73.0, 74.49], [76.0, 76.35], [78.0, 81.51], [86.0, 86.78], [89.0, 93.46]], "keep_status": [true, false, true, true, true, false, true, true, true, false, false, false, true, false, false, true, false, true], "silence_prob": [43.43, 0.0, 44.93, 36.73, 39.91, 0.0, 36.47, 48.74, 35.84, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 39.24, 0.0, 41.03], "audiomae_on_audioset": [[["music", 36.62], ["sonar", 25.49], ["whale vocalization", 4.23]], null, [["sine wave", 25.21], ["hum", 24.36], ["chirp tone", 12.02]], [["hum", 18.12], ["sonar", 14.22], ["music", 13.98]], [["sonar", 28.09], ["hum", 26.91], ["music", 11.04]], null, [["throbbing", 22.98], ["rumble", 14.12], ["hum", 14.04]], [["music", 22.65], ["speech", 21.68], ["rumble", 5.53]], [["speech", 38.4], ["music", 9.2], ["hum", 9.15]], null, null, null, [["speech", 31.49], ["gong", 12.54], ["music", 11.5]], null, null, [["speech", 32.32], ["music", 18.91], ["whale vocalization", 5.07]], null, [["music", 53.33], ["musical instrument", 4.39], ["theremin", 4.02]]], "duration": [3.94, 0.8, 4.39, 5.17, 7.85, 1.8, 5.87, 3.48, 4.78, 0.92, 1.18, 1.81, 6.2, 1.49, 0.35, 3.51, 0.78, 4.46]} \ No newline at end of file diff --git a/annotations_1/kVujmsfAIUk_filtered.json b/annotations_1/kVujmsfAIUk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..effd36ef0659e2f3bf200f7979f89bf4e6bf3904 --- /dev/null +++ b/annotations_1/kVujmsfAIUk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.11], [26.0, 27.11], [28.0, 47.75], [48.0, 48.93], [51.0, 51.63], [54.0, 54.55], [55.0, 56.32], [58.0, 64.03], [65.0, 65.74], [70.0, 70.24], [71.0, 71.39], [80.0, 80.15], [82.0, 81.84], [83.0, 87.56], [89.0, 89.67], [99.0, 99.5], [102.0, 102.9], [110.0, 114.91], [117.0, 117.44], [125.0, 125.56], [127.0, 127.68], [131.0, 131.45], [132.0, 136.61], [137.0, 136.71], [137.0, 137.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 39.82, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0, 41.7, 0.0, 0.0, 0.0, 0.0, 40.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 60.48], ["sidetone", 13.09], ["noise", 10.35]], null, null, null, null, null, [["speech", 77.13], ["sidetone", 5.67], ["speech synthesizer", 5.23]], null, null, null, [["speech", 78.7], ["sidetone", 2.03], ["grunt", 1.56]], null, null, null, null, [["speech", 71.56], ["radio", 8.18], ["male speech, man speaking", 3.25]], null, null], "duration": [1.11, 1.11, 19.75, 0.93, 0.63, 0.55, 1.32, 6.03, 0.74, 0.24, 0.39, 0.15, -0.16, 4.56, 0.67, 0.5, 0.9, 4.91, 0.44, 0.56, 0.68, 0.45, 4.61, -0.29, 0.37]} \ No newline at end of file diff --git a/annotations_1/kWHOafRR0Sk_filtered.json b/annotations_1/kWHOafRR0Sk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9d8bc2e434f279e6266cab8e84d1d625e022cf4 --- /dev/null +++ b/annotations_1/kWHOafRR0Sk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.95], [33.0, 33.32], [34.0, 37.59], [43.0, 43.44], [47.0, 48.61], [50.0, 52.89], [90.0, 91.0]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.71, 0.0, 0.0, 87.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.95, 0.32, 3.59, 0.44, 1.61, 2.89, 1.0]} \ No newline at end of file diff --git a/annotations_1/kXXnZuu72DA_filtered.json b/annotations_1/kXXnZuu72DA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaf5cd179e3390457e19e45129f917695172209d --- /dev/null +++ b/annotations_1/kXXnZuu72DA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.49], [13.0, 20.41], [21.0, 20.61], [21.0, 20.93], [22.0, 41.2], [42.0, 59.97], [62.0, 78.04], [80.0, 80.22], [81.0, 95.22], [96.0, 96.2], [100.0, 107.42]], "keep_status": [false, true, false, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 30.78, 0.0, 0.0, 31.54, 30.62, 30.74, 0.0, 30.02, 0.0, 30.79], "audiomae_on_audioset": [null, [["music", 43.16], ["didgeridoo", 17.54], ["animal", 7.38]], null, null, [["music", 63.67], ["speech", 16.1], ["whack, thwack", 3.03]], [["music", 52.41], ["speech", 11.34], ["fly, housefly", 4.39]], [["music", 59.38], ["speech", 4.39], ["musical instrument", 4.11]], null, [["music", 66.07], ["animal", 8.24], ["ding", 2.56]], null, [["music", 42.29], ["trombone", 14.86], ["musical instrument", 6.36]]], "duration": [0.49, 7.41, -0.39, -0.07, 19.2, 17.97, 16.04, 0.22, 14.22, 0.2, 7.42]} \ No newline at end of file diff --git a/annotations_1/kXvNxXDDHSY_filtered.json b/annotations_1/kXvNxXDDHSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37b88c37d0ab56c0a443e5bda67b1434f32dfe4c --- /dev/null +++ b/annotations_1/kXvNxXDDHSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.59], [21.0, 21.78], [24.0, 24.71], [29.0, 29.74], [32.0, 32.88], [41.0, 41.94], [43.0, 42.99], [52.0, 51.75], [64.0, 64.76], [68.0, 69.13], [73.0, 73.48], [81.0, 80.77], [90.0, 90.44], [102.0, 101.88], [124.0, 124.23], [125.0, 126.55], [149.0, 150.6], [152.0, 151.75], [153.0, 159.73], [163.0, 164.52], [166.0, 166.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.44, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.63], ["boing", 3.51], ["theremin", 0.91]], null, null], "duration": [0.59, 0.78, 0.71, 0.74, 0.88, 0.94, -0.01, -0.25, 0.76, 1.13, 0.48, -0.23, 0.44, -0.12, 0.23, 1.55, 1.6, -0.25, 6.73, 1.52, 0.75]} \ No newline at end of file diff --git a/annotations_1/kYFrx0jdcoY_filtered.json b/annotations_1/kYFrx0jdcoY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1ab74cb50b00d2bfd9f76042f4c35f7be856d09 --- /dev/null +++ b/annotations_1/kYFrx0jdcoY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [13.0, 13.51], [16.0, 16.48], [18.0, 17.85], [26.0, 26.97], [29.0, 31.14], [33.0, 33.47], [37.0, 37.86], [38.0, 38.62], [43.0, 43.33], [50.0, 51.65], [53.0, 56.52], [62.0, 77.62], [83.0, 96.55], [98.0, 97.82], [98.0, 99.23], [100.0, 100.97], [103.0, 103.79], [109.0, 109.56], [110.0, 113.81], [114.0, 116.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 36.59, 37.26, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 50.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 15.73], ["hum", 13.09], ["car", 9.56]], [["buzz", 21.48], ["hum", 12.0], ["noise", 8.64]], null, null, null, null, null, [["vehicle", 49.06], ["car", 17.53], ["speech", 11.45]], null], "duration": [0.52, 0.51, 0.48, -0.15, 0.97, 2.14, 0.47, 0.86, 0.62, 0.33, 1.65, 3.52, 15.62, 13.55, -0.18, 1.23, 0.97, 0.79, 0.56, 3.81, 2.33]} \ No newline at end of file diff --git a/annotations_1/kYlPBN4yMe0_filtered.json b/annotations_1/kYlPBN4yMe0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8163b4b119a07ae8b6f700574394f1a0aa8f8e2b --- /dev/null +++ b/annotations_1/kYlPBN4yMe0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 19.25], [35.0, 35.82], [41.0, 69.06], [71.0, 98.56], [102.0, 128.93], [131.0, 147.45], [148.0, 158.33], [158.0, 158.63], [159.0, 159.16], [159.0, 169.26]], "keep_status": [false, false, false, true, true, false, false, false, false, false], "silence_prob": [29.72, 0.0, 29.04, 29.37, 29.64, 29.56, 33.49, 0.0, 0.0, 35.07], "audiomae_on_audioset": [[["speech", 81.07], ["vehicle", 2.46], ["music", 1.8]], null, [["cattle, bovinae", 49.99], ["moo", 28.35], ["livestock, farm animals, working animals", 15.06]], [["hum", 21.72], ["music", 16.97], ["mains hum", 9.18]], [["music", 21.59], ["grunt", 18.12], ["groan", 14.18]], [["speech", 36.24], ["music", 20.36], ["hum", 14.36]], [["hum", 51.9], ["mains hum", 16.49], ["throbbing", 10.49]], null, null, [["music", 33.71], ["grunt", 27.88], ["hum", 12.79]]], "duration": [9.25, 0.82, 28.06, 27.56, 26.93, 16.45, 10.33, 0.63, 0.16, 10.26]} \ No newline at end of file diff --git a/annotations_1/kZCgrTDVRbI_filtered.json b/annotations_1/kZCgrTDVRbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2beb562a57f7a67e8c0eefae0b495df85962ae9b --- /dev/null +++ b/annotations_1/kZCgrTDVRbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.21], [6.0, 6.76], [8.0, 9.34], [11.0, 11.82], [12.0, 14.25], [19.0, 20.33], [22.0, 23.45], [28.0, 29.66], [38.0, 47.33], [50.0, 51.12], [64.0, 68.96], [76.0, 76.5], [77.0, 76.71], [77.0, 77.26], [88.0, 94.07], [108.0, 111.08], [112.0, 112.75], [114.0, 116.11], [118.0, 118.22], [127.0, 130.18], [135.0, 135.58], [136.0, 137.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.63, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 73.36, 0.0, 48.87, 0.0, 0.0, 0.0, 98.99, 91.98, 0.0, 99.62, 0.0, 56.63, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 80.04], ["speech synthesizer", 6.6], ["music", 3.05]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 0.76, 1.34, 0.82, 2.25, 1.33, 1.45, 1.66, 9.33, 1.12, 4.96, 0.5, -0.29, 0.26, 6.07, 3.08, 0.75, 2.11, 0.22, 3.18, 0.58, 1.22]} \ No newline at end of file diff --git a/annotations_1/kZRq9scxIWM_filtered.json b/annotations_1/kZRq9scxIWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..05d036e702ff0ebef5649fc0ae24f93b0528e920 --- /dev/null +++ b/annotations_1/kZRq9scxIWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 14.93], [32.0, 33.67], [40.0, 40.53], [41.0, 41.25], [44.0, 44.73], [45.0, 46.3], [57.0, 58.83], [74.0, 74.01], [108.0, 109.22], [110.0, 110.76], [113.0, 113.0], [124.0, 124.83], [128.0, 128.75], [164.0, 164.61], [167.0, 167.51], [174.0, 175.71], [180.0, 182.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.07, 1.67, 0.53, 0.25, 0.73, 1.3, 1.83, 0.01, 1.22, 0.76, 0.0, 0.83, 0.75, 0.61, 0.51, 1.71, 2.75]} \ No newline at end of file diff --git a/annotations_1/kZcr7bw6k_k_filtered.json b/annotations_1/kZcr7bw6k_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d86a09dfa3c735603059b0f572082a2cb57a126d --- /dev/null +++ b/annotations_1/kZcr7bw6k_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [19.0, 19.92], [21.0, 21.51], [22.0, 23.53], [25.0, 27.84], [30.0, 29.86], [34.0, 34.23], [36.0, 36.36], [41.0, 41.27], [42.0, 42.74], [44.0, 46.45], [48.0, 48.0], [49.0, 49.42], [54.0, 54.14], [57.0, 57.03], [61.0, 63.83], [66.0, 74.65], [75.0, 82.59], [87.0, 88.33], [89.0, 92.25], [100.0, 100.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 56.03, 88.46, 87.37, 0.0, 94.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.17, 0.92, 0.51, 1.53, 2.84, -0.14, 0.23, 0.36, 0.27, 0.74, 2.45, 0.0, 0.42, 0.14, 0.03, 2.83, 8.65, 7.59, 1.33, 3.25, 0.5]} \ No newline at end of file diff --git a/annotations_1/kZg0_oypRpU_filtered.json b/annotations_1/kZg0_oypRpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddaefe35dcd25b67c13ca117f2c1e54464331273 --- /dev/null +++ b/annotations_1/kZg0_oypRpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [7.0, 6.88], [9.0, 8.85], [13.0, 13.68], [20.0, 20.7], [21.0, 22.27], [24.0, 23.79], [26.0, 27.35], [32.0, 31.85], [32.0, 35.23], [38.0, 39.07], [41.0, 41.18], [42.0, 42.36], [46.0, 46.74], [50.0, 50.33], [53.0, 53.86], [54.0, 54.53], [55.0, 54.92], [58.0, 58.08], [59.0, 59.95], [61.0, 61.15], [62.0, 63.05], [71.0, 73.11], [74.0, 74.41], [76.0, 76.38], [77.0, 78.53], [80.0, 83.07], [87.0, 87.44], [88.0, 89.09], [94.0, 94.53], [98.0, 98.15], [99.0, 100.89], [102.0, 102.84], [104.0, 104.23], [108.0, 108.7], [114.0, 114.45], [117.0, 119.21], [121.0, 124.58], [129.0, 133.68], [142.0, 142.62], [147.0, 148.85], [151.0, 152.25], [152.0, 154.77], [159.0, 161.01], [167.0, 168.99]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 33.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 55.11, 40.48, 0.0, 0.0, 0.0, 97.33, 40.41, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hammer", 22.37], ["speech", 18.2], ["tuning fork", 9.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 50.76], ["music", 11.47], ["groan", 6.02]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.05], ["music", 9.66], ["noise", 7.97]], null, null, null, null, [["beatboxing", 37.12], ["speech", 26.11], ["music", 8.98]], null], "duration": [1.09, -0.12, -0.15, 0.68, 0.7, 1.27, -0.21, 1.35, -0.15, 3.23, 1.07, 0.18, 0.36, 0.74, 0.33, 0.86, 0.53, -0.08, 0.08, 0.95, 0.15, 1.05, 2.11, 0.41, 0.38, 1.53, 3.07, 0.44, 1.09, 0.53, 0.15, 1.89, 0.84, 0.23, 0.7, 0.45, 2.21, 3.58, 4.68, 0.62, 1.85, 1.25, 2.77, 2.01, 1.99]} \ No newline at end of file diff --git a/annotations_1/kZz5k_xsG0Q_filtered.json b/annotations_1/kZz5k_xsG0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ccaa95c94fd2439df6f852111ca5eb3efa94696c --- /dev/null +++ b/annotations_1/kZz5k_xsG0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.73], [6.0, 10.22], [11.0, 12.11], [14.0, 13.96], [14.0, 15.23], [16.0, 45.69], [48.0, 48.12], [50.0, 55.12], [57.0, 57.94], [60.0, 66.14], [67.0, 68.42], [69.0, 80.74], [86.0, 91.67], [96.0, 104.67], [105.0, 106.79], [107.0, 107.96], [111.0, 112.72], [113.0, 114.72], [120.0, 120.72], [125.0, 125.15], [125.0, 126.01], [127.0, 128.38], [129.0, 130.33], [132.0, 133.02]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.65, 0.0, 0.0, 0.0, 28.58, 0.0, 36.15, 0.0, 33.19, 0.0, 33.25, 29.23, 29.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 19.72], ["throbbing", 13.41], ["music", 11.04]], null, null, null, [["speech", 48.77], ["buzz", 13.77], ["music", 9.21]], null, [["speech", 38.03], ["hum", 12.02], ["music", 11.92]], null, [["speech", 74.58], ["hum", 5.05], ["mains hum", 4.42]], null, [["hum", 49.07], ["mains hum", 26.03], ["throbbing", 11.99]], [["music", 27.48], ["throbbing", 22.89], ["hum", 15.73]], [["music", 24.04], ["speech", 20.11], ["sidetone", 5.97]], null, null, null, null, null, null, null, null, null, null], "duration": [1.73, 4.22, 1.11, -0.04, 1.23, 29.69, 0.12, 5.12, 0.94, 6.14, 1.42, 11.74, 5.67, 8.67, 1.79, 0.96, 1.72, 1.72, 0.72, 0.15, 1.01, 1.38, 1.33, 1.02]} \ No newline at end of file diff --git a/annotations_1/k_pB_zV6kVw_filtered.json b/annotations_1/k_pB_zV6kVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a580bec3bce1ac5ee14072781a4ff138cf2625ba --- /dev/null +++ b/annotations_1/k_pB_zV6kVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.72], [5.0, 12.87], [15.0, 16.73], [20.0, 21.17], [22.0, 25.32], [28.0, 29.32], [31.0, 34.06], [37.0, 36.86], [39.0, 39.39], [42.0, 42.72], [44.0, 46.09], [48.0, 60.02], [64.0, 65.64], [69.0, 68.98], [72.0, 72.1], [73.0, 75.05], [77.0, 76.6], [79.0, 79.22], [82.0, 82.07], [84.0, 85.31], [87.0, 87.51], [89.0, 90.39], [92.0, 92.28], [94.0, 96.28], [98.0, 98.98], [100.0, 100.57], [102.0, 105.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 63.1, 0.0, 0.0, 62.27, 0.0, 78.38, 0.0, 0.0, 0.0, 86.27, 41.16, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 91.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 23.17], ["electric shaver, electric razor", 10.89], ["mosquito", 7.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.72, 7.87, 1.73, 1.17, 3.32, 1.32, 3.06, -0.14, 0.39, 0.72, 2.09, 12.02, 1.64, -0.02, 0.1, 2.05, -0.4, 0.22, 0.07, 1.31, 0.51, 1.39, 0.28, 2.28, 0.98, 0.57, 3.26]} \ No newline at end of file diff --git a/annotations_1/kaJbWpMZdwM_filtered.json b/annotations_1/kaJbWpMZdwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0547d1c2657e30c3d9298ef4a594b65e7c7fc1d --- /dev/null +++ b/annotations_1/kaJbWpMZdwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.21], [7.0, 7.2], [8.0, 9.85], [10.0, 16.5], [17.0, 63.44], [70.0, 83.84], [87.0, 123.28]], "keep_status": [true, false, false, true, false, false, false], "silence_prob": [47.43, 0.0, 0.0, 38.43, 0.0, 28.82, 0.0], "audiomae_on_audioset": [[["music", 13.27], ["hum", 13.02], ["mains hum", 9.72]], null, null, [["speech", 46.15], ["mains hum", 15.08], ["hum", 8.56]], null, [["speech", 52.71], ["music", 14.31], ["fireworks", 3.7]], null], "duration": [2.21, 0.2, 1.85, 6.5, 46.44, 13.84, 36.28]} \ No newline at end of file diff --git a/annotations_1/kbGvnI1qIz8_filtered.json b/annotations_1/kbGvnI1qIz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d85d315fb83c3a60a9bb5b3d57f41c6afce5d144 --- /dev/null +++ b/annotations_1/kbGvnI1qIz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.47], [3.0, 3.75], [6.0, 7.06], [8.0, 8.33], [11.0, 11.64], [13.0, 13.29], [16.0, 18.23], [19.0, 20.29], [22.0, 22.33], [25.0, 25.27], [27.0, 27.28], [32.0, 32.66], [35.0, 35.67], [37.0, 38.03], [40.0, 40.34], [45.0, 45.18], [46.0, 46.89], [48.0, 48.32], [51.0, 51.61], [63.0, 64.0], [64.0, 64.74], [66.0, 66.61], [69.0, 68.86], [71.0, 71.41], [74.0, 74.17], [75.0, 76.87], [79.0, 81.31], [84.0, 84.37], [91.0, 93.6], [95.0, 95.47], [96.0, 96.9], [99.0, 99.59], [102.0, 103.05], [105.0, 105.34], [106.0, 107.18], [108.0, 111.2], [112.0, 113.12], [114.0, 122.07], [123.0, 123.63], [125.0, 126.81], [129.0, 129.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 0.0, 44.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.85, 0.0, 74.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.63], ["radio", 12.8], ["noise", 5.35]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.75, 1.06, 0.33, 0.64, 0.29, 2.23, 1.29, 0.33, 0.27, 0.28, 0.66, 0.67, 1.03, 0.34, 0.18, 0.89, 0.32, 0.61, 1.0, 0.74, 0.61, -0.14, 0.41, 0.17, 1.87, 2.31, 0.37, 2.6, 0.47, 0.9, 0.59, 1.05, 0.34, 1.18, 3.2, 1.12, 8.07, 0.63, 1.81, 0.88]} \ No newline at end of file diff --git a/annotations_1/kbVtjc-ygTM_filtered.json b/annotations_1/kbVtjc-ygTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e44bd2a883cf8a6a655992ca378ab4602696724a --- /dev/null +++ b/annotations_1/kbVtjc-ygTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.13], [8.0, 7.65], [12.0, 12.36], [15.0, 15.79], [32.0, 32.95], [34.0, 36.09], [37.0, 38.01], [50.0, 51.17], [55.0, 58.58], [60.0, 60.18], [66.0, 66.65], [70.0, 70.83], [73.0, 72.57], [77.0, 77.99], [85.0, 85.21], [97.0, 98.41], [100.0, 101.29], [102.0, 102.02], [103.0, 104.18], [113.0, 113.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, -0.35, 0.36, 0.79, 0.95, 2.09, 1.01, 1.17, 3.58, 0.18, 0.65, 0.83, -0.43, 0.99, 0.21, 1.41, 1.29, 0.02, 1.18, 0.07]} \ No newline at end of file diff --git a/annotations_1/kbb1MUQmusU_filtered.json b/annotations_1/kbb1MUQmusU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbe21a1be9cba0714761614041403f610e5755f7 --- /dev/null +++ b/annotations_1/kbb1MUQmusU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.29], [21.0, 25.15], [28.0, 31.4], [34.0, 58.26], [59.0, 78.19], [81.0, 82.49], [83.0, 84.21], [88.0, 88.91], [92.0, 92.69], [96.0, 98.78], [100.0, 103.87], [104.0, 107.86], [109.0, 109.86], [112.0, 113.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [85.72, 66.15, 85.72, 73.51, 51.94, 0.0, 0.0, 0.0, 0.0, 72.16, 45.3, 41.6, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 50.74], ["musical instrument", 4.15], ["synthesizer", 4.01]], [["music", 30.29], ["speech", 21.79], ["theremin", 7.42]], null, null], "duration": [2.29, 4.15, 3.4, 24.26, 19.19, 1.49, 1.21, 0.91, 0.69, 2.78, 3.87, 3.86, 0.86, 1.78]} \ No newline at end of file diff --git a/annotations_1/kbpdM9ORaI8_filtered.json b/annotations_1/kbpdM9ORaI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..478be32f2a89df6ae48e30dd1d2a9da88116af9d --- /dev/null +++ b/annotations_1/kbpdM9ORaI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 23.67], [25.0, 45.87], [47.0, 60.96], [62.0, 75.93]], "keep_status": [false, true, true, false], "silence_prob": [33.5, 31.53, 31.9, 30.35], "audiomae_on_audioset": [[["music", 78.52], ["speech", 3.7], ["musical instrument", 2.03]], [["music", 34.62], ["whack, thwack", 9.97], ["mosquito", 8.9]], [["music", 64.99], ["musical instrument", 2.47], ["whack, thwack", 2.32]], [["music", 57.23], ["synthesizer", 7.47], ["electronic music", 5.48]]], "duration": [11.67, 20.87, 13.96, 13.93]} \ No newline at end of file diff --git a/annotations_1/kcrHhDoUS1k_filtered.json b/annotations_1/kcrHhDoUS1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce5ca57329adb24780167781bf584447628ff360 --- /dev/null +++ b/annotations_1/kcrHhDoUS1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.5], [17.0, 17.27], [19.0, 19.2], [24.0, 36.24], [37.0, 37.32], [39.0, 40.32], [46.0, 46.75], [50.0, 49.92], [52.0, 52.39], [64.0, 66.7], [70.0, 70.7], [75.0, 75.17], [76.0, 78.76], [82.0, 90.22], [94.0, 106.05], [106.0, 113.63], [116.0, 125.34], [127.0, 132.02], [138.0, 139.31], [140.0, 141.3], [143.0, 151.41], [152.0, 153.0], [153.0, 154.14], [160.0, 164.19], [165.0, 173.96]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, true, false], "silence_prob": [35.4, 0.0, 0.0, 28.8, 0.0, 0.0, 0.0, 0.0, 0.0, 32.15, 0.0, 0.0, 41.81, 34.64, 32.4, 33.91, 30.98, 29.3, 0.0, 0.0, 29.89, 0.0, 0.0, 33.56, 29.76], "audiomae_on_audioset": [[["music", 54.57], ["hum", 4.46], ["musical instrument", 3.39]], null, null, [["music", 23.42], ["cattle, bovinae", 17.76], ["livestock, farm animals, working animals", 12.74]], null, null, null, null, null, [["music", 48.75], ["theremin", 12.44], ["hum", 5.71]], null, null, [["throbbing", 46.85], ["hum", 24.3], ["music", 17.93]], [["throbbing", 51.63], ["hum", 19.73], ["music", 17.62]], [["music", 31.84], ["whack, thwack", 12.06], ["hum", 8.24]], [["hum", 41.16], ["mains hum", 17.27], ["throbbing", 13.5]], [["hum", 38.41], ["throbbing", 24.23], ["mains hum", 22.77]], [["breaking", 13.54], ["whack, thwack", 8.52], ["music", 6.02]], null, null, [["music", 25.38], ["didgeridoo", 10.24], ["livestock, farm animals, working animals", 5.98]], null, null, [["music", 40.89], ["whale vocalization", 13.92], ["throbbing", 5.92]], [["speech", 54.21], ["music", 14.46], ["fly, housefly", 8.31]]], "duration": [9.5, 0.27, 0.2, 12.24, 0.32, 1.32, 0.75, -0.08, 0.39, 2.7, 0.7, 0.17, 2.76, 8.22, 12.05, 7.63, 9.34, 5.02, 1.31, 1.3, 8.41, 1.0, 1.14, 4.19, 8.96]} \ No newline at end of file diff --git a/annotations_1/kd01w5eLVwo_filtered.json b/annotations_1/kd01w5eLVwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846b12ff166215eed7e5268d962b083229a71a3c --- /dev/null +++ b/annotations_1/kd01w5eLVwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 97.68], [98.0, 102.05], [103.0, 104.85], [106.0, 107.2], [108.0, 112.28], [113.0, 114.78], [115.0, 117.36], [118.0, 122.81], [123.0, 125.24], [126.0, 129.1], [130.0, 133.08], [134.0, 137.2], [138.0, 142.67], [144.0, 148.34], [149.0, 151.33], [152.0, 153.77], [155.0, 158.08], [159.0, 167.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.95, 0.0, 0.0, 99.26, 0.0, 78.21, 99.05, 98.73, 99.87, 97.33, 97.43, 95.64, 99.56, 99.88, 0.0, 99.92, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [70.68, 4.05, 1.85, 1.2, 4.28, 1.78, 2.36, 4.81, 2.24, 3.1, 3.08, 3.2, 4.67, 4.34, 2.33, 1.77, 3.08, 8.0]} \ No newline at end of file diff --git a/annotations_1/kdbRwpxZHJY_filtered.json b/annotations_1/kdbRwpxZHJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e89f00d8346f5731ae19cc5053c5be8b4b97ff2 --- /dev/null +++ b/annotations_1/kdbRwpxZHJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.69], [17.0, 17.56], [31.0, 32.1], [44.0, 44.34], [73.0, 72.91]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.69, 0.56, 1.1, 0.34, -0.09]} \ No newline at end of file diff --git a/annotations_1/kdrPUm5zBqA_filtered.json b/annotations_1/kdrPUm5zBqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84852f4aeb7d3237cf26f75d9a551e8af3807a77 --- /dev/null +++ b/annotations_1/kdrPUm5zBqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.1], [11.0, 11.53], [18.0, 18.52], [49.0, 51.16], [54.0, 56.56], [62.0, 65.16], [68.0, 71.76], [75.0, 80.86], [81.0, 82.27], [89.0, 89.78], [92.0, 92.53], [93.0, 93.95], [106.0, 108.97], [113.0, 125.81], [134.0, 134.45], [137.0, 138.77], [139.0, 139.56], [146.0, 146.18], [150.0, 151.21], [151.0, 159.75]], "keep_status": [false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.92, 36.66, 39.82, 37.75, 35.77, 0.0, 0.0, 0.0, 0.0, 33.39, 34.63, 0.0, 0.0, 0.0, 0.0, 0.0, 36.18], "audiomae_on_audioset": [null, null, null, [["speech", 30.5], ["music", 22.85], ["didgeridoo", 7.93]], [["music", 60.27], ["electronic music", 5.68], ["grunt", 3.88]], [["music", 52.89], ["throbbing", 18.92], ["synthesizer", 6.98]], [["music", 47.14], ["speech", 10.46], ["didgeridoo", 8.91]], [["music", 58.9], ["throbbing", 12.44], ["speech", 8.63]], null, null, null, null, [["fart", 76.89], ["music", 16.16], ["fly, housefly", 0.78]], [["music", 82.33], ["electronic music", 1.7], ["synthesizer", 1.34]], null, null, null, null, null, [["music", 70.88], ["electronic music", 4.01], ["didgeridoo", 2.85]]], "duration": [1.1, 0.53, 0.52, 2.16, 2.56, 3.16, 3.76, 5.86, 1.27, 0.78, 0.53, 0.95, 2.97, 12.81, 0.45, 1.77, 0.56, 0.18, 1.21, 8.75]} \ No newline at end of file diff --git a/annotations_1/kevJJDQloNE_filtered.json b/annotations_1/kevJJDQloNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f972268705b2f9e15b2ba85254af46e3d59e3fae --- /dev/null +++ b/annotations_1/kevJJDQloNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.93], [20.0, 22.0], [25.0, 77.46], [82.0, 85.62]], "keep_status": [false, false, false, false], "silence_prob": [31.08, 30.34, 0.0, 30.44], "audiomae_on_audioset": [[["music", 80.83], ["disco", 3.47], ["synthesizer", 2.05]], [["music", 69.23], ["house music", 4.88], ["electronic music", 2.14]], null, [["music", 71.98], ["disco", 4.47], ["house music", 2.47]]], "duration": [12.93, 2.0, 52.46, 3.62]} \ No newline at end of file diff --git a/annotations_1/kfdeG-hRX7A_filtered.json b/annotations_1/kfdeG-hRX7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9ab5868578811130dd3e79a6f4a27b080c47759 --- /dev/null +++ b/annotations_1/kfdeG-hRX7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.02], [10.0, 10.83], [11.0, 11.79], [13.0, 14.45], [27.0, 26.69], [29.0, 29.29], [30.0, 30.5], [32.0, 32.97], [34.0, 37.0], [37.0, 39.02], [44.0, 46.47], [47.0, 47.63], [49.0, 49.1], [50.0, 50.45], [51.0, 54.92], [58.0, 58.26], [59.0, 60.79], [67.0, 69.9], [71.0, 72.15], [73.0, 89.94], [97.0, 106.03], [107.0, 108.94], [116.0, 117.8], [118.0, 119.1], [120.0, 120.39], [131.0, 139.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.84, 50.71, 83.7, 0.0, 0.0, 0.0, 34.86, 0.0, 0.0, 29.65, 0.0, 32.77, 32.29, 0.0, 0.0, 0.0, 0.0, 30.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 31.78], ["hum", 25.41], ["music", 13.98]], null, null, [["music", 52.86], ["speech", 14.29], ["synthesizer", 9.4]], null, [["music", 69.73], ["musical instrument", 6.68], ["effects unit", 5.37]], [["music", 81.91], ["boing", 2.44], ["rock and roll", 1.91]], null, null, null, null, [["hum", 36.83], ["throbbing", 31.31], ["music", 14.75]]], "duration": [0.02, 0.83, 0.79, 1.45, -0.31, 0.29, 0.5, 0.97, 3.0, 2.02, 2.47, 0.63, 0.1, 0.45, 3.92, 0.26, 1.79, 2.9, 1.15, 16.94, 9.03, 1.94, 1.8, 1.1, 0.39, 8.72]} \ No newline at end of file diff --git a/annotations_1/kg2o35acq4c_filtered.json b/annotations_1/kg2o35acq4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27772631567c93481d7f8b360dd9df3d2bb35e52 --- /dev/null +++ b/annotations_1/kg2o35acq4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.53], [11.0, 13.51], [15.0, 15.97], [18.0, 20.22], [21.0, 25.14], [30.0, 30.47], [36.0, 38.1], [40.0, 40.73], [42.0, 43.98], [45.0, 46.28], [51.0, 50.75], [53.0, 55.81], [58.0, 70.23], [71.0, 71.12], [73.0, 74.83], [78.0, 80.13], [83.0, 85.78], [88.0, 88.86], [89.0, 90.49], [92.0, 94.85], [98.0, 98.15], [103.0, 104.19], [106.0, 106.1], [110.0, 112.38], [114.0, 114.59], [115.0, 115.57], [119.0, 120.72], [122.0, 131.67], [140.0, 141.1], [141.0, 142.77], [150.0, 150.36], [151.0, 151.11], [153.0, 152.88], [155.0, 155.06], [158.0, 157.76], [160.0, 159.81], [160.0, 161.7], [163.0, 163.32], [164.0, 164.34], [165.0, 165.86], [167.0, 167.71], [174.0, 175.07], [176.0, 176.71], [177.0, 178.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.03, 0.0, 69.07, 47.98, 0.0, 78.21, 0.0, 0.0, 0.0, 0.0, 53.22, 68.02, 0.0, 0.0, 50.26, 57.97, 0.0, 0.0, 43.87, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 35.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 71.13], ["hum", 7.24], ["rumble", 2.97]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.56], ["music", 12.17], ["gong", 10.63]], null, null, null, null, null, null, null, [["whale vocalization", 43.73], ["noise", 16.35], ["animal", 4.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 2.51, 0.97, 2.22, 4.14, 0.47, 2.1, 0.73, 1.98, 1.28, -0.25, 2.81, 12.23, 0.12, 1.83, 2.13, 2.78, 0.86, 1.49, 2.85, 0.15, 1.19, 0.1, 2.38, 0.59, 0.57, 1.72, 9.67, 1.1, 1.77, 0.36, 0.11, -0.12, 0.06, -0.24, -0.19, 1.7, 0.32, 0.34, 0.86, 0.71, 1.07, 0.71, 1.55]} \ No newline at end of file diff --git a/annotations_1/kg3erAXOz34_filtered.json b/annotations_1/kg3erAXOz34_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9c663706f98f58d0ccb5d7592b430166716d8a6 --- /dev/null +++ b/annotations_1/kg3erAXOz34_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.23], [14.0, 14.49], [19.0, 19.6], [32.0, 33.66], [41.0, 40.76], [41.0, 44.09], [49.0, 51.34], [61.0, 61.35], [63.0, 63.73], [64.0, 64.03], [67.0, 67.88], [72.0, 72.77], [74.0, 74.39], [74.0, 74.87], [78.0, 79.3], [88.0, 96.92], [103.0, 103.6], [106.0, 106.59], [108.0, 108.3], [109.0, 110.57], [113.0, 113.27], [114.0, 115.52], [117.0, 118.2], [124.0, 124.16], [126.0, 127.75], [139.0, 139.43], [140.0, 142.87], [149.0, 149.12], [151.0, 150.79], [152.0, 152.93], [155.0, 155.24], [157.0, 158.04], [159.0, 160.51], [161.0, 164.66], [165.0, 168.05]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.12, 29.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.87, 32.94], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 31.99], ["music", 26.49], ["hum", 6.42]], [["music", 33.41], ["speech", 12.31], ["cattle, bovinae", 10.94]], null, null, null, null, null, null, null, null, [["boing", 66.74], ["music", 26.36], ["speech", 4.43]], null, null, null, null, null, null, null, null, null, null, [["music", 41.2], ["speech", 33.44], ["boing", 16.41]], null, null, null, null, null, null, [["music", 23.53], ["bleat", 20.84], ["sheep", 17.24]], [["speech", 58.24], ["electric shaver, electric razor", 18.36], ["music", 4.6]]], "duration": [0.23, 0.49, 0.6, 1.66, -0.24, 3.09, 2.34, 0.35, 0.73, 0.03, 0.88, 0.77, 0.39, 0.87, 1.3, 8.92, 0.6, 0.59, 0.3, 1.57, 0.27, 1.52, 1.2, 0.16, 1.75, 0.43, 2.87, 0.12, -0.21, 0.93, 0.24, 1.04, 1.51, 3.66, 3.05]} \ No newline at end of file diff --git a/annotations_1/kgwjR-pQ29o_filtered.json b/annotations_1/kgwjR-pQ29o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..532c89c29beeeba1707ba53f923e58ce1fb3ee40 --- /dev/null +++ b/annotations_1/kgwjR-pQ29o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.5], [8.0, 8.92], [10.0, 10.81], [15.0, 29.35], [34.0, 37.32], [43.0, 43.23], [46.0, 45.98], [57.0, 57.96], [66.0, 66.72], [67.0, 69.84], [82.0, 82.31], [85.0, 85.83], [87.0, 90.81], [94.0, 97.01], [145.0, 146.31], [149.0, 150.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.31, 31.1, 0.0, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 28.89, 31.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 47.27], ["music", 26.29], ["vehicle", 4.47]], [["music", 78.07], ["synthesizer", 4.43], ["musical instrument", 3.96]], null, null, null, null, [["speech", 53.53], ["boing", 30.73], ["fart", 2.19]], null, null, [["speech", 53.38], ["vehicle", 15.2], ["car", 5.69]], [["fly, housefly", 19.55], ["hum", 12.25], ["insect", 4.87]], null, null], "duration": [0.5, 0.92, 0.81, 14.35, 3.32, 0.23, -0.02, 0.96, 0.72, 2.84, 0.31, 0.83, 3.81, 3.01, 1.31, 1.16]} \ No newline at end of file diff --git a/annotations_1/khX9fjqlf40_filtered.json b/annotations_1/khX9fjqlf40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e1d1f37640d20e611971ffab2f20a101f9662dc --- /dev/null +++ b/annotations_1/khX9fjqlf40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 6.3], [8.0, 8.41], [14.0, 17.93], [21.0, 22.74], [25.0, 26.72], [29.0, 29.69], [32.0, 32.86], [35.0, 40.46], [41.0, 43.31], [44.0, 46.99], [48.0, 51.41], [52.0, 53.1], [55.0, 57.75], [60.0, 62.83], [65.0, 66.99], [68.0, 69.35], [72.0, 76.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.3, 0.0, 0.0, 0.0, 0.0, 74.76, 60.23, 72.16, 67.63, 0.0, 71.29, 44.96, 0.0, 0.0, 40.24], "audiomae_on_audioset": [null, null, null, [["speech", 49.47], ["hum", 15.12], ["mains hum", 6.71]], null, null, null, null, null, null, null, null, null, null, [["speech", 39.22], ["hum", 15.79], ["whale vocalization", 7.46]], null, null, [["whale vocalization", 90.38], ["hum", 4.57], ["mains hum", 1.25]]], "duration": [0.33, 1.3, 0.41, 3.93, 1.74, 1.72, 0.69, 0.86, 5.46, 2.31, 2.99, 3.41, 1.1, 2.75, 2.83, 1.99, 1.35, 4.87]} \ No newline at end of file diff --git a/annotations_1/kheP3iy8-6E_filtered.json b/annotations_1/kheP3iy8-6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5650aab3292e0c99d50674ac17c1124336355ca6 --- /dev/null +++ b/annotations_1/kheP3iy8-6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.24], [10.0, 10.15], [11.0, 11.85], [13.0, 14.22], [15.0, 15.11], [19.0, 20.01], [20.0, 21.9], [24.0, 24.11], [25.0, 25.71], [27.0, 28.0], [30.0, 30.62], [33.0, 33.22], [34.0, 34.65], [45.0, 44.73], [46.0, 47.34], [52.0, 53.18], [55.0, 55.86], [61.0, 61.16], [63.0, 63.41], [64.0, 67.09], [67.0, 69.28], [70.0, 71.56], [73.0, 73.53], [77.0, 83.96], [88.0, 97.7], [99.0, 99.33], [101.0, 104.43], [108.0, 108.14], [119.0, 119.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 62.89, 0.0, 0.0, 61.57, 38.74, 0.0, 56.1, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.92], ["brass instrument", 10.79], ["trombone", 8.27]], null, null, null, null], "duration": [5.24, 0.15, 0.85, 1.22, 0.11, 1.01, 1.9, 0.11, 0.71, 1.0, 0.62, 0.22, 0.65, -0.27, 1.34, 1.18, 0.86, 0.16, 0.41, 3.09, 2.28, 1.56, 0.53, 6.96, 9.7, 0.33, 3.43, 0.14, 0.28]} \ No newline at end of file diff --git a/annotations_1/ki3zzZ-GsGI_filtered.json b/annotations_1/ki3zzZ-GsGI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e50730b605d427a9d81f5e17b37cff458c57528 --- /dev/null +++ b/annotations_1/ki3zzZ-GsGI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 19.92], [21.0, 26.84], [28.0, 62.01], [63.0, 65.64], [67.0, 67.95], [69.0, 72.67], [75.0, 78.66], [82.0, 83.17], [84.0, 85.72], [91.0, 102.52], [104.0, 105.49], [107.0, 107.6], [110.0, 118.72], [122.0, 156.78], [158.0, 158.62], [159.0, 160.1]], "keep_status": [true, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.11, 65.44, 0.0, 30.5, 0.0, 30.22, 30.46, 0.0, 0.0, 29.92, 0.0, 0.0, 30.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["applause", 22.77], ["crowd", 19.05], ["speech", 9.91]], null, null, [["music", 55.48], ["trombone", 5.73], ["musical instrument", 4.7]], null, [["music", 43.87], ["reggae", 9.09], ["swing music", 6.45]], [["music", 64.27], ["saxophone", 7.33], ["swing music", 6.93]], null, null, [["music", 72.08], ["musical instrument", 3.54], ["harmonica", 2.06]], null, null, [["music", 79.78], ["brass instrument", 2.34], ["reggae", 1.87]], null, null, null], "duration": [15.92, 5.84, 34.01, 2.64, 0.95, 3.67, 3.66, 1.17, 1.72, 11.52, 1.49, 0.6, 8.72, 34.78, 0.62, 1.1]} \ No newline at end of file diff --git a/annotations_1/kjLqB63ihJE_filtered.json b/annotations_1/kjLqB63ihJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4265bf6d62e1003bd7da59e2874be61ce129dfa1 --- /dev/null +++ b/annotations_1/kjLqB63ihJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.68], [26.0, 49.84], [52.0, 53.94], [55.0, 58.5], [60.0, 64.61], [66.0, 74.92], [79.0, 82.68], [91.0, 93.06], [95.0, 97.43], [99.0, 102.81], [110.0, 111.38], [113.0, 114.54], [115.0, 118.69]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [32.75, 37.49, 0.0, 46.94, 53.4, 30.47, 30.39, 33.57, 49.0, 41.24, 0.0, 0.0, 32.85], "audiomae_on_audioset": [[["hum", 41.08], ["throbbing", 25.91], ["music", 8.3]], [["music", 36.57], ["hum", 29.31], ["throbbing", 22.82]], null, [["music", 50.97], ["speech", 16.83], ["throbbing", 5.76]], null, [["music", 18.86], ["speech", 17.63], ["throbbing", 16.42]], [["music", 68.08], ["musical instrument", 3.63], ["throbbing", 3.15]], [["music", 54.6], ["speech", 26.21], ["throbbing", 5.39]], [["music", 62.31], ["quack", 7.12], ["fart", 3.04]], [["music", 40.83], ["throbbing", 17.62], ["hum", 9.39]], null, null, [["music", 57.33], ["speech", 10.61], ["throbbing", 7.92]]], "duration": [13.68, 23.84, 1.94, 3.5, 4.61, 8.92, 3.68, 2.06, 2.43, 3.81, 1.38, 1.54, 3.69]} \ No newline at end of file diff --git a/annotations_1/kjtPUnPa0LQ_filtered.json b/annotations_1/kjtPUnPa0LQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2457c0166b620f8d99b4ea11da8df9b287890557 --- /dev/null +++ b/annotations_1/kjtPUnPa0LQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[85.0, 135.7], [138.0, 147.65], [148.0, 150.36], [151.0, 150.63], [151.0, 153.06]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 34.68, 46.26, 0.0, 84.07], "audiomae_on_audioset": [null, [["music", 30.61], ["hum", 16.86], ["explosion", 9.22]], [["fly, housefly", 36.72], ["insect", 33.35], ["bee, wasp, etc.", 9.07]], null, null], "duration": [50.7, 9.65, 2.36, -0.37, 2.06]} \ No newline at end of file diff --git a/annotations_1/klnVwzouc_k_filtered.json b/annotations_1/klnVwzouc_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..598539a48ebd4f2a72de72c4c54f38daab95c305 --- /dev/null +++ b/annotations_1/klnVwzouc_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.51], [10.0, 11.33], [15.0, 20.63], [22.0, 25.27], [26.0, 27.73], [31.0, 42.11], [43.0, 50.77], [55.0, 56.1], [58.0, 59.16], [60.0, 62.4], [65.0, 64.99], [70.0, 70.77], [72.0, 72.22], [74.0, 75.93], [87.0, 87.39], [97.0, 96.85], [100.0, 100.33], [107.0, 108.08], [116.0, 116.61], [122.0, 123.04], [128.0, 129.09], [138.0, 138.92], [144.0, 144.64], [150.0, 150.3], [152.0, 153.32]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.59, 0.0, 96.42, 44.55, 0.0, 99.36, 43.53, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 33.64], ["thunk", 5.58], ["cello", 5.47]], null, null, [["music", 19.42], ["hum", 16.76], ["mains hum", 15.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.51, 1.33, 5.63, 3.27, 1.73, 11.11, 7.77, 1.1, 1.16, 2.4, -0.01, 0.77, 0.22, 1.93, 0.39, -0.15, 0.33, 1.08, 0.61, 1.04, 1.09, 0.92, 0.64, 0.3, 1.32]} \ No newline at end of file diff --git a/annotations_1/klpN-W3Z8Cw_filtered.json b/annotations_1/klpN-W3Z8Cw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72db48ed7064c22f99dfd8192fbe8b7ded122c78 --- /dev/null +++ b/annotations_1/klpN-W3Z8Cw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 37.91], [40.0, 45.15], [46.0, 59.56], [60.0, 81.24], [84.0, 96.33], [97.0, 97.71], [98.0, 99.94], [100.0, 117.19], [118.0, 119.25], [120.0, 123.72]], "keep_status": [true, false, true, true, true, false, false, true, false, false], "silence_prob": [31.34, 31.91, 31.19, 31.2, 30.84, 0.0, 0.0, 31.91, 0.0, 33.83], "audiomae_on_audioset": [[["music", 53.57], ["cacophony", 7.97], ["throbbing", 7.2]], [["music", 35.98], ["speech", 30.12], ["mains hum", 8.88]], [["cacophony", 33.08], ["music", 23.9], ["throbbing", 6.69]], [["music", 30.39], ["speech", 22.68], ["machine gun", 10.96]], [["music", 36.14], ["machine gun", 20.2], ["cacophony", 9.56]], null, null, [["music", 35.53], ["speech", 12.28], ["hum", 7.37]], null, [["music", 40.5], ["throbbing", 16.05], ["pulse", 14.44]]], "duration": [17.91, 5.15, 13.56, 21.24, 12.33, 0.71, 1.94, 17.19, 1.25, 3.72]} \ No newline at end of file diff --git a/annotations_1/klt86blKwaA_filtered.json b/annotations_1/klt86blKwaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a679ddab6ec10813b431ab3550573251d9ffcc --- /dev/null +++ b/annotations_1/klt86blKwaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.88], [12.0, 17.49], [19.0, 19.52], [28.0, 29.74], [31.0, 31.8], [37.0, 37.27], [43.0, 44.93], [48.0, 48.05], [49.0, 49.81], [58.0, 69.2], [77.0, 77.23], [78.0, 78.39], [79.0, 79.12], [82.0, 82.7], [85.0, 84.91], [86.0, 86.71], [88.0, 89.07], [91.0, 91.98], [93.0, 92.94], [94.0, 96.13], [97.0, 98.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.71, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 5.49, 0.52, 1.74, 0.8, 0.27, 1.93, 0.05, 0.81, 11.2, 0.23, 0.39, 0.12, 0.7, -0.09, 0.71, 1.07, 0.98, -0.06, 2.13, 1.36]} \ No newline at end of file diff --git a/annotations_1/kn5Sc8o9YTM_filtered.json b/annotations_1/kn5Sc8o9YTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d93969d00524eae5c281d63c01aea389d645970 --- /dev/null +++ b/annotations_1/kn5Sc8o9YTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 8.01], [10.0, 11.65], [12.0, 13.19], [15.0, 15.45], [19.0, 19.95], [20.0, 21.68], [27.0, 31.13], [32.0, 33.67], [40.0, 40.53], [49.0, 50.53], [58.0, 62.04], [63.0, 64.07], [64.0, 64.77], [66.0, 66.83], [68.0, 69.28], [70.0, 71.51], [73.0, 73.38], [74.0, 74.38], [75.0, 75.88], [78.0, 78.8], [81.0, 81.84], [83.0, 84.25], [90.0, 91.18], [92.0, 92.37], [94.0, 94.76], [95.0, 96.58], [99.0, 100.28], [103.0, 105.21], [107.0, 108.67], [112.0, 112.77], [129.0, 129.91], [137.0, 138.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 46.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 33.76], ["music", 19.3], ["hum", 7.77]], null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 27.17], ["cattle, bovinae", 23.86], ["moo", 18.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["moo", 34.07], ["cattle, bovinae", 31.59], ["music", 11.23]], null, null, null, null], "duration": [0.66, 5.01, 1.65, 1.19, 0.45, 0.95, 1.68, 4.13, 1.67, 0.53, 1.53, 4.04, 1.07, 0.77, 0.83, 1.28, 1.51, 0.38, 0.38, 0.88, 0.8, 0.84, 1.25, 1.18, 0.37, 0.76, 1.58, 1.28, 2.21, 1.67, 0.77, 0.91, 1.94]} \ No newline at end of file diff --git a/annotations_1/kn8k_ox5OXs_filtered.json b/annotations_1/kn8k_ox5OXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b400ac6ef875deef23b694b3ae5eceaf3e96a17 --- /dev/null +++ b/annotations_1/kn8k_ox5OXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.66], [18.0, 32.29], [36.0, 38.3], [40.0, 50.01], [51.0, 52.35], [53.0, 52.84], [53.0, 53.0], [53.0, 55.34], [56.0, 56.88], [63.0, 64.47], [67.0, 78.58], [81.0, 97.46], [101.0, 107.06], [108.0, 111.91], [115.0, 115.1], [117.0, 117.09], [121.0, 121.54], [123.0, 123.94], [125.0, 132.22], [134.0, 149.37], [151.0, 163.14]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [41.18, 36.01, 35.59, 36.17, 0.0, 0.0, 0.0, 38.4, 0.0, 0.0, 33.29, 32.09, 32.92, 56.55, 0.0, 0.0, 0.0, 0.0, 39.99, 32.92, 31.6], "audiomae_on_audioset": [[["music", 64.74], ["didgeridoo", 11.36], ["musical instrument", 8.03]], [["music", 40.31], ["hum", 14.26], ["mains hum", 6.46]], [["music", 34.92], ["hum", 22.39], ["throbbing", 7.14]], [["music", 62.4], ["theremin", 12.16], ["hum", 5.94]], null, null, null, [["music", 64.49], ["speech", 6.45], ["musical instrument", 3.79]], null, null, [["music", 69.68], ["theremin", 5.64], ["electronic music", 5.23]], [["throbbing", 39.31], ["hum", 27.91], ["music", 20.49]], [["music", 53.25], ["throbbing", 6.82], ["ambient music", 5.98]], null, null, null, null, null, [["mains hum", 36.62], ["hum", 19.6], ["music", 16.37]], [["music", 29.16], ["hum", 21.48], ["speech", 11.74]], [["music", 66.89], ["cello", 3.61], ["bowed string instrument", 2.59]]], "duration": [6.66, 14.29, 2.3, 10.01, 1.35, -0.16, 0.0, 2.34, 0.88, 1.47, 11.58, 16.46, 6.06, 3.91, 0.1, 0.09, 0.54, 0.94, 7.22, 15.37, 12.14]} \ No newline at end of file diff --git a/annotations_1/knJ438gN25k_filtered.json b/annotations_1/knJ438gN25k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ceb7a680ac45ba5815ddf4064351c7aecf2eed --- /dev/null +++ b/annotations_1/knJ438gN25k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.01], [14.0, 14.27], [20.0, 20.34], [24.0, 24.6], [25.0, 25.68], [28.0, 38.16], [39.0, 39.36], [42.0, 69.84], [71.0, 77.82], [80.0, 80.08], [80.0, 80.67]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 38.54, 0.0, 41.85, 46.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 21.3], ["hum", 20.85], ["mains hum", 9.88]], null, [["music", 49.83], ["flute", 6.59], ["wind instrument, woodwind instrument", 4.73]], [["music", 53.13], ["musical instrument", 3.75], ["theremin", 3.18]], null, null], "duration": [1.01, 0.27, 0.34, 0.6, 0.68, 10.16, 0.36, 27.84, 6.82, 0.08, 0.67]} \ No newline at end of file diff --git a/annotations_1/kndeWhsNlJs_filtered.json b/annotations_1/kndeWhsNlJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c88eb13346cbccce33abba2f3db98c2a72ce13c --- /dev/null +++ b/annotations_1/kndeWhsNlJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.27], [27.0, 34.91], [35.0, 37.89], [39.0, 46.13], [47.0, 47.66], [49.0, 54.68], [56.0, 83.25], [84.0, 93.07], [93.0, 106.81]], "keep_status": [true, true, true, false, false, false, false, false, true], "silence_prob": [31.14, 32.42, 31.4, 39.33, 0.0, 30.99, 30.93, 60.89, 29.56], "audiomae_on_audioset": [[["music", 26.4], ["mains hum", 22.18], ["hum", 19.79]], [["didgeridoo", 30.29], ["music", 24.04], ["musical instrument", 6.59]], [["speech", 34.12], ["music", 16.65], ["didgeridoo", 10.41]], [["music", 55.93], ["didgeridoo", 11.42], ["musical instrument", 4.93]], null, [["music", 83.61], ["musical instrument", 4.02], ["guitar", 2.8]], [["music", 60.2], ["didgeridoo", 12.35], ["musical instrument", 6.52]], null, [["music", 28.39], ["mains hum", 17.26], ["hum", 8.75]]], "duration": [19.27, 7.91, 2.89, 7.13, 0.66, 5.68, 27.25, 9.07, 13.81]} \ No newline at end of file diff --git a/annotations_1/koWhZSL1Kwo_filtered.json b/annotations_1/koWhZSL1Kwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae006cd0ff6c35added2ce2cb61c71bdc0ad782e --- /dev/null +++ b/annotations_1/koWhZSL1Kwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.1], [10.0, 10.05], [33.0, 33.03], [35.0, 35.88], [37.0, 37.39], [40.0, 40.17], [42.0, 42.31], [59.0, 62.16], [68.0, 70.85], [71.0, 71.32], [72.0, 72.17], [72.0, 73.43], [75.0, 75.24], [76.0, 76.38], [81.0, 81.14], [83.0, 89.23], [93.0, 96.43], [97.0, 101.6], [102.0, 104.87], [105.0, 116.04], [118.0, 118.18], [122.0, 123.08], [129.0, 129.41], [134.0, 134.15]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 40.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.52, 80.11, 57.81, 69.88, 37.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 18.35], ["roaring cats (lions, tigers)", 15.65], ["whale vocalization", 14.59]], null, null, null, null, null, null, [["music", 42.52], ["theremin", 12.47], ["animal", 6.37]], null, null, null, [["grunt", 20.22], ["music", 7.77], ["sound effect", 7.22]], null, null, null, null], "duration": [4.1, 0.05, 0.03, 0.88, 0.39, 0.17, 0.31, 3.16, 2.85, 0.32, 0.17, 1.43, 0.24, 0.38, 0.14, 6.23, 3.43, 4.6, 2.87, 11.04, 0.18, 1.08, 0.41, 0.15]} \ No newline at end of file diff --git a/annotations_1/koZie6TLz3s_filtered.json b/annotations_1/koZie6TLz3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ee5d533b4d40b00d279dbdbc66fccdb77c3f4f1 --- /dev/null +++ b/annotations_1/koZie6TLz3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.21], [13.0, 12.93], [16.0, 16.06], [17.0, 17.17], [17.0, 17.78], [20.0, 20.71], [22.0, 22.05], [22.0, 22.72], [25.0, 25.34], [25.0, 25.46], [26.0, 26.49], [27.0, 28.16], [30.0, 31.78], [33.0, 34.77], [39.0, 39.26], [46.0, 45.66], [47.0, 48.69], [50.0, 52.0], [54.0, 54.06], [80.0, 81.63], [90.0, 90.07], [125.0, 125.78], [143.0, 143.78], [145.0, 146.31], [147.0, 153.96], [155.0, 156.61], [157.0, 157.71], [167.0, 168.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, -0.07, 0.06, 0.17, 0.78, 0.71, 0.05, 0.72, 0.34, 0.46, 0.49, 1.16, 1.78, 1.77, 0.26, -0.34, 1.69, 2.0, 0.06, 1.63, 0.07, 0.78, 0.78, 1.31, 6.96, 1.61, 0.71, 1.62]} \ No newline at end of file diff --git a/annotations_1/kokQDLJ1104_filtered.json b/annotations_1/kokQDLJ1104_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/kokQDLJ1104_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/kpFSJhQ_30c_filtered.json b/annotations_1/kpFSJhQ_30c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdfe69110d837a068441ffcf16421a2af9ec6eb --- /dev/null +++ b/annotations_1/kpFSJhQ_30c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.08], [17.0, 22.17], [24.0, 24.49], [27.0, 27.87], [31.0, 31.87], [33.0, 95.32], [95.0, 95.4], [95.0, 96.31], [97.0, 116.09], [126.0, 127.31], [131.0, 131.58], [142.0, 142.69]], "keep_status": [true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [32.84, 31.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.9], ["music", 17.61], ["vehicle", 7.63]], [["cattle, bovinae", 44.25], ["livestock, farm animals, working animals", 29.92], ["moo", 22.94]], null, null, null, null, null, null, [["speech", 34.55], ["vehicle", 22.33], ["motorcycle", 6.8]], null, null, null], "duration": [5.08, 5.17, 0.49, 0.87, 0.87, 62.32, 0.4, 1.31, 19.09, 1.31, 0.58, 0.69]} \ No newline at end of file diff --git a/annotations_1/kpYZ4G1AQ0c_filtered.json b/annotations_1/kpYZ4G1AQ0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7531ddad88061528d66d31e69a7fd91c8be2bd5d --- /dev/null +++ b/annotations_1/kpYZ4G1AQ0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [21.0, 22.6], [24.0, 26.92], [31.0, 37.03], [37.0, 38.15], [39.0, 49.49], [54.0, 54.68], [55.0, 66.99], [68.0, 76.44], [79.0, 80.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.43, 57.09, 0.0, 61.67, 0.0, 58.05, 60.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.6, 2.92, 6.03, 1.15, 10.49, 0.68, 11.99, 8.44, 1.28]} \ No newline at end of file diff --git a/annotations_1/kqBMHRX-c-4_filtered.json b/annotations_1/kqBMHRX-c-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2ace522b73e148434aff52778646d545e5cc768 --- /dev/null +++ b/annotations_1/kqBMHRX-c-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.28], [9.0, 9.44], [11.0, 11.25], [14.0, 15.9], [18.0, 18.52], [20.0, 20.14], [28.0, 29.73], [35.0, 35.36], [40.0, 40.41], [45.0, 45.2], [50.0, 50.5], [53.0, 53.47], [59.0, 60.3], [61.0, 62.14], [67.0, 67.2], [74.0, 75.02], [78.0, 79.02], [84.0, 85.08], [88.0, 88.26], [92.0, 92.11], [94.0, 94.36], [101.0, 101.85], [103.0, 104.04], [107.0, 107.57], [133.0, 133.42], [136.0, 137.32], [143.0, 143.94], [149.0, 149.3], [151.0, 151.6], [160.0, 160.54], [162.0, 162.51], [165.0, 166.06], [172.0, 173.58], [175.0, 179.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 0.44, 0.25, 1.9, 0.52, 0.14, 1.73, 0.36, 0.41, 0.2, 0.5, 0.47, 1.3, 1.14, 0.2, 1.02, 1.02, 1.08, 0.26, 0.11, 0.36, 0.85, 1.04, 0.57, 0.42, 1.32, 0.94, 0.3, 0.6, 0.54, 0.51, 1.06, 1.58, 4.37]} \ No newline at end of file diff --git a/annotations_1/kqFgnN10khg_filtered.json b/annotations_1/kqFgnN10khg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..665bb053537e1646bbbdd9b067c06c1d5dc89794 --- /dev/null +++ b/annotations_1/kqFgnN10khg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.81], [11.0, 24.63], [26.0, 79.44], [84.0, 84.5], [87.0, 87.52], [88.0, 100.45], [101.0, 102.41], [110.0, 112.77], [114.0, 121.1], [121.0, 121.24], [124.0, 123.92], [125.0, 128.09], [129.0, 160.61], [164.0, 164.84], [168.0, 179.51], [181.0, 183.3], [184.0, 185.26], [186.0, 187.66], [189.0, 189.9], [192.0, 193.5]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [37.51, 31.01, 0.0, 0.0, 0.0, 34.81, 0.0, 45.62, 34.95, 0.0, 0.0, 42.42, 0.0, 0.0, 61.08, 57.48, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 34.31], ["music", 26.49], ["hum", 22.85]], [["music", 53.59], ["hum", 14.66], ["throbbing", 11.3]], null, null, null, [["speech", 26.84], ["music", 15.76], ["thunk", 11.35]], null, [["speech", 27.59], ["music", 18.96], ["hum", 4.95]], [["speech", 54.5], ["single-lens reflex camera", 11.74], ["music", 9.97]], null, null, [["speech", 31.56], ["music", 19.38], ["sheep", 6.21]], null, null, null, null, null, null, null, null], "duration": [4.81, 13.63, 53.44, 0.5, 0.52, 12.45, 1.41, 2.77, 7.1, 0.24, -0.08, 3.09, 31.61, 0.84, 11.51, 2.3, 1.26, 1.66, 0.9, 1.5]} \ No newline at end of file diff --git a/annotations_1/kr2k20G3hCc_filtered.json b/annotations_1/kr2k20G3hCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c4a84c59421e6c4fc02fb3f8d0d320b0d330c2f --- /dev/null +++ b/annotations_1/kr2k20G3hCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [2.0, 2.83], [4.0, 4.97], [9.0, 12.02], [13.0, 14.25], [14.0, 15.5], [17.0, 20.83], [22.0, 23.9], [26.0, 26.89], [34.0, 35.31], [41.0, 41.35], [43.0, 43.73], [45.0, 45.42], [51.0, 51.33], [62.0, 62.18], [63.0, 68.74], [69.0, 72.39], [74.0, 74.21], [77.0, 78.58], [79.0, 85.6], [92.0, 93.34], [98.0, 99.49], [104.0, 113.1], [113.0, 115.99], [120.0, 121.24], [122.0, 129.27], [131.0, 133.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 46.54, 0.0, 0.0, 34.42, 0.0, 0.0, 30.2, 32.91, 0.0, 30.83, 68.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.66], ["speech", 24.71], ["hum", 4.76]], null, null, [["speech", 46.35], ["hum", 15.73], ["music", 7.43]], null, null, [["speech", 43.19], ["music", 11.93], ["fart", 4.85]], [["speech", 20.05], ["music", 13.17], ["cattle, bovinae", 11.78]], null, [["music", 15.83], ["rumble", 12.41], ["siren", 5.68]], null], "duration": [0.49, 0.83, 0.97, 3.02, 1.25, 1.5, 3.83, 1.9, 0.89, 1.31, 0.35, 0.73, 0.42, 0.33, 0.18, 5.74, 3.39, 0.21, 1.58, 6.6, 1.34, 1.49, 9.1, 2.99, 1.24, 7.27, 2.89]} \ No newline at end of file diff --git a/annotations_1/kswPGoPPdwE_filtered.json b/annotations_1/kswPGoPPdwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4df6baa2d2db30ce9a73cdc8f138801c2cc3bbaf --- /dev/null +++ b/annotations_1/kswPGoPPdwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [6.0, 8.5], [9.0, 14.82], [16.0, 17.09], [18.0, 19.2], [20.0, 20.63], [23.0, 23.4], [25.0, 25.83], [31.0, 35.11], [37.0, 37.29], [39.0, 40.1], [41.0, 42.33], [44.0, 44.42], [48.0, 48.61], [52.0, 52.34], [59.0, 67.47], [70.0, 70.92], [73.0, 83.15], [88.0, 91.22], [92.0, 93.58], [95.0, 96.21], [97.0, 97.85], [99.0, 100.06], [101.0, 101.71], [103.0, 103.03], [104.0, 106.57], [108.0, 110.17], [112.0, 112.85], [114.0, 114.89], [119.0, 124.36], [127.0, 129.49], [130.0, 131.06], [131.0, 132.33], [137.0, 137.08]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.3, 62.47, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.53, 0.0, 54.23, 78.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 85.17, 0.0, 0.0, 50.76, 89.19, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 46.44], ["sidetone", 11.71], ["bee, wasp, etc.", 5.12]], null, null, null, null, null, null, [["mains hum", 48.07], ["hum", 42.88], ["speech", 3.77]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.92, 2.5, 5.82, 1.09, 1.2, 0.63, 0.4, 0.83, 4.11, 0.29, 1.1, 1.33, 0.42, 0.61, 0.34, 8.47, 0.92, 10.15, 3.22, 1.58, 1.21, 0.85, 1.06, 0.71, 0.03, 2.57, 2.17, 0.85, 0.89, 5.36, 2.49, 1.06, 1.33, 0.08]} \ No newline at end of file diff --git a/annotations_1/kt1aHAlXi4g_filtered.json b/annotations_1/kt1aHAlXi4g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb139386f3ba738b30a743a901886694ab5ebc1 --- /dev/null +++ b/annotations_1/kt1aHAlXi4g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [3.0, 3.27], [3.0, 12.26], [19.0, 30.33], [34.0, 35.04], [39.0, 53.38], [56.0, 56.29], [57.0, 57.79], [63.0, 67.22], [73.0, 77.97], [79.0, 79.15], [80.0, 86.53], [88.0, 89.99], [92.0, 98.15]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 35.65, 33.12, 0.0, 31.11, 0.0, 0.0, 36.66, 39.57, 0.0, 45.02, 0.0, 50.81], "audiomae_on_audioset": [null, null, [["hum", 26.37], ["whale vocalization", 15.65], ["music", 10.85]], [["music", 46.43], ["sidetone", 9.2], ["throbbing", 8.35]], null, [["cattle, bovinae", 49.94], ["moo", 26.0], ["livestock, farm animals, working animals", 19.67]], null, null, [["music", 31.23], ["speech", 28.74], ["hum", 4.2]], [["music", 40.02], ["speech", 23.75], ["hum", 6.4]], null, [["fly, housefly", 15.35], ["music", 14.95], ["bee, wasp, etc.", 13.07]], null, null], "duration": [1.08, 0.27, 9.26, 11.33, 1.04, 14.38, 0.29, 0.79, 4.22, 4.97, 0.15, 6.53, 1.99, 6.15]} \ No newline at end of file diff --git a/annotations_1/ktCIr_DMGOI_filtered.json b/annotations_1/ktCIr_DMGOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa51a9f89a51a5c324322b16bb23af96b2b2b339 --- /dev/null +++ b/annotations_1/ktCIr_DMGOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.39], [51.0, 51.53], [78.0, 78.8], [80.0, 86.85], [89.0, 90.69], [92.0, 103.57], [104.0, 103.71], [104.0, 104.95], [112.0, 113.49], [124.0, 125.17], [127.0, 127.21], [129.0, 129.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.22, 0.0, 30.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 49.89], ["applause", 20.43], ["music", 6.52]], null, [["explosion", 39.29], ["speech", 29.7], ["burst, pop", 10.21]], null, null, null, null, null, null], "duration": [0.39, 0.53, 0.8, 6.85, 1.69, 11.57, -0.29, 0.95, 1.49, 1.17, 0.21, 0.07]} \ No newline at end of file diff --git a/annotations_1/ktt64clTkj4_filtered.json b/annotations_1/ktt64clTkj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32aa6a13da30c85a0ac088ee74db1e5e9ec57262 --- /dev/null +++ b/annotations_1/ktt64clTkj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.69], [6.0, 6.49], [8.0, 9.56], [15.0, 15.31], [20.0, 21.71], [24.0, 24.38], [25.0, 25.89], [26.0, 27.35], [29.0, 29.61], [31.0, 32.97], [35.0, 35.83], [41.0, 41.22], [66.0, 65.96], [71.0, 70.88], [72.0, 73.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.69, 0.49, 1.56, 0.31, 1.71, 0.38, 0.89, 1.35, 0.61, 1.97, 0.83, 0.22, -0.04, -0.12, 1.03]} \ No newline at end of file diff --git a/annotations_1/kv-hhf-kPkw_filtered.json b/annotations_1/kv-hhf-kPkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e905753656de65f0b4fb2d341928942d2ce34f02 --- /dev/null +++ b/annotations_1/kv-hhf-kPkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [18.0, 19.25], [22.0, 23.94], [27.0, 27.06], [29.0, 30.35], [40.0, 44.86], [50.0, 50.08], [56.0, 57.28], [58.0, 59.93], [64.0, 64.02], [71.0, 75.9], [79.0, 81.13], [90.0, 97.53], [98.0, 103.6], [105.0, 105.68], [108.0, 108.55], [110.0, 113.27], [116.0, 120.41], [121.0, 122.39], [125.0, 133.96], [135.0, 136.59], [137.0, 137.49], [141.0, 143.23], [144.0, 145.25], [146.0, 153.77], [155.0, 156.1], [157.0, 157.69], [159.0, 161.91]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false, true, true, false, false, false, false, true, false, true, false, false, true], "silence_prob": [32.6, 0.0, 0.0, 0.0, 0.0, 30.49, 0.0, 0.0, 0.0, 0.0, 29.95, 29.74, 29.36, 29.47, 0.0, 0.0, 29.11, 28.95, 0.0, 31.01, 0.0, 0.0, 41.81, 0.0, 35.73, 0.0, 0.0, 34.97], "audiomae_on_audioset": [[["music", 43.76], ["musical instrument", 4.15], ["speech", 3.57]], null, null, null, null, [["music", 36.57], ["speech", 14.84], ["explosion", 7.8]], null, null, null, null, [["frog", 31.6], ["fly, housefly", 16.59], ["mosquito", 15.0]], [["speech", 67.41], ["music", 6.91], ["groan", 2.77]], [["buzz", 23.22], ["speech", 19.46], ["music", 6.82]], [["speech", 37.63], ["music", 27.16], ["sidetone", 14.31]], null, null, [["music", 39.04], ["boing", 8.27], ["sound effect", 7.45]], [["music", 44.12], ["carnatic music", 8.73], ["speech", 4.93]], null, [["speech", 68.07], ["boing", 7.82], ["music", 7.44]], null, null, [["music", 34.28], ["didgeridoo", 11.77], ["hum", 6.64]], null, [["speech", 43.11], ["hum", 14.39], ["music", 7.97]], null, null, [["music", 28.93], ["didgeridoo", 11.33], ["insect", 6.07]]], "duration": [2.14, 1.25, 1.94, 0.06, 1.35, 4.86, 0.08, 1.28, 1.93, 0.02, 4.9, 2.13, 7.53, 5.6, 0.68, 0.55, 3.27, 4.41, 1.39, 8.96, 1.59, 0.49, 2.23, 1.25, 7.77, 1.1, 0.69, 2.91]} \ No newline at end of file diff --git a/annotations_1/kvtsZ1Edkk4_filtered.json b/annotations_1/kvtsZ1Edkk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cee472719f1467e678b62fb3b6f8196b74a58a77 --- /dev/null +++ b/annotations_1/kvtsZ1Edkk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [10.0, 10.08], [15.0, 15.72], [19.0, 19.06], [21.0, 21.36], [35.0, 35.02], [42.0, 42.36], [58.0, 57.96], [60.0, 61.21], [69.0, 70.28], [91.0, 94.22], [97.0, 98.34], [101.0, 101.38], [105.0, 106.15], [110.0, 110.81], [113.0, 114.08], [117.0, 118.56], [122.0, 122.59], [126.0, 128.12], [128.0, 128.19], [128.0, 128.22], [128.0, 128.26], [128.0, 128.29], [128.0, 128.33], [128.0, 128.36], [130.0, 130.72], [148.0, 160.22], [168.0, 168.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 63.87], ["musical instrument", 10.09], ["guitar", 9.6]], null, null, null, null, null, null, null, [["music", 76.08], ["musical instrument", 2.41], ["guitar", 2.3]], null, null, null, null, null, null, null, [["music", 80.52], ["musical instrument", 4.51], ["guitar", 2.56]], null], "duration": [0.6, 0.08, 0.72, 0.06, 0.36, 0.02, 0.36, -0.04, 1.21, 1.28, 3.22, 1.34, 0.38, 1.15, 0.81, 1.08, 1.56, 0.59, 2.12, 0.19, 0.22, 0.26, 0.29, 0.33, 0.36, 0.72, 12.22, 0.44]} \ No newline at end of file diff --git a/annotations_1/kvzzBebEAHQ_filtered.json b/annotations_1/kvzzBebEAHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..919de983e9ee276fbbee646decd75bcf3bfc684e --- /dev/null +++ b/annotations_1/kvzzBebEAHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 63.59], [64.0, 91.47], [94.0, 96.48], [96.0, 96.53]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 31.81, 34.12, 0.0], "audiomae_on_audioset": [null, [["music", 37.13], ["hum", 7.74], ["throbbing", 5.76]], [["throbbing", 41.19], ["hum", 25.07], ["music", 15.93]], null], "duration": [35.59, 27.47, 2.48, 0.53]} \ No newline at end of file diff --git a/annotations_1/kwvSRZG285g_filtered.json b/annotations_1/kwvSRZG285g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e60cf8f982c0eb1cbab22e4fc004d2ce2a2e373 --- /dev/null +++ b/annotations_1/kwvSRZG285g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [8.0, 8.24], [12.0, 13.69], [20.0, 21.83], [25.0, 25.44], [27.0, 28.92], [34.0, 36.12], [38.0, 40.93], [45.0, 45.2], [46.0, 46.43], [49.0, 52.0], [56.0, 56.35], [59.0, 60.17], [66.0, 66.85], [69.0, 70.58], [76.0, 76.01], [81.0, 82.02], [83.0, 84.92], [89.0, 96.09], [102.0, 104.43], [105.0, 105.92], [112.0, 115.94], [121.0, 121.49], [124.0, 129.29], [133.0, 132.95], [139.0, 139.92], [147.0, 148.15], [157.0, 158.04], [158.0, 159.21], [164.0, 165.3], [166.0, 166.7], [168.0, 170.63], [173.0, 175.54], [179.0, 181.97], [184.0, 186.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 100.0, 0.0, 0.0, 87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.83, 99.31, 0.0, 100.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 98.01, 100.0, 92.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.74, 0.24, 1.69, 1.83, 0.44, 1.92, 2.12, 2.93, 0.2, 0.43, 3.0, 0.35, 1.17, 0.85, 1.58, 0.01, 1.02, 1.92, 7.09, 2.43, 0.92, 3.94, 0.49, 5.29, -0.05, 0.92, 1.15, 1.04, 1.21, 1.3, 0.7, 2.63, 2.54, 2.97, 2.17]} \ No newline at end of file diff --git a/annotations_1/kxvkI8K7fTo_filtered.json b/annotations_1/kxvkI8K7fTo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7d7fd1e934b4afe29d3f66a39a02ea264daf912 --- /dev/null +++ b/annotations_1/kxvkI8K7fTo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [13.0, 15.4], [26.0, 26.13], [27.0, 30.57], [32.0, 32.07], [33.0, 34.45], [38.0, 38.85], [42.0, 44.12], [47.0, 48.3], [50.0, 50.67], [56.0, 56.61], [57.0, 57.7], [58.0, 59.53], [76.0, 77.36], [91.0, 91.88], [105.0, 106.71], [113.0, 113.34], [113.0, 114.12], [118.0, 123.69], [126.0, 127.06], [135.0, 136.31], [140.0, 140.9], [143.0, 143.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 79.59, 0.0, 63.42, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 14.65], ["moo", 12.4], ["mosquito", 11.65]], null, null, null, null], "duration": [0.21, 2.4, 0.13, 3.57, 0.07, 1.45, 0.85, 2.12, 1.3, 0.67, 0.61, 0.7, 1.53, 1.36, 0.88, 1.71, 0.34, 1.12, 5.69, 1.06, 1.31, 0.9, 0.16]} \ No newline at end of file diff --git a/annotations_1/kyfMjDlcisQ_filtered.json b/annotations_1/kyfMjDlcisQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee7e7bc4451f91a3089d3682dfd10f961e647bb8 --- /dev/null +++ b/annotations_1/kyfMjDlcisQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.99], [16.0, 18.12], [19.0, 41.74], [45.0, 46.41], [48.0, 55.88], [58.0, 68.22], [75.0, 82.39]], "keep_status": [true, false, false, false, false, false, false], "silence_prob": [30.41, 29.3, 29.64, 0.0, 29.55, 29.76, 29.34], "audiomae_on_audioset": [[["music", 58.27], ["guitar", 4.39], ["musical instrument", 3.92]], [["music", 69.32], ["guitar", 5.87], ["plucked string instrument", 4.08]], [["music", 63.3], ["hum", 5.12], ["synthesizer", 4.78]], null, [["music", 67.39], ["sitar", 13.35], ["carnatic music", 7.55]], [["music", 53.99], ["hum", 13.91], ["throbbing", 11.6]], [["music", 59.75], ["sitar", 9.18], ["carnatic music", 7.96]]], "duration": [4.99, 2.12, 22.74, 1.41, 7.88, 10.22, 7.39]} \ No newline at end of file diff --git a/annotations_1/kzVO5JrnEJ8_filtered.json b/annotations_1/kzVO5JrnEJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3caefeaa8657d212ab40c762e8d3f70ef5e69381 --- /dev/null +++ b/annotations_1/kzVO5JrnEJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.38], [10.0, 10.29], [11.0, 11.82], [20.0, 20.01], [22.0, 23.08], [24.0, 24.8], [27.0, 27.33], [28.0, 32.56], [34.0, 33.86], [38.0, 40.98], [49.0, 51.26], [56.0, 57.0], [64.0, 64.57], [69.0, 71.68], [75.0, 75.22], [77.0, 79.79], [84.0, 85.26], [96.0, 98.56], [100.0, 104.41], [107.0, 108.41], [110.0, 110.66], [112.0, 116.94], [122.0, 123.03], [124.0, 124.56], [125.0, 124.6], [125.0, 126.17], [134.0, 135.92], [137.0, 143.29], [144.0, 144.49], [152.0, 153.0]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 42.84, 50.41, 0.0, 0.0, 60.6, 0.0, 35.73, 0.0, 70.44, 99.1, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 35.95], ["music", 23.96], ["hum", 9.06]], null, null, null, null, null, [["music", 42.56], ["applause", 24.52], ["crowd", 3.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.38, 0.29, 0.82, 0.01, 1.08, 0.8, 0.33, 4.56, -0.14, 2.98, 2.26, 1.0, 0.57, 2.68, 0.22, 2.79, 1.26, 2.56, 4.41, 1.41, 0.66, 4.94, 1.03, 0.56, -0.4, 1.17, 1.92, 6.29, 0.49, 1.0]} \ No newline at end of file diff --git a/annotations_1/kzZQYnvw-6E_filtered.json b/annotations_1/kzZQYnvw-6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e250924417f5bd5e6271b8f793e8e8ac862bf49 --- /dev/null +++ b/annotations_1/kzZQYnvw-6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.04], [28.0, 30.62], [35.0, 36.56], [38.0, 40.59], [42.0, 42.74], [44.0, 51.06], [55.0, 58.97], [62.0, 65.37], [79.0, 79.02], [83.0, 82.63], [92.0, 92.62], [103.0, 103.96], [106.0, 106.0], [108.0, 108.24], [113.0, 117.14], [119.0, 127.31], [132.0, 132.63], [134.0, 137.71], [151.0, 151.88], [153.0, 162.89], [164.0, 166.18], [171.0, 171.69]], "keep_status": [true, true, false, true, false, false, true, false, false, false, false, false, false, false, true, true, false, true, false, false, true, false], "silence_prob": [31.87, 33.45, 0.0, 30.33, 0.0, 31.69, 34.35, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.65, 30.95, 0.0, 32.0, 0.0, 30.54, 29.93, 0.0], "audiomae_on_audioset": [[["speech", 26.01], ["thunk", 11.18], ["explosion", 8.42]], [["roaring cats (lions, tigers)", 17.26], ["animal", 15.75], ["roar", 13.9]], null, [["speech", 46.09], ["grunt", 14.66], ["fart", 8.91]], null, [["cattle, bovinae", 46.48], ["moo", 25.63], ["livestock, farm animals, working animals", 16.75]], [["groan", 50.44], ["grunt", 11.14], ["roar", 4.96]], [["speech", 79.75], ["sine wave", 2.76], ["sidetone", 1.68]], null, null, null, null, null, null, [["whack, thwack", 27.44], ["speech", 18.8], ["music", 9.42]], [["music", 33.3], ["speech", 17.03], ["groan", 17.0]], null, [["speech", 16.28], ["music", 6.88], ["hum", 6.78]], null, [["speech", 36.5], ["music", 36.33], ["didgeridoo", 10.63]], [["speech", 28.85], ["groan", 13.62], ["cattle, bovinae", 5.8]], null], "duration": [4.04, 2.62, 1.56, 2.59, 0.74, 7.06, 3.97, 3.37, 0.02, -0.37, 0.62, 0.96, 0.0, 0.24, 4.14, 8.31, 0.63, 3.71, 0.88, 9.89, 2.18, 0.69]} \ No newline at end of file diff --git a/annotations_1/kzf7hr9O00k_filtered.json b/annotations_1/kzf7hr9O00k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f9866c94894100de6a12ce50c0e343154abc4ba --- /dev/null +++ b/annotations_1/kzf7hr9O00k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [14.0, 14.34], [16.0, 17.12], [25.0, 26.16], [40.0, 43.5], [44.0, 43.63], [52.0, 53.67], [56.0, 60.2], [63.0, 67.26], [68.0, 75.68], [81.0, 81.53], [87.0, 88.64], [94.0, 94.56], [105.0, 105.6], [111.0, 112.04], [113.0, 113.39], [122.0, 122.59], [126.0, 126.05], [133.0, 133.22], [141.0, 141.47]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 34.41, 33.93, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 53.46], ["speech", 6.61], ["electronic music", 4.32]], null, null, [["music", 67.92], ["musical instrument", 6.36], ["didgeridoo", 3.8]], [["speech", 48.82], ["music", 35.76], ["throbbing", 3.53]], [["music", 34.12], ["speech", 16.33], ["didgeridoo", 15.29]], null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 0.34, 1.12, 1.16, 3.5, -0.37, 1.67, 4.2, 4.26, 7.68, 0.53, 1.64, 0.56, 0.6, 1.04, 0.39, 0.59, 0.05, 0.22, 0.47]} \ No newline at end of file diff --git a/annotations_1/kzxSZ5zCfXs_filtered.json b/annotations_1/kzxSZ5zCfXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa9b16a9f60d67a6bcaf1f387f8699d78656a68 --- /dev/null +++ b/annotations_1/kzxSZ5zCfXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 29.1], [30.0, 34.7], [36.0, 40.37], [41.0, 53.47], [56.0, 58.72], [60.0, 61.2], [64.0, 65.35]], "keep_status": [false, true, true, true, false, false, false], "silence_prob": [28.96, 28.76, 28.91, 29.13, 29.6, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 45.01], ["buzz", 17.46], ["vehicle", 11.94]], [["speech", 44.77], ["vehicle", 20.06], ["hum", 4.91]], [["hum", 27.95], ["mains hum", 18.24], ["breaking", 9.42]], [["speech", 23.24], ["electric shaver, electric razor", 18.65], ["buzz", 15.01]], [["mains hum", 46.39], ["hum", 28.84], ["speech", 7.44]], null, null], "duration": [4.1, 4.7, 4.37, 12.47, 2.72, 1.2, 1.35]} \ No newline at end of file diff --git a/annotations_1/kzxz5xezOAI_filtered.json b/annotations_1/kzxz5xezOAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b896f7ae2c3e50c308d40585c38ed0c20fe00bab --- /dev/null +++ b/annotations_1/kzxz5xezOAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.15], [15.0, 15.85], [23.0, 24.14], [29.0, 30.5], [32.0, 32.95], [34.0, 34.42], [37.0, 38.25], [46.0, 47.53], [54.0, 54.19], [56.0, 57.99], [59.0, 60.03], [62.0, 66.97], [69.0, 70.02], [71.0, 72.03], [73.0, 81.43], [84.0, 84.08]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0, 32.04, 0.0], "audiomae_on_audioset": [[["noise", 26.46], ["hum", 15.62], ["music", 10.78]], null, null, null, null, null, null, null, null, null, null, [["speech", 26.45], ["whale vocalization", 24.88], ["hum", 8.82]], null, null, [["speech", 44.02], ["animal", 7.14], ["electric shaver, electric razor", 6.3]], null], "duration": [7.15, 0.85, 1.14, 1.5, 0.95, 0.42, 1.25, 1.53, 0.19, 1.99, 1.03, 4.97, 1.02, 1.03, 8.43, 0.08]} \ No newline at end of file diff --git a/annotations_1/l-GbvgBXi18_filtered.json b/annotations_1/l-GbvgBXi18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3b0ab52be4ea68a3321f7283b4b70d5ab6b5dfe --- /dev/null +++ b/annotations_1/l-GbvgBXi18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.6], [10.0, 13.85], [16.0, 16.63], [18.0, 23.73], [27.0, 26.89], [27.0, 28.32], [29.0, 30.75], [34.0, 37.71], [41.0, 41.62], [44.0, 46.57], [70.0, 71.1], [72.0, 76.99], [78.0, 87.88], [96.0, 96.42], [97.0, 97.51], [98.0, 99.82], [108.0, 133.25], [140.0, 145.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 55.04, 0.0, 35.0, 0.0, 0.0, 0.0, 42.44, 0.0, 99.92, 0.0, 87.55, 60.05, 0.0, 0.0, 0.0, 37.59, 99.65], "audiomae_on_audioset": [null, null, null, [["speech", 64.85], ["whack, thwack", 5.66], ["arrow", 2.1]], null, null, null, [["hum", 36.27], ["whale vocalization", 16.44], ["throbbing", 11.94]], null, null, null, null, null, null, null, null, [["whale vocalization", 81.95], ["rumble", 5.63], ["stomach rumble", 2.14]], null], "duration": [0.6, 3.85, 0.63, 5.73, -0.11, 1.32, 1.75, 3.71, 0.62, 2.57, 1.1, 4.99, 9.88, 0.42, 0.51, 1.82, 25.25, 5.94]} \ No newline at end of file diff --git a/annotations_1/l081UdHizvg_filtered.json b/annotations_1/l081UdHizvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58626b70210cb0020dbdf7a49eefead172f345a2 --- /dev/null +++ b/annotations_1/l081UdHizvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.7], [10.0, 13.47], [15.0, 15.4], [20.0, 20.39], [23.0, 23.77], [25.0, 25.22], [27.0, 27.99], [29.0, 30.05], [31.0, 31.7], [35.0, 35.82], [39.0, 38.99], [51.0, 57.72], [62.0, 62.19], [64.0, 64.56], [65.0, 66.09], [69.0, 71.64], [72.0, 73.57], [74.0, 75.15], [76.0, 76.86], [79.0, 80.76], [86.0, 88.43], [89.0, 89.5], [91.0, 91.49], [100.0, 101.8], [103.0, 102.95], [104.0, 105.81], [106.0, 107.18], [108.0, 108.8], [110.0, 112.02], [113.0, 114.02], [117.0, 116.99], [122.0, 122.67], [125.0, 125.54], [129.0, 129.83], [133.0, 133.03], [135.0, 154.74], [173.0, 174.51]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.81, 0.0, 0.0, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.47, 0.0], "audiomae_on_audioset": [null, [["music", 24.02], ["speech", 22.13], ["animal", 4.54]], null, null, null, null, null, null, null, null, null, [["hum", 22.94], ["livestock, farm animals, working animals", 12.7], ["cattle, bovinae", 11.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.94], ["foghorn", 7.79], ["musical instrument", 4.8]], null], "duration": [1.7, 3.47, 0.4, 0.39, 0.77, 0.22, 0.99, 1.05, 0.7, 0.82, -0.01, 6.72, 0.19, 0.56, 1.09, 2.64, 1.57, 1.15, 0.86, 1.76, 2.43, 0.5, 0.49, 1.8, -0.05, 1.81, 1.18, 0.8, 2.02, 1.02, -0.01, 0.67, 0.54, 0.83, 0.03, 19.74, 1.51]} \ No newline at end of file diff --git a/annotations_1/l0zmCUVB0Yw_filtered.json b/annotations_1/l0zmCUVB0Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7a5c806a6229708f9063d41ab8b399166e8280b --- /dev/null +++ b/annotations_1/l0zmCUVB0Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.4], [1.0, 5.49], [12.0, 12.66], [26.0, 25.68], [27.0, 27.46], [41.0, 42.52], [54.0, 53.82], [66.0, 66.01], [72.0, 72.57], [86.0, 86.7], [91.0, 91.45], [93.0, 94.9], [97.0, 97.38], [98.0, 99.45], [100.0, 100.8], [116.0, 116.51], [120.0, 120.8], [122.0, 122.44], [124.0, 124.61], [128.0, 127.89], [132.0, 132.21], [143.0, 143.43], [144.0, 143.95], [145.0, 144.76], [145.0, 145.66], [152.0, 161.81], [172.0, 172.57], [174.0, 174.8]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 32.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.72], ["musical instrument", 5.08], ["speech", 3.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.24], ["synthesizer", 16.42], ["speech", 15.84]], null, null], "duration": [0.4, 4.49, 0.66, -0.32, 0.46, 1.52, -0.18, 0.01, 0.57, 0.7, 0.45, 1.9, 0.38, 1.45, 0.8, 0.51, 0.8, 0.44, 0.61, -0.11, 0.21, 0.43, -0.05, -0.24, 0.66, 9.81, 0.57, 0.8]} \ No newline at end of file diff --git a/annotations_1/l17e0M4TTBA_filtered.json b/annotations_1/l17e0M4TTBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d3b73326501caf13173162dfbc4de2a7c4f49d --- /dev/null +++ b/annotations_1/l17e0M4TTBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [17.0, 17.44], [19.0, 20.68], [22.0, 22.79], [24.0, 28.0], [30.0, 32.7], [33.0, 36.27], [38.0, 43.34], [44.0, 45.54], [50.0, 51.41], [52.0, 54.48], [57.0, 57.3], [69.0, 70.6], [71.0, 88.65], [91.0, 95.96], [99.0, 104.23], [109.0, 111.72], [116.0, 117.9], [121.0, 122.81], [124.0, 125.85], [130.0, 133.51], [134.0, 135.68], [137.0, 138.23], [144.0, 147.04], [150.0, 151.31], [153.0, 158.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 96.54, 53.59, 97.92, 75.88, 0.0, 0.0, 72.01, 0.0, 0.0, 59.15, 88.46, 99.21, 54.97, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 59.33, 0.0, 99.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.44, 1.68, 0.79, 4.0, 2.7, 3.27, 5.34, 1.54, 1.41, 2.48, 0.3, 1.6, 17.65, 4.96, 5.23, 2.72, 1.9, 1.81, 1.85, 3.51, 1.68, 1.23, 3.04, 1.31, 5.25]} \ No newline at end of file diff --git a/annotations_1/l2zrJ_LZrhg_filtered.json b/annotations_1/l2zrJ_LZrhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2478a921ad33eb0eb2471972ab4cb2837d6222c2 --- /dev/null +++ b/annotations_1/l2zrJ_LZrhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [22.0, 26.7], [30.0, 31.02], [32.0, 33.84], [41.0, 41.71], [46.0, 48.88], [59.0, 59.75], [60.0, 65.45], [68.0, 78.95], [86.0, 87.83], [88.0, 89.95], [92.0, 94.49], [98.0, 98.02], [99.0, 103.5], [113.0, 113.46], [117.0, 120.11], [123.0, 131.89], [146.0, 147.12], [151.0, 152.14], [155.0, 157.84], [158.0, 162.06], [165.0, 167.04]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, true, false, true, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 33.61, 0.0, 0.0, 0.0, 33.9, 0.0, 30.07, 33.22, 0.0, 0.0, 42.74, 0.0, 31.58, 0.0, 90.6, 51.18, 0.0, 0.0, 39.46, 34.79, 39.3], "audiomae_on_audioset": [null, [["speech", 34.27], ["thunk", 17.83], ["whack, thwack", 10.15]], null, null, null, [["hum", 32.05], ["speech", 29.31], ["mains hum", 8.42]], null, [["speech", 36.88], ["sidetone", 14.05], ["music", 13.06]], [["speech", 56.79], ["music", 22.23], ["fart", 4.71]], null, null, [["hum", 17.38], ["throbbing", 16.39], ["music", 14.13]], null, [["livestock, farm animals, working animals", 24.58], ["cattle, bovinae", 20.05], ["moo", 18.87]], null, null, null, null, null, [["music", 53.96], ["musical instrument", 7.06], ["didgeridoo", 4.37]], [["music", 65.83], ["musical instrument", 3.32], ["guitar", 2.0]], [["music", 47.04], ["cello", 10.83], ["double bass", 8.04]]], "duration": [1.25, 4.7, 1.02, 1.84, 0.71, 2.88, 0.75, 5.45, 10.95, 1.83, 1.95, 2.49, 0.02, 4.5, 0.46, 3.11, 8.89, 1.12, 1.14, 2.84, 4.06, 2.04]} \ No newline at end of file diff --git a/annotations_1/l38Qliee6VE_filtered.json b/annotations_1/l38Qliee6VE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a567293154f755fce37d62314e80f91ebf1c54d8 --- /dev/null +++ b/annotations_1/l38Qliee6VE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.6], [10.0, 15.33], [18.0, 19.43], [20.0, 20.38], [25.0, 27.9], [49.0, 51.92], [61.0, 61.3], [62.0, 62.94], [64.0, 65.42], [67.0, 69.18], [70.0, 71.02], [71.0, 87.2], [87.0, 87.37], [87.0, 87.71], [88.0, 87.74], [88.0, 87.98], [88.0, 95.86], [107.0, 108.51], [112.0, 112.11], [113.0, 113.46], [119.0, 127.38], [129.0, 132.38], [134.0, 136.65], [143.0, 151.14], [152.0, 156.39]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 55.25, 0.0, 0.0, 38.11, 59.96, 0.0, 0.0, 0.0, 40.99, 0.0, 31.57, 0.0, 0.0, 0.0, 0.0, 31.75, 0.0, 0.0, 0.0, 40.19, 39.22, 75.23, 78.38, 49.18], "audiomae_on_audioset": [null, null, null, null, [["speech", 29.2], ["wail, moan", 19.16], ["fart", 11.28]], null, null, null, null, [["music", 33.31], ["hum", 6.27], ["musical instrument", 3.69]], null, [["music", 56.52], ["speech", 10.06], ["synthesizer", 9.18]], null, null, null, null, [["music", 56.53], ["sidetone", 14.12], ["speech", 5.12]], null, null, null, [["music", 82.44], ["speech", 4.41], ["musical instrument", 2.06]], [["music", 56.16], ["musical instrument", 4.13], ["hum", 2.77]], null, null, [["music", 28.34], ["speech", 17.1], ["sidetone", 11.26]]], "duration": [-0.4, 5.33, 1.43, 0.38, 2.9, 2.92, 0.3, 0.94, 1.42, 2.18, 1.02, 16.2, 0.37, 0.71, -0.26, -0.02, 7.86, 1.51, 0.11, 0.46, 8.38, 3.38, 2.65, 8.14, 4.39]} \ No newline at end of file diff --git a/annotations_1/l46yjkR0SqU_filtered.json b/annotations_1/l46yjkR0SqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38cd542ff5ea235a39c355dce17e2ac37de81320 --- /dev/null +++ b/annotations_1/l46yjkR0SqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 14.69], [19.0, 20.33], [21.0, 21.47], [23.0, 22.98], [24.0, 36.44], [38.0, 84.97], [85.0, 86.39], [87.0, 100.45], [104.0, 115.13], [120.0, 122.1], [124.0, 125.63], [126.0, 126.79], [130.0, 130.27], [131.0, 134.03], [137.0, 137.24], [138.0, 140.02], [141.0, 158.82], [160.0, 160.37], [163.0, 167.86]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true], "silence_prob": [35.42, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 29.03, 30.52, 62.58, 0.0, 0.0, 0.0, 40.45, 0.0, 43.35, 39.89, 0.0, 37.35], "audiomae_on_audioset": [[["hum", 28.04], ["throbbing", 17.13], ["whale vocalization", 15.07]], null, null, null, null, null, null, [["music", 68.86], ["marimba, xylophone", 4.87], ["musical instrument", 2.74]], [["music", 69.46], ["theremin", 12.56], ["soundtrack music", 1.42]], null, null, null, null, [["cattle, bovinae", 9.82], ["fly, housefly", 9.7], ["speech", 9.15]], null, [["speech", 35.97], ["music", 5.78], ["hum", 4.73]], [["hum", 37.13], ["mains hum", 16.82], ["throbbing", 14.55]], null, [["speech", 32.24], ["music", 8.79], ["mains hum", 7.83]]], "duration": [10.69, 1.33, 0.47, -0.02, 12.44, 46.97, 1.39, 13.45, 11.13, 2.1, 1.63, 0.79, 0.27, 3.03, 0.24, 2.02, 17.82, 0.37, 4.86]} \ No newline at end of file diff --git a/annotations_1/l4S4IBACQCM_filtered.json b/annotations_1/l4S4IBACQCM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a558c0944860c39a9b177beca85e141e80213c26 --- /dev/null +++ b/annotations_1/l4S4IBACQCM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.93], [3.0, 7.15], [8.0, 8.94], [9.0, 10.83], [22.0, 22.69], [25.0, 25.02], [26.0, 26.47], [30.0, 31.56], [32.0, 32.66], [34.0, 34.13], [40.0, 41.39], [51.0, 51.46], [71.0, 108.7], [113.0, 134.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.85], "audiomae_on_audioset": [null, [["music", 53.16], ["brass instrument", 11.65], ["trombone", 9.66]], null, null, null, null, null, null, null, null, null, null, null, [["music", 62.04], ["buzz", 6.35], ["musical instrument", 4.06]]], "duration": [0.93, 4.15, 0.94, 1.83, 0.69, 0.02, 0.47, 1.56, 0.66, 0.13, 1.39, 0.46, 37.7, 21.6]} \ No newline at end of file diff --git a/annotations_1/l6TGERgrXmA_filtered.json b/annotations_1/l6TGERgrXmA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f0477d3030c9f5b3f24fe2ccab26ab3f38baddc3 --- /dev/null +++ b/annotations_1/l6TGERgrXmA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.76], [2.0, 5.68], [19.0, 19.84], [25.0, 26.74], [35.0, 36.02], [38.0, 38.2], [43.0, 45.15], [46.0, 46.57], [54.0, 61.33], [64.0, 64.56], [65.0, 67.07], [68.0, 68.5], [71.0, 71.22], [74.0, 75.03], [82.0, 84.2], [95.0, 98.25], [102.0, 103.13], [115.0, 124.48], [127.0, 130.47], [131.0, 132.68], [133.0, 144.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.95, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 61.97, 0.0, 53.84, 0.0, 0.0, 0.0, 56.25, 99.92, 0.0, 90.95, 92.8, 0.0, 96.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.24, 3.68, 0.84, 1.74, 1.02, 0.2, 2.15, 0.57, 7.33, 0.56, 2.07, 0.5, 0.22, 1.03, 2.2, 3.25, 1.13, 9.48, 3.47, 1.68, 11.15]} \ No newline at end of file diff --git a/annotations_1/l7FkN4ooYvA_filtered.json b/annotations_1/l7FkN4ooYvA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a584a05e954f9425d0c9d1535c245c1840f5e41e --- /dev/null +++ b/annotations_1/l7FkN4ooYvA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.3], [13.0, 13.07], [28.0, 27.82], [28.0, 28.24], [28.0, 28.29], [35.0, 38.47], [43.0, 59.8], [61.0, 69.09], [69.0, 69.16], [69.0, 70.78], [77.0, 79.84], [84.0, 95.12], [102.0, 101.88], [108.0, 107.94], [108.0, 108.26], [116.0, 116.51], [119.0, 118.94], [124.0, 129.41], [130.0, 139.38], [142.0, 144.83], [166.0, 169.23], [172.0, 174.31]], "keep_status": [true, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, true, true], "silence_prob": [43.08, 0.0, 0.0, 0.0, 0.0, 33.77, 32.13, 31.81, 0.0, 0.0, 29.05, 32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 37.37, 32.2, 35.53, 29.39, 29.62], "audiomae_on_audioset": [[["music", 41.04], ["bow-wow", 11.26], ["speech", 8.64]], null, null, null, null, [["vehicle", 12.32], ["motorcycle", 12.29], ["siren", 11.47]], [["music", 53.36], ["boing", 32.63], ["speech", 4.03]], [["music", 67.0], ["boing", 10.35], ["scratching (performance technique)", 3.59]], null, null, [["speech", 26.34], ["sidetone", 11.01], ["music", 10.72]], [["music", 55.98], ["theremin", 10.15], ["buzz", 3.46]], null, null, null, null, null, [["music", 71.55], ["speech", 11.47], ["sidetone", 3.01]], [["music", 67.5], ["speech", 6.65], ["groan", 4.84]], [["groan", 34.29], ["music", 23.55], ["boing", 18.51]], [["music", 53.34], ["electronic music", 3.58], ["effects unit", 3.02]], [["music", 23.69], ["speech", 4.54], ["musical instrument", 2.28]]], "duration": [2.3, 0.07, -0.18, 0.24, 0.29, 3.47, 16.8, 8.09, 0.16, 1.78, 2.84, 11.12, -0.12, -0.06, 0.26, 0.51, -0.06, 5.41, 9.38, 2.83, 3.23, 2.31]} \ No newline at end of file diff --git a/annotations_1/l8MFxT9ILKY_filtered.json b/annotations_1/l8MFxT9ILKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5c0933f535b9b625257a6c481f8d7308d96e896 --- /dev/null +++ b/annotations_1/l8MFxT9ILKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.26], [15.0, 26.89], [31.0, 34.96], [37.0, 38.3], [39.0, 46.01], [47.0, 53.87], [60.0, 60.45], [63.0, 74.66], [78.0, 79.2], [80.0, 81.51], [83.0, 89.67], [93.0, 104.14], [106.0, 107.42], [108.0, 144.15], [146.0, 146.11], [148.0, 147.75], [149.0, 160.91], [162.0, 163.76], [165.0, 166.13]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.45, 30.18, 0.0, 33.63, 44.32, 0.0, 41.36, 0.0, 0.0, 34.3, 30.33, 0.0, 0.0, 0.0, 0.0, 30.44, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 36.47], ["vehicle", 8.92], ["hum", 8.59]], [["speech", 45.64], ["hubbub, speech noise, speech babble", 11.15], ["cattle, bovinae", 3.68]], null, [["speech", 64.71], ["theremin", 5.02], ["music", 4.38]], [["speech", 37.49], ["music", 30.69], ["hum", 3.35]], null, [["mains hum", 55.52], ["hum", 38.39], ["speech", 1.05]], null, null, [["music", 67.67], ["hum", 2.68], ["scary music", 2.54]], [["music", 56.25], ["hum", 9.0], ["buzz", 8.47]], null, null, null, null, [["music", 53.96], ["hum", 20.39], ["mains hum", 12.97]], null, null], "duration": [0.26, 11.89, 3.96, 1.3, 7.01, 6.87, 0.45, 11.66, 1.2, 1.51, 6.67, 11.14, 1.42, 36.15, 0.11, -0.25, 11.91, 1.76, 1.13]} \ No newline at end of file diff --git a/annotations_1/l94geYuwNJg_filtered.json b/annotations_1/l94geYuwNJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17ab885ea5eab14dd8a67a2f68be6f2d0ecec6c4 --- /dev/null +++ b/annotations_1/l94geYuwNJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.33]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.33]} \ No newline at end of file diff --git a/annotations_1/lCF6_l8gtdA_filtered.json b/annotations_1/lCF6_l8gtdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cce6e7183e28c6111d61f1e647e066888cb29f3a --- /dev/null +++ b/annotations_1/lCF6_l8gtdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.66], [3.0, 4.01], [5.0, 5.34], [6.0, 6.54], [9.0, 11.89], [17.0, 17.2], [37.0, 39.51], [50.0, 51.02], [53.0, 53.27], [53.0, 53.91], [56.0, 56.03], [56.0, 59.31], [61.0, 62.72], [63.0, 65.06], [70.0, 76.52], [81.0, 88.11], [89.0, 89.14], [90.0, 90.29], [92.0, 92.84], [94.0, 94.29], [96.0, 96.3], [100.0, 100.63], [105.0, 107.92], [109.0, 110.42], [111.0, 111.52], [114.0, 114.96], [116.0, 117.9], [125.0, 128.41], [129.0, 133.59], [135.0, 135.31], [136.0, 137.3], [138.0, 139.67], [140.0, 141.02], [144.0, 145.89], [146.0, 146.82], [149.0, 149.23], [150.0, 153.35], [158.0, 163.36], [164.0, 165.27], [168.0, 167.83], [170.0, 170.7], [171.0, 173.18], [174.0, 174.43], [175.0, 176.28], [178.0, 179.64], [181.0, 183.95], [185.0, 185.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 60.32, 0.0, 0.0, 0.0, 0.0, 43.13, 0.0, 54.43, 76.7, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.27, 0.0, 0.0, 0.0, 0.0, 50.26, 40.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.18, 41.95, 0.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 53.28, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 14.98], ["noise", 10.72], ["radio", 6.16]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.17], ["music", 26.49], ["didgeridoo", 4.99]], null, null, null, null, null, null, null, [["mains hum", 39.35], ["hum", 27.28], ["music", 7.84]], [["hum", 38.88], ["mains hum", 27.15], ["music", 13.12]], null, null, null, [["speech", 17.05], ["mains hum", 17.01], ["sidetone", 15.06]], null, null, null, null, null], "duration": [0.66, 1.01, 0.34, 0.54, 2.89, 0.2, 2.51, 1.02, 0.27, 0.91, 0.03, 3.31, 1.72, 2.06, 6.52, 7.11, 0.14, 0.29, 0.84, 0.29, 0.3, 0.63, 2.92, 1.42, 0.52, 0.96, 1.9, 3.41, 4.59, 0.31, 1.3, 1.67, 1.02, 1.89, 0.82, 0.23, 3.35, 5.36, 1.27, -0.17, 0.7, 2.18, 0.43, 1.28, 1.64, 2.95, 0.97]} \ No newline at end of file diff --git a/annotations_1/lCL7DI3ah40_filtered.json b/annotations_1/lCL7DI3ah40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f7b292f08ab79c96052665c7d7907d42e0b36f9 --- /dev/null +++ b/annotations_1/lCL7DI3ah40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.29], [19.0, 20.28], [30.0, 81.67]], "keep_status": [false, false, false], "silence_prob": [32.33, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 34.42], ["mains hum", 23.92], ["speech", 13.76]], null, null], "duration": [3.29, 1.28, 51.67]} \ No newline at end of file diff --git a/annotations_1/lCcWPDXqKi0_filtered.json b/annotations_1/lCcWPDXqKi0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26aa7aa409eea55b45ddc8943b7a825e74760955 --- /dev/null +++ b/annotations_1/lCcWPDXqKi0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.93], [11.0, 19.18], [20.0, 19.92], [20.0, 23.84], [25.0, 35.29], [37.0, 38.99], [51.0, 52.98], [53.0, 54.13], [57.0, 60.07], [61.0, 60.66], [61.0, 60.79], [61.0, 60.94], [67.0, 69.25], [75.0, 76.0], [76.0, 79.2]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 42.79, 0.0, 45.56, 46.54, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 45.18, 0.0, 46.64], "audiomae_on_audioset": [null, [["music", 45.85], ["speech", 27.88], ["synthesizer", 2.4]], null, [["music", 20.04], ["hum", 17.55], ["throbbing", 17.11]], [["music", 51.14], ["throbbing", 6.83], ["speech", 5.94]], null, null, null, [["music", 75.25], ["speech", 4.12], ["electronic music", 2.32]], null, null, null, [["music", 42.43], ["frog", 21.2], ["croak", 18.89]], null, [["speech", 24.59], ["music", 23.52], ["animal", 14.34]]], "duration": [1.93, 8.18, -0.08, 3.84, 10.29, 1.99, 1.98, 1.13, 3.07, -0.34, -0.21, -0.06, 2.25, 1.0, 3.2]} \ No newline at end of file diff --git a/annotations_1/lCqHKRjIMu8_filtered.json b/annotations_1/lCqHKRjIMu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfa4890a1b2d8726937e732e5ac8005626273d8f --- /dev/null +++ b/annotations_1/lCqHKRjIMu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.68], [6.0, 7.2], [9.0, 10.64], [14.0, 15.7], [17.0, 17.05], [18.0, 21.74], [26.0, 26.18], [27.0, 27.35], [28.0, 29.12], [30.0, 30.75], [33.0, 33.02], [35.0, 35.14], [35.0, 35.18], [35.0, 35.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 54.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.2, 1.64, 1.7, 0.05, 3.74, 0.18, 0.35, 1.12, 0.75, 0.02, 0.14, 0.18, 0.97]} \ No newline at end of file diff --git a/annotations_1/lEykI65QtSQ_filtered.json b/annotations_1/lEykI65QtSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a4fec14d85b7917572e05db8eda9c26dfe361d6 --- /dev/null +++ b/annotations_1/lEykI65QtSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.7], [47.0, 46.95], [59.0, 59.44], [61.0, 60.74], [66.0, 66.19], [67.0, 68.57], [81.0, 82.04], [82.0, 82.7], [85.0, 88.57], [96.0, 97.28], [98.0, 98.34], [99.0, 99.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.31, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["thunk", 66.8], ["speech", 17.16], ["music", 6.64]], null, null, null], "duration": [1.7, -0.05, 0.44, -0.26, 0.19, 1.57, 1.04, 0.7, 3.57, 1.28, 0.34, 0.74]} \ No newline at end of file diff --git a/annotations_1/lF3IIOXn5qU_filtered.json b/annotations_1/lF3IIOXn5qU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfeb210152b1c91560cfb68a2734bc9a194753d8 --- /dev/null +++ b/annotations_1/lF3IIOXn5qU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.08], [13.0, 15.72], [18.0, 18.28], [21.0, 21.71], [33.0, 34.8], [36.0, 37.4], [41.0, 41.66], [53.0, 53.33], [55.0, 55.46], [56.0, 58.99], [73.0, 73.21], [75.0, 75.76], [82.0, 86.48], [88.0, 88.94], [92.0, 94.47], [95.0, 96.25], [102.0, 103.15], [107.0, 108.01], [114.0, 115.25], [116.0, 117.31], [144.0, 145.57], [146.0, 146.84], [153.0, 156.56], [159.0, 158.82]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 0.0, 31.34, 0.0, 31.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0], "audiomae_on_audioset": [null, [["music", 32.21], ["boing", 11.13], ["speech", 9.18]], null, null, null, null, null, null, null, [["music", 22.56], ["livestock, farm animals, working animals", 15.21], ["moo", 9.85]], null, null, [["speech", 24.95], ["whack, thwack", 10.32], ["boing", 9.45]], null, [["music", 31.96], ["sidetone", 27.96], ["speech", 16.69]], null, null, null, null, null, null, null, [["music", 14.66], ["speech", 8.86], ["sheep", 3.7]], null], "duration": [1.08, 2.72, 0.28, 0.71, 1.8, 1.4, 0.66, 0.33, 0.46, 2.99, 0.21, 0.76, 4.48, 0.94, 2.47, 1.25, 1.15, 1.01, 1.25, 1.31, 1.57, 0.84, 3.56, -0.18]} \ No newline at end of file diff --git a/annotations_1/lFGfoPuKx9o_filtered.json b/annotations_1/lFGfoPuKx9o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fef17c86b77d3050e280236e05f07672ca21f905 --- /dev/null +++ b/annotations_1/lFGfoPuKx9o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [6.0, 10.49], [11.0, 11.5], [12.0, 13.24], [14.0, 14.93], [16.0, 26.01], [28.0, 44.02], [45.0, 48.37]], "keep_status": [false, true, false, false, false, true, false, true], "silence_prob": [0.0, 30.3, 0.0, 0.0, 0.0, 31.51, 31.76, 32.48], "audiomae_on_audioset": [null, [["music", 39.88], ["whale vocalization", 10.44], ["hum", 5.13]], null, null, null, [["throbbing", 29.39], ["music", 16.72], ["hum", 15.6]], [["mains hum", 33.06], ["hum", 29.15], ["throbbing", 16.85]], [["music", 27.2], ["hum", 17.34], ["mains hum", 9.63]]], "duration": [1.6, 4.49, 0.5, 1.24, 0.93, 10.01, 16.02, 3.37]} \ No newline at end of file diff --git a/annotations_1/lFyh5QCd6kw_filtered.json b/annotations_1/lFyh5QCd6kw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f7e761e8d142e0e3282fe918bc8b22e6c07166 --- /dev/null +++ b/annotations_1/lFyh5QCd6kw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 85.82]], "keep_status": [false], "silence_prob": [30.89], "audiomae_on_audioset": [[["music", 64.87], ["explosion", 3.29], ["brass instrument", 1.94]]], "duration": [4.82]} \ No newline at end of file diff --git a/annotations_1/lGAADj8laqo_filtered.json b/annotations_1/lGAADj8laqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9425b52c9b8b94c7e9b4e1d0f8dccc5d3a36ceb --- /dev/null +++ b/annotations_1/lGAADj8laqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.71], [10.0, 11.82], [13.0, 16.11], [19.0, 22.13], [23.0, 25.27], [26.0, 28.66], [30.0, 32.12], [33.0, 36.54], [37.0, 38.26], [39.0, 46.67], [48.0, 50.33], [51.0, 54.5], [58.0, 61.86], [63.0, 66.14], [68.0, 72.15], [74.0, 77.5], [83.0, 83.29], [84.0, 84.27], [85.0, 87.59], [89.0, 95.64], [97.0, 105.27], [106.0, 109.21], [111.0, 114.13], [115.0, 123.03]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [84.62, 0.0, 72.75, 98.86, 49.27, 53.16, 44.52, 59.96, 0.0, 98.19, 99.52, 84.43, 56.55, 70.72, 98.66, 64.18, 0.0, 0.0, 99.05, 99.48, 48.39, 50.46, 88.28, 90.6], "audiomae_on_audioset": [null, null, null, null, [["speech", 56.11], ["dial tone", 8.87], ["busy signal", 4.73]], null, [["speech", 39.74], ["music", 8.28], ["hum", 7.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 22.03], ["hum", 18.35], ["heart sounds, heartbeat", 8.34]], null, null, null], "duration": [3.71, 1.82, 3.11, 3.13, 2.27, 2.66, 2.12, 3.54, 1.26, 7.67, 2.33, 3.5, 3.86, 3.14, 4.15, 3.5, 0.29, 0.27, 2.59, 6.64, 8.27, 3.21, 3.13, 8.03]} \ No newline at end of file diff --git a/annotations_1/lGuivq-6xrw_filtered.json b/annotations_1/lGuivq-6xrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c31b49e1fd45fa617f95e69757a23ed635b18d4 --- /dev/null +++ b/annotations_1/lGuivq-6xrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.54], [14.0, 17.29], [32.0, 34.25], [42.0, 44.51], [49.0, 54.36], [66.0, 69.63], [72.0, 80.62], [81.0, 81.38], [83.0, 83.96], [100.0, 100.5], [117.0, 118.4], [136.0, 137.13], [147.0, 150.03], [164.0, 166.45], [171.0, 171.0], [176.0, 192.7], [193.0, 214.46], [223.0, 240.81], [250.0, 254.82], [270.0, 276.57]], "keep_status": [true, true, false, true, true, false, false, false, false, false, false, false, true, false, false, true, false, true, false, false], "silence_prob": [29.77, 30.32, 31.86, 32.28, 29.37, 31.3, 29.83, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42, 28.58, 0.0, 28.79, 29.18, 28.7, 30.48, 29.85], "audiomae_on_audioset": [[["music", 60.46], ["didgeridoo", 2.76], ["theremin", 2.54]], [["speech", 35.78], ["music", 30.68], ["mains hum", 3.48]], [["music", 60.6], ["synthesizer", 8.64], ["speech", 6.23]], [["whack, thwack", 20.16], ["speech", 13.04], ["clang", 12.71]], [["speech", 19.9], ["music", 18.36], ["hum", 17.94]], [["music", 77.24], ["speech", 3.43], ["whale vocalization", 3.03]], [["music", 63.86], ["didgeridoo", 14.09], ["fart", 7.5]], null, null, null, null, null, [["music", 38.01], ["snicker", 12.32], ["speech", 9.38]], [["speech", 52.15], ["music", 14.36], ["vehicle", 6.57]], null, [["music", 40.66], ["speech", 17.0], ["sound effect", 8.15]], [["music", 33.22], ["boing", 25.63], ["synthesizer", 12.91]], [["music", 60.4], ["throbbing", 4.92], ["cacophony", 2.82]], [["speech", 46.63], ["music", 24.54], ["sound effect", 3.84]], [["speech", 52.33], ["music", 17.35], ["explosion", 4.49]]], "duration": [2.54, 3.29, 2.25, 2.51, 5.36, 3.63, 8.62, 0.38, 0.96, 0.5, 1.4, 1.13, 3.03, 2.45, 0.0, 16.7, 21.46, 17.81, 4.82, 6.57]} \ No newline at end of file diff --git a/annotations_1/lHqGIe8AZ1g_filtered.json b/annotations_1/lHqGIe8AZ1g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3457533b8fa0e504d29e96954ff577c50cdee492 --- /dev/null +++ b/annotations_1/lHqGIe8AZ1g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [9.0, 9.76], [12.0, 12.65], [14.0, 14.64], [22.0, 22.06], [26.0, 25.78], [27.0, 28.0], [29.0, 30.18], [36.0, 37.59], [45.0, 46.45], [47.0, 48.71], [50.0, 51.12], [56.0, 57.28], [67.0, 68.69], [72.0, 71.64], [74.0, 76.3], [77.0, 77.08], [85.0, 86.54], [89.0, 88.97], [90.0, 91.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.76, 0.65, 0.64, 0.06, -0.22, 1.0, 1.18, 1.59, 1.45, 1.71, 1.12, 1.28, 1.69, -0.36, 2.3, 0.08, 1.54, -0.03, 1.79]} \ No newline at end of file diff --git a/annotations_1/lHxzWs9NcS0_filtered.json b/annotations_1/lHxzWs9NcS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df7410f076f221d2f091ed63ea06eedb8147c97e --- /dev/null +++ b/annotations_1/lHxzWs9NcS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 20.51], [21.0, 24.87], [31.0, 31.9], [35.0, 37.39], [47.0, 50.79], [57.0, 57.7], [62.0, 62.13], [75.0, 74.8], [83.0, 84.89], [87.0, 88.32], [89.0, 88.52], [89.0, 90.1], [96.0, 96.25], [107.0, 109.07], [122.0, 122.69], [127.0, 127.06], [129.0, 128.75], [131.0, 131.06], [137.0, 137.88], [139.0, 148.2], [149.0, 151.02], [156.0, 157.05]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [41.66, 42.88, 0.0, 33.75, 31.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59, 0.0, 0.0, 0.0, 0.0, 0.0, 29.31, 29.63, 0.0], "audiomae_on_audioset": [[["sidetone", 19.22], ["noise", 16.32], ["speech", 13.5]], [["speech", 36.16], ["beatboxing", 22.28], ["music", 9.35]], null, [["speech", 75.54], ["music", 9.95], ["boing", 1.55]], [["bleat", 16.38], ["sheep", 15.38], ["music", 14.62]], null, null, null, null, null, null, null, null, [["speech", 49.79], ["music", 6.75], ["livestock, farm animals, working animals", 6.52]], null, null, null, null, null, [["music", 80.2], ["whack, thwack", 4.76], ["speech", 2.68]], [["music", 31.24], ["cattle, bovinae", 9.87], ["moo", 9.49]], null], "duration": [8.51, 3.87, 0.9, 2.39, 3.79, 0.7, 0.13, -0.2, 1.89, 1.32, -0.48, 1.1, 0.25, 2.07, 0.69, 0.06, -0.25, 0.06, 0.88, 9.2, 2.02, 1.05]} \ No newline at end of file diff --git a/annotations_1/lISiW7wcIVc_filtered.json b/annotations_1/lISiW7wcIVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d37f053f32c06e542ee35c4210ea20f08a5abd35 --- /dev/null +++ b/annotations_1/lISiW7wcIVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.66], [15.0, 17.29], [21.0, 26.06], [34.0, 34.82], [39.0, 39.38], [43.0, 45.25], [46.0, 46.89], [58.0, 59.16], [60.0, 60.47], [65.0, 67.83], [68.0, 68.28], [80.0, 88.64], [95.0, 102.86], [103.0, 102.95], [103.0, 104.14], [111.0, 111.7], [116.0, 116.14], [117.0, 123.47], [126.0, 139.99], [140.0, 145.94], [151.0, 162.99], [169.0, 169.45], [178.0, 181.95], [186.0, 189.3], [190.0, 190.93], [192.0, 193.63], [195.0, 205.7], [207.0, 207.44], [208.0, 207.94], [212.0, 218.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 74.44, 68.93, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 60.23, 0.0, 60.89, 39.0, 0.0, 0.0, 0.0, 0.0, 77.7, 46.83, 49.09, 39.28, 0.0, 36.22, 35.39, 0.0, 0.0, 56.48, 0.0, 0.0, 64.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.73], ["speech", 14.9], ["synthesizer", 9.77]], null, null, null, null, null, [["music", 51.19], ["speech", 13.2], ["mains hum", 9.44]], [["hum", 32.36], ["mains hum", 14.82], ["sidetone", 9.13]], [["mains hum", 45.75], ["hum", 28.22], ["fly, housefly", 2.86]], null, [["speech", 56.27], ["sidetone", 5.61], ["music", 3.31]], [["insect", 36.38], ["fly, housefly", 30.12], ["mosquito", 14.42]], null, null, null, null, null, null], "duration": [0.66, 2.29, 5.06, 0.82, 0.38, 2.25, 0.89, 1.16, 0.47, 2.83, 0.28, 8.64, 7.86, -0.05, 1.14, 0.7, 0.14, 6.47, 13.99, 5.94, 11.99, 0.45, 3.95, 3.3, 0.93, 1.63, 10.7, 0.44, -0.06, 6.47]} \ No newline at end of file diff --git a/annotations_1/lIbBAWzE6H8_filtered.json b/annotations_1/lIbBAWzE6H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c01b1aa87e805a43e980ae77c694cf0d9249666 --- /dev/null +++ b/annotations_1/lIbBAWzE6H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 71.24], [75.0, 75.29], [80.0, 86.16], [100.0, 100.48], [120.0, 122.49], [125.0, 124.83], [134.0, 134.01], [136.0, 136.66], [149.0, 148.83], [155.0, 155.92], [158.0, 180.27], [180.0, 189.97], [197.0, 203.23], [204.0, 204.96]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [30.73, 0.0, 31.27, 0.0, 29.84, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 28.93, 31.77, 0.0], "audiomae_on_audioset": [[["music", 72.98], ["throbbing", 3.16], ["musical instrument", 1.96]], null, [["speech", 37.52], ["music", 21.79], ["hum", 8.29]], null, [["music", 53.44], ["crack", 11.16], ["speech", 6.97]], null, null, null, null, null, [["throbbing", 40.9], ["music", 23.35], ["hum", 19.29]], [["music", 38.17], ["livestock, farm animals, working animals", 11.93], ["cattle, bovinae", 6.75]], [["livestock, farm animals, working animals", 47.72], ["cattle, bovinae", 32.51], ["moo", 19.4]], null], "duration": [24.24, 0.29, 6.16, 0.48, 2.49, -0.17, 0.01, 0.66, -0.17, 0.92, 22.27, 9.97, 6.23, 0.96]} \ No newline at end of file diff --git a/annotations_1/lIbKD5ovjok_filtered.json b/annotations_1/lIbKD5ovjok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b993e544e8de19f220e6a4e0f7f0578e1b51482f --- /dev/null +++ b/annotations_1/lIbKD5ovjok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [10.0, 12.23], [13.0, 15.03], [16.0, 22.86], [24.0, 25.51], [26.0, 26.96], [28.0, 28.63], [29.0, 31.36], [32.0, 34.08], [35.0, 38.72], [39.0, 43.41], [44.0, 47.46], [49.0, 50.04], [52.0, 57.54], [60.0, 72.52], [75.0, 77.41], [79.0, 81.9], [86.0, 87.59], [88.0, 92.99], [94.0, 95.01], [95.0, 96.01], [97.0, 98.49], [100.0, 102.3], [104.0, 105.06], [105.0, 106.12], [108.0, 112.77], [114.0, 149.37], [152.0, 164.61], [166.0, 166.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.28, 52.51, 99.82, 84.8, 0.0, 0.0, 0.0, 74.44, 66.15, 99.44, 46.94, 61.87, 0.0, 94.81, 38.43, 59.07, 55.53, 0.0, 30.03, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 99.68, 0.0, 68.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 32.49], ["music", 9.56], ["hum", 8.84]], null, null, null, [["breaking", 46.51], ["speech", 36.26], ["crack", 4.58]], null, null, null, [["fart", 17.1], ["crushing", 16.16], ["crunch", 11.3]], null, null, null, null, null, null, null, null, null, null], "duration": [3.76, 2.23, 2.03, 6.86, 1.51, 0.96, 0.63, 2.36, 2.08, 3.72, 4.41, 3.46, 1.04, 5.54, 12.52, 2.41, 2.9, 1.59, 4.99, 1.01, 1.01, 1.49, 2.3, 1.06, 1.12, 4.77, 35.37, 12.61, 0.45]} \ No newline at end of file diff --git a/annotations_1/lJ7F2kWLGuE_filtered.json b/annotations_1/lJ7F2kWLGuE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1df98e9800131dec1792704ae53f6a527cb4f4f1 --- /dev/null +++ b/annotations_1/lJ7F2kWLGuE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.21], [3.0, 2.91], [7.0, 7.99], [14.0, 15.16], [18.0, 21.52], [24.0, 24.44], [27.0, 27.65], [32.0, 33.44], [36.0, 36.37], [58.0, 64.91], [68.0, 69.13], [71.0, 72.08], [79.0, 81.19], [82.0, 83.78], [89.0, 89.82], [94.0, 94.1], [99.0, 100.47], [105.0, 107.91], [109.0, 110.29], [116.0, 117.95], [128.0, 130.49], [131.0, 132.51], [142.0, 143.83], [147.0, 146.82], [148.0, 148.9], [149.0, 151.55], [152.0, 163.14], [165.0, 166.53], [169.0, 171.76], [173.0, 188.01], [191.0, 191.34], [193.0, 198.1], [199.0, 199.72], [202.0, 205.14], [209.0, 211.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 37.85, 0.0, 0.0, 0.0, 0.0, 34.55, 0.0, 0.0, 32.3, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 0.0, 36.95, 0.0, 0.0, 0.0, 0.0, 33.83, 28.67, 0.0, 32.56, 28.68, 0.0, 50.46, 0.0, 74.76, 36.59], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.8], ["synthesizer", 17.46], ["musical instrument", 2.25]], null, null, null, null, [["music", 60.66], ["synthesizer", 6.59], ["cacophony", 4.17]], null, null, [["music", 59.99], ["synthesizer", 14.03], ["cacophony", 2.83]], null, null, null, null, [["music", 76.31], ["synthesizer", 4.57], ["musical instrument", 2.7]], null, null, [["music", 40.27], ["speech", 34.79], ["liquid", 1.85]], null, null, null, null, [["speech", 33.99], ["music", 33.52], ["hum", 7.05]], [["music", 65.02], ["hum", 7.37], ["throbbing", 7.03]], null, [["music", 49.81], ["electronic music", 4.48], ["house music", 2.7]], [["music", 77.89], ["throbbing", 8.92], ["hum", 4.47]], null, null, null, null, [["insect", 26.52], ["fly, housefly", 23.37], ["bee, wasp, etc.", 15.11]]], "duration": [0.0, 0.21, -0.09, 0.99, 1.16, 3.52, 0.44, 0.65, 1.44, 0.37, 6.91, 1.13, 1.08, 2.19, 1.78, 0.82, 0.1, 1.47, 2.91, 1.29, 1.95, 2.49, 1.51, 1.83, -0.18, 0.9, 2.55, 11.14, 1.53, 2.76, 15.01, 0.34, 5.1, 0.72, 3.14, 2.22]} \ No newline at end of file diff --git a/annotations_1/lJf8EW9800o_filtered.json b/annotations_1/lJf8EW9800o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5552831fbbfc2f56927b1286c2ba7e556e471295 --- /dev/null +++ b/annotations_1/lJf8EW9800o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.79], [28.0, 39.23], [43.0, 47.97], [57.0, 71.59], [74.0, 80.4], [82.0, 112.55], [115.0, 115.74], [119.0, 118.71], [119.0, 120.9], [125.0, 129.64], [130.0, 137.44], [142.0, 149.88], [150.0, 154.21], [155.0, 158.5], [159.0, 161.23], [162.0, 162.63]], "keep_status": [true, true, true, true, true, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [29.97, 30.66, 29.52, 29.87, 29.11, 0.0, 0.0, 0.0, 0.0, 54.5, 40.4, 32.41, 61.27, 63.96, 46.09, 0.0], "audiomae_on_audioset": [[["music", 49.89], ["mains hum", 8.81], ["hum", 6.01]], [["music", 41.29], ["vehicle", 7.29], ["hum", 7.04]], [["speech", 40.55], ["vehicle", 23.46], ["car", 5.68]], [["vehicle", 33.56], ["car", 22.07], ["race car, auto racing", 14.02]], [["speech", 37.17], ["vehicle", 10.71], ["foghorn", 7.81]], null, null, null, null, null, [["music", 29.39], ["throbbing", 23.21], ["hum", 8.37]], [["music", 64.04], ["synthesizer", 14.03], ["musical instrument", 3.49]], null, null, [["music", 59.07], ["theremin", 7.11], ["singing bowl", 4.6]], null], "duration": [3.79, 11.23, 4.97, 14.59, 6.4, 30.55, 0.74, -0.29, 1.9, 4.64, 7.44, 7.88, 4.21, 3.5, 2.23, 0.63]} \ No newline at end of file diff --git a/annotations_1/lJjxm4xTVKk_filtered.json b/annotations_1/lJjxm4xTVKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbd09f4b2bf30ee0f11dd2e1f7523f5f3695e177 --- /dev/null +++ b/annotations_1/lJjxm4xTVKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [4.0, 8.04], [9.0, 10.3], [13.0, 15.92], [17.0, 19.18], [24.0, 23.7], [25.0, 25.44], [28.0, 29.74], [32.0, 33.24], [35.0, 36.61], [45.0, 46.53], [48.0, 60.25], [61.0, 64.45], [65.0, 65.84], [66.0, 67.19], [68.0, 69.08], [72.0, 76.23], [77.0, 77.8], [84.0, 85.09], [86.0, 85.95], [88.0, 89.36], [90.0, 90.68], [98.0, 98.17], [99.0, 99.67], [103.0, 102.91], [104.0, 104.28], [105.0, 105.0], [108.0, 108.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.79, 0.0, 42.19, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 30.91, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.12], ["hum", 16.16], ["throbbing", 8.9]], null, [["music", 50.84], ["hum", 14.53], ["throbbing", 7.46]], [["hum", 35.78], ["music", 24.08], ["gong", 11.15]], null, null, null, null, null, null, [["speech", 43.23], ["music", 14.02], ["burst, pop", 9.33]], [["explosion", 18.2], ["music", 12.43], ["hum", 9.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 4.04, 1.3, 2.92, 2.18, -0.3, 0.44, 1.74, 1.24, 1.61, 1.53, 12.25, 3.45, 0.84, 1.19, 1.08, 4.23, 0.8, 1.09, -0.05, 1.36, 0.68, 0.17, 0.67, -0.09, 0.28, 0.0, 0.63]} \ No newline at end of file diff --git a/annotations_1/lKBbFHMEvDc_filtered.json b/annotations_1/lKBbFHMEvDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92910403568e0c5a347b55a8cc2df572b5561299 --- /dev/null +++ b/annotations_1/lKBbFHMEvDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [7.0, 7.53], [9.0, 9.44], [11.0, 11.91], [13.0, 15.04], [16.0, 29.05], [30.0, 30.92], [33.0, 33.94], [36.0, 37.03], [38.0, 38.33], [39.0, 40.24], [42.0, 42.13], [43.0, 43.48], [44.0, 46.13], [49.0, 54.01], [55.0, 56.54], [57.0, 57.25], [58.0, 58.87], [59.0, 60.22], [61.0, 61.45], [62.0, 64.99], [66.0, 66.09], [67.0, 68.05], [68.0, 69.52], [71.0, 71.86], [73.0, 73.23], [75.0, 76.2], [80.0, 80.76], [83.0, 83.42], [86.0, 87.07], [88.0, 88.38], [89.0, 89.82], [92.0, 92.26], [100.0, 99.79], [102.0, 102.52], [104.0, 104.79], [109.0, 109.73], [112.0, 112.18], [116.0, 117.15], [119.0, 119.89], [121.0, 121.78], [123.0, 125.05], [127.0, 127.2], [129.0, 129.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.64, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.7, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 58.15], ["sidetone", 9.87], ["dial tone", 5.39]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.93], ["speech", 20.39], ["didgeridoo", 8.48]], null, null], "duration": [0.97, 0.53, 0.44, 0.91, 2.04, 13.05, 0.92, 0.94, 1.03, 0.33, 1.24, 0.13, 0.48, 2.13, 5.01, 1.54, 0.25, 0.87, 1.22, 0.45, 2.99, 0.09, 1.05, 1.52, 0.86, 0.23, 1.2, 0.76, 0.42, 1.07, 0.38, 0.82, 0.26, -0.21, 0.52, 0.79, 0.73, 0.18, 1.15, 0.89, 0.78, 2.05, 0.2, 0.78]} \ No newline at end of file diff --git a/annotations_1/lKStI-3GHDc_filtered.json b/annotations_1/lKStI-3GHDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4091a82bce9b7b518bac37989e3e1236d4392d5 --- /dev/null +++ b/annotations_1/lKStI-3GHDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [9.0, 10.77], [12.0, 16.28], [19.0, 19.33], [25.0, 25.17], [25.0, 29.39], [34.0, 50.87], [55.0, 61.53], [67.0, 67.22], [68.0, 68.34], [70.0, 74.92], [79.0, 86.83], [87.0, 97.85], [104.0, 120.12], [122.0, 124.12]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, true, true, true, true], "silence_prob": [0.0, 0.0, 30.48, 0.0, 0.0, 29.56, 30.05, 30.03, 0.0, 0.0, 30.52, 29.88, 30.19, 30.34, 29.48], "audiomae_on_audioset": [null, null, [["music", 51.15], ["breaking", 5.47], ["noise", 3.27]], null, null, [["music", 30.41], ["throbbing", 28.9], ["hum", 5.75]], [["music", 51.91], ["throbbing", 17.71], ["hum", 3.71]], [["music", 43.9], ["speech", 20.96], ["throbbing", 11.48]], null, null, [["music", 22.79], ["speech", 19.01], ["fly, housefly", 10.14]], [["music", 37.99], ["cattle, bovinae", 9.1], ["speech", 5.43]], [["throbbing", 22.73], ["music", 14.78], ["hum", 13.85]], [["music", 12.25], ["speech", 11.9], ["hum", 11.21]], [["music", 27.76], ["speech", 7.77], ["electronic music", 6.5]]], "duration": [0.99, 1.77, 4.28, 0.33, 0.17, 4.39, 16.87, 6.53, 0.22, 0.34, 4.92, 7.83, 10.85, 16.12, 2.12]} \ No newline at end of file diff --git a/annotations_1/lKh7qSp6zIc_filtered.json b/annotations_1/lKh7qSp6zIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2320cef9398ea52abca079cbb500148709bd274a --- /dev/null +++ b/annotations_1/lKh7qSp6zIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.62], [15.0, 15.11], [17.0, 17.63], [19.0, 18.86], [23.0, 22.81], [25.0, 27.55], [31.0, 32.71], [35.0, 35.7], [42.0, 42.21], [43.0, 43.92], [45.0, 45.6], [46.0, 47.33], [51.0, 51.83], [53.0, 53.7], [57.0, 57.33], [59.0, 59.22], [62.0, 66.75], [68.0, 68.72], [71.0, 74.93], [76.0, 79.89], [84.0, 85.16], [95.0, 96.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.59, 0.0, 34.31, 58.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["explosion", 41.97], ["eruption", 13.05], ["burst, pop", 8.96]], null, null, null, null, null, null, null, null, null, null, [["effects unit", 18.09], ["noise", 15.11], ["synthesizer", 11.03]], null, [["explosion", 22.75], ["burst, pop", 18.67], ["gunshot, gunfire", 13.9]], null, null, null], "duration": [0.62, 0.11, 0.63, -0.14, -0.19, 2.55, 1.71, 0.7, 0.21, 0.92, 0.6, 1.33, 0.83, 0.7, 0.33, 0.22, 4.75, 0.72, 3.93, 3.89, 1.16, 1.87]} \ No newline at end of file diff --git a/annotations_1/lKqBsgfSSU8_filtered.json b/annotations_1/lKqBsgfSSU8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbb691fe0507a25b221686c5a6d6c19842bc22c9 --- /dev/null +++ b/annotations_1/lKqBsgfSSU8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.12], [11.0, 13.73], [17.0, 17.74], [22.0, 23.65], [27.0, 32.56], [36.0, 37.18], [38.0, 39.45], [40.0, 42.18], [42.0, 45.15], [47.0, 56.08], [58.0, 62.85], [64.0, 77.65], [81.0, 82.39], [86.0, 88.74], [92.0, 96.75], [97.0, 102.63], [105.0, 108.19], [110.0, 111.13], [112.0, 113.63], [118.0, 122.69], [124.0, 130.33], [132.0, 137.27], [139.0, 141.0], [143.0, 148.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.87, 41.12, 0.0, 0.0, 94.37, 0.0, 0.0, 73.82, 50.86, 99.99, 62.17, 66.51, 0.0, 99.98, 89.54, 61.37, 87.74, 0.0, 0.0, 88.46, 63.96, 66.03, 70.02, 36.47], "audiomae_on_audioset": [null, [["sine wave", 45.11], ["speech", 21.99], ["dial tone", 14.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.0], ["singing bowl", 25.96], ["hum", 6.57]]], "duration": [7.12, 2.73, 0.74, 1.65, 5.56, 1.18, 1.45, 2.18, 3.15, 9.08, 4.85, 13.65, 1.39, 2.74, 4.75, 5.63, 3.19, 1.13, 1.63, 4.69, 6.33, 5.27, 2.0, 5.44]} \ No newline at end of file diff --git a/annotations_1/lLItY-Oyvt0_filtered.json b/annotations_1/lLItY-Oyvt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..39c906b201ac1bc3eb3175d48d08652230059cff --- /dev/null +++ b/annotations_1/lLItY-Oyvt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.7], [12.0, 12.7], [14.0, 16.53], [20.0, 30.57], [32.0, 42.13], [43.0, 44.78], [46.0, 67.95], [69.0, 94.04], [96.0, 103.45], [104.0, 103.94], [104.0, 104.45], [108.0, 129.36], [130.0, 143.63], [146.0, 150.79], [152.0, 152.17], [153.0, 153.86], [155.0, 157.11], [158.0, 167.34], [171.0, 172.0], [174.0, 190.43], [198.0, 201.43], [202.0, 201.53], [202.0, 201.58], [202.0, 201.63], [202.0, 201.75], [202.0, 204.3]], "keep_status": [false, false, true, true, true, false, true, true, true, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.75, 28.56, 29.53, 0.0, 30.38, 30.4, 30.29, 0.0, 0.0, 28.83, 29.17, 31.07, 0.0, 0.0, 33.83, 29.64, 0.0, 33.01, 32.83, 0.0, 0.0, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, null, [["rumble", 19.53], ["hum", 18.0], ["mains hum", 12.79]], [["buzz", 27.86], ["music", 12.68], ["vehicle", 11.43]], [["music", 28.05], ["buzz", 15.05], ["hum", 10.2]], null, [["music", 41.07], ["whack, thwack", 13.87], ["speech", 10.92]], [["music", 52.64], ["speech", 7.88], ["didgeridoo", 5.65]], [["music", 30.24], ["mains hum", 23.14], ["fly, housefly", 9.01]], null, null, [["music", 62.73], ["didgeridoo", 7.26], ["mains hum", 5.43]], [["music", 34.44], ["mains hum", 9.88], ["buzz", 7.82]], [["music", 15.8], ["speech", 15.1], ["didgeridoo", 11.91]], null, null, [["music", 72.51], ["speech", 7.2], ["hum", 1.76]], [["music", 32.84], ["buzz", 22.48], ["hum", 13.54]], null, [["music", 38.59], ["speech", 23.34], ["scary music", 11.99]], [["speech", 53.17], ["music", 16.7], ["foghorn", 3.71]], null, null, null, null, [["music", 53.52], ["theremin", 16.3], ["thunk", 9.87]]], "duration": [1.7, 0.7, 2.53, 10.57, 10.13, 1.78, 21.95, 25.04, 7.45, -0.06, 0.45, 21.36, 13.63, 4.79, 0.17, 0.86, 2.11, 9.34, 1.0, 16.43, 3.43, -0.47, -0.42, -0.37, -0.25, 2.3]} \ No newline at end of file diff --git a/annotations_1/lLbWBsRVUAU_filtered.json b/annotations_1/lLbWBsRVUAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6baa86d373e0698e6070e4c235ab2b3c6045ecaa --- /dev/null +++ b/annotations_1/lLbWBsRVUAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.67], [8.0, 9.12], [11.0, 11.25], [13.0, 19.52], [21.0, 24.11], [25.0, 26.35], [34.0, 36.02], [37.0, 37.54], [43.0, 43.71], [45.0, 45.08], [56.0, 56.49], [60.0, 60.4], [62.0, 62.24], [65.0, 65.11], [74.0, 74.83], [77.0, 77.58], [80.0, 80.54], [89.0, 89.38], [92.0, 92.3], [94.0, 94.14], [103.0, 103.91], [105.0, 105.65], [108.0, 108.43], [125.0, 124.8], [127.0, 127.21], [130.0, 131.65], [134.0, 135.01], [135.0, 135.99], [136.0, 145.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 53.22, 64.29, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.6], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.67, 1.12, 0.25, 6.52, 3.11, 1.35, 2.02, 0.54, 0.71, 0.08, 0.49, 0.4, 0.24, 0.11, 0.83, 0.58, 0.54, 0.38, 0.3, 0.14, 0.91, 0.65, 0.43, -0.2, 0.21, 1.65, 1.01, 0.99, 9.07]} \ No newline at end of file diff --git a/annotations_1/lLeY8-bhEuQ_filtered.json b/annotations_1/lLeY8-bhEuQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b98846df6e46877346c0c3241858b722087b2d3b --- /dev/null +++ b/annotations_1/lLeY8-bhEuQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 60.59], [62.0, 77.94]], "keep_status": [false, true], "silence_prob": [30.45, 29.75], "audiomae_on_audioset": [[["music", 41.32], ["hum", 24.57], ["mains hum", 12.34]], [["music", 44.43], ["livestock, farm animals, working animals", 10.96], ["whale vocalization", 5.23]]], "duration": [28.59, 15.94]} \ No newline at end of file diff --git a/annotations_1/lLgOrvsA9tw_filtered.json b/annotations_1/lLgOrvsA9tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a0da1e033c78f0d5c7716ba1410ec700ee8127f --- /dev/null +++ b/annotations_1/lLgOrvsA9tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.62], [31.0, 32.64], [48.0, 51.33], [57.0, 59.43], [78.0, 80.37], [112.0, 112.67]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.31, 35.15, 32.58, 0.0], "audiomae_on_audioset": [null, null, [["music", 71.5], ["didgeridoo", 16.66], ["musical instrument", 2.84]], [["music", 37.99], ["timpani", 11.07], ["musical instrument", 6.93]], [["music", 50.63], ["didgeridoo", 13.74], ["musical instrument", 7.09]], null], "duration": [1.62, 1.64, 3.33, 2.43, 2.37, 0.67]} \ No newline at end of file diff --git a/annotations_1/lMA48vIxajE_filtered.json b/annotations_1/lMA48vIxajE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23f6be0b61332a0b805815df49bfa8fd9a8c560d --- /dev/null +++ b/annotations_1/lMA48vIxajE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.45], [9.0, 9.86], [28.0, 27.78], [30.0, 30.03], [35.0, 34.64], [47.0, 48.25], [53.0, 52.91], [58.0, 58.36], [59.0, 60.74], [62.0, 63.1], [65.0, 67.51], [69.0, 69.85], [78.0, 77.62], [79.0, 85.78], [88.0, 88.59], [93.0, 93.72], [95.0, 95.15], [98.0, 98.31], [101.0, 101.7], [105.0, 105.27], [106.0, 106.66], [113.0, 113.53], [116.0, 116.28], [119.0, 118.88], [121.0, 121.37], [130.0, 130.44], [132.0, 132.68], [134.0, 137.47], [138.0, 138.47], [141.0, 144.34], [146.0, 145.94], [147.0, 147.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 97.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.45, 0.86, -0.22, 0.03, -0.36, 1.25, -0.09, 0.36, 1.74, 1.1, 2.51, 0.85, -0.38, 6.78, 0.59, 0.72, 0.15, 0.31, 0.7, 0.27, 0.66, 0.53, 0.28, -0.12, 0.37, 0.44, 0.68, 3.47, 0.47, 3.34, -0.06, 0.48]} \ No newline at end of file diff --git a/annotations_1/lMXVWQCa_MY_filtered.json b/annotations_1/lMXVWQCa_MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4266f95291d1113d6b8ee100f0bb5bc40af74ae1 --- /dev/null +++ b/annotations_1/lMXVWQCa_MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.13], [19.0, 26.2], [26.0, 26.23], [28.0, 29.62], [30.0, 31.16], [33.0, 45.33], [46.0, 62.11], [62.0, 64.81], [65.0, 69.69], [72.0, 73.84], [76.0, 77.92], [82.0, 81.94], [82.0, 83.96], [85.0, 86.95], [110.0, 111.79], [113.0, 114.12], [116.0, 116.11], [117.0, 117.21], [118.0, 118.59], [119.0, 119.55], [120.0, 120.16], [121.0, 123.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [62.47, 52.27, 0.0, 0.0, 0.0, 86.09, 79.07, 49.78, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.5], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 49.2], ["mains hum", 29.23], ["speech", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.12], ["radio", 11.8], ["hum", 10.87]]], "duration": [10.13, 7.2, 0.23, 1.62, 1.16, 12.33, 16.11, 2.81, 4.69, 1.84, 1.92, -0.06, 1.96, 1.95, 1.79, 1.12, 0.11, 0.21, 0.59, 0.55, 0.16, 2.28]} \ No newline at end of file diff --git a/annotations_1/lMiVewLfZKI_filtered.json b/annotations_1/lMiVewLfZKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cecff14033eb65dc8135b3a8e1e9cfe673afd832 --- /dev/null +++ b/annotations_1/lMiVewLfZKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.39], [11.0, 11.37], [14.0, 25.46], [26.0, 26.47], [30.0, 30.54], [31.0, 158.09]], "keep_status": [false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["mains hum", 23.08], ["hum", 23.03], ["electric shaver, electric razor", 12.27]], null, null, null], "duration": [1.39, 0.37, 11.46, 0.47, 0.54, 127.09]} \ No newline at end of file diff --git a/annotations_1/lMmTZ7oTDRI_filtered.json b/annotations_1/lMmTZ7oTDRI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5676440c0772efd4b07dcce050d2c3ebf8826e --- /dev/null +++ b/annotations_1/lMmTZ7oTDRI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.82], [11.0, 32.49], [34.0, 37.94], [40.0, 40.71], [43.0, 47.07], [50.0, 51.53], [52.0, 55.53], [56.0, 58.26], [60.0, 67.76], [68.0, 72.67], [74.0, 76.1]], "keep_status": [false, true, true, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 35.71, 46.33, 0.0, 40.59, 0.0, 49.0, 43.85, 42.6, 50.41, 61.27], "audiomae_on_audioset": [null, [["speech", 27.19], ["siren", 17.7], ["emergency vehicle", 14.57]], [["speech", 27.49], ["vehicle", 14.72], ["hum", 7.9]], null, [["mains hum", 21.14], ["hum", 20.6], ["vehicle", 6.47]], null, [["hum", 52.14], ["mains hum", 21.08], ["throbbing", 10.16]], [["hum", 18.47], ["music", 15.58], ["throbbing", 10.71]], [["hum", 28.39], ["speech", 19.34], ["music", 10.3]], null, null], "duration": [1.82, 21.49, 3.94, 0.71, 4.07, 1.53, 3.53, 2.26, 7.76, 4.67, 2.1]} \ No newline at end of file diff --git a/annotations_1/lMtWWls4oas_filtered.json b/annotations_1/lMtWWls4oas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d759de0d200e02a9fe92651f85bc58918801db1b --- /dev/null +++ b/annotations_1/lMtWWls4oas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [3.0, 4.4], [6.0, 6.88], [7.0, 7.94], [20.0, 21.61], [25.0, 25.22], [28.0, 28.98], [32.0, 32.36], [34.0, 35.63], [39.0, 39.28], [42.0, 62.36], [65.0, 86.97], [88.0, 88.79], [92.0, 104.65], [106.0, 107.28], [109.0, 109.19], [115.0, 115.55], [116.0, 116.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.03, 31.82, 0.0, 33.27, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["hum", 43.9], ["music", 34.22], ["throbbing", 7.26]], [["music", 37.16], ["speech", 33.01], ["foghorn", 4.24]], null, [["music", 59.89], ["hum", 11.82], ["mains hum", 7.74]], null, null, null, null], "duration": [0.25, 1.4, 0.88, 0.94, 1.61, 0.22, 0.98, 0.36, 1.63, 0.28, 20.36, 21.97, 0.79, 12.65, 1.28, 0.19, 0.55, 0.78]} \ No newline at end of file diff --git a/annotations_1/lNFbbWOM5FU_filtered.json b/annotations_1/lNFbbWOM5FU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f454d902adf86650480ec3120cff697cc4ac83 --- /dev/null +++ b/annotations_1/lNFbbWOM5FU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 22.69], [24.0, 31.75], [34.0, 73.82], [74.0, 124.88], [132.0, 132.04], [138.0, 140.48], [141.0, 141.71], [146.0, 146.31], [156.0, 185.84]], "keep_status": [true, false, false, false, false, true, false, false, false], "silence_prob": [38.94, 37.08, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0, 37.74], "audiomae_on_audioset": [[["music", 54.98], ["musical instrument", 6.87], ["vibraphone", 5.26]], [["music", 79.79], ["musical instrument", 6.44], ["synthesizer", 3.15]], null, null, null, [["music", 55.32], ["musical instrument", 7.42], ["theremin", 7.23]], null, null, [["music", 55.11], ["musical instrument", 9.68], ["brass instrument", 9.43]]], "duration": [13.69, 7.75, 39.82, 50.88, 0.04, 2.48, 0.71, 0.31, 29.84]} \ No newline at end of file diff --git a/annotations_1/lNVb-ZNIO-A_filtered.json b/annotations_1/lNVb-ZNIO-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483b74a6b1662aea32e0aa1b154600a8ad9ee957 --- /dev/null +++ b/annotations_1/lNVb-ZNIO-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 76.42], [77.0, 77.5], [78.0, 79.84], [81.0, 93.8], [97.0, 107.92], [111.0, 111.45], [118.0, 118.15], [119.0, 119.31], [120.0, 133.66], [135.0, 135.6], [137.0, 138.91], [140.0, 141.62], [142.0, 145.69], [147.0, 148.73], [150.0, 150.5], [156.0, 155.95], [161.0, 162.03], [165.0, 169.69], [172.0, 174.65], [176.0, 178.06], [178.0, 186.0], [186.0, 186.19]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 47.82, 33.97, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 38.59, 83.7, 67.76, 30.21, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.99], ["fart", 10.05], ["synthesizer", 4.58]], [["music", 30.45], ["speech", 22.84], ["throbbing", 10.04]], null, null, null, [["music", 32.69], ["hum", 22.43], ["throbbing", 18.35]], null, null, null, [["insect", 29.35], ["music", 15.33], ["fly, housefly", 8.45]], null, null, null, null, [["livestock, farm animals, working animals", 13.16], ["moo", 11.8], ["fly, housefly", 11.51]], null, null, [["whale vocalization", 23.94], ["livestock, farm animals, working animals", 18.95], ["speech", 14.03]], null], "duration": [60.42, 0.5, 1.84, 12.8, 10.92, 0.45, 0.15, 0.31, 13.66, 0.6, 1.91, 1.62, 3.69, 1.73, 0.5, -0.05, 1.03, 4.69, 2.65, 2.06, 8.0, 0.19]} \ No newline at end of file diff --git a/annotations_1/lP-A8UaVbLE_filtered.json b/annotations_1/lP-A8UaVbLE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076e7aed57ba93abb208967bb855a2d9080368b3 --- /dev/null +++ b/annotations_1/lP-A8UaVbLE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.69], [9.0, 9.14], [10.0, 11.1], [12.0, 14.2], [16.0, 18.64], [20.0, 20.7], [21.0, 39.28], [46.0, 55.51], [59.0, 65.04], [67.0, 70.82], [71.0, 76.05], [79.0, 79.19], [83.0, 98.46], [105.0, 107.15], [114.0, 116.51], [118.0, 119.4], [123.0, 128.34], [130.0, 146.57], [149.0, 149.74], [150.0, 152.09], [158.0, 161.05], [163.0, 167.48], [173.0, 175.0]], "keep_status": [false, false, false, true, true, false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 41.76, 41.64, 0.0, 29.62, 29.61, 45.4, 64.63, 55.11, 0.0, 38.58, 73.06, 75.07, 0.0, 85.17, 36.68, 0.0, 80.82, 87.74, 77.2, 55.46], "audiomae_on_audioset": [null, null, null, [["speech", 23.51], ["music", 14.15], ["pulse", 6.42]], [["hum", 33.2], ["rumble", 8.64], ["sonar", 8.55]], null, [["mains hum", 52.94], ["hum", 24.12], ["music", 4.66]], [["speech", 69.8], ["explosion", 6.54], ["music", 6.37]], [["sine wave", 18.53], ["chirp tone", 17.27], ["tuning fork", 8.97]], null, null, null, [["music", 20.65], ["throbbing", 19.78], ["hum", 14.96]], null, null, null, null, [["static", 14.44], ["white noise", 12.67], ["hum", 10.44]], null, null, null, null, null], "duration": [1.69, 0.14, 1.1, 2.2, 2.64, 0.7, 18.28, 9.51, 6.04, 3.82, 5.05, 0.19, 15.46, 2.15, 2.51, 1.4, 5.34, 16.57, 0.74, 2.09, 3.05, 4.48, 2.0]} \ No newline at end of file diff --git a/annotations_1/lP8EYYjPEmc_filtered.json b/annotations_1/lP8EYYjPEmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae868302132c56f527f7d998b495f417339f18bd --- /dev/null +++ b/annotations_1/lP8EYYjPEmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.48], [33.0, 34.72], [35.0, 37.39], [43.0, 43.34], [44.0, 45.93], [47.0, 48.29], [50.0, 58.48], [59.0, 60.34], [61.0, 61.69], [62.0, 63.59], [81.0, 81.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.72, 2.39, 0.34, 1.93, 1.29, 8.48, 1.34, 0.69, 1.59, 0.57]} \ No newline at end of file diff --git a/annotations_1/lPB6exj8Kgo_filtered.json b/annotations_1/lPB6exj8Kgo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aa201f3746c06c17e1fc08f0e9c925eb7f03825 --- /dev/null +++ b/annotations_1/lPB6exj8Kgo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 76.94], [78.0, 175.56]], "keep_status": [true, false], "silence_prob": [41.93, 0.0], "audiomae_on_audioset": [[["animal", 38.49], ["music", 21.66], ["speech", 6.93]], null], "duration": [18.94, 97.56]} \ No newline at end of file diff --git a/annotations_1/lPOo7SzR7Sc_filtered.json b/annotations_1/lPOo7SzR7Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b741aa8c58bae2afd949325fd40c5b5636141a59 --- /dev/null +++ b/annotations_1/lPOo7SzR7Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.03], [13.0, 13.59], [14.0, 16.5], [22.0, 41.45], [43.0, 46.55], [49.0, 49.69], [50.0, 49.81], [50.0, 53.91], [55.0, 54.94], [55.0, 59.14], [62.0, 64.03], [69.0, 69.74], [71.0, 73.18], [82.0, 84.67], [85.0, 132.36], [133.0, 143.8], [144.0, 145.1], [146.0, 149.45]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 45.62, 38.06, 35.37, 0.0, 0.0, 32.83, 0.0, 28.92, 39.27, 0.0, 39.74, 45.36, 0.0, 29.74, 0.0, 50.46], "audiomae_on_audioset": [null, null, [["speech", 26.26], ["music", 20.21], ["hum", 16.81]], [["music", 37.73], ["hum", 25.61], ["throbbing", 14.8]], [["music", 35.2], ["burping, eructation", 32.43], ["grunt", 7.02]], null, null, [["music", 30.45], ["didgeridoo", 15.23], ["throbbing", 9.46]], null, [["speech", 52.31], ["music", 34.08], ["electric shaver, electric razor", 2.81]], [["croak", 25.18], ["frog", 18.02], ["music", 12.86]], null, [["didgeridoo", 22.66], ["music", 21.7], ["hum", 12.45]], [["music", 59.62], ["hum", 6.35], ["musical instrument", 4.77]], null, [["music", 20.56], ["sound effect", 8.33], ["explosion", 5.74]], null, null], "duration": [0.03, 0.59, 2.5, 19.45, 3.55, 0.69, -0.19, 3.91, -0.06, 4.14, 2.03, 0.74, 2.18, 2.67, 47.36, 10.8, 1.1, 3.45]} \ No newline at end of file diff --git a/annotations_1/lPrJqB8ljAE_filtered.json b/annotations_1/lPrJqB8ljAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56e42eed0f02a09636ade558223461841801526f --- /dev/null +++ b/annotations_1/lPrJqB8ljAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.65], [24.0, 26.3], [28.0, 29.71], [32.0, 56.42], [58.0, 79.86], [81.0, 97.56], [98.0, 98.41], [98.0, 98.51], [99.0, 99.55], [101.0, 103.18], [104.0, 104.53], [107.0, 108.89], [110.0, 110.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.58, 37.53, 0.0, 29.76, 29.97, 31.2, 0.0, 0.0, 0.0, 50.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 41.57], ["music", 17.2], ["throbbing", 14.82]], [["hum", 43.84], ["throbbing", 34.28], ["mains hum", 12.94]], null, [["music", 68.57], ["throbbing", 13.76], ["hum", 8.17]], [["hum", 29.01], ["mains hum", 28.48], ["music", 17.81]], [["music", 53.55], ["speech", 19.8], ["sidetone", 4.4]], null, null, null, null, null, null, null], "duration": [2.65, 2.3, 1.71, 24.42, 21.86, 16.56, 0.41, 0.51, 0.55, 2.18, 0.53, 1.89, 0.98]} \ No newline at end of file diff --git a/annotations_1/lQhQeus0ItY_filtered.json b/annotations_1/lQhQeus0ItY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..846217812d3fe1ca31dea12af69b788b9c2fcfb1 --- /dev/null +++ b/annotations_1/lQhQeus0ItY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [5.0, 4.99], [6.0, 6.07], [7.0, 7.26], [10.0, 10.45], [11.0, 18.5], [19.0, 19.52], [21.0, 21.68], [25.0, 25.68], [27.0, 27.31], [30.0, 31.13], [35.0, 35.48], [37.0, 37.94], [38.0, 39.82], [44.0, 45.15], [45.0, 47.22], [52.0, 57.97], [58.0, 58.72], [62.0, 62.19], [65.0, 66.23], [67.0, 68.44], [70.0, 71.66], [72.0, 72.54], [74.0, 75.1], [78.0, 81.13], [83.0, 84.43], [86.0, 85.95], [86.0, 86.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 38.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 74.34], ["fart", 5.47], ["beatboxing", 1.96]], null, null, null, null, null, null, null, null, null, [["speech", 83.12], ["dial tone", 5.48], ["busy signal", 3.38]], [["speech", 34.69], ["sidetone", 28.33], ["whale vocalization", 8.18]], null, null, null, null, null, null, null, [["speech", 28.08], ["grunt", 12.07], ["groan", 7.83]], null, null, null], "duration": [0.99, -0.01, 0.07, 0.26, 0.45, 7.5, 0.52, 0.68, 0.68, 0.31, 1.13, 0.48, 0.94, 1.82, 1.15, 2.22, 5.97, 0.72, 0.19, 1.23, 1.44, 1.66, 0.54, 1.1, 3.13, 1.43, -0.05, 0.34]} \ No newline at end of file diff --git a/annotations_1/lQr3va8emXg_filtered.json b/annotations_1/lQr3va8emXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b07720bd99df4593484210373115c6bccd7dcdcf --- /dev/null +++ b/annotations_1/lQr3va8emXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 130.44], [134.0, 136.95], [139.0, 205.9], [207.0, 207.52]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 30.05, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.11], ["throbbing", 8.65], ["hum", 7.21]], null, null], "duration": [44.44, 2.95, 66.9, 0.52]} \ No newline at end of file diff --git a/annotations_1/lR8KTwcC8fc_filtered.json b/annotations_1/lR8KTwcC8fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10fb1751d309537ea6bf399ef9acdb6d283bc9a8 --- /dev/null +++ b/annotations_1/lR8KTwcC8fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [9.0, 9.86], [13.0, 13.81], [19.0, 19.28], [23.0, 24.04], [28.0, 28.83], [29.0, 30.65], [32.0, 32.46], [34.0, 34.8], [41.0, 41.62], [42.0, 43.01], [51.0, 51.38], [52.0, 52.95], [62.0, 62.75], [65.0, 64.94], [68.0, 69.58], [72.0, 78.56], [79.0, 92.7], [94.0, 97.29], [104.0, 106.08], [108.0, 108.41], [109.0, 110.52], [112.0, 112.48], [114.0, 114.27], [117.0, 117.09], [118.0, 126.0], [127.0, 132.81], [138.0, 140.17], [143.0, 143.75], [147.0, 149.94], [155.0, 156.32], [161.0, 162.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.2, 39.94, 43.15, 54.1, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 75.39, 84.07, 0.0, 71.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 36.96], ["burst, pop", 17.38], ["explosion", 15.32]], [["telephone dialing, dtmf", 46.55], ["busy signal", 11.47], ["beep, bleep", 8.24]], [["music", 45.73], ["speech", 9.11], ["musical instrument", 1.99]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.86, 0.81, 0.28, 1.04, 0.83, 1.65, 0.46, 0.8, 0.62, 1.01, 0.38, 0.95, 0.75, -0.06, 1.58, 6.56, 13.7, 3.29, 2.08, 0.41, 1.52, 0.48, 0.27, 0.09, 8.0, 5.81, 2.17, 0.75, 2.94, 1.32, 1.14]} \ No newline at end of file diff --git a/annotations_1/lRlgx_GFwyI_filtered.json b/annotations_1/lRlgx_GFwyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/lRlgx_GFwyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/lRpBlNgu8j4_filtered.json b/annotations_1/lRpBlNgu8j4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbb545f65e0d5759b78caedf5c16212da749abb1 --- /dev/null +++ b/annotations_1/lRpBlNgu8j4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.64], [28.0, 28.38], [31.0, 32.05], [35.0, 35.34], [41.0, 42.21], [56.0, 68.1], [69.0, 69.67], [72.0, 73.41], [76.0, 75.69], [77.0, 78.31], [83.0, 82.86], [87.0, 87.67], [92.0, 92.38], [96.0, 96.85], [101.0, 102.15], [108.0, 109.27], [110.0, 110.81], [113.0, 114.27], [119.0, 119.84], [121.0, 122.08], [127.0, 127.77], [129.0, 130.11], [131.0, 166.43], [167.0, 167.68], [168.0, 179.78]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 44.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.45], "audiomae_on_audioset": [null, null, null, null, null, [["music", 33.15], ["musical instrument", 9.12], ["speech", 7.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.84], ["applause", 11.94], ["crowd", 11.12]]], "duration": [0.64, 0.38, 1.05, 0.34, 1.21, 12.1, 0.67, 1.41, -0.31, 1.31, -0.14, 0.67, 0.38, 0.85, 1.15, 1.27, 0.81, 1.27, 0.84, 1.08, 0.77, 1.11, 35.43, 0.68, 11.78]} \ No newline at end of file diff --git a/annotations_1/lS9V0oDrPfs_filtered.json b/annotations_1/lS9V0oDrPfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/lS9V0oDrPfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/lUglQukweZY_filtered.json b/annotations_1/lUglQukweZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..520220ff88f2e8337f93952badac2da2108f319f --- /dev/null +++ b/annotations_1/lUglQukweZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [36.0, 38.31], [77.0, 77.63], [82.0, 83.67], [89.0, 89.72], [99.0, 112.94], [119.0, 119.08], [145.0, 146.58], [155.0, 155.93], [162.0, 162.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 70.02, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 80.32], ["reggae", 2.53], ["funk", 1.63]], null, null, null, null], "duration": [0.54, 2.31, 0.63, 1.67, 0.72, 13.94, 0.08, 1.58, 0.93, 0.06]} \ No newline at end of file diff --git a/annotations_1/lV2XAU1JzuI_filtered.json b/annotations_1/lV2XAU1JzuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ea7f32a6a230266fe5bc841d92a8d2bc25bff6d --- /dev/null +++ b/annotations_1/lV2XAU1JzuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.72], [21.0, 22.1], [27.0, 27.14], [35.0, 55.54], [59.0, 59.73], [62.0, 62.38], [64.0, 66.82], [70.0, 73.5], [74.0, 74.61], [75.0, 75.37], [75.0, 75.51], [78.0, 78.53], [81.0, 82.0], [84.0, 86.04], [87.0, 89.56]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 32.5, 0.0, 0.0, 35.26, 32.38, 0.0, 0.0, 0.0, 0.0, 0.0, 37.93, 31.31], "audiomae_on_audioset": [null, null, null, [["music", 30.92], ["trombone", 25.29], ["brass instrument", 24.18]], null, null, [["music", 29.7], ["saxophone", 9.94], ["speech", 7.46]], [["cattle, bovinae", 53.33], ["moo", 36.93], ["livestock, farm animals, working animals", 9.36]], null, null, null, null, null, [["music", 46.73], ["theremin", 4.96], ["hum", 4.77]], [["mantra", 39.25], ["music", 18.2], ["chant", 12.05]]], "duration": [0.72, 1.1, 0.14, 20.54, 0.73, 0.38, 2.82, 3.5, 0.61, 0.37, 0.51, 0.53, 1.0, 2.04, 2.56]} \ No newline at end of file diff --git a/annotations_1/lVSMG8FTnpw_filtered.json b/annotations_1/lVSMG8FTnpw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bed8cdcf03b97584287883f774df9e8ab085d8ab --- /dev/null +++ b/annotations_1/lVSMG8FTnpw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.11], [12.0, 12.66], [13.0, 20.24], [20.0, 21.14], [21.0, 25.66], [31.0, 36.19], [40.0, 50.89], [51.0, 133.71], [134.0, 133.88], [134.0, 153.82]], "keep_status": [true, false, false, false, false, true, false, false, false, true], "silence_prob": [37.33, 0.0, 42.74, 0.0, 39.38, 31.55, 42.67, 0.0, 0.0, 36.98], "audiomae_on_audioset": [[["music", 50.68], ["ambient music", 10.03], ["scary music", 6.46]], null, [["music", 57.43], ["didgeridoo", 17.68], ["hum", 2.71]], null, [["music", 40.39], ["theremin", 30.15], ["synthesizer", 7.47]], [["music", 50.76], ["theremin", 8.31], ["musical instrument", 3.82]], [["civil defense siren", 61.35], ["siren", 30.46], ["music", 4.02]], null, null, [["music", 49.09], ["theremin", 8.6], ["didgeridoo", 6.23]]], "duration": [2.11, 0.66, 7.24, 1.14, 4.66, 5.19, 10.89, 82.71, -0.12, 19.82]} \ No newline at end of file diff --git a/annotations_1/lXS7GWgCBWM_filtered.json b/annotations_1/lXS7GWgCBWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b29dbc23e014a25db8295229d6b2e4f242343890 --- /dev/null +++ b/annotations_1/lXS7GWgCBWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.96], [10.0, 13.44], [15.0, 15.48], [16.0, 22.65], [23.0, 24.71], [28.0, 29.29], [30.0, 30.97], [39.0, 39.04], [41.0, 41.62], [45.0, 46.95], [58.0, 59.51], [62.0, 63.48], [67.0, 67.93], [69.0, 71.31], [74.0, 73.75], [75.0, 75.91], [80.0, 80.57], [81.0, 82.7], [86.0, 86.51], [87.0, 88.43], [89.0, 93.99], [95.0, 151.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.05, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 3.44, 0.48, 6.65, 1.71, 1.29, 0.97, 0.04, 0.62, 1.95, 1.51, 1.48, 0.93, 2.31, -0.25, 0.91, 0.57, 1.7, 0.51, 1.43, 4.99, 56.8]} \ No newline at end of file diff --git a/annotations_1/lYCq6x3AHYw_filtered.json b/annotations_1/lYCq6x3AHYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b64fd6ffa6f8cc3747e71bb8792b17441172d98f --- /dev/null +++ b/annotations_1/lYCq6x3AHYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 26.08], [26.0, 55.8], [58.0, 62.5], [63.0, 65.55], [67.0, 72.71], [75.0, 117.1], [120.0, 120.36], [126.0, 129.27], [139.0, 139.78], [141.0, 142.32], [147.0, 147.58], [149.0, 162.26], [163.0, 164.47]], "keep_status": [true, false, true, false, true, false, false, true, false, false, false, true, false], "silence_prob": [32.92, 32.43, 34.44, 35.42, 33.51, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 37.89, 0.0], "audiomae_on_audioset": [[["music", 26.98], ["bow-wow", 20.12], ["livestock, farm animals, working animals", 6.77]], [["music", 74.67], ["musical instrument", 1.85], ["speech", 1.79]], [["music", 54.19], ["synthesizer", 5.59], ["speech", 5.28]], [["music", 71.58], ["synthesizer", 4.61], ["drum machine", 3.58]], [["cattle, bovinae", 30.76], ["moo", 23.25], ["music", 15.22]], null, null, [["crushing", 39.79], ["whack, thwack", 23.85], ["boing", 3.6]], null, null, null, [["music", 38.22], ["speech", 15.1], ["hum", 9.24]], null], "duration": [23.08, 29.8, 4.5, 2.55, 5.71, 42.1, 0.36, 3.27, 0.78, 1.32, 0.58, 13.26, 1.47]} \ No newline at end of file diff --git a/annotations_1/lZ_r2Q0FQ1A_filtered.json b/annotations_1/lZ_r2Q0FQ1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1614c302e232fbb289441db9ff745873ab2b63a --- /dev/null +++ b/annotations_1/lZ_r2Q0FQ1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 34.94], [35.0, 43.43], [56.0, 77.38], [78.0, 79.2], [80.0, 80.99], [86.0, 86.48], [97.0, 131.04], [133.0, 141.84]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.23, 35.1, 0.0, 0.0, 0.0, 0.0, 32.61], "audiomae_on_audioset": [null, [["music", 32.05], ["hum", 31.42], ["ambient music", 15.51]], [["hum", 40.91], ["mains hum", 18.79], ["music", 17.67]], null, null, null, null, [["music", 76.46], ["mantra", 5.09], ["chant", 3.59]]], "duration": [-0.06, 8.43, 21.38, 1.2, 0.99, 0.48, 34.04, 8.84]} \ No newline at end of file diff --git a/annotations_1/lb6nAmbkk9Y_filtered.json b/annotations_1/lb6nAmbkk9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20bc857a34dad0428de6902a4c96497271f178f9 --- /dev/null +++ b/annotations_1/lb6nAmbkk9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 4.24], [5.0, 5.76], [7.0, 8.92], [9.0, 9.86], [10.0, 10.74], [14.0, 16.34], [23.0, 23.73], [24.0, 25.29], [28.0, 28.26], [46.0, 47.24], [53.0, 54.72], [56.0, 56.03], [59.0, 61.16], [62.0, 63.29], [65.0, 65.18], [73.0, 74.31], [78.0, 78.76], [79.0, 80.65], [83.0, 84.59], [90.0, 91.4], [95.0, 96.9], [98.0, 98.04], [100.0, 102.37], [104.0, 104.46], [125.0, 127.4], [137.0, 139.24], [142.0, 142.86], [144.0, 145.77], [147.0, 147.51], [156.0, 157.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.56, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 0.24, 0.76, 1.92, 0.86, 0.74, 2.34, 0.73, 1.29, 0.26, 1.24, 1.72, 0.03, 2.16, 1.29, 0.18, 1.31, 0.76, 1.65, 1.59, 1.4, 1.9, 0.04, 2.37, 0.46, 2.4, 2.24, 0.86, 1.77, 0.51, 1.23]} \ No newline at end of file diff --git a/annotations_1/lbqDuUjm4aU_filtered.json b/annotations_1/lbqDuUjm4aU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa8a53316378b2443b96cc74723015af9621e1b --- /dev/null +++ b/annotations_1/lbqDuUjm4aU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.75], [7.0, 8.99], [12.0, 13.9], [18.0, 20.41], [23.0, 23.85], [27.0, 27.89], [30.0, 31.19], [33.0, 35.24], [37.0, 38.75], [42.0, 42.26], [45.0, 46.67], [49.0, 51.21], [58.0, 58.51], [61.0, 61.42], [62.0, 63.44], [70.0, 71.32], [73.0, 74.71], [80.0, 80.82], [83.0, 84.59], [90.0, 91.37], [93.0, 93.45], [97.0, 97.12], [115.0, 120.04], [121.0, 122.67], [123.0, 125.51], [126.0, 127.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 56.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.75, 1.99, 1.9, 2.41, 0.85, 0.89, 1.19, 2.24, 1.75, 0.26, 1.67, 2.21, 0.51, 0.42, 1.44, 1.32, 1.71, 0.82, 1.59, 1.37, 0.45, 0.12, 5.04, 1.67, 2.51, 1.65]} \ No newline at end of file diff --git a/annotations_1/lcIuJs1vHrg_filtered.json b/annotations_1/lcIuJs1vHrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41b2f5bd0c7fb7446e0829b74ae3e9aa19e1bbf --- /dev/null +++ b/annotations_1/lcIuJs1vHrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [3.0, 3.54], [4.0, 5.04], [8.0, 7.62], [8.0, 13.04], [14.0, 16.88], [19.0, 20.28], [20.0, 38.04], [38.0, 38.84], [41.0, 45.98], [47.0, 48.93], [49.0, 50.16], [56.0, 74.09], [74.0, 74.75], [75.0, 75.78], [80.0, 80.25], [81.0, 84.43], [87.0, 109.44], [120.0, 138.37], [141.0, 141.56], [143.0, 144.56], [147.0, 169.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 98.19, 0.0, 98.86, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 99.31, 79.76, 97.54, 0.0, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 0.54, 1.04, -0.38, 5.04, 2.88, 1.28, 18.04, 0.84, 4.98, 1.93, 1.16, 18.09, 0.75, 0.78, 0.25, 3.43, 22.44, 18.37, 0.56, 1.56, 22.13]} \ No newline at end of file diff --git a/annotations_1/leSpIIaEblk_filtered.json b/annotations_1/leSpIIaEblk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..648b4539942f96866db262885c00adaf12822ef7 --- /dev/null +++ b/annotations_1/leSpIIaEblk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.01], [19.0, 41.17], [45.0, 81.01], [82.0, 82.56], [87.0, 97.24], [100.0, 102.19], [103.0, 127.18]], "keep_status": [false, false, false, false, false, false, true], "silence_prob": [29.92, 29.69, 0.0, 0.0, 31.04, 30.62, 39.52], "audiomae_on_audioset": [[["music", 42.55], ["sidetone", 28.89], ["throbbing", 6.1]], [["music", 63.48], ["throbbing", 22.71], ["hum", 3.52]], null, null, [["throbbing", 30.08], ["music", 24.51], ["speech", 22.82]], [["music", 46.12], ["breaking", 20.6], ["boom", 6.48]], [["music", 45.8], ["throbbing", 14.93], ["electronic music", 6.43]]], "duration": [4.01, 22.17, 36.01, 0.56, 10.24, 2.19, 24.18]} \ No newline at end of file diff --git a/annotations_1/lfKcANi5Zrk_filtered.json b/annotations_1/lfKcANi5Zrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c990a1e6aca30e56ecf2b5a9c32c1e101cb06875 --- /dev/null +++ b/annotations_1/lfKcANi5Zrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.31], [13.0, 13.29], [14.0, 14.27], [14.0, 20.17], [22.0, 23.38], [24.0, 25.19], [30.0, 30.82], [32.0, 34.74], [36.0, 36.42], [37.0, 38.72], [40.0, 41.37], [43.0, 44.02], [45.0, 46.67], [47.0, 49.38], [50.0, 52.24], [54.0, 60.45], [62.0, 63.1], [65.0, 66.34], [67.0, 68.94], [70.0, 71.47], [73.0, 78.38], [80.0, 80.23], [82.0, 86.39], [89.0, 89.7], [91.0, 96.21], [99.0, 99.67], [104.0, 106.25], [109.0, 113.48], [115.0, 115.26], [122.0, 122.99], [125.0, 128.7], [129.0, 128.76], [129.0, 129.15], [129.0, 132.75], [133.0, 133.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 99.1, 100.0, 0.0, 0.0, 0.0, 0.0, 52.27, 0.0, 69.34, 0.0, 79.76, 0.0, 100.0, 97.33, 0.0, 0.0, 89.54, 0.0, 0.0, 68.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.29, 0.27, 6.17, 1.38, 1.19, 0.82, 2.74, 0.42, 1.72, 1.37, 1.02, 1.67, 2.38, 2.24, 6.45, 1.1, 1.34, 1.94, 1.47, 5.38, 0.23, 4.39, 0.7, 5.21, 0.67, 2.25, 4.48, 0.26, 0.99, 3.7, -0.24, 0.15, 3.75, 0.83]} \ No newline at end of file diff --git a/annotations_1/lfObLA5H4Rg_filtered.json b/annotations_1/lfObLA5H4Rg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b1be62eae7a5c8ae8d5aac69ac54ccf880096de --- /dev/null +++ b/annotations_1/lfObLA5H4Rg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.33], [5.0, 43.63], [44.0, 45.55], [52.0, 54.18], [55.0, 146.01], [147.0, 148.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.53, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.33], ["mains hum", 9.22], ["hum", 7.71]], null, null], "duration": [0.33, 38.63, 1.55, 2.18, 91.01, 1.0]} \ No newline at end of file diff --git a/annotations_1/lfUlATBIer8_filtered.json b/annotations_1/lfUlATBIer8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..869e16fad0aba3a7730a8fb89e907dc402ffca62 --- /dev/null +++ b/annotations_1/lfUlATBIer8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.28], [29.0, 30.55], [34.0, 36.05], [39.0, 43.44], [47.0, 49.55], [51.0, 52.08], [52.0, 56.17], [63.0, 62.94], [68.0, 70.5], [72.0, 72.57], [90.0, 90.1], [121.0, 121.85], [125.0, 125.02], [126.0, 126.71]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [37.35, 0.0, 40.9, 32.24, 33.16, 0.0, 39.12, 0.0, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 64.49], ["synthesizer", 9.82], ["throbbing", 4.34]], null, [["hum", 25.98], ["music", 24.98], ["mains hum", 14.48]], [["music", 41.23], ["throbbing", 18.37], ["hum", 17.23]], [["music", 83.6], ["video game music", 1.88], ["soundtrack music", 1.09]], null, [["music", 50.98], ["speech", 11.12], ["musical instrument", 4.93]], null, null, null, null, null, null, null], "duration": [24.28, 1.55, 2.05, 4.44, 2.55, 1.08, 4.17, -0.06, 2.5, 0.57, 0.1, 0.85, 0.02, 0.71]} \ No newline at end of file diff --git a/annotations_1/lfeYgfKa2cY_filtered.json b/annotations_1/lfeYgfKa2cY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/lfeYgfKa2cY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/lh5IiK9eQhA_filtered.json b/annotations_1/lh5IiK9eQhA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..106a57553fbbc3b3430826e1055aba0cd48c2d97 --- /dev/null +++ b/annotations_1/lh5IiK9eQhA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.01], [19.0, 30.89], [34.0, 33.81], [38.0, 45.69], [47.0, 50.58], [55.0, 59.43], [61.0, 61.75], [62.0, 63.27], [65.0, 73.13], [74.0, 77.68], [80.0, 81.16], [86.0, 89.4], [92.0, 93.04], [95.0, 105.17], [106.0, 107.13], [108.0, 119.77], [122.0, 124.48]], "keep_status": [false, true, false, true, true, true, false, false, true, true, false, true, false, true, false, false, true], "silence_prob": [0.0, 29.91, 0.0, 30.14, 29.87, 30.57, 0.0, 0.0, 29.95, 29.87, 0.0, 30.08, 0.0, 29.64, 0.0, 29.84, 30.6], "audiomae_on_audioset": [null, [["music", 56.88], ["throbbing", 7.79], ["speech", 4.92]], null, [["music", 60.22], ["electronic music", 4.03], ["cacophony", 3.88]], [["music", 56.94], ["electronic music", 9.51], ["throbbing", 3.36]], [["speech", 28.5], ["music", 10.41], ["rumble", 5.85]], null, null, [["vehicle", 19.85], ["music", 17.45], ["car", 16.87]], [["speech", 46.34], ["music", 8.17], ["sound effect", 7.91]], null, [["whale vocalization", 47.55], ["cattle, bovinae", 11.31], ["livestock, farm animals, working animals", 10.41]], null, [["music", 46.63], ["didgeridoo", 7.7], ["electronic music", 5.88]], null, [["music", 45.26], ["throbbing", 22.28], ["hum", 8.01]], [["car", 21.69], ["music", 15.7], ["vehicle", 15.26]]], "duration": [0.01, 11.89, -0.19, 7.69, 3.58, 4.43, 0.75, 1.27, 8.13, 3.68, 1.16, 3.4, 1.04, 10.17, 1.13, 11.77, 2.48]} \ No newline at end of file diff --git a/annotations_1/ljAdSzBv0ug_filtered.json b/annotations_1/ljAdSzBv0ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7afe786723cf195246f4a689d86215ca682e1b2a --- /dev/null +++ b/annotations_1/ljAdSzBv0ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [6.0, 7.13], [12.0, 12.85], [14.0, 15.89], [16.0, 20.04], [21.0, 27.84], [31.0, 31.62], [35.0, 36.21], [38.0, 38.62], [41.0, 42.47], [43.0, 44.66], [48.0, 48.63], [58.0, 60.07], [62.0, 61.96], [62.0, 65.8], [66.0, 65.87], [81.0, 81.55], [86.0, 86.63], [87.0, 87.67], [90.0, 92.55], [94.0, 96.3], [97.0, 97.8], [99.0, 99.74], [103.0, 103.2], [104.0, 104.99], [106.0, 106.41], [112.0, 113.78], [116.0, 118.81], [119.0, 121.73], [122.0, 121.76], [122.0, 121.8], [122.0, 121.83], [122.0, 121.86], [122.0, 122.23], [122.0, 124.33], [125.0, 133.64], [136.0, 137.64], [138.0, 139.21], [141.0, 142.08], [146.0, 157.38], [164.0, 165.59], [169.0, 169.57], [175.0, 176.4], [177.0, 178.09], [181.0, 181.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.35, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.86, 0.0, 34.96, 0.0, 0.0, 0.0, 0.0, 47.08, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 51.55, 0.0, 0.0, 0.0, 32.01, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 60.58], ["music", 12.33], ["noise", 2.4]], [["speech", 25.28], ["clip-clop", 19.0], ["horse", 11.28]], null, null, null, null, null, null, [["hum", 35.15], ["music", 18.81], ["throbbing", 18.41]], null, [["music", 54.24], ["didgeridoo", 12.7], ["speech", 7.6]], null, null, null, null, [["animal", 16.48], ["music", 14.75], ["dog", 6.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.77], ["music", 29.91], ["inside, small room", 4.03]], null, null, null, null, [["music", 52.85], ["speech", 22.8], ["hum", 4.32]], null, null, null, null, null], "duration": [0.56, 1.13, 0.85, 1.89, 4.04, 6.84, 0.62, 1.21, 0.62, 1.47, 1.66, 0.63, 2.07, -0.04, 3.8, -0.13, 0.55, 0.63, 0.67, 2.55, 2.3, 0.8, 0.74, 0.2, 0.99, 0.41, 1.78, 2.81, 2.73, -0.24, -0.2, -0.17, -0.14, 0.23, 2.33, 8.64, 1.64, 1.21, 1.08, 11.38, 1.59, 0.57, 1.4, 1.09, 0.04]} \ No newline at end of file diff --git a/annotations_1/ljMuEDlInLo_filtered.json b/annotations_1/ljMuEDlInLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eea80e80ddbde93355d7ff0b3d53b2d760f5faec --- /dev/null +++ b/annotations_1/ljMuEDlInLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.42], [17.0, 17.91], [22.0, 22.72], [25.0, 27.06], [35.0, 35.61], [36.0, 36.48], [39.0, 39.21], [43.0, 46.45], [50.0, 51.81], [58.0, 58.67], [64.0, 64.66], [67.0, 67.74]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.01, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["baby laughter", 18.67], ["echo", 14.09], ["chuckle, chortle", 12.45]], null, null, null, null, null, null, [["laughter", 34.3], ["snicker", 14.92], ["baby laughter", 11.89]], null, null, null, null], "duration": [2.42, 0.91, 0.72, 2.06, 0.61, 0.48, 0.21, 3.45, 1.81, 0.67, 0.66, 0.74]} \ No newline at end of file diff --git a/annotations_1/lkT9aqC6Tqw_filtered.json b/annotations_1/lkT9aqC6Tqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a28353378e1ce186c54e65c6ac8cddf44ec62ec --- /dev/null +++ b/annotations_1/lkT9aqC6Tqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 58.35], [66.0, 67.36], [69.0, 69.06]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [37.35, 1.36, 0.06]} \ No newline at end of file diff --git a/annotations_1/lkoWhWGcVR4_filtered.json b/annotations_1/lkoWhWGcVR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc6a3177fed57b41b5b286aafc4fed28eef5b709 --- /dev/null +++ b/annotations_1/lkoWhWGcVR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [8.0, 9.22], [11.0, 12.23], [14.0, 15.08], [18.0, 19.79], [20.0, 20.98], [23.0, 23.67], [24.0, 24.39], [26.0, 30.27], [34.0, 34.55], [37.0, 38.06], [47.0, 47.63], [50.0, 64.56], [69.0, 69.45], [72.0, 72.23], [73.0, 74.6], [75.0, 76.89], [80.0, 94.74], [97.0, 100.01], [102.0, 102.88], [109.0, 109.53], [110.0, 110.64], [116.0, 116.85], [122.0, 122.69], [128.0, 133.19], [135.0, 135.18], [136.0, 137.74], [140.0, 141.17], [144.0, 145.83], [147.0, 147.88], [149.0, 149.42], [153.0, 158.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 52.8, 0.0, 0.0, 0.0, 0.0, 72.75, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 38.08], ["clip-clop", 10.82], ["horse", 9.25]]], "duration": [0.63, 1.22, 1.23, 1.08, 1.79, 0.98, 0.67, 0.39, 4.27, 0.55, 1.06, 0.63, 14.56, 0.45, 0.23, 1.6, 1.89, 14.74, 3.01, 0.88, 0.53, 0.64, 0.85, 0.69, 5.19, 0.18, 1.74, 1.17, 1.83, 0.88, 0.42, 5.84]} \ No newline at end of file diff --git a/annotations_1/llTSaDl6Pcg_filtered.json b/annotations_1/llTSaDl6Pcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b7898b3e5aef9e9fa96b3d04b700f88fc6874c98 --- /dev/null +++ b/annotations_1/llTSaDl6Pcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.19], [6.0, 6.98], [8.0, 10.76], [19.0, 18.77], [19.0, 22.18], [22.0, 22.27], [22.0, 30.65], [31.0, 32.22], [33.0, 34.82], [37.0, 41.72], [44.0, 45.06], [49.0, 50.99], [53.0, 54.24], [56.0, 58.6], [66.0, 67.22], [74.0, 74.53], [76.0, 77.67], [79.0, 81.16], [83.0, 94.96], [95.0, 96.94], [100.0, 101.66], [103.0, 104.7], [107.0, 108.45], [110.0, 112.41], [115.0, 117.53], [119.0, 122.34], [123.0, 125.49], [127.0, 135.7], [137.0, 137.73], [139.0, 143.78], [145.0, 146.64], [150.0, 151.33], [152.0, 154.89], [156.0, 157.2], [158.0, 159.7], [161.0, 165.59], [166.0, 171.48], [177.0, 178.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.97, 0.0, 52.1, 0.0, 80.11, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 99.62, 81.0, 0.0, 0.0, 0.0, 0.0, 99.85, 99.98, 99.93, 86.45, 72.75, 0.0, 53.22, 0.0, 0.0, 73.36, 0.0, 0.0, 98.36, 72.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.98, 2.76, -0.23, 3.18, 0.27, 8.65, 1.22, 1.82, 4.72, 1.06, 1.99, 1.24, 2.6, 1.22, 0.53, 1.67, 2.16, 11.96, 1.94, 1.66, 1.7, 1.45, 2.41, 2.53, 3.34, 2.49, 8.7, 0.73, 4.78, 1.64, 1.33, 2.89, 1.2, 1.7, 4.59, 5.48, 1.88]} \ No newline at end of file diff --git a/annotations_1/lnPDc4XE77w_filtered.json b/annotations_1/lnPDc4XE77w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1b217136dc421a5d094a8022506a05178c8283 --- /dev/null +++ b/annotations_1/lnPDc4XE77w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.43], [1.0, 5.61], [6.0, 7.42], [11.0, 16.63], [18.0, 20.36], [21.0, 23.25], [27.0, 31.06], [32.0, 32.73], [36.0, 38.62], [39.0, 38.87], [40.0, 40.61], [42.0, 49.38], [51.0, 51.9], [54.0, 54.01], [56.0, 70.24], [71.0, 72.0], [76.0, 76.49], [82.0, 83.03], [85.0, 89.82], [94.0, 109.92], [114.0, 117.07], [119.0, 120.16], [120.0, 127.13], [132.0, 134.52], [135.0, 144.53], [146.0, 146.57], [150.0, 167.95], [170.0, 171.69], [172.0, 172.57], [176.0, 192.62], [199.0, 201.8]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true], "silence_prob": [0.0, 30.91, 0.0, 37.23, 59.42, 84.43, 55.81, 0.0, 37.04, 0.0, 0.0, 36.35, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 30.78, 30.86, 33.06, 0.0, 33.14, 30.87, 30.8, 0.0, 29.66, 0.0, 0.0, 29.86, 31.48], "audiomae_on_audioset": [null, [["music", 71.77], ["speech", 7.04], ["didgeridoo", 3.57]], null, [["music", 33.82], ["didgeridoo", 31.01], ["speech", 2.92]], null, null, null, null, [["music", 35.45], ["speech", 17.27], ["noise", 8.94]], null, null, [["music", 30.37], ["livestock, farm animals, working animals", 21.03], ["cattle, bovinae", 7.53]], null, null, [["music", 21.84], ["sound effect", 6.88], ["hum", 6.75]], null, null, null, [["music", 52.88], ["whack, thwack", 17.42], ["smash, crash", 3.16]], [["music", 49.31], ["breaking", 24.55], ["speech", 14.13]], [["music", 72.43], ["boing", 5.73], ["didgeridoo", 2.64]], null, [["music", 65.63], ["speech", 7.7], ["smash, crash", 5.06]], [["clang", 36.17], ["speech", 16.58], ["ding", 10.47]], [["music", 39.33], ["speech", 38.53], ["quack", 3.39]], null, [["cattle, bovinae", 14.9], ["moo", 13.78], ["livestock, farm animals, working animals", 13.49]], null, null, [["whale vocalization", 81.73], ["music", 3.16], ["vehicle", 1.95]], [["speech", 18.66], ["beatboxing", 13.5], ["music", 10.29]]], "duration": [1.43, 4.61, 1.42, 5.63, 2.36, 2.25, 4.06, 0.73, 2.62, -0.13, 0.61, 7.38, 0.9, 0.01, 14.24, 1.0, 0.49, 1.03, 4.82, 15.92, 3.07, 1.16, 7.13, 2.52, 9.53, 0.57, 17.95, 1.69, 0.57, 16.62, 2.8]} \ No newline at end of file diff --git a/annotations_1/lnfpTgAQ0Ys_filtered.json b/annotations_1/lnfpTgAQ0Ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef525b23219d13c63457607962566ad649491e6c --- /dev/null +++ b/annotations_1/lnfpTgAQ0Ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.83], [14.0, 18.13], [19.0, 23.99], [25.0, 28.51], [29.0, 34.08], [35.0, 42.55], [44.0, 45.05], [46.0, 46.47], [48.0, 50.08], [53.0, 54.73], [56.0, 60.17], [62.0, 64.66], [66.0, 66.8], [67.0, 69.48], [75.0, 75.49], [77.0, 79.44], [80.0, 81.82], [82.0, 83.2], [84.0, 84.94], [88.0, 88.43], [90.0, 95.76], [102.0, 102.54], [104.0, 105.27], [108.0, 108.3], [113.0, 114.66], [116.0, 119.97], [121.0, 122.42], [124.0, 126.12], [128.0, 129.19], [133.0, 133.24], [140.0, 142.62], [146.0, 152.52], [154.0, 155.22], [156.0, 159.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.92, 72.9, 99.56, 100.0, 96.89, 92.64, 0.0, 0.0, 74.44, 0.0, 89.54, 90.78, 0.0, 99.65, 0.0, 99.85, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 91.13, 0.0, 0.0, 99.84, 99.26, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.83, 4.13, 4.99, 3.51, 5.08, 7.55, 1.05, 0.47, 2.08, 1.73, 4.17, 2.66, 0.8, 2.48, 0.49, 2.44, 1.82, 1.2, 0.94, 0.43, 5.76, 0.54, 1.27, 0.3, 1.66, 3.97, 1.42, 2.12, 1.19, 0.24, 2.62, 6.52, 1.22, 3.88]} \ No newline at end of file diff --git a/annotations_1/lp1s4-tc2U0_filtered.json b/annotations_1/lp1s4-tc2U0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8367f17b85b9586d250ba7366ff90d3a9b9b7830 --- /dev/null +++ b/annotations_1/lp1s4-tc2U0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.67], [11.0, 12.38], [16.0, 18.3], [19.0, 55.95], [58.0, 66.82], [69.0, 141.81], [143.0, 160.47], [166.0, 184.89], [190.0, 216.4]], "keep_status": [false, false, true, false, false, false, true, false, false], "silence_prob": [30.21, 0.0, 30.27, 0.0, 30.65, 0.0, 30.08, 29.93, 31.64], "audiomae_on_audioset": [[["hum", 39.92], ["mains hum", 25.51], ["throbbing", 16.7]], null, [["music", 45.35], ["musical instrument", 6.68], ["thunk", 6.52]], null, [["music", 52.67], ["speech", 21.18], ["synthesizer", 7.76]], null, [["music", 51.42], ["speech", 9.2], ["synthesizer", 4.85]], [["music", 61.9], ["throbbing", 13.68], ["hum", 8.94]], [["hum", 33.6], ["music", 27.8], ["throbbing", 22.84]]], "duration": [4.67, 1.38, 2.3, 36.95, 8.82, 72.81, 17.47, 18.89, 26.4]} \ No newline at end of file diff --git a/annotations_1/lpod4qQzO7Q_filtered.json b/annotations_1/lpod4qQzO7Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ae15b605d58341bbeb7c79e955bc9f73cad6872 --- /dev/null +++ b/annotations_1/lpod4qQzO7Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.05], [33.0, 33.89], [36.0, 40.64]], "keep_status": [false, false, false], "silence_prob": [31.03, 0.0, 28.85], "audiomae_on_audioset": [[["music", 62.34], ["theremin", 5.55], ["speech", 5.14]], null, [["music", 36.58], ["mains hum", 28.2], ["hum", 9.61]]], "duration": [2.05, 0.89, 4.64]} \ No newline at end of file diff --git a/annotations_1/lqnKLTA2GVE_filtered.json b/annotations_1/lqnKLTA2GVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..153ed7709e8a8a041394dabdb6736a06cd8281dc --- /dev/null +++ b/annotations_1/lqnKLTA2GVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 45.23], [47.0, 48.46], [53.0, 53.79], [55.0, 67.73], [69.0, 70.02], [73.0, 148.96]], "keep_status": [false, false, false, true, false, false], "silence_prob": [58.64, 0.0, 0.0, 31.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 48.09], ["hum", 9.83], ["explosion", 6.36]], null, null], "duration": [9.23, 1.46, 0.79, 12.73, 1.02, 75.96]} \ No newline at end of file diff --git a/annotations_1/lr7pyggTmmY_filtered.json b/annotations_1/lr7pyggTmmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21ce3ba4353ac7bd245fd500f44dfd996d46ceeb --- /dev/null +++ b/annotations_1/lr7pyggTmmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.32], [7.0, 7.23], [11.0, 14.15], [19.0, 19.82], [22.0, 23.09], [30.0, 31.36], [35.0, 35.7], [38.0, 38.01], [53.0, 54.94], [63.0, 66.31], [67.0, 67.9], [77.0, 78.11], [81.0, 88.48], [89.0, 90.51], [93.0, 98.51], [100.0, 100.82], [112.0, 121.37], [123.0, 137.37], [139.0, 141.3], [144.0, 149.64], [152.0, 153.22], [154.0, 156.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [99.71, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.82, 0.0, 0.0, 89.54, 0.0, 36.44, 0.0, 62.37, 46.4, 88.83, 33.04, 0.0, 33.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 45.73], ["beatboxing", 35.33], ["music", 2.72]], null, null, [["music", 40.49], ["insect", 7.25], ["singing bowl", 5.7]], null, [["music", 13.83], ["mains hum", 9.9], ["noise", 6.25]], null, [["throbbing", 29.31], ["music", 27.97], ["hum", 27.82]]], "duration": [2.32, 0.23, 3.15, 0.82, 1.09, 1.36, 0.7, 0.01, 1.94, 3.31, 0.9, 1.11, 7.48, 1.51, 5.51, 0.82, 9.37, 14.37, 2.3, 5.64, 1.22, 2.49]} \ No newline at end of file diff --git a/annotations_1/lsa5PDPgJmI_filtered.json b/annotations_1/lsa5PDPgJmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e1ce03d5b9b2cb1f3f89c63df1675b497866560 --- /dev/null +++ b/annotations_1/lsa5PDPgJmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [6.0, 8.85], [10.0, 11.8], [13.0, 14.57], [26.0, 26.0], [33.0, 33.24], [34.0, 34.45], [36.0, 38.28], [40.0, 62.82]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 35.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 61.53], ["throbbing", 19.75], ["hum", 8.28]]], "duration": [1.26, 2.85, 1.8, 1.57, 0.0, 0.24, 0.45, 2.28, 22.82]} \ No newline at end of file diff --git a/annotations_1/lsmWjQdGHMI_filtered.json b/annotations_1/lsmWjQdGHMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc75117444146fcdf36798292532199121d91715 --- /dev/null +++ b/annotations_1/lsmWjQdGHMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.16], [12.0, 12.8], [14.0, 15.63], [20.0, 21.0], [23.0, 22.76], [23.0, 23.45], [26.0, 26.91], [29.0, 30.06], [35.0, 36.26], [37.0, 37.42], [38.0, 38.33], [40.0, 41.96], [44.0, 44.85], [48.0, 48.88], [51.0, 52.2], [55.0, 56.34], [57.0, 57.23], [60.0, 60.44], [62.0, 63.63], [65.0, 65.47], [66.0, 68.32], [72.0, 79.51], [81.0, 82.83], [84.0, 85.58], [87.0, 88.7], [91.0, 91.69], [94.0, 95.23], [96.0, 96.97], [98.0, 98.07], [99.0, 100.09], [101.0, 107.15], [108.0, 108.28], [109.0, 109.81], [112.0, 114.35], [119.0, 120.82], [121.0, 123.43], [124.0, 148.09], [149.0, 158.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.78, 0.0, 0.0, 66.63, 0.0, 73.67, 68.67, 76.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.41], ["singing bowl", 8.06], ["wind instrument, woodwind instrument", 3.68]], null, null, null, null, null, null, null], "duration": [0.16, 0.8, 1.63, 1.0, -0.24, 0.45, 0.91, 1.06, 1.26, 0.42, 0.33, 1.96, 0.85, 0.88, 1.2, 1.34, 0.23, 0.44, 1.63, 0.47, 2.32, 7.51, 1.83, 1.58, 1.7, 0.69, 1.23, 0.97, 0.07, 1.09, 6.15, 0.28, 0.81, 2.35, 1.82, 2.43, 24.09, 9.79]} \ No newline at end of file diff --git a/annotations_1/luF2eyiYlyE_filtered.json b/annotations_1/luF2eyiYlyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76852dd699186b0d3ce167d6a9aaa870f938029b --- /dev/null +++ b/annotations_1/luF2eyiYlyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [7.0, 7.1], [8.0, 8.41], [13.0, 13.34], [15.0, 15.16], [17.0, 18.4], [20.0, 21.64], [22.0, 22.52], [23.0, 23.21], [24.0, 24.16], [34.0, 38.62], [40.0, 40.49], [41.0, 53.08], [58.0, 57.84], [58.0, 58.55], [60.0, 60.17], [62.0, 62.33], [67.0, 67.34], [68.0, 68.55], [91.0, 92.69], [106.0, 106.71], [116.0, 116.87], [120.0, 120.38], [122.0, 121.78], [122.0, 123.01], [147.0, 150.15], [151.0, 151.26], [154.0, 154.25], [156.0, 156.68], [159.0, 159.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.47, 0.0, 34.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 40.51], ["brass instrument", 8.58], ["speech", 7.49]], null, [["music", 31.13], ["theremin", 23.8], ["speech", 14.83]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.2], ["theremin", 13.29], ["musical instrument", 6.13]], null, null, null, null], "duration": [-0.03, 0.1, 0.41, 0.34, 0.16, 1.4, 1.64, 0.52, 0.21, 0.16, 4.62, 0.49, 12.08, -0.16, 0.55, 0.17, 0.33, 0.34, 0.55, 1.69, 0.71, 0.87, 0.38, -0.22, 1.01, 3.15, 0.26, 0.25, 0.68, 0.26]} \ No newline at end of file diff --git a/annotations_1/lwruhQqFttU_filtered.json b/annotations_1/lwruhQqFttU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308446a7d5509ae70f256b5fc478eb5e80495c93 --- /dev/null +++ b/annotations_1/lwruhQqFttU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [19.0, 21.24], [22.0, 45.2], [46.0, 49.62], [54.0, 54.33], [56.0, 62.51], [64.0, 68.57], [70.0, 72.79], [74.0, 74.26], [75.0, 77.33], [84.0, 119.91], [123.0, 123.4]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 32.72, 75.55, 36.31, 0.0, 33.58, 31.15, 33.12, 0.0, 35.74, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 77.68], ["music", 14.39], ["musical instrument", 1.42]], null, [["hum", 51.85], ["throbbing", 11.02], ["music", 8.39]], null, [["speech", 42.26], ["gong", 8.21], ["chirp tone", 7.5]], [["music", 35.08], ["chirp tone", 15.94], ["electronic music", 8.47]], [["throbbing", 38.17], ["hum", 30.07], ["mains hum", 5.73]], null, [["music", 14.87], ["effects unit", 10.07], ["distortion", 5.69]], null, null], "duration": [0.75, 2.24, 23.2, 3.62, 0.33, 6.51, 4.57, 2.79, 0.26, 2.33, 35.91, 0.4]} \ No newline at end of file diff --git a/annotations_1/lxlwKE2-3fg_filtered.json b/annotations_1/lxlwKE2-3fg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bf80349ea0c2934f2b054014d9f96b1186aae91 --- /dev/null +++ b/annotations_1/lxlwKE2-3fg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.22], [10.0, 14.15], [21.0, 21.98], [22.0, 23.79], [24.0, 24.36], [29.0, 30.48], [33.0, 36.05], [36.0, 49.25], [56.0, 57.27], [61.0, 60.76], [61.0, 64.29], [65.0, 67.37], [72.0, 72.5], [80.0, 86.1], [87.0, 86.81], [87.0, 87.52], [88.0, 88.94], [91.0, 90.91], [103.0, 103.23], [121.0, 121.22], [122.0, 122.61], [126.0, 127.11], [129.0, 130.44], [138.0, 139.62], [141.0, 142.28]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.26, 100.0, 0.0, 0.0, 0.0, 0.0, 97.33, 98.1, 0.0, 0.0, 65.44, 71.72, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 25.95], ["animal", 14.14], ["fart", 7.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.22, 4.15, 0.98, 1.79, 0.36, 1.48, 3.05, 13.25, 1.27, -0.24, 3.29, 2.37, 0.5, 6.1, -0.19, 0.52, 0.94, -0.09, 0.23, 0.22, 0.61, 1.11, 1.44, 1.62, 1.28]} \ No newline at end of file diff --git a/annotations_1/lyM65FpQLlM_filtered.json b/annotations_1/lyM65FpQLlM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9abf89c0bcbf9866e5c5fcc22faf546136efba9 --- /dev/null +++ b/annotations_1/lyM65FpQLlM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.49], [5.0, 6.22], [8.0, 7.94], [13.0, 14.76], [16.0, 20.68], [21.0, 23.85], [25.0, 28.58], [30.0, 32.88], [35.0, 35.58], [37.0, 37.4], [40.0, 42.18], [45.0, 77.57], [80.0, 91.05], [96.0, 107.45], [110.0, 125.41], [126.0, 128.24], [129.0, 129.98], [134.0, 134.57], [136.0, 136.27], [137.0, 137.42], [138.0, 140.61], [141.0, 149.94], [152.0, 163.24], [168.0, 171.49], [172.0, 172.66], [173.0, 181.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.44, 78.04, 99.16, 86.27, 0.0, 0.0, 70.44, 0.0, 34.6, 32.13, 30.49, 79.94, 0.0, 0.0, 0.0, 0.0, 42.15, 68.02, 54.43, 54.63, 0.0, 64.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.36], ["ambient music", 29.84], ["synthesizer", 5.99]], [["music", 58.48], ["theremin", 8.7], ["ambient music", 6.87]], [["music", 47.92], ["speech", 9.81], ["mains hum", 8.98]], null, null, null, null, null, [["music", 61.61], ["effects unit", 10.54], ["synthesizer", 3.49]], null, null, null, null, null], "duration": [0.49, 1.22, -0.06, 1.76, 4.68, 2.85, 3.58, 2.88, 0.58, 0.4, 2.18, 32.57, 11.05, 11.45, 15.41, 2.24, 0.98, 0.57, 0.27, 0.42, 2.61, 8.94, 11.24, 3.49, 0.66, 8.53]} \ No newline at end of file diff --git a/annotations_1/lyd4tC8LH1s_filtered.json b/annotations_1/lyd4tC8LH1s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3fb4bc6099d0ad066ece7f729649187f16183cf --- /dev/null +++ b/annotations_1/lyd4tC8LH1s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [7.0, 21.98], [23.0, 22.99], [24.0, 32.29], [35.0, 52.61], [54.0, 57.32], [58.0, 57.94], [69.0, 69.03], [70.0, 73.77], [75.0, 78.27], [78.0, 78.41], [78.0, 78.92], [87.0, 87.98], [89.0, 107.08], [112.0, 116.33], [118.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 30.75, 0.0, 30.85, 31.02, 89.9, 0.0, 0.0, 30.97, 32.28, 0.0, 0.0, 0.0, 36.0, 33.77, 0.0], "audiomae_on_audioset": [null, [["speech", 59.56], ["beatboxing", 17.26], ["didgeridoo", 5.96]], null, [["fart", 48.01], ["speech", 19.38], ["whack, thwack", 8.39]], [["speech", 57.36], ["whack, thwack", 12.23], ["music", 4.98]], null, null, null, [["breaking", 21.08], ["smash, crash", 17.8], ["speech", 9.76]], [["speech", 33.14], ["boing", 27.27], ["music", 9.56]], null, null, null, [["ding", 14.64], ["speech", 12.63], ["animal", 8.53]], [["beatboxing", 32.25], ["speech", 24.09], ["music", 13.37]], null], "duration": [0.3, 14.98, -0.01, 8.29, 17.61, 3.32, -0.06, 0.03, 3.77, 3.27, 0.41, 0.92, 0.98, 18.08, 4.33, 0.35]} \ No newline at end of file diff --git a/annotations_1/lyvAjZw6O_Q_filtered.json b/annotations_1/lyvAjZw6O_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9dcdb290d01ef74b576d2ded650424e49712bc3f --- /dev/null +++ b/annotations_1/lyvAjZw6O_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [6.0, 7.65], [17.0, 18.03], [21.0, 22.06], [26.0, 27.14], [29.0, 29.83], [31.0, 32.95], [39.0, 39.53], [42.0, 42.57], [46.0, 46.84], [52.0, 52.12], [53.0, 53.7], [55.0, 55.81], [58.0, 60.39], [61.0, 62.4], [63.0, 64.08], [68.0, 68.94], [79.0, 81.5], [85.0, 85.77], [88.0, 88.79], [107.0, 107.91], [114.0, 114.51], [117.0, 117.53], [121.0, 121.68], [123.0, 123.99], [126.0, 129.86], [130.0, 131.41], [134.0, 135.58], [141.0, 141.93], [144.0, 144.53], [146.0, 147.16], [150.0, 151.77], [153.0, 154.28], [155.0, 160.71], [162.0, 162.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 1.65, 1.03, 1.06, 1.14, 0.83, 1.95, 0.53, 0.57, 0.84, 0.12, 0.7, 0.81, 2.39, 1.4, 1.08, 0.94, 2.5, 0.77, 0.79, 0.91, 0.51, 0.53, 0.68, 0.99, 3.86, 1.41, 1.58, 0.93, 0.53, 1.16, 1.77, 1.28, 5.71, 0.97]} \ No newline at end of file diff --git a/annotations_1/lz98akbX_NE_filtered.json b/annotations_1/lz98akbX_NE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13a8cd681423f61f9befff951f9b4c2a060ca85b --- /dev/null +++ b/annotations_1/lz98akbX_NE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.13], [15.0, 105.73], [109.0, 108.87], [110.0, 123.09], [124.0, 129.24], [136.0, 136.58], [138.0, 140.41], [142.0, 142.84], [143.0, 148.27], [153.0, 153.64], [156.0, 156.12], [158.0, 158.18], [160.0, 175.93], [178.0, 180.98]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [91.64, 0.0, 0.0, 29.37, 51.55, 0.0, 88.46, 0.0, 35.79, 0.0, 0.0, 0.0, 38.72, 73.82], "audiomae_on_audioset": [null, null, null, [["echo", 47.53], ["whale vocalization", 12.16], ["speech", 7.15]], null, null, null, null, [["noise", 19.25], ["radio", 12.87], ["buzz", 6.14]], null, null, null, [["gurgling", 18.71], ["squish", 9.55], ["music", 9.32]], null], "duration": [7.13, 90.73, -0.13, 13.09, 5.24, 0.58, 2.41, 0.84, 5.27, 0.64, 0.12, 0.18, 15.93, 2.98]} \ No newline at end of file diff --git a/annotations_1/lzJV7k-LiC4_filtered.json b/annotations_1/lzJV7k-LiC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1de9428acb7b78f858750a44cff3c9a892bb11e0 --- /dev/null +++ b/annotations_1/lzJV7k-LiC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.63], [1.0, 0.75], [7.0, 10.71], [11.0, 13.85], [22.0, 29.88], [31.0, 32.51], [35.0, 36.31], [37.0, 37.3], [38.0, 49.62], [54.0, 55.48], [58.0, 58.72], [61.0, 65.18], [68.0, 70.5], [74.0, 77.65], [81.0, 83.56], [89.0, 90.41], [93.0, 93.88], [98.0, 104.38], [106.0, 113.53], [116.0, 143.23], [148.0, 154.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 52.62, 55.18, 32.07, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 79.76, 53.4, 49.45, 69.88, 0.0, 0.0, 32.68, 31.63, 31.07, 30.91], "audiomae_on_audioset": [null, null, null, null, [["boing", 27.29], ["speech", 19.04], ["whack, thwack", 10.15]], null, null, null, null, null, null, null, null, [["music", 60.86], ["lullaby", 4.02], ["musical instrument", 3.83]], null, null, null, [["music", 71.18], ["synthesizer", 2.38], ["singing", 2.04]], [["music", 68.38], ["singing", 2.87], ["throbbing", 2.0]], [["music", 71.19], ["singing", 3.92], ["pop music", 2.94]], [["speech", 37.48], ["music", 23.49], ["fart", 6.01]]], "duration": [-0.37, -0.25, 3.71, 2.85, 7.88, 1.51, 1.31, 0.3, 11.62, 1.48, 0.72, 4.18, 2.5, 3.65, 2.56, 1.41, 0.88, 6.38, 7.53, 27.23, 6.68]} \ No newline at end of file diff --git a/annotations_1/lzo2hgdDUDw_filtered.json b/annotations_1/lzo2hgdDUDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be46567604352748e8eba3524a4d2299a7a9f3a5 --- /dev/null +++ b/annotations_1/lzo2hgdDUDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.21], [10.0, 14.15], [19.0, 35.4], [38.0, 38.69], [39.0, 39.6], [40.0, 45.0], [47.0, 67.78], [71.0, 91.83]], "keep_status": [false, true, true, false, false, false, true, false], "silence_prob": [0.0, 48.91, 42.0, 0.0, 0.0, 59.51, 36.45, 38.66], "audiomae_on_audioset": [null, [["fly, housefly", 21.48], ["speech", 16.96], ["insect", 10.99]], [["speech", 32.72], ["buzz", 14.25], ["fly, housefly", 6.07]], null, null, null, [["speech", 30.11], ["fly, housefly", 17.37], ["insect", 11.65]], [["music", 64.57], ["didgeridoo", 13.46], ["speech", 3.5]]], "duration": [1.21, 4.15, 16.4, 0.69, 0.6, 5.0, 20.78, 20.83]} \ No newline at end of file diff --git a/annotations_1/m-2WmcLl_PQ_filtered.json b/annotations_1/m-2WmcLl_PQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa9c363c2742ff788a0c09592a8f54bbef84cd97 --- /dev/null +++ b/annotations_1/m-2WmcLl_PQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.9], [4.0, 4.28], [6.0, 6.99], [10.0, 11.28], [12.0, 55.76], [58.0, 89.61], [92.0, 138.32], [140.0, 179.36], [180.0, 179.98]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.9, 0.28, 0.99, 1.28, 43.76, 31.61, 46.32, 39.36, -0.02]} \ No newline at end of file diff --git a/annotations_1/m-3Ohq-bVFA_filtered.json b/annotations_1/m-3Ohq-bVFA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f622398d75c5cf1f38eaf2ec077484ebd21fde12 --- /dev/null +++ b/annotations_1/m-3Ohq-bVFA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.49], [14.0, 15.8], [19.0, 20.61], [21.0, 23.28], [25.0, 26.42], [30.0, 30.99], [33.0, 33.84], [35.0, 36.09], [38.0, 39.55], [41.0, 42.38], [44.0, 45.2], [48.0, 49.05], [51.0, 54.45], [55.0, 57.2], [58.0, 59.29], [61.0, 61.16], [63.0, 62.85], [75.0, 79.83], [90.0, 91.2], [92.0, 94.02], [95.0, 96.25], [97.0, 100.21], [102.0, 102.19], [105.0, 106.62]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [31.73, 0.0, 0.0, 34.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.35, 31.11, 0.0, 0.0, 0.0, 35.37, 0.0, 31.81, 0.0, 83.52, 0.0, 0.0], "audiomae_on_audioset": [[["music", 57.9], ["electronic music", 10.75], ["speech", 7.83]], null, null, [["music", 48.57], ["speech", 14.65], ["electronic music", 3.62]], null, null, null, null, null, null, null, null, [["music", 50.72], ["ambient music", 9.9], ["electronic music", 9.71]], [["music", 51.38], ["hum", 14.83], ["sonar", 6.87]], null, null, null, [["music", 54.78], ["telephone bell ringing", 15.38], ["telephone", 11.98]], null, [["gong", 35.51], ["music", 17.23], ["musical instrument", 9.99]], null, null, null, null], "duration": [2.49, 1.8, 1.61, 2.28, 1.42, 0.99, 0.84, 1.09, 1.55, 1.38, 1.2, 1.05, 3.45, 2.2, 1.29, 0.16, -0.15, 4.83, 1.2, 2.02, 1.25, 3.21, 0.19, 1.62]} \ No newline at end of file diff --git a/annotations_1/m-ETkZmPNiM_filtered.json b/annotations_1/m-ETkZmPNiM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..870861f1971ed86c643857470c2f5f50662c60dc --- /dev/null +++ b/annotations_1/m-ETkZmPNiM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.86], [18.0, 18.6], [24.0, 24.07], [33.0, 33.67], [36.0, 36.44], [40.0, 42.89], [43.0, 44.34], [47.0, 47.93], [48.0, 48.9], [50.0, 50.77], [53.0, 59.81], [64.0, 64.35], [65.0, 65.94], [68.0, 71.32], [73.0, 93.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 0.0, 100.0, 51.34], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.6, 0.07, 0.67, 0.44, 2.89, 1.34, 0.93, 0.9, 0.77, 6.81, 0.35, 0.94, 3.32, 20.23]} \ No newline at end of file diff --git a/annotations_1/m-L3k3ElIQE_filtered.json b/annotations_1/m-L3k3ElIQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..275a324f794abbacdeccf33770ef94949fb880c7 --- /dev/null +++ b/annotations_1/m-L3k3ElIQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.32], [9.0, 10.98], [16.0, 16.43], [20.0, 20.34], [31.0, 31.78], [34.0, 33.99], [37.0, 37.96], [41.0, 41.82], [46.0, 46.08], [47.0, 47.16], [51.0, 50.99], [66.0, 67.66], [70.0, 71.49], [75.0, 75.71], [81.0, 84.65], [86.0, 87.08], [89.0, 89.41], [91.0, 91.03], [91.0, 102.22], [104.0, 105.65], [115.0, 116.75], [119.0, 121.69], [131.0, 132.95], [139.0, 140.75], [142.0, 143.23], [145.0, 145.74], [148.0, 149.72], [158.0, 157.99], [159.0, 160.79], [164.0, 165.75], [168.0, 168.98], [170.0, 171.36], [172.0, 172.81], [180.0, 180.49], [190.0, 191.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.72, 0.0, 0.0, 0.0, 38.1, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.47], ["sidetone", 10.06], ["sine wave", 2.32]], null, null, null, [["hum", 43.08], ["mains hum", 25.94], ["speech", 13.45]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 1.98, 0.43, 0.34, 0.78, -0.01, 0.96, 0.82, 0.08, 0.16, -0.01, 1.66, 1.49, 0.71, 3.65, 1.08, 0.41, 0.03, 11.22, 1.65, 1.75, 2.69, 1.95, 1.75, 1.23, 0.74, 1.72, -0.01, 1.79, 1.75, 0.98, 1.36, 0.81, 0.49, 1.81]} \ No newline at end of file diff --git a/annotations_1/m-PsCZ_57MY_filtered.json b/annotations_1/m-PsCZ_57MY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6d28ad14484d731ed290d7d669a6417d858c3ff --- /dev/null +++ b/annotations_1/m-PsCZ_57MY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [5.0, 6.84], [8.0, 13.56], [15.0, 15.57], [16.0, 17.46], [18.0, 19.14], [27.0, 28.14], [33.0, 34.35], [36.0, 36.21], [37.0, 38.47], [39.0, 40.05], [41.0, 43.11], [44.0, 45.5], [49.0, 54.6], [55.0, 59.36], [61.0, 60.93], [62.0, 62.72], [67.0, 67.22], [68.0, 76.27], [77.0, 78.31], [84.0, 85.02], [92.0, 98.69], [103.0, 104.35], [108.0, 109.29], [112.0, 111.99], [118.0, 117.78], [125.0, 127.14], [128.0, 128.92], [130.0, 130.3], [133.0, 138.0], [141.0, 160.14], [164.0, 173.2], [175.0, 175.0]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 29.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.09, 0.0, 29.32, 29.74, 0.0, 0.0, 0.0, 28.97, 0.0, 0.0, 29.77, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 29.75, 28.39, 29.02, 0.0], "audiomae_on_audioset": [null, null, [["music", 51.86], ["hum", 7.53], ["synthesizer", 7.02]], null, null, null, null, null, null, null, null, [["whoosh, swoosh, swish", 18.02], ["rumble", 14.96], ["whack, thwack", 14.12]], null, [["mains hum", 25.35], ["music", 16.09], ["hum", 15.37]], [["rumble", 14.62], ["hum", 9.17], ["mains hum", 8.6]], null, null, null, [["speech", 66.48], ["hum", 10.55], ["mains hum", 4.29]], null, null, [["music", 54.46], ["whale vocalization", 14.94], ["stomach rumble", 7.78]], null, null, null, null, [["frog", 18.78], ["throbbing", 13.77], ["croak", 13.07]], null, null, [["music", 49.56], ["speech", 20.01], ["throbbing", 2.22]], [["speech", 27.03], ["rumble", 19.25], ["music", 12.91]], [["music", 42.43], ["hum", 22.61], ["mains hum", 8.98]], null], "duration": [0.59, 1.84, 5.56, 0.57, 1.46, 1.14, 1.14, 1.35, 0.21, 1.47, 1.05, 2.11, 1.5, 5.6, 4.36, -0.07, 0.72, 0.22, 8.27, 1.31, 1.02, 6.69, 1.35, 1.29, -0.01, -0.22, 2.14, 0.92, 0.3, 5.0, 19.14, 9.2, 0.0]} \ No newline at end of file diff --git a/annotations_1/m0DbfOnOBQo_filtered.json b/annotations_1/m0DbfOnOBQo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..423c7726876ef6434971b68fc9219f5e5512c1c5 --- /dev/null +++ b/annotations_1/m0DbfOnOBQo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.3], [28.0, 48.03], [48.0, 89.45], [90.0, 90.09], [91.0, 100.48], [102.0, 105.0], [106.0, 147.11], [148.0, 151.12], [155.0, 161.59], [163.0, 163.58], [164.0, 175.0], [179.0, 180.5], [182.0, 182.51], [183.0, 183.57], [187.0, 189.19]], "keep_status": [false, true, false, false, false, true, false, true, true, false, true, false, false, false, true], "silence_prob": [100.0, 30.48, 0.0, 0.0, 29.39, 35.11, 0.0, 35.87, 35.2, 0.0, 30.79, 0.0, 0.0, 0.0, 32.7], "audiomae_on_audioset": [null, [["speech", 26.76], ["fly, housefly", 13.96], ["music", 11.18]], null, null, [["music", 67.6], ["whack, thwack", 4.18], ["sound effect", 3.09]], [["creak", 41.38], ["music", 13.57], ["hum", 7.6]], null, [["speech", 54.76], ["livestock, farm animals, working animals", 8.77], ["roaring cats (lions, tigers)", 5.46]], [["music", 19.95], ["animal", 19.28], ["wild animals", 7.54]], null, [["music", 22.72], ["animal", 19.01], ["hum", 13.3]], null, null, null, [["music", 36.37], ["speech", 12.12], ["hum", 10.85]]], "duration": [4.3, 20.03, 41.45, 0.09, 9.48, 3.0, 41.11, 3.12, 6.59, 0.58, 11.0, 1.5, 0.51, 0.57, 2.19]} \ No newline at end of file diff --git a/annotations_1/m0etOugqkPU_filtered.json b/annotations_1/m0etOugqkPU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99f31956df5cab3263c42640bd8cf9e3773feb97 --- /dev/null +++ b/annotations_1/m0etOugqkPU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.65], [15.0, 16.02], [25.0, 40.64], [58.0, 66.5], [68.0, 68.71], [70.0, 77.89], [80.0, 83.37], [90.0, 98.98], [117.0, 118.59], [123.0, 127.04], [127.0, 128.58], [135.0, 138.97], [143.0, 148.54], [149.0, 155.55], [157.0, 159.0], [167.0, 168.0]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 29.87, 30.45, 0.0, 31.57, 31.03, 31.92, 0.0, 34.49, 0.0, 36.25, 33.45, 30.73, 31.25, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.99], ["didgeridoo", 1.89], ["carnatic music", 1.52]], [["speech", 25.6], ["music", 22.64], ["mosquito", 5.51]], null, [["speech", 55.38], ["hum", 9.58], ["music", 9.37]], [["music", 52.4], ["speech", 11.99], ["electronic music", 2.68]], [["fly, housefly", 21.8], ["music", 11.27], ["livestock, farm animals, working animals", 10.15]], null, [["music", 38.56], ["speech", 30.61], ["musical instrument", 2.6]], null, [["music", 38.67], ["speech", 15.64], ["hum", 3.91]], [["music", 56.4], ["didgeridoo", 5.35], ["drum and bass", 4.78]], [["music", 77.63], ["hum", 3.55], ["electronic music", 2.71]], [["music", 46.3], ["speech", 14.24], ["boing", 3.74]], null], "duration": [-0.35, 1.02, 15.64, 8.5, 0.71, 7.89, 3.37, 8.98, 1.59, 4.04, 1.58, 3.97, 5.54, 6.55, 2.0, 1.0]} \ No newline at end of file diff --git a/annotations_1/m1JgMM8b9_w_filtered.json b/annotations_1/m1JgMM8b9_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e52913a84901615120cb277b4e6405dadf1bf5a8 --- /dev/null +++ b/annotations_1/m1JgMM8b9_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.37], [29.0, 29.98], [30.0, 32.43], [33.0, 36.44], [38.0, 39.23], [42.0, 43.21], [49.0, 49.17], [50.0, 50.85], [56.0, 59.48], [61.0, 61.86], [64.0, 67.93], [70.0, 81.26], [82.0, 83.74], [85.0, 89.67], [91.0, 93.55], [95.0, 96.16], [98.0, 100.52], [102.0, 102.86], [104.0, 105.43], [106.0, 108.4], [110.0, 110.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 52.68, 70.72, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 86.27, 39.34, 0.0, 56.4, 94.52, 0.0, 82.07, 0.0, 0.0, 66.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 81.77], ["hum", 2.4], ["musical instrument", 1.96]], null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.98, 2.43, 3.44, 1.23, 1.21, 0.17, 0.85, 3.48, 0.86, 3.93, 11.26, 1.74, 4.67, 2.55, 1.16, 2.52, 0.86, 1.43, 2.4, 0.86]} \ No newline at end of file diff --git a/annotations_1/m1p-vJzqPKw_filtered.json b/annotations_1/m1p-vJzqPKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffb64ae10b36f2d88ea5f0f072974228d8934914 --- /dev/null +++ b/annotations_1/m1p-vJzqPKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.11], [17.0, 16.65], [17.0, 17.0], [18.0, 57.89], [60.0, 59.95], [61.0, 76.49], [80.0, 86.36], [88.0, 158.35]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.4, 30.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 53.99], ["mains hum", 12.26], ["speech", 12.12]], [["speech", 37.07], ["explosion", 12.25], ["rumble", 10.12]], null], "duration": [1.11, -0.35, 0.0, 39.89, -0.05, 15.49, 6.36, 70.35]} \ No newline at end of file diff --git a/annotations_1/m2cUbp6Vkfs_filtered.json b/annotations_1/m2cUbp6Vkfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61a66372793f6680982e73ced7638fcae88bcd8b --- /dev/null +++ b/annotations_1/m2cUbp6Vkfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.37], [19.0, 18.71], [19.0, 25.07], [32.0, 32.16], [33.0, 43.93], [47.0, 59.59], [60.0, 61.64], [64.0, 84.67], [92.0, 98.04], [98.0, 104.23], [116.0, 148.1], [172.0, 172.88]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [32.51, 0.0, 32.93, 0.0, 32.93, 33.38, 0.0, 32.86, 32.67, 33.1, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.92], ["musical instrument", 8.12], ["synthesizer", 4.06]], null, [["music", 59.2], ["trombone", 13.41], ["musical instrument", 3.79]], null, [["music", 79.1], ["trombone", 7.86], ["musical instrument", 2.97]], [["music", 66.46], ["musical instrument", 8.16], ["trombone", 3.7]], null, [["vehicle", 13.26], ["car", 10.39], ["race car, auto racing", 9.77]], [["music", 64.6], ["musical instrument", 6.1], ["effects unit", 5.97]], [["music", 42.05], ["musical instrument", 10.69], ["didgeridoo", 8.85]], null, null], "duration": [6.37, -0.29, 6.07, 0.16, 10.93, 12.59, 1.64, 20.67, 6.04, 6.23, 32.1, 0.88]} \ No newline at end of file diff --git a/annotations_1/m2tk7RatWsk_filtered.json b/annotations_1/m2tk7RatWsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4983cc731a5a5639596ea0bd7e95b6772f895b67 --- /dev/null +++ b/annotations_1/m2tk7RatWsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.12], [15.0, 17.98], [19.0, 19.23], [20.0, 64.25], [68.0, 76.91], [78.0, 92.72], [99.0, 112.7], [115.0, 118.94]], "keep_status": [false, false, false, false, true, false, true, true], "silence_prob": [40.09, 52.39, 0.0, 0.0, 46.97, 61.57, 30.27, 33.92], "audiomae_on_audioset": [[["hum", 49.05], ["mains hum", 22.73], ["music", 12.74]], null, null, null, [["hum", 20.94], ["mains hum", 20.15], ["rumble", 15.72]], null, [["hum", 18.17], ["speech", 10.66], ["mains hum", 9.7]], [["music", 28.05], ["throbbing", 12.93], ["hum", 11.46]]], "duration": [7.12, 2.98, 0.23, 44.25, 8.91, 14.72, 13.7, 3.94]} \ No newline at end of file diff --git a/annotations_1/m31MSgGEIAk_filtered.json b/annotations_1/m31MSgGEIAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9439042b286d30162c845456c8825c53846c31b --- /dev/null +++ b/annotations_1/m31MSgGEIAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.32], [34.0, 34.82], [36.0, 37.81], [39.0, 42.42], [43.0, 44.49], [51.0, 55.21], [55.0, 68.79], [73.0, 84.16], [88.0, 89.8], [103.0, 109.63], [114.0, 128.01], [129.0, 129.76], [131.0, 131.52], [136.0, 136.29], [139.0, 138.96], [141.0, 142.18], [144.0, 145.84], [147.0, 148.37], [150.0, 150.67], [151.0, 152.93], [154.0, 154.94], [156.0, 161.45], [162.0, 162.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.25, 0.0, 50.76, 65.32, 37.26, 0.0, 88.83, 67.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 54.62], ["sidetone", 15.81], ["radio", 3.64]], null, null, null, [["speech", 63.7], ["cough", 21.33], ["whack, thwack", 2.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 82.33], ["sidetone", 8.58], ["busy signal", 3.03]], null], "duration": [0.32, 0.82, 1.81, 3.42, 1.49, 4.21, 13.79, 11.16, 1.8, 6.63, 14.01, 0.76, 0.52, 0.29, -0.04, 1.18, 1.84, 1.37, 0.67, 1.93, 0.94, 5.45, 0.43]} \ No newline at end of file diff --git a/annotations_1/m3XsVwEuULw_filtered.json b/annotations_1/m3XsVwEuULw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..734f137bd569b1163e98b7043163cff096d77669 --- /dev/null +++ b/annotations_1/m3XsVwEuULw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [12.0, 13.1], [14.0, 22.52], [27.0, 30.01], [35.0, 44.95], [48.0, 64.83], [65.0, 70.01], [71.0, 71.96], [73.0, 73.03], [73.0, 78.75], [85.0, 87.93], [88.0, 106.64], [108.0, 114.39], [118.0, 120.09], [121.0, 134.32], [138.0, 138.21], [139.0, 142.48], [145.0, 147.63]], "keep_status": [false, false, false, true, true, false, true, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.89, 42.13, 39.08, 34.08, 36.31, 0.0, 0.0, 35.5, 36.41, 36.02, 35.87, 35.36, 54.63, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, [["music", 51.58], ["drum and bass", 13.63], ["speech", 9.2]], [["music", 44.63], ["speech", 9.61], ["drum machine", 4.85]], [["music", 57.85], ["didgeridoo", 8.1], ["musical instrument", 3.98]], [["music", 57.99], ["buzz", 12.16], ["didgeridoo", 5.44]], [["sidetone", 32.78], ["music", 19.94], ["hum", 11.06]], null, null, [["music", 37.13], ["speech", 15.12], ["boing", 14.17]], [["music", 74.33], ["cacophony", 4.47], ["speech", 3.27]], [["music", 58.01], ["boing", 27.32], ["didgeridoo", 1.69]], [["music", 42.06], ["sidetone", 12.8], ["speech", 12.57]], [["music", 54.63], ["speech", 12.05], ["throbbing", 5.31]], null, null, null, null], "duration": [0.37, 1.1, 8.52, 3.01, 9.95, 16.83, 5.01, 0.96, 0.03, 5.75, 2.93, 18.64, 6.39, 2.09, 13.32, 0.21, 3.48, 2.63]} \ No newline at end of file diff --git a/annotations_1/m3qnMx_kA2A_filtered.json b/annotations_1/m3qnMx_kA2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f69ab121120dd15584280e8e3cf77ec49eb0186 --- /dev/null +++ b/annotations_1/m3qnMx_kA2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.13], [7.0, 10.32], [17.0, 17.83], [19.0, 19.57], [26.0, 27.5], [30.0, 30.5], [32.0, 34.64], [36.0, 38.25], [39.0, 40.42], [53.0, 52.81], [61.0, 61.67], [62.0, 62.61], [64.0, 63.85], [66.0, 70.95], [76.0, 79.52], [81.0, 86.63], [90.0, 90.95], [91.0, 93.36], [94.0, 97.06], [102.0, 102.09], [103.0, 103.74], [104.0, 107.86], [114.0, 127.8], [128.0, 128.73], [132.0, 132.87], [133.0, 137.37]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [59.24, 58.89, 0.0, 0.0, 0.0, 0.0, 42.91, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 40.68, 50.31, 36.99, 0.0, 36.04, 40.33, 0.0, 0.0, 35.1, 34.67, 0.0, 0.0, 34.01], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 16.39], ["music", 11.23], ["throbbing", 10.57]], [["speech", 37.44], ["frog", 14.95], ["music", 12.23]], null, null, null, null, null, [["music", 26.1], ["speech", 16.62], ["throbbing", 5.28]], null, [["mains hum", 34.8], ["hum", 29.58], ["music", 8.5]], null, [["speech", 56.6], ["fly, housefly", 3.32], ["field recording", 3.11]], [["speech", 15.42], ["music", 15.14], ["gong", 13.25]], null, null, [["music", 45.14], ["speech", 30.01], ["mains hum", 2.22]], [["hum", 31.12], ["music", 28.11], ["throbbing", 18.88]], null, null, [["speech", 30.51], ["music", 28.05], ["mains hum", 7.81]]], "duration": [4.13, 3.32, 0.83, 0.57, 1.5, 0.5, 2.64, 2.25, 1.42, -0.19, 0.67, 0.61, -0.15, 4.95, 3.52, 5.63, 0.95, 2.36, 3.06, 0.09, 0.74, 3.86, 13.8, 0.73, 0.87, 4.37]} \ No newline at end of file diff --git a/annotations_1/m43-bLl6ZwI_filtered.json b/annotations_1/m43-bLl6ZwI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ae46fa6805fdf7d267d6a33f04e7249d17d5afa --- /dev/null +++ b/annotations_1/m43-bLl6ZwI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 25.73], [28.0, 62.92], [64.0, 68.98]], "keep_status": [false, false, false], "silence_prob": [29.59, 0.0, 29.66], "audiomae_on_audioset": [[["hum", 49.53], ["mains hum", 37.73], ["throbbing", 3.04]], null, [["speech", 59.43], ["throbbing", 7.17], ["music", 6.39]]], "duration": [10.73, 34.92, 4.98]} \ No newline at end of file diff --git a/annotations_1/m49ub45c8AI_filtered.json b/annotations_1/m49ub45c8AI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a718d4dc0d1693e1502f4b059b1af754c42dffb9 --- /dev/null +++ b/annotations_1/m49ub45c8AI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[84.0, 108.85], [110.0, 127.21], [129.0, 129.2], [139.0, 142.2]], "keep_status": [true, true, false, false], "silence_prob": [32.22, 28.85, 0.0, 33.97], "audiomae_on_audioset": [[["quack", 20.46], ["duck", 13.62], ["sonar", 10.72]], [["machine gun", 21.54], ["speech", 16.54], ["boom", 11.63]], null, [["whale vocalization", 51.06], ["speech", 35.95], ["music", 1.27]]], "duration": [24.85, 17.21, 0.2, 3.2]} \ No newline at end of file diff --git a/annotations_1/m4SWkyqSFxM_filtered.json b/annotations_1/m4SWkyqSFxM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abc770eb1f76ffeb02f678e54031be72e16cf707 --- /dev/null +++ b/annotations_1/m4SWkyqSFxM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.25], [4.0, 4.62], [7.0, 8.53], [19.0, 20.6], [23.0, 23.45], [40.0, 40.36], [46.0, 47.07], [49.0, 49.15]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.25, 0.62, 1.53, 1.6, 0.45, 0.36, 1.07, 0.15]} \ No newline at end of file diff --git a/annotations_1/m7HLqZP-l7E_filtered.json b/annotations_1/m7HLqZP-l7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9eaaf742755227a0dea99caa3167fe7c684e967 --- /dev/null +++ b/annotations_1/m7HLqZP-l7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.79], [27.0, 27.08], [29.0, 29.44], [32.0, 33.96], [36.0, 36.58], [39.0, 39.21], [42.0, 44.17], [44.0, 46.09], [48.0, 48.83], [49.0, 48.93], [49.0, 48.96], [51.0, 51.29], [52.0, 72.79], [75.0, 93.63], [98.0, 97.77], [104.0, 103.91], [110.0, 123.67], [126.0, 126.64], [128.0, 137.03], [142.0, 170.97], [176.0, 178.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 66.51, 0.0, 0.0, 0.0, 0.0, 29.62, 31.22, 0.0, 0.0, 30.85, 0.0, 29.45, 30.16, 32.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.74], ["speech", 20.14], ["musical instrument", 2.67]], [["music", 88.72], ["throbbing", 1.82], ["synthesizer", 1.52]], null, null, [["music", 38.25], ["hum", 21.72], ["throbbing", 18.93]], null, [["cattle, bovinae", 33.89], ["music", 23.22], ["livestock, farm animals, working animals", 17.66]], [["music", 59.81], ["speech", 11.22], ["boing", 4.64]], [["music", 45.33], ["theremin", 18.19], ["musical instrument", 8.55]]], "duration": [0.79, 0.08, 0.44, 1.96, 0.58, 0.21, 2.17, 2.09, 0.83, -0.07, -0.04, 0.29, 20.79, 18.63, -0.23, -0.09, 13.67, 0.64, 9.03, 28.97, 2.66]} \ No newline at end of file diff --git a/annotations_1/m7xTE3rvkDk_filtered.json b/annotations_1/m7xTE3rvkDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..106f4e2095268a4f0ffd6ac354ae181586b9522a --- /dev/null +++ b/annotations_1/m7xTE3rvkDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.12], [9.0, 9.17], [10.0, 11.52], [18.0, 17.85], [19.0, 33.78], [34.0, 34.91], [36.0, 44.9], [48.0, 50.73], [52.0, 56.83], [61.0, 69.94], [71.0, 74.16], [77.0, 88.87], [90.0, 90.12], [91.0, 97.28], [98.0, 125.9], [127.0, 127.62], [129.0, 129.84], [132.0, 132.93], [135.0, 137.22], [138.0, 139.29], [140.0, 148.78], [149.0, 150.9], [154.0, 160.3], [165.0, 182.76], [187.0, 187.1], [188.0, 191.05], [194.0, 196.67]], "keep_status": [true, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [40.62, 0.0, 0.0, 0.0, 32.74, 0.0, 31.84, 32.43, 34.18, 31.69, 32.36, 35.05, 0.0, 34.72, 38.67, 0.0, 0.0, 0.0, 33.62, 0.0, 32.32, 0.0, 42.74, 31.16, 0.0, 30.66, 52.56], "audiomae_on_audioset": [[["music", 34.63], ["speech", 14.0], ["throbbing", 9.35]], null, null, null, [["music", 67.82], ["boing", 13.0], ["clang", 2.77]], null, [["music", 66.18], ["throbbing", 8.88], ["hum", 5.9]], [["speech", 44.51], ["artillery fire", 8.36], ["explosion", 4.1]], [["mains hum", 29.46], ["hum", 21.7], ["music", 18.38]], [["music", 30.83], ["speech", 27.99], ["didgeridoo", 7.27]], [["music", 43.38], ["hum", 8.71], ["throbbing", 7.24]], [["music", 67.76], ["throbbing", 5.69], ["hum", 5.03]], null, [["music", 70.39], ["throbbing", 8.8], ["electronic music", 2.57]], [["music", 60.44], ["hum", 6.12], ["throbbing", 5.82]], null, null, null, [["music", 40.24], ["whack, thwack", 7.52], ["throbbing", 7.11]], null, [["music", 42.34], ["speech", 41.59], ["throbbing", 1.51]], null, [["fly, housefly", 29.61], ["music", 13.02], ["mosquito", 11.99]], [["throbbing", 62.62], ["music", 16.92], ["hum", 10.54]], null, [["noise", 26.13], ["throbbing", 16.75], ["hum", 14.05]], null], "duration": [6.12, 0.17, 1.52, -0.15, 14.78, 0.91, 8.9, 2.73, 4.83, 8.94, 3.16, 11.87, 0.12, 6.28, 27.9, 0.62, 0.84, 0.93, 2.22, 1.29, 8.78, 1.9, 6.3, 17.76, 0.1, 3.05, 2.67]} \ No newline at end of file diff --git a/annotations_1/m8lzyaMZ-mA_filtered.json b/annotations_1/m8lzyaMZ-mA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3561340430fe47999607095a646cc8047760abc4 --- /dev/null +++ b/annotations_1/m8lzyaMZ-mA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.08], [3.0, 3.37], [5.0, 5.59], [7.0, 8.95], [11.0, 11.13], [15.0, 15.38], [17.0, 17.66], [21.0, 21.61], [29.0, 29.51], [37.0, 37.44], [41.0, 41.23], [44.0, 44.32], [58.0, 58.33], [61.0, 61.53], [65.0, 65.2], [67.0, 66.78], [68.0, 68.27], [70.0, 70.17], [70.0, 72.1], [91.0, 91.84], [98.0, 98.81], [106.0, 106.34], [114.0, 114.42], [131.0, 131.04], [134.0, 134.0], [136.0, 135.8], [151.0, 151.9], [154.0, 154.87], [168.0, 168.52], [173.0, 172.98], [174.0, 174.51], [176.0, 175.88], [207.0, 206.96], [212.0, 212.21], [213.0, 213.48], [215.0, 214.89], [217.0, 217.71], [222.0, 222.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 0.37, 0.59, 1.95, 0.13, 0.38, 0.66, 0.61, 0.51, 0.44, 0.23, 0.32, 0.33, 0.53, 0.2, -0.22, 0.27, 0.17, 2.1, 0.84, 0.81, 0.34, 0.42, 0.04, 0.0, -0.2, 0.9, 0.87, 0.52, -0.02, 0.51, -0.12, -0.04, 0.21, 0.48, -0.11, 0.71, 0.84]} \ No newline at end of file diff --git a/annotations_1/m9Gg_VQP2zw_filtered.json b/annotations_1/m9Gg_VQP2zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84e899885390c659d2cebeec058752403fee049d --- /dev/null +++ b/annotations_1/m9Gg_VQP2zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.81], [27.0, 27.19], [29.0, 29.86], [31.0, 33.35], [40.0, 41.37], [45.0, 46.16], [48.0, 48.56], [52.0, 52.44], [54.0, 62.13], [62.0, 102.49], [110.0, 111.38], [115.0, 119.57], [120.0, 126.67], [137.0, 140.05], [140.0, 148.2], [154.0, 157.38], [162.0, 162.24], [162.0, 172.49], [173.0, 172.94]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, false], "silence_prob": [30.79, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 30.93, 0.0, 0.0, 30.77, 30.49, 31.98, 34.55, 38.08, 0.0, 32.61, 0.0], "audiomae_on_audioset": [[["music", 45.65], ["boing", 16.82], ["speech", 13.45]], null, null, null, null, null, null, null, [["music", 50.05], ["sampler", 9.88], ["electronic music", 4.94]], null, null, [["music", 59.16], ["musical instrument", 7.25], ["synthesizer", 5.69]], [["music", 79.94], ["hum", 4.69], ["grunt", 2.72]], [["speech", 39.19], ["music", 18.63], ["synthesizer", 5.1]], [["speech", 45.29], ["music", 15.86], ["explosion", 11.17]], [["speech", 29.82], ["music", 27.74], ["bleat", 4.05]], null, [["fly, housefly", 45.02], ["insect", 16.7], ["speech", 11.24]], null], "duration": [13.81, 0.19, 0.86, 2.35, 1.37, 1.16, 0.56, 0.44, 8.13, 40.49, 1.38, 4.57, 6.67, 3.05, 8.2, 3.38, 0.24, 10.49, -0.06]} \ No newline at end of file diff --git a/annotations_1/m9aEg5dlFOI_filtered.json b/annotations_1/m9aEg5dlFOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4955a5bbc919cc4ec10ba29f8f27f31e969d9c9 --- /dev/null +++ b/annotations_1/m9aEg5dlFOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 49.81], [50.0, 53.6], [60.0, 65.3], [67.0, 67.66], [70.0, 70.53], [71.0, 71.15], [74.0, 76.79], [79.0, 78.9], [84.0, 85.58], [87.0, 88.33], [89.0, 90.17], [93.0, 95.25], [97.0, 98.93], [100.0, 101.83], [141.0, 141.1], [153.0, 153.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 61.08, 77.2, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.19, 3.6, 5.3, 0.66, 0.53, 0.15, 2.79, -0.1, 1.58, 1.33, 1.17, 2.25, 1.93, 1.83, 0.1, 0.22]} \ No newline at end of file diff --git a/annotations_1/mAB-hSPmzjk_filtered.json b/annotations_1/mAB-hSPmzjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..066bb53794fb4ac910b9fe9e9f31fcfc5fa77ece --- /dev/null +++ b/annotations_1/mAB-hSPmzjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 25.84], [29.0, 32.31], [34.0, 37.84], [39.0, 39.93], [42.0, 54.41], [56.0, 60.54], [61.0, 80.37]], "keep_status": [true, true, true, false, false, false, false], "silence_prob": [30.84, 31.76, 30.27, 0.0, 30.37, 30.92, 31.55], "audiomae_on_audioset": [[["hum", 28.51], ["music", 21.67], ["musical instrument", 8.35]], [["music", 46.87], ["hum", 7.8], ["musical instrument", 4.93]], [["hum", 30.94], ["music", 22.78], ["mains hum", 11.04]], null, [["music", 51.94], ["synthesizer", 14.32], ["musical instrument", 8.32]], [["hum", 56.47], ["mains hum", 25.3], ["throbbing", 7.64]], [["music", 44.22], ["hum", 23.36], ["throbbing", 5.88]]], "duration": [5.84, 3.31, 3.84, 0.93, 12.41, 4.54, 19.37]} \ No newline at end of file diff --git a/annotations_1/mAD2gJTRSbI_filtered.json b/annotations_1/mAD2gJTRSbI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73f773ba462a087616f76b5c52644cc3382917aa --- /dev/null +++ b/annotations_1/mAD2gJTRSbI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.19], [6.0, 6.2], [7.0, 8.55], [15.0, 15.53], [18.0, 19.11], [31.0, 30.96], [33.0, 35.38], [37.0, 104.65], [109.0, 110.47], [119.0, 119.01], [119.0, 119.06], [119.0, 119.28], [126.0, 126.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.2, 1.55, 0.53, 1.11, -0.04, 2.38, 67.65, 1.47, 0.01, 0.06, 0.28, 0.0]} \ No newline at end of file diff --git a/annotations_1/mBiT0g4TIYc_filtered.json b/annotations_1/mBiT0g4TIYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be1c32d52f387ddc392a51636900e874f8692bbc --- /dev/null +++ b/annotations_1/mBiT0g4TIYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [3.0, 2.96], [5.0, 5.46], [6.0, 13.36], [16.0, 15.79], [16.0, 16.63], [19.0, 19.68], [21.0, 21.46], [22.0, 22.03], [25.0, 26.0], [28.0, 28.21], [30.0, 36.39], [38.0, 38.94], [45.0, 45.12], [49.0, 51.66], [61.0, 73.13], [75.0, 82.65], [92.0, 93.48], [95.0, 101.01], [102.0, 102.64], [104.0, 137.54], [140.0, 143.24], [143.0, 143.73], [146.0, 147.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 36.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 0.0, 29.95, 29.65, 29.05, 0.0, 29.74, 0.0, 0.0, 33.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 26.49], ["speech", 15.68], ["mains hum", 11.2]], null, null, null, null, null, null, null, null, null, null, [["speech", 47.13], ["music", 17.81], ["didgeridoo", 2.9]], [["music", 88.27], ["musical instrument", 3.5], ["piano", 0.88]], [["music", 61.22], ["musical instrument", 5.27], ["clarinet", 3.86]], null, [["music", 56.73], ["musical instrument", 9.87], ["brass instrument", 4.36]], null, null, [["throbbing", 45.81], ["music", 18.3], ["heart sounds, heartbeat", 8.36]], null, null], "duration": [0.24, -0.04, 0.46, 7.36, -0.21, 0.63, 0.68, 0.46, 0.03, 1.0, 0.21, 6.39, 0.94, 0.12, 2.66, 12.13, 7.65, 1.48, 6.01, 0.64, 33.54, 3.24, 0.73, 1.53]} \ No newline at end of file diff --git a/annotations_1/mCSno4xODKY_filtered.json b/annotations_1/mCSno4xODKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5238c634b4b0756e9df0616b281d1398f22dba47 --- /dev/null +++ b/annotations_1/mCSno4xODKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.55], [20.0, 20.22], [21.0, 22.72], [25.0, 24.66], [25.0, 27.73], [31.0, 31.67], [33.0, 36.86], [50.0, 65.2], [70.0, 82.83], [83.0, 84.75]], "keep_status": [false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 57.56, 32.21, 58.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 26.77], ["hum", 25.4], ["mains hum", 14.93]], null, null], "duration": [0.55, 0.22, 1.72, -0.34, 2.73, 0.67, 3.86, 15.2, 12.83, 1.75]} \ No newline at end of file diff --git a/annotations_1/mCfKPXX19Gw_filtered.json b/annotations_1/mCfKPXX19Gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0fd8b642ed2e12c3f931d4bcb09d2966b1ba527 --- /dev/null +++ b/annotations_1/mCfKPXX19Gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 30.06], [33.0, 80.65], [85.0, 106.19], [108.0, 152.63], [154.0, 153.94]], "keep_status": [false, false, true, false, false], "silence_prob": [30.6, 0.0, 33.53, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.41], ["buzzer", 16.18], ["alarm", 11.94]], null, [["music", 47.73], ["hum", 12.14], ["rumble", 9.2]], null, null], "duration": [19.06, 47.65, 21.19, 44.63, -0.06]} \ No newline at end of file diff --git a/annotations_1/mCsu9hGvNEc_filtered.json b/annotations_1/mCsu9hGvNEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..79b0af36476acf461497fec8a278ae9f6614a7c9 --- /dev/null +++ b/annotations_1/mCsu9hGvNEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.26], [5.0, 5.29], [8.0, 8.53], [10.0, 11.92], [15.0, 15.52], [16.0, 17.31], [17.0, 18.57], [20.0, 20.46], [28.0, 28.65], [31.0, 30.69], [33.0, 33.12], [36.0, 37.54], [40.0, 40.54], [43.0, 44.15], [50.0, 50.03], [58.0, 68.86], [69.0, 71.68], [73.0, 81.09], [89.0, 89.55], [107.0, 107.96], [109.0, 109.78], [118.0, 121.61], [124.0, 126.72], [127.0, 126.79], [127.0, 150.48], [151.0, 158.84], [164.0, 168.76], [169.0, 177.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 94.22, 0.0, 0.0, 0.0, 99.98, 99.98, 0.0, 99.73, 97.83, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 0.29, 0.53, 1.92, 0.52, 1.31, 1.57, 0.46, 0.65, -0.31, 0.12, 1.54, 0.54, 1.15, 0.03, 10.86, 2.68, 8.09, 0.55, 0.96, 0.78, 3.61, 2.72, -0.21, 23.48, 7.84, 4.76, 8.92]} \ No newline at end of file diff --git a/annotations_1/mExTnHwAcYY_filtered.json b/annotations_1/mExTnHwAcYY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4197a8f89b3ed95e7567ed6568c7bb7cc2e3a96 --- /dev/null +++ b/annotations_1/mExTnHwAcYY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.45], [12.0, 13.47], [17.0, 23.25], [25.0, 25.35], [27.0, 27.14], [30.0, 29.93], [46.0, 51.02], [52.0, 54.04], [54.0, 56.54], [58.0, 58.46], [59.0, 67.74], [69.0, 69.15], [69.0, 74.24], [76.0, 77.9], [80.0, 80.76], [85.0, 88.05], [89.0, 93.01], [94.0, 99.03], [103.0, 104.04], [104.0, 105.11], [107.0, 107.43], [108.0, 108.92], [111.0, 116.82], [119.0, 124.36], [126.0, 127.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.66, 0.0, 84.43, 0.0, 0.0, 0.0, 100.0, 100.0, 99.4, 0.0, 99.68, 0.0, 97.33, 0.0, 0.0, 99.82, 87.37, 98.27, 0.0, 0.0, 0.0, 0.0, 89.19, 95.37, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.45, 1.47, 6.25, 0.35, 0.14, -0.07, 5.02, 2.04, 2.54, 0.46, 8.74, 0.15, 5.24, 1.9, 0.76, 3.05, 4.01, 5.03, 1.04, 1.11, 0.43, 0.92, 5.82, 5.36, 1.06]} \ No newline at end of file diff --git a/annotations_1/mFA9-zsFtt8_filtered.json b/annotations_1/mFA9-zsFtt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54eaa71e9ac978df423d7687032a7664f6478d90 --- /dev/null +++ b/annotations_1/mFA9-zsFtt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 29.24], [32.0, 33.49], [36.0, 36.04], [37.0, 38.13], [39.0, 44.41], [46.0, 47.17], [50.0, 50.3], [65.0, 65.7], [68.0, 68.67], [69.0, 72.23], [73.0, 74.09], [78.0, 80.49], [84.0, 89.21], [91.0, 91.71], [95.0, 96.79], [104.0, 104.53], [112.0, 112.29], [116.0, 116.26], [117.0, 118.67], [120.0, 120.63], [121.0, 122.34], [125.0, 125.25], [126.0, 126.05], [126.0, 126.2], [130.0, 130.65], [133.0, 133.64], [140.0, 142.69], [145.0, 146.04], [146.0, 146.97], [149.0, 149.69], [150.0, 162.3], [170.0, 170.11], [171.0, 172.39], [178.0, 182.36], [189.0, 194.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [73.97, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0, 44.15, 0.0, 43.56, 44.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.89, 0.0, 0.0, 0.0, 35.49, 0.0, 0.0, 36.35, 37.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 57.64], ["hum", 9.42], ["music", 9.02]], null, [["speech", 53.74], ["hum", 9.11], ["music", 4.8]], [["sidetone", 50.39], ["speech", 15.87], ["music", 8.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.15], ["throbbing", 5.21], ["hum", 4.17]], null, null, null, [["music", 52.64], ["trance music", 7.31], ["techno", 6.6]], null, null, [["music", 51.53], ["electronic music", 10.27], ["techno", 9.04]], [["music", 65.4], ["electronic music", 5.69], ["techno", 4.65]]], "duration": [8.24, 1.49, 0.04, 1.13, 5.41, 1.17, 0.3, 0.7, 0.67, 3.23, 1.09, 2.49, 5.21, 0.71, 1.79, 0.53, 0.29, 0.26, 1.67, 0.63, 1.34, 0.25, 0.05, 0.2, 0.65, 0.64, 2.69, 1.04, 0.97, 0.69, 12.3, 0.11, 1.39, 4.36, 5.26]} \ No newline at end of file diff --git a/annotations_1/mFH_r2w28rM_filtered.json b/annotations_1/mFH_r2w28rM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c2f47a4926bfc154b42530d439d5064eddb98ee --- /dev/null +++ b/annotations_1/mFH_r2w28rM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.19], [0.0, 0.43], [6.0, 5.85], [8.0, 8.7], [13.0, 15.9], [25.0, 25.15], [26.0, 26.37], [32.0, 32.31], [36.0, 36.21], [38.0, 39.14], [40.0, 40.47], [44.0, 44.47], [51.0, 52.54], [65.0, 74.85], [75.0, 79.24], [80.0, 81.77], [90.0, 89.83], [94.0, 94.29], [95.0, 94.91], [101.0, 103.22], [105.0, 105.44], [106.0, 107.55], [116.0, 117.56], [119.0, 119.23], [121.0, 121.98], [131.0, 130.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 85.35, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.19, 0.43, -0.15, 0.7, 2.9, 0.15, 0.37, 0.31, 0.21, 1.14, 0.47, 0.47, 1.54, 9.85, 4.24, 1.77, -0.17, 0.29, -0.09, 2.22, 0.44, 1.55, 1.56, 0.23, 0.98, -0.26]} \ No newline at end of file diff --git a/annotations_1/mFl8nzZuExE_filtered.json b/annotations_1/mFl8nzZuExE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf9d9438c77bd3fb2773443df32d4bc22be10daf --- /dev/null +++ b/annotations_1/mFl8nzZuExE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.21], [8.0, 10.99], [25.0, 25.59], [29.0, 29.71], [38.0, 37.61], [41.0, 41.93], [44.0, 44.36], [51.0, 51.19], [53.0, 52.66], [53.0, 53.65], [60.0, 61.45], [66.0, 89.26], [90.0, 91.2], [96.0, 96.85], [101.0, 102.76], [110.0, 110.86], [112.0, 113.12], [124.0, 125.0], [136.0, 135.68], [149.0, 149.59], [152.0, 153.01], [170.0, 169.69], [176.0, 176.59], [177.0, 180.06], [184.0, 184.18], [187.0, 187.69], [192.0, 197.29], [197.0, 197.45], [198.0, 198.73], [199.0, 202.15], [210.0, 210.61]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 33.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.2, 0.0, 0.0, 33.89, 0.0, 0.0, 43.0, 0.0], "audiomae_on_audioset": [null, [["thunk", 28.02], ["breaking", 24.32], ["creak", 14.07]], null, null, null, null, null, null, null, null, null, [["music", 72.01], ["breaking", 8.72], ["hum", 2.59]], null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 56.04], ["moo", 22.61], ["livestock, farm animals, working animals", 18.35]], null, null, [["music", 17.42], ["moo", 6.52], ["crowd", 6.49]], null, null, [["music", 60.77], ["speech", 10.0], ["electronic music", 2.52]], null], "duration": [0.21, 2.99, 0.59, 0.71, -0.39, 0.93, 0.36, 0.19, -0.34, 0.65, 1.45, 23.26, 1.2, 0.85, 1.76, 0.86, 1.12, 1.0, -0.32, 0.59, 1.01, -0.31, 0.59, 3.06, 0.18, 0.69, 5.29, 0.45, 0.73, 3.15, 0.61]} \ No newline at end of file diff --git a/annotations_1/mGAaR9KKszs_filtered.json b/annotations_1/mGAaR9KKszs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfb8a6ad29b5a239518d1ec7c71bef5ff0663b3f --- /dev/null +++ b/annotations_1/mGAaR9KKszs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.92], [28.0, 28.75], [48.0, 49.49], [50.0, 50.38], [52.0, 53.2], [64.0, 67.44], [68.0, 68.01], [70.0, 70.95], [74.0, 74.28], [76.0, 77.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 47.77], ["music", 26.17], ["thunk", 3.98]], null, null, null, null], "duration": [-0.08, 0.75, 1.49, 0.38, 1.2, 3.44, 0.01, 0.95, 0.28, 1.01]} \ No newline at end of file diff --git a/annotations_1/mG_G5waoSeo_filtered.json b/annotations_1/mG_G5waoSeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25fbaf6d375db6a8452cfd072d4c6e7224c21211 --- /dev/null +++ b/annotations_1/mG_G5waoSeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [8.0, 12.78], [14.0, 14.71], [20.0, 21.27], [24.0, 24.85], [27.0, 27.9], [30.0, 30.84], [45.0, 46.99], [48.0, 54.7], [56.0, 56.57], [57.0, 60.56], [61.0, 66.92], [69.0, 84.27], [87.0, 87.72], [89.0, 100.6], [104.0, 113.98], [116.0, 115.87], [117.0, 126.57], [135.0, 136.58], [156.0, 171.46]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.84, 0.0, 32.34, 30.83, 28.38, 0.0, 28.25, 28.16, 0.0, 28.23, 0.0, 28.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 17.77], ["hum", 14.41], ["firecracker", 8.12]], null, [["fly, housefly", 13.34], ["whack, thwack", 12.49], ["groan", 11.56]], [["speech", 40.07], ["cattle, bovinae", 5.57], ["hubbub, speech noise, speech babble", 4.23]], [["music", 61.26], ["speech", 24.92], ["hum", 2.04]], null, [["music", 92.15], ["electronic music", 1.53], ["speech", 1.4]], [["music", 65.6], ["speech", 7.71], ["throbbing", 3.98]], null, [["music", 70.14], ["cattle, bovinae", 5.48], ["moo", 4.48]], null, [["music", 61.21], ["sidetone", 15.7], ["speech", 5.71]]], "duration": [0.56, 4.78, 0.71, 1.27, 0.85, 0.9, 0.84, 1.99, 6.7, 0.57, 3.56, 5.92, 15.27, 0.72, 11.6, 9.98, -0.13, 9.57, 1.58, 15.46]} \ No newline at end of file diff --git a/annotations_1/mHGHJwXWh1k_filtered.json b/annotations_1/mHGHJwXWh1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fe861aed5757d51726c69ab4a4761b7f3665dc4 --- /dev/null +++ b/annotations_1/mHGHJwXWh1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.35], [14.0, 14.39], [23.0, 25.25], [25.0, 25.29], [26.0, 25.64], [26.0, 26.1], [26.0, 28.93], [30.0, 41.34], [45.0, 45.89], [46.0, 48.24], [50.0, 99.22], [103.0, 105.39], [110.0, 109.7], [110.0, 117.68], [121.0, 122.1], [123.0, 144.21]], "keep_status": [false, false, true, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 31.92, 0.0, 0.0, 0.0, 34.51, 35.28, 0.0, 32.08, 0.0, 36.14, 0.0, 32.81, 0.0, 32.73], "audiomae_on_audioset": [null, null, [["speech", 57.54], ["fly, housefly", 6.31], ["insect", 3.69]], null, null, null, [["cattle, bovinae", 42.94], ["livestock, farm animals, working animals", 23.92], ["moo", 21.87]], [["music", 67.87], ["speech", 8.71], ["synthesizer", 3.59]], null, [["moo", 25.28], ["cattle, bovinae", 21.59], ["music", 12.32]], null, [["music", 37.52], ["synthesizer", 7.8], ["didgeridoo", 6.18]], null, [["music", 70.01], ["theremin", 6.48], ["didgeridoo", 5.79]], null, [["speech", 35.83], ["music", 23.66], ["musical instrument", 9.17]]], "duration": [0.35, 0.39, 2.25, 0.29, -0.36, 0.1, 2.93, 11.34, 0.89, 2.24, 49.22, 2.39, -0.3, 7.68, 1.1, 21.21]} \ No newline at end of file diff --git a/annotations_1/mHRbCgVCbIA_filtered.json b/annotations_1/mHRbCgVCbIA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eca838ee6b3f9c2eced630dc1d3d24195b04d5ab --- /dev/null +++ b/annotations_1/mHRbCgVCbIA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.1], [21.0, 21.03], [29.0, 29.93], [32.0, 33.37], [34.0, 33.99], [44.0, 44.17], [44.0, 44.36], [59.0, 59.68], [62.0, 71.63], [74.0, 75.61], [83.0, 83.3], [89.0, 89.73], [102.0, 103.06], [106.0, 107.08], [109.0, 109.16], [114.0, 113.9], [116.0, 117.86], [119.0, 119.04], [120.0, 121.37], [133.0, 133.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 77.62], ["animal", 11.03], ["roaring cats (lions, tigers)", 1.27]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.1, 0.03, 0.93, 1.37, -0.01, 0.17, 0.36, 0.68, 9.63, 1.61, 0.3, 0.73, 1.06, 1.08, 0.16, -0.1, 1.86, 0.04, 1.37, 0.44]} \ No newline at end of file diff --git a/annotations_1/mI6O2d4Ieok_filtered.json b/annotations_1/mI6O2d4Ieok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68dacbeafd1ef30258064e164e4f47ef10b752a0 --- /dev/null +++ b/annotations_1/mI6O2d4Ieok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.17], [8.0, 17.86], [18.0, 25.44], [31.0, 34.4], [37.0, 42.99], [48.0, 48.84], [49.0, 51.85], [55.0, 59.09], [63.0, 63.51], [73.0, 85.83], [89.0, 93.72], [100.0, 102.68], [105.0, 116.45], [117.0, 117.29], [118.0, 118.5], [120.0, 134.23], [136.0, 137.4], [146.0, 154.62], [159.0, 174.46]], "keep_status": [false, false, false, true, true, false, true, false, false, true, false, true, true, false, false, false, false, true, true], "silence_prob": [0.0, 33.64, 34.5, 31.45, 32.22, 0.0, 33.15, 31.22, 0.0, 31.62, 34.53, 31.34, 31.63, 0.0, 0.0, 32.35, 0.0, 34.65, 32.26], "audiomae_on_audioset": [null, [["sidetone", 35.38], ["music", 24.63], ["speech", 13.3]], [["music", 46.45], ["hum", 17.03], ["throbbing", 16.29]], [["music", 25.92], ["speech", 15.48], ["electronic music", 8.32]], [["cattle, bovinae", 22.69], ["music", 20.65], ["moo", 20.61]], null, [["music", 41.68], ["speech", 10.68], ["fly, housefly", 4.44]], [["music", 54.44], ["speech", 19.29], ["electronic music", 2.36]], null, [["music", 29.29], ["speech", 18.03], ["hum", 7.02]], [["music", 61.44], ["throbbing", 6.48], ["hum", 6.29]], [["speech", 54.22], ["vehicle", 5.77], ["breaking", 3.89]], [["cattle, bovinae", 26.86], ["livestock, farm animals, working animals", 17.43], ["music", 17.2]], null, null, [["music", 45.34], ["speech", 27.88], ["electric shaver, electric razor", 5.18]], null, [["hum", 34.61], ["mains hum", 27.16], ["speech", 4.45]], [["music", 28.16], ["livestock, farm animals, working animals", 9.21], ["fly, housefly", 6.93]]], "duration": [1.17, 9.86, 7.44, 3.4, 5.99, 0.84, 2.85, 4.09, 0.51, 12.83, 4.72, 2.68, 11.45, 0.29, 0.5, 14.23, 1.4, 8.62, 15.46]} \ No newline at end of file diff --git a/annotations_1/mIGCgzqFR0s_filtered.json b/annotations_1/mIGCgzqFR0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5bb88932fcae499056b171299baaa5e24fe3dfaa --- /dev/null +++ b/annotations_1/mIGCgzqFR0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.83], [12.0, 19.28], [20.0, 41.03], [42.0, 42.13], [44.0, 44.63], [46.0, 52.19], [53.0, 54.11], [57.0, 58.33], [63.0, 63.0], [65.0, 64.81], [67.0, 67.76], [71.0, 71.1], [78.0, 79.68], [80.0, 80.89], [85.0, 86.37], [89.0, 88.92], [94.0, 95.69], [96.0, 97.04], [104.0, 104.4], [106.0, 106.3], [110.0, 113.05], [113.0, 113.1], [113.0, 113.16], [114.0, 117.1], [120.0, 120.83], [123.0, 123.92], [131.0, 130.86], [132.0, 133.79], [135.0, 135.53], [140.0, 141.69], [151.0, 151.98], [155.0, 155.22], [169.0, 170.36], [175.0, 175.17], [177.0, 177.75], [180.0, 180.3], [181.0, 181.58], [183.0, 191.78], [193.0, 193.75], [196.0, 195.83], [208.0, 210.37], [213.0, 213.21], [222.0, 222.34], [228.0, 228.6], [235.0, 236.26], [239.0, 239.52], [240.0, 241.47], [246.0, 248.32], [255.0, 255.01], [270.0, 271.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 45.24, 29.16, 0.0, 0.0, 32.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.68, 0.0, 0.0, 35.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 44.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.51], ["electronic music", 9.42], ["noise", 6.97]], [["music", 64.11], ["synthesizer", 3.51], ["musical instrument", 3.48]], null, null, [["music", 64.81], ["speech", 10.88], ["animal", 2.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.28], ["music", 37.16], ["theremin", 6.05]], null, null, [["boing", 37.77], ["music", 29.73], ["speech", 7.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.13], ["throat clearing", 10.02], ["oink", 7.27]], null, null, null, null, null, null, [["music", 42.88], ["speech", 18.7], ["synthesizer", 5.93]], null, null], "duration": [-0.17, 7.28, 21.03, 0.13, 0.63, 6.19, 1.11, 1.33, 0.0, -0.19, 0.76, 0.1, 1.68, 0.89, 1.37, -0.08, 1.69, 1.04, 0.4, 0.3, 3.05, 0.1, 0.16, 3.1, 0.83, 0.92, -0.14, 1.79, 0.53, 1.69, 0.98, 0.22, 1.36, 0.17, 0.75, 0.3, 0.58, 8.78, 0.75, -0.17, 2.37, 0.21, 0.34, 0.6, 1.26, 0.52, 1.47, 2.32, 0.01, 1.61]} \ No newline at end of file diff --git a/annotations_1/mIeU7y3CGKQ_filtered.json b/annotations_1/mIeU7y3CGKQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dfeee5298a3849c9621e9b58999deeb91efbfac --- /dev/null +++ b/annotations_1/mIeU7y3CGKQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.14], [7.0, 10.29], [13.0, 17.31], [17.0, 17.37], [24.0, 26.59], [27.0, 29.78], [31.0, 33.42], [38.0, 43.71], [46.0, 57.37], [58.0, 58.5], [59.0, 58.55], [59.0, 58.62], [63.0, 68.2], [71.0, 83.94]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [30.84, 29.75, 29.89, 0.0, 30.02, 30.06, 30.07, 29.14, 29.08, 0.0, 0.0, 0.0, 29.45, 29.35], "audiomae_on_audioset": [[["music", 67.34], ["electronic music", 4.61], ["speech", 4.0]], [["music", 67.73], ["electronic music", 4.69], ["house music", 3.88]], [["music", 64.78], ["trance music", 10.31], ["sampler", 3.77]], null, [["music", 80.66], ["trance music", 4.76], ["electronic music", 2.94]], [["music", 77.7], ["trance music", 2.85], ["electronic music", 2.67]], [["music", 71.27], ["trance music", 5.42], ["electronic music", 3.91]], [["music", 55.9], ["throbbing", 5.51], ["hum", 4.06]], [["music", 76.47], ["electronic music", 1.73], ["trance music", 1.34]], null, null, null, [["music", 69.19], ["electronic music", 5.57], ["trance music", 2.93]], [["music", 77.99], ["trance music", 3.57], ["house music", 2.44]]], "duration": [2.14, 3.29, 4.31, 0.37, 2.59, 2.78, 2.42, 5.71, 11.37, 0.5, -0.45, -0.38, 5.2, 12.94]} \ No newline at end of file diff --git a/annotations_1/mM5dRMY2u28_filtered.json b/annotations_1/mM5dRMY2u28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..883264843d44f4878c4049face3691171a5aeeb3 --- /dev/null +++ b/annotations_1/mM5dRMY2u28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.04], [16.0, 16.7], [18.0, 19.11], [20.0, 21.49], [45.0, 45.47], [50.0, 50.26], [51.0, 51.56], [52.0, 52.91], [54.0, 54.8], [72.0, 72.4], [84.0, 84.43], [86.0, 87.29], [90.0, 90.71], [109.0, 109.34], [116.0, 117.0], [119.0, 125.51], [126.0, 129.1], [136.0, 137.37], [140.0, 141.81], [147.0, 148.53], [151.0, 151.12], [154.0, 154.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.3, 43.61, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.72], ["singing", 1.71], ["folk music", 1.62]], [["music", 82.81], ["singing", 1.74], ["musical instrument", 1.07]], null, null, null, null, null], "duration": [0.04, 0.7, 1.11, 1.49, 0.47, 0.26, 0.56, 0.91, 0.8, 0.4, 0.43, 1.29, 0.71, 0.34, 1.0, 6.51, 3.1, 1.37, 1.81, 1.53, 0.12, 0.89]} \ No newline at end of file diff --git a/annotations_1/mNUnCTKwS8Q_filtered.json b/annotations_1/mNUnCTKwS8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1652671dc78d85d451c0ef6400f48738ae0a973e --- /dev/null +++ b/annotations_1/mNUnCTKwS8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 30.4], [31.0, 31.92], [33.0, 45.22], [46.0, 48.88], [49.0, 50.68], [54.0, 54.53], [55.0, 55.95], [58.0, 58.23], [59.0, 59.39], [70.0, 71.96], [78.0, 78.68], [80.0, 80.38], [81.0, 82.12], [83.0, 83.83], [94.0, 97.41], [99.0, 99.28], [99.0, 100.35], [112.0, 122.61], [128.0, 128.98], [130.0, 130.32], [131.0, 133.32], [136.0, 153.77], [159.0, 160.79], [161.0, 160.83], [161.0, 160.86], [164.0, 168.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [30.14, 0.0, 58.13, 65.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 84.43, 0.0, 0.0, 74.76, 34.39, 0.0, 0.0, 0.0, 29.8], "audiomae_on_audioset": [[["music", 47.14], ["hum", 18.36], ["mains hum", 11.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 40.1], ["throbbing", 25.61], ["music", 11.29]], null, null, null, [["speech", 40.61], ["music", 20.56], ["whack, thwack", 4.15]]], "duration": [29.4, 0.92, 12.22, 2.88, 1.68, 0.53, 0.95, 0.23, 0.39, 1.96, 0.68, 0.38, 1.12, 0.83, 3.41, 0.28, 1.35, 10.61, 0.98, 0.32, 2.32, 17.77, 1.79, -0.17, -0.14, 4.42]} \ No newline at end of file diff --git a/annotations_1/mNd16XocjBg_filtered.json b/annotations_1/mNd16XocjBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..247dfdd759ff3518071f256373660453908fc7ab --- /dev/null +++ b/annotations_1/mNd16XocjBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [3.0, 3.89], [5.0, 6.64], [8.0, 8.14], [10.0, 10.59], [15.0, 14.99], [17.0, 17.69], [19.0, 18.87], [20.0, 20.6], [23.0, 23.82], [26.0, 27.43], [29.0, 29.51], [33.0, 34.38], [38.0, 38.13], [45.0, 45.86], [48.0, 48.71], [52.0, 54.19], [56.0, 57.52], [61.0, 61.16], [63.0, 63.32], [67.0, 67.22], [70.0, 70.6], [76.0, 77.45], [80.0, 80.86], [82.0, 82.63], [86.0, 85.9], [87.0, 87.56], [92.0, 92.87], [94.0, 94.37], [97.0, 99.66], [102.0, 102.59], [109.0, 109.8], [110.0, 111.57], [115.0, 115.94], [117.0, 117.98], [120.0, 120.48], [121.0, 122.66], [123.0, 124.02], [127.0, 128.98], [133.0, 133.34], [135.0, 135.84], [140.0, 142.03], [143.0, 143.73], [146.0, 146.96], [152.0, 152.54], [153.0, 156.49], [158.0, 160.2], [162.0, 164.47], [170.0, 170.88], [172.0, 173.13], [175.0, 177.65], [179.0, 184.45], [185.0, 187.27], [188.0, 188.55], [190.0, 191.0], [192.0, 192.6], [194.0, 194.83], [197.0, 196.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 100.0, 85.72, 79.76, 0.0, 0.0, 55.11, 64.41, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.89, 1.64, 0.14, 0.59, -0.01, 0.69, -0.13, 0.6, 0.82, 1.43, 0.51, 1.38, 0.13, 0.86, 0.71, 2.19, 1.52, 0.16, 0.32, 0.22, 0.6, 1.45, 0.86, 0.63, -0.1, 0.56, 0.87, 0.37, 2.66, 0.59, 0.8, 1.57, 0.94, 0.98, 0.48, 1.66, 1.02, 1.98, 0.34, 0.84, 2.03, 0.73, 0.96, 0.54, 3.49, 2.2, 2.47, 0.88, 1.13, 2.65, 5.45, 2.27, 0.55, 1.0, 0.6, 0.83, -0.06]} \ No newline at end of file diff --git a/annotations_1/mOicvmEloyY_filtered.json b/annotations_1/mOicvmEloyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77965f8e141ab7058ded28a42f550e95016b45e0 --- /dev/null +++ b/annotations_1/mOicvmEloyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.34], [10.0, 21.49], [29.0, 31.13], [34.0, 34.8], [37.0, 37.61], [40.0, 43.46], [45.0, 46.14], [47.0, 47.29], [49.0, 49.67], [50.0, 50.65], [53.0, 55.05], [56.0, 57.06], [59.0, 60.2], [61.0, 66.85], [68.0, 69.82], [72.0, 87.08], [88.0, 88.42], [89.0, 111.25], [112.0, 112.65], [113.0, 115.89], [117.0, 118.2], [125.0, 125.85], [127.0, 128.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 86.64, 59.15, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 46.22, 0.0, 71.43, 0.0, 98.8, 0.0, 37.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 34.74], ["radio", 18.59], ["noise", 12.12]], null, null, null, null, null, [["bee, wasp, etc.", 46.94], ["fly, housefly", 28.35], ["insect", 17.37]], null, null, null], "duration": [1.34, 11.49, 2.13, 0.8, 0.61, 3.46, 1.14, 0.29, 0.67, 0.65, 2.05, 1.06, 1.2, 5.85, 1.82, 15.08, 0.42, 22.25, 0.65, 2.89, 1.2, 0.85, 1.24]} \ No newline at end of file diff --git a/annotations_1/mPWo1Dsti3c_filtered.json b/annotations_1/mPWo1Dsti3c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0156d2aa951311df033b8abcc390f1ed355e1427 --- /dev/null +++ b/annotations_1/mPWo1Dsti3c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.53], [3.0, 4.29], [6.0, 6.91], [10.0, 10.56], [17.0, 19.85], [20.0, 37.96], [39.0, 40.8], [41.0, 41.81], [51.0, 51.95], [55.0, 55.93], [57.0, 57.32], [58.0, 58.35], [61.0, 76.22], [85.0, 85.36]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.22, 29.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.18, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 16.74], ["noise", 15.54], ["hum", 12.22]], [["music", 36.78], ["speech", 28.92], ["sidetone", 6.89]], null, null, null, null, null, null, [["music", 31.71], ["speech", 23.72], ["throbbing", 18.2]], null], "duration": [1.53, 1.29, 0.91, 0.56, 2.85, 17.96, 1.8, 0.81, 0.95, 0.93, 0.32, 0.35, 15.22, 0.36]} \ No newline at end of file diff --git a/annotations_1/mQTPziHf9Qc_filtered.json b/annotations_1/mQTPziHf9Qc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71f8815e063084e58f9f9a5db64bf97c1c561774 --- /dev/null +++ b/annotations_1/mQTPziHf9Qc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.08], [9.0, 9.78], [19.0, 20.44], [23.0, 24.11], [36.0, 37.83], [40.0, 41.44], [44.0, 43.63], [45.0, 45.42], [49.0, 51.98], [53.0, 53.89], [57.0, 58.11], [63.0, 67.41], [80.0, 80.69], [84.0, 92.1], [95.0, 96.15], [98.0, 100.03], [102.0, 103.86], [110.0, 111.55], [112.0, 116.26], [124.0, 152.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 55.31, 0.0, 33.07, 0.0, 33.95, 0.0, 0.0, 33.92, 48.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 84.09], ["singing", 1.77], ["soul music", 1.37]], null, [["music", 66.13], ["bass guitar", 3.48], ["musical instrument", 3.25]], null, null, [["music", 73.89], ["singing", 6.4], ["song", 1.56]], [["music", 60.15], ["effects unit", 4.3], ["musical instrument", 3.29]]], "duration": [1.08, 0.78, 1.44, 1.11, 1.83, 1.44, -0.37, 0.42, 2.98, 0.89, 1.11, 4.41, 0.69, 8.1, 1.15, 2.03, 1.86, 1.55, 4.26, 28.86]} \ No newline at end of file diff --git a/annotations_1/mRIaK9Vf0Ns_filtered.json b/annotations_1/mRIaK9Vf0Ns_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f3a3d7b1a411fecb3bf0c5fb3028d50f50b8978d --- /dev/null +++ b/annotations_1/mRIaK9Vf0Ns_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 23.35], [25.0, 32.37], [33.0, 41.0], [43.0, 43.66], [44.0, 48.86], [51.0, 98.66], [100.0, 100.8], [107.0, 106.69], [107.0, 109.95], [110.0, 110.94], [114.0, 128.29], [133.0, 136.48], [140.0, 140.86], [142.0, 142.82], [146.0, 147.07], [149.0, 157.96], [159.0, 159.11], [159.0, 159.14], [159.0, 159.17], [159.0, 159.21], [159.0, 159.24], [159.0, 164.93], [167.0, 168.03], [171.0, 172.17], [173.0, 182.11], [183.0, 184.5]], "keep_status": [false, true, true, false, true, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, true, false], "silence_prob": [32.61, 33.15, 37.03, 0.0, 36.59, 0.0, 0.0, 0.0, 33.48, 0.0, 32.27, 31.73, 0.0, 0.0, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0, 33.46, 0.0, 0.0, 32.07, 0.0], "audiomae_on_audioset": [[["hum", 31.14], ["throbbing", 28.24], ["music", 15.22]], [["speech", 24.89], ["music", 15.82], ["mosquito", 12.01]], [["music", 15.2], ["hum", 9.79], ["fly, housefly", 8.96]], null, [["music", 28.38], ["whale vocalization", 6.28], ["rumble", 3.71]], null, null, null, [["music", 21.22], ["hum", 17.76], ["animal", 7.37]], null, [["music", 33.71], ["speech", 30.13], ["hum", 9.55]], [["music", 41.31], ["hum", 7.8], ["animal", 7.74]], null, null, null, [["speech", 18.17], ["music", 14.95], ["noise", 7.66]], null, null, null, null, null, [["music", 29.91], ["didgeridoo", 9.21], ["cacophony", 7.19]], null, null, [["music", 15.73], ["whale vocalization", 13.17], ["speech", 12.66]], null], "duration": [22.35, 7.37, 8.0, 0.66, 4.86, 47.66, 0.8, -0.31, 2.95, 0.94, 14.29, 3.48, 0.86, 0.82, 1.07, 8.96, 0.11, 0.14, 0.17, 0.21, 0.24, 5.93, 1.03, 1.17, 9.11, 1.5]} \ No newline at end of file diff --git a/annotations_1/mRwKWTGCd7Y_filtered.json b/annotations_1/mRwKWTGCd7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3323689684689be498e7947fd7ab70e583b8b57 --- /dev/null +++ b/annotations_1/mRwKWTGCd7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 16.01], [18.0, 40.12], [41.0, 46.18], [51.0, 53.81], [56.0, 56.46], [62.0, 62.07], [62.0, 76.08], [79.0, 99.76]], "keep_status": [false, false, true, true, false, false, true, true], "silence_prob": [54.63, 45.59, 29.11, 31.92, 0.0, 0.0, 29.51, 30.18], "audiomae_on_audioset": [null, [["music", 36.45], ["hum", 35.53], ["mains hum", 5.96]], [["whack, thwack", 44.12], ["music", 10.69], ["speech", 8.77]], [["music", 30.76], ["speech", 17.36], ["pulse", 17.09]], null, null, [["whack, thwack", 27.11], ["groan", 18.5], ["fly, housefly", 8.82]], [["whack, thwack", 28.15], ["music", 27.8], ["speech", 4.54]]], "duration": [9.01, 22.12, 5.18, 2.81, 0.46, 0.07, 14.08, 20.76]} \ No newline at end of file diff --git a/annotations_1/mS1u_E53e10_filtered.json b/annotations_1/mS1u_E53e10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f4503f5a5c351bda0e9fdb89c7a8896e383a10c --- /dev/null +++ b/annotations_1/mS1u_E53e10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.65], [8.0, 8.23], [12.0, 12.95], [15.0, 19.38], [24.0, 24.21], [27.0, 29.83], [33.0, 36.49], [40.0, 41.1], [48.0, 49.47], [51.0, 51.6], [61.0, 64.25], [76.0, 80.89], [82.0, 87.32], [92.0, 94.83], [96.0, 96.72], [108.0, 110.0]], "keep_status": [false, false, false, false, false, true, true, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.23, 0.0, 46.61, 32.1, 0.0, 0.0, 0.0, 35.14, 29.82, 30.55, 32.73, 0.0, 64.18], "audiomae_on_audioset": [null, null, null, [["fart", 35.63], ["speech", 33.22], ["fly, housefly", 5.28]], null, [["speech", 17.21], ["fly, housefly", 12.22], ["music", 10.56]], [["speech", 38.5], ["vehicle", 7.78], ["music", 4.54]], null, null, null, [["speech", 30.59], ["animal", 6.55], ["radio", 4.48]], [["moo", 26.88], ["cattle, bovinae", 23.83], ["livestock, farm animals, working animals", 12.43]], [["music", 41.16], ["speech", 36.05], ["electronic music", 5.84]], [["speech", 38.55], ["whale vocalization", 13.66], ["cattle, bovinae", 9.99]], null, null], "duration": [1.65, 0.23, 0.95, 4.38, 0.21, 2.83, 3.49, 1.1, 1.47, 0.6, 3.25, 4.89, 5.32, 2.83, 0.72, 2.0]} \ No newline at end of file diff --git a/annotations_1/mS4njwcS4dw_filtered.json b/annotations_1/mS4njwcS4dw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4ff89bd527fca00365999d05636e5a6f844af06 --- /dev/null +++ b/annotations_1/mS4njwcS4dw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 18.69]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [-0.31]} \ No newline at end of file diff --git a/annotations_1/mT3_2sDEBJQ_filtered.json b/annotations_1/mT3_2sDEBJQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a41d40ca591356a3240003f907aeae0c495381e --- /dev/null +++ b/annotations_1/mT3_2sDEBJQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.2], [8.0, 8.65], [10.0, 9.88], [22.0, 22.0], [35.0, 34.72], [72.0, 73.01]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.2, 0.65, -0.12, 0.0, -0.28, 1.01]} \ No newline at end of file diff --git a/annotations_1/mTYe5PvlRno_filtered.json b/annotations_1/mTYe5PvlRno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19d2556d36f8dfc51f0518334dd4f6a157f87f73 --- /dev/null +++ b/annotations_1/mTYe5PvlRno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.98], [12.0, 14.61], [16.0, 16.71], [18.0, 19.67], [21.0, 22.0], [26.0, 29.37], [30.0, 31.31], [33.0, 33.79], [37.0, 37.32], [52.0, 53.11], [55.0, 58.19], [62.0, 62.23], [63.0, 64.02], [65.0, 66.53], [67.0, 68.49], [71.0, 71.37], [75.0, 77.73], [79.0, 79.95], [81.0, 82.32], [83.0, 84.6], [89.0, 89.67], [103.0, 103.28], [105.0, 106.41], [120.0, 131.87], [134.0, 134.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 62.47, 0.0, 0.0, 0.0, 62.47, 0.0, 0.0, 0.0, 0.0, 40.16, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 11.2], ["burping, eructation", 7.16], ["groan", 6.71]], null, null, null, null, null, [["speech", 38.72], ["quack", 12.79], ["laughter", 6.75]], null, null, null, null, null, null, null, null], "duration": [-0.02, 2.61, 0.71, 1.67, 1.0, 3.37, 1.31, 0.79, 0.32, 1.11, 3.19, 0.23, 1.02, 1.53, 1.49, 0.37, 2.73, 0.95, 1.32, 1.6, 0.67, 0.28, 1.41, 11.87, 0.72]} \ No newline at end of file diff --git a/annotations_1/mUVup2pr_eM_filtered.json b/annotations_1/mUVup2pr_eM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a29a293c4a4a5006273c3be77db87845dd458e8 --- /dev/null +++ b/annotations_1/mUVup2pr_eM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.67], [1.0, 7.5], [8.0, 9.41], [11.0, 11.84], [12.0, 53.05], [55.0, 55.05], [57.0, 57.13], [58.0, 60.51], [63.0, 71.0], [77.0, 117.37], [119.0, 119.75], [127.0, 127.3], [128.0, 129.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.04, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 30.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["neigh, whinny", 41.02], ["animal", 22.15], ["horse", 15.68]], null, null, null, null, null, [["music", 70.42], ["didgeridoo", 3.15], ["synthesizer", 3.04]], [["music", 76.18], ["didgeridoo", 6.56], ["musical instrument", 5.89]], null, null, null, null], "duration": [0.67, 6.5, 1.41, 0.84, 41.05, 0.05, 0.13, 2.51, 8.0, 40.37, 0.75, 0.3, 1.73]} \ No newline at end of file diff --git a/annotations_1/mVUQ88T2S6E_filtered.json b/annotations_1/mVUQ88T2S6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d87e472a2b9d88532ff6ba02813d0871779d61ec --- /dev/null +++ b/annotations_1/mVUQ88T2S6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 6.27], [11.0, 12.88], [19.0, 23.45], [24.0, 27.14], [28.0, 33.96], [40.0, 43.55], [53.0, 54.43], [57.0, 56.78], [64.0, 64.56], [66.0, 79.14], [82.0, 113.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 44.55, 43.25, 39.19, 40.75, 0.0, 0.0, 0.0, 28.4, 0.0], "audiomae_on_audioset": [null, null, null, [["telephone dialing, dtmf", 34.36], ["speech", 27.04], ["sidetone", 13.57]], [["speech", 23.92], ["sidetone", 18.3], ["music", 15.3]], [["speech", 58.3], ["radio", 19.75], ["sidetone", 9.14]], [["sidetone", 54.72], ["speech", 16.75], ["radio", 14.65]], null, null, null, [["mains hum", 58.5], ["hum", 21.25], ["music", 7.69]], null], "duration": [0.29, 1.27, 1.88, 4.45, 3.14, 5.96, 3.55, 1.43, -0.22, 0.56, 13.14, 31.32]} \ No newline at end of file diff --git a/annotations_1/mXvst0jlR9Q_filtered.json b/annotations_1/mXvst0jlR9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f797f93b39297fc73113450b8a9836eee98189c3 --- /dev/null +++ b/annotations_1/mXvst0jlR9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.53], [8.0, 8.07], [9.0, 9.78], [19.0, 18.82], [19.0, 20.16], [21.0, 20.75], [22.0, 22.55], [23.0, 23.46], [24.0, 25.95], [26.0, 27.04], [28.0, 28.44], [29.0, 30.7], [32.0, 34.4], [35.0, 37.02], [38.0, 39.43], [44.0, 45.82], [49.0, 49.54], [51.0, 52.07], [52.0, 52.62], [54.0, 54.53], [56.0, 56.96], [60.0, 68.47], [69.0, 70.28], [70.0, 73.85], [74.0, 75.98], [78.0, 78.92], [80.0, 81.04], [84.0, 100.82], [101.0, 102.37], [103.0, 115.67], [118.0, 121.85], [126.0, 128.44], [129.0, 132.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 60.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 83.34, 0.0, 0.0, 0.0, 98.59, 0.0, 95.37, 80.64, 97.73, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.53, 0.07, 0.78, -0.18, 1.16, -0.25, 0.55, 0.46, 1.95, 1.04, 0.44, 1.7, 2.4, 2.02, 1.43, 1.82, 0.54, 1.07, 0.62, 0.53, 0.96, 8.47, 1.28, 3.85, 1.98, 0.92, 1.04, 16.82, 1.37, 12.67, 3.85, 2.44, 3.83]} \ No newline at end of file diff --git a/annotations_1/mXz39lQAEmY_filtered.json b/annotations_1/mXz39lQAEmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f28e0ebf425746cd4bb894426d241e4deea3c9 --- /dev/null +++ b/annotations_1/mXz39lQAEmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.63], [6.0, 9.51], [11.0, 11.69], [12.0, 15.08], [19.0, 24.19], [25.0, 26.84], [29.0, 30.82], [37.0, 40.93], [42.0, 43.19], [44.0, 45.1], [46.0, 48.05], [50.0, 53.76], [57.0, 57.42], [60.0, 61.18], [64.0, 66.53], [69.0, 70.34], [75.0, 75.14], [77.0, 78.11], [81.0, 82.58], [83.0, 84.96], [86.0, 88.42], [89.0, 90.9], [92.0, 94.37], [99.0, 101.71], [106.0, 108.04], [113.0, 117.58], [119.0, 119.75], [122.0, 122.99], [123.0, 125.54], [126.0, 128.95], [131.0, 132.92], [134.0, 135.67], [137.0, 139.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.19, 98.27, 0.0, 89.72, 95.64, 0.0, 0.0, 90.43, 0.0, 0.0, 82.43, 91.81, 0.0, 0.0, 78.38, 0.0, 0.0, 0.0, 0.0, 0.0, 90.6, 0.0, 84.25, 97.73, 79.07, 83.7, 0.0, 0.0, 66.27, 57.01, 0.0, 0.0, 73.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.63, 3.51, 0.69, 3.08, 5.19, 1.84, 1.82, 3.93, 1.19, 1.1, 2.05, 3.76, 0.42, 1.18, 2.53, 1.34, 0.14, 1.11, 1.58, 1.96, 2.42, 1.9, 2.37, 2.71, 2.04, 4.58, 0.75, 0.99, 2.54, 2.95, 1.92, 1.67, 2.83]} \ No newline at end of file diff --git a/annotations_1/mZHlantNtwg_filtered.json b/annotations_1/mZHlantNtwg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aea677e2057c726929710231977794acf016d8e8 --- /dev/null +++ b/annotations_1/mZHlantNtwg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.67], [15.0, 17.41], [23.0, 41.22], [47.0, 47.9], [60.0, 60.54], [62.0, 65.52], [66.0, 81.09], [83.0, 89.99], [94.0, 95.2], [96.0, 97.26], [99.0, 99.3], [103.0, 106.27], [109.0, 109.27], [119.0, 118.84], [146.0, 149.23], [151.0, 153.62]], "keep_status": [true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [34.46, 30.03, 33.06, 0.0, 0.0, 44.84, 31.13, 30.91, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 68.02, 35.74], "audiomae_on_audioset": [[["music", 34.03], ["throbbing", 8.81], ["theremin", 7.28]], [["groan", 27.51], ["speech", 18.45], ["music", 18.35]], [["speech", 65.84], ["music", 19.84], ["explosion", 1.37]], null, null, [["speech", 22.21], ["fly, housefly", 19.66], ["insect", 14.04]], [["music", 55.42], ["speech", 20.31], ["fart", 3.12]], [["music", 54.91], ["hum", 5.53], ["musical instrument", 3.66]], null, null, null, null, null, null, null, [["speech", 45.21], ["chirp tone", 15.39], ["sine wave", 15.33]]], "duration": [4.67, 2.41, 18.22, 0.9, 0.54, 3.52, 15.09, 6.99, 1.2, 1.26, 0.3, 3.27, 0.27, -0.16, 3.23, 2.62]} \ No newline at end of file diff --git a/annotations_1/mZYTLYXT-CQ_filtered.json b/annotations_1/mZYTLYXT-CQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e77f53c96df3e36dce1251230d0e80cf12a91799 --- /dev/null +++ b/annotations_1/mZYTLYXT-CQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.77], [18.0, 17.74], [20.0, 24.98], [31.0, 34.82], [40.0, 44.76], [51.0, 52.25], [53.0, 59.49], [61.0, 63.05], [63.0, 73.35], [75.0, 79.44], [82.0, 91.42], [94.0, 117.73], [119.0, 120.34], [121.0, 122.82], [127.0, 128.82], [132.0, 132.71], [134.0, 137.34], [140.0, 144.88], [146.0, 146.92], [148.0, 150.31], [150.0, 152.15], [152.0, 161.49], [162.0, 170.4], [176.0, 176.59]], "keep_status": [true, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [37.61, 0.0, 34.32, 59.15, 52.68, 0.0, 39.66, 40.04, 49.36, 53.59, 48.61, 53.91, 0.0, 0.0, 0.0, 0.0, 78.55, 54.04, 0.0, 37.26, 38.83, 49.87, 71.57, 0.0], "audiomae_on_audioset": [[["animal", 21.29], ["dog", 17.32], ["domestic animals, pets", 13.82]], null, [["music", 40.51], ["theremin", 14.33], ["speech", 6.61]], null, null, null, [["whale vocalization", 54.29], ["speech", 17.57], ["theremin", 12.45]], [["whale vocalization", 36.16], ["music", 18.08], ["theremin", 17.91]], [["music", 54.86], ["theremin", 6.99], ["speech", 3.61]], null, [["music", 45.77], ["whale vocalization", 10.86], ["speech", 10.2]], null, null, null, null, null, null, null, null, [["fly, housefly", 15.88], ["livestock, farm animals, working animals", 15.25], ["bee, wasp, etc.", 12.85]], [["hum", 31.73], ["speech", 15.17], ["mains hum", 6.35]], [["livestock, farm animals, working animals", 33.79], ["animal", 26.09], ["cattle, bovinae", 7.88]], null, null], "duration": [10.77, -0.26, 4.98, 3.82, 4.76, 1.25, 6.49, 2.05, 10.35, 4.44, 9.42, 23.73, 1.34, 1.82, 1.82, 0.71, 3.34, 4.88, 0.92, 2.31, 2.15, 9.49, 8.4, 0.59]} \ No newline at end of file diff --git a/annotations_1/mbBhikLj86Y_filtered.json b/annotations_1/mbBhikLj86Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cd4800145edd95ca4ba6a3f0c37b57b4b32c6c7 --- /dev/null +++ b/annotations_1/mbBhikLj86Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.27], [19.0, 18.74], [21.0, 21.95], [23.0, 26.0], [28.0, 32.93], [34.0, 42.38], [45.0, 45.79], [47.0, 55.46], [57.0, 58.36], [59.0, 63.27], [64.0, 64.99], [65.0, 72.55], [87.0, 89.04], [92.0, 92.64], [95.0, 96.25], [97.0, 97.09], [97.0, 97.44], [97.0, 99.17], [102.0, 102.07], [103.0, 103.2], [108.0, 108.24], [110.0, 109.98], [115.0, 117.85], [119.0, 119.23]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [32.14, 0.0, 0.0, 32.61, 31.93, 31.91, 0.0, 44.26, 0.0, 42.96, 0.0, 34.04, 33.38, 0.0, 0.0, 0.0, 0.0, 32.28, 0.0, 0.0, 0.0, 0.0, 36.08, 0.0], "audiomae_on_audioset": [[["music", 48.58], ["cello", 5.66], ["musical instrument", 5.62]], null, null, [["music", 43.23], ["cello", 10.14], ["bowed string instrument", 5.64]], [["music", 65.69], ["cello", 2.99], ["musical instrument", 2.92]], [["speech", 55.6], ["fart", 19.44], ["whack, thwack", 2.96]], null, [["music", 29.57], ["animal", 10.31], ["frog", 10.23]], null, [["music", 45.6], ["chime", 15.15], ["marimba, xylophone", 4.57]], null, [["speech", 83.0], ["telephone", 1.94], ["fart", 1.85]], [["radio", 7.7], ["telephone", 6.34], ["boing", 6.08]], null, null, null, null, [["speech", 42.67], ["music", 40.63], ["inside, small room", 2.03]], null, null, null, null, [["music", 28.78], ["cello", 14.73], ["musical instrument", 11.59]], null], "duration": [2.27, -0.26, 0.95, 3.0, 4.93, 8.38, 0.79, 8.46, 1.36, 4.27, 0.99, 7.55, 2.04, 0.64, 1.25, 0.09, 0.44, 2.17, 0.07, 0.2, 0.24, -0.02, 2.85, 0.23]} \ No newline at end of file diff --git a/annotations_1/mbKiHp_ljJY_filtered.json b/annotations_1/mbKiHp_ljJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cff073438e3b28456cfb864d2e30172fe3dcde04 --- /dev/null +++ b/annotations_1/mbKiHp_ljJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.49], [15.0, 19.57], [21.0, 25.27], [27.0, 34.67], [36.0, 36.98], [41.0, 41.76], [44.0, 44.44], [48.0, 49.06], [50.0, 50.57], [53.0, 54.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [38.83, 63.1, 66.88, 50.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.24], ["speech", 16.54], ["effects unit", 4.65]], null, null, null, null, null, null, null, null, null], "duration": [9.49, 4.57, 4.27, 7.67, 0.98, 0.76, 0.44, 1.06, 0.57, 1.46]} \ No newline at end of file diff --git a/annotations_1/mbTKo5Ylypw_filtered.json b/annotations_1/mbTKo5Ylypw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dfc6497a2ef148602cf97a727b2037d80cf896f --- /dev/null +++ b/annotations_1/mbTKo5Ylypw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.88], [10.0, 10.74], [11.0, 12.65], [18.0, 21.63], [23.0, 23.5], [33.0, 40.71], [44.0, 45.1], [48.0, 48.37], [52.0, 52.02], [61.0, 61.33], [62.0, 62.7], [65.0, 65.58], [70.0, 70.83], [72.0, 73.84], [74.0, 76.77], [78.0, 79.62], [81.0, 88.89], [90.0, 92.08], [93.0, 92.82], [93.0, 95.13], [97.0, 98.9], [102.0, 102.84], [103.0, 104.04], [109.0, 109.41], [110.0, 111.13], [113.0, 115.26], [116.0, 121.37], [123.0, 125.17], [126.0, 125.93], [127.0, 128.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 43.51, 96.17, 0.0, 91.3, 0.0, 0.0, 0.0, 0.0, 0.0, 43.79, 44.63, 68.93, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 19.35], ["hum", 12.16], ["eruption", 8.86]], null, null, null, null, null, null, null, null, [["speech", 89.69], ["dial tone", 2.54], ["telephone", 1.52]], [["speech", 31.4], ["stomach rumble", 10.12], ["hum", 8.68]], null, null, null], "duration": [2.88, 0.74, 1.65, 3.63, 0.5, 7.71, 1.1, 0.37, 0.02, 0.33, 0.7, 0.58, 0.83, 1.84, 2.77, 1.62, 7.89, 2.08, -0.18, 2.13, 1.9, 0.84, 1.04, 0.41, 1.13, 2.26, 5.37, 2.17, -0.07, 1.6]} \ No newline at end of file diff --git a/annotations_1/mbzNdI-1iUc_filtered.json b/annotations_1/mbzNdI-1iUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/mbzNdI-1iUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/mcerWHb94yo_filtered.json b/annotations_1/mcerWHb94yo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2058f7b638e9cb94e6d2bf98fbb7d13b5284ded --- /dev/null +++ b/annotations_1/mcerWHb94yo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [7.0, 19.18], [21.0, 23.55], [27.0, 28.36], [31.0, 32.8], [35.0, 42.38], [50.0, 53.47], [56.0, 56.37], [61.0, 70.17], [80.0, 80.65], [83.0, 112.18], [115.0, 116.11], [118.0, 121.91], [125.0, 125.85], [129.0, 141.88], [147.0, 148.47], [150.0, 161.94], [163.0, 227.75]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.43, 64.75, 0.0, 0.0, 31.61, 33.33, 0.0, 30.29, 0.0, 29.25, 0.0, 29.51, 0.0, 29.32, 0.0, 28.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 45.45], ["guitar", 12.89], ["musical instrument", 8.4]], [["music", 50.73], ["mantra", 17.98], ["chant", 3.14]], null, [["music", 76.43], ["hum", 2.51], ["throbbing", 1.84]], null, [["music", 79.21], ["musical instrument", 6.91], ["carnatic music", 3.91]], null, [["music", 77.27], ["synthesizer", 1.66], ["boing", 1.11]], null, [["music", 83.3], ["synthetic singing", 1.2], ["musical instrument", 0.79]], null, [["music", 46.22], ["didgeridoo", 22.08], ["theremin", 4.95]], null], "duration": [0.22, 12.18, 2.55, 1.36, 1.8, 7.38, 3.47, 0.37, 9.17, 0.65, 29.18, 1.11, 3.91, 0.85, 12.88, 1.47, 11.94, 64.75]} \ No newline at end of file diff --git a/annotations_1/mdHpbI8Y7Oo_filtered.json b/annotations_1/mdHpbI8Y7Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b89781423593b1e40347b14505f15e725255c9 --- /dev/null +++ b/annotations_1/mdHpbI8Y7Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 2.4], [3.0, 3.25], [5.0, 5.27], [6.0, 6.67], [8.0, 8.04], [12.0, 14.1], [18.0, 20.41], [24.0, 26.6], [28.0, 41.42], [44.0, 45.18], [49.0, 49.37], [50.0, 50.73], [53.0, 53.64], [63.0, 64.4], [70.0, 70.71], [77.0, 76.72], [79.0, 80.22], [84.0, 84.55], [103.0, 106.34], [108.0, 109.61], [112.0, 112.35], [114.0, 113.98], [116.0, 116.23], [118.0, 118.56], [120.0, 120.82], [123.0, 123.01], [124.0, 124.28], [129.0, 129.24], [132.0, 132.97], [137.0, 150.13], [154.0, 159.68], [161.0, 164.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 100.0, 99.96, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.71, 42.76, 36.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 72.26], ["music", 6.54], ["busy signal", 5.83]], [["animal", 33.37], ["speech", 25.95], ["sheep", 8.41]], [["vehicle", 25.84], ["fly, housefly", 6.45], ["car", 6.05]]], "duration": [0.21, 0.4, 0.25, 0.27, 0.67, 0.04, 2.1, 2.41, 2.6, 13.42, 1.18, 0.37, 0.73, 0.64, 1.4, 0.71, -0.28, 1.22, 0.55, 3.34, 1.61, 0.35, -0.02, 0.23, 0.56, 0.82, 0.01, 0.28, 0.24, 0.97, 13.13, 5.68, 3.96]} \ No newline at end of file diff --git a/annotations_1/mdgbtrpVBm8_filtered.json b/annotations_1/mdgbtrpVBm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63d40a3669ff7466e170a904db02ad6ab704a04b --- /dev/null +++ b/annotations_1/mdgbtrpVBm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.55], [12.0, 13.69], [15.0, 15.67], [17.0, 18.52], [20.0, 22.59], [23.0, 22.91], [26.0, 26.28], [30.0, 30.0], [31.0, 31.6], [38.0, 41.71], [43.0, 44.25], [45.0, 46.84], [47.0, 48.63], [50.0, 50.52], [52.0, 52.17], [53.0, 54.18], [56.0, 56.12], [58.0, 58.48], [59.0, 59.68], [60.0, 66.02], [74.0, 77.8], [79.0, 82.19], [85.0, 86.49], [88.0, 88.87], [90.0, 92.58], [94.0, 95.44], [99.0, 99.62], [100.0, 103.27], [105.0, 106.35], [107.0, 106.89], [107.0, 108.4], [111.0, 112.33], [115.0, 115.1], [120.0, 120.16], [124.0, 125.19]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 98.99, 38.25, 0.0, 0.0, 100.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 15.97], ["livestock, farm animals, working animals", 15.3], ["hum", 8.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.28], ["vehicle", 5.47], ["door", 5.27]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.55, 1.69, 0.67, 1.52, 2.59, -0.09, 0.28, 0.0, 0.6, 3.71, 1.25, 1.84, 1.63, 0.52, 0.17, 1.18, 0.12, 0.48, 0.68, 6.02, 3.8, 3.19, 1.49, 0.87, 2.58, 1.44, 0.62, 3.27, 1.35, -0.11, 1.4, 1.33, 0.1, 0.16, 1.19]} \ No newline at end of file diff --git a/annotations_1/melCNhYmwII_filtered.json b/annotations_1/melCNhYmwII_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73ab3386947d69728cfb03df61eba7589f9898b1 --- /dev/null +++ b/annotations_1/melCNhYmwII_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.58], [12.0, 13.68], [14.0, 15.74], [17.0, 18.1], [21.0, 21.51], [25.0, 25.76], [26.0, 27.9], [29.0, 29.35], [30.0, 43.19], [44.0, 47.01], [48.0, 49.72], [58.0, 59.71], [60.0, 59.76], [60.0, 88.65], [89.0, 93.45], [96.0, 100.43], [121.0, 120.9]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [51.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.14, 99.97, 0.0, 0.0, 0.0, 86.64, 40.12, 39.17, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["thunk", 24.83], ["electric shaver, electric razor", 8.07], ["whack, thwack", 7.08]], null, null, null, null, null, [["mains hum", 53.27], ["hum", 42.14], ["speech", 0.65]], [["hum", 30.18], ["mains hum", 26.5], ["speech", 12.52]], null], "duration": [2.58, 1.68, 1.74, 1.1, 0.51, 0.76, 1.9, 0.35, 13.19, 3.01, 1.72, 1.71, -0.24, 28.65, 4.45, 4.43, -0.1]} \ No newline at end of file diff --git a/annotations_1/mfCwgYR1yS8_filtered.json b/annotations_1/mfCwgYR1yS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8defb0c40839016d1f183b601390b1d6de4acae7 --- /dev/null +++ b/annotations_1/mfCwgYR1yS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[113.0, 117.61]], "keep_status": [false], "silence_prob": [35.72], "audiomae_on_audioset": [[["throbbing", 32.64], ["hum", 28.01], ["music", 19.41]]], "duration": [4.61]} \ No newline at end of file diff --git a/annotations_1/mfkzA9zjRdM_filtered.json b/annotations_1/mfkzA9zjRdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dacd07f70103c38ccb53826ea9d3581cdd6a460a --- /dev/null +++ b/annotations_1/mfkzA9zjRdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 39.58], [40.0, 40.9], [42.0, 42.92], [44.0, 46.52], [47.0, 53.55], [55.0, 61.43], [64.0, 69.45], [76.0, 93.92], [100.0, 100.97], [103.0, 104.19], [105.0, 105.68], [107.0, 112.63], [117.0, 119.69], [121.0, 121.31]], "keep_status": [true, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.21, 0.0, 0.0, 49.87, 40.99, 31.7, 30.83, 29.89, 0.0, 0.0, 0.0, 29.64, 37.64, 0.0], "audiomae_on_audioset": [[["music", 60.22], ["synthesizer", 4.24], ["effects unit", 2.87]], null, null, [["music", 47.59], ["synthesizer", 7.15], ["musical instrument", 4.33]], [["music", 37.84], ["speech", 11.83], ["sidetone", 8.77]], [["music", 67.79], ["throbbing", 5.21], ["hum", 4.76]], [["music", 58.62], ["ambient music", 10.52], ["theremin", 6.35]], [["music", 73.15], ["musical instrument", 5.31], ["ambient music", 2.28]], null, null, null, [["music", 59.07], ["musical instrument", 10.44], ["synthesizer", 8.85]], [["speech", 40.68], ["music", 23.51], ["foghorn", 8.48]], null], "duration": [8.58, 0.9, 0.92, 2.52, 6.55, 6.43, 5.45, 17.92, 0.97, 1.19, 0.68, 5.63, 2.69, 0.31]} \ No newline at end of file diff --git a/annotations_1/mhCiFB07I2w_filtered.json b/annotations_1/mhCiFB07I2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..407b536a6bad68edcb38194404e8ff8f2557386c --- /dev/null +++ b/annotations_1/mhCiFB07I2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 37.52], [40.0, 41.49], [42.0, 53.06], [56.0, 75.54], [81.0, 81.04], [83.0, 83.62], [85.0, 85.53], [87.0, 114.47], [119.0, 119.67], [125.0, 129.98], [130.0, 131.26], [134.0, 135.53]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [52.05, 0.0, 32.61, 34.64, 0.0, 0.0, 0.0, 31.69, 0.0, 30.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 12.17], ["police car (siren)", 7.74], ["emergency vehicle", 7.48]], [["hum", 35.96], ["mains hum", 21.98], ["throbbing", 19.87]], null, null, null, [["speech", 49.47], ["noise", 11.07], ["sidetone", 5.59]], null, [["explosion", 43.13], ["speech", 25.68], ["artillery fire", 9.96]], null, null], "duration": [19.52, 1.49, 11.06, 19.54, 0.04, 0.62, 0.53, 27.47, 0.67, 4.98, 1.26, 1.53]} \ No newline at end of file diff --git a/annotations_1/miJ26dYcbBw_filtered.json b/annotations_1/miJ26dYcbBw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/miJ26dYcbBw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/mjuNE5wyMzY_filtered.json b/annotations_1/mjuNE5wyMzY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b8b06c7fb353b18ee297074ca051c0879c7f79c --- /dev/null +++ b/annotations_1/mjuNE5wyMzY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.93], [17.0, 24.39], [26.0, 35.99], [39.0, 64.13], [69.0, 105.39], [108.0, 110.54], [115.0, 114.99], [116.0, 131.19], [131.0, 137.59], [140.0, 143.82], [144.0, 148.56], [155.0, 172.66]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [33.05, 32.33, 31.12, 30.44, 0.0, 33.77, 0.0, 34.18, 31.58, 61.87, 50.76, 30.46], "audiomae_on_audioset": [[["bee, wasp, etc.", 14.47], ["music", 12.37], ["fly, housefly", 11.41]], [["hum", 32.66], ["speech", 23.73], ["music", 20.18]], [["music", 49.18], ["speech", 32.71], ["hum", 2.42]], [["speech", 56.49], ["music", 18.43], ["hum", 4.14]], null, [["music", 37.56], ["didgeridoo", 11.03], ["musical instrument", 6.83]], null, [["music", 80.4], ["didgeridoo", 5.66], ["theremin", 5.29]], [["music", 40.5], ["trombone", 4.87], ["fly, housefly", 4.77]], null, null, [["music", 33.91], ["foghorn", 6.09], ["hum", 4.23]]], "duration": [12.93, 7.39, 9.99, 25.13, 36.39, 2.54, -0.01, 15.19, 6.59, 3.82, 4.56, 17.66]} \ No newline at end of file diff --git a/annotations_1/mkG2YdCogPY_filtered.json b/annotations_1/mkG2YdCogPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78c0f00af27a850f244287022b8eb4f1d0c01bfc --- /dev/null +++ b/annotations_1/mkG2YdCogPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.16], [9.0, 8.85], [12.0, 13.59], [14.0, 15.16], [17.0, 21.15], [28.0, 28.98], [30.0, 31.06], [32.0, 33.37], [35.0, 35.19], [37.0, 37.86], [40.0, 40.93], [42.0, 43.33], [46.0, 47.41], [48.0, 48.15], [49.0, 49.64], [51.0, 52.88], [58.0, 59.48], [60.0, 60.32], [62.0, 63.22], [65.0, 66.36], [67.0, 67.69], [69.0, 70.38], [74.0, 78.58], [79.0, 81.09], [84.0, 85.01], [87.0, 87.42], [90.0, 90.42], [91.0, 91.71], [96.0, 95.89], [99.0, 100.77], [103.0, 103.37], [105.0, 107.37], [112.0, 113.14], [119.0, 119.47], [122.0, 122.3], [123.0, 123.18], [125.0, 126.79], [128.0, 127.9], [130.0, 130.45], [131.0, 132.48], [134.0, 135.06], [136.0, 137.56], [138.0, 139.67], [141.0, 142.3], [144.0, 144.44], [145.0, 145.27], [146.0, 147.39], [148.0, 148.51], [149.0, 149.72], [150.0, 150.36], [152.0, 152.49], [155.0, 155.56], [156.0, 158.53], [159.0, 159.6], [163.0, 163.38], [165.0, 165.28], [166.0, 167.21], [168.0, 169.1], [169.0, 170.02], [170.0, 171.75], [173.0, 173.96], [174.0, 175.04], [176.0, 176.49], [178.0, 178.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 99.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.8], ["boing", 9.54], ["inside, small room", 8.57]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, -0.15, 1.59, 1.16, 4.15, 0.98, 1.06, 1.37, 0.19, 0.86, 0.93, 1.33, 1.41, 0.15, 0.64, 1.88, 1.48, 0.32, 1.22, 1.36, 0.69, 1.38, 4.58, 2.09, 1.01, 0.42, 0.42, 0.71, -0.11, 1.77, 0.37, 2.37, 1.14, 0.47, 0.3, 0.18, 1.79, -0.1, 0.45, 1.48, 1.06, 1.56, 1.67, 1.3, 0.44, 0.27, 1.39, 0.51, 0.72, 0.36, 0.49, 0.56, 2.53, 0.6, 0.38, 0.28, 1.21, 1.1, 1.02, 1.75, 0.96, 1.04, 0.49, 0.7]} \ No newline at end of file diff --git a/annotations_1/mlHF0Vv7yEc_filtered.json b/annotations_1/mlHF0Vv7yEc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..665c3fe2de4d055df7e21eef8c6170515f6b9569 --- /dev/null +++ b/annotations_1/mlHF0Vv7yEc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.79], [16.0, 18.67], [25.0, 27.46], [30.0, 39.21], [42.0, 54.45], [55.0, 87.94], [95.0, 95.25], [98.0, 110.12], [111.0, 110.76], [111.0, 110.79], [111.0, 110.83], [111.0, 118.71], [119.0, 120.31], [125.0, 127.65], [130.0, 133.83], [134.0, 136.21], [140.0, 170.95]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 34.88, 31.72, 32.37, 32.54, 0.0, 0.0, 30.97, 0.0, 0.0, 0.0, 53.34, 0.0, 31.09, 32.24, 32.39, 0.0], "audiomae_on_audioset": [null, [["music", 20.45], ["speech", 11.41], ["boing", 3.2]], [["music", 46.07], ["speech", 30.16], ["cattle, bovinae", 1.75]], [["hum", 46.67], ["throbbing", 18.7], ["speech", 9.03]], [["speech", 37.79], ["music", 16.2], ["buzz", 11.98]], null, null, [["music", 19.41], ["livestock, farm animals, working animals", 17.38], ["sound effect", 7.34]], null, null, null, null, null, [["speech", 26.37], ["crowd", 10.21], ["music", 7.99]], [["vehicle", 33.88], ["speech", 24.69], ["aircraft", 7.56]], [["quack", 43.87], ["music", 36.21], ["duck", 9.18]], null], "duration": [0.79, 2.67, 2.46, 9.21, 12.45, 32.94, 0.25, 12.12, -0.24, -0.21, -0.17, 7.71, 1.31, 2.65, 3.83, 2.21, 30.95]} \ No newline at end of file diff --git a/annotations_1/ml_zSw6yWOE_filtered.json b/annotations_1/ml_zSw6yWOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..265f5cb504e531a0a17598d6657754762b5f434f --- /dev/null +++ b/annotations_1/ml_zSw6yWOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [8.0, 8.58], [12.0, 12.45], [15.0, 16.87], [19.0, 21.22], [24.0, 27.24], [32.0, 33.71], [36.0, 38.04], [42.0, 44.47], [45.0, 46.28], [46.0, 51.83], [53.0, 55.85], [57.0, 59.02], [64.0, 94.98], [95.0, 95.59], [96.0, 96.08], [96.0, 96.21], [96.0, 104.28], [106.0, 118.37], [121.0, 123.47], [128.0, 129.69], [130.0, 135.95], [137.0, 138.28], [139.0, 139.62], [142.0, 141.96], [147.0, 155.93], [157.0, 157.74], [159.0, 161.3]], "keep_status": [false, false, false, false, true, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 38.31, 28.96, 0.0, 29.21, 28.7, 0.0, 28.74, 29.06, 29.54, 0.0, 0.0, 0.0, 0.0, 46.61, 92.64, 45.02, 0.0, 50.26, 0.0, 0.0, 0.0, 76.2, 0.0, 88.64], "audiomae_on_audioset": [null, null, null, null, [["speech", 48.31], ["rumble", 9.58], ["music", 8.01]], [["hum", 28.24], ["mains hum", 14.85], ["throbbing", 12.6]], null, [["hum", 36.38], ["throbbing", 25.3], ["mains hum", 10.76]], [["whack, thwack", 33.59], ["music", 8.95], ["door", 5.05]], null, [["speech", 32.79], ["livestock, farm animals, working animals", 16.85], ["cattle, bovinae", 7.27]], [["music", 39.54], ["throbbing", 23.32], ["hum", 7.56]], [["music", 25.19], ["beatboxing", 16.71], ["speech", 5.43]], null, null, null, null, [["gong", 53.82], ["singing bowl", 13.62], ["music", 7.45]], null, [["speech", 63.69], ["sidetone", 6.05], ["hum", 3.34]], null, null, null, null, null, null, null, null], "duration": [0.76, 0.58, 0.45, 1.87, 2.22, 3.24, 1.71, 2.04, 2.47, 1.28, 5.83, 2.85, 2.02, 30.98, 0.59, 0.08, 0.21, 8.28, 12.37, 2.47, 1.69, 5.95, 1.28, 0.62, -0.04, 8.93, 0.74, 2.3]} \ No newline at end of file diff --git a/annotations_1/mlc2UyZdalQ_filtered.json b/annotations_1/mlc2UyZdalQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b20a12055ba57f85b960cb4153622ab61e8495cb --- /dev/null +++ b/annotations_1/mlc2UyZdalQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.11], [4.0, 6.91], [10.0, 11.67], [12.0, 21.09], [23.0, 23.03], [28.0, 28.53], [31.0, 31.16], [35.0, 37.1], [38.0, 39.02], [41.0, 42.26], [44.0, 46.63], [52.0, 57.37], [59.0, 59.75], [61.0, 61.47], [62.0, 63.15], [67.0, 69.2], [71.0, 71.73], [77.0, 79.42], [80.0, 83.76], [98.0, 98.71], [99.0, 100.06], [101.0, 101.38], [102.0, 102.03], [103.0, 104.19], [105.0, 105.97], [113.0, 113.04], [117.0, 117.42], [118.0, 127.14]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.37, 0.0, 30.45, 0.0, 0.0, 0.0, 36.03, 0.0, 0.0, 37.72, 31.0, 0.0, 0.0, 0.0, 38.02, 0.0, 71.43, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.6], "audiomae_on_audioset": [null, null, null, [["music", 40.58], ["speech", 20.85], ["throbbing", 8.32]], null, null, null, [["speech", 40.49], ["sidetone", 33.67], ["busy signal", 3.02]], null, null, [["speech", 54.89], ["chirp tone", 8.46], ["sine wave", 7.35]], [["speech", 21.19], ["music", 9.49], ["foghorn", 8.36]], null, null, null, [["music", 23.78], ["theremin", 16.3], ["synthesizer", 13.02]], null, null, null, null, null, null, null, null, null, null, null, [["music", 67.26], ["theremin", 18.87], ["opera", 6.94]]], "duration": [0.11, 2.91, 1.67, 9.09, 0.03, 0.53, 0.16, 2.1, 1.02, 1.26, 2.63, 5.37, 0.75, 0.47, 1.15, 2.2, 0.73, 2.42, 3.76, 0.71, 1.06, 0.38, 0.03, 1.19, 0.97, 0.04, 0.42, 9.14]} \ No newline at end of file diff --git a/annotations_1/mlkWgiyQ-8g_filtered.json b/annotations_1/mlkWgiyQ-8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b1949cbe932d61dfe5797704eb183aa4333f803 --- /dev/null +++ b/annotations_1/mlkWgiyQ-8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.08], [8.0, 8.48], [10.0, 10.77], [18.0, 17.71], [19.0, 33.22], [34.0, 35.58], [38.0, 38.8], [42.0, 42.35], [44.0, 45.62], [46.0, 46.26], [47.0, 57.67], [59.0, 59.27], [62.0, 62.41], [64.0, 65.62], [66.0, 66.68], [68.0, 68.82], [71.0, 71.25], [72.0, 72.74], [77.0, 77.08], [78.0, 78.71], [87.0, 87.22], [94.0, 93.95], [96.0, 96.8], [98.0, 98.71], [101.0, 102.36], [103.0, 104.57], [105.0, 106.49], [107.0, 109.34], [110.0, 111.08], [112.0, 113.48], [117.0, 117.73], [121.0, 121.14], [124.0, 123.84], [128.0, 127.87], [131.0, 132.26], [133.0, 133.64], [136.0, 136.88], [143.0, 142.8], [149.0, 149.03], [151.0, 152.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.07, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.32], ["hum", 4.16], ["inside, small room", 3.78]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.08, 0.48, 0.77, -0.29, 14.22, 1.58, 0.8, 0.35, 1.62, 0.26, 10.67, 0.27, 0.41, 1.62, 0.68, 0.82, 0.25, 0.74, 0.08, 0.71, 0.22, -0.05, 0.8, 0.71, 1.36, 1.57, 1.49, 2.34, 1.08, 1.48, 0.73, 0.14, -0.16, -0.13, 1.26, 0.64, 0.88, -0.2, 0.03, 1.51]} \ No newline at end of file diff --git a/annotations_1/mlpkQuvDJbs_filtered.json b/annotations_1/mlpkQuvDJbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6366a042518d02ecb656bcc1bd5e7d565e31e5d8 --- /dev/null +++ b/annotations_1/mlpkQuvDJbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 78.22], [82.0, 82.14], [83.0, 83.05], [85.0, 86.12], [87.0, 96.42], [101.0, 109.63], [110.0, 118.37], [120.0, 120.56], [122.0, 123.42], [127.0, 128.21], [131.0, 142.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.41, 53.78, 35.48, 0.0, 0.0, 0.0, 30.24], "audiomae_on_audioset": [null, null, null, null, [["hum", 40.38], ["mains hum", 35.09], ["music", 12.57]], null, [["music", 30.75], ["throbbing", 29.01], ["hum", 27.69]], null, null, null, [["noise", 24.26], ["music", 22.71], ["mains hum", 5.47]]], "duration": [36.22, 0.14, 0.05, 1.12, 9.42, 8.63, 8.37, 0.56, 1.42, 1.21, 11.23]} \ No newline at end of file diff --git a/annotations_1/mmH76155CuU_filtered.json b/annotations_1/mmH76155CuU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5ff8e6a689d7130dd272ff3e071174b5beb4787 --- /dev/null +++ b/annotations_1/mmH76155CuU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.42], [21.0, 22.54], [24.0, 25.68], [27.0, 81.48]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.42, 1.54, 1.68, 54.48]} \ No newline at end of file diff --git a/annotations_1/mmdPZs0Nvvg_filtered.json b/annotations_1/mmdPZs0Nvvg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07c38918a312190d8fe007c87556cf0442f0e92f --- /dev/null +++ b/annotations_1/mmdPZs0Nvvg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 28.05], [29.0, 34.01], [37.0, 39.39], [41.0, 42.6], [43.0, 75.64], [77.0, 77.23], [79.0, 85.4], [87.0, 88.77], [90.0, 93.55]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [98.36, 66.51, 96.66, 0.0, 0.0, 0.0, 66.15, 0.0, 44.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["singing bowl", 28.83], ["music", 18.66], ["speech", 16.76]]], "duration": [15.05, 5.01, 2.39, 1.6, 32.64, 0.23, 6.4, 1.77, 3.55]} \ No newline at end of file diff --git a/annotations_1/mpBQ883QIUs_filtered.json b/annotations_1/mpBQ883QIUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90d4d2e7de23e94be7f20936e0310156a6923e22 --- /dev/null +++ b/annotations_1/mpBQ883QIUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.66], [12.0, 12.58], [14.0, 19.84], [21.0, 38.87], [40.0, 43.55], [50.0, 50.19], [52.0, 53.59], [67.0, 69.72], [76.0, 76.87], [82.0, 83.25], [84.0, 84.52], [85.0, 85.6], [88.0, 88.94], [94.0, 94.14], [95.0, 100.28], [102.0, 109.22], [114.0, 120.01], [121.0, 121.32], [123.0, 122.98], [136.0, 145.56], [150.0, 152.74], [159.0, 164.08], [165.0, 167.97], [171.0, 176.94], [179.0, 179.14], [183.0, 183.98], [186.0, 197.41], [198.0, 201.24]], "keep_status": [false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.55, 32.61, 48.44, 0.0, 0.0, 34.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 33.31, 32.73, 0.0, 0.0, 36.37, 37.36, 37.28, 38.36, 42.58, 0.0, 0.0, 63.1, 97.73], "audiomae_on_audioset": [null, null, null, [["music", 33.29], ["speech", 12.79], ["groan", 9.13]], [["speech", 29.7], ["inside, small room", 6.16], ["insect", 5.87]], null, null, [["speech", 30.95], ["music", 21.68], ["boing", 8.62]], null, null, null, null, null, null, null, [["speech", 29.33], ["music", 23.8], ["foghorn", 13.44]], [["music", 56.8], ["speech", 19.53], ["whale vocalization", 2.25]], null, null, [["music", 49.02], ["speech", 8.34], ["musical instrument", 3.28]], [["music", 52.19], ["musical instrument", 2.55], ["brass instrument", 2.42]], [["music", 78.44], ["throbbing", 2.11], ["fart", 1.86]], [["speech", 21.47], ["music", 14.23], ["cowbell", 6.81]], [["music", 46.85], ["speech", 26.97], ["synthesizer", 3.41]], null, null, null, null], "duration": [0.66, 0.58, 5.84, 17.87, 3.55, 0.19, 1.59, 2.72, 0.87, 1.25, 0.52, 0.6, 0.94, 0.14, 5.28, 7.22, 6.01, 0.32, -0.02, 9.56, 2.74, 5.08, 2.97, 5.94, 0.14, 0.98, 11.41, 3.24]} \ No newline at end of file diff --git a/annotations_1/mpDGnFwbw0U_filtered.json b/annotations_1/mpDGnFwbw0U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f0d9a25dcf9dad207245c19d63eab0d0eef8765 --- /dev/null +++ b/annotations_1/mpDGnFwbw0U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.37], [8.0, 8.83], [11.0, 11.5], [13.0, 16.6], [22.0, 22.64], [23.0, 25.49], [32.0, 34.94], [38.0, 39.88], [44.0, 52.42], [55.0, 55.85], [56.0, 57.03], [57.0, 58.7], [62.0, 62.46], [91.0, 91.59], [97.0, 101.78], [123.0, 123.36]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 55.04, 0.0, 42.79, 37.62, 0.0, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["creak", 25.14], ["fly, housefly", 15.3], ["insect", 5.84]], [["rumble", 14.01], ["throbbing", 8.43], ["vehicle horn, car horn, honking", 7.2]], null, [["hum", 41.63], ["throbbing", 15.61], ["rumble", 12.77]], null, null, null, null, null, [["speech", 45.32], ["rumble", 17.23], ["hum", 14.94]], null], "duration": [1.37, 0.83, 0.5, 3.6, 0.64, 2.49, 2.94, 1.88, 8.42, 0.85, 1.03, 1.7, 0.46, 0.59, 4.78, 0.36]} \ No newline at end of file diff --git a/annotations_1/mpG7K909Gi4_filtered.json b/annotations_1/mpG7K909Gi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf4de8b958757b6367d0b4acf1a4518adc649ddd --- /dev/null +++ b/annotations_1/mpG7K909Gi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.92], [23.0, 27.7], [29.0, 29.47], [31.0, 31.5], [36.0, 36.81], [38.0, 50.11], [51.0, 51.65], [52.0, 54.8], [60.0, 69.99], [72.0, 77.03], [78.0, 78.36], [80.0, 80.57], [83.0, 83.42], [84.0, 90.24], [93.0, 95.0], [96.0, 97.82], [99.0, 103.2], [104.0, 125.37], [127.0, 127.57], [128.0, 129.86]], "keep_status": [false, true, false, false, false, false, false, true, true, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [30.96, 30.79, 0.0, 0.0, 0.0, 29.91, 0.0, 32.03, 28.68, 30.02, 0.0, 0.0, 0.0, 35.45, 32.01, 0.0, 32.0, 28.96, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 40.11], ["insect", 35.46], ["bee, wasp, etc.", 10.27]], [["music", 32.41], ["hum", 13.3], ["gong", 9.22]], null, null, null, [["hum", 45.25], ["throbbing", 24.08], ["mains hum", 13.87]], null, [["music", 12.55], ["speech", 11.65], ["animal", 8.66]], [["music", 42.73], ["whale vocalization", 20.46], ["throbbing", 3.8]], [["music", 35.48], ["hum", 17.53], ["throbbing", 16.76]], null, null, null, [["music", 42.9], ["whale vocalization", 14.06], ["theremin", 5.55]], [["music", 46.0], ["giggle", 3.68], ["hum", 3.54]], null, [["hum", 44.15], ["mains hum", 17.67], ["throbbing", 14.6]], [["music", 38.54], ["speech", 30.92], ["buzz", 3.54]], null, null], "duration": [5.92, 4.7, 0.47, 0.5, 0.81, 12.11, 0.65, 2.8, 9.99, 5.03, 0.36, 0.57, 0.42, 6.24, 2.0, 1.82, 4.2, 21.37, 0.57, 1.86]} \ No newline at end of file diff --git a/annotations_1/mpfBH5WLlOA_filtered.json b/annotations_1/mpfBH5WLlOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bacf228eaf6f064c9a12ab060aef84c05309a18a --- /dev/null +++ b/annotations_1/mpfBH5WLlOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.69], [15.0, 14.84], [15.0, 15.99], [20.0, 20.46], [20.0, 20.51], [21.0, 20.61], [22.0, 26.59], [27.0, 28.38], [29.0, 38.06], [39.0, 43.73], [49.0, 89.72], [90.0, 96.38], [97.0, 105.36], [106.0, 111.11], [112.0, 116.01], [120.0, 124.68], [126.0, 128.07], [131.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.37, 0.0, 40.52, 34.23, 0.0, 35.22, 28.88, 28.39, 29.47, 30.23, 35.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 42.79], ["mains hum", 15.43], ["throbbing", 11.82]], [["sine wave", 27.93], ["chirp tone", 15.18], ["speech", 11.37]], null, [["music", 24.23], ["glass", 9.52], ["speech", 7.79]], [["speech", 77.06], ["music", 5.43], ["thunk", 2.0]], [["whack, thwack", 15.57], ["breaking", 15.0], ["hammer", 13.01]], [["gong", 16.91], ["speech", 15.1], ["music", 14.8]], [["whale vocalization", 57.6], ["speech", 10.82], ["music", 9.02]], [["speech", 33.36], ["creak", 13.17], ["music", 11.8]], null], "duration": [1.69, -0.16, 0.99, 0.46, 0.51, -0.39, 4.59, 1.38, 9.06, 4.73, 40.72, 6.38, 8.36, 5.11, 4.01, 4.68, 2.07, 0.9]} \ No newline at end of file diff --git a/annotations_1/mpgaMjGOeJg_filtered.json b/annotations_1/mpgaMjGOeJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6f4f555458cb85c6abda350457dff8fe1bb0427 --- /dev/null +++ b/annotations_1/mpgaMjGOeJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.98], [11.0, 12.48], [13.0, 14.03], [17.0, 19.97], [23.0, 23.67], [26.0, 25.98], [30.0, 31.06], [34.0, 34.43], [38.0, 38.31], [45.0, 46.06], [47.0, 47.71], [48.0, 49.76], [53.0, 53.62], [57.0, 61.89], [63.0, 65.25], [68.0, 68.89], [72.0, 73.36], [76.0, 77.35], [84.0, 88.23], [89.0, 89.77], [92.0, 102.0], [103.0, 111.27], [116.0, 142.91], [146.0, 152.17], [156.0, 157.96], [159.0, 159.78], [162.0, 165.23], [166.0, 171.51], [173.0, 173.77], [175.0, 193.99], [196.0, 212.65], [217.0, 222.44], [223.0, 223.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 33.13, 0.0, 0.0, 0.0, 30.92, 0.0, 30.87, 30.52, 94.66, 82.79, 0.0, 0.0, 94.22, 68.93, 0.0, 48.19, 35.49, 33.46, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.39], ["groan", 5.58], ["rumble", 2.55]], null, null, null, [["wind instrument, woodwind instrument", 57.65], ["music", 15.01], ["didgeridoo", 10.83]], null, [["animal", 49.45], ["dog", 20.48], ["domestic animals, pets", 12.11]], [["music", 45.02], ["didgeridoo", 9.84], ["wind instrument, woodwind instrument", 9.69]], null, null, null, null, null, null, null, [["music", 75.2], ["synthesizer", 4.05], ["ambient music", 3.49]], [["music", 74.38], ["synthesizer", 5.36], ["soundtrack music", 4.11]], [["music", 65.56], ["speech", 4.07], ["explosion", 3.55]], null], "duration": [-0.02, 1.48, 1.03, 2.97, 0.67, -0.02, 1.06, 0.43, 0.31, 1.06, 0.71, 1.76, 0.62, 4.89, 2.25, 0.89, 1.36, 1.35, 4.23, 0.77, 10.0, 8.27, 26.91, 6.17, 1.96, 0.78, 3.23, 5.51, 0.77, 18.99, 16.65, 5.44, 0.82]} \ No newline at end of file diff --git a/annotations_1/mpr3XG5Tzmk_filtered.json b/annotations_1/mpr3XG5Tzmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a08cca41cf0dea9ae3e54508965728ce0d329ce --- /dev/null +++ b/annotations_1/mpr3XG5Tzmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.45], [15.0, 15.6], [17.0, 18.1], [21.0, 24.34], [26.0, 51.92], [53.0, 91.29], [96.0, 97.41], [103.0, 105.19], [110.0, 112.68], [125.0, 126.47], [128.0, 130.67]], "keep_status": [false, false, false, true, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.98, 29.66, 0.0, 0.0, 33.02, 30.73, 0.0, 28.57], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 12.77], ["explosion", 8.68], ["insect", 8.44]], [["music", 47.85], ["hum", 14.36], ["electronic music", 8.04]], null, null, [["music", 20.74], ["moo", 7.36], ["frog", 6.44]], [["hum", 25.05], ["music", 25.0], ["mains hum", 11.82]], null, [["buzz", 11.84], ["hum", 8.93], ["fly, housefly", 8.62]]], "duration": [0.45, 0.6, 1.1, 3.34, 25.92, 38.29, 1.41, 2.19, 2.68, 1.47, 2.67]} \ No newline at end of file diff --git a/annotations_1/mqYkD0nMs04_filtered.json b/annotations_1/mqYkD0nMs04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..050218e3a9324744febc7de1dbd3bf1b9e72fe0d --- /dev/null +++ b/annotations_1/mqYkD0nMs04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.18], [10.0, 10.22], [10.0, 15.16], [26.0, 27.28], [40.0, 40.58], [42.0, 43.04], [44.0, 45.47], [50.0, 52.93], [55.0, 55.36], [58.0, 59.21], [79.0, 78.66], [80.0, 81.24], [84.0, 84.18], [89.0, 89.09], [90.0, 90.22]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.59, 0.0, 0.0, 0.0, 0.0, 48.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 65.65], ["speech", 14.66], ["electronic music", 5.37]], null, null, null, null, [["boing", 42.19], ["speech", 16.88], ["dog", 3.81]], null, null, null, null, null, null, null], "duration": [0.18, 0.22, 5.16, 1.28, 0.58, 1.04, 1.47, 2.93, 0.36, 1.21, -0.34, 1.24, 0.18, 0.09, 0.22]} \ No newline at end of file diff --git a/annotations_1/mqhpZ30uNic_filtered.json b/annotations_1/mqhpZ30uNic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18a99747db3a7106ac19977bbf72583f8b6cbf42 --- /dev/null +++ b/annotations_1/mqhpZ30uNic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 121.0], [122.0, 130.55], [146.0, 146.1], [152.0, 153.57], [157.0, 163.75], [165.0, 170.78], [172.0, 173.85], [175.0, 184.62]], "keep_status": [false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.45, 0.0, 0.0, 56.4, 36.21, 0.0, 48.27], "audiomae_on_audioset": [null, null, [["music", 34.72], ["hum", 12.78], ["whale vocalization", 5.66]], null, null, null, [["dog", 27.09], ["animal", 26.22], ["bow-wow", 19.09]], null, [["whale vocalization", 85.24], ["speech", 5.43], ["animal", 1.21]]], "duration": [0.66, 118.0, 8.55, 0.1, 1.57, 6.75, 5.78, 1.85, 9.62]} \ No newline at end of file diff --git a/annotations_1/mqkYeGeQ1f4_filtered.json b/annotations_1/mqkYeGeQ1f4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41ada88a4b84fffc2a6af406d805ec29a34021f7 --- /dev/null +++ b/annotations_1/mqkYeGeQ1f4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.5], [27.0, 45.87], [47.0, 80.01], [85.0, 98.98]], "keep_status": [false, true, false, false], "silence_prob": [0.0, 30.3, 0.0, 30.58], "audiomae_on_audioset": [null, [["music", 35.05], ["hum", 12.21], ["mains hum", 6.24]], null, [["music", 51.07], ["hum", 19.01], ["throbbing", 9.3]]], "duration": [0.5, 18.87, 33.01, 13.98]} \ No newline at end of file diff --git a/annotations_1/mr1bVID2qao_filtered.json b/annotations_1/mr1bVID2qao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c96376d4ee14d08f2ee0f5bc666f6fbcd831328 --- /dev/null +++ b/annotations_1/mr1bVID2qao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.91], [12.0, 13.17], [15.0, 15.38], [28.0, 28.43], [59.0, 69.4], [98.0, 97.83], [100.0, 100.62], [129.0, 130.13], [144.0, 144.14], [144.0, 144.17], [145.0, 145.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.21, 0.0, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 73.61], ["synthesizer", 5.84], ["musical instrument", 3.62]], null, null, null, [["music", 80.57], ["musical instrument", 1.51], ["cello", 1.26]], null, null, null, null, null, null], "duration": [5.91, 1.17, 0.38, 0.43, 10.4, -0.17, 0.62, 1.13, 0.14, 0.17, 0.39]} \ No newline at end of file diff --git a/annotations_1/mr3L2D4yv-0_filtered.json b/annotations_1/mr3L2D4yv-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d994c5d8769a0b76cb92043d4f7628606fe875e --- /dev/null +++ b/annotations_1/mr3L2D4yv-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 57.05], [58.0, 64.42], [65.0, 66.04], [66.0, 76.08], [78.0, 83.12], [85.0, 93.38], [95.0, 96.38], [96.0, 96.47], [96.0, 96.52]], "keep_status": [false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 30.43, 0.0, 31.79, 98.36, 33.21, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.92], ["speech", 15.03], ["hum", 4.33]], null, [["music", 42.64], ["smash, crash", 5.61], ["sound effect", 5.28]], null, [["hum", 16.13], ["machine gun", 13.99], ["breaking", 12.44]], null, null, null], "duration": [55.05, 6.42, 1.04, 10.08, 5.12, 8.38, 1.38, 0.47, 0.52]} \ No newline at end of file diff --git a/annotations_1/msSsPzKVzW0_filtered.json b/annotations_1/msSsPzKVzW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ede202a6de4be4134f01d40ad48a9c6fb05103 --- /dev/null +++ b/annotations_1/msSsPzKVzW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.8], [7.0, 7.55], [9.0, 9.73], [13.0, 14.05], [25.0, 25.35], [30.0, 31.92], [38.0, 38.38], [43.0, 43.06], [47.0, 46.65], [47.0, 48.51], [49.0, 49.05], [53.0, 53.32], [56.0, 56.13], [57.0, 57.55], [59.0, 58.99], [60.0, 60.52], [62.0, 63.14], [67.0, 67.36], [68.0, 68.71], [73.0, 73.21], [75.0, 75.59], [76.0, 77.03], [83.0, 83.12], [93.0, 92.99], [104.0, 104.94], [105.0, 105.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.55, 0.73, 1.05, 0.35, 1.92, 0.38, 0.06, -0.35, 1.51, 0.05, 0.32, 0.13, 0.55, -0.01, 0.52, 1.14, 0.36, 0.71, 0.21, 0.59, 1.03, 0.12, -0.01, 0.94, 0.76]} \ No newline at end of file diff --git a/annotations_1/msWWI02CG-o_filtered.json b/annotations_1/msWWI02CG-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbd208f5f0da6ce8d261954af073ede6de45afd7 --- /dev/null +++ b/annotations_1/msWWI02CG-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.94], [14.0, 15.3], [22.0, 23.08], [26.0, 27.09], [35.0, 35.36], [36.0, 37.66], [38.0, 39.55], [44.0, 48.81], [49.0, 50.14], [51.0, 51.41], [52.0, 52.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 65.26], ["electronic music", 5.81], ["techno", 3.01]], null, null, null], "duration": [1.94, 1.3, 1.08, 1.09, 0.36, 1.66, 1.55, 4.81, 1.14, 0.41, 0.22]} \ No newline at end of file diff --git a/annotations_1/ms_ERfOYnqI_filtered.json b/annotations_1/ms_ERfOYnqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b100fee9f10f5afd48a3e5faa60afbd7f0d334c4 --- /dev/null +++ b/annotations_1/ms_ERfOYnqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 55.75], [58.0, 70.43], [72.0, 72.4], [73.0, 76.77], [78.0, 79.27], [80.0, 84.28], [87.0, 92.3], [95.0, 101.48]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.27, 0.0, 57.72, 0.0, 63.53, 51.94, 57.32], "audiomae_on_audioset": [null, [["sound effect", 12.76], ["speech", 10.79], ["explosion", 9.59]], null, null, null, null, null, null], "duration": [40.75, 12.43, 0.4, 3.77, 1.27, 4.28, 5.3, 6.48]} \ No newline at end of file diff --git a/annotations_1/msoyjm3gCBM_filtered.json b/annotations_1/msoyjm3gCBM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cecdd8993d441d11afd04b2051b709e997e1e6fb --- /dev/null +++ b/annotations_1/msoyjm3gCBM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 120.66], [124.0, 129.22], [131.0, 135.11], [138.0, 139.01], [143.0, 160.57]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 28.16, 28.42, 0.0, 28.29], "audiomae_on_audioset": [null, [["music", 47.76], ["speech", 9.24], ["crowd", 3.85]], [["music", 46.87], ["throbbing", 17.09], ["hum", 12.87]], null, [["music", 66.75], ["vehicle", 3.99], ["car", 3.02]]], "duration": [60.66, 5.22, 4.11, 1.01, 17.57]} \ No newline at end of file diff --git a/annotations_1/msqRzlYXXQE_filtered.json b/annotations_1/msqRzlYXXQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92faf37425291c4d8fd9a260ff94c0201e3baa73 --- /dev/null +++ b/annotations_1/msqRzlYXXQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 72.74]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [58.74]} \ No newline at end of file diff --git a/annotations_1/mtsQ0CR4Z28_filtered.json b/annotations_1/mtsQ0CR4Z28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..add54beeff18f2339ad3673c41aebf4834f02b93 --- /dev/null +++ b/annotations_1/mtsQ0CR4Z28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 68.44], [71.0, 71.83], [72.0, 84.48], [85.0, 86.0], [96.0, 97.23], [99.0, 101.29], [102.0, 108.82], [118.0, 119.75], [120.0, 121.47]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.46, 0.0, 0.0, 67.13, 43.85, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 48.01], ["buzz", 19.7], ["speech", 4.53]], null, null, null, [["music", 60.19], ["theremin", 10.74], ["musical instrument", 5.34]], null, null], "duration": [54.44, 0.83, 12.48, 1.0, 1.23, 2.29, 6.82, 1.75, 1.47]} \ No newline at end of file diff --git a/annotations_1/mvH6IhKpehk_filtered.json b/annotations_1/mvH6IhKpehk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..792049977dced172ca16befcc5cf1f41fc5f97a7 --- /dev/null +++ b/annotations_1/mvH6IhKpehk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [10.0, 11.1], [12.0, 13.17], [18.0, 18.28], [19.0, 19.75], [20.0, 20.88], [21.0, 34.05], [40.0, 44.81], [53.0, 53.25], [63.0, 63.17], [65.0, 65.26], [80.0, 80.57], [91.0, 90.75], [92.0, 92.23], [105.0, 105.68], [108.0, 108.73], [111.0, 112.04], [113.0, 113.19], [133.0, 132.73], [138.0, 138.75], [139.0, 139.53], [140.0, 140.58], [146.0, 146.57], [154.0, 154.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 35.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 45.08], ["didgeridoo", 8.71], ["musical instrument", 5.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.1, 1.17, 0.28, 0.75, 0.88, 13.05, 4.81, 0.25, 0.17, 0.26, 0.57, -0.25, 0.23, 0.68, 0.73, 1.04, 0.19, -0.27, 0.75, 0.53, 0.58, 0.57, 0.14]} \ No newline at end of file diff --git a/annotations_1/mwMmZ8dtWNM_filtered.json b/annotations_1/mwMmZ8dtWNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a54c90c18021fa2cc0c8abd734a397d341249ee --- /dev/null +++ b/annotations_1/mwMmZ8dtWNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.44], [8.0, 8.82], [17.0, 17.49], [22.0, 22.82], [45.0, 45.45], [47.0, 47.95], [54.0, 55.32], [62.0, 62.63], [64.0, 64.0], [71.0, 73.09], [74.0, 77.79], [80.0, 80.99], [84.0, 87.67], [89.0, 91.5], [92.0, 96.4], [103.0, 104.26], [105.0, 105.16], [106.0, 116.21], [122.0, 122.49], [124.0, 140.12], [142.0, 142.64], [144.0, 145.02], [147.0, 150.31], [153.0, 153.66], [168.0, 167.97], [170.0, 171.37], [178.0, 178.85], [185.0, 185.16], [187.0, 187.52], [192.0, 192.89], [194.0, 197.09], [200.0, 201.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 99.87, 0.0, 100.0, 98.1, 82.97, 0.0, 0.0, 79.59, 0.0, 50.02, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.26], ["speech", 6.91], ["musical instrument", 2.62]], null, null, null, null, null, null, null, null, null], "duration": [3.44, 0.82, 0.49, 0.82, 0.45, 0.95, 1.32, 0.63, 0.0, 2.09, 3.79, 0.99, 3.67, 2.5, 4.4, 1.26, 0.16, 10.21, 0.49, 16.12, 0.64, 1.02, 3.31, 0.66, -0.03, 1.37, 0.85, 0.16, 0.52, 0.89, 3.09, 1.23]} \ No newline at end of file diff --git a/annotations_1/mxz_RfabdUo_filtered.json b/annotations_1/mxz_RfabdUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e8960e61349848707711f592c951dc743074060 --- /dev/null +++ b/annotations_1/mxz_RfabdUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [13.0, 13.86], [14.0, 14.23], [23.0, 25.24], [29.0, 29.47], [32.0, 32.24], [33.0, 33.52], [35.0, 36.0], [37.0, 37.22], [39.0, 47.58], [49.0, 50.25], [51.0, 55.09], [56.0, 56.73], [58.0, 58.16], [72.0, 72.22], [75.0, 74.95], [77.0, 76.81], [77.0, 77.38], [80.0, 80.01], [83.0, 83.4], [87.0, 87.76], [94.0, 94.15], [96.0, 97.12], [103.0, 103.94], [106.0, 106.2], [114.0, 115.28], [117.0, 117.41], [131.0, 131.35], [133.0, 133.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.95, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.86, 0.23, 2.24, 0.47, 0.24, 0.52, 1.0, 0.22, 8.58, 1.25, 4.09, 0.73, 0.16, 0.22, -0.05, -0.19, 0.38, 0.01, 0.4, 0.76, 0.15, 1.12, 0.94, 0.2, 1.28, 0.41, 0.35, 0.47]} \ No newline at end of file diff --git a/annotations_1/mySMw3VkEBE_filtered.json b/annotations_1/mySMw3VkEBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b288832a6a4df4e5350c8f284df9a05bde6b734d --- /dev/null +++ b/annotations_1/mySMw3VkEBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.31], [5.0, 9.96], [11.0, 14.35], [16.0, 21.54], [24.0, 27.11], [28.0, 30.15], [31.0, 34.26], [36.0, 37.2], [38.0, 39.02], [43.0, 44.51], [46.0, 46.06], [47.0, 48.46], [51.0, 51.26], [54.0, 54.6], [56.0, 61.01], [62.0, 72.06], [77.0, 89.31], [100.0, 101.53], [104.0, 104.82], [120.0, 129.07], [130.0, 132.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.94, 53.72, 99.16, 75.72, 70.86, 99.05, 52.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.92, 56.63, 37.93, 0.0, 0.0, 72.16, 52.92], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["busy signal", 31.57], ["dial tone", 30.06], ["sine wave", 12.16]], null, [["speech", 43.58], ["telephone", 25.47], ["telephone bell ringing", 16.28]], null, null, null, null], "duration": [3.31, 4.96, 3.35, 5.54, 3.11, 2.15, 3.26, 1.2, 1.02, 1.51, 0.06, 1.46, 0.26, 0.6, 5.01, 10.06, 12.31, 1.53, 0.82, 9.07, 2.16]} \ No newline at end of file diff --git a/annotations_1/myZDn8fFRLY_filtered.json b/annotations_1/myZDn8fFRLY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75dabbc259706ba17d32554aff22c9775dd4c971 --- /dev/null +++ b/annotations_1/myZDn8fFRLY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.44], [26.0, 27.35], [50.0, 63.58], [69.0, 70.07], [73.0, 72.94], [104.0, 104.25], [107.0, 107.81], [112.0, 112.31], [113.0, 114.12], [115.0, 116.02], [131.0, 132.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [53.47, 0.0, 32.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.49], ["speech", 18.28], ["groan", 6.54]], null, null, null, null, null, null, null, null], "duration": [13.44, 1.35, 13.58, 1.07, -0.06, 0.25, 0.81, 0.31, 1.12, 1.02, 1.71]} \ No newline at end of file diff --git a/annotations_1/mycAsRhAr_M_filtered.json b/annotations_1/mycAsRhAr_M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..539bb68871bfd32402fd75705846edb96aff8dcf --- /dev/null +++ b/annotations_1/mycAsRhAr_M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.7], [8.0, 7.74], [8.0, 7.77], [8.0, 7.8], [8.0, 13.78], [15.0, 16.02], [17.0, 19.28], [23.0, 24.38], [26.0, 26.74], [27.0, 32.32], [34.0, 39.26], [40.0, 41.15], [44.0, 45.81], [49.0, 53.43], [54.0, 56.88], [58.0, 62.9], [65.0, 70.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.4, 0.0, 62.99, 0.0, 0.0, 78.21, 95.37, 0.0, 0.0, 51.82, 48.69, 43.1, 43.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.22], ["theremin", 18.15], ["shofar", 13.29]], [["theremin", 50.28], ["music", 22.98], ["speech", 5.53]], [["music", 65.09], ["theremin", 19.74], ["musical instrument", 3.06]]], "duration": [-0.3, -0.26, -0.23, -0.2, 5.78, 1.02, 2.28, 1.38, 0.74, 5.32, 5.26, 1.15, 1.81, 4.43, 2.88, 4.9, 5.28]} \ No newline at end of file diff --git a/annotations_1/mz6dgt11n-E_filtered.json b/annotations_1/mz6dgt11n-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13ed034baf16b0358f15f9b1290ba5d625e9085c --- /dev/null +++ b/annotations_1/mz6dgt11n-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.8], [11.0, 12.51], [14.0, 14.84], [15.0, 15.74], [19.0, 22.35], [23.0, 23.77], [24.0, 25.46], [27.0, 29.0], [29.0, 30.55], [37.0, 37.71], [43.0, 43.16], [44.0, 45.03], [51.0, 51.85], [53.0, 53.1], [54.0, 55.21], [56.0, 60.35], [64.0, 65.48], [72.0, 71.88], [75.0, 76.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.51, 0.84, 0.74, 3.35, 0.77, 1.46, 2.0, 1.55, 0.71, 0.16, 1.03, 0.85, 0.1, 1.21, 4.35, 1.48, -0.12, 1.94]} \ No newline at end of file diff --git a/annotations_1/n0QO2xOuqp0_filtered.json b/annotations_1/n0QO2xOuqp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..deac3708f656a93b7c11ef5c6ad1388771e9ba0f --- /dev/null +++ b/annotations_1/n0QO2xOuqp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.09], [13.0, 23.8], [26.0, 25.84], [28.0, 28.54], [34.0, 34.97], [40.0, 42.36], [44.0, 49.52], [54.0, 57.87], [63.0, 79.02], [83.0, 93.51], [97.0, 98.81], [105.0, 105.21], [110.0, 115.16], [126.0, 132.81], [145.0, 147.56], [154.0, 157.3], [158.0, 158.16], [159.0, 160.88], [162.0, 167.81]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.79, 29.02, 0.0, 0.0, 0.0, 28.97, 28.98, 29.49, 28.84, 29.21, 0.0, 0.0, 28.9, 28.81, 29.18, 29.53, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["music", 60.94], ["throbbing", 9.68], ["sidetone", 2.85]], [["smash, crash", 44.44], ["whack, thwack", 22.46], ["music", 22.03]], null, null, null, [["music", 23.22], ["speech", 16.01], ["cattle, bovinae", 8.83]], [["speech", 39.6], ["vehicle", 12.86], ["music", 9.58]], [["music", 56.91], ["speech", 30.17], ["sidetone", 2.35]], [["music", 78.33], ["speech", 3.14], ["whip", 1.98]], [["music", 52.14], ["cacophony", 8.1], ["throbbing", 7.43]], null, null, [["music", 64.81], ["speech", 14.85], ["boing", 5.07]], [["music", 71.59], ["speech", 5.9], ["musical instrument", 1.61]], [["music", 36.66], ["speech", 27.72], ["electronic music", 7.16]], [["music", 46.65], ["throbbing", 28.08], ["hum", 7.3]], null, null, [["throbbing", 56.65], ["music", 15.17], ["hum", 14.51]]], "duration": [2.09, 10.8, -0.16, 0.54, 0.97, 2.36, 5.52, 3.87, 16.02, 10.51, 1.81, 0.21, 5.16, 6.81, 2.56, 3.3, 0.16, 1.88, 5.81]} \ No newline at end of file diff --git a/annotations_1/n1GlWng3oOQ_filtered.json b/annotations_1/n1GlWng3oOQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bfe1485723b949724312e1117befd2976f27db3a --- /dev/null +++ b/annotations_1/n1GlWng3oOQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 58.31], [59.0, 59.9], [60.0, 62.29], [63.0, 64.64], [66.0, 68.98], [70.0, 78.22], [79.0, 82.46], [84.0, 87.86], [89.0, 90.14], [91.0, 93.82], [95.0, 96.11], [97.0, 99.32], [100.0, 102.07], [103.0, 115.96], [116.0, 119.65], [120.0, 127.95], [131.0, 131.84], [133.0, 133.93], [135.0, 136.41], [138.0, 139.09], [140.0, 148.0], [149.0, 155.56], [156.0, 159.0], [160.0, 164.69], [165.0, 168.84], [170.0, 174.85], [176.0, 177.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.23, 0.0, 62.78, 0.0, 64.29, 58.38, 74.29, 85.9, 0.0, 98.36, 0.0, 92.97, 97.33, 58.47, 77.36, 62.99, 0.0, 0.0, 0.0, 0.0, 56.86, 56.86, 69.47, 73.67, 57.89, 53.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.31, 0.9, 2.29, 1.64, 2.98, 8.22, 3.46, 3.86, 1.14, 2.82, 1.11, 2.32, 2.07, 12.96, 3.65, 7.95, 0.84, 0.93, 1.41, 1.09, 8.0, 6.56, 3.0, 4.69, 3.84, 4.85, 1.96]} \ No newline at end of file diff --git a/annotations_1/n1VEmXiaFY4_filtered.json b/annotations_1/n1VEmXiaFY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9eb77a736ce5b9c542afebc998cdf9f525b60f3 --- /dev/null +++ b/annotations_1/n1VEmXiaFY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[86.0, 107.08], [108.0, 110.08], [117.0, 120.04], [122.0, 127.04], [129.0, 135.14], [137.0, 143.31], [143.0, 147.72], [148.0, 149.45], [153.0, 155.78], [162.0, 162.5]], "keep_status": [false, true, false, false, false, true, false, false, false, false], "silence_prob": [31.51, 46.68, 64.63, 53.84, 61.37, 48.95, 40.92, 0.0, 99.44, 0.0], "audiomae_on_audioset": [[["music", 61.4], ["hum", 10.88], ["throbbing", 7.79]], [["speech", 26.03], ["music", 20.1], ["hum", 14.09]], null, null, null, [["music", 29.49], ["gong", 13.49], ["singing bowl", 9.7]], [["speech", 67.48], ["music", 19.33], ["sidetone", 2.92]], null, null, null], "duration": [21.08, 2.08, 3.04, 5.04, 6.14, 6.31, 4.72, 1.45, 2.78, 0.5]} \ No newline at end of file diff --git a/annotations_1/n2YCseaZK0Q_filtered.json b/annotations_1/n2YCseaZK0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ae51eef1dfb54ae9d483bc0a3b1c3d9d971f3d6 --- /dev/null +++ b/annotations_1/n2YCseaZK0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [7.0, 8.04], [15.0, 16.02], [19.0, 20.48], [24.0, 27.72], [29.0, 34.13], [35.0, 36.37], [38.0, 38.67], [40.0, 41.84], [43.0, 52.78], [57.0, 61.59], [63.0, 64.13], [70.0, 72.27], [75.0, 75.69], [76.0, 92.6], [94.0, 97.02], [103.0, 109.02], [109.0, 121.85], [122.0, 124.92], [126.0, 127.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.98, 51.99, 0.0, 0.0, 0.0, 53.91, 57.97, 0.0, 53.65, 0.0, 48.74, 49.18, 48.87, 40.16, 44.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 24.62], ["hum", 20.8], ["throbbing", 13.72]], [["throbbing", 36.44], ["hum", 21.45], ["music", 17.25]], [["throbbing", 45.32], ["hum", 25.45], ["mains hum", 5.77]], [["hum", 45.11], ["throbbing", 17.55], ["mains hum", 14.93]], [["throbbing", 28.32], ["hum", 28.0], ["music", 22.52]], null], "duration": [1.12, 1.04, 1.02, 1.48, 3.72, 5.13, 1.37, 0.67, 1.84, 9.78, 4.59, 1.13, 2.27, 0.69, 16.6, 3.02, 6.02, 12.85, 2.92, 1.63]} \ No newline at end of file diff --git a/annotations_1/n3L8UVTe6Ak_filtered.json b/annotations_1/n3L8UVTe6Ak_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5621d200c92049a4dba6afcbffb2db8551ace9b --- /dev/null +++ b/annotations_1/n3L8UVTe6Ak_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [7.0, 8.5], [12.0, 13.09], [17.0, 17.86], [22.0, 22.98], [26.0, 26.16], [34.0, 36.02], [39.0, 39.88], [40.0, 40.41], [43.0, 45.22], [47.0, 49.65], [51.0, 52.41], [54.0, 54.95], [57.0, 59.17], [69.0, 69.25], [71.0, 71.47], [73.0, 73.99], [77.0, 77.62], [79.0, 80.22], [82.0, 83.07], [85.0, 88.74], [91.0, 147.46], [148.0, 149.37], [153.0, 154.31], [166.0, 167.04], [170.0, 170.65], [175.0, 179.25], [181.0, 196.23], [197.0, 198.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.86, 0.0, 0.0, 64.75, 86.09, 0.0, 0.0, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 0.0, 0.0, 0.0, 0.0, 0.0, 49.87, 31.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.15], ["music", 14.2], ["croak", 7.45]], null, null, null, null, null, [["music", 31.26], ["hum", 10.83], ["speech", 7.24]], [["music", 46.67], ["speech", 16.5], ["hum", 8.78]], null], "duration": [0.29, 1.5, 1.09, 0.86, 0.98, 0.16, 2.02, 0.88, 0.41, 2.22, 2.65, 1.41, 0.95, 2.17, 0.25, 0.47, 0.99, 0.62, 1.22, 1.07, 3.74, 56.46, 1.37, 1.31, 1.04, 0.65, 4.25, 15.23, 1.78]} \ No newline at end of file diff --git a/annotations_1/n3tXVrGw3kY_filtered.json b/annotations_1/n3tXVrGw3kY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..480d74950ed52d84939c7357cc92b80a7e870508 --- /dev/null +++ b/annotations_1/n3tXVrGw3kY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.59], [9.0, 9.95], [12.0, 12.56], [21.0, 21.73], [25.0, 25.56], [30.0, 33.2], [39.0, 40.19], [50.0, 51.95], [54.0, 55.56], [62.0, 63.0], [83.0, 84.89], [87.0, 88.11], [91.0, 92.53], [97.0, 96.92], [101.0, 101.78], [118.0, 118.79], [127.0, 128.61]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.41, 0.0, 0.0, 0.0, 0.0, 33.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.88], ["fart", 13.92], ["whip", 12.62]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.59, 0.95, 0.56, 0.73, 0.56, 3.2, 1.19, 1.95, 1.56, 1.0, 1.89, 1.11, 1.53, -0.08, 0.78, 0.79, 1.61]} \ No newline at end of file diff --git a/annotations_1/n44APWaJZ58_filtered.json b/annotations_1/n44APWaJZ58_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..932b7f7fcf6f11486d822d4d187660bd70bc6516 --- /dev/null +++ b/annotations_1/n44APWaJZ58_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.61], [8.0, 7.87], [13.0, 14.66], [20.0, 21.15], [27.0, 28.17], [30.0, 30.4], [34.0, 36.51], [38.0, 38.03], [41.0, 41.17], [47.0, 48.63], [49.0, 49.65], [50.0, 53.06], [58.0, 92.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.08, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, -0.13, 1.66, 1.15, 1.17, 0.4, 2.51, 0.03, 0.17, 1.63, 0.65, 3.06, 34.75]} \ No newline at end of file diff --git a/annotations_1/n4bsNkDyF2s_filtered.json b/annotations_1/n4bsNkDyF2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8593977a343a4122e8e7621af53fcb6661e05f49 --- /dev/null +++ b/annotations_1/n4bsNkDyF2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.2], [13.0, 20.39], [23.0, 41.74], [45.0, 60.98]], "keep_status": [false, true, false, true], "silence_prob": [0.0, 43.13, 28.4, 28.3], "audiomae_on_audioset": [null, [["hum", 28.06], ["music", 24.89], ["mains hum", 9.15]], [["music", 76.33], ["speech", 3.77], ["throbbing", 1.9]], [["music", 28.71], ["speech", 13.55], ["explosion", 7.93]]], "duration": [0.2, 7.39, 18.74, 15.98]} \ No newline at end of file diff --git a/annotations_1/n4pUbyGBD18_filtered.json b/annotations_1/n4pUbyGBD18_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..022cbd4a2b7080fd3bcee8ee51d50b1460471b63 --- /dev/null +++ b/annotations_1/n4pUbyGBD18_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [2.0, 2.78], [5.0, 6.61], [8.0, 7.96], [10.0, 10.4], [12.0, 12.88], [19.0, 19.45], [28.0, 31.48], [33.0, 33.05], [34.0, 34.82], [42.0, 42.53], [43.0, 43.85], [46.0, 48.81], [51.0, 51.54], [53.0, 53.64], [55.0, 55.36], [56.0, 56.47], [57.0, 58.16], [59.0, 61.47], [64.0, 64.39], [65.0, 74.21], [77.0, 87.39], [88.0, 88.43], [89.0, 136.19], [139.0, 140.37], [142.0, 143.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.86, 0.0, 0.0, 0.0, 0.0, 42.79, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 30.85, 48.91, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 25.07], ["hum", 11.98], ["mains hum", 9.89]], null, null, null, null, [["fly, housefly", 46.56], ["bee, wasp, etc.", 17.51], ["insect", 13.29]], null, null, null, null, null, [["fly, housefly", 41.02], ["insect", 16.67], ["bee, wasp, etc.", 9.37]], null, [["music", 17.09], ["hum", 15.72], ["mains hum", 6.0]], [["music", 45.62], ["wind instrument, woodwind instrument", 6.03], ["hum", 5.13]], null, null, null, null], "duration": [-0.01, 0.78, 1.61, -0.04, 0.4, 0.88, 0.45, 3.48, 0.05, 0.82, 0.53, 0.85, 2.81, 0.54, 0.64, 0.36, 0.47, 1.16, 2.47, 0.39, 9.21, 10.39, 0.43, 47.19, 1.37, 1.07]} \ No newline at end of file diff --git a/annotations_1/n59mG9_X35Q_filtered.json b/annotations_1/n59mG9_X35Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db1fd9aa81daa67a9f69850bd6f93c404cfd5f62 --- /dev/null +++ b/annotations_1/n59mG9_X35Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [7.0, 8.18], [14.0, 18.4], [20.0, 20.24], [21.0, 21.49], [28.0, 29.49], [35.0, 39.68], [41.0, 48.25], [52.0, 58.35], [58.0, 58.53], [59.0, 60.44], [62.0, 63.64], [73.0, 73.47], [74.0, 80.5], [86.0, 87.27], [89.0, 90.41], [95.0, 99.84]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.7, 0.0, 0.0, 0.0, 29.06, 30.0, 32.37, 0.0, 0.0, 0.0, 0.0, 36.39, 0.0, 0.0, 32.34], "audiomae_on_audioset": [null, null, [["music", 28.91], ["grunt", 18.4], ["speech", 13.9]], null, null, null, [["music", 39.54], ["throbbing", 19.77], ["hum", 14.23]], [["speech", 43.08], ["music", 34.74], ["throbbing", 2.89]], [["music", 53.7], ["theremin", 13.93], ["soundtrack music", 4.33]], null, null, null, null, [["music", 76.5], ["didgeridoo", 8.69], ["musical instrument", 3.55]], null, null, [["music", 48.87], ["grunt", 22.24], ["animal", 13.24]]], "duration": [0.65, 1.18, 4.4, 0.24, 0.49, 1.49, 4.68, 7.25, 6.35, 0.53, 1.44, 1.64, 0.47, 6.5, 1.27, 1.41, 4.84]} \ No newline at end of file diff --git a/annotations_1/n5tMCxz-9uY_filtered.json b/annotations_1/n5tMCxz-9uY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf5d2b25c94eaab4e83e87cedddd55155709376b --- /dev/null +++ b/annotations_1/n5tMCxz-9uY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.76], [26.0, 30.79], [44.0, 44.12], [50.0, 50.75], [53.0, 53.15], [55.0, 56.78], [58.0, 61.82], [68.0, 68.49], [78.0, 79.14], [93.0, 92.99], [102.0, 102.05], [104.0, 104.57], [111.0, 111.84], [121.0, 122.5], [125.0, 136.78], [140.0, 151.58], [157.0, 157.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.2, 0.0, 0.0, 0.0, 0.0, 30.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.32, 30.57, 0.0], "audiomae_on_audioset": [null, [["music", 78.77], ["quack", 2.23], ["boing", 1.9]], null, null, null, null, [["music", 95.33], ["musical instrument", 0.6], ["guitar", 0.44]], null, null, null, null, null, null, null, [["music", 49.87], ["boing", 15.09], ["speech", 4.89]], [["music", 83.62], ["reggae", 1.58], ["drum and bass", 1.27]], null], "duration": [1.76, 4.79, 0.12, 0.75, 0.15, 1.78, 3.82, 0.49, 1.14, -0.01, 0.05, 0.57, 0.84, 1.5, 11.78, 11.58, 0.76]} \ No newline at end of file diff --git a/annotations_1/n6H7zga2Ks0_filtered.json b/annotations_1/n6H7zga2Ks0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c71ab910a32c7db3eb18318f483500ce585d1218 --- /dev/null +++ b/annotations_1/n6H7zga2Ks0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.03], [12.0, 13.26], [16.0, 17.27], [21.0, 23.21], [24.0, 26.05], [28.0, 29.03], [31.0, 33.94], [34.0, 36.0], [38.0, 40.02], [46.0, 45.99], [48.0, 50.6], [55.0, 56.02], [57.0, 58.41], [59.0, 60.03], [62.0, 63.85], [65.0, 66.02], [67.0, 67.49], [69.0, 69.13], [76.0, 78.07], [84.0, 84.47], [85.0, 87.99], [90.0, 95.99], [96.0, 99.42], [102.0, 103.72], [104.0, 105.43], [107.0, 106.98], [108.0, 109.98], [111.0, 112.75], [114.0, 114.67], [115.0, 116.77], [119.0, 119.52], [123.0, 123.82], [124.0, 126.79], [128.0, 128.55], [130.0, 132.27], [133.0, 136.22], [137.0, 138.3], [139.0, 142.82], [143.0, 144.59], [146.0, 148.19]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 0.0, 99.48, 86.82, 0.0, 100.0, 48.91, 83.7, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 78.38, 99.95, 99.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.22, 0.0, 100.0, 100.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 54.23], ["sidetone", 10.47], ["hum", 5.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.03, 1.26, 1.27, 2.21, 2.05, 1.03, 2.94, 2.0, 2.02, -0.01, 2.6, 1.02, 1.41, 1.03, 1.85, 1.02, 0.49, 0.13, 2.07, 0.47, 2.99, 5.99, 3.42, 1.72, 1.43, -0.02, 1.98, 1.75, 0.67, 1.77, 0.52, 0.82, 2.79, 0.55, 2.27, 3.22, 1.3, 3.82, 1.59, 2.19]} \ No newline at end of file diff --git a/annotations_1/n7l2RLvI7Ss_filtered.json b/annotations_1/n7l2RLvI7Ss_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4284c47930b9e567aaf44b2883a21470191e68d0 --- /dev/null +++ b/annotations_1/n7l2RLvI7Ss_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.05], [9.0, 9.14], [12.0, 12.7], [18.0, 22.33], [26.0, 26.74], [29.0, 28.78], [30.0, 30.74], [33.0, 33.1], [34.0, 34.97], [35.0, 35.56], [40.0, 40.1], [41.0, 41.07], [49.0, 49.33], [50.0, 50.89], [53.0, 54.21], [56.0, 56.88], [61.0, 61.77], [63.0, 65.94], [66.0, 67.26], [68.0, 68.17], [69.0, 69.18], [69.0, 70.02], [71.0, 71.27], [73.0, 73.8], [76.0, 77.6], [78.0, 78.92], [80.0, 80.0], [81.0, 81.6], [83.0, 82.88], [84.0, 83.91], [84.0, 85.41], [88.0, 88.64], [94.0, 94.09], [96.0, 96.97], [98.0, 98.0], [98.0, 100.14], [102.0, 104.13], [106.0, 107.13], [109.0, 109.41], [110.0, 111.94], [114.0, 114.07], [115.0, 115.45], [116.0, 115.96], [116.0, 117.21], [125.0, 125.02], [130.0, 130.22], [131.0, 130.98], [132.0, 132.22], [134.0, 133.64], [136.0, 136.78], [139.0, 140.17], [141.0, 141.61], [143.0, 143.83], [144.0, 144.88], [146.0, 146.5], [147.0, 147.68], [148.0, 148.46], [151.0, 151.5], [152.0, 152.19], [153.0, 153.39], [156.0, 156.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 97.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.05, 0.14, 0.7, 4.33, 0.74, -0.22, 0.74, 0.1, 0.97, 0.56, 0.1, 0.07, 0.33, 0.89, 1.21, 0.88, 0.77, 2.94, 1.26, 0.17, 0.18, 1.02, 0.27, 0.8, 1.6, 0.92, 0.0, 0.6, -0.12, -0.09, 1.41, 0.64, 0.09, 0.97, 0.0, 2.14, 2.13, 1.13, 0.41, 1.94, 0.07, 0.45, -0.04, 1.21, 0.02, 0.22, -0.02, 0.22, -0.36, 0.78, 1.17, 0.61, 0.83, 0.88, 0.5, 0.68, 0.46, 0.5, 0.19, 0.39, 0.79]} \ No newline at end of file diff --git a/annotations_1/n8yUoQP6Rwo_filtered.json b/annotations_1/n8yUoQP6Rwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..529e93efc5114dfe22f528f8b78693b67cc17e11 --- /dev/null +++ b/annotations_1/n8yUoQP6Rwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [5.0, 5.61], [9.0, 16.66], [22.0, 30.91], [36.0, 41.44], [42.0, 42.62], [44.0, 52.37], [54.0, 56.2], [61.0, 62.14], [64.0, 82.86]], "keep_status": [false, false, false, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 49.59, 30.13, 28.67, 0.0, 29.12, 29.44, 0.0, 29.3], "audiomae_on_audioset": [null, null, [["whale vocalization", 64.52], ["music", 11.4], ["speech", 8.86]], [["whale vocalization", 25.82], ["animal", 11.63], ["buzz", 8.67]], [["animal", 13.18], ["speech", 11.35], ["livestock, farm animals, working animals", 8.82]], null, [["speech", 21.7], ["music", 14.65], ["roar", 8.73]], [["speech", 24.02], ["fly, housefly", 23.68], ["insect", 11.74]], null, [["music", 50.82], ["speech", 12.57], ["groan", 11.49]]], "duration": [0.89, 0.61, 7.66, 8.91, 5.44, 0.62, 8.37, 2.2, 1.14, 18.86]} \ No newline at end of file diff --git a/annotations_1/n94um7eDILg_filtered.json b/annotations_1/n94um7eDILg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c5c9f721c7da72b3e967c80d0117b9d5e8045fe --- /dev/null +++ b/annotations_1/n94um7eDILg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.47], [13.0, 13.46], [15.0, 14.99], [16.0, 19.23], [21.0, 21.25], [22.0, 22.69], [25.0, 25.24], [26.0, 26.5], [39.0, 39.51], [42.0, 47.55], [59.0, 59.0], [61.0, 62.01], [63.0, 63.26], [69.0, 69.58], [71.0, 71.42], [72.0, 72.76], [79.0, 81.23], [84.0, 85.19], [86.0, 87.44], [88.0, 88.96], [90.0, 111.91], [114.0, 114.62]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [32.77, 0.0, 0.0, 32.45, 0.0, 0.0, 0.0, 0.0, 0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.79, 0.0, 0.0, 0.0, 32.73, 0.0], "audiomae_on_audioset": [[["thump, thud", 17.92], ["rumble", 8.86], ["speech", 7.21]], null, null, [["fly, housefly", 28.36], ["insect", 13.81], ["wail, moan", 7.59]], null, null, null, null, null, [["speech", 29.41], ["groan", 18.11], ["grunt", 4.91]], null, null, null, null, null, null, [["music", 9.36], ["cattle, bovinae", 8.58], ["animal", 7.68]], null, null, null, [["music", 17.52], ["fly, housefly", 13.64], ["groan", 8.42]], null], "duration": [2.47, 0.46, -0.01, 3.23, 0.25, 0.69, 0.24, 0.5, 0.51, 5.55, 0.0, 1.01, 0.26, 0.58, 0.42, 0.76, 2.23, 1.19, 1.44, 0.96, 21.91, 0.62]} \ No newline at end of file diff --git a/annotations_1/n9hjsuaj448_filtered.json b/annotations_1/n9hjsuaj448_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/n9hjsuaj448_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/n9uVWlO0GAs_filtered.json b/annotations_1/n9uVWlO0GAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/n9uVWlO0GAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/nA1lAszNSoI_filtered.json b/annotations_1/nA1lAszNSoI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51943b0b231aad71a0802242060e85049886b769 --- /dev/null +++ b/annotations_1/nA1lAszNSoI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 41.13], [42.0, 67.95], [71.0, 78.54], [82.0, 92.94], [93.0, 139.78], [143.0, 154.03]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 29.84, 33.02, 30.21, 0.0, 39.83], "audiomae_on_audioset": [null, [["music", 29.07], ["hum", 21.54], ["throbbing", 17.39]], [["music", 57.28], ["hum", 16.1], ["throbbing", 6.34]], [["hum", 28.68], ["throbbing", 22.88], ["mains hum", 20.17]], null, [["music", 72.96], ["whale vocalization", 10.08], ["ambient music", 4.85]]], "duration": [40.13, 25.95, 7.54, 10.94, 46.78, 11.03]} \ No newline at end of file diff --git a/annotations_1/nAqJV2olXN0_filtered.json b/annotations_1/nAqJV2olXN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b5bd6bb21d3f49e3f46e58828a6c639e0f1c636 --- /dev/null +++ b/annotations_1/nAqJV2olXN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.92], [8.0, 9.22], [20.0, 20.12], [21.0, 37.57], [38.0, 38.89], [40.0, 40.8], [41.0, 42.06], [45.0, 46.6], [47.0, 65.04], [67.0, 74.92], [75.0, 75.91], [76.0, 76.86], [82.0, 84.03], [84.0, 85.97], [91.0, 93.88], [95.0, 100.9]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 43.66, 0.0, 0.0, 0.0, 0.0, 48.56, 50.56, 0.0, 0.0, 52.45, 0.0, 44.99, 67.38], "audiomae_on_audioset": [null, null, null, [["speech", 60.49], ["radio", 4.91], ["sidetone", 4.07]], null, null, null, null, [["music", 42.85], ["musical instrument", 7.27], ["guitar", 5.77]], null, null, null, null, null, [["music", 31.47], ["mains hum", 17.88], ["hum", 9.88]], null], "duration": [1.92, 1.22, 0.12, 16.57, 0.89, 0.8, 1.06, 1.6, 18.04, 7.92, 0.91, 0.86, 2.03, 1.97, 2.88, 5.9]} \ No newline at end of file diff --git a/annotations_1/nAuz36A1zG0_filtered.json b/annotations_1/nAuz36A1zG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88cbce43057702c1cf0bebf02b34face076882d2 --- /dev/null +++ b/annotations_1/nAuz36A1zG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.95], [14.0, 82.0], [87.0, 88.11]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.05, 68.0, 1.11]} \ No newline at end of file diff --git a/annotations_1/nB9rg6sxHhU_filtered.json b/annotations_1/nB9rg6sxHhU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d8b1566c12ae64abd4bfc0afefd48aaf03bcb00 --- /dev/null +++ b/annotations_1/nB9rg6sxHhU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.53], [12.0, 11.77], [25.0, 25.57], [34.0, 34.91], [36.0, 40.2], [41.0, 42.82], [44.0, 50.21], [55.0, 57.08], [60.0, 61.84], [67.0, 68.84], [72.0, 73.53], [86.0, 86.46], [89.0, 91.2], [96.0, 98.27], [101.0, 103.0], [114.0, 115.72], [123.0, 124.46], [132.0, 131.99], [135.0, 135.84], [136.0, 140.68], [147.0, 148.27], [154.0, 170.51], [173.0, 175.02], [180.0, 182.01], [185.0, 186.63], [197.0, 199.03], [205.0, 207.6], [218.0, 218.62], [220.0, 222.4], [228.0, 232.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 91.13, 0.0, 33.67, 49.13, 0.0, 0.0, 0.0, 0.0, 40.06, 39.99, 40.24, 0.0, 0.0, 0.0, 0.0, 30.86, 0.0, 32.72, 39.54, 38.21, 0.0, 39.78, 30.99, 0.0, 31.98, 30.78], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 43.85], ["theremin", 34.95], ["guitar", 2.8]], [["music", 73.19], ["synthesizer", 3.81], ["musical instrument", 2.11]], null, null, null, null, [["music", 64.47], ["synthesizer", 5.85], ["middle eastern music", 1.65]], [["music", 62.48], ["flute", 5.97], ["carnatic music", 5.12]], [["music", 59.43], ["didgeridoo", 7.15], ["synthesizer", 5.07]], null, null, null, null, [["music", 68.82], ["singing", 2.94], ["swing music", 2.28]], null, [["music", 84.87], ["synthesizer", 0.98], ["keyboard (musical)", 0.8]], [["music", 68.34], ["singing", 3.11], ["musical instrument", 2.38]], [["music", 69.74], ["theremin", 5.46], ["middle eastern music", 2.34]], null, [["music", 30.76], ["double bass", 14.95], ["cello", 10.41]], [["music", 74.35], ["soundtrack music", 2.01], ["sampler", 1.7]], null, [["music", 74.53], ["musical instrument", 3.86], ["synthesizer", 3.58]], [["music", 74.73], ["didgeridoo", 2.45], ["electronic music", 2.05]]], "duration": [1.53, -0.23, 0.57, 0.91, 4.2, 1.82, 6.21, 2.08, 1.84, 1.84, 1.53, 0.46, 2.2, 2.27, 2.0, 1.72, 1.46, -0.01, 0.84, 4.68, 1.27, 16.51, 2.02, 2.01, 1.63, 2.03, 2.6, 0.62, 2.4, 4.06]} \ No newline at end of file diff --git a/annotations_1/nBZ39gX_FlU_filtered.json b/annotations_1/nBZ39gX_FlU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72e28de9204556d8c374c56503c6ace77417876f --- /dev/null +++ b/annotations_1/nBZ39gX_FlU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 22.86], [25.0, 32.27], [33.0, 57.7], [61.0, 91.02], [92.0, 93.61], [95.0, 95.35], [96.0, 96.79], [98.0, 99.64], [103.0, 104.85], [109.0, 116.94], [120.0, 122.77], [134.0, 137.27], [138.0, 142.13], [143.0, 143.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false], "silence_prob": [33.14, 30.67, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.5, 32.06, 31.89, 31.75, 0.0], "audiomae_on_audioset": [[["throbbing", 34.52], ["music", 30.14], ["hum", 17.66]], [["hum", 30.56], ["mains hum", 27.63], ["music", 11.88]], [["music", 47.31], ["throbbing", 27.52], ["hum", 10.62]], null, null, null, null, null, null, [["fly, housefly", 34.26], ["mosquito", 9.05], ["insect", 8.53]], [["gong", 20.96], ["music", 19.61], ["sonar", 8.44]], [["moo", 21.9], ["cattle, bovinae", 12.62], ["livestock, farm animals, working animals", 12.05]], [["speech", 34.0], ["hum", 23.24], ["music", 14.7]], null], "duration": [15.86, 7.27, 24.7, 30.02, 1.61, 0.35, 0.79, 1.64, 1.85, 7.94, 2.77, 3.27, 4.13, 0.82]} \ No newline at end of file diff --git a/annotations_1/nBsxbjTIJxs_filtered.json b/annotations_1/nBsxbjTIJxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a20138b5dface444a734105c196a610d78016f8 --- /dev/null +++ b/annotations_1/nBsxbjTIJxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.23], [6.0, 6.03], [9.0, 9.14], [20.0, 20.49], [21.0, 23.45], [26.0, 26.69], [29.0, 29.19], [34.0, 35.8], [46.0, 46.97], [48.0, 48.49], [52.0, 52.79], [54.0, 54.21], [56.0, 56.69], [69.0, 69.96], [87.0, 89.63], [90.0, 90.9], [91.0, 92.33], [95.0, 95.05], [101.0, 101.21], [102.0, 102.81], [105.0, 105.76], [113.0, 113.58], [118.0, 118.59], [127.0, 127.36], [133.0, 133.61], [147.0, 148.07], [149.0, 149.54], [153.0, 152.88], [155.0, 155.95], [158.0, 158.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.03, 0.14, 0.49, 2.45, 0.69, 0.19, 1.8, 0.97, 0.49, 0.79, 0.21, 0.69, 0.96, 2.63, 0.9, 1.33, 0.05, 0.21, 0.81, 0.76, 0.58, 0.59, 0.36, 0.61, 1.07, 0.54, -0.12, 0.95, 0.19]} \ No newline at end of file diff --git a/annotations_1/nCWBxPh4dGo_filtered.json b/annotations_1/nCWBxPh4dGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95b447f18cacead1d4f83505d7b7932c3f733aac --- /dev/null +++ b/annotations_1/nCWBxPh4dGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.01], [12.0, 25.47], [28.0, 70.87], [73.0, 73.25], [76.0, 80.84], [83.0, 83.66], [85.0, 86.51], [87.0, 104.75], [108.0, 115.67], [119.0, 154.55], [156.0, 158.89], [161.0, 161.13], [165.0, 166.72]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.55, 29.24, 0.0, 0.0, 30.88, 0.0, 0.0, 31.53, 28.92, 0.0, 29.74, 0.0, 0.0], "audiomae_on_audioset": [[["music", 48.89], ["speech", 28.0], ["electronic music", 1.83]], [["music", 30.02], ["speech", 5.95], ["groan", 5.49]], null, null, [["music", 36.22], ["speech", 33.74], ["boing", 10.64]], null, null, [["music", 45.68], ["synthesizer", 22.72], ["keyboard (musical)", 3.54]], [["music", 87.88], ["musical instrument", 1.43], ["rock and roll", 0.75]], null, [["music", 73.54], ["boing", 2.7], ["electronic music", 1.66]], null, null], "duration": [3.01, 13.47, 42.87, 0.25, 4.84, 0.66, 1.51, 17.75, 7.67, 35.55, 2.89, 0.13, 1.72]} \ No newline at end of file diff --git a/annotations_1/nD6DMtXc3mY_filtered.json b/annotations_1/nD6DMtXc3mY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91825cc40c66c563bd230d6d2a66b1639e10434b --- /dev/null +++ b/annotations_1/nD6DMtXc3mY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.39], [9.0, 10.52], [16.0, 16.71], [20.0, 21.59], [22.0, 113.95], [120.0, 120.28], [122.0, 122.93], [123.0, 125.2], [132.0, 133.84], [137.0, 147.51], [149.0, 150.11], [151.0, 158.89], [160.0, 171.64]], "keep_status": [true, false, false, false, false, false, false, true, false, true, false, true, true], "silence_prob": [36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.22, 0.0, 38.22, 0.0, 30.7, 30.85], "audiomae_on_audioset": [[["music", 33.75], ["hum", 15.33], ["speech", 14.24]], null, null, null, null, null, null, [["music", 53.78], ["didgeridoo", 10.98], ["hum", 4.89]], null, [["music", 31.47], ["didgeridoo", 15.42], ["hum", 14.05]], null, [["whale vocalization", 20.43], ["mains hum", 11.02], ["hum", 9.77]], [["music", 44.13], ["hum", 13.2], ["electronic music", 7.58]]], "duration": [2.39, 1.52, 0.71, 1.59, 91.95, 0.28, 0.93, 2.2, 1.84, 10.51, 1.11, 7.89, 11.64]} \ No newline at end of file diff --git a/annotations_1/nEGbOGGiENU_filtered.json b/annotations_1/nEGbOGGiENU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..994f76b985006f423ca0ad8555c82037c1209047 --- /dev/null +++ b/annotations_1/nEGbOGGiENU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.79], [22.0, 22.25], [23.0, 28.07], [28.0, 29.07], [31.0, 39.61], [40.0, 40.61], [50.0, 51.43], [52.0, 64.76], [65.0, 66.92], [70.0, 84.16], [87.0, 87.12], [95.0, 116.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.6, 0.0, 30.13, 0.0, 0.0, 30.14, 0.0, 29.84, 0.0, 30.14], "audiomae_on_audioset": [null, null, [["music", 41.67], ["speech", 40.76], ["synthesizer", 4.18]], null, [["music", 68.56], ["vehicle", 5.38], ["car", 4.84]], null, null, [["music", 77.14], ["synthesizer", 2.54], ["cacophony", 1.58]], null, [["music", 59.07], ["synthesizer", 7.05], ["throbbing", 4.81]], null, [["music", 49.37], ["car", 13.96], ["vehicle", 8.88]]], "duration": [1.79, 0.25, 5.07, 1.07, 8.61, 0.61, 1.43, 12.76, 1.92, 14.16, 0.12, 21.01]} \ No newline at end of file diff --git a/annotations_1/nEf2ML7wkBE_filtered.json b/annotations_1/nEf2ML7wkBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90023259a86b7f3f6acd514c091d6a1df3441860 --- /dev/null +++ b/annotations_1/nEf2ML7wkBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.39], [15.0, 15.92], [33.0, 33.76], [37.0, 37.72], [50.0, 51.02], [94.0, 94.81], [116.0, 115.75]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.39, 0.92, 0.76, 0.72, 1.02, 0.81, -0.25]} \ No newline at end of file diff --git a/annotations_1/nF74obZFKp8_filtered.json b/annotations_1/nF74obZFKp8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72cc6c82e83e8c3bcbb1835816962a657d594866 --- /dev/null +++ b/annotations_1/nF74obZFKp8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 22.92], [29.0, 35.31], [42.0, 96.85], [100.0, 109.63], [115.0, 140.78], [143.0, 149.82], [151.0, 161.5], [162.0, 165.11], [167.0, 167.49], [170.0, 171.17]], "keep_status": [false, false, false, false, true, false, false, true, false, false], "silence_prob": [28.83, 28.33, 0.0, 28.4, 28.35, 28.56, 28.63, 29.14, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.32], ["throbbing", 31.41], ["hum", 11.14]], [["music", 70.86], ["speech", 13.16], ["throbbing", 3.86]], null, [["music", 61.88], ["throbbing", 12.33], ["hum", 9.42]], [["music", 24.31], ["speech", 14.61], ["vehicle", 5.77]], [["music", 32.93], ["speech", 32.39], ["hum", 6.63]], [["music", 34.5], ["hum", 30.07], ["mains hum", 18.57]], [["music", 48.48], ["hum", 9.69], ["mains hum", 6.01]], null, null], "duration": [16.92, 6.31, 54.85, 9.63, 25.78, 6.82, 10.5, 3.11, 0.49, 1.17]} \ No newline at end of file diff --git a/annotations_1/nGx3WY944DU_filtered.json b/annotations_1/nGx3WY944DU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..beb4144a7279cc9f9965cb26f402e980eb01edd9 --- /dev/null +++ b/annotations_1/nGx3WY944DU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.0], [8.0, 7.84], [12.0, 11.79], [15.0, 18.64], [19.0, 21.02], [22.0, 24.36], [26.0, 40.53], [42.0, 44.66], [50.0, 50.57], [53.0, 54.5], [58.0, 65.35], [67.0, 68.89], [73.0, 80.49], [87.0, 88.72], [90.0, 101.75], [107.0, 108.63], [110.0, 110.69], [112.0, 112.72], [117.0, 117.19], [118.0, 120.48], [122.0, 122.22], [127.0, 127.3], [130.0, 131.04], [132.0, 131.65], [135.0, 135.41], [136.0, 136.76], [140.0, 149.67], [152.0, 152.05], [157.0, 160.91], [162.0, 162.35]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [56.1, 0.0, 0.0, 37.97, 49.92, 55.89, 38.15, 30.41, 0.0, 0.0, 35.06, 0.0, 35.72, 0.0, 32.3, 0.0, 0.0, 0.0, 0.0, 31.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.97, 0.0, 38.95, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 66.64], ["gong", 16.85], ["electronic music", 3.41]], [["speech", 42.63], ["music", 9.99], ["singing bowl", 6.59]], null, [["music", 51.55], ["hum", 9.59], ["electronic music", 7.21]], [["music", 16.3], ["mosquito", 11.33], ["fly, housefly", 5.44]], null, null, [["speech", 70.37], ["hum", 6.22], ["music", 6.12]], null, [["sheep", 20.03], ["bleat", 12.71], ["speech", 11.84]], null, [["speech", 37.46], ["music", 17.41], ["throbbing", 8.07]], null, null, null, null, [["moo", 40.3], ["cattle, bovinae", 26.82], ["speech", 6.41]], null, null, null, null, null, null, [["crying, sobbing", 26.34], ["whimper", 23.33], ["speech", 14.21]], null, [["moo", 29.32], ["cattle, bovinae", 28.49], ["whale vocalization", 21.38]], null], "duration": [2.0, -0.16, -0.21, 3.64, 2.02, 2.36, 14.53, 2.66, 0.57, 1.5, 7.35, 1.89, 7.49, 1.72, 11.75, 1.63, 0.69, 0.72, 0.19, 2.48, 0.22, 0.3, 1.04, -0.35, 0.41, 0.76, 9.67, 0.05, 3.91, 0.35]} \ No newline at end of file diff --git a/annotations_1/nHcRQhadzhY_filtered.json b/annotations_1/nHcRQhadzhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0dcaa5d93c4970be2a5fd99857e7a94536886de --- /dev/null +++ b/annotations_1/nHcRQhadzhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.23], [19.0, 19.68], [21.0, 29.64], [39.0, 40.37], [44.0, 46.5], [59.0, 64.03], [69.0, 78.31], [82.0, 94.37], [95.0, 98.63], [104.0, 125.69], [134.0, 136.95], [147.0, 154.01], [157.0, 157.32], [159.0, 159.83], [162.0, 161.91], [163.0, 163.34], [164.0, 166.68], [169.0, 169.21], [176.0, 192.77], [199.0, 199.15], [201.0, 205.58], [211.0, 211.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [32.12, 0.0, 30.36, 0.0, 31.38, 30.34, 31.35, 31.1, 30.76, 30.48, 29.62, 31.49, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 30.02, 0.0, 29.32, 0.0], "audiomae_on_audioset": [[["music", 74.65], ["musical instrument", 4.0], ["guitar", 3.21]], null, [["music", 49.51], ["speech", 27.44], ["rattle (instrument)", 2.32]], null, [["music", 64.87], ["speech", 7.49], ["techno", 3.73]], [["music", 75.23], ["speech", 6.0], ["boing", 2.44]], [["music", 54.45], ["speech", 29.32], ["didgeridoo", 1.77]], [["music", 84.51], ["musical instrument", 2.54], ["speech", 0.88]], [["music", 70.02], ["speech", 11.75], ["electronic music", 2.33]], [["music", 63.23], ["speech", 8.57], ["boing", 2.75]], [["music", 77.45], ["speech", 3.53], ["musical instrument", 1.74]], [["music", 71.45], ["speech", 3.64], ["boing", 3.15]], null, null, null, null, [["speech", 38.35], ["music", 12.04], ["fly, housefly", 10.37]], null, [["music", 65.63], ["throbbing", 5.79], ["cacophony", 3.86]], null, [["music", 29.32], ["hum", 21.97], ["throbbing", 19.42]], null], "duration": [3.23, 0.68, 8.64, 1.37, 2.5, 5.03, 9.31, 12.37, 3.63, 21.69, 2.95, 7.01, 0.32, 0.83, -0.09, 0.34, 2.68, 0.21, 16.77, 0.15, 4.58, 0.94]} \ No newline at end of file diff --git a/annotations_1/nI6agjxMa2s_filtered.json b/annotations_1/nI6agjxMa2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b23b4336f92de1fee35dfc95d11c0a27d0cc9e7 --- /dev/null +++ b/annotations_1/nI6agjxMa2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.45], [19.0, 25.59], [30.0, 34.3], [35.0, 56.2], [56.0, 77.21], [78.0, 90.05]], "keep_status": [true, true, true, true, false, false], "silence_prob": [30.95, 30.92, 30.49, 29.63, 29.61, 29.16], "audiomae_on_audioset": [[["speech", 29.48], ["music", 20.67], ["hum", 13.76]], [["music", 44.4], ["trombone", 10.13], ["brass instrument", 9.9]], [["mains hum", 22.71], ["music", 22.65], ["hum", 20.08]], [["music", 24.63], ["speech", 23.34], ["buzz", 10.45]], [["buzz", 56.22], ["music", 16.27], ["fly, housefly", 2.12]], [["speech", 55.78], ["vehicle", 13.83], ["music", 3.38]]], "duration": [5.45, 6.59, 4.3, 21.2, 21.21, 12.05]} \ No newline at end of file diff --git a/annotations_1/nIW73heJdg4_filtered.json b/annotations_1/nIW73heJdg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8051f577be77b9fd3da4f61214bee348f4d98c93 --- /dev/null +++ b/annotations_1/nIW73heJdg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.52], [11.0, 12.85], [14.0, 14.34], [48.0, 48.71], [52.0, 53.03], [56.0, 56.17], [65.0, 83.35], [87.0, 131.65]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 31.46], ["whip", 30.2], ["speech", 10.11]], null], "duration": [0.52, 1.85, 0.34, 0.71, 1.03, 0.17, 18.35, 44.65]} \ No newline at end of file diff --git a/annotations_1/nJ1hrmVHUJg_filtered.json b/annotations_1/nJ1hrmVHUJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8227657ec4713ab248e62aecf061e607d2cf4ca --- /dev/null +++ b/annotations_1/nJ1hrmVHUJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.75], [15.0, 15.16], [16.0, 16.65], [19.0, 19.16], [24.0, 25.2], [31.0, 36.37], [39.0, 39.06], [40.0, 40.39], [41.0, 47.12], [56.0, 57.81], [65.0, 64.83], [66.0, 66.85], [69.0, 69.87], [75.0, 89.8], [91.0, 91.45], [94.0, 94.68], [98.0, 97.77], [99.0, 109.8], [115.0, 146.92]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.02, 0.0, 0.0, 38.1, 0.0, 0.0, 0.0, 0.0, 30.22, 0.0, 0.0, 0.0, 29.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.66], ["speech", 16.86], ["air horn, truck horn", 4.03]], null, null, [["fly, housefly", 24.8], ["speech", 24.72], ["bee, wasp, etc.", 17.51]], null, null, null, null, [["music", 57.49], ["theremin", 11.66], ["didgeridoo", 6.61]], null, null, null, [["speech", 40.51], ["music", 9.96], ["animal", 7.09]], null], "duration": [0.75, 0.16, 0.65, 0.16, 1.2, 5.37, 0.06, 0.39, 6.12, 1.81, -0.17, 0.85, 0.87, 14.8, 0.45, 0.68, -0.23, 10.8, 31.92]} \ No newline at end of file diff --git a/annotations_1/nJwGWiuonws_filtered.json b/annotations_1/nJwGWiuonws_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c6e5c37c2963e867232f67312569bfe8b43627 --- /dev/null +++ b/annotations_1/nJwGWiuonws_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.97], [3.0, 5.7], [14.0, 15.15], [16.0, 19.35], [20.0, 20.49], [23.0, 23.48], [28.0, 30.4], [31.0, 31.8], [36.0, 36.19], [39.0, 39.18], [41.0, 42.26], [44.0, 46.06], [47.0, 47.56], [48.0, 48.51], [50.0, 51.26], [54.0, 55.32], [58.0, 58.67], [67.0, 67.37], [83.0, 84.2], [88.0, 88.53], [89.0, 90.85], [92.0, 91.77], [93.0, 93.77], [99.0, 99.39], [101.0, 101.38], [104.0, 104.38], [106.0, 107.2], [116.0, 116.21], [119.0, 119.38], [121.0, 122.35], [123.0, 123.5], [130.0, 132.65], [142.0, 142.47], [144.0, 144.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 67.13, 0.0, 96.77, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 2.7, 1.15, 3.35, 0.49, 0.48, 2.4, 0.8, 0.19, 0.18, 1.26, 2.06, 0.56, 0.51, 1.26, 1.32, 0.67, 0.37, 1.2, 0.53, 1.85, -0.23, 0.77, 0.39, 0.38, 0.38, 1.2, 0.21, 0.38, 1.35, 0.5, 2.65, 0.47, 0.59]} \ No newline at end of file diff --git a/annotations_1/nKDUDF3cgRA_filtered.json b/annotations_1/nKDUDF3cgRA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..40da527b4a3b15d44762547a6a567995c137a3ac --- /dev/null +++ b/annotations_1/nKDUDF3cgRA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [6.0, 8.9], [11.0, 10.93], [12.0, 28.27], [29.0, 30.4], [31.0, 59.75], [61.0, 83.34], [85.0, 90.95], [92.0, 92.42], [93.0, 94.0], [95.0, 122.08], [123.0, 128.7]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 36.78, 0.0, 43.05, 0.0, 43.33, 41.05, 33.55, 0.0, 0.0, 38.72, 58.22], "audiomae_on_audioset": [null, [["speech", 85.2], ["animal", 1.42], ["electric shaver, electric razor", 1.34]], null, [["speech", 76.55], ["electric shaver, electric razor", 4.85], ["telephone", 3.68]], null, [["music", 37.97], ["speech", 10.21], ["fly, housefly", 4.01]], [["music", 48.04], ["speech", 17.33], ["musical instrument", 6.8]], [["music", 42.46], ["musical instrument", 11.78], ["speech", 8.9]], null, null, [["speech", 82.97], ["beatboxing", 5.88], ["music", 2.71]], null], "duration": [1.51, 2.9, -0.07, 16.27, 1.4, 28.75, 22.34, 5.95, 0.42, 1.0, 27.08, 5.7]} \ No newline at end of file diff --git a/annotations_1/nKISdYhQcvw_filtered.json b/annotations_1/nKISdYhQcvw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77960fe55feb524b12114c1f014fbb4b3bc11e30 --- /dev/null +++ b/annotations_1/nKISdYhQcvw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.57], [30.0, 30.59], [31.0, 30.89], [32.0, 32.61], [35.0, 35.82], [36.0, 35.94], [36.0, 53.49], [58.0, 67.98], [69.0, 69.65], [70.0, 136.39], [138.0, 143.82]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [30.49, 0.0, 0.0, 0.0, 0.0, 0.0, 30.64, 32.3, 0.0, 0.0, 34.71], "audiomae_on_audioset": [[["cattle, bovinae", 49.56], ["moo", 28.12], ["livestock, farm animals, working animals", 11.24]], null, null, null, null, null, [["speech", 21.57], ["whack, thwack", 16.05], ["groan", 7.85]], [["whack, thwack", 8.07], ["fart", 6.94], ["speech", 6.83]], null, null, [["grunt", 26.36], ["music", 13.89], ["groan", 9.57]]], "duration": [15.57, 0.59, -0.11, 0.61, 0.82, -0.06, 17.49, 9.98, 0.65, 66.39, 5.82]} \ No newline at end of file diff --git a/annotations_1/nKuJ6UvlGek_filtered.json b/annotations_1/nKuJ6UvlGek_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f8408ae01f7e2627fda8779225e3dd7e9a051cd --- /dev/null +++ b/annotations_1/nKuJ6UvlGek_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.42], [32.0, 32.17], [33.0, 33.86], [40.0, 47.61], [48.0, 51.68], [53.0, 52.96], [56.0, 56.25], [57.0, 58.16], [59.0, 59.53], [61.0, 61.26], [62.0, 64.29], [66.0, 66.72], [68.0, 68.47], [70.0, 70.88], [73.0, 74.49], [76.0, 79.96], [84.0, 86.02], [89.0, 90.53], [93.0, 95.77], [97.0, 97.87], [103.0, 103.76], [116.0, 117.0]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.4, 0.0, 0.0, 32.97, 34.53, 0.0, 0.0, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 34.55, 33.45, 0.0, 33.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 71.88], ["didgeridoo", 6.04], ["musical instrument", 4.85]], null, null, [["noise", 32.15], ["hum", 22.87], ["speech", 11.72]], [["whale vocalization", 40.69], ["sidetone", 17.7], ["speech", 12.51]], null, null, null, null, null, [["mains hum", 40.2], ["hum", 18.66], ["music", 9.16]], null, null, null, null, [["mains hum", 43.94], ["hum", 18.32], ["music", 10.14]], [["theremin", 44.81], ["music", 24.2], ["didgeridoo", 5.63]], null, [["music", 52.24], ["gong", 12.24], ["vehicle", 8.46]], null, null, null], "duration": [3.42, 0.17, 0.86, 7.61, 3.68, -0.04, 0.25, 1.16, 0.53, 0.26, 2.29, 0.72, 0.47, 0.88, 1.49, 3.96, 2.02, 1.53, 2.77, 0.87, 0.76, 1.0]} \ No newline at end of file diff --git a/annotations_1/nL3o4MGY9NQ_filtered.json b/annotations_1/nL3o4MGY9NQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83b3d4efdb9740c3606e2ba40f5b5eb8ebf4db57 --- /dev/null +++ b/annotations_1/nL3o4MGY9NQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 31.23], [32.0, 36.96], [37.0, 37.08], [37.0, 42.28], [43.0, 58.35], [60.0, 125.52], [127.0, 130.11], [131.0, 146.16], [147.0, 153.44], [154.0, 163.46], [164.0, 165.21], [166.0, 166.9]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [72.01, 79.41, 0.0, 79.24, 89.19, 0.0, 99.71, 93.6, 82.79, 42.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 22.14], ["whale vocalization", 18.67], ["theremin", 8.72]], null, null], "duration": [4.23, 4.96, 0.08, 5.28, 15.35, 65.52, 3.11, 15.16, 6.44, 9.46, 1.21, 0.9]} \ No newline at end of file diff --git a/annotations_1/nLDgcHxJ4Sc_filtered.json b/annotations_1/nLDgcHxJ4Sc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bddb039b035b5c63ca6d7098d7e8540ab911f48c --- /dev/null +++ b/annotations_1/nLDgcHxJ4Sc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [7.0, 7.7], [9.0, 9.05], [13.0, 13.8], [15.0, 15.13], [15.0, 16.26], [17.0, 18.71], [20.0, 20.61], [23.0, 25.68], [27.0, 31.29], [33.0, 34.11], [35.0, 37.35], [39.0, 39.99], [41.0, 44.59], [49.0, 57.16], [60.0, 61.25], [63.0, 63.49], [66.0, 66.7], [69.0, 69.96], [80.0, 81.24], [84.0, 90.88], [91.0, 90.91], [93.0, 92.92], [95.0, 97.95], [99.0, 99.93], [101.0, 101.66], [105.0, 105.73], [107.0, 107.7], [109.0, 110.32], [113.0, 113.88], [116.0, 118.74], [126.0, 131.82], [133.0, 141.45], [145.0, 146.03], [149.0, 150.89], [152.0, 151.97], [152.0, 154.04], [155.0, 165.45], [167.0, 167.75], [169.0, 169.69], [172.0, 174.61], [176.0, 177.67], [179.0, 182.38], [183.0, 186.65], [187.0, 194.12], [195.0, 196.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.16, 96.42, 0.0, 97.73, 0.0, 98.86, 68.93, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.13, 83.88, 99.92, 0.0, 0.0, 0.0, 49.54, 47.54, 0.0, 0.0, 95.78, 0.0, 47.62, 99.91, 99.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.76], ["fly, housefly", 15.43], ["insect", 8.5]], [["speech", 34.32], ["grunt", 23.84], ["cattle, bovinae", 6.2]], null, null, null, null, [["speech", 76.11], ["sidetone", 9.98], ["dial tone", 2.7]], null, null, null], "duration": [0.34, 0.7, 0.05, 0.8, 0.13, 1.26, 1.71, 0.61, 2.68, 4.29, 1.11, 2.35, 0.99, 3.59, 8.16, 1.25, 0.49, 0.7, 0.96, 1.24, 6.88, -0.09, -0.08, 2.95, 0.93, 0.66, 0.73, 0.7, 1.32, 0.88, 2.74, 5.82, 8.45, 1.03, 1.89, -0.03, 2.04, 10.45, 0.75, 0.69, 2.61, 1.67, 3.38, 3.65, 7.12, 1.25]} \ No newline at end of file diff --git a/annotations_1/nLMkSN2F2xs_filtered.json b/annotations_1/nLMkSN2F2xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6fa0528ff6e4ea573c25ccf3110c630e961e0311 --- /dev/null +++ b/annotations_1/nLMkSN2F2xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.58], [33.0, 93.21], [94.0, 106.47], [108.0, 108.09], [109.0, 118.93], [124.0, 133.74], [140.0, 142.26]], "keep_status": [false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 28.88, 0.0, 28.96, 28.05, 40.41], "audiomae_on_audioset": [null, null, [["speech", 52.67], ["music", 9.98], ["buzz", 9.19]], null, [["speech", 57.09], ["music", 12.49], ["knock", 3.86]], [["speech", 45.12], ["music", 10.07], ["electric shaver, electric razor", 9.26]], [["frog", 26.57], ["croak", 12.88], ["hiccup", 9.24]]], "duration": [1.58, 60.21, 12.47, 0.09, 9.93, 9.74, 2.26]} \ No newline at end of file diff --git a/annotations_1/nLkmfL6IVQs_filtered.json b/annotations_1/nLkmfL6IVQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0795a601f02be2e5b450cf6a3a74b4464df71a93 --- /dev/null +++ b/annotations_1/nLkmfL6IVQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.67], [5.0, 11.15], [16.0, 18.42], [20.0, 22.67], [23.0, 24.31], [26.0, 29.15], [33.0, 35.36], [38.0, 38.87], [41.0, 41.5], [48.0, 48.3], [48.0, 49.4], [53.0, 57.18], [77.0, 79.62], [80.0, 84.25], [91.0, 93.39], [100.0, 101.02], [108.0, 109.32], [116.0, 117.85], [130.0, 130.18], [134.0, 136.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 56.03, 66.27, 74.92, 0.0, 83.7, 56.7, 0.0, 0.0, 0.0, 0.0, 30.34, 29.31, 28.89, 30.01, 0.0, 0.0, 0.0, 0.0, 30.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 35.35], ["cattle, bovinae", 11.49], ["moo", 7.83]], [["music", 33.44], ["skateboard", 21.31], ["cattle, bovinae", 7.79]], [["cattle, bovinae", 38.75], ["moo", 37.55], ["livestock, farm animals, working animals", 8.78]], [["music", 57.31], ["moo", 3.23], ["cattle, bovinae", 3.11]], null, null, null, null, [["music", 63.91], ["hum", 6.5], ["throbbing", 3.24]]], "duration": [1.67, 6.15, 2.42, 2.67, 1.31, 3.15, 2.36, 0.87, 0.5, 0.3, 1.4, 4.18, 2.62, 4.25, 2.39, 1.02, 1.32, 1.85, 0.18, 2.22]} \ No newline at end of file diff --git a/annotations_1/nM0h6QXTpHQ_filtered.json b/annotations_1/nM0h6QXTpHQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b54726c66239eaea329096588b096c3a44139922 --- /dev/null +++ b/annotations_1/nM0h6QXTpHQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [9.0, 9.54], [10.0, 11.4], [12.0, 12.46], [16.0, 16.63], [20.0, 20.68], [21.0, 21.57], [23.0, 24.24], [25.0, 35.24], [35.0, 36.66], [38.0, 38.74], [40.0, 46.31], [47.0, 47.8], [50.0, 51.39], [52.0, 52.02], [52.0, 53.43], [54.0, 54.53], [55.0, 56.32], [63.0, 63.37], [64.0, 70.17], [70.0, 71.07], [72.0, 72.55], [73.0, 76.72], [77.0, 77.6], [81.0, 81.36], [86.0, 86.12], [87.0, 88.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 0.54, 1.4, 0.46, 0.63, 0.68, 0.57, 1.24, 10.24, 1.66, 0.74, 6.31, 0.8, 1.39, 0.02, 1.43, 0.53, 1.32, 0.37, 6.17, 1.07, 0.55, 3.72, 0.6, 0.36, 0.12, 1.5]} \ No newline at end of file diff --git a/annotations_1/nNGz1GspkbM_filtered.json b/annotations_1/nNGz1GspkbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7792c84b06795d4caf50f95aed3fbc50baa335fd --- /dev/null +++ b/annotations_1/nNGz1GspkbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[65.0, 75.74], [77.0, 77.65], [81.0, 83.02], [85.0, 85.23], [87.0, 87.67], [89.0, 138.27], [138.0, 143.51], [150.0, 215.86]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [28.42, 0.0, 29.49, 0.0, 0.0, 0.0, 29.05, 0.0], "audiomae_on_audioset": [[["hum", 40.58], ["mains hum", 16.53], ["throbbing", 7.97]], null, [["music", 42.59], ["hum", 10.6], ["electronic music", 8.88]], null, null, null, [["speech", 22.14], ["whale vocalization", 15.89], ["hum", 12.13]], null], "duration": [10.74, 0.65, 2.02, 0.23, 0.67, 49.27, 5.51, 65.86]} \ No newline at end of file diff --git a/annotations_1/nO7qxQsQK44_filtered.json b/annotations_1/nO7qxQsQK44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5b67b79a44d34333f8bfb40ec225651c3fdf443 --- /dev/null +++ b/annotations_1/nO7qxQsQK44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.55], [6.0, 7.47], [8.0, 14.59], [15.0, 16.14], [17.0, 20.87], [21.0, 21.95], [22.0, 24.75], [28.0, 28.39], [46.0, 48.37], [49.0, 55.76], [56.0, 57.89], [59.0, 59.14], [60.0, 60.12], [61.0, 61.43], [61.0, 61.52], [62.0, 62.53], [63.0, 63.22], [65.0, 75.2], [76.0, 77.62], [83.0, 83.64], [85.0, 87.02], [89.0, 89.19], [90.0, 93.18], [94.0, 94.15], [98.0, 104.19], [104.0, 104.85], [107.0, 107.28], [108.0, 109.49], [116.0, 115.97], [119.0, 127.89], [130.0, 133.46], [134.0, 137.91], [140.0, 140.07], [144.0, 144.21], [145.0, 145.83], [149.0, 149.59], [154.0, 153.91], [155.0, 156.03], [160.0, 161.67], [162.0, 162.95]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.78, 0.0, 72.75, 0.0, 50.61, 0.0, 98.59, 55.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.86, 0.0, 0.0, 97.33, 0.0, 35.54, 0.0, 41.78, 0.0, 0.0, 0.0, 0.0, 88.1, 98.73, 92.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 17.1], ["stomach rumble", 14.57], ["hum", 13.37]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 61.35], ["hum", 9.88], ["mains hum", 3.79]], null, null, null, null, [["speech", 29.38], ["beatboxing", 8.74], ["radio", 6.32]], null, [["speech", 89.14], ["radio", 6.24], ["inside, small room", 0.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 1.47, 6.59, 1.14, 3.87, 0.95, 2.75, 0.39, 2.37, 6.76, 1.89, 0.14, 0.12, 0.43, 0.52, 0.53, 0.22, 10.2, 1.62, 0.64, 2.02, 0.19, 3.18, 0.15, 6.19, 0.85, 0.28, 1.49, -0.03, 8.89, 3.46, 3.91, 0.07, 0.21, 0.83, 0.59, -0.09, 1.03, 1.67, 0.95]} \ No newline at end of file diff --git a/annotations_1/nP-P4IYLJWY_filtered.json b/annotations_1/nP-P4IYLJWY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e91933dbd275829bca7bad32bbf134b2772f49e --- /dev/null +++ b/annotations_1/nP-P4IYLJWY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.17], [23.0, 40.69], [42.0, 47.73], [49.0, 55.32], [56.0, 73.48], [78.0, 91.64], [94.0, 109.85], [112.0, 125.17], [129.0, 137.88], [140.0, 142.15], [143.0, 143.67], [145.0, 163.43], [166.0, 166.43]], "keep_status": [true, false, false, true, false, false, true, false, true, true, false, true, false], "silence_prob": [29.19, 28.46, 29.07, 28.63, 28.57, 28.91, 28.82, 28.51, 28.63, 30.78, 0.0, 28.64, 0.0], "audiomae_on_audioset": [[["music", 48.64], ["throbbing", 9.59], ["hum", 6.68]], [["music", 74.37], ["cacophony", 3.02], ["throbbing", 2.58]], [["music", 37.57], ["throbbing", 25.76], ["hum", 12.45]], [["sound effect", 17.76], ["music", 17.22], ["hum", 9.93]], [["speech", 62.1], ["music", 19.87], ["hum", 3.02]], [["music", 63.99], ["electronic music", 6.1], ["didgeridoo", 3.54]], [["buzz", 29.13], ["music", 19.13], ["hum", 9.53]], [["speech", 48.91], ["music", 21.64], ["mains hum", 12.35]], [["music", 28.27], ["hum", 20.08], ["throbbing", 17.23]], [["music", 48.57], ["cacophony", 16.12], ["mains hum", 4.47]], null, [["music", 29.41], ["hum", 17.53], ["speech", 16.94]], null], "duration": [5.17, 17.69, 5.73, 6.32, 17.48, 13.64, 15.85, 13.17, 8.88, 2.15, 0.67, 18.43, 0.43]} \ No newline at end of file diff --git a/annotations_1/nPJFSx8RTzo_filtered.json b/annotations_1/nPJFSx8RTzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..470d7927e721a6a2b3843ec1a81d167094aad054 --- /dev/null +++ b/annotations_1/nPJFSx8RTzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.99], [6.0, 6.24], [14.0, 14.27], [19.0, 20.41], [22.0, 22.23], [24.0, 26.22], [30.0, 31.38], [32.0, 32.83], [35.0, 35.97], [40.0, 39.85], [41.0, 41.27], [48.0, 53.16], [54.0, 59.75], [62.0, 67.47], [71.0, 71.71], [76.0, 76.11], [77.0, 77.73], [78.0, 80.87], [83.0, 83.32], [85.0, 86.54], [87.0, 86.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.47, 0.0, 0.0, 0.0, 0.0, 0.0, 43.35, 34.28, 36.9, 0.0, 0.0, 0.0, 39.78, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 20.5], ["hum", 19.3], ["mains hum", 17.86]], null, null, null, null, null, [["bee, wasp, etc.", 34.77], ["fly, housefly", 25.56], ["insect", 24.43]], [["mains hum", 39.48], ["hum", 37.46], ["bee, wasp, etc.", 4.14]], [["hum", 44.11], ["mains hum", 20.52], ["speech", 5.72]], null, null, null, [["hum", 21.09], ["speech", 19.68], ["throbbing", 8.24]], null, null, null], "duration": [-0.01, 0.24, 0.27, 1.41, 0.23, 2.22, 1.38, 0.83, 0.97, -0.15, 0.27, 5.16, 5.75, 5.47, 0.71, 0.11, 0.73, 2.87, 0.32, 1.54, -0.12]} \ No newline at end of file diff --git a/annotations_1/nPeH0w6ZXZM_filtered.json b/annotations_1/nPeH0w6ZXZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e95bd08c3a5e9402171cce92ed33fe2d3b747dfc --- /dev/null +++ b/annotations_1/nPeH0w6ZXZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.27], [29.0, 29.3], [31.0, 38.11], [39.0, 41.0], [42.0, 69.79], [73.0, 76.44], [78.0, 81.09], [83.0, 83.17], [86.0, 85.56], [86.0, 87.22], [88.0, 90.24], [92.0, 93.18], [95.0, 96.58], [98.0, 98.9], [99.0, 99.81], [102.0, 103.44], [104.0, 105.93]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.11, 0.0, 37.2, 46.86, 31.55, 36.51, 47.58, 0.0, 0.0, 0.0, 63.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 65.14], ["musical instrument", 11.8], ["brass instrument", 6.1]], null, [["music", 65.04], ["theremin", 8.44], ["musical instrument", 5.31]], [["music", 56.36], ["musical instrument", 6.9], ["clarinet", 6.24]], [["music", 61.76], ["musical instrument", 9.97], ["brass instrument", 6.32]], [["music", 42.62], ["musical instrument", 9.58], ["didgeridoo", 7.87]], [["music", 41.38], ["didgeridoo", 11.01], ["musical instrument", 7.84]], null, null, null, null, null, null, null, null, null, null], "duration": [19.27, 0.3, 7.11, 2.0, 27.79, 3.44, 3.09, 0.17, -0.44, 1.22, 2.24, 1.18, 1.58, 0.9, 0.81, 1.44, 1.93]} \ No newline at end of file diff --git a/annotations_1/nQ2Y1gm0fRU_filtered.json b/annotations_1/nQ2Y1gm0fRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09f5162a6dbfa77fda94c627748cb0c10d5f58c1 --- /dev/null +++ b/annotations_1/nQ2Y1gm0fRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.14], [53.0, 53.52], [56.0, 56.49], [62.0, 62.4], [67.0, 68.47], [78.0, 78.93], [97.0, 97.83], [99.0, 102.91], [105.0, 106.71], [116.0, 131.41], [135.0, 151.06], [153.0, 153.44], [154.0, 153.67], [154.0, 153.74], [154.0, 155.19]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.07, 0.0, 32.0, 31.93, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 39.1], ["speech", 10.82], ["didgeridoo", 8.44]], null, [["speech", 22.05], ["music", 21.16], ["throbbing", 9.67]], [["music", 36.17], ["throbbing", 10.95], ["speech", 7.56]], null, null, null, null], "duration": [0.14, 0.52, 0.49, 0.4, 1.47, 0.93, 0.83, 3.91, 1.71, 15.41, 16.06, 0.44, -0.33, -0.26, 1.19]} \ No newline at end of file diff --git a/annotations_1/nQeov6j0bsQ_filtered.json b/annotations_1/nQeov6j0bsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e034be0ca862b06c224856e3b819ea2d0f811e2 --- /dev/null +++ b/annotations_1/nQeov6j0bsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[68.0, 98.05], [100.0, 107.16], [110.0, 112.7], [116.0, 123.25], [125.0, 130.52]], "keep_status": [false, false, false, false, true], "silence_prob": [0.0, 33.19, 35.52, 33.6, 34.67], "audiomae_on_audioset": [null, [["music", 27.28], ["hum", 27.19], ["speech", 16.8]], [["music", 58.04], ["sidetone", 11.35], ["throbbing", 5.3]], [["music", 61.46], ["speech", 12.81], ["electronic music", 5.78]], [["music", 46.75], ["speech", 8.9], ["whale vocalization", 5.4]]], "duration": [30.05, 7.16, 2.7, 7.25, 5.52]} \ No newline at end of file diff --git a/annotations_1/nS-0lfCTcrk_filtered.json b/annotations_1/nS-0lfCTcrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eec002fd61f07498aba0ea2d9c9c2362bda98750 --- /dev/null +++ b/annotations_1/nS-0lfCTcrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 18.33], [20.0, 23.23], [24.0, 30.35], [31.0, 53.81], [58.0, 64.88], [75.0, 82.14], [82.0, 114.62], [116.0, 116.23], [116.0, 116.67], [117.0, 120.38], [122.0, 129.83], [131.0, 135.94], [137.0, 139.8], [140.0, 141.45], [142.0, 142.82], [144.0, 148.39]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.44, 34.82, 36.61, 30.64, 31.7, 30.74, 0.0, 0.0, 0.0, 95.37, 100.0, 86.09, 51.18, 0.0, 0.0, 43.25], "audiomae_on_audioset": [[["music", 66.86], ["brass instrument", 5.69], ["musical instrument", 4.23]], [["music", 54.69], ["saxophone", 9.92], ["wind instrument, woodwind instrument", 5.57]], [["music", 50.8], ["musical instrument", 10.96], ["synthesizer", 8.09]], [["music", 55.86], ["musical instrument", 17.3], ["brass instrument", 7.68]], [["saxophone", 39.94], ["music", 18.56], ["brass instrument", 16.93]], [["music", 38.72], ["saxophone", 26.48], ["brass instrument", 10.05]], null, null, null, null, null, null, null, null, null, [["speech", 87.6], ["telephone", 4.49], ["inside, small room", 1.0]]], "duration": [9.33, 3.23, 6.35, 22.81, 6.88, 7.14, 32.62, 0.23, 0.67, 3.38, 7.83, 4.94, 2.8, 1.45, 0.82, 4.39]} \ No newline at end of file diff --git a/annotations_1/nS1ePEA5XeQ_filtered.json b/annotations_1/nS1ePEA5XeQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2ba946e08262c1019ad2823d65e6f9663d70332 --- /dev/null +++ b/annotations_1/nS1ePEA5XeQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.48], [8.0, 8.63], [12.0, 14.77], [34.0, 34.45], [38.0, 38.18], [43.0, 43.44], [47.0, 48.24], [50.0, 57.5], [58.0, 61.15], [63.0, 63.0], [63.0, 63.04], [64.0, 64.3], [64.0, 64.34], [64.0, 72.45], [75.0, 79.03], [79.0, 79.3], [79.0, 99.44], [101.0, 105.39], [109.0, 117.85]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 96.04, 0.0, 0.0, 0.0, 0.0, 34.72, 34.89, 0.0, 0.0, 0.0, 0.0, 37.27, 36.97, 0.0, 34.77, 35.55, 33.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 55.88], ["theremin", 5.71], ["speech", 3.22]], [["music", 22.83], ["speech", 22.18], ["hum", 10.75]], null, null, null, null, [["music", 66.58], ["cello", 3.93], ["clarinet", 2.63]], [["music", 44.71], ["trombone", 6.24], ["brass instrument", 6.19]], null, [["music", 39.27], ["speech", 21.22], ["animal", 7.03]], [["music", 34.98], ["speech", 6.04], ["animal", 4.76]], [["speech", 42.7], ["music", 24.13], ["hum", 2.81]]], "duration": [0.48, 0.63, 2.77, 0.45, 0.18, 0.44, 1.24, 7.5, 3.15, 0.0, 0.04, 0.3, 0.34, 8.45, 4.03, 0.3, 20.44, 4.39, 8.85]} \ No newline at end of file diff --git a/annotations_1/nS4Zfx9BSX0_filtered.json b/annotations_1/nS4Zfx9BSX0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bce913d62069fcd71a9407b7df354d460793fd9 --- /dev/null +++ b/annotations_1/nS4Zfx9BSX0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 23.75], [35.0, 41.93], [50.0, 73.09], [75.0, 83.84], [84.0, 84.48], [96.0, 96.55], [98.0, 98.07], [101.0, 101.17], [115.0, 115.8], [118.0, 117.93], [118.0, 122.98]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false], "silence_prob": [34.3, 35.73, 33.82, 38.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.27], "audiomae_on_audioset": [[["music", 56.45], ["theremin", 6.81], ["throbbing", 4.91]], [["music", 54.08], ["didgeridoo", 5.54], ["effects unit", 4.89]], [["music", 54.27], ["guitar", 6.91], ["fart", 6.27]], [["music", 52.24], ["theremin", 12.05], ["musical instrument", 5.04]], null, null, null, null, null, null, [["music", 58.17], ["speech", 18.75], ["vibraphone", 2.32]]], "duration": [3.75, 6.93, 23.09, 8.84, 0.48, 0.55, 0.07, 0.17, 0.8, -0.07, 4.98]} \ No newline at end of file diff --git a/annotations_1/nSH_S3LDUYI_filtered.json b/annotations_1/nSH_S3LDUYI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..668f10b570be9fda8550c7062974024493a5a915 --- /dev/null +++ b/annotations_1/nSH_S3LDUYI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.9], [14.0, 14.89], [20.0, 20.75], [26.0, 26.4], [32.0, 38.74], [41.0, 43.82], [50.0, 51.41], [54.0, 53.77], [57.0, 57.25], [69.0, 69.16], [71.0, 91.4], [95.0, 97.24], [103.0, 104.31], [105.0, 106.59], [107.0, 108.43], [109.0, 110.71], [112.0, 113.22], [115.0, 117.8], [123.0, 130.37], [135.0, 135.97], [137.0, 138.27], [140.0, 142.72], [145.0, 145.3], [147.0, 148.49], [151.0, 152.85], [162.0, 163.75]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.85, 29.45, 0.0, 0.0, 0.0, 0.0, 33.26, 88.83, 0.0, 0.0, 0.0, 0.0, 0.0, 89.36, 33.43, 0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 78.97], ["static", 1.73], ["reggae", 1.25]], [["music", 49.01], ["carnatic music", 5.36], ["drum machine", 4.01]], null, null, null, null, [["music", 84.02], ["throbbing", 3.05], ["drum and bass", 2.95]], null, null, null, null, null, null, null, [["speech", 35.35], ["music", 25.45], ["throbbing", 13.01]], null, null, [["music", 52.12], ["drum and bass", 13.42], ["throbbing", 6.16]], null, null, null, null], "duration": [-0.1, 0.89, 0.75, 0.4, 6.74, 2.82, 1.41, -0.23, 0.25, 0.16, 20.4, 2.24, 1.31, 1.59, 1.43, 1.71, 1.22, 2.8, 7.37, 0.97, 1.27, 2.72, 0.3, 1.49, 1.85, 1.75]} \ No newline at end of file diff --git a/annotations_1/nSO22k4XGUo_filtered.json b/annotations_1/nSO22k4XGUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a910b5f01b4778ca7794dbd73761f4dc77855f --- /dev/null +++ b/annotations_1/nSO22k4XGUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.67], [6.0, 8.01], [9.0, 9.71], [16.0, 17.24], [18.0, 17.9], [20.0, 23.06], [24.0, 26.23], [27.0, 28.11], [32.0, 38.21], [40.0, 40.76], [42.0, 48.84], [50.0, 50.01], [58.0, 58.14], [59.0, 60.29], [69.0, 69.62], [78.0, 82.41], [85.0, 85.08], [90.0, 90.54], [91.0, 91.3], [92.0, 92.23], [95.0, 95.3], [110.0, 111.08], [116.0, 116.85], [117.0, 117.49], [120.0, 120.48]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.41, 0.0, 0.0, 0.0, 32.5, 97.22, 0.0, 53.04, 0.0, 34.34, 0.0, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.19], ["didgeridoo", 33.38], ["musical instrument", 2.47]], null, null, null, [["music", 41.5], ["didgeridoo", 11.15], ["synthesizer", 7.77]], null, null, null, null, [["speech", 55.33], ["music", 18.94], ["breaking", 8.92]], null, null, null, null, [["speech", 68.68], ["burst, pop", 4.93], ["radio", 3.15]], null, null, null, null, null, null, null, null, null], "duration": [0.67, 2.01, 0.71, 1.24, -0.1, 3.06, 2.23, 1.11, 6.21, 0.76, 6.84, 0.01, 0.14, 1.29, 0.62, 4.41, 0.08, 0.54, 0.3, 0.23, 0.3, 1.08, 0.85, 0.49, 0.48]} \ No newline at end of file diff --git a/annotations_1/nTAYbwY6oeU_filtered.json b/annotations_1/nTAYbwY6oeU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..042282de44d3e4b9c9bcb29772c6086eb4892669 --- /dev/null +++ b/annotations_1/nTAYbwY6oeU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.22], [15.0, 20.8], [21.0, 45.03], [46.0, 56.44], [58.0, 58.65]], "keep_status": [false, true, true, true, false], "silence_prob": [29.76, 30.49, 29.72, 29.63, 0.0], "audiomae_on_audioset": [[["throbbing", 32.9], ["hum", 31.31], ["music", 21.15]], [["music", 48.76], ["throbbing", 10.09], ["electronic music", 7.57]], [["music", 57.57], ["cacophony", 4.76], ["throbbing", 3.45]], [["music", 42.91], ["throbbing", 12.52], ["hum", 9.32]], null], "duration": [4.22, 5.8, 24.03, 10.44, 0.65]} \ No newline at end of file diff --git a/annotations_1/nToATRUkpMI_filtered.json b/annotations_1/nToATRUkpMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a0338e5fb01426e764809dcc23204bdde4e45b6 --- /dev/null +++ b/annotations_1/nToATRUkpMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [4.0, 4.48], [6.0, 6.34], [9.0, 9.64], [11.0, 11.48], [12.0, 13.61], [16.0, 16.95], [25.0, 25.95], [35.0, 36.31], [37.0, 38.1], [39.0, 39.75], [41.0, 42.01], [44.0, 46.74], [52.0, 53.06], [57.0, 56.69], [58.0, 58.89], [60.0, 61.1], [68.0, 68.45], [69.0, 70.07], [72.0, 73.65], [75.0, 75.34], [81.0, 81.68], [103.0, 103.57], [108.0, 108.26], [119.0, 119.77], [124.0, 124.98], [127.0, 128.36], [129.0, 131.03], [132.0, 132.04], [133.0, 134.96], [136.0, 136.78], [138.0, 139.72], [140.0, 141.72], [146.0, 146.33], [154.0, 154.89], [155.0, 155.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 13.07], ["radio", 6.38], ["busy signal", 6.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 79.18], ["speech synthesizer", 2.94], ["inside, small room", 1.93]], null, null, null, null, null, null, null, null], "duration": [0.04, 0.48, 0.34, 0.64, 0.48, 1.61, 0.95, 0.95, 1.31, 1.1, 0.75, 1.01, 2.74, 1.06, -0.31, 0.89, 1.1, 0.45, 1.07, 1.65, 0.34, 0.68, 0.57, 0.26, 0.77, 0.98, 1.36, 2.03, 0.04, 1.96, 0.78, 1.72, 1.72, 0.33, 0.89, 0.9]} \ No newline at end of file diff --git a/annotations_1/nUpmxMzBCjk_filtered.json b/annotations_1/nUpmxMzBCjk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..438888fa1eba5672cd405800bcd5ef878aabd425 --- /dev/null +++ b/annotations_1/nUpmxMzBCjk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.7], [8.0, 12.36], [14.0, 17.9], [25.0, 25.68], [27.0, 27.55], [30.0, 34.67], [35.0, 36.71], [37.0, 38.64], [40.0, 40.91], [42.0, 45.55], [48.0, 48.69], [54.0, 54.09], [56.0, 56.96], [59.0, 63.51], [64.0, 64.37], [84.0, 90.59], [93.0, 93.88], [108.0, 123.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [36.75, 60.14, 68.8, 0.0, 0.0, 47.82, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 36.31, 0.0, 29.6, 0.0, 29.01], "audiomae_on_audioset": [[["music", 42.59], ["trombone", 25.79], ["brass instrument", 9.07]], null, null, null, null, [["speech", 51.64], ["sidetone", 28.04], ["radio", 3.36]], null, null, null, null, null, null, null, [["sidetone", 33.99], ["noise", 8.94], ["music", 8.49]], null, [["speech", 44.57], ["vehicle", 23.4], ["car", 6.47]], null, [["music", 67.61], ["musical instrument", 9.62], ["didgeridoo", 5.21]]], "duration": [3.7, 4.36, 3.9, 0.68, 0.55, 4.67, 1.71, 1.64, 0.91, 3.55, 0.69, 0.09, 0.96, 4.51, 0.37, 6.59, 0.88, 15.82]} \ No newline at end of file diff --git a/annotations_1/nUxHF4O3GYU_filtered.json b/annotations_1/nUxHF4O3GYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41370e49a15feb60be0535fbfc1a65a7252cc267 --- /dev/null +++ b/annotations_1/nUxHF4O3GYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [6.0, 6.96], [12.0, 15.85], [19.0, 19.23], [21.0, 20.75], [22.0, 22.15], [23.0, 24.85], [27.0, 27.43], [34.0, 35.13], [38.0, 39.21], [42.0, 42.67], [44.0, 46.31], [49.0, 51.22], [51.0, 56.76], [58.0, 58.09], [60.0, 62.7], [68.0, 70.16], [72.0, 73.87], [75.0, 75.69], [77.0, 78.51], [80.0, 80.97], [82.0, 86.48], [88.0, 89.65], [93.0, 96.28], [97.0, 99.2], [101.0, 101.26], [104.0, 105.06], [107.0, 108.94], [110.0, 118.56], [119.0, 126.0], [126.0, 129.86], [131.0, 141.62], [143.0, 144.36], [145.0, 146.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 76.04, 32.68, 0.0, 44.57, 76.37, 0.0, 0.0, 0.0, 0.0, 83.34, 0.0, 40.93, 68.15, 0.0, 0.0, 0.0, 65.79, 53.84, 29.99, 57.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.8], ["speech", 19.65], ["mechanisms", 11.37]], null, [["music", 27.76], ["hum", 25.22], ["throbbing", 20.22]], null, null, null, null, null, null, null, [["music", 34.71], ["theremin", 28.19], ["speech", 4.35]], null, null, null, null, null, null, [["speech", 44.56], ["thunk", 24.09], ["breaking", 5.06]], null, null, null], "duration": [0.41, 0.96, 3.85, 0.23, -0.25, 0.15, 1.85, 0.43, 1.13, 1.21, 0.67, 2.31, 2.22, 5.76, 0.09, 2.7, 2.16, 1.87, 0.69, 1.51, 0.97, 4.48, 1.65, 3.28, 2.2, 0.26, 1.06, 1.94, 8.56, 7.0, 3.86, 10.62, 1.36, 1.75]} \ No newline at end of file diff --git a/annotations_1/nVvMBs0TFWA_filtered.json b/annotations_1/nVvMBs0TFWA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46c33f6d8227fd594927a2885e2e4b29fc018cea --- /dev/null +++ b/annotations_1/nVvMBs0TFWA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.06], [7.0, 8.02], [11.0, 11.89], [13.0, 15.09], [15.0, 17.93], [20.0, 22.01], [24.0, 41.25], [43.0, 50.9], [53.0, 68.57], [70.0, 70.09], [74.0, 91.07], [92.0, 99.76], [100.0, 100.53], [102.0, 105.54], [106.0, 108.53], [110.0, 117.02], [118.0, 165.87], [168.0, 172.32]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [98.51, 0.0, 0.0, 81.53, 51.28, 99.99, 44.34, 51.6, 45.33, 0.0, 65.67, 82.97, 0.0, 86.64, 79.07, 61.47, 0.0, 36.72], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 53.77], ["hum", 40.08], ["music", 1.6]], null, [["music", 29.41], ["speech", 10.42], ["didgeridoo", 4.08]], null, null, null, null, null, null, null, null, [["throbbing", 52.39], ["hum", 20.39], ["music", 15.29]]], "duration": [2.06, 1.02, 0.89, 2.09, 2.93, 2.01, 17.25, 7.9, 15.57, 0.09, 17.07, 7.76, 0.53, 3.54, 2.53, 7.02, 47.87, 4.32]} \ No newline at end of file diff --git a/annotations_1/nW92suQFQ5c_filtered.json b/annotations_1/nW92suQFQ5c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24f64d3d1b473ba97cb49292c8405521233a41f4 --- /dev/null +++ b/annotations_1/nW92suQFQ5c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 42.58], [45.0, 46.14], [48.0, 49.67], [52.0, 52.35], [55.0, 55.76], [61.0, 61.57], [63.0, 67.1], [69.0, 81.8]], "keep_status": [false, false, false, false, false, false, true, true], "silence_prob": [57.64, 0.0, 0.0, 0.0, 0.0, 0.0, 40.09, 44.55], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 35.12], ["rumble", 25.09], ["throbbing", 8.95]], [["music", 23.64], ["sine wave", 16.04], ["breaking", 9.09]]], "duration": [3.58, 1.14, 1.67, 0.35, 0.76, 0.57, 4.1, 12.8]} \ No newline at end of file diff --git a/annotations_1/nWd-gLPa5fs_filtered.json b/annotations_1/nWd-gLPa5fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e18433c51d52494490357f95b008736542f935de --- /dev/null +++ b/annotations_1/nWd-gLPa5fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.68], [7.0, 8.04], [11.0, 13.22], [16.0, 16.61], [17.0, 18.49], [21.0, 21.88], [25.0, 25.03], [26.0, 28.44], [30.0, 31.38], [32.0, 32.05], [34.0, 34.62], [42.0, 42.99], [45.0, 46.4], [48.0, 51.73], [53.0, 53.81], [57.0, 57.77], [60.0, 59.88], [62.0, 62.38], [63.0, 66.53], [67.0, 68.69], [70.0, 74.39], [76.0, 80.64], [82.0, 86.86], [90.0, 94.51], [96.0, 97.43], [100.0, 101.16], [104.0, 109.49], [110.0, 115.62], [118.0, 121.39], [123.0, 123.57], [130.0, 130.23], [133.0, 133.47], [137.0, 137.2], [139.0, 139.19], [141.0, 141.52], [143.0, 144.58], [154.0, 154.89], [158.0, 159.34], [162.0, 163.11], [166.0, 166.5], [169.0, 169.32], [170.0, 170.85], [174.0, 177.25]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 0.0, 0.0, 0.0, 35.55, 0.0, 0.0, 0.0, 0.0, 39.19, 0.0, 34.18, 59.24, 90.25, 71.57, 0.0, 0.0, 56.25, 54.36, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.81], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 28.76], ["music", 18.71], ["hum", 6.22]], null, null, null, null, null, [["speech", 63.96], ["music", 6.75], ["didgeridoo", 6.63]], null, null, null, null, [["speech", 33.12], ["music", 30.17], ["theremin", 6.1]], null, [["speech", 50.63], ["music", 21.74], ["musical instrument", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, 1.04, 2.22, 0.61, 1.49, 0.88, 0.03, 2.44, 1.38, 0.05, 0.62, 0.99, 1.4, 3.73, 0.81, 0.77, -0.12, 0.38, 3.53, 1.69, 4.39, 4.64, 4.86, 4.51, 1.43, 1.16, 5.49, 5.62, 3.39, 0.57, 0.23, 0.47, 0.2, 0.19, 0.52, 1.58, 0.89, 1.34, 1.11, 0.5, 0.32, 0.85, 3.25]} \ No newline at end of file diff --git a/annotations_1/nWwlcubR7s0_filtered.json b/annotations_1/nWwlcubR7s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..586f7913c661adca0051e7a34b36fb99f7f219e4 --- /dev/null +++ b/annotations_1/nWwlcubR7s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.39], [12.0, 13.09], [21.0, 22.27], [24.0, 24.61], [29.0, 30.94], [43.0, 45.64], [47.0, 47.88], [51.0, 53.33], [57.0, 57.99], [66.0, 66.46], [69.0, 71.63], [77.0, 77.4], [80.0, 81.41], [83.0, 83.17], [102.0, 101.71], [113.0, 113.22], [122.0, 121.93], [131.0, 132.9], [144.0, 147.18], [151.0, 151.29], [154.0, 164.25], [165.0, 165.72], [166.0, 166.82]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [35.44, 0.0, 0.0, 0.0, 0.0, 29.54, 0.0, 30.52, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.04, 0.0, 33.97, 0.0, 0.0], "audiomae_on_audioset": [[["beatboxing", 32.52], ["music", 12.26], ["cough", 11.26]], null, null, null, null, [["music", 60.67], ["speech", 10.53], ["boing", 4.39]], null, [["music", 47.42], ["throbbing", 4.92], ["mains hum", 2.54]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 38.47], ["speech", 24.17], ["sonar", 5.89]], null, null], "duration": [2.39, 1.09, 1.27, 0.61, 1.94, 2.64, 0.88, 2.33, 0.99, 0.46, 2.63, 0.4, 1.41, 0.17, -0.29, 0.22, -0.07, 1.9, 3.18, 0.29, 10.25, 0.72, 0.82]} \ No newline at end of file diff --git a/annotations_1/nXSfDMvXAxw_filtered.json b/annotations_1/nXSfDMvXAxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce2377b1e19e8a20dc7ac5392b4b1f6b5258eeaf --- /dev/null +++ b/annotations_1/nXSfDMvXAxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.35], [10.0, 12.72], [20.0, 21.42], [24.0, 24.54], [27.0, 27.65], [33.0, 34.35], [35.0, 36.58], [51.0, 57.06], [57.0, 58.31], [59.0, 64.25], [66.0, 69.45], [71.0, 71.59], [73.0, 73.82], [75.0, 75.02], [76.0, 76.52]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 48.1, 0.0, 67.13, 58.22, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["fart", 25.51], ["noise", 5.91], ["frog", 4.62]], null, null, null, null, null, [["fly, housefly", 28.26], ["mosquito", 23.77], ["whale vocalization", 5.42]], null, null, null, null, null, null, null], "duration": [1.35, 2.72, 1.42, 0.54, 0.65, 1.35, 1.58, 6.06, 1.31, 5.25, 3.45, 0.59, 0.82, 0.02, 0.52]} \ No newline at end of file diff --git a/annotations_1/nXV8YHeJfOs_filtered.json b/annotations_1/nXV8YHeJfOs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21abc3cde6070ac332715f8d548be3826513ddb8 --- /dev/null +++ b/annotations_1/nXV8YHeJfOs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 28.85], [30.0, 30.72], [31.0, 33.67], [37.0, 45.44], [46.0, 87.83], [89.0, 89.56], [91.0, 92.87], [95.0, 96.01], [97.0, 99.33], [100.0, 107.55], [109.0, 109.8], [111.0, 111.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.49, 0.0, 30.71, 30.34, 0.0, 0.0, 0.0, 0.0, 35.63, 30.55, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.71], ["music", 17.7], ["cacophony", 17.17]], null, [["music", 68.75], ["speech", 9.92], ["smash, crash", 2.78]], [["music", 58.05], ["speech", 15.7], ["hum", 4.65]], null, null, null, null, [["music", 47.67], ["throbbing", 22.68], ["hum", 6.85]], [["throbbing", 48.01], ["music", 18.0], ["hum", 16.28]], null, null], "duration": [19.85, 0.72, 2.67, 8.44, 41.83, 0.56, 1.87, 1.01, 2.33, 7.55, 0.8, 0.59]} \ No newline at end of file diff --git a/annotations_1/nXait2wHOQc_filtered.json b/annotations_1/nXait2wHOQc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2d9dbc3d14be197bb501cf73ebae2566a95fe22 --- /dev/null +++ b/annotations_1/nXait2wHOQc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.96], [18.0, 19.13], [26.0, 27.38], [32.0, 32.58], [33.0, 33.74], [34.0, 38.13], [39.0, 39.93], [43.0, 43.14], [47.0, 50.35], [53.0, 54.73], [55.0, 56.67], [58.0, 62.04], [67.0, 67.63], [72.0, 72.44], [75.0, 76.05], [78.0, 79.03], [83.0, 85.02], [86.0, 86.97], [93.0, 93.24], [94.0, 98.15], [107.0, 108.06], [110.0, 112.8], [113.0, 117.29], [117.0, 118.15], [120.0, 125.85], [127.0, 130.3], [132.0, 138.64], [141.0, 149.74], [154.0, 155.9], [158.0, 159.16], [163.0, 163.81], [165.0, 165.6], [167.0, 169.05], [171.0, 171.32], [176.0, 176.47], [180.0, 181.92], [182.0, 182.04], [182.0, 182.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.44, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 85.35, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 91.98, 0.0, 73.82, 89.19, 0.0, 43.66, 44.9, 49.68, 44.4, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.97], ["music", 35.01], ["boing", 3.12]], null, null, null, null, null, null, null, [["speech", 37.17], ["music", 31.95], ["boing", 5.89]], [["speech", 33.06], ["music", 16.09], ["livestock, farm animals, working animals", 7.69]], [["music", 50.53], ["livestock, farm animals, working animals", 7.0], ["boing", 4.87]], [["music", 58.2], ["speech", 11.16], ["boing", 10.57]], null, null, null, null, null, null, null, null, null, null], "duration": [3.96, 1.13, 1.38, 0.58, 0.74, 4.13, 0.93, 0.14, 3.35, 1.73, 1.67, 4.04, 0.63, 0.44, 1.05, 1.03, 2.02, 0.97, 0.24, 4.15, 1.06, 2.8, 4.29, 1.15, 5.85, 3.3, 6.64, 8.74, 1.9, 1.16, 0.81, 0.6, 2.05, 0.32, 0.47, 1.92, 0.04, 0.58]} \ No newline at end of file diff --git a/annotations_1/nXrsB2RMo2w_filtered.json b/annotations_1/nXrsB2RMo2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e70bcbcaaae8dc635ecbd79e80a8597e78d7eff --- /dev/null +++ b/annotations_1/nXrsB2RMo2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 55.49], [57.0, 57.82], [59.0, 60.3], [61.0, 62.26], [63.0, 108.87], [110.0, 110.24], [111.0, 113.48], [116.0, 116.09], [116.0, 116.46], [117.0, 118.29], [121.0, 121.88], [123.0, 127.11], [128.0, 129.68], [130.0, 132.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 40.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 55.97], ["speech", 30.32], ["dial tone", 5.23]]], "duration": [38.49, 0.82, 1.3, 1.26, 45.87, 0.24, 2.48, 0.09, 0.46, 1.29, 0.88, 4.11, 1.68, 2.41]} \ No newline at end of file diff --git a/annotations_1/nYvvM0FXKWQ_filtered.json b/annotations_1/nYvvM0FXKWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa677631e4f81621c1812a428b064f0bbac5bad5 --- /dev/null +++ b/annotations_1/nYvvM0FXKWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.13], [10.0, 11.8], [13.0, 16.44], [22.0, 25.12], [28.0, 30.3], [31.0, 33.27], [39.0, 40.51], [42.0, 42.48], [45.0, 49.01], [53.0, 73.31], [85.0, 85.31], [86.0, 86.26], [88.0, 89.78], [94.0, 95.23], [97.0, 97.63], [101.0, 101.49], [102.0, 138.82], [139.0, 139.23], [140.0, 142.08], [148.0, 149.86], [154.0, 154.21], [156.0, 160.1]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 92.8, 89.19, 66.63, 56.55, 0.0, 0.0, 29.99, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 32.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 51.3], ["hum", 7.95], ["explosion", 5.34]], [["music", 73.48], ["theremin", 6.99], ["soundtrack music", 3.45]], null, null, null, null, null, null, null, null, null, null, null, [["music", 43.05], ["throbbing", 11.28], ["hum", 4.79]]], "duration": [1.13, 1.8, 3.44, 3.12, 2.3, 2.27, 1.51, 0.48, 4.01, 20.31, 0.31, 0.26, 1.78, 1.23, 0.63, 0.49, 36.82, 0.23, 2.08, 1.86, 0.21, 4.1]} \ No newline at end of file diff --git a/annotations_1/n_3Fsg5qGfk_filtered.json b/annotations_1/n_3Fsg5qGfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa7a32dbbd46625a6978fd6e7972e0ed1eed426f --- /dev/null +++ b/annotations_1/n_3Fsg5qGfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [14.0, 14.44], [15.0, 17.09], [18.0, 32.68], [35.0, 35.55], [39.0, 45.5], [46.0, 45.59], [46.0, 45.64], [46.0, 45.69], [46.0, 45.77], [46.0, 60.0], [63.0, 62.82], [65.0, 66.38], [67.0, 67.64], [68.0, 70.02], [70.0, 73.58], [75.0, 78.21], [82.0, 85.14], [86.0, 87.18], [89.0, 92.13], [93.0, 94.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 96.04, 70.44, 0.0, 31.89, 0.0, 0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 33.12, 76.7, 94.81, 91.13, 0.0, 77.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 59.98], ["music", 16.83], ["explosion", 5.29]], null, null, null, null, null, null, null, null, [["speech", 41.19], ["music", 9.35], ["boing", 6.62]], null, null, null, null, null, null], "duration": [0.42, 0.44, 2.09, 14.68, 0.55, 6.5, -0.41, -0.36, -0.31, -0.23, 14.0, -0.18, 1.38, 0.64, 2.02, 3.58, 3.21, 3.14, 1.18, 3.13, 1.44]} \ No newline at end of file diff --git a/annotations_1/n_ci8BbMilc_filtered.json b/annotations_1/n_ci8BbMilc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6cb22331a35606ad74e741daedf08bebb2c5f1e --- /dev/null +++ b/annotations_1/n_ci8BbMilc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [3.0, 3.35], [4.0, 23.28], [49.0, 59.73], [67.0, 68.28], [92.0, 92.84], [100.0, 101.02], [105.0, 105.85], [107.0, 117.58], [119.0, 127.25], [129.0, 128.95], [130.0, 130.96], [131.0, 132.19]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 41.12, 63.64, 0.0, 0.0, 0.0, 0.0, 30.18, 30.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 50.34], ["musical instrument", 8.34], ["synthesizer", 3.85]], null, null, null, null, null, [["speech", 29.08], ["music", 16.03], ["groan", 5.4]], [["fart", 37.45], ["crying, sobbing", 12.66], ["speech", 11.7]], null, null, null], "duration": [0.29, 0.35, 19.28, 10.73, 1.28, 0.84, 1.02, 0.85, 10.58, 8.25, -0.05, 0.96, 1.19]} \ No newline at end of file diff --git a/annotations_1/n_z0TcZkPzg_filtered.json b/annotations_1/n_z0TcZkPzg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6862282df47460fe370019e8dffc799f88be0a3 --- /dev/null +++ b/annotations_1/n_z0TcZkPzg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.02], [12.0, 12.31], [12.0, 17.09], [25.0, 25.35], [26.0, 26.49], [40.0, 41.15], [42.0, 44.95], [46.0, 46.97], [51.0, 51.73], [54.0, 55.07], [58.0, 69.01], [71.0, 70.95], [71.0, 71.12], [72.0, 84.72], [85.0, 87.99], [90.0, 91.08], [92.0, 93.45], [95.0, 96.85], [99.0, 99.33], [102.0, 102.96], [105.0, 106.22], [113.0, 118.99], [120.0, 120.36], [124.0, 124.92]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [46.19, 0.0, 42.67, 0.0, 0.0, 0.0, 69.07, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 97.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 43.44], ["music", 14.62], ["speech", 6.65]], null, [["music", 23.87], ["foghorn", 22.99], ["speech", 12.0]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["busy signal", 16.71], ["speech", 12.05], ["dial tone", 8.23]], null, null], "duration": [4.02, 0.31, 5.09, 0.35, 0.49, 1.15, 2.95, 0.97, 0.73, 1.07, 11.01, -0.05, 0.12, 12.72, 2.99, 1.08, 1.45, 1.85, 0.33, 0.96, 1.22, 5.99, 0.36, 0.92]} \ No newline at end of file diff --git a/annotations_1/nbssDN3Y75Q_filtered.json b/annotations_1/nbssDN3Y75Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d82f2459f87bb11582d3d77fb383e8ed01e94b27 --- /dev/null +++ b/annotations_1/nbssDN3Y75Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 14.67], [15.0, 16.34], [18.0, 19.7], [21.0, 22.08], [22.0, 23.57], [24.0, 25.08], [25.0, 25.19], [26.0, 26.77], [29.0, 31.21], [36.0, 38.4], [40.0, 42.5], [45.0, 50.38], [51.0, 56.13], [58.0, 64.77], [66.0, 69.5], [71.0, 73.5], [74.0, 75.27], [76.0, 83.69], [84.0, 96.8], [98.0, 99.94], [101.0, 101.9], [104.0, 105.24], [106.0, 118.45], [131.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false], "silence_prob": [71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.42, 65.44, 80.46, 36.65, 37.59, 62.89, 58.64, 31.29, 0.0, 34.13, 45.24, 0.0, 0.0, 0.0, 32.29, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 40.79], ["music", 22.71], ["hum", 10.37]], [["whale vocalization", 42.36], ["music", 14.83], ["hum", 13.64]], null, null, [["hum", 28.61], ["music", 18.83], ["mains hum", 17.77]], null, [["music", 31.29], ["noise", 13.97], ["hum", 10.21]], [["music", 53.28], ["hum", 7.08], ["didgeridoo", 5.69]], null, null, null, [["music", 43.38], ["didgeridoo", 12.58], ["hum", 8.96]], null], "duration": [5.67, 1.34, 1.7, 1.08, 1.57, 1.08, 0.19, 0.77, 2.21, 2.4, 2.5, 5.38, 5.13, 6.77, 3.5, 2.5, 1.27, 7.69, 12.8, 1.94, 0.9, 1.24, 12.45, -0.09]} \ No newline at end of file diff --git a/annotations_1/nc0LwkqYGpM_filtered.json b/annotations_1/nc0LwkqYGpM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58ccf12e74f6c42ae743ff77cf94f1eadcdb08f5 --- /dev/null +++ b/annotations_1/nc0LwkqYGpM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.17], [39.0, 39.46], [43.0, 42.82], [47.0, 46.84], [61.0, 61.42], [95.0, 97.48]], "keep_status": [false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.57], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 28.83], ["fart", 11.67], ["music", 11.18]]], "duration": [1.17, 0.46, -0.18, -0.16, 0.42, 2.48]} \ No newline at end of file diff --git a/annotations_1/ndpVsMLr424_filtered.json b/annotations_1/ndpVsMLr424_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d59e35b9db381b19db8fc58772ad46d3e30c59f --- /dev/null +++ b/annotations_1/ndpVsMLr424_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.73], [30.0, 30.27], [31.0, 58.09]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.99], "audiomae_on_audioset": [null, null, [["music", 60.76], ["throbbing", 14.31], ["hum", 5.13]]], "duration": [0.73, 0.27, 27.09]} \ No newline at end of file diff --git a/annotations_1/nepc-GLWtfc_filtered.json b/annotations_1/nepc-GLWtfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd323da0e7167d2d0e3d4ee078716e606e3471f7 --- /dev/null +++ b/annotations_1/nepc-GLWtfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.21], [7.0, 7.7], [9.0, 9.26], [10.0, 11.62], [12.0, 15.04], [16.0, 16.23], [18.0, 19.11], [21.0, 22.05], [24.0, 26.91], [28.0, 31.5], [34.0, 35.82], [37.0, 37.44], [39.0, 42.45], [48.0, 48.09], [51.0, 52.81], [57.0, 57.01], [59.0, 61.64], [63.0, 75.79], [76.0, 77.55], [78.0, 78.54], [79.0, 80.1], [81.0, 81.51]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.7, 0.0, 0.0, 0.0, 33.52, 42.69, 0.0, 0.0, 96.42, 0.0, 0.0, 0.0, 100.0, 98.86, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 41.77], ["cattle, bovinae", 29.85], ["moo", 28.25]], [["hum", 10.67], ["explosion", 7.76], ["speech", 7.31]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.7, 0.26, 1.62, 3.04, 0.23, 1.11, 1.05, 2.91, 3.5, 1.82, 0.44, 3.45, 0.09, 1.81, 0.01, 2.64, 12.79, 1.55, 0.54, 1.1, 0.51]} \ No newline at end of file diff --git a/annotations_1/nfFsHF8guzM_filtered.json b/annotations_1/nfFsHF8guzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb952860edc0e0818efd3a1af7089c3d1da472d --- /dev/null +++ b/annotations_1/nfFsHF8guzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.3], [10.0, 10.08], [11.0, 24.75], [29.0, 30.5], [31.0, 31.46], [34.0, 36.21], [42.0, 41.94], [43.0, 43.92], [47.0, 47.04], [49.0, 49.11], [54.0, 55.27], [56.0, 56.03], [58.0, 59.02], [61.0, 61.32], [63.0, 63.05], [66.0, 65.65], [67.0, 67.22], [70.0, 70.39], [72.0, 73.26], [74.0, 74.61], [75.0, 75.09], [80.0, 81.62], [84.0, 85.43], [87.0, 89.09], [90.0, 90.96], [98.0, 99.17], [101.0, 101.95], [108.0, 110.96]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 34.11, 0.0, 0.0, 33.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 47.2], "audiomae_on_audioset": [null, null, [["music", 28.34], ["speech", 16.3], ["vehicle", 4.43]], null, null, [["livestock, farm animals, working animals", 38.11], ["cattle, bovinae", 37.86], ["moo", 23.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.94], ["speech", 10.34], ["didgeridoo", 4.7]], null, null, null, [["livestock, farm animals, working animals", 37.19], ["cattle, bovinae", 27.62], ["moo", 11.78]]], "duration": [0.3, 0.08, 13.75, 1.5, 0.46, 2.21, -0.06, 0.92, 0.04, 0.11, 1.27, 0.03, 1.02, 0.32, 0.05, -0.35, 0.22, 0.39, 1.26, 0.61, 0.09, 1.62, 1.43, 2.09, 0.96, 1.17, 0.95, 2.96]} \ No newline at end of file diff --git a/annotations_1/nfQr0dDL8jg_filtered.json b/annotations_1/nfQr0dDL8jg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90c0bb5a8665cd07dc4a2435fb134ae7e54e15bd --- /dev/null +++ b/annotations_1/nfQr0dDL8jg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.64], [18.0, 59.64], [61.0, 64.89], [65.0, 97.85]], "keep_status": [false, false, false, false], "silence_prob": [55.18, 0.0, 43.61, 0.0], "audiomae_on_audioset": [null, null, [["music", 64.14], ["didgeridoo", 20.37], ["theremin", 4.04]], null], "duration": [2.64, 41.64, 3.89, 32.85]} \ No newline at end of file diff --git a/annotations_1/ng95gpwSjZU_filtered.json b/annotations_1/ng95gpwSjZU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ed5a72e18bee9f7742a221da760d5fba5cd4575 --- /dev/null +++ b/annotations_1/ng95gpwSjZU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [5.0, 7.1], [9.0, 10.59], [14.0, 15.7], [19.0, 19.11], [22.0, 26.45], [27.0, 29.89], [30.0, 32.09], [38.0, 40.22], [41.0, 42.09], [46.0, 46.18], [46.0, 46.41], [48.0, 48.96], [50.0, 52.83], [61.0, 61.74], [84.0, 84.64], [86.0, 87.12], [88.0, 88.11], [88.0, 89.14], [91.0, 92.89], [98.0, 99.93], [110.0, 110.61], [119.0, 120.83], [129.0, 129.61], [131.0, 132.27], [135.0, 136.41], [141.0, 142.37], [144.0, 145.35], [147.0, 146.82], [148.0, 147.82], [149.0, 149.67], [153.0, 153.3], [159.0, 162.4], [167.0, 167.8], [169.0, 170.33], [174.0, 174.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 40.21, 0.0, 0.0, 0.0, 58.89, 51.71, 55.11, 76.04, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["gong", 40.58], ["music", 28.15], ["singing bowl", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 64.51], ["theremin", 7.06], ["didgeridoo", 2.84]], null, null, null], "duration": [0.22, 2.1, 1.59, 1.7, 0.11, 4.45, 2.89, 2.09, 2.22, 1.09, 0.18, 0.41, 0.96, 2.83, 0.74, 0.64, 1.12, 0.11, 1.14, 1.89, 1.93, 0.61, 1.83, 0.61, 1.27, 1.41, 1.37, 1.35, -0.18, -0.18, 0.67, 0.3, 3.4, 0.8, 1.33, 0.61]} \ No newline at end of file diff --git a/annotations_1/ngLX1uDh-eg_filtered.json b/annotations_1/ngLX1uDh-eg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9bae35ea95a4572fae153321520bc698ec5fc86 --- /dev/null +++ b/annotations_1/ngLX1uDh-eg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [12.0, 13.85], [16.0, 17.27], [18.0, 19.21], [21.0, 50.53], [55.0, 56.02], [65.0, 66.66], [68.0, 69.84], [73.0, 73.67], [80.0, 81.8], [83.0, 83.13], [85.0, 84.87], [93.0, 94.05], [98.0, 99.59], [101.0, 108.99], [110.0, 111.01], [116.0, 116.46], [119.0, 120.18], [120.0, 120.23], [120.0, 122.45], [125.0, 125.68], [131.0, 131.52], [135.0, 135.11], [140.0, 139.75], [154.0, 169.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 0.0, 0.0, 0.0, 37.82, 0.0, 0.0, 0.0, 0.0, 36.78], "audiomae_on_audioset": [null, null, null, null, [["music", 71.93], ["electronic music", 3.43], ["drum and bass", 3.4]], null, null, null, null, null, null, null, null, null, [["music", 47.98], ["synthesizer", 22.54], ["keyboard (musical)", 4.39]], null, null, null, null, [["music", 53.58], ["musical instrument", 4.95], ["synthesizer", 4.0]], null, null, null, null, [["music", 55.79], ["didgeridoo", 7.98], ["singing", 3.91]]], "duration": [0.45, 1.85, 1.27, 1.21, 29.53, 1.02, 1.66, 1.84, 0.67, 1.8, 0.13, -0.13, 1.05, 1.59, 7.99, 1.01, 0.46, 1.18, 0.23, 2.45, 0.68, 0.52, 0.11, -0.25, 15.3]} \ No newline at end of file diff --git a/annotations_1/ngRthItc3Yc_filtered.json b/annotations_1/ngRthItc3Yc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bdecbca0080fc7088946684bd6d5d4c45cc4ecf --- /dev/null +++ b/annotations_1/ngRthItc3Yc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 131.67], [141.0, 143.99], [145.0, 146.11], [146.0, 153.15], [155.0, 155.68], [157.0, 157.74]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 31.52, 0.0, 30.82, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 21.8], ["music", 18.99], ["throbbing", 11.68]], null, [["hum", 41.79], ["throbbing", 24.0], ["music", 12.97]], null, null], "duration": [128.67, 2.99, 1.11, 7.15, 0.68, 0.74]} \ No newline at end of file diff --git a/annotations_1/ngSM_wxh0lE_filtered.json b/annotations_1/ngSM_wxh0lE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..063d1350ff13e74f08aa7c41e8ef59cc6cb7d20a --- /dev/null +++ b/annotations_1/ngSM_wxh0lE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 57.55], [79.0, 79.57], [82.0, 83.13], [94.0, 94.68]], "keep_status": [true, false, false, false], "silence_prob": [31.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.83], ["crowd", 10.08], ["speech", 2.24]], null, null, null], "duration": [16.55, 0.57, 1.13, 0.68]} \ No newline at end of file diff --git a/annotations_1/ngdsRt31sIc_filtered.json b/annotations_1/ngdsRt31sIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88a973ddf842aff8aa106d0eb401607144c37245 --- /dev/null +++ b/annotations_1/ngdsRt31sIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.16], [13.0, 31.04], [31.0, 31.14], [31.0, 31.63], [33.0, 35.16], [37.0, 46.33], [48.0, 73.62], [77.0, 77.13], [78.0, 80.35], [82.0, 109.44], [113.0, 113.49], [114.0, 114.94], [116.0, 116.85]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [31.87, 33.54, 0.0, 0.0, 34.27, 30.48, 30.46, 0.0, 75.88, 31.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 47.82], ["music", 8.68], ["explosion", 6.18]], [["speech", 62.58], ["music", 5.48], ["electric shaver, electric razor", 4.81]], null, null, [["speech", 12.83], ["whip", 6.84], ["music", 6.58]], [["music", 47.62], ["speech", 19.76], ["didgeridoo", 15.13]], [["music", 55.79], ["hum", 5.45], ["throbbing", 4.28]], null, null, [["grunt", 68.52], ["music", 7.24], ["groan", 3.86]], null, null, null], "duration": [4.16, 18.04, 0.14, 0.63, 2.16, 9.33, 25.62, 0.13, 2.35, 27.44, 0.49, 0.94, 0.85]} \ No newline at end of file diff --git a/annotations_1/nhvRzLcCk40_filtered.json b/annotations_1/nhvRzLcCk40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215d3e27547d75c8d888bd29c2ba2611d3d8814f --- /dev/null +++ b/annotations_1/nhvRzLcCk40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.95], [20.0, 24.63], [27.0, 60.67], [63.0, 78.53], [80.0, 112.83], [114.0, 116.43], [119.0, 126.52], [131.0, 175.09], [176.0, 176.1]], "keep_status": [false, false, false, true, false, true, true, false, false], "silence_prob": [57.17, 70.02, 0.0, 30.81, 0.0, 29.62, 33.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 19.88], ["cacophony", 9.74], ["explosion", 8.21]], null, [["music", 33.79], ["hum", 6.3], ["mains hum", 5.33]], [["music", 29.67], ["synthesizer", 18.96], ["hum", 8.56]], null, null], "duration": [4.95, 4.63, 33.67, 15.53, 32.83, 2.43, 7.52, 44.09, 0.1]} \ No newline at end of file diff --git a/annotations_1/nifcKdVjpbw_filtered.json b/annotations_1/nifcKdVjpbw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c8334439369637dc68fdea13c4ce49efdef3236 --- /dev/null +++ b/annotations_1/nifcKdVjpbw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [10.0, 10.57], [23.0, 25.59], [27.0, 27.45], [29.0, 29.05], [36.0, 35.83], [44.0, 46.55], [50.0, 50.62], [52.0, 52.57], [53.0, 53.15], [57.0, 57.64], [59.0, 58.95], [61.0, 61.69], [63.0, 108.24], [115.0, 116.11], [116.0, 119.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.74], ["speech", 34.1], ["hum", 8.1]]], "duration": [0.18, 0.57, 2.59, 0.45, 0.05, -0.17, 2.55, 0.62, 0.57, 0.15, 0.64, -0.05, 0.69, 45.24, 1.11, 3.65]} \ No newline at end of file diff --git a/annotations_1/nixHRzTvCUE_filtered.json b/annotations_1/nixHRzTvCUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7226b3fcfa28aa54a4f018561350c1f11dd82643 --- /dev/null +++ b/annotations_1/nixHRzTvCUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.82], [24.0, 24.49], [27.0, 29.25], [33.0, 33.13], [35.0, 36.71], [38.0, 40.76], [42.0, 44.04], [44.0, 44.22], [44.0, 44.31], [44.0, 45.62], [46.0, 48.29], [49.0, 50.89], [52.0, 52.83], [54.0, 53.91], [58.0, 59.39], [60.0, 129.47], [129.0, 129.56], [130.0, 145.77], [149.0, 153.01], [156.0, 175.24]], "keep_status": [true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [31.9, 0.0, 35.02, 0.0, 0.0, 86.27, 46.68, 0.0, 0.0, 0.0, 33.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.02, 28.68, 30.7], "audiomae_on_audioset": [[["hum", 28.05], ["music", 9.44], ["mains hum", 6.24]], null, [["beatboxing", 10.27], ["gasp", 8.03], ["grunt", 7.83]], null, null, null, [["speech", 60.01], ["music", 16.93], ["radio", 3.36]], null, null, null, [["sound effect", 8.41], ["fly, housefly", 8.32], ["music", 7.12]], null, null, null, null, null, null, [["throbbing", 38.53], ["hum", 30.08], ["music", 12.56]], [["mains hum", 37.35], ["hum", 25.8], ["rumble", 4.92]], [["music", 45.38], ["hum", 10.13], ["mains hum", 5.85]]], "duration": [18.82, 0.49, 2.25, 0.13, 1.71, 2.76, 2.04, 0.22, 0.31, 1.62, 2.29, 1.89, 0.83, -0.09, 1.39, 69.47, 0.56, 15.77, 4.01, 19.24]} \ No newline at end of file diff --git a/annotations_1/njfu6wuNC_w_filtered.json b/annotations_1/njfu6wuNC_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5969abc120c5d1d3a705dc65dabeeba877e48851 --- /dev/null +++ b/annotations_1/njfu6wuNC_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.23], [5.0, 6.51], [8.0, 8.6], [11.0, 11.48], [12.0, 13.04], [14.0, 15.08], [19.0, 23.95], [25.0, 28.66], [29.0, 33.0], [34.0, 41.91], [44.0, 43.61], [44.0, 44.95], [47.0, 51.65], [54.0, 58.65], [61.0, 61.62], [63.0, 66.16], [67.0, 69.92], [71.0, 75.78], [78.0, 80.1], [82.0, 82.14], [83.0, 85.14], [88.0, 89.94], [92.0, 103.6], [104.0, 106.42], [107.0, 108.8], [110.0, 112.73], [113.0, 113.46], [116.0, 116.38], [128.0, 128.46], [133.0, 133.73], [137.0, 137.29]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [57.01, 0.0, 0.0, 0.0, 0.0, 0.0, 42.02, 42.39, 36.73, 37.47, 0.0, 0.0, 35.85, 41.3, 0.0, 37.44, 47.82, 47.78, 62.37, 0.0, 51.02, 0.0, 43.4, 35.12, 0.0, 39.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 25.1], ["speech", 20.89], ["mains hum", 14.68]], [["hum", 45.03], ["mains hum", 37.99], ["music", 4.4]], [["speech", 32.54], ["mains hum", 32.26], ["hum", 19.34]], [["hum", 43.62], ["mains hum", 27.24], ["throbbing", 3.85]], null, null, [["speech", 45.23], ["hum", 26.02], ["mains hum", 8.98]], [["hum", 21.51], ["mains hum", 7.66], ["vehicle", 5.4]], null, [["mains hum", 34.78], ["hum", 32.13], ["music", 8.71]], [["hum", 16.39], ["mains hum", 7.97], ["vehicle", 5.81]], [["hum", 13.36], ["vehicle", 8.85], ["mains hum", 6.33]], null, null, null, null, [["hum", 44.26], ["mains hum", 32.43], ["whale vocalization", 8.76]], [["hum", 45.87], ["mains hum", 39.09], ["throbbing", 3.83]], null, [["mains hum", 49.74], ["hum", 37.84], ["throbbing", 1.54]], null, null, null, null, null], "duration": [2.23, 1.51, 0.6, 0.48, 1.04, 1.08, 4.95, 3.66, 4.0, 7.91, -0.39, 0.95, 4.65, 4.65, 0.62, 3.16, 2.92, 4.78, 2.1, 0.14, 2.14, 1.94, 11.6, 2.42, 1.8, 2.73, 0.46, 0.38, 0.46, 0.73, 0.29]} \ No newline at end of file diff --git a/annotations_1/njnCT6sD1Bk_filtered.json b/annotations_1/njnCT6sD1Bk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..680ad3efff3b1dc2daa19cd5ed62956d2f2e3256 --- /dev/null +++ b/annotations_1/njnCT6sD1Bk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.72], [7.0, 10.99], [12.0, 12.78], [17.0, 17.9], [18.0, 19.2], [21.0, 21.59], [25.0, 25.95], [30.0, 37.07], [39.0, 39.43], [41.0, 41.67], [43.0, 45.0], [49.0, 51.66], [53.0, 56.24], [58.0, 58.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true, false], "silence_prob": [39.74, 39.63, 0.0, 0.0, 0.0, 0.0, 0.0, 36.34, 0.0, 0.0, 52.56, 30.8, 31.58, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 41.87], ["moo", 35.17], ["livestock, farm animals, working animals", 18.32]], [["speech", 54.84], ["music", 19.07], ["hum", 3.76]], null, null, null, null, null, [["speech", 16.48], ["music", 14.54], ["fly, housefly", 6.57]], null, null, null, [["whale vocalization", 48.8], ["music", 7.26], ["vehicle", 3.92]], [["speech", 29.28], ["music", 12.38], ["vehicle", 4.83]], null], "duration": [2.72, 3.99, 0.78, 0.9, 1.2, 0.59, 0.95, 7.07, 0.43, 0.67, 2.0, 2.66, 3.24, 0.46]} \ No newline at end of file diff --git a/annotations_1/njq3H2iy2X0_filtered.json b/annotations_1/njq3H2iy2X0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9323f50b976120dc3e6c3e2550a7cecab38884d --- /dev/null +++ b/annotations_1/njq3H2iy2X0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.48], [6.0, 7.32], [8.0, 8.21], [16.0, 17.32], [31.0, 31.29], [40.0, 45.22], [47.0, 48.57], [49.0, 50.62], [58.0, 61.48], [81.0, 81.57], [83.0, 83.59], [85.0, 85.75], [87.0, 87.24], [100.0, 101.46], [104.0, 105.73], [110.0, 110.35], [117.0, 118.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.48, 1.32, 0.21, 1.32, 0.29, 5.22, 1.57, 1.62, 3.48, 0.57, 0.59, 0.75, 0.24, 1.46, 1.73, 0.35, 1.12]} \ No newline at end of file diff --git a/annotations_1/njz1p35e_EU_filtered.json b/annotations_1/njz1p35e_EU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a13359b0f51e5d7226559bd999fe2871677dcea8 --- /dev/null +++ b/annotations_1/njz1p35e_EU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.67], [11.0, 11.42], [24.0, 30.0], [33.0, 32.91], [36.0, 43.14], [43.0, 43.92], [44.0, 57.52], [70.0, 71.78], [75.0, 97.24], [99.0, 108.87], [111.0, 132.39], [132.0, 132.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.24, 0.0, 31.69, 0.0, 31.28, 0.0, 29.94, 29.79, 50.16, 0.0], "audiomae_on_audioset": [null, null, [["music", 76.17], ["theremin", 6.39], ["musical instrument", 4.25]], null, [["speech", 43.97], ["music", 17.29], ["sidetone", 14.87]], null, [["music", 45.4], ["speech", 26.66], ["musical instrument", 2.66]], null, [["music", 41.32], ["gong", 24.64], ["theremin", 9.74]], [["music", 54.32], ["theremin", 27.69], ["musical instrument", 7.08]], null, null], "duration": [1.67, 0.42, 6.0, -0.09, 7.14, 0.92, 13.52, 1.78, 22.24, 9.87, 21.39, 0.53]} \ No newline at end of file diff --git a/annotations_1/nkuKrymtuCg_filtered.json b/annotations_1/nkuKrymtuCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..863ef5108e83d2184491896c57e988b26a9f633a --- /dev/null +++ b/annotations_1/nkuKrymtuCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.28], [12.0, 33.4], [34.0, 35.09], [37.0, 37.76], [40.0, 48.24], [49.0, 52.42], [54.0, 54.87], [55.0, 59.17], [60.0, 94.44], [96.0, 100.11], [102.0, 103.17]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [75.23, 33.91, 0.0, 0.0, 99.8, 99.31, 0.0, 78.04, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, [["breaking", 38.56], ["glass", 6.61], ["boing", 4.54]], null, null, null, null, null, null, null, [["music", 41.88], ["carnatic music", 15.81], ["musical instrument", 7.35]], null], "duration": [9.28, 21.4, 1.09, 0.76, 8.24, 3.42, 0.87, 4.17, 34.44, 4.11, 1.17]} \ No newline at end of file diff --git a/annotations_1/nlJqcYb65o0_filtered.json b/annotations_1/nlJqcYb65o0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d119775aae6df2c60025fdecd3ba032a0e5b2a9 --- /dev/null +++ b/annotations_1/nlJqcYb65o0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[102.0, 136.32], [139.0, 146.65]], "keep_status": [false, true], "silence_prob": [0.0, 32.0], "audiomae_on_audioset": [null, [["music", 48.25], ["speech", 5.68], ["vehicle", 5.0]]], "duration": [34.32, 7.65]} \ No newline at end of file diff --git a/annotations_1/nm86_ZWeUzk_filtered.json b/annotations_1/nm86_ZWeUzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea59904c509fd5005a1c7376a6fc9f1eaa1716c2 --- /dev/null +++ b/annotations_1/nm86_ZWeUzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [6.0, 13.02], [13.0, 13.63], [18.0, 22.49], [30.0, 40.14], [45.0, 49.18], [54.0, 60.76], [61.0, 76.32], [85.0, 87.34], [91.0, 96.01], [102.0, 103.25], [107.0, 107.5], [108.0, 108.73], [110.0, 110.29], [122.0, 130.94], [135.0, 135.67], [139.0, 139.4], [139.0, 144.63]], "keep_status": [false, false, false, true, true, true, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 29.12, 0.0, 28.63, 28.66, 34.38, 28.65, 31.97, 36.04, 29.69, 0.0, 0.0, 0.0, 0.0, 28.54, 0.0, 0.0, 28.17], "audiomae_on_audioset": [null, [["mains hum", 36.13], ["hum", 25.19], ["speech", 11.62]], null, [["breaking", 28.92], ["music", 17.03], ["speech", 10.81]], [["music", 48.29], ["cowbell", 5.21], ["thump, thud", 3.55]], [["music", 32.01], ["throbbing", 19.13], ["speech", 14.06]], [["sidetone", 45.08], ["music", 18.7], ["throbbing", 8.59]], [["speech", 37.4], ["music", 37.09], ["didgeridoo", 11.96]], [["speech", 43.2], ["music", 23.02], ["throbbing", 4.25]], [["music", 31.12], ["throbbing", 18.08], ["hum", 11.19]], null, null, null, null, [["explosion", 33.7], ["burst, pop", 8.03], ["smash, crash", 7.51]], null, null, [["speech", 79.61], ["music", 6.24], ["vehicle", 1.75]]], "duration": [0.65, 7.02, 0.63, 4.49, 10.14, 4.18, 6.76, 15.32, 2.34, 5.01, 1.25, 0.5, 0.73, 0.29, 8.94, 0.67, 0.4, 5.63]} \ No newline at end of file diff --git a/annotations_1/nma6daFY6b0_filtered.json b/annotations_1/nma6daFY6b0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..258775f7466f58bfb43a834ce84838160f3ef987 --- /dev/null +++ b/annotations_1/nma6daFY6b0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.79], [5.0, 6.52], [9.0, 9.19], [12.0, 12.29], [13.0, 13.68], [15.0, 16.56], [18.0, 18.5], [20.0, 22.99], [24.0, 29.54], [30.0, 31.06], [36.0, 36.14], [38.0, 38.67], [40.0, 41.05], [43.0, 44.27], [46.0, 47.66], [52.0, 52.54], [55.0, 62.02], [65.0, 66.45], [75.0, 75.78], [77.0, 77.21], [78.0, 87.54], [88.0, 130.35]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.79, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 34.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["throbbing", 32.75], ["hum", 20.64], ["music", 7.06]], [["music", 37.17], ["hum", 12.33], ["electronic music", 9.28]], null, null, null, null, null, null, null, [["throbbing", 52.22], ["hum", 25.49], ["music", 9.36]], null, null, null, [["breaking", 37.95], ["hum", 19.2], ["music", 8.72]], null], "duration": [0.79, 1.52, 0.19, 0.29, 0.68, 1.56, 0.5, 2.99, 5.54, 1.06, 0.14, 0.67, 1.05, 1.27, 1.66, 0.54, 7.02, 1.45, 0.78, 0.21, 9.54, 42.35]} \ No newline at end of file diff --git a/annotations_1/nmaCobIvt2w_filtered.json b/annotations_1/nmaCobIvt2w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ede4a7d56b578ca903b7fa3488dfb55a9f66bf3 --- /dev/null +++ b/annotations_1/nmaCobIvt2w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [10.0, 11.6], [14.0, 15.94], [28.0, 38.31], [44.0, 45.25], [48.0, 48.12], [51.0, 55.43], [58.0, 58.14], [68.0, 68.23], [71.0, 70.7], [73.0, 73.57], [77.0, 81.04], [82.0, 91.83], [103.0, 106.1], [111.0, 135.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 32.48, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 0.0, 35.33, 33.7, 38.56, 31.15], "audiomae_on_audioset": [null, null, null, [["music", 64.98], ["electronic music", 8.24], ["trance music", 7.38]], null, null, [["music", 47.78], ["throbbing", 15.77], ["trance music", 10.38]], null, null, null, null, [["music", 61.55], ["speech", 22.48], ["electronic music", 3.2]], [["music", 72.72], ["throbbing", 8.98], ["hum", 6.23]], [["music", 43.1], ["sidetone", 6.52], ["throbbing", 6.19]], [["music", 53.46], ["speech", 4.81], ["throbbing", 4.36]]], "duration": [-0.06, 1.6, 1.94, 10.31, 1.25, 0.12, 4.43, 0.14, 0.23, -0.3, 0.57, 4.04, 9.83, 3.1, 24.57]} \ No newline at end of file diff --git a/annotations_1/no7XR7s8Z7o_filtered.json b/annotations_1/no7XR7s8Z7o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1c2d989e634b0be67a60303a65b416e7f25238e --- /dev/null +++ b/annotations_1/no7XR7s8Z7o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 12.26], [13.0, 53.91]], "keep_status": [false, false], "silence_prob": [30.56, 0.0], "audiomae_on_audioset": [[["music", 77.92], ["skidding", 3.4], ["synthesizer", 3.19]], null], "duration": [11.26, 40.91]} \ No newline at end of file diff --git a/annotations_1/notFMAwEQeM_filtered.json b/annotations_1/notFMAwEQeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21fcf38e4f69d20056801644a7ace57128b7abff --- /dev/null +++ b/annotations_1/notFMAwEQeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.54], [10.0, 11.4], [13.0, 17.51], [41.0, 42.35], [49.0, 62.29], [72.0, 71.95], [75.0, 79.37], [89.0, 90.05], [93.0, 93.28], [95.0, 95.67], [100.0, 102.68], [105.0, 107.86], [110.0, 123.69], [128.0, 161.81], [165.0, 165.32], [167.0, 167.22], [169.0, 193.08], [195.0, 195.18], [199.0, 200.01], [201.0, 229.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.8, 0.0, 31.53, 0.0, 37.4, 0.0, 0.0, 0.0, 32.3, 29.43, 29.13, 0.0, 0.0, 0.0, 28.51, 0.0, 0.0, 30.45], "audiomae_on_audioset": [null, null, [["music", 67.02], ["throbbing", 14.08], ["hum", 5.89]], null, [["music", 76.75], ["carnatic music", 4.33], ["musical instrument", 2.88]], null, [["music", 50.9], ["throbbing", 14.82], ["hum", 5.06]], null, null, null, [["hum", 20.94], ["mains hum", 18.94], ["rumble", 11.5]], [["speech", 23.88], ["buzz", 10.25], ["vehicle", 7.13]], [["buzz", 43.65], ["music", 18.1], ["electric shaver, electric razor", 7.11]], null, null, null, [["music", 58.46], ["throbbing", 10.34], ["buzz", 7.36]], null, null, [["music", 67.12], ["scary music", 22.92], ["speech", 3.68]]], "duration": [0.54, 1.4, 4.51, 1.35, 13.29, -0.05, 4.37, 1.05, 0.28, 0.67, 2.68, 2.86, 13.69, 33.81, 0.32, 0.22, 24.08, 0.18, 1.01, 28.78]} \ No newline at end of file diff --git a/annotations_1/npSYPN8LXas_filtered.json b/annotations_1/npSYPN8LXas_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12d09db5fe03e49074c22e34051e01e16c837011 --- /dev/null +++ b/annotations_1/npSYPN8LXas_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.14], [9.0, 10.13], [13.0, 13.49], [15.0, 14.96], [39.0, 39.8], [49.0, 50.08], [51.0, 51.44], [53.0, 53.05], [54.0, 55.19], [59.0, 60.32], [61.0, 61.64], [65.0, 65.58], [68.0, 68.61], [75.0, 76.15], [77.0, 77.79], [78.0, 78.39], [82.0, 82.71], [88.0, 88.77], [105.0, 106.42], [108.0, 108.65], [109.0, 110.02], [111.0, 111.54], [114.0, 115.53], [118.0, 118.03], [122.0, 122.66], [162.0, 162.73], [164.0, 164.86], [167.0, 168.12]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["fly, housefly", 34.37], ["insect", 15.49], ["mosquito", 7.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.14, 1.13, 0.49, -0.04, 0.8, 1.08, 0.44, 0.05, 1.19, 1.32, 0.64, 0.58, 0.61, 1.15, 0.79, 0.39, 0.71, 0.77, 1.42, 0.65, 1.02, 0.54, 1.53, 0.03, 0.66, 0.73, 0.86, 1.12]} \ No newline at end of file diff --git a/annotations_1/npaLKZ0Egus_filtered.json b/annotations_1/npaLKZ0Egus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..575f5e133d6ad7d838a2b65c146a3b725a48524f --- /dev/null +++ b/annotations_1/npaLKZ0Egus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 31.31], [32.0, 33.08], [36.0, 39.06], [43.0, 51.0], [52.0, 52.91], [54.0, 70.23], [71.0, 100.36], [103.0, 127.04], [129.0, 168.39], [169.0, 178.04], [182.0, 181.79], [182.0, 182.44], [187.0, 188.6]], "keep_status": [true, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [30.03, 0.0, 31.65, 30.57, 0.0, 29.13, 29.04, 29.17, 0.0, 33.59, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 53.78], ["didgeridoo", 7.73], ["frog", 4.49]], null, [["music", 33.52], ["throbbing", 16.31], ["hum", 6.91]], [["music", 54.08], ["throbbing", 9.42], ["quack", 5.67]], null, [["speech", 38.02], ["music", 36.41], ["animal", 4.71]], [["music", 40.26], ["speech", 29.8], ["throbbing", 8.82]], [["music", 45.85], ["throbbing", 13.4], ["hum", 4.88]], null, [["speech", 56.06], ["music", 19.6], ["theremin", 3.06]], null, null, null], "duration": [6.31, 1.08, 3.06, 8.0, 0.91, 16.23, 29.36, 24.04, 39.39, 9.04, -0.21, 0.44, 1.6]} \ No newline at end of file diff --git a/annotations_1/npkzgnKAgXU_filtered.json b/annotations_1/npkzgnKAgXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fdf5c7d8fe3b7ef925bec66b788993dbaafa3c42 --- /dev/null +++ b/annotations_1/npkzgnKAgXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [5.0, 6.99], [8.0, 9.19], [15.0, 24.63], [25.0, 32.95], [36.0, 39.63], [42.0, 61.7], [63.0, 71.31], [72.0, 71.96], [72.0, 78.75], [79.0, 80.23], [81.0, 82.17], [83.0, 87.52], [88.0, 88.64], [89.0, 89.31], [92.0, 95.1], [100.0, 106.91], [110.0, 111.2], [113.0, 113.49], [115.0, 117.53], [119.0, 128.82]], "keep_status": [false, false, false, false, true, true, false, true, false, false, false, false, true, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 29.8, 29.74, 30.48, 29.7, 30.75, 0.0, 30.53, 0.0, 0.0, 30.02, 0.0, 0.0, 29.66, 29.6, 0.0, 0.0, 30.17, 29.65], "audiomae_on_audioset": [null, null, null, [["speech", 43.2], ["music", 29.82], ["sidetone", 3.16]], [["music", 17.82], ["cattle, bovinae", 13.06], ["livestock, farm animals, working animals", 12.22]], [["music", 42.39], ["speech", 17.98], ["hum", 5.74]], [["music", 41.81], ["speech", 27.82], ["throbbing", 7.11]], [["music", 51.58], ["whack, thwack", 8.07], ["throbbing", 6.92]], null, [["music", 42.32], ["speech", 24.48], ["hum", 8.33]], null, null, [["music", 42.9], ["speech", 13.28], ["didgeridoo", 7.23]], null, null, [["music", 19.69], ["speech", 10.32], ["hum", 9.98]], [["music", 28.87], ["throbbing", 21.01], ["hum", 13.83]], null, null, [["music", 35.05], ["electronic music", 17.02], ["hum", 12.34]], [["music", 70.74], ["musical instrument", 3.53], ["smash, crash", 2.08]]], "duration": [1.05, 1.99, 1.19, 9.63, 7.95, 3.63, 19.7, 8.31, -0.04, 6.75, 1.23, 1.17, 4.52, 0.64, 0.31, 3.1, 6.91, 1.2, 0.49, 2.53, 9.82]} \ No newline at end of file diff --git a/annotations_1/nprJvYKz3QQ_filtered.json b/annotations_1/nprJvYKz3QQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b023c454c149b224e7ee893c5742925b5bc1c347 --- /dev/null +++ b/annotations_1/nprJvYKz3QQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.12], [15.0, 15.03], [15.0, 15.06], [15.0, 16.5], [25.0, 25.0], [26.0, 26.13], [28.0, 28.14], [30.0, 30.96], [33.0, 33.67], [35.0, 35.38], [37.0, 37.39], [41.0, 40.93], [42.0, 42.63], [44.0, 44.0], [49.0, 49.4], [52.0, 55.98], [56.0, 56.73], [57.0, 74.58], [76.0, 75.96], [77.0, 78.41], [79.0, 81.28], [82.0, 82.83], [83.0, 83.64], [84.0, 84.74], [86.0, 92.13], [92.0, 99.27], [100.0, 100.45], [101.0, 101.55], [107.0, 108.48], [109.0, 109.53], [110.0, 111.91], [114.0, 115.94], [116.0, 117.56], [118.0, 118.69], [120.0, 123.4], [124.0, 125.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.16, 0.0, 36.45, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 85.72, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 22.96], ["speech", 22.7], ["hum", 16.91]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.03, 0.06, 1.5, 0.0, 0.13, 0.14, 0.96, 0.67, 0.38, 0.39, -0.07, 0.63, 0.0, 0.4, 3.98, 0.73, 17.58, -0.04, 1.41, 2.28, 0.83, 0.64, 0.74, 6.13, 7.27, 0.45, 0.55, 1.48, 0.53, 1.91, 1.94, 1.56, 0.69, 3.4, 1.95]} \ No newline at end of file diff --git a/annotations_1/npvFfvyT8Pc_filtered.json b/annotations_1/npvFfvyT8Pc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c94d6ba65e14939e6324f229cd940e0ec9b24a3 --- /dev/null +++ b/annotations_1/npvFfvyT8Pc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.13], [7.0, 7.75], [8.0, 9.02], [10.0, 11.08], [14.0, 15.23], [16.0, 17.61], [22.0, 22.65], [24.0, 27.11], [29.0, 30.01], [32.0, 32.0], [34.0, 34.21], [35.0, 36.61], [37.0, 38.31], [41.0, 41.62], [42.0, 43.21], [47.0, 47.7], [53.0, 53.13], [55.0, 55.12], [58.0, 58.46], [61.0, 61.3], [65.0, 66.02], [68.0, 69.03], [70.0, 71.54], [73.0, 73.8], [75.0, 76.69], [80.0, 79.98], [83.0, 84.25], [85.0, 86.48]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 32.13], ["hum", 15.98], ["mains hum", 14.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.13, 0.75, 1.02, 1.08, 1.23, 1.61, 0.65, 3.11, 1.01, 0.0, 0.21, 1.61, 1.31, 0.62, 1.21, 0.7, 0.13, 0.12, 0.46, 0.3, 1.02, 1.03, 1.54, 0.8, 1.69, -0.02, 1.25, 1.48]} \ No newline at end of file diff --git a/annotations_1/nqEL7fP4Rvs_filtered.json b/annotations_1/nqEL7fP4Rvs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8463c25562e40fcaf738b59032f91c00045ed3b4 --- /dev/null +++ b/annotations_1/nqEL7fP4Rvs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 54.75], [57.0, 66.5]], "keep_status": [false, true], "silence_prob": [0.0, 28.35], "audiomae_on_audioset": [null, [["speech", 46.45], ["music", 14.25], ["explosion", 4.45]]], "duration": [44.75, 9.5]} \ No newline at end of file diff --git a/annotations_1/nqF0yFLjiXs_filtered.json b/annotations_1/nqF0yFLjiXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f4c0cfc3c02a361aac384b248c9d7a9d431b3c1 --- /dev/null +++ b/annotations_1/nqF0yFLjiXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.84], [13.0, 14.01], [15.0, 17.32], [17.0, 17.49], [18.0, 17.52], [18.0, 23.79], [24.0, 29.0], [31.0, 30.99], [32.0, 73.31], [75.0, 85.8], [90.0, 92.15], [102.0, 109.65], [112.0, 113.26], [122.0, 133.95], [134.0, 135.62], [137.0, 139.04]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 72.6, 0.0, 0.0, 37.35, 76.04, 0.0, 0.0, 44.09, 35.27, 36.15, 0.0, 30.6, 0.0, 34.64], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 21.42], ["noise", 14.75], ["mains hum", 10.0]], null, null, null, [["speech", 28.47], ["fart", 14.76], ["whale vocalization", 12.78]], [["whale vocalization", 30.31], ["mains hum", 26.95], ["hum", 17.55]], [["hum", 27.35], ["mains hum", 9.81], ["clang", 7.94]], null, [["music", 57.73], ["carnatic music", 9.29], ["musical instrument", 4.33]], null, [["music", 40.81], ["theremin", 4.2], ["musical instrument", 3.45]]], "duration": [-0.16, 1.01, 2.32, 0.49, -0.48, 5.79, 5.0, -0.01, 41.31, 10.8, 2.15, 7.65, 1.26, 11.95, 1.62, 2.04]} \ No newline at end of file diff --git a/annotations_1/nqK7Kk3ZKvY_filtered.json b/annotations_1/nqK7Kk3ZKvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b23995110dfb14c6972e45637b4fa29ed00257c4 --- /dev/null +++ b/annotations_1/nqK7Kk3ZKvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 106.54], [107.0, 108.26], [111.0, 115.89]], "keep_status": [false, false, false], "silence_prob": [79.59, 0.0, 67.63], "audiomae_on_audioset": [null, null, null], "duration": [5.54, 1.26, 4.89]} \ No newline at end of file diff --git a/annotations_1/nqzkyfeS2Oo_filtered.json b/annotations_1/nqzkyfeS2Oo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a926665100d94556dae505f8f3d3a683f1fc1183 --- /dev/null +++ b/annotations_1/nqzkyfeS2Oo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.92], [24.0, 29.64], [30.0, 30.92], [32.0, 32.93], [36.0, 38.72], [43.0, 44.17], [45.0, 46.84], [49.0, 53.37], [54.0, 54.87], [56.0, 56.78], [58.0, 59.36], [61.0, 61.7], [62.0, 63.49], [64.0, 71.95], [73.0, 85.99], [88.0, 97.34], [99.0, 99.28], [100.0, 100.62], [102.0, 102.42], [104.0, 111.2], [111.0, 127.79], [129.0, 129.39], [131.0, 131.77], [133.0, 151.21], [152.0, 153.6], [156.0, 156.25], [158.0, 158.45], [160.0, 165.5], [169.0, 171.66], [173.0, 173.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [52.98, 92.64, 0.0, 0.0, 56.78, 0.0, 0.0, 76.86, 0.0, 0.0, 0.0, 0.0, 0.0, 53.1, 29.67, 30.32, 0.0, 0.0, 0.0, 35.78, 31.32, 0.0, 0.0, 35.26, 0.0, 0.0, 0.0, 35.56, 44.96, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 26.17], ["music", 15.1], ["mains hum", 14.11]], [["music", 18.12], ["hum", 11.77], ["noise", 10.07]], null, null, null, [["speech", 42.81], ["hum", 25.35], ["mains hum", 9.84]], [["hum", 22.47], ["music", 17.57], ["throbbing", 8.54]], null, null, [["speech", 34.71], ["hum", 24.28], ["music", 17.01]], null, null, null, [["music", 23.12], ["speech", 21.71], ["sidetone", 18.62]], [["music", 33.48], ["hum", 14.59], ["ambient music", 6.9]], null], "duration": [5.92, 5.64, 0.92, 0.93, 2.72, 1.17, 1.84, 4.37, 0.87, 0.78, 1.36, 0.7, 1.49, 7.95, 12.99, 9.34, 0.28, 0.62, 0.42, 7.2, 16.79, 0.39, 0.77, 18.21, 1.6, 0.25, 0.45, 5.5, 2.66, 0.84]} \ No newline at end of file diff --git a/annotations_1/nr1sLngjJXQ_filtered.json b/annotations_1/nr1sLngjJXQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bc923938318c834e924aa7db5082fb3b6260616 --- /dev/null +++ b/annotations_1/nr1sLngjJXQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.61], [9.0, 23.67], [26.0, 80.45], [83.0, 83.47], [83.0, 83.51], [87.0, 146.57], [147.0, 167.91], [171.0, 175.71], [176.0, 177.28]], "keep_status": [true, false, false, false, false, false, true, true, false], "silence_prob": [31.71, 33.63, 0.0, 0.0, 0.0, 0.0, 30.71, 30.89, 0.0], "audiomae_on_audioset": [[["music", 30.49], ["smash, crash", 21.46], ["throbbing", 6.23]], [["music", 71.92], ["throbbing", 4.22], ["hum", 2.82]], null, null, null, null, [["music", 19.39], ["fart", 17.78], ["speech", 16.6]], [["music", 45.63], ["noise", 17.08], ["hum", 6.56]], null], "duration": [2.61, 14.67, 54.45, 0.47, 0.51, 59.57, 20.91, 4.71, 1.28]} \ No newline at end of file diff --git a/annotations_1/ns3j2exbdbU_filtered.json b/annotations_1/ns3j2exbdbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fa9ea383513586863baeca79345ef03c60c1d5d --- /dev/null +++ b/annotations_1/ns3j2exbdbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.34], [16.0, 16.33], [19.0, 19.8], [30.0, 32.24], [35.0, 34.86], [73.0, 74.21], [79.0, 80.23], [82.0, 83.98], [89.0, 91.13], [96.0, 121.74], [123.0, 128.93], [131.0, 132.04], [133.0, 133.52], [135.0, 137.27], [145.0, 146.33], [148.0, 149.23], [150.0, 151.5], [152.0, 152.52], [153.0, 153.84], [156.0, 163.38], [164.0, 170.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.95, 0.0, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 100.0, 99.99, 100.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 0.33, 0.8, 2.24, -0.14, 1.21, 1.23, 1.98, 2.13, 25.74, 5.93, 1.04, 0.52, 2.27, 1.33, 1.23, 1.5, 0.52, 0.84, 7.38, 6.63]} \ No newline at end of file diff --git a/annotations_1/ns7B5fzH11c_filtered.json b/annotations_1/ns7B5fzH11c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c043b551088d4a409a022120806a210650a5e9a0 --- /dev/null +++ b/annotations_1/ns7B5fzH11c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.25], [21.0, 26.1], [31.0, 38.77], [40.0, 39.95], [40.0, 57.48], [59.0, 59.36], [62.0, 62.9], [63.0, 65.1], [67.0, 69.55], [71.0, 80.13]], "keep_status": [false, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 38.03, 46.05, 0.0, 38.7, 0.0, 0.0, 55.6, 45.08, 48.69], "audiomae_on_audioset": [null, [["speech", 45.98], ["music", 15.23], ["hum", 5.99]], [["speech", 20.38], ["mains hum", 17.64], ["music", 17.36]], null, [["music", 44.67], ["didgeridoo", 16.22], ["speech", 4.34]], null, null, null, [["didgeridoo", 79.69], ["music", 12.83], ["musical instrument", 1.43]], [["music", 24.37], ["speech", 19.67], ["fart", 18.01]]], "duration": [0.25, 5.1, 7.77, -0.05, 17.48, 0.36, 0.9, 2.1, 2.55, 9.13]} \ No newline at end of file diff --git a/annotations_1/ntKYG1LdbV8_filtered.json b/annotations_1/ntKYG1LdbV8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4911f6dd23e74d43dd67c41df81313f135c5d80f --- /dev/null +++ b/annotations_1/ntKYG1LdbV8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 32.05], [33.0, 34.65], [41.0, 41.79], [46.0, 46.21], [47.0, 48.57]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.05, 1.65, 0.79, 0.21, 1.57]} \ No newline at end of file diff --git a/annotations_1/ntirWguFrfM_filtered.json b/annotations_1/ntirWguFrfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e43a3040777f911bd8e6192cf8fe0e0fed5007bd --- /dev/null +++ b/annotations_1/ntirWguFrfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [4.0, 4.82], [8.0, 8.06], [10.0, 10.86], [13.0, 12.85], [27.0, 33.44], [40.0, 40.44], [45.0, 45.72], [46.0, 46.67], [77.0, 77.35], [80.0, 82.19], [84.0, 88.3], [90.0, 97.14], [99.0, 100.57], [107.0, 107.84], [110.0, 111.21], [115.0, 115.45], [121.0, 121.88], [123.0, 123.48], [125.0, 126.0], [134.0, 137.59], [143.0, 149.47], [152.0, 157.01], [161.0, 171.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 36.64, 0.0, 0.0, 0.0, 0.0, 94.52, 55.11, 82.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.43, 36.55, 35.18, 38.42], "audiomae_on_audioset": [null, null, null, null, null, [["livestock, farm animals, working animals", 41.26], ["cattle, bovinae", 21.27], ["moo", 16.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 18.84], ["cattle, bovinae", 8.3], ["moo", 8.24]], [["music", 48.32], ["whale vocalization", 17.09], ["howl", 4.55]], [["music", 40.95], ["speech", 8.45], ["explosion", 7.4]]], "duration": [0.43, 0.82, 0.06, 0.86, -0.15, 6.44, 0.44, 0.72, 0.67, 0.35, 2.19, 4.3, 7.14, 1.57, 0.84, 1.21, 0.45, 0.88, 0.48, 1.0, 3.59, 6.47, 5.01, 10.96]} \ No newline at end of file diff --git a/annotations_1/ntnqp7-SG7k_filtered.json b/annotations_1/ntnqp7-SG7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4c7e03785dd5bf070e0c2bf2b2d586f49215277 --- /dev/null +++ b/annotations_1/ntnqp7-SG7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.07], [6.0, 9.04], [11.0, 13.44], [14.0, 14.59], [16.0, 29.42], [31.0, 30.94], [32.0, 36.34], [37.0, 47.85], [49.0, 48.84], [50.0, 55.09], [56.0, 61.69], [65.0, 67.44], [68.0, 71.12], [73.0, 72.87], [74.0, 77.77], [79.0, 82.02], [83.0, 86.43], [87.0, 87.84], [89.0, 89.55], [91.0, 91.98], [93.0, 95.27], [96.0, 105.97], [107.0, 110.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.54, 80.64, 99.56, 0.0, 94.37, 0.0, 97.33, 89.01, 0.0, 96.89, 83.88, 74.13, 88.1, 0.0, 82.97, 94.95, 91.64, 0.0, 0.0, 0.0, 87.37, 90.6, 79.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.07, 3.04, 2.44, 0.59, 13.42, -0.06, 4.34, 10.85, -0.16, 5.09, 5.69, 2.44, 3.12, -0.13, 3.77, 3.02, 3.43, 0.84, 0.55, 0.98, 2.27, 9.97, 3.13]} \ No newline at end of file diff --git a/annotations_1/nudL_t9u78o_filtered.json b/annotations_1/nudL_t9u78o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38f0766aec91806cda192cf5242f2b0cdc6e212d --- /dev/null +++ b/annotations_1/nudL_t9u78o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.79], [11.0, 10.86], [11.0, 10.96], [11.0, 11.03], [11.0, 11.06], [11.0, 48.74], [58.0, 78.0], [80.0, 97.63], [100.0, 100.55], [101.0, 108.06], [108.0, 108.36], [108.0, 111.77], [114.0, 145.27], [146.0, 159.34], [160.0, 164.39], [169.0, 175.69], [176.0, 175.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.57, 33.49, 0.0, 34.35, 0.0, 28.99, 0.0, 43.35, 99.84, 31.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 60.56], ["mains hum", 15.18], ["music", 14.24]], [["whale vocalization", 37.45], ["music", 36.98], ["electronic music", 4.49]], null, [["hum", 45.9], ["mains hum", 24.97], ["music", 16.41]], null, [["music", 36.59], ["noise", 14.47], ["speech", 10.94]], null, [["music", 49.06], ["sonar", 9.34], ["singing bowl", 5.33]], null, [["music", 60.06], ["theremin", 5.86], ["hum", 4.66]], null], "duration": [-0.21, -0.14, -0.04, 0.03, 0.06, 37.74, 20.0, 17.63, 0.55, 7.06, 0.36, 3.77, 31.27, 13.34, 4.39, 6.69, -0.05]} \ No newline at end of file diff --git a/annotations_1/nvAZrrDwecI_filtered.json b/annotations_1/nvAZrrDwecI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45e4f6f850577c7531bf07becce518459a7c68fc --- /dev/null +++ b/annotations_1/nvAZrrDwecI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [8.0, 11.04], [12.0, 13.68], [15.0, 15.28], [19.0, 18.76], [29.0, 30.45], [31.0, 31.87], [35.0, 35.8], [39.0, 39.8], [41.0, 40.78], [43.0, 43.7], [46.0, 49.98], [51.0, 52.22], [57.0, 60.84], [61.0, 61.86], [65.0, 66.31], [67.0, 67.2], [73.0, 73.79], [78.0, 79.44], [84.0, 85.36], [86.0, 88.6], [90.0, 91.15], [92.0, 92.87], [96.0, 96.53], [97.0, 111.42], [113.0, 112.77], [113.0, 113.14], [114.0, 115.16], [115.0, 116.41], [116.0, 120.7], [124.0, 124.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.3, 0.0, 74.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 60.23, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.61], ["music", 20.98], ["hum", 5.9]], null], "duration": [0.34, 3.04, 1.68, 0.28, -0.24, 1.45, 0.87, 0.8, 0.8, -0.22, 0.7, 3.98, 1.22, 3.84, 0.86, 1.31, 0.2, 0.79, 1.44, 1.36, 2.6, 1.15, 0.87, 0.53, 14.42, -0.23, 0.14, 1.16, 1.41, 4.7, 0.36]} \ No newline at end of file diff --git a/annotations_1/nvldRH4OC_k_filtered.json b/annotations_1/nvldRH4OC_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294d914ae7669f49166eafb3e72c9344ba129a94 --- /dev/null +++ b/annotations_1/nvldRH4OC_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.64], [18.0, 18.4], [31.0, 37.18], [37.0, 54.45]], "keep_status": [false, false, true, false], "silence_prob": [31.85, 0.0, 29.63, 29.92], "audiomae_on_audioset": [[["music", 39.1], ["boing", 20.45], ["speech", 18.52]], null, [["hum", 34.87], ["music", 16.79], ["mains hum", 16.09]], [["speech", 39.32], ["music", 30.31], ["synthesizer", 6.86]]], "duration": [3.64, 0.4, 6.18, 17.45]} \ No newline at end of file diff --git a/annotations_1/nwrLvq5W58o_filtered.json b/annotations_1/nwrLvq5W58o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..808572335bb2c72fe6dc2b03f1e551609db15aaa --- /dev/null +++ b/annotations_1/nwrLvq5W58o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.62], [11.0, 16.28], [17.0, 16.97], [18.0, 18.84], [27.0, 27.18], [28.0, 33.91], [43.0, 43.97], [47.0, 48.36], [49.0, 48.59], [49.0, 49.0], [54.0, 55.8], [56.0, 57.91], [64.0, 64.3], [67.0, 68.28], [71.0, 109.93], [111.0, 112.36], [113.0, 134.38], [137.0, 137.44], [139.0, 139.38], [141.0, 143.85], [145.0, 145.49], [146.0, 149.49], [151.0, 155.31], [157.0, 161.42], [165.0, 165.11], [169.0, 169.59]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 29.43, 0.0, 0.0, 0.0, 32.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 0.0, 29.55, 0.0, 31.39, 30.88, 31.93, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.69], ["speech", 18.75], ["sound effect", 2.92]], null, null, null, [["music", 13.9], ["cattle, bovinae", 9.0], ["speech", 8.88]], null, null, null, null, null, null, null, null, null, null, [["music", 83.59], ["theremin", 2.47], ["scary music", 1.54]], null, null, [["music", 30.71], ["sound effect", 10.95], ["speech", 10.21]], null, [["music", 52.76], ["throbbing", 22.35], ["hum", 4.42]], [["whack, thwack", 32.93], ["music", 29.09], ["thunk", 6.15]], [["whack, thwack", 38.41], ["music", 24.84], ["fly, housefly", 7.26]], null, null], "duration": [0.62, 5.28, -0.03, 0.84, 0.18, 5.91, 0.97, 1.36, -0.41, 0.0, 1.8, 1.91, 0.3, 1.28, 38.93, 1.36, 21.38, 0.44, 0.38, 2.85, 0.49, 3.49, 4.31, 4.42, 0.11, 0.59]} \ No newline at end of file diff --git a/annotations_1/nwt-V8xfwkQ_filtered.json b/annotations_1/nwt-V8xfwkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ed540f1de616005525fd6350a859fb678a213cb --- /dev/null +++ b/annotations_1/nwt-V8xfwkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.83], [11.0, 12.06], [13.0, 60.89], [62.0, 62.48], [63.0, 77.94], [79.0, 108.43], [111.0, 124.55], [125.0, 155.61], [156.0, 156.63]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [32.3, 0.0, 0.0, 0.0, 29.5, 29.63, 30.73, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.46], ["hum", 7.12], ["throbbing", 3.44]], null, null, null, [["speech", 72.9], ["music", 6.87], ["outside, rural or natural", 2.46]], [["hum", 43.82], ["throbbing", 12.0], ["mains hum", 11.98]], [["whack, thwack", 46.34], ["speech", 14.85], ["whip", 12.59]], null, null], "duration": [2.83, 1.06, 47.89, 0.48, 14.94, 29.43, 13.55, 30.61, 0.63]} \ No newline at end of file diff --git a/annotations_1/nxc6kwBYFSM_filtered.json b/annotations_1/nxc6kwBYFSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b805fbb024b092425487d82e9929bbcfa8338e8 --- /dev/null +++ b/annotations_1/nxc6kwBYFSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.5], [40.0, 41.0], [42.0, 43.31], [43.0, 51.88], [60.0, 61.97], [69.0, 69.25], [74.0, 75.05], [76.0, 77.85], [83.0, 85.99], [98.0, 98.58], [101.0, 101.55], [105.0, 109.65], [113.0, 115.43], [116.0, 116.5], [126.0, 128.39]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [30.48, 0.0, 0.0, 31.5, 0.0, 0.0, 0.0, 0.0, 29.7, 0.0, 0.0, 29.54, 36.02, 0.0, 30.74], "audiomae_on_audioset": [[["whale vocalization", 58.02], ["livestock, farm animals, working animals", 4.71], ["moo", 2.64]], null, null, [["speech", 22.41], ["didgeridoo", 9.4], ["fart", 8.1]], null, null, null, null, [["groan", 14.35], ["whale vocalization", 13.34], ["screaming", 13.27]], null, null, [["speech", 49.34], ["groan", 10.42], ["screaming", 7.09]], [["cattle, bovinae", 46.21], ["livestock, farm animals, working animals", 26.15], ["moo", 14.46]], null, [["fart", 18.54], ["beatboxing", 11.65], ["groan", 8.27]]], "duration": [2.5, 1.0, 1.31, 8.88, 1.97, 0.25, 1.05, 1.85, 2.99, 0.58, 0.55, 4.65, 2.43, 0.5, 2.39]} \ No newline at end of file diff --git a/annotations_1/nxmaYsZjnXo_filtered.json b/annotations_1/nxmaYsZjnXo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c33e65509716dd26144b46c3fd2dee1b98652d8a --- /dev/null +++ b/annotations_1/nxmaYsZjnXo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.36], [9.0, 12.07], [14.0, 16.14], [16.0, 17.22], [21.0, 22.01], [24.0, 24.34], [25.0, 31.87], [35.0, 44.68], [49.0, 52.12], [56.0, 56.64], [58.0, 62.36], [64.0, 63.93], [65.0, 67.1], [68.0, 88.67], [91.0, 92.52], [95.0, 96.18], [98.0, 98.47], [99.0, 100.35], [101.0, 102.07], [103.0, 103.72], [105.0, 105.83], [107.0, 108.45], [110.0, 111.0], [114.0, 116.01], [120.0, 120.93], [122.0, 123.2], [125.0, 125.85], [128.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 98.1, 99.91, 0.0, 0.0, 0.0, 97.92, 99.05, 100.0, 0.0, 100.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.01, 0.0, 0.0, 0.0, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.36, 3.07, 2.14, 1.22, 1.01, 0.34, 6.87, 9.68, 3.12, 0.64, 4.36, -0.07, 2.1, 20.67, 1.52, 1.18, 0.47, 1.35, 1.07, 0.72, 0.83, 1.45, 1.0, 2.01, 0.93, 1.2, 0.85, 2.06]} \ No newline at end of file diff --git a/annotations_1/o-6E3Hd2OW0_filtered.json b/annotations_1/o-6E3Hd2OW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee49ed42355364dde2ea14b4f8b69291e6052c1e --- /dev/null +++ b/annotations_1/o-6E3Hd2OW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.15], [37.0, 63.88], [68.0, 67.86], [75.0, 116.33], [118.0, 121.07], [126.0, 127.3], [128.0, 133.03]], "keep_status": [false, false, false, false, true, false, false], "silence_prob": [38.88, 37.03, 0.0, 0.0, 30.0, 0.0, 31.93], "audiomae_on_audioset": [[["music", 34.23], ["hum", 22.22], ["mains hum", 17.6]], [["hum", 43.11], ["music", 19.12], ["throbbing", 17.78]], null, null, [["explosion", 24.11], ["burst, pop", 11.95], ["whack, thwack", 9.87]], null, [["insect", 35.47], ["fly, housefly", 24.8], ["speech", 11.17]]], "duration": [6.15, 26.88, -0.14, 41.33, 3.07, 1.3, 5.03]} \ No newline at end of file diff --git a/annotations_1/o-OKsTWIVxk_filtered.json b/annotations_1/o-OKsTWIVxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..547062b6f0e71e0455a0fd50948eaa3443c24858 --- /dev/null +++ b/annotations_1/o-OKsTWIVxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.18], [12.0, 17.14], [19.0, 19.28], [34.0, 33.71], [34.0, 33.74], [37.0, 36.83], [47.0, 47.21], [49.0, 49.67], [61.0, 65.16], [69.0, 70.87], [73.0, 85.41], [86.0, 86.8], [100.0, 100.6], [101.0, 101.24], [103.0, 103.74], [105.0, 105.29], [114.0, 114.88], [117.0, 117.07], [126.0, 125.81], [129.0, 129.78], [141.0, 141.24], [142.0, 143.75], [144.0, 144.68], [151.0, 151.07]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.92, 0.0, 30.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.47], ["hum", 16.85], ["mains hum", 14.57]], null, null, null, null, null, null, [["sidetone", 37.03], ["music", 34.33], ["speech", 11.38]], null, [["music", 77.34], ["boing", 3.31], ["synthesizer", 3.23]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.18, 5.14, 0.28, -0.29, -0.26, -0.17, 0.21, 0.67, 4.16, 1.87, 12.41, 0.8, 0.6, 0.24, 0.74, 0.29, 0.88, 0.07, -0.19, 0.78, 0.24, 1.75, 0.68, 0.07]} \ No newline at end of file diff --git a/annotations_1/o-_ochO9CFQ_filtered.json b/annotations_1/o-_ochO9CFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eace1008a72ceae8fc77ac43d047f6c72ce5fb65 --- /dev/null +++ b/annotations_1/o-_ochO9CFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [3.0, 3.54], [16.0, 16.9], [27.0, 31.82], [33.0, 34.67], [36.0, 39.26], [42.0, 42.57], [44.0, 44.79], [46.0, 47.48], [49.0, 49.4], [54.0, 54.4], [56.0, 56.76], [58.0, 57.96], [60.0, 60.3], [61.0, 61.62], [62.0, 64.64], [65.0, 66.16], [70.0, 70.75], [71.0, 74.09], [76.0, 75.88], [76.0, 77.75], [81.0, 87.93], [89.0, 90.51], [92.0, 94.36], [95.0, 98.02], [99.0, 104.52], [106.0, 128.9], [130.0, 168.66], [170.0, 172.69], [176.0, 178.41], [179.0, 179.66], [181.0, 182.43], [184.0, 188.74], [191.0, 195.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.59, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.21, 0.0, 0.0, 99.05, 0.0, 0.0, 97.0, 0.0, 99.52, 99.21, 99.96, 94.95, 0.0, 88.28, 99.92, 0.0, 0.0, 81.89, 61.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.42, 0.54, 0.9, 4.82, 1.67, 3.26, 0.57, 0.79, 1.48, 0.4, 0.4, 0.76, -0.04, 0.3, 0.62, 2.64, 1.16, 0.75, 3.09, -0.12, 1.75, 6.93, 1.51, 2.36, 3.02, 5.52, 22.9, 38.66, 2.69, 2.41, 0.66, 1.43, 4.74, 4.13]} \ No newline at end of file diff --git a/annotations_1/o-cA_1F05bU_filtered.json b/annotations_1/o-cA_1F05bU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12acb35a878ca506bfaefcbb984e586cfee2c6da --- /dev/null +++ b/annotations_1/o-cA_1F05bU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [5.0, 6.56], [8.0, 8.16], [10.0, 11.03], [12.0, 13.15], [14.0, 20.14], [21.0, 27.21], [29.0, 29.39], [32.0, 33.67], [35.0, 35.24], [38.0, 38.45], [44.0, 47.58], [49.0, 50.13], [54.0, 54.85], [56.0, 56.83], [58.0, 58.33], [60.0, 60.44], [62.0, 64.44], [66.0, 65.94], [67.0, 83.78], [84.0, 84.38], [86.0, 91.42], [92.0, 102.27], [103.0, 111.37], [122.0, 131.68], [140.0, 142.59]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 30.3, 0.0, 0.0, 0.0, 0.0, 61.37, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 54.23, 0.0, 52.45, 48.14, 31.95, 50.71, 91.3], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 29.28], ["burst, pop", 26.23], ["speech", 13.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.66], ["electric shaver, electric razor", 21.52], ["hum", 12.87]], [["speech", 29.08], ["explosion", 18.85], ["burst, pop", 9.34]], null, null], "duration": [1.64, 1.56, 0.16, 1.03, 1.15, 6.14, 6.21, 0.39, 1.67, 0.24, 0.45, 3.58, 1.13, 0.85, 0.83, 0.33, 0.44, 2.44, -0.06, 16.78, 0.38, 5.42, 10.27, 8.37, 9.68, 2.59]} \ No newline at end of file diff --git a/annotations_1/o-kmndqHfF0_filtered.json b/annotations_1/o-kmndqHfF0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..461273a30e4947570a3408b0b9ce0b6b5d9c4265 --- /dev/null +++ b/annotations_1/o-kmndqHfF0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [11.0, 10.98], [21.0, 21.98], [28.0, 28.44], [29.0, 30.37], [33.0, 33.32], [33.0, 33.37], [38.0, 40.2], [42.0, 47.63], [50.0, 51.0], [54.0, 54.77], [56.0, 56.42], [58.0, 59.39], [60.0, 62.83], [65.0, 64.96], [69.0, 69.82], [71.0, 71.81], [75.0, 75.22], [77.0, 77.25], [80.0, 80.87], [81.0, 81.9], [83.0, 86.81], [88.0, 89.04], [90.0, 90.44], [91.0, 92.47], [93.0, 93.58], [95.0, 96.48], [98.0, 100.99], [103.0, 104.3], [104.0, 105.16], [107.0, 109.0], [113.0, 113.68], [116.0, 122.32], [126.0, 129.73], [130.0, 130.5], [132.0, 132.49], [135.0, 136.19], [137.0, 140.76], [141.0, 143.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.36, 74.29, 0.0, 0.0, 0.0, 0.0, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 69.07, 0.0, 96.04, 50.71, 0.0, 0.0, 0.0, 96.54, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 83.17], ["telephone", 2.61], ["inside, small room", 1.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, -0.02, 0.98, 0.44, 1.37, 0.32, 0.37, 2.2, 5.63, 1.0, 0.77, 0.42, 1.39, 2.83, -0.04, 0.82, 0.81, 0.22, 0.25, 0.87, 0.9, 3.81, 1.04, 0.44, 1.47, 0.58, 1.48, 2.99, 1.3, 1.16, 2.0, 0.68, 6.32, 3.73, 0.5, 0.49, 1.19, 3.76, 2.28]} \ No newline at end of file diff --git a/annotations_1/o1RMSG4bnrg_filtered.json b/annotations_1/o1RMSG4bnrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2b12149865c182d0cf0597075ebd189dca0092d --- /dev/null +++ b/annotations_1/o1RMSG4bnrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.16], [8.0, 8.67], [9.0, 11.74], [12.0, 13.27], [14.0, 15.31], [16.0, 16.75], [18.0, 20.46], [23.0, 23.19], [26.0, 27.03], [29.0, 31.04], [32.0, 32.63], [33.0, 34.35], [37.0, 38.69], [46.0, 47.95], [49.0, 49.17], [52.0, 53.72], [55.0, 56.3], [59.0, 60.59], [61.0, 66.45], [67.0, 68.74], [70.0, 70.75], [73.0, 74.33], [75.0, 75.68], [77.0, 77.41], [78.0, 79.24], [81.0, 83.86], [85.0, 85.53], [88.0, 87.78], [89.0, 90.1], [91.0, 91.88], [96.0, 96.26], [99.0, 99.08], [100.0, 100.82], [111.0, 112.72], [115.0, 117.29], [120.0, 123.31], [129.0, 133.41], [142.0, 153.67], [155.0, 154.99], [156.0, 156.57], [157.0, 157.82], [159.0, 159.16], [160.0, 160.78], [163.0, 163.09], [167.0, 167.88], [171.0, 171.21], [172.0, 171.96], [174.0, 174.75], [178.0, 178.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.02, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 32.91, 30.81, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 67.1], ["sidetone", 3.84], ["vehicle", 3.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.01], ["radio", 6.66], ["mains hum", 5.84]], null, null, null, null, null, null, null, null, null, [["gunshot, gunfire", 26.19], ["burst, pop", 8.82], ["explosion", 6.07]], [["noise", 7.91], ["firecracker", 7.65], ["gunshot, gunfire", 7.51]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.67, 2.74, 1.27, 1.31, 0.75, 2.46, 0.19, 1.03, 2.04, 0.63, 1.35, 1.69, 1.95, 0.17, 1.72, 1.3, 1.59, 5.45, 1.74, 0.75, 1.33, 0.68, 0.41, 1.24, 2.86, 0.53, -0.22, 1.1, 0.88, 0.26, 0.08, 0.82, 1.72, 2.29, 3.31, 4.41, 11.67, -0.01, 0.57, 0.82, 0.16, 0.78, 0.09, 0.88, 0.21, -0.04, 0.75, 0.17]} \ No newline at end of file diff --git a/annotations_1/o2wFqjb9AU0_filtered.json b/annotations_1/o2wFqjb9AU0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13d767a25613527d4c962dd031c9e04e51f1078 --- /dev/null +++ b/annotations_1/o2wFqjb9AU0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 9.56], [11.0, 11.97], [14.0, 16.38], [17.0, 17.9], [21.0, 22.22], [23.0, 27.33], [30.0, 31.35], [33.0, 44.44], [46.0, 46.28], [47.0, 50.26], [51.0, 52.81], [56.0, 56.02], [60.0, 65.3], [67.0, 67.37], [74.0, 74.61], [76.0, 77.72], [78.0, 80.0], [88.0, 88.35], [95.0, 95.01], [96.0, 96.45], [97.0, 98.78], [100.0, 100.72], [102.0, 102.69], [106.0, 107.1], [112.0, 113.14], [114.0, 114.96], [116.0, 117.31], [119.0, 119.2], [120.0, 120.85], [123.0, 123.67], [130.0, 131.08], [133.0, 133.81], [136.0, 140.29], [141.0, 142.6], [143.0, 144.31], [146.0, 147.99], [149.0, 149.98], [151.0, 152.04], [153.0, 154.5], [157.0, 164.76], [166.0, 167.0], [168.0, 177.5], [178.0, 178.51]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [38.04, 0.0, 97.92, 0.0, 0.0, 97.0, 0.0, 63.31, 0.0, 63.21, 0.0, 0.0, 69.47, 0.0, 0.0, 0.0, 84.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.16, 0.0, 32.0, 0.0], "audiomae_on_audioset": [[["whale vocalization", 27.16], ["music", 19.08], ["crying, sobbing", 7.53]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 28.26], ["music", 20.29], ["mains hum", 14.98]], null], "duration": [6.56, 0.97, 2.38, 0.9, 1.22, 4.33, 1.35, 11.44, 0.28, 3.26, 1.81, 0.02, 5.3, 0.37, 0.61, 1.72, 2.0, 0.35, 0.01, 0.45, 1.78, 0.72, 0.69, 1.1, 1.14, 0.96, 1.31, 0.2, 0.85, 0.67, 1.08, 0.81, 4.29, 1.6, 1.31, 1.99, 0.98, 1.04, 1.5, 7.76, 1.0, 9.5, 0.51]} \ No newline at end of file diff --git a/annotations_1/o3ya6zEv3eM_filtered.json b/annotations_1/o3ya6zEv3eM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87edc9a5ce70cf14afbe10c47d80c85d2b3e5218 --- /dev/null +++ b/annotations_1/o3ya6zEv3eM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.84], [24.0, 43.8], [46.0, 93.77], [102.0, 114.67], [120.0, 120.28], [122.0, 121.8], [122.0, 122.76], [132.0, 132.71], [133.0, 150.5], [151.0, 151.56], [156.0, 158.16], [162.0, 161.65], [167.0, 167.36], [172.0, 172.94]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.85, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 27.89, 0.0, 33.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 26.68], ["hum", 24.69], ["throbbing", 14.07]], null, [["music", 69.17], ["throbbing", 10.19], ["hum", 6.33]], null, null, null, null, [["music", 73.4], ["electronic music", 12.93], ["hum", 3.17]], null, [["radio", 33.81], ["speech", 30.59], ["sidetone", 25.38]], null, null, null], "duration": [0.84, 19.8, 47.77, 12.67, 0.28, -0.2, 0.76, 0.71, 17.5, 0.56, 2.16, -0.35, 0.36, 0.94]} \ No newline at end of file diff --git a/annotations_1/o4ARk91_ptU_filtered.json b/annotations_1/o4ARk91_ptU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b26ead05096d27237226c6d9aedcc8216b3de2e8 --- /dev/null +++ b/annotations_1/o4ARk91_ptU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.5], [6.0, 8.7], [9.0, 32.29], [36.0, 90.49], [92.0, 101.92], [103.0, 104.52]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 100.0, 37.39, 0.0, 44.49, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 49.74], ["speech", 26.12], ["fly, housefly", 3.07]], null, [["fart", 25.33], ["fly, housefly", 10.57], ["grunt", 9.53]], null], "duration": [1.5, 2.7, 23.29, 54.49, 9.92, 1.52]} \ No newline at end of file diff --git a/annotations_1/o5CBItcNkFs_filtered.json b/annotations_1/o5CBItcNkFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51e072e36970d52b38614ad28ae21d496bb4c716 --- /dev/null +++ b/annotations_1/o5CBItcNkFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 50.41], [51.0, 98.96], [100.0, 103.57], [106.0, 107.15]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 43.98, 0.0], "audiomae_on_audioset": [null, null, [["fart", 21.25], ["speech", 15.54], ["livestock, farm animals, working animals", 10.34]], null], "duration": [0.41, 47.96, 3.57, 1.15]} \ No newline at end of file diff --git a/annotations_1/o6FUdj0_fGY_filtered.json b/annotations_1/o6FUdj0_fGY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1458bb85b2da82fb9215aacc3fc76c0e5508de44 --- /dev/null +++ b/annotations_1/o6FUdj0_fGY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 74.19], [97.0, 99.39], [113.0, 116.41], [116.0, 116.53], [117.0, 122.84], [124.0, 125.91], [131.0, 131.45], [142.0, 143.28]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 32.4, 64.41, 0.0, 50.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 25.35], ["animal", 12.22], ["grunt", 11.25]], null, null, null, null, null, null], "duration": [0.19, 2.39, 3.41, 0.53, 5.84, 1.91, 0.45, 1.28]} \ No newline at end of file diff --git a/annotations_1/o6Jkz5TQv84_filtered.json b/annotations_1/o6Jkz5TQv84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6208bb50292741066dc96233a9bd16200fdb368 --- /dev/null +++ b/annotations_1/o6Jkz5TQv84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.92], [15.0, 15.53], [19.0, 18.93], [29.0, 29.86], [31.0, 31.68], [33.0, 35.58], [36.0, 40.2], [46.0, 46.03], [48.0, 47.98], [49.0, 53.1], [64.0, 66.26], [69.0, 70.95], [77.0, 77.16], [87.0, 87.91], [90.0, 90.48], [101.0, 104.04], [105.0, 108.51], [115.0, 116.24], [119.0, 120.14], [126.0, 126.99], [131.0, 134.16], [135.0, 139.9], [149.0, 149.96], [152.0, 163.71], [164.0, 165.03], [168.0, 172.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 40.71, 0.0, 0.0, 30.91, 31.48, 0.0, 0.0, 0.0, 0.0, 32.21, 35.2, 0.0, 0.0, 0.0, 38.26, 30.28, 0.0, 32.68, 0.0, 30.01], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 35.02], ["music", 20.99], ["throbbing", 14.97]], null, null, [["electric shaver, electric razor", 30.24], ["mains hum", 16.06], ["hum", 12.9]], [["music", 50.16], ["throbbing", 16.14], ["hum", 11.91]], null, null, null, null, [["music", 46.27], ["throbbing", 16.89], ["hum", 14.14]], [["music", 41.47], ["throbbing", 24.27], ["hum", 14.58]], null, null, null, [["throbbing", 37.41], ["music", 36.47], ["hum", 9.69]], [["hum", 45.06], ["throbbing", 14.87], ["mains hum", 13.49]], null, [["music", 53.26], ["throbbing", 19.87], ["hum", 12.4]], null, [["speech", 35.18], ["music", 12.48], ["hum", 7.9]]], "duration": [1.92, 0.53, -0.07, 0.86, 0.68, 2.58, 4.2, 0.03, -0.02, 4.1, 2.26, 1.95, 0.16, 0.91, 0.48, 3.04, 3.51, 1.24, 1.14, 0.99, 3.16, 4.9, 0.96, 11.71, 1.03, 4.47]} \ No newline at end of file diff --git a/annotations_1/o6MDdOWCCT8_filtered.json b/annotations_1/o6MDdOWCCT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ba11f6a4aeffe8b73aad45e0610bafbec9b3ece --- /dev/null +++ b/annotations_1/o6MDdOWCCT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.6], [12.0, 15.4], [16.0, 16.85], [17.0, 18.03], [18.0, 18.81], [19.0, 21.32], [24.0, 24.17], [35.0, 34.87], [40.0, 41.44], [45.0, 44.76], [110.0, 110.0], [111.0, 112.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.89, 0.0, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 48.09], ["music", 27.51], ["boing", 12.4]], null, null, null, [["sidetone", 46.6], ["speech", 21.29], ["music", 17.02]], null, null, null, null, null, null], "duration": [1.6, 3.4, 0.85, 1.03, 0.81, 2.32, 0.17, -0.13, 1.44, -0.24, 0.0, 1.13]} \ No newline at end of file diff --git a/annotations_1/o6synmrDXqU_filtered.json b/annotations_1/o6synmrDXqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e351d2716cdc6d6aacb1f1c38c2ccaa3cbd00258 --- /dev/null +++ b/annotations_1/o6synmrDXqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [8.0, 8.46], [26.0, 28.0], [37.0, 39.65], [40.0, 39.68], [40.0, 40.85], [51.0, 51.39], [53.0, 55.24], [59.0, 59.64], [60.0, 60.79], [74.0, 74.58], [79.0, 79.07], [95.0, 101.49], [111.0, 112.01], [113.0, 113.64], [116.0, 116.16], [120.0, 120.34], [122.0, 122.25], [128.0, 133.27], [133.0, 133.49], [134.0, 137.13], [140.0, 141.1], [141.0, 141.18], [144.0, 146.21], [150.0, 164.19]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true], "silence_prob": [0.0, 0.0, 71.72, 49.09, 0.0, 0.0, 0.0, 60.6, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 0.0, 0.0, 0.0, 0.0, 29.72, 0.0, 29.35, 0.0, 0.0, 29.8, 29.57], "audiomae_on_audioset": [null, null, null, [["music", 40.32], ["speech", 23.87], ["theremin", 2.85]], null, null, null, null, null, null, null, null, [["music", 68.21], ["singing", 5.88], ["male singing", 5.86]], null, null, null, null, null, [["music", 56.49], ["singing", 5.89], ["musical instrument", 2.77]], null, [["fly, housefly", 18.85], ["music", 12.13], ["insect", 12.04]], null, null, [["boing", 38.93], ["music", 18.97], ["thunk", 10.42]], [["music", 64.5], ["singing", 3.67], ["pop music", 1.71]]], "duration": [0.69, 0.46, 2.0, 2.65, -0.32, 0.85, 0.39, 2.24, 0.64, 0.79, 0.58, 0.07, 6.49, 1.01, 0.64, 0.16, 0.34, 0.25, 5.27, 0.49, 3.13, 1.1, 0.18, 2.21, 14.19]} \ No newline at end of file diff --git a/annotations_1/o9-cFlOdXn8_filtered.json b/annotations_1/o9-cFlOdXn8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a113604cab9580466dba884005bfd9057c55a472 --- /dev/null +++ b/annotations_1/o9-cFlOdXn8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.78], [10.0, 14.55], [19.0, 40.9], [41.0, 55.53], [59.0, 60.05], [61.0, 60.88], [62.0, 62.92], [63.0, 71.85], [75.0, 75.27], [78.0, 90.91], [94.0, 97.93], [98.0, 107.74], [116.0, 120.45], [122.0, 128.12], [129.0, 131.55]], "keep_status": [true, true, true, false, false, false, false, false, false, true, true, true, false, true, true], "silence_prob": [30.23, 37.17, 36.4, 34.31, 0.0, 0.0, 0.0, 31.97, 0.0, 30.16, 30.21, 40.38, 55.53, 42.6, 44.87], "audiomae_on_audioset": [[["speech", 39.79], ["music", 19.8], ["hum", 4.82]], [["speech", 31.12], ["thunk", 17.18], ["music", 12.76]], [["rumble", 22.41], ["hum", 20.45], ["speech", 18.76]], [["hum", 43.03], ["mains hum", 32.37], ["music", 4.99]], null, null, null, [["music", 45.99], ["didgeridoo", 20.12], ["speech", 13.6]], null, [["explosion", 20.34], ["speech", 15.44], ["burst, pop", 10.07]], [["speech", 21.3], ["whale vocalization", 19.84], ["music", 10.01]], [["speech", 32.05], ["animal", 17.9], ["music", 12.32]], null, [["music", 39.11], ["whale vocalization", 11.0], ["hum", 5.84]], [["music", 43.98], ["mains hum", 8.35], ["hum", 7.78]]], "duration": [4.78, 4.55, 21.9, 14.53, 1.05, -0.12, 0.92, 8.85, 0.27, 12.91, 3.93, 9.74, 4.45, 6.12, 2.55]} \ No newline at end of file diff --git a/annotations_1/o9dLO77OSao_filtered.json b/annotations_1/o9dLO77OSao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81c37caf3571ee6fce33774cc7c6b403e63e46fe --- /dev/null +++ b/annotations_1/o9dLO77OSao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.34], [18.0, 19.55], [21.0, 22.71], [24.0, 26.7], [27.0, 29.15], [32.0, 33.2], [35.0, 35.24], [39.0, 40.14], [43.0, 45.0], [46.0, 47.46], [48.0, 49.18], [50.0, 50.41], [51.0, 52.19], [54.0, 55.41], [56.0, 57.06], [60.0, 63.21], [64.0, 65.18], [66.0, 66.36], [67.0, 68.72], [70.0, 72.1], [74.0, 74.48], [77.0, 78.61], [82.0, 83.15], [88.0, 88.5], [110.0, 112.04], [124.0, 125.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 67.38, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 1.55, 1.71, 2.7, 2.15, 1.2, 0.24, 1.14, 2.0, 1.46, 1.18, 0.41, 1.19, 1.41, 1.06, 3.21, 1.18, 0.36, 1.72, 2.1, 0.48, 1.61, 1.15, 0.5, 2.04, 1.49]} \ No newline at end of file diff --git a/annotations_1/oAjKMLcDlfc_filtered.json b/annotations_1/oAjKMLcDlfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..050fc15cde29c2549aea6a0c23c26cfc3c20098e --- /dev/null +++ b/annotations_1/oAjKMLcDlfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.79], [5.0, 18.64], [20.0, 23.52], [24.0, 30.52], [34.0, 38.67], [48.0, 60.39], [64.0, 65.3], [69.0, 81.92], [83.0, 85.9], [87.0, 87.22], [87.0, 89.19], [94.0, 96.04], [98.0, 104.03], [105.0, 114.81], [120.0, 128.46], [131.0, 132.83]], "keep_status": [false, true, false, true, true, true, false, true, true, false, true, true, true, false, true, false], "silence_prob": [0.0, 29.71, 30.93, 29.48, 29.5, 29.53, 0.0, 29.89, 31.13, 0.0, 30.72, 29.56, 30.66, 29.99, 30.07, 0.0], "audiomae_on_audioset": [null, [["music", 25.36], ["mains hum", 18.58], ["hum", 15.45]], [["music", 60.46], ["didgeridoo", 7.7], ["noise", 6.25]], [["music", 19.2], ["tabla", 16.42], ["throbbing", 11.92]], [["hum", 17.69], ["music", 15.9], ["noise", 15.08]], [["music", 41.27], ["speech", 10.28], ["race car, auto racing", 5.38]], null, [["music", 15.03], ["moo", 7.96], ["fart", 6.2]], [["speech", 24.95], ["music", 18.27], ["meow", 6.64]], null, [["speech", 36.75], ["music", 13.75], ["crowd", 7.28]], [["music", 39.39], ["speech", 27.75], ["electronic music", 2.23]], [["music", 26.0], ["trombone", 12.6], ["musical instrument", 9.62]], [["cattle, bovinae", 40.86], ["moo", 23.01], ["livestock, farm animals, working animals", 10.28]], [["music", 34.71], ["theremin", 15.32], ["speech", 13.62]], null], "duration": [-0.21, 13.64, 3.52, 6.52, 4.67, 12.39, 1.3, 12.92, 2.9, 0.22, 2.19, 2.04, 6.03, 9.81, 8.46, 1.83]} \ No newline at end of file diff --git a/annotations_1/oBURpv30IkA_filtered.json b/annotations_1/oBURpv30IkA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a91320c35089e9af0168bfb7a834ec7b7d4038e8 --- /dev/null +++ b/annotations_1/oBURpv30IkA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.19], [13.0, 14.79], [15.0, 15.8], [16.0, 16.71], [17.0, 17.81], [20.0, 20.21], [34.0, 33.83], [38.0, 37.79], [38.0, 38.52], [39.0, 39.21], [43.0, 43.39], [48.0, 48.54], [60.0, 61.25], [69.0, 71.63], [75.0, 75.52], [83.0, 83.62], [94.0, 93.9], [99.0, 100.95], [101.0, 102.54], [107.0, 107.4], [110.0, 110.44], [112.0, 114.78], [115.0, 118.42], [119.0, 119.79], [120.0, 119.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.17, 35.11, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 51.03], ["speech", 23.97], ["guitar", 8.55]], [["music", 62.24], ["guitar", 11.63], ["musical instrument", 9.96]], null, null], "duration": [0.19, 1.79, 0.8, 0.71, 0.81, 0.21, -0.17, -0.21, 0.52, 0.21, 0.39, 0.54, 1.25, 2.63, 0.52, 0.62, -0.1, 1.95, 1.54, 0.4, 0.44, 2.78, 3.42, 0.79, -0.06]} \ No newline at end of file diff --git a/annotations_1/oDcNKpBgd_0_filtered.json b/annotations_1/oDcNKpBgd_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..895d264d1815d4958c9ed059cfc37bb524a457b6 --- /dev/null +++ b/annotations_1/oDcNKpBgd_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 40.37], [41.0, 74.31], [77.0, 86.31], [88.0, 105.31], [107.0, 107.77], [108.0, 155.68], [157.0, 156.93], [157.0, 157.79], [159.0, 159.48], [160.0, 169.91]], "keep_status": [true, false, true, true, false, false, false, false, false, true], "silence_prob": [27.97, 0.0, 28.15, 27.82, 0.0, 0.0, 0.0, 0.0, 0.0, 27.99], "audiomae_on_audioset": [[["music", 26.67], ["rumble", 9.25], ["sound effect", 4.64]], null, [["music", 32.03], ["grunt", 5.57], ["animal", 5.54]], [["music", 11.28], ["vehicle", 7.41], ["rumble", 4.89]], null, null, null, null, null, [["speech", 29.44], ["explosion", 6.75], ["whoosh, swoosh, swish", 5.65]]], "duration": [20.37, 33.31, 9.31, 17.31, 0.77, 47.68, -0.07, 0.79, 0.48, 9.91]} \ No newline at end of file diff --git a/annotations_1/oDjuY9KCsI8_filtered.json b/annotations_1/oDjuY9KCsI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ddb58b3ed326e514af7439afc317b1b75c02489 --- /dev/null +++ b/annotations_1/oDjuY9KCsI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [5.0, 5.02], [6.0, 6.56], [11.0, 11.43], [20.0, 20.06], [31.0, 32.24], [35.0, 35.8], [38.0, 38.94], [43.0, 43.34], [68.0, 68.17], [75.0, 74.66], [79.0, 79.89], [83.0, 83.12], [87.0, 87.62], [89.0, 89.46], [90.0, 91.35], [92.0, 91.96], [93.0, 93.83], [99.0, 106.46], [107.0, 108.35], [124.0, 124.77], [126.0, 127.06], [129.0, 129.37], [131.0, 132.33], [134.0, 134.59], [135.0, 137.44], [138.0, 139.31], [142.0, 142.75], [143.0, 149.81], [150.0, 151.28], [152.0, 153.6], [155.0, 156.27], [157.0, 158.67], [166.0, 167.04], [169.0, 170.19], [173.0, 174.09], [177.0, 180.66], [182.0, 186.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 51.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04, 68.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 0.02, 0.56, 0.43, 0.06, 1.24, 0.8, 0.94, 0.34, 0.17, -0.34, 0.89, 0.12, 0.62, 0.46, 1.35, -0.04, 0.83, 7.46, 1.35, 0.77, 1.06, 0.37, 1.33, 0.59, 2.44, 1.31, 0.75, 6.81, 1.28, 1.6, 1.27, 1.67, 1.04, 1.19, 1.09, 3.66, 4.65]} \ No newline at end of file diff --git a/annotations_1/oEHayxH_YT8_filtered.json b/annotations_1/oEHayxH_YT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8dafcc4ee18283df8cb7c4691a8650270d0e493b --- /dev/null +++ b/annotations_1/oEHayxH_YT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 26.1], [26.0, 57.67], [60.0, 72.52], [74.0, 75.73], [76.0, 80.79], [81.0, 102.3], [105.0, 106.89], [108.0, 114.44], [116.0, 118.4], [119.0, 128.28], [129.0, 139.38], [140.0, 140.34], [141.0, 142.89], [146.0, 146.37]], "keep_status": [true, false, false, false, false, true, false, true, true, true, false, false, false, false], "silence_prob": [30.19, 0.0, 50.36, 0.0, 49.36, 39.01, 0.0, 47.98, 47.5, 47.74, 32.87, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 22.62], ["hum", 15.57], ["throbbing", 14.13]], null, null, null, [["hum", 35.49], ["mains hum", 21.29], ["music", 17.06]], [["music", 31.07], ["hum", 19.1], ["synthesizer", 10.39]], null, [["hum", 25.31], ["throbbing", 17.69], ["music", 17.34]], [["music", 45.05], ["hum", 7.99], ["mains hum", 3.88]], [["speech", 20.83], ["mains hum", 18.86], ["hum", 18.07]], [["hum", 53.68], ["mains hum", 16.84], ["throbbing", 9.36]], null, null, null], "duration": [14.1, 31.67, 12.52, 1.73, 4.79, 21.3, 1.89, 6.44, 2.4, 9.28, 10.38, 0.34, 1.89, 0.37]} \ No newline at end of file diff --git a/annotations_1/oEddtexPCso_filtered.json b/annotations_1/oEddtexPCso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2aea6158bd5ce1c504fc1de3829c69d78cb4d508 --- /dev/null +++ b/annotations_1/oEddtexPCso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 35.61], [43.0, 43.9], [51.0, 52.08], [56.0, 56.27], [57.0, 57.72], [65.0, 65.08], [68.0, 73.36], [74.0, 74.7], [76.0, 76.55], [77.0, 85.16], [87.0, 87.34], [91.0, 91.27], [92.0, 94.9], [98.0, 97.53], [98.0, 100.31], [102.0, 103.99], [113.0, 114.61], [117.0, 123.99], [124.0, 126.86], [130.0, 141.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.71, 0.0, 0.0, 31.48, 0.0, 0.0, 38.35, 0.0, 35.75, 0.0, 0.0, 35.37, 34.61, 31.38], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 53.79], ["fart", 25.43], ["music", 6.05]], null, null, [["speech", 58.52], ["music", 18.85], ["electric shaver, electric razor", 2.99]], null, null, [["music", 44.4], ["speech", 33.73], ["synthesizer", 3.94]], null, [["speech", 30.63], ["music", 20.96], ["sound effect", 5.44]], null, null, [["speech", 41.52], ["music", 28.72], ["telephone bell ringing", 6.01]], [["music", 36.52], ["mains hum", 13.12], ["hum", 7.91]], [["mains hum", 52.19], ["hum", 36.52], ["music", 4.92]]], "duration": [0.61, 0.9, 1.08, 0.27, 0.72, 0.08, 5.36, 0.7, 0.55, 8.16, 0.34, 0.27, 2.9, -0.47, 2.31, 1.99, 1.61, 6.99, 2.86, 11.45]} \ No newline at end of file diff --git a/annotations_1/oG-MKxVWwi4_filtered.json b/annotations_1/oG-MKxVWwi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e345fdcfc3b6ee7f6fc30ec40707b26d61f9bdcf --- /dev/null +++ b/annotations_1/oG-MKxVWwi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.03], [12.0, 13.0], [20.0, 20.07], [22.0, 22.49], [26.0, 28.59], [29.0, 31.58], [32.0, 32.86], [34.0, 35.4], [38.0, 38.75], [40.0, 40.9], [66.0, 66.85], [68.0, 71.05], [75.0, 75.76], [77.0, 78.31], [83.0, 85.65], [87.0, 87.71], [90.0, 90.39], [94.0, 95.2], [97.0, 115.21], [117.0, 118.93], [127.0, 129.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 68.15, 57.81, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 70.3, 0.0, 60.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 1.0, 0.07, 0.49, 2.59, 2.58, 0.86, 1.4, 0.75, 0.9, 0.85, 3.05, 0.76, 1.31, 2.65, 0.71, 0.39, 1.2, 18.21, 1.93, 2.17]} \ No newline at end of file diff --git a/annotations_1/oGV14YsOvWo_filtered.json b/annotations_1/oGV14YsOvWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a49df3333498ef55fa2294e6a87c190687ed1c66 --- /dev/null +++ b/annotations_1/oGV14YsOvWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [3.0, 9.19], [10.0, 16.01], [18.0, 20.66], [27.0, 28.85], [29.0, 29.62], [32.0, 32.37], [33.0, 36.76], [47.0, 53.67], [58.0, 60.32], [67.0, 99.62], [100.0, 101.63], [102.0, 106.73], [107.0, 116.09], [117.0, 120.09], [121.0, 123.57], [124.0, 129.22], [136.0, 136.46], [137.0, 139.06], [141.0, 149.28]], "keep_status": [false, false, true, true, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 38.23, 34.49, 34.59, 0.0, 0.0, 0.0, 32.63, 32.97, 33.16, 0.0, 0.0, 73.51, 74.29, 48.35, 59.77, 51.6, 0.0, 34.68, 31.78], "audiomae_on_audioset": [null, [["music", 59.9], ["boing", 16.0], ["speech", 10.71]], [["music", 32.99], ["boing", 18.17], ["wind instrument, woodwind instrument", 17.21]], [["music", 38.41], ["fly, housefly", 8.0], ["sidetone", 7.79]], null, null, null, [["boing", 17.19], ["cattle, bovinae", 16.74], ["music", 13.04]], [["whack, thwack", 26.41], ["music", 23.18], ["quack", 5.98]], [["moo", 37.44], ["cattle, bovinae", 16.33], ["livestock, farm animals, working animals", 16.1]], null, null, null, null, [["speech", 26.45], ["music", 11.59], ["wail, moan", 10.82]], null, null, null, [["speech", 23.94], ["music", 19.82], ["crowd", 7.4]], [["sidetone", 26.7], ["music", 20.27], ["speech", 12.58]]], "duration": [0.35, 6.19, 6.01, 2.66, 1.85, 0.62, 0.37, 3.76, 6.67, 2.32, 32.62, 1.63, 4.73, 9.09, 3.09, 2.57, 5.22, 0.46, 2.06, 8.28]} \ No newline at end of file diff --git a/annotations_1/oH-kAHKtbTE_filtered.json b/annotations_1/oH-kAHKtbTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84673b966d7c2cb260c250f727aeb50cee1b2e76 --- /dev/null +++ b/annotations_1/oH-kAHKtbTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.95], [7.0, 7.43], [10.0, 17.36], [19.0, 23.77], [25.0, 27.78], [29.0, 30.52], [31.0, 35.16], [36.0, 38.4], [50.0, 52.74], [53.0, 66.48], [67.0, 89.88], [92.0, 94.68], [95.0, 95.84], [97.0, 104.97], [108.0, 109.02], [113.0, 151.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 66.39, 90.25, 79.24, 0.0, 83.7, 79.41, 96.77, 82.43, 82.97, 46.79, 0.0, 55.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["dog", 27.03], ["bow-wow", 11.43], ["domestic animals, pets", 8.82]], null, null, null, null], "duration": [1.95, 0.43, 7.36, 4.77, 2.78, 1.52, 4.16, 2.4, 2.74, 13.48, 22.88, 2.68, 0.84, 7.97, 1.02, 38.16]} \ No newline at end of file diff --git a/annotations_1/oIlpo2mj_qk_filtered.json b/annotations_1/oIlpo2mj_qk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..731ae801ecdd3b0b044437fedfe6b5c06b7713cb --- /dev/null +++ b/annotations_1/oIlpo2mj_qk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.91], [12.0, 15.36], [17.0, 19.58], [21.0, 45.33], [47.0, 48.09], [51.0, 53.62], [55.0, 58.35], [60.0, 61.05], [64.0, 65.28], [66.0, 81.03], [82.0, 82.19], [85.0, 86.24], [92.0, 101.73], [103.0, 104.63], [106.0, 108.97]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [74.44, 70.3, 83.7, 68.8, 0.0, 82.07, 30.38, 0.0, 0.0, 32.92, 0.0, 0.0, 33.03, 0.0, 76.37], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.43], ["breaking", 8.73], ["fusillade", 4.71]], null, null, [["music", 68.03], ["electronic music", 3.59], ["breaking", 2.94]], null, null, [["music", 57.62], ["hum", 5.28], ["breaking", 4.67]], null, null], "duration": [2.91, 3.36, 2.58, 24.33, 1.09, 2.62, 3.35, 1.05, 1.28, 15.03, 0.19, 1.24, 9.73, 1.63, 2.97]} \ No newline at end of file diff --git a/annotations_1/oK1zfJausVM_filtered.json b/annotations_1/oK1zfJausVM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90c08e620881ba7f4882abb09b12fbfa8a5a76e0 --- /dev/null +++ b/annotations_1/oK1zfJausVM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [10.0, 12.75], [13.0, 13.8], [16.0, 17.42], [21.0, 21.59], [22.0, 22.71], [23.0, 24.09], [24.0, 24.27], [25.0, 25.34], [27.0, 28.16], [29.0, 30.15], [32.0, 31.99], [34.0, 34.6], [39.0, 41.27], [43.0, 44.47], [47.0, 48.42], [49.0, 62.99], [64.0, 67.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 89.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.43, 0.0, 0.0, 29.47, 99.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.71], ["speech", 18.98], ["didgeridoo", 1.99]], null, null, [["whip", 47.34], ["music", 12.05], ["speech", 10.07]], null], "duration": [0.16, 2.75, 0.8, 1.42, 0.59, 0.71, 1.09, 0.27, 0.34, 1.16, 1.15, -0.01, 0.6, 2.27, 1.47, 1.42, 13.99, 3.71]} \ No newline at end of file diff --git a/annotations_1/oLJ7246t3-c_filtered.json b/annotations_1/oLJ7246t3-c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b4df6829618f85420cf3df30ef9f43f15bb26c --- /dev/null +++ b/annotations_1/oLJ7246t3-c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.45], [6.0, 6.05], [6.0, 9.27], [12.0, 13.09], [17.0, 18.3], [19.0, 20.56], [21.0, 23.08], [24.0, 25.73], [27.0, 31.89], [33.0, 34.1], [38.0, 39.18], [42.0, 43.87], [46.0, 48.66], [50.0, 66.65], [68.0, 68.5], [69.0, 70.66], [73.0, 72.99], [74.0, 74.88], [77.0, 77.18], [78.0, 79.79], [81.0, 80.84], [85.0, 85.6], [87.0, 88.67], [90.0, 91.23], [93.0, 93.61], [96.0, 98.2], [101.0, 102.46], [104.0, 104.35], [109.0, 111.33], [113.0, 113.68], [115.0, 115.62], [119.0, 156.78], [157.0, 164.67], [166.0, 167.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.05, 0.0, 92.97, 0.0, 0.0, 0.0, 99.16, 0.0, 97.54, 0.0, 0.0, 0.0, 99.4, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 97.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.45, 0.05, 3.27, 1.09, 1.3, 1.56, 2.08, 1.73, 4.89, 1.1, 1.18, 1.87, 2.66, 16.65, 0.5, 1.66, -0.01, 0.88, 0.18, 1.79, -0.16, 0.6, 1.67, 1.23, 0.61, 2.2, 1.46, 0.35, 2.33, 0.68, 0.62, 37.78, 7.67, 1.71]} \ No newline at end of file diff --git a/annotations_1/oMH9kIyIl1I_filtered.json b/annotations_1/oMH9kIyIl1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ace4faf5f2025ddf89e849d0f3b2f6fa0c73ec48 --- /dev/null +++ b/annotations_1/oMH9kIyIl1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.09], [25.0, 36.73], [39.0, 38.69], [39.0, 46.74], [52.0, 56.88], [60.0, 70.92], [75.0, 78.97], [83.0, 86.95], [94.0, 95.35]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.66, 0.0, 29.41, 29.67, 29.56, 29.64, 29.64, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 43.25], ["cattle, bovinae", 29.36], ["moo", 18.82]], null, [["music", 79.26], ["hum", 3.17], ["cacophony", 2.79]], [["music", 81.6], ["cacophony", 3.75], ["musical instrument", 1.43]], [["music", 80.19], ["rock music", 2.34], ["musical instrument", 2.27]], [["music", 57.24], ["hum", 7.97], ["mains hum", 5.06]], [["music", 58.29], ["throbbing", 5.49], ["hum", 4.97]], null], "duration": [0.09, 11.73, -0.31, 7.74, 4.88, 10.92, 3.97, 3.95, 1.35]} \ No newline at end of file diff --git a/annotations_1/oMt4F9ELo3U_filtered.json b/annotations_1/oMt4F9ELo3U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29aa7447bff986a1fa76ba92293fe26dd9575fd4 --- /dev/null +++ b/annotations_1/oMt4F9ELo3U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.75], [11.0, 12.58], [22.0, 21.74], [24.0, 24.73], [25.0, 24.76], [25.0, 25.17], [25.0, 26.32], [28.0, 29.49], [30.0, 37.49], [41.0, 41.17], [43.0, 43.06], [45.0, 44.78], [46.0, 46.26], [51.0, 50.85], [53.0, 54.4], [58.0, 59.19], [64.0, 72.66], [73.0, 74.55], [78.0, 84.38], [85.0, 85.85], [89.0, 91.4], [91.0, 91.44], [101.0, 101.87], [123.0, 125.96], [139.0, 142.21], [147.0, 149.17], [153.0, 155.26], [157.0, 157.6], [161.0, 161.33], [162.0, 162.73], [168.0, 168.0], [168.0, 170.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.1, 0.0, 41.48, 0.0, 60.6, 0.0, 0.0, 30.36, 29.66, 29.61, 51.34, 0.0, 0.0, 0.0, 0.0, 36.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.93], ["fly, housefly", 7.26], ["bee, wasp, etc.", 3.41]], null, null, null, null, [["cattle, bovinae", 31.44], ["moo", 25.4], ["speech", 23.51]], [["speech", 59.57], ["electric shaver, electric razor", 5.07], ["vehicle", 4.9]], [["livestock, farm animals, working animals", 17.21], ["cattle, bovinae", 15.17], ["insect", 12.55]], null, null, null, null, null, [["sidetone", 38.57], ["speech", 28.37], ["music", 16.31]]], "duration": [0.75, 1.58, -0.26, 0.73, -0.24, 0.17, 1.32, 1.49, 7.49, 0.17, 0.06, -0.22, 0.26, -0.15, 1.4, 1.19, 8.66, 1.55, 6.38, 0.85, 2.4, 0.44, 0.87, 2.96, 3.21, 2.17, 2.26, 0.6, 0.33, 0.73, 0.0, 2.43]} \ No newline at end of file diff --git a/annotations_1/oNWAiWBup2Q_filtered.json b/annotations_1/oNWAiWBup2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c548673f8d29910127b20f9cd1fac705774d6d4 --- /dev/null +++ b/annotations_1/oNWAiWBup2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [15.0, 15.11], [38.0, 38.4], [47.0, 53.89], [56.0, 58.31], [62.0, 62.94], [66.0, 66.5], [68.0, 68.08], [72.0, 83.29], [88.0, 87.84], [90.0, 92.74], [95.0, 108.19], [109.0, 109.59], [110.0, 111.37], [114.0, 115.18], [116.0, 118.39], [120.0, 123.89], [126.0, 127.79], [129.0, 131.14], [131.0, 147.23], [150.0, 154.5], [159.0, 159.02], [164.0, 174.28], [177.0, 184.47], [186.0, 187.08], [206.0, 217.41]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.63, 51.55, 0.0, 0.0, 0.0, 34.04, 0.0, 30.01, 32.91, 0.0, 0.0, 0.0, 35.32, 39.52, 0.0, 34.98, 34.02, 35.0, 0.0, 33.95, 33.88, 0.0, 35.82], "audiomae_on_audioset": [null, null, null, [["music", 53.26], ["didgeridoo", 11.05], ["hum", 9.82]], null, null, null, null, [["music", 31.5], ["speech", 25.39], ["vehicle", 7.66]], null, [["speech", 17.7], ["motorcycle", 11.2], ["sidetone", 8.43]], [["music", 56.5], ["throbbing", 8.71], ["hum", 5.41]], null, null, null, [["music", 47.43], ["theremin", 22.08], ["speech", 2.74]], [["music", 42.95], ["hum", 9.13], ["theremin", 8.24]], null, [["speech", 35.05], ["music", 9.85], ["vehicle", 6.48]], [["hum", 26.37], ["buzz", 16.75], ["music", 16.19]], [["music", 60.79], ["synthesizer", 7.26], ["hum", 5.11]], null, [["music", 81.28], ["synthesizer", 1.62], ["musical instrument", 1.59]], [["music", 41.47], ["speech", 23.26], ["hum", 7.5]], null, [["music", 65.39], ["hum", 9.59], ["throbbing", 6.57]]], "duration": [0.67, 0.11, 0.4, 6.89, 2.31, 0.94, 0.5, 0.08, 11.29, -0.16, 2.74, 13.19, 0.59, 1.37, 1.18, 2.39, 3.89, 1.79, 2.14, 16.23, 4.5, 0.02, 10.28, 7.47, 1.08, 11.41]} \ No newline at end of file diff --git a/annotations_1/oNiW2ftWINg_filtered.json b/annotations_1/oNiW2ftWINg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c85367d2fb9ea223553585f949e44b59df70db --- /dev/null +++ b/annotations_1/oNiW2ftWINg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [8.0, 8.87], [9.0, 9.56], [11.0, 17.19], [18.0, 18.86], [21.0, 20.98], [23.0, 24.26], [26.0, 27.08], [30.0, 43.75], [47.0, 47.76], [56.0, 57.18], [58.0, 67.36], [68.0, 70.55], [71.0, 72.01], [75.0, 76.57], [78.0, 79.84], [81.0, 85.01], [86.0, 87.24], [87.0, 89.94], [91.0, 91.61], [92.0, 93.26], [97.0, 98.68], [100.0, 104.21], [105.0, 107.05], [109.0, 114.78], [118.0, 119.57], [123.0, 124.21], [126.0, 126.79], [130.0, 131.16], [132.0, 143.21], [144.0, 149.08], [150.0, 154.35], [155.0, 164.34], [165.0, 166.9], [168.0, 171.95], [174.0, 175.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.6, 0.0, 0.0, 0.0, 0.0, 53.4, 0.0, 0.0, 59.59, 85.9, 0.0, 0.0, 0.0, 84.43, 0.0, 56.4, 0.0, 0.0, 0.0, 44.78, 90.25, 73.51, 0.0, 0.0, 0.0, 0.0, 73.82, 88.46, 65.09, 33.05, 0.0, 98.99, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.03], ["didgeridoo", 20.28], ["music", 13.6]], null, null, null, null, null, null, null, null, null, [["speech", 45.65], ["sidetone", 8.01], ["music", 7.53]], null, null, null], "duration": [0.56, 0.87, 0.56, 6.19, 0.86, -0.02, 1.26, 1.08, 13.75, 0.76, 1.18, 9.36, 2.55, 1.01, 1.57, 1.84, 4.01, 1.24, 2.94, 0.61, 1.26, 1.68, 4.21, 2.05, 5.78, 1.57, 1.21, 0.79, 1.16, 11.21, 5.08, 4.35, 9.34, 1.9, 3.95, 1.61]} \ No newline at end of file diff --git a/annotations_1/oNoOFf527GU_filtered.json b/annotations_1/oNoOFf527GU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa47b7c4acd1a31ef73fe7d6bacff700e33c9efa --- /dev/null +++ b/annotations_1/oNoOFf527GU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.63], [7.0, 9.8], [12.0, 12.82], [17.0, 18.12], [19.0, 19.84], [32.0, 32.9], [42.0, 44.47], [48.0, 48.98], [65.0, 65.96], [68.0, 69.23], [73.0, 73.99], [80.0, 81.13], [82.0, 86.19], [89.0, 92.26], [94.0, 94.07], [94.0, 94.1], [94.0, 94.2], [96.0, 100.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [76.2, 90.25, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 46.72, 96.17, 0.0, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 40.85], ["radio", 24.71], ["whale vocalization", 14.92]], null, null, null, null, null], "duration": [3.63, 2.8, 0.82, 1.12, 0.84, 0.9, 2.47, 0.98, 0.96, 1.23, 0.99, 1.13, 4.19, 3.26, 0.07, 0.1, 0.2, 4.55]} \ No newline at end of file diff --git a/annotations_1/oNpeuCWJgCc_filtered.json b/annotations_1/oNpeuCWJgCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0448572e2d17a267d56d1cfeb9c5a677353ef1c6 --- /dev/null +++ b/annotations_1/oNpeuCWJgCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.6], [11.0, 11.53], [12.0, 13.76], [17.0, 18.47], [27.0, 32.51], [36.0, 36.98], [40.0, 44.63], [48.0, 59.53], [62.0, 62.92], [64.0, 64.93], [66.0, 73.26], [75.0, 82.54], [86.0, 86.95], [90.0, 91.44], [100.0, 102.19], [107.0, 107.1], [107.0, 111.57], [113.0, 113.76], [115.0, 118.29], [121.0, 122.64]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [30.19, 0.0, 0.0, 0.0, 31.74, 0.0, 30.83, 31.0, 0.0, 0.0, 31.54, 31.45, 0.0, 0.0, 39.75, 0.0, 42.67, 0.0, 30.64, 0.0], "audiomae_on_audioset": [[["music", 41.0], ["speech", 13.48], ["fly, housefly", 8.44]], null, null, null, [["music", 50.83], ["percussion", 4.17], ["musical instrument", 3.66]], null, [["music", 55.67], ["cattle, bovinae", 6.64], ["moo", 4.81]], [["music", 70.7], ["musical instrument", 3.8], ["music of latin america", 2.28]], null, null, [["music", 68.63], ["music of latin america", 3.1], ["musical instrument", 2.44]], [["music", 69.86], ["musical instrument", 4.45], ["swing music", 1.64]], null, null, [["music", 36.78], ["sidetone", 22.94], ["didgeridoo", 10.18]], null, [["music", 53.25], ["didgeridoo", 19.75], ["speech", 4.26]], null, [["music", 61.28], ["cacophony", 9.58], ["cheering", 2.13]], null], "duration": [5.6, 0.53, 1.76, 1.47, 5.51, 0.98, 4.63, 11.53, 0.92, 0.93, 7.26, 7.54, 0.95, 1.44, 2.19, 0.1, 4.57, 0.76, 3.29, 1.64]} \ No newline at end of file diff --git a/annotations_1/oNuGwa5Kd8E_filtered.json b/annotations_1/oNuGwa5Kd8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..843912143b67fa449cdf36b51cc76b057a058c4a --- /dev/null +++ b/annotations_1/oNuGwa5Kd8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 13.73], [24.0, 24.27], [26.0, 26.6], [31.0, 31.68], [33.0, 33.57], [34.0, 34.84], [37.0, 40.17], [41.0, 41.91], [43.0, 43.38], [44.0, 45.03], [49.0, 49.01], [56.0, 56.66], [71.0, 71.52], [73.0, 73.57], [74.0, 74.88], [76.0, 76.81], [77.0, 79.2], [83.0, 83.64], [91.0, 90.76], [93.0, 96.53], [100.0, 111.13], [113.0, 115.86], [124.0, 125.73], [127.0, 129.52], [133.0, 135.21], [137.0, 138.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 37.07, 35.26, 82.07, 0.0, 43.38, 30.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 61.35], ["musical instrument", 8.55], ["didgeridoo", 3.88]], null, null, null, null, null, null, null, null, null, [["speech", 47.36], ["music", 11.13], ["didgeridoo", 4.83]], null, null, [["music", 35.74], ["speech", 19.49], ["pulse", 11.98]], [["hum", 25.49], ["music", 25.42], ["speech", 18.2]], null, null, [["music", 28.03], ["speech", 25.24], ["hum", 8.52]], [["speech", 50.26], ["fart", 12.56], ["boing", 11.86]], null], "duration": [-0.27, 0.27, 0.6, 0.68, 0.57, 0.84, 3.17, 0.91, 0.38, 1.03, 0.01, 0.66, 0.52, 0.57, 0.88, 0.81, 2.2, 0.64, -0.24, 3.53, 11.13, 2.86, 1.73, 2.52, 2.21, 1.08]} \ No newline at end of file diff --git a/annotations_1/oOWl14GlJx4_filtered.json b/annotations_1/oOWl14GlJx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b5c2d094317ac0303fd1d07bcdce424f06eef63 --- /dev/null +++ b/annotations_1/oOWl14GlJx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.08], [7.0, 9.14], [13.0, 15.11], [16.0, 17.61], [19.0, 97.95], [100.0, 101.29], [103.0, 102.74], [104.0, 106.51], [108.0, 110.02], [111.0, 111.82], [113.0, 123.11]], "keep_status": [false, true, true, false, false, false, false, true, true, false, true], "silence_prob": [0.0, 30.63, 31.58, 0.0, 0.0, 0.0, 0.0, 31.62, 32.9, 0.0, 44.23], "audiomae_on_audioset": [null, [["owl", 17.76], ["throbbing", 13.7], ["hoot", 10.08]], [["music", 18.74], ["hum", 14.09], ["explosion", 10.07]], null, null, null, null, [["wind instrument, woodwind instrument", 23.14], ["foghorn", 21.11], ["speech", 19.0]], [["mains hum", 22.82], ["hum", 12.35], ["throbbing", 7.08]], null, [["speech", 16.63], ["hum", 12.44], ["animal", 7.51]]], "duration": [1.08, 2.14, 2.11, 1.61, 78.95, 1.29, -0.26, 2.51, 2.02, 0.82, 10.11]} \ No newline at end of file diff --git a/annotations_1/oQIubudKQQE_filtered.json b/annotations_1/oQIubudKQQE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa90740e0017062d9819120477738c4c8cd00c33 --- /dev/null +++ b/annotations_1/oQIubudKQQE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [9.0, 8.67], [10.0, 13.41], [15.0, 20.98], [23.0, 23.43], [24.0, 25.86], [27.0, 29.73], [35.0, 35.75], [39.0, 39.65], [40.0, 40.32], [40.0, 40.95], [42.0, 42.13], [43.0, 44.07], [52.0, 53.3], [59.0, 62.43], [69.0, 70.53], [72.0, 72.84], [74.0, 75.19], [76.0, 77.09], [82.0, 85.82], [89.0, 91.05], [92.0, 95.25], [98.0, 99.96], [108.0, 108.95], [111.0, 113.36], [114.0, 115.79], [124.0, 125.04], [128.0, 128.36], [133.0, 133.14], [134.0, 143.88], [146.0, 149.37], [150.0, 150.69], [155.0, 156.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 83.7, 69.34, 0.0, 0.0, 82.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 99.4, 99.62, 99.98, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 97.11, 93.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, -0.33, 3.41, 5.98, 0.43, 1.86, 2.73, 0.75, 0.65, 0.32, 0.95, 0.13, 1.07, 1.3, 3.43, 1.53, 0.84, 1.19, 1.09, 3.82, 2.05, 3.25, 1.96, 0.95, 2.36, 1.79, 1.04, 0.36, 0.14, 9.88, 3.37, 0.69, 1.64]} \ No newline at end of file diff --git a/annotations_1/oR3h33DSGPM_filtered.json b/annotations_1/oR3h33DSGPM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f549e248c5c0ecb7efb5113c2098b50f77debed --- /dev/null +++ b/annotations_1/oR3h33DSGPM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.04], [14.0, 23.36], [28.0, 40.96], [47.0, 47.8], [49.0, 50.18], [55.0, 55.75], [57.0, 57.32], [58.0, 58.4], [66.0, 66.51], [72.0, 72.57], [87.0, 86.81], [88.0, 89.75], [93.0, 92.7], [97.0, 98.64], [100.0, 102.19], [119.0, 120.53], [127.0, 128.19], [135.0, 136.59], [138.0, 138.65], [140.0, 141.52]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.8, 41.3, 75.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 68.66], ["hum", 7.47], ["music", 6.46]], [["music", 26.49], ["speech", 19.41], ["didgeridoo", 9.6]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.04, 9.36, 12.96, 0.8, 1.18, 0.75, 0.32, 0.4, 0.51, 0.57, -0.19, 1.75, -0.3, 1.64, 2.19, 1.53, 1.19, 1.59, 0.65, 1.52]} \ No newline at end of file diff --git a/annotations_1/oRRupV-lwbU_filtered.json b/annotations_1/oRRupV-lwbU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e88969a5d246d33c2717e83be340cd915b65cf80 --- /dev/null +++ b/annotations_1/oRRupV-lwbU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.34], [9.0, 10.03], [13.0, 19.85], [21.0, 25.03], [28.0, 29.24], [32.0, 33.08], [35.0, 35.72], [44.0, 45.82], [49.0, 50.99], [52.0, 53.38], [55.0, 55.56], [59.0, 58.99], [63.0, 63.24], [65.0, 66.51], [74.0, 74.8], [82.0, 82.53], [83.0, 82.93], [84.0, 86.1], [87.0, 88.16], [91.0, 92.48]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.97, 0.0, 36.98, 33.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 60.89], ["music", 9.47], ["speech", 7.5]], null, [["speech", 43.39], ["explosion", 8.17], ["screaming", 6.97]], [["boing", 26.81], ["speech", 14.22], ["cattle, bovinae", 9.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 1.03, 6.85, 4.03, 1.24, 1.08, 0.72, 1.82, 1.99, 1.38, 0.56, -0.01, 0.24, 1.51, 0.8, 0.53, -0.07, 2.1, 1.16, 1.48]} \ No newline at end of file diff --git a/annotations_1/oRe8EuewinY_filtered.json b/annotations_1/oRe8EuewinY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91c63a0d4108613e095d25eba3ab7fac53a8ee26 --- /dev/null +++ b/annotations_1/oRe8EuewinY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.75], [28.0, 28.61], [35.0, 35.56], [37.0, 37.89], [39.0, 39.72], [40.0, 41.67], [44.0, 44.9], [47.0, 47.48], [49.0, 49.45], [51.0, 51.38], [52.0, 53.97], [55.0, 57.21], [58.0, 59.53], [61.0, 85.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 29.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.49], ["didgeridoo", 14.08], ["theremin", 11.45]]], "duration": [1.75, 0.61, 0.56, 0.89, 0.72, 1.67, 0.9, 0.48, 0.45, 0.38, 1.97, 2.21, 1.53, 24.77]} \ No newline at end of file diff --git a/annotations_1/oS6AtbHHjSo_filtered.json b/annotations_1/oS6AtbHHjSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56fcaa94a1e698a2d658c4f57b9a364d407c40ca --- /dev/null +++ b/annotations_1/oS6AtbHHjSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 15.11], [16.0, 21.76], [24.0, 24.63], [28.0, 42.94], [51.0, 54.75]], "keep_status": [true, true, false, true, false], "silence_prob": [30.11, 30.39, 0.0, 30.24, 30.24], "audiomae_on_audioset": [[["speech", 42.74], ["music", 16.64], ["vehicle", 2.96]], [["speech", 34.77], ["music", 21.87], ["cacophony", 4.33]], null, [["music", 12.29], ["whack, thwack", 10.69], ["speech", 9.23]], [["music", 54.21], ["speech", 18.75], ["throbbing", 5.31]]], "duration": [10.11, 5.76, 0.63, 14.94, 3.75]} \ No newline at end of file diff --git a/annotations_1/oS_Iap5D9jQ_filtered.json b/annotations_1/oS_Iap5D9jQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab0bbddb877ab91f8f7af999df796188ac250cb9 --- /dev/null +++ b/annotations_1/oS_Iap5D9jQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [8.0, 9.02], [12.0, 92.37], [93.0, 108.36], [111.0, 112.82], [114.0, 117.81], [119.0, 119.99], [121.0, 123.87], [125.0, 148.27], [154.0, 156.9], [159.0, 163.78], [164.0, 165.89], [167.0, 168.05], [168.0, 168.79], [170.0, 186.27], [186.0, 186.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [86.45, 0.0, 0.0, 95.51, 0.0, 96.54, 0.0, 96.54, 83.16, 93.76, 88.64, 0.0, 0.0, 0.0, 95.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.68, 1.02, 80.37, 15.36, 1.82, 3.81, 0.99, 2.87, 23.27, 2.9, 4.78, 1.89, 1.05, 0.79, 16.27, 0.51]} \ No newline at end of file diff --git a/annotations_1/oT_RsXOPjTs_filtered.json b/annotations_1/oT_RsXOPjTs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8984d49d1d338a5793691f16214d80c9be37c8e0 --- /dev/null +++ b/annotations_1/oT_RsXOPjTs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[51.0, 52.79], [55.0, 56.71], [67.0, 67.29], [70.0, 69.84], [78.0, 78.54], [81.0, 81.87], [83.0, 83.79], [84.0, 85.28], [86.0, 86.85], [88.0, 89.43], [91.0, 93.29], [95.0, 118.13], [120.0, 121.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.7, 43.03, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["frog", 21.53], ["gurgling", 13.04], ["whale vocalization", 12.01]], null], "duration": [1.79, 1.71, 0.29, -0.16, 0.54, 0.87, 0.79, 1.28, 0.85, 1.43, 2.29, 23.13, 1.95]} \ No newline at end of file diff --git a/annotations_1/oToIYlwJY9I_filtered.json b/annotations_1/oToIYlwJY9I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..043d80d6c134150fc6bda1e7ca3f91aaf52ef451 --- /dev/null +++ b/annotations_1/oToIYlwJY9I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [4.0, 4.11], [6.0, 9.58], [14.0, 16.11], [18.0, 18.06], [18.0, 19.65], [24.0, 33.42], [34.0, 35.33], [39.0, 39.72], [40.0, 40.34], [41.0, 41.88], [45.0, 59.48], [66.0, 107.06], [108.0, 111.62], [116.0, 117.96], [122.0, 124.6], [128.0, 133.2], [137.0, 137.62], [141.0, 146.89], [147.0, 149.12]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.14, 33.76, 0.0, 0.0, 31.32, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 41.34, 0.0, 38.14, 33.95, 0.0, 37.27, 35.5], "audiomae_on_audioset": [null, null, [["music", 49.87], ["speech", 6.1], ["moo", 5.89]], [["music", 74.84], ["speech", 5.36], ["electronic music", 2.94]], null, null, [["music", 78.63], ["speech", 6.9], ["cattle, bovinae", 3.08]], null, null, null, null, [["music", 80.54], ["musical instrument", 2.65], ["didgeridoo", 2.19]], null, [["music", 66.45], ["guitar", 4.12], ["bass guitar", 3.83]], null, [["music", 67.9], ["singing", 3.79], ["dubstep", 3.22]], [["music", 81.41], ["singing", 1.45], ["musical instrument", 0.84]], null, [["music", 65.57], ["bass guitar", 7.55], ["guitar", 5.03]], [["music", 66.7], ["musical instrument", 2.98], ["guitar", 2.87]]], "duration": [1.27, 0.11, 3.58, 2.11, 0.06, 1.65, 9.42, 1.33, 0.72, 0.34, 0.88, 14.48, 41.06, 3.62, 1.96, 2.6, 5.2, 0.62, 5.89, 2.12]} \ No newline at end of file diff --git a/annotations_1/oUKw4qcGHZs_filtered.json b/annotations_1/oUKw4qcGHZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b317ac65f4269b8e3a8151e2627cc070ba79b4b2 --- /dev/null +++ b/annotations_1/oUKw4qcGHZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[93.0, 95.89], [96.0, 144.22], [148.0, 148.22], [150.0, 154.41], [155.0, 160.03], [164.0, 165.0]], "keep_status": [false, false, false, false, false, false], "silence_prob": [85.17, 0.0, 0.0, 73.06, 51.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [2.89, 48.22, 0.22, 4.41, 5.03, 1.0]} \ No newline at end of file diff --git a/annotations_1/oUo_8mKGHvY_filtered.json b/annotations_1/oUo_8mKGHvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0cd8ab02a0b4f4c9c3a5d6fee393b1cc362407 --- /dev/null +++ b/annotations_1/oUo_8mKGHvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.61], [12.0, 12.38], [19.0, 19.75], [35.0, 34.86], [41.0, 41.64], [45.0, 46.3], [80.0, 81.01], [83.0, 83.59], [85.0, 86.16], [87.0, 87.49], [88.0, 89.61], [90.0, 90.61], [102.0, 103.38], [105.0, 105.17], [109.0, 109.9], [113.0, 113.02], [120.0, 121.37], [122.0, 123.38], [124.0, 127.08], [127.0, 127.92], [131.0, 131.11], [133.0, 132.87], [136.0, 136.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.38, 0.75, -0.14, 0.64, 1.3, 1.01, 0.59, 1.16, 0.49, 1.61, 0.61, 1.38, 0.17, 0.9, 0.02, 1.37, 1.38, 3.08, 0.92, 0.11, -0.13, 0.61]} \ No newline at end of file diff --git a/annotations_1/oVLfIoIujHE_filtered.json b/annotations_1/oVLfIoIujHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0780bf8586f9e64816cfa4ce1cf89286a54cf05 --- /dev/null +++ b/annotations_1/oVLfIoIujHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 56.61], [66.0, 66.55], [68.0, 71.81], [73.0, 74.43], [76.0, 77.8], [79.0, 85.14], [86.0, 97.33], [99.0, 101.88], [103.0, 109.58], [112.0, 113.29], [116.0, 119.84], [125.0, 125.52], [126.0, 126.49], [128.0, 128.29], [129.0, 130.4], [132.0, 134.42]], "keep_status": [false, false, false, false, false, false, true, true, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.78, 0.0, 0.0, 40.31, 35.18, 39.15, 45.95, 0.0, 33.35, 0.0, 0.0, 0.0, 0.0, 36.87], "audiomae_on_audioset": [null, null, null, null, null, [["music", 73.61], ["hum", 5.11], ["musical instrument", 4.23]], [["music", 58.87], ["musical instrument", 5.41], ["speech", 4.97]], [["music", 26.47], ["speech", 5.75], ["musical instrument", 3.14]], [["music", 43.35], ["effects unit", 14.19], ["speech", 5.39]], null, [["music", 23.17], ["sheep", 14.49], ["bleat", 11.14]], null, null, null, null, [["music", 44.14], ["didgeridoo", 16.59], ["mantra", 6.44]]], "duration": [40.61, 0.55, 3.81, 1.43, 1.8, 6.14, 11.33, 2.88, 6.58, 1.29, 3.84, 0.52, 0.49, 0.29, 1.4, 2.42]} \ No newline at end of file diff --git a/annotations_1/oWSIUe5wYvc_filtered.json b/annotations_1/oWSIUe5wYvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..359100c211baea495259a4ebd917655647edd693 --- /dev/null +++ b/annotations_1/oWSIUe5wYvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.3], [11.0, 13.49], [17.0, 60.84], [61.0, 107.81], [109.0, 112.23], [114.0, 126.32]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 60.51, 0.0, 0.0, 100.0, 83.16], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.3, 2.49, 43.84, 46.81, 3.23, 12.32]} \ No newline at end of file diff --git a/annotations_1/oWjtcWh-gyI_filtered.json b/annotations_1/oWjtcWh-gyI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1be8c24d4637a2a48e76219b8c4fb85f15df4cf0 --- /dev/null +++ b/annotations_1/oWjtcWh-gyI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.88], [13.0, 13.59], [16.0, 20.71], [28.0, 29.15], [34.0, 35.75], [36.0, 37.05], [46.0, 53.47], [58.0, 57.92], [59.0, 59.1], [59.0, 60.08], [61.0, 68.47], [89.0, 89.6], [90.0, 90.22], [92.0, 94.07], [96.0, 96.69], [100.0, 121.44], [125.0, 125.44], [127.0, 132.8], [134.0, 135.21], [135.0, 138.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.33, 0.0, 0.0, 0.0, 34.01, 0.0, 0.0, 0.0, 35.26, 0.0, 0.0, 41.91, 0.0, 31.05, 0.0, 33.87, 0.0, 32.39], "audiomae_on_audioset": [null, null, [["music", 48.52], ["speech", 35.27], ["electronic music", 2.74]], null, null, null, [["music", 55.83], ["mains hum", 11.57], ["hum", 7.53]], null, null, null, [["music", 56.43], ["didgeridoo", 7.12], ["hum", 5.58]], null, null, [["music", 34.97], ["throbbing", 12.9], ["speech", 11.85]], null, [["electric shaver, electric razor", 33.84], ["speech", 29.83], ["buzz", 11.27]], null, [["speech", 80.84], ["hum", 1.73], ["vehicle", 1.54]], null, [["breaking", 18.43], ["cattle, bovinae", 12.97], ["moo", 11.44]]], "duration": [-0.12, 0.59, 4.71, 1.15, 1.75, 1.05, 7.47, -0.08, 0.1, 1.08, 7.47, 0.6, 0.22, 2.07, 0.69, 21.44, 0.44, 5.8, 1.21, 3.2]} \ No newline at end of file diff --git a/annotations_1/oXpKBkMq_OM_filtered.json b/annotations_1/oXpKBkMq_OM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85fca763c0c3dde4ce2335a7a47272fc09295c52 --- /dev/null +++ b/annotations_1/oXpKBkMq_OM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 26.18], [27.0, 27.26], [29.0, 58.36]], "keep_status": [false, false, true], "silence_prob": [72.75, 0.0, 32.79], "audiomae_on_audioset": [null, null, [["music", 21.87], ["whack, thwack", 16.41], ["speech", 15.43]]], "duration": [6.18, 0.26, 29.36]} \ No newline at end of file diff --git a/annotations_1/oY0spjrKFdM_filtered.json b/annotations_1/oY0spjrKFdM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..653b11ffa4cf08116bf72ca61d4a11dea69b80c8 --- /dev/null +++ b/annotations_1/oY0spjrKFdM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.13], [11.0, 12.68], [17.0, 16.98], [24.0, 24.54], [34.0, 35.14], [38.0, 38.8], [45.0, 44.91], [46.0, 47.01], [59.0, 59.78], [61.0, 61.84], [67.0, 67.22], [71.0, 71.07], [72.0, 130.79], [133.0, 137.22], [142.0, 142.5], [148.0, 148.58], [160.0, 161.16], [164.0, 164.61], [167.0, 168.07], [175.0, 176.13], [180.0, 186.06], [187.0, 187.81], [191.0, 191.52], [198.0, 207.35], [208.0, 209.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.35, 0.0, 0.0, 31.21, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["brass instrument", 26.51], ["music", 24.26], ["trombone", 11.83]], null, null, null, null, null, null, [["music", 85.14], ["foghorn", 2.71], ["theremin", 1.08]], null, null, [["music", 74.86], ["boing", 4.4], ["theremin", 2.16]], null], "duration": [0.13, 1.68, -0.02, 0.54, 1.14, 0.8, -0.09, 1.01, 0.78, 0.84, 0.22, 0.07, 58.79, 4.22, 0.5, 0.58, 1.16, 0.61, 1.07, 1.13, 6.06, 0.81, 0.52, 9.35, 1.02]} \ No newline at end of file diff --git a/annotations_1/oY1tp2HG06w_filtered.json b/annotations_1/oY1tp2HG06w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d18f2f6395142a0f0402cb9c55902665f95ed70 --- /dev/null +++ b/annotations_1/oY1tp2HG06w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.58], [8.0, 18.89], [20.0, 23.4], [25.0, 35.21], [37.0, 38.38], [41.0, 45.2], [53.0, 53.59], [57.0, 57.59], [58.0, 59.36], [60.0, 61.21], [67.0, 68.91], [70.0, 71.68], [76.0, 76.59], [78.0, 78.12], [78.0, 83.07], [83.0, 84.25], [85.0, 98.58], [100.0, 100.79], [104.0, 104.3], [105.0, 106.15], [107.0, 108.18], [110.0, 111.11], [112.0, 114.59], [117.0, 119.16], [121.0, 122.3], [124.0, 124.87], [128.0, 130.27], [136.0, 136.59], [143.0, 144.24], [147.0, 149.37], [151.0, 161.15], [166.0, 167.61], [169.0, 170.06], [171.0, 171.76], [178.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 51.99, 64.52, 67.89, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.57, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 43.1, 52.27, 0.0, 0.0, 39.28, 0.0, 0.0, 99.93, 32.66, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 77.43], ["sidetone", 3.12], ["dial tone", 2.75]], null, null, null, [["speech", 24.02], ["music", 5.02], ["buzz", 2.98]], null, null, null, [["music", 38.76], ["domestic animals, pets", 9.33], ["animal", 7.47]], null, null, null, null], "duration": [0.58, 10.89, 3.4, 10.21, 1.38, 4.2, 0.59, 0.59, 1.36, 1.21, 1.91, 1.68, 0.59, 0.12, 5.07, 1.25, 13.58, 0.79, 0.3, 1.15, 1.18, 1.11, 2.59, 2.16, 1.3, 0.87, 2.27, 0.59, 1.24, 2.37, 10.15, 1.61, 1.06, 0.76, 0.12]} \ No newline at end of file diff --git a/annotations_1/oY31D4QSB-Y_filtered.json b/annotations_1/oY31D4QSB-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dbdb3c675500878b624396fedb1469f3bcd00a2 --- /dev/null +++ b/annotations_1/oY31D4QSB-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.08], [13.0, 18.98], [21.0, 21.88], [22.0, 21.96], [26.0, 28.93], [31.0, 35.82], [37.0, 43.92], [44.0, 77.16], [78.0, 85.11], [89.0, 106.66], [108.0, 114.37], [116.0, 116.01], [118.0, 118.84], [119.0, 121.26], [122.0, 124.8]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [98.8, 32.22, 0.0, 0.0, 70.44, 62.27, 50.26, 0.0, 33.68, 32.17, 32.58, 0.0, 0.0, 58.89, 64.86], "audiomae_on_audioset": [null, [["speech", 34.21], ["music", 23.36], ["outside, rural or natural", 3.38]], null, null, null, null, null, null, [["music", 59.86], ["noise", 19.02], ["cacophony", 2.33]], [["music", 48.34], ["noise", 14.12], ["cacophony", 5.06]], [["whale vocalization", 63.88], ["music", 13.89], ["mosquito", 2.46]], null, null, null, null], "duration": [3.08, 5.98, 0.88, -0.04, 2.93, 4.82, 6.92, 33.16, 7.11, 17.66, 6.37, 0.01, 0.84, 2.26, 2.8]} \ No newline at end of file diff --git a/annotations_1/oYet52yPgu0_filtered.json b/annotations_1/oYet52yPgu0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c158709677b87a31090fda1e7f3ffc57decdac44 --- /dev/null +++ b/annotations_1/oYet52yPgu0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 69.94], [70.0, 70.53], [74.0, 78.24], [80.0, 80.96], [92.0, 91.93], [92.0, 95.57], [101.0, 101.9], [103.0, 103.3], [106.0, 106.88]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.86, 0.0, 0.0, 36.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["hum", 36.23], ["mains hum", 32.1], ["throbbing", 4.46]], null, null, [["speech", 40.45], ["music", 31.29], ["quack", 7.1]], null, null, null], "duration": [-0.06, 0.53, 4.24, 0.96, -0.07, 3.57, 0.9, 0.3, 0.88]} \ No newline at end of file diff --git a/annotations_1/oZ1Mz78d3wI_filtered.json b/annotations_1/oZ1Mz78d3wI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a53c52c6a4edcd2b3606e5c06a3c03ff37ef37e --- /dev/null +++ b/annotations_1/oZ1Mz78d3wI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 38.47], [39.0, 42.7], [43.0, 66.9], [67.0, 66.93], [69.0, 72.1], [75.0, 75.05], [77.0, 78.07], [81.0, 84.96], [85.0, 100.21], [101.0, 102.56], [104.0, 104.68], [107.0, 123.3], [125.0, 125.88], [127.0, 150.72], [151.0, 154.18], [157.0, 168.89]], "keep_status": [false, true, true, false, false, false, false, true, false, false, false, true, false, false, true, false], "silence_prob": [32.77, 31.01, 31.83, 0.0, 38.75, 0.0, 0.0, 40.92, 33.77, 0.0, 0.0, 39.18, 0.0, 32.48, 41.93, 35.47], "audiomae_on_audioset": [[["music", 77.05], ["throbbing", 3.53], ["hum", 1.96]], [["music", 35.19], ["singing", 7.17], ["chant", 6.74]], [["music", 55.09], ["throbbing", 5.6], ["synthesizer", 4.55]], null, [["music", 72.9], ["synthesizer", 6.33], ["pulse", 2.27]], null, null, [["music", 19.25], ["noise", 15.28], ["livestock, farm animals, working animals", 6.77]], [["music", 80.55], ["synthesizer", 3.19], ["noise", 2.58]], null, null, [["music", 29.41], ["fly, housefly", 18.23], ["insect", 9.52]], null, [["music", 77.84], ["groan", 4.35], ["carnatic music", 2.24]], [["music", 39.26], ["hum", 10.21], ["theremin", 9.22]], [["music", 58.07], ["theremin", 16.93], ["ambient music", 4.0]]], "duration": [24.47, 3.7, 23.9, -0.07, 3.1, 0.05, 1.07, 3.96, 15.21, 1.56, 0.68, 16.3, 0.88, 23.72, 3.18, 11.89]} \ No newline at end of file diff --git a/annotations_1/oZ28XpWmN00_filtered.json b/annotations_1/oZ28XpWmN00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..740813c2ac6c493f5e5b9499b2be913af49cc4d9 --- /dev/null +++ b/annotations_1/oZ28XpWmN00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.59], [8.0, 8.33], [12.0, 12.51], [21.0, 21.46], [31.0, 32.86], [36.0, 36.29], [42.0, 58.53], [59.0, 58.85], [60.0, 63.14], [64.0, 64.91], [66.0, 68.23], [71.0, 71.47], [76.0, 77.03], [80.0, 80.55], [82.0, 85.65], [96.0, 100.85], [106.0, 109.85], [112.0, 125.04]], "keep_status": [true, false, false, false, false, false, false, false, true, false, true, false, false, false, true, false, true, true], "silence_prob": [34.17, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 39.12, 0.0, 35.29, 0.0, 0.0, 0.0, 34.75, 34.63, 31.57, 32.03], "audiomae_on_audioset": [[["speech", 48.33], ["music", 17.43], ["hum", 3.79]], null, null, null, null, null, [["speech", 43.29], ["music", 28.56], ["buzz", 4.64]], null, [["speech", 28.29], ["hum", 15.36], ["mains hum", 11.76]], null, [["eruption", 22.67], ["music", 12.05], ["hum", 10.4]], null, null, null, [["speech", 15.42], ["eruption", 13.37], ["music", 10.89]], [["speech", 58.06], ["explosion", 10.38], ["eruption", 10.33]], [["speech", 33.64], ["music", 8.3], ["whack, thwack", 4.27]], [["music", 29.0], ["hum", 16.89], ["mains hum", 14.92]]], "duration": [3.59, 0.33, 0.51, 0.46, 1.86, 0.29, 16.53, -0.15, 3.14, 0.91, 2.23, 0.47, 1.03, 0.55, 3.65, 4.85, 3.85, 13.04]} \ No newline at end of file diff --git a/annotations_1/oZlQMLXqw0g_filtered.json b/annotations_1/oZlQMLXqw0g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f88c3718b9f0e792cb9d7b3186028c130744f1c --- /dev/null +++ b/annotations_1/oZlQMLXqw0g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.37], [6.0, 8.26], [13.0, 13.27], [17.0, 18.84], [22.0, 22.45], [22.0, 23.67], [29.0, 30.48], [34.0, 34.28], [36.0, 54.13], [59.0, 59.09], [61.0, 62.07], [68.0, 69.04], [70.0, 70.55], [73.0, 74.12], [75.0, 75.54], [83.0, 84.38], [85.0, 85.67], [87.0, 90.32], [99.0, 99.22], [102.0, 101.76], [103.0, 105.14], [108.0, 109.19], [110.0, 111.33], [114.0, 114.44], [115.0, 116.41], [117.0, 125.34], [126.0, 126.87], [128.0, 130.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 36.93, 0.0, 36.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.78], ["harp", 31.12], ["musical instrument", 11.24]], null, [["music", 34.88], ["harp", 21.56], ["musical instrument", 17.4]]], "duration": [0.37, 2.26, 0.27, 1.84, 0.45, 1.67, 1.48, 0.28, 18.13, 0.09, 1.07, 1.04, 0.55, 1.12, 0.54, 1.38, 0.67, 3.32, 0.22, -0.24, 2.14, 1.19, 1.33, 0.44, 1.41, 8.34, 0.87, 2.81]} \ No newline at end of file diff --git a/annotations_1/o_3BdeGhzrs_filtered.json b/annotations_1/o_3BdeGhzrs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a778f5b69050fd4910476b12b5b1abcab92db9a --- /dev/null +++ b/annotations_1/o_3BdeGhzrs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 15.8], [19.0, 20.48], [23.0, 43.16], [44.0, 55.44], [62.0, 72.98], [76.0, 145.98], [149.0, 155.9], [156.0, 156.63], [157.0, 157.91], [161.0, 184.57]], "keep_status": [false, false, false, false, true, false, true, false, false, false], "silence_prob": [30.51, 0.0, 30.43, 29.71, 29.85, 0.0, 31.35, 0.0, 0.0, 29.98], "audiomae_on_audioset": [[["speech", 39.54], ["music", 19.98], ["vehicle", 13.11]], null, [["music", 63.92], ["vehicle", 5.91], ["car", 5.03]], [["music", 50.91], ["throbbing", 10.5], ["hum", 9.85]], [["music", 54.92], ["electronic music", 5.48], ["hum", 4.85]], null, [["insect", 30.72], ["fly, housefly", 25.11], ["music", 12.49]], null, null, [["music", 42.68], ["throbbing", 22.27], ["hum", 14.69]]], "duration": [8.8, 1.48, 20.16, 11.44, 10.98, 69.98, 6.9, 0.63, 0.91, 23.57]} \ No newline at end of file diff --git a/annotations_1/oaKjYmfK_Pw_filtered.json b/annotations_1/oaKjYmfK_Pw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..097e3229cb8ceef0117aedb6261c5e7bad422a45 --- /dev/null +++ b/annotations_1/oaKjYmfK_Pw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.32], [3.0, 9.78], [11.0, 11.43], [13.0, 13.42], [15.0, 16.07], [17.0, 19.82], [21.0, 22.22], [23.0, 23.41], [26.0, 27.43], [32.0, 32.63], [35.0, 35.21], [39.0, 39.72], [50.0, 51.49], [52.0, 54.63], [59.0, 59.49], [61.0, 62.24], [63.0, 64.03], [65.0, 66.21], [68.0, 68.49], [73.0, 76.69], [78.0, 79.89], [80.0, 83.54], [85.0, 85.92], [95.0, 96.58], [104.0, 113.43], [116.0, 118.18], [121.0, 120.95], [121.0, 121.1], [123.0, 127.94], [138.0, 139.21], [141.0, 141.2], [143.0, 143.14], [144.0, 146.23], [147.0, 153.3], [154.0, 156.09], [158.0, 170.41], [172.0, 173.28], [174.0, 174.82], [176.0, 177.11], [178.0, 181.9], [184.0, 189.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.2, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 39.49, 0.0, 0.0, 97.33, 99.88, 0.0, 0.0, 58.38, 0.0, 0.0, 0.0, 75.39, 99.84, 99.36, 72.46, 0.0, 0.0, 0.0, 68.15, 69.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.7], ["speech", 19.92], ["music", 9.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.32, 6.78, 0.43, 0.42, 1.07, 2.82, 1.22, 0.41, 1.43, 0.63, 0.21, 0.72, 1.49, 2.63, 0.49, 1.24, 1.03, 1.21, 0.49, 3.69, 1.89, 3.54, 0.92, 1.58, 9.43, 2.18, -0.05, 0.1, 4.94, 1.21, 0.2, 0.14, 2.23, 6.3, 2.09, 12.41, 1.28, 0.82, 1.11, 3.9, 5.57]} \ No newline at end of file diff --git a/annotations_1/ob2QomOgStQ_filtered.json b/annotations_1/ob2QomOgStQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e4eba83b3d2d04d2d3c9997f19c663675e500c7 --- /dev/null +++ b/annotations_1/ob2QomOgStQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 117.59], [124.0, 124.17], [124.0, 135.57], [136.0, 156.19], [158.0, 169.43], [171.0, 204.42]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 29.13, 29.54, 30.04, 0.0], "audiomae_on_audioset": [null, null, [["hum", 17.73], ["music", 14.71], ["throbbing", 14.43]], [["music", 50.2], ["hum", 6.58], ["speech", 4.94]], [["music", 65.18], ["synthesizer", 5.48], ["speech", 5.48]], null], "duration": [100.59, 0.17, 11.57, 20.19, 11.43, 33.42]} \ No newline at end of file diff --git a/annotations_1/ob_6XAhj_1U_filtered.json b/annotations_1/ob_6XAhj_1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22af92ece19cf9c06ad0bc09a9fbb2375325edb9 --- /dev/null +++ b/annotations_1/ob_6XAhj_1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.21], [2.0, 2.61], [5.0, 5.73], [10.0, 10.56], [15.0, 16.21], [21.0, 22.2], [23.0, 23.14], [23.0, 24.36], [50.0, 49.96], [60.0, 66.61], [69.0, 69.84], [71.0, 73.67], [74.0, 75.96], [78.0, 78.66], [89.0, 92.42], [99.0, 99.01], [102.0, 102.17], [105.0, 106.17], [108.0, 114.84], [124.0, 126.06], [129.0, 130.91], [133.0, 133.56], [135.0, 136.61], [140.0, 141.69], [142.0, 143.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.4, 0.0, 38.54, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 35.64, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.78], ["hum", 16.6], ["throbbing", 11.34]], null, [["music", 86.93], ["hum", 1.92], ["throbbing", 1.69]], null, null, [["music", 44.48], ["cattle, bovinae", 8.57], ["moo", 6.22]], null, null, null, [["music", 39.7], ["speech", 10.26], ["throbbing", 6.88]], [["music", 31.54], ["speech", 8.18], ["fly, housefly", 5.98]], null, null, null, null, null], "duration": [0.21, 0.61, 0.73, 0.56, 1.21, 1.2, 0.14, 1.36, -0.04, 6.61, 0.84, 2.67, 1.96, 0.66, 3.42, 0.01, 0.17, 1.17, 6.84, 2.06, 1.91, 0.56, 1.61, 1.69, 1.02]} \ No newline at end of file diff --git a/annotations_1/obn9BZj6V-M_filtered.json b/annotations_1/obn9BZj6V-M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7261d2a4fb430b5b10fa07bbcc23a9e2109839d1 --- /dev/null +++ b/annotations_1/obn9BZj6V-M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.41], [5.0, 5.83], [9.0, 10.66], [15.0, 16.01], [18.0, 20.24], [24.0, 27.31], [29.0, 30.84], [33.0, 33.64], [37.0, 43.28], [45.0, 59.58], [61.0, 93.77], [95.0, 96.82], [98.0, 98.42], [100.0, 102.76], [106.0, 110.15], [115.0, 125.1], [127.0, 131.52], [135.0, 136.56], [139.0, 150.67], [153.0, 158.94], [161.0, 164.59], [167.0, 168.05], [170.0, 173.37], [175.0, 194.93], [196.0, 197.16], [198.0, 222.78], [223.0, 224.87], [225.0, 225.58], [227.0, 227.94], [229.0, 229.8]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, true, true, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.72, 52.16, 0.0, 0.0, 32.03, 28.78, 0.0, 0.0, 0.0, 30.66, 30.02, 30.77, 34.65, 0.0, 31.54, 30.2, 28.39, 0.0, 33.92, 28.9, 0.0, 28.95, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.83], ["singing bowl", 17.36], ["theremin", 10.22]], null, null, null, [["music", 37.93], ["whale vocalization", 13.49], ["synthesizer", 9.39]], [["speech", 62.94], ["music", 26.74], ["outside, rural or natural", 1.15]], null, null, null, [["speech", 15.56], ["foghorn", 14.88], ["civil defense siren", 9.51]], [["music", 36.29], ["fly, housefly", 7.13], ["mains hum", 7.06]], [["music", 46.71], ["theremin", 35.51], ["hum", 4.91]], [["music", 31.35], ["speech", 17.81], ["whale vocalization", 15.01]], null, [["music", 58.85], ["hum", 14.37], ["electronic music", 7.66]], [["mains hum", 26.84], ["hum", 26.81], ["music", 22.19]], [["music", 20.43], ["vehicle", 7.86], ["rumble", 7.57]], null, [["speech", 21.47], ["music", 16.32], ["civil defense siren", 9.71]], [["music", 66.79], ["theremin", 16.73], ["electronic music", 2.78]], null, [["music", 54.79], ["sound effect", 5.23], ["musical instrument", 3.48]], null, null, null, null], "duration": [0.41, 0.83, 1.66, 1.01, 2.24, 3.31, 1.84, 0.64, 6.28, 14.58, 32.77, 1.82, 0.42, 2.76, 4.15, 10.1, 4.52, 1.56, 11.67, 5.94, 3.59, 1.05, 3.37, 19.93, 1.16, 24.78, 1.87, 0.58, 0.94, 0.8]} \ No newline at end of file diff --git a/annotations_1/obnODOdLD7k_filtered.json b/annotations_1/obnODOdLD7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c64d82a9186cf9e806e4e1aeaf407904ec98dde4 --- /dev/null +++ b/annotations_1/obnODOdLD7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.21], [7.0, 7.33], [10.0, 10.02], [16.0, 20.02], [27.0, 30.35], [36.0, 36.44], [39.0, 39.26], [42.0, 42.8], [44.0, 45.22], [45.0, 47.16], [49.0, 49.81], [50.0, 51.44], [52.0, 55.56], [56.0, 58.41], [62.0, 62.28], [63.0, 65.85], [68.0, 67.78], [71.0, 71.46], [72.0, 73.48], [75.0, 75.76], [77.0, 77.45], [78.0, 79.76], [81.0, 83.05], [85.0, 87.18], [89.0, 90.04], [90.0, 91.57], [98.0, 101.04], [101.0, 105.85], [106.0, 106.22], [106.0, 108.35], [109.0, 108.57], [109.0, 118.3], [119.0, 120.92], [121.0, 121.71]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.72, 46.97, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 44.87, 73.21, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 99.97, 0.0, 0.0, 98.59, 71.0, 0.0, 66.76, 0.0, 61.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 85.12], ["whack, thwack", 5.9], ["thunk", 3.49]], [["radio", 23.39], ["frog", 12.99], ["livestock, farm animals, working animals", 10.66]], null, null, null, null, null, null, null, [["speech", 34.74], ["radio", 14.44], ["whale vocalization", 7.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 0.33, 0.02, 4.02, 3.35, 0.44, 0.26, 0.8, 1.22, 2.16, 0.81, 1.44, 3.56, 2.41, 0.28, 2.85, -0.22, 0.46, 1.48, 0.76, 0.45, 1.76, 2.05, 2.18, 1.04, 1.57, 3.04, 4.85, 0.22, 2.35, -0.43, 9.3, 1.92, 0.71]} \ No newline at end of file diff --git a/annotations_1/oc8bWybEFFI_filtered.json b/annotations_1/oc8bWybEFFI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41baa962a94d32db43d666ee174b2caf0933ee06 --- /dev/null +++ b/annotations_1/oc8bWybEFFI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.62], [17.0, 17.59], [19.0, 19.45], [26.0, 29.64], [32.0, 43.31], [47.0, 48.81], [50.0, 56.94], [62.0, 62.19], [64.0, 64.61], [74.0, 93.88], [94.0, 96.63], [123.0, 124.82], [125.0, 125.79], [127.0, 127.52], [130.0, 130.55], [132.0, 132.81], [134.0, 135.63], [138.0, 138.21], [140.0, 140.05], [142.0, 142.67], [145.0, 149.93], [155.0, 156.2], [165.0, 168.64], [177.0, 177.31], [178.0, 178.61], [179.0, 180.23]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 94.66, 32.21, 0.0, 33.1, 0.0, 0.0, 30.16, 39.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.31, 0.0, 42.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["gong", 73.31], ["music", 13.63], ["hum", 2.81]], null, [["mosquito", 66.4], ["fly, housefly", 14.69], ["whip", 5.33]], null, null, [["whack, thwack", 17.83], ["mosquito", 6.97], ["groan", 6.95]], [["music", 38.87], ["sidetone", 31.35], ["speech", 6.67]], null, null, null, null, null, null, null, null, null, [["speech", 27.43], ["fly, housefly", 25.5], ["insect", 19.03]], null, [["fly, housefly", 27.72], ["speech", 15.1], ["insect", 14.47]], null, null, null], "duration": [0.62, 0.59, 0.45, 3.64, 11.31, 1.81, 6.94, 0.19, 0.61, 19.88, 2.63, 1.82, 0.79, 0.52, 0.55, 0.81, 1.63, 0.21, 0.05, 0.67, 4.93, 1.2, 3.64, 0.31, 0.61, 1.23]} \ No newline at end of file diff --git a/annotations_1/ocDL_b6BRE4_filtered.json b/annotations_1/ocDL_b6BRE4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17f314315ebe6f1dcdf60b890b21920bc8da07e9 --- /dev/null +++ b/annotations_1/ocDL_b6BRE4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.08], [6.0, 7.87], [14.0, 14.15], [15.0, 15.9], [31.0, 33.17], [34.0, 35.65], [39.0, 39.07], [42.0, 44.04], [45.0, 47.07], [49.0, 49.81], [53.0, 53.3], [57.0, 57.6], [58.0, 60.72], [63.0, 71.85], [76.0, 78.63], [85.0, 86.58], [91.0, 92.33], [94.0, 95.77], [97.0, 99.5], [101.0, 106.84], [108.0, 109.19], [114.0, 114.49], [117.0, 116.9], [118.0, 118.44], [120.0, 120.77], [123.0, 124.39], [126.0, 128.6], [129.0, 128.63], [147.0, 149.99], [158.0, 158.62], [166.0, 166.46], [169.0, 170.83], [175.0, 178.29], [179.0, 184.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.06, 0.0, 0.0, 99.56, 67.89, 0.0, 0.0, 0.0, 73.51, 39.86, 91.98, 0.0, 0.0, 0.0, 77.7, 34.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.97, 0.0, 73.51, 0.0, 0.0, 0.0, 35.88, 90.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 29.99], ["wind instrument, woodwind instrument", 13.72], ["flute", 11.09]], null, null, null, null, null, [["music", 74.97], ["lullaby", 3.52], ["singing bowl", 3.06]], null, null, null, null, null, null, [["music", 63.67], ["theremin", 8.92], ["wind instrument, woodwind instrument", 2.86]], null, null, null, null, null, [["music", 48.16], ["theremin", 19.2], ["synthesizer", 4.37]], null], "duration": [0.08, 1.87, 0.15, 0.9, 2.17, 1.65, 0.07, 2.04, 2.07, 0.81, 0.3, 0.6, 2.72, 8.85, 2.63, 1.58, 1.33, 1.77, 2.5, 5.84, 1.19, 0.49, -0.1, 0.44, 0.77, 1.39, 2.6, -0.37, 2.99, 0.62, 0.46, 1.83, 3.29, 5.86]} \ No newline at end of file diff --git a/annotations_1/od6IxUWPMcs_filtered.json b/annotations_1/od6IxUWPMcs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8df0706b5a6293ff03489b62ab0cdd28466d4db --- /dev/null +++ b/annotations_1/od6IxUWPMcs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.29], [13.0, 13.07], [17.0, 31.45], [35.0, 35.78], [38.0, 39.83], [41.0, 45.25], [51.0, 55.21], [57.0, 57.37], [66.0, 68.52], [70.0, 77.26], [80.0, 81.4], [85.0, 87.35], [93.0, 93.66], [97.0, 97.17], [101.0, 101.24], [104.0, 106.34], [108.0, 110.29], [143.0, 149.15], [152.0, 152.51], [158.0, 159.49], [163.0, 164.94], [166.0, 166.7], [168.0, 172.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.14, 0.0, 0.0, 79.41, 47.2, 0.0, 54.63, 47.39, 0.0, 48.52, 0.0, 0.0, 0.0, 55.89, 55.18, 43.15, 0.0, 0.0, 0.0, 0.0, 48.14], "audiomae_on_audioset": [null, null, [["throbbing", 38.45], ["hum", 36.44], ["music", 13.98]], null, null, null, [["sidetone", 48.42], ["hum", 18.01], ["mains hum", 10.15]], null, null, [["sidetone", 49.02], ["throbbing", 10.16], ["speech", 9.52]], null, [["hum", 41.76], ["mains hum", 16.76], ["whale vocalization", 8.36]], null, null, null, null, null, [["hum", 31.53], ["speech", 14.26], ["throbbing", 13.92]], null, null, null, null, [["speech", 16.85], ["radio", 11.11], ["hum", 10.98]]], "duration": [0.29, 0.07, 14.45, 0.78, 1.83, 4.25, 4.21, 0.37, 2.52, 7.26, 1.4, 2.35, 0.66, 0.17, 0.24, 2.34, 2.29, 6.15, 0.51, 1.49, 1.94, 0.7, 4.47]} \ No newline at end of file diff --git a/annotations_1/odNZhZSydNc_filtered.json b/annotations_1/odNZhZSydNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34f89f8bf32ac4aac5af5a5bbfd3f4ccb31f12b3 --- /dev/null +++ b/annotations_1/odNZhZSydNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.71], [4.0, 4.53], [9.0, 14.07], [15.0, 15.9], [18.0, 17.64], [19.0, 19.52], [22.0, 22.57], [24.0, 24.8], [26.0, 26.7], [28.0, 28.39], [31.0, 33.27], [35.0, 35.68], [37.0, 37.56], [42.0, 44.64], [45.0, 46.09], [48.0, 48.39], [54.0, 55.17], [59.0, 59.51], [61.0, 61.32], [66.0, 67.71], [68.0, 68.34], [69.0, 69.89], [78.0, 82.76], [85.0, 89.8], [98.0, 98.49], [99.0, 99.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 62.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 0.0, 37.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.56, 29.84, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["wood", 19.79], ["music", 17.7], ["electric shaver, electric razor", 7.01]], null, null, null, null, null, null, null, null, [["mains hum", 44.05], ["hum", 42.9], ["electric shaver, electric razor", 5.28]], [["music", 37.07], ["electric shaver, electric razor", 19.1], ["wail, moan", 5.52]], null, null], "duration": [-0.29, 0.53, 5.07, 0.9, -0.36, 0.52, 0.57, 0.8, 0.7, 0.39, 2.27, 0.68, 0.56, 2.64, 1.09, 0.39, 1.17, 0.51, 0.32, 1.71, 0.34, 0.89, 4.76, 4.8, 0.49, 0.27]} \ No newline at end of file diff --git a/annotations_1/oeF5tq_zeqU_filtered.json b/annotations_1/oeF5tq_zeqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96886b61860237a2142711faf8f34de0c84bc628 --- /dev/null +++ b/annotations_1/oeF5tq_zeqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.51], [4.0, 16.51], [18.0, 20.36], [22.0, 23.72], [27.0, 26.84], [29.0, 33.12], [34.0, 38.31], [39.0, 39.78], [41.0, 44.0], [45.0, 52.1], [53.0, 57.23], [57.0, 58.38], [60.0, 62.06], [63.0, 63.9], [64.0, 66.46], [68.0, 72.23], [73.0, 74.04], [75.0, 75.2], [76.0, 80.77], [85.0, 93.26], [95.0, 95.93], [99.0, 102.81], [108.0, 111.67], [113.0, 114.05], [115.0, 149.91], [152.0, 159.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.16, 99.82, 0.0, 0.0, 65.79, 99.78, 0.0, 50.06, 73.67, 95.37, 0.0, 99.48, 0.0, 42.19, 94.37, 0.0, 0.0, 89.54, 88.28, 0.0, 95.37, 99.78, 0.0, 0.0, 57.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 30.06], ["singing bowl", 24.41], ["music", 9.72]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.51, 12.51, 2.36, 1.72, -0.16, 4.12, 4.31, 0.78, 3.0, 7.1, 4.23, 1.38, 2.06, 0.9, 2.46, 4.23, 1.04, 0.2, 4.77, 8.26, 0.93, 3.81, 3.67, 1.05, 34.91, 7.16]} \ No newline at end of file diff --git a/annotations_1/oeQ4HWhPEdA_filtered.json b/annotations_1/oeQ4HWhPEdA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..533223871b1826228013c068e0ed4384130e7615 --- /dev/null +++ b/annotations_1/oeQ4HWhPEdA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.28], [23.0, 23.95], [31.0, 31.13], [48.0, 47.98], [59.0, 59.12], [64.0, 64.42], [80.0, 80.52]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.28, 0.95, 0.13, -0.02, 0.12, 0.42, 0.52]} \ No newline at end of file diff --git a/annotations_1/oeW9lZBY-VM_filtered.json b/annotations_1/oeW9lZBY-VM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b3831dfa4b8aaa4212f094a3050206f8a3ef73d6 --- /dev/null +++ b/annotations_1/oeW9lZBY-VM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.12], [6.0, 5.83], [12.0, 12.34], [17.0, 21.14], [26.0, 26.67], [30.0, 30.18], [46.0, 46.75], [51.0, 55.71], [56.0, 55.95], [57.0, 59.07], [60.0, 61.97], [72.0, 73.18], [74.0, 75.29], [85.0, 86.7], [95.0, 94.9], [98.0, 103.13], [107.0, 107.5], [108.0, 112.21], [113.0, 114.29], [117.0, 117.76], [123.0, 124.41], [127.0, 127.8], [133.0, 136.58], [138.0, 141.29], [143.0, 142.7], [145.0, 145.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 82.79, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 43.48, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 99.21, 93.76, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mantra", 21.12], ["lullaby", 12.91], ["male singing", 10.44]], null, null, null, null, null, null, null, null, null, null], "duration": [0.12, -0.17, 0.34, 4.14, 0.67, 0.18, 0.75, 4.71, -0.05, 2.07, 1.97, 1.18, 1.29, 1.7, -0.1, 5.13, 0.5, 4.21, 1.29, 0.76, 1.41, 0.8, 3.58, 3.29, -0.3, 0.71]} \ No newline at end of file diff --git a/annotations_1/oefn8TJ3_H8_filtered.json b/annotations_1/oefn8TJ3_H8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de8f7011013ba20ba3350c6568ff252194e2ae73 --- /dev/null +++ b/annotations_1/oefn8TJ3_H8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.23], [21.0, 24.43], [26.0, 26.59], [27.0, 30.2], [32.0, 33.12], [34.0, 37.23], [43.0, 44.54], [49.0, 51.29], [52.0, 52.35], [54.0, 54.92], [56.0, 59.85], [63.0, 68.25], [71.0, 73.01], [75.0, 76.3], [78.0, 80.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [61.08, 97.22, 0.0, 73.67, 0.0, 54.9, 0.0, 91.98, 0.0, 0.0, 87.55, 70.16, 92.31, 0.0, 89.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 3.43, 0.59, 3.2, 1.12, 3.23, 1.54, 2.29, 0.35, 0.92, 3.85, 5.25, 2.01, 1.3, 2.32]} \ No newline at end of file diff --git a/annotations_1/oexJPg9rZqo_filtered.json b/annotations_1/oexJPg9rZqo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c13fe57e87a23d61541f6b25bee7d7d8834244a3 --- /dev/null +++ b/annotations_1/oexJPg9rZqo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 50.11], [53.0, 53.94], [55.0, 55.66], [57.0, 60.44], [63.0, 67.29], [71.0, 116.78], [120.0, 119.94], [122.0, 127.36]], "keep_status": [false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 29.11, 33.45, 0.0, 0.0, 29.64], "audiomae_on_audioset": [null, null, null, [["music", 31.42], ["throbbing", 9.22], ["speech", 6.98]], [["music", 40.95], ["speech", 18.44], ["sidetone", 5.63]], null, null, [["sidetone", 30.25], ["speech", 28.89], ["music", 9.7]]], "duration": [32.11, 0.94, 0.66, 3.44, 4.29, 45.78, -0.06, 5.36]} \ No newline at end of file diff --git a/annotations_1/oezKQEF0deY_filtered.json b/annotations_1/oezKQEF0deY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..710c9b50e409698f9a0eb4105e38c48af89fea2d --- /dev/null +++ b/annotations_1/oezKQEF0deY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.2], [11.0, 13.59], [15.0, 22.1], [23.0, 25.66], [27.0, 29.08], [30.0, 33.74], [35.0, 59.44], [64.0, 80.87]], "keep_status": [false, false, false, false, false, false, true, false], "silence_prob": [65.09, 65.2, 58.22, 90.95, 98.51, 96.17, 47.5, 39.11], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 17.82], ["speech", 16.69], ["noise", 11.14]], [["music", 66.62], ["tubular bells", 7.37], ["chime", 3.4]]], "duration": [2.2, 2.59, 7.1, 2.66, 2.08, 3.74, 24.44, 16.87]} \ No newline at end of file diff --git a/annotations_1/of7H9H_aPxg_filtered.json b/annotations_1/of7H9H_aPxg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c4262ddc9b60e2452e1cb767d625420432be7d5 --- /dev/null +++ b/annotations_1/of7H9H_aPxg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [7.0, 7.2], [8.0, 8.36], [10.0, 32.58]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 32.69], "audiomae_on_audioset": [null, null, null, [["hum", 24.32], ["speech", 18.49], ["music", 17.69]]], "duration": [0.1, 0.2, 0.36, 22.58]} \ No newline at end of file diff --git a/annotations_1/oflbCHWZCBU_filtered.json b/annotations_1/oflbCHWZCBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c9e5fe578fbd8ecd73c4ea1d67623d8dda1c8cd8 --- /dev/null +++ b/annotations_1/oflbCHWZCBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [5.0, 5.49], [7.0, 10.62], [11.0, 12.12], [15.0, 15.53], [17.0, 21.14], [24.0, 24.41], [26.0, 27.43], [28.0, 30.1], [31.0, 32.83], [34.0, 37.34], [39.0, 40.59], [42.0, 42.84], [44.0, 46.06], [46.0, 46.2], [46.0, 49.74], [55.0, 56.81], [61.0, 64.18], [66.0, 65.94], [66.0, 66.01], [67.0, 70.19], [71.0, 75.63], [77.0, 91.42], [94.0, 96.21], [97.0, 97.19], [101.0, 102.24], [103.0, 103.99], [106.0, 112.63], [113.0, 114.44], [119.0, 120.7], [126.0, 127.3], [132.0, 134.42], [137.0, 150.5], [155.0, 160.54], [164.0, 167.17], [169.0, 173.35], [180.0, 180.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.18, 0.0, 0.0, 90.43, 0.0, 0.0, 81.53, 0.0, 32.29, 0.0, 0.0, 31.98, 0.0, 31.17, 0.0, 31.3, 0.0, 0.0, 32.14, 31.16, 31.19, 42.48, 0.0, 0.0, 0.0, 36.04, 0.0, 0.0, 0.0, 31.74, 30.24, 30.25, 31.58, 31.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 76.72], ["guitar", 4.98], ["musical instrument", 4.4]], null, null, [["music", 65.76], ["guitar", 5.88], ["plucked string instrument", 4.42]], null, [["music", 71.19], ["boing", 8.47], ["speech", 5.29]], null, [["music", 74.74], ["bass guitar", 3.82], ["country", 2.08]], null, null, [["music", 73.4], ["guitar", 3.27], ["bass guitar", 3.23]], [["music", 48.92], ["musical instrument", 6.1], ["singing", 5.7]], [["music", 85.78], ["country", 2.04], ["musical instrument", 1.99]], [["music", 65.53], ["speech", 1.39], ["musical instrument", 1.23]], null, null, null, [["music", 68.03], ["speech", 3.74], ["musical instrument", 1.87]], null, null, null, [["music", 74.45], ["synthesizer", 4.1], ["musical instrument", 2.82]], [["music", 87.01], ["didgeridoo", 8.42], ["musical instrument", 0.74]], [["music", 76.12], ["didgeridoo", 4.44], ["livestock, farm animals, working animals", 3.16]], [["music", 71.64], ["speech", 3.07], ["guitar", 1.16]], [["music", 80.62], ["musical instrument", 2.26], ["bass guitar", 1.99]], null], "duration": [1.52, 0.49, 3.62, 1.12, 0.53, 4.14, 0.41, 1.43, 2.1, 1.83, 3.34, 1.59, 0.84, 2.06, 0.2, 3.74, 1.81, 3.18, -0.06, 0.01, 3.19, 4.63, 14.42, 2.21, 0.19, 1.24, 0.99, 6.63, 1.44, 1.7, 1.3, 2.42, 13.5, 5.54, 3.17, 4.35, 0.4]} \ No newline at end of file diff --git a/annotations_1/oflnRQP6Woo_filtered.json b/annotations_1/oflnRQP6Woo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907c8be30404ced43c5786ba600226a4fb80a2b8 --- /dev/null +++ b/annotations_1/oflnRQP6Woo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.75], [23.0, 27.06], [30.0, 33.22], [35.0, 36.85], [37.0, 82.71], [90.0, 90.42], [93.0, 113.22], [114.0, 117.14], [117.0, 118.52], [119.0, 119.7], [120.0, 120.88], [122.0, 122.22], [123.0, 129.03], [131.0, 136.83], [139.0, 144.8], [146.0, 146.13], [147.0, 149.96], [150.0, 151.07], [152.0, 152.36], [154.0, 156.78], [160.0, 171.85], [180.0, 179.56], [182.0, 186.87], [191.0, 191.64]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 36.67, 37.09, 0.0, 0.0, 0.0, 41.52, 39.41, 0.0, 0.0, 0.0, 0.0, 39.83, 62.68, 99.48, 0.0, 67.63, 0.0, 0.0, 34.8, 31.37, 0.0, 33.26, 0.0], "audiomae_on_audioset": [null, [["speech", 38.74], ["music", 21.15], ["hum", 9.43]], [["music", 43.74], ["throbbing", 9.89], ["hum", 9.66]], null, null, null, [["music", 59.43], ["hum", 15.23], ["throbbing", 6.18]], [["speech", 42.65], ["music", 39.68], ["synthesizer", 2.61]], null, null, null, null, [["music", 35.66], ["speech", 20.41], ["animal", 6.42]], null, null, null, null, null, null, [["music", 75.66], ["synthesizer", 7.67], ["musical instrument", 2.44]], [["music", 82.06], ["throbbing", 2.09], ["electronic music", 1.48]], null, [["music", 36.77], ["boing", 15.79], ["speech", 10.89]], null], "duration": [0.75, 4.06, 3.22, 1.85, 45.71, 0.42, 20.22, 3.14, 1.52, 0.7, 0.88, 0.22, 6.03, 5.83, 5.8, 0.13, 2.96, 1.07, 0.36, 2.78, 11.85, -0.44, 4.87, 0.64]} \ No newline at end of file diff --git a/annotations_1/ogUC0Fcvh7g_filtered.json b/annotations_1/ogUC0Fcvh7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d1d34cbceff3332838a7efaf0c961d0b5167d1f --- /dev/null +++ b/annotations_1/ogUC0Fcvh7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [5.0, 6.79], [7.0, 8.28], [9.0, 9.56], [10.0, 16.88], [17.0, 22.5], [38.0, 38.55], [55.0, 54.84], [57.0, 57.55], [61.0, 61.82], [68.0, 68.74], [91.0, 91.35], [95.0, 95.45], [104.0, 106.2], [110.0, 109.75], [111.0, 111.38]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.42, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["bee, wasp, etc.", 20.63], ["insect", 15.14], ["fly, housefly", 9.89]], [["fly, housefly", 37.81], ["insect", 31.99], ["mains hum", 9.52]], null, null, null, null, null, null, null, [["speech", 25.86], ["hum", 12.72], ["sidetone", 7.19]], null, null], "duration": [0.59, 1.79, 1.28, 0.56, 6.88, 5.5, 0.55, -0.16, 0.55, 0.82, 0.74, 0.35, 0.45, 2.2, -0.25, 0.38]} \ No newline at end of file diff --git a/annotations_1/oiQPOmrEAxo_filtered.json b/annotations_1/oiQPOmrEAxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06ba077d92bd4d628a75e2145b0b7dbdf5d3c39f --- /dev/null +++ b/annotations_1/oiQPOmrEAxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [10.0, 24.48], [28.0, 38.77], [43.0, 73.06], [73.0, 73.18], [73.0, 76.69], [79.0, 79.71], [82.0, 90.66], [91.0, 108.3], [108.0, 108.45], [109.0, 116.65], [120.0, 125.46], [127.0, 130.37], [132.0, 134.97], [136.0, 136.95], [137.0, 146.52], [149.0, 182.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 28.92, 29.15, 0.0, 0.0, 29.13, 0.0, 28.82, 28.93, 0.0, 31.36, 34.28, 31.26, 29.54, 0.0, 29.56, 0.0], "audiomae_on_audioset": [null, [["music", 64.88], ["speech", 6.65], ["hum", 5.12]], [["speech", 53.12], ["music", 33.51], ["throbbing", 1.9]], null, null, [["music", 55.31], ["synthesizer", 10.25], ["electronic music", 4.63]], null, [["speech", 46.35], ["music", 41.97], ["hum", 1.63]], [["music", 36.7], ["speech", 36.39], ["throbbing", 4.97]], null, [["music", 46.31], ["electronic music", 16.9], ["soundtrack music", 6.25]], [["music", 28.65], ["synthesizer", 12.53], ["hum", 11.86]], [["music", 59.94], ["speech", 20.98], ["boing", 7.31]], [["music", 63.95], ["stomach rumble", 4.65], ["whale vocalization", 4.59]], null, [["speech", 48.4], ["music", 39.93], ["synthesizer", 1.39]], null], "duration": [0.46, 14.48, 10.77, 30.06, 0.18, 3.69, 0.71, 8.66, 17.3, 0.45, 7.65, 5.46, 3.37, 2.97, 0.95, 9.52, 33.21]} \ No newline at end of file diff --git a/annotations_1/oiYBUM-EE-w_filtered.json b/annotations_1/oiYBUM-EE-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b454e9e94fb34d886f0dae4bd9fdffe5d61f98ce --- /dev/null +++ b/annotations_1/oiYBUM-EE-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 31.83], [37.0, 37.37], [48.0, 48.56], [72.0, 71.83], [81.0, 87.29], [88.0, 92.79], [109.0, 123.48], [126.0, 125.81], [128.0, 127.72]], "keep_status": [true, false, false, false, true, true, true, false, false], "silence_prob": [33.55, 0.0, 0.0, 0.0, 30.64, 29.67, 29.96, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.25], ["synthesizer", 14.86], ["musical instrument", 9.34]], null, null, null, [["speech", 42.98], ["vehicle", 9.4], ["explosion", 9.11]], [["speech", 32.22], ["explosion", 28.23], ["eruption", 7.13]], [["hum", 15.68], ["noise", 15.06], ["music", 14.92]], null, null], "duration": [4.83, 0.37, 0.56, -0.17, 6.29, 4.79, 14.48, -0.19, -0.28]} \ No newline at end of file diff --git a/annotations_1/ojoC-Kbzpo8_filtered.json b/annotations_1/ojoC-Kbzpo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcb33f494af3af5e3cf55acbbef7646ebaf10242 --- /dev/null +++ b/annotations_1/ojoC-Kbzpo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.66], [28.0, 27.94], [28.0, 33.12], [33.0, 33.44], [37.0, 38.28], [44.0, 44.49], [79.0, 80.25], [80.0, 81.65], [122.0, 131.72], [133.0, 140.71], [142.0, 157.96], [159.0, 160.61]], "keep_status": [true, false, true, false, false, false, false, false, true, true, true, false], "silence_prob": [37.46, 0.0, 34.82, 0.0, 0.0, 0.0, 0.0, 0.0, 29.42, 30.46, 28.61, 0.0], "audiomae_on_audioset": [[["music", 25.12], ["didgeridoo", 15.09], ["chorus effect", 5.89]], null, [["chant", 16.53], ["music", 14.88], ["didgeridoo", 12.05]], null, null, null, null, null, [["livestock, farm animals, working animals", 17.91], ["music", 12.03], ["cowbell", 8.22]], [["speech", 12.09], ["whack, thwack", 9.57], ["burst, pop", 8.42]], [["livestock, farm animals, working animals", 18.53], ["cattle, bovinae", 14.13], ["moo", 6.23]], null], "duration": [5.66, -0.06, 5.12, 0.44, 1.28, 0.49, 1.25, 1.65, 9.72, 7.71, 15.96, 1.61]} \ No newline at end of file diff --git a/annotations_1/ok6H1OFTmyA_filtered.json b/annotations_1/ok6H1OFTmyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7474fe6e7680c39f0a375ae3e6329f1a98f330c --- /dev/null +++ b/annotations_1/ok6H1OFTmyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.97], [3.0, 3.75], [4.0, 5.81], [9.0, 10.76], [12.0, 13.69], [14.0, 17.02], [18.0, 21.63], [22.0, 23.25], [25.0, 26.69], [29.0, 28.76], [30.0, 31.13], [32.0, 33.66], [35.0, 45.33], [46.0, 47.97], [50.0, 49.92], [52.0, 53.0], [54.0, 56.93], [58.0, 60.37], [61.0, 63.42], [64.0, 67.37], [68.0, 71.24], [72.0, 72.82], [74.0, 74.82], [75.0, 76.47], [78.0, 80.01], [80.0, 82.61], [83.0, 84.21], [86.0, 86.73], [88.0, 88.43], [90.0, 90.34], [91.0, 91.91], [94.0, 95.01], [96.0, 110.91], [113.0, 118.64], [120.0, 123.55], [125.0, 125.44], [126.0, 128.28], [129.0, 133.32], [134.0, 135.84], [137.0, 140.17], [142.0, 142.48], [144.0, 149.25], [151.0, 156.37], [157.0, 160.49], [162.0, 167.24], [168.0, 180.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 60.6, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 0.0, 90.43, 88.64, 75.88, 99.73, 84.98, 0.0, 0.0, 0.0, 97.43, 54.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 95.64, 93.91, 0.0, 80.29, 78.38, 0.0, 92.15, 0.0, 93.29, 87.92, 90.95, 89.54, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.03, 0.75, 1.81, 1.76, 1.69, 3.02, 3.63, 1.25, 1.69, -0.24, 1.13, 1.66, 10.33, 1.97, -0.08, 1.0, 2.93, 2.37, 2.42, 3.37, 3.24, 0.82, 0.82, 1.47, 2.01, 2.61, 1.21, 0.73, 0.43, 0.34, 0.91, 1.01, 14.91, 5.64, 3.55, 0.44, 2.28, 4.32, 1.84, 3.17, 0.48, 5.25, 5.37, 3.49, 5.24, 12.23]} \ No newline at end of file diff --git a/annotations_1/onO71_aItKA_filtered.json b/annotations_1/onO71_aItKA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b90978086008c97b04ee3deaea3c8dd4a50d6fa8 --- /dev/null +++ b/annotations_1/onO71_aItKA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [8.0, 10.32], [13.0, 13.12], [15.0, 17.58], [18.0, 21.74], [22.0, 24.06], [25.0, 26.35], [27.0, 32.26], [36.0, 38.25], [40.0, 46.62], [47.0, 48.61], [50.0, 49.77], [52.0, 52.76], [54.0, 54.46], [55.0, 54.62], [55.0, 62.68], [64.0, 75.37], [76.0, 76.55], [79.0, 88.28], [89.0, 89.18], [90.0, 96.62], [108.0, 110.51], [112.0, 112.43], [115.0, 121.41], [122.0, 122.93], [124.0, 127.72], [130.0, 130.82], [131.0, 131.94], [138.0, 139.26], [140.0, 145.76]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 71.57, 0.0, 64.18, 51.12, 48.31, 0.0, 57.32, 75.07, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 48.74, 0.0, 43.58, 0.0, 32.56, 29.83, 0.0, 28.69, 0.0, 30.14, 0.0, 0.0, 0.0, 35.47], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 40.44], ["sidetone", 26.64], ["throbbing", 5.88]], null, null, null, null, null, null, null, null, null, [["frog", 54.35], ["music", 7.22], ["effects unit", 5.94]], [["hum", 18.88], ["animal", 17.01], ["speech", 10.9]], null, [["speech", 25.79], ["mains hum", 20.16], ["hum", 10.96]], null, [["speech", 65.83], ["didgeridoo", 9.55], ["music", 7.63]], [["speech", 76.81], ["music", 9.3], ["didgeridoo", 2.05]], null, [["gong", 41.24], ["hum", 13.59], ["mains hum", 6.95]], null, [["didgeridoo", 83.92], ["music", 6.06], ["musical instrument", 2.43]], null, null, null, [["music", 44.01], ["speech", 12.05], ["synthesizer", 6.83]]], "duration": [0.56, 2.32, 0.12, 2.58, 3.74, 2.06, 1.35, 5.26, 2.25, 6.62, 1.61, -0.23, 0.76, 0.46, -0.38, 7.68, 11.37, 0.55, 9.28, 0.18, 6.62, 2.51, 0.43, 6.41, 0.93, 3.72, 0.82, 0.94, 1.26, 5.76]} \ No newline at end of file diff --git a/annotations_1/onesjJyXdFQ_filtered.json b/annotations_1/onesjJyXdFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dbefb6828283a0ded696ce4f001fe0096b272ed9 --- /dev/null +++ b/annotations_1/onesjJyXdFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.6], [9.0, 10.34], [12.0, 13.47], [16.0, 18.18], [21.0, 22.54], [24.0, 25.44], [29.0, 29.24], [31.0, 32.02], [35.0, 36.78], [41.0, 40.83], [42.0, 42.77], [45.0, 45.74], [50.0, 50.52], [52.0, 52.89], [56.0, 56.74], [60.0, 62.55], [64.0, 65.16], [69.0, 69.77], [78.0, 78.29], [88.0, 92.31], [93.0, 94.96], [97.0, 98.31], [100.0, 101.44], [102.0, 103.17], [107.0, 110.13], [111.0, 113.39], [119.0, 118.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 92.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.6, 1.34, 1.47, 2.18, 1.54, 1.44, 0.24, 1.02, 1.78, -0.17, 0.77, 0.74, 0.52, 0.89, 0.74, 2.55, 1.16, 0.77, 0.29, 4.31, 1.96, 1.31, 1.44, 1.17, 3.13, 2.39, -0.06]} \ No newline at end of file diff --git a/annotations_1/oo5SkNM3c1Y_filtered.json b/annotations_1/oo5SkNM3c1Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0f5a11302e696669208cde9e7f6d8339fae97e6 --- /dev/null +++ b/annotations_1/oo5SkNM3c1Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.75], [26.0, 26.92], [30.0, 31.24], [36.0, 39.39], [41.0, 43.39], [45.0, 45.27], [48.0, 49.17], [50.0, 52.54], [53.0, 55.36], [56.0, 56.76], [61.0, 60.93], [64.0, 66.48], [67.0, 67.53], [68.0, 68.96], [69.0, 71.34], [73.0, 74.22], [82.0, 82.92], [84.0, 84.75], [90.0, 105.0], [108.0, 109.38], [111.0, 111.01], [112.0, 112.43], [114.0, 120.5], [126.0, 126.93], [128.0, 129.39], [131.0, 132.11], [144.0, 144.49], [146.0, 147.16], [148.0, 152.76], [156.0, 156.56], [160.0, 160.74], [163.0, 163.58], [167.0, 168.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.76, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 60.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.75, 0.92, 1.24, 3.39, 2.39, 0.27, 1.17, 2.54, 2.36, 0.76, -0.07, 2.48, 0.53, 0.96, 2.34, 1.22, 0.92, 0.75, 15.0, 1.38, 0.01, 0.43, 6.5, 0.93, 1.39, 1.11, 0.49, 1.16, 4.76, 0.56, 0.74, 0.58, 1.12]} \ No newline at end of file diff --git a/annotations_1/oo7VlD66ISM_filtered.json b/annotations_1/oo7VlD66ISM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c0a290516cf053cd25c6bb73130fbff6b126187 --- /dev/null +++ b/annotations_1/oo7VlD66ISM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.49], [9.0, 10.67], [21.0, 21.27], [28.0, 28.41], [33.0, 33.81], [37.0, 37.61], [43.0, 43.19], [82.0, 83.35], [92.0, 92.85]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.49, 1.67, 0.27, 0.41, 0.81, 0.61, 0.19, 1.35, 0.85]} \ No newline at end of file diff --git a/annotations_1/ooS5gVdYgRQ_filtered.json b/annotations_1/ooS5gVdYgRQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9bfb04bf5da2e32ee8d56c90ef0126800e9614b8 --- /dev/null +++ b/annotations_1/ooS5gVdYgRQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[64.0, 66.63], [77.0, 78.39], [85.0, 84.79], [88.0, 88.55], [93.0, 93.31]], "keep_status": [true, false, false, false, false], "silence_prob": [29.19, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 37.07], ["explosion", 10.52], ["music", 4.63]], null, null, null, null], "duration": [2.63, 1.39, -0.21, 0.55, 0.31]} \ No newline at end of file diff --git a/annotations_1/opSAGkaqx6Y_filtered.json b/annotations_1/opSAGkaqx6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7a5b6d283a203d11d99ca48757c2a8177bd1d2e --- /dev/null +++ b/annotations_1/opSAGkaqx6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.8], [22.0, 44.76], [46.0, 74.01], [82.0, 81.85], [87.0, 87.42], [98.0, 98.86], [104.0, 103.81], [105.0, 105.61], [110.0, 110.35], [110.0, 111.5], [119.0, 119.25], [124.0, 124.09], [125.0, 126.52], [128.0, 128.16], [129.0, 130.17], [131.0, 130.98], [135.0, 135.87], [138.0, 138.33], [139.0, 140.22], [147.0, 150.9], [153.0, 153.17], [154.0, 155.17], [165.0, 165.3], [174.0, 173.8], [174.0, 175.17], [180.0, 180.5]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.39, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 49.4], ["sine wave", 7.71], ["singing bowl", 6.0]], [["music", 11.45], ["whack, thwack", 8.12], ["hum", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 66.87], ["synthesizer", 4.21], ["hum", 3.08]], null, null, null, null, null, null], "duration": [1.8, 22.76, 28.01, -0.15, 0.42, 0.86, -0.19, 0.61, 0.35, 1.5, 0.25, 0.09, 1.52, 0.16, 1.17, -0.02, 0.87, 0.33, 1.22, 3.9, 0.17, 1.17, 0.3, -0.2, 1.17, 0.5]} \ No newline at end of file diff --git a/annotations_1/opWPxmr2h2s_filtered.json b/annotations_1/opWPxmr2h2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e299f34773867ae066cbe53ff0d00a9fefc748a --- /dev/null +++ b/annotations_1/opWPxmr2h2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.5], [11.0, 12.34], [18.0, 18.49], [20.0, 26.76], [29.0, 29.49], [30.0, 30.54], [38.0, 37.99], [59.0, 59.12], [75.0, 76.96], [78.0, 80.55], [83.0, 85.06], [87.0, 88.23], [89.0, 89.31], [92.0, 93.45], [94.0, 94.63], [96.0, 95.94], [99.0, 99.35], [100.0, 101.11], [108.0, 108.3], [109.0, 109.58], [110.0, 110.62], [111.0, 111.84], [113.0, 116.07], [118.0, 120.24], [122.0, 123.33], [125.0, 126.91], [132.0, 133.66], [137.0, 139.62], [143.0, 144.68]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 76.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 76.37, 0.0, 0.0, 0.0, 74.6, 0.0], "audiomae_on_audioset": [null, null, null, [["fart", 20.19], ["groan", 16.38], ["grunt", 10.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 1.34, 0.49, 6.76, 0.49, 0.54, -0.01, 0.12, 1.96, 2.55, 2.06, 1.23, 0.31, 1.45, 0.63, -0.06, 0.35, 1.11, 0.3, 0.58, 0.62, 0.84, 3.07, 2.24, 1.33, 1.91, 1.66, 2.62, 1.68]} \ No newline at end of file diff --git a/annotations_1/opXI29YEI5s_filtered.json b/annotations_1/opXI29YEI5s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a1985eedc2d051eadc880c3be88a4b65981c0c40 --- /dev/null +++ b/annotations_1/opXI29YEI5s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.95], [15.0, 15.43], [29.0, 29.62], [33.0, 34.86], [38.0, 37.89], [38.0, 39.09], [40.0, 41.74], [46.0, 46.5], [51.0, 51.73], [54.0, 54.4], [55.0, 102.79], [115.0, 116.36], [119.0, 118.86], [119.0, 165.21], [166.0, 171.39], [172.0, 173.37], [174.0, 182.97], [187.0, 187.1], [193.0, 195.18], [197.0, 198.53], [207.0, 210.07], [211.0, 212.6], [213.0, 215.16], [216.0, 216.68], [221.0, 221.88], [223.0, 223.42], [225.0, 225.9], [231.0, 232.02], [233.0, 233.78], [235.0, 235.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.23, 0.0, 39.66, 0.0, 65.67, 0.0, 55.67, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 39.45], ["music", 22.56], ["hum", 6.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["vehicle", 21.74], ["car", 11.24], ["buzz", 7.51]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.95, 0.43, 0.62, 1.86, -0.11, 1.09, 1.74, 0.5, 0.73, 0.4, 47.79, 1.36, -0.14, 46.21, 5.39, 1.37, 8.97, 0.1, 2.18, 1.53, 3.07, 1.6, 2.16, 0.68, 0.88, 0.42, 0.9, 1.02, 0.78, 0.01]} \ No newline at end of file diff --git a/annotations_1/opyh8AAgisI_filtered.json b/annotations_1/opyh8AAgisI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..479b3cccc8e407997a68ce7226232fc23d49d421 --- /dev/null +++ b/annotations_1/opyh8AAgisI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.02], [13.0, 16.06], [18.0, 24.81], [28.0, 33.12], [33.0, 35.61], [36.0, 37.29], [38.0, 38.3], [39.0, 48.0], [51.0, 52.49], [53.0, 57.89], [60.0, 62.77], [65.0, 68.94], [72.0, 75.68], [77.0, 77.8], [84.0, 84.1], [88.0, 94.9], [96.0, 97.71], [102.0, 102.74], [104.0, 105.21], [108.0, 112.16], [113.0, 115.97], [116.0, 120.77], [122.0, 126.23], [127.0, 134.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.47, 79.94, 87.0, 94.81, 96.54, 0.0, 0.0, 99.96, 0.0, 98.8, 100.0, 100.0, 100.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 94.66, 92.15, 76.7, 82.25, 87.19], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.02, 3.06, 6.81, 5.12, 2.61, 1.29, 0.3, 9.0, 1.49, 4.89, 2.77, 3.94, 3.68, 0.8, 0.1, 6.9, 1.71, 0.74, 1.21, 4.16, 2.97, 4.77, 4.23, 7.25]} \ No newline at end of file diff --git a/annotations_1/oqGij9ylbAk_filtered.json b/annotations_1/oqGij9ylbAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ada8b4802b0bdefeabbf14d9a15662732db07b04 --- /dev/null +++ b/annotations_1/oqGij9ylbAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.12], [14.0, 24.8], [26.0, 92.2]], "keep_status": [false, true, false], "silence_prob": [0.0, 37.07, 0.0], "audiomae_on_audioset": [null, [["music", 30.01], ["speech", 19.85], ["hum", 9.1]], null], "duration": [0.12, 10.8, 66.2]} \ No newline at end of file diff --git a/annotations_1/oqQGFh5yiWE_filtered.json b/annotations_1/oqQGFh5yiWE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c6ba41dff5e6421a63c8ecb6671a22e7e7ace73e --- /dev/null +++ b/annotations_1/oqQGFh5yiWE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.29], [3.0, 3.69], [9.0, 9.49], [12.0, 12.73], [14.0, 15.42], [20.0, 20.44], [24.0, 25.86], [27.0, 32.22], [35.0, 35.58], [36.0, 37.07], [38.0, 43.5], [45.0, 45.71], [48.0, 48.61], [54.0, 54.45], [62.0, 61.86], [70.0, 70.8], [77.0, 77.67], [81.0, 81.68], [82.0, 82.61], [85.0, 85.08], [92.0, 92.25], [97.0, 98.54], [106.0, 107.05], [113.0, 113.12], [116.0, 116.56], [122.0, 122.12], [126.0, 127.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 36.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 32.72], ["moo", 16.01], ["cattle, bovinae", 13.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 0.69, 0.49, 0.73, 1.42, 0.44, 1.86, 5.22, 0.58, 1.07, 5.5, 0.71, 0.61, 0.45, -0.14, 0.8, 0.67, 0.68, 0.61, 0.08, 0.25, 1.54, 1.05, 0.12, 0.56, 0.12, 1.04]} \ No newline at end of file diff --git a/annotations_1/oqquLzHmH5k_filtered.json b/annotations_1/oqquLzHmH5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2be9ee6f2ed3dadd73aefd5d6496a7a0ed3cbf --- /dev/null +++ b/annotations_1/oqquLzHmH5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.96], [4.0, 5.27], [6.0, 8.97], [11.0, 13.29], [14.0, 19.35], [22.0, 22.37], [23.0, 24.81], [25.0, 27.94], [31.0, 31.14], [37.0, 37.86], [39.0, 39.65], [40.0, 40.86], [43.0, 43.39], [45.0, 45.96], [48.0, 49.15], [54.0, 54.92], [57.0, 59.24], [63.0, 63.81], [70.0, 72.45], [81.0, 83.15], [87.0, 88.26], [90.0, 91.0], [95.0, 96.87], [100.0, 100.23], [102.0, 103.44], [105.0, 106.0], [108.0, 108.11], [110.0, 109.88], [110.0, 111.16], [113.0, 114.15], [115.0, 115.57], [117.0, 118.15], [120.0, 121.93], [128.0, 128.19], [130.0, 132.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 75.72, 99.93, 99.36, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 87.19, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 1.27, 2.97, 2.29, 5.35, 0.37, 1.81, 2.94, 0.14, 0.86, 0.65, 0.86, 0.39, 0.96, 1.15, 0.92, 2.24, 0.81, 2.45, 2.15, 1.26, 1.0, 1.87, 0.23, 1.44, 1.0, 0.11, -0.12, 1.16, 1.15, 0.57, 1.15, 1.93, 0.19, 2.48]} \ No newline at end of file diff --git a/annotations_1/or6rCLpiS10_filtered.json b/annotations_1/or6rCLpiS10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..600ac9530b46f81ea7935c736c1493d7d8654ce5 --- /dev/null +++ b/annotations_1/or6rCLpiS10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 103.59], [107.0, 122.89]], "keep_status": [false, true], "silence_prob": [0.0, 28.48], "audiomae_on_audioset": [null, [["speech", 54.45], ["music", 6.03], ["explosion", 4.75]]], "duration": [94.59, 15.89]} \ No newline at end of file diff --git a/annotations_1/os1x0te4Waw_filtered.json b/annotations_1/os1x0te4Waw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6715e309a819ee16522edf5c35dcae2ee360dc3 --- /dev/null +++ b/annotations_1/os1x0te4Waw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.31], [10.0, 13.46], [15.0, 18.28], [24.0, 24.58], [27.0, 28.29], [32.0, 32.76], [39.0, 41.0], [45.0, 45.82], [52.0, 52.81], [55.0, 54.85], [57.0, 58.09], [63.0, 64.13], [66.0, 66.33], [66.0, 67.73], [72.0, 73.63], [75.0, 77.73], [79.0, 80.87], [84.0, 85.89], [89.0, 96.2], [99.0, 99.52], [100.0, 104.18], [108.0, 124.6]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.73, 52.05, 53.28, 0.0, 0.0, 0.0, 58.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 0.0, 68.28, 0.0, 65.67, 31.73], "audiomae_on_audioset": [[["fly, housefly", 11.35], ["insect", 10.03], ["speech", 9.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 51.42], ["speech", 31.15], ["music", 6.09]]], "duration": [2.31, 3.46, 3.28, 0.58, 1.29, 0.76, 2.0, 0.82, 0.81, -0.15, 1.09, 1.13, 0.33, 1.73, 1.63, 2.73, 1.87, 1.89, 7.2, 0.52, 4.18, 16.6]} \ No newline at end of file diff --git a/annotations_1/os7KKfG3QE0_filtered.json b/annotations_1/os7KKfG3QE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd8205c58bbd059ada1b74784e59556d5ecad2c --- /dev/null +++ b/annotations_1/os7KKfG3QE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.11], [13.0, 13.69], [19.0, 20.16], [21.0, 21.54], [23.0, 23.31], [36.0, 39.51], [41.0, 41.67], [44.0, 44.17], [47.0, 51.58], [52.0, 51.61], [52.0, 51.68], [52.0, 51.71], [52.0, 51.75], [54.0, 54.6], [55.0, 55.49], [58.0, 57.72], [61.0, 61.28], [75.0, 75.19], [79.0, 80.94], [82.0, 89.55], [100.0, 100.55], [101.0, 101.9], [105.0, 106.0], [112.0, 112.68], [116.0, 116.04], [117.0, 118.4], [120.0, 119.62], [127.0, 128.12], [130.0, 130.89], [134.0, 134.42], [136.0, 136.24], [140.0, 140.46], [141.0, 143.36], [144.0, 144.69], [146.0, 146.7], [149.0, 149.03], [151.0, 151.14], [156.0, 156.57], [158.0, 165.86], [168.0, 169.86]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0, 42.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.22, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.43], ["fart", 9.16], ["speech", 6.45]], null, null, [["hum", 21.3], ["music", 16.12], ["speech", 11.17]], null, null, null, null, null, null, null, null, null, null, [["music", 25.39], ["whale vocalization", 23.4], ["livestock, farm animals, working animals", 16.31]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.96], ["chirp tone", 8.45], ["music", 8.21]], null, null, null, null, null, [["speech", 30.26], ["livestock, farm animals, working animals", 27.53], ["cattle, bovinae", 7.97]], null], "duration": [1.11, 0.69, 1.16, 0.54, 0.31, 3.51, 0.67, 0.17, 4.58, -0.39, -0.32, -0.29, -0.25, 0.6, 0.49, -0.28, 0.28, 0.19, 1.94, 7.55, 0.55, 0.9, 1.0, 0.68, 0.04, 1.4, -0.38, 1.12, 0.89, 0.42, 0.24, 0.46, 2.36, 0.69, 0.7, 0.03, 0.14, 0.57, 7.86, 1.86]} \ No newline at end of file diff --git a/annotations_1/osE84bZ1jNc_filtered.json b/annotations_1/osE84bZ1jNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cb37968f79266f810fa531a856c4da58fa9c8b6 --- /dev/null +++ b/annotations_1/osE84bZ1jNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.57], [4.0, 4.75], [6.0, 10.62], [12.0, 13.09], [14.0, 14.67], [15.0, 16.19], [18.0, 19.97], [21.0, 24.0], [24.0, 27.04], [30.0, 30.89], [31.0, 32.44], [33.0, 34.79], [38.0, 38.3], [39.0, 40.04], [41.0, 45.17], [46.0, 47.78], [48.0, 48.69], [50.0, 81.35], [82.0, 84.32], [85.0, 90.78], [91.0, 94.83], [95.0, 95.66], [97.0, 97.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 84.98, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 34.04, 29.65, 30.45, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.43], ["theremin", 14.51], ["music", 10.76]], [["didgeridoo", 23.65], ["music", 16.8], ["foghorn", 13.28]], [["fart", 55.98], ["music", 8.6], ["speech", 6.21]], null, null], "duration": [0.57, 0.75, 4.62, 1.09, 0.67, 1.19, 1.97, 3.0, 3.04, 0.89, 1.44, 1.79, 0.3, 1.04, 4.17, 1.78, 0.69, 31.35, 2.32, 5.78, 3.83, 0.66, 0.8]} \ No newline at end of file diff --git a/annotations_1/osLhRtHZ4Gw_filtered.json b/annotations_1/osLhRtHZ4Gw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59a5aca66af652d5656f3a651afa0a0a260d6992 --- /dev/null +++ b/annotations_1/osLhRtHZ4Gw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [11.0, 46.85], [49.0, 49.27], [50.0, 49.92], [51.0, 51.81], [53.0, 53.82], [54.0, 55.86], [56.0, 56.05], [56.0, 56.08], [56.0, 56.12], [56.0, 56.15], [57.0, 61.21], [64.0, 66.77], [68.0, 69.85], [70.0, 71.2], [77.0, 77.8], [79.0, 79.15], [80.0, 80.64], [82.0, 82.63], [84.0, 84.11], [89.0, 89.46], [92.0, 92.62], [93.0, 95.39], [96.0, 96.96], [103.0, 113.19], [115.0, 115.26], [117.0, 117.49], [119.0, 120.11], [121.0, 121.9], [123.0, 123.77], [126.0, 126.67], [128.0, 129.81], [134.0, 138.82], [141.0, 141.39], [143.0, 143.45], [145.0, 146.69], [149.0, 154.62], [155.0, 157.06], [158.0, 158.43], [164.0, 164.1], [167.0, 166.99], [167.0, 171.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.74, 31.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.12, 0.0, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.87, 0.0, 0.0, 0.0, 34.07, 33.5, 0.0, 0.0, 0.0, 32.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.63], ["whack, thwack", 16.6], ["breaking", 9.09]], [["mains hum", 38.6], ["hum", 30.73], ["speech", 6.96]], null, null, null, null, null, null, null, null, null, [["rumble", 25.24], ["speech", 22.28], ["music", 5.16]], null, [["music", 35.7], ["speech", 31.53], ["fart", 5.21]], null, null, null, null, null, null, null, [["speech", 23.16], ["hum", 15.17], ["rumble", 14.91]], null, null, null, [["speech", 49.93], ["music", 7.84], ["hum", 5.52]], [["speech", 55.09], ["music", 11.22], ["whale vocalization", 4.76]], null, null, null, [["whack, thwack", 50.43], ["breaking", 14.66], ["thump, thud", 11.34]]], "duration": [0.75, 35.85, 0.27, -0.08, 0.81, 0.82, 1.86, 0.05, 0.08, 0.12, 0.15, 4.21, 2.77, 1.85, 1.2, 0.8, 0.15, 0.64, 0.63, 0.11, 0.46, 0.62, 2.39, 0.96, 10.19, 0.26, 0.49, 1.11, 0.9, 0.77, 0.67, 1.81, 4.82, 0.39, 0.45, 1.69, 5.62, 2.06, 0.43, 0.1, -0.01, 4.44]} \ No newline at end of file diff --git a/annotations_1/otOIqHsnQZY_filtered.json b/annotations_1/otOIqHsnQZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4329735b6aa37cf743d6413fb060af8120f57336 --- /dev/null +++ b/annotations_1/otOIqHsnQZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.09], [9.0, 9.9], [13.0, 14.23], [25.0, 25.88], [28.0, 28.49], [29.0, 30.13], [36.0, 36.39], [36.0, 38.55], [41.0, 41.52], [43.0, 44.9], [53.0, 54.24], [54.0, 54.73], [61.0, 62.43], [63.0, 64.44], [65.0, 66.46], [67.0, 67.31], [68.0, 68.18], [69.0, 69.03], [69.0, 70.23], [71.0, 70.98], [71.0, 71.64], [72.0, 72.17], [74.0, 74.07], [75.0, 77.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["boing", 49.0], ["speech", 19.38], ["music", 15.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 17.34], ["boing", 12.33], ["smash, crash", 11.55]]], "duration": [1.09, 0.9, 1.23, 0.88, 0.49, 1.13, 0.39, 2.55, 0.52, 1.9, 1.24, 0.73, 1.43, 1.44, 1.46, 0.31, 0.18, 0.03, 1.23, -0.02, 0.64, 0.17, 0.07, 2.67]} \ No newline at end of file diff --git a/annotations_1/ouQG7Pcq1S8_filtered.json b/annotations_1/ouQG7Pcq1S8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd144b512fd3aebaa0c395888ad788f8774b9dac --- /dev/null +++ b/annotations_1/ouQG7Pcq1S8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [18.0, 22.52], [24.0, 25.02], [28.0, 28.27], [31.0, 30.99], [34.0, 34.82], [35.0, 35.09], [35.0, 42.63], [43.0, 46.13], [53.0, 63.27], [65.0, 71.15], [75.0, 76.1], [79.0, 82.04], [83.0, 85.72], [98.0, 111.75], [120.0, 122.25], [123.0, 126.84], [128.0, 128.76], [129.0, 130.69], [134.0, 133.66], [136.0, 136.43], [138.0, 137.89], [142.0, 141.84], [149.0, 149.93], [153.0, 153.37], [154.0, 154.65], [156.0, 156.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.7, 32.11, 32.44, 31.55, 0.0, 37.84, 35.77, 77.53, 61.57, 39.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.6], ["speech", 19.47], ["boing", 4.24]], null, null, null, null, null, [["music", 52.56], ["speech", 21.93], ["boing", 4.38]], [["music", 43.0], ["bow-wow", 12.37], ["dog", 9.22]], [["boing", 37.38], ["music", 25.73], ["whack, thwack", 24.38]], [["music", 48.03], ["groan", 8.17], ["boing", 4.67]], null, [["speech", 37.89], ["cattle, bovinae", 9.61], ["music", 7.98]], [["hum", 35.24], ["music", 19.38], ["whale vocalization", 8.99]], null, null, [["music", 36.2], ["speech", 32.08], ["hum", 3.3]], null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 4.52, 1.02, 0.27, -0.01, 0.82, 0.09, 7.63, 3.13, 10.27, 6.15, 1.1, 3.04, 2.72, 13.75, 2.25, 3.84, 0.76, 1.69, -0.34, 0.43, -0.11, -0.16, 0.93, 0.37, 0.65, 0.44]} \ No newline at end of file diff --git a/annotations_1/ovFDrgui4a0_filtered.json b/annotations_1/ovFDrgui4a0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2683276f5e886941d239d59c4044d7ced50f8fa --- /dev/null +++ b/annotations_1/ovFDrgui4a0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 13.1], [15.0, 28.51], [31.0, 34.33], [35.0, 36.26], [38.0, 62.06], [63.0, 76.37]], "keep_status": [true, false, true, false, false, true], "silence_prob": [32.6, 36.15, 36.69, 0.0, 32.25, 30.4], "audiomae_on_audioset": [[["music", 50.39], ["hum", 7.94], ["mains hum", 5.04]], [["music", 61.53], ["hum", 6.76], ["ambient music", 6.27]], [["music", 58.9], ["musical instrument", 4.49], ["guitar", 4.07]], null, [["music", 77.31], ["echo", 4.05], ["livestock, farm animals, working animals", 1.99]], [["bow-wow", 26.12], ["music", 16.69], ["yip", 12.25]]], "duration": [12.1, 13.51, 3.33, 1.26, 24.06, 13.37]} \ No newline at end of file diff --git a/annotations_1/ovPXL1WPTMA_filtered.json b/annotations_1/ovPXL1WPTMA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd4a498990976f377c7082fb54221be6e78af84 --- /dev/null +++ b/annotations_1/ovPXL1WPTMA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.81], [29.0, 34.42], [37.0, 40.83], [41.0, 44.51], [46.0, 56.73], [60.0, 61.57], [63.0, 65.03], [67.0, 75.95], [77.0, 77.57]], "keep_status": [false, false, true, true, false, false, true, true, false], "silence_prob": [50.11, 79.41, 40.82, 49.87, 49.36, 0.0, 34.34, 31.09, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.69], ["speech", 22.9], ["hum", 5.52]], [["music", 27.42], ["hum", 13.34], ["fly, housefly", 8.28]], [["music", 73.85], ["synthesizer", 2.52], ["boing", 1.94]], null, [["mosquito", 25.32], ["music", 16.48], ["fly, housefly", 11.81]], [["fly, housefly", 28.11], ["music", 17.38], ["mosquito", 17.34]], null], "duration": [16.81, 5.42, 3.83, 3.51, 10.73, 1.57, 2.03, 8.95, 0.57]} \ No newline at end of file diff --git a/annotations_1/ovxjAnlr7qg_filtered.json b/annotations_1/ovxjAnlr7qg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67d253cb77dea62abeee0b3940ae8b45623cffb9 --- /dev/null +++ b/annotations_1/ovxjAnlr7qg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.53], [20.0, 20.14], [24.0, 24.49], [40.0, 40.86], [42.0, 42.96], [70.0, 69.79], [77.0, 77.14], [77.0, 82.31], [84.0, 86.04], [89.0, 91.0], [92.0, 97.56], [100.0, 100.03], [101.0, 102.52], [104.0, 105.43], [106.0, 113.0], [121.0, 122.4], [130.0, 135.33], [139.0, 142.47], [144.0, 144.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 53.04, 53.28, 33.53, 0.0, 0.0, 0.0, 40.17, 0.0, 41.3, 50.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 67.81], ["didgeridoo", 8.45], ["guitar", 4.86]], null, null, [["speech", 35.23], ["music", 21.25], ["sidetone", 11.03]], null, null, null, [["music", 64.81], ["musical instrument", 3.06], ["speech", 2.62]], null, [["music", 36.89], ["speech", 12.01], ["didgeridoo", 5.81]], null, null], "duration": [1.53, 0.14, 0.49, 0.86, 0.96, -0.21, 0.14, 5.31, 2.04, 2.0, 5.56, 0.03, 1.52, 1.43, 7.0, 1.4, 5.33, 3.47, 0.91]} \ No newline at end of file diff --git a/annotations_1/ow3Pf0LSXwc_filtered.json b/annotations_1/ow3Pf0LSXwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b98f77933a876bf5af8ed9bc017d117b44b30fb6 --- /dev/null +++ b/annotations_1/ow3Pf0LSXwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.14], [25.0, 28.17], [30.0, 32.39], [33.0, 33.81], [37.0, 39.24], [48.0, 56.86], [61.0, 71.32], [76.0, 97.58]], "keep_status": [true, true, true, false, false, false, true, false], "silence_prob": [36.11, 38.46, 45.3, 0.0, 38.33, 34.01, 34.07, 32.97], "audiomae_on_audioset": [[["music", 24.86], ["didgeridoo", 11.2], ["hum", 11.01]], [["music", 55.42], ["speech", 6.07], ["theremin", 4.97]], [["music", 55.14], ["synthesizer", 7.36], ["musical instrument", 4.22]], null, [["music", 51.18], ["throbbing", 15.3], ["hum", 7.56]], [["music", 63.76], ["synthesizer", 8.95], ["theremin", 8.21]], [["speech", 45.56], ["hum", 11.89], ["music", 10.98]], [["hum", 45.41], ["mains hum", 42.16], ["music", 5.25]]], "duration": [3.14, 3.17, 2.39, 0.81, 2.24, 8.86, 10.32, 21.58]} \ No newline at end of file diff --git a/annotations_1/ox1SVCutwv4_filtered.json b/annotations_1/ox1SVCutwv4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6e392c242640a7105cba67534cb472860f46c62 --- /dev/null +++ b/annotations_1/ox1SVCutwv4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.65], [30.0, 30.43], [31.0, 32.66], [34.0, 34.38], [35.0, 37.81], [39.0, 59.61], [65.0, 81.43], [83.0, 85.19], [86.0, 92.5], [93.0, 95.91], [97.0, 101.58], [105.0, 119.52], [123.0, 137.08], [140.0, 146.8], [149.0, 152.59], [157.0, 157.4], [158.0, 161.84], [165.0, 166.01], [168.0, 180.1]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.74, 29.34, 29.82, 35.28, 33.14, 38.08, 34.38, 30.46, 29.86, 35.6, 56.03, 0.0, 37.98, 0.0, 35.51], "audiomae_on_audioset": [null, null, null, null, [["music", 22.96], ["breaking", 10.06], ["whack, thwack", 5.58]], [["speech", 36.64], ["music", 31.98], ["cacophony", 8.8]], [["music", 57.89], ["hum", 10.7], ["throbbing", 10.09]], [["music", 30.53], ["throbbing", 28.35], ["hum", 11.32]], [["music", 68.03], ["electronic music", 7.37], ["synthesizer", 4.54]], [["music", 52.13], ["gong", 15.53], ["hum", 7.83]], [["music", 44.1], ["ambient music", 8.18], ["hum", 6.67]], [["music", 31.68], ["hum", 26.3], ["throbbing", 19.98]], [["music", 36.31], ["throbbing", 27.55], ["hum", 19.02]], [["hum", 39.42], ["mains hum", 34.45], ["speech", 5.09]], null, null, [["hum", 17.5], ["heart sounds, heartbeat", 15.18], ["music", 12.62]], null, [["mains hum", 40.24], ["hum", 39.67], ["throbbing", 5.9]]], "duration": [0.65, 0.43, 1.66, 0.38, 2.81, 20.61, 16.43, 2.19, 6.5, 2.91, 4.58, 14.52, 14.08, 6.8, 3.59, 0.4, 3.84, 1.01, 12.1]} \ No newline at end of file diff --git a/annotations_1/oyU6En9HN8E_filtered.json b/annotations_1/oyU6En9HN8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4c1de3da89a1736ec43ddf16b4de643ce353cbd --- /dev/null +++ b/annotations_1/oyU6En9HN8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [8.0, 20.17], [24.0, 24.21], [25.0, 32.58], [34.0, 36.51], [38.0, 38.97], [40.0, 41.98], [44.0, 57.6], [59.0, 59.71], [64.0, 65.91], [72.0, 75.2], [110.0, 109.83], [117.0, 118.74], [128.0, 128.68], [130.0, 130.89], [134.0, 134.37], [135.0, 146.11], [163.0, 164.05], [165.0, 166.43], [166.0, 166.5], [167.0, 167.46]], "keep_status": [false, true, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.74, 0.0, 39.46, 38.1, 0.0, 0.0, 36.07, 0.0, 0.0, 30.98, 0.0, 0.0, 0.0, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 23.87], ["fly, housefly", 12.18], ["buzz", 9.07]], null, [["fly, housefly", 18.63], ["speech", 18.16], ["bee, wasp, etc.", 8.55]], [["music", 17.77], ["throbbing", 13.98], ["hum", 9.26]], null, null, [["livestock, farm animals, working animals", 12.83], ["clip-clop", 12.46], ["horse", 11.92]], null, null, [["beatboxing", 62.41], ["speech", 22.59], ["music", 5.67]], null, null, null, null, null, [["speech", 81.56], ["sidetone", 4.15], ["radio", 3.99]], null, null, null, null], "duration": [0.51, 12.17, 0.21, 7.58, 2.51, 0.97, 1.98, 13.6, 0.71, 1.91, 3.2, -0.17, 1.74, 0.68, 0.89, 0.37, 11.11, 1.05, 1.43, 0.5, 0.46]} \ No newline at end of file diff --git a/annotations_1/oyZblWujofQ_filtered.json b/annotations_1/oyZblWujofQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b6982326ddfc8ac0828ca77fcb742950348780a --- /dev/null +++ b/annotations_1/oyZblWujofQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.84], [8.0, 9.39], [10.0, 10.62], [14.0, 14.34], [16.0, 18.15], [20.0, 20.7], [22.0, 26.81], [27.0, 28.21], [32.0, 60.02], [64.0, 65.4], [67.0, 78.93], [81.0, 81.73], [83.0, 84.94], [85.0, 85.72], [86.0, 86.9]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.63, 0.0, 31.74, 0.0, 30.61, 0.0, 30.17, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["explosion", 27.53], ["music", 17.4], ["burst, pop", 11.81]], null, [["speech", 66.3], ["explosion", 7.82], ["music", 5.03]], null, [["speech", 61.92], ["machine gun", 18.01], ["cacophony", 2.56]], null, [["speech", 26.26], ["machine gun", 9.45], ["explosion", 8.59]], null, null, null, null], "duration": [-0.16, 1.39, 0.62, 0.34, 2.15, 0.7, 4.81, 1.21, 28.02, 1.4, 11.93, 0.73, 1.94, 0.72, 0.9]} \ No newline at end of file diff --git a/annotations_1/oymR3xfYh4c_filtered.json b/annotations_1/oymR3xfYh4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc83d9e4bd4a8d0a8080033fa011fce693020c10 --- /dev/null +++ b/annotations_1/oymR3xfYh4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 44.19], [45.0, 45.47], [46.0, 64.45], [65.0, 65.94], [67.0, 88.55], [91.0, 91.45], [92.0, 105.95], [107.0, 113.12], [115.0, 136.71], [137.0, 147.7], [148.0, 149.89], [150.0, 151.12], [152.0, 174.33], [175.0, 176.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.97, 0.0, 93.29, 0.0, 87.19, 0.0, 56.7, 73.97, 87.74, 39.82, 0.0, 0.0, 61.27, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["sidetone", 37.01], ["speech", 25.14], ["hum", 12.93]], null, null, null, null], "duration": [7.19, 0.47, 18.45, 0.94, 21.55, 0.45, 13.95, 6.12, 21.71, 10.7, 1.89, 1.12, 22.33, 1.0]} \ No newline at end of file diff --git a/annotations_1/oyqIjdFcJVg_filtered.json b/annotations_1/oyqIjdFcJVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5be2ecc7b3e18b2c066b228c4356f2adc429e741 --- /dev/null +++ b/annotations_1/oyqIjdFcJVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 23.82], [26.0, 27.68], [45.0, 45.23], [45.0, 45.87], [47.0, 49.25], [50.0, 50.65], [51.0, 55.41], [56.0, 56.24], [58.0, 59.07]], "keep_status": [true, false, false, false, false, false, true, false, false], "silence_prob": [33.13, 0.0, 0.0, 0.0, 31.67, 0.0, 41.5, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 58.12], ["horse", 4.22], ["radio", 3.65]], null, null, null, [["telephone bell ringing", 48.28], ["telephone", 11.52], ["ringtone", 10.43]], null, [["speech", 46.84], ["radio", 14.97], ["sidetone", 6.92]], null, null], "duration": [12.82, 1.68, 0.23, 0.87, 2.25, 0.65, 4.41, 0.24, 1.07]} \ No newline at end of file diff --git a/annotations_1/oyuHdD6ORAg_filtered.json b/annotations_1/oyuHdD6ORAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0a5d80a3da8366c93ee9d6a559e083123a97cc7 --- /dev/null +++ b/annotations_1/oyuHdD6ORAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [9.0, 13.54], [14.0, 97.77]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.07, 0.0], "audiomae_on_audioset": [null, [["music", 50.94], ["speech", 27.67], ["electronic music", 2.72]], null], "duration": [0.2, 4.54, 83.77]} \ No newline at end of file diff --git a/annotations_1/ozkF8KRjeO8_filtered.json b/annotations_1/ozkF8KRjeO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a03cf282e8614ce338d60638b52bf78b87383fb8 --- /dev/null +++ b/annotations_1/ozkF8KRjeO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.51], [7.0, 19.47], [20.0, 28.93], [32.0, 63.07], [64.0, 64.79], [65.0, 65.99], [67.0, 67.88], [70.0, 72.79], [80.0, 97.97], [99.0, 110.96], [111.0, 112.92], [113.0, 116.78], [122.0, 123.31]], "keep_status": [true, true, true, false, false, false, false, true, false, false, false, true, false], "silence_prob": [35.84, 37.15, 33.61, 0.0, 0.0, 0.0, 0.0, 45.4, 31.11, 29.92, 0.0, 32.37, 0.0], "audiomae_on_audioset": [[["cattle, bovinae", 27.17], ["livestock, farm animals, working animals", 15.77], ["moo", 13.95]], [["cattle, bovinae", 25.68], ["moo", 19.85], ["livestock, farm animals, working animals", 18.92]], [["speech", 38.7], ["vehicle", 18.85], ["buzz", 7.54]], null, null, null, null, [["fly, housefly", 32.52], ["mosquito", 15.84], ["insect", 6.24]], [["music", 75.07], ["synthesizer", 4.99], ["musical instrument", 3.88]], [["music", 80.11], ["grunt", 2.21], ["synthesizer", 1.42]], null, [["cattle, bovinae", 26.42], ["moo", 22.33], ["livestock, farm animals, working animals", 13.52]], null], "duration": [5.51, 12.47, 8.93, 31.07, 0.79, 0.99, 0.88, 2.79, 17.97, 11.96, 1.92, 3.78, 1.31]} \ No newline at end of file diff --git a/annotations_1/p-tvo3Hz3nw_filtered.json b/annotations_1/p-tvo3Hz3nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..589e01587e61758681f521ffb746d5f4a62ac3ff --- /dev/null +++ b/annotations_1/p-tvo3Hz3nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 23.41], [32.0, 37.2], [40.0, 45.2], [46.0, 47.76], [50.0, 78.51], [82.0, 82.16], [88.0, 91.74], [93.0, 94.76]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [29.81, 68.28, 33.77, 0.0, 34.57, 0.0, 44.52, 0.0], "audiomae_on_audioset": [[["music", 32.78], ["smash, crash", 15.04], ["whack, thwack", 10.45]], null, [["cattle, bovinae", 15.95], ["livestock, farm animals, working animals", 15.44], ["animal", 7.41]], null, [["hum", 39.33], ["throbbing", 30.2], ["music", 8.32]], null, [["music", 50.14], ["synthesizer", 6.97], ["electronic music", 5.66]], null], "duration": [15.41, 5.2, 5.2, 1.76, 28.51, 0.16, 3.74, 1.76]} \ No newline at end of file diff --git a/annotations_1/p03u3v6GF-Y_filtered.json b/annotations_1/p03u3v6GF-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca84335babd313913e683bc73fdcf67d9d613732 --- /dev/null +++ b/annotations_1/p03u3v6GF-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.98], [10.0, 16.77], [24.0, 28.29], [33.0, 49.18], [56.0, 59.19], [61.0, 79.86], [80.0, 86.02], [93.0, 104.89], [107.0, 116.48], [116.0, 116.51], [117.0, 116.95], [117.0, 127.45], [132.0, 134.0], [137.0, 144.9]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.37, 33.3, 32.09, 32.48, 32.47, 32.79, 33.18, 32.09, 0.0, 0.0, 32.66, 36.58, 33.67], "audiomae_on_audioset": [null, [["music", 39.71], ["gong", 31.89], ["musical instrument", 4.81]], [["music", 51.32], ["synthesizer", 10.24], ["musical instrument", 7.9]], [["music", 73.5], ["musical instrument", 7.21], ["echo", 2.73]], [["music", 86.89], ["musical instrument", 2.2], ["echo", 0.83]], [["music", 67.37], ["musical instrument", 7.94], ["trombone", 3.97]], [["music", 81.0], ["musical instrument", 4.96], ["theremin", 4.79]], [["music", 57.08], ["musical instrument", 12.27], ["brass instrument", 9.72]], [["music", 61.37], ["synthesizer", 7.88], ["musical instrument", 7.47]], null, null, [["music", 38.25], ["trombone", 27.28], ["brass instrument", 19.96]], [["music", 48.37], ["theremin", 25.41], ["effects unit", 7.41]], [["gong", 38.01], ["music", 16.39], ["synthesizer", 6.7]]], "duration": [0.98, 6.77, 4.29, 16.18, 3.19, 18.86, 6.02, 11.89, 9.48, 0.51, -0.05, 10.45, 2.0, 7.9]} \ No newline at end of file diff --git a/annotations_1/p07sXB8H3zQ_filtered.json b/annotations_1/p07sXB8H3zQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5488ec9b043fdea4b14663d67551a5b27b39e8 --- /dev/null +++ b/annotations_1/p07sXB8H3zQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.32], [10.0, 10.2], [12.0, 12.38], [20.0, 24.24], [26.0, 28.7], [31.0, 32.22], [33.0, 34.3], [36.0, 36.36], [38.0, 38.4], [42.0, 42.67], [44.0, 47.53], [58.0, 58.75], [63.0, 67.85], [69.0, 71.61], [76.0, 81.84], [87.0, 89.5]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.27, 31.62, 0.0, 0.0, 0.0, 0.0, 0.0, 36.16, 0.0, 31.41, 32.33, 31.53, 32.68], "audiomae_on_audioset": [null, null, null, [["music", 42.07], ["hum", 20.02], ["electronic music", 6.1]], [["music", 29.26], ["speech", 28.91], ["hum", 6.75]], null, null, null, null, null, [["music", 50.98], ["didgeridoo", 12.18], ["speech", 6.88]], null, [["speech", 47.1], ["whale vocalization", 22.78], ["music", 7.82]], [["speech", 69.45], ["chuckle, chortle", 4.39], ["snicker", 3.75]], [["music", 45.07], ["throbbing", 5.08], ["electronic music", 4.54]], [["music", 63.52], ["didgeridoo", 4.33], ["hum", 4.32]]], "duration": [0.32, 0.2, 0.38, 4.24, 2.7, 1.22, 1.3, 0.36, 0.4, 0.67, 3.53, 0.75, 4.85, 2.61, 5.84, 2.5]} \ No newline at end of file diff --git a/annotations_1/p0CQcDumPh8_filtered.json b/annotations_1/p0CQcDumPh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e037535174280424fca31be0e77fa93b3ba0ec2 --- /dev/null +++ b/annotations_1/p0CQcDumPh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 36.88], [40.0, 44.71], [47.0, 73.77], [76.0, 76.22], [79.0, 81.4], [85.0, 87.69], [94.0, 95.12], [96.0, 96.13], [97.0, 98.51], [104.0, 104.38], [107.0, 107.1], [108.0, 109.34], [111.0, 111.64], [113.0, 113.41], [116.0, 117.69], [118.0, 119.04], [121.0, 121.81], [125.0, 125.66], [129.0, 130.22], [133.0, 135.16], [141.0, 140.78], [144.0, 144.21], [146.0, 146.91], [148.0, 149.25], [150.0, 151.75], [154.0, 154.58], [157.0, 156.91], [159.0, 161.87]], "keep_status": [true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.0, 31.22, 30.12, 0.0, 37.25, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.26], "audiomae_on_audioset": [[["music", 36.16], ["animal", 8.22], ["drum machine", 4.08]], [["music", 53.03], ["speech", 8.84], ["cattle, bovinae", 4.63]], [["music", 64.0], ["cattle, bovinae", 12.75], ["moo", 5.61]], null, [["speech", 24.59], ["telephone", 19.23], ["insect", 6.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.88, 4.71, 26.77, 0.22, 2.4, 2.69, 1.12, 0.13, 1.51, 0.38, 0.1, 1.34, 0.64, 0.41, 1.69, 1.04, 0.81, 0.66, 1.22, 2.16, -0.22, 0.21, 0.91, 1.25, 1.75, 0.58, -0.09, 2.87]} \ No newline at end of file diff --git a/annotations_1/p0cf4-1zuOk_filtered.json b/annotations_1/p0cf4-1zuOk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5832947a174760cf9107c1d52c7b0622564de283 --- /dev/null +++ b/annotations_1/p0cf4-1zuOk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 56.84], [58.0, 58.94], [60.0, 60.29], [63.0, 67.64], [71.0, 73.75], [74.0, 75.29], [75.0, 94.66], [96.0, 111.55], [112.0, 113.43], [114.0, 118.12], [123.0, 124.55]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.63, 30.86, 0.0, 29.94, 31.01, 0.0, 89.9, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.8], ["hum", 18.67], ["throbbing", 17.25]], [["music", 79.32], ["meow", 3.86], ["throbbing", 2.88]], null, [["music", 52.54], ["hum", 6.89], ["throbbing", 5.97]], [["music", 40.5], ["didgeridoo", 8.63], ["synthesizer", 5.59]], null, null, null], "duration": [-0.16, 0.94, 0.29, 4.64, 2.75, 1.29, 19.66, 15.55, 1.43, 4.12, 1.55]} \ No newline at end of file diff --git a/annotations_1/p0vZhGqM_Rs_filtered.json b/annotations_1/p0vZhGqM_Rs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9271600cb44b2ad54d2fa4cbdeae1ed5662341f0 --- /dev/null +++ b/annotations_1/p0vZhGqM_Rs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 55.41], [56.0, 56.03], [56.0, 69.09], [74.0, 77.31], [80.0, 81.36], [83.0, 84.57], [88.0, 90.37], [93.0, 94.31], [98.0, 100.6], [101.0, 102.2], [106.0, 107.45], [109.0, 111.25], [115.0, 116.11], [119.0, 118.99], [119.0, 119.38], [123.0, 125.95], [136.0, 137.69], [138.0, 142.69], [144.0, 144.93], [146.0, 152.24], [154.0, 153.93], [156.0, 156.83]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.56, 48.39, 0.0, 0.0, 49.73, 0.0, 56.55, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 53.72, 0.0, 59.51, 0.0, 55.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sonar", 40.19], ["music", 25.05], ["hum", 4.94]], [["music", 15.25], ["sonar", 11.46], ["hum", 6.78]], null, null, [["music", 29.18], ["whale vocalization", 9.69], ["hum", 9.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.41, 0.03, 13.09, 3.31, 1.36, 1.57, 2.37, 1.31, 2.6, 1.2, 1.45, 2.25, 1.11, -0.01, 0.38, 2.95, 1.69, 4.69, 0.93, 6.24, -0.07, 0.83]} \ No newline at end of file diff --git a/annotations_1/p1e3NC3IIF8_filtered.json b/annotations_1/p1e3NC3IIF8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a39ccdfa7c83be52a14075a2162ccd5e4a7b112 --- /dev/null +++ b/annotations_1/p1e3NC3IIF8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.72], [20.0, 24.29], [34.0, 35.48], [37.0, 38.64], [42.0, 43.85], [46.0, 46.77], [50.0, 49.92], [54.0, 53.86], [58.0, 60.02], [61.0, 62.83], [65.0, 65.42], [71.0, 71.04], [72.0, 83.44], [86.0, 86.07], [88.0, 96.84], [97.0, 97.93], [100.0, 104.63], [108.0, 107.79], [121.0, 130.79], [133.0, 132.9], [141.0, 141.3], [141.0, 141.74], [145.0, 144.64], [145.0, 146.16], [148.0, 148.42], [151.0, 155.12], [157.0, 157.6], [161.0, 162.04], [165.0, 166.13], [167.0, 167.44], [171.0, 173.69], [175.0, 178.85], [179.0, 182.24]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0, 32.77, 0.0, 38.12, 0.0, 62.27, 0.0, 45.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.7, 0.0, 0.0, 0.0, 0.0, 55.18, 45.14, 44.55], "audiomae_on_audioset": [null, [["music", 45.14], ["didgeridoo", 5.98], ["hum", 5.25]], null, null, null, null, null, null, [["music", 57.82], ["throbbing", 7.95], ["hum", 7.05]], null, null, null, [["music", 40.52], ["hum", 17.17], ["mains hum", 10.43]], null, [["speech", 59.92], ["hum", 16.89], ["mains hum", 4.44]], null, null, null, [["music", 49.61], ["hum", 5.65], ["fly, housefly", 4.28]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 48.46], ["speech", 17.1], ["synthesizer", 3.62]], [["music", 52.37], ["speech", 13.02], ["hum", 7.9]]], "duration": [-0.28, 4.29, 1.48, 1.64, 1.85, 0.77, -0.08, -0.14, 2.02, 1.83, 0.42, 0.04, 11.44, 0.07, 8.84, 0.93, 4.63, -0.21, 9.79, -0.1, 0.3, 0.74, -0.36, 1.16, 0.42, 4.12, 0.6, 1.04, 1.13, 0.44, 2.69, 3.85, 3.24]} \ No newline at end of file diff --git a/annotations_1/p2CR0S7DHyQ_filtered.json b/annotations_1/p2CR0S7DHyQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..232dd42dd278be5801d3180b3a8d6a22197374dc --- /dev/null +++ b/annotations_1/p2CR0S7DHyQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.52], [7.0, 7.86], [9.0, 10.25], [11.0, 11.52], [13.0, 13.63], [14.0, 15.26], [17.0, 17.88], [18.0, 26.89], [27.0, 31.82], [34.0, 36.54], [37.0, 51.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.62, 74.44, 93.91, 81.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.86, 1.25, 0.52, 0.63, 1.26, 0.88, 8.89, 4.82, 2.54, 14.02]} \ No newline at end of file diff --git a/annotations_1/p2QiCFAQ-qQ_filtered.json b/annotations_1/p2QiCFAQ-qQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0527a23576cedb7ade8d11b3093d821beb445105 --- /dev/null +++ b/annotations_1/p2QiCFAQ-qQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.9], [17.0, 18.62], [19.0, 20.51], [23.0, 23.25], [24.0, 24.31], [28.0, 28.46], [33.0, 34.67], [43.0, 43.09], [44.0, 44.32], [45.0, 47.34], [48.0, 48.56], [51.0, 51.34], [55.0, 54.94], [56.0, 57.01], [62.0, 62.07], [65.0, 67.54], [68.0, 69.28], [71.0, 71.78], [76.0, 77.48], [79.0, 81.04], [82.0, 99.0], [99.0, 100.72], [103.0, 103.33], [105.0, 108.46], [116.0, 116.29], [117.0, 117.68], [118.0, 119.55], [120.0, 120.66], [126.0, 125.88], [129.0, 130.35], [134.0, 134.27], [135.0, 135.55], [137.0, 140.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 99.65, 31.16, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.45], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 49.43], ["speech", 19.26], ["music", 16.98]], null, null, null, null, null, null, null, null, null, null, null, [["music", 71.56], ["breaking", 19.63], ["smash, crash", 2.26]]], "duration": [3.9, 1.62, 1.51, 0.25, 0.31, 0.46, 1.67, 0.09, 0.32, 2.34, 0.56, 0.34, -0.06, 1.01, 0.07, 2.54, 1.28, 0.78, 1.48, 2.04, 17.0, 1.72, 0.33, 3.46, 0.29, 0.68, 1.55, 0.66, -0.12, 1.35, 0.27, 0.55, 3.37]} \ No newline at end of file diff --git a/annotations_1/p2zDdb_MqmI_filtered.json b/annotations_1/p2zDdb_MqmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33a957da0615285a633790464f59a7e96a6cead1 --- /dev/null +++ b/annotations_1/p2zDdb_MqmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.8], [24.0, 24.8], [25.0, 35.01], [35.0, 36.24], [41.0, 42.74], [43.0, 45.22], [50.0, 52.62], [56.0, 61.72], [67.0, 70.7], [81.0, 81.38], [83.0, 93.55], [95.0, 96.5], [99.0, 106.69], [109.0, 109.85], [112.0, 112.51], [117.0, 117.61], [118.0, 117.71], [118.0, 120.02], [121.0, 125.9], [132.0, 143.75], [144.0, 144.75], [147.0, 146.74], [148.0, 150.16], [151.0, 153.79], [158.0, 159.66], [161.0, 161.67], [162.0, 174.65], [176.0, 190.31], [192.0, 193.62]], "keep_status": [true, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false, true, true, false], "silence_prob": [34.12, 0.0, 30.33, 0.0, 0.0, 32.69, 31.17, 30.57, 33.24, 0.0, 31.54, 0.0, 30.97, 0.0, 0.0, 0.0, 0.0, 38.94, 36.85, 30.78, 0.0, 0.0, 50.16, 34.43, 0.0, 0.0, 33.12, 30.76, 0.0], "audiomae_on_audioset": [[["music", 28.58], ["speech", 24.64], ["quack", 5.52]], null, [["music", 43.78], ["speech", 29.45], ["vehicle", 3.38]], null, null, [["music", 44.0], ["speech", 26.21], ["trombone", 4.16]], [["music", 49.03], ["speech", 13.7], ["cattle, bovinae", 6.99]], [["music", 60.28], ["throbbing", 4.01], ["cattle, bovinae", 3.42]], [["music", 17.66], ["throbbing", 10.4], ["honk", 7.18]], null, [["livestock, farm animals, working animals", 38.02], ["moo", 23.55], ["cattle, bovinae", 20.52]], null, [["music", 52.15], ["speech", 14.0], ["throbbing", 4.83]], null, null, null, null, [["noise", 14.7], ["livestock, farm animals, working animals", 9.37], ["cattle, bovinae", 9.3]], [["fart", 25.32], ["speech", 24.22], ["noise", 15.26]], [["smash, crash", 22.94], ["livestock, farm animals, working animals", 17.59], ["music", 16.04]], null, null, null, [["music", 17.52], ["fly, housefly", 10.57], ["didgeridoo", 9.2]], null, null, [["music", 37.48], ["throbbing", 12.59], ["hum", 11.83]], [["vehicle", 30.73], ["car", 16.06], ["race car, auto racing", 10.09]], null], "duration": [3.8, 0.8, 10.01, 1.24, 1.74, 2.22, 2.62, 5.72, 3.7, 0.38, 10.55, 1.5, 7.69, 0.85, 0.51, 0.61, -0.29, 2.02, 4.9, 11.75, 0.75, -0.26, 2.16, 2.79, 1.66, 0.67, 12.65, 14.31, 1.62]} \ No newline at end of file diff --git a/annotations_1/p39lIRTEPY4_filtered.json b/annotations_1/p39lIRTEPY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5379449ce1e19047e240fec7efd11dc85c634a4f --- /dev/null +++ b/annotations_1/p39lIRTEPY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 46.09], [48.0, 93.45], [95.0, 101.28], [102.0, 131.95]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 92.15, 29.06], "audiomae_on_audioset": [null, null, null, [["music", 21.68], ["breaking", 14.75], ["rumble", 8.77]]], "duration": [42.09, 45.45, 6.28, 29.95]} \ No newline at end of file diff --git a/annotations_1/p3ZnaRMhD_A_filtered.json b/annotations_1/p3ZnaRMhD_A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d69566bb8932521c09c51f098c5ce9bd1c3eeb33 --- /dev/null +++ b/annotations_1/p3ZnaRMhD_A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [8.0, 9.91], [14.0, 16.43], [19.0, 20.04], [22.0, 24.14], [27.0, 33.12], [35.0, 37.35], [40.0, 41.0], [43.0, 44.61], [47.0, 50.13], [51.0, 52.47], [55.0, 56.39], [59.0, 61.28], [63.0, 64.74], [70.0, 70.28], [75.0, 75.78], [85.0, 86.43], [88.0, 90.36], [96.0, 96.77], [98.0, 99.3], [104.0, 104.38], [113.0, 114.4], [115.0, 115.99], [117.0, 119.16], [121.0, 126.57], [128.0, 129.79], [131.0, 133.1], [135.0, 135.75], [139.0, 139.16], [140.0, 140.76], [144.0, 158.36], [161.0, 162.85], [163.0, 168.37], [169.0, 170.11], [171.0, 171.63], [175.0, 176.59], [178.0, 178.63], [180.0, 182.21], [184.0, 185.03], [189.0, 190.17], [193.0, 199.22], [200.0, 201.19], [203.0, 203.82], [210.0, 212.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 73.97, 0.0, 97.54, 99.98, 57.32, 0.0, 0.0, 100.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 43.9, 0.0, 0.0, 0.0, 96.17, 0.0, 53.47, 0.0, 0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 66.27, 0.0, 0.0, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["stomach rumble", 41.72], ["sidetone", 7.25], ["effects unit", 6.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.91, 2.43, 1.04, 2.14, 6.12, 2.35, 1.0, 1.61, 3.13, 1.47, 1.39, 2.28, 1.74, 0.28, 0.78, 1.43, 2.36, 0.77, 1.3, 0.38, 1.4, 0.99, 2.16, 5.57, 1.79, 2.1, 0.75, 0.16, 0.76, 14.36, 1.85, 5.37, 1.11, 0.63, 1.59, 0.63, 2.21, 1.03, 1.17, 6.22, 1.19, 0.82, 2.58]} \ No newline at end of file diff --git a/annotations_1/p3zb4fwFd3E_filtered.json b/annotations_1/p3zb4fwFd3E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..634ecce56d77c807e4ba1193f4513e06a564c984 --- /dev/null +++ b/annotations_1/p3zb4fwFd3E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[66.0, 119.35], [120.0, 123.33], [124.0, 140.37], [142.0, 161.59], [167.0, 169.94], [172.0, 187.49], [189.0, 190.54]], "keep_status": [false, true, false, false, true, true, false], "silence_prob": [0.0, 39.35, 29.93, 30.66, 33.68, 31.39, 0.0], "audiomae_on_audioset": [null, [["music", 29.36], ["hum", 18.6], ["throbbing", 10.84]], [["hum", 42.93], ["music", 25.55], ["throbbing", 9.96]], [["music", 46.18], ["throbbing", 25.98], ["hum", 7.97]], [["music", 28.64], ["frog", 11.05], ["croak", 6.6]], [["gong", 32.68], ["music", 24.65], ["hum", 11.76]], null], "duration": [53.35, 3.33, 16.37, 19.59, 2.94, 15.49, 1.54]} \ No newline at end of file diff --git a/annotations_1/p4HqnBtsz1I_filtered.json b/annotations_1/p4HqnBtsz1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..215954be729f5debad13ceb620844eac15024c86 --- /dev/null +++ b/annotations_1/p4HqnBtsz1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [4.0, 5.39], [6.0, 6.72], [10.0, 10.12], [12.0, 12.29], [13.0, 13.91], [15.0, 15.45], [16.0, 21.15], [25.0, 29.46], [31.0, 38.25], [41.0, 44.15], [48.0, 53.65], [56.0, 56.61], [58.0, 58.63], [59.0, 59.68], [60.0, 61.15], [62.0, 62.97], [65.0, 65.84], [68.0, 68.99], [70.0, 70.26], [72.0, 73.38], [74.0, 75.83], [78.0, 81.24], [89.0, 90.07], [95.0, 97.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 61.97, 47.46, 55.67, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 99.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 57.81], ["ambient music", 19.46], ["singing bowl", 6.87]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.54, 1.39, 0.72, 0.12, 0.29, 0.91, 0.45, 5.15, 4.46, 7.25, 3.15, 5.65, 0.61, 0.63, 0.68, 1.15, 0.97, 0.84, 0.99, 0.26, 1.38, 1.83, 3.24, 1.07, 2.53]} \ No newline at end of file diff --git a/annotations_1/p4Pq9aZVV9Y_filtered.json b/annotations_1/p4Pq9aZVV9Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb5a13c232c250578bd9489575798190b820a76 --- /dev/null +++ b/annotations_1/p4Pq9aZVV9Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.99], [16.0, 17.1], [19.0, 20.66], [27.0, 28.43], [31.0, 35.38], [37.0, 39.18], [42.0, 43.5], [44.0, 44.96], [47.0, 48.47], [50.0, 58.65], [59.0, 58.73], [59.0, 67.15], [69.0, 69.82], [76.0, 82.46], [85.0, 95.23], [102.0, 101.9], [105.0, 105.48], [127.0, 129.64]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.48, 49.68, 0.0, 0.0, 0.0, 45.21, 0.0, 33.15, 0.0, 32.96, 30.17, 0.0, 0.0, 63.74], "audiomae_on_audioset": [null, null, null, null, [["speech", 49.63], ["music", 21.75], ["boing", 3.19]], [["speech", 46.61], ["fireworks", 9.12], ["music", 3.79]], null, null, null, [["speech", 35.42], ["music", 24.87], ["fart", 6.25]], null, [["music", 53.48], ["throbbing", 9.33], ["hum", 6.51]], null, [["music", 60.65], ["speech", 16.76], ["skateboard", 2.5]], [["music", 52.56], ["hum", 9.94], ["throbbing", 3.75]], null, null, null], "duration": [-0.01, 1.1, 1.66, 1.43, 4.38, 2.18, 1.5, 0.96, 1.47, 8.65, -0.27, 8.15, 0.82, 6.46, 10.23, -0.1, 0.48, 2.64]} \ No newline at end of file diff --git a/annotations_1/p4ylvDhfiQw_filtered.json b/annotations_1/p4ylvDhfiQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45035655a5c69681b7c604a3c8ca9baf3ea96e28 --- /dev/null +++ b/annotations_1/p4ylvDhfiQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.93], [23.0, 23.14], [26.0, 27.11], [28.0, 34.53], [35.0, 35.45], [37.0, 43.63], [45.0, 45.3], [48.0, 54.18], [69.0, 86.02], [86.0, 87.25], [98.0, 107.4], [110.0, 114.05], [115.0, 115.77], [122.0, 122.3], [128.0, 129.49], [132.0, 133.83], [142.0, 147.36], [150.0, 153.81], [156.0, 164.91], [170.0, 172.34], [176.0, 175.96]], "keep_status": [false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 28.72, 0.0, 28.32, 0.0, 28.21, 28.41, 0.0, 28.57, 28.59, 0.0, 0.0, 0.0, 0.0, 28.62, 28.7, 28.45, 28.71, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 43.92], ["speech", 26.49], ["throbbing", 8.54]], null, [["throbbing", 30.41], ["music", 22.07], ["hum", 10.49]], null, [["whale vocalization", 19.28], ["animal", 15.63], ["music", 6.28]], [["music", 80.89], ["skateboard", 1.63], ["livestock, farm animals, working animals", 1.28]], null, [["music", 57.99], ["speech", 13.42], ["cacophony", 3.1]], [["music", 73.86], ["speech", 6.95], ["didgeridoo", 3.75]], null, null, null, null, [["music", 44.53], ["speech", 27.21], ["throbbing", 3.51]], [["music", 33.02], ["motorcycle", 10.88], ["livestock, farm animals, working animals", 10.07]], [["music", 55.17], ["vehicle", 8.08], ["speech", 7.71]], [["music", 24.01], ["cacophony", 12.09], ["vehicle", 8.08]], null], "duration": [1.93, 0.14, 1.11, 6.53, 0.45, 6.63, 0.3, 6.18, 17.02, 1.25, 9.4, 4.05, 0.77, 0.3, 1.49, 1.83, 5.36, 3.81, 8.91, 2.34, -0.04]} \ No newline at end of file diff --git a/annotations_1/p5BfdwK92UI_filtered.json b/annotations_1/p5BfdwK92UI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71773c08102e49e591ec4fbf701f6dd201ffa657 --- /dev/null +++ b/annotations_1/p5BfdwK92UI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.91], [19.0, 19.57], [21.0, 21.0], [23.0, 22.79], [28.0, 29.07], [32.0, 33.54], [34.0, 35.85], [37.0, 37.89], [39.0, 49.82], [52.0, 52.91], [64.0, 71.09], [73.0, 75.29], [81.0, 82.26], [83.0, 83.35], [84.0, 84.6], [86.0, 88.75], [94.0, 97.34], [100.0, 103.99], [109.0, 115.94], [116.0, 128.71], [134.0, 134.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.71, 0.0, 42.28, 65.32, 0.0, 0.0, 0.0, 56.48, 34.22, 30.19, 29.6, 31.32, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 54.41], ["speech", 34.92], ["electronic music", 0.53]], null, [["cattle, bovinae", 23.91], ["animal", 17.97], ["moo", 14.15]], null, null, null, null, null, [["music", 51.95], ["throbbing", 5.75], ["sidetone", 3.06]], [["music", 78.05], ["boing", 2.56], ["musical instrument", 2.22]], [["music", 58.78], ["speech", 6.55], ["boing", 6.4]], [["speech", 55.12], ["music", 25.59], ["hum", 1.95]], null], "duration": [2.91, 0.57, 0.0, -0.21, 1.07, 1.54, 1.85, 0.89, 10.82, 0.91, 7.09, 2.29, 1.26, 0.35, 0.6, 2.75, 3.34, 3.99, 6.94, 12.71, 0.35]} \ No newline at end of file diff --git a/annotations_1/p6HbXVaNFfc_filtered.json b/annotations_1/p6HbXVaNFfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59288c0ded8dd75e61db2b30e42d26cb50e664c7 --- /dev/null +++ b/annotations_1/p6HbXVaNFfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [4.0, 4.45], [8.0, 15.3], [16.0, 20.83], [26.0, 48.56], [58.0, 64.99], [65.0, 65.45], [66.0, 65.89], [67.0, 68.39], [69.0, 72.54], [73.0, 96.18], [97.0, 99.18], [101.0, 101.24], [107.0, 115.52], [116.0, 153.55], [157.0, 166.01], [166.0, 190.59], [194.0, 213.49], [216.0, 216.36], [217.0, 217.65], [219.0, 219.01]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 56.1, 34.72, 33.85, 0.0, 0.0, 0.0, 34.42, 34.64, 38.2, 0.0, 35.59, 0.0, 34.69, 35.28, 36.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 82.92], ["funk", 2.55], ["house music", 2.25]], [["music", 76.0], ["funk", 2.89], ["disco", 1.33]], null, null, null, [["music", 60.92], ["synthesizer", 2.13], ["sampler", 2.02]], [["music", 80.49], ["house music", 1.51], ["singing", 1.31]], [["music", 74.26], ["musical instrument", 5.06], ["synthesizer", 2.9]], null, [["music", 81.22], ["funk", 2.83], ["disco", 1.31]], null, [["music", 80.37], ["singing", 1.33], ["middle eastern music", 1.13]], [["music", 78.31], ["house music", 1.59], ["disco", 1.53]], [["music", 62.88], ["clarinet", 2.66], ["musical instrument", 2.42]], null, null, null], "duration": [0.91, 0.45, 7.3, 4.83, 22.56, 6.99, 0.45, -0.11, 1.39, 3.54, 23.18, 2.18, 0.24, 8.52, 37.55, 9.01, 24.59, 19.49, 0.36, 0.65, 0.01]} \ No newline at end of file diff --git a/annotations_1/p6IvB-2jYtY_filtered.json b/annotations_1/p6IvB-2jYtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c97401118d8f65f57bb758c5f29d623fbeb6b0e --- /dev/null +++ b/annotations_1/p6IvB-2jYtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [7.0, 7.59], [11.0, 12.07], [14.0, 16.23], [21.0, 22.23], [23.0, 23.13], [26.0, 28.12], [31.0, 33.24], [35.0, 35.65], [37.0, 42.36], [43.0, 44.59], [46.0, 51.12], [52.0, 57.67], [59.0, 59.44], [61.0, 61.82], [65.0, 67.96], [70.0, 71.39], [74.0, 75.29], [76.0, 77.85], [81.0, 82.95], [87.0, 88.03], [95.0, 96.42], [97.0, 98.41], [100.0, 100.77], [103.0, 107.79], [109.0, 110.73], [112.0, 113.31], [114.0, 114.98], [116.0, 118.91], [120.0, 120.72], [123.0, 123.31], [130.0, 129.71]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 95.78, 0.0, 0.0, 36.09, 85.35, 0.0, 36.2, 0.0, 34.47, 38.6, 0.0, 0.0, 38.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.83, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["chant", 12.84], ["mantra", 10.6], ["synthetic singing", 9.61]], null, null, [["theremin", 54.16], ["music", 27.61], ["musical instrument", 2.9]], null, [["theremin", 60.24], ["music", 27.31], ["musical instrument", 2.16]], [["theremin", 90.01], ["music", 3.32], ["wind instrument, woodwind instrument", 1.32]], null, null, [["theremin", 56.1], ["music", 34.57], ["musical instrument", 1.82]], null, null, null, null, null, null, null, null, [["music", 41.91], ["theremin", 29.55], ["synthesizer", 2.44]], null, null, null, null, null, null, null], "duration": [1.37, 0.59, 1.07, 2.23, 1.23, 0.13, 2.12, 2.24, 0.65, 5.36, 1.59, 5.12, 5.67, 0.44, 0.82, 2.96, 1.39, 1.29, 1.85, 1.95, 1.03, 1.42, 1.41, 0.77, 4.79, 1.73, 1.31, 0.98, 2.91, 0.72, 0.31, -0.29]} \ No newline at end of file diff --git a/annotations_1/p6oIR31ZgyA_filtered.json b/annotations_1/p6oIR31ZgyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0eb5eef54a8a6206c83d983193ed24d3e3c545d0 --- /dev/null +++ b/annotations_1/p6oIR31ZgyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 38.08], [39.0, 41.93], [43.0, 45.1], [47.0, 49.08], [51.0, 55.49], [60.0, 65.2], [69.0, 68.84], [72.0, 72.35], [77.0, 80.4], [81.0, 93.21], [95.0, 95.99], [97.0, 98.54], [101.0, 136.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.82, 88.1, 89.72, 79.59, 98.86, 0.0, 0.0, 93.13, 58.55, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [34.08, 2.93, 2.1, 2.08, 4.49, 5.2, -0.16, 0.35, 3.4, 12.21, 0.99, 1.54, 35.39]} \ No newline at end of file diff --git a/annotations_1/p70o9g5gcdY_filtered.json b/annotations_1/p70o9g5gcdY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3377d3aeac1e352fc52675a288f1cfcbd1860ce2 --- /dev/null +++ b/annotations_1/p70o9g5gcdY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [12.0, 13.12], [13.0, 13.2], [14.0, 17.04], [17.0, 17.42], [45.0, 45.3], [51.0, 51.7], [53.0, 60.27], [65.0, 78.92], [83.0, 83.39], [85.0, 91.77], [100.0, 100.09], [100.0, 103.2], [105.0, 114.37], [115.0, 122.39]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0, 31.96, 30.58, 0.0, 31.39, 0.0, 31.45, 30.7, 30.96], "audiomae_on_audioset": [null, null, null, [["music", 86.12], ["musical instrument", 4.0], ["synthesizer", 2.06]], null, null, null, [["music", 73.91], ["boing", 2.98], ["speech", 2.79]], [["music", 64.99], ["sampler", 2.74], ["male singing", 2.18]], null, [["music", 73.16], ["electronic music", 3.04], ["throbbing", 2.67]], null, [["music", 63.07], ["drum machine", 4.14], ["house music", 3.36]], [["music", 84.27], ["funk", 2.69], ["disco", 1.72]], [["music", 66.56], ["funk", 13.79], ["disco", 4.0]]], "duration": [0.61, 1.12, 0.2, 3.04, 0.42, 0.3, 0.7, 7.27, 13.92, 0.39, 6.77, 0.09, 3.2, 9.37, 7.39]} \ No newline at end of file diff --git a/annotations_1/p9Bo67_slJY_filtered.json b/annotations_1/p9Bo67_slJY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c74cdb62cbdcb564874c746b2f8d708d0a07bce0 --- /dev/null +++ b/annotations_1/p9Bo67_slJY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [5.0, 6.56], [8.0, 10.49], [12.0, 12.77], [18.0, 18.06], [23.0, 25.88], [29.0, 29.78], [31.0, 38.94], [39.0, 39.68], [40.0, 40.58], [43.0, 43.33], [46.0, 56.05], [57.0, 58.11], [60.0, 61.21], [63.0, 64.12], [69.0, 69.3], [71.0, 71.68], [72.0, 73.47], [76.0, 76.37], [78.0, 79.62], [85.0, 86.48], [88.0, 88.2], [89.0, 92.64], [94.0, 96.23], [97.0, 98.09], [99.0, 106.0], [107.0, 108.58], [109.0, 111.01], [112.0, 117.41], [119.0, 123.92], [126.0, 126.62]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, true, false], "silence_prob": [44.99, 0.0, 44.2, 0.0, 0.0, 44.43, 0.0, 34.93, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.18, 38.8, 0.0, 34.82, 0.0, 38.79, 41.28, 36.69, 0.0], "audiomae_on_audioset": [[["speech", 38.1], ["music", 16.66], ["synthesizer", 3.9]], null, [["music", 26.85], ["throbbing", 8.03], ["fly, housefly", 6.64]], null, null, [["music", 43.36], ["throbbing", 16.65], ["hum", 13.07]], null, [["hum", 38.84], ["music", 21.38], ["mains hum", 16.53]], null, null, null, [["hum", 47.53], ["music", 20.21], ["mains hum", 19.13]], null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 27.19], ["speech", 8.76], ["hum", 7.52]], [["sidetone", 26.74], ["speech", 26.38], ["hum", 7.14]], null, [["hum", 55.43], ["mains hum", 16.67], ["music", 7.49]], null, [["hum", 36.98], ["mains hum", 9.43], ["throbbing", 7.14]], [["hum", 29.42], ["mains hum", 29.39], ["throbbing", 6.66]], [["rumble", 16.29], ["music", 13.75], ["hum", 8.32]], null], "duration": [2.11, 1.56, 2.49, 0.77, 0.06, 2.88, 0.78, 7.94, 0.68, 0.58, 0.33, 10.05, 1.11, 1.21, 1.12, 0.3, 0.68, 1.47, 0.37, 1.62, 1.48, 0.2, 3.64, 2.23, 1.09, 7.0, 1.58, 2.01, 5.41, 4.92, 0.62]} \ No newline at end of file diff --git a/annotations_1/p9W9PhaNGOY_filtered.json b/annotations_1/p9W9PhaNGOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0361e228b76b8585c7ee6effc90647de671e33e6 --- /dev/null +++ b/annotations_1/p9W9PhaNGOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 38.45], [39.0, 56.56], [62.0, 85.8], [86.0, 92.18], [93.0, 95.35]], "keep_status": [false, true, true, false, false], "silence_prob": [0.0, 29.58, 29.77, 34.13, 41.76], "audiomae_on_audioset": [null, [["music", 48.96], ["sidetone", 7.96], ["synthesizer", 5.89]], [["music", 27.01], ["livestock, farm animals, working animals", 8.2], ["speech", 7.31]], [["didgeridoo", 39.07], ["music", 24.53], ["speech", 15.12]], [["music", 64.56], ["didgeridoo", 7.74], ["musical instrument", 4.81]]], "duration": [1.45, 17.56, 23.8, 6.18, 2.35]} \ No newline at end of file diff --git a/annotations_1/p9XIPtizl3s_filtered.json b/annotations_1/p9XIPtizl3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08d2eca572dbda61923191b3ae94b623532daff9 --- /dev/null +++ b/annotations_1/p9XIPtizl3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 14.4], [15.0, 40.12], [40.0, 40.15], [40.0, 40.19], [40.0, 40.22], [40.0, 40.26], [41.0, 40.63], [41.0, 40.66], [41.0, 40.69], [41.0, 40.76], [41.0, 52.74], [60.0, 67.39], [68.0, 68.76], [69.0, 85.89], [86.0, 86.48], [87.0, 88.13], [93.0, 93.45], [94.0, 107.94], [108.0, 144.29], [145.0, 145.66]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, true, false, false], "silence_prob": [29.45, 29.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.86, 29.54, 0.0, 28.93, 0.0, 0.0, 0.0, 33.88, 0.0, 0.0], "audiomae_on_audioset": [[["clang", 42.27], ["ding", 16.65], ["music", 7.37]], [["whack, thwack", 66.13], ["music", 10.49], ["fly, housefly", 2.05]], null, null, null, null, null, null, null, null, [["clang", 22.89], ["music", 16.53], ["speech", 8.81]], [["whack, thwack", 24.42], ["clang", 23.73], ["ding", 10.2]], null, [["music", 30.68], ["whack, thwack", 18.87], ["boing", 9.19]], null, null, null, [["hum", 21.62], ["music", 15.92], ["throbbing", 13.07]], null, null], "duration": [7.4, 25.12, 0.15, 0.19, 0.22, 0.26, -0.37, -0.34, -0.31, -0.24, 11.74, 7.39, 0.76, 16.89, 0.48, 1.13, 0.45, 13.94, 36.29, 0.66]} \ No newline at end of file diff --git a/annotations_1/pAwdeWy9yYM_filtered.json b/annotations_1/pAwdeWy9yYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..744fff4d3298f9a39852a8bd85338d2cf7e70d80 --- /dev/null +++ b/annotations_1/pAwdeWy9yYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 40.0], [44.0, 44.85], [53.0, 53.23], [56.0, 57.25], [58.0, 70.73], [84.0, 84.47], [86.0, 85.78], [89.0, 92.21], [94.0, 94.26], [94.0, 112.19], [113.0, 114.49], [116.0, 116.58], [117.0, 122.84], [126.0, 128.29], [129.0, 139.16], [141.0, 141.0], [144.0, 150.04], [156.0, 160.27], [173.0, 182.31], [187.0, 193.7]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, true, true, true], "silence_prob": [30.78, 0.0, 0.0, 0.0, 33.26, 0.0, 0.0, 36.66, 0.0, 29.74, 0.0, 0.0, 30.29, 52.16, 51.02, 0.0, 31.24, 30.99, 30.22, 31.63], "audiomae_on_audioset": [[["music", 67.47], ["throbbing", 4.9], ["synthesizer", 2.9]], null, null, null, [["hum", 26.1], ["music", 20.48], ["throbbing", 14.45]], null, null, [["music", 23.92], ["boing", 17.96], ["throbbing", 15.12]], null, [["boing", 37.93], ["music", 28.94], ["speech", 15.68]], null, null, [["livestock, farm animals, working animals", 25.37], ["music", 17.95], ["speech", 8.72]], null, null, null, [["cattle, bovinae", 28.04], ["music", 27.56], ["moo", 16.91]], [["music", 30.13], ["fart", 23.84], ["speech", 13.64]], [["throbbing", 36.52], ["music", 17.28], ["hum", 11.95]], [["speech", 27.0], ["throbbing", 24.94], ["hum", 17.46]]], "duration": [26.0, 0.85, 0.23, 1.25, 12.73, 0.47, -0.22, 3.21, 0.26, 18.19, 1.49, 0.58, 5.84, 2.29, 10.16, 0.0, 6.04, 4.27, 9.31, 6.7]} \ No newline at end of file diff --git a/annotations_1/pAwoA-XPzsQ_filtered.json b/annotations_1/pAwoA-XPzsQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..de7c8bdd3a03cc4bde96104c00250ba45cce0e84 --- /dev/null +++ b/annotations_1/pAwoA-XPzsQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[102.0, 102.02], [102.0, 115.42], [117.0, 124.43], [126.0, 127.01], [132.0, 133.15]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 30.71, 31.12, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 42.41], ["speech", 30.18], ["throbbing", 7.07]], [["music", 48.36], ["throbbing", 19.44], ["hum", 7.54]], null, null], "duration": [0.02, 13.42, 7.43, 1.01, 1.15]} \ No newline at end of file diff --git a/annotations_1/pBd7XYjjvRw_filtered.json b/annotations_1/pBd7XYjjvRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdd077ebe54dfedc29f6718d1129f8777c77d4b9 --- /dev/null +++ b/annotations_1/pBd7XYjjvRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [6.0, 12.46], [16.0, 23.58], [24.0, 25.08], [27.0, 27.72], [28.0, 49.11], [50.0, 51.04], [54.0, 55.07], [57.0, 56.94], [59.0, 60.2], [61.0, 62.31], [64.0, 64.42], [65.0, 66.38], [68.0, 69.35], [75.0, 76.25], [81.0, 80.87], [83.0, 82.66], [85.0, 85.4], [91.0, 91.71], [94.0, 95.1], [97.0, 98.41], [103.0, 103.82], [105.0, 105.73], [109.0, 109.36], [112.0, 112.99], [119.0, 119.5], [122.0, 122.62], [124.0, 124.95], [126.0, 126.79], [135.0, 136.0], [137.0, 137.32], [142.0, 143.09], [148.0, 147.85], [152.0, 152.15], [156.0, 157.33], [160.0, 160.24], [162.0, 163.65], [165.0, 166.56], [168.0, 169.3], [171.0, 172.32], [173.0, 174.02]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.17, 72.9, 0.0, 0.0, 45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["chink, clink", 20.83], ["glass", 13.96], ["tuning fork", 6.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 6.46, 7.58, 1.08, 0.72, 21.11, 1.04, 1.07, -0.06, 1.2, 1.31, 0.42, 1.38, 1.35, 1.25, -0.13, -0.34, 0.4, 0.71, 1.1, 1.41, 0.82, 0.73, 0.36, 0.99, 0.5, 0.62, 0.95, 0.79, 1.0, 0.32, 1.09, -0.15, 0.15, 1.33, 0.24, 1.65, 1.56, 1.3, 1.32, 1.02]} \ No newline at end of file diff --git a/annotations_1/pCFld9GCy_Q_filtered.json b/annotations_1/pCFld9GCy_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49d3cba47abcadbe8b742813bd39b18aa6ddab62 --- /dev/null +++ b/annotations_1/pCFld9GCy_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.93], [28.0, 28.39], [32.0, 31.62], [34.0, 58.68], [60.0, 61.03], [65.0, 75.57], [76.0, 76.76], [80.0, 80.4], [103.0, 103.72], [109.0, 109.58], [110.0, 120.99], [122.0, 122.88], [125.0, 129.22], [130.0, 133.3], [137.0, 137.71], [139.0, 142.21], [143.0, 144.56], [148.0, 149.47], [151.0, 151.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 92.97, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 94.95, 92.48, 0.0, 97.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 66.85], ["sidetone", 10.35], ["music", 3.55]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.39, -0.38, 24.68, 1.03, 10.57, 0.76, 0.4, 0.72, 0.58, 10.99, 0.88, 4.22, 3.3, 0.71, 3.21, 1.56, 1.47, 0.6]} \ No newline at end of file diff --git a/annotations_1/pDj1GM3RRWs_filtered.json b/annotations_1/pDj1GM3RRWs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8884596a16091834fbb841aead45ab8e7f62e066 --- /dev/null +++ b/annotations_1/pDj1GM3RRWs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [4.0, 4.24], [6.0, 6.18], [10.0, 10.2], [12.0, 12.34], [19.0, 20.65], [29.0, 30.55], [31.0, 31.21], [32.0, 33.71], [34.0, 36.8], [38.0, 39.46], [64.0, 70.43], [71.0, 72.15], [76.0, 77.16], [81.0, 81.97], [87.0, 91.93], [94.0, 100.45], [104.0, 108.3], [110.0, 110.37], [111.0, 112.68], [113.0, 121.17], [122.0, 140.0], [141.0, 146.45], [147.0, 149.71], [151.0, 158.28], [159.0, 165.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.32, 0.0, 98.36, 0.0, 0.0, 0.0, 99.96, 92.31, 89.9, 0.0, 0.0, 65.79, 63.21, 58.05, 57.81, 61.67, 45.65], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.26], ["speech", 26.51], ["ambient music", 3.54]]], "duration": [0.39, 0.24, 0.18, 0.2, 0.34, 1.65, 1.55, 0.21, 1.71, 2.8, 1.46, 6.43, 1.15, 1.16, 0.97, 4.93, 6.45, 4.3, 0.37, 1.68, 8.17, 18.0, 5.45, 2.71, 7.28, 6.72]} \ No newline at end of file diff --git a/annotations_1/pDjY4qorZrg_filtered.json b/annotations_1/pDjY4qorZrg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1bcc473f31d3304e6eca0c882b4a72d410e0f48 --- /dev/null +++ b/annotations_1/pDjY4qorZrg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 30.89], [33.0, 46.58], [48.0, 48.24], [49.0, 49.84], [52.0, 54.94], [56.0, 64.03], [65.0, 66.82], [69.0, 69.06], [71.0, 71.69], [74.0, 74.65], [82.0, 82.46], [84.0, 85.5], [91.0, 93.16], [94.0, 93.77], [96.0, 97.38], [106.0, 106.91], [112.0, 113.0], [121.0, 121.44], [125.0, 125.1], [136.0, 137.05], [140.0, 141.2], [157.0, 157.3], [157.0, 157.67], [161.0, 161.33], [165.0, 165.15], [166.0, 166.7], [169.0, 170.6], [175.0, 175.91], [177.0, 177.45], [179.0, 192.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [34.02, 30.9, 0.0, 0.0, 32.71, 31.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.05], "audiomae_on_audioset": [[["music", 44.74], ["theremin", 23.97], ["hum", 13.1]], [["music", 46.25], ["speech", 30.53], ["fly, housefly", 2.83]], null, null, [["whale vocalization", 41.86], ["music", 28.5], ["cattle, bovinae", 2.36]], [["speech", 63.9], ["cattle, bovinae", 3.53], ["explosion", 3.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.3], ["music", 11.06], ["vehicle", 4.72]]], "duration": [20.89, 13.58, 0.24, 0.84, 2.94, 8.03, 1.82, 0.06, 0.69, 0.65, 0.46, 1.5, 2.16, -0.23, 1.38, 0.91, 1.0, 0.44, 0.1, 1.05, 1.2, 0.3, 0.67, 0.33, 0.15, 0.7, 1.6, 0.91, 0.45, 13.11]} \ No newline at end of file diff --git a/annotations_1/pE0vTejjWuk_filtered.json b/annotations_1/pE0vTejjWuk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5adeedd3667b9acef5847cd959fb05a196de9ee5 --- /dev/null +++ b/annotations_1/pE0vTejjWuk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.68], [3.0, 2.89], [5.0, 5.36], [7.0, 9.12], [10.0, 26.2], [28.0, 28.61], [30.0, 30.18], [31.0, 31.41], [33.0, 42.03], [44.0, 44.63], [45.0, 45.76], [47.0, 47.71], [50.0, 50.57], [55.0, 55.54], [58.0, 58.82], [60.0, 60.64], [63.0, 63.46], [66.0, 68.01], [70.0, 69.96], [71.0, 71.64], [73.0, 73.72], [75.0, 76.89], [78.0, 79.15], [80.0, 81.38], [84.0, 84.05], [87.0, 88.11], [90.0, 90.39], [92.0, 92.13], [97.0, 97.23], [98.0, 98.76], [100.0, 101.63]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.35, 35.58, 0.0, 0.0, 0.0, 54.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["liquid", 11.82], ["mains hum", 10.66], ["whale vocalization", 9.59]], [["horse", 44.74], ["clip-clop", 25.97], ["hum", 8.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.68, -0.11, 0.36, 2.12, 16.2, 0.61, 0.18, 0.41, 9.03, 0.63, 0.76, 0.71, 0.57, 0.54, 0.82, 0.64, 0.46, 2.01, -0.04, 0.64, 0.72, 1.89, 1.15, 1.38, 0.05, 1.11, 0.39, 0.13, 0.23, 0.76, 1.63]} \ No newline at end of file diff --git a/annotations_1/pFXW-7VNngk_filtered.json b/annotations_1/pFXW-7VNngk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a46f94d309971d513bc31f179cfbf77b8415b636 --- /dev/null +++ b/annotations_1/pFXW-7VNngk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.29], [13.0, 20.87], [25.0, 29.79], [30.0, 44.36], [54.0, 55.11], [72.0, 73.45], [74.0, 74.65], [77.0, 77.18], [79.0, 79.15], [87.0, 91.61], [98.0, 98.74], [101.0, 101.7], [109.0, 109.81], [113.0, 119.31], [120.0, 119.79], [120.0, 120.26], [129.0, 131.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 33.34, 32.96, 30.9, 0.0, 0.0, 0.0, 0.0, 0.0, 31.18, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 40.64], "audiomae_on_audioset": [null, [["music", 70.82], ["theremin", 5.15], ["electronic music", 4.52]], [["music", 67.05], ["electronic music", 7.26], ["speech", 6.21]], [["music", 56.68], ["police car (siren)", 9.74], ["siren", 8.19]], null, null, null, null, null, [["music", 55.14], ["hum", 15.7], ["throbbing", 7.29]], null, null, null, [["music", 32.77], ["hum", 26.36], ["mains hum", 17.6]], null, null, [["hum", 40.82], ["mains hum", 19.77], ["music", 9.1]]], "duration": [0.29, 7.87, 4.79, 14.36, 1.11, 1.45, 0.65, 0.18, 0.15, 4.61, 0.74, 0.7, 0.81, 6.31, -0.21, 0.26, 2.9]} \ No newline at end of file diff --git a/annotations_1/pHBKmT6eNGw_filtered.json b/annotations_1/pHBKmT6eNGw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3828ce7561c154ec87e32cc3d18c772818393eb --- /dev/null +++ b/annotations_1/pHBKmT6eNGw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.19], [14.0, 14.66], [16.0, 17.17], [20.0, 23.36], [26.0, 26.23], [28.0, 28.68], [30.0, 32.76], [35.0, 38.18], [39.0, 44.63], [48.0, 52.47], [60.0, 60.22], [60.0, 64.49], [66.0, 65.72], [66.0, 65.82], [67.0, 67.64], [70.0, 69.87], [71.0, 71.39], [72.0, 72.59], [74.0, 74.16], [75.0, 75.56], [78.0, 78.14], [80.0, 81.26], [82.0, 82.98], [88.0, 88.43], [89.0, 89.26], [90.0, 91.37], [92.0, 92.65], [95.0, 95.15], [98.0, 99.42], [103.0, 103.65], [112.0, 112.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 68.93, 0.0, 0.0, 97.64, 89.9, 99.68, 83.34, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.66, 1.17, 3.36, 0.23, 0.68, 2.76, 3.18, 5.63, 4.47, 0.22, 4.49, -0.28, -0.18, 0.64, -0.13, 0.39, 0.59, 0.16, 0.56, 0.14, 1.26, 0.98, 0.43, 0.26, 1.37, 0.65, 0.15, 1.42, 0.65, 0.21]} \ No newline at end of file diff --git a/annotations_1/pHXL7yantDY_filtered.json b/annotations_1/pHXL7yantDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac2eb5e2da935c76087e81e74e005ce4b99daa01 --- /dev/null +++ b/annotations_1/pHXL7yantDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.62], [8.0, 9.69], [12.0, 12.19], [12.0, 16.88], [22.0, 23.65], [26.0, 30.59], [35.0, 36.22], [37.0, 37.71], [38.0, 39.02], [39.0, 43.14], [44.0, 44.81], [45.0, 45.5], [47.0, 49.35], [51.0, 51.04], [55.0, 60.91], [64.0, 63.85], [65.0, 65.65], [71.0, 72.0], [74.0, 80.5], [81.0, 82.12], [84.0, 84.35], [84.0, 87.25], [88.0, 88.62], [91.0, 93.7], [95.0, 95.27], [98.0, 100.63], [101.0, 100.67], [104.0, 106.57], [108.0, 108.14], [111.0, 126.33], [127.0, 127.63], [132.0, 132.54], [133.0, 137.32], [140.0, 140.76], [143.0, 144.21], [147.0, 149.89], [150.0, 150.77], [153.0, 157.33], [160.0, 160.44], [163.0, 163.8], [167.0, 181.6], [184.0, 185.14], [187.0, 190.02], [193.0, 194.98], [196.0, 196.57], [202.0, 203.15], [206.0, 206.78], [209.0, 209.63], [212.0, 217.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 64.52, 0.0, 60.51, 0.0, 0.0, 0.0, 75.72, 0.0, 0.0, 66.03, 0.0, 32.16, 0.0, 0.0, 0.0, 30.94, 0.0, 0.0, 31.67, 0.0, 31.37, 0.0, 31.72, 0.0, 29.51, 0.0, 31.8, 0.0, 0.0, 30.52, 0.0, 0.0, 30.3, 0.0, 31.82, 0.0, 0.0, 32.46, 0.0, 30.83, 0.0, 0.0, 0.0, 0.0, 0.0, 31.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.26], ["throbbing", 5.93], ["hum", 4.32]], null, null, null, [["music", 71.36], ["reggae", 4.28], ["boing", 3.52]], null, null, [["music", 59.86], ["boing", 15.32], ["didgeridoo", 2.35]], null, [["music", 63.37], ["drum machine", 3.55], ["sampler", 3.16]], null, [["music", 47.92], ["boing", 5.76], ["mosquito", 4.14]], null, [["music", 45.08], ["musical instrument", 3.7], ["livestock, farm animals, working animals", 2.65]], null, [["music", 87.34], ["musical instrument", 2.74], ["piano", 0.68]], null, null, [["music", 55.44], ["boing", 20.2], ["speech", 4.27]], null, null, [["music", 51.1], ["dubstep", 15.24], ["cacophony", 4.46]], null, [["music", 64.43], ["musical instrument", 2.42], ["video game music", 1.56]], null, null, [["music", 82.7], ["sampler", 1.88], ["didgeridoo", 1.67]], null, [["music", 70.71], ["drum machine", 3.63], ["singing", 2.43]], null, null, null, null, null, [["music", 51.96], ["speech", 9.4], ["boing", 5.77]]], "duration": [1.62, 1.69, 0.19, 4.88, 1.65, 4.59, 1.22, 0.71, 1.02, 4.14, 0.81, 0.5, 2.35, 0.04, 5.91, -0.15, 0.65, 1.0, 6.5, 1.12, 0.35, 3.25, 0.62, 2.7, 0.27, 2.63, -0.33, 2.57, 0.14, 15.33, 0.63, 0.54, 4.32, 0.76, 1.21, 2.89, 0.77, 4.33, 0.44, 0.8, 14.6, 1.14, 3.02, 1.98, 0.57, 1.15, 0.78, 0.63, 5.04]} \ No newline at end of file diff --git a/annotations_1/pHrp2OM19t4_filtered.json b/annotations_1/pHrp2OM19t4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d55fb35c8f8a5cfff6bde8d4084602f61cbb7f75 --- /dev/null +++ b/annotations_1/pHrp2OM19t4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 24.14], [25.0, 48.1], [50.0, 53.62], [54.0, 67.47], [69.0, 73.57], [76.0, 86.7], [101.0, 103.25], [104.0, 103.99], [104.0, 105.19], [110.0, 109.76], [118.0, 125.78], [133.0, 132.78], [140.0, 140.93], [144.0, 144.0], [146.0, 149.35], [150.0, 150.97], [151.0, 152.14], [164.0, 178.95], [179.0, 179.04]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [28.82, 29.0, 31.57, 29.39, 29.72, 30.31, 31.71, 0.0, 0.0, 0.0, 29.18, 0.0, 0.0, 0.0, 31.91, 0.0, 0.0, 29.0, 0.0], "audiomae_on_audioset": [[["mosquito", 17.66], ["music", 12.98], ["speech", 12.86]], [["music", 55.11], ["speech", 14.74], ["tabla", 2.61]], [["hum", 42.69], ["throbbing", 32.95], ["mains hum", 15.19]], [["music", 70.11], ["speech", 6.19], ["cacophony", 2.42]], [["fly, housefly", 21.7], ["cattle, bovinae", 16.86], ["moo", 15.33]], [["music", 61.14], ["buzz", 6.08], ["throbbing", 5.2]], [["music", 59.79], ["speech", 20.22], ["musical instrument", 1.13]], null, null, null, [["music", 52.94], ["animal", 18.96], ["dog", 7.7]], null, null, null, [["music", 55.67], ["musical instrument", 10.96], ["plucked string instrument", 9.42]], null, null, [["fly, housefly", 39.11], ["insect", 18.21], ["mosquito", 16.0]], null], "duration": [6.14, 23.1, 3.62, 13.47, 4.57, 10.7, 2.25, -0.01, 1.19, -0.24, 7.78, -0.22, 0.93, 0.0, 3.35, 0.97, 1.14, 14.95, 0.04]} \ No newline at end of file diff --git a/annotations_1/pJCgeOAKXyg_filtered.json b/annotations_1/pJCgeOAKXyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45aa14da90142558c3a4cee60ec883dc6f326f92 --- /dev/null +++ b/annotations_1/pJCgeOAKXyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.06], [34.0, 34.18], [37.0, 36.9], [59.0, 59.95], [61.0, 68.69], [70.0, 78.22], [81.0, 120.75], [122.0, 128.31], [129.0, 138.91], [141.0, 202.2], [203.0, 208.79], [210.0, 225.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.91, 32.32, 0.0, 29.47, 28.43, 0.0, 28.36, 28.54], "audiomae_on_audioset": [null, null, null, null, [["music", 62.39], ["speech", 7.38], ["electronic music", 5.42]], [["music", 55.74], ["ambient music", 11.78], ["electronic music", 5.87]], null, [["hum", 29.94], ["music", 25.5], ["throbbing", 25.47]], [["throbbing", 27.08], ["music", 25.37], ["hum", 18.22]], null, [["livestock, farm animals, working animals", 40.85], ["cattle, bovinae", 14.4], ["moo", 10.05]], [["music", 73.75], ["speech", 3.46], ["hum", 3.17]]], "duration": [0.06, 0.18, -0.1, 0.95, 7.69, 8.22, 39.75, 6.31, 9.91, 61.2, 5.79, 15.61]} \ No newline at end of file diff --git a/annotations_1/pJFZLCoqB9w_filtered.json b/annotations_1/pJFZLCoqB9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b59d40e8f1584535fdf4faf44f7dac041b2d4164 --- /dev/null +++ b/annotations_1/pJFZLCoqB9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.66], [8.0, 11.8], [12.0, 13.42], [14.0, 19.97], [21.0, 21.93], [23.0, 39.14], [40.0, 40.24], [46.0, 52.03], [53.0, 53.76], [58.0, 59.04], [61.0, 61.06], [65.0, 65.03], [67.0, 67.59], [68.0, 69.69], [71.0, 71.56], [73.0, 74.98], [78.0, 79.84], [81.0, 82.95], [84.0, 84.55], [87.0, 88.45], [89.0, 90.63], [96.0, 97.23], [98.0, 98.58], [101.0, 102.36], [104.0, 104.33], [108.0, 108.89], [110.0, 112.67], [114.0, 115.79], [124.0, 128.14]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 99.71, 0.0, 95.64, 0.0, 64.75, 0.0, 40.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 41.12], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 39.13], ["stomach rumble", 14.0], ["sidetone", 11.49]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 55.18], ["hum", 6.98], ["throbbing", 6.91]]], "duration": [0.66, 3.8, 1.42, 5.97, 0.93, 16.14, 0.24, 6.03, 0.76, 1.04, 0.06, 0.03, 0.59, 1.69, 0.56, 1.98, 1.84, 1.95, 0.55, 1.45, 1.63, 1.23, 0.58, 1.36, 0.33, 0.89, 2.67, 1.79, 4.14]} \ No newline at end of file diff --git a/annotations_1/pJIGy4zHo6E_filtered.json b/annotations_1/pJIGy4zHo6E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbcec2dda3092a2b38bc7e6897c737a8d549233 --- /dev/null +++ b/annotations_1/pJIGy4zHo6E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [5.0, 6.45], [8.0, 8.19], [9.0, 9.64], [10.0, 16.87], [18.0, 58.08], [59.0, 78.81], [81.0, 86.34], [87.0, 88.42], [90.0, 97.95], [102.0, 112.11], [118.0, 121.46]], "keep_status": [false, false, false, false, true, false, false, true, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.53, 0.0, 33.75, 31.18, 0.0, 31.36, 32.16, 30.79], "audiomae_on_audioset": [null, null, null, null, [["music", 53.1], ["livestock, farm animals, working animals", 9.72], ["groan", 4.72]], null, [["hum", 45.66], ["throbbing", 16.02], ["music", 11.37]], [["animal", 16.98], ["bow-wow", 12.81], ["canidae, dogs, wolves", 11.01]], null, [["music", 58.3], ["animal", 5.57], ["theremin", 5.24]], [["vehicle", 34.78], ["car", 6.62], ["music", 6.5]], [["music", 48.68], ["musical instrument", 5.12], ["brass instrument", 4.27]]], "duration": [1.65, 1.45, 0.19, 0.64, 6.87, 40.08, 19.81, 5.34, 1.42, 7.95, 10.11, 3.46]} \ No newline at end of file diff --git a/annotations_1/pJImKCcPIsU_filtered.json b/annotations_1/pJImKCcPIsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..474b39c1c796901f04c5d8498f5f4e2741746ebf --- /dev/null +++ b/annotations_1/pJImKCcPIsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.62], [8.0, 10.64], [12.0, 12.68], [13.0, 14.91], [16.0, 16.55], [17.0, 19.89], [29.0, 29.71], [37.0, 38.53], [42.0, 42.69], [44.0, 45.55], [46.0, 49.25], [50.0, 53.72], [57.0, 57.43], [67.0, 67.2], [70.0, 72.79], [75.0, 76.54], [77.0, 78.33], [83.0, 83.98], [84.0, 84.75], [87.0, 87.4], [89.0, 91.15], [93.0, 94.15], [98.0, 99.35], [107.0, 116.21], [117.0, 117.96], [121.0, 120.99], [124.0, 124.51], [125.0, 126.99], [129.0, 129.25], [131.0, 130.89], [139.0, 139.43], [146.0, 147.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.52, 99.62, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 77.36, 72.16, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0, 38.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 55.32], ["hum", 15.61], ["sidetone", 6.13]], null, null, null, null, null, null, null, null], "duration": [4.62, 2.64, 0.68, 1.91, 0.55, 2.89, 0.71, 1.53, 0.69, 1.55, 3.25, 3.72, 0.43, 0.2, 2.79, 1.54, 1.33, 0.98, 0.75, 0.4, 2.15, 1.15, 1.35, 9.21, 0.96, -0.01, 0.51, 1.99, 0.25, -0.11, 0.43, 1.12]} \ No newline at end of file diff --git a/annotations_1/pK35em6gl0Q_filtered.json b/annotations_1/pK35em6gl0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4bb3134234458efb339168e07ed5369477b79986 --- /dev/null +++ b/annotations_1/pK35em6gl0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.91], [16.0, 16.36], [17.0, 23.45], [24.0, 27.06], [28.0, 29.93], [32.0, 32.49], [33.0, 34.13], [35.0, 38.16], [39.0, 39.87], [41.0, 41.72], [43.0, 45.06], [48.0, 49.62], [51.0, 52.15], [53.0, 54.04], [54.0, 55.17], [56.0, 57.47], [58.0, 66.51], [67.0, 76.11], [77.0, 78.53], [80.0, 82.17], [83.0, 93.21], [94.0, 96.18], [100.0, 102.56], [104.0, 105.19], [106.0, 116.36], [117.0, 116.95], [117.0, 118.18], [119.0, 121.69], [125.0, 127.58], [129.0, 129.34], [130.0, 131.09], [133.0, 133.42], [134.0, 135.6], [138.0, 139.24], [140.0, 141.15], [142.0, 143.46], [147.0, 147.36], [148.0, 149.93], [150.0, 157.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.88, 0.0, 82.43, 95.09, 0.0, 0.0, 0.0, 55.46, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 0.0, 36.97, 31.68, 0.0, 99.1, 58.55, 99.31, 99.52, 0.0, 99.4, 0.0, 0.0, 52.33, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 23.58], ["mains hum", 22.12], ["speech", 20.66]], [["speech", 38.66], ["mains hum", 13.45], ["music", 10.54]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.91, 0.36, 6.45, 3.06, 1.93, 0.49, 1.13, 3.16, 0.87, 0.72, 2.06, 1.62, 1.15, 1.04, 1.17, 1.47, 8.51, 9.11, 1.53, 2.17, 10.21, 2.18, 2.56, 1.19, 10.36, -0.05, 1.18, 2.69, 2.58, 0.34, 1.09, 0.42, 1.6, 1.24, 1.15, 1.46, 0.36, 1.93, 7.27]} \ No newline at end of file diff --git a/annotations_1/pKHAhc31MOI_filtered.json b/annotations_1/pKHAhc31MOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e04f55bf2db9224512124d2da284420220424db1 --- /dev/null +++ b/annotations_1/pKHAhc31MOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.02], [3.0, 12.02], [13.0, 13.83], [17.0, 19.26], [32.0, 34.91], [37.0, 38.62], [52.0, 52.76], [56.0, 56.74], [61.0, 62.28], [76.0, 76.81], [78.0, 78.65], [85.0, 98.58], [99.0, 104.73], [107.0, 108.11], [110.0, 111.79], [115.0, 115.5], [116.0, 116.73], [119.0, 121.58], [133.0, 134.33], [143.0, 148.71], [151.0, 152.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.44, 0.0, 99.56, 96.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.64, 99.62, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.02, 9.02, 0.83, 2.26, 2.91, 1.62, 0.76, 0.74, 1.28, 0.81, 0.65, 13.58, 5.73, 1.11, 1.79, 0.5, 0.73, 2.58, 1.33, 5.71, 1.86]} \ No newline at end of file diff --git a/annotations_1/pKsa_9TFG48_filtered.json b/annotations_1/pKsa_9TFG48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e213ab32dda989b7fc0436d181748d3ba5149d20 --- /dev/null +++ b/annotations_1/pKsa_9TFG48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.91], [22.0, 22.64], [26.0, 27.08]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.09, 0.64, 1.08]} \ No newline at end of file diff --git a/annotations_1/pLlcwabi5AQ_filtered.json b/annotations_1/pLlcwabi5AQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63e945bb6a6623e70b8e104e2e3dd87845defc6f --- /dev/null +++ b/annotations_1/pLlcwabi5AQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.5], [11.0, 11.75], [39.0, 39.24], [48.0, 47.73], [68.0, 68.86], [70.0, 70.7], [84.0, 85.01], [98.0, 98.64], [132.0, 132.63], [136.0, 137.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.75, 0.24, -0.27, 0.86, 0.7, 1.01, 0.64, 0.63, 1.02]} \ No newline at end of file diff --git a/annotations_1/pLooDtjrhv8_filtered.json b/annotations_1/pLooDtjrhv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11f6f54ec00547c95340d4c92940c6d4a5b73cd9 --- /dev/null +++ b/annotations_1/pLooDtjrhv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.59], [5.0, 7.64], [13.0, 12.75], [17.0, 17.51], [19.0, 20.16], [24.0, 25.07], [26.0, 26.06], [27.0, 31.75], [33.0, 33.56], [34.0, 34.3], [35.0, 35.73], [45.0, 45.25], [50.0, 51.12], [60.0, 60.35], [63.0, 63.15], [78.0, 78.51], [84.0, 84.57], [87.0, 87.44], [87.0, 87.51], [100.0, 99.99], [101.0, 104.82], [108.0, 116.46], [119.0, 130.84], [142.0, 146.45], [146.0, 147.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 55.74, 0.0, 0.0, 0.0, 0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.71, 28.81, 28.85, 28.88, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 21.25], ["cattle, bovinae", 19.15], ["music", 18.41]], [["music", 51.19], ["electronic music", 12.07], ["speech", 10.91]], [["speech", 48.65], ["music", 21.75], ["electronic music", 8.09]], [["speech", 22.39], ["cattle, bovinae", 21.75], ["moo", 12.78]], null], "duration": [-0.41, 2.64, -0.25, 0.51, 1.16, 1.07, 0.06, 4.75, 0.56, 0.3, 0.73, 0.25, 1.12, 0.35, 0.15, 0.51, 0.57, 0.44, 0.51, -0.01, 3.82, 8.46, 11.84, 4.45, 1.23]} \ No newline at end of file diff --git a/annotations_1/pLqoZtmyxxk_filtered.json b/annotations_1/pLqoZtmyxxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad42a0b9068ed39f41eac6030d53cce4274710f8 --- /dev/null +++ b/annotations_1/pLqoZtmyxxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.25], [13.0, 14.52], [21.0, 24.97], [26.0, 27.03], [29.0, 36.54], [40.0, 42.09], [47.0, 47.43], [48.0, 47.9], [48.0, 47.98], [48.0, 53.08], [55.0, 58.35], [61.0, 74.82], [76.0, 80.76], [86.0, 87.0], [89.0, 124.93], [127.0, 127.87]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [36.05, 0.0, 67.63, 0.0, 37.73, 54.43, 0.0, 0.0, 0.0, 33.63, 40.28, 38.9, 35.82, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 20.59], ["animal", 14.0], ["livestock, farm animals, working animals", 9.72]], null, null, null, [["music", 58.58], ["synthesizer", 7.48], ["speech", 4.71]], null, null, null, null, [["speech", 26.8], ["music", 22.17], ["cattle, bovinae", 5.0]], [["speech", 25.14], ["music", 19.2], ["radio", 7.16]], [["speech", 34.35], ["music", 31.84], ["radio", 3.98]], [["livestock, farm animals, working animals", 19.33], ["cattle, bovinae", 19.3], ["moo", 18.03]], null, null, null], "duration": [10.25, 1.52, 3.97, 1.03, 7.54, 2.09, 0.43, -0.1, -0.02, 5.08, 3.35, 13.82, 4.76, 1.0, 35.93, 0.87]} \ No newline at end of file diff --git a/annotations_1/pLra48c-SuA_filtered.json b/annotations_1/pLra48c-SuA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9aa77b8523c6b5f2247fb11de364e5f81c88d3ce --- /dev/null +++ b/annotations_1/pLra48c-SuA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 49.33], [52.0, 52.83], [54.0, 57.94], [66.0, 66.55], [68.0, 76.89], [79.0, 78.95], [81.0, 89.8]], "keep_status": [false, false, true, false, true, false, true], "silence_prob": [0.0, 0.0, 41.28, 0.0, 34.58, 0.0, 31.7], "audiomae_on_audioset": [null, null, [["music", 40.33], ["ambient music", 15.48], ["gong", 11.91]], null, [["rumble", 30.04], ["music", 14.13], ["hum", 12.27]], null, [["music", 30.99], ["hum", 20.05], ["mains hum", 11.59]]], "duration": [40.33, 0.83, 3.94, 0.55, 8.89, -0.05, 8.8]} \ No newline at end of file diff --git a/annotations_1/pM87ObBNOk4_filtered.json b/annotations_1/pM87ObBNOk4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..622886fa5781820012a7f0783e13b4334f24a7d1 --- /dev/null +++ b/annotations_1/pM87ObBNOk4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 67.98], [71.0, 70.95], [75.0, 75.24], [88.0, 88.48], [91.0, 95.86], [96.0, 97.02]], "keep_status": [false, false, false, false, true, false], "silence_prob": [40.04, 0.0, 0.0, 0.0, 37.02, 0.0], "audiomae_on_audioset": [[["speech", 55.52], ["sidetone", 10.56], ["whip", 5.76]], null, null, null, [["frog", 17.07], ["fart", 15.19], ["grunt", 8.85]], null], "duration": [17.98, -0.05, 0.24, 0.48, 4.86, 1.02]} \ No newline at end of file diff --git a/annotations_1/pN5RlyFWJBA_filtered.json b/annotations_1/pN5RlyFWJBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abd30550909167e3b065ed0882654637b6f333da --- /dev/null +++ b/annotations_1/pN5RlyFWJBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 38.28], [42.0, 42.3], [45.0, 45.3], [49.0, 49.67], [51.0, 52.34], [56.0, 72.71], [77.0, 78.48], [80.0, 83.47], [88.0, 131.63]], "keep_status": [true, false, false, false, false, true, false, false, false], "silence_prob": [32.38, 0.0, 0.0, 0.0, 0.0, 34.26, 0.0, 34.0, 0.0], "audiomae_on_audioset": [[["music", 19.69], ["didgeridoo", 11.66], ["fly, housefly", 11.16]], null, null, null, null, [["insect", 29.22], ["fly, housefly", 19.71], ["music", 12.12]], null, [["music", 69.0], ["throbbing", 4.79], ["electronic music", 3.45]], null], "duration": [15.28, 0.3, 0.3, 0.67, 1.34, 16.71, 1.48, 3.47, 43.63]} \ No newline at end of file diff --git a/annotations_1/pPCq9SIyHqE_filtered.json b/annotations_1/pPCq9SIyHqE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..966d56714e89d1943afc2ad355936b41b94426ea --- /dev/null +++ b/annotations_1/pPCq9SIyHqE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.99], [6.0, 6.98], [8.0, 8.51], [11.0, 17.05], [21.0, 21.73], [24.0, 30.89], [34.0, 35.72], [37.0, 50.53], [53.0, 68.27], [71.0, 103.86], [104.0, 106.03], [107.0, 113.04], [113.0, 113.86], [116.0, 119.97], [121.0, 121.31], [122.0, 123.21], [126.0, 132.04], [133.0, 136.8], [142.0, 142.21]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 34.49, 0.0, 30.23, 0.0, 30.89, 34.16, 0.0, 32.22, 32.4, 0.0, 30.78, 0.0, 0.0, 32.25, 32.58, 0.0], "audiomae_on_audioset": [null, null, null, [["throbbing", 27.37], ["music", 27.01], ["hum", 22.3]], null, [["car", 37.44], ["vehicle", 20.77], ["hum", 7.95]], null, [["music", 79.3], ["hum", 3.51], ["throbbing", 3.39]], [["speech", 45.15], ["music", 23.19], ["door", 6.09]], null, [["music", 44.87], ["speech", 21.65], ["hum", 7.08]], [["music", 43.9], ["animal", 7.15], ["dog", 6.74]], null, [["speech", 27.1], ["music", 25.39], ["gunshot, gunfire", 10.73]], null, null, [["hum", 28.63], ["throbbing", 25.55], ["music", 24.48]], [["speech", 31.33], ["music", 12.52], ["hum", 11.75]], null], "duration": [0.99, 0.98, 0.51, 6.05, 0.73, 6.89, 1.72, 13.53, 15.27, 32.86, 2.03, 6.04, 0.86, 3.97, 0.31, 1.21, 6.04, 3.8, 0.21]} \ No newline at end of file diff --git a/annotations_1/pPcxCk8YBVs_filtered.json b/annotations_1/pPcxCk8YBVs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b3212c005dd0feacd1b57a400afcb769ad2663d --- /dev/null +++ b/annotations_1/pPcxCk8YBVs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.3], [27.0, 27.18], [29.0, 29.35], [30.0, 37.86], [40.0, 40.15], [42.0, 43.04], [44.0, 63.96], [65.0, 65.5], [68.0, 69.6], [72.0, 77.31], [82.0, 87.42], [90.0, 91.13], [93.0, 108.8], [111.0, 126.37], [129.0, 144.78], [145.0, 146.28], [148.0, 148.17], [150.0, 150.01], [151.0, 151.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.71, 0.0, 0.0, 30.6, 0.0, 0.0, 30.41, 32.54, 0.0, 29.29, 29.05, 33.48, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.59], ["speech", 20.68], ["hum", 9.75]], null, null, [["mains hum", 39.19], ["hum", 19.46], ["music", 12.59]], null, null, [["throbbing", 28.13], ["music", 27.19], ["hum", 21.72]], [["rumble", 28.22], ["hum", 18.38], ["mains hum", 17.07]], null, [["music", 34.86], ["mains hum", 24.31], ["hum", 22.1]], [["music", 77.47], ["whip", 3.09], ["outside, rural or natural", 2.2]], [["music", 66.19], ["scary music", 8.09], ["ambient music", 4.11]], null, null, null, null], "duration": [1.3, 0.18, 0.35, 7.86, 0.15, 1.04, 19.96, 0.5, 1.6, 5.31, 5.42, 1.13, 15.8, 15.37, 15.78, 1.28, 0.17, 0.01, 0.82]} \ No newline at end of file diff --git a/annotations_1/pQv0ZtpRdNk_filtered.json b/annotations_1/pQv0ZtpRdNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..131420d278c9167687bc5e7c378ce4ce06f489f9 --- /dev/null +++ b/annotations_1/pQv0ZtpRdNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [4.0, 6.15], [7.0, 9.53], [15.0, 20.11], [24.0, 24.51], [32.0, 32.76], [35.0, 39.24], [41.0, 44.02], [46.0, 47.48], [49.0, 52.02], [55.0, 55.46], [59.0, 59.95], [62.0, 62.92], [63.0, 63.1], [64.0, 65.18], [67.0, 68.4], [69.0, 71.46], [72.0, 75.19], [77.0, 79.39], [82.0, 82.7], [87.0, 87.78], [92.0, 93.5], [98.0, 102.96], [108.0, 116.43], [120.0, 120.02], [124.0, 129.12], [132.0, 132.48], [134.0, 135.38], [136.0, 136.76], [138.0, 139.67], [143.0, 143.16], [145.0, 145.99], [148.0, 149.54]], "keep_status": [false, false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.89, 68.67, 51.12, 0.0, 0.0, 32.62, 32.4, 0.0, 41.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 55.96, 52.16, 0.0, 0.0, 0.0, 42.69, 40.07, 0.0, 36.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["crowd", 26.19], ["cheering", 9.75], ["vehicle", 8.61]], [["vehicle", 22.58], ["car", 5.8], ["motorcycle", 5.25]], null, [["speech", 45.3], ["music", 21.73], ["busy signal", 2.81]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.08], ["singing bowl", 15.16], ["theremin", 10.77]], [["music", 46.14], ["ambient music", 12.3], ["synthesizer", 5.73]], null, [["music", 41.32], ["whale vocalization", 20.14], ["theremin", 16.36]], null, null, null, null, null, null, null], "duration": [0.72, 2.15, 2.53, 5.11, 0.51, 0.76, 4.24, 3.02, 1.48, 3.02, 0.46, 0.95, 0.92, 0.1, 1.18, 1.4, 2.46, 3.19, 2.39, 0.7, 0.78, 1.5, 4.96, 8.43, 0.02, 5.12, 0.48, 1.38, 0.76, 1.67, 0.16, 0.99, 1.54]} \ No newline at end of file diff --git a/annotations_1/pR8Lt5DyU88_filtered.json b/annotations_1/pR8Lt5DyU88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd2417176084f3ac38ae1fc80f3411fba130c716 --- /dev/null +++ b/annotations_1/pR8Lt5DyU88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.51], [24.0, 24.6], [35.0, 35.36], [47.0, 49.91], [58.0, 58.21], [65.0, 70.73], [90.0, 92.8], [114.0, 114.57], [122.0, 123.42], [127.0, 127.18], [129.0, 130.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.95, 0.0, 56.18, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 62.42], ["synthesizer", 7.26], ["musical instrument", 2.53]], null, null, null, null, null, null, null], "duration": [0.51, 0.6, 0.36, 2.91, 0.21, 5.73, 2.8, 0.57, 1.42, 0.18, 1.57]} \ No newline at end of file diff --git a/annotations_1/pS-KE1LXpXU_filtered.json b/annotations_1/pS-KE1LXpXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f3a098c0f488cb57e6aac32cfc8112084800b65 --- /dev/null +++ b/annotations_1/pS-KE1LXpXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [3.0, 4.53], [5.0, 6.13], [9.0, 12.18], [14.0, 14.88], [23.0, 23.52], [25.0, 25.34], [29.0, 29.56], [30.0, 32.22], [35.0, 36.69], [42.0, 42.67], [45.0, 53.0], [54.0, 54.84], [56.0, 57.28], [61.0, 61.16], [66.0, 66.85], [68.0, 68.44], [70.0, 70.34], [71.0, 71.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 41.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 87.59], ["speech", 8.8], ["telephone", 0.72]], null, null, null, null, null, null, null], "duration": [1.37, 1.53, 1.13, 3.18, 0.88, 0.52, 0.34, 0.56, 2.22, 1.69, 0.67, 8.0, 0.84, 1.28, 0.16, 0.85, 0.44, 0.34, 0.73]} \ No newline at end of file diff --git a/annotations_1/pUPliO3qy04_filtered.json b/annotations_1/pUPliO3qy04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac3fe63dc4b00e1bfcd7c2da578c3b9c32ee4040 --- /dev/null +++ b/annotations_1/pUPliO3qy04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.42], [12.0, 14.62], [16.0, 18.57], [20.0, 23.62], [25.0, 28.36], [29.0, 31.72], [32.0, 33.88], [35.0, 36.88], [39.0, 45.52], [48.0, 53.25], [54.0, 65.58], [67.0, 67.64], [69.0, 70.73], [72.0, 76.52], [77.0, 79.0], [80.0, 83.08], [83.0, 88.82], [90.0, 95.91], [97.0, 99.32], [101.0, 101.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 61.27, 64.41, 65.91, 76.04, 75.39, 0.0, 0.0, 77.2, 72.75, 61.47, 0.0, 0.0, 45.24, 53.4, 74.29, 46.26, 73.36, 56.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.67], ["didgeridoo", 5.6], ["singing bowl", 4.97]], null, null, [["music", 44.5], ["theremin", 24.05], ["speech", 8.78]], null, null, null], "duration": [0.42, 2.62, 2.57, 3.62, 3.36, 2.72, 1.88, 1.88, 6.52, 5.25, 11.58, 0.64, 1.73, 4.52, 2.0, 3.08, 5.82, 5.91, 2.32, 0.85]} \ No newline at end of file diff --git a/annotations_1/pUmu0VJuwOA_filtered.json b/annotations_1/pUmu0VJuwOA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2df7e248f1e53d00f41243fec9ffa19b2ff01345 --- /dev/null +++ b/annotations_1/pUmu0VJuwOA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [4.0, 4.7], [5.0, 7.69], [10.0, 12.41], [13.0, 13.42], [15.0, 16.23], [17.0, 17.88], [34.0, 35.16], [37.0, 37.2], [40.0, 40.36], [50.0, 51.04], [55.0, 55.24], [55.0, 56.24], [58.0, 58.92], [60.0, 60.69], [63.0, 66.61], [68.0, 68.3], [69.0, 70.04], [83.0, 85.68], [86.0, 88.53], [89.0, 91.37], [94.0, 96.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 44.96, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 56.18, 51.18, 29.71, 40.19], "audiomae_on_audioset": [null, null, [["speech", 60.76], ["clang", 5.29], ["telephone", 4.3]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.38], ["radio", 10.17], ["music", 8.98]], null, null, null, null, [["music", 41.77], ["explosion", 14.0], ["speech", 10.95]], [["noise", 53.79], ["radio", 12.57], ["sidetone", 7.12]]], "duration": [1.37, 0.7, 2.69, 2.41, 0.42, 1.23, 0.88, 1.16, 0.2, 0.36, 1.04, 0.24, 1.24, 0.92, 0.69, 3.61, 0.3, 1.04, 2.68, 2.53, 2.37, 2.79]} \ No newline at end of file diff --git a/annotations_1/pVB70-zPv5E_filtered.json b/annotations_1/pVB70-zPv5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f00903343030f6dcd2e57f8a9918802bfb170fac --- /dev/null +++ b/annotations_1/pVB70-zPv5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 81.11], [84.0, 89.51], [90.0, 91.37]], "keep_status": [false, true, false], "silence_prob": [0.0, 35.77, 0.0], "audiomae_on_audioset": [null, [["music", 34.98], ["hum", 15.21], ["mains hum", 12.45]], null], "duration": [0.11, 5.51, 1.37]} \ No newline at end of file diff --git a/annotations_1/pVqOcGEbZvo_filtered.json b/annotations_1/pVqOcGEbZvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9d7b896aeb7b626b2ed2a040b4250ad974c535 --- /dev/null +++ b/annotations_1/pVqOcGEbZvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[94.0, 98.61], [99.0, 98.68], [99.0, 100.03], [101.0, 102.44]], "keep_status": [true, false, false, false], "silence_prob": [31.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 33.02], ["animal", 6.97], ["beatboxing", 3.47]], null, null, null], "duration": [4.61, -0.32, 1.03, 1.44]} \ No newline at end of file diff --git a/annotations_1/pW-ZHlM3RxI_filtered.json b/annotations_1/pW-ZHlM3RxI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15bf869a748cc422d44bbca1c1b66ccfdf53e438 --- /dev/null +++ b/annotations_1/pW-ZHlM3RxI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.0], [6.0, 8.51], [9.0, 12.36], [14.0, 15.52], [18.0, 18.45], [19.0, 19.9], [20.0, 22.17], [23.0, 25.39], [29.0, 30.28], [36.0, 36.29], [51.0, 51.44], [66.0, 66.83], [79.0, 83.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 72.6, 100.0, 0.0, 0.0, 0.0, 99.78, 97.83, 0.0, 0.0, 0.0, 0.0, 99.94], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 2.51, 3.36, 1.52, 0.45, 0.9, 2.17, 2.39, 1.28, 0.29, 0.44, 0.83, 4.71]} \ No newline at end of file diff --git a/annotations_1/pWfB7jrCgxk_filtered.json b/annotations_1/pWfB7jrCgxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97890979693ff59be2324382df70fc83d7e489a8 --- /dev/null +++ b/annotations_1/pWfB7jrCgxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [12.0, 13.26], [26.0, 26.72], [29.0, 31.16], [31.0, 32.14], [33.0, 35.14], [35.0, 36.46], [40.0, 40.36], [51.0, 53.03], [54.0, 58.5], [66.0, 65.77], [79.0, 79.25], [84.0, 84.2], [85.0, 85.56], [86.0, 87.86], [95.0, 96.74], [99.0, 100.14], [104.0, 104.06], [106.0, 106.61], [113.0, 112.87], [116.0, 119.1], [120.0, 124.5], [126.0, 127.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.54, 0.0, 0.0, 63.42, 0.0, 53.34, 0.0, 0.0, 48.27, 45.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 80.82, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 50.7], ["speech", 19.2], ["musical instrument", 4.28]], [["throbbing", 39.99], ["hum", 26.19], ["music", 19.32]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.25, 1.26, 0.72, 2.16, 1.14, 2.14, 1.46, 0.36, 2.03, 4.5, -0.23, 0.25, 0.2, 0.56, 1.86, 1.74, 1.14, 0.06, 0.61, -0.13, 3.1, 4.5, 1.41]} \ No newline at end of file diff --git a/annotations_1/pWt-GnERki0_filtered.json b/annotations_1/pWt-GnERki0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45ab38a33a014b0e94484c45e66b9b5fb908e38b --- /dev/null +++ b/annotations_1/pWt-GnERki0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [7.0, 8.16], [12.0, 12.21], [13.0, 13.44], [16.0, 16.98], [22.0, 22.77], [31.0, 31.68], [61.0, 61.01]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.74, 1.16, 0.21, 0.44, 0.98, 0.77, 0.68, 0.01]} \ No newline at end of file diff --git a/annotations_1/pXGsio9H1xs_filtered.json b/annotations_1/pXGsio9H1xs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d05fe9f07e36ecba51d8ff2421131e479b33b43 --- /dev/null +++ b/annotations_1/pXGsio9H1xs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.56], [5.0, 8.02], [10.0, 10.61], [14.0, 20.44], [22.0, 23.6], [25.0, 27.94], [29.0, 29.98], [31.0, 33.15], [35.0, 43.11], [44.0, 48.42], [51.0, 60.05], [61.0, 62.77], [65.0, 72.35], [73.0, 78.21], [79.0, 85.33], [86.0, 88.23], [90.0, 92.45], [93.0, 94.17], [95.0, 98.76], [100.0, 102.27], [110.0, 111.64], [117.0, 120.02], [120.0, 121.74], [122.0, 122.94], [127.0, 133.02], [134.0, 135.73], [136.0, 137.44], [138.0, 139.94], [141.0, 145.81], [146.0, 152.63], [157.0, 157.38], [162.0, 163.16], [164.0, 164.62], [167.0, 168.35], [177.0, 184.74], [186.0, 192.25], [193.0, 197.13], [197.0, 203.93], [207.0, 207.22]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.43, 0.0, 48.95, 0.0, 99.91, 0.0, 99.98, 90.78, 99.85, 99.93, 0.0, 81.35, 99.62, 95.09, 98.27, 98.8, 0.0, 99.1, 96.04, 0.0, 99.96, 0.0, 0.0, 70.16, 0.0, 0.0, 0.0, 87.37, 96.89, 0.0, 0.0, 0.0, 0.0, 99.94, 67.25, 89.9, 51.71, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 59.88], ["cat", 3.87], ["noise", 3.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.56, 3.02, 0.61, 6.44, 1.6, 2.94, 0.98, 2.15, 8.11, 4.42, 9.05, 1.77, 7.35, 5.21, 6.33, 2.23, 2.45, 1.17, 3.76, 2.27, 1.64, 3.02, 1.74, 0.94, 6.02, 1.73, 1.44, 1.94, 4.81, 6.63, 0.38, 1.16, 0.62, 1.35, 7.74, 6.25, 4.13, 6.93, 0.22]} \ No newline at end of file diff --git a/annotations_1/pXrMAjB8ka0_filtered.json b/annotations_1/pXrMAjB8ka0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..36e2ed567f6469a2ce9a0f66965f9517368b63ab --- /dev/null +++ b/annotations_1/pXrMAjB8ka0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.25], [12.0, 13.09], [14.0, 13.95], [26.0, 27.53], [30.0, 30.45], [32.0, 32.14], [33.0, 34.55], [37.0, 41.37], [43.0, 45.13], [46.0, 47.39], [49.0, 49.08], [50.0, 50.26], [53.0, 52.71], [55.0, 56.89], [57.0, 58.4], [59.0, 80.62], [83.0, 83.83], [87.0, 91.25], [94.0, 94.19], [95.0, 95.69], [96.0, 97.31], [100.0, 100.62], [102.0, 103.54], [105.0, 105.73], [107.0, 107.6], [109.0, 109.07], [110.0, 110.93], [112.0, 112.7], [113.0, 120.09], [121.0, 121.96], [123.0, 125.54], [127.0, 127.82], [129.0, 129.47], [130.0, 140.63], [142.0, 145.77], [148.0, 148.0], [149.0, 149.05], [150.0, 150.82], [152.0, 152.61], [153.0, 153.77], [154.0, 154.43], [155.0, 156.05], [157.0, 157.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [32.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.15, 36.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.23, 0.0, 32.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0, 30.92, 0.0, 0.0, 32.02, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 45.36], ["mains hum", 40.15], ["throbbing", 7.12]], null, null, null, null, null, null, [["mains hum", 34.72], ["hum", 34.46], ["buzz", 12.45]], [["mains hum", 40.67], ["hum", 31.23], ["music", 9.08]], null, null, null, null, null, null, [["hum", 54.12], ["mains hum", 27.75], ["music", 9.73]], null, [["hum", 48.86], ["mains hum", 35.52], ["throbbing", 3.94]], null, null, null, null, null, null, null, null, null, null, [["hum", 36.37], ["throbbing", 15.49], ["mains hum", 6.84]], null, [["livestock, farm animals, working animals", 20.84], ["cattle, bovinae", 17.69], ["moo", 16.55]], null, null, [["hum", 28.28], ["buzz", 10.6], ["cattle, bovinae", 8.75]], [["whale vocalization", 36.52], ["livestock, farm animals, working animals", 20.02], ["cattle, bovinae", 7.19]], null, null, null, null, null, null, null, null], "duration": [2.25, 1.09, -0.05, 1.53, 0.45, 0.14, 1.55, 4.37, 2.13, 1.39, 0.08, 0.26, -0.29, 1.89, 1.4, 21.62, 0.83, 4.25, 0.19, 0.69, 1.31, 0.62, 1.54, 0.73, 0.6, 0.07, 0.93, 0.7, 7.09, 0.96, 2.54, 0.82, 0.47, 10.63, 3.77, 0.0, 0.05, 0.82, 0.61, 0.77, 0.43, 1.05, 0.33]} \ No newline at end of file diff --git a/annotations_1/pYaJ7p8RrzM_filtered.json b/annotations_1/pYaJ7p8RrzM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bad8770626021647a503137a7b3522b9a3eafed --- /dev/null +++ b/annotations_1/pYaJ7p8RrzM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.41], [26.0, 26.91], [30.0, 43.88], [45.0, 46.08], [47.0, 47.98], [54.0, 54.77], [56.0, 57.43], [58.0, 60.29], [64.0, 65.16], [66.0, 67.96], [70.0, 70.21], [81.0, 82.0]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [33.97, 0.0, 36.9, 0.0, 0.0, 0.0, 0.0, 50.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 52.73], ["music", 6.08], ["mains hum", 4.14]], null, [["hum", 24.79], ["music", 14.05], ["throbbing", 9.36]], null, null, null, null, null, null, null, null, null], "duration": [4.41, 0.91, 13.88, 1.08, 0.98, 0.77, 1.43, 2.29, 1.16, 1.96, 0.21, 1.0]} \ No newline at end of file diff --git a/annotations_1/pYmo3PXF_T4_filtered.json b/annotations_1/pYmo3PXF_T4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b44d778dd7e5d8123adfc4321c5400a0db7af46 --- /dev/null +++ b/annotations_1/pYmo3PXF_T4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 32.21], [34.0, 34.69], [35.0, 37.47], [40.0, 40.27], [43.0, 50.79], [53.0, 55.88], [58.0, 62.21], [63.0, 80.77], [84.0, 87.35], [89.0, 96.75], [98.0, 101.26], [102.0, 106.78], [108.0, 109.41], [110.0, 138.96], [140.0, 145.47], [147.0, 147.61], [149.0, 149.23]], "keep_status": [false, false, true, false, false, false, false, false, true, true, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 40.43, 0.0, 28.87, 73.67, 31.13, 29.22, 32.42, 33.99, 35.13, 43.66, 0.0, 37.8, 49.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["beatboxing", 33.07], ["throbbing", 9.93], ["music", 8.86]], null, [["fly, housefly", 42.65], ["insect", 41.32], ["mosquito", 9.54]], null, [["speech", 79.84], ["music", 6.14], ["whack, thwack", 1.31]], [["speech", 35.4], ["music", 29.76], ["cattle, bovinae", 8.29]], [["music", 46.61], ["speech", 10.56], ["echo", 5.06]], [["speech", 38.54], ["chirp tone", 6.45], ["sine wave", 5.88]], [["speech", 70.78], ["sidetone", 4.87], ["groan", 2.76]], [["speech", 25.29], ["burping, eructation", 15.85], ["cough", 13.96]], null, [["speech", 42.48], ["frog", 11.8], ["croak", 4.86]], [["music", 21.34], ["singing bowl", 20.47], ["animal", 4.88]], null, null], "duration": [0.21, 0.69, 2.47, 0.27, 7.79, 2.88, 4.21, 17.77, 3.35, 7.75, 3.26, 4.78, 1.41, 28.96, 5.47, 0.61, 0.23]} \ No newline at end of file diff --git a/annotations_1/pZRDwBXv7T0_filtered.json b/annotations_1/pZRDwBXv7T0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f04692566660a4b0ebc16883d0df86b291c3de2 --- /dev/null +++ b/annotations_1/pZRDwBXv7T0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[162.0, 164.54], [168.0, 168.12], [170.0, 173.87]], "keep_status": [false, false, false], "silence_prob": [35.38, 0.0, 32.29], "audiomae_on_audioset": [[["music", 75.71], ["throbbing", 9.36], ["electronic music", 3.31]], null, [["throbbing", 63.53], ["music", 12.93], ["hum", 10.19]]], "duration": [2.54, 0.12, 3.87]} \ No newline at end of file diff --git a/annotations_1/p_jspptikh8_filtered.json b/annotations_1/p_jspptikh8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..936ab9038983272754b34a10c89bc3eb1850a670 --- /dev/null +++ b/annotations_1/p_jspptikh8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.45], [6.0, 7.05], [9.0, 11.43], [14.0, 14.88], [20.0, 21.44], [24.0, 24.16], [25.0, 25.93], [26.0, 27.33], [29.0, 29.2], [30.0, 30.25], [37.0, 37.72], [41.0, 42.04], [46.0, 45.89], [49.0, 50.33], [51.0, 51.16], [54.0, 54.16], [55.0, 57.92], [58.0, 59.41], [61.0, 61.47], [64.0, 77.41], [80.0, 81.7], [83.0, 84.0], [85.0, 86.1], [89.0, 88.72], [91.0, 91.47], [93.0, 93.77], [95.0, 95.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0, 33.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["insect", 24.2], ["fly, housefly", 18.0], ["telephone dialing, dtmf", 10.74]], null, null, null, null, null, null, null], "duration": [0.45, 1.05, 2.43, 0.88, 1.44, 0.16, 0.93, 1.33, 0.2, 0.25, 0.72, 1.04, -0.11, 1.33, 0.16, 0.16, 2.92, 1.41, 0.47, 13.41, 1.7, 1.0, 1.1, -0.28, 0.47, 0.77, 0.37]} \ No newline at end of file diff --git a/annotations_1/p_wCMFyHeUE_filtered.json b/annotations_1/p_wCMFyHeUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60cb5be6d3c077d53409bb18ddbe77fc78b55c71 --- /dev/null +++ b/annotations_1/p_wCMFyHeUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.75], [21.0, 23.68], [25.0, 27.65], [29.0, 44.04], [46.0, 98.46], [99.0, 99.94]], "keep_status": [false, true, true, false, false, false], "silence_prob": [50.56, 45.62, 46.4, 30.83, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.2], ["hum", 10.69], ["throbbing", 10.34]], [["music", 25.79], ["hum", 17.72], ["throbbing", 11.24]], [["speech", 27.83], ["buzz", 25.42], ["mains hum", 17.99]], null, null], "duration": [3.75, 2.68, 2.65, 15.04, 52.46, 0.94]} \ No newline at end of file diff --git a/annotations_1/paPWv3HjXAI_filtered.json b/annotations_1/paPWv3HjXAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6540765abafdcb80d7b36fda498d50a50f170216 --- /dev/null +++ b/annotations_1/paPWv3HjXAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 22.44], [25.0, 58.09]], "keep_status": [false, false], "silence_prob": [42.13, 0.0], "audiomae_on_audioset": [[["music", 61.85], ["ambient music", 19.43], ["synthesizer", 6.21]], null], "duration": [12.44, 33.09]} \ No newline at end of file diff --git a/annotations_1/padXZANlFwE_filtered.json b/annotations_1/padXZANlFwE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5ba05e3cb7d4b29f9d37f027d570f9e79cca0b --- /dev/null +++ b/annotations_1/padXZANlFwE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.84], [8.0, 9.37], [11.0, 12.31], [13.0, 17.44], [20.0, 21.02], [24.0, 24.11], [26.0, 27.92], [29.0, 30.35], [34.0, 34.59], [37.0, 49.99], [52.0, 75.79], [77.0, 85.65], [88.0, 127.43]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [68.02, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 28.52, 30.1, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.17], ["animal", 18.93], ["wild animals", 9.95]], [["music", 73.02], ["throbbing", 4.32], ["hum", 3.31]], null, null], "duration": [2.84, 1.37, 1.31, 4.44, 1.02, 0.11, 1.92, 1.35, 0.59, 12.99, 23.79, 8.65, 39.43]} \ No newline at end of file diff --git a/annotations_1/pb8pWn_yyF4_filtered.json b/annotations_1/pb8pWn_yyF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a19ab59ccaa9394cda773a04fa30e5954a42695b --- /dev/null +++ b/annotations_1/pb8pWn_yyF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 64.1], [64.0, 66.87], [68.0, 77.08], [82.0, 82.73], [83.0, 84.62], [85.0, 87.56], [88.0, 99.3], [100.0, 102.42], [104.0, 104.46], [105.0, 104.57], [105.0, 105.48], [106.0, 108.33], [108.0, 108.48], [108.0, 117.68], [118.0, 117.76], [120.0, 119.75], [120.0, 121.41], [122.0, 122.23], [125.0, 132.7], [146.0, 147.83]], "keep_status": [true, false, false, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, true, false], "silence_prob": [39.22, 39.91, 41.12, 0.0, 0.0, 40.62, 42.13, 33.89, 0.0, 0.0, 0.0, 32.77, 0.0, 33.26, 0.0, 0.0, 0.0, 0.0, 31.55, 0.0], "audiomae_on_audioset": [[["music", 47.54], ["pizzicato", 5.28], ["musical instrument", 4.55]], [["music", 55.98], ["musical instrument", 14.94], ["guitar", 9.85]], [["music", 64.3], ["guitar", 8.27], ["musical instrument", 7.9]], null, null, [["music", 56.84], ["musical instrument", 5.63], ["didgeridoo", 4.98]], [["music", 42.4], ["guitar", 8.24], ["musical instrument", 7.78]], [["music", 68.13], ["guitar", 5.71], ["musical instrument", 3.37]], null, null, null, [["speech", 44.08], ["music", 14.47], ["fart", 8.63]], null, [["speech", 46.49], ["fart", 18.86], ["fly, housefly", 4.03]], null, null, null, null, [["speech", 61.33], ["explosion", 4.72], ["burst, pop", 2.17]], null], "duration": [25.1, 2.87, 9.08, 0.73, 1.62, 2.56, 11.3, 2.42, 0.46, -0.43, 0.48, 2.33, 0.48, 9.68, -0.24, -0.25, 1.41, 0.23, 7.7, 1.83]} \ No newline at end of file diff --git a/annotations_1/pbv02n_zKvo_filtered.json b/annotations_1/pbv02n_zKvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f300f8c83b413c4f2787c3fab32d8e4737020cb --- /dev/null +++ b/annotations_1/pbv02n_zKvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.37], [9.0, 9.81], [20.0, 20.78], [26.0, 26.5], [30.0, 31.09], [32.0, 32.26], [34.0, 44.83], [48.0, 48.03], [54.0, 54.53], [55.0, 59.27], [62.0, 65.87], [83.0, 83.62], [96.0, 95.94], [97.0, 97.61], [100.0, 101.21], [101.0, 102.15], [106.0, 106.66], [116.0, 116.33], [124.0, 125.71], [127.0, 127.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 97.83, 67.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.81, 0.78, 0.5, 1.09, 0.26, 10.83, 0.03, 0.53, 4.27, 3.87, 0.62, -0.06, 0.61, 1.21, 1.15, 0.66, 0.33, 1.71, 0.95]} \ No newline at end of file diff --git a/annotations_1/pdmo-_KXg0Y_filtered.json b/annotations_1/pdmo-_KXg0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b460e0b67003588e052d3d6834a6c9754a88c1c3 --- /dev/null +++ b/annotations_1/pdmo-_KXg0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.48], [41.0, 42.45], [52.0, 52.39], [63.0, 63.73], [64.0, 66.26], [68.0, 74.46], [75.0, 77.97], [85.0, 85.13], [87.0, 87.59], [104.0, 106.51], [111.0, 112.8], [117.0, 126.0], [132.0, 131.8]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.78, 70.72, 35.44, 0.0, 0.0, 30.24, 0.0, 29.76, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 26.83], ["speech", 22.54], ["mains hum", 10.62]], null, [["music", 29.53], ["speech", 24.45], ["musical instrument", 2.91]], null, null, [["speech", 46.64], ["music", 26.06], ["grunt", 5.63]], null, [["speech", 68.75], ["outside, rural or natural", 4.45], ["music", 4.08]], null], "duration": [1.48, 1.45, 0.39, 0.73, 2.26, 6.46, 2.97, 0.13, 0.59, 2.51, 1.8, 9.0, -0.2]} \ No newline at end of file diff --git a/annotations_1/pdwGNiv2q4U_filtered.json b/annotations_1/pdwGNiv2q4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cc6608983bcf3e10e70106d438e84c873b74ae4 --- /dev/null +++ b/annotations_1/pdwGNiv2q4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.76], [23.0, 23.58], [27.0, 27.36], [29.0, 29.78], [31.0, 31.13], [32.0, 33.89], [36.0, 36.8], [38.0, 38.48], [40.0, 46.4], [47.0, 48.19], [51.0, 53.69], [55.0, 58.21], [58.0, 60.1], [60.0, 61.69], [63.0, 63.78], [71.0, 71.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 90.43, 90.6, 71.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.76, 0.58, 0.36, 0.78, 0.13, 1.89, 0.8, 0.48, 6.4, 1.19, 2.69, 3.21, 2.1, 1.69, 0.78, 0.15]} \ No newline at end of file diff --git a/annotations_1/pf0erXl4pwQ_filtered.json b/annotations_1/pf0erXl4pwQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..80e706b49008f659dfa19bf39f568f825e03fdf4 --- /dev/null +++ b/annotations_1/pf0erXl4pwQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.27], [7.0, 8.97], [10.0, 11.21], [15.0, 16.17], [26.0, 26.79], [39.0, 39.19], [41.0, 42.48], [44.0, 45.06], [59.0, 59.21], [72.0, 73.25], [77.0, 77.84], [78.0, 86.61], [88.0, 88.25], [90.0, 92.87], [94.0, 94.85], [99.0, 99.18], [100.0, 101.82], [107.0, 108.18], [112.0, 111.89], [113.0, 116.41], [117.0, 119.52], [123.0, 122.82], [131.0, 133.83], [135.0, 138.97], [139.0, 140.12], [144.0, 144.29], [147.0, 148.8], [153.0, 153.12], [155.0, 156.42], [164.0, 165.2], [172.0, 177.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 51.6, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 62.15], ["thunk", 21.92], ["thump, thud", 1.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.27, 1.97, 1.21, 1.17, 0.79, 0.19, 1.48, 1.06, 0.21, 1.25, 0.84, 8.61, 0.25, 2.87, 0.85, 0.18, 1.82, 1.18, -0.11, 3.41, 2.52, -0.18, 2.83, 3.97, 1.12, 0.29, 1.8, 0.12, 1.42, 1.2, 5.33]} \ No newline at end of file diff --git a/annotations_1/pfOJfhbqJhY_filtered.json b/annotations_1/pfOJfhbqJhY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44e348145e9c9a6fb3f1bdccb54d1a43e82322d --- /dev/null +++ b/annotations_1/pfOJfhbqJhY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.18], [27.0, 29.29], [31.0, 32.17], [35.0, 39.63], [40.0, 45.76], [46.0, 53.94], [55.0, 61.6], [62.0, 62.43], [65.0, 71.71], [84.0, 85.04], [85.0, 85.67], [91.0, 92.97]], "keep_status": [false, true, false, true, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 34.06, 0.0, 39.58, 34.09, 34.67, 31.07, 0.0, 31.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 45.64], ["fart", 11.74], ["creak", 4.72]], null, [["speech", 29.42], ["honk", 11.5], ["hum", 8.88]], [["speech", 53.24], ["animal", 11.61], ["horse", 4.1]], [["horse", 27.51], ["speech", 24.46], ["clip-clop", 12.76]], [["music", 58.54], ["brass instrument", 7.42], ["trombone", 6.17]], null, [["cattle, bovinae", 43.54], ["livestock, farm animals, working animals", 21.69], ["moo", 19.87]], null, null, null], "duration": [0.18, 2.29, 1.17, 4.63, 5.76, 7.94, 6.6, 0.43, 6.71, 1.04, 0.67, 1.97]} \ No newline at end of file diff --git a/annotations_1/phGwatUEyzc_filtered.json b/annotations_1/phGwatUEyzc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5258e7c8fcbfbf4e84bf8ab01b2e7c0bd3dcaeb --- /dev/null +++ b/annotations_1/phGwatUEyzc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [4.0, 4.83], [17.0, 17.22], [19.0, 19.03], [26.0, 27.09], [34.0, 34.26], [37.0, 39.72], [40.0, 40.2], [79.0, 80.52], [84.0, 86.46], [90.0, 90.0], [90.0, 90.53], [94.0, 94.36], [95.0, 96.16], [102.0, 101.8], [103.0, 103.82], [105.0, 106.39], [110.0, 113.48], [115.0, 126.33], [128.0, 129.68], [133.0, 137.24], [138.0, 145.44], [146.0, 146.87], [164.0, 166.08], [168.0, 169.37]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.4, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.98, 29.39, 0.0, 29.37, 28.92, 0.0, 47.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 27.23], ["speech", 17.38], ["musical instrument", 4.03]], null, null, [["music", 46.17], ["saxophone", 8.12], ["musical instrument", 6.79]], null, null, null, null, null, null, null, [["music", 64.74], ["electronic tuner", 3.41], ["boing", 3.35]], [["music", 71.32], ["carnatic music", 7.22], ["musical instrument", 2.67]], null, [["music", 57.03], ["boing", 5.79], ["harmonic", 3.09]], [["music", 83.14], ["carnatic music", 4.2], ["singing", 1.61]], null, [["foghorn", 19.79], ["music", 14.7], ["speech", 12.61]], null], "duration": [1.1, 0.83, 0.22, 0.03, 1.09, 0.26, 2.72, 0.2, 1.52, 2.46, 0.0, 0.53, 0.36, 1.16, -0.2, 0.82, 1.39, 3.48, 11.33, 1.68, 4.24, 7.44, 0.87, 2.08, 1.37]} \ No newline at end of file diff --git a/annotations_1/piTAjb8dd2Y_filtered.json b/annotations_1/piTAjb8dd2Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d5d8186ad74a9a93394de50f9e6f534b6cbff11 --- /dev/null +++ b/annotations_1/piTAjb8dd2Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.35], [4.0, 4.06], [11.0, 11.01], [20.0, 23.7], [28.0, 39.5], [44.0, 46.97], [48.0, 58.68], [61.0, 61.59], [64.0, 102.12], [107.0, 106.95], [107.0, 107.05], [107.0, 125.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.85, 55.04, 76.37, 56.03, 0.0, 0.0, 0.0, 0.0, 39.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 43.09], ["speech", 27.85], ["musical instrument", 2.67]]], "duration": [0.35, 0.06, 0.01, 3.7, 11.5, 2.97, 10.68, 0.59, 38.12, -0.05, 0.05, 18.47]} \ No newline at end of file diff --git a/annotations_1/pikAt8prREE_filtered.json b/annotations_1/pikAt8prREE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c5ae227f8cae20f2083a563e0b3c4825576e58f --- /dev/null +++ b/annotations_1/pikAt8prREE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[57.0, 58.43], [61.0, 62.5], [72.0, 73.2], [74.0, 73.7], [74.0, 74.33], [75.0, 75.76], [77.0, 78.78], [84.0, 88.48], [97.0, 97.53], [114.0, 114.86], [133.0, 133.29], [141.0, 143.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 0.0, 29.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["moo", 19.25], ["livestock, farm animals, working animals", 18.65], ["cattle, bovinae", 18.09]]], "duration": [1.43, 1.5, 1.2, -0.3, 0.33, 0.76, 1.78, 4.48, 0.53, 0.86, 0.29, 2.33]} \ No newline at end of file diff --git a/annotations_1/pizMaFdtY-s_filtered.json b/annotations_1/pizMaFdtY-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..be4c995b7b60445743893dd577fcb6851455939c --- /dev/null +++ b/annotations_1/pizMaFdtY-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.55], [9.0, 9.26], [13.0, 13.83], [15.0, 15.5], [17.0, 18.06], [20.0, 19.6], [20.0, 20.95], [23.0, 23.73], [25.0, 25.49], [29.0, 29.47], [31.0, 31.65], [32.0, 33.32], [34.0, 36.56], [38.0, 40.39], [45.0, 45.47], [46.0, 47.49], [49.0, 51.02], [53.0, 53.11], [54.0, 55.41], [56.0, 57.15], [58.0, 59.86], [61.0, 65.67], [67.0, 67.73], [70.0, 72.54], [74.0, 81.14], [83.0, 89.65], [92.0, 93.68], [100.0, 101.29], [102.0, 102.95], [103.0, 103.45], [103.0, 103.72], [107.0, 109.58], [110.0, 112.13], [118.0, 118.64], [124.0, 126.12], [129.0, 129.68], [131.0, 130.96], [136.0, 136.43], [137.0, 137.93], [141.0, 176.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.13, 31.13, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 32.84, 0.0, 32.58, 32.49, 32.06, 0.0, 0.0, 0.0, 0.0, 0.0, 45.43, 49.82, 0.0, 35.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 61.18], ["hum", 7.33], ["throbbing", 5.64]], [["music", 68.11], ["electronic music", 4.22], ["guitar", 3.32]], null, null, [["music", 69.88], ["musical instrument", 4.99], ["electronic music", 3.9]], null, null, null, null, [["music", 34.01], ["throbbing", 17.79], ["hum", 6.88]], null, [["music", 68.52], ["electronic music", 9.29], ["hum", 2.36]], [["music", 37.35], ["hum", 24.71], ["throbbing", 15.65]], [["hum", 38.38], ["mains hum", 37.02], ["throbbing", 10.11]], null, null, null, null, null, [["music", 56.36], ["whale vocalization", 3.78], ["hum", 2.99]], [["music", 31.17], ["ambient music", 10.49], ["hum", 10.2]], null, [["music", 48.8], ["electronic music", 12.76], ["whale vocalization", 8.71]], null, null, null, null, null], "duration": [0.55, 0.26, 0.83, 0.5, 1.06, -0.4, 0.95, 0.73, 0.49, 0.47, 0.65, 1.32, 2.56, 2.39, 0.47, 1.49, 2.02, 0.11, 1.41, 1.15, 1.86, 4.67, 0.73, 2.54, 7.14, 6.65, 1.68, 1.29, 0.95, 0.45, 0.72, 2.58, 2.13, 0.64, 2.12, 0.68, -0.04, 0.43, 0.93, 35.59]} \ No newline at end of file diff --git a/annotations_1/pjF6bofXAvQ_filtered.json b/annotations_1/pjF6bofXAvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7980a3d6a95d5fcc7dfd6b9134e37bf1fa66321 --- /dev/null +++ b/annotations_1/pjF6bofXAvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.16], [0.0, 3.06], [10.0, 11.55], [22.0, 23.11], [24.0, 26.55], [30.0, 31.5], [34.0, 33.86], [46.0, 46.65], [49.0, 51.07], [55.0, 57.3], [59.0, 59.63], [67.0, 68.55], [70.0, 73.74], [79.0, 78.78], [83.0, 84.27], [98.0, 98.46], [101.0, 103.22], [106.0, 107.47], [109.0, 111.74], [112.0, 113.61], [127.0, 127.77], [130.0, 130.0], [131.0, 136.16], [137.0, 138.35], [144.0, 145.0], [149.0, 149.52], [152.0, 152.61], [155.0, 155.44], [158.0, 158.8], [161.0, 161.4], [163.0, 163.39], [164.0, 164.44]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.89, 0.0, 0.0, 99.9, 0.0, 0.0, 0.0, 48.91, 37.84, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 42.08, 0.0, 54.7, 0.0, 0.0, 0.0, 42.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 37.6], ["creak", 8.57], ["musical instrument", 3.78]], [["music", 40.7], ["breaking", 10.98], ["screaming", 9.05]], null, null, [["speech", 67.68], ["music", 7.79], ["breaking", 2.53]], null, null, null, [["music", 10.84], ["livestock, farm animals, working animals", 9.59], ["sheep", 8.17]], null, null, null, null, null, [["music", 43.43], ["screaming", 9.26], ["speech", 8.74]], null, null, null, null, null, null, null, null, null], "duration": [0.16, 3.06, 1.55, 1.11, 2.55, 1.5, -0.14, 0.65, 2.07, 2.3, 0.63, 1.55, 3.74, -0.22, 1.27, 0.46, 2.22, 1.47, 2.74, 1.61, 0.77, 0.0, 5.16, 1.35, 1.0, 0.52, 0.61, 0.44, 0.8, 0.4, 0.39, 0.44]} \ No newline at end of file diff --git a/annotations_1/pkogDQ3CK9E_filtered.json b/annotations_1/pkogDQ3CK9E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4702f308054e484980d805afdb9c09492cd45a3 --- /dev/null +++ b/annotations_1/pkogDQ3CK9E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.62], [18.0, 18.91], [41.0, 42.62], [46.0, 47.7], [56.0, 59.14], [75.0, 75.39], [86.0, 89.9], [105.0, 108.45], [113.0, 113.43], [123.0, 124.12], [140.0, 142.1], [146.0, 151.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 29.81, 0.0, 31.75, 31.57, 0.0, 0.0, 31.11, 30.36], "audiomae_on_audioset": [null, null, null, null, [["music", 44.82], ["grunt", 28.06], ["synthesizer", 5.65]], null, [["music", 62.07], ["grunt", 5.63], ["sound effect", 3.88]], [["music", 40.34], ["throbbing", 20.88], ["hum", 18.53]], null, null, [["hum", 19.79], ["rumble", 13.2], ["music", 11.5]], [["music", 71.5], ["animal", 3.54], ["speech", 1.61]]], "duration": [1.62, 0.91, 1.62, 1.7, 3.14, 0.39, 3.9, 3.45, 0.43, 1.12, 2.1, 5.98]} \ No newline at end of file diff --git a/annotations_1/pkqyDC9YnfM_filtered.json b/annotations_1/pkqyDC9YnfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5cb43da0568cdf2928c5eef29c41e11dabfdcac1 --- /dev/null +++ b/annotations_1/pkqyDC9YnfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 58.89], [60.0, 71.42], [73.0, 74.11], [75.0, 79.54], [82.0, 85.23], [87.0, 88.32], [92.0, 114.35], [115.0, 122.28], [124.0, 137.27], [137.0, 137.3], [139.0, 142.82], [146.0, 146.45], [151.0, 152.31], [153.0, 153.84], [155.0, 175.39]], "keep_status": [false, true, false, false, true, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 35.3, 0.0, 35.2, 36.7, 0.0, 32.25, 33.23, 38.0, 0.0, 71.0, 0.0, 0.0, 0.0, 32.24], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 16.93], ["electric shaver, electric razor", 16.91], ["music", 11.09]], null, [["music", 62.64], ["didgeridoo", 10.0], ["musical instrument", 5.4]], [["music", 47.22], ["speech", 15.67], ["didgeridoo", 5.81]], null, [["speech", 67.19], ["music", 20.64], ["basketball bounce", 1.56]], [["mains hum", 33.87], ["hum", 20.97], ["speech", 12.81]], [["speech", 62.42], ["explosion", 9.23], ["hum", 5.01]], null, null, null, null, null, [["music", 50.73], ["fly, housefly", 6.66], ["animal", 5.72]]], "duration": [-0.11, 11.42, 1.11, 4.54, 3.23, 1.32, 22.35, 7.28, 13.27, 0.3, 3.82, 0.45, 1.31, 0.84, 20.39]} \ No newline at end of file diff --git a/annotations_1/pkwGEagSVT0_filtered.json b/annotations_1/pkwGEagSVT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8cdf91906ae498a58ec0714d0c36881374908663 --- /dev/null +++ b/annotations_1/pkwGEagSVT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.74], [18.0, 50.8], [52.0, 52.69], [68.0, 68.47], [92.0, 92.84], [97.0, 130.74]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 74.02], ["throbbing", 6.44], ["mantra", 4.13]], null, null, null, null, null], "duration": [12.74, 32.8, 0.69, 0.47, 0.84, 33.74]} \ No newline at end of file diff --git a/annotations_1/pl7JzW6eGZg_filtered.json b/annotations_1/pl7JzW6eGZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9612fa865ea34e116fa65a14f9cfb47d33998fbe --- /dev/null +++ b/annotations_1/pl7JzW6eGZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 36.48], [37.0, 37.79], [38.0, 39.61]], "keep_status": [false, false, false], "silence_prob": [52.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [5.48, 0.79, 1.61]} \ No newline at end of file diff --git a/annotations_1/plu5YA3t2l8_filtered.json b/annotations_1/plu5YA3t2l8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cb6526bcbb08c47cd8543880c481e48acd092ec --- /dev/null +++ b/annotations_1/plu5YA3t2l8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 26.33], [27.0, 69.62]], "keep_status": [false, false], "silence_prob": [32.91, 0.0], "audiomae_on_audioset": [[["music", 54.68], ["singing bowl", 10.04], ["ambient music", 6.32]], null], "duration": [19.33, 42.62]} \ No newline at end of file diff --git a/annotations_1/pmAZlEkONa0_filtered.json b/annotations_1/pmAZlEkONa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..347fcb800e5696bb7cbd9b7c3aaa04c557362439 --- /dev/null +++ b/annotations_1/pmAZlEkONa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 38.16], [38.0, 40.32], [44.0, 45.84], [46.0, 47.48], [52.0, 52.98], [56.0, 57.11], [58.0, 73.45], [75.0, 78.66], [79.0, 78.98], [79.0, 85.53], [86.0, 87.4], [89.0, 93.72], [94.0, 95.44], [97.0, 98.76], [100.0, 100.09], [101.0, 103.82], [105.0, 128.75], [134.0, 134.67], [136.0, 136.95], [138.0, 150.55]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 40.79, 0.0, 0.0, 0.0, 0.0, 31.02, 30.56, 0.0, 31.39, 0.0, 36.52, 0.0, 0.0, 0.0, 36.49, 30.18, 0.0, 0.0, 29.49], "audiomae_on_audioset": [null, [["music", 26.38], ["didgeridoo", 11.54], ["mains hum", 11.01]], null, null, null, null, [["music", 62.34], ["hum", 7.49], ["throbbing", 7.35]], [["music", 34.07], ["speech", 20.85], ["fart", 18.37]], null, [["music", 51.76], ["throbbing", 6.84], ["breaking", 4.87]], null, [["music", 27.78], ["hum", 12.13], ["noise", 10.84]], null, null, null, [["music", 30.26], ["didgeridoo", 19.17], ["mains hum", 12.86]], [["music", 19.51], ["hum", 15.51], ["speech", 11.73]], null, null, [["speech", 17.36], ["music", 16.74], ["hum", 11.45]]], "duration": [30.16, 2.32, 1.84, 1.48, 0.98, 1.11, 15.45, 3.66, -0.02, 6.53, 1.4, 4.72, 1.44, 1.76, 0.09, 2.82, 23.75, 0.67, 0.95, 12.55]} \ No newline at end of file diff --git a/annotations_1/pmqBmTWq420_filtered.json b/annotations_1/pmqBmTWq420_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2183d317a013d49d8e2c9a5089fc90327a652fc1 --- /dev/null +++ b/annotations_1/pmqBmTWq420_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.8], [16.0, 16.41], [21.0, 22.23], [29.0, 31.6], [38.0, 38.21], [38.0, 38.26], [38.0, 39.56], [42.0, 52.96], [56.0, 58.26], [67.0, 71.19], [78.0, 87.83], [90.0, 91.47], [95.0, 95.99], [99.0, 101.92], [110.0, 110.03], [121.0, 123.33], [128.0, 129.52], [132.0, 136.71], [145.0, 145.94], [149.0, 150.97], [153.0, 153.5]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true, false, false, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 29.22, 0.0, 0.0, 0.0, 28.62, 28.52, 28.6, 28.71, 0.0, 0.0, 28.89, 0.0, 44.34, 0.0, 30.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["livestock, farm animals, working animals", 58.89], ["cattle, bovinae", 20.69], ["moo", 10.59]], null, null, null, [["speech", 26.95], ["music", 15.14], ["explosion", 11.22]], [["speech", 16.25], ["mains hum", 14.88], ["fly, housefly", 9.04]], [["speech", 20.25], ["insect", 16.29], ["fly, housefly", 11.17]], [["music", 61.46], ["buzz", 5.64], ["didgeridoo", 2.71]], null, null, [["music", 48.18], ["groan", 4.44], ["didgeridoo", 4.34]], null, [["music", 49.31], ["speech", 9.68], ["sine wave", 8.15]], null, [["speech", 51.54], ["music", 8.85], ["electric shaver, electric razor", 6.42]], null, null, null], "duration": [0.8, 0.41, 1.23, 2.6, 0.21, 0.26, 1.56, 10.96, 2.26, 4.19, 9.83, 1.47, 0.99, 2.92, 0.03, 2.33, 1.52, 4.71, 0.94, 1.97, 0.5]} \ No newline at end of file diff --git a/annotations_1/po0Gj897Tmk_filtered.json b/annotations_1/po0Gj897Tmk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52d8aa7fec272913bbdb203e958892ae34d8d595 --- /dev/null +++ b/annotations_1/po0Gj897Tmk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.59], [7.0, 7.84], [11.0, 19.7], [20.0, 20.56], [29.0, 29.49], [34.0, 34.26], [52.0, 53.94], [55.0, 55.97], [56.0, 57.16], [65.0, 65.7], [68.0, 72.99], [80.0, 83.42], [87.0, 94.47], [99.0, 112.43], [113.0, 123.47], [124.0, 125.85], [128.0, 147.93], [152.0, 152.27]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 44.69, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.78, 36.23, 34.57, 30.78, 30.21, 0.0, 31.92, 0.0], "audiomae_on_audioset": [null, null, [["music", 12.55], ["telephone dialing, dtmf", 12.42], ["speech", 12.37]], null, null, null, null, null, null, null, [["music", 36.67], ["throbbing", 22.14], ["hum", 14.44]], [["throbbing", 21.21], ["speech", 17.28], ["hum", 14.81]], [["throbbing", 35.38], ["music", 26.39], ["hum", 16.38]], [["hum", 23.61], ["gong", 17.55], ["music", 17.32]], [["music", 36.05], ["gong", 26.52], ["ambient music", 9.68]], null, [["music", 48.59], ["noise", 8.73], ["hum", 7.04]], null], "duration": [0.59, 0.84, 8.7, 0.56, 0.49, 0.26, 1.94, 0.97, 1.16, 0.7, 4.99, 3.42, 7.47, 13.43, 10.47, 1.85, 19.93, 0.27]} \ No newline at end of file diff --git a/annotations_1/poTqVcSgFRE_filtered.json b/annotations_1/poTqVcSgFRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..09486fde35d0080283da62ff71ece04c9e2f064f --- /dev/null +++ b/annotations_1/poTqVcSgFRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [2.0, 2.94], [4.0, 4.95], [7.0, 7.69], [9.0, 10.96], [12.0, 13.32], [15.0, 15.55], [16.0, 17.9], [21.0, 22.42], [36.0, 37.59], [46.0, 47.39], [61.0, 61.42], [64.0, 65.58], [72.0, 73.13], [76.0, 78.04], [80.0, 80.4], [82.0, 83.73], [87.0, 87.25], [98.0, 98.34], [100.0, 100.3], [104.0, 104.6], [106.0, 106.2], [107.0, 107.91], [110.0, 110.47], [113.0, 112.67], [114.0, 122.18], [123.0, 123.92], [125.0, 125.96], [143.0, 144.44], [151.0, 151.09], [164.0, 165.35], [168.0, 168.03], [171.0, 170.85], [172.0, 173.11], [176.0, 177.45], [180.0, 181.11], [183.0, 183.59], [193.0, 194.43], [203.0, 204.53], [205.0, 205.46], [206.0, 206.15], [207.0, 208.47], [209.0, 210.81], [213.0, 213.36], [217.0, 217.43], [218.0, 220.13], [223.0, 224.16], [226.0, 226.61], [230.0, 230.1], [231.0, 232.5], [234.0, 235.84], [242.0, 243.68], [244.0, 245.37], [246.0, 249.18], [250.0, 251.18], [253.0, 254.2], [257.0, 259.78], [260.0, 261.22], [262.0, 264.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 99.31, 0.0, 97.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.04, 0.94, 0.95, 0.69, 1.96, 1.32, 0.55, 1.9, 1.42, 1.59, 1.39, 0.42, 1.58, 1.13, 2.04, 0.4, 1.73, 0.25, 0.34, 0.3, 0.6, 0.2, 0.91, 0.47, -0.33, 8.18, 0.92, 0.96, 1.44, 0.09, 1.35, 0.03, -0.15, 1.11, 1.45, 1.11, 0.59, 1.43, 1.53, 0.46, 0.15, 1.47, 1.81, 0.36, 0.43, 2.13, 1.16, 0.61, 0.1, 1.5, 1.84, 1.68, 1.37, 3.18, 1.18, 1.2, 2.78, 1.22, 2.79]} \ No newline at end of file diff --git a/annotations_1/poU8QxFJjbo_filtered.json b/annotations_1/poU8QxFJjbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..375b908f5784cfe88aef591726f8c962555b9876 --- /dev/null +++ b/annotations_1/poU8QxFJjbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 42.84], [44.0, 45.6], [46.0, 66.21], [68.0, 67.93], [69.0, 70.33], [72.0, 108.18], [109.0, 109.59], [112.0, 166.43], [167.0, 169.32], [170.0, 171.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.98, 0.0, 0.0, 0.0, 0.0, 0.0, 56.86, 0.0], "audiomae_on_audioset": [null, null, [["music", 81.4], ["hum", 2.51], ["electronic music", 1.78]], null, null, null, null, null, null, null], "duration": [40.84, 1.6, 20.21, -0.07, 1.33, 36.18, 0.59, 54.43, 2.32, 1.44]} \ No newline at end of file diff --git a/annotations_1/poswRRB_2i0_filtered.json b/annotations_1/poswRRB_2i0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0539aecb10e696cfeaa13dec41e32d7b119b592b --- /dev/null +++ b/annotations_1/poswRRB_2i0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.21], [11.0, 11.55], [16.0, 22.0], [23.0, 24.19], [27.0, 29.96], [38.0, 45.27], [48.0, 51.41], [52.0, 58.45], [59.0, 61.96], [65.0, 67.49], [76.0, 77.89], [78.0, 78.39], [81.0, 81.09], [81.0, 85.02], [86.0, 86.36], [88.0, 87.86], [93.0, 96.33], [99.0, 109.11], [111.0, 121.47], [123.0, 126.52], [129.0, 129.66], [131.0, 131.6], [134.0, 134.91], [136.0, 138.28], [142.0, 150.28], [159.0, 160.0], [165.0, 166.8], [168.0, 168.69], [170.0, 170.95], [173.0, 173.57], [179.0, 178.6], [179.0, 179.07], [180.0, 180.17], [181.0, 184.45], [185.0, 185.18], [186.0, 186.56], [193.0, 193.46], [195.0, 196.05], [197.0, 205.68], [209.0, 208.8], [213.0, 213.76], [231.0, 230.79], [231.0, 233.25], [238.0, 240.44], [242.0, 243.19], [244.0, 259.01], [259.0, 261.6], [264.0, 268.74], [271.0, 280.4]], "keep_status": [true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [44.07, 0.0, 44.63, 0.0, 44.32, 49.45, 39.52, 38.83, 55.6, 45.95, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 54.76, 67.0, 68.93, 72.01, 0.0, 0.0, 0.0, 57.09, 70.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.5, 0.0, 0.0, 0.0, 0.0, 30.57, 0.0, 0.0, 0.0, 35.14, 39.67, 0.0, 32.44, 37.27, 32.42, 32.21], "audiomae_on_audioset": [[["music", 27.74], ["humming", 7.4], ["theremin", 5.93]], null, [["music", 38.46], ["carnatic music", 8.44], ["vocal music", 8.03]], null, [["music", 33.92], ["humming", 10.02], ["chant", 8.67]], [["music", 66.32], ["carnatic music", 10.55], ["singing", 2.17]], [["music", 75.82], ["singing", 3.35], ["humming", 1.98]], [["music", 46.47], ["speech", 20.45], ["boing", 6.61]], null, [["music", 73.24], ["singing", 1.34], ["song", 1.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.03], ["singing", 2.87], ["gospel music", 2.03]], null, null, null, null, [["music", 79.87], ["carnatic music", 3.17], ["singing", 2.62]], null, null, null, [["music", 29.38], ["burping, eructation", 16.06], ["guitar", 4.99]], [["music", 61.27], ["quack", 4.87], ["synthesizer", 2.2]], null, [["music", 89.46], ["singing", 1.18], ["musical instrument", 0.88]], [["music", 35.39], ["guitar", 8.41], ["plucked string instrument", 6.17]], [["music", 76.37], ["gospel music", 1.87], ["carnatic music", 1.84]], [["music", 81.99], ["singing", 2.34], ["musical instrument", 1.98]]], "duration": [4.21, 0.55, 6.0, 1.19, 2.96, 7.27, 3.41, 6.45, 2.96, 2.49, 1.89, 0.39, 0.09, 4.02, 0.36, -0.14, 3.33, 10.11, 10.47, 3.52, 0.66, 0.6, 0.91, 2.28, 8.28, 1.0, 1.8, 0.69, 0.95, 0.57, -0.4, 0.07, 0.17, 3.45, 0.18, 0.56, 0.46, 1.05, 8.68, -0.2, 0.76, -0.21, 2.25, 2.44, 1.19, 15.01, 2.6, 4.74, 9.4]} \ No newline at end of file diff --git a/annotations_1/pppK-fl9a2E_filtered.json b/annotations_1/pppK-fl9a2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dd92b9f1f60822e1d02c104ca33689b5ad2a063 --- /dev/null +++ b/annotations_1/pppK-fl9a2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.75], [4.0, 5.66], [7.0, 8.23], [9.0, 9.58], [11.0, 13.73], [15.0, 16.55], [17.0, 20.6], [22.0, 22.18], [22.0, 23.45], [42.0, 41.89], [44.0, 47.09], [48.0, 51.26], [54.0, 55.26], [56.0, 56.34], [69.0, 69.79], [75.0, 75.66], [76.0, 79.41], [80.0, 83.05], [85.0, 85.16], [87.0, 95.28], [97.0, 97.58], [103.0, 103.47], [107.0, 106.98], [117.0, 118.22], [126.0, 127.26], [134.0, 133.81], [134.0, 134.76], [136.0, 137.15], [138.0, 138.5], [140.0, 141.84], [145.0, 145.3], [147.0, 147.56], [149.0, 149.15], [150.0, 150.58]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 38.67, 0.0, 0.0, 0.0, 30.78, 28.64, 0.0, 0.0, 0.0, 0.0, 36.75, 33.12, 0.0, 33.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 25.65], ["quack", 7.48], ["croak", 6.29]], null, [["speech", 37.21], ["music", 30.06], ["hum", 3.74]], null, null, null, [["music", 62.8], ["theremin", 7.61], ["ambient music", 7.31]], [["thunk", 27.51], ["whack, thwack", 17.88], ["music", 10.35]], null, null, null, null, [["hum", 21.38], ["music", 19.78], ["mains hum", 15.55]], [["speech", 45.5], ["sidetone", 25.18], ["telephone", 11.9]], null, [["music", 69.87], ["synthesizer", 7.0], ["musical instrument", 5.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.25, 1.66, 1.23, 0.58, 2.73, 1.55, 3.6, 0.18, 1.45, -0.11, 3.09, 3.26, 1.26, 0.34, 0.79, 0.66, 3.41, 3.05, 0.16, 8.28, 0.58, 0.47, -0.02, 1.22, 1.26, -0.19, 0.76, 1.15, 0.5, 1.84, 0.3, 0.56, 0.15, 0.58]} \ No newline at end of file diff --git a/annotations_1/prAOME_9oP8_filtered.json b/annotations_1/prAOME_9oP8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e87585b153cf746fd7a6473d352b883e3893fc52 --- /dev/null +++ b/annotations_1/prAOME_9oP8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 30.94], [32.0, 37.2], [42.0, 42.35], [46.0, 73.72], [76.0, 76.45], [77.0, 78.04], [80.0, 87.81], [89.0, 90.09], [92.0, 121.1], [122.0, 126.45], [129.0, 130.65], [133.0, 142.01], [149.0, 161.45], [166.0, 170.53], [171.0, 175.95]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [30.86, 50.02, 0.0, 42.58, 0.0, 0.0, 38.25, 0.0, 42.51, 33.79, 0.0, 28.96, 32.6, 34.97, 34.42], "audiomae_on_audioset": [[["machine gun", 24.31], ["speech", 23.13], ["music", 17.3]], null, null, [["music", 51.01], ["throbbing", 22.92], ["hum", 8.37]], null, null, [["hum", 40.15], ["speech", 18.52], ["throbbing", 15.28]], null, [["hum", 36.5], ["speech", 24.69], ["throbbing", 15.44]], [["music", 31.69], ["hum", 17.62], ["throbbing", 8.14]], null, [["music", 60.91], ["throbbing", 4.87], ["hum", 4.36]], [["car", 17.36], ["music", 13.51], ["explosion", 11.85]], [["fart", 38.56], ["speech", 28.94], ["noise", 13.62]], [["music", 21.48], ["noise", 7.15], ["thunk", 5.63]]], "duration": [10.94, 5.2, 0.35, 27.72, 0.45, 1.04, 7.81, 1.09, 29.1, 4.45, 1.65, 9.01, 12.45, 4.53, 4.95]} \ No newline at end of file diff --git a/annotations_1/prTlJO34AHE_filtered.json b/annotations_1/prTlJO34AHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7f514216433bcaddc20e2b7ad8b3a1d4332a91b --- /dev/null +++ b/annotations_1/prTlJO34AHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 22.1], [23.0, 22.89], [25.0, 24.71], [25.0, 27.65], [37.0, 37.22], [43.0, 45.64], [46.0, 52.41], [55.0, 56.32], [59.0, 61.13], [65.0, 66.73], [71.0, 79.98], [80.0, 88.6], [95.0, 96.67], [98.0, 98.83], [99.0, 104.19], [107.0, 107.7], [113.0, 115.99], [119.0, 121.0], [125.0, 128.04], [130.0, 131.55], [134.0, 135.5], [142.0, 145.29], [147.0, 152.71], [154.0, 156.57], [157.0, 158.89], [159.0, 167.09], [169.0, 174.06], [174.0, 176.99]], "keep_status": [true, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false, false, true, false, true, false, true, false, true], "silence_prob": [34.58, 0.0, 0.0, 37.85, 0.0, 74.76, 75.88, 0.0, 61.77, 0.0, 31.85, 31.58, 0.0, 0.0, 37.9, 0.0, 50.81, 35.95, 46.43, 0.0, 0.0, 32.92, 32.47, 37.28, 0.0, 34.34, 34.85, 33.65], "audiomae_on_audioset": [[["music", 24.84], ["speech", 20.71], ["didgeridoo", 6.39]], null, null, [["grunt", 32.69], ["speech", 18.82], ["music", 12.71]], null, null, null, null, null, null, [["music", 23.55], ["hum", 19.73], ["throbbing", 11.75]], [["music", 46.42], ["groan", 14.6], ["speech", 9.62]], null, null, [["speech", 50.23], ["music", 32.82], ["groan", 4.14]], null, null, [["music", 29.3], ["sheep", 21.48], ["bleat", 18.25]], [["music", 37.73], ["throbbing", 13.83], ["synthesizer", 7.03]], null, null, [["music", 50.91], ["honk", 9.78], ["goose", 8.01]], [["music", 47.27], ["groan", 22.84], ["speech", 9.05]], [["music", 29.05], ["bow-wow", 10.8], ["animal", 10.44]], null, [["music", 28.08], ["animal", 19.63], ["speech", 9.04]], [["music", 43.53], ["speech", 40.63], ["brass instrument", 2.59]], [["music", 38.4], ["speech", 27.61], ["didgeridoo", 3.4]]], "duration": [5.1, -0.11, -0.29, 2.65, 0.22, 2.64, 6.41, 1.32, 2.13, 1.73, 8.98, 8.6, 1.67, 0.83, 5.19, 0.7, 2.99, 2.0, 3.04, 1.55, 1.5, 3.29, 5.71, 2.57, 1.89, 8.09, 5.06, 2.99]} \ No newline at end of file diff --git a/annotations_1/psDtqypK3hI_filtered.json b/annotations_1/psDtqypK3hI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..056061cc88be3e3136c3ff2dc13f4760e5b1639c --- /dev/null +++ b/annotations_1/psDtqypK3hI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [11.0, 11.91], [16.0, 17.69], [21.0, 20.66], [27.0, 27.65], [32.0, 32.76], [35.0, 36.12], [47.0, 47.17], [57.0, 58.14], [62.0, 62.31], [65.0, 70.68], [73.0, 97.66], [103.0, 183.66], [185.0, 185.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.45, 42.51, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 42.84], ["livestock, farm animals, working animals", 9.99], ["cattle, bovinae", 9.63]], [["music", 69.8], ["wind instrument, woodwind instrument", 10.59], ["flute", 6.73]], null, null], "duration": [0.43, 0.91, 1.69, -0.34, 0.65, 0.76, 1.12, 0.17, 1.14, 0.31, 5.68, 24.66, 80.66, 0.4]} \ No newline at end of file diff --git a/annotations_1/psW7sLoNutA_filtered.json b/annotations_1/psW7sLoNutA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..75a000369b50b05ee8cd6a2f78542b86d4eda597 --- /dev/null +++ b/annotations_1/psW7sLoNutA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.12], [3.0, 3.28], [9.0, 9.9], [11.0, 12.19], [20.0, 20.88], [24.0, 27.24], [31.0, 33.3], [37.0, 37.86], [38.0, 39.8], [41.0, 42.89], [45.0, 45.69], [47.0, 52.08], [53.0, 53.76], [55.0, 55.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 82.97, 89.01, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 0.28, 0.9, 1.19, 0.88, 3.24, 2.3, 0.86, 1.8, 1.89, 0.69, 5.08, 0.76, 0.59]} \ No newline at end of file diff --git a/annotations_1/ptAdtShJa_0_filtered.json b/annotations_1/ptAdtShJa_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e90ff83d001ae3e8440e611fd51b29d3d77adb --- /dev/null +++ b/annotations_1/ptAdtShJa_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.51], [19.0, 20.49], [21.0, 21.09], [22.0, 21.63], [23.0, 26.1], [27.0, 27.87], [28.0, 29.25], [32.0, 32.71], [34.0, 37.39], [38.0, 38.7], [42.0, 42.8], [49.0, 49.84], [50.0, 50.62], [51.0, 52.15], [53.0, 53.55], [56.0, 58.04], [58.0, 59.16], [62.0, 62.63], [64.0, 65.7], [68.0, 69.33], [71.0, 73.97], [86.0, 86.49], [90.0, 91.0], [93.0, 94.68], [98.0, 100.89], [101.0, 103.94], [104.0, 105.22], [106.0, 106.79], [108.0, 109.63], [114.0, 131.45], [133.0, 148.64], [152.0, 162.89], [166.0, 167.43], [168.0, 170.77], [172.0, 172.34], [174.0, 174.19], [176.0, 176.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 42.88, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 88.64, 38.75, 0.0, 0.0, 0.0, 44.29, 45.46, 37.24, 0.0, 35.94, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 38.34], ["speech", 21.07], ["music", 13.42]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.7], ["sidetone", 14.42], ["radio", 3.77]], null, null, null, null, [["speech", 60.77], ["telephone dialing, dtmf", 16.36], ["telephone", 14.44]], null, null, null, [["hum", 27.36], ["music", 19.78], ["mains hum", 19.54]], [["music", 74.58], ["theremin", 3.92], ["cello", 2.35]], [["music", 55.04], ["crack", 4.24], ["thunk", 2.57]], null, [["speech", 46.79], ["music", 21.96], ["radio", 19.33]], null, null, null], "duration": [1.51, 1.49, 0.09, -0.37, 3.1, 0.87, 1.25, 0.71, 3.39, 0.7, 0.8, 0.84, 0.62, 1.15, 0.55, 2.04, 1.16, 0.63, 1.7, 1.33, 2.97, 0.49, 1.0, 1.68, 2.89, 2.94, 1.22, 0.79, 1.63, 17.45, 15.64, 10.89, 1.43, 2.77, 0.34, 0.19, 0.61]} \ No newline at end of file diff --git a/annotations_1/ptJ8x9AERwA_filtered.json b/annotations_1/ptJ8x9AERwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f22c9b0f59a3c0e21d0bf860930d5c3235cf1337 --- /dev/null +++ b/annotations_1/ptJ8x9AERwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.32], [12.0, 18.39], [19.0, 20.41], [23.0, 24.53], [25.0, 26.3], [28.0, 30.15], [31.0, 31.63], [33.0, 34.86], [39.0, 40.91], [42.0, 43.7], [50.0, 50.67], [52.0, 53.79], [56.0, 57.86], [60.0, 66.72], [70.0, 78.58], [81.0, 82.56], [89.0, 90.93], [95.0, 96.33], [98.0, 98.58], [104.0, 104.99], [107.0, 108.57], [111.0, 112.53], [113.0, 114.17], [115.0, 116.5], [118.0, 119.4], [123.0, 124.58], [125.0, 126.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 100.0, 0.0, 0.0, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.32, 6.39, 1.41, 1.53, 1.3, 2.15, 0.63, 1.86, 1.91, 1.7, 0.67, 1.79, 1.86, 6.72, 8.58, 1.56, 1.93, 1.33, 0.58, 0.99, 1.57, 1.53, 1.17, 1.5, 1.4, 1.58, 1.08]} \ No newline at end of file diff --git a/annotations_1/ptOc-HdvEW0_filtered.json b/annotations_1/ptOc-HdvEW0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06dce4b5b22997da4a03a8c49522fa717e418958 --- /dev/null +++ b/annotations_1/ptOc-HdvEW0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.57], [8.0, 8.68], [11.0, 11.21], [11.0, 13.73], [28.0, 28.68], [33.0, 33.47], [46.0, 46.99], [48.0, 48.59], [56.0, 56.73], [58.0, 58.92], [87.0, 87.89], [90.0, 90.41], [99.0, 98.96], [109.0, 109.85], [115.0, 115.4], [123.0, 125.02], [126.0, 126.4], [128.0, 129.19], [131.0, 132.26], [138.0, 140.17], [143.0, 148.66], [149.0, 149.18], [150.0, 150.4], [155.0, 155.38], [161.0, 160.78], [162.0, 162.31], [163.0, 163.11], [166.0, 167.75], [169.0, 168.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 96.04, 44.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 85.97], ["radio", 3.67], ["telephone", 2.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 76.96], ["radio", 2.79], ["telephone", 1.86]], null, null, null, null, null, null, null, null], "duration": [0.57, 0.68, 0.21, 2.73, 0.68, 0.47, 0.99, 0.59, 0.73, 0.92, 0.89, 0.41, -0.04, 0.85, 0.4, 2.02, 0.4, 1.19, 1.26, 2.17, 5.66, 0.18, 0.4, 0.38, -0.22, 0.31, 0.11, 1.75, -0.02]} \ No newline at end of file diff --git a/annotations_1/ptcDoIfzLtI_filtered.json b/annotations_1/ptcDoIfzLtI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97ba3493b119242333aaf1a6e0d7a5b3f89b8093 --- /dev/null +++ b/annotations_1/ptcDoIfzLtI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 22.87], [36.0, 36.54]], "keep_status": [false, false], "silence_prob": [53.72, 0.0], "audiomae_on_audioset": [null, null], "duration": [2.87, 0.54]} \ No newline at end of file diff --git a/annotations_1/puXiyRw_L6g_filtered.json b/annotations_1/puXiyRw_L6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70bca5df6bf49a41b7e340b0f25282d60b720c30 --- /dev/null +++ b/annotations_1/puXiyRw_L6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [11.0, 14.27], [17.0, 18.59], [27.0, 27.85], [29.0, 29.08], [32.0, 32.32], [34.0, 38.87], [39.0, 40.1], [41.0, 42.65], [44.0, 45.18], [49.0, 49.89], [59.0, 59.86], [61.0, 63.54], [69.0, 68.93], [71.0, 72.49], [79.0, 86.64], [90.0, 108.48], [110.0, 111.79], [113.0, 116.11], [120.0, 126.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 87.19, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 0.0, 0.0, 93.91, 97.73, 0.0, 65.44, 69.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 3.27, 1.59, 0.85, 0.08, 0.32, 4.87, 1.1, 1.65, 1.18, 0.89, 0.86, 2.54, -0.07, 1.49, 7.64, 18.48, 1.79, 3.11, 6.96]} \ No newline at end of file diff --git a/annotations_1/puyN3edOOUY_filtered.json b/annotations_1/puyN3edOOUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f5c2c30aaa85e3a7463543e92311184a8b120b1 --- /dev/null +++ b/annotations_1/puyN3edOOUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.81], [16.0, 90.91]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.81, 74.91]} \ No newline at end of file diff --git a/annotations_1/pvACjy-tYFE_filtered.json b/annotations_1/pvACjy-tYFE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..172530cf7e618c97817157cd340a7d6a94e512ca --- /dev/null +++ b/annotations_1/pvACjy-tYFE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.46], [20.0, 27.97], [33.0, 33.56], [34.0, 43.56], [49.0, 48.96], [56.0, 56.59], [62.0, 63.34], [65.0, 67.39], [70.0, 72.99], [75.0, 76.89], [79.0, 83.79], [85.0, 89.95], [92.0, 107.94]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, true, true], "silence_prob": [30.26, 35.48, 0.0, 35.22, 0.0, 0.0, 0.0, 40.21, 29.87, 0.0, 29.16, 29.28, 29.07], "audiomae_on_audioset": [[["speech", 38.75], ["music", 27.85], ["whack, thwack", 4.44]], [["mains hum", 28.95], ["hum", 25.99], ["throbbing", 12.71]], null, [["speech", 30.79], ["hum", 22.08], ["music", 17.45]], null, null, null, [["music", 68.64], ["musical instrument", 8.64], ["synthesizer", 5.16]], [["music", 21.26], ["vehicle", 4.35], ["synthesizer", 4.02]], null, [["music", 43.53], ["throbbing", 20.11], ["static", 6.69]], [["music", 26.01], ["throbbing", 24.66], ["mains hum", 16.89]], [["music", 28.08], ["vehicle", 14.64], ["hum", 9.91]]], "duration": [9.46, 7.97, 0.56, 9.56, -0.04, 0.59, 1.34, 2.39, 2.99, 1.89, 4.79, 4.95, 15.94]} \ No newline at end of file diff --git a/annotations_1/pvNA2JkMfSI_filtered.json b/annotations_1/pvNA2JkMfSI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d34429c242754d93329a8978744c6e3bbcab705e --- /dev/null +++ b/annotations_1/pvNA2JkMfSI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.06], [12.0, 13.24], [17.0, 17.74], [20.0, 20.6], [21.0, 22.11], [25.0, 25.62], [29.0, 29.94], [33.0, 33.2], [36.0, 36.17], [37.0, 39.26], [47.0, 47.16], [49.0, 49.52], [51.0, 54.11], [55.0, 56.74], [58.0, 58.99], [61.0, 61.53], [64.0, 64.64], [65.0, 66.21], [83.0, 84.74], [86.0, 86.66], [87.0, 88.75], [91.0, 92.3], [95.0, 98.44], [100.0, 100.95], [102.0, 102.12], [104.0, 104.7], [106.0, 107.18], [109.0, 109.68], [110.0, 111.1], [113.0, 113.51], [114.0, 115.32], [116.0, 123.04], [126.0, 128.85], [131.0, 130.77], [135.0, 137.07], [139.0, 140.75], [145.0, 146.11], [148.0, 150.33], [153.0, 154.68], [156.0, 156.2], [157.0, 158.5], [163.0, 165.03], [168.0, 169.97], [173.0, 181.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 0.0, 82.97, 0.0, 0.0, 95.91, 0.0, 0.0, 0.0, 97.83, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.06, 1.24, 0.74, 0.6, 1.11, 0.62, 0.94, 0.2, 0.17, 2.26, 0.16, 0.52, 3.11, 1.74, 0.99, 0.53, 0.64, 1.21, 1.74, 0.66, 1.75, 1.3, 3.44, 0.95, 0.12, 0.7, 1.18, 0.68, 1.1, 0.51, 1.32, 7.04, 2.85, -0.23, 2.07, 1.75, 1.11, 2.33, 1.68, 0.2, 1.5, 2.03, 1.97, 8.06]} \ No newline at end of file diff --git a/annotations_1/pvS3j8VtanM_filtered.json b/annotations_1/pvS3j8VtanM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56c566591e9ce9eea5e3b0a866db887c2d9f8a89 --- /dev/null +++ b/annotations_1/pvS3j8VtanM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.22], [6.0, 6.1], [7.0, 7.5], [20.0, 20.85], [23.0, 24.16], [28.0, 32.05], [36.0, 36.63], [40.0, 40.1], [41.0, 43.26], [44.0, 46.47], [47.0, 47.73], [48.0, 48.91], [50.0, 51.78], [53.0, 54.36], [56.0, 55.7], [58.0, 60.83], [63.0, 68.01], [69.0, 69.99], [73.0, 75.76], [79.0, 82.43], [89.0, 88.87], [93.0, 93.36], [95.0, 95.0], [96.0, 96.79], [97.0, 97.71], [100.0, 100.65], [102.0, 102.44], [114.0, 117.93], [119.0, 119.3], [121.0, 122.86], [126.0, 128.6], [142.0, 142.35], [146.0, 147.23], [149.0, 149.93], [152.0, 152.32], [154.0, 153.99], [156.0, 156.36], [157.0, 157.0], [158.0, 158.41], [162.0, 163.9]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 39.05, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 77.87, 46.15, 0.0, 51.5, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.86, 0.0, 0.0, 48.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 36.91], ["mains hum", 12.56], ["music", 9.47]], null, null, null, null, null, null, null, [["speech", 66.99], ["music", 7.63], ["synthesizer", 2.25]], null, null, null, null, null, null, null, null, null, null, [["speech", 60.6], ["music", 13.64], ["synthesizer", 2.89]], null, null, [["music", 63.91], ["synthesizer", 10.86], ["musical instrument", 5.24]], null, null, null, null, null, null, null, null, null], "duration": [1.22, 0.1, 0.5, 0.85, 1.16, 4.05, 0.63, 0.1, 2.26, 2.47, 0.73, 0.91, 1.78, 1.36, -0.3, 2.83, 5.01, 0.99, 2.76, 3.43, -0.13, 0.36, 0.0, 0.79, 0.71, 0.65, 0.44, 3.93, 0.3, 1.86, 2.6, 0.35, 1.23, 0.93, 0.32, -0.01, 0.36, 0.0, 0.41, 1.9]} \ No newline at end of file diff --git a/annotations_1/pwSkfvXD_ug_filtered.json b/annotations_1/pwSkfvXD_ug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..96eb9c54f226d00f1dd83991a0118f880b23da4a --- /dev/null +++ b/annotations_1/pwSkfvXD_ug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [17.0, 17.59], [19.0, 169.62], [176.0, 177.31], [179.0, 178.92]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.41, 0.59, 150.62, 1.31, -0.08]} \ No newline at end of file diff --git a/annotations_1/pxQNKJWZ-t0_filtered.json b/annotations_1/pxQNKJWZ-t0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eb36fd80a038d10d39e03c6c16807ce2890c1b11 --- /dev/null +++ b/annotations_1/pxQNKJWZ-t0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 20.85], [21.0, 35.83], [41.0, 53.54], [54.0, 62.8], [64.0, 76.05], [77.0, 89.9], [90.0, 90.44], [90.0, 134.05], [138.0, 146.62]], "keep_status": [true, false, false, true, false, true, false, false, true], "silence_prob": [28.96, 29.43, 29.23, 28.51, 29.33, 28.58, 0.0, 0.0, 29.76], "audiomae_on_audioset": [[["speech", 22.53], ["music", 15.97], ["roar", 9.83]], [["music", 26.99], ["hum", 25.54], ["throbbing", 19.09]], [["music", 69.68], ["throbbing", 7.4], ["theremin", 2.58]], [["speech", 16.59], ["music", 14.76], ["rumble", 6.14]], [["music", 41.08], ["speech", 27.92], ["didgeridoo", 3.31]], [["music", 29.56], ["hum", 21.45], ["mains hum", 18.39]], null, null, [["grunt", 53.3], ["roaring cats (lions, tigers)", 7.26], ["sound effect", 5.01]]], "duration": [19.85, 14.83, 12.54, 8.8, 12.05, 12.9, 0.44, 44.05, 8.62]} \ No newline at end of file diff --git a/annotations_1/pxSjP6JkAis_filtered.json b/annotations_1/pxSjP6JkAis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b0b27b7e9ae8e451fe562a639f35be50a8753f --- /dev/null +++ b/annotations_1/pxSjP6JkAis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.59], [4.0, 4.9], [5.0, 6.72], [9.0, 9.66], [10.0, 12.21], [14.0, 14.59], [15.0, 15.75], [19.0, 27.09], [30.0, 31.63], [32.0, 38.84], [40.0, 40.46], [41.0, 51.21], [52.0, 56.03], [57.0, 64.45], [67.0, 69.57], [72.0, 73.21], [74.0, 74.55], [76.0, 77.58], [80.0, 85.97], [87.0, 87.71], [89.0, 90.88], [91.0, 91.03], [91.0, 91.86], [94.0, 96.21], [97.0, 97.23], [98.0, 98.69], [102.0, 104.52], [106.0, 107.3], [109.0, 115.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 99.88, 0.0, 71.0, 0.0, 62.89, 55.39, 43.25, 53.28, 0.0, 0.0, 0.0, 47.7, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 0.0, 44.4, 0.0, 42.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 67.96], ["musical instrument", 5.39], ["plucked string instrument", 3.21]], null, null, null, null, [["music", 52.87], ["electric piano", 7.25], ["keyboard (musical)", 5.61]], null, null, null, null, [["music", 54.96], ["lullaby", 6.3], ["vibraphone", 4.81]], null, null, [["music", 39.71], ["electric piano", 12.7], ["keyboard (musical)", 8.31]], null, [["music", 63.37], ["guitar", 5.58], ["plucked string instrument", 4.84]]], "duration": [1.59, 0.9, 1.72, 0.66, 2.21, 0.59, 0.75, 8.09, 1.63, 6.84, 0.46, 10.21, 4.03, 7.45, 2.57, 1.21, 0.55, 1.58, 5.97, 0.71, 1.88, 0.03, 0.86, 2.21, 0.23, 0.69, 2.52, 1.3, 6.91]} \ No newline at end of file diff --git a/annotations_1/py7xqlpvCIk_filtered.json b/annotations_1/py7xqlpvCIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ceae0447940da73a9b7236b5c4396bfe2c8ac632 --- /dev/null +++ b/annotations_1/py7xqlpvCIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [6.0, 39.16], [40.0, 55.54], [56.0, 67.63], [69.0, 101.41], [102.0, 105.48]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.31, 33.43, 0.0, 30.32], "audiomae_on_audioset": [null, null, [["hum", 52.52], ["mains hum", 32.25], ["music", 8.38]], [["music", 40.73], ["hum", 36.47], ["mains hum", 5.36]], null, [["fly, housefly", 45.85], ["insect", 28.17], ["speech", 7.25]]], "duration": [1.13, 33.16, 15.54, 11.63, 32.41, 3.48]} \ No newline at end of file diff --git a/annotations_1/pz6wAzZlnhE_filtered.json b/annotations_1/pz6wAzZlnhE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019b55ce7ef3b45a306bee4b1f921c7099f4e6d6 --- /dev/null +++ b/annotations_1/pz6wAzZlnhE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.59], [11.0, 18.08], [19.0, 21.19], [24.0, 25.93], [28.0, 30.62], [34.0, 36.46], [39.0, 39.5], [42.0, 49.79], [51.0, 52.69], [54.0, 54.78], [56.0, 56.05], [57.0, 57.45], [58.0, 58.06], [59.0, 84.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 100.0, 0.0, 98.44, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.59, 7.08, 2.19, 1.93, 2.62, 2.46, 0.5, 7.79, 1.69, 0.78, 0.05, 0.45, 0.06, 25.86]} \ No newline at end of file diff --git a/annotations_1/pzE6SVUHAYE_filtered.json b/annotations_1/pzE6SVUHAYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1411acf4ccd42e255252174482656c82ee145ae8 --- /dev/null +++ b/annotations_1/pzE6SVUHAYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 6.83], [13.0, 13.58], [16.0, 17.32], [24.0, 26.81], [31.0, 31.82], [91.0, 98.29], [99.0, 102.41]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [1.18, 1.83, 0.58, 1.32, 2.81, 0.82, 7.29, 3.41]} \ No newline at end of file diff --git a/annotations_1/pzG1ckuBqpg_filtered.json b/annotations_1/pzG1ckuBqpg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afc73124e4d90e22e7ff7a021932e31027dcafbc --- /dev/null +++ b/annotations_1/pzG1ckuBqpg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.56], [32.0, 49.47], [76.0, 87.96], [90.0, 98.1], [101.0, 104.36], [113.0, 117.15], [125.0, 128.29], [131.0, 131.5], [133.0, 134.54], [135.0, 135.46], [138.0, 139.75], [140.0, 143.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [66.39, 31.1, 42.28, 78.04, 78.21, 78.38, 30.67, 0.0, 0.0, 0.0, 0.0, 52.39], "audiomae_on_audioset": [null, [["speech", 83.06], ["boing", 2.28], ["whack, thwack", 1.23]], [["hum", 21.84], ["music", 13.01], ["musical instrument", 10.83]], null, null, null, [["speech", 73.99], ["radio", 11.49], ["speech synthesizer", 3.36]], null, null, null, null, null], "duration": [5.56, 17.47, 11.96, 8.1, 3.36, 4.15, 3.29, 0.5, 1.54, 0.46, 1.75, 3.19]} \ No newline at end of file diff --git a/annotations_1/pzZ9UdUTRNA_filtered.json b/annotations_1/pzZ9UdUTRNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc822d4e1c94bc77ce61c6cc6271fbd89602f873 --- /dev/null +++ b/annotations_1/pzZ9UdUTRNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.54], [5.0, 5.73], [15.0, 16.17], [17.0, 25.69], [27.0, 27.84], [29.0, 29.71], [31.0, 31.78], [32.0, 41.52], [42.0, 43.58], [45.0, 46.79], [50.0, 72.28], [79.0, 80.42], [91.0, 94.27], [99.0, 106.83], [113.0, 131.75], [138.0, 140.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 50.97, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 35.91, 0.0, 76.04, 53.1, 64.97, 45.05], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["machine gun", 58.25], ["speech", 14.24], ["gunshot, gunfire", 8.49]], null, null, null, null, [["music", 48.37], ["electronic music", 6.48], ["scary music", 4.18]]], "duration": [1.54, 0.73, 1.17, 8.69, 0.84, 0.71, 0.78, 9.52, 1.58, 1.79, 22.28, 1.42, 3.27, 7.83, 18.75, 2.88]} \ No newline at end of file diff --git a/annotations_1/q-nQtR-WbIs_filtered.json b/annotations_1/q-nQtR-WbIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..859d5bd8a8db60b8a5bc926d9f78d290652f5aa1 --- /dev/null +++ b/annotations_1/q-nQtR-WbIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 10.99], [15.0, 16.09], [17.0, 18.67], [20.0, 21.05], [23.0, 24.83], [25.0, 27.5], [31.0, 31.35], [33.0, 33.89], [36.0, 42.15], [44.0, 45.4], [49.0, 53.2], [55.0, 57.52], [60.0, 61.84], [63.0, 65.65], [68.0, 70.68], [72.0, 91.34], [93.0, 97.53], [98.0, 101.28], [102.0, 109.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [61.87, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 63.64, 0.0, 58.3, 80.11, 0.0, 73.51, 46.36, 53.22, 71.57, 53.4, 57.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 42.09], ["musical instrument", 12.16], ["guitar", 5.93]], null, null, null, null], "duration": [4.99, 1.09, 1.67, 1.05, 1.83, 2.5, 0.35, 0.89, 6.15, 1.4, 4.2, 2.52, 1.84, 2.65, 2.68, 19.34, 4.53, 3.28, 7.75]} \ No newline at end of file diff --git a/annotations_1/q1SFvQhjK5I_filtered.json b/annotations_1/q1SFvQhjK5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00e18a206fc89cde1e872484411cd86ffe61c352 --- /dev/null +++ b/annotations_1/q1SFvQhjK5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 41.28], [42.0, 42.26], [43.0, 43.68], [45.0, 45.15], [50.0, 50.8], [53.0, 54.06], [55.0, 56.54], [58.0, 58.8], [65.0, 65.67], [66.0, 67.54], [69.0, 69.52], [70.0, 71.07], [73.0, 73.72], [80.0, 81.82], [84.0, 84.94], [101.0, 101.95], [103.0, 104.45], [105.0, 106.68], [108.0, 109.07], [111.0, 111.54], [112.0, 112.97], [114.0, 114.64], [116.0, 118.1], [129.0, 130.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0], "audiomae_on_audioset": [[["music", 77.7], ["theremin", 2.9], ["throbbing", 1.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.28, 0.26, 0.68, 0.15, 0.8, 1.06, 1.54, 0.8, 0.67, 1.54, 0.52, 1.07, 0.72, 1.82, 0.94, 0.95, 1.45, 1.68, 1.07, 0.54, 0.97, 0.64, 2.1, 1.01]} \ No newline at end of file diff --git a/annotations_1/q1bV-D8cSz8_filtered.json b/annotations_1/q1bV-D8cSz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9fdb1cc4765a78d247937cae11041ba0de172c80 --- /dev/null +++ b/annotations_1/q1bV-D8cSz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 37.77], [39.0, 44.68], [49.0, 71.68], [72.0, 72.62], [77.0, 77.25], [79.0, 79.62], [81.0, 82.07], [83.0, 96.45], [96.0, 115.42]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [80.11, 86.82, 72.75, 0.0, 0.0, 0.0, 0.0, 32.66, 33.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 23.95], ["speech", 16.88], ["hum", 14.72]], [["music", 37.04], ["speech", 24.19], ["smash, crash", 9.74]]], "duration": [22.77, 5.68, 22.68, 0.62, 0.25, 0.62, 1.07, 13.45, 19.42]} \ No newline at end of file diff --git a/annotations_1/q289a8P8Ht8_filtered.json b/annotations_1/q289a8P8Ht8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d827271413ff968398496b2f7db9db8586bd01 --- /dev/null +++ b/annotations_1/q289a8P8Ht8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 116.88], [118.0, 149.82]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [82.88, 31.82]} \ No newline at end of file diff --git a/annotations_1/q2EU-k9I5yg_filtered.json b/annotations_1/q2EU-k9I5yg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf33f8ca162013533cbc139e174d7cf73ac3292f --- /dev/null +++ b/annotations_1/q2EU-k9I5yg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.48], [4.0, 4.45], [10.0, 10.39], [12.0, 12.04], [13.0, 13.61], [19.0, 19.57], [45.0, 45.6], [48.0, 48.61], [58.0, 59.19], [97.0, 97.12], [101.0, 101.33], [102.0, 102.1], [106.0, 107.32], [111.0, 111.91], [113.0, 113.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 0.45, 0.39, 0.04, 0.61, 0.57, 0.6, 0.61, 1.19, 0.12, 0.33, 0.1, 1.32, 0.91, 0.64]} \ No newline at end of file diff --git a/annotations_1/q2YwvMc96VY_filtered.json b/annotations_1/q2YwvMc96VY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5fb815cca7de6d97ce2ead61b5a59dd07f0238 --- /dev/null +++ b/annotations_1/q2YwvMc96VY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [5.0, 6.02], [7.0, 7.05], [9.0, 9.81], [11.0, 11.53], [14.0, 14.57], [16.0, 16.44], [20.0, 20.17], [22.0, 64.52], [65.0, 67.37], [68.0, 69.6], [70.0, 72.82], [73.0, 75.36], [76.0, 77.63], [79.0, 79.44], [80.0, 80.76], [83.0, 83.24], [85.0, 86.07], [87.0, 90.54], [91.0, 100.33], [103.0, 104.14], [107.0, 108.8], [109.0, 111.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 57.48, 64.07, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 33.63, 0.0, 0.0, 52.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.18], ["speech", 15.51], ["sidetone", 5.07]], null, null, null], "duration": [1.3, 1.02, 0.05, 0.81, 0.53, 0.57, 0.44, 0.17, 42.52, 2.37, 1.6, 2.82, 2.36, 1.63, 0.44, 0.76, 0.24, 1.07, 3.54, 9.33, 1.14, 1.8, 2.92]} \ No newline at end of file diff --git a/annotations_1/q30Pl1M6_DE_filtered.json b/annotations_1/q30Pl1M6_DE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eaac6bf946caee7a2f3fd1483ee6423e6145e19b --- /dev/null +++ b/annotations_1/q30Pl1M6_DE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 110.42], [113.0, 112.9], [114.0, 136.07]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 29.54], "audiomae_on_audioset": [null, null, [["music", 69.57], ["hum", 9.74], ["mains hum", 4.53]]], "duration": [92.42, -0.1, 22.07]} \ No newline at end of file diff --git a/annotations_1/q3Vvto0REuc_filtered.json b/annotations_1/q3Vvto0REuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5f24b32a11034a4bb60f4b37641d5be338fa1fe5 --- /dev/null +++ b/annotations_1/q3Vvto0REuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.05], [28.0, 39.77], [41.0, 41.91], [44.0, 46.67], [48.0, 50.04], [51.0, 52.05], [53.0, 54.06], [56.0, 56.49], [57.0, 58.23], [63.0, 63.83], [65.0, 65.74], [67.0, 70.12], [71.0, 72.1], [73.0, 73.99], [75.0, 75.95], [77.0, 77.53], [79.0, 79.88], [81.0, 82.31], [83.0, 83.47], [85.0, 85.77], [88.0, 91.86], [93.0, 94.86], [97.0, 97.16], [99.0, 99.03], [101.0, 101.61], [102.0, 103.25], [104.0, 104.38], [105.0, 104.94], [107.0, 107.76], [109.0, 109.93], [111.0, 112.24], [115.0, 115.08], [116.0, 117.42], [119.0, 119.57], [122.0, 123.16], [124.0, 124.78], [126.0, 126.69], [128.0, 128.73], [130.0, 130.98], [133.0, 133.32], [134.0, 135.01], [136.0, 137.03], [139.0, 143.16], [148.0, 149.88], [150.0, 152.56], [153.0, 154.75], [156.0, 157.17], [158.0, 160.1], [161.0, 162.08], [164.0, 166.53], [168.0, 168.89], [172.0, 193.24], [194.0, 195.61], [197.0, 197.46], [200.0, 202.95], [204.0, 205.43], [208.0, 215.89], [217.0, 219.06], [219.0, 221.97], [222.0, 224.14], [225.0, 228.33]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 30.57, 0.0, 49.68, 98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 56.18, 0.0, 0.0, 53.84, 0.0, 99.76, 0.0, 94.95, 0.0, 0.0, 78.55, 0.0, 99.88, 62.78, 49.27, 39.63, 99.16], "audiomae_on_audioset": [null, [["fly, housefly", 15.2], ["hum", 15.1], ["music", 13.9]], null, [["speech", 11.13], ["hum", 10.58], ["sneeze", 9.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.07], ["sidetone", 24.02], ["hum", 3.63]], [["speech", 31.75], ["sidetone", 19.56], ["dial tone", 12.14]], null], "duration": [1.05, 11.77, 0.91, 2.67, 2.04, 1.05, 1.06, 0.49, 1.23, 0.83, 0.74, 3.12, 1.1, 0.99, 0.95, 0.53, 0.88, 1.31, 0.47, 0.77, 3.86, 1.86, 0.16, 0.03, 0.61, 1.25, 0.38, -0.06, 0.76, 0.93, 1.24, 0.08, 1.42, 0.57, 1.16, 0.78, 0.69, 0.73, 0.98, 0.32, 1.01, 1.03, 4.16, 1.88, 2.56, 1.75, 1.17, 2.1, 1.08, 2.53, 0.89, 21.24, 1.61, 0.46, 2.95, 1.43, 7.89, 2.06, 2.97, 2.14, 3.33]} \ No newline at end of file diff --git a/annotations_1/q42thgSKkpo_filtered.json b/annotations_1/q42thgSKkpo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71cdd813712ecf42a270c7d28116d0ab2cd15ca6 --- /dev/null +++ b/annotations_1/q42thgSKkpo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 64.52], [67.0, 75.03], [76.0, 81.19], [83.0, 83.44], [84.0, 83.61], [84.0, 99.37], [103.0, 110.79], [116.0, 118.81], [122.0, 132.19], [133.0, 153.87], [155.0, 158.97]], "keep_status": [false, true, true, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 29.06, 30.16, 0.0, 0.0, 29.37, 42.19, 36.52, 35.61, 38.9, 29.26], "audiomae_on_audioset": [null, [["music", 26.49], ["speech", 23.9], ["mains hum", 13.67]], [["music", 25.8], ["mains hum", 6.93], ["foghorn", 6.43]], null, null, [["music", 65.23], ["didgeridoo", 7.31], ["speech", 3.64]], [["music", 41.02], ["speech", 15.76], ["whale vocalization", 7.68]], [["theremin", 36.28], ["music", 31.47], ["wind instrument, woodwind instrument", 4.54]], [["music", 46.12], ["theremin", 25.52], ["whale vocalization", 4.7]], [["didgeridoo", 43.17], ["music", 34.13], ["musical instrument", 2.84]], [["music", 45.52], ["musical instrument", 9.54], ["sound effect", 6.44]]], "duration": [56.52, 8.03, 5.19, 0.44, -0.39, 15.37, 7.79, 2.81, 10.19, 20.87, 3.97]} \ No newline at end of file diff --git a/annotations_1/q5RSKejDWo8_filtered.json b/annotations_1/q5RSKejDWo8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b668e559887e787248df620dda7a746e3cab9f3 --- /dev/null +++ b/annotations_1/q5RSKejDWo8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [5.0, 5.07], [7.0, 9.42], [11.0, 17.31], [26.0, 27.53], [31.0, 31.41], [32.0, 32.49], [33.0, 33.79], [41.0, 40.86], [42.0, 42.82], [44.0, 44.1], [47.0, 48.25], [53.0, 54.24], [55.0, 56.94], [58.0, 60.0], [62.0, 65.6], [69.0, 69.01], [76.0, 76.4], [77.0, 77.06], [80.0, 79.95], [81.0, 81.48], [82.0, 83.07], [83.0, 83.59], [84.0, 87.07], [88.0, 88.64], [89.0, 90.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 85.72, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.88, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.07, 2.42, 6.31, 1.53, 0.41, 0.49, 0.79, -0.14, 0.82, 0.1, 1.25, 1.24, 1.94, 2.0, 3.6, 0.01, 0.4, 0.06, -0.05, 0.48, 1.07, 0.59, 3.07, 0.64, 1.17]} \ No newline at end of file diff --git a/annotations_1/q5eGg_CgBPk_filtered.json b/annotations_1/q5eGg_CgBPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45bb471648d9e6d024c7cf48e62ce7ef59e4ec6c --- /dev/null +++ b/annotations_1/q5eGg_CgBPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.0], [14.0, 15.08], [20.0, 36.95], [59.0, 61.13], [65.0, 79.03], [79.0, 79.07], [79.0, 79.1], [79.0, 79.41], [79.0, 79.44], [85.0, 85.11], [92.0, 98.17], [100.0, 102.29], [113.0, 120.5], [128.0, 130.54], [133.0, 148.44]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 32.51, 32.22, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 32.88, 34.17, 33.75, 31.01, 35.3], "audiomae_on_audioset": [null, null, [["music", 23.97], ["speech", 18.5], ["breaking", 15.7]], [["speech", 41.2], ["music", 32.48], ["boing", 3.31]], [["speech", 48.29], ["music", 35.28], ["explosion", 2.42]], null, null, null, null, null, [["music", 45.03], ["didgeridoo", 14.62], ["speech", 11.91]], [["music", 41.47], ["theremin", 4.79], ["musical instrument", 4.75]], [["speech", 45.67], ["music", 35.79], ["sidetone", 6.72]], [["music", 41.66], ["trombone", 8.49], ["speech", 7.33]], [["whale vocalization", 40.86], ["theremin", 20.63], ["music", 16.89]]], "duration": [0.0, 1.08, 16.95, 2.13, 14.03, 0.07, 0.1, 0.41, 0.44, 0.11, 6.17, 2.29, 7.5, 2.54, 15.44]} \ No newline at end of file diff --git a/annotations_1/q6ObhNBURyY_filtered.json b/annotations_1/q6ObhNBURyY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7baf5e21a6979e8c05ab339e8bdfcbd6f46fc15 --- /dev/null +++ b/annotations_1/q6ObhNBURyY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 74.87], [76.0, 143.33], [144.0, 143.95], [144.0, 166.08]], "keep_status": [false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.5], "audiomae_on_audioset": [null, null, null, [["music", 19.68], ["vehicle", 13.41], ["car", 11.03]]], "duration": [45.87, 67.33, -0.05, 22.08]} \ No newline at end of file diff --git a/annotations_1/q6j_0vS_NNM_filtered.json b/annotations_1/q6j_0vS_NNM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3222a58d5681c35fa936845350d7bdedd05d8a6c --- /dev/null +++ b/annotations_1/q6j_0vS_NNM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [16.0, 18.57], [21.0, 22.17], [23.0, 27.63], [30.0, 36.73], [40.0, 41.08], [45.0, 49.71], [54.0, 54.53], [56.0, 58.04], [60.0, 64.32], [66.0, 76.3], [78.0, 81.97], [85.0, 85.72], [87.0, 99.3], [102.0, 109.26], [114.0, 113.86], [114.0, 113.9], [114.0, 117.98], [126.0, 127.23], [135.0, 136.34], [138.0, 144.41], [146.0, 152.27], [153.0, 154.09], [158.0, 161.25], [162.0, 163.02], [165.0, 173.42], [177.0, 177.04], [180.0, 182.07]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.27, 0.0, 47.12, 39.63, 0.0, 36.55, 0.0, 35.52, 38.93, 36.99, 39.83, 0.0, 35.77, 38.97, 0.0, 0.0, 41.89, 0.0, 0.0, 36.27, 35.59, 0.0, 34.88, 0.0, 37.05, 0.0, 46.64], "audiomae_on_audioset": [null, [["music", 56.9], ["fly, housefly", 5.47], ["insect", 2.84]], null, [["music", 63.09], ["bass guitar", 4.08], ["double bass", 2.84]], [["music", 74.2], ["bass guitar", 2.43], ["double bass", 2.09]], null, [["music", 77.85], ["musical instrument", 1.82], ["mantra", 1.59]], null, [["music", 73.24], ["humming", 3.63], ["carnatic music", 2.71]], [["music", 83.24], ["sad music", 1.23], ["musical instrument", 1.17]], [["music", 67.54], ["double bass", 7.28], ["cello", 5.9]], [["music", 69.54], ["mantra", 3.72], ["carnatic music", 2.64]], null, [["music", 79.48], ["sad music", 3.12], ["cello", 1.98]], [["music", 57.86], ["double bass", 11.95], ["cello", 9.96]], null, null, [["music", 62.64], ["theremin", 6.0], ["cello", 4.46]], null, null, [["music", 78.74], ["guitar", 3.5], ["plucked string instrument", 2.71]], [["music", 81.57], ["mantra", 1.87], ["musical instrument", 1.33]], null, [["music", 73.93], ["mantra", 2.11], ["vocal music", 1.46]], null, [["music", 79.52], ["double bass", 3.29], ["cello", 1.47]], null, [["music", 73.25], ["musical instrument", 1.8], ["scary music", 1.51]]], "duration": [0.58, 2.57, 1.17, 4.63, 6.73, 1.08, 4.71, 0.53, 2.04, 4.32, 10.3, 3.97, 0.72, 12.3, 7.26, -0.14, -0.1, 3.98, 1.23, 1.34, 6.41, 6.27, 1.09, 3.25, 1.02, 8.42, 0.04, 2.07]} \ No newline at end of file diff --git a/annotations_1/q7S2ckr4IkM_filtered.json b/annotations_1/q7S2ckr4IkM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b00bd6ab8f5f647a9f73bb1b0739f6b3ffb48350 --- /dev/null +++ b/annotations_1/q7S2ckr4IkM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.23], [29.0, 29.34], [32.0, 35.02], [35.0, 35.06], [35.0, 35.61], [37.0, 38.16], [45.0, 45.23], [48.0, 48.32], [53.0, 53.32], [54.0, 56.4], [62.0, 62.43], [69.0, 70.39], [71.0, 72.01], [75.0, 75.88], [77.0, 78.12], [80.0, 80.13], [82.0, 82.68], [86.0, 86.56], [89.0, 90.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.23, 0.34, 3.02, 0.06, 0.61, 1.16, 0.23, 0.32, 0.32, 2.4, 0.43, 1.39, 1.01, 0.88, 1.12, 0.13, 0.68, 0.56, 1.59]} \ No newline at end of file diff --git a/annotations_1/q7V1sM0VNaw_filtered.json b/annotations_1/q7V1sM0VNaw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b7635076f4d1842f95547a154cdf524d161e0b6 --- /dev/null +++ b/annotations_1/q7V1sM0VNaw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 14.25], [20.0, 26.97], [28.0, 28.56], [32.0, 33.72], [35.0, 35.51], [37.0, 38.28], [39.0, 39.92], [47.0, 48.24], [49.0, 49.98], [51.0, 52.05], [54.0, 54.5], [56.0, 56.47], [58.0, 59.64], [61.0, 63.48], [64.0, 64.84], [66.0, 67.56], [71.0, 71.96], [76.0, 77.26], [84.0, 84.47], [86.0, 86.49], [89.0, 92.13], [93.0, 93.33], [101.0, 101.97], [105.0, 105.51], [106.0, 106.54], [108.0, 111.92], [113.0, 113.78], [116.0, 115.6], [117.0, 118.64], [120.0, 124.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.86, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 0.0, 0.0, 58.98, 0.0, 0.0, 0.0, 29.84], "audiomae_on_audioset": [[["music", 54.8], ["sidetone", 11.94], ["speech", 9.01]], [["music", 78.58], ["throbbing", 3.97], ["musical instrument", 2.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.68], ["speech", 12.16], ["applause", 4.75]]], "duration": [4.25, 6.97, 0.56, 1.72, 0.51, 1.28, 0.92, 1.24, 0.98, 1.05, 0.5, 0.47, 1.64, 2.48, 0.84, 1.56, 0.96, 1.26, 0.47, 0.49, 3.13, 0.33, 0.97, 0.51, 0.54, 3.92, 0.78, -0.4, 1.64, 4.77]} \ No newline at end of file diff --git a/annotations_1/q7tLJC4pC14_filtered.json b/annotations_1/q7tLJC4pC14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba25ec36e7b1909c02a59ffce3ee332923263227 --- /dev/null +++ b/annotations_1/q7tLJC4pC14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.34], [13.0, 14.03], [16.0, 23.46], [24.0, 31.4], [33.0, 33.76], [34.0, 35.18], [36.0, 36.34], [37.0, 40.46], [42.0, 43.12], [45.0, 46.43], [49.0, 49.59], [52.0, 53.28], [54.0, 55.0], [56.0, 59.1], [60.0, 61.3], [64.0, 65.7], [68.0, 68.39], [85.0, 85.72], [86.0, 87.0], [89.0, 93.73], [95.0, 95.62], [96.0, 96.57], [98.0, 107.25]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 32.29, 78.38, 0.0, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 43.51, 0.0, 0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 31.69], "audiomae_on_audioset": [null, null, [["music", 54.84], ["electronic music", 4.13], ["speech", 2.56]], null, null, null, null, null, null, null, null, null, null, [["music", 31.79], ["speech", 15.51], ["fart", 9.13]], null, null, null, null, null, [["speech", 23.04], ["hum", 16.89], ["mains hum", 8.45]], null, null, [["speech", 16.6], ["animal", 12.71], ["beatboxing", 6.29]]], "duration": [0.34, 1.03, 7.46, 7.4, 0.76, 1.18, 0.34, 3.46, 1.12, 1.43, 0.59, 1.28, 1.0, 3.1, 1.3, 1.7, 0.39, 0.72, 1.0, 4.73, 0.62, 0.57, 9.25]} \ No newline at end of file diff --git a/annotations_1/q8-xQspXFag_filtered.json b/annotations_1/q8-xQspXFag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5e56e219ebbf2aaf766295263bef28b529d6b44 --- /dev/null +++ b/annotations_1/q8-xQspXFag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.85], [8.0, 10.37], [11.0, 11.69], [14.0, 14.99], [18.0, 18.91], [19.0, 22.22], [24.0, 45.0], [47.0, 48.09], [49.0, 53.38], [55.0, 56.1], [56.0, 143.45], [144.0, 143.72], [144.0, 143.75], [144.0, 143.82], [145.0, 147.04], [150.0, 153.52], [155.0, 155.98], [157.0, 164.89], [168.0, 171.39], [174.0, 175.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [98.8, 96.54, 0.0, 0.0, 0.0, 87.92, 79.07, 0.0, 35.54, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 47.5, 0.0, 52.27, 61.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whale vocalization", 57.46], ["music", 17.03], ["pigeon, dove", 2.64]], null, null, null, null, null, null, [["thunk", 52.54], ["fart", 4.97], ["hum", 3.99]], null, null, null, null], "duration": [2.85, 2.37, 0.69, 0.99, 0.91, 3.22, 21.0, 1.09, 4.38, 1.1, 87.45, -0.28, -0.25, -0.18, 2.04, 3.52, 0.98, 7.89, 3.39, 1.14]} \ No newline at end of file diff --git a/annotations_1/q8HcMk_IimM_filtered.json b/annotations_1/q8HcMk_IimM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dedbc2fd564897c6352557516b9cf0dd779a902b --- /dev/null +++ b/annotations_1/q8HcMk_IimM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [1.0, 2.44], [5.0, 18.81], [21.0, 42.99], [47.0, 50.14], [51.0, 55.24], [57.0, 57.5], [58.0, 58.87], [61.0, 61.08], [70.0, 77.8], [78.0, 78.07], [79.0, 79.35], [81.0, 81.3], [82.0, 83.03], [84.0, 85.21], [86.0, 86.75], [88.0, 88.13], [91.0, 91.47], [94.0, 99.89], [100.0, 136.7], [137.0, 138.59], [148.0, 172.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 30.59, 29.98, 31.63, 29.13, 0.0, 0.0, 0.0, 29.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.08, 0.0, 0.0, 28.58], "audiomae_on_audioset": [null, null, [["music", 61.76], ["didgeridoo", 6.31], ["whack, thwack", 5.87]], [["music", 29.07], ["whack, thwack", 29.02], ["whip", 11.75]], [["music", 79.78], ["boing", 2.78], ["electronic music", 2.75]], [["speech", 37.46], ["music", 30.38], ["burst, pop", 6.86]], null, null, null, [["music", 54.43], ["speech", 13.05], ["radio", 5.79]], null, null, null, null, null, null, null, null, [["music", 75.85], ["didgeridoo", 4.16], ["musical instrument", 2.06]], null, null, [["music", 61.05], ["music of latin america", 6.22], ["funny music", 2.37]]], "duration": [0.06, 1.44, 13.81, 21.99, 3.14, 4.24, 0.5, 0.87, 0.08, 7.8, 0.07, 0.35, 0.3, 1.03, 1.21, 0.75, 0.13, 0.47, 5.89, 36.7, 1.59, 24.3]} \ No newline at end of file diff --git a/annotations_1/q8Wj4buHUtE_filtered.json b/annotations_1/q8Wj4buHUtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b696a0508b4bd2ad34b5a20496f890b4dc45a6b4 --- /dev/null +++ b/annotations_1/q8Wj4buHUtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [4.0, 3.94], [5.0, 5.27], [8.0, 8.77], [10.0, 13.02], [15.0, 16.55], [19.0, 20.95], [25.0, 27.73], [29.0, 28.85], [32.0, 32.37], [33.0, 35.77], [38.0, 39.02], [41.0, 40.91], [45.0, 45.86], [47.0, 47.43], [50.0, 52.79], [54.0, 55.83], [58.0, 62.24], [64.0, 65.08], [66.0, 67.78], [68.0, 71.02], [73.0, 78.12], [79.0, 79.61], [83.0, 90.19], [92.0, 102.78], [104.0, 108.14], [114.0, 115.86], [119.0, 121.31], [124.0, 143.67], [146.0, 146.42], [147.0, 157.87]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 0.0, 49.97, 0.0, 0.0, 36.24, 0.0, 0.0, 0.0, 0.0, 71.29, 0.0, 67.0, 0.0, 0.0, 43.79, 59.15, 0.0, 60.05, 57.64, 75.39, 0.0, 63.1, 54.63, 0.0, 42.42], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 26.0], ["mosquito", 5.93], ["synthesizer", 5.08]], null, null, [["music", 25.13], ["hum", 22.25], ["throbbing", 9.87]], null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 24.17], ["hum", 15.32], ["fly, housefly", 12.26]], null, null, null, null, null, null, null, null, null, [["music", 51.08], ["hum", 17.7], ["mains hum", 6.03]]], "duration": [1.4, -0.06, 0.27, 0.77, 3.02, 1.55, 1.95, 2.73, -0.15, 0.37, 2.77, 1.02, -0.09, 0.86, 0.43, 2.79, 1.83, 4.24, 1.08, 1.78, 3.02, 5.12, 0.61, 7.19, 10.78, 4.14, 1.86, 2.31, 19.67, 0.42, 10.87]} \ No newline at end of file diff --git a/annotations_1/q8nzGlXDvO8_filtered.json b/annotations_1/q8nzGlXDvO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a612c06193b9ca8d5fd1ca7e40c47565bffbcb6 --- /dev/null +++ b/annotations_1/q8nzGlXDvO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.82], [24.0, 24.65], [26.0, 26.42], [27.0, 26.92], [28.0, 28.66], [29.0, 31.89], [33.0, 33.1], [40.0, 39.88], [43.0, 44.69], [47.0, 47.7], [53.0, 53.89], [57.0, 56.96], [58.0, 58.26], [60.0, 62.41], [69.0, 80.32], [82.0, 84.97], [87.0, 105.88], [108.0, 114.08], [117.0, 117.63], [118.0, 124.09]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 51.6, 87.19, 47.54, 74.76, 0.0, 55.04], "audiomae_on_audioset": [null, null, null, null, null, [["music", 30.24], ["speech", 22.55], ["burping, eructation", 7.23]], null, null, null, null, null, null, null, null, null, null, [["music", 81.3], ["guitar", 2.01], ["drum machine", 1.41]], null, null, null], "duration": [1.82, 0.65, 0.42, -0.08, 0.66, 2.89, 0.1, -0.12, 1.69, 0.7, 0.89, -0.04, 0.26, 2.41, 11.32, 2.97, 18.88, 6.08, 0.63, 6.09]} \ No newline at end of file diff --git a/annotations_1/q8woScnBklo_filtered.json b/annotations_1/q8woScnBklo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef28657ad8231fd2a538d5b3c51ff4d2aee8dee8 --- /dev/null +++ b/annotations_1/q8woScnBklo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.85], [10.0, 10.93], [11.0, 14.2], [15.0, 16.39], [18.0, 18.3], [20.0, 34.26], [45.0, 52.89], [59.0, 59.97], [61.0, 62.33], [66.0, 65.77], [68.0, 71.51], [75.0, 84.62], [88.0, 88.4], [89.0, 92.4], [95.0, 100.03], [100.0, 101.49], [103.0, 103.89], [105.0, 105.83], [107.0, 111.43], [113.0, 112.89], [113.0, 113.93], [115.0, 115.13], [116.0, 121.66]], "keep_status": [false, false, true, false, false, true, true, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.52, 0.0, 0.0, 31.53, 30.65, 0.0, 0.0, 0.0, 46.64, 33.69, 0.0, 43.1, 72.75, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 57.72], "audiomae_on_audioset": [null, null, [["music", 34.39], ["foghorn", 21.29], ["musical instrument", 7.78]], null, null, [["music", 35.93], ["musical instrument", 7.83], ["foghorn", 4.61]], [["music", 41.17], ["foghorn", 11.23], ["quack", 8.46]], null, null, null, [["music", 44.16], ["theremin", 6.76], ["musical instrument", 5.01]], [["music", 46.94], ["musical instrument", 10.55], ["theremin", 8.52]], null, [["music", 53.88], ["theremin", 7.92], ["hum", 4.27]], null, null, null, null, null, null, null, null, null], "duration": [-0.15, 0.93, 3.2, 1.39, 0.3, 14.26, 7.89, 0.97, 1.33, -0.23, 3.51, 9.62, 0.4, 3.4, 5.03, 1.49, 0.89, 0.83, 4.43, -0.11, 0.93, 0.13, 5.66]} \ No newline at end of file diff --git a/annotations_1/q928Wa_h_gg_filtered.json b/annotations_1/q928Wa_h_gg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fc94ab59cb9b93ac30371f48148164bed49be384 --- /dev/null +++ b/annotations_1/q928Wa_h_gg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 29.29], [31.0, 30.82], [31.0, 30.89], [31.0, 40.51], [56.0, 60.88], [68.0, 72.52], [74.0, 75.79], [81.0, 81.57], [87.0, 91.4], [94.0, 95.88]], "keep_status": [false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.85, 30.07, 32.84, 0.0, 0.0, 30.54, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.63], ["hum", 15.33], ["mains hum", 8.21]], [["fly, housefly", 46.03], ["mosquito", 32.07], ["insect", 15.72]], [["breaking", 20.63], ["gunshot, gunfire", 10.41], ["clang", 9.49]], null, null, [["music", 24.16], ["speech", 17.1], ["whack, thwack", 10.06]], null], "duration": [0.29, -0.18, -0.11, 9.51, 4.88, 4.52, 1.79, 0.57, 4.4, 1.88]} \ No newline at end of file diff --git a/annotations_1/q9FYBjSc3cU_filtered.json b/annotations_1/q9FYBjSc3cU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2b9e63352ae464b4ad76a70f7629c1c37599cfd --- /dev/null +++ b/annotations_1/q9FYBjSc3cU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.74], [16.0, 18.47], [20.0, 21.49], [23.0, 23.06], [27.0, 29.59], [34.0, 54.55], [56.0, 74.73], [75.0, 94.04], [97.0, 100.23], [102.0, 102.54], [103.0, 107.6], [109.0, 111.86], [113.0, 115.38], [117.0, 118.4], [121.0, 124.11], [126.0, 126.57], [129.0, 129.34], [132.0, 132.48], [134.0, 134.96], [137.0, 137.56], [143.0, 145.84], [148.0, 148.12], [152.0, 151.95], [163.0, 165.05], [170.0, 171.27], [172.0, 174.73], [176.0, 177.2], [178.0, 179.1], [180.0, 180.57]], "keep_status": [false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 37.45, 0.0, 0.0, 38.91, 46.86, 32.24, 31.15, 33.2, 0.0, 32.5, 70.02, 93.6, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 76.86, 0.0, 0.0, 57.4, 0.0, 42.06, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 36.92], ["speech", 14.2], ["hum", 8.52]], null, null, [["hum", 41.94], ["mains hum", 12.28], ["throbbing", 11.41]], [["music", 59.53], ["throbbing", 13.08], ["hum", 11.12]], [["music", 57.79], ["throbbing", 17.4], ["hum", 4.98]], [["music", 64.34], ["throbbing", 9.35], ["electronic music", 3.6]], [["speech", 26.25], ["music", 24.69], ["smash, crash", 8.67]], null, [["speech", 70.16], ["fart", 8.9], ["music", 6.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.3], ["ambient music", 10.99], ["hum", 5.41]], null, null, null], "duration": [0.74, 2.47, 1.49, 0.06, 2.59, 20.55, 18.73, 19.04, 3.23, 0.54, 4.6, 2.86, 2.38, 1.4, 3.11, 0.57, 0.34, 0.48, 0.96, 0.56, 2.84, 0.12, -0.05, 2.05, 1.27, 2.73, 1.2, 1.1, 0.57]} \ No newline at end of file diff --git a/annotations_1/q9Wip3v8h40_filtered.json b/annotations_1/q9Wip3v8h40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fa2575a6a8cfb235c65b6cca86bba6cf1bb7bf7 --- /dev/null +++ b/annotations_1/q9Wip3v8h40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.85], [15.0, 15.15], [17.0, 17.56], [18.0, 17.76], [22.0, 24.73], [29.0, 29.51], [30.0, 29.62], [34.0, 40.58], [43.0, 46.23], [48.0, 48.95], [65.0, 65.96], [67.0, 67.12], [68.0, 70.56], [76.0, 79.71], [84.0, 84.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.61, 0.0, 0.0, 32.74, 33.9, 0.0, 0.0, 0.0, 34.99, 55.89, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 70.77], ["fly, housefly", 4.33], ["music", 3.48]], null, null, [["music", 68.48], ["musical instrument", 3.57], ["speech", 3.29]], [["music", 26.2], ["speech", 21.96], ["boing", 14.84]], null, null, null, [["cattle, bovinae", 29.44], ["moo", 17.85], ["livestock, farm animals, working animals", 10.88]], null, null], "duration": [1.85, 0.15, 0.56, -0.24, 2.73, 0.51, -0.38, 6.58, 3.23, 0.95, 0.96, 0.12, 2.56, 3.71, 0.45]} \ No newline at end of file diff --git a/annotations_1/q9X6tpvxZyE_filtered.json b/annotations_1/q9X6tpvxZyE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1b01ebdf274dd86ad58c47910653989bfc6d22b --- /dev/null +++ b/annotations_1/q9X6tpvxZyE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.27], [11.0, 13.49], [24.0, 24.44], [27.0, 29.64], [39.0, 40.05], [46.0, 47.66], [49.0, 53.92], [55.0, 55.73], [59.0, 60.54], [61.0, 61.99], [63.0, 63.0], [63.0, 67.36], [69.0, 77.19], [78.0, 83.51], [85.0, 86.7], [89.0, 89.18], [89.0, 90.63], [102.0, 101.92], [117.0, 117.83], [126.0, 126.82], [128.0, 129.46], [130.0, 132.36], [133.0, 133.66], [135.0, 136.36], [142.0, 142.25], [144.0, 144.58], [157.0, 157.0], [158.0, 158.63], [159.0, 163.65], [165.0, 173.53], [174.0, 176.42], [178.0, 181.92], [183.0, 185.4], [186.0, 186.65], [187.0, 188.11], [192.0, 192.97], [193.0, 194.56], [195.0, 195.62], [196.0, 228.8], [230.0, 232.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.36, 0.0, 93.91, 0.0, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 60.79, 99.59, 99.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.95, 80.64, 73.67, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 31.51], ["speech", 26.87], ["music", 14.32]]], "duration": [0.27, 2.49, 0.44, 2.64, 1.05, 1.66, 4.92, 0.73, 1.54, 0.99, 0.0, 4.36, 8.19, 5.51, 1.7, 0.18, 1.63, -0.08, 0.83, 0.82, 1.46, 2.36, 0.66, 1.36, 0.25, 0.58, 0.0, 0.63, 4.65, 8.53, 2.42, 3.92, 2.4, 0.65, 1.11, 0.97, 1.56, 0.62, 32.8, 2.71]} \ No newline at end of file diff --git a/annotations_1/q9sjo2J6hIk_filtered.json b/annotations_1/q9sjo2J6hIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4395663414ad1c72b4a224fc5940e13c49f1a8ee --- /dev/null +++ b/annotations_1/q9sjo2J6hIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.07], [15.0, 107.87], [111.0, 111.47], [113.0, 113.59]], "keep_status": [false, false, false, false], "silence_prob": [38.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.52], ["cattle, bovinae", 20.28], ["moo", 20.09]], null, null, null], "duration": [9.07, 92.87, 0.47, 0.59]} \ No newline at end of file diff --git a/annotations_1/qA_zzk2c7G8_filtered.json b/annotations_1/qA_zzk2c7G8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6984c2e263016dc5faa08cd39d77e0e015ec3c31 --- /dev/null +++ b/annotations_1/qA_zzk2c7G8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.36], [11.0, 20.11], [28.0, 28.07], [29.0, 28.98], [31.0, 31.62], [34.0, 34.18], [38.0, 38.87], [40.0, 43.75], [44.0, 44.42], [44.0, 51.06], [57.0, 57.77], [60.0, 63.22], [66.0, 66.66], [68.0, 68.28], [69.0, 69.21], [73.0, 74.43], [77.0, 101.51], [103.0, 103.44], [103.0, 103.52], [104.0, 104.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [89.9, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 91.47, 0.0, 42.74, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 54.19], ["speech", 10.43], ["mosquito", 8.44]], null, [["music", 43.92], ["speech", 8.82], ["boing", 5.34]], null, null, null, null, null, null, null, null], "duration": [2.36, 9.11, 0.07, -0.02, 0.62, 0.18, 0.87, 3.75, 0.42, 7.06, 0.77, 3.22, 0.66, 0.28, 0.21, 1.43, 24.51, 0.44, 0.52, 0.04]} \ No newline at end of file diff --git a/annotations_1/qAfsU2gI408_filtered.json b/annotations_1/qAfsU2gI408_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20d897ac60e0eecf4505fd2eab878ddc38e54f31 --- /dev/null +++ b/annotations_1/qAfsU2gI408_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.91], [5.0, 5.37], [7.0, 7.21], [10.0, 10.89], [12.0, 12.66], [14.0, 13.66], [15.0, 16.63], [18.0, 21.84], [23.0, 24.16], [25.0, 27.03], [28.0, 29.51], [30.0, 30.77], [32.0, 32.53], [34.0, 34.99], [35.0, 35.78], [36.0, 39.97], [41.0, 42.15], [44.0, 44.22], [44.0, 51.48], [52.0, 53.64], [54.0, 55.27], [58.0, 61.2], [62.0, 62.65], [64.0, 64.59], [65.0, 101.36], [102.0, 106.41], [109.0, 150.18], [152.0, 159.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 0.0, 99.88, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 46.36, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 46.06], ["throbbing", 17.95], ["mains hum", 14.39]], null, null], "duration": [1.91, 0.37, 0.21, 0.89, 0.66, -0.34, 1.63, 3.84, 1.16, 2.03, 1.51, 0.77, 0.53, 0.99, 0.78, 3.97, 1.15, 0.22, 7.48, 1.64, 1.27, 3.2, 0.65, 0.59, 36.36, 4.41, 41.18, 7.24]} \ No newline at end of file diff --git a/annotations_1/qB311wvyggM_filtered.json b/annotations_1/qB311wvyggM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4eb1898d36ed96e54fa2e130763dc83759e9281 --- /dev/null +++ b/annotations_1/qB311wvyggM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 38.01], [39.0, 39.65], [41.0, 55.07], [57.0, 66.8], [68.0, 71.0], [72.0, 92.21]], "keep_status": [false, false, true, false, true, true], "silence_prob": [35.08, 0.0, 41.62, 53.04, 34.69, 33.21], "audiomae_on_audioset": [[["speech", 57.19], ["sidetone", 11.27], ["hum", 6.95]], null, [["speech", 19.4], ["mains hum", 7.7], ["vehicle", 6.73]], null, [["music", 35.53], ["electronic music", 13.64], ["synthesizer", 6.38]], [["hum", 32.82], ["mains hum", 25.34], ["speech", 9.67]]], "duration": [2.01, 0.65, 14.07, 9.8, 3.0, 20.21]} \ No newline at end of file diff --git a/annotations_1/qB93c2JU4uQ_filtered.json b/annotations_1/qB93c2JU4uQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ea77281ad3289bcba8a9aac58e3f779ac9843b --- /dev/null +++ b/annotations_1/qB93c2JU4uQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.96], [22.0, 22.84], [51.0, 50.92], [57.0, 57.55], [62.0, 65.69], [66.0, 67.78], [68.0, 68.52], [71.0, 70.95], [78.0, 78.43], [79.0, 79.57], [81.0, 105.22], [105.0, 106.42], [111.0, 111.3], [113.0, 136.9], [138.0, 144.02], [146.0, 179.05], [182.0, 199.94], [204.0, 205.43], [206.0, 206.52], [208.0, 209.97], [216.0, 225.96], [227.0, 234.25], [241.0, 243.43]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.7, 0.0, 0.0, 0.0, 0.0, 0.0, 31.42, 0.0, 0.0, 30.01, 30.46, 0.0, 29.95, 0.0, 0.0, 0.0, 30.16, 31.6, 43.48], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 34.32], ["music", 12.6], ["insect", 11.09]], null, null, null, null, null, [["mains hum", 36.25], ["hum", 32.72], ["music", 16.55]], null, null, [["throbbing", 27.29], ["hum", 26.7], ["music", 23.85]], [["music", 54.36], ["throbbing", 21.51], ["hum", 10.9]], null, [["music", 44.56], ["speech", 24.95], ["groan", 5.42]], null, null, null, [["music", 40.83], ["boing", 12.0], ["smash, crash", 5.39]], [["music", 52.22], ["throbbing", 15.17], ["hum", 7.9]], [["music", 58.53], ["boing", 5.78], ["musical instrument", 4.11]]], "duration": [0.96, 0.84, -0.08, 0.55, 3.69, 1.78, 0.52, -0.05, 0.43, 0.57, 24.22, 1.42, 0.3, 23.9, 6.02, 33.05, 17.94, 1.43, 0.52, 1.97, 9.96, 7.25, 2.43]} \ No newline at end of file diff --git a/annotations_1/qCYYMqHyPKk_filtered.json b/annotations_1/qCYYMqHyPKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f75dc67f97fdbdf8c2c2422a60b0fb6f265fa0e --- /dev/null +++ b/annotations_1/qCYYMqHyPKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.64], [8.0, 24.63], [28.0, 33.59], [34.0, 38.6], [39.0, 40.66], [52.0, 57.21], [66.0, 69.21], [71.0, 72.67], [80.0, 100.94], [104.0, 124.39]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 52.62, 64.18, 51.6, 0.0, 63.42, 50.61, 0.0, 63.21, 40.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 34.88], ["explosion", 13.29], ["hum", 7.61]]], "duration": [0.64, 16.63, 5.59, 4.6, 1.66, 5.21, 3.21, 1.67, 20.94, 20.39]} \ No newline at end of file diff --git a/annotations_1/qC_pkxnYQfk_filtered.json b/annotations_1/qC_pkxnYQfk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..360d701b4fe3700ca0a876bdd8e74508967cb5cf --- /dev/null +++ b/annotations_1/qC_pkxnYQfk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 44.47], [48.0, 51.76], [52.0, 96.7]], "keep_status": [true, false, false], "silence_prob": [43.9, 28.36, 0.0], "audiomae_on_audioset": [[["music", 56.03], ["hum", 7.02], ["ambient music", 6.41]], [["livestock, farm animals, working animals", 42.48], ["cattle, bovinae", 23.25], ["moo", 15.27]], null], "duration": [26.47, 3.76, 44.7]} \ No newline at end of file diff --git a/annotations_1/qCjSApp2o1E_filtered.json b/annotations_1/qCjSApp2o1E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89d1871fe56ade197c01ae79967949a86ef6a1e9 --- /dev/null +++ b/annotations_1/qCjSApp2o1E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.26], [24.0, 24.33], [28.0, 29.02], [31.0, 33.49], [37.0, 46.04], [51.0, 52.73], [54.0, 57.65], [60.0, 61.21], [64.0, 65.94], [72.0, 72.25], [74.0, 74.56], [78.0, 80.33], [82.0, 81.73], [84.0, 92.4], [96.0, 96.69], [99.0, 99.52], [100.0, 99.55]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 85.9, 31.92, 0.0, 44.72, 0.0, 0.0, 0.0, 0.0, 44.96, 0.0, 28.66, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.33], ["sidetone", 22.48], ["music", 11.55]], null, [["hum", 22.74], ["music", 20.05], ["throbbing", 17.06]], null, null, null, null, [["hum", 22.15], ["mains hum", 9.31], ["music", 7.24]], null, [["mains hum", 32.13], ["hum", 21.98], ["music", 19.88]], null, null, null], "duration": [1.26, 0.33, 1.02, 2.49, 9.04, 1.73, 3.65, 1.21, 1.94, 0.25, 0.56, 2.33, -0.27, 8.4, 0.69, 0.52, -0.45]} \ No newline at end of file diff --git a/annotations_1/qDjmN1TyJAU_filtered.json b/annotations_1/qDjmN1TyJAU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cde8d0ef8d7547a8ad1dd5e025823d140313a07c --- /dev/null +++ b/annotations_1/qDjmN1TyJAU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.23], [18.0, 38.5], [45.0, 49.64], [54.0, 60.83], [62.0, 63.14], [66.0, 66.21], [69.0, 69.43], [70.0, 73.08], [74.0, 74.83], [76.0, 75.74], [77.0, 79.69], [84.0, 84.45], [87.0, 90.49], [93.0, 94.46], [96.0, 97.23], [99.0, 100.16], [102.0, 102.59], [104.0, 105.04], [106.0, 108.36], [111.0, 111.35], [117.0, 119.26]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.47, 31.13, 36.52, 91.47, 0.0, 0.0, 0.0, 46.47, 0.0, 0.0, 97.83, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0], "audiomae_on_audioset": [[["speech", 25.88], ["hum", 21.65], ["throbbing", 13.02]], [["vehicle", 35.33], ["boat, water vehicle", 9.01], ["motorboat, speedboat", 7.88]], [["hum", 39.59], ["mains hum", 36.4], ["throbbing", 9.31]], null, null, null, null, [["speech", 71.58], ["sidetone", 11.53], ["dial tone", 3.29]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.23, 20.5, 4.64, 6.83, 1.14, 0.21, 0.43, 3.08, 0.83, -0.26, 2.69, 0.45, 3.49, 1.46, 1.23, 1.16, 0.59, 1.04, 2.36, 0.35, 2.26]} \ No newline at end of file diff --git a/annotations_1/qEH9lnYIndY_filtered.json b/annotations_1/qEH9lnYIndY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82f707bd6804c93d51ec00cd057e84890b3c1541 --- /dev/null +++ b/annotations_1/qEH9lnYIndY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.91], [15.0, 15.52], [24.0, 26.32], [36.0, 39.99], [41.0, 43.73], [45.0, 44.98], [46.0, 50.26], [52.0, 100.6], [105.0, 112.31], [113.0, 114.02], [116.0, 144.44], [147.0, 150.13], [150.0, 152.58], [157.0, 158.45]], "keep_status": [false, false, false, true, true, false, true, false, false, false, true, false, true, false], "silence_prob": [42.26, 0.0, 39.6, 49.09, 40.95, 0.0, 39.49, 0.0, 30.05, 0.0, 29.6, 31.48, 32.23, 0.0], "audiomae_on_audioset": [[["throbbing", 60.41], ["music", 14.57], ["hum", 13.51]], null, [["throbbing", 69.52], ["hum", 12.53], ["music", 5.75]], [["music", 27.6], ["hum", 22.69], ["throbbing", 12.38]], [["hum", 33.51], ["throbbing", 23.85], ["mains hum", 11.8]], null, [["synthesizer", 24.21], ["music", 22.99], ["hum", 12.16]], null, [["speech", 68.23], ["music", 6.34], ["eruption", 4.13]], null, [["speech", 46.97], ["music", 10.1], ["whip", 4.98]], [["music", 73.58], ["synthesizer", 4.19], ["musical instrument", 3.42]], [["speech", 31.34], ["music", 23.03], ["hum", 9.47]], null], "duration": [5.91, 0.52, 2.32, 3.99, 2.73, -0.02, 4.26, 48.6, 7.31, 1.02, 28.44, 3.13, 2.58, 1.45]} \ No newline at end of file diff --git a/annotations_1/qEb51O12XFw_filtered.json b/annotations_1/qEb51O12XFw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdad4ff76927b08faf4023e31e0a72af855b40ad --- /dev/null +++ b/annotations_1/qEb51O12XFw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 24.8], [32.0, 31.8], [32.0, 32.61], [35.0, 37.84], [39.0, 41.2], [42.0, 42.84], [45.0, 45.96], [48.0, 64.98], [70.0, 74.75], [79.0, 106.95], [108.0, 108.53]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 50.81, 49.18, 0.0, 0.0, 29.05, 51.99, 29.44, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 49.69], ["speech", 12.28], ["music", 8.38]], null, null, [["music", 65.3], ["throbbing", 10.91], ["electronic music", 5.42]], null, [["music", 46.18], ["throbbing", 8.14], ["electronic music", 6.81]], null], "duration": [0.8, -0.2, 0.61, 2.84, 2.2, 0.84, 0.96, 16.98, 4.75, 27.95, 0.53]} \ No newline at end of file diff --git a/annotations_1/qFH0mR6eVLg_filtered.json b/annotations_1/qFH0mR6eVLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd0360000ddf0c5fb9bf1f60f3021ce27ae03773 --- /dev/null +++ b/annotations_1/qFH0mR6eVLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.87], [12.0, 20.71], [21.0, 22.0], [22.0, 28.16], [29.0, 33.24], [34.0, 36.14], [41.0, 42.18], [43.0, 43.95], [44.0, 46.58], [48.0, 52.08], [52.0, 56.98], [58.0, 59.31], [61.0, 63.0], [63.0, 66.02], [67.0, 68.54], [69.0, 118.79], [120.0, 120.19], [126.0, 129.1]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [80.82, 69.74, 0.0, 47.23, 40.62, 41.46, 0.0, 0.0, 55.74, 57.48, 51.82, 0.0, 76.2, 42.67, 0.0, 0.0, 0.0, 37.77], "audiomae_on_audioset": [null, null, null, [["hum", 37.04], ["speech", 25.56], ["throbbing", 5.74]], [["speech", 48.85], ["sidetone", 14.54], ["music", 6.1]], [["speech", 28.86], ["music", 23.67], ["sidetone", 6.78]], null, null, null, null, null, null, null, [["speech", 39.88], ["sidetone", 9.67], ["music", 9.45]], null, null, null, [["whack, thwack", 12.43], ["mosquito", 7.42], ["fly, housefly", 6.96]]], "duration": [5.87, 8.71, 1.0, 6.16, 4.24, 2.14, 1.18, 0.95, 2.58, 4.08, 4.98, 1.31, 2.0, 3.02, 1.54, 49.79, 0.19, 3.1]} \ No newline at end of file diff --git a/annotations_1/qFprLPWDd-Y_filtered.json b/annotations_1/qFprLPWDd-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0554cf4ee5ad16801d0e52b717b245c5f7ca7581 --- /dev/null +++ b/annotations_1/qFprLPWDd-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.36], [13.0, 13.86], [14.0, 14.94], [20.0, 21.83]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [0.36, 0.86, 0.94, 1.83]} \ No newline at end of file diff --git a/annotations_1/qHA5R-Q1Od8_filtered.json b/annotations_1/qHA5R-Q1Od8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec00b83607f66ea1fd7654f7d87788d8a8aef4b --- /dev/null +++ b/annotations_1/qHA5R-Q1Od8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.76], [16.0, 15.96], [20.0, 21.09], [22.0, 23.87], [24.0, 27.06], [30.0, 30.03], [30.0, 30.38], [35.0, 36.32], [41.0, 41.05], [42.0, 46.23], [48.0, 47.97], [50.0, 50.23], [54.0, 54.85], [57.0, 58.99], [64.0, 64.4], [67.0, 67.81], [74.0, 82.0], [83.0, 86.71], [88.0, 90.69], [91.0, 93.04], [97.0, 98.24], [99.0, 100.97], [102.0, 102.9], [106.0, 106.95], [110.0, 112.45], [113.0, 115.28], [116.0, 118.32], [119.0, 125.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.36, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 85.9, 96.04, 100.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, -0.04, 1.09, 1.87, 3.06, 0.03, 0.38, 1.32, 0.05, 4.23, -0.03, 0.23, 0.85, 1.99, 0.4, 0.81, 8.0, 3.71, 2.69, 2.04, 1.24, 1.97, 0.9, 0.95, 2.45, 2.28, 2.32, 6.61]} \ No newline at end of file diff --git a/annotations_1/qHisKG66fLI_filtered.json b/annotations_1/qHisKG66fLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d252ccf403986400b92ce1184f588be0adfaa2 --- /dev/null +++ b/annotations_1/qHisKG66fLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.45], [5.0, 20.87], [25.0, 25.79], [30.0, 31.99], [33.0, 34.25], [35.0, 36.09], [39.0, 42.74], [44.0, 44.42], [45.0, 48.88], [51.0, 51.51], [54.0, 59.31], [64.0, 72.17], [78.0, 91.12], [95.0, 96.16], [98.0, 98.52], [100.0, 103.65], [105.0, 107.96], [110.0, 128.8], [130.0, 131.41], [133.0, 137.49], [139.0, 141.25], [143.0, 144.29], [146.0, 147.23], [149.0, 149.07], [151.0, 153.22], [154.0, 154.6], [156.0, 163.75], [166.0, 169.42], [171.0, 171.58], [173.0, 175.86]], "keep_status": [false, true, false, false, false, false, true, false, true, false, true, false, true, false, false, false, true, true, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [39.66, 30.27, 0.0, 0.0, 0.0, 0.0, 36.11, 0.0, 48.56, 0.0, 29.86, 30.27, 29.8, 0.0, 0.0, 53.16, 29.71, 29.11, 0.0, 30.07, 29.39, 0.0, 0.0, 0.0, 47.01, 0.0, 35.3, 48.1, 0.0, 39.77], "audiomae_on_audioset": [[["music", 58.26], ["hum", 11.27], ["singing bowl", 5.72]], [["grunt", 19.16], ["music", 15.51], ["animal", 14.62]], null, null, null, null, [["music", 28.04], ["gong", 18.6], ["hum", 11.89]], null, [["music", 49.86], ["foghorn", 11.51], ["ambient music", 5.47]], null, [["grunt", 39.23], ["music", 12.32], ["wild animals", 6.92]], [["music", 84.06], ["roaring cats (lions, tigers)", 1.99], ["wild animals", 1.74]], [["music", 40.99], ["sound effect", 5.5], ["hum", 5.23]], null, null, null, [["music", 27.42], ["speech", 20.33], ["carnatic music", 6.72]], [["music", 46.15], ["sound effect", 3.43], ["groan", 3.42]], null, [["speech", 28.9], ["music", 20.93], ["didgeridoo", 6.2]], [["hum", 22.7], ["music", 17.88], ["sonar", 8.24]], null, null, null, [["hum", 41.1], ["music", 25.36], ["throbbing", 6.38]], null, [["music", 73.66], ["ambient music", 6.29], ["synthesizer", 4.6]], [["music", 62.33], ["singing bowl", 3.45], ["ambient music", 3.13]], null, [["music", 50.09], ["theremin", 16.36], ["musical instrument", 3.58]]], "duration": [2.45, 15.87, 0.79, 1.99, 1.25, 1.09, 3.74, 0.42, 3.88, 0.51, 5.31, 8.17, 13.12, 1.16, 0.52, 3.65, 2.96, 18.8, 1.41, 4.49, 2.25, 1.29, 1.23, 0.07, 2.22, 0.6, 7.75, 3.42, 0.58, 2.86]} \ No newline at end of file diff --git a/annotations_1/qIalODmFrZk_filtered.json b/annotations_1/qIalODmFrZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23456326960c6fbf43ac86964edef763ff5448b2 --- /dev/null +++ b/annotations_1/qIalODmFrZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.51], [12.0, 20.06], [28.0, 28.05], [37.0, 37.22], [40.0, 41.01], [46.0, 47.68], [53.0, 53.28], [61.0, 61.37], [67.0, 70.09], [76.0, 82.61], [92.0, 92.31], [93.0, 94.32], [95.0, 96.7], [110.0, 114.4], [128.0, 128.83], [136.0, 136.49], [139.0, 144.04], [150.0, 157.77], [158.0, 159.56], [165.0, 172.96], [181.0, 182.19], [185.0, 186.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.05, 42.15, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 36.08, 36.27, 0.0, 37.17, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 63.53], ["door", 10.11], ["throbbing", 6.08]], null, null, null, null, null, null, [["music", 61.68], ["throbbing", 11.64], ["hum", 8.36]], [["music", 37.87], ["throbbing", 24.8], ["speech", 8.25]], null, null, null, [["music", 43.42], ["speech", 12.76], ["fusillade", 5.97]], null, null, [["music", 29.7], ["shuffling cards", 29.07], ["speech", 15.24]], [["music", 49.91], ["speech", 29.26], ["synthesizer", 3.57]], null, [["music", 68.35], ["chink, clink", 7.55], ["glass", 5.65]], null, null], "duration": [1.51, 8.06, 0.05, 0.22, 1.01, 1.68, 0.28, 0.37, 3.09, 6.61, 0.31, 1.32, 1.7, 4.4, 0.83, 0.49, 5.04, 7.77, 1.56, 7.96, 1.19, 1.11]} \ No newline at end of file diff --git a/annotations_1/qIs2PMXvAmQ_filtered.json b/annotations_1/qIs2PMXvAmQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f007e1ec6bf553bca64f78bcd2c9ddc1b24cf56 --- /dev/null +++ b/annotations_1/qIs2PMXvAmQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.56], [6.0, 6.61], [7.0, 6.81], [7.0, 6.94], [7.0, 8.04], [13.0, 13.76], [19.0, 23.43], [23.0, 23.5], [24.0, 23.73], [24.0, 23.79], [24.0, 23.82], [26.0, 25.74], [28.0, 27.77], [42.0, 43.29], [44.0, 44.71], [46.0, 54.94], [57.0, 57.47], [61.0, 65.18], [66.0, 81.33], [88.0, 93.36], [96.0, 114.49], [118.0, 120.72], [122.0, 123.08], [128.0, 133.12]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.26, 0.0, 30.84, 31.36, 30.94, 31.16, 32.25, 0.0, 31.32], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 44.15], ["speech", 23.65], ["vehicle", 2.09]], null, null, null, null, null, null, null, null, [["music", 69.89], ["synthesizer", 3.37], ["throbbing", 2.45]], null, [["music", 54.92], ["electronic music", 4.55], ["boing", 4.15]], [["speech", 27.07], ["music", 23.96], ["hum", 20.29]], [["music", 46.49], ["speech", 11.78], ["cacophony", 7.78]], [["music", 23.76], ["speech", 23.08], ["buzz", 6.37]], [["music", 34.69], ["speech", 14.1], ["mains hum", 8.26]], null, [["music", 22.53], ["speech", 13.29], ["vehicle", 7.87]]], "duration": [0.56, 0.61, -0.19, -0.06, 1.04, 0.76, 4.43, 0.5, -0.27, -0.21, -0.18, -0.26, -0.23, 1.29, 0.71, 8.94, 0.47, 4.18, 15.33, 5.36, 18.49, 2.72, 1.08, 5.12]} \ No newline at end of file diff --git a/annotations_1/qItvl5cX4-A_filtered.json b/annotations_1/qItvl5cX4-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dd728891c42f4334b75e0c9537f73874508e852 --- /dev/null +++ b/annotations_1/qItvl5cX4-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.39], [7.0, 8.41], [11.0, 19.18], [21.0, 21.86], [23.0, 26.35], [28.0, 31.28], [32.0, 33.76], [36.0, 37.47], [38.0, 39.8], [45.0, 45.39], [50.0, 55.12], [57.0, 57.87], [60.0, 63.48], [67.0, 68.1], [75.0, 76.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.0, 0.0, 65.09, 68.8, 0.0, 0.0, 0.0, 0.0, 66.27, 0.0, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.41, 8.18, 0.86, 3.35, 3.28, 1.76, 1.47, 1.8, 0.39, 5.12, 0.87, 3.48, 1.1, 1.2]} \ No newline at end of file diff --git a/annotations_1/qJznSue3tEs_filtered.json b/annotations_1/qJznSue3tEs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ebd5b362adc804ffabcaac5d28c3e0d473fae39 --- /dev/null +++ b/annotations_1/qJznSue3tEs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.62], [3.0, 5.58], [7.0, 9.76], [11.0, 13.54], [17.0, 18.99], [20.0, 21.34], [22.0, 23.3], [24.0, 26.69], [27.0, 30.3], [32.0, 31.95], [33.0, 35.78], [37.0, 43.34], [45.0, 47.73], [51.0, 53.94], [57.0, 59.46], [61.0, 65.16], [66.0, 67.17], [68.0, 69.2], [69.0, 69.53], [70.0, 75.25], [76.0, 78.49], [79.0, 87.71], [89.0, 91.23], [92.0, 102.44], [106.0, 108.72], [110.0, 116.5], [118.0, 122.12], [124.0, 126.86], [128.0, 130.06], [131.0, 132.26], [135.0, 148.17], [152.0, 156.27], [157.0, 161.45], [165.0, 167.02], [168.0, 169.67], [171.0, 173.35]], "keep_status": [false, true, true, true, false, false, false, true, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.44, 35.1, 33.78, 0.0, 0.0, 0.0, 35.07, 35.75, 0.0, 35.88, 37.2, 35.0, 59.77, 100.0, 66.76, 0.0, 0.0, 0.0, 62.58, 66.03, 91.98, 70.86, 94.81, 100.0, 100.0, 98.99, 99.73, 97.33, 0.0, 77.2, 80.29, 99.65, 91.47, 0.0, 99.73], "audiomae_on_audioset": [null, [["music", 44.36], ["hum", 8.51], ["throbbing", 6.21]], [["music", 34.77], ["hum", 17.66], ["throbbing", 8.7]], [["music", 36.64], ["didgeridoo", 14.94], ["speech", 8.69]], null, null, null, [["music", 24.52], ["speech", 16.43], ["synthesizer", 11.47]], [["hum", 26.52], ["music", 21.65], ["throbbing", 19.05]], null, [["music", 54.34], ["electronic music", 9.13], ["ambient music", 6.85]], [["music", 32.6], ["ambient music", 9.89], ["speech", 9.6]], [["music", 29.76], ["hum", 27.58], ["mains hum", 9.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.38, 2.58, 2.76, 2.54, 1.99, 1.34, 1.3, 2.69, 3.3, -0.05, 2.78, 6.34, 2.73, 2.94, 2.46, 4.16, 1.17, 1.2, 0.53, 5.25, 2.49, 8.71, 2.23, 10.44, 2.72, 6.5, 4.12, 2.86, 2.06, 1.26, 13.17, 4.27, 4.45, 2.02, 1.67, 2.35]} \ No newline at end of file diff --git a/annotations_1/qL5_xmtFVDo_filtered.json b/annotations_1/qL5_xmtFVDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcbdf0820c53b11801c7c957c429cac2ef3c5c77 --- /dev/null +++ b/annotations_1/qL5_xmtFVDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [5.0, 5.53], [7.0, 8.7], [23.0, 23.87], [34.0, 34.75], [46.0, 46.21], [47.0, 48.57], [56.0, 60.1], [66.0, 67.12], [72.0, 72.2], [78.0, 78.26], [102.0, 101.7], [104.0, 104.3], [112.0, 112.11], [127.0, 127.99], [139.0, 139.19], [140.0, 140.31], [141.0, 140.9], [141.0, 141.03], [157.0, 157.81], [158.0, 158.38], [164.0, 164.02], [165.0, 165.99], [176.0, 177.42], [184.0, 184.05], [193.0, 193.36], [202.0, 201.7], [206.0, 206.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["whale vocalization", 96.87], ["stomach rumble", 0.36], ["liquid", 0.35]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 0.53, 1.7, 0.87, 0.75, 0.21, 1.57, 4.1, 1.12, 0.2, 0.26, -0.3, 0.3, 0.11, 0.99, 0.19, 0.31, -0.1, 0.03, 0.81, 0.38, 0.02, 0.99, 1.42, 0.05, 0.36, -0.3, 0.22]} \ No newline at end of file diff --git a/annotations_1/qLCy66eZrQs_filtered.json b/annotations_1/qLCy66eZrQs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e823c94379300b751b325183678842fc1d6d02f --- /dev/null +++ b/annotations_1/qLCy66eZrQs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [5.0, 6.37], [9.0, 34.45], [38.0, 38.35], [44.0, 45.82], [47.0, 48.2], [53.0, 55.68], [59.0, 59.88], [62.0, 64.25], [67.0, 67.31], [68.0, 69.04], [71.0, 71.74], [77.0, 81.06], [83.0, 84.13], [87.0, 88.16], [90.0, 91.08], [92.0, 95.23], [98.0, 99.08]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 37.09, 0.0, 0.0, 0.0, 87.92, 0.0, 96.04, 0.0, 0.0, 0.0, 71.14, 0.0, 0.0, 0.0, 62.07, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.71], ["musical instrument", 11.07], ["speech", 9.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.37, 25.45, 0.35, 1.82, 1.2, 2.68, 0.88, 2.25, 0.31, 1.04, 0.74, 4.06, 1.13, 1.16, 1.08, 3.23, 1.08]} \ No newline at end of file diff --git a/annotations_1/qLFrdv2R8ng_filtered.json b/annotations_1/qLFrdv2R8ng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2120f34919e03ce354156c00b476adf61f456d --- /dev/null +++ b/annotations_1/qLFrdv2R8ng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.75], [16.0, 19.53], [21.0, 22.94], [23.0, 25.05], [26.0, 26.87], [27.0, 28.86], [29.0, 32.64], [34.0, 34.33], [35.0, 39.8], [55.0, 55.44], [62.0, 64.15], [85.0, 85.89], [91.0, 92.53], [100.0, 101.58], [106.0, 106.34], [107.0, 109.16], [110.0, 122.34], [123.0, 124.11], [125.0, 126.71]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 61.57, 0.0, 67.38, 0.0, 0.0, 82.79, 0.0, 36.56, 0.0, 49.04, 0.0, 0.0, 0.0, 0.0, 100.0, 46.57, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 16.11], ["livestock, farm animals, working animals", 9.2], ["cattle, bovinae", 9.01]], null, [["fly, housefly", 32.49], ["sidetone", 29.3], ["insect", 22.03]], null, null, null, null, null, [["whoop", 15.64], ["speech", 11.33], ["crowd", 8.3]], null, null], "duration": [0.75, 3.53, 1.94, 2.05, 0.87, 1.86, 3.64, 0.33, 4.8, 0.44, 2.15, 0.89, 1.53, 1.58, 0.34, 2.16, 12.34, 1.11, 1.71]} \ No newline at end of file diff --git a/annotations_1/qLoufJLKN6Q_filtered.json b/annotations_1/qLoufJLKN6Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a98206dc19e313b223b3d2086def3d5e6d402b53 --- /dev/null +++ b/annotations_1/qLoufJLKN6Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [4.0, 4.95], [6.0, 6.02], [8.0, 30.13], [31.0, 32.39], [34.0, 36.22], [38.0, 39.39], [40.0, 42.67], [48.0, 48.71], [49.0, 50.3], [51.0, 52.39], [57.0, 57.45], [58.0, 58.48], [59.0, 61.55], [66.0, 67.91], [70.0, 69.69], [71.0, 73.75], [75.0, 77.65], [78.0, 79.03], [80.0, 81.89], [85.0, 84.7], [86.0, 87.3], [94.0, 94.8], [104.0, 105.36], [106.0, 106.79], [107.0, 108.46], [111.0, 111.28], [112.0, 113.16], [114.0, 115.37], [116.0, 130.76], [132.0, 133.54], [134.0, 134.55], [135.0, 148.49], [150.0, 152.25], [154.0, 154.97], [156.0, 156.88], [158.0, 160.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 30.65, 0.0, 38.09, 0.0, 42.15, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 50.91, 29.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.43, 0.0, 0.0, 29.6, 33.76, 0.0, 0.0, 35.18], "audiomae_on_audioset": [null, null, null, [["music", 45.35], ["speech", 27.55], ["hum", 7.14]], null, [["music", 52.55], ["hum", 13.76], ["throbbing", 4.12]], null, [["speech", 31.7], ["music", 30.39], ["hum", 8.61]], null, null, null, null, null, [["music", 48.14], ["didgeridoo", 9.46], ["musical instrument", 8.25]], null, null, null, [["mains hum", 26.94], ["music", 20.98], ["hum", 20.18]], null, null, null, null, null, null, null, null, null, null, null, [["hum", 47.56], ["throbbing", 29.01], ["mains hum", 9.68]], null, null, [["music", 53.57], ["electronic music", 5.37], ["hum", 5.21]], [["speech", 58.67], ["rumble", 23.3], ["music", 8.63]], null, null, [["music", 20.58], ["throbbing", 10.29], ["hum", 7.18]]], "duration": [0.48, 0.95, 0.02, 22.13, 1.39, 2.22, 1.39, 2.67, 0.71, 1.3, 1.39, 0.45, 0.48, 2.55, 1.91, -0.31, 2.75, 2.65, 1.03, 1.89, -0.3, 1.3, 0.8, 1.36, 0.79, 1.46, 0.28, 1.16, 1.37, 14.76, 1.54, 0.55, 13.49, 2.25, 0.97, 0.88, 2.07]} \ No newline at end of file diff --git a/annotations_1/qMaZAi73HDo_filtered.json b/annotations_1/qMaZAi73HDo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42c1adf22b5309154e462621788d6fec88e72c93 --- /dev/null +++ b/annotations_1/qMaZAi73HDo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.94], [13.0, 16.68], [18.0, 19.47], [24.0, 23.68], [26.0, 26.33], [30.0, 30.2], [34.0, 33.78], [88.0, 88.16], [91.0, 91.1], [92.0, 99.81], [103.0, 104.08], [105.0, 105.31], [115.0, 115.82]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.08], ["foghorn", 12.1], ["theremin", 10.89]], null, null, null, null, null, null, null, [["music", 62.72], ["musical instrument", 4.91], ["sidetone", 3.34]], null, null, null], "duration": [0.94, 3.68, 1.47, -0.32, 0.33, 0.2, -0.22, 0.16, 0.1, 7.81, 1.08, 0.31, 0.82]} \ No newline at end of file diff --git a/annotations_1/qN_sGdVG0Yw_filtered.json b/annotations_1/qN_sGdVG0Yw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e8f4aff076cdd33b202e586bb28728ba51d5011 --- /dev/null +++ b/annotations_1/qN_sGdVG0Yw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.9], [24.0, 25.78], [30.0, 30.86], [33.0, 33.51], [34.0, 60.44], [61.0, 60.57], [62.0, 65.77], [66.0, 66.34], [75.0, 90.02], [92.0, 92.4], [94.0, 96.48], [97.0, 97.16], [99.0, 99.32], [106.0, 108.43], [112.0, 117.91], [118.0, 117.95], [120.0, 121.71], [123.0, 123.4], [127.0, 127.43], [133.0, 133.64]], "keep_status": [true, false, false, false, false, false, true, false, true, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [32.62, 0.0, 0.0, 0.0, 30.75, 0.0, 37.06, 0.0, 31.28, 0.0, 47.31, 0.0, 0.0, 30.31, 40.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 44.56], ["speech", 11.2], ["sidetone", 7.1]], null, null, null, [["tuning fork", 49.96], ["music", 24.07], ["breaking", 6.66]], null, [["hum", 14.71], ["fly, housefly", 12.66], ["throbbing", 11.81]], null, [["music", 41.42], ["noise", 10.97], ["hum", 8.81]], null, [["hum", 19.98], ["music", 17.82], ["mains hum", 16.06]], null, null, [["vehicle", 17.85], ["motorcycle", 12.49], ["speech", 10.3]], [["speech", 70.29], ["music", 2.56], ["eruption", 2.46]], null, null, null, null, null], "duration": [3.9, 1.78, 0.86, 0.51, 26.44, -0.43, 3.77, 0.34, 15.02, 0.4, 2.48, 0.16, 0.32, 2.43, 5.91, -0.05, 1.71, 0.4, 0.43, 0.64]} \ No newline at end of file diff --git a/annotations_1/qOeZ9TL0wHs_filtered.json b/annotations_1/qOeZ9TL0wHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eeba59d19251fe3fb45993930295e1e37c58272f --- /dev/null +++ b/annotations_1/qOeZ9TL0wHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.51], [22.0, 25.14], [33.0, 35.87], [39.0, 40.19], [52.0, 54.11], [69.0, 69.21], [82.0, 83.27], [97.0, 103.77], [107.0, 107.49], [110.0, 111.81]], "keep_status": [true, true, true, false, false, false, false, false, false, false], "silence_prob": [42.0, 46.79, 40.71, 0.0, 32.88, 0.0, 0.0, 33.38, 0.0, 0.0], "audiomae_on_audioset": [[["music", 26.3], ["didgeridoo", 20.6], ["fly, housefly", 10.73]], [["music", 51.69], ["theremin", 8.38], ["musical instrument", 3.5]], [["music", 28.05], ["speech", 13.26], ["foghorn", 5.69]], null, [["cattle, bovinae", 41.06], ["moo", 39.08], ["livestock, farm animals, working animals", 19.18]], null, null, [["foghorn", 38.04], ["music", 35.35], ["echo", 3.41]], null, null], "duration": [4.51, 3.14, 2.87, 1.19, 2.11, 0.21, 1.27, 6.77, 0.49, 1.81]} \ No newline at end of file diff --git a/annotations_1/qPkKjKAyJ8I_filtered.json b/annotations_1/qPkKjKAyJ8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a525f939f6dc93b19bcecc29a61624a154e0289 --- /dev/null +++ b/annotations_1/qPkKjKAyJ8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.14], [24.0, 25.27], [26.0, 38.74], [39.0, 39.48], [40.0, 41.13], [42.0, 42.84], [46.0, 46.97], [47.0, 59.41], [64.0, 99.64], [104.0, 108.18], [109.0, 128.9], [130.0, 131.94], [138.0, 144.19], [146.0, 152.29]], "keep_status": [false, false, true, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 31.51, 0.0, 0.0, 0.0, 0.0, 37.17, 0.0, 33.69, 31.65, 0.0, 30.65, 31.72], "audiomae_on_audioset": [null, null, [["music", 47.45], ["buzz", 7.71], ["fly, housefly", 7.04]], null, null, null, null, [["speech", 44.82], ["music", 31.55], ["throbbing", 3.85]], null, [["music", 70.76], ["hum", 6.41], ["electronic music", 4.76]], [["music", 44.55], ["noise", 6.58], ["hum", 6.34]], null, [["music", 24.29], ["mains hum", 19.51], ["hum", 18.63]], [["music", 74.14], ["throbbing", 3.51], ["hum", 3.37]]], "duration": [1.14, 1.27, 12.74, 0.48, 1.13, 0.84, 0.97, 12.41, 35.64, 4.18, 19.9, 1.94, 6.19, 6.29]} \ No newline at end of file diff --git a/annotations_1/qR9MgJkOFJ0_filtered.json b/annotations_1/qR9MgJkOFJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eadbfffb010423d646f76cbcc744b806a015ea9b --- /dev/null +++ b/annotations_1/qR9MgJkOFJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [11.0, 12.09], [18.0, 18.74], [20.0, 21.98], [23.0, 26.11], [29.0, 31.26], [33.0, 33.22], [34.0, 35.53], [36.0, 41.18], [47.0, 47.95], [51.0, 51.04], [54.0, 56.1], [57.0, 61.53], [62.0, 67.09], [70.0, 71.34], [72.0, 78.31], [80.0, 80.6], [83.0, 87.79], [89.0, 97.34], [98.0, 104.65], [106.0, 106.81], [112.0, 111.67], [114.0, 115.33], [116.0, 117.78], [119.0, 125.95], [127.0, 137.84], [143.0, 148.73], [151.0, 154.65], [157.0, 158.58], [160.0, 162.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.96, 99.8, 0.0, 0.0, 99.96, 0.0, 0.0, 99.91, 99.91, 99.98, 0.0, 99.85, 0.0, 100.0, 100.0, 99.98, 0.0, 0.0, 0.0, 0.0, 100.0, 94.37, 84.43, 89.72, 0.0, 73.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.81, 1.09, 0.74, 1.98, 3.11, 2.26, 0.22, 1.53, 5.18, 0.95, 0.04, 2.1, 4.53, 5.09, 1.34, 6.31, 0.6, 4.79, 8.34, 6.65, 0.81, -0.33, 1.33, 1.78, 6.95, 10.84, 5.73, 3.65, 1.58, 2.13]} \ No newline at end of file diff --git a/annotations_1/qRQu4tZF1GA_filtered.json b/annotations_1/qRQu4tZF1GA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edeb12bd3eca077282b89e2b84c90aad1a8db517 --- /dev/null +++ b/annotations_1/qRQu4tZF1GA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.82], [16.0, 16.68], [21.0, 21.29], [22.0, 28.19], [34.0, 34.65], [38.0, 38.4], [39.0, 53.81], [57.0, 59.85], [61.0, 63.26], [68.0, 74.7], [80.0, 90.19], [91.0, 91.49], [92.0, 95.54], [103.0, 116.78], [119.0, 119.52], [132.0, 134.69], [136.0, 136.49], [141.0, 141.51]], "keep_status": [false, false, false, true, false, false, false, true, true, true, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 43.2, 0.0, 0.0, 29.94, 30.26, 32.97, 36.61, 30.8, 0.0, 35.84, 29.26, 0.0, 52.68, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 45.13], ["speech", 15.77], ["didgeridoo", 7.15]], null, null, [["throbbing", 46.87], ["music", 35.96], ["hum", 9.43]], [["music", 49.37], ["hum", 10.05], ["throbbing", 8.36]], [["music", 33.75], ["hum", 12.38], ["speech", 6.36]], [["music", 42.61], ["throbbing", 14.26], ["speech", 9.93]], [["speech", 35.04], ["music", 29.04], ["outside, rural or natural", 3.78]], null, [["music", 41.31], ["speech", 27.48], ["throbbing", 6.26]], [["music", 45.17], ["throbbing", 8.03], ["hum", 5.73]], null, null, null, null], "duration": [-0.18, 0.68, 0.29, 6.19, 0.65, 0.4, 14.81, 2.85, 2.26, 6.7, 10.19, 0.49, 3.54, 13.78, 0.52, 2.69, 0.49, 0.51]} \ No newline at end of file diff --git a/annotations_1/qSd4Q3GY7dc_filtered.json b/annotations_1/qSd4Q3GY7dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7fd7d148bd2cb53a28bd4a5502e0f53e85c14d --- /dev/null +++ b/annotations_1/qSd4Q3GY7dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.16], [8.0, 8.23], [11.0, 11.72], [13.0, 13.42], [18.0, 17.76], [20.0, 20.48], [20.0, 20.51], [21.0, 21.86], [32.0, 33.35], [34.0, 34.15], [42.0, 44.51], [51.0, 51.71], [54.0, 53.92], [59.0, 59.31], [62.0, 64.64], [77.0, 82.39], [87.0, 87.99], [90.0, 90.96], [93.0, 97.75], [115.0, 114.64], [116.0, 117.78], [122.0, 122.61], [138.0, 139.08], [144.0, 144.22], [145.0, 147.31], [148.0, 151.26], [164.0, 164.05], [166.0, 165.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 0.0, 97.54, 99.59, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 0.0, 0.0, 50.11, 64.29, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 0.23, 0.72, 0.42, -0.24, 0.48, 0.51, 0.86, 1.35, 0.15, 2.51, 0.71, -0.08, 0.31, 2.64, 5.39, 0.99, 0.96, 4.75, -0.36, 1.78, 0.61, 1.08, 0.22, 2.31, 3.26, 0.05, -0.09]} \ No newline at end of file diff --git a/annotations_1/qTey0qxMboA_filtered.json b/annotations_1/qTey0qxMboA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bac3ba45ec362d58e7dd47e888fcd99eafe5fa2 --- /dev/null +++ b/annotations_1/qTey0qxMboA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[109.0, 134.32]], "keep_status": [true], "silence_prob": [33.69], "audiomae_on_audioset": [[["speech", 33.31], ["music", 18.75], ["sonar", 9.54]]], "duration": [25.32]} \ No newline at end of file diff --git a/annotations_1/qTj4aSPwTBk_filtered.json b/annotations_1/qTj4aSPwTBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..329be6f1d4680ae41cdedaad63b4484d85ab4089 --- /dev/null +++ b/annotations_1/qTj4aSPwTBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 75.74], [76.0, 79.49], [80.0, 81.09], [87.0, 126.28], [130.0, 130.79], [138.0, 149.22], [152.0, 157.37], [164.0, 164.61]], "keep_status": [false, true, false, false, false, false, false, false], "silence_prob": [0.0, 40.97, 0.0, 0.0, 0.0, 42.08, 36.74, 0.0], "audiomae_on_audioset": [null, [["music", 23.56], ["speech", 19.7], ["fly, housefly", 6.83]], null, null, null, [["music", 54.55], ["speech", 22.19], ["sidetone", 5.29]], [["speech", 33.72], ["music", 26.18], ["boing", 22.63]], null], "duration": [40.74, 3.49, 1.09, 39.28, 0.79, 11.22, 5.37, 0.61]} \ No newline at end of file diff --git a/annotations_1/qULQCbfqJm8_filtered.json b/annotations_1/qULQCbfqJm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08505f0292cf0bfc383813c3d059560b51409a36 --- /dev/null +++ b/annotations_1/qULQCbfqJm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.92], [11.0, 12.24], [16.0, 17.15], [20.0, 24.17], [44.0, 45.59], [60.0, 61.1], [66.0, 65.97], [92.0, 93.55], [97.0, 97.66], [99.0, 100.53], [108.0, 112.51], [118.0, 118.45], [145.0, 148.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.23, 0.0, 37.26], "audiomae_on_audioset": [null, null, null, [["music", 76.29], ["musical instrument", 5.81], ["synthesizer", 5.4]], null, null, null, null, null, null, [["music", 68.37], ["synthesizer", 3.24], ["theremin", 2.97]], null, [["music", 65.62], ["speech", 6.51], ["flute", 2.75]]], "duration": [-0.08, 1.24, 1.15, 4.17, 1.59, 1.1, -0.03, 1.55, 0.66, 1.53, 4.51, 0.45, 3.42]} \ No newline at end of file diff --git a/annotations_1/qULlmr4lxb0_filtered.json b/annotations_1/qULlmr4lxb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d3f48f20ae69c840bccff7e5df841844287d984 --- /dev/null +++ b/annotations_1/qULlmr4lxb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.69], [10.0, 13.31], [13.0, 13.59], [22.0, 23.01], [28.0, 28.51], [34.0, 36.93], [38.0, 37.79], [39.0, 40.22], [43.0, 43.55], [46.0, 48.24], [60.0, 60.89], [66.0, 66.29], [66.0, 67.64], [77.0, 80.91], [82.0, 85.45], [91.0, 94.64], [98.0, 97.82], [101.0, 100.99], [102.0, 109.65], [110.0, 110.59]], "keep_status": [false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 38.03, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 0.0, 34.7, 0.0, 0.0, 0.0, 30.81, 32.4, 33.72, 0.0, 0.0, 32.17, 0.0], "audiomae_on_audioset": [null, [["speech", 53.81], ["music", 19.98], ["sidetone", 12.63]], null, null, null, [["speech", 29.9], ["music", 26.22], ["television", 7.28]], null, null, null, [["speech", 30.51], ["music", 19.18], ["sidetone", 6.1]], null, null, null, [["speech", 56.69], ["music", 11.14], ["noise", 4.82]], [["speech", 71.34], ["mains hum", 5.69], ["music", 3.55]], [["speech", 34.07], ["music", 28.35], ["fart", 2.57]], null, null, [["hum", 35.79], ["mains hum", 21.36], ["throbbing", 16.81]], null], "duration": [0.69, 3.31, 0.59, 1.01, 0.51, 2.93, -0.21, 1.22, 0.55, 2.24, 0.89, 0.29, 1.64, 3.91, 3.45, 3.64, -0.18, -0.01, 7.65, 0.59]} \ No newline at end of file diff --git a/annotations_1/qUammhHxd1k_filtered.json b/annotations_1/qUammhHxd1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e8b97fb81d721cbb8a7442ef05ecb1339ae8174 --- /dev/null +++ b/annotations_1/qUammhHxd1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [6.0, 9.69], [12.0, 12.43], [13.0, 13.68], [20.0, 19.82], [28.0, 30.4], [33.0, 33.54], [34.0, 34.89], [37.0, 37.66], [41.0, 45.79], [46.0, 48.63], [49.0, 50.53], [52.0, 63.91], [65.0, 64.94], [66.0, 71.02], [72.0, 82.65], [84.0, 88.5], [91.0, 94.83], [96.0, 126.89], [127.0, 126.98], [130.0, 203.32], [210.0, 212.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.99, 0.0, 0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 83.34, 36.67, 0.0, 30.87, 0.0, 30.21, 29.79, 30.0, 30.47, 0.0, 0.0, 0.0, 30.7], "audiomae_on_audioset": [null, [["speech", 67.7], ["caw", 3.65], ["sine wave", 2.28]], null, null, null, null, null, null, null, null, [["music", 66.07], ["speech", 12.89], ["electronic music", 4.47]], null, [["music", 79.1], ["drum machine", 4.1], ["sampler", 3.81]], null, [["music", 71.58], ["sampler", 4.54], ["synthesizer", 3.31]], [["music", 82.37], ["sampler", 2.1], ["electronic music", 2.03]], [["music", 81.24], ["speech", 1.58], ["house music", 1.52]], [["music", 76.81], ["speech", 8.5], ["electronic music", 2.2]], null, null, null, [["music", 71.32], ["house music", 2.51], ["dance music", 1.94]]], "duration": [1.14, 3.69, 0.43, 0.68, -0.18, 2.4, 0.54, 0.89, 0.66, 4.79, 2.63, 1.53, 11.91, -0.06, 5.02, 10.65, 4.5, 3.83, 30.89, -0.02, 73.32, 2.53]} \ No newline at end of file diff --git a/annotations_1/qVDMu-erGtc_filtered.json b/annotations_1/qVDMu-erGtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ea346063ed788fa97ae868569ea13cdd8c1ba683 --- /dev/null +++ b/annotations_1/qVDMu-erGtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 29.0], [32.0, 32.12], [38.0, 38.5], [41.0, 41.72], [48.0, 48.22], [49.0, 58.56], [64.0, 75.51], [80.0, 88.6], [90.0, 90.37], [92.0, 94.05], [97.0, 132.56], [134.0, 166.83], [170.0, 177.5], [179.0, 179.98], [181.0, 181.58], [183.0, 183.71], [184.0, 188.15], [189.0, 194.09], [198.0, 199.45], [200.0, 210.19], [213.0, 223.91]], "keep_status": [false, false, false, false, false, true, true, true, false, true, false, false, false, false, false, false, true, true, false, false, true], "silence_prob": [35.44, 0.0, 0.0, 0.0, 0.0, 29.12, 29.14, 29.48, 0.0, 29.86, 0.0, 0.0, 29.27, 0.0, 0.0, 0.0, 31.87, 29.57, 0.0, 29.59, 30.36], "audiomae_on_audioset": [[["music", 45.3], ["throbbing", 30.1], ["hum", 11.46]], null, null, null, null, [["music", 41.49], ["throbbing", 15.92], ["hum", 7.01]], [["music", 36.49], ["hum", 17.07], ["mains hum", 9.86]], [["music", 22.69], ["speech", 20.29], ["hum", 12.17]], null, [["music", 43.07], ["hum", 8.68], ["electronic music", 7.68]], null, null, [["machine gun", 40.5], ["music", 30.31], ["gunshot, gunfire", 6.14]], null, null, null, [["speech", 38.18], ["music", 19.42], ["hum", 6.23]], [["music", 16.91], ["speech", 11.48], ["mains hum", 11.34]], null, [["throbbing", 31.54], ["music", 31.01], ["hum", 13.63]], [["music", 26.78], ["siren", 7.51], ["vehicle", 6.71]]], "duration": [8.0, 0.12, 0.5, 0.72, 0.22, 9.56, 11.51, 8.6, 0.37, 2.05, 35.56, 32.83, 7.5, 0.98, 0.58, 0.71, 4.15, 5.09, 1.45, 10.19, 10.91]} \ No newline at end of file diff --git a/annotations_1/qWiGcXSaKUc_filtered.json b/annotations_1/qWiGcXSaKUc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0517a789bcea190c43348dc6445ed284d438d0eb --- /dev/null +++ b/annotations_1/qWiGcXSaKUc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.31], [7.0, 9.75], [11.0, 12.65], [14.0, 19.28], [22.0, 22.99], [26.0, 27.13], [29.0, 30.4], [32.0, 34.16], [39.0, 42.28], [44.0, 45.98], [47.0, 48.24], [50.0, 51.19], [55.0, 55.54], [61.0, 64.61], [67.0, 69.94], [70.0, 71.81], [73.0, 78.27], [80.0, 79.83], [87.0, 92.31], [98.0, 98.93], [118.0, 119.11], [128.0, 128.55], [137.0, 137.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [100.0, 100.0, 0.0, 97.73, 0.0, 0.0, 0.0, 99.44, 100.0, 0.0, 0.0, 0.0, 0.0, 99.98, 97.92, 0.0, 68.41, 0.0, 29.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.93], ["hum", 5.29], ["fly, housefly", 4.94]], null, null, null, null], "duration": [2.31, 2.75, 1.65, 5.28, 0.99, 1.13, 1.4, 2.16, 3.28, 1.98, 1.24, 1.19, 0.54, 3.61, 2.94, 1.81, 5.27, -0.17, 5.31, 0.93, 1.11, 0.55, 0.15]} \ No newline at end of file diff --git a/annotations_1/qXKeIDlP-ys_filtered.json b/annotations_1/qXKeIDlP-ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f5b18ba1b8b4f9bce5c0cc784d66e316a77455 --- /dev/null +++ b/annotations_1/qXKeIDlP-ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 20.56], [22.0, 22.01], [22.0, 29.71], [31.0, 36.12], [37.0, 36.95], [37.0, 50.6], [52.0, 58.95], [64.0, 67.47], [69.0, 70.23], [72.0, 72.72], [73.0, 75.78], [78.0, 78.98], [80.0, 80.28], [81.0, 94.74], [97.0, 97.88], [100.0, 103.65], [105.0, 105.58], [107.0, 108.85], [109.0, 110.67], [111.0, 161.52]], "keep_status": [true, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.94, 0.0, 43.66, 34.95, 0.0, 43.15, 41.95, 39.44, 0.0, 0.0, 56.93, 0.0, 0.0, 33.5, 0.0, 53.04, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.5], ["groan", 10.58], ["throbbing", 5.04]], null, [["didgeridoo", 38.53], ["music", 30.16], ["fart", 9.64]], [["music", 22.67], ["fly, housefly", 13.05], ["throbbing", 10.5]], null, [["music", 59.07], ["throbbing", 12.65], ["hum", 7.24]], [["mosquito", 37.99], ["fly, housefly", 19.93], ["insect", 5.68]], [["whale vocalization", 42.91], ["music", 10.65], ["mosquito", 9.61]], null, null, null, null, null, [["hum", 43.84], ["throbbing", 25.21], ["music", 13.15]], null, null, null, null, null, null], "duration": [15.56, 0.01, 7.71, 5.12, -0.05, 13.6, 6.95, 3.47, 1.23, 0.72, 2.78, 0.98, 0.28, 13.74, 0.88, 3.65, 0.58, 1.85, 1.67, 50.52]} \ No newline at end of file diff --git a/annotations_1/qY7EPDCU5hc_filtered.json b/annotations_1/qY7EPDCU5hc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7c2be1e4cf562af6913bbfc72225d083c6f01424 --- /dev/null +++ b/annotations_1/qY7EPDCU5hc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [11.0, 12.78], [16.0, 19.33], [24.0, 24.33], [28.0, 36.29], [42.0, 42.74], [58.0, 60.12], [66.0, 66.23], [71.0, 70.98], [83.0, 85.43], [89.0, 89.63], [97.0, 97.17], [98.0, 98.83], [100.0, 103.87], [107.0, 125.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.33, 0.0, 31.57, 0.0, 70.86, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 67.63, 30.52], "audiomae_on_audioset": [null, null, [["hum", 37.47], ["throbbing", 23.05], ["heart sounds, heartbeat", 9.7]], null, [["music", 30.42], ["mains hum", 25.72], ["hum", 19.73]], null, null, null, null, null, null, null, null, null, [["music", 78.28], ["didgeridoo", 4.1], ["musical instrument", 3.04]]], "duration": [0.49, 1.78, 3.33, 0.33, 8.29, 0.74, 2.12, 0.23, -0.02, 2.43, 0.63, 0.17, 0.83, 3.87, 18.31]} \ No newline at end of file diff --git a/annotations_1/qYCEXS6Ws_c_filtered.json b/annotations_1/qYCEXS6Ws_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988681a5f4a9ffc6006bebc5e773c7df73697c36 --- /dev/null +++ b/annotations_1/qYCEXS6Ws_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.52], [17.0, 21.71], [23.0, 32.68], [34.0, 34.77], [36.0, 36.91], [38.0, 54.41], [55.0, 55.75], [57.0, 59.75], [68.0, 70.23], [82.0, 83.84], [86.0, 97.44], [99.0, 101.38], [105.0, 105.83], [114.0, 122.64], [123.0, 124.41], [125.0, 126.1], [126.0, 132.73], [134.0, 135.84], [137.0, 137.56], [142.0, 142.23], [154.0, 154.21], [158.0, 160.05], [161.0, 172.86]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 31.57, 35.14, 0.0, 0.0, 33.87, 0.0, 66.51, 61.97, 0.0, 38.02, 46.97, 0.0, 59.51, 0.0, 0.0, 32.76, 0.0, 0.0, 0.0, 0.0, 99.94, 35.99], "audiomae_on_audioset": [null, [["hum", 9.9], ["music", 9.87], ["speech", 8.16]], [["music", 86.83], ["musical instrument", 2.4], ["guitar", 1.86]], null, null, [["music", 83.58], ["musical instrument", 2.3], ["synthesizer", 2.26]], null, null, null, null, [["music", 74.69], ["electric shaver, electric razor", 8.56], ["buzz", 3.35]], [["animal", 11.53], ["livestock, farm animals, working animals", 10.74], ["speech", 9.39]], null, null, null, null, [["music", 49.14], ["theremin", 31.55], ["foghorn", 4.01]], null, null, null, null, null, [["speech", 14.84], ["crowd", 10.73], ["music", 9.61]]], "duration": [1.52, 4.71, 9.68, 0.77, 0.91, 16.41, 0.75, 2.75, 2.23, 1.84, 11.44, 2.38, 0.83, 8.64, 1.41, 1.1, 6.73, 1.84, 0.56, 0.23, 0.21, 2.05, 11.86]} \ No newline at end of file diff --git a/annotations_1/qYEOmZzqX28_filtered.json b/annotations_1/qYEOmZzqX28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81906d6c6a4808fc9a874c0a109211c3b8bee947 --- /dev/null +++ b/annotations_1/qYEOmZzqX28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.24], [10.0, 11.15], [15.0, 20.44], [21.0, 24.68], [29.0, 30.3], [35.0, 36.05], [54.0, 59.61], [70.0, 70.23], [105.0, 106.0], [106.0, 107.38], [136.0, 137.02], [156.0, 157.72], [161.0, 163.32], [164.0, 177.3], [178.0, 180.79], [182.0, 185.52], [188.0, 188.59], [190.0, 190.58], [196.0, 196.77], [202.0, 211.33]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 33.15, 33.24, 0.0, 0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 30.87, 34.89, 36.78, 0.0, 0.0, 0.0, 30.63], "audiomae_on_audioset": [null, null, [["music", 62.25], ["speech", 18.6], ["sidetone", 3.3]], [["music", 48.8], ["hum", 9.63], ["speech", 5.15]], null, null, [["whack, thwack", 63.49], ["speech", 8.65], ["rumble", 3.78]], null, null, null, null, null, null, [["throbbing", 19.71], ["hum", 16.93], ["music", 14.94]], [["throbbing", 34.82], ["hum", 22.21], ["music", 17.47]], [["music", 30.61], ["hum", 23.52], ["mains hum", 8.81]], null, null, null, [["music", 36.22], ["speech", 24.2], ["buzz", 3.25]]], "duration": [1.24, 1.15, 5.44, 3.68, 1.3, 1.05, 5.61, 0.23, 1.0, 1.38, 1.02, 1.72, 2.32, 13.3, 2.79, 3.52, 0.59, 0.58, 0.77, 9.33]} \ No newline at end of file diff --git a/annotations_1/qYZw_tL0j9U_filtered.json b/annotations_1/qYZw_tL0j9U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..faa4b77489c99c916e2436d63e66439c7200c88a --- /dev/null +++ b/annotations_1/qYZw_tL0j9U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.13], [12.0, 13.29], [27.0, 28.17], [30.0, 38.16], [42.0, 53.33], [61.0, 67.44], [73.0, 75.44], [84.0, 84.08], [85.0, 91.34], [96.0, 104.99], [108.0, 108.57], [113.0, 114.17], [114.0, 114.2], [114.0, 122.23], [123.0, 123.48], [127.0, 138.28], [139.0, 145.69], [158.0, 166.77], [168.0, 175.73]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.49, 34.49, 33.36, 33.06, 0.0, 33.74, 34.13, 0.0, 0.0, 0.0, 38.3, 0.0, 39.05, 34.13, 45.62, 68.8], "audiomae_on_audioset": [null, null, null, [["sidetone", 60.91], ["music", 12.27], ["speech", 10.14]], [["music", 54.49], ["speech", 17.8], ["electronic music", 5.52]], [["music", 68.22], ["speech", 9.58], ["electronic music", 5.24]], [["music", 67.35], ["speech", 12.63], ["electronic music", 2.98]], null, [["music", 52.58], ["sidetone", 9.76], ["synthesizer", 7.31]], [["music", 33.54], ["sidetone", 25.57], ["speech", 23.15]], null, null, null, [["music", 64.81], ["house music", 5.88], ["speech", 5.34]], null, [["music", 39.42], ["moo", 11.88], ["cattle, bovinae", 9.28]], [["music", 64.61], ["rattle (instrument)", 8.71], ["musical instrument", 7.85]], [["music", 57.15], ["drum machine", 8.28], ["synthesizer", 5.12]], null], "duration": [1.13, 1.29, 1.17, 8.16, 11.33, 6.44, 2.44, 0.08, 6.34, 8.99, 0.57, 1.17, 0.2, 8.23, 0.48, 11.28, 6.69, 8.77, 7.73]} \ No newline at end of file diff --git a/annotations_1/q_tMagfE-nM_filtered.json b/annotations_1/q_tMagfE-nM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b279448d707e1ed104eaaee0c6d2cf43df2c9489 --- /dev/null +++ b/annotations_1/q_tMagfE-nM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [4.0, 4.58], [5.0, 6.22], [10.0, 12.23], [14.0, 15.28], [19.0, 24.98], [27.0, 28.07], [29.0, 30.87], [33.0, 35.28], [36.0, 39.14], [41.0, 41.99], [44.0, 44.88], [45.0, 49.0], [51.0, 52.93], [54.0, 56.32], [60.0, 62.18], [64.0, 64.67], [68.0, 71.47], [74.0, 74.7], [77.0, 80.03], [83.0, 85.26], [87.0, 88.25], [91.0, 96.47], [100.0, 102.49], [104.0, 105.76], [108.0, 111.05], [113.0, 117.31], [120.0, 122.37], [126.0, 130.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.84, 0.0, 99.1, 0.0, 0.0, 97.11, 99.94, 0.0, 0.0, 95.09, 0.0, 82.25, 99.85, 0.0, 99.99, 0.0, 99.99, 99.71, 0.0, 83.34, 99.98, 0.0, 99.68, 92.64, 100.0, 99.93], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 0.58, 1.22, 2.23, 1.28, 5.98, 1.07, 1.87, 2.28, 3.14, 0.99, 0.88, 4.0, 1.93, 2.32, 2.18, 0.67, 3.47, 0.7, 3.03, 2.26, 1.25, 5.47, 2.49, 1.76, 3.05, 4.31, 2.37, 4.03]} \ No newline at end of file diff --git a/annotations_1/q_u6njqBaB8_filtered.json b/annotations_1/q_u6njqBaB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9cda88c354c8124bed37d5b2ce09c1e1e98087b0 --- /dev/null +++ b/annotations_1/q_u6njqBaB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.04], [34.0, 35.36], [68.0, 68.94], [70.0, 73.58], [74.0, 74.83], [77.0, 77.85], [80.0, 81.75], [92.0, 93.46], [96.0, 96.35], [99.0, 99.33], [101.0, 102.32], [113.0, 125.71], [128.0, 128.04], [130.0, 132.44], [133.0, 134.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 52.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.68, 0.0, 46.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 33.67], ["hum", 10.64], ["music", 9.92]], null, [["speech", 15.2], ["music", 14.9], ["mains hum", 13.02]], null], "duration": [0.04, 1.36, 0.94, 3.58, 0.83, 0.85, 1.75, 1.46, 0.35, 0.33, 1.32, 12.71, 0.04, 2.44, 1.82]} \ No newline at end of file diff --git a/annotations_1/q_v3jNjwHNQ_filtered.json b/annotations_1/q_v3jNjwHNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53741cc29e8433fdb6864da3b7e7d13e8c83f844 --- /dev/null +++ b/annotations_1/q_v3jNjwHNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 93.58], [95.0, 141.86], [144.0, 166.75], [167.0, 166.82]], "keep_status": [false, false, false, false], "silence_prob": [34.06, 0.0, 31.38, 0.0], "audiomae_on_audioset": [[["music", 61.85], ["throbbing", 14.66], ["hum", 10.25]], null, [["hum", 36.27], ["music", 28.77], ["mains hum", 14.2]], null], "duration": [18.58, 46.86, 22.75, -0.18]} \ No newline at end of file diff --git a/annotations_1/q_y6O1yflZI_filtered.json b/annotations_1/q_y6O1yflZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2a1df22509cc1aa2b8e6eee23cb667cf110abf9 --- /dev/null +++ b/annotations_1/q_y6O1yflZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[60.0, 61.8], [89.0, 92.72], [117.0, 119.04], [120.0, 121.8], [125.0, 127.28], [128.0, 131.16], [134.0, 134.69], [135.0, 135.41], [138.0, 140.98], [142.0, 142.4], [143.0, 144.49], [148.0, 148.88], [151.0, 155.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 50.71, 98.93, 0.0, 96.42, 99.48, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 3.72, 2.04, 1.8, 2.28, 3.16, 0.69, 0.41, 2.98, 0.4, 1.49, 0.88, 4.33]} \ No newline at end of file diff --git a/annotations_1/qaAz6YklimY_filtered.json b/annotations_1/qaAz6YklimY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1f7d75dabe7b4b09e159fa8be95878777d137d48 --- /dev/null +++ b/annotations_1/qaAz6YklimY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.35], [17.0, 19.45], [20.0, 20.46], [21.0, 23.21], [25.0, 25.74], [28.0, 28.75], [30.0, 34.97]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.35, 2.45, 0.46, 2.21, 0.74, 0.75, 4.97]} \ No newline at end of file diff --git a/annotations_1/qaQQ3LLyKvo_filtered.json b/annotations_1/qaQQ3LLyKvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a375c3b66dad45c21e2f74ee1cb64b599b3ab59e --- /dev/null +++ b/annotations_1/qaQQ3LLyKvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.03], [2.0, 2.07], [2.0, 2.1], [2.0, 2.13], [2.0, 2.17], [2.0, 2.25], [2.0, 2.32], [2.0, 2.49], [3.0, 2.54], [4.0, 4.19], [5.0, 7.69], [8.0, 9.34], [10.0, 15.21], [18.0, 31.95], [33.0, 35.34], [36.0, 39.16], [40.0, 43.28], [44.0, 44.27], [45.0, 45.62], [50.0, 50.53], [52.0, 88.91], [90.0, 95.62], [96.0, 99.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 58.64, 51.55, 63.96, 59.86, 44.49, 0.0, 0.0, 0.0, 0.0, 54.9, 44.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.75], ["mains hum", 25.98], ["speech", 8.62]], null, null, null, null, null, [["hum", 27.42], ["theremin", 18.96], ["music", 12.32]]], "duration": [0.03, 0.07, 0.1, 0.13, 0.17, 0.25, 0.32, 0.49, -0.46, 0.19, 2.69, 1.34, 5.21, 13.95, 2.34, 3.16, 3.28, 0.27, 0.62, 0.53, 36.91, 5.62, 3.42]} \ No newline at end of file diff --git a/annotations_1/qabChviGItk_filtered.json b/annotations_1/qabChviGItk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4337d3b83d5b2c0980a107a6c1f25734c206cc1 --- /dev/null +++ b/annotations_1/qabChviGItk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 37.67], [38.0, 53.35], [55.0, 56.05], [59.0, 80.62], [82.0, 93.12], [93.0, 93.82]], "keep_status": [true, false, false, false, false, false], "silence_prob": [30.13, 30.41, 0.0, 30.54, 30.41, 0.0], "audiomae_on_audioset": [[["music", 21.15], ["car", 15.36], ["race car, auto racing", 10.77]], [["throbbing", 38.78], ["music", 31.4], ["hum", 19.37]], null, [["music", 45.8], ["hum", 14.68], ["throbbing", 11.47]], [["music", 56.49], ["smash, crash", 12.36], ["whack, thwack", 8.04]], null], "duration": [11.67, 15.35, 1.05, 21.62, 11.12, 0.82]} \ No newline at end of file diff --git a/annotations_1/qcYPASs4jMQ_filtered.json b/annotations_1/qcYPASs4jMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..907fe2bc31cc7db287545acf390cfe08dba466ed --- /dev/null +++ b/annotations_1/qcYPASs4jMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.79], [24.0, 125.14], [128.0, 130.6]], "keep_status": [false, false, true], "silence_prob": [29.67, 0.0, 41.5], "audiomae_on_audioset": [[["eruption", 28.4], ["speech", 28.22], ["explosion", 21.09]], null, [["cattle, bovinae", 10.34], ["whale vocalization", 9.82], ["moo", 9.52]]], "duration": [9.79, 101.14, 2.6]} \ No newline at end of file diff --git a/annotations_1/qcaVM8TcZbA_filtered.json b/annotations_1/qcaVM8TcZbA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0eac198fc08a1828509fa65fa0b5f29192116b1 --- /dev/null +++ b/annotations_1/qcaVM8TcZbA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.89], [15.0, 15.15], [16.0, 16.98], [20.0, 21.1], [23.0, 25.49], [27.0, 29.2], [30.0, 32.98], [34.0, 34.33], [35.0, 36.12], [37.0, 38.3], [41.0, 41.72], [43.0, 45.1], [53.0, 53.22], [58.0, 61.79], [63.0, 63.68], [64.0, 65.67], [68.0, 67.78], [69.0, 70.53], [76.0, 84.47], [92.0, 92.65], [98.0, 99.01], [101.0, 116.02], [119.0, 121.68], [122.0, 124.95], [128.0, 129.54], [133.0, 133.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 90.43, 97.11, 83.7, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 47.66, 0.0, 0.0, 0.0, 0.0, 38.76, 0.0, 0.0, 29.04, 29.93, 29.39, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.44], ["speech", 19.25], ["singing bowl", 5.31]], null, null, null, null, [["music", 41.3], ["ambient music", 13.06], ["speech", 12.38]], null, null, [["music", 40.11], ["hum", 20.18], ["throbbing", 19.47]], [["music", 34.57], ["cattle, bovinae", 12.35], ["moo", 8.79]], [["music", 76.86], ["speech", 9.46], ["throbbing", 1.33]], null, null], "duration": [-0.11, 0.15, 0.98, 1.1, 2.49, 2.2, 2.98, 0.33, 1.12, 1.3, 0.72, 2.1, 0.22, 3.79, 0.68, 1.67, -0.22, 1.53, 8.47, 0.65, 1.01, 15.02, 2.68, 2.95, 1.54, 0.74]} \ No newline at end of file diff --git a/annotations_1/qe8IY41zyCc_filtered.json b/annotations_1/qe8IY41zyCc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64d515d0cdaa298d09475d5ad17a39aacf26f68e --- /dev/null +++ b/annotations_1/qe8IY41zyCc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 66.48], [67.0, 112.04], [113.0, 112.95], [113.0, 120.31]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.1], "audiomae_on_audioset": [null, null, null, [["throbbing", 43.48], ["music", 25.18], ["hum", 19.68]]], "duration": [34.48, 45.04, -0.05, 7.31]} \ No newline at end of file diff --git a/annotations_1/qeaiVveZWD8_filtered.json b/annotations_1/qeaiVveZWD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c2a7d5bee9a35b0b1611f5ae818e380b9870f61 --- /dev/null +++ b/annotations_1/qeaiVveZWD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 47.93], [48.0, 48.15], [49.0, 51.83], [54.0, 89.04], [89.0, 137.1]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 43.18], ["ambient music", 21.31], ["scary music", 6.17]], null, null], "duration": [1.93, 0.15, 2.83, 35.04, 48.1]} \ No newline at end of file diff --git a/annotations_1/qfq5VozCshY_filtered.json b/annotations_1/qfq5VozCshY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..89e0ad340e3f6ec3473a47eb8ef81fc632d7a0e4 --- /dev/null +++ b/annotations_1/qfq5VozCshY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [2.0, 3.3], [8.0, 9.8], [14.0, 14.67], [17.0, 21.46], [37.0, 41.55], [44.0, 47.48], [55.0, 55.41], [55.0, 55.49], [71.0, 71.1], [75.0, 76.4], [84.0, 84.64], [92.0, 92.69], [100.0, 100.01], [101.0, 103.2], [105.0, 105.53], [108.0, 108.21], [109.0, 109.63], [110.0, 111.28], [112.0, 112.09], [124.0, 124.01], [125.0, 125.44], [126.0, 126.45], [130.0, 134.01], [136.0, 136.8], [156.0, 159.38], [163.0, 163.41], [169.0, 169.57], [174.0, 174.8], [180.0, 180.69], [182.0, 182.28], [185.0, 185.28], [188.0, 188.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.71, 44.46, 37.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.44, 0.0, 57.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["thunk", 60.04], ["music", 25.01], ["door", 3.9]], [["music", 75.07], ["speech", 6.48], ["musical instrument", 3.68]], [["music", 72.79], ["maraca", 4.61], ["musical instrument", 2.59]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.33, 1.3, 1.8, 0.67, 4.46, 4.55, 3.48, 0.41, 0.49, 0.1, 1.4, 0.64, 0.69, 0.01, 2.2, 0.53, 0.21, 0.63, 1.28, 0.09, 0.01, 0.44, 0.45, 4.01, 0.8, 3.38, 0.41, 0.57, 0.8, 0.69, 0.28, 0.28, 0.0]} \ No newline at end of file diff --git a/annotations_1/qgRXFJqB-9Q_filtered.json b/annotations_1/qgRXFJqB-9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91ea6b05666d6e966d5e2ab673cda2e44214d074 --- /dev/null +++ b/annotations_1/qgRXFJqB-9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.8], [13.0, 24.98], [31.0, 43.71], [48.0, 81.6], [82.0, 88.35], [92.0, 92.42], [99.0, 99.39], [100.0, 123.45], [126.0, 140.56], [143.0, 147.23], [152.0, 152.39], [154.0, 156.19], [156.0, 156.25], [158.0, 161.72], [165.0, 173.08]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 28.51, 28.75, 0.0, 28.72, 0.0, 0.0, 29.35, 31.22, 30.59, 0.0, 31.15, 0.0, 29.79, 30.02], "audiomae_on_audioset": [null, [["music", 66.24], ["hum", 7.68], ["throbbing", 3.77]], [["music", 62.14], ["hum", 9.27], ["throbbing", 5.76]], null, [["music", 43.7], ["hum", 6.88], ["speech", 6.81]], null, null, [["music", 75.38], ["throbbing", 6.98], ["electronic music", 5.69]], [["speech", 27.96], ["music", 27.56], ["hum", 12.11]], [["music", 35.51], ["speech", 32.65], ["didgeridoo", 5.27]], null, [["music", 30.55], ["whale vocalization", 7.95], ["vehicle", 7.38]], null, [["music", 49.9], ["speech", 16.8], ["throbbing", 7.33]], [["music", 58.03], ["speech", 15.95], ["cacophony", 4.3]]], "duration": [0.8, 11.98, 12.71, 33.6, 6.35, 0.42, 0.39, 23.45, 14.56, 4.23, 0.39, 2.19, 0.25, 3.72, 8.08]} \ No newline at end of file diff --git a/annotations_1/qgm_ou3TsIs_filtered.json b/annotations_1/qgm_ou3TsIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..128a61fba9426cedc2bce133a48927a713b6ff0b --- /dev/null +++ b/annotations_1/qgm_ou3TsIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.6], [5.0, 5.83], [8.0, 30.96], [34.0, 47.83], [51.0, 53.59], [57.0, 57.37], [59.0, 63.44], [64.0, 65.58], [67.0, 68.74], [70.0, 71.54], [74.0, 74.8], [77.0, 77.28], [78.0, 78.88], [83.0, 91.13], [92.0, 96.77], [99.0, 99.23], [100.0, 107.42], [108.0, 111.87], [115.0, 121.46]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 76.04, 53.28, 66.88, 0.0, 42.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 54.43, 0.0, 35.47, 33.81, 34.42], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 29.01], ["didgeridoo", 9.92], ["fly, housefly", 4.29]], null, null, null, null, null, null, null, null, null, [["music", 42.17], ["clarinet", 16.95], ["musical instrument", 7.38]], [["music", 63.22], ["effects unit", 9.13], ["musical instrument", 9.12]], [["music", 45.12], ["theremin", 33.99], ["musical instrument", 4.57]]], "duration": [0.6, 0.83, 22.96, 13.83, 2.59, 0.37, 4.44, 1.58, 1.74, 1.54, 0.8, 0.28, 0.88, 8.13, 4.77, 0.23, 7.42, 3.87, 6.46]} \ No newline at end of file diff --git a/annotations_1/qj3TqaXp2Mg_filtered.json b/annotations_1/qj3TqaXp2Mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a76df2a2029fc305038ffeb478b0937a24e1fa35 --- /dev/null +++ b/annotations_1/qj3TqaXp2Mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.6], [14.0, 14.89], [16.0, 16.17], [18.0, 17.66], [20.0, 20.95], [22.0, 30.35], [35.0, 44.37], [45.0, 48.24], [52.0, 56.84], [59.0, 62.18], [63.0, 63.22], [65.0, 68.91], [72.0, 83.81], [84.0, 87.02], [89.0, 90.34], [95.0, 99.35], [101.0, 101.82], [103.0, 114.34]], "keep_status": [false, false, false, false, false, true, false, false, true, true, false, true, true, true, false, false, false, true], "silence_prob": [42.74, 0.0, 0.0, 0.0, 0.0, 40.29, 41.24, 35.79, 45.14, 44.99, 0.0, 44.37, 39.05, 34.73, 0.0, 44.34, 0.0, 39.21], "audiomae_on_audioset": [[["sidetone", 44.73], ["speech", 28.85], ["whale vocalization", 10.41]], null, null, null, null, [["speech", 25.91], ["didgeridoo", 9.27], ["hum", 8.93]], [["speech", 60.35], ["hum", 9.17], ["sidetone", 6.35]], [["speech", 70.84], ["sidetone", 15.78], ["radio", 3.09]], [["hum", 17.78], ["rumble", 9.72], ["whale vocalization", 9.3]], [["speech", 29.58], ["hum", 10.43], ["rumble", 5.73]], null, [["speech", 29.75], ["noise", 12.82], ["whale vocalization", 6.49]], [["music", 35.0], ["didgeridoo", 11.09], ["hum", 7.49]], [["reverberation", 12.98], ["speech", 6.38], ["animal", 5.86]], null, [["speech", 64.5], ["sidetone", 7.05], ["music", 3.99]], null, [["mains hum", 23.8], ["hum", 16.92], ["fly, housefly", 13.43]]], "duration": [5.6, 0.89, 0.17, -0.34, 0.95, 8.35, 9.37, 3.24, 4.84, 3.18, 0.22, 3.91, 11.81, 3.02, 1.34, 4.35, 0.82, 11.34]} \ No newline at end of file diff --git a/annotations_1/qjJnk3MgNgc_filtered.json b/annotations_1/qjJnk3MgNgc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60fe87650ac0340a722f05a5e7fe3adb07386a25 --- /dev/null +++ b/annotations_1/qjJnk3MgNgc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.86], [10.0, 10.42], [13.0, 13.68], [21.0, 21.51], [29.0, 36.73], [39.0, 38.97], [44.0, 44.15], [47.0, 46.89], [51.0, 51.53], [55.0, 55.46], [57.0, 58.11], [66.0, 66.61], [74.0, 74.24], [75.0, 76.55], [77.0, 78.76], [79.0, 84.1], [86.0, 88.05], [93.0, 95.79], [99.0, 101.53], [104.0, 105.71], [110.0, 110.42], [111.0, 111.55], [112.0, 112.43], [113.0, 113.12], [114.0, 113.97], [119.0, 119.2], [126.0, 127.13], [129.0, 128.92], [132.0, 132.36], [134.0, 138.74], [140.0, 142.3], [143.0, 146.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 51.34, 42.13, 45.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.31, 34.65, 34.42], "audiomae_on_audioset": [null, null, null, null, [["music", 58.55], ["synthesizer", 8.26], ["hum", 7.89]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.91], ["hum", 17.16], ["speech", 7.23]], [["music", 52.24], ["guitar", 6.77], ["plucked string instrument", 5.44]], null, null, null, null, null, null, null, null, null, null, [["music", 57.26], ["synthesizer", 5.78], ["ambient music", 5.28]], [["music", 32.46], ["speech", 31.19], ["synthesizer", 13.93]], [["music", 68.15], ["synthesizer", 7.35], ["electronic music", 6.29]]], "duration": [0.86, 0.42, 0.68, 0.51, 7.73, -0.03, 0.15, -0.11, 0.53, 0.46, 1.11, 0.61, 0.24, 1.55, 1.76, 5.1, 2.05, 2.79, 2.53, 1.71, 0.42, 0.55, 0.43, 0.12, -0.03, 0.2, 1.13, -0.08, 0.36, 4.74, 2.3, 3.16]} \ No newline at end of file diff --git a/annotations_1/qjUsrdzDbuY_filtered.json b/annotations_1/qjUsrdzDbuY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cdee922285d16d159e5627be1429db2e690451a --- /dev/null +++ b/annotations_1/qjUsrdzDbuY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.38], [22.0, 22.94], [23.0, 23.16], [27.0, 26.79], [28.0, 28.16], [28.0, 30.03], [31.0, 30.86], [34.0, 34.11], [35.0, 35.73], [37.0, 37.35], [38.0, 39.68], [43.0, 48.25], [50.0, 50.97], [52.0, 66.66], [73.0, 73.72], [74.0, 74.68], [76.0, 76.62], [79.0, 79.88], [82.0, 82.51], [83.0, 84.35], [85.0, 86.09], [90.0, 92.21], [92.0, 94.27], [95.0, 96.23], [97.0, 98.19], [99.0, 98.93], [106.0, 107.27], [110.0, 111.43], [113.0, 114.74], [116.0, 118.66]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [49.45, 0.0, 0.0, 0.0, 0.0, 39.24, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 37.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 43.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.62], "audiomae_on_audioset": [[["speech", 70.56], ["hum", 4.42], ["radio", 3.2]], null, null, null, null, [["speech", 47.86], ["music", 6.65], ["coin (dropping)", 3.77]], null, null, null, null, null, null, null, [["music", 45.36], ["speech", 23.51], ["sidetone", 6.59]], null, null, null, null, null, null, null, null, [["music", 37.41], ["speech", 9.69], ["singing bowl", 6.84]], null, null, null, null, null, null, [["speech", 33.27], ["music", 17.45], ["hum", 16.64]]], "duration": [9.38, 0.94, 0.16, -0.21, 0.16, 2.03, -0.14, 0.11, 0.73, 0.35, 1.68, 5.25, 0.97, 14.66, 0.72, 0.68, 0.62, 0.88, 0.51, 1.35, 1.09, 2.21, 2.27, 1.23, 1.19, -0.07, 1.27, 1.43, 1.74, 2.66]} \ No newline at end of file diff --git a/annotations_1/qjqJtri_EG4_filtered.json b/annotations_1/qjqJtri_EG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62670efc11c7a046abeb55f3d614da3c1eecaf7f --- /dev/null +++ b/annotations_1/qjqJtri_EG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.81], [17.0, 17.09], [28.0, 28.68], [37.0, 38.77], [43.0, 46.23], [51.0, 50.95], [53.0, 54.77], [56.0, 57.1], [58.0, 58.43], [60.0, 61.99], [73.0, 73.63], [90.0, 90.54], [93.0, 93.34], [94.0, 94.56], [95.0, 96.31], [100.0, 100.5], [109.0, 112.95], [122.0, 122.59], [124.0, 125.2], [134.0, 135.57], [137.0, 137.39], [141.0, 141.88], [151.0, 151.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [62.37, 0.0, 0.0, 0.0, 98.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.1], ["electronic music", 3.03], ["ambient music", 2.99]], null, null, null, null, null, null], "duration": [2.81, 0.09, 0.68, 1.77, 3.23, -0.05, 1.77, 1.1, 0.43, 1.99, 0.63, 0.54, 0.34, 0.56, 1.31, 0.5, 3.95, 0.59, 1.2, 1.57, 0.39, 0.88, 0.65]} \ No newline at end of file diff --git a/annotations_1/qlfI_AppyIk_filtered.json b/annotations_1/qlfI_AppyIk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce3f04a5f138e2af5576853eaea4cf520b4972a5 --- /dev/null +++ b/annotations_1/qlfI_AppyIk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.81], [4.0, 5.49], [6.0, 6.25], [9.0, 16.5], [20.0, 24.83], [27.0, 32.9], [36.0, 39.26], [42.0, 46.18], [48.0, 53.32], [54.0, 58.85], [70.0, 73.6], [75.0, 92.5], [93.0, 95.79], [96.0, 107.18], [108.0, 117.86], [119.0, 120.53], [121.0, 123.18], [124.0, 130.55]], "keep_status": [false, false, false, false, false, true, false, true, false, true, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 99.98, 42.06, 57.56, 43.23, 81.89, 33.75, 50.71, 37.03, 37.78, 30.45, 76.2, 0.0, 64.07, 69.61], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.8], ["speech", 12.78], ["singing bowl", 12.33]], null, [["hum", 20.21], ["mains hum", 12.75], ["music", 12.04]], null, [["speech", 40.1], ["hum", 17.27], ["music", 11.73]], null, [["music", 26.94], ["hum", 10.5], ["thunk", 6.48]], [["chirp tone", 29.29], ["sine wave", 26.75], ["music", 10.34]], [["speech", 37.78], ["sonar", 13.11], ["hum", 11.8]], null, null, null, null], "duration": [1.81, 1.49, 0.25, 7.5, 4.83, 5.9, 3.26, 4.18, 5.32, 4.85, 3.6, 17.5, 2.79, 11.18, 9.86, 1.53, 2.18, 6.55]} \ No newline at end of file diff --git a/annotations_1/qnFWCagTOtw_filtered.json b/annotations_1/qnFWCagTOtw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..175d1f3d6b6cf5973d9f9e8c2ef987f127ba5144 --- /dev/null +++ b/annotations_1/qnFWCagTOtw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.21], [26.0, 26.43], [45.0, 45.87], [63.0, 63.59], [64.0, 68.4], [70.0, 70.24], [72.0, 72.12], [73.0, 73.21], [73.0, 74.88], [79.0, 79.12], [80.0, 79.84], [81.0, 81.24], [82.0, 82.05], [87.0, 87.35], [88.0, 89.75], [98.0, 98.76], [113.0, 113.64], [120.0, 120.72], [121.0, 122.34], [127.0, 127.74], [128.0, 128.09], [136.0, 136.53], [137.0, 140.98], [142.0, 143.18], [144.0, 144.66], [145.0, 144.96], [148.0, 149.64], [151.0, 152.0], [161.0, 161.76], [162.0, 165.37], [166.0, 167.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.65, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.21, 0.43, 0.87, 0.59, 4.4, 0.24, 0.12, 0.21, 1.88, 0.12, -0.16, 0.24, 0.05, 0.35, 1.75, 0.76, 0.64, 0.72, 1.34, 0.74, 0.09, 0.53, 3.98, 1.18, 0.66, -0.04, 1.64, 1.0, 0.76, 3.37, 1.19]} \ No newline at end of file diff --git a/annotations_1/qo1cSaFhPiQ_filtered.json b/annotations_1/qo1cSaFhPiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f8034e0417452d2810dadd4b24bd3851fce7e063 --- /dev/null +++ b/annotations_1/qo1cSaFhPiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 25.27], [28.0, 28.8], [31.0, 41.4], [46.0, 46.3], [48.0, 47.97], [52.0, 54.33], [55.0, 55.73], [56.0, 58.24], [59.0, 59.37], [59.0, 59.49], [63.0, 63.76], [65.0, 66.16], [68.0, 69.3], [72.0, 72.3], [74.0, 73.84], [76.0, 77.62], [79.0, 82.88]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 33.97, 0.0, 0.0, 44.66, 0.0, 95.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42], "audiomae_on_audioset": [null, null, [["fly, housefly", 64.72], ["insect", 25.26], ["mosquito", 4.51]], null, null, [["radio", 27.95], ["speech", 25.15], ["sidetone", 5.51]], null, null, null, null, null, null, null, null, null, null, [["speech", 30.2], ["explosion", 10.47], ["burst, pop", 4.22]]], "duration": [1.27, 0.8, 10.4, 0.3, -0.03, 2.33, 0.73, 2.24, 0.37, 0.49, 0.76, 1.16, 1.3, 0.3, -0.16, 1.62, 3.88]} \ No newline at end of file diff --git a/annotations_1/qoXJJin1e7g_filtered.json b/annotations_1/qoXJJin1e7g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..511f1e8191aba0f3a42801a771eea6f4f80a2bb5 --- /dev/null +++ b/annotations_1/qoXJJin1e7g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.85], [19.0, 19.85], [28.0, 28.41], [31.0, 31.7], [34.0, 44.96], [54.0, 54.43], [59.0, 60.66], [62.0, 61.96], [63.0, 70.87], [72.0, 72.62], [74.0, 74.71], [81.0, 82.34], [89.0, 89.88], [93.0, 95.99], [101.0, 103.25], [104.0, 107.91], [109.0, 110.34], [112.0, 112.7]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 45.49, 42.04, 40.86, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 22.93], ["rumble", 17.09], ["music", 15.84]], null, null, null, [["hum", 37.33], ["mains hum", 25.32], ["throbbing", 12.05]], null, null, null, null, [["creak", 19.65], ["vehicle", 5.96], ["fly, housefly", 5.42]], [["telephone", 80.82], ["telephone bell ringing", 13.59], ["ringtone", 1.93]], [["music", 18.99], ["hum", 8.35], ["synthesizer", 7.57]], null, null], "duration": [0.85, 0.85, 0.41, 0.7, 10.96, 0.43, 1.66, -0.04, 7.87, 0.62, 0.71, 1.34, 0.88, 2.99, 2.25, 3.91, 1.34, 0.7]} \ No newline at end of file diff --git a/annotations_1/qp-Jr4oEFWo_filtered.json b/annotations_1/qp-Jr4oEFWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c47b52f5a3220ad5b90e5e1cf00728a6be47fb0 --- /dev/null +++ b/annotations_1/qp-Jr4oEFWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.4], [9.0, 9.8], [11.0, 11.91], [14.0, 16.04], [18.0, 19.01], [23.0, 23.26], [27.0, 26.81], [28.0, 28.27], [29.0, 29.67], [31.0, 33.13], [36.0, 38.37], [41.0, 45.13], [48.0, 49.08], [49.0, 50.52], [52.0, 53.15], [56.0, 56.1], [58.0, 60.03], [62.0, 64.39], [67.0, 70.12], [72.0, 72.2], [74.0, 76.11], [78.0, 78.65], [81.0, 81.5], [82.0, 83.05], [85.0, 86.66], [87.0, 90.51], [103.0, 104.14], [105.0, 106.19], [109.0, 109.49], [122.0, 122.39], [125.0, 127.72], [132.0, 132.34], [145.0, 146.65], [149.0, 151.55], [153.0, 155.16], [155.0, 157.2], [158.0, 159.11], [161.0, 161.47], [170.0, 178.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.82, 0.0, 0.0, 0.0, 0.0, 0.0, 70.58, 100.0, 98.27, 0.0, 0.0, 0.0, 0.0, 100.0, 60.32, 38.78, 0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 43.98, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 100.0, 84.98, 36.19, 0.0, 0.0, 98.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.41], ["speech synthesizer", 3.04], ["radio", 2.44]], null, null, null, null, null, null, [["speech", 34.96], ["electric shaver, electric razor", 9.01], ["didgeridoo", 6.81]], null, null, null, null, null, null, null, null, null, [["speech", 39.92], ["sidetone", 14.98], ["frog", 7.17]], null, null, null], "duration": [1.4, 0.8, 0.91, 2.04, 1.01, 0.26, -0.19, 0.27, 0.67, 2.13, 2.37, 4.13, 1.08, 1.52, 1.15, 0.1, 2.03, 2.39, 3.12, 0.2, 2.11, 0.65, 0.5, 1.05, 1.66, 3.51, 1.14, 1.19, 0.49, 0.39, 2.72, 0.34, 1.65, 2.55, 2.16, 2.2, 1.11, 0.47, 8.7]} \ No newline at end of file diff --git a/annotations_1/qp-uFNB9jYo_filtered.json b/annotations_1/qp-uFNB9jYo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87602b5008b36762f8281bb70181bf411e962dc4 --- /dev/null +++ b/annotations_1/qp-uFNB9jYo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.32], [8.0, 8.73], [10.0, 14.84], [15.0, 22.64], [23.0, 24.95], [27.0, 28.09], [29.0, 32.17], [33.0, 33.89], [34.0, 36.09], [37.0, 43.5], [45.0, 45.64], [47.0, 49.0], [50.0, 52.14], [54.0, 57.62], [58.0, 60.08], [62.0, 62.58], [65.0, 66.07], [67.0, 67.76], [70.0, 71.95], [73.0, 76.15], [77.0, 78.85], [80.0, 81.3], [85.0, 85.68], [86.0, 87.62], [88.0, 89.58], [90.0, 91.4], [94.0, 95.82], [101.0, 101.71], [104.0, 104.23], [105.0, 107.65], [109.0, 109.17], [112.0, 112.6], [113.0, 113.68], [117.0, 118.17], [123.0, 124.78], [128.0, 128.75], [130.0, 130.45], [139.0, 140.22], [143.0, 143.07], [147.0, 147.21], [148.0, 149.44], [150.0, 151.63], [154.0, 155.49], [158.0, 160.0], [163.0, 167.12], [171.0, 171.78], [173.0, 174.6], [175.0, 178.19], [181.0, 181.33], [187.0, 189.08], [190.0, 196.97], [200.0, 203.49], [205.0, 206.04], [207.0, 207.94], [211.0, 211.76], [213.0, 214.89], [218.0, 220.06], [221.0, 222.78], [223.0, 230.89]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 49.97, 94.95, 0.0, 0.0, 80.46, 0.0, 44.15, 51.6, 0.0, 74.6, 51.82, 74.92, 48.02, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.3, 99.97, 0.0, 0.0, 99.9, 0.0, 95.91, 97.11, 65.67, 0.0, 0.0, 0.0, 0.0, 47.2, 0.0, 51.82], "audiomae_on_audioset": [null, null, [["whale vocalization", 67.11], ["noise", 3.57], ["music", 3.53]], null, null, null, null, null, [["speech", 25.61], ["music", 22.98], ["whale vocalization", 11.63]], null, null, null, null, null, [["mains hum", 43.45], ["hum", 32.14], ["sidetone", 8.63]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.35], ["music", 21.09], ["sidetone", 5.36]], null, null], "duration": [1.32, 0.73, 4.84, 7.64, 1.95, 1.09, 3.17, 0.89, 2.09, 6.5, 0.64, 2.0, 2.14, 3.62, 2.08, 0.58, 1.07, 0.76, 1.95, 3.15, 1.85, 1.3, 0.68, 1.62, 1.58, 1.4, 1.82, 0.71, 0.23, 2.65, 0.17, 0.6, 0.68, 1.17, 1.78, 0.75, 0.45, 1.22, 0.07, 0.21, 1.44, 1.63, 1.49, 2.0, 4.12, 0.78, 1.6, 3.19, 0.33, 2.08, 6.97, 3.49, 1.04, 0.94, 0.76, 1.89, 2.06, 1.78, 7.89]} \ No newline at end of file diff --git a/annotations_1/qpxUYzNSGn0_filtered.json b/annotations_1/qpxUYzNSGn0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1c811bab3e16fc2a512ac7f8aa84f8f370f5f981 --- /dev/null +++ b/annotations_1/qpxUYzNSGn0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.73], [30.0, 30.82], [31.0, 32.48], [40.0, 41.42], [44.0, 46.43], [47.0, 49.35], [52.0, 55.05], [63.0, 63.68], [65.0, 65.3], [69.0, 74.7], [76.0, 77.85], [79.0, 79.93], [81.0, 81.82], [83.0, 83.0], [83.0, 83.17], [94.0, 93.92], [120.0, 120.66], [125.0, 125.14], [128.0, 128.51], [130.0, 130.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 66.15, 74.92, 44.32, 0.0, 0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 53.93], ["music", 13.18], ["sidetone", 5.3]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.27, 0.82, 1.48, 1.42, 2.43, 2.35, 3.05, 0.68, 0.3, 5.7, 1.85, 0.93, 0.82, 0.0, 0.17, -0.08, 0.66, 0.14, 0.51, 0.91]} \ No newline at end of file diff --git a/annotations_1/qqAzmt1d8kU_filtered.json b/annotations_1/qqAzmt1d8kU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff6a3a306bc7d7bd55def7035200970dca618475 --- /dev/null +++ b/annotations_1/qqAzmt1d8kU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.67]], "keep_status": [false], "silence_prob": [64.97], "audiomae_on_audioset": [null], "duration": [3.67]} \ No newline at end of file diff --git a/annotations_1/qqSS99m2dQ0_filtered.json b/annotations_1/qqSS99m2dQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87bfd62b27eb302a2b8386105a4e45571211bec2 --- /dev/null +++ b/annotations_1/qqSS99m2dQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.8], [12.0, 13.85], [15.0, 15.15], [16.0, 17.17], [23.0, 23.89], [26.0, 25.84], [26.0, 31.6], [39.0, 39.01], [40.0, 40.15], [43.0, 44.34], [46.0, 46.11], [47.0, 48.3], [51.0, 51.21], [54.0, 53.69], [56.0, 56.76], [57.0, 57.4], [59.0, 60.88], [61.0, 61.87], [67.0, 71.71], [73.0, 76.5], [78.0, 78.58], [80.0, 80.43], [88.0, 89.18], [94.0, 94.19], [95.0, 96.89], [98.0, 98.79], [104.0, 104.65], [105.0, 105.27], [106.0, 105.9], [116.0, 116.55], [119.0, 120.23], [122.0, 125.05], [131.0, 135.48], [136.0, 137.96], [138.0, 138.91], [140.0, 140.48], [141.0, 141.76], [145.0, 144.88], [156.0, 157.35], [159.0, 159.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.07, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.06, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.34], ["fly, housefly", 7.54], ["insect", 6.69]], null, null, null, null, null, null, null, null], "duration": [0.8, 1.85, 0.15, 1.17, 0.89, -0.16, 5.6, 0.01, 0.15, 1.34, 0.11, 1.3, 0.21, -0.31, 0.76, 0.4, 1.88, 0.87, 4.71, 3.5, 0.58, 0.43, 1.18, 0.19, 1.89, 0.79, 0.65, 0.27, -0.1, 0.55, 1.23, 3.05, 4.48, 1.96, 0.91, 0.48, 0.76, -0.12, 1.35, 0.71]} \ No newline at end of file diff --git a/annotations_1/qqZPej42OkE_filtered.json b/annotations_1/qqZPej42OkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..657824bbfcc91533c223a6ff37d0b482840edd82 --- /dev/null +++ b/annotations_1/qqZPej42OkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [3.0, 12.01], [13.0, 16.44], [18.0, 20.48], [23.0, 30.28], [31.0, 32.29], [33.0, 37.18]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 89.36, 99.8, 66.27, 72.46, 0.0, 87.92], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.1, 9.01, 3.44, 2.48, 7.28, 1.29, 4.18]} \ No newline at end of file diff --git a/annotations_1/qqhyIIZt87A_filtered.json b/annotations_1/qqhyIIZt87A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dab733a0405cba33bff9909a22d47ce3cce8630f --- /dev/null +++ b/annotations_1/qqhyIIZt87A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.1], [8.0, 8.61], [17.0, 16.66], [46.0, 47.24], [49.0, 50.43], [52.0, 52.22], [54.0, 54.62], [57.0, 59.27], [62.0, 66.95], [71.0, 72.23], [75.0, 76.92], [78.0, 82.97], [85.0, 86.93], [87.0, 88.2], [89.0, 91.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.8, 99.73, 0.0, 0.0, 43.58, 0.0, 0.0, 56.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 61.21], ["drum", 7.12], ["bass drum", 4.62]], null, null, null], "duration": [0.1, 0.61, -0.34, 1.24, 1.43, 0.22, 0.62, 2.27, 4.95, 1.23, 1.92, 4.97, 1.93, 1.2, 2.17]} \ No newline at end of file diff --git a/annotations_1/qrIt5BPvCv8_filtered.json b/annotations_1/qrIt5BPvCv8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57ea0b7a10ebfa5c27b003f147ef1838138c004b --- /dev/null +++ b/annotations_1/qrIt5BPvCv8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.75], [11.0, 14.25], [47.0, 47.92], [50.0, 50.58], [54.0, 54.99], [56.0, 70.95], [75.0, 76.65], [79.0, 82.85], [84.0, 84.97], [86.0, 87.08], [88.0, 89.26], [90.0, 90.68], [92.0, 94.41], [96.0, 96.4], [97.0, 97.9], [101.0, 100.99], [104.0, 106.95], [108.0, 108.41], [110.0, 111.28], [113.0, 114.13], [115.0, 116.06], [117.0, 117.37], [119.0, 120.68], [122.0, 122.66], [123.0, 124.21], [127.0, 126.77], [129.0, 129.25]], "keep_status": [true, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.95, 38.51, 0.0, 0.0, 0.0, 31.07, 0.0, 43.23, 0.0, 0.0, 0.0, 0.0, 49.5, 0.0, 0.0, 0.0, 44.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["noise", 47.79], ["music", 14.96], ["musical instrument", 5.22]], [["speech", 42.47], ["music", 23.66], ["didgeridoo", 5.49]], null, null, null, [["speech", 36.26], ["hum", 10.47], ["vehicle", 6.32]], null, [["music", 21.47], ["hum", 11.86], ["throbbing", 7.18]], null, null, null, null, [["sidetone", 20.0], ["hum", 18.4], ["speech", 11.42]], null, null, null, [["speech", 30.58], ["music", 4.69], ["hum", 3.44]], null, null, null, null, null, null, null, null, null, null], "duration": [3.75, 3.25, 0.92, 0.58, 0.99, 14.95, 1.65, 3.85, 0.97, 1.08, 1.26, 0.68, 2.41, 0.4, 0.9, -0.01, 2.95, 0.41, 1.28, 1.13, 1.06, 0.37, 1.68, 0.66, 1.21, -0.23, 0.25]} \ No newline at end of file diff --git a/annotations_1/qrONj6Srq7M_filtered.json b/annotations_1/qrONj6Srq7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ccb6734f721a39152e31da1ec11b920e3062777 --- /dev/null +++ b/annotations_1/qrONj6Srq7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [3.0, 4.97], [6.0, 12.53], [15.0, 14.66], [16.0, 16.92], [18.0, 19.74], [22.0, 22.89], [23.0, 25.44], [27.0, 28.0], [35.0, 37.17], [37.0, 39.83], [42.0, 44.07], [46.0, 47.93], [51.0, 53.47], [54.0, 54.41], [57.0, 57.15], [58.0, 58.82], [61.0, 62.26], [63.0, 65.62], [66.0, 68.13], [75.0, 75.81], [77.0, 77.65], [79.0, 79.03], [82.0, 84.67], [87.0, 88.33], [89.0, 92.72], [97.0, 99.67], [100.0, 100.77], [104.0, 107.35], [109.0, 110.83], [114.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 99.44, 99.68, 74.92, 0.0, 68.67, 0.0, 0.0, 0.0, 0.0, 99.92, 99.93, 0.0, 0.0, 0.0, 99.95, 0.0, 98.19, 99.8, 0.0, 98.01, 0.0, 99.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.97, 6.53, -0.34, 0.92, 1.74, 0.89, 2.44, 1.0, 2.17, 2.83, 2.07, 1.93, 2.47, 0.41, 0.15, 0.82, 1.26, 2.62, 2.13, 0.81, 0.65, 0.03, 2.67, 1.33, 3.72, 2.67, 0.77, 3.35, 1.83, 4.59]} \ No newline at end of file diff --git a/annotations_1/qsyYw2x1-js_filtered.json b/annotations_1/qsyYw2x1-js_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f094cc09f4caf8f0378daf11d89a473108a5a23b --- /dev/null +++ b/annotations_1/qsyYw2x1-js_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.02], [5.0, 16.44], [21.0, 26.99], [27.0, 32.54], [34.0, 47.09], [48.0, 82.07], [83.0, 131.45], [132.0, 134.79], [136.0, 147.56], [150.0, 149.54], [151.0, 174.92], [178.0, 178.68]], "keep_status": [true, true, true, true, true, false, false, true, false, false, false, false], "silence_prob": [38.68, 29.57, 29.48, 30.7, 31.58, 0.0, 0.0, 40.99, 29.56, 0.0, 65.79, 0.0], "audiomae_on_audioset": [[["hum", 37.13], ["speech", 18.19], ["music", 11.82]], [["music", 45.9], ["hum", 10.64], ["didgeridoo", 7.17]], [["whack, thwack", 19.16], ["speech", 18.4], ["music", 12.77]], [["speech", 33.01], ["groan", 12.44], ["music", 5.45]], [["music", 19.32], ["speech", 16.57], ["breaking", 7.96]], null, null, [["music", 20.85], ["cello", 15.87], ["foghorn", 10.74]], [["speech", 50.32], ["music", 32.98], ["roar", 1.81]], null, null, null], "duration": [3.02, 11.44, 5.99, 5.54, 13.09, 34.07, 48.45, 2.79, 11.56, -0.46, 23.92, 0.68]} \ No newline at end of file diff --git a/annotations_1/qu68Gym5PvE_filtered.json b/annotations_1/qu68Gym5PvE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f5eaeb7526ed8eb629711920369f1580626ae9c --- /dev/null +++ b/annotations_1/qu68Gym5PvE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 42.06], [49.0, 55.71], [62.0, 65.03], [66.0, 97.34], [98.0, 114.42], [115.0, 116.61], [117.0, 117.19], [120.0, 120.75], [122.0, 126.93], [130.0, 130.6]], "keep_status": [false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.31, 31.66, 0.0, 30.39, 0.0, 0.0, 0.0, 49.18, 0.0], "audiomae_on_audioset": [null, [["music", 51.39], ["throbbing", 11.53], ["didgeridoo", 8.03]], [["music", 55.48], ["theremin", 6.8], ["timpani", 5.0]], null, [["music", 40.82], ["speech", 20.7], ["hum", 9.32]], null, null, null, [["fart", 38.31], ["noise", 5.89], ["throbbing", 5.02]], null], "duration": [32.06, 6.71, 3.03, 31.34, 16.42, 1.61, 0.19, 0.75, 4.93, 0.6]} \ No newline at end of file diff --git a/annotations_1/qv4BPYX4B8U_filtered.json b/annotations_1/qv4BPYX4B8U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b372bc90fe24c2df6920c4140042daaf58551e3f --- /dev/null +++ b/annotations_1/qv4BPYX4B8U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [6.0, 6.45], [7.0, 9.91], [12.0, 12.31], [14.0, 14.23], [16.0, 17.17], [19.0, 18.59], [19.0, 19.75], [22.0, 22.49], [23.0, 24.44], [29.0, 31.92], [33.0, 33.42], [38.0, 38.23], [39.0, 39.41], [40.0, 40.22], [43.0, 44.42], [50.0, 51.22], [53.0, 54.35], [56.0, 55.97], [57.0, 57.72], [63.0, 64.54], [67.0, 67.64], [68.0, 69.75], [70.0, 72.3], [74.0, 77.4], [79.0, 78.61], [91.0, 92.08], [96.0, 105.95], [107.0, 108.01], [109.0, 114.44], [115.0, 117.1], [119.0, 119.33], [122.0, 134.16], [135.0, 139.46], [140.0, 141.35], [146.0, 145.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.53, 61.77, 0.0, 0.0, 87.37, 0.0, 85.9, 64.63, 0.0, 58.89, 53.47, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.45, 2.91, 0.31, 0.23, 1.17, -0.41, 0.75, 0.49, 1.44, 2.92, 0.42, 0.23, 0.41, 0.22, 1.42, 1.22, 1.35, -0.03, 0.72, 1.54, 0.64, 1.75, 2.3, 3.4, -0.39, 1.08, 9.95, 1.01, 5.44, 2.1, 0.33, 12.16, 4.46, 1.35, -0.01]} \ No newline at end of file diff --git a/annotations_1/qv_DJYvELTQ_filtered.json b/annotations_1/qv_DJYvELTQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70b16399f661c36df8f840473427a17efc95f8bf --- /dev/null +++ b/annotations_1/qv_DJYvELTQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 19.97], [21.0, 21.76], [26.0, 26.77], [29.0, 30.01], [35.0, 39.8], [41.0, 42.62], [43.0, 45.71], [47.0, 47.85], [48.0, 51.31], [52.0, 58.21], [60.0, 60.61], [62.0, 63.07], [66.0, 69.8], [71.0, 73.31], [74.0, 74.63], [76.0, 77.45], [83.0, 84.23], [86.0, 87.91], [91.0, 92.21], [96.0, 98.37], [102.0, 112.41], [115.0, 116.41], [119.0, 119.87], [121.0, 121.88], [130.0, 132.48], [133.0, 137.19], [137.0, 137.52], [138.0, 144.98], [147.0, 160.89], [165.0, 167.9], [168.0, 170.18], [172.0, 174.65]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, true, true], "silence_prob": [33.56, 0.0, 0.0, 0.0, 66.76, 0.0, 36.61, 0.0, 68.8, 39.8, 0.0, 0.0, 41.52, 36.42, 0.0, 0.0, 0.0, 0.0, 0.0, 62.47, 40.48, 0.0, 0.0, 0.0, 53.65, 29.99, 0.0, 29.41, 36.98, 40.38, 41.18, 30.03], "audiomae_on_audioset": [[["hum", 59.61], ["mains hum", 30.69], ["throbbing", 6.75]], null, null, null, null, null, [["hum", 21.3], ["whale vocalization", 17.31], ["cattle, bovinae", 11.52]], null, null, [["speech", 75.62], ["sidetone", 7.96], ["radio", 2.77]], null, null, [["stomach rumble", 45.24], ["speech", 17.37], ["whale vocalization", 7.16]], [["sidetone", 69.1], ["hum", 9.0], ["music", 5.58]], null, null, null, null, null, null, [["hum", 41.62], ["speech", 25.15], ["mains hum", 7.49]], null, null, null, null, [["speech", 32.58], ["bee, wasp, etc.", 9.01], ["fly, housefly", 7.14]], null, [["speech", 43.04], ["animal", 9.46], ["outside, rural or natural", 5.1]], [["hum", 41.38], ["throbbing", 29.67], ["music", 6.03]], [["speech", 31.53], ["gong", 11.36], ["hum", 8.96]], [["speech", 36.86], ["hum", 20.67], ["whale vocalization", 8.56]], [["speech", 64.04], ["outside, rural or natural", 3.24], ["rumble", 2.01]]], "duration": [7.97, 0.76, 0.77, 1.01, 4.8, 1.62, 2.71, 0.85, 3.31, 6.21, 0.61, 1.07, 3.8, 2.31, 0.63, 1.45, 1.23, 1.91, 1.21, 2.37, 10.41, 1.41, 0.87, 0.88, 2.48, 4.19, 0.52, 6.98, 13.89, 2.9, 2.18, 2.65]} \ No newline at end of file diff --git a/annotations_1/qvvcVzNqXVg_filtered.json b/annotations_1/qvvcVzNqXVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41e68efb62a36ca80d35b4887087d928722a7499 --- /dev/null +++ b/annotations_1/qvvcVzNqXVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.49], [32.0, 35.6], [37.0, 37.62], [52.0, 52.14], [53.0, 54.04], [76.0, 76.33], [88.0, 90.91], [92.0, 92.18], [97.0, 98.58], [100.0, 100.77], [101.0, 103.0], [107.0, 109.44], [110.0, 110.57], [119.0, 120.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 33.06, 0.0, 0.0, 0.0, 0.0, 72.31, 0.0, 0.0, 0.0, 53.16, 34.57, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 72.92], ["boing", 4.02], ["snicker", 3.92]], null, null, null, null, null, null, null, null, null, [["music", 57.44], ["synthesizer", 3.97], ["musical instrument", 3.64]], null, null], "duration": [0.49, 3.6, 0.62, 0.14, 1.04, 0.33, 2.91, 0.18, 1.58, 0.77, 2.0, 2.44, 0.57, 1.92]} \ No newline at end of file diff --git a/annotations_1/qwwLKFCR4K0_filtered.json b/annotations_1/qwwLKFCR4K0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53ceac545e0e1a5c711887a802b257c09ae6c905 --- /dev/null +++ b/annotations_1/qwwLKFCR4K0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.09]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [1.09]} \ No newline at end of file diff --git a/annotations_1/qyXpj-yVjVg_filtered.json b/annotations_1/qyXpj-yVjVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a1e6018baf2142831163b0640a1bc6518851e4 --- /dev/null +++ b/annotations_1/qyXpj-yVjVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.98], [21.0, 27.57], [28.0, 31.48], [32.0, 36.78], [38.0, 39.41], [40.0, 41.89], [47.0, 49.06], [51.0, 51.09], [54.0, 55.8], [57.0, 58.89], [61.0, 60.62], [64.0, 68.91], [70.0, 72.42], [76.0, 77.3], [79.0, 80.86], [82.0, 82.26], [84.0, 85.77], [87.0, 87.44], [88.0, 88.86], [90.0, 90.21], [92.0, 92.64], [93.0, 93.75], [96.0, 97.09], [101.0, 106.81], [108.0, 109.11], [111.0, 112.16], [113.0, 112.95], [113.0, 114.24], [115.0, 116.36], [117.0, 118.67], [120.0, 120.85], [123.0, 123.58], [124.0, 124.88], [127.0, 127.45], [129.0, 129.05], [130.0, 131.31], [133.0, 133.79], [134.0, 134.96], [136.0, 136.61], [138.0, 138.3], [141.0, 142.82]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.62, 51.82, 77.53, 88.83, 0.0, 0.0, 81.53, 0.0, 0.0, 0.0, 0.0, 46.61, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 47.4], ["speech", 12.35], ["door", 3.9]], null, null, null, null, null, null, null, null, null, null, [["music", 30.33], ["didgeridoo", 14.43], ["mains hum", 12.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.98, 6.57, 3.48, 4.78, 1.41, 1.89, 2.06, 0.09, 1.8, 1.89, -0.38, 4.91, 2.42, 1.3, 1.86, 0.26, 1.77, 0.44, 0.86, 0.21, 0.64, 0.75, 1.09, 5.81, 1.11, 1.16, -0.05, 1.24, 1.36, 1.67, 0.85, 0.58, 0.88, 0.45, 0.05, 1.31, 0.79, 0.96, 0.61, 0.3, 1.82]} \ No newline at end of file diff --git a/annotations_1/qyZXW5Md1HM_filtered.json b/annotations_1/qyZXW5Md1HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bbe14f204df4538ff2ec3aa8910a949f1732a8c --- /dev/null +++ b/annotations_1/qyZXW5Md1HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 26.55], [27.0, 28.75], [31.0, 38.62], [50.0, 49.72], [50.0, 53.33], [58.0, 57.94], [64.0, 79.46], [80.0, 94.53], [98.0, 113.53], [115.0, 144.07]], "keep_status": [true, false, false, false, true, false, false, true, false, false], "silence_prob": [30.57, 0.0, 32.53, 0.0, 31.59, 0.0, 31.48, 46.4, 62.07, 36.86], "audiomae_on_audioset": [[["music", 29.42], ["grunt", 12.8], ["speech", 11.34]], null, [["music", 67.53], ["plop", 16.94], ["bass guitar", 2.01]], null, [["speech", 30.63], ["music", 13.24], ["cattle, bovinae", 12.34]], null, [["music", 85.83], ["plop", 1.82], ["bass guitar", 1.11]], [["speech", 14.72], ["hoot", 7.95], ["whimper", 6.41]], null, [["dial tone", 49.58], ["busy signal", 17.26], ["music", 10.29]]], "duration": [3.55, 1.75, 7.62, -0.28, 3.33, -0.06, 15.46, 14.53, 15.53, 29.07]} \ No newline at end of file diff --git a/annotations_1/qyvR5lglbTE_filtered.json b/annotations_1/qyvR5lglbTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7289cad99be09eb2dd88121764ae56cf906e3aa1 --- /dev/null +++ b/annotations_1/qyvR5lglbTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [3.0, 3.64], [4.0, 5.85], [7.0, 9.05], [10.0, 23.97], [25.0, 25.78], [26.0, 35.67], [36.0, 54.36]], "keep_status": [false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 49.36, 28.43, 0.0, 29.09, 28.91], "audiomae_on_audioset": [null, null, null, [["music", 59.81], ["throbbing", 5.3], ["synthesizer", 3.89]], [["vehicle", 43.56], ["speech", 15.69], ["car", 15.03]], null, [["speech", 56.86], ["hum", 12.94], ["music", 10.87]], [["speech", 23.82], ["music", 18.31], ["mains hum", 10.52]]], "duration": [0.76, 0.64, 1.85, 2.05, 13.97, 0.78, 9.67, 18.36]} \ No newline at end of file diff --git a/annotations_1/qzQdwPNUcME_filtered.json b/annotations_1/qzQdwPNUcME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9f9ce998f314abdcb314f14189ef6fbe11f4fb6 --- /dev/null +++ b/annotations_1/qzQdwPNUcME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 13.24], [16.0, 17.24], [18.0, 18.44], [34.0, 37.25], [38.0, 38.25], [40.0, 50.31], [51.0, 53.4], [53.0, 54.94], [56.0, 57.42], [81.0, 81.58], [82.0, 82.75], [83.0, 83.52], [85.0, 85.68], [87.0, 86.66], [87.0, 88.65], [89.0, 90.12], [91.0, 94.04], [98.0, 99.2], [104.0, 104.68], [134.0, 134.94], [149.0, 150.42], [151.0, 153.2], [156.0, 156.83], [158.0, 162.77], [164.0, 166.04]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [47.9, 0.0, 0.0, 31.98, 0.0, 74.76, 53.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 0.0, 0.0, 29.23, 0.0, 27.91, 64.29], "audiomae_on_audioset": [[["fart", 75.97], ["noise", 5.7], ["speech", 5.22]], null, null, [["moo", 23.12], ["speech", 20.34], ["cattle, bovinae", 20.09]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.28], ["didgeridoo", 12.6], ["musical instrument", 2.95]], null, [["speech", 39.2], ["screaming", 10.7], ["explosion", 5.85]], null], "duration": [7.24, 1.24, 0.44, 3.25, 0.25, 10.31, 2.4, 1.94, 1.42, 0.58, 0.75, 0.52, 0.68, -0.34, 1.65, 1.12, 3.04, 1.2, 0.68, 0.94, 1.42, 2.2, 0.83, 4.77, 2.04]} \ No newline at end of file diff --git a/annotations_1/r-IE6wNNbAI_filtered.json b/annotations_1/r-IE6wNNbAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5b3eef65f108ab4bfaf462efb7520529345f1ee --- /dev/null +++ b/annotations_1/r-IE6wNNbAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.43], [4.0, 5.86], [9.0, 10.49], [11.0, 10.93], [24.0, 24.56], [42.0, 47.68], [49.0, 50.75], [52.0, 54.01], [61.0, 60.91], [64.0, 72.03], [73.0, 75.66], [85.0, 105.49], [106.0, 106.61], [108.0, 119.53], [121.0, 122.62], [124.0, 136.93], [138.0, 140.34], [142.0, 154.62]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.66, 0.0, 37.67, 0.0, 31.79, 33.31, 35.22, 0.0, 31.71, 0.0, 33.06, 37.46, 30.36], "audiomae_on_audioset": [null, null, null, null, null, [["music", 20.35], ["speech", 17.84], ["didgeridoo", 13.13]], null, [["music", 79.07], ["musical instrument", 2.48], ["throbbing", 1.94]], null, [["music", 40.14], ["moo", 9.52], ["cattle, bovinae", 8.01]], [["music", 35.19], ["speech", 8.9], ["carnatic music", 4.34]], [["music", 84.39], ["reggae", 1.01], ["funny music", 0.84]], null, [["music", 41.49], ["buzz", 28.27], ["breaking", 9.09]], null, [["music", 62.76], ["speech", 16.05], ["boing", 2.68]], [["music", 68.05], ["speech", 4.58], ["electronic music", 2.4]], [["music", 49.29], ["hum", 13.3], ["throbbing", 6.96]]], "duration": [0.43, 1.86, 1.49, -0.07, 0.56, 5.68, 1.75, 2.01, -0.09, 8.03, 2.66, 20.49, 0.61, 11.53, 1.62, 12.93, 2.34, 12.62]} \ No newline at end of file diff --git a/annotations_1/r0eg-ieT77g_filtered.json b/annotations_1/r0eg-ieT77g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9cf3e2864417ad1775d4eaf87ce140deee02d2 --- /dev/null +++ b/annotations_1/r0eg-ieT77g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.91], [12.0, 15.62], [18.0, 22.0], [25.0, 26.4], [29.0, 35.92], [39.0, 42.72], [43.0, 46.77], [54.0, 55.38], [57.0, 60.2], [61.0, 68.17], [72.0, 71.85], [74.0, 74.66], [75.0, 83.44], [85.0, 86.53], [91.0, 96.43], [100.0, 111.27], [115.0, 135.24], [140.0, 140.86], [143.0, 144.24], [148.0, 155.34], [156.0, 161.67], [166.0, 166.06]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.05, 32.45, 31.45, 0.0, 33.91, 64.86, 36.15, 0.0, 38.75, 31.39, 0.0, 0.0, 31.13, 0.0, 31.09, 31.37, 30.38, 0.0, 0.0, 32.52, 31.25, 0.0], "audiomae_on_audioset": [[["music", 60.12], ["hum", 6.73], ["throbbing", 3.75]], [["music", 50.72], ["electronic music", 6.42], ["noise", 5.48]], [["music", 32.17], ["speech", 28.13], ["throbbing", 4.23]], null, [["music", 63.13], ["throbbing", 8.8], ["didgeridoo", 5.85]], null, [["music", 50.1], ["boing", 32.52], ["didgeridoo", 1.94]], null, [["music", 54.09], ["theremin", 22.01], ["noise", 5.21]], [["music", 85.3], ["throbbing", 3.44], ["boing", 1.71]], null, null, [["music", 58.12], ["speech", 13.35], ["sidetone", 10.57]], null, [["music", 38.52], ["hum", 17.3], ["throbbing", 15.14]], [["music", 89.05], ["electronic music", 1.4], ["throbbing", 0.89]], [["music", 63.91], ["throbbing", 8.86], ["hum", 6.64]], null, null, [["music", 61.28], ["electronic music", 10.1], ["synthesizer", 5.39]], [["sidetone", 45.35], ["music", 21.03], ["hum", 10.12]], null], "duration": [8.91, 3.62, 4.0, 1.4, 6.92, 3.72, 3.77, 1.38, 3.2, 7.17, -0.15, 0.66, 8.44, 1.53, 5.43, 11.27, 20.24, 0.86, 1.24, 7.34, 5.67, 0.06]} \ No newline at end of file diff --git a/annotations_1/r12JlwSBvVQ_filtered.json b/annotations_1/r12JlwSBvVQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a079be838732742d5119d1132f45b07503653b42 --- /dev/null +++ b/annotations_1/r12JlwSBvVQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.04], [14.0, 16.68], [34.0, 42.38], [53.0, 53.74], [66.0, 68.45], [75.0, 76.27], [77.0, 80.77], [82.0, 82.93], [84.0, 85.28], [98.0, 98.63], [101.0, 102.41], [112.0, 121.58], [126.0, 126.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 68.54, 62.37, 0.0, 82.79, 0.0, 50.06, 0.0, 0.0, 0.0, 0.0, 44.43, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.65], ["applause", 7.29], ["male speech, man speaking", 1.36]], null], "duration": [1.04, 2.68, 8.38, 0.74, 2.45, 1.27, 3.77, 0.93, 1.28, 0.63, 1.41, 9.58, 0.06]} \ No newline at end of file diff --git a/annotations_1/r1N-Xby5AnA_filtered.json b/annotations_1/r1N-Xby5AnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57057f5bec4528181dfdbeb6ef82de3f716a4d3b --- /dev/null +++ b/annotations_1/r1N-Xby5AnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.02], [8.0, 8.48], [11.0, 20.11], [21.0, 21.12], [23.0, 23.31], [25.0, 27.16], [29.0, 48.61], [50.0, 50.79], [52.0, 53.76], [55.0, 69.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 53.53, 0.0, 0.0, 92.8, 34.61, 0.0, 0.0, 33.16], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 74.79], ["throbbing", 2.97], ["synthesizer", 2.14]], null, null, [["music", 63.41], ["speech", 9.89], ["throbbing", 2.77]]], "duration": [0.02, 0.48, 9.11, 0.12, 0.31, 2.16, 19.61, 0.79, 1.76, 14.15]} \ No newline at end of file diff --git a/annotations_1/r1NUy3Rq8n4_filtered.json b/annotations_1/r1NUy3Rq8n4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7af9bd37bedf85f4caa919d974fcb1935f4c96c8 --- /dev/null +++ b/annotations_1/r1NUy3Rq8n4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.65], [21.0, 22.28], [23.0, 23.36], [41.0, 42.2], [51.0, 52.68], [54.0, 54.87], [55.0, 56.88], [59.0, 60.84], [71.0, 73.55], [74.0, 75.25], [78.0, 83.32], [86.0, 89.04], [93.0, 97.83], [99.0, 100.53]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.46, 0.0, 32.85, 33.08, 35.04, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 21.34], ["throbbing", 14.72], ["hum", 9.6]], null, [["music", 38.95], ["speech", 20.84], ["electronic music", 4.11]], [["music", 49.14], ["sidetone", 10.45], ["electronic music", 4.07]], [["music", 60.84], ["speech", 7.71], ["sidetone", 3.9]], null], "duration": [0.65, 1.28, 0.36, 1.2, 1.68, 0.87, 1.88, 1.84, 2.55, 1.25, 5.32, 3.04, 4.83, 1.53]} \ No newline at end of file diff --git a/annotations_1/r29P93wUiMg_filtered.json b/annotations_1/r29P93wUiMg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..800b7b45c3a611e1f6cf9d490f35d0a20522b984 --- /dev/null +++ b/annotations_1/r29P93wUiMg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 112.8], [118.0, 131.21]], "keep_status": [false, false], "silence_prob": [29.65, 29.91], "audiomae_on_audioset": [[["music", 29.07], ["throbbing", 28.26], ["hum", 16.06]], [["music", 30.73], ["throbbing", 29.76], ["hum", 15.25]]], "duration": [14.8, 13.21]} \ No newline at end of file diff --git a/annotations_1/r2GpJzIdoYQ_filtered.json b/annotations_1/r2GpJzIdoYQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba69a45351ab056373ddd5f56b5a4a64e60bf9c3 --- /dev/null +++ b/annotations_1/r2GpJzIdoYQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [9.0, 9.51], [10.0, 12.6], [15.0, 16.46], [17.0, 19.41], [21.0, 28.9], [29.0, 30.47], [31.0, 31.8], [37.0, 38.01], [39.0, 39.85], [43.0, 44.12], [47.0, 50.53], [52.0, 59.73], [61.0, 91.96], [96.0, 96.77], [99.0, 100.13], [102.0, 104.09], [105.0, 105.66], [106.0, 108.24], [109.0, 138.3], [139.0, 148.2], [149.0, 150.36], [151.0, 151.68], [154.0, 154.85], [157.0, 159.06], [160.0, 161.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.03, 0.0, 82.43, 95.23, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 96.66, 0.0, 0.0, 0.0, 98.51, 0.0, 88.46, 33.41, 41.98, 0.0, 0.0, 0.0, 59.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.83], ["ambient music", 10.8], ["hum", 4.91]], [["music", 73.08], ["musical instrument", 3.29], ["hum", 2.51]], null, null, null, null, null], "duration": [1.62, 0.51, 2.6, 1.46, 2.41, 7.9, 1.47, 0.8, 1.01, 0.85, 1.12, 3.53, 7.73, 30.96, 0.77, 1.13, 2.09, 0.66, 2.24, 29.3, 9.2, 1.36, 0.68, 0.85, 2.06, 1.15]} \ No newline at end of file diff --git a/annotations_1/r2RzBizjKT0_filtered.json b/annotations_1/r2RzBizjKT0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67a5ba5b950a320971d5dfb170756953693fd1b6 --- /dev/null +++ b/annotations_1/r2RzBizjKT0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [7.0, 8.45], [10.0, 10.96], [12.0, 15.38], [16.0, 28.05], [29.0, 38.75], [48.0, 49.89], [51.0, 52.91], [54.0, 57.1], [59.0, 72.77], [75.0, 82.92], [84.0, 85.11], [86.0, 86.34], [89.0, 90.12], [94.0, 104.97], [105.0, 114.27], [115.0, 122.15], [122.0, 122.32], [122.0, 125.39], [127.0, 127.18], [129.0, 128.87], [131.0, 132.04], [135.0, 137.34], [141.0, 141.81], [149.0, 149.47], [150.0, 151.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 93.6, 59.51, 69.47, 0.0, 0.0, 61.37, 60.89, 67.89, 0.0, 0.0, 0.0, 51.44, 38.42, 76.04, 0.0, 43.74, 0.0, 0.0, 0.0, 67.38, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 36.25], ["cattle, bovinae", 32.45], ["moo", 13.65]], null, null, [["speech", 54.19], ["fly, housefly", 4.86], ["hum", 3.71]], null, null, null, null, null, null, null], "duration": [1.8, 1.45, 0.96, 3.38, 12.05, 9.75, 1.89, 1.91, 3.1, 13.77, 7.92, 1.11, 0.34, 1.12, 10.97, 9.27, 7.15, 0.32, 3.39, 0.18, -0.13, 1.04, 2.34, 0.81, 0.47, 1.34]} \ No newline at end of file diff --git a/annotations_1/r2fHzai5ih4_filtered.json b/annotations_1/r2fHzai5ih4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6896e5455c31f5f9f42e9910504e0ec813587dd2 --- /dev/null +++ b/annotations_1/r2fHzai5ih4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.94], [16.0, 16.65], [21.0, 21.41], [32.0, 32.04], [45.0, 45.91], [72.0, 72.82], [73.0, 75.52], [76.0, 75.84], [80.0, 81.41], [85.0, 85.36], [99.0, 100.43], [104.0, 104.73], [105.0, 106.57], [111.0, 113.59], [115.0, 117.09], [118.0, 120.02]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 34.67, 60.51], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 32.03], ["music", 15.68], ["pulse", 7.91]], null, null, null, null, null, null, null, [["music", 34.27], ["theremin", 6.29], ["whale vocalization", 5.1]], null], "duration": [0.94, 0.65, 0.41, 0.04, 0.91, 0.82, 2.52, -0.16, 1.41, 0.36, 1.43, 0.73, 1.57, 2.59, 2.09, 2.02]} \ No newline at end of file diff --git a/annotations_1/r2x4QueC2As_filtered.json b/annotations_1/r2x4QueC2As_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/r2x4QueC2As_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/r3BS4jKjRkc_filtered.json b/annotations_1/r3BS4jKjRkc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b85c01ce188b3ec749b2c3ead2f12a7db7b7ad1b --- /dev/null +++ b/annotations_1/r3BS4jKjRkc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.89], [20.0, 23.9], [24.0, 29.29], [30.0, 34.1], [35.0, 44.76], [47.0, 54.24], [55.0, 55.68], [58.0, 60.67], [64.0, 67.83], [71.0, 89.68], [91.0, 95.1], [96.0, 105.11], [114.0, 115.18], [119.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 76.2, 88.28, 97.83, 95.09, 88.28, 0.0, 53.84, 83.88, 57.25, 92.64, 87.37, 0.0, 85.17], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.89, 3.9, 5.29, 4.1, 9.76, 7.24, 0.68, 2.67, 3.83, 18.68, 4.1, 9.11, 1.18, 10.05]} \ No newline at end of file diff --git a/annotations_1/r3L0e0izKG4_filtered.json b/annotations_1/r3L0e0izKG4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b70276e20a52f0599147ac5761ef745474e9e29f --- /dev/null +++ b/annotations_1/r3L0e0izKG4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 55.86], [58.0, 70.53], [73.0, 85.31], [87.0, 87.91], [91.0, 92.57], [97.0, 97.9], [101.0, 117.91], [123.0, 122.94], [125.0, 127.31], [128.0, 132.54], [137.0, 138.35], [139.0, 139.56], [142.0, 142.55], [144.0, 143.95], [146.0, 147.21], [147.0, 148.56], [153.0, 154.31], [155.0, 155.73], [156.0, 166.63], [168.0, 179.61], [182.0, 184.62], [185.0, 185.75], [187.0, 253.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.11, 96.66, 0.0, 0.0, 0.0, 100.0, 0.0, 65.2, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.0, 99.85, 97.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [52.86, 12.53, 12.31, 0.91, 1.57, 0.9, 16.91, -0.06, 2.31, 4.54, 1.35, 0.56, 0.55, -0.05, 1.21, 1.56, 1.31, 0.73, 10.63, 11.61, 2.62, 0.75, 66.84]} \ No newline at end of file diff --git a/annotations_1/r3_IvtMPIi4_filtered.json b/annotations_1/r3_IvtMPIi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c841cca1789528a7fb0be25fe6f60d418de8346 --- /dev/null +++ b/annotations_1/r3_IvtMPIi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.16], [8.0, 10.57], [11.0, 16.95], [17.0, 35.46], [37.0, 43.97], [44.0, 44.78], [48.0, 49.37], [56.0, 58.77], [60.0, 61.32], [66.0, 66.29], [72.0, 72.72], [75.0, 76.72], [77.0, 79.35], [82.0, 83.1], [92.0, 93.38], [95.0, 96.33], [98.0, 99.54], [100.0, 107.91], [110.0, 118.76], [119.0, 121.51], [122.0, 122.62], [123.0, 123.6], [124.0, 129.3], [131.0, 131.52], [133.0, 138.94], [142.0, 152.79], [156.0, 155.68], [158.0, 158.67], [162.0, 164.07], [165.0, 165.43], [166.0, 182.14], [184.0, 185.43], [186.0, 189.73]], "keep_status": [false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 30.92, 30.87, 30.47, 39.99, 0.0, 0.0, 40.02, 0.0, 0.0, 0.0, 0.0, 34.94, 0.0, 0.0, 0.0, 0.0, 38.86, 42.42, 36.94, 0.0, 0.0, 57.17, 0.0, 43.96, 47.74, 0.0, 0.0, 58.47, 0.0, 38.75, 0.0, 32.84], "audiomae_on_audioset": [null, [["music", 53.8], ["speech", 9.08], ["rattle (instrument)", 6.36]], [["music", 45.7], ["speech", 32.87], ["boing", 3.63]], [["music", 49.51], ["speech", 14.01], ["theremin", 10.49]], [["hum", 47.36], ["mains hum", 34.23], ["music", 4.06]], null, null, [["hum", 18.43], ["mains hum", 14.36], ["noise", 11.36]], null, null, null, null, [["speech", 32.15], ["music", 10.05], ["whale vocalization", 8.07]], null, null, null, null, [["speech", 51.62], ["music", 31.72], ["synthesizer", 2.49]], [["hum", 18.44], ["speech", 17.17], ["mains hum", 15.59]], [["speech", 29.25], ["sidetone", 28.94], ["hum", 5.31]], null, null, null, null, [["mains hum", 30.98], ["music", 22.38], ["hum", 15.01]], [["theremin", 58.98], ["music", 17.82], ["hum", 2.39]], null, null, null, null, [["music", 64.1], ["theremin", 8.88], ["hum", 5.44]], null, [["music", 33.22], ["owl", 9.92], ["hum", 8.07]]], "duration": [0.16, 2.57, 5.95, 18.46, 6.97, 0.78, 1.37, 2.77, 1.32, 0.29, 0.72, 1.72, 2.35, 1.1, 1.38, 1.33, 1.54, 7.91, 8.76, 2.51, 0.62, 0.6, 5.3, 0.52, 5.94, 10.79, -0.32, 0.67, 2.07, 0.43, 16.14, 1.43, 3.73]} \ No newline at end of file diff --git a/annotations_1/r3fnCEjvPCQ_filtered.json b/annotations_1/r3fnCEjvPCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7ea6402ae029739151cd472e579f80c3f04cb240 --- /dev/null +++ b/annotations_1/r3fnCEjvPCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [8.0, 10.74], [11.0, 13.73], [14.0, 15.7], [16.0, 29.39]], "keep_status": [true, true, true, false, true], "silence_prob": [34.16, 36.55, 34.74, 0.0, 31.18], "audiomae_on_audioset": [[["music", 20.69], ["hum", 19.68], ["mains hum", 12.93]], [["music", 28.29], ["hum", 12.49], ["speech", 6.9]], [["moo", 19.99], ["cattle, bovinae", 17.23], ["livestock, farm animals, working animals", 12.26]], null, [["hum", 20.61], ["throbbing", 12.85], ["buzz", 10.8]]], "duration": [2.74, 2.74, 2.73, 1.7, 13.39]} \ No newline at end of file diff --git a/annotations_1/r5ilcq9hUZI_filtered.json b/annotations_1/r5ilcq9hUZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f57ebea22616bdf1bce5ea32ced9fba3b4bcb26f --- /dev/null +++ b/annotations_1/r5ilcq9hUZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [7.0, 8.26], [20.0, 23.75], [25.0, 25.83], [28.0, 30.18], [33.0, 33.51], [37.0, 38.08], [41.0, 52.34], [55.0, 56.46], [60.0, 60.3], [61.0, 61.59], [62.0, 63.04], [65.0, 66.41], [67.0, 67.31], [69.0, 69.9], [75.0, 76.64], [79.0, 80.59], [81.0, 84.54], [92.0, 93.58], [96.0, 97.21], [108.0, 109.27], [113.0, 114.47], [115.0, 117.93], [127.0, 132.73], [133.0, 135.5], [137.0, 143.43], [144.0, 145.71], [149.0, 150.9], [153.0, 153.54], [155.0, 162.11], [163.0, 166.7], [167.0, 170.16], [170.0, 174.24], [175.0, 176.64], [178.0, 182.09], [187.0, 188.72], [189.0, 194.31], [195.0, 196.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 76.37, 0.0, 99.82, 0.0, 0.0, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 44.07, 28.91, 52.74, 99.98, 0.0, 0.0, 0.0, 72.46, 99.85, 87.74, 43.85, 0.0, 90.25, 0.0, 45.52, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.31], ["sine wave", 29.07], ["chirp tone", 6.82]], [["crack", 27.78], ["breaking", 11.01], ["animal", 7.31]], null, null, null, null, null, null, null, null, [["speech", 52.24], ["singing bowl", 12.96], ["tuning fork", 10.4]], null, null, null, [["hum", 41.39], ["speech", 31.81], ["throbbing", 8.62]], null], "duration": [1.1, 1.26, 3.75, 0.83, 2.18, 0.51, 1.08, 11.34, 1.46, 0.3, 0.59, 1.04, 1.41, 0.31, 0.9, 1.64, 1.59, 3.54, 1.58, 1.21, 1.27, 1.47, 2.93, 5.73, 2.5, 6.43, 1.71, 1.9, 0.54, 7.11, 3.7, 3.16, 4.24, 1.64, 4.09, 1.72, 5.31, 1.16]} \ No newline at end of file diff --git a/annotations_1/r5zhPLNGAOE_filtered.json b/annotations_1/r5zhPLNGAOE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bbda6f4a6e608eaa1f1e2eba8345ee0ab29a676 --- /dev/null +++ b/annotations_1/r5zhPLNGAOE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [6.0, 7.5], [10.0, 11.45], [19.0, 19.06], [20.0, 20.75], [22.0, 22.77], [24.0, 38.52], [41.0, 71.58], [74.0, 87.93], [91.0, 92.06], [99.0, 99.49], [100.0, 102.96], [105.0, 108.43], [111.0, 121.32], [124.0, 124.93], [127.0, 127.72], [130.0, 138.08], [141.0, 141.24], [144.0, 144.04], [146.0, 149.86], [153.0, 155.16], [159.0, 160.08], [163.0, 164.83], [166.0, 167.34], [170.0, 172.29], [175.0, 176.4], [177.0, 180.74], [181.0, 182.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.63, 0.0, 32.26, 0.0, 0.0, 44.46, 39.22, 95.09, 0.0, 0.0, 83.52, 0.0, 0.0, 96.04, 97.64, 0.0, 0.0, 0.0, 81.89, 0.0, 67.51, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 62.09], ["throbbing", 5.02], ["hum", 4.48]], null, [["whale vocalization", 38.56], ["speech", 35.85], ["music", 6.47]], null, null, [["throbbing", 34.94], ["hum", 31.35], ["music", 13.77]], [["hum", 38.67], ["music", 19.03], ["mains hum", 16.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 1.5, 1.45, 0.06, 0.75, 0.77, 14.52, 30.58, 13.93, 1.06, 0.49, 2.96, 3.43, 10.32, 0.93, 0.72, 8.08, 0.24, 0.04, 3.86, 2.16, 1.08, 1.83, 1.34, 2.29, 1.4, 3.74, 1.6]} \ No newline at end of file diff --git a/annotations_1/r67faKKQyO4_filtered.json b/annotations_1/r67faKKQyO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..542dfbfb59fc45e658263de089c3e0e6cffa2742 --- /dev/null +++ b/annotations_1/r67faKKQyO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [5.0, 6.94], [9.0, 11.33], [15.0, 20.53], [28.0, 29.32], [36.0, 45.94], [47.0, 49.55], [52.0, 60.27], [65.0, 64.89], [69.0, 70.09], [74.0, 80.49], [81.0, 96.13], [98.0, 100.84], [106.0, 113.46], [114.0, 114.39], [120.0, 143.33], [148.0, 152.34], [153.0, 158.73], [164.0, 172.44], [173.0, 173.69], [174.0, 174.46], [178.0, 181.38]], "keep_status": [false, false, true, true, false, false, true, true, false, false, true, true, true, false, false, false, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 32.48, 33.12, 0.0, 33.67, 41.78, 36.06, 0.0, 0.0, 35.08, 34.34, 33.14, 35.94, 0.0, 32.89, 34.66, 31.93, 30.97, 0.0, 0.0, 30.34], "audiomae_on_audioset": [null, null, [["mosquito", 30.83], ["moo", 14.33], ["boing", 10.3]], [["music", 25.98], ["whack, thwack", 21.18], ["fly, housefly", 8.89]], null, [["livestock, farm animals, working animals", 37.7], ["cattle, bovinae", 26.34], ["ding", 12.99]], [["cattle, bovinae", 18.73], ["livestock, farm animals, working animals", 17.84], ["moo", 14.15]], [["music", 38.8], ["boing", 12.05], ["speech", 5.47]], null, null, [["music", 26.93], ["fly, housefly", 19.04], ["breaking", 8.96]], [["hum", 36.82], ["mains hum", 15.69], ["fly, housefly", 10.01]], [["music", 47.47], ["boing", 7.97], ["speech", 3.98]], [["music", 63.02], ["boing", 9.4], ["whip", 7.51]], null, [["speech", 61.0], ["music", 14.19], ["fart", 7.92]], [["mosquito", 61.99], ["fly, housefly", 17.43], ["insect", 3.26]], [["music", 36.64], ["speech", 11.6], ["throbbing", 8.68]], [["music", 35.32], ["noise", 12.68], ["synthesizer", 10.51]], null, null, [["music", 14.6], ["crowd", 10.52], ["whale vocalization", 8.65]]], "duration": [0.56, 1.94, 2.33, 5.53, 1.32, 9.94, 2.55, 8.27, -0.11, 1.09, 6.49, 15.13, 2.84, 7.46, 0.39, 23.33, 4.34, 5.73, 8.44, 0.69, 0.46, 3.38]} \ No newline at end of file diff --git a/annotations_1/r76peMNNiyw_filtered.json b/annotations_1/r76peMNNiyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bef6d53952800c293deb7e75343ca992665c46a --- /dev/null +++ b/annotations_1/r76peMNNiyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.56], [19.0, 22.05], [23.0, 24.14], [26.0, 26.11], [28.0, 29.52], [31.0, 32.51]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 55.31, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.56, 3.05, 1.14, 0.11, 1.52, 1.51]} \ No newline at end of file diff --git a/annotations_1/r7aXjBDUk8w_filtered.json b/annotations_1/r7aXjBDUk8w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..642171687e5673c8708344d7738c2b48407f404e --- /dev/null +++ b/annotations_1/r7aXjBDUk8w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.74], [15.0, 15.72], [18.0, 20.22], [22.0, 22.52], [28.0, 32.17], [42.0, 41.88], [49.0, 50.99], [51.0, 51.48], [56.0, 66.07], [68.0, 68.47], [71.0, 74.33], [75.0, 75.46], [76.0, 80.49], [82.0, 91.0], [91.0, 106.78]], "keep_status": [false, false, true, false, true, false, false, false, false, false, true, false, true, true, false], "silence_prob": [64.75, 0.0, 42.35, 0.0, 42.58, 0.0, 0.0, 0.0, 37.01, 0.0, 35.24, 0.0, 35.94, 35.11, 32.06], "audiomae_on_audioset": [null, null, [["sidetone", 16.02], ["fly, housefly", 13.64], ["speech", 10.45]], null, [["music", 43.98], ["hum", 11.83], ["throbbing", 8.89]], null, null, null, [["music", 65.5], ["brass instrument", 5.16], ["musical instrument", 4.95]], null, [["music", 54.16], ["hum", 9.91], ["theremin", 4.9]], null, [["music", 41.57], ["speech", 16.93], ["fly, housefly", 8.44]], [["music", 40.03], ["buzz", 15.82], ["trombone", 10.65]], [["music", 61.88], ["music of latin america", 6.45], ["flamenco", 3.85]]], "duration": [2.74, 0.72, 2.22, 0.52, 4.17, -0.12, 1.99, 0.48, 10.07, 0.47, 3.33, 0.46, 4.49, 9.0, 15.78]} \ No newline at end of file diff --git a/annotations_1/r8-BFx3xFJ4_filtered.json b/annotations_1/r8-BFx3xFJ4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4cbf1b059b55f889653980218abdfd413a7bf047 --- /dev/null +++ b/annotations_1/r8-BFx3xFJ4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[52.0, 64.67], [65.0, 65.64], [67.0, 67.24], [68.0, 69.5], [75.0, 75.69], [77.0, 81.45], [83.0, 91.45], [98.0, 98.39], [100.0, 100.35], [101.0, 114.1], [115.0, 116.87], [139.0, 147.46], [148.0, 148.22], [159.0, 159.95], [162.0, 162.43], [164.0, 165.96], [171.0, 172.81], [174.0, 174.68], [176.0, 175.86], [176.0, 181.94]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.42, 0.0, 0.0, 0.0, 0.0, 31.39, 32.13, 0.0, 0.0, 30.55, 0.0, 32.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72], "audiomae_on_audioset": [[["music", 49.7], ["throbbing", 15.88], ["speech", 8.49]], null, null, null, null, [["music", 57.54], ["speech", 9.65], ["hum", 6.25]], [["music", 32.0], ["throbbing", 31.16], ["hum", 13.2]], null, null, [["music", 56.09], ["speech", 10.35], ["hum", 3.53]], null, [["hum", 26.89], ["music", 25.87], ["throbbing", 16.63]], null, null, null, null, null, null, null, null], "duration": [12.67, 0.64, 0.24, 1.5, 0.69, 4.45, 8.45, 0.39, 0.35, 13.1, 1.87, 8.46, 0.22, 0.95, 0.43, 1.96, 1.81, 0.68, -0.14, 5.94]} \ No newline at end of file diff --git a/annotations_1/r86n2JRUyRc_filtered.json b/annotations_1/r86n2JRUyRc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..760b0f81a9c7739e78c5fc54741372ae10186bda --- /dev/null +++ b/annotations_1/r86n2JRUyRc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.83], [14.0, 13.91], [29.0, 29.98], [32.0, 42.97], [45.0, 88.25], [91.0, 97.02], [99.0, 99.49], [102.0, 112.62], [121.0, 121.58], [128.0, 128.66], [150.0, 149.96], [156.0, 159.11], [159.0, 159.26], [159.0, 159.33], [159.0, 159.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.09, 0.0, 34.41, 0.0, 30.58, 0.0, 0.0, 0.0, 34.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 56.61], ["throbbing", 15.86], ["hum", 5.28]], null, [["music", 46.31], ["throbbing", 12.48], ["speech", 11.9]], null, [["music", 39.24], ["smash, crash", 20.44], ["speech", 13.55]], null, null, null, [["speech", 56.99], ["whip", 7.59], ["hubbub, speech noise, speech babble", 4.11]], null, null, null], "duration": [0.83, -0.09, 0.98, 10.97, 43.25, 6.02, 0.49, 10.62, 0.58, 0.66, -0.04, 3.11, 0.26, 0.33, 0.44]} \ No newline at end of file diff --git a/annotations_1/r8swYmKUGJ0_filtered.json b/annotations_1/r8swYmKUGJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5623240b61b849eeb0c5f66814bba5a30395a09f --- /dev/null +++ b/annotations_1/r8swYmKUGJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.2], [40.0, 40.68], [49.0, 49.17], [53.0, 53.16], [55.0, 55.71], [58.0, 57.74], [65.0, 65.84]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [0.2, 0.68, 0.17, 0.16, 0.71, -0.26, 0.84]} \ No newline at end of file diff --git a/annotations_1/r8uOQupi1iQ_filtered.json b/annotations_1/r8uOQupi1iQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37fc61bcaca6be8a010867cc3db34ed1dd71c1e2 --- /dev/null +++ b/annotations_1/r8uOQupi1iQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.42], [18.0, 20.09], [21.0, 22.94], [25.0, 25.52], [26.0, 30.7], [36.0, 36.1], [37.0, 38.4], [47.0, 47.34], [50.0, 50.3], [52.0, 52.44], [55.0, 55.43], [58.0, 61.52], [66.0, 66.95], [68.0, 68.54], [70.0, 72.06], [74.0, 79.76], [83.0, 84.96], [88.0, 88.84], [92.0, 94.47], [96.0, 96.72], [99.0, 101.41], [106.0, 106.44], [106.0, 106.66], [107.0, 106.69], [107.0, 109.31]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, false, true], "silence_prob": [29.69, 33.57, 0.0, 0.0, 29.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.73, 0.0, 0.0, 41.32, 34.54, 0.0, 0.0, 52.68, 0.0, 77.87, 0.0, 0.0, 0.0, 34.97], "audiomae_on_audioset": [[["speech", 51.49], ["music", 25.98], ["whack, thwack", 1.67]], [["music", 41.87], ["hum", 18.67], ["throbbing", 16.07]], null, null, [["speech", 42.2], ["music", 13.93], ["whack, thwack", 9.32]], null, null, null, null, null, null, [["music", 22.23], ["speech", 20.28], ["crushing", 11.22]], null, null, [["cattle, bovinae", 26.83], ["moo", 14.8], ["livestock, farm animals, working animals", 11.85]], [["music", 14.51], ["insect", 12.0], ["fly, housefly", 10.26]], null, null, null, null, null, null, null, null, [["sound effect", 17.1], ["music", 12.2], ["whack, thwack", 9.88]]], "duration": [6.42, 2.09, 1.94, 0.52, 4.7, 0.1, 1.4, 0.34, 0.3, 0.44, 0.43, 3.52, 0.95, 0.54, 2.06, 5.76, 1.96, 0.84, 2.47, 0.72, 2.41, 0.44, 0.66, -0.31, 2.31]} \ No newline at end of file diff --git a/annotations_1/r9ae_frgcpU_filtered.json b/annotations_1/r9ae_frgcpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0240edc9a2a95beef6db4af0e87994eba0938040 --- /dev/null +++ b/annotations_1/r9ae_frgcpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.05], [8.0, 19.45], [22.0, 58.11], [59.0, 63.31], [64.0, 66.41], [69.0, 72.71], [73.0, 74.01], [76.0, 77.5], [78.0, 78.49], [81.0, 81.24], [82.0, 82.17], [82.0, 82.8], [85.0, 87.76], [89.0, 89.56], [91.0, 90.88], [92.0, 103.22], [105.0, 108.85], [113.0, 114.61], [116.0, 117.81], [120.0, 120.82], [122.0, 123.15], [127.0, 128.06], [129.0, 130.98], [133.0, 137.29], [138.0, 138.86], [142.0, 148.49], [149.0, 150.25], [152.0, 153.3], [156.0, 157.11], [161.0, 167.56]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, true, false, true, false, false, false, true], "silence_prob": [31.76, 29.63, 0.0, 48.82, 77.7, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.05, 0.0, 0.0, 30.39, 36.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.41, 0.0, 38.68, 0.0, 0.0, 0.0, 44.07], "audiomae_on_audioset": [[["vehicle", 19.13], ["car", 4.31], ["outside, urban or manmade", 4.15]], [["buzz", 15.15], ["music", 10.3], ["noise", 8.7]], null, [["music", 36.25], ["hum", 13.53], ["whale vocalization", 7.59]], null, null, null, null, null, null, null, null, [["speech", 51.18], ["hum", 13.09], ["sonar", 4.42]], null, null, [["whack, thwack", 30.39], ["clang", 16.73], ["ding", 12.45]], [["hum", 17.04], ["throbbing", 15.99], ["music", 10.49]], null, null, null, null, null, null, [["music", 53.03], ["speech", 5.05], ["musical instrument", 4.87]], null, [["hum", 28.21], ["mains hum", 13.81], ["bee, wasp, etc.", 11.84]], null, null, null, [["music", 35.69], ["speech", 25.11], ["didgeridoo", 8.3]]], "duration": [2.05, 11.45, 36.11, 4.31, 2.41, 3.71, 1.01, 1.5, 0.49, 0.24, 0.17, 0.8, 2.76, 0.56, -0.12, 11.22, 3.85, 1.61, 1.81, 0.82, 1.15, 1.06, 1.98, 4.29, 0.86, 6.49, 1.25, 1.3, 1.11, 6.56]} \ No newline at end of file diff --git a/annotations_1/rA69NDoXRhI_filtered.json b/annotations_1/rA69NDoXRhI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..344807f9d78727251d18de60dc4bc6ac77b4de5c --- /dev/null +++ b/annotations_1/rA69NDoXRhI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 14.39], [19.0, 20.07], [22.0, 45.2], [49.0, 49.99], [52.0, 53.45], [55.0, 55.48], [56.0, 57.15], [59.0, 60.18], [65.0, 66.02], [67.0, 67.63], [77.0, 78.56], [79.0, 79.44], [82.0, 82.68], [93.0, 94.42], [96.0, 96.48], [103.0, 107.86], [109.0, 110.25], [115.0, 115.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.98, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 48.2], ["singing bowl", 20.54], ["music", 10.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.39, 1.07, 23.2, 0.99, 1.45, 0.48, 1.15, 1.18, 1.02, 0.63, 1.56, 0.44, 0.68, 1.42, 0.48, 4.86, 1.25, 0.77]} \ No newline at end of file diff --git a/annotations_1/rA6AZeHyw8Q_filtered.json b/annotations_1/rA6AZeHyw8Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6fd39a06d7e72d1cd2f521c375af5755fc52909 --- /dev/null +++ b/annotations_1/rA6AZeHyw8Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 13.39], [17.0, 25.79], [28.0, 39.04], [41.0, 63.91], [65.0, 65.87], [67.0, 67.86], [69.0, 70.06], [70.0, 73.25], [73.0, 73.3], [74.0, 74.33], [77.0, 84.33], [86.0, 85.73], [86.0, 102.41], [104.0, 131.55], [133.0, 132.68], [133.0, 132.8], [133.0, 155.11], [157.0, 167.98], [170.0, 170.95], [172.0, 173.33]], "keep_status": [true, false, true, true, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false, false], "silence_prob": [42.06, 44.32, 40.95, 46.29, 0.0, 0.0, 0.0, 40.19, 0.0, 0.0, 46.75, 0.0, 49.97, 46.26, 0.0, 0.0, 48.19, 65.09, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.95], ["didgeridoo", 4.28], ["electronic music", 3.48]], [["music", 65.27], ["musical instrument", 5.42], ["synthesizer", 2.26]], [["music", 62.24], ["electronic music", 4.2], ["speech", 3.51]], [["music", 31.9], ["sidetone", 8.75], ["cattle, bovinae", 8.37]], null, null, null, [["pigeon, dove", 21.4], ["speech", 21.32], ["bird", 19.06]], null, null, [["speech", 33.81], ["horse", 11.23], ["whale vocalization", 8.36]], null, [["speech", 41.06], ["hum", 6.8], ["fly, housefly", 6.12]], [["speech", 50.24], ["hum", 6.77], ["explosion", 5.07]], null, null, [["hum", 39.57], ["throbbing", 28.94], ["mains hum", 6.27]], null, null, null], "duration": [9.39, 8.79, 11.04, 22.91, 0.87, 0.86, 1.06, 3.25, 0.3, 0.33, 7.33, -0.27, 16.41, 27.55, -0.32, -0.2, 22.11, 10.98, 0.95, 1.33]} \ No newline at end of file diff --git a/annotations_1/rAdvJOAGEmc_filtered.json b/annotations_1/rAdvJOAGEmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..82104a080f474743bae36282099f0a530f540bc4 --- /dev/null +++ b/annotations_1/rAdvJOAGEmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.97], [5.0, 12.88], [14.0, 14.79], [16.0, 17.24], [19.0, 28.27], [32.0, 32.63], [34.0, 36.14], [42.0, 44.76], [49.0, 53.43], [55.0, 55.76], [56.0, 57.69], [58.0, 59.26], [60.0, 61.15], [63.0, 62.94], [71.0, 74.95], [80.0, 83.64], [91.0, 92.94], [101.0, 117.42], [122.0, 122.25], [122.0, 128.12], [133.0, 133.39], [134.0, 134.38], [135.0, 135.28], [141.0, 145.34], [146.0, 149.47]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 37.39, 0.0, 0.0, 38.31, 0.0, 35.65, 35.02, 34.94, 0.0, 0.0, 0.0, 0.0, 0.0, 34.39, 34.55, 0.0, 34.39, 0.0, 48.48, 0.0, 0.0, 0.0, 51.71, 68.67], "audiomae_on_audioset": [null, [["music", 13.73], ["beatboxing", 7.01], ["animal", 6.29]], null, null, [["music", 52.92], ["beatboxing", 7.94], ["didgeridoo", 6.77]], null, [["music", 61.25], ["guitar", 7.76], ["musical instrument", 5.97]], [["music", 70.82], ["musical instrument", 3.12], ["guitar", 2.2]], [["music", 77.87], ["swing music", 2.13], ["musical instrument", 1.75]], null, null, null, null, null, [["music", 69.86], ["swing music", 4.25], ["musical instrument", 2.39]], [["music", 65.48], ["swing music", 4.86], ["musical instrument", 2.86]], null, [["music", 41.59], ["boing", 26.76], ["speech", 9.32]], null, [["animal", 33.42], ["speech", 14.96], ["outside, rural or natural", 4.75]], null, null, null, null, null], "duration": [0.97, 7.88, 0.79, 1.24, 9.27, 0.63, 2.14, 2.76, 4.43, 0.76, 1.69, 1.26, 1.15, -0.06, 3.95, 3.64, 1.94, 16.42, 0.25, 6.12, 0.39, 0.38, 0.28, 4.34, 3.47]} \ No newline at end of file diff --git a/annotations_1/rC9MhZGgJy4_filtered.json b/annotations_1/rC9MhZGgJy4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ff01691bc67e15cd0823126b2ffb065ed06d4881 --- /dev/null +++ b/annotations_1/rC9MhZGgJy4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.97], [7.0, 8.58], [10.0, 10.93], [16.0, 16.09], [22.0, 22.74], [23.0, 28.16], [29.0, 30.08], [39.0, 40.44], [42.0, 43.09], [44.0, 45.89], [46.0, 53.96], [59.0, 59.17], [62.0, 62.33], [66.0, 68.49], [70.0, 70.43], [71.0, 72.33], [80.0, 80.89], [82.0, 83.25], [87.0, 88.8], [90.0, 90.64], [91.0, 93.14], [106.0, 107.59], [109.0, 109.41], [111.0, 112.55], [114.0, 113.86], [116.0, 116.78], [118.0, 119.04], [123.0, 123.63], [126.0, 126.42], [128.0, 128.48], [134.0, 135.03], [136.0, 139.24], [142.0, 143.02], [147.0, 147.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 58.72, 0.0, 0.0, 0.0, 0.0, 41.66, 0.0, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.48, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 36.4], ["music", 13.89], ["thunk", 9.3]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 19.24], ["music", 14.16], ["insect", 7.34]], null, null, null, null, null, null, null, null, null, null, [["singing bowl", 24.82], ["gong", 10.72], ["hum", 8.56]], null, null], "duration": [0.97, 1.58, 0.93, 0.09, 0.74, 5.16, 1.08, 1.44, 1.09, 1.89, 7.96, 0.17, 0.33, 2.49, 0.43, 1.33, 0.89, 1.25, 1.8, 0.64, 2.14, 1.59, 0.41, 1.55, -0.14, 0.78, 1.04, 0.63, 0.42, 0.48, 1.03, 3.24, 1.02, 0.66]} \ No newline at end of file diff --git a/annotations_1/rCEbhr55ISU_filtered.json b/annotations_1/rCEbhr55ISU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7b888c71b68b8bcf5dc553bb082c328a98dfded --- /dev/null +++ b/annotations_1/rCEbhr55ISU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [5.0, 4.92], [6.0, 7.47], [8.0, 9.73], [11.0, 13.78], [14.0, 14.59], [17.0, 23.5], [26.0, 26.77], [28.0, 27.9], [29.0, 30.82], [31.0, 31.58], [32.0, 33.1], [36.0, 37.79], [51.0, 51.21], [54.0, 55.58], [63.0, 63.75], [67.0, 67.63], [69.0, 70.51], [73.0, 73.74], [77.0, 77.38], [86.0, 86.56], [94.0, 95.12], [97.0, 98.27], [104.0, 104.65], [105.0, 107.91], [111.0, 117.78], [118.0, 125.63], [126.0, 127.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 51.39, 0.0, 34.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.53, 44.2, 52.92, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 56.86], ["sidetone", 8.61], ["music", 8.18]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.12], ["speech", 7.95], ["hum", 5.27]], null, null], "duration": [0.29, -0.08, 1.47, 1.73, 2.78, 0.59, 6.5, 0.77, -0.1, 1.82, 0.58, 1.1, 1.79, 0.21, 1.58, 0.75, 0.63, 1.51, 0.74, 0.38, 0.56, 1.12, 1.27, 0.65, 2.91, 6.78, 7.63, 1.57]} \ No newline at end of file diff --git a/annotations_1/rCUNazDU2mg_filtered.json b/annotations_1/rCUNazDU2mg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9450c54c611b322bb95584f67928152b8c43aa09 --- /dev/null +++ b/annotations_1/rCUNazDU2mg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 29.24], [30.0, 79.42], [80.0, 97.98], [98.0, 98.04], [101.0, 104.99], [106.0, 110.59], [111.0, 112.14], [115.0, 180.37], [181.0, 181.94]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [30.17, 0.0, 30.06, 0.0, 32.94, 37.17, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 73.56], ["smash, crash", 6.17], ["breaking", 4.28]], null, [["music", 71.16], ["hum", 3.73], ["sound effect", 2.87]], null, [["whale vocalization", 44.81], ["sidetone", 21.37], ["music", 5.61]], [["hum", 31.91], ["music", 20.01], ["throbbing", 13.68]], null, null, null], "duration": [26.24, 49.42, 17.98, 0.04, 3.99, 4.59, 1.14, 65.37, 0.94]} \ No newline at end of file diff --git a/annotations_1/rDTZ6A5zsYc_filtered.json b/annotations_1/rDTZ6A5zsYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a882679f9827f48e794d9442a8ff2b00bc30bdd --- /dev/null +++ b/annotations_1/rDTZ6A5zsYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.73], [28.0, 37.08], [38.0, 39.09], [48.0, 59.19], [73.0, 114.22], [116.0, 145.4]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 38.84, 0.0, 55.89, 0.0, 34.4], "audiomae_on_audioset": [null, [["music", 31.66], ["speech", 23.87], ["thunk", 4.36]], null, null, null, [["music", 75.73], ["country", 5.09], ["bluegrass", 1.57]]], "duration": [0.73, 9.08, 1.09, 11.19, 41.22, 29.4]} \ No newline at end of file diff --git a/annotations_1/rDnazOBaF1U_filtered.json b/annotations_1/rDnazOBaF1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7182d79c1d2f5b969faaf7ffae9a9c6e1c8002a2 --- /dev/null +++ b/annotations_1/rDnazOBaF1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.96], [5.0, 5.21], [5.0, 6.3], [8.0, 7.77], [10.0, 13.17], [14.0, 14.32], [17.0, 18.98], [20.0, 22.08], [24.0, 24.75], [27.0, 27.23], [31.0, 32.41], [38.0, 37.94], [40.0, 40.9], [41.0, 46.18], [47.0, 49.1], [50.0, 53.64], [55.0, 55.86], [57.0, 59.04], [59.0, 67.12], [68.0, 73.23], [75.0, 78.76], [85.0, 88.35], [89.0, 89.82], [91.0, 92.5], [95.0, 96.2], [98.0, 98.05], [102.0, 103.87], [105.0, 106.14], [108.0, 109.48], [113.0, 115.57], [116.0, 117.27], [119.0, 120.61], [121.0, 122.86], [127.0, 128.53], [129.0, 131.43], [134.0, 137.47], [143.0, 147.45], [148.0, 150.52], [151.0, 152.93], [154.0, 154.16]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 45.98, 0.0, 0.0, 0.0, 0.0, 0.0, 41.78, 82.79, 92.64, 0.0, 82.97, 60.89, 51.44, 48.48, 47.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.94, 0.0, 0.0, 0.0, 0.0, 37.35, 38.56, 32.09, 35.7, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 43.58], ["sidetone", 12.41], ["sine wave", 7.18]], null, null, null, null, null, [["sidetone", 46.76], ["speech", 13.55], ["sine wave", 11.27]], null, null, null, null, null, null, [["music", 24.63], ["mains hum", 13.42], ["hum", 12.68]], [["music", 31.85], ["marimba, xylophone", 13.48], ["glockenspiel", 6.88]], null, null, null, null, null, null, null, [["music", 51.59], ["musical instrument", 9.07], ["mains hum", 4.97]], null, null, null, null, [["music", 45.44], ["guitar", 6.3], ["musical instrument", 6.04]], [["music", 58.41], ["hum", 4.2], ["synthesizer", 3.7]], [["music", 52.53], ["didgeridoo", 12.12], ["mains hum", 6.79]], [["music", 55.48], ["synthesizer", 8.55], ["musical instrument", 4.14]], null, null], "duration": [1.96, 0.21, 1.3, -0.23, 3.17, 0.32, 1.98, 2.08, 0.75, 0.23, 1.41, -0.06, 0.9, 5.18, 2.1, 3.64, 0.86, 2.04, 8.12, 5.23, 3.76, 3.35, 0.82, 1.5, 1.2, 0.05, 1.87, 1.14, 1.48, 2.57, 1.27, 1.61, 1.86, 1.53, 2.43, 3.47, 4.45, 2.52, 1.93, 0.16]} \ No newline at end of file diff --git a/annotations_1/rFbe4I4SXGg_filtered.json b/annotations_1/rFbe4I4SXGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca3d9c31783504c9a4c041ffc7c3842721cdf360 --- /dev/null +++ b/annotations_1/rFbe4I4SXGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.48], [9.0, 8.8], [13.0, 14.12], [17.0, 18.22], [26.0, 27.18], [30.0, 30.43], [32.0, 33.18], [34.0, 35.23], [36.0, 37.2], [38.0, 38.85], [42.0, 42.69], [48.0, 47.93], [52.0, 54.06], [61.0, 62.31], [69.0, 69.45], [69.0, 69.52], [70.0, 71.46], [72.0, 82.93], [83.0, 86.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 53.72, 64.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, -0.2, 1.12, 1.22, 1.18, 0.43, 1.18, 1.23, 1.2, 0.85, 0.69, -0.07, 2.06, 1.31, 0.45, 0.52, 1.46, 10.93, 3.12]} \ No newline at end of file diff --git a/annotations_1/rGAjkzbV8zw_filtered.json b/annotations_1/rGAjkzbV8zw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5b272a94794693dc09d36d6451ff222f9b9c0f56 --- /dev/null +++ b/annotations_1/rGAjkzbV8zw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.69], [5.0, 6.54], [7.0, 7.79], [9.0, 9.78], [11.0, 11.8], [14.0, 14.44], [18.0, 18.82], [20.0, 22.49], [23.0, 23.77], [26.0, 28.61], [30.0, 30.16], [30.0, 32.63], [33.0, 33.29], [34.0, 34.03], [35.0, 35.55], [38.0, 39.51], [40.0, 41.3], [43.0, 44.12], [46.0, 46.72], [47.0, 52.76], [54.0, 54.68], [55.0, 55.75], [58.0, 59.14], [64.0, 64.17], [64.0, 65.37], [66.0, 66.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.17, 0.0, 100.0, 0.0, 62.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 47.56], ["hum", 12.29], ["mains hum", 5.72]], null, null, null, null, null, null], "duration": [0.69, 1.54, 0.79, 0.78, 0.8, 0.44, 0.82, 2.49, 0.77, 2.61, 0.16, 2.63, 0.29, 0.03, 0.55, 1.51, 1.3, 1.12, 0.72, 5.76, 0.68, 0.75, 1.14, 0.17, 1.37, 0.61]} \ No newline at end of file diff --git a/annotations_1/rGnXd_krGA0_filtered.json b/annotations_1/rGnXd_krGA0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/rGnXd_krGA0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/rGtJbW9sRbo_filtered.json b/annotations_1/rGtJbW9sRbo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0beb3a1058e25a8f122aa5307ef4672c4af2d57 --- /dev/null +++ b/annotations_1/rGtJbW9sRbo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.37], [7.0, 7.5], [13.0, 15.84], [16.0, 21.76], [22.0, 22.4], [23.0, 24.88], [26.0, 26.99], [27.0, 29.71], [30.0, 31.06], [36.0, 37.2], [47.0, 48.66], [50.0, 50.14], [53.0, 53.65], [57.0, 57.16], [58.0, 58.56], [65.0, 65.99], [67.0, 67.64], [69.0, 71.05], [74.0, 74.85], [76.0, 76.01], [80.0, 80.0], [88.0, 90.22], [94.0, 94.31], [100.0, 100.38], [101.0, 101.92], [105.0, 105.16], [109.0, 109.02], [110.0, 123.7], [124.0, 129.88]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 48.39, 51.82, 0.0, 0.0, 0.0, 53.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.47, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 36.65, 50.21], "audiomae_on_audioset": [null, null, [["speech", 47.91], ["animal", 7.73], ["wild animals", 7.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.13], ["fly, housefly", 18.84], ["insect", 7.6]], null], "duration": [1.37, 0.5, 2.84, 5.76, 0.4, 1.88, 0.99, 2.71, 1.06, 1.2, 1.66, 0.14, 0.65, 0.16, 0.56, 0.99, 0.64, 2.05, 0.85, 0.01, 0.0, 2.22, 0.31, 0.38, 0.92, 0.16, 0.02, 13.7, 5.88]} \ No newline at end of file diff --git a/annotations_1/rHIIMIBMvng_filtered.json b/annotations_1/rHIIMIBMvng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fc5568a0ec2b6dd70b2e096ee0961c015521530 --- /dev/null +++ b/annotations_1/rHIIMIBMvng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.4], [12.0, 16.19], [17.0, 26.05], [27.0, 30.15], [32.0, 35.21], [37.0, 74.11]], "keep_status": [true, true, true, true, false, false], "silence_prob": [31.93, 31.59, 29.31, 32.13, 30.89, 0.0], "audiomae_on_audioset": [[["hum", 27.63], ["music", 14.01], ["sine wave", 9.67]], [["hum", 26.56], ["mains hum", 12.46], ["throbbing", 12.3]], [["hum", 22.92], ["music", 19.77], ["static", 14.41]], [["music", 46.98], ["hum", 10.69], ["ambient music", 8.58]], [["music", 64.93], ["ambient music", 8.33], ["synthesizer", 6.05]], null], "duration": [3.4, 4.19, 9.05, 3.15, 3.21, 37.11]} \ No newline at end of file diff --git a/annotations_1/rHvCQEr_ETk_filtered.json b/annotations_1/rHvCQEr_ETk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2404e372ede619415e93f53919feba6e0accc822 --- /dev/null +++ b/annotations_1/rHvCQEr_ETk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.45], [15.0, 20.71], [22.0, 23.57], [24.0, 24.71], [27.0, 27.75], [28.0, 29.17], [32.0, 35.28], [36.0, 45.64], [53.0, 83.17], [83.0, 83.44], [83.0, 102.59], [104.0, 118.27], [122.0, 123.26], [125.0, 129.95], [130.0, 132.6], [139.0, 141.29], [143.0, 145.71], [147.0, 147.36], [149.0, 149.94], [152.0, 152.79], [153.0, 154.25], [155.0, 156.0], [157.0, 157.64], [159.0, 165.01]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 65.32, 32.3, 0.0, 0.0, 30.34, 31.98, 0.0, 88.83, 43.77, 85.17, 36.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 35.96], ["groan", 20.1], ["fart", 6.92]], null, null, [["music", 38.34], ["speech", 22.46], ["groan", 7.65]], [["music", 66.95], ["grunt", 8.39], ["musical instrument", 2.59]], null, null, [["speech", 42.75], ["sidetone", 17.39], ["music", 4.73]], null, [["music", 56.56], ["didgeridoo", 10.73], ["foghorn", 3.01]], null, null, null, null, null, null, [["music", 56.02], ["electronic music", 8.64], ["sonar", 4.08]]], "duration": [1.45, 5.71, 1.57, 0.71, 0.75, 1.17, 3.28, 9.64, 30.17, 0.44, 19.59, 14.27, 1.26, 4.95, 2.6, 2.29, 2.71, 0.36, 0.94, 0.79, 1.25, 1.0, 0.64, 6.01]} \ No newline at end of file diff --git a/annotations_1/rKUEBIPe5F8_filtered.json b/annotations_1/rKUEBIPe5F8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f92b21c2e1aa3e9e79932a18b66b12d25abe44ed --- /dev/null +++ b/annotations_1/rKUEBIPe5F8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.45], [11.0, 13.17], [16.0, 17.14], [18.0, 23.4], [25.0, 79.34], [86.0, 103.79], [106.0, 145.15], [147.0, 147.11], [149.0, 154.74], [160.0, 161.27], [170.0, 177.45]], "keep_status": [false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [0.0, 73.82, 0.0, 79.59, 0.0, 36.61, 0.0, 0.0, 30.47, 0.0, 29.88], "audiomae_on_audioset": [null, null, null, null, null, [["music", 38.44], ["speech", 16.64], ["electronic music", 9.03]], null, null, [["music", 53.72], ["sound effect", 6.91], ["hum", 4.99]], null, [["music", 37.83], ["hum", 20.64], ["didgeridoo", 9.67]]], "duration": [0.45, 2.17, 1.14, 5.4, 54.34, 17.79, 39.15, 0.11, 5.74, 1.27, 7.45]} \ No newline at end of file diff --git a/annotations_1/rKh4muRk_s0_filtered.json b/annotations_1/rKh4muRk_s0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f26670503b0718be8c0a538169bd6ef217f4cd --- /dev/null +++ b/annotations_1/rKh4muRk_s0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.15], [10.0, 11.69], [13.0, 13.98], [16.0, 20.04], [22.0, 23.73], [25.0, 45.96], [48.0, 56.62], [59.0, 59.53], [61.0, 81.72], [91.0, 98.59], [99.0, 100.18], [101.0, 101.51], [103.0, 111.0], [113.0, 116.53], [122.0, 126.3], [128.0, 128.75], [130.0, 130.81], [133.0, 137.83], [139.0, 139.53], [150.0, 155.16], [163.0, 164.57], [169.0, 192.6], [194.0, 204.89], [208.0, 209.07], [209.0, 219.47]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true], "silence_prob": [98.1, 0.0, 0.0, 80.11, 0.0, 28.75, 28.99, 0.0, 28.47, 28.54, 0.0, 0.0, 28.32, 28.27, 28.45, 0.0, 0.0, 28.17, 0.0, 28.45, 0.0, 28.49, 28.38, 0.0, 29.06], "audiomae_on_audioset": [null, null, null, null, null, [["music", 69.92], ["synthesizer", 6.24], ["throbbing", 4.88]], [["speech", 32.95], ["vehicle", 8.5], ["music", 6.42]], null, [["speech", 33.16], ["vehicle", 14.31], ["electric shaver, electric razor", 13.6]], [["music", 68.57], ["throbbing", 10.74], ["electronic music", 10.46]], null, null, [["throbbing", 31.03], ["music", 24.47], ["hum", 17.33]], [["music", 71.46], ["cacophony", 8.5], ["musical instrument", 3.9]], [["speech", 68.38], ["vehicle", 10.39], ["music", 6.27]], null, null, [["speech", 55.03], ["music", 20.79], ["electronic music", 2.54]], null, [["speech", 63.97], ["music", 24.63], ["vehicle", 2.08]], null, [["speech", 19.42], ["burst, pop", 7.83], ["music", 7.05]], [["speech", 31.06], ["music", 24.77], ["outside, rural or natural", 3.37]], null, [["music", 58.3], ["musical instrument", 6.33], ["bowed string instrument", 4.53]]], "duration": [3.15, 1.69, 0.98, 4.04, 1.73, 20.96, 8.62, 0.53, 20.72, 7.59, 1.18, 0.51, 8.0, 3.53, 4.3, 0.75, 0.81, 4.83, 0.53, 5.16, 1.57, 23.6, 10.89, 1.07, 10.47]} \ No newline at end of file diff --git a/annotations_1/rKwnRWbuCx4_filtered.json b/annotations_1/rKwnRWbuCx4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe12023117ca82ccccca17a41e1f69b5f8f07a7b --- /dev/null +++ b/annotations_1/rKwnRWbuCx4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.43], [9.0, 11.87], [14.0, 17.88], [19.0, 28.04], [34.0, 34.72], [36.0, 48.3], [58.0, 58.9], [61.0, 61.53], [64.0, 65.15], [68.0, 68.74], [75.0, 75.98], [89.0, 96.9], [101.0, 101.49], [102.0, 103.47], [106.0, 107.4], [109.0, 111.48], [113.0, 114.39], [117.0, 125.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.75, 43.3, 38.83, 0.0, 40.43, 0.0, 0.0, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 99.4, 0.0, 99.16], "audiomae_on_audioset": [null, [["music", 54.8], ["speech", 12.28], ["sitar", 3.11]], [["music", 77.52], ["theremin", 3.26], ["musical instrument", 2.77]], [["music", 69.44], ["speech", 10.56], ["cattle, bovinae", 2.19]], null, [["music", 64.5], ["theremin", 7.26], ["cello", 4.53]], null, null, null, null, null, [["music", 71.58], ["boing", 3.68], ["speech", 2.05]], null, null, null, null, null, null], "duration": [1.43, 2.87, 3.88, 9.04, 0.72, 12.3, 0.9, 0.53, 1.15, 0.74, 0.98, 7.9, 0.49, 1.47, 1.4, 2.48, 1.39, 8.78]} \ No newline at end of file diff --git a/annotations_1/rLVwKpyUwWI_filtered.json b/annotations_1/rLVwKpyUwWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..85a7bfa102a94f26c976f77eb827e43437cd6289 --- /dev/null +++ b/annotations_1/rLVwKpyUwWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [14.0, 14.49], [30.0, 31.14], [35.0, 35.04], [35.0, 35.21], [41.0, 42.2], [45.0, 47.48], [60.0, 62.72], [65.0, 66.5], [70.0, 73.62], [88.0, 91.84], [129.0, 140.16]], "keep_status": [false, false, false, false, false, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.54, 34.93, 0.0, 34.38, 34.04, 32.23], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 52.62], ["boing", 5.38], ["throbbing", 3.3]], [["music", 49.72], ["drum machine", 5.6], ["funk", 4.09]], null, [["music", 73.48], ["musical instrument", 2.3], ["guitar", 1.15]], [["music", 59.47], ["singing", 5.68], ["funk", 2.67]], [["music", 57.75], ["speech", 14.22], ["throbbing", 9.26]]], "duration": [0.43, 0.49, 1.14, 0.04, 0.21, 1.2, 2.48, 2.72, 1.5, 3.62, 3.84, 11.16]} \ No newline at end of file diff --git a/annotations_1/rLZ5aVNxV84_filtered.json b/annotations_1/rLZ5aVNxV84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a060ee831ddf0662e6442e248c068dd35163c105 --- /dev/null +++ b/annotations_1/rLZ5aVNxV84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.31], [9.0, 10.79], [15.0, 15.57], [20.0, 21.46], [30.0, 31.94], [36.0, 35.95], [44.0, 48.39], [52.0, 52.3], [76.0, 77.13], [91.0, 91.1], [96.0, 115.77], [116.0, 116.82], [118.0, 123.47], [126.0, 128.19], [131.0, 131.85], [136.0, 135.68], [145.0, 145.02], [147.0, 147.07], [148.0, 148.09], [150.0, 150.42]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 0.0, 0.0, 0.0, 29.96, 0.0, 32.11, 34.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["groan", 25.06], ["whack, thwack", 23.85], ["screaming", 6.53]], null, null, null, [["livestock, farm animals, working animals", 22.22], ["cattle, bovinae", 12.61], ["groan", 11.4]], null, [["whale vocalization", 76.05], ["animal", 2.35], ["mosquito", 2.35]], [["speech", 30.63], ["fly, housefly", 7.27], ["fart", 5.94]], null, null, null, null, null, null], "duration": [0.31, 1.79, 0.57, 1.46, 1.94, -0.05, 4.39, 0.3, 1.13, 0.1, 19.77, 0.82, 5.47, 2.19, 0.85, -0.32, 0.02, 0.07, 0.09, 0.42]} \ No newline at end of file diff --git a/annotations_1/rM5Bg89j9qo_filtered.json b/annotations_1/rM5Bg89j9qo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b604c4697d3c451ade33f0b014a1c32609ef0607 --- /dev/null +++ b/annotations_1/rM5Bg89j9qo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 74.44]], "keep_status": [true], "silence_prob": [31.29], "audiomae_on_audioset": [[["speech", 50.56], ["rumble", 8.8], ["mains hum", 5.94]]], "duration": [4.44]} \ No newline at end of file diff --git a/annotations_1/rMczYrlPwaw_filtered.json b/annotations_1/rMczYrlPwaw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..100d01ddb953decd64f8ad28f839be30bd197aab --- /dev/null +++ b/annotations_1/rMczYrlPwaw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.8], [20.0, 21.51], [24.0, 24.26], [26.0, 26.49], [27.0, 27.82], [30.0, 30.3], [32.0, 32.54], [34.0, 34.33], [35.0, 37.1], [39.0, 40.44], [45.0, 44.93], [52.0, 57.25], [58.0, 59.8], [61.0, 63.21], [65.0, 66.75], [68.0, 68.84], [71.0, 72.52], [74.0, 75.51], [78.0, 82.38], [84.0, 84.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 95.23, 0.0, 82.97, 0.0, 0.0, 0.0, 0.0, 96.89, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 1.51, 0.26, 0.49, 0.82, 0.3, 0.54, 0.33, 2.1, 1.44, -0.07, 5.25, 1.8, 2.21, 1.75, 0.84, 1.52, 1.51, 4.38, 0.54]} \ No newline at end of file diff --git a/annotations_1/rNP5uIQxAfY_filtered.json b/annotations_1/rNP5uIQxAfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c2ec852c919a09305105f78018390a67f55d633 --- /dev/null +++ b/annotations_1/rNP5uIQxAfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.29], [13.0, 14.27], [20.0, 20.21], [23.0, 30.2], [33.0, 32.98], [34.0, 34.82], [36.0, 36.49], [38.0, 38.91], [42.0, 42.33], [45.0, 46.28], [47.0, 48.69], [51.0, 50.6], [52.0, 54.51], [55.0, 61.47], [63.0, 63.14], [65.0, 65.62], [67.0, 76.86], [78.0, 96.94], [99.0, 100.85], [103.0, 109.02], [110.0, 110.56], [117.0, 117.34], [118.0, 121.68], [127.0, 127.67], [129.0, 129.56], [136.0, 136.43], [138.0, 142.23], [144.0, 145.08], [148.0, 148.15], [149.0, 149.84]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 95.37, 0.0, 0.0, 95.64, 83.16, 0.0, 96.89, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 18.39], ["glass", 8.26], ["musical instrument", 4.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.29, 1.27, 0.21, 7.2, -0.02, 0.82, 0.49, 0.91, 0.33, 1.28, 1.69, -0.4, 2.51, 6.47, 0.14, 0.62, 9.86, 18.94, 1.85, 6.02, 0.56, 0.34, 3.68, 0.67, 0.56, 0.43, 4.23, 1.08, 0.15, 0.84]} \ No newline at end of file diff --git a/annotations_1/rNxqb6KMtkg_filtered.json b/annotations_1/rNxqb6KMtkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..779527c2bd6fff35a75dd8b344e2d3645a5c8582 --- /dev/null +++ b/annotations_1/rNxqb6KMtkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.68], [16.0, 16.23], [18.0, 19.53], [21.0, 21.54], [29.0, 32.39], [35.0, 37.1], [39.0, 40.14], [44.0, 44.93], [46.0, 47.02], [49.0, 49.49], [50.0, 50.65], [53.0, 54.43], [57.0, 57.08], [59.0, 64.18], [65.0, 73.14], [76.0, 78.63]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.73, 0.0, 0.0, 0.0, 98.1, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.72, 30.77, 95.78], "audiomae_on_audioset": [[["speech", 29.41], ["siren", 14.59], ["emergency vehicle", 5.95]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 60.71], ["music", 7.12], ["hum", 4.92]], null], "duration": [2.68, 0.23, 1.53, 0.54, 3.39, 2.1, 1.14, 0.93, 1.02, 0.49, 0.65, 1.43, 0.08, 5.18, 8.14, 2.63]} \ No newline at end of file diff --git a/annotations_1/rOzJnj3UmNE_filtered.json b/annotations_1/rOzJnj3UmNE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee60b9db5a9fab3fa26b27599c9956ea7c2343e --- /dev/null +++ b/annotations_1/rOzJnj3UmNE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.11], [15.0, 32.9], [37.0, 37.5], [38.0, 39.68], [40.0, 41.17], [41.0, 42.26], [43.0, 50.85], [54.0, 53.6], [54.0, 54.97], [57.0, 57.97], [58.0, 58.31], [59.0, 60.07], [62.0, 73.16], [74.0, 84.35], [86.0, 116.97], [118.0, 130.27], [131.0, 143.04], [143.0, 143.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.73, 68.67, 0.0, 0.0, 0.0, 0.0, 62.17, 0.0, 0.0, 0.0, 0.0, 0.0, 36.38, 39.38, 0.0, 42.39, 31.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.83], ["hum", 22.05], ["mains hum", 21.43]], [["hum", 33.66], ["music", 23.25], ["throbbing", 18.96]], null, [["music", 47.3], ["hum", 14.8], ["rumble", 10.47]], [["music", 45.64], ["hum", 18.37], ["throbbing", 10.78]], null], "duration": [5.11, 17.9, 0.5, 1.68, 1.17, 1.26, 7.85, -0.4, 0.97, 0.97, 0.31, 1.07, 11.16, 10.35, 30.97, 12.27, 12.04, 0.5]} \ No newline at end of file diff --git a/annotations_1/rPh94cOW-MI_filtered.json b/annotations_1/rPh94cOW-MI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78a1fe56022ba362d0fdbec56e18d5b199e3a4c8 --- /dev/null +++ b/annotations_1/rPh94cOW-MI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.4], [12.0, 14.17], [19.0, 25.1], [30.0, 34.96], [38.0, 39.34], [44.0, 45.55], [50.0, 50.8], [52.0, 52.79], [54.0, 55.12], [59.0, 60.59], [63.0, 63.53], [65.0, 67.68], [71.0, 71.49], [77.0, 78.54], [80.0, 81.5], [84.0, 84.08], [85.0, 87.4], [90.0, 90.71], [95.0, 96.4], [97.0, 99.15], [101.0, 102.3], [105.0, 111.57], [114.0, 113.85], [115.0, 115.69], [117.0, 118.71], [120.0, 120.21], [123.0, 122.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.43, 43.2, 38.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 0.0, 51.28, 0.0, 51.28, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.63], ["theremin", 17.78], ["effects unit", 5.56]], [["music", 74.08], ["fart", 3.16], ["grunt", 1.89]], [["music", 55.46], ["synthesizer", 10.61], ["didgeridoo", 8.11]], null, null, null, null, null, null, null, [["music", 51.69], ["theremin", 18.01], ["effects unit", 5.26]], null, null, null, null, [["music", 29.26], ["theremin", 7.64], ["mosquito", 6.24]], null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 2.17, 6.1, 4.96, 1.34, 1.55, 0.8, 0.79, 1.12, 1.59, 0.53, 2.68, 0.49, 1.54, 1.5, 0.08, 2.4, 0.71, 1.4, 2.15, 1.3, 6.57, -0.15, 0.69, 1.71, 0.21, -0.14]} \ No newline at end of file diff --git a/annotations_1/rPuW7T25Yuw_filtered.json b/annotations_1/rPuW7T25Yuw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9a097e21a41e1780e734bad97a07dd2b2f95142d --- /dev/null +++ b/annotations_1/rPuW7T25Yuw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.62], [8.0, 9.73], [11.0, 15.84], [19.0, 19.52], [23.0, 23.41], [24.0, 26.42], [27.0, 28.44], [32.0, 34.08], [34.0, 34.5], [35.0, 34.62], [35.0, 36.73], [39.0, 39.56], [41.0, 42.65], [45.0, 47.56], [49.0, 56.02], [58.0, 58.83], [61.0, 62.38], [65.0, 68.77], [69.0, 69.38], [70.0, 70.44], [70.0, 70.51], [71.0, 76.87], [86.0, 85.67], [89.0, 93.11], [96.0, 95.89], [98.0, 109.26], [112.0, 114.88], [116.0, 123.8]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.39, 0.0, 42.19, 0.0, 0.0, 36.22, 0.0, 36.7, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 42.39, 0.0, 0.0, 37.28, 0.0, 0.0, 0.0, 35.85, 0.0, 36.69, 0.0, 43.71, 51.82, 50.16], "audiomae_on_audioset": [[["music", 47.33], ["didgeridoo", 8.1], ["speech", 4.92]], null, [["music", 31.19], ["speech", 29.57], ["didgeridoo", 5.33]], null, null, [["music", 76.73], ["speech", 5.78], ["throbbing", 2.53]], null, [["music", 28.38], ["hum", 10.97], ["mains hum", 8.41]], null, null, null, null, null, [["music", 78.95], ["musical instrument", 2.85], ["electronic music", 0.88]], [["music", 63.89], ["didgeridoo", 7.34], ["speech", 3.56]], null, null, [["music", 80.56], ["didgeridoo", 2.37], ["musical instrument", 1.71]], null, null, null, [["music", 54.84], ["didgeridoo", 10.03], ["speech", 9.8]], null, [["music", 55.13], ["hum", 11.1], ["mains hum", 8.9]], null, [["music", 63.26], ["theremin", 14.32], ["didgeridoo", 9.4]], null, null], "duration": [2.62, 1.73, 4.84, 0.52, 0.41, 2.42, 1.44, 2.08, 0.5, -0.38, 1.73, 0.56, 1.65, 2.56, 7.02, 0.83, 1.38, 3.77, 0.38, 0.44, 0.51, 5.87, -0.33, 4.11, -0.11, 11.26, 2.88, 7.8]} \ No newline at end of file diff --git a/annotations_1/rQ3Qokn9t_w_filtered.json b/annotations_1/rQ3Qokn9t_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4600af2e89eb6b9cf159de7168cce4a5ba22bf00 --- /dev/null +++ b/annotations_1/rQ3Qokn9t_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.6], [10.0, 23.99], [25.0, 59.9], [60.0, 61.48], [63.0, 102.61], [110.0, 113.14], [115.0, 122.01], [122.0, 122.59], [126.0, 127.99], [129.0, 129.73], [132.0, 131.94]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 41.87, 0.0, 0.0, 0.0, 30.58, 29.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 29.32], ["mains hum", 26.33], ["throbbing", 15.31]], null, null, null, [["speech", 53.03], ["beatboxing", 6.94], ["music", 5.28]], [["speech", 27.85], ["fly, housefly", 11.94], ["insect", 8.58]], null, null, null, null], "duration": [1.6, 13.99, 34.9, 1.48, 39.61, 3.14, 7.01, 0.59, 1.99, 0.73, -0.06]} \ No newline at end of file diff --git a/annotations_1/rQABiLDqdVc_filtered.json b/annotations_1/rQABiLDqdVc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b762d6d160c4d8679bb6874a9828ffaaa0de1de2 --- /dev/null +++ b/annotations_1/rQABiLDqdVc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.84], [20.0, 21.0], [24.0, 34.47], [41.0, 52.14], [58.0, 67.54], [68.0, 85.14], [86.0, 115.99]], "keep_status": [false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 29.66, 29.7, 29.89, 30.45, 30.5], "audiomae_on_audioset": [null, null, [["speech", 42.08], ["music", 16.79], ["eruption", 7.56]], [["speech", 45.97], ["explosion", 18.81], ["music", 14.06]], [["throbbing", 22.87], ["hum", 19.85], ["music", 13.4]], [["fart", 16.5], ["music", 14.5], ["speech", 14.24]], [["throbbing", 30.07], ["speech", 23.38], ["hum", 20.99]]], "duration": [0.84, 1.0, 10.47, 11.14, 9.54, 17.14, 29.99]} \ No newline at end of file diff --git a/annotations_1/rQWpTKfljVg_filtered.json b/annotations_1/rQWpTKfljVg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b9b2023d6f7802874fe906fbed7bc8ec5a5a4c --- /dev/null +++ b/annotations_1/rQWpTKfljVg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.73], [7.0, 7.6], [9.0, 8.82], [9.0, 13.93], [15.0, 15.74], [17.0, 18.08], [19.0, 20.04], [21.0, 21.71], [25.0, 32.97], [35.0, 36.48], [40.0, 40.85], [46.0, 49.38], [51.0, 64.35], [68.0, 72.77], [74.0, 75.71], [76.0, 77.14], [80.0, 80.32], [81.0, 81.67], [86.0, 87.0], [90.0, 92.97], [95.0, 98.69], [100.0, 101.44], [102.0, 102.24], [104.0, 105.12], [106.0, 107.3], [108.0, 108.5], [113.0, 113.8], [121.0, 121.73], [123.0, 124.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 97.64, 75.72, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.6, -0.18, 4.93, 0.74, 1.08, 1.04, 0.71, 7.97, 1.48, 0.85, 3.38, 13.35, 4.77, 1.71, 1.14, 0.32, 0.67, 1.0, 2.97, 3.69, 1.44, 0.24, 1.12, 1.3, 0.5, 0.8, 0.73, 1.07]} \ No newline at end of file diff --git a/annotations_1/rRUVmTXpPyg_filtered.json b/annotations_1/rRUVmTXpPyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3d432fcb5ce89854be2bcb3135fc00d57fca9ef --- /dev/null +++ b/annotations_1/rRUVmTXpPyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [7.0, 8.09], [11.0, 11.42], [14.0, 14.61], [17.0, 20.56], [23.0, 24.21], [25.0, 26.57], [31.0, 31.31], [34.0, 35.5], [37.0, 37.49], [38.0, 40.49], [47.0, 47.16], [52.0, 53.0], [63.0, 67.64], [83.0, 83.54], [85.0, 87.3], [92.0, 98.29], [99.0, 101.95], [102.0, 111.79], [114.0, 114.49], [115.0, 127.57], [130.0, 130.1], [138.0, 151.41], [154.0, 158.19], [161.0, 161.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 33.31, 0.0, 0.0, 30.35, 0.0, 31.22, 30.21, 29.96, 30.55, 0.0, 29.9, 0.0, 29.16, 32.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["mosquito", 35.46], ["fly, housefly", 26.34], ["insect", 10.65]], null, null, [["livestock, farm animals, working animals", 32.76], ["cowbell", 15.75], ["music", 11.84]], null, [["music", 44.74], ["brass instrument", 8.65], ["musical instrument", 8.52]], [["music", 49.94], ["didgeridoo", 11.48], ["musical instrument", 6.43]], [["foghorn", 16.93], ["speech", 8.41], ["mosquito", 8.38]], [["fly, housefly", 48.4], ["insect", 19.9], ["buzz", 11.7]], null, [["fly, housefly", 28.05], ["insect", 10.84], ["music", 10.59]], null, [["music", 40.5], ["speech", 10.84], ["race car, auto racing", 7.8]], [["hum", 41.94], ["music", 17.3], ["mains hum", 14.34]], null], "duration": [1.91, 1.09, 0.42, 0.61, 3.56, 1.21, 1.57, 0.31, 1.5, 0.49, 2.49, 0.16, 1.0, 4.64, 0.54, 2.3, 6.29, 2.95, 9.79, 0.49, 12.57, 0.1, 13.41, 4.19, 0.6]} \ No newline at end of file diff --git a/annotations_1/rRlfzy7Rxdo_filtered.json b/annotations_1/rRlfzy7Rxdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b8b507bb5c4713b147283630251fbaa3e842086 --- /dev/null +++ b/annotations_1/rRlfzy7Rxdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[140.0, 142.62], [143.0, 145.12], [146.0, 147.97], [149.0, 151.09], [152.0, 167.81], [172.0, 172.69]], "keep_status": [true, true, false, false, true, false], "silence_prob": [38.87, 37.77, 0.0, 36.72, 29.14, 0.0], "audiomae_on_audioset": [[["hum", 27.31], ["music", 24.71], ["mains hum", 7.04]], [["hum", 32.2], ["throbbing", 19.1], ["music", 15.72]], null, [["hum", 32.06], ["music", 23.56], ["throbbing", 17.79]], [["hum", 40.4], ["mains hum", 15.39], ["throbbing", 10.77]], null], "duration": [2.62, 2.12, 1.97, 2.09, 15.81, 0.69]} \ No newline at end of file diff --git a/annotations_1/rRuulhJ2ARQ_filtered.json b/annotations_1/rRuulhJ2ARQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3746baec07aed264cf84a4fedddae0e5c8156e0b --- /dev/null +++ b/annotations_1/rRuulhJ2ARQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.43], [17.0, 17.32], [18.0, 68.57], [69.0, 112.99], [114.0, 142.77], [143.0, 143.46], [144.0, 145.35], [146.0, 147.16], [150.0, 171.76]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [57.89, 0.0, 0.0, 0.0, 72.6, 0.0, 0.0, 0.0, 34.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 66.86], ["scary music", 8.57], ["ambient music", 7.34]]], "duration": [3.43, 0.32, 50.57, 43.99, 28.77, 0.46, 1.35, 1.16, 21.76]} \ No newline at end of file diff --git a/annotations_1/rS-P78D5US4_filtered.json b/annotations_1/rS-P78D5US4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7715d7ba2ab217f0f2570a96784fdfda1fda714 --- /dev/null +++ b/annotations_1/rS-P78D5US4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.96], [45.0, 45.76], [48.0, 47.58], [48.0, 47.73], [68.0, 68.05], [78.0, 78.73], [126.0, 126.6], [129.0, 130.23], [137.0, 137.15]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [57.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [3.96, 0.76, -0.42, -0.27, 0.05, 0.73, 0.6, 1.23, 0.15]} \ No newline at end of file diff --git a/annotations_1/rS_HIFTV7wM_filtered.json b/annotations_1/rS_HIFTV7wM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cebf2a776bedcfefe6bce3944a64d83de7819952 --- /dev/null +++ b/annotations_1/rS_HIFTV7wM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 52.12], [54.0, 67.86]], "keep_status": [true, true], "silence_prob": [29.76, 29.45], "audiomae_on_audioset": [[["fly, housefly", 43.13], ["mains hum", 6.4], ["bee, wasp, etc.", 6.35]], [["hum", 16.19], ["noise", 15.63], ["mains hum", 8.28]]], "duration": [24.12, 13.86]} \ No newline at end of file diff --git a/annotations_1/rTlfnymyrrQ_filtered.json b/annotations_1/rTlfnymyrrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..963be3be9925a55590379819d6e3df69fb1f0b92 --- /dev/null +++ b/annotations_1/rTlfnymyrrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 6.64], [10.0, 27.77], [33.0, 33.35], [35.0, 34.97], [35.0, 36.21], [37.0, 37.91], [38.0, 38.7], [41.0, 42.92], [49.0, 49.06], [51.0, 52.86], [61.0, 68.62], [72.0, 77.85], [82.0, 84.47], [88.0, 93.61], [94.0, 95.15], [96.0, 96.42], [97.0, 97.31], [99.0, 99.03], [100.0, 99.96], [101.0, 101.63], [104.0, 104.75], [106.0, 122.17], [139.0, 140.29], [140.0, 140.34], [141.0, 151.55], [155.0, 157.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.09, 30.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.52, 29.98, 31.64, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.02, 0.0, 0.0, 41.62, 84.25], "audiomae_on_audioset": [[["mains hum", 28.62], ["hum", 21.47], ["music", 21.45]], [["music", 73.97], ["electronic music", 3.08], ["explosion", 2.38]], null, null, null, null, null, null, null, null, [["hum", 39.06], ["music", 15.03], ["throbbing", 14.79]], [["music", 22.37], ["speech", 10.72], ["cattle, bovinae", 10.43]], [["hum", 24.78], ["mains hum", 19.47], ["music", 16.94]], [["speech", 56.36], ["music", 13.62], ["throbbing", 11.3]], null, null, null, null, null, null, null, [["speech", 66.56], ["eruption", 5.34], ["explosion", 5.19]], null, null, [["speech", 43.12], ["gunshot, gunfire", 10.78], ["hum", 8.4]], null], "duration": [5.64, 17.77, 0.35, -0.03, 1.21, 0.91, 0.7, 1.92, 0.06, 1.86, 7.62, 5.85, 2.47, 5.61, 1.15, 0.42, 0.31, 0.03, -0.04, 0.63, 0.75, 16.17, 1.29, 0.34, 10.55, 2.03]} \ No newline at end of file diff --git a/annotations_1/rUbY9uikvWc_filtered.json b/annotations_1/rUbY9uikvWc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..87fbd04d847f1fe539f382a506dbc62a33a48f43 --- /dev/null +++ b/annotations_1/rUbY9uikvWc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.59], [6.0, 6.54], [7.0, 8.56], [10.0, 10.77], [17.0, 17.07], [20.0, 19.97], [23.0, 23.23], [27.0, 27.87], [41.0, 41.82], [45.0, 44.85], [50.0, 50.08], [52.0, 51.93], [57.0, 57.6], [58.0, 59.32], [61.0, 62.65], [65.0, 65.69], [72.0, 75.51], [81.0, 81.36], [84.0, 84.57], [86.0, 90.0], [94.0, 95.18], [109.0, 111.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 71.14, 0.0, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.54, 1.56, 0.77, 0.07, -0.03, 0.23, 0.87, 0.82, -0.15, 0.08, -0.07, 0.6, 1.32, 1.65, 0.69, 3.51, 0.36, 0.57, 4.0, 1.18, 2.4]} \ No newline at end of file diff --git a/annotations_1/rW1_EfZ2pWU_filtered.json b/annotations_1/rW1_EfZ2pWU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51a9d9dbb3944b3a8ac5437ad3c2c02732022142 --- /dev/null +++ b/annotations_1/rW1_EfZ2pWU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.15], [12.0, 12.56], [13.0, 13.8], [21.0, 21.56], [24.0, 24.27], [26.0, 26.43], [29.0, 29.22], [37.0, 37.62], [40.0, 41.12], [43.0, 44.02], [48.0, 48.17], [50.0, 50.94], [52.0, 52.35], [55.0, 55.16], [58.0, 58.75], [60.0, 60.66], [63.0, 63.56], [70.0, 72.76], [76.0, 76.77], [78.0, 78.07], [79.0, 79.07], [82.0, 82.76], [86.0, 87.81], [89.0, 91.84], [94.0, 94.27], [96.0, 96.94], [101.0, 102.3], [104.0, 104.9], [107.0, 106.86], [109.0, 109.83], [111.0, 110.98], [113.0, 113.09], [115.0, 114.88], [116.0, 116.24], [117.0, 118.49], [120.0, 120.6], [124.0, 124.56], [134.0, 135.06], [136.0, 135.89], [136.0, 137.32], [139.0, 145.05], [146.0, 146.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.35, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["noise", 27.21], ["frog", 16.15], ["grunt", 7.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.15, 0.56, 0.8, 0.56, 0.27, 0.43, 0.22, 0.62, 1.12, 1.02, 0.17, 0.94, 0.35, 0.16, 0.75, 0.66, 0.56, 2.76, 0.77, 0.07, 0.07, 0.76, 1.81, 2.84, 0.27, 0.94, 1.3, 0.9, -0.14, 0.83, -0.02, 0.09, -0.12, 0.24, 1.49, 0.6, 0.56, 1.06, -0.11, 1.32, 6.05, 0.89]} \ No newline at end of file diff --git a/annotations_1/rW59kLTHdBE_filtered.json b/annotations_1/rW59kLTHdBE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ccd073e5b4f7de8b579075303c154e994ce939e --- /dev/null +++ b/annotations_1/rW59kLTHdBE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 44.29], [48.0, 77.06], [80.0, 84.18], [86.0, 87.61]], "keep_status": [true, false, false, false], "silence_prob": [29.03, 29.25, 36.86, 0.0], "audiomae_on_audioset": [[["music", 36.22], ["speech", 24.54], ["groan", 3.71]], [["music", 92.51], ["timpani", 0.5], ["hum", 0.48]], [["music", 54.81], ["didgeridoo", 15.16], ["speech", 7.15]], null], "duration": [23.29, 29.06, 4.18, 1.61]} \ No newline at end of file diff --git a/annotations_1/rWlFWMR9MfY_filtered.json b/annotations_1/rWlFWMR9MfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..796b0bca04731b8bf732386665fe5d400198cb7d --- /dev/null +++ b/annotations_1/rWlFWMR9MfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.12], [4.0, 3.74], [5.0, 6.99], [14.0, 15.52], [27.0, 27.35], [32.0, 31.97], [33.0, 33.81], [47.0, 49.08], [52.0, 52.27], [65.0, 65.77], [74.0, 73.79], [82.0, 82.65], [91.0, 94.8], [96.0, 102.78], [106.0, 106.79], [120.0, 127.4], [130.0, 132.19], [135.0, 148.12], [150.0, 150.72], [154.0, 155.19], [159.0, 159.83], [161.0, 165.42], [167.0, 180.93]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, true, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 29.23, 28.97, 0.0, 29.0, 31.46, 29.02, 0.0, 0.0, 0.0, 29.55, 28.59], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["roar", 22.34], ["speech", 18.76], ["music", 12.83]], null, null, null, null, [["music", 46.66], ["sound effect", 10.63], ["reverberation", 8.15]], [["music", 38.63], ["hum", 24.59], ["throbbing", 15.29]], null, [["music", 43.96], ["didgeridoo", 5.49], ["hum", 4.45]], [["music", 18.22], ["musical instrument", 5.16], ["trombone", 4.99]], [["music", 10.08], ["whack, thwack", 7.65], ["speech", 6.6]], null, null, null, [["speech", 41.49], ["rumble", 11.6], ["whoosh, swoosh, swish", 6.1]], [["music", 21.65], ["speech", 19.45], ["buzz", 7.18]]], "duration": [0.12, -0.26, 1.99, 1.52, 0.35, -0.03, 0.81, 2.08, 0.27, 0.77, -0.21, 0.65, 3.8, 6.78, 0.79, 7.4, 2.19, 13.12, 0.72, 1.19, 0.83, 4.42, 13.93]} \ No newline at end of file diff --git a/annotations_1/rX6oUNKUbI8_filtered.json b/annotations_1/rX6oUNKUbI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d624a28f81c821f7670c690f140fd4cdb1fe401 --- /dev/null +++ b/annotations_1/rX6oUNKUbI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.72], [32.0, 32.17], [60.0, 61.01], [69.0, 69.57], [71.0, 71.27], [76.0, 75.68], [91.0, 91.71], [96.0, 95.77], [128.0, 128.07], [130.0, 129.81], [133.0, 135.36], [140.0, 140.22], [160.0, 160.54], [164.0, 164.96], [166.0, 174.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [99.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 45.72], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.47], ["thunk", 16.49], ["whack, thwack", 13.63]]], "duration": [2.72, 0.17, 1.01, 0.57, 0.27, -0.32, 0.71, -0.23, 0.07, -0.19, 2.36, 0.22, 0.54, 0.96, 8.09]} \ No newline at end of file diff --git a/annotations_1/rXxBQRh89AA_filtered.json b/annotations_1/rXxBQRh89AA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2033a4fd3e114e9e0ed5d9b25422792b53d7e6e --- /dev/null +++ b/annotations_1/rXxBQRh89AA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.43], [11.0, 12.24], [13.0, 15.03], [18.0, 19.58], [20.0, 20.85], [27.0, 28.14], [30.0, 30.89], [33.0, 34.21], [35.0, 35.67], [37.0, 38.57], [41.0, 42.7], [44.0, 45.13], [46.0, 47.63], [49.0, 49.18], [49.0, 51.0], [57.0, 57.21], [57.0, 58.09], [61.0, 64.56], [68.0, 68.57], [69.0, 70.87], [71.0, 73.25], [75.0, 75.76], [76.0, 76.6], [78.0, 79.25], [81.0, 82.49], [84.0, 86.27], [89.0, 90.51], [92.0, 97.36], [98.0, 99.52], [100.0, 102.09], [103.0, 104.79], [106.0, 106.91], [108.0, 109.98], [110.0, 121.14], [122.0, 122.18], [123.0, 127.08], [130.0, 132.39], [133.0, 134.77], [142.0, 142.28], [148.0, 152.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 76.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 0.0, 53.53, 0.0, 0.0, 36.98, 0.0, 0.0, 0.0, 0.0, 78.21, 0.0, 62.37, 0.0, 38.55, 0.0, 0.0, 0.0, 45.62, 0.0, 48.02, 53.28, 0.0, 0.0, 72.16], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.27], ["music", 21.16], ["hum", 3.91]], null, null, null, null, null, null, null, null, [["speech", 21.7], ["hum", 20.31], ["mains hum", 13.22]], null, null, null, [["fly, housefly", 23.76], ["insect", 14.04], ["speech", 11.62]], null, [["fart", 13.97], ["rumble", 12.78], ["buzz", 9.42]], null, null, null, null], "duration": [1.43, 1.24, 2.03, 1.58, 0.85, 1.14, 0.89, 1.21, 0.67, 1.57, 1.7, 1.13, 1.63, 0.18, 2.0, 0.21, 1.09, 3.56, 0.57, 1.87, 2.25, 0.76, 0.6, 1.25, 1.49, 2.27, 1.51, 5.36, 1.52, 2.09, 1.79, 0.91, 1.98, 11.14, 0.18, 4.08, 2.39, 1.77, 0.28, 4.69]} \ No newline at end of file diff --git a/annotations_1/rYHCZi-tmTE_filtered.json b/annotations_1/rYHCZi-tmTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9af77bc8770939f1ce4c4ecab377a619c075cb1c --- /dev/null +++ b/annotations_1/rYHCZi-tmTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.97], [5.0, 5.71], [7.0, 8.6], [11.0, 14.98], [16.0, 16.36], [18.0, 19.11], [20.0, 20.65], [21.0, 22.01], [37.0, 37.49], [44.0, 44.07], [49.0, 49.3], [65.0, 65.2], [74.0, 76.42], [80.0, 81.18], [82.0, 83.91], [90.0, 90.58], [94.0, 93.97], [95.0, 95.08], [96.0, 97.19], [101.0, 109.48], [138.0, 139.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.87, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.97, 0.71, 1.6, 3.98, 0.36, 1.11, 0.65, 1.01, 0.49, 0.07, 0.3, 0.2, 2.42, 1.18, 1.91, 0.58, -0.03, 0.08, 1.19, 8.48, 1.06]} \ No newline at end of file diff --git a/annotations_1/rYS9mUCFOAk_filtered.json b/annotations_1/rYS9mUCFOAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..831cebef585827996df2f215afff83b90bbe2cb2 --- /dev/null +++ b/annotations_1/rYS9mUCFOAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [34.0, 34.13], [36.0, 35.75], [40.0, 41.07], [45.0, 45.94], [56.0, 56.49], [64.0, 65.16], [74.0, 74.34], [77.0, 77.35], [86.0, 86.04], [93.0, 94.05], [95.0, 94.91], [96.0, 96.74], [98.0, 99.22], [101.0, 102.39], [104.0, 104.36], [113.0, 113.41], [119.0, 119.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.13, -0.25, 1.07, 0.94, 0.49, 1.16, 0.34, 0.35, 0.04, 1.05, -0.09, 0.74, 1.22, 1.39, 0.36, 0.41, 0.91]} \ No newline at end of file diff --git a/annotations_1/rZpeepxXh7I_filtered.json b/annotations_1/rZpeepxXh7I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e1add10aedc242a867bd6301909a3491482c0d6 --- /dev/null +++ b/annotations_1/rZpeepxXh7I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.42], [4.0, 7.2], [7.0, 14.27], [17.0, 17.07], [20.0, 23.06], [25.0, 25.42], [28.0, 28.12], [30.0, 30.69], [32.0, 32.9], [35.0, 35.01], [39.0, 41.34], [43.0, 43.56], [45.0, 45.15], [47.0, 51.0], [52.0, 53.74], [56.0, 64.99], [66.0, 66.78], [68.0, 68.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 68.41, 59.51, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 67.13, 0.0, 0.0, 74.29, 0.0, 33.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 16.75], ["explosion", 13.36], ["burst, pop", 9.06]], null, null], "duration": [0.42, 3.2, 7.27, 0.07, 3.06, 0.42, 0.12, 0.69, 0.9, 0.01, 2.34, 0.56, 0.15, 4.0, 1.74, 8.99, 0.78, 0.82]} \ No newline at end of file diff --git a/annotations_1/rZs0ZkhzpsI_filtered.json b/annotations_1/rZs0ZkhzpsI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edc6c419c04d21da56967843f42bc915c09bc86a --- /dev/null +++ b/annotations_1/rZs0ZkhzpsI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.03], [22.0, 25.47], [27.0, 34.2], [36.0, 37.3], [38.0, 38.6], [45.0, 47.75], [53.0, 57.59], [58.0, 60.15], [62.0, 64.69], [66.0, 66.21], [67.0, 68.88], [71.0, 76.01], [76.0, 77.36], [79.0, 84.97], [87.0, 89.04], [94.0, 100.4], [101.0, 103.05], [107.0, 108.57], [109.0, 110.73], [112.0, 113.9], [117.0, 119.79], [121.0, 124.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 47.35, 63.64, 0.0, 0.0, 39.37, 98.86, 84.43, 96.77, 0.0, 0.0, 89.9, 0.0, 95.23, 98.27, 98.93, 99.87, 0.0, 0.0, 0.0, 69.88, 68.28], "audiomae_on_audioset": [null, [["music", 10.12], ["speech", 8.05], ["wood", 6.54]], null, null, null, [["speech", 50.52], ["music", 14.22], ["synthesizer", 5.36]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 3.47, 7.2, 1.3, 0.6, 2.75, 4.59, 2.15, 2.69, 0.21, 1.88, 5.01, 1.36, 5.97, 2.04, 6.4, 2.05, 1.57, 1.73, 1.9, 2.79, 3.23]} \ No newline at end of file diff --git a/annotations_1/rZyjko9lXo0_filtered.json b/annotations_1/rZyjko9lXo0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d19bf08fdfdb0c43955c0f544ec0ee2ae827816 --- /dev/null +++ b/annotations_1/rZyjko9lXo0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.59], [24.0, 25.15], [31.0, 33.54], [43.0, 44.27], [47.0, 47.78], [53.0, 55.26], [68.0, 68.98], [75.0, 76.18], [77.0, 78.09], [79.0, 80.59], [84.0, 85.8], [90.0, 91.88], [92.0, 93.26], [98.0, 100.33], [102.0, 102.91], [104.0, 108.9], [112.0, 111.87], [114.0, 114.61], [118.0, 122.59], [129.0, 129.03], [131.0, 132.54], [135.0, 135.48], [137.0, 140.78], [143.0, 146.04], [149.0, 149.4], [150.0, 151.92], [153.0, 156.05], [159.0, 160.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 99.16, 0.0, 0.0, 79.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 63.96, 0.0, 0.0, 82.97, 0.0, 0.0, 0.0, 74.6, 49.45, 0.0, 0.0, 89.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 26.02], ["throbbing", 12.68], ["music", 10.65]], null, null, null, null], "duration": [0.59, 1.15, 2.54, 1.27, 0.78, 2.26, 0.98, 1.18, 1.09, 1.59, 1.8, 1.88, 1.26, 2.33, 0.91, 4.9, -0.13, 0.61, 4.59, 0.03, 1.54, 0.48, 3.78, 3.04, 0.4, 1.92, 3.05, 1.34]} \ No newline at end of file diff --git a/annotations_1/r_3ofu2x8qM_filtered.json b/annotations_1/r_3ofu2x8qM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfc9c62e11ce199bda64243b76b6a14b5d5a166 --- /dev/null +++ b/annotations_1/r_3ofu2x8qM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.58], [26.0, 26.55], [30.0, 30.47], [31.0, 31.4], [34.0, 104.4], [105.0, 106.47], [109.0, 109.8], [110.0, 111.54], [112.0, 112.41], [120.0, 129.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [1.58, 0.55, 0.47, 0.4, 70.4, 1.47, 0.8, 1.54, 0.41, 9.63]} \ No newline at end of file diff --git a/annotations_1/r_ckU9PkTbM_filtered.json b/annotations_1/r_ckU9PkTbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..416bef00fc88e38ea267fafc8d5ea082da17402a --- /dev/null +++ b/annotations_1/r_ckU9PkTbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.14], [13.0, 14.67], [21.0, 21.37], [22.0, 21.96], [23.0, 24.7], [26.0, 26.18], [28.0, 28.8], [31.0, 31.67], [34.0, 34.3], [36.0, 37.22], [37.0, 37.99], [47.0, 49.11], [55.0, 55.83], [57.0, 56.86], [59.0, 59.81], [61.0, 64.89], [65.0, 66.93], [72.0, 71.9], [73.0, 74.04], [78.0, 78.71], [79.0, 80.15], [81.0, 81.14], [82.0, 82.51], [83.0, 83.84], [87.0, 88.25], [89.0, 96.96], [97.0, 115.13], [116.0, 118.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.93, 0.0, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.72, 53.78, 68.41], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.1], ["music", 10.44], ["buzz", 7.6]], null, null], "duration": [0.14, 1.67, 0.37, -0.04, 1.7, 0.18, 0.8, 0.67, 0.3, 1.22, 0.99, 2.11, 0.83, -0.14, 0.81, 3.89, 1.93, -0.1, 1.04, 0.71, 1.15, 0.14, 0.51, 0.84, 1.25, 7.96, 18.13, 2.61]} \ No newline at end of file diff --git a/annotations_1/r_tl6PA-Rd4_filtered.json b/annotations_1/r_tl6PA-Rd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c326956edef9238d66673bf87bb0ae9bb9e8a76 --- /dev/null +++ b/annotations_1/r_tl6PA-Rd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.85], [3.0, 2.73], [4.0, 7.2], [8.0, 8.51], [14.0, 15.82], [20.0, 20.24], [21.0, 23.04], [24.0, 24.68], [26.0, 26.81], [29.0, 30.2], [31.0, 33.61], [37.0, 39.85], [43.0, 43.7], [44.0, 47.75], [50.0, 51.09], [54.0, 54.73], [57.0, 57.65], [59.0, 61.06], [63.0, 63.42], [64.0, 69.26], [70.0, 69.77], [70.0, 86.44], [88.0, 88.38], [95.0, 100.45], [105.0, 105.66], [108.0, 108.62], [109.0, 109.34], [110.0, 111.11], [113.0, 114.62], [115.0, 119.64], [122.0, 122.71]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 46.5, 0.0, 0.0, 0.0, 53.59, 0.0, 0.0, 0.0, 48.52, 45.24, 0.0, 32.22, 0.0, 0.0, 0.0, 30.05, 0.0, 31.55, 0.0, 31.18, 0.0, 50.76, 0.0, 0.0, 0.0, 0.0, 0.0, 49.73, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.21], ["didgeridoo", 21.21], ["theremin", 8.0]], null, null, null, null, null, null, null, [["music", 49.93], ["didgeridoo", 29.12], ["musical instrument", 2.96]], [["music", 9.91], ["animal", 5.62], ["dog", 5.04]], null, [["music", 65.63], ["speech", 15.57], ["musical instrument", 2.9]], null, null, null, [["music", 69.56], ["musical instrument", 4.34], ["carnatic music", 3.73]], null, [["music", 55.38], ["brass instrument", 11.42], ["musical instrument", 7.11]], null, [["music", 64.21], ["effects unit", 2.26], ["didgeridoo", 2.17]], null, null, null, null, null, null, null, [["bee, wasp, etc.", 24.5], ["speech", 23.42], ["fly, housefly", 20.7]], null], "duration": [-0.15, -0.27, 3.2, 0.51, 1.82, 0.24, 2.04, 0.68, 0.81, 1.2, 2.61, 2.85, 0.7, 3.75, 1.09, 0.73, 0.65, 2.06, 0.42, 5.26, -0.23, 16.44, 0.38, 5.45, 0.66, 0.62, 0.34, 1.11, 1.62, 4.64, 0.71]} \ No newline at end of file diff --git a/annotations_1/ra42YS4NRlY_filtered.json b/annotations_1/ra42YS4NRlY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59bc49d0d5a82843a8d5bdea2b81c1c5e9b3e3b7 --- /dev/null +++ b/annotations_1/ra42YS4NRlY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.78], [6.0, 6.49], [8.0, 7.7], [8.0, 15.09], [23.0, 27.46], [40.0, 40.96], [47.0, 46.89], [49.0, 50.5], [52.0, 52.69], [59.0, 58.89], [60.0, 61.28], [65.0, 65.47], [73.0, 76.65], [77.0, 77.23], [79.0, 81.95], [84.0, 84.5], [87.0, 90.61], [96.0, 96.87], [97.0, 98.68], [99.0, 99.69], [100.0, 100.75], [101.0, 101.61], [106.0, 118.37], [119.0, 123.96], [127.0, 127.14], [129.0, 131.77], [135.0, 135.75]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [54.5, 0.0, 0.0, 40.17, 34.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.37, 0.0, 41.3, 0.0, 32.88, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 32.45, 0.0, 37.3, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 40.47], ["bass guitar", 8.63], ["hum", 6.35]], [["music", 21.7], ["hum", 19.6], ["mains hum", 16.35]], null, null, null, null, null, null, null, [["music", 64.35], ["musical instrument", 4.87], ["didgeridoo", 4.75]], null, [["music", 49.5], ["speech", 32.98], ["explosion", 1.6]], null, [["music", 62.07], ["hum", 5.83], ["throbbing", 5.15]], null, null, null, null, null, [["music", 32.71], ["speech", 12.53], ["hum", 10.19]], [["speech", 44.92], ["music", 28.39], ["boing", 8.01]], null, [["hum", 30.02], ["speech", 17.29], ["music", 14.79]], null], "duration": [2.78, 0.49, -0.3, 7.09, 4.46, 0.96, -0.11, 1.5, 0.69, -0.11, 1.28, 0.47, 3.65, 0.23, 2.95, 0.5, 3.61, 0.87, 1.68, 0.69, 0.75, 0.61, 12.37, 4.96, 0.14, 2.77, 0.75]} \ No newline at end of file diff --git a/annotations_1/ra9UQb-OVqQ_filtered.json b/annotations_1/ra9UQb-OVqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb1b419207e0aa81850985644bb51acbe87772a4 --- /dev/null +++ b/annotations_1/ra9UQb-OVqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.87], [10.0, 16.88], [22.0, 21.84], [23.0, 23.5], [24.0, 29.86], [31.0, 30.75], [38.0, 41.81], [48.0, 51.61], [53.0, 55.59], [58.0, 61.08], [62.0, 62.95], [66.0, 68.45], [77.0, 77.95]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [34.28, 36.15, 0.0, 0.0, 31.04, 0.0, 33.79, 34.65, 94.22, 46.12, 0.0, 48.65, 0.0], "audiomae_on_audioset": [[["music", 40.28], ["speech", 29.37], ["busy signal", 2.56]], [["music", 53.15], ["speech", 17.1], ["throbbing", 2.56]], null, null, [["music", 52.91], ["speech", 24.68], ["boing", 3.22]], null, [["music", 24.99], ["hum", 16.15], ["mains hum", 10.17]], [["music", 53.55], ["throbbing", 13.4], ["hum", 12.5]], null, [["thunk", 38.05], ["arrow", 29.26], ["animal", 2.88]], null, [["music", 40.8], ["animal", 8.2], ["livestock, farm animals, working animals", 7.64]], null], "duration": [4.87, 6.88, -0.16, 0.5, 5.86, -0.25, 3.81, 3.61, 2.59, 3.08, 0.95, 2.45, 0.95]} \ No newline at end of file diff --git a/annotations_1/raDWhK7iSqU_filtered.json b/annotations_1/raDWhK7iSqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463a145617ebbbe425141dae61b6c14a69ae7144 --- /dev/null +++ b/annotations_1/raDWhK7iSqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.67], [14.0, 22.77], [33.0, 32.9], [33.0, 34.28], [35.0, 35.77], [37.0, 47.71], [50.0, 52.17], [59.0, 59.31], [60.0, 62.23], [68.0, 79.32], [79.0, 81.63], [83.0, 84.08], [92.0, 96.04], [97.0, 97.02], [98.0, 99.55], [102.0, 102.61], [103.0, 124.82], [132.0, 151.97], [153.0, 153.54], [154.0, 154.7]], "keep_status": [true, false, false, false, false, false, true, false, true, true, true, false, true, false, false, false, false, false, false, false], "silence_prob": [35.28, 35.65, 0.0, 0.0, 0.0, 35.47, 33.07, 0.0, 35.67, 35.18, 33.81, 0.0, 42.79, 0.0, 0.0, 0.0, 34.05, 35.56, 0.0, 0.0], "audiomae_on_audioset": [[["music", 15.24], ["mosquito", 13.2], ["fly, housefly", 10.75]], [["music", 67.48], ["animal", 4.96], ["quack", 2.07]], null, null, null, [["speech", 30.97], ["music", 23.19], ["groan", 16.47]], [["hum", 41.25], ["throbbing", 20.79], ["noise", 5.78]], null, [["music", 28.68], ["groan", 14.52], ["didgeridoo", 9.54]], [["music", 33.21], ["fly, housefly", 8.99], ["moo", 6.36]], [["fly, housefly", 31.21], ["insect", 11.02], ["music", 9.59]], null, [["theremin", 39.08], ["music", 13.45], ["speech", 7.53]], null, null, null, [["music", 58.33], ["didgeridoo", 9.29], ["insect", 4.63]], [["music", 66.08], ["sonar", 16.94], ["didgeridoo", 2.24]], null, null], "duration": [4.67, 8.77, -0.1, 1.28, 0.77, 10.71, 2.17, 0.31, 2.23, 11.32, 2.63, 1.08, 4.04, 0.02, 1.55, 0.61, 21.82, 19.97, 0.54, 0.7]} \ No newline at end of file diff --git a/annotations_1/raM63LAHuwo_filtered.json b/annotations_1/raM63LAHuwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0cf627c1076824bf396a08966a7982e513d3c08c --- /dev/null +++ b/annotations_1/raM63LAHuwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.08], [5.0, 7.3], [10.0, 11.1], [14.0, 19.09], [20.0, 22.2], [23.0, 23.46], [25.0, 31.33], [31.0, 32.8], [35.0, 35.87], [37.0, 38.11], [40.0, 40.78], [44.0, 45.0], [48.0, 49.01], [51.0, 51.44], [52.0, 52.74], [54.0, 56.4], [58.0, 68.59], [70.0, 74.82], [76.0, 79.05], [79.0, 85.06], [85.0, 89.5], [91.0, 91.69], [93.0, 93.29], [94.0, 95.98], [97.0, 97.46], [98.0, 98.52], [100.0, 100.75], [107.0, 107.22], [110.0, 111.03], [112.0, 112.89], [113.0, 113.95], [115.0, 115.65], [118.0, 118.81], [120.0, 145.15], [147.0, 148.93], [151.0, 162.53], [165.0, 164.86], [166.0, 175.29], [176.0, 176.54], [177.0, 177.77], [178.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 94.52, 0.0, 97.92, 99.96, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 94.95, 83.34, 98.36, 86.82, 71.87, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 51.28, 0.0, 50.91, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.08, 2.3, 1.1, 5.09, 2.2, 0.46, 6.33, 1.8, 0.87, 1.11, 0.78, 1.0, 1.01, 0.44, 0.74, 2.4, 10.59, 4.82, 3.05, 6.06, 4.5, 0.69, 0.29, 1.98, 0.46, 0.52, 0.75, 0.22, 1.03, 0.89, 0.95, 0.65, 0.81, 25.15, 1.93, 11.53, -0.14, 9.29, 0.54, 0.77, 0.12]} \ No newline at end of file diff --git a/annotations_1/raSWINBYtuc_filtered.json b/annotations_1/raSWINBYtuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..088a863688a7557b0320d4fc2458b68d8310ac53 --- /dev/null +++ b/annotations_1/raSWINBYtuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 31.87], [33.0, 33.81], [44.0, 45.25], [52.0, 52.37], [54.0, 54.14], [56.0, 56.27], [60.0, 76.77], [79.0, 82.46], [83.0, 84.81], [86.0, 118.5], [119.0, 119.87], [121.0, 124.34], [130.0, 131.38], [134.0, 148.12], [149.0, 149.17], [151.0, 150.99], [158.0, 158.31], [163.0, 164.17], [165.0, 166.5], [172.0, 173.37]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [30.52, 0.0, 0.0, 0.0, 0.0, 0.0, 29.65, 28.98, 0.0, 0.0, 0.0, 31.05, 0.0, 32.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 39.19], ["hum", 25.86], ["music", 21.01]], null, null, null, null, null, [["music", 36.46], ["throbbing", 23.47], ["hum", 15.81]], [["music", 24.94], ["speech", 23.86], ["explosion", 17.8]], null, null, null, [["music", 44.47], ["mains hum", 10.47], ["didgeridoo", 7.43]], null, [["hum", 48.7], ["mains hum", 42.09], ["buzz", 3.17]], null, null, null, null, null, null], "duration": [15.87, 0.81, 1.25, 0.37, 0.14, 0.27, 16.77, 3.46, 1.81, 32.5, 0.87, 3.34, 1.38, 14.12, 0.17, -0.01, 0.31, 1.17, 1.5, 1.37]} \ No newline at end of file diff --git a/annotations_1/rbYJb_i2czc_filtered.json b/annotations_1/rbYJb_i2czc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f493d2425f651fd91e9771ce892001cbaf89f649 --- /dev/null +++ b/annotations_1/rbYJb_i2czc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.85], [24.0, 25.51], [26.0, 28.43], [34.0, 46.47], [47.0, 47.65], [56.0, 55.92], [57.0, 69.72], [71.0, 71.56], [76.0, 77.89], [79.0, 80.5], [81.0, 87.72], [89.0, 90.69]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 29.42, 30.06, 0.0, 0.0, 30.72, 0.0, 0.0, 0.0, 39.72, 0.0], "audiomae_on_audioset": [null, null, [["music", 33.66], ["hum", 26.0], ["mains hum", 19.21]], [["music", 54.68], ["throbbing", 24.99], ["hum", 8.42]], null, null, [["speech", 20.51], ["thump, thud", 15.29], ["music", 13.4]], null, null, null, [["hum", 31.37], ["speech", 18.7], ["music", 15.32]], null], "duration": [1.85, 1.51, 2.43, 12.47, 0.65, -0.08, 12.72, 0.56, 1.89, 1.5, 6.72, 1.69]} \ No newline at end of file diff --git a/annotations_1/rbhNKSWKWwU_filtered.json b/annotations_1/rbhNKSWKWwU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fddce614a447c49650d76419aedce21bfb71397a --- /dev/null +++ b/annotations_1/rbhNKSWKWwU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.37], [8.0, 10.76], [19.0, 19.4], [32.0, 32.17], [56.0, 56.19], [57.0, 61.7], [63.0, 71.07], [73.0, 73.52], [77.0, 78.58], [87.0, 93.6], [108.0, 110.15], [117.0, 118.54], [120.0, 121.44], [124.0, 128.58], [130.0, 129.73], [142.0, 149.35], [152.0, 153.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [45.92, 82.25, 0.0, 0.0, 0.0, 31.54, 38.7, 0.0, 0.0, 46.12, 31.99, 0.0, 0.0, 31.16, 0.0, 28.73, 0.0], "audiomae_on_audioset": [[["chirp tone", 44.59], ["sine wave", 29.59], ["hum", 7.29]], null, null, null, null, [["music", 71.01], ["speech", 12.62], ["musical instrument", 3.36]], [["chirp tone", 33.98], ["busy signal", 31.48], ["sine wave", 21.35]], null, null, [["chirp tone", 48.19], ["sine wave", 18.68], ["speech", 6.24]], [["speech", 46.24], ["whale vocalization", 10.09], ["hum", 5.71]], null, null, [["speech", 37.67], ["music", 27.12], ["didgeridoo", 6.86]], null, [["speech", 27.59], ["music", 13.04], ["sound effect", 8.09]], null], "duration": [4.37, 2.76, 0.4, 0.17, 0.19, 4.7, 8.07, 0.52, 1.58, 6.6, 2.15, 1.54, 1.44, 4.58, -0.27, 7.35, 1.15]} \ No newline at end of file diff --git a/annotations_1/rbrIQjVNl0E_filtered.json b/annotations_1/rbrIQjVNl0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2dacc2e2e1da8a2792ee72d2b302c00e03379732 --- /dev/null +++ b/annotations_1/rbrIQjVNl0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.87], [7.0, 7.57], [10.0, 18.01], [23.0, 23.82], [26.0, 34.45], [36.0, 36.59], [37.0, 38.1], [41.0, 41.47], [42.0, 89.43], [91.0, 93.28], [99.0, 99.64], [102.0, 111.0], [119.0, 132.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 29.88, 0.0, 29.75, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 31.62, 30.88], "audiomae_on_audioset": [null, null, [["music", 61.15], ["throbbing", 6.42], ["sidetone", 5.97]], null, [["speech", 40.4], ["music", 33.59], ["throbbing", 6.51]], null, null, null, null, [["music", 35.57], ["didgeridoo", 25.45], ["speech", 10.62]], null, [["music", 38.5], ["hum", 23.34], ["throbbing", 10.46]], [["music", 45.3], ["hum", 20.59], ["mains hum", 8.48]]], "duration": [-0.13, 0.57, 8.01, 0.82, 8.45, 0.59, 1.1, 0.47, 47.43, 2.28, 0.64, 9.0, 13.88]} \ No newline at end of file diff --git a/annotations_1/rcA0MBnPPM8_filtered.json b/annotations_1/rcA0MBnPPM8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e5d10a77b6e74be3b0428c36cfd566498f9e61e9 --- /dev/null +++ b/annotations_1/rcA0MBnPPM8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.55], [18.0, 22.92], [27.0, 27.75], [35.0, 36.21], [49.0, 55.83]], "keep_status": [false, false, false, false, false], "silence_prob": [33.67, 36.22, 0.0, 0.0, 35.54], "audiomae_on_audioset": [[["music", 60.35], ["didgeridoo", 10.83], ["speech", 4.94]], [["music", 50.67], ["speech", 10.67], ["didgeridoo", 8.77]], null, null, [["music", 56.07], ["didgeridoo", 10.2], ["speech", 9.34]]], "duration": [3.55, 4.92, 0.75, 1.21, 6.83]} \ No newline at end of file diff --git a/annotations_1/rcIfzdLjjxU_filtered.json b/annotations_1/rcIfzdLjjxU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..615ecfd5b337268ca9cdb0c623d47d48bf201bef --- /dev/null +++ b/annotations_1/rcIfzdLjjxU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.56], [10.0, 10.89], [11.0, 15.92], [18.0, 18.44], [19.0, 25.51], [27.0, 28.43], [29.0, 32.56], [36.0, 39.26], [40.0, 46.3], [49.0, 49.62], [52.0, 53.35], [55.0, 56.05], [58.0, 59.51], [61.0, 62.06], [63.0, 64.79], [66.0, 67.27], [69.0, 70.16], [72.0, 72.2], [76.0, 76.0], [79.0, 79.27], [79.0, 79.51], [81.0, 81.67], [83.0, 83.29], [86.0, 87.56], [89.0, 92.2], [92.0, 95.81], [97.0, 97.73], [99.0, 99.37], [102.0, 102.25], [103.0, 103.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.08, 0.0, 47.31, 0.0, 95.23, 44.6, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 57.01, 49.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["sidetone", 47.8], ["music", 21.99], ["speech", 10.24]], null, [["hum", 28.03], ["throbbing", 26.38], ["music", 16.64]], null, null, [["speech", 66.34], ["hum", 2.99], ["outside, rural or natural", 2.85]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 61.11], ["mains hum", 10.51], ["throbbing", 10.04]], null, null, null, null], "duration": [0.56, 0.89, 4.92, 0.44, 6.51, 1.43, 3.56, 3.26, 6.3, 0.62, 1.35, 1.05, 1.51, 1.06, 1.79, 1.27, 1.16, 0.2, 0.0, 0.27, 0.51, 0.67, 0.29, 1.56, 3.2, 3.81, 0.73, 0.37, 0.25, 0.54]} \ No newline at end of file diff --git a/annotations_1/rczP7CJB4Hs_filtered.json b/annotations_1/rczP7CJB4Hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af285f03f218a71630dcecd57760e81635c7d3b5 --- /dev/null +++ b/annotations_1/rczP7CJB4Hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.89], [20.0, 21.0], [69.0, 69.13], [79.0, 79.78], [86.0, 86.66], [105.0, 105.61]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [-0.11, 1.0, 0.13, 0.78, 0.66, 0.61]} \ No newline at end of file diff --git a/annotations_1/rd8JDPjEoE0_filtered.json b/annotations_1/rd8JDPjEoE0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..087ed14d1e2cc1f398e2c414800348665722212e --- /dev/null +++ b/annotations_1/rd8JDPjEoE0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 8.63], [11.0, 18.76], [20.0, 61.16], [64.0, 88.7], [93.0, 105.36], [107.0, 109.93], [115.0, 150.06], [151.0, 152.66], [153.0, 161.57], [164.0, 175.53]], "keep_status": [false, true, true, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 28.68, 29.98, 0.0, 28.48, 32.86, 30.37, 0.0, 0.0, 65.79, 56.78], "audiomae_on_audioset": [null, [["speech", 57.99], ["vehicle", 8.59], ["car", 3.24]], [["speech", 33.63], ["hum", 23.96], ["music", 11.62]], null, [["speech", 19.17], ["music", 15.77], ["vehicle", 5.7]], [["music", 37.86], ["hum", 29.85], ["mains hum", 16.28]], [["music", 35.66], ["hum", 11.95], ["scary music", 10.51]], null, null, null, null], "duration": [0.57, 4.63, 7.76, 41.16, 24.7, 12.36, 2.93, 35.06, 1.66, 8.57, 11.53]} \ No newline at end of file diff --git a/annotations_1/rdWIo5R10CM_filtered.json b/annotations_1/rdWIo5R10CM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4567c4d28cd345645ec095c09cf50fb1593191a0 --- /dev/null +++ b/annotations_1/rdWIo5R10CM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [9.0, 10.29], [12.0, 42.69], [43.0, 55.92], [60.0, 60.52], [65.0, 65.3], [72.0, 129.02], [131.0, 139.82]], "keep_status": [false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 28.46, 0.0, 0.0, 0.0, 30.75], "audiomae_on_audioset": [null, null, null, [["music", 51.62], ["didgeridoo", 10.88], ["throbbing", 9.93]], null, null, null, [["speech", 34.55], ["radio", 5.33], ["livestock, farm animals, working animals", 4.51]]], "duration": [1.06, 1.29, 30.69, 12.92, 0.52, 0.3, 57.02, 8.82]} \ No newline at end of file diff --git a/annotations_1/re_liKgRGew_filtered.json b/annotations_1/re_liKgRGew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef44432b0ca1585bf1f2904bc34647961c2d2349 --- /dev/null +++ b/annotations_1/re_liKgRGew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.1], [9.0, 51.19], [52.0, 53.4], [54.0, 54.67], [59.0, 58.97], [61.0, 61.8], [63.0, 64.13], [65.0, 66.66], [69.0, 69.45], [70.0, 71.12], [72.0, 72.69], [75.0, 75.52], [84.0, 84.74], [86.0, 87.27], [89.0, 89.14], [90.0, 90.71], [93.0, 93.11], [94.0, 95.0], [99.0, 99.18], [101.0, 102.63], [105.0, 105.53], [107.0, 108.26], [109.0, 113.75], [115.0, 115.5], [118.0, 119.91], [121.0, 123.84], [133.0, 142.74], [143.0, 144.54], [148.0, 149.15], [150.0, 151.43], [152.0, 153.17], [155.0, 155.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 0.0, 0.0, 39.74, 32.44, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 29.81], ["speech", 11.39], ["burst, pop", 8.15]], null, null, [["music", 45.46], ["synthesizer", 22.38], ["drum machine", 5.87]], [["music", 47.11], ["boing", 6.92], ["electric shaver, electric razor", 3.81]], null, null, null, null, null], "duration": [0.1, 42.19, 1.4, 0.67, -0.03, 0.8, 1.13, 1.66, 0.45, 1.12, 0.69, 0.52, 0.74, 1.27, 0.14, 0.71, 0.11, 1.0, 0.18, 1.63, 0.53, 1.26, 4.75, 0.5, 1.91, 2.84, 9.74, 1.54, 1.15, 1.43, 1.17, 0.65]} \ No newline at end of file diff --git a/annotations_1/refu69Hu5R0_filtered.json b/annotations_1/refu69Hu5R0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baee76e0625b0d0643cd6650478850ea4d2d17b4 --- /dev/null +++ b/annotations_1/refu69Hu5R0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.02], [4.0, 12.19], [14.0, 14.03], [15.0, 15.99], [24.0, 24.6], [26.0, 28.76], [30.0, 32.46], [35.0, 35.82], [38.0, 38.23], [40.0, 43.66], [45.0, 45.72], [51.0, 56.61], [57.0, 65.1], [66.0, 67.31], [69.0, 69.13], [70.0, 70.09], [73.0, 73.82], [75.0, 74.95], [78.0, 78.02], [81.0, 82.26], [83.0, 83.79], [84.0, 84.89], [86.0, 86.41], [90.0, 93.33], [94.0, 94.85], [96.0, 97.12], [99.0, 98.96], [100.0, 102.17], [104.0, 105.36], [106.0, 106.74], [108.0, 108.21], [110.0, 112.83], [113.0, 116.07], [118.0, 118.81], [119.0, 119.33], [125.0, 125.25], [126.0, 126.64], [128.0, 129.47], [130.0, 130.72], [132.0, 133.02], [137.0, 142.5], [144.0, 144.83], [146.0, 147.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 35.67, 0.0, 0.0, 0.0, 61.57, 99.21, 0.0, 0.0, 47.05, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 79.07, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.8, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 64.17], ["explosion", 4.69], ["music", 4.58]], null, null, null, null, null, null, null, [["speech", 57.71], ["whale vocalization", 11.84], ["fart", 2.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["explosion", 27.31], ["burst, pop", 15.22], ["glass", 8.03]], null, null], "duration": [0.02, 8.19, 0.03, 0.99, 0.6, 2.76, 2.46, 0.82, 0.23, 3.66, 0.72, 5.61, 8.1, 1.31, 0.13, 0.09, 0.82, -0.05, 0.02, 1.26, 0.79, 0.89, 0.41, 3.33, 0.85, 1.12, -0.04, 2.17, 1.36, 0.74, 0.21, 2.83, 3.07, 0.81, 0.33, 0.25, 0.64, 1.47, 0.72, 1.02, 5.5, 0.83, 1.02]} \ No newline at end of file diff --git a/annotations_1/relfjwjhscE_filtered.json b/annotations_1/relfjwjhscE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07e7f449b8715c746248cf7bc28dd49289128018 --- /dev/null +++ b/annotations_1/relfjwjhscE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 83.39], [84.0, 95.44], [97.0, 101.11]], "keep_status": [false, true, true], "silence_prob": [0.0, 30.02, 37.61], "audiomae_on_audioset": [null, [["hum", 29.82], ["mains hum", 20.67], ["music", 14.54]], [["hum", 26.22], ["music", 17.18], ["throbbing", 14.89]]], "duration": [66.39, 11.44, 4.11]} \ No newline at end of file diff --git a/annotations_1/reyTknNqDjA_filtered.json b/annotations_1/reyTknNqDjA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8df0ab15fdd44980c4f7cedcf1a967bbf2c1aa07 --- /dev/null +++ b/annotations_1/reyTknNqDjA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 50.46], [52.0, 93.63]], "keep_status": [false, false], "silence_prob": [34.1, 0.0], "audiomae_on_audioset": [[["music", 75.59], ["throbbing", 7.8], ["hum", 2.37]], null], "duration": [14.46, 41.63]} \ No newline at end of file diff --git a/annotations_1/rey_J7jIvno_filtered.json b/annotations_1/rey_J7jIvno_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a561a1cd14041b85e852f833ccc8ea006f1e491 --- /dev/null +++ b/annotations_1/rey_J7jIvno_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.74], [16.0, 61.32], [62.0, 133.05]], "keep_status": [false, false, false], "silence_prob": [33.04, 0.0, 0.0], "audiomae_on_audioset": [[["mains hum", 38.02], ["hum", 33.94], ["music", 15.5]], null, null], "duration": [6.74, 45.32, 71.05]} \ No newline at end of file diff --git a/annotations_1/rezZBgaJGoM_filtered.json b/annotations_1/rezZBgaJGoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4db5b6159f7adb7eabcdeb2704575bf16b4f2c9 --- /dev/null +++ b/annotations_1/rezZBgaJGoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [34.0, 34.7], [36.0, 36.83], [37.0, 38.58], [42.0, 44.04], [48.0, 49.08], [52.0, 52.32], [73.0, 73.52], [80.0, 87.62], [99.0, 99.39], [104.0, 106.84], [115.0, 115.57]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.36, 0.0, 0.0, 0.0, 30.29, 0.0, 48.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["whip", 32.72], ["speech", 19.42], ["whack, thwack", 12.91]], null, [["speech", 29.02], ["sidetone", 17.51], ["sine wave", 14.28]], null], "duration": [0.48, 0.7, 0.83, 1.58, 2.04, 1.08, 0.32, 0.52, 7.62, 0.39, 2.84, 0.57]} \ No newline at end of file diff --git a/annotations_1/rgd8TC1Q09g_filtered.json b/annotations_1/rgd8TC1Q09g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b6cbe789e6e4957242950898fb62ab85bda8da --- /dev/null +++ b/annotations_1/rgd8TC1Q09g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.06], [15.0, 19.79], [22.0, 28.32], [38.0, 40.68], [58.0, 58.56], [65.0, 66.24], [70.0, 71.07]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [89.19, 99.82, 99.62, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [4.06, 4.79, 6.32, 2.68, 0.56, 1.24, 1.07]} \ No newline at end of file diff --git a/annotations_1/rglfoXHFty8_filtered.json b/annotations_1/rglfoXHFty8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35f9aa9a8a0d74237b702524851fd5075ff05d97 --- /dev/null +++ b/annotations_1/rglfoXHFty8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.09], [6.0, 7.57], [19.0, 20.98], [26.0, 27.24], [29.0, 34.48], [38.0, 38.7], [39.0, 39.6], [51.0, 98.1], [98.0, 100.13], [100.0, 100.5], [101.0, 101.49], [111.0, 111.67], [113.0, 146.01], [148.0, 149.27], [151.0, 153.1], [156.0, 156.07], [161.0, 161.35], [163.0, 163.24], [166.0, 167.39], [169.0, 168.76]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 30.47, 0.0, 0.0, 0.0, 0.0, 0.0, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.59], ["music", 14.36], ["electric shaver, electric razor", 14.35]], null, null, null, [["music", 65.38], ["speech", 4.57], ["hum", 3.2]], null, null, null, null, null, [["music", 51.81], ["throbbing", 16.52], ["electronic music", 4.42]], null, null, null, null, null], "duration": [1.09, 1.57, 1.98, 1.24, 5.48, 0.7, 0.6, 47.1, 2.13, 0.5, 0.49, 0.67, 33.01, 1.27, 2.1, 0.07, 0.35, 0.24, 1.39, -0.24]} \ No newline at end of file diff --git a/annotations_1/rgmKJYrtmkw_filtered.json b/annotations_1/rgmKJYrtmkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3996f4cb359e7ec100fa6e786434a781511ad7b7 --- /dev/null +++ b/annotations_1/rgmKJYrtmkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.82], [5.0, 5.49], [6.0, 6.47], [8.0, 8.33], [10.0, 10.1], [10.0, 10.64], [12.0, 14.82], [17.0, 19.16], [21.0, 25.61], [27.0, 27.08], [32.0, 39.93], [49.0, 52.51], [55.0, 56.12], [60.0, 61.08], [73.0, 77.62], [78.0, 77.65], [86.0, 87.03], [89.0, 94.93], [118.0, 118.3], [141.0, 142.16]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 100.0, 48.91, 0.0, 39.22, 46.83, 0.0, 0.0, 64.86, 0.0, 0.0, 39.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 33.74], ["music", 12.75], ["frog", 12.09]], null, [["speech", 54.19], ["thunk", 26.48], ["music", 5.23]], [["music", 42.52], ["didgeridoo", 7.01], ["animal", 5.66]], null, null, null, null, null, [["music", 39.01], ["speech", 12.27], ["throbbing", 10.22]], null, null], "duration": [1.82, 0.49, 0.47, 0.33, 0.1, 0.64, 2.82, 2.16, 4.61, 0.08, 7.93, 3.51, 1.12, 1.08, 4.62, -0.35, 1.03, 5.93, 0.3, 1.16]} \ No newline at end of file diff --git a/annotations_1/rhFw9HYTReY_filtered.json b/annotations_1/rhFw9HYTReY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edb1ed206b83e6f3217134a63cfe4b84c19a0f49 --- /dev/null +++ b/annotations_1/rhFw9HYTReY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 49.82], [54.0, 104.82]], "keep_status": [false, false], "silence_prob": [30.97, 0.0], "audiomae_on_audioset": [[["music", 42.86], ["didgeridoo", 37.02], ["trombone", 2.53]], null], "duration": [14.82, 50.82]} \ No newline at end of file diff --git a/annotations_1/rhfBzC5A79o_filtered.json b/annotations_1/rhfBzC5A79o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f7385a0480d688d86b5fa64148aad09260f37ac --- /dev/null +++ b/annotations_1/rhfBzC5A79o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 31.83], [34.0, 35.14], [42.0, 41.67], [44.0, 43.8], [48.0, 51.61], [52.0, 54.01], [54.0, 54.09], [54.0, 56.05], [57.0, 62.06], [65.0, 65.6], [70.0, 83.66], [87.0, 89.75], [91.0, 98.25], [102.0, 105.09], [107.0, 106.83], [108.0, 108.97], [110.0, 110.74], [112.0, 113.32], [115.0, 118.3], [119.0, 122.62]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 0.0, 0.0, 0.0, 99.84, 37.32, 0.0, 37.02, 33.41, 0.0, 98.99, 99.85, 95.09, 44.55, 0.0, 0.0, 0.0, 0.0, 99.84, 42.42], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 48.63], ["busy signal", 22.3], ["sine wave", 12.56]], null, [["speech", 29.49], ["noise", 12.99], ["sidetone", 6.85]], [["speech", 55.03], ["whimper", 4.21], ["laughter", 3.79]], null, null, null, null, [["speech", 53.28], ["busy signal", 20.92], ["dial tone", 8.39]], null, null, null, null, null, [["speech", 35.37], ["dial tone", 29.72], ["sine wave", 25.65]]], "duration": [2.83, 1.14, -0.33, -0.2, 3.61, 2.01, 0.09, 2.05, 5.06, 0.6, 13.66, 2.75, 7.25, 3.09, -0.17, 0.97, 0.74, 1.32, 3.3, 3.62]} \ No newline at end of file diff --git a/annotations_1/rhkkbjKcaJ0_filtered.json b/annotations_1/rhkkbjKcaJ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2e9d98b29c726c68302e6b77bf5d396821cac6bd --- /dev/null +++ b/annotations_1/rhkkbjKcaJ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.29], [10.0, 11.77], [12.0, 13.78], [15.0, 17.56], [19.0, 23.38], [25.0, 112.89], [116.0, 138.23], [140.0, 172.22]], "keep_status": [true, false, false, false, true, false, false, false], "silence_prob": [49.22, 0.0, 0.0, 56.63, 43.45, 0.0, 30.86, 0.0], "audiomae_on_audioset": [[["speech", 27.43], ["hum", 12.71], ["mains hum", 6.69]], null, null, null, [["music", 48.21], ["throbbing", 4.78], ["hum", 4.73]], null, [["hum", 50.08], ["mains hum", 28.26], ["music", 5.87]], null], "duration": [2.29, 1.77, 1.78, 2.56, 4.38, 87.89, 22.23, 32.22]} \ No newline at end of file diff --git a/annotations_1/rhnCmErsnYA_filtered.json b/annotations_1/rhnCmErsnYA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..809e3c0deb2f22e0d7fc4e2431b5606a539fe773 --- /dev/null +++ b/annotations_1/rhnCmErsnYA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [14.0, 14.79], [17.0, 19.55], [21.0, 23.46], [24.0, 35.68], [42.0, 44.44], [44.0, 44.51], [45.0, 44.61], [45.0, 55.53], [60.0, 75.36], [77.0, 77.7], [79.0, 82.32], [84.0, 84.08], [86.0, 88.65], [92.0, 128.33], [132.0, 134.45], [136.0, 141.4], [141.0, 141.44], [144.0, 148.14]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 53.72, 31.42, 30.97, 30.53, 0.0, 0.0, 30.62, 30.15, 0.0, 34.18, 0.0, 32.56, 0.0, 30.15, 29.86, 0.0, 31.71], "audiomae_on_audioset": [null, null, null, [["music", 59.41], ["throbbing", 10.16], ["hum", 7.45]], [["music", 79.49], ["electronic music", 3.03], ["speech", 2.28]], [["music", 42.9], ["didgeridoo", 21.09], ["musical instrument", 5.15]], null, null, [["speech", 39.75], ["music", 29.66], ["whack, thwack", 5.17]], [["music", 36.97], ["speech", 33.85], ["whack, thwack", 3.44]], null, [["music", 47.87], ["boing", 19.22], ["synthesizer", 7.29]], null, [["moo", 42.46], ["cattle, bovinae", 38.77], ["livestock, farm animals, working animals", 16.39]], null, [["moo", 36.99], ["livestock, farm animals, working animals", 32.1], ["cattle, bovinae", 29.87]], [["boing", 39.13], ["music", 34.17], ["speech", 11.7]], null, [["speech", 30.72], ["music", 29.89], ["throbbing", 6.45]]], "duration": [1.96, 0.79, 2.55, 2.46, 11.68, 2.44, 0.51, -0.39, 10.53, 15.36, 0.7, 3.32, 0.08, 2.65, 36.33, 2.45, 5.4, 0.44, 4.14]} \ No newline at end of file diff --git a/annotations_1/ri8WqeTAUDE_filtered.json b/annotations_1/ri8WqeTAUDE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abfa6453dcc3160309d8511c88b9d783390978d9 --- /dev/null +++ b/annotations_1/ri8WqeTAUDE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.86], [6.0, 6.51], [11.0, 15.94], [16.0, 21.2], [24.0, 25.2], [27.0, 27.68], [30.0, 30.64], [39.0, 38.85], [50.0, 50.55], [54.0, 54.45], [71.0, 72.27], [75.0, 75.22], [75.0, 76.13], [77.0, 77.8], [79.0, 79.56], [81.0, 88.55], [89.0, 93.56], [100.0, 99.93], [103.0, 103.45], [104.0, 104.11], [106.0, 106.07], [108.0, 111.99], [120.0, 120.56], [128.0, 128.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 65.32, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81, 99.05, 0.0, 0.0, 0.0, 0.0, 97.64, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 0.51, 4.94, 5.2, 1.2, 0.68, 0.64, -0.15, 0.55, 0.45, 1.27, 0.22, 1.13, 0.8, 0.56, 7.55, 4.56, -0.07, 0.45, 0.11, 0.07, 3.99, 0.56, 0.82]} \ No newline at end of file diff --git a/annotations_1/riSEerXD6nE_filtered.json b/annotations_1/riSEerXD6nE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba1b2831d6959126a0d1df55d07f20dbf6d8e9f0 --- /dev/null +++ b/annotations_1/riSEerXD6nE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [11.0, 11.55], [14.0, 15.13], [20.0, 28.66], [30.0, 31.16], [32.0, 32.12], [33.0, 34.21], [37.0, 38.57], [44.0, 45.71], [52.0, 53.47], [56.0, 56.13], [59.0, 60.76], [61.0, 62.18], [64.0, 63.93], [67.0, 68.67], [69.0, 70.02], [76.0, 77.28], [78.0, 77.7], [78.0, 78.06], [80.0, 80.99], [82.0, 83.81], [85.0, 86.14], [88.0, 87.98], [91.0, 91.86], [92.0, 97.04], [98.0, 98.46], [104.0, 112.35], [113.0, 113.68], [115.0, 119.4], [121.0, 123.89], [124.0, 124.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 71.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.18, 0.0, 86.64, 0.0, 99.94, 30.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 44.66], ["musical instrument", 8.93], ["cough", 8.43]], null], "duration": [1.39, 0.55, 1.13, 8.66, 1.16, 0.12, 1.21, 1.57, 1.71, 1.47, 0.13, 1.76, 1.18, -0.07, 1.67, 1.02, 1.28, -0.3, 0.06, 0.99, 1.81, 1.14, -0.02, 0.86, 5.04, 0.46, 8.35, 0.68, 4.4, 2.89, 0.92]} \ No newline at end of file diff --git a/annotations_1/rilZTyv9RLo_filtered.json b/annotations_1/rilZTyv9RLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f65d2808bd2641dac797b359252613ef389916af --- /dev/null +++ b/annotations_1/rilZTyv9RLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.59], [15.0, 19.11], [20.0, 20.51], [25.0, 25.3], [29.0, 29.52], [41.0, 44.74], [49.0, 49.86], [52.0, 54.35], [56.0, 58.78], [60.0, 62.45], [77.0, 78.0], [86.0, 87.18], [91.0, 92.35], [100.0, 102.22], [118.0, 118.54], [120.0, 120.26], [131.0, 131.19]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false], "silence_prob": [42.51, 41.58, 0.0, 0.0, 0.0, 33.17, 0.0, 53.78, 40.12, 31.23, 0.0, 0.0, 0.0, 29.75, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["boing", 59.51], ["music", 17.71], ["speech", 10.73]], [["music", 49.82], ["speech", 34.95], ["scratching (performance technique)", 3.36]], null, null, null, [["music", 56.15], ["theremin", 14.87], ["didgeridoo", 3.38]], null, null, [["music", 26.68], ["synthesizer", 19.76], ["noise", 7.52]], [["speech", 27.35], ["music", 16.91], ["fart", 15.94]], null, null, null, [["music", 35.16], ["speech", 19.89], ["didgeridoo", 6.08]], null, null, null], "duration": [2.59, 4.11, 0.51, 0.3, 0.52, 3.74, 0.86, 2.35, 2.78, 2.45, 1.0, 1.18, 1.35, 2.22, 0.54, 0.26, 0.19]} \ No newline at end of file diff --git a/annotations_1/rjnLGy6uWKc_filtered.json b/annotations_1/rjnLGy6uWKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1763f0436597ca70ac4704b1c9f292069696084 --- /dev/null +++ b/annotations_1/rjnLGy6uWKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.48], [16.0, 16.9], [19.0, 19.79], [28.0, 30.7], [32.0, 33.25], [36.0, 36.69], [42.0, 42.84], [44.0, 45.93], [48.0, 48.52], [55.0, 55.11], [59.0, 60.07], [100.0, 99.96], [101.0, 103.74], [106.0, 109.04], [132.0, 133.64], [135.0, 135.21]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [75.39, 0.0, 0.0, 37.84, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.76], ["speech", 14.21], ["mosquito", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.48, 0.9, 0.79, 2.7, 1.25, 0.69, 0.84, 1.93, 0.52, 0.11, 1.07, -0.04, 2.74, 3.04, 1.64, 0.21]} \ No newline at end of file diff --git a/annotations_1/rlMANFZdCkk_filtered.json b/annotations_1/rlMANFZdCkk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf3e07829e561f27d3080de0d8994aa58d2e67c --- /dev/null +++ b/annotations_1/rlMANFZdCkk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.99], [31.0, 30.77], [31.0, 31.77], [33.0, 33.67], [45.0, 63.14], [76.0, 76.54], [77.0, 78.17], [80.0, 81.55], [82.0, 83.05], [85.0, 85.21], [85.0, 85.6], [98.0, 99.94], [104.0, 104.73], [116.0, 117.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 87.74], ["funk", 0.9], ["musical instrument", 0.79]], null, null, null, null, null, null, null, null, null], "duration": [0.99, -0.23, 0.77, 0.67, 18.14, 0.54, 1.17, 1.55, 1.05, 0.21, 0.6, 1.94, 0.73, 1.09]} \ No newline at end of file diff --git a/annotations_1/rlXKgVlILbM_filtered.json b/annotations_1/rlXKgVlILbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b610c144b5c14d27e61761c1676e887a8b877561 --- /dev/null +++ b/annotations_1/rlXKgVlILbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.61], [2.0, 2.79], [3.0, 3.7], [7.0, 8.31], [16.0, 16.14], [18.0, 18.66], [20.0, 20.82], [25.0, 25.07], [32.0, 33.81], [35.0, 35.09], [37.0, 42.04], [42.0, 42.94], [47.0, 47.55], [62.0, 62.45], [64.0, 65.92], [68.0, 68.55], [73.0, 73.8], [90.0, 89.65], [92.0, 92.57], [108.0, 108.51], [113.0, 112.99], [116.0, 116.19], [117.0, 117.51], [119.0, 118.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.61, 0.79, 0.7, 1.31, 0.14, 0.66, 0.82, 0.07, 1.81, 0.09, 5.04, 0.94, 0.55, 0.45, 1.92, 0.55, 0.8, -0.35, 0.57, 0.51, -0.01, 0.19, 0.51, -0.09]} \ No newline at end of file diff --git a/annotations_1/rlaRlCFXUqk_filtered.json b/annotations_1/rlaRlCFXUqk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..709eaa661c602afe8cdb0333e22b13bc69b1ff77 --- /dev/null +++ b/annotations_1/rlaRlCFXUqk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.62], [6.0, 6.07], [7.0, 8.07], [9.0, 14.08], [15.0, 15.03], [17.0, 18.42], [19.0, 20.02], [21.0, 28.71], [31.0, 31.11], [37.0, 36.69], [43.0, 44.49], [54.0, 55.14], [56.0, 57.1], [67.0, 67.2], [76.0, 77.11], [81.0, 80.92], [81.0, 88.8], [91.0, 91.1], [92.0, 94.61], [99.0, 103.76], [107.0, 108.11], [113.0, 116.16], [121.0, 121.91], [133.0, 133.71], [140.0, 142.97], [145.0, 145.37], [147.0, 147.7], [151.0, 151.82], [155.0, 156.83], [158.0, 159.27], [163.0, 163.0], [166.0, 167.16], [171.0, 172.59]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.54, 0.0, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.26, 0.0, 65.2, 45.92, 0.0, 49.18, 0.0, 0.0, 66.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 19.79], ["hum", 7.49], ["mains hum", 5.55]], null, null, null, [["hum", 26.06], ["music", 19.06], ["rumble", 18.96]], null, null, null, null, null, null, null, null, [["mains hum", 38.56], ["hum", 31.08], ["speech", 10.8]], null, null, [["music", 44.58], ["electronic music", 10.38], ["gong", 9.96]], null, [["music", 31.05], ["sonar", 9.21], ["ambient music", 7.24]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.07, 1.07, 5.08, 0.03, 1.42, 1.02, 7.71, 0.11, -0.31, 1.49, 1.14, 1.1, 0.2, 1.11, -0.08, 7.8, 0.1, 2.61, 4.76, 1.11, 3.16, 0.91, 0.71, 2.97, 0.37, 0.7, 0.82, 1.83, 1.27, 0.0, 1.16, 1.59]} \ No newline at end of file diff --git a/annotations_1/rmE6nTzmDqI_filtered.json b/annotations_1/rmE6nTzmDqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28c48cc68b5e71b544465b388dca07d3c1d832a4 --- /dev/null +++ b/annotations_1/rmE6nTzmDqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 8.48], [11.0, 12.21], [16.0, 16.34], [21.0, 22.22], [25.0, 25.29], [27.0, 28.56], [32.0, 32.63], [37.0, 37.83], [39.0, 69.35], [70.0, 73.08], [74.0, 80.45], [81.0, 87.94], [89.0, 101.65], [104.0, 103.91], [105.0, 105.6], [107.0, 108.8], [110.0, 112.92], [118.0, 119.53], [123.0, 124.7], [126.0, 128.56], [130.0, 139.38], [141.0, 143.83], [145.0, 145.77], [146.0, 149.89], [150.0, 156.17], [160.0, 163.27], [166.0, 166.14], [168.0, 169.45], [171.0, 178.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.51, 39.54, 36.62, 47.27, 0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 93.76, 47.54, 75.72, 0.0, 51.66, 54.63, 87.55, 0.0, 0.0, 85.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 29.08], ["synthesizer", 11.46], ["speech", 6.4]], [["music", 23.19], ["synthesizer", 16.03], ["hum", 9.72]], [["music", 30.74], ["hum", 16.56], ["synthesizer", 10.25]], [["speech", 24.52], ["music", 18.94], ["mains hum", 17.2]], null, null, null, null, null, null, null, [["speech", 27.66], ["mains hum", 25.63], ["hum", 14.03]], null, null, null, null, null, null, null, null], "duration": [3.48, 1.21, 0.34, 1.22, 0.29, 1.56, 0.63, 0.83, 30.35, 3.08, 6.45, 6.94, 12.65, -0.09, 0.6, 1.8, 2.92, 1.53, 1.7, 2.56, 9.38, 2.83, 0.77, 3.89, 6.17, 3.27, 0.14, 1.45, 7.82]} \ No newline at end of file diff --git a/annotations_1/rmpFmJfEZXs_filtered.json b/annotations_1/rmpFmJfEZXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e613c599b6357b000c1996d76facac3076fb1de --- /dev/null +++ b/annotations_1/rmpFmJfEZXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 46.43], [46.0, 47.95], [65.0, 69.11], [69.0, 70.04], [71.0, 71.44], [74.0, 74.56], [75.0, 77.57], [81.0, 81.24], [85.0, 85.24], [86.0, 86.59], [89.0, 89.13], [90.0, 89.87], [107.0, 107.87], [111.0, 121.2], [139.0, 139.38], [140.0, 144.91], [181.0, 187.69], [190.0, 194.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [66.76, 0.0, 88.1, 0.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.83, 0.0, 43.9, 38.11, 33.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.08], ["whack, thwack", 10.52], ["hammer", 8.84]], null, [["music", 66.68], ["didgeridoo", 8.57], ["musical instrument", 6.08]], [["speech", 31.91], ["music", 30.03], ["crushing", 13.91]], [["fly, housefly", 39.02], ["music", 21.21], ["mosquito", 14.93]]], "duration": [2.43, 1.95, 4.11, 1.04, 0.44, 0.56, 2.57, 0.24, 0.24, 0.59, 0.13, -0.13, 0.87, 10.2, 0.38, 4.91, 6.69, 4.66]} \ No newline at end of file diff --git a/annotations_1/rnaCi4rBfqw_filtered.json b/annotations_1/rnaCi4rBfqw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d28e6859714c6c7f66f9ba8bf0f97c0f6e3d4e07 --- /dev/null +++ b/annotations_1/rnaCi4rBfqw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.7], [18.0, 18.67], [21.0, 22.0], [22.0, 23.41], [24.0, 24.73], [27.0, 27.6], [35.0, 36.21], [37.0, 37.71], [43.0, 43.19], [43.0, 45.62], [48.0, 48.91], [50.0, 62.58], [65.0, 103.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.15, 0.0, 33.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 55.78], ["trombone", 14.21], ["brass instrument", 9.45]], null, [["music", 68.89], ["musical instrument", 7.66], ["effects unit", 2.4]], null], "duration": [0.7, 0.67, 1.0, 1.41, 0.73, 0.6, 1.21, 0.71, 0.19, 2.62, 0.91, 12.58, 38.5]} \ No newline at end of file diff --git a/annotations_1/roLboEc4M-w_filtered.json b/annotations_1/roLboEc4M-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..62b5c3c33709c26f73dc94f3525c65a3dd13c076 --- /dev/null +++ b/annotations_1/roLboEc4M-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.84], [9.0, 9.54], [12.0, 13.46], [14.0, 14.25], [14.0, 14.52], [15.0, 14.61], [18.0, 19.38], [28.0, 33.2], [34.0, 36.37], [37.0, 38.31], [40.0, 41.82], [43.0, 44.22], [45.0, 47.06], [52.0, 53.42], [55.0, 56.0], [64.0, 64.35], [67.0, 68.34], [73.0, 73.63], [76.0, 76.38], [77.0, 79.88], [83.0, 83.22], [84.0, 84.82], [86.0, 88.87], [92.0, 92.52], [95.0, 102.32], [105.0, 106.1], [108.0, 109.76], [111.0, 111.4], [113.0, 113.24], [115.0, 115.25], [116.0, 116.8], [119.0, 124.28], [125.0, 126.01], [128.0, 128.61], [129.0, 129.76], [132.0, 133.68], [136.0, 137.46], [138.0, 144.24], [150.0, 151.66], [153.0, 153.91], [160.0, 161.49], [162.0, 163.31], [164.0, 165.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.82, 76.53, 0.0, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.39, 0.0, 0.0, 47.12, 0.0, 49.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.84], ["hum", 11.08], ["whale vocalization", 8.36]], null, null, null, null, null, null, null, null, null, [["speech", 29.4], ["music", 25.6], ["hum", 4.96]], null, [["music", 54.85], ["hum", 7.71], ["mains hum", 7.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.54, 1.46, 0.25, 0.52, -0.39, 1.38, 5.2, 2.37, 1.31, 1.82, 1.22, 2.06, 1.42, 1.0, 0.35, 1.34, 0.63, 0.38, 2.88, 0.22, 0.82, 2.87, 0.52, 7.32, 1.1, 1.76, 0.4, 0.24, 0.25, 0.8, 5.28, 1.01, 0.61, 0.76, 1.68, 1.46, 6.24, 1.66, 0.91, 1.49, 1.31, 1.52]} \ No newline at end of file diff --git a/annotations_1/roST4TM0ccM_filtered.json b/annotations_1/roST4TM0ccM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5398246235d982e2ab0f68faf99b4a57377e035c --- /dev/null +++ b/annotations_1/roST4TM0ccM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.48], [0.0, 1.09], [2.0, 8.43], [9.0, 13.76], [14.0, 14.5], [15.0, 16.07], [17.0, 35.38], [38.0, 37.81], [40.0, 45.17], [54.0, 56.24], [57.0, 57.1], [58.0, 57.96], [65.0, 65.64], [67.0, 73.92], [77.0, 93.21], [99.0, 108.82], [112.0, 112.14], [114.0, 114.0], [115.0, 132.29], [135.0, 136.11], [136.0, 136.95], [139.0, 153.81], [157.0, 157.27], [158.0, 162.3], [163.0, 171.31], [183.0, 193.94]], "keep_status": [false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false], "silence_prob": [0.0, 0.0, 35.58, 38.35, 0.0, 0.0, 35.68, 0.0, 30.23, 68.8, 0.0, 0.0, 0.0, 40.77, 31.1, 31.45, 0.0, 0.0, 29.19, 0.0, 0.0, 30.43, 0.0, 35.39, 44.55, 51.66], "audiomae_on_audioset": [null, null, [["speech", 17.14], ["livestock, farm animals, working animals", 14.84], ["moo", 12.4]], [["fire", 19.25], ["speech", 12.85], ["rain", 10.11]], null, null, [["music", 30.12], ["speech", 25.34], ["theremin", 15.81]], null, [["speech", 25.41], ["music", 17.4], ["livestock, farm animals, working animals", 5.37]], null, null, null, null, [["throbbing", 34.13], ["hum", 27.63], ["mains hum", 11.46]], [["music", 55.81], ["fart", 7.92], ["groan", 7.91]], [["music", 55.93], ["speech", 18.68], ["throbbing", 4.42]], null, null, [["music", 37.9], ["speech", 27.92], ["whack, thwack", 8.34]], null, null, [["music", 57.27], ["sidetone", 2.88], ["speech", 2.87]], null, [["speech", 37.13], ["music", 22.16], ["noise", 6.26]], [["hum", 35.54], ["mains hum", 17.89], ["music", 15.31]], null], "duration": [0.48, 1.09, 6.43, 4.76, 0.5, 1.07, 18.38, -0.19, 5.17, 2.24, 0.1, -0.04, 0.64, 6.92, 16.21, 9.82, 0.14, 0.0, 17.29, 1.11, 0.95, 14.81, 0.27, 4.3, 8.31, 10.94]} \ No newline at end of file diff --git a/annotations_1/rpPm4pAJQbc_filtered.json b/annotations_1/rpPm4pAJQbc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83e2b4ca1e669867ccfa799871290e3c825c9b47 --- /dev/null +++ b/annotations_1/rpPm4pAJQbc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 24.66], [46.0, 45.66], [46.0, 46.84], [66.0, 66.26], [79.0, 79.2], [79.0, 79.27], [79.0, 79.39], [87.0, 86.71], [89.0, 89.45], [99.0, 99.25]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [28.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 52.05], ["trombone", 13.73], ["musical instrument", 2.66]], null, null, null, null, null, null, null, null, null], "duration": [13.66, -0.34, 0.84, 0.26, 0.2, 0.27, 0.39, -0.29, 0.45, 0.25]} \ No newline at end of file diff --git a/annotations_1/rpqgDDBcmcI_filtered.json b/annotations_1/rpqgDDBcmcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12a3c2106328d982d207deec6dd1704a4df221df --- /dev/null +++ b/annotations_1/rpqgDDBcmcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [6.0, 6.3], [16.0, 22.62], [24.0, 24.66], [26.0, 26.18], [27.0, 36.98], [40.0, 41.49], [42.0, 79.12], [79.0, 79.64], [91.0, 94.83], [95.0, 99.4], [101.0, 111.2], [112.0, 112.89], [116.0, 118.08], [119.0, 128.9], [129.0, 131.95], [133.0, 133.14], [141.0, 160.41], [161.0, 161.3]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, false, false, false], "silence_prob": [36.33, 0.0, 29.0, 0.0, 0.0, 29.11, 0.0, 0.0, 0.0, 31.33, 31.41, 29.99, 0.0, 28.99, 29.27, 28.73, 0.0, 29.78, 0.0], "audiomae_on_audioset": [[["music", 50.97], ["throbbing", 18.91], ["hum", 11.56]], null, [["music", 52.95], ["speech", 9.14], ["throbbing", 8.65]], null, null, [["music", 57.68], ["throbbing", 7.67], ["electronic music", 5.97]], null, null, null, [["music", 48.32], ["hum", 8.0], ["throbbing", 5.96]], [["music", 36.18], ["throbbing", 12.82], ["hum", 10.2]], [["speech", 38.29], ["hum", 12.26], ["mains hum", 9.1]], null, [["music", 75.47], ["throbbing", 2.15], ["cacophony", 1.97]], [["vehicle", 34.67], ["car", 16.92], ["music", 16.54]], [["music", 63.03], ["electronic music", 4.24], ["hum", 3.29]], null, [["hum", 42.17], ["throbbing", 16.1], ["mains hum", 12.93]], null], "duration": [3.33, 0.3, 6.62, 0.66, 0.18, 9.98, 1.49, 37.12, 0.64, 3.83, 4.4, 10.2, 0.89, 2.08, 9.9, 2.95, 0.14, 19.41, 0.3]} \ No newline at end of file diff --git a/annotations_1/rpy7vhvX8jw_filtered.json b/annotations_1/rpy7vhvX8jw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7405725b12817c190c4de45871afc71307d7b6cc --- /dev/null +++ b/annotations_1/rpy7vhvX8jw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.61], [7.0, 7.62], [11.0, 11.8], [14.0, 16.33], [18.0, 20.02], [23.0, 24.76], [26.0, 28.56], [31.0, 31.7], [33.0, 35.11], [36.0, 38.06], [41.0, 42.21], [48.0, 51.7], [53.0, 53.94], [58.0, 61.8], [63.0, 63.91], [67.0, 67.93], [69.0, 68.96], [72.0, 76.45], [79.0, 79.0], [82.0, 84.1], [88.0, 88.21], [91.0, 93.18], [94.0, 94.73], [99.0, 100.45], [104.0, 104.18], [104.0, 104.62], [109.0, 110.91], [113.0, 122.18], [123.0, 124.53], [125.0, 128.55], [129.0, 133.64], [136.0, 138.4], [140.0, 140.61], [142.0, 141.84], [144.0, 147.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.16, 89.36, 0.0, 95.23, 0.0, 86.09, 79.94, 0.0, 98.99, 0.0, 68.41, 0.0, 0.0, 0.0, 99.97, 0.0, 97.64, 0.0, 99.16, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 88.64, 99.91, 0.0, 0.0, 96.54], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.61, 0.62, 0.8, 2.33, 2.02, 1.76, 2.56, 0.7, 2.11, 2.06, 1.21, 3.7, 0.94, 3.8, 0.91, 0.93, -0.04, 4.45, 0.0, 2.1, 0.21, 2.18, 0.73, 1.45, 0.18, 0.62, 1.91, 9.18, 1.53, 3.55, 4.64, 2.4, 0.61, -0.16, 3.24]} \ No newline at end of file diff --git a/annotations_1/rqKaJ4Yp_oU_filtered.json b/annotations_1/rqKaJ4Yp_oU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa37dd148f00cf33f39bced5aaaf6c8c7c8cb345 --- /dev/null +++ b/annotations_1/rqKaJ4Yp_oU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.41], [14.0, 14.35], [17.0, 16.85], [18.0, 19.99], [21.0, 22.54], [23.0, 24.63], [25.0, 32.78], [34.0, 53.84], [57.0, 88.67], [89.0, 89.5], [90.0, 91.57], [92.0, 93.04], [96.0, 96.87], [104.0, 111.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 0.0, 0.0, 0.0, 0.0, 0.0, 78.72, 36.25, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 83.94], ["musical instrument", 1.63], ["fart", 1.36]], null, null, null, null, null, null], "duration": [3.41, 0.35, -0.15, 1.99, 1.54, 1.63, 7.78, 19.84, 31.67, 0.5, 1.57, 1.04, 0.87, 7.92]} \ No newline at end of file diff --git a/annotations_1/rqdEaDM2PWM_filtered.json b/annotations_1/rqdEaDM2PWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c12fd68262e7c609ea14d7e405d4930704af7ba --- /dev/null +++ b/annotations_1/rqdEaDM2PWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.63], [18.0, 41.96], [43.0, 44.34], [44.0, 45.71], [48.0, 52.54], [54.0, 62.46], [63.0, 64.44], [66.0, 77.55], [82.0, 83.17], [90.0, 93.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.31, 0.0, 0.0, 97.54, 54.63, 0.0, 64.75, 0.0, 99.82], "audiomae_on_audioset": [null, [["music", 60.75], ["sidetone", 21.58], ["thunk", 3.84]], null, null, null, null, null, null, null, null], "duration": [0.63, 23.96, 1.34, 1.71, 4.54, 8.46, 1.44, 11.55, 1.17, 3.77]} \ No newline at end of file diff --git a/annotations_1/rrMvGHoW7aw_filtered.json b/annotations_1/rrMvGHoW7aw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9a77a0f61cfeac108d82299279d7b83be9878ec --- /dev/null +++ b/annotations_1/rrMvGHoW7aw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 8.88], [12.0, 12.66], [46.0, 46.36], [47.0, 47.16], [67.0, 67.47], [71.0, 71.32], [106.0, 106.68], [109.0, 109.34], [133.0, 133.51], [136.0, 136.56], [146.0, 149.12], [150.0, 151.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.7, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.12, 0.66, 0.36, 0.16, 0.47, 0.32, 0.68, 0.34, 0.51, 0.56, 3.12, 1.31]} \ No newline at end of file diff --git a/annotations_1/rrWLFKZafAc_filtered.json b/annotations_1/rrWLFKZafAc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f257af3f3a26be2309b0a677096a95de4d11adc8 --- /dev/null +++ b/annotations_1/rrWLFKZafAc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 67.15], [68.0, 89.85], [91.0, 91.56], [93.0, 93.72], [97.0, 98.0], [99.0, 100.87], [103.0, 102.95], [116.0, 116.24]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.93], ["speech", 20.15], ["throbbing", 8.12]], null, null, null, null, null, null], "duration": [62.15, 21.85, 0.56, 0.72, 1.0, 1.87, -0.05, 0.24]} \ No newline at end of file diff --git a/annotations_1/rsi2WcPIcQ0_filtered.json b/annotations_1/rsi2WcPIcQ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19159bb357689b8d114da24c54523b8382864e2e --- /dev/null +++ b/annotations_1/rsi2WcPIcQ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.83], [8.0, 10.22], [11.0, 13.81], [18.0, 21.27], [23.0, 25.95], [26.0, 26.87], [27.0, 28.88], [30.0, 31.26], [32.0, 32.54], [33.0, 34.05], [34.0, 42.11], [43.0, 45.47], [49.0, 50.25], [53.0, 54.87], [61.0, 61.35], [62.0, 62.24], [63.0, 63.96], [69.0, 70.82], [71.0, 71.54], [73.0, 73.84], [93.0, 93.72], [96.0, 95.86], [112.0, 129.36], [130.0, 131.38], [133.0, 134.1], [136.0, 138.75], [140.0, 141.56], [143.0, 151.95], [153.0, 155.76], [157.0, 158.13], [160.0, 164.91], [166.0, 169.48], [174.0, 175.14]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 99.95, 35.26, 100.0, 56.1, 0.0, 0.0, 0.0, 0.0, 0.0, 53.91, 56.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.26, 0.0, 0.0, 44.34, 0.0, 33.29, 35.63, 0.0, 31.09, 100.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 58.72], ["hum", 5.28], ["music", 3.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 50.01], ["drum", 11.69], ["percussion", 6.44]], null, null, [["music", 65.25], ["electronic music", 6.16], ["synthesizer", 5.66]], null, [["music", 75.13], ["speech", 5.63], ["throbbing", 3.36]], [["music", 63.03], ["throbbing", 13.22], ["electronic music", 3.86]], null, [["music", 46.86], ["whack, thwack", 15.3], ["thunk", 5.47]], null, null], "duration": [-0.17, 2.22, 2.81, 3.27, 2.95, 0.87, 1.88, 1.26, 0.54, 1.05, 8.11, 2.47, 1.25, 1.87, 0.35, 0.24, 0.96, 1.82, 0.54, 0.84, 0.72, -0.14, 17.36, 1.38, 1.1, 2.75, 1.56, 8.95, 2.76, 1.13, 4.91, 3.48, 1.14]} \ No newline at end of file diff --git a/annotations_1/rsktGDtzKhg_filtered.json b/annotations_1/rsktGDtzKhg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b93de1f58be9c2f815256867cab91b837c1a17c1 --- /dev/null +++ b/annotations_1/rsktGDtzKhg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.16], [31.0, 35.29], [35.0, 38.23], [38.0, 40.15], [56.0, 57.54], [70.0, 73.89], [98.0, 101.9], [123.0, 124.04], [130.0, 131.3], [136.0, 136.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [72.16, 35.13, 32.57, 32.5, 0.0, 31.15, 32.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 69.28], ["musical instrument", 1.66], ["guitar", 1.55]], [["music", 68.56], ["funny music", 8.03], ["singing", 4.47]], [["music", 80.2], ["reggae", 1.44], ["funny music", 1.16]], null, [["music", 78.04], ["swing music", 12.92], ["funny music", 2.05]], [["music", 61.92], ["musical instrument", 5.49], ["drum machine", 4.82]], null, null, null], "duration": [5.16, 4.29, 3.23, 2.15, 1.54, 3.89, 3.9, 1.04, 1.3, 0.73]} \ No newline at end of file diff --git a/annotations_1/rsnLwzzkF_Q_filtered.json b/annotations_1/rsnLwzzkF_Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a2ec11656e510edd952eb50db78676295c23674 --- /dev/null +++ b/annotations_1/rsnLwzzkF_Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.66], [3.0, 3.15], [5.0, 11.74], [18.0, 19.06], [23.0, 51.95], [55.0, 55.59], [66.0, 69.3], [70.0, 70.09], [71.0, 70.61], [71.0, 82.05], [83.0, 144.19]], "keep_status": [false, false, true, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 40.14, 0.0, 28.98, 0.0, 29.15, 0.0, 0.0, 28.53, 0.0], "audiomae_on_audioset": [null, null, [["music", 41.39], ["hum", 18.45], ["synthesizer", 7.18]], null, [["music", 32.33], ["frog", 21.89], ["croak", 5.06]], null, [["music", 33.02], ["roar", 19.01], ["livestock, farm animals, working animals", 3.86]], null, null, [["music", 45.15], ["smash, crash", 12.15], ["whack, thwack", 7.84]], null], "duration": [1.66, 0.15, 6.74, 1.06, 28.95, 0.59, 3.3, 0.09, -0.39, 11.05, 61.19]} \ No newline at end of file diff --git a/annotations_1/rsuNowyCF0c_filtered.json b/annotations_1/rsuNowyCF0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee2f3717b29f9ac8e561b5c181d1e3233fb5a866 --- /dev/null +++ b/annotations_1/rsuNowyCF0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.13], [6.0, 8.33], [11.0, 11.08], [12.0, 14.1], [15.0, 16.41], [16.0, 20.12], [26.0, 31.63], [35.0, 35.43], [37.0, 37.74], [38.0, 39.01], [40.0, 42.63], [44.0, 76.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.64, 0.0, 71.0, 0.0, 34.79, 39.25, 0.0, 0.0, 0.0, 42.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 36.14], ["music", 27.38], ["hum", 13.24]], [["music", 49.28], ["speech", 22.12], ["electronic music", 6.97]], null, null, null, [["music", 59.26], ["throbbing", 7.61], ["electronic music", 5.64]], null], "duration": [0.13, 2.33, 0.08, 2.1, 1.41, 4.12, 5.63, 0.43, 0.74, 1.01, 2.63, 32.84]} \ No newline at end of file diff --git a/annotations_1/rt3FEbzjM3o_filtered.json b/annotations_1/rt3FEbzjM3o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9797a2ad4f2fd3d4ab9888fe6d772c7b52cce4 --- /dev/null +++ b/annotations_1/rt3FEbzjM3o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.1], [8.0, 9.31], [10.0, 12.97], [14.0, 16.53], [19.0, 32.61], [34.0, 33.83], [35.0, 38.31], [39.0, 40.19], [40.0, 57.23], [59.0, 60.56], [62.0, 63.21], [65.0, 65.48], [75.0, 76.82], [78.0, 79.68], [82.0, 87.47], [90.0, 96.94], [98.0, 104.63], [106.0, 108.62], [109.0, 113.66], [119.0, 129.03]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true], "silence_prob": [56.03, 0.0, 72.16, 91.47, 36.09, 0.0, 64.75, 0.0, 51.39, 0.0, 0.0, 0.0, 0.0, 0.0, 42.58, 96.17, 72.9, 46.64, 39.4, 36.48], "audiomae_on_audioset": [null, null, null, null, [["hum", 30.87], ["music", 14.74], ["throbbing", 14.37]], null, null, null, null, null, null, null, null, null, [["music", 41.54], ["synthesizer", 9.29], ["ambient music", 7.65]], null, null, [["music", 32.9], ["hum", 9.16], ["didgeridoo", 7.42]], [["music", 41.51], ["hum", 6.29], ["throbbing", 6.06]], [["sine wave", 33.39], ["music", 16.27], ["sidetone", 7.09]]], "duration": [4.1, 1.31, 2.97, 2.53, 13.61, -0.17, 3.31, 1.19, 17.23, 1.56, 1.21, 0.48, 1.82, 1.68, 5.47, 6.94, 6.63, 2.62, 4.66, 10.03]} \ No newline at end of file diff --git a/annotations_1/rtYKhaQStZE_filtered.json b/annotations_1/rtYKhaQStZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84bbc44d5ca2b31da0c740b6628a239a2f586090 --- /dev/null +++ b/annotations_1/rtYKhaQStZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 20.87], [22.0, 22.52], [23.0, 24.21], [27.0, 27.55], [34.0, 34.57], [35.0, 35.87], [37.0, 38.04], [39.0, 40.2], [44.0, 44.05], [46.0, 46.25], [49.0, 49.01], [53.0, 57.91], [60.0, 63.19], [65.0, 65.06], [68.0, 69.25], [71.0, 72.1], [77.0, 78.06], [79.0, 79.54], [88.0, 88.43], [94.0, 100.87], [102.0, 102.74], [104.0, 105.29], [116.0, 115.97], [117.0, 117.73], [119.0, 119.97], [122.0, 123.65], [125.0, 128.9], [133.0, 133.78], [134.0, 134.99], [136.0, 137.19], [138.0, 139.58], [143.0, 143.75], [145.0, 147.56], [148.0, 148.91], [150.0, 150.63], [154.0, 156.69], [160.0, 162.48], [167.0, 168.91]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.36, 38.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 52.33, 0.0, 0.0, 42.67, 38.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 45.55], ["music", 25.03], ["hum", 20.16]], [["throbbing", 21.68], ["hum", 21.49], ["mains hum", 13.47]], null, null, null, null, null, null, [["hum", 43.98], ["mains hum", 16.19], ["buzz", 13.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.44], ["hum", 13.78], ["throbbing", 5.44]], [["hum", 38.31], ["throbbing", 14.03], ["music", 10.43]], null], "duration": [-0.13, 0.52, 1.21, 0.55, 0.57, 0.87, 1.04, 1.2, 0.05, 0.25, 0.01, 4.91, 3.19, 0.06, 1.25, 1.1, 1.06, 0.54, 0.43, 6.87, 0.74, 1.29, -0.03, 0.73, 0.97, 1.65, 3.9, 0.78, 0.99, 1.19, 1.58, 0.75, 2.56, 0.91, 0.63, 2.69, 2.48, 1.91]} \ No newline at end of file diff --git a/annotations_1/rtn4-lDSB80_filtered.json b/annotations_1/rtn4-lDSB80_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d39dad5d6f717d795e60054a228241f82e32135f --- /dev/null +++ b/annotations_1/rtn4-lDSB80_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 21.56], [24.0, 59.68], [60.0, 106.34]], "keep_status": [false, false, false], "silence_prob": [61.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [7.56, 35.68, 46.34]} \ No newline at end of file diff --git a/annotations_1/ruCFlIoCpJ8_filtered.json b/annotations_1/ruCFlIoCpJ8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd9aeec8887d80f9b832c986188d53b830715115 --- /dev/null +++ b/annotations_1/ruCFlIoCpJ8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [5.0, 9.14], [11.0, 12.11], [14.0, 19.23], [20.0, 21.1], [24.0, 24.68], [25.0, 25.86], [36.0, 37.44], [40.0, 41.0], [43.0, 45.27], [47.0, 49.55], [56.0, 55.86], [58.0, 58.41], [60.0, 60.96], [66.0, 66.43], [67.0, 67.81], [71.0, 76.42], [78.0, 80.16], [87.0, 87.66], [90.0, 91.39], [98.0, 103.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 74.76, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 0.0, 51.34, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 45.08, 62.17, 0.0, 0.0, 30.68], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 24.83], ["snicker", 6.79], ["fart", 6.38]], null, null, null, null, null, [["burping, eructation", 47.67], ["speech", 12.11], ["sidetone", 6.1]], null, null, null, [["speech", 80.78], ["whack, thwack", 5.39], ["burst, pop", 1.99]]], "duration": [0.45, 4.14, 1.11, 5.23, 1.1, 0.68, 0.86, 1.44, 1.0, 2.27, 2.55, -0.14, 0.41, 0.96, 0.43, 0.81, 5.42, 2.16, 0.66, 1.39, 5.69]} \ No newline at end of file diff --git a/annotations_1/ruwbVFvdfco_filtered.json b/annotations_1/ruwbVFvdfco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc1559363584897d6bb790adc08d4f34df288250 --- /dev/null +++ b/annotations_1/ruwbVFvdfco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 20.22], [23.0, 26.65], [36.0, 37.57], [40.0, 42.55], [55.0, 58.55], [62.0, 64.52], [73.0, 73.08], [74.0, 74.29], [76.0, 81.35], [82.0, 99.45], [102.0, 102.27], [104.0, 104.77], [106.0, 106.3], [108.0, 108.82], [110.0, 110.24], [111.0, 112.92], [116.0, 119.15], [123.0, 124.12], [125.0, 125.71], [128.0, 133.93], [137.0, 137.42], [139.0, 142.84]], "keep_status": [false, true, false, false, true, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.23, 29.08, 0.0, 42.91, 30.14, 29.53, 0.0, 0.0, 30.91, 28.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 0.0, 0.0, 67.51, 0.0, 87.74], "audiomae_on_audioset": [[["mains hum", 39.9], ["hum", 34.89], ["music", 6.93]], [["speech", 48.73], ["sidetone", 8.95], ["music", 5.48]], null, [["music", 58.17], ["throbbing", 10.48], ["hum", 9.36]], [["hum", 26.05], ["mains hum", 25.28], ["music", 6.92]], [["mains hum", 28.64], ["hum", 24.69], ["music", 16.66]], null, null, [["music", 56.39], ["train horn", 4.32], ["hum", 3.89]], [["hum", 32.82], ["music", 19.8], ["mains hum", 19.39]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.22, 3.65, 1.57, 2.55, 3.55, 2.52, 0.08, 0.29, 5.35, 17.45, 0.27, 0.77, 0.3, 0.82, 0.24, 1.92, 3.15, 1.12, 0.71, 5.93, 0.42, 3.84]} \ No newline at end of file diff --git a/annotations_1/rvOq4hFIRJg_filtered.json b/annotations_1/rvOq4hFIRJg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b53822cd2cb6a2530bf602a3f4aa10e10efb698 --- /dev/null +++ b/annotations_1/rvOq4hFIRJg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.01], [9.0, 10.05], [12.0, 12.51], [20.0, 20.53], [21.0, 46.77], [48.0, 49.99], [51.0, 53.0], [53.0, 61.48], [63.0, 70.58], [86.0, 86.14], [96.0, 100.58], [106.0, 107.43], [113.0, 113.24], [123.0, 123.84], [126.0, 127.52], [130.0, 130.33], [131.0, 132.19], [133.0, 133.69], [137.0, 137.89], [138.0, 140.09], [156.0, 156.81], [158.0, 159.66], [161.0, 165.15], [183.0, 183.64], [184.0, 184.71]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.34, 0.0, 98.93, 88.64, 29.77, 0.0, 29.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.83, 0.0, 0.0, 45.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 12.61], ["burst, pop", 9.45], ["explosion", 7.9]], null, null, null, [["sonar", 30.97], ["music", 14.57], ["rumble", 8.12]], null, [["hum", 40.98], ["mains hum", 25.96], ["throbbing", 21.18]], null, null, null, null, null, null, null, null, [["speech", 36.58], ["music", 28.61], ["insect", 4.61]], null, null, [["mains hum", 18.12], ["hum", 14.72], ["gasp", 9.31]], null, null], "duration": [1.01, 1.05, 0.51, 0.53, 25.77, 1.99, 2.0, 8.48, 7.58, 0.14, 4.58, 1.43, 0.24, 0.84, 1.52, 0.33, 1.19, 0.69, 0.89, 2.09, 0.81, 1.66, 4.15, 0.64, 0.71]} \ No newline at end of file diff --git a/annotations_1/rvQZ6MdHSEk_filtered.json b/annotations_1/rvQZ6MdHSEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce319c45c956ba7033c7f8440b0717198bc9e774 --- /dev/null +++ b/annotations_1/rvQZ6MdHSEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.61], [16.0, 17.15], [19.0, 53.42], [54.0, 61.33], [63.0, 63.69], [65.0, 64.79], [65.0, 67.36], [73.0, 82.83], [86.0, 87.69], [91.0, 91.27], [93.0, 93.34]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.57, 0.0, 0.0, 34.22, 30.02, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 29.21], ["throbbing", 21.75], ["speech", 18.02]], null, null, [["music", 47.61], ["dubstep", 5.14], ["electronic music", 4.21]], [["speech", 43.71], ["music", 23.85], ["sidetone", 7.35]], null, null, null], "duration": [1.61, 1.15, 34.42, 7.33, 0.69, -0.21, 2.36, 9.83, 1.69, 0.27, 0.34]} \ No newline at end of file diff --git a/annotations_1/rvqm61CcOLo_filtered.json b/annotations_1/rvqm61CcOLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6dfebefd02234e13ced301cdfaff6e27262522e5 --- /dev/null +++ b/annotations_1/rvqm61CcOLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.14], [16.0, 17.51], [18.0, 21.73], [23.0, 24.22], [27.0, 40.29], [42.0, 115.06], [119.0, 158.92]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [51.28, 0.0, 51.39, 0.0, 39.24, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 76.01], ["scary music", 6.2], ["hum", 3.57]], null, null], "duration": [4.14, 1.51, 3.73, 1.22, 13.29, 73.06, 39.92]} \ No newline at end of file diff --git a/annotations_1/rwDDgGuCVS0_filtered.json b/annotations_1/rwDDgGuCVS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/rwDDgGuCVS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/rwr1IzFzjqA_filtered.json b/annotations_1/rwr1IzFzjqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eb358cb9ed9467b7b2914d2dd9f3de4349cfad7 --- /dev/null +++ b/annotations_1/rwr1IzFzjqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [7.0, 8.46], [13.0, 13.49], [14.0, 14.94], [16.0, 16.31], [27.0, 27.82], [30.0, 31.41], [34.0, 34.2], [37.0, 36.95], [43.0, 45.96], [49.0, 49.67], [55.0, 55.58], [57.0, 57.59], [68.0, 67.86], [78.0, 80.89], [82.0, 82.75], [85.0, 85.7], [92.0, 92.3], [93.0, 93.85], [98.0, 97.93], [102.0, 103.42], [104.0, 103.94], [105.0, 105.43], [106.0, 106.07], [112.0, 111.82], [113.0, 113.86], [114.0, 114.62], [115.0, 115.53], [117.0, 117.31], [118.0, 118.03], [130.0, 130.71]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 1.46, 0.49, 0.94, 0.31, 0.82, 1.41, 0.2, -0.05, 2.96, 0.67, 0.58, 0.59, -0.14, 2.89, 0.75, 0.7, 0.3, 0.85, -0.07, 1.42, -0.06, 0.43, 0.07, -0.18, 0.86, 0.62, 0.53, 0.31, 0.03, 0.71]} \ No newline at end of file diff --git a/annotations_1/rx4sKoITt-Q_filtered.json b/annotations_1/rx4sKoITt-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc4c2cf0dc7ac804d4fb8eac9c48bebd44a553e6 --- /dev/null +++ b/annotations_1/rx4sKoITt-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.56], [6.0, 7.23], [19.0, 20.85], [25.0, 25.69], [33.0, 33.12], [34.0, 34.23], [35.0, 36.61], [38.0, 37.61], [42.0, 42.58], [44.0, 44.02], [50.0, 49.71], [51.0, 52.03], [54.0, 55.7], [65.0, 70.33], [73.0, 80.91], [81.0, 81.01], [81.0, 84.69], [86.0, 86.83], [89.0, 90.81], [93.0, 97.93], [104.0, 105.51], [109.0, 109.81], [112.0, 114.2], [119.0, 120.8], [127.0, 129.22], [133.0, 135.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 87.19, 0.0, 55.89, 0.0, 0.0, 100.0, 0.0, 0.0, 99.76, 0.0, 90.95, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 1.23, 1.85, 0.69, 0.12, 0.23, 1.61, -0.39, 0.58, 0.02, -0.29, 1.03, 1.7, 5.33, 7.91, 0.01, 3.69, 0.83, 1.81, 4.93, 1.51, 0.81, 2.2, 1.8, 2.22, 2.78]} \ No newline at end of file diff --git a/annotations_1/rxC2ZWU4IPo_filtered.json b/annotations_1/rxC2ZWU4IPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3580a8ff363a5a51c708034a0b8aac3323931daf --- /dev/null +++ b/annotations_1/rxC2ZWU4IPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [14.0, 14.12], [15.0, 16.48], [22.0, 23.89], [25.0, 29.94], [52.0, 53.87], [60.0, 60.64], [65.0, 65.62], [67.0, 68.94], [73.0, 72.94], [74.0, 74.19], [76.0, 80.96], [86.0, 85.78], [89.0, 89.46], [90.0, 90.78], [92.0, 95.32], [98.0, 100.3], [109.0, 109.53], [110.0, 111.23], [112.0, 113.44], [129.0, 134.16], [135.0, 135.65], [140.0, 141.45], [145.0, 146.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.76, 0.0, 0.0, 0.0, 77.87, 98.1, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 96.4], ["speech", 1.71], ["music", 0.72]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 0.12, 1.48, 1.89, 4.94, 1.87, 0.64, 0.62, 1.94, -0.06, 0.19, 4.96, -0.22, 0.46, 0.78, 3.32, 2.3, 0.53, 1.23, 1.44, 5.16, 0.65, 1.45, 1.31]} \ No newline at end of file diff --git a/annotations_1/rxWQfQcLAUA_filtered.json b/annotations_1/rxWQfQcLAUA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d52e6b4724a3d193f278deb2f715641b94d9b940 --- /dev/null +++ b/annotations_1/rxWQfQcLAUA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.87], [21.0, 20.85], [21.0, 22.03], [22.0, 23.72], [26.0, 26.49], [29.0, 29.56], [33.0, 34.89], [43.0, 44.44], [51.0, 55.24], [60.0, 64.79], [66.0, 69.62], [89.0, 91.77], [95.0, 95.94], [102.0, 109.07], [118.0, 126.13], [130.0, 131.14], [133.0, 133.69]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.38, 29.56, 30.26, 28.88, 0.0, 29.5, 30.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.03], ["a capella", 10.86], ["vocal music", 9.96]], [["music", 56.08], ["singing", 5.69], ["musical instrument", 5.33]], [["music", 66.7], ["musical instrument", 3.53], ["middle eastern music", 2.65]], [["music", 59.82], ["musical instrument", 6.08], ["synthesizer", 5.6]], null, [["music", 51.19], ["theremin", 7.57], ["didgeridoo", 6.88]], [["music", 53.34], ["tabla", 8.92], ["carnatic music", 5.7]], null, null], "duration": [1.87, -0.15, 1.03, 1.72, 0.49, 0.56, 1.89, 1.44, 4.24, 4.79, 3.62, 2.77, 0.94, 7.07, 8.13, 1.14, 0.69]} \ No newline at end of file diff --git a/annotations_1/rxkB20Tpvx0_filtered.json b/annotations_1/rxkB20Tpvx0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..579ad4072185addf3a726a25e2068bd6926eed91 --- /dev/null +++ b/annotations_1/rxkB20Tpvx0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [5.0, 8.43], [18.0, 20.83], [23.0, 23.94], [25.0, 26.94], [39.0, 39.48], [44.0, 46.45], [48.0, 50.38], [56.0, 69.9], [71.0, 72.52], [82.0, 85.31], [90.0, 91.84], [95.0, 95.17], [98.0, 98.39], [104.0, 104.7], [108.0, 107.91], [110.0, 111.18], [117.0, 145.84], [150.0, 155.44]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 98.19, 34.92, 0.0, 0.0, 0.0, 30.88, 31.48, 31.6, 0.0, 30.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 36.25], "audiomae_on_audioset": [null, null, [["music", 49.34], ["speech", 25.26], ["effects unit", 3.22]], null, null, null, [["music", 40.83], ["didgeridoo", 37.86], ["speech", 4.23]], [["music", 49.52], ["theremin", 18.23], ["musical instrument", 7.71]], [["music", 38.51], ["didgeridoo", 8.2], ["cattle, bovinae", 7.67]], null, [["mains hum", 25.67], ["hum", 19.09], ["fly, housefly", 12.75]], null, null, null, null, null, null, [["theremin", 61.67], ["music", 31.33], ["musical instrument", 0.88]], [["music", 33.19], ["foghorn", 20.06], ["brass instrument", 7.48]]], "duration": [1.42, 3.43, 2.83, 0.94, 1.94, 0.48, 2.45, 2.38, 13.9, 1.52, 3.31, 1.84, 0.17, 0.39, 0.7, -0.09, 1.18, 28.84, 5.44]} \ No newline at end of file diff --git a/annotations_1/rxno2wz0eKc_filtered.json b/annotations_1/rxno2wz0eKc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e72f82131a098dab5748cae2df48610cc2d304e8 --- /dev/null +++ b/annotations_1/rxno2wz0eKc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.46], [3.0, 6.03], [10.0, 10.49], [12.0, 13.24], [18.0, 19.63], [27.0, 29.02], [31.0, 30.86], [32.0, 32.27], [33.0, 33.61], [34.0, 34.69], [37.0, 37.83], [40.0, 40.26], [41.0, 42.63], [48.0, 48.73], [50.0, 50.41], [60.0, 60.78], [63.0, 63.83], [65.0, 66.16], [67.0, 68.64], [69.0, 72.84], [77.0, 76.76], [78.0, 77.99], [82.0, 90.8], [93.0, 98.59], [101.0, 102.93], [104.0, 104.45], [105.0, 107.72], [110.0, 118.34], [119.0, 121.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 87.55, 0.0, 0.0, 0.0, 77.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.95, 0.0, 0.0, 44.18, 49.0, 0.0, 0.0, 45.98, 33.12, 39.15], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 83.08], ["musical instrument", 2.92], ["synthesizer", 2.73]], null, null, [["music", 53.64], ["brass instrument", 12.02], ["trombone", 6.78]], [["music", 78.93], ["thunk", 2.92], ["brass instrument", 2.67]], null, null, [["music", 71.73], ["didgeridoo", 7.42], ["musical instrument", 3.77]], [["music", 34.42], ["speech", 26.62], ["screaming", 8.59]], [["didgeridoo", 47.01], ["music", 36.78], ["musical instrument", 4.71]]], "duration": [0.46, 3.03, 0.49, 1.24, 1.63, 2.02, -0.14, 0.27, 0.61, 0.69, 0.83, 0.26, 1.63, 0.73, 0.41, 0.78, 0.83, 1.16, 1.64, 3.84, -0.24, -0.01, 8.8, 5.59, 1.93, 0.45, 2.72, 8.34, 2.46]} \ No newline at end of file diff --git a/annotations_1/ry55--J4_VQ_filtered.json b/annotations_1/ry55--J4_VQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb2127313177d7dc4fb1ba12a7513e594d905af0 --- /dev/null +++ b/annotations_1/ry55--J4_VQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 25.68], [33.0, 33.03], [36.0, 45.13], [48.0, 49.03], [51.0, 51.04], [52.0, 52.98], [55.0, 56.03], [57.0, 59.48]], "keep_status": [true, false, false, false, false, false, false, true], "silence_prob": [48.44, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 48.39], "audiomae_on_audioset": [[["hum", 28.76], ["mains hum", 12.25], ["throbbing", 11.98]], null, [["speech", 67.93], ["sidetone", 7.0], ["music", 4.74]], null, null, null, null, [["hum", 17.05], ["music", 15.52], ["mains hum", 7.55]]], "duration": [2.68, 0.03, 9.13, 1.03, 0.04, 0.98, 1.03, 2.48]} \ No newline at end of file diff --git a/annotations_1/ry9yNbMVeMQ_filtered.json b/annotations_1/ry9yNbMVeMQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd3b368c488068e49e42464d333d80bf142223cf --- /dev/null +++ b/annotations_1/ry9yNbMVeMQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 31.75], [33.0, 36.44], [38.0, 78.14], [81.0, 113.26]], "keep_status": [false, true, false, false], "silence_prob": [31.91, 30.3, 0.0, 0.0], "audiomae_on_audioset": [[["music", 30.43], ["hum", 28.91], ["mains hum", 27.85]], [["mains hum", 26.37], ["hum", 20.15], ["music", 15.23]], null, null], "duration": [27.75, 3.44, 40.14, 32.26]} \ No newline at end of file diff --git a/annotations_1/ryqyAX_lA7w_filtered.json b/annotations_1/ryqyAX_lA7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b20b5c86e9965444088ea98aa801946a2a60101 --- /dev/null +++ b/annotations_1/ryqyAX_lA7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 106.37], [108.0, 116.83]], "keep_status": [false, true], "silence_prob": [46.5, 44.26], "audiomae_on_audioset": [[["music", 60.49], ["hum", 8.45], ["ambient music", 3.64]], [["music", 57.87], ["singing bowl", 5.41], ["theremin", 5.32]]], "duration": [25.37, 8.83]} \ No newline at end of file diff --git a/annotations_1/ryyEEyKD9EU_filtered.json b/annotations_1/ryyEEyKD9EU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bec1e41e9edf6b86c8ada2f3598afb6d0daecdd --- /dev/null +++ b/annotations_1/ryyEEyKD9EU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [10.0, 9.86], [12.0, 12.11], [14.0, 13.91], [18.0, 20.26], [27.0, 28.02], [31.0, 31.56], [34.0, 34.18], [35.0, 35.02], [37.0, 38.3], [39.0, 40.56], [42.0, 43.16], [45.0, 46.45], [47.0, 47.8], [52.0, 52.39], [54.0, 54.18], [61.0, 61.72], [64.0, 65.31], [72.0, 73.47], [83.0, 83.1], [85.0, 86.73], [89.0, 90.53], [93.0, 93.24], [94.0, 95.23], [97.0, 111.32], [112.0, 115.23], [117.0, 118.49], [123.0, 124.01], [128.0, 129.52], [131.0, 132.93], [134.0, 135.6], [138.0, 138.52], [139.0, 142.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 86.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.47, 60.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.38], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, -0.14, 0.11, -0.09, 2.26, 1.02, 0.56, 0.18, 0.02, 1.3, 1.56, 1.16, 1.45, 0.8, 0.39, 0.18, 0.72, 1.31, 1.47, 0.1, 1.73, 1.53, 0.24, 1.23, 14.32, 3.23, 1.49, 1.01, 1.52, 1.93, 1.6, 0.52, 3.16]} \ No newline at end of file diff --git a/annotations_1/rz2FxTVVJi4_filtered.json b/annotations_1/rz2FxTVVJi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..34ae7171da1b392b0f712ef009cc32a211d28373 --- /dev/null +++ b/annotations_1/rz2FxTVVJi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.8], [11.0, 11.06], [11.0, 11.37], [15.0, 14.84], [28.0, 29.12], [35.0, 36.26], [37.0, 38.35], [44.0, 43.95], [56.0, 56.54], [89.0, 89.82], [90.0, 90.93], [97.0, 98.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.8, 0.06, 0.37, -0.16, 1.12, 1.26, 1.35, -0.05, 0.54, 0.82, 0.93, 1.1]} \ No newline at end of file diff --git a/annotations_1/rzCeSHk3aVY_filtered.json b/annotations_1/rzCeSHk3aVY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c6ca616965008ce3356b9592fcd2d112a99fb46 --- /dev/null +++ b/annotations_1/rzCeSHk3aVY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.13], [3.0, 4.06], [7.0, 7.65], [10.0, 12.21], [18.0, 27.11], [31.0, 31.83], [39.0, 39.38], [42.0, 42.35], [46.0, 45.72], [63.0, 64.91], [66.0, 68.17], [71.0, 71.04], [73.0, 74.31], [75.0, 87.29], [89.0, 97.39], [99.0, 100.47], [109.0, 111.97], [114.0, 115.43], [118.0, 122.42], [124.0, 128.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 98.99, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 40.38, 61.67, 0.0, 58.38, 0.0, 31.31, 29.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.32], ["electronic music", 14.11], ["hum", 12.83]], null, null, null, null, [["music", 48.32], ["buzz", 4.87], ["mosquito", 3.17]], [["music", 38.04], ["throbbing", 6.68], ["hum", 5.45]]], "duration": [0.13, 1.06, 0.65, 2.21, 9.11, 0.83, 0.38, 0.35, -0.28, 1.91, 2.17, 0.04, 1.31, 12.29, 8.39, 1.47, 2.97, 1.43, 4.42, 4.65]} \ No newline at end of file diff --git a/annotations_1/rzIs51GUVgg_filtered.json b/annotations_1/rzIs51GUVgg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43f8e8b03562d664a7133de3ddf31cfe75e11880 --- /dev/null +++ b/annotations_1/rzIs51GUVgg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.22], [14.0, 14.61], [31.0, 33.96], [39.0, 40.83], [58.0, 59.0], [62.0, 62.87], [65.0, 65.96], [67.0, 68.05], [70.0, 70.17], [79.0, 80.25], [82.0, 83.64], [86.0, 86.73], [89.0, 89.38], [93.0, 94.04], [97.0, 98.42], [102.0, 102.46], [131.0, 131.92]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.55, 0.0, 33.96, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["echo", 19.98], ["moo", 10.31], ["cattle, bovinae", 5.65]], null, [["music", 44.4], ["didgeridoo", 10.43], ["singing", 3.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.22, 0.61, 2.96, 1.83, 1.0, 0.87, 0.96, 1.05, 0.17, 1.25, 1.64, 0.73, 0.38, 1.04, 1.42, 0.46, 0.92]} \ No newline at end of file diff --git a/annotations_1/rzuN9uvnsZI_filtered.json b/annotations_1/rzuN9uvnsZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fb56548e0251d3a6e5b3f8f5f5083e4ba04302c2 --- /dev/null +++ b/annotations_1/rzuN9uvnsZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.73], [6.0, 6.34], [11.0, 11.43], [17.0, 16.66], [22.0, 22.22], [28.0, 29.88], [30.0, 32.32], [33.0, 38.21], [39.0, 83.35], [84.0, 96.45], [98.0, 114.07], [115.0, 125.14], [126.0, 165.21], [167.0, 167.83], [170.0, 171.44], [173.0, 173.87], [177.0, 178.38], [180.0, 189.19], [191.0, 191.67], [192.0, 203.52], [207.0, 209.01], [210.0, 212.18], [213.0, 219.3], [221.0, 236.58], [243.0, 244.34], [247.0, 249.1], [255.0, 255.9], [264.0, 264.56]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.31, 39.15, 0.0, 28.4, 28.26, 28.43, 0.0, 0.0, 0.0, 0.0, 0.0, 28.84, 0.0, 29.75, 33.97, 37.65, 34.09, 51.71, 0.0, 90.08, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["sidetone", 90.73], ["speech", 3.77], ["radio", 3.05]], null, [["speech", 13.29], ["music", 11.18], ["hum", 7.81]], [["buzz", 24.98], ["electric shaver, electric razor", 9.09], ["noise", 4.57]], [["speech", 44.44], ["vehicle", 11.9], ["aircraft", 6.57]], null, null, null, null, null, [["mains hum", 30.33], ["hum", 17.7], ["music", 12.11]], null, [["music", 41.59], ["synthesizer", 13.89], ["noise", 10.13]], [["music", 43.59], ["hum", 6.6], ["electronic music", 4.97]], [["music", 42.3], ["didgeridoo", 34.0], ["musical instrument", 4.07]], [["speech", 33.81], ["music", 30.23], ["didgeridoo", 13.97]], null, null, null, null, null], "duration": [0.73, 0.34, 0.43, -0.34, 0.22, 1.88, 2.32, 5.21, 44.35, 12.45, 16.07, 10.14, 39.21, 0.83, 1.44, 0.87, 1.38, 9.19, 0.67, 11.52, 2.01, 2.18, 6.3, 15.58, 1.34, 2.1, 0.9, 0.56]} \ No newline at end of file diff --git a/annotations_1/s-vP7WgMkpA_filtered.json b/annotations_1/s-vP7WgMkpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3429ea54609483e0952e11f2da2f7a4c2089a61f --- /dev/null +++ b/annotations_1/s-vP7WgMkpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[45.0, 45.44]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.44]} \ No newline at end of file diff --git a/annotations_1/s039YJGaP-Y_filtered.json b/annotations_1/s039YJGaP-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1834680fa447d5518ee9955c9291df9d769df82d --- /dev/null +++ b/annotations_1/s039YJGaP-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.14], [1.0, 2.84], [10.0, 10.12], [19.0, 19.53], [22.0, 22.6], [23.0, 23.19], [35.0, 35.73], [40.0, 40.91], [44.0, 44.95], [47.0, 47.16], [50.0, 52.07], [54.0, 54.55], [59.0, 78.14], [81.0, 85.09], [88.0, 88.74], [92.0, 96.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.21, 0.0, 64.41, 52.16, 0.0, 39.28], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 54.02], ["sidetone", 12.84], ["radio", 3.7]], null, null, null, null, [["music", 24.71], ["hum", 12.54], ["mains hum", 9.34]]], "duration": [0.14, 1.84, 0.12, 0.53, 0.6, 0.19, 0.73, 0.91, 0.95, 0.16, 2.07, 0.55, 19.14, 4.09, 0.74, 4.72]} \ No newline at end of file diff --git a/annotations_1/s1QgQny2o5E_filtered.json b/annotations_1/s1QgQny2o5E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11e98fcd87fea16a646bb5ec1501130f845b8d4a --- /dev/null +++ b/annotations_1/s1QgQny2o5E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 29.32], [31.0, 34.11], [37.0, 39.09], [41.0, 44.24], [46.0, 46.9], [49.0, 49.65], [53.0, 53.79], [57.0, 59.64], [63.0, 62.53], [67.0, 71.17], [73.0, 88.57], [89.0, 91.84], [93.0, 94.53], [96.0, 112.19], [114.0, 115.65]], "keep_status": [false, true, true, true, false, false, false, true, false, true, false, true, false, false, false], "silence_prob": [35.73, 34.98, 30.91, 42.28, 0.0, 0.0, 0.0, 38.32, 0.0, 32.7, 29.36, 36.2, 0.0, 32.96, 0.0], "audiomae_on_audioset": [[["music", 41.74], ["hum", 21.17], ["mains hum", 17.4]], [["mains hum", 29.07], ["hum", 19.88], ["music", 9.78]], [["music", 28.04], ["sound effect", 14.85], ["synthesizer", 7.86]], [["music", 29.86], ["gong", 20.4], ["sonar", 7.51]], null, null, null, [["music", 18.71], ["hum", 17.97], ["mains hum", 14.61]], null, [["mains hum", 15.15], ["hum", 12.47], ["speech", 8.57]], [["music", 42.94], ["speech", 24.15], ["hum", 9.26]], [["music", 31.89], ["whale vocalization", 15.45], ["civil defense siren", 11.02]], null, [["music", 78.67], ["scary music", 8.25], ["foghorn", 2.74]], null], "duration": [5.32, 3.11, 2.09, 3.24, 0.9, 0.65, 0.79, 2.64, -0.47, 4.17, 15.57, 2.84, 1.53, 16.19, 1.65]} \ No newline at end of file diff --git a/annotations_1/s2Tpk6RnkaA_filtered.json b/annotations_1/s2Tpk6RnkaA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a923d65123e0d78e39fe093aef8a350e19621d12 --- /dev/null +++ b/annotations_1/s2Tpk6RnkaA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [10.0, 9.88], [14.0, 14.07], [18.0, 17.98], [21.0, 22.03], [23.0, 24.17], [27.0, 27.5], [32.0, 33.0], [35.0, 34.82], [37.0, 37.88], [39.0, 41.23], [47.0, 47.31], [48.0, 48.03], [50.0, 50.45], [54.0, 54.89], [56.0, 57.69], [61.0, 61.38], [63.0, 64.37], [65.0, 65.18], [66.0, 66.21], [68.0, 68.52], [70.0, 70.85], [73.0, 73.04], [84.0, 86.86], [88.0, 90.66], [93.0, 94.49], [96.0, 99.25], [100.0, 100.77], [103.0, 103.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 99.85, 0.0, 98.27, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, -0.12, 0.07, -0.02, 1.03, 1.17, 0.5, 1.0, -0.18, 0.88, 2.23, 0.31, 0.03, 0.45, 0.89, 1.69, 0.38, 1.37, 0.18, 0.21, 0.52, 0.85, 0.04, 2.86, 2.66, 1.49, 3.25, 0.77, 0.42]} \ No newline at end of file diff --git a/annotations_1/s33dP0ETrCo_filtered.json b/annotations_1/s33dP0ETrCo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..623882ddcaa2c1eb516dff1dc021bc2ca30843fb --- /dev/null +++ b/annotations_1/s33dP0ETrCo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [13.0, 19.65], [24.0, 25.12], [29.0, 31.23], [32.0, 33.56], [36.0, 37.52], [40.0, 41.12], [42.0, 43.68], [44.0, 47.06], [51.0, 52.79], [65.0, 65.11], [65.0, 65.8], [73.0, 73.82], [79.0, 79.61], [82.0, 83.86], [87.0, 88.1], [92.0, 92.15], [93.0, 93.6], [95.0, 95.81], [105.0, 105.71], [106.0, 107.18], [112.0, 113.36], [117.0, 117.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.04, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 6.65, 1.12, 2.23, 1.56, 1.52, 1.12, 1.68, 3.06, 1.79, 0.11, 0.8, 0.82, 0.61, 1.86, 1.1, 0.15, 0.6, 0.81, 0.71, 1.18, 1.36, 0.54]} \ No newline at end of file diff --git a/annotations_1/s3mwDA8sv8I_filtered.json b/annotations_1/s3mwDA8sv8I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af9dfbc0fd9e59d81314498bcc3136e9dc95a3a8 --- /dev/null +++ b/annotations_1/s3mwDA8sv8I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.64], [10.0, 10.13], [13.0, 13.54], [15.0, 14.77], [19.0, 20.36], [22.0, 24.09], [26.0, 26.82], [28.0, 29.56], [31.0, 32.76], [35.0, 36.48], [38.0, 38.67], [41.0, 41.01], [42.0, 50.87], [52.0, 62.46], [64.0, 64.93], [66.0, 68.77], [69.0, 78.73], [81.0, 81.63], [84.0, 85.8], [87.0, 90.17], [93.0, 95.94], [97.0, 100.53], [102.0, 102.27], [103.0, 104.53], [106.0, 109.14], [112.0, 115.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 81.35, 0.0, 75.72, 56.33, 0.0, 0.0, 71.29, 64.07, 60.6, 0.0, 0.0, 80.82, 58.89], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 29.12], ["insect", 18.83], ["speech", 15.73]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.64, 0.13, 0.54, -0.23, 1.36, 2.09, 0.82, 1.56, 1.76, 1.48, 0.67, 0.01, 8.87, 10.46, 0.93, 2.77, 9.73, 0.63, 1.8, 3.17, 2.94, 3.53, 0.27, 1.53, 3.14, 3.3]} \ No newline at end of file diff --git a/annotations_1/s43ARFFNrz0_filtered.json b/annotations_1/s43ARFFNrz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d843ae51f27a09060ed2838e088385c26bd3e2a --- /dev/null +++ b/annotations_1/s43ARFFNrz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.42], [19.0, 19.08], [20.0, 20.63], [21.0, 21.83], [26.0, 26.32], [52.0, 54.18], [60.0, 60.29], [71.0, 76.4], [77.0, 77.82], [79.0, 88.03]], "keep_status": [true, false, false, false, false, true, false, false, false, false], "silence_prob": [45.59, 0.0, 0.0, 0.0, 0.0, 43.33, 0.0, 62.07, 0.0, 62.47], "audiomae_on_audioset": [[["raindrop", 24.44], ["rain on surface", 16.42], ["rain", 14.5]], null, null, null, null, [["rain on surface", 24.23], ["rain", 16.14], ["raindrop", 12.59]], null, null, null, null], "duration": [3.42, 0.08, 0.63, 0.83, 0.32, 2.18, 0.29, 5.4, 0.82, 9.03]} \ No newline at end of file diff --git a/annotations_1/s4esaE679Wg_filtered.json b/annotations_1/s4esaE679Wg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c92efb29a57712b5c18b0f7cb6c7a3a2a38b46ca --- /dev/null +++ b/annotations_1/s4esaE679Wg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 22.92], [24.0, 27.82], [30.0, 35.09], [46.0, 46.65], [47.0, 47.68], [52.0, 53.59], [56.0, 59.9], [61.0, 62.09], [65.0, 66.02], [68.0, 68.82], [72.0, 84.32], [86.0, 96.48], [96.0, 96.52], [97.0, 96.77], [97.0, 101.75], [103.0, 124.07], [125.0, 165.86], [166.0, 166.45], [167.0, 167.44], [167.0, 167.59]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false, true, false, false, true, true, false, false, false, false], "silence_prob": [27.82, 27.77, 28.68, 0.0, 0.0, 0.0, 31.55, 0.0, 0.0, 0.0, 27.81, 28.01, 0.0, 0.0, 28.17, 27.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 31.73], ["cattle, bovinae", 11.59], ["animal", 8.43]], [["vehicle", 20.08], ["car", 14.77], ["skidding", 12.77]], [["music", 13.86], ["noise", 9.43], ["sound effect", 9.23]], null, null, null, [["music", 56.84], ["cattle, bovinae", 7.04], ["didgeridoo", 5.51]], null, null, null, [["speech", 68.8], ["vehicle", 5.95], ["motorcycle", 3.03]], [["speech", 35.1], ["vehicle", 6.55], ["music", 6.16]], null, null, [["music", 45.72], ["noise", 13.11], ["musical instrument", 7.32]], [["music", 52.24], ["buzz", 5.51], ["fly, housefly", 3.17]], null, null, null, null], "duration": [14.92, 3.82, 5.09, 0.65, 0.68, 1.59, 3.9, 1.09, 1.02, 0.82, 12.32, 10.48, 0.52, -0.23, 4.75, 21.07, 40.86, 0.45, 0.44, 0.59]} \ No newline at end of file diff --git a/annotations_1/s6JmX_n5oeo_filtered.json b/annotations_1/s6JmX_n5oeo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a2b2cfe2e3ff960c1a82feb87092f08e041cd86 --- /dev/null +++ b/annotations_1/s6JmX_n5oeo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.5], [17.0, 20.61], [22.0, 23.23], [26.0, 26.86], [31.0, 31.6], [38.0, 38.6], [40.0, 42.11], [45.0, 45.37], [47.0, 50.92], [55.0, 58.9], [64.0, 65.64], [66.0, 67.63], [71.0, 76.84], [78.0, 79.35], [81.0, 81.55], [82.0, 82.17], [84.0, 83.67], [84.0, 86.64], [88.0, 92.64], [95.0, 95.15], [98.0, 98.91], [99.0, 99.94], [100.0, 102.24], [103.0, 116.09]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [73.82, 99.59, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 47.08, 79.41, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 76.86, 99.26, 0.0, 0.0, 0.0, 72.01, 41.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["stomach rumble", 16.21], ["hum", 13.88], ["throbbing", 7.86]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 17.13], ["tuning fork", 10.93], ["hum", 8.72]]], "duration": [4.5, 3.61, 1.23, 0.86, 0.6, 0.6, 2.11, 0.37, 3.92, 3.9, 1.64, 1.63, 5.84, 1.35, 0.55, 0.17, -0.33, 2.64, 4.64, 0.15, 0.91, 0.94, 2.24, 13.09]} \ No newline at end of file diff --git a/annotations_1/s6moLb_ieqA_filtered.json b/annotations_1/s6moLb_ieqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..399feecbce8c04c43ef29e6235188fb44c9f013d --- /dev/null +++ b/annotations_1/s6moLb_ieqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.61], [2.0, 3.16], [5.0, 5.88], [6.0, 7.43], [10.0, 10.45], [22.0, 46.41], [48.0, 48.17], [54.0, 59.73], [65.0, 64.86], [65.0, 65.64], [68.0, 73.28], [74.0, 79.79], [83.0, 83.15], [83.0, 87.74], [93.0, 103.81], [107.0, 107.87], [109.0, 109.02], [111.0, 112.56], [113.0, 117.78], [122.0, 121.71], [122.0, 123.79], [126.0, 127.58], [128.0, 129.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.58, 0.0, 50.91, 0.0, 0.0, 100.0, 99.91, 0.0, 47.9, 32.83, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["thunk", 43.18], ["speech", 34.29], ["music", 4.59]], [["music", 42.63], ["thunk", 13.99], ["whack, thwack", 12.09]], null, null, null, null, null, null, null, null], "duration": [-0.39, 1.16, 0.88, 1.43, 0.45, 24.41, 0.17, 5.73, -0.14, 0.64, 5.28, 5.79, 0.15, 4.74, 10.81, 0.87, 0.02, 1.56, 4.78, -0.29, 1.79, 1.58, 1.0]} \ No newline at end of file diff --git a/annotations_1/s6n8HGwboO4_filtered.json b/annotations_1/s6n8HGwboO4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9f3a8e9b9da144c5d24da71ec7ad444b836ed723 --- /dev/null +++ b/annotations_1/s6n8HGwboO4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.26], [7.0, 9.46], [39.0, 40.8], [43.0, 43.43], [45.0, 46.23], [49.0, 59.56], [63.0, 68.37], [69.0, 74.98], [76.0, 78.19], [79.0, 81.72], [83.0, 83.47], [84.0, 85.46], [87.0, 88.13], [89.0, 90.46], [91.0, 93.02], [94.0, 95.77], [100.0, 100.92], [107.0, 107.54], [111.0, 112.9], [116.0, 117.54], [120.0, 121.78], [125.0, 127.18], [128.0, 129.63], [134.0, 135.89], [138.0, 138.64], [141.0, 144.04]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 81.89, 0.0, 0.0, 0.0, 47.05, 64.52, 56.55, 70.72, 63.64, 0.0, 0.0, 0.0, 0.0, 83.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.19, 0.0, 0.0, 0.0, 59.07], "audiomae_on_audioset": [null, null, null, null, null, [["cello", 34.32], ["music", 17.79], ["bowed string instrument", 12.19]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.22], ["sidetone", 21.66], ["hum", 4.95]], null, null, null, null], "duration": [1.26, 2.46, 1.8, 0.43, 1.23, 10.56, 5.37, 5.98, 2.19, 2.72, 0.47, 1.46, 1.13, 1.46, 2.02, 1.77, 0.92, 0.54, 1.9, 1.54, 1.78, 2.18, 1.63, 1.89, 0.64, 3.04]} \ No newline at end of file diff --git a/annotations_1/s7ougTo-pGg_filtered.json b/annotations_1/s7ougTo-pGg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10e5072149c2a8914c6f6995db0f1d572ae91a70 --- /dev/null +++ b/annotations_1/s7ougTo-pGg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.72], [6.0, 7.43], [15.0, 15.43], [17.0, 17.78], [19.0, 20.33], [28.0, 28.78], [33.0, 34.13], [53.0, 53.54], [55.0, 60.93], [62.0, 66.77], [74.0, 74.66], [84.0, 83.67], [88.0, 88.53], [89.0, 107.64], [111.0, 136.17], [139.0, 149.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 34.34, 0.0, 0.0, 0.0, 33.5, 32.91, 43.03], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 51.19], ["sidetone", 21.31], ["electronic music", 4.52]], [["music", 71.47], ["electronic music", 3.16], ["musical instrument", 2.0]], null, null, null, [["music", 43.31], ["cattle, bovinae", 16.24], ["moo", 12.96]], [["music", 67.98], ["electronic music", 6.39], ["cattle, bovinae", 3.07]], [["music", 73.33], ["didgeridoo", 3.37], ["musical instrument", 2.98]]], "duration": [0.72, 1.43, 0.43, 0.78, 1.33, 0.78, 1.13, 0.54, 5.93, 4.77, 0.66, -0.33, 0.53, 18.64, 25.17, 10.37]} \ No newline at end of file diff --git a/annotations_1/s8cVCsIcGAE_filtered.json b/annotations_1/s8cVCsIcGAE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3841a8769336edf6a035a01421ef7969ed6c10ef --- /dev/null +++ b/annotations_1/s8cVCsIcGAE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 26.11], [27.0, 27.97], [28.0, 29.52], [30.0, 36.14], [38.0, 45.54], [50.0, 77.38], [80.0, 81.4], [84.0, 85.5], [91.0, 93.53], [99.0, 141.81], [144.0, 148.98]], "keep_status": [false, false, false, true, true, false, false, false, true, false, true], "silence_prob": [30.83, 0.0, 0.0, 29.83, 28.63, 28.65, 0.0, 0.0, 28.39, 0.0, 35.22], "audiomae_on_audioset": [[["hum", 33.73], ["speech", 24.09], ["mains hum", 15.53]], null, null, [["speech", 25.99], ["music", 9.71], ["animal", 6.97]], [["music", 15.29], ["speech", 14.55], ["buzz", 11.2]], [["mains hum", 30.79], ["music", 20.13], ["hum", 19.37]], null, null, [["music", 23.38], ["hum", 17.15], ["throbbing", 12.83]], null, [["music", 44.85], ["hum", 12.76], ["speech", 8.67]]], "duration": [10.11, 0.97, 1.52, 6.14, 7.54, 27.38, 1.4, 1.5, 2.53, 42.81, 4.98]} \ No newline at end of file diff --git a/annotations_1/s8tXE43jYho_filtered.json b/annotations_1/s8tXE43jYho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63dbcf8321b800a76bf0193a03e54adc9ab388d5 --- /dev/null +++ b/annotations_1/s8tXE43jYho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.97], [11.0, 14.18], [17.0, 18.2], [21.0, 23.33], [29.0, 29.02], [32.0, 44.42], [46.0, 48.57], [59.0, 64.37], [66.0, 75.22], [77.0, 84.74], [85.0, 85.02], [86.0, 88.2], [91.0, 91.62], [95.0, 102.9], [106.0, 106.59]], "keep_status": [false, false, false, true, false, false, true, true, false, false, false, true, false, true, false], "silence_prob": [0.0, 99.99, 0.0, 46.33, 0.0, 40.64, 36.55, 45.08, 35.54, 35.13, 0.0, 35.3, 0.0, 36.74, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 44.05], ["musical instrument", 10.29], ["guitar", 3.83]], null, [["music", 54.98], ["theremin", 12.17], ["hum", 5.04]], [["music", 31.45], ["speech", 28.75], ["didgeridoo", 5.0]], [["music", 53.79], ["musical instrument", 7.81], ["hum", 4.57]], [["music", 70.96], ["speech", 14.64], ["effects unit", 1.63]], [["music", 72.67], ["speech", 5.53], ["boing", 4.36]], null, [["speech", 21.59], ["music", 11.57], ["dog", 9.34]], null, [["music", 32.57], ["speech", 15.31], ["guitar", 15.29]], null], "duration": [1.97, 3.18, 1.2, 2.33, 0.02, 12.42, 2.57, 5.37, 9.22, 7.74, 0.02, 2.2, 0.62, 7.9, 0.59]} \ No newline at end of file diff --git a/annotations_1/s9TKR7rSFfA_filtered.json b/annotations_1/s9TKR7rSFfA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..83863a81096c0126ce5a686455d25a533343edae --- /dev/null +++ b/annotations_1/s9TKR7rSFfA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.86], [4.0, 3.96], [5.0, 6.64], [8.0, 8.82], [10.0, 10.03], [17.0, 19.77], [21.0, 21.61], [22.0, 23.16], [25.0, 25.34], [27.0, 26.67], [28.0, 28.51], [29.0, 33.71], [37.0, 41.99], [44.0, 44.91], [47.0, 47.22], [47.0, 48.98], [51.0, 54.95], [56.0, 56.03], [57.0, 61.79], [63.0, 64.89], [68.0, 69.43], [74.0, 74.55], [76.0, 77.14], [95.0, 94.85], [96.0, 96.6], [98.0, 100.62], [103.0, 103.94], [108.0, 108.11], [108.0, 108.14], [110.0, 115.05], [116.0, 116.28], [118.0, 118.34]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.99, 0.0, 0.0, 0.0, 0.0, 0.0, 77.7, 32.88, 0.0, 0.0, 0.0, 39.08, 0.0, 38.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 0.0, 83.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 24.6], ["noise", 20.02], ["mains hum", 19.38]], null, null, null, [["sidetone", 43.91], ["speech", 27.46], ["hum", 4.22]], null, [["hum", 15.94], ["speech", 15.38], ["mains hum", 12.54]], null, null, null, null, null, null, [["hum", 16.21], ["snicker", 7.6], ["eruption", 6.5]], null, null, null, null, null, null], "duration": [-0.14, -0.04, 1.64, 0.82, 0.03, 2.77, 0.61, 1.16, 0.34, -0.33, 0.51, 4.71, 4.99, 0.91, 0.22, 1.98, 3.95, 0.03, 4.79, 1.89, 1.43, 0.55, 1.14, -0.15, 0.6, 2.62, 0.94, 0.11, 0.14, 5.05, 0.28, 0.34]} \ No newline at end of file diff --git a/annotations_1/sAvGdule3fA_filtered.json b/annotations_1/sAvGdule3fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef0b1094eaf27534549dda360e2ab5c7a57d96de --- /dev/null +++ b/annotations_1/sAvGdule3fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.89], [13.0, 13.71], [14.0, 14.32], [15.0, 18.52], [19.0, 20.63], [21.0, 22.74], [25.0, 27.75], [28.0, 28.92], [29.0, 30.87], [32.0, 32.32], [33.0, 33.13], [34.0, 38.47], [39.0, 41.89], [42.0, 43.8], [45.0, 46.16], [47.0, 50.3], [51.0, 53.82], [55.0, 56.07], [57.0, 63.29], [64.0, 65.21], [66.0, 68.79], [69.0, 70.92], [73.0, 73.99], [75.0, 76.11], [77.0, 79.71], [80.0, 81.65], [83.0, 85.9], [87.0, 87.42], [88.0, 87.79], [89.0, 90.29], [91.0, 93.31], [95.0, 94.93], [98.0, 101.6], [105.0, 105.19], [109.0, 113.07], [115.0, 115.3], [116.0, 123.06], [125.0, 128.49], [129.0, 134.5], [135.0, 135.3], [136.0, 137.24], [138.0, 138.82], [140.0, 140.63], [141.0, 150.08], [153.0, 155.31], [157.0, 157.67], [161.0, 162.35], [163.0, 164.96], [166.0, 166.97], [168.0, 169.97], [171.0, 171.96], [173.0, 173.21], [177.0, 184.1], [186.0, 188.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 78.21, 0.0, 0.0, 86.82, 0.0, 0.0, 0.0, 0.0, 87.19, 83.88, 0.0, 0.0, 75.88, 76.86, 0.0, 50.06, 0.0, 53.65, 0.0, 0.0, 0.0, 86.09, 0.0, 64.18, 0.0, 0.0, 0.0, 61.57, 0.0, 53.47, 0.0, 40.38, 0.0, 50.97, 42.33, 39.38, 0.0, 0.0, 0.0, 0.0, 39.94, 47.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.52, 37.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 36.88], ["music", 22.37], ["hum", 13.93]], null, null, [["music", 26.15], ["organ", 13.49], ["musical instrument", 10.53]], [["music", 49.68], ["theremin", 12.61], ["musical instrument", 5.17]], null, null, null, null, [["music", 43.83], ["speech", 24.39], ["foghorn", 13.96]], [["music", 27.07], ["hum", 8.67], ["mains hum", 8.54]], null, null, null, null, null, null, null, [["music", 45.96], ["theremin", 24.0], ["foghorn", 5.16]], [["music", 56.38], ["didgeridoo", 21.33], ["theremin", 4.84]]], "duration": [0.89, 0.71, 0.32, 3.52, 1.63, 1.74, 2.75, 0.92, 1.87, 0.32, 0.13, 4.47, 2.89, 1.8, 1.16, 3.3, 2.82, 1.07, 6.29, 1.21, 2.79, 1.92, 0.99, 1.11, 2.71, 1.65, 2.9, 0.42, -0.21, 1.29, 2.31, -0.07, 3.6, 0.19, 4.07, 0.3, 7.06, 3.49, 5.5, 0.3, 1.24, 0.82, 0.63, 9.08, 2.31, 0.67, 1.35, 1.96, 0.97, 1.97, 0.96, 0.21, 7.1, 2.5]} \ No newline at end of file diff --git a/annotations_1/sC78ImgOLQI_filtered.json b/annotations_1/sC78ImgOLQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0162137acdf68374897c1e991f85912f54531a4 --- /dev/null +++ b/annotations_1/sC78ImgOLQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.23], [4.0, 5.36], [14.0, 13.91], [17.0, 17.14], [18.0, 18.27], [19.0, 50.58], [54.0, 56.03], [57.0, 58.99], [60.0, 60.69], [62.0, 65.8], [67.0, 68.37], [69.0, 70.75], [72.0, 72.47], [73.0, 74.28], [75.0, 82.43], [83.0, 98.1], [98.0, 98.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.46, 0.0, 0.0, 67.25, 0.0, 0.0, 0.0, 0.0, 34.06, 32.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 19.53], ["music", 15.96], ["synthesizer", 9.49]], [["music", 25.2], ["synthesizer", 11.78], ["speech", 11.25]], null], "duration": [0.23, 1.36, -0.09, 0.14, 0.27, 31.58, 2.03, 1.99, 0.69, 3.8, 1.37, 1.75, 0.47, 1.28, 7.43, 15.1, 0.9]} \ No newline at end of file diff --git a/annotations_1/sCSTQpBwqqs_filtered.json b/annotations_1/sCSTQpBwqqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e41add6143718548ec81e38aafe7e5b849449bf3 --- /dev/null +++ b/annotations_1/sCSTQpBwqqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 42.23], [43.0, 43.95], [44.0, 51.26], [52.0, 53.92], [55.0, 56.34], [57.0, 62.78], [64.0, 79.54], [80.0, 81.67], [82.0, 92.33], [93.0, 96.52], [98.0, 103.44], [104.0, 108.48], [119.0, 119.35], [122.0, 124.75], [125.0, 127.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [67.38, 0.0, 88.1, 0.0, 0.0, 71.14, 34.48, 0.0, 46.68, 53.65, 49.5, 37.85, 0.0, 55.6, 47.54], "audiomae_on_audioset": [null, null, null, null, null, null, [["hum", 47.87], ["mains hum", 19.15], ["music", 5.57]], null, [["insect", 40.43], ["animal", 7.48], ["fly, housefly", 6.62]], null, [["fly, housefly", 12.96], ["fireworks", 12.49], ["insect", 11.83]], [["speech", 39.45], ["explosion", 9.48], ["whack, thwack", 4.39]], null, null, [["fly, housefly", 34.31], ["insect", 29.96], ["speech", 10.47]]], "duration": [26.23, 0.95, 7.26, 1.92, 1.34, 5.78, 15.54, 1.67, 10.33, 3.52, 5.44, 4.48, 0.35, 2.75, 2.87]} \ No newline at end of file diff --git a/annotations_1/sCr9YZRDsJA_filtered.json b/annotations_1/sCr9YZRDsJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad652c67a4e6e37c9333b62603c656dbad018c7e --- /dev/null +++ b/annotations_1/sCr9YZRDsJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.45], [8.0, 8.92], [17.0, 17.98], [24.0, 25.69], [30.0, 30.0], [39.0, 39.39], [50.0, 50.55], [54.0, 54.36], [67.0, 74.36], [77.0, 77.7], [78.0, 79.62], [104.0, 104.8], [106.0, 106.1], [111.0, 115.48], [126.0, 127.31], [130.0, 131.14], [133.0, 133.76], [134.0, 135.72], [137.0, 146.38], [147.0, 148.09], [153.0, 155.01], [157.0, 160.3], [164.0, 164.73], [165.0, 174.8], [182.0, 182.63], [184.0, 208.94], [210.0, 213.17], [213.0, 213.34], [213.0, 213.44], [213.0, 213.61], [214.0, 224.34], [231.0, 232.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.51, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 29.31, 0.0, 30.96, 29.03, 0.0, 29.16, 0.0, 30.16, 29.08, 0.0, 0.0, 0.0, 29.48, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 71.84], ["scratching (performance technique)", 7.11], ["electronic music", 3.47]], null, null, null, null, null, null, null, null, null, [["music", 45.33], ["speech", 39.53], ["didgeridoo", 1.94]], null, [["speech", 62.65], ["vehicle", 6.68], ["boat, water vehicle", 3.47]], [["speech", 61.0], ["music", 9.7], ["vehicle", 3.78]], null, [["speech", 18.11], ["livestock, farm animals, working animals", 10.29], ["cattle, bovinae", 5.84]], null, [["speech", 19.36], ["cattle, bovinae", 12.05], ["music", 11.99]], [["music", 47.37], ["whoosh, swoosh, swish", 4.11], ["whack, thwack", 3.61]], null, null, null, [["sidetone", 21.84], ["throbbing", 20.94], ["music", 20.1]], null], "duration": [0.45, 0.92, 0.98, 1.69, 0.0, 0.39, 0.55, 0.36, 7.36, 0.7, 1.62, 0.8, 0.1, 4.48, 1.31, 1.14, 0.76, 1.72, 9.38, 1.09, 2.01, 3.3, 0.73, 9.8, 0.63, 24.94, 3.17, 0.34, 0.44, 0.61, 10.34, 1.36]} \ No newline at end of file diff --git a/annotations_1/sCsMjWjftZs_filtered.json b/annotations_1/sCsMjWjftZs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b59c66a6a1aa76ac969f47d244fb83b090e39f60 --- /dev/null +++ b/annotations_1/sCsMjWjftZs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.5], [11.0, 11.03], [13.0, 13.95], [18.0, 44.76], [48.0, 52.35], [55.0, 62.65], [63.0, 64.96], [71.0, 79.35], [86.0, 87.52], [88.0, 93.38], [94.0, 95.4], [99.0, 101.56], [103.0, 103.89], [106.0, 107.08], [108.0, 136.7], [137.0, 137.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.27, 64.86, 31.58, 0.0, 33.34, 0.0, 35.67, 0.0, 39.69, 0.0, 0.0, 31.65, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 81.98], ["speech", 1.34], ["musical instrument", 0.95]], null, [["music", 77.15], ["theremin", 5.36], ["musical instrument", 3.72]], null, [["music", 75.62], ["throbbing", 11.71], ["hum", 1.78]], null, [["hum", 36.38], ["music", 22.69], ["mains hum", 15.16]], null, [["music", 42.07], ["foghorn", 14.28], ["speech", 2.25]], null, null, [["music", 70.3], ["scary music", 2.9], ["mains hum", 2.65]], null], "duration": [0.5, 0.03, 0.95, 26.76, 4.35, 7.65, 1.96, 8.35, 1.52, 5.38, 1.4, 2.56, 0.89, 1.08, 28.7, 0.94]} \ No newline at end of file diff --git a/annotations_1/sDEWZnPJGRU_filtered.json b/annotations_1/sDEWZnPJGRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef31538318e9f36825d191c5f1d733aa24eeaf40 --- /dev/null +++ b/annotations_1/sDEWZnPJGRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.01], [30.0, 31.51], [33.0, 34.26], [37.0, 45.45], [48.0, 49.23], [49.0, 50.16], [51.0, 56.81], [59.0, 62.26], [71.0, 72.4], [81.0, 83.67], [92.0, 92.97], [94.0, 95.34], [113.0, 115.18], [127.0, 128.14], [131.0, 143.4], [148.0, 155.55], [169.0, 170.26], [171.0, 172.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.02, 0.0, 0.0, 33.05, 0.0, 0.0, 32.92, 32.64, 0.0, 31.63, 0.0, 0.0, 36.39, 0.0, 32.3, 31.58, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 30.36], ["mosquito", 27.39], ["insect", 16.12]], null, null, [["music", 67.9], ["didgeridoo", 6.38], ["throbbing", 2.29]], [["music", 66.85], ["didgeridoo", 3.94], ["musical instrument", 1.33]], null, [["music", 67.86], ["carnatic music", 5.67], ["chant", 1.92]], null, null, [["music", 83.32], ["electronic music", 1.61], ["throbbing", 1.38]], null, [["music", 65.81], ["musical instrument", 4.78], ["didgeridoo", 3.08]], [["music", 71.31], ["buzz", 4.0], ["mosquito", 2.6]], null, null], "duration": [2.01, 1.51, 1.26, 8.45, 1.23, 1.16, 5.81, 3.26, 1.4, 2.67, 0.97, 1.34, 2.18, 1.14, 12.4, 7.55, 1.26, 1.42]} \ No newline at end of file diff --git a/annotations_1/sF-j-GhV6xw_filtered.json b/annotations_1/sF-j-GhV6xw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b72e0c970b91bec56f38827b4648e1bc5ccf636 --- /dev/null +++ b/annotations_1/sF-j-GhV6xw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [10.0, 14.62], [17.0, 16.78], [22.0, 23.9], [28.0, 30.52], [32.0, 32.43], [40.0, 40.36], [45.0, 45.54], [51.0, 51.73], [53.0, 54.23], [59.0, 58.77], [62.0, 62.02], [70.0, 70.9], [74.0, 74.53], [75.0, 75.74], [78.0, 79.12], [88.0, 87.98], [91.0, 92.37], [100.0, 102.66], [107.0, 107.15], [112.0, 114.98], [116.0, 116.18], [117.0, 117.96], [132.0, 132.43], [148.0, 149.81], [167.0, 169.69], [172.0, 173.57], [179.0, 187.78], [190.0, 190.56], [191.0, 192.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 36.98, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.77, 0.0, 53.4, 0.0, 0.0, 0.0, 0.0, 28.85, 0.0, 47.98, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 43.65], ["throbbing", 18.5], ["hum", 8.28]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 30.28], ["hum", 20.33], ["static", 7.34]], null, [["music", 43.74], ["breaking", 15.76], ["buzz", 6.2]], null, null], "duration": [0.61, 4.62, -0.22, 1.9, 2.52, 0.43, 0.36, 0.54, 0.73, 1.23, -0.23, 0.02, 0.9, 0.53, 0.74, 1.12, -0.02, 1.37, 2.66, 0.15, 2.98, 0.18, 0.96, 0.43, 1.81, 2.69, 1.57, 8.78, 0.56, 1.01]} \ No newline at end of file diff --git a/annotations_1/sGLXpKnQfSs_filtered.json b/annotations_1/sGLXpKnQfSs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e80b84603aa6db98d67d5e16f1bc3671915b3c2c --- /dev/null +++ b/annotations_1/sGLXpKnQfSs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 39.09], [40.0, 40.95], [41.0, 41.88], [43.0, 45.59], [55.0, 60.74], [64.0, 84.48], [87.0, 88.84], [92.0, 92.82], [94.0, 122.5], [124.0, 124.46], [125.0, 125.49], [126.0, 126.49], [128.0, 150.3], [151.0, 152.31], [155.0, 155.41], [160.0, 161.65], [163.0, 163.71]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [43.66, 0.0, 0.0, 35.54, 38.58, 33.8, 0.0, 0.0, 33.7, 0.0, 0.0, 0.0, 31.08, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 76.45], ["electronic music", 3.81], ["telephone bell ringing", 3.3]], null, null, [["music", 77.38], ["hum", 2.95], ["throbbing", 2.87]], [["music", 31.4], ["speech", 13.33], ["throbbing", 10.14]], [["music", 45.66], ["speech", 19.73], ["throbbing", 10.39]], null, null, [["music", 69.48], ["didgeridoo", 6.44], ["theremin", 2.3]], null, null, null, [["music", 49.68], ["hum", 9.56], ["cacophony", 6.65]], null, null, null, null], "duration": [28.09, 0.95, 0.88, 2.59, 5.74, 20.48, 1.84, 0.82, 28.5, 0.46, 0.49, 0.49, 22.3, 1.31, 0.41, 1.65, 0.71]} \ No newline at end of file diff --git a/annotations_1/sGPeVmnAFAI_filtered.json b/annotations_1/sGPeVmnAFAI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..463d84d235352428f15f327c082c6666da0f45af --- /dev/null +++ b/annotations_1/sGPeVmnAFAI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.0], [5.0, 6.89], [8.0, 9.63], [13.0, 12.7], [16.0, 16.53], [21.0, 21.88], [23.0, 23.9], [26.0, 26.89], [29.0, 29.78], [33.0, 33.18], [34.0, 35.75], [36.0, 36.07], [38.0, 39.24], [40.0, 39.9], [51.0, 51.8], [53.0, 53.49], [57.0, 57.84], [59.0, 59.54], [61.0, 64.74], [65.0, 66.34], [69.0, 70.44], [71.0, 73.09], [74.0, 77.62], [81.0, 82.29], [83.0, 84.08], [86.0, 87.93], [89.0, 91.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.17, 0.0, 0.0, 53.28, 92.31, 0.0, 0.0, 0.0, 99.62], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 1.89, 1.63, -0.3, 0.53, 0.88, 0.9, 0.89, 0.78, 0.18, 1.75, 0.07, 1.24, -0.1, 0.8, 0.49, 0.84, 0.54, 3.74, 1.34, 1.44, 2.09, 3.62, 1.29, 1.08, 1.93, 2.03]} \ No newline at end of file diff --git a/annotations_1/sH8nzHarprc_filtered.json b/annotations_1/sH8nzHarprc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59960ebf078d57878ac674415bbf65104e13c7cd --- /dev/null +++ b/annotations_1/sH8nzHarprc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.02], [15.0, 21.84], [27.0, 30.01], [34.0, 34.65], [40.0, 41.59], [43.0, 43.48], [51.0, 51.43], [53.0, 54.16], [61.0, 60.94], [68.0, 70.53], [74.0, 98.68], [102.0, 104.41], [108.0, 111.3], [112.0, 137.59], [140.0, 141.59], [144.0, 145.71], [148.0, 149.05]], "keep_status": [true, false, true, false, false, false, false, false, false, true, true, false, true, false, false, false, false], "silence_prob": [34.44, 33.64, 34.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.4, 28.88, 29.9, 29.07, 28.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.47], ["hum", 25.11], ["mains hum", 11.25]], [["music", 39.76], ["hum", 25.16], ["throbbing", 13.23]], [["speech", 37.25], ["music", 13.64], ["hum", 4.23]], null, null, null, null, null, null, [["music", 27.06], ["tabla", 11.49], ["carnatic music", 6.39]], [["music", 61.47], ["sound effect", 2.86], ["buzz", 2.78]], [["music", 51.73], ["speech", 23.96], ["buzz", 5.44]], [["music", 46.21], ["speech", 15.24], ["boing", 6.85]], [["music", 49.72], ["speech", 19.7], ["boing", 2.75]], null, null, null], "duration": [4.02, 6.84, 3.01, 0.65, 1.59, 0.48, 0.43, 1.16, -0.06, 2.53, 24.68, 2.41, 3.3, 25.59, 1.59, 1.71, 1.05]} \ No newline at end of file diff --git a/annotations_1/sIDHrcDf-N0_filtered.json b/annotations_1/sIDHrcDf-N0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d680cd37e3df33519a49135b9665e2830a0b319 --- /dev/null +++ b/annotations_1/sIDHrcDf-N0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 21.32], [28.0, 33.62], [34.0, 34.45], [35.0, 34.86], [36.0, 37.03], [41.0, 42.06], [43.0, 43.41], [44.0, 45.12], [48.0, 49.22], [50.0, 61.94], [62.0, 62.58], [63.0, 74.28], [77.0, 78.49], [83.0, 83.61], [87.0, 88.59], [90.0, 107.94], [120.0, 121.39], [123.0, 122.91], [126.0, 128.31], [129.0, 130.52], [132.0, 134.96], [138.0, 137.89], [140.0, 182.19]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [28.49, 28.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.26, 0.0, 28.85, 0.0, 0.0, 0.0, 29.03, 0.0, 0.0, 31.23, 0.0, 29.45, 0.0, 0.0], "audiomae_on_audioset": [[["music", 17.49], ["vehicle", 13.44], ["aircraft", 7.85]], [["speech", 34.39], ["music", 23.27], ["vehicle", 6.43]], null, null, null, null, null, null, null, [["music", 47.01], ["throbbing", 30.9], ["hum", 4.46]], null, [["speech", 56.71], ["vehicle", 8.13], ["music", 5.86]], null, null, null, [["music", 68.48], ["speech", 11.66], ["musical instrument", 2.08]], null, null, [["throbbing", 27.21], ["music", 23.48], ["hum", 16.83]], null, [["music", 45.94], ["tuning fork", 10.24], ["ping", 4.57]], null, null], "duration": [19.32, 5.62, 0.45, -0.14, 1.03, 1.06, 0.41, 1.12, 1.22, 11.94, 0.58, 11.28, 1.49, 0.61, 1.59, 17.94, 1.39, -0.09, 2.31, 1.52, 2.96, -0.11, 42.19]} \ No newline at end of file diff --git a/annotations_1/sILyPxN_1Dc_filtered.json b/annotations_1/sILyPxN_1Dc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35ffc236df44acbf8e73da9356a86502dd20dd1b --- /dev/null +++ b/annotations_1/sILyPxN_1Dc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.73], [16.0, 16.44], [19.0, 20.06], [22.0, 22.67], [47.0, 47.41], [51.0, 50.99], [53.0, 56.24], [58.0, 57.96], [69.0, 71.17], [72.0, 72.59]], "keep_status": [false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 73.06, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 46.53], ["animal", 10.62], ["domestic animals, pets", 5.5]], null, null, null], "duration": [0.73, 0.44, 1.06, 0.67, 0.41, -0.01, 3.24, -0.04, 2.17, 0.59]} \ No newline at end of file diff --git a/annotations_1/sISJ7r3kERg_filtered.json b/annotations_1/sISJ7r3kERg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9150d2c356b09690712d06b7446cbdaa92e4d8bf --- /dev/null +++ b/annotations_1/sISJ7r3kERg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.13], [8.0, 8.67], [10.0, 20.8], [21.0, 23.8], [25.0, 26.11], [28.0, 28.27], [28.0, 29.76], [30.0, 30.55], [32.0, 32.26], [33.0, 33.12], [33.0, 34.97], [36.0, 36.91], [38.0, 38.53], [42.0, 43.26], [44.0, 45.79], [47.0, 47.8], [48.0, 48.95], [50.0, 49.92], [51.0, 51.58], [54.0, 57.37], [58.0, 58.82], [59.0, 59.58], [60.0, 61.37], [62.0, 63.98], [65.0, 68.67], [70.0, 69.79], [71.0, 71.95], [73.0, 74.6], [75.0, 75.78], [76.0, 76.96], [78.0, 78.56], [79.0, 79.89], [81.0, 82.21], [82.0, 90.98], [96.0, 96.35], [99.0, 99.25], [101.0, 101.46], [102.0, 107.43], [108.0, 108.01], [108.0, 108.46], [109.0, 114.45], [117.0, 117.27], [118.0, 118.44], [121.0, 127.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [92.8, 0.0, 50.31, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.44, 0.0, 0.0, 0.0, 0.0, 51.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.78, 0.0, 0.0, 0.0, 57.56, 0.0, 0.0, 29.87, 0.0, 0.0, 46.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.18], ["wild animals", 15.1], ["animal", 11.72]], null, null, null, null, null, null, [["livestock, farm animals, working animals", 23.86], ["cattle, bovinae", 20.49], ["moo", 18.08]], null, null, [["theremin", 46.15], ["speech", 20.17], ["music", 4.15]]], "duration": [6.13, 0.67, 10.8, 2.8, 1.11, 0.27, 1.76, 0.55, 0.26, 0.12, 1.97, 0.91, 0.53, 1.26, 1.79, 0.8, 0.95, -0.08, 0.58, 3.37, 0.82, 0.58, 1.37, 1.98, 3.67, -0.21, 0.95, 1.6, 0.78, 0.96, 0.56, 0.89, 1.21, 8.98, 0.35, 0.25, 0.46, 5.43, 0.01, 0.46, 5.45, 0.27, 0.44, 6.23]} \ No newline at end of file diff --git a/annotations_1/sIY7BQkbIT8_filtered.json b/annotations_1/sIY7BQkbIT8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a784adb5a939532e36570a0ebbb87612e73e93e --- /dev/null +++ b/annotations_1/sIY7BQkbIT8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[170.0, 170.87], [171.0, 217.11]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.87, 46.11]} \ No newline at end of file diff --git a/annotations_1/sIwsArbH5ck_filtered.json b/annotations_1/sIwsArbH5ck_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..98f43d29d5ee264972bdba2845891f98a9deeab1 --- /dev/null +++ b/annotations_1/sIwsArbH5ck_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.08], [16.0, 15.99], [29.0, 29.83], [30.0, 30.67], [39.0, 42.89], [56.0, 56.13], [57.0, 57.06], [58.0, 58.13], [66.0, 68.76], [69.0, 70.06], [76.0, 77.23], [79.0, 78.98], [81.0, 82.65], [94.0, 95.23], [104.0, 105.11], [106.0, 108.53], [112.0, 114.05], [117.0, 131.19], [134.0, 138.5], [144.0, 144.0], [144.0, 144.48], [154.0, 155.41], [161.0, 168.32]], "keep_status": [false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 36.37, 0.0, 0.0, 0.0, 39.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.49, 36.42, 50.71, 51.77, 0.0, 0.0, 0.0, 53.16], "audiomae_on_audioset": [null, null, null, null, [["hum", 14.7], ["mains hum", 9.27], ["music", 8.79]], null, null, null, [["hum", 13.78], ["throbbing", 10.17], ["music", 9.21]], null, null, null, null, null, null, [["music", 35.43], ["speech", 19.17], ["mains hum", 8.46]], [["speech", 39.01], ["music", 4.02], ["hum", 3.57]], null, null, null, null, null, null], "duration": [1.08, -0.01, 0.83, 0.67, 3.89, 0.13, 0.06, 0.13, 2.76, 1.06, 1.23, -0.02, 1.65, 1.23, 1.11, 2.53, 2.05, 14.19, 4.5, 0.0, 0.48, 1.41, 7.32]} \ No newline at end of file diff --git a/annotations_1/sJsCKwZLztk_filtered.json b/annotations_1/sJsCKwZLztk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6273f2e332cff5626340acbc65b67dc45429f85c --- /dev/null +++ b/annotations_1/sJsCKwZLztk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.67], [3.0, 3.77], [5.0, 5.78], [9.0, 10.34], [15.0, 14.98], [18.0, 17.74], [18.0, 18.33], [20.0, 21.37], [25.0, 38.67], [42.0, 42.99], [46.0, 47.76], [49.0, 61.62], [63.0, 64.05], [66.0, 68.3], [69.0, 69.63], [73.0, 81.19], [84.0, 84.3], [85.0, 85.7], [103.0, 103.3], [105.0, 106.02], [116.0, 117.39], [122.0, 125.19], [128.0, 129.56], [131.0, 130.77], [131.0, 131.23], [133.0, 134.54], [136.0, 136.93], [140.0, 140.36], [147.0, 147.24], [150.0, 157.99], [158.0, 158.31], [160.0, 161.1], [162.0, 162.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.35, 0.0, 0.0, 78.21, 0.0, 41.48, 0.0, 33.12, 0.0, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.52, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.17], ["speech", 29.08], ["theremin", 7.56]], null, [["music", 41.97], ["speech", 17.37], ["carnatic music", 12.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.33, 0.77, 0.78, 1.34, -0.02, -0.26, 0.33, 1.37, 13.67, 0.99, 1.76, 12.62, 1.05, 2.3, 0.63, 8.19, 0.3, 0.7, 0.3, 1.02, 1.39, 3.19, 1.56, -0.23, 0.23, 1.54, 0.93, 0.36, 0.24, 7.99, 0.31, 1.1, 0.35]} \ No newline at end of file diff --git a/annotations_1/sJsHcwZsNnI_filtered.json b/annotations_1/sJsHcwZsNnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f32a7fcd1cfa342a688ff5b2f306b1ebee21869 --- /dev/null +++ b/annotations_1/sJsHcwZsNnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 48.17], [54.0, 56.12], [57.0, 61.28], [67.0, 73.55], [74.0, 74.33], [85.0, 85.51], [87.0, 87.91], [90.0, 90.46], [92.0, 96.96], [98.0, 99.08], [107.0, 107.45], [110.0, 134.4], [136.0, 136.14], [137.0, 139.95], [142.0, 151.68]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [32.39, 34.01, 32.56, 30.12, 0.0, 0.0, 0.0, 0.0, 32.25, 0.0, 0.0, 29.92, 0.0, 34.26, 28.82], "audiomae_on_audioset": [[["music", 41.46], ["telephone bell ringing", 23.05], ["telephone", 11.52]], [["music", 68.83], ["throbbing", 7.12], ["hum", 4.33]], [["music", 62.03], ["livestock, farm animals, working animals", 3.53], ["reggae", 3.16]], [["music", 52.1], ["speech", 5.2], ["musical instrument", 4.98]], null, null, null, null, [["music", 70.14], ["theremin", 4.43], ["throbbing", 3.69]], null, null, [["music", 40.71], ["speech", 29.93], ["throbbing", 6.15]], null, [["fly, housefly", 54.67], ["mosquito", 26.49], ["insect", 17.41]], [["music", 46.24], ["speech", 25.16], ["throbbing", 11.91]]], "duration": [5.17, 2.12, 4.28, 6.55, 0.33, 0.51, 0.91, 0.46, 4.96, 1.08, 0.45, 24.4, 0.14, 2.95, 9.68]} \ No newline at end of file diff --git a/annotations_1/sL6gDhH7FpE_filtered.json b/annotations_1/sL6gDhH7FpE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dcb7954492e5e3c5065d3ce299c8310a02df9b0 --- /dev/null +++ b/annotations_1/sL6gDhH7FpE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.49], [12.0, 15.15], [18.0, 19.94], [28.0, 28.75], [30.0, 30.57], [34.0, 34.28], [36.0, 36.46], [37.0, 37.27], [40.0, 41.64], [43.0, 43.71], [46.0, 47.09], [51.0, 51.26], [54.0, 54.46], [55.0, 55.59], [57.0, 58.6], [87.0, 88.43], [89.0, 90.56], [92.0, 91.79], [94.0, 96.43], [105.0, 105.22], [109.0, 110.42], [113.0, 113.22], [117.0, 117.12], [122.0, 123.65], [134.0, 133.89], [135.0, 135.53], [138.0, 138.75], [139.0, 141.42], [143.0, 146.42], [149.0, 149.82], [151.0, 151.56], [153.0, 154.62], [156.0, 156.91], [159.0, 159.63], [161.0, 161.91], [172.0, 172.23], [174.0, 174.87], [177.0, 177.96], [180.0, 180.89], [190.0, 190.73], [193.0, 193.35], [193.0, 193.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.39, 47.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.62], ["hum", 3.95], ["musical instrument", 3.9]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.49, 3.15, 1.94, 0.75, 0.57, 0.28, 0.46, 0.27, 1.64, 0.71, 1.09, 0.26, 0.46, 0.59, 1.6, 1.43, 1.56, -0.21, 2.43, 0.22, 1.42, 0.22, 0.12, 1.65, -0.11, 0.53, 0.75, 2.42, 3.42, 0.82, 0.56, 1.62, 0.91, 0.63, 0.91, 0.23, 0.87, 0.96, 0.89, 0.73, 0.35, 0.48]} \ No newline at end of file diff --git a/annotations_1/sLKnt2jBax4_filtered.json b/annotations_1/sLKnt2jBax4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aba0825d1a0e8ee11d8a1915ad861715682b20c3 --- /dev/null +++ b/annotations_1/sLKnt2jBax4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.18], [14.0, 14.27], [15.0, 15.15], [18.0, 20.51], [24.0, 43.9], [51.0, 51.48], [59.0, 81.18], [82.0, 82.63]], "keep_status": [false, false, false, true, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 33.6, 30.53, 0.0, 32.34, 0.0], "audiomae_on_audioset": [null, null, null, [["cattle, bovinae", 34.2], ["moo", 19.86], ["livestock, farm animals, working animals", 14.82]], [["music", 43.27], ["livestock, farm animals, working animals", 7.78], ["groan", 6.69]], null, [["music", 47.01], ["speech", 7.42], ["livestock, farm animals, working animals", 5.96]], null], "duration": [0.18, 0.27, 0.15, 2.51, 19.9, 0.48, 22.18, 0.63]} \ No newline at end of file diff --git a/annotations_1/sLLp4bO6dDI_filtered.json b/annotations_1/sLLp4bO6dDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b27fc2943ac84c7fafba4eaeab1fec903a4f354 --- /dev/null +++ b/annotations_1/sLLp4bO6dDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.62], [25.0, 30.91], [31.0, 33.91], [35.0, 44.27], [46.0, 84.05], [84.0, 85.5], [86.0, 87.52], [90.0, 102.88], [103.0, 140.58], [142.0, 155.34], [156.0, 162.63], [166.0, 167.0], [168.0, 169.2], [170.0, 173.38], [175.0, 175.51]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 44.52, 40.71, 42.0, 0.0, 0.0, 0.0, 36.11, 0.0, 46.43, 47.86, 0.0, 0.0, 47.12, 0.0], "audiomae_on_audioset": [null, [["music", 25.09], ["speech", 17.46], ["hum", 8.88]], [["speech", 23.16], ["hum", 21.89], ["mains hum", 15.98]], [["hum", 46.3], ["mains hum", 32.32], ["throbbing", 6.88]], null, null, null, [["frog", 78.91], ["owl", 6.66], ["hum", 1.91]], null, [["hum", 61.81], ["mains hum", 16.37], ["throbbing", 11.67]], [["rumble", 32.55], ["hum", 27.28], ["mains hum", 12.8]], null, null, [["hum", 32.45], ["music", 9.28], ["throbbing", 8.92]], null], "duration": [1.62, 5.91, 2.91, 9.27, 38.05, 1.5, 1.52, 12.88, 37.58, 13.34, 6.63, 1.0, 1.2, 3.38, 0.51]} \ No newline at end of file diff --git a/annotations_1/sM1I11qUM44_filtered.json b/annotations_1/sM1I11qUM44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..448c222fb02bf62f335d87484dd4203c5e290b23 --- /dev/null +++ b/annotations_1/sM1I11qUM44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.89], [24.0, 28.51], [34.0, 37.08], [42.0, 43.07], [44.0, 69.06], [73.0, 98.91], [103.0, 106.1], [110.0, 133.19], [134.0, 134.47], [138.0, 140.19], [143.0, 143.18], [144.0, 164.39], [170.0, 188.32], [197.0, 199.0]], "keep_status": [false, true, true, false, true, true, true, true, false, true, false, true, true, false], "silence_prob": [0.0, 33.01, 32.39, 0.0, 32.33, 32.39, 37.84, 32.37, 0.0, 45.27, 0.0, 31.41, 30.34, 33.13], "audiomae_on_audioset": [null, [["speech", 30.62], ["explosion", 17.45], ["burst, pop", 12.96]], [["music", 23.21], ["throbbing", 9.3], ["didgeridoo", 7.95]], null, [["music", 32.27], ["speech", 27.89], ["whack, thwack", 3.38]], [["music", 20.83], ["buzz", 16.84], ["fly, housefly", 10.99]], [["thunk", 44.28], ["music", 13.57], ["creak", 10.15]], [["speech", 35.9], ["whack, thwack", 19.88], ["music", 13.22]], null, [["sine wave", 37.96], ["speech", 14.84], ["music", 9.94]], null, [["music", 57.44], ["speech", 6.72], ["whack, thwack", 4.43]], [["music", 18.88], ["throbbing", 11.2], ["whack, thwack", 7.88]], [["fly, housefly", 46.17], ["insect", 30.73], ["mosquito", 12.25]]], "duration": [0.89, 4.51, 3.08, 1.07, 25.06, 25.91, 3.1, 23.19, 0.47, 2.19, 0.18, 20.39, 18.32, 2.0]} \ No newline at end of file diff --git a/annotations_1/sMLop6XZBEw_filtered.json b/annotations_1/sMLop6XZBEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5696b287d203fa24ed639bcdede2eab33827b1a7 --- /dev/null +++ b/annotations_1/sMLop6XZBEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.95], [15.0, 25.05], [30.0, 34.86], [38.0, 38.62], [47.0, 47.21], [49.0, 51.63], [55.0, 54.94], [56.0, 56.73], [58.0, 58.38], [59.0, 60.05], [61.0, 61.55], [63.0, 63.44], [65.0, 72.28], [74.0, 77.3], [83.0, 85.02], [87.0, 87.44], [87.0, 88.82], [97.0, 98.37], [101.0, 105.02], [107.0, 107.42], [111.0, 111.08], [113.0, 113.97], [115.0, 115.89], [116.0, 158.25]], "keep_status": [false, true, true, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 28.76, 28.88, 0.0, 0.0, 35.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 38.2, 34.39, 0.0, 0.0, 0.0, 34.57, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 54.52], ["vehicle", 4.41], ["speech", 4.33]], [["music", 34.24], ["speech", 19.15], ["moo", 13.86]], null, null, [["music", 47.88], ["electronic music", 6.42], ["synthesizer", 4.2]], null, null, null, null, null, null, [["music", 65.1], ["speech", 11.73], ["throbbing", 4.79]], [["music", 49.03], ["synthesizer", 11.17], ["musical instrument", 4.33]], [["music", 28.36], ["theremin", 20.39], ["foghorn", 15.74]], null, null, null, [["didgeridoo", 36.5], ["music", 34.42], ["throbbing", 4.26]], null, null, null, null, null], "duration": [1.95, 10.05, 4.86, 0.62, 0.21, 2.63, -0.06, 0.73, 0.38, 1.05, 0.55, 0.44, 7.28, 3.3, 2.02, 0.44, 1.82, 1.37, 4.02, 0.42, 0.08, 0.97, 0.89, 42.25]} \ No newline at end of file diff --git a/annotations_1/sMjmQzP9D6o_filtered.json b/annotations_1/sMjmQzP9D6o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ee360f5bdd10eb8bd8a132a5d32562ce3d0def7 --- /dev/null +++ b/annotations_1/sMjmQzP9D6o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.51], [10.0, 14.45], [16.0, 17.91], [19.0, 31.68], [32.0, 34.87], [36.0, 45.03], [45.0, 59.05], [62.0, 66.36], [68.0, 73.57], [74.0, 74.61], [75.0, 81.75], [83.0, 85.13], [89.0, 97.07], [103.0, 116.78], [118.0, 131.82], [135.0, 134.94], [137.0, 148.76], [149.0, 149.44], [153.0, 160.27], [161.0, 177.47]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.03, 0.0, 59.86, 41.24, 55.6, 47.43, 46.83, 53.04, 0.0, 52.92, 53.04, 36.78, 55.67, 41.89, 0.0, 43.03, 0.0, 37.98, 55.81], "audiomae_on_audioset": [null, null, null, null, [["music", 34.76], ["whale vocalization", 18.04], ["electronic music", 7.47]], null, [["music", 56.6], ["speech", 17.08], ["electronic music", 5.87]], [["music", 50.44], ["didgeridoo", 15.91], ["theremin", 8.77]], null, null, null, null, [["music", 29.04], ["speech", 15.95], ["foghorn", 4.86]], null, [["theremin", 46.08], ["music", 42.29], ["ambient music", 1.56]], null, [["music", 66.95], ["theremin", 10.43], ["ambient music", 2.05]], null, [["music", 56.6], ["carnatic music", 14.43], ["theremin", 9.19]], null], "duration": [0.51, 4.45, 1.91, 12.68, 2.87, 9.03, 14.05, 4.36, 5.57, 0.61, 6.75, 2.13, 8.07, 13.78, 13.82, -0.06, 11.76, 0.44, 7.27, 16.47]} \ No newline at end of file diff --git a/annotations_1/sMrjeejmCpI_filtered.json b/annotations_1/sMrjeejmCpI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6bd7f14d07abaa4f323bd7e48a43073221c4aeb --- /dev/null +++ b/annotations_1/sMrjeejmCpI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.75], [10.0, 14.12], [26.0, 30.05], [32.0, 33.15], [37.0, 41.49], [51.0, 53.11], [67.0, 68.62], [70.0, 70.51], [75.0, 75.57], [87.0, 91.15], [96.0, 96.74], [100.0, 100.23], [102.0, 102.44], [104.0, 104.11], [124.0, 125.44], [154.0, 155.73], [169.0, 170.73], [173.0, 172.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.94, 32.31, 0.0, 32.06, 31.91, 0.0, 0.0, 0.0, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 76.26], ["musical instrument", 3.96], ["synthesizer", 2.9]], [["music", 76.01], ["musical instrument", 2.97], ["funny music", 2.52]], null, [["music", 44.44], ["speech", 18.31], ["sidetone", 7.62]], [["music", 38.14], ["boing", 21.02], ["didgeridoo", 13.02]], null, null, null, [["music", 74.91], ["musical instrument", 7.39], ["didgeridoo", 3.54]], null, null, null, null, null, null, null, null], "duration": [0.75, 4.12, 4.05, 1.15, 4.49, 2.11, 1.62, 0.51, 0.57, 4.15, 0.74, 0.23, 0.44, 0.11, 1.44, 1.73, 1.73, -0.02]} \ No newline at end of file diff --git a/annotations_1/sOBIrjgDZr4_filtered.json b/annotations_1/sOBIrjgDZr4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51772936c4059c14d23e20bebb516ec9576ee67c --- /dev/null +++ b/annotations_1/sOBIrjgDZr4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.89], [5.0, 6.35], [8.0, 10.25], [11.0, 13.58], [17.0, 17.14], [20.0, 19.74], [33.0, 35.28], [37.0, 37.71], [41.0, 42.18], [43.0, 45.12], [50.0, 52.37], [56.0, 56.22], [57.0, 61.3], [65.0, 66.02], [67.0, 67.34], [69.0, 70.01], [72.0, 71.93], [72.0, 72.96], [74.0, 75.69], [77.0, 78.43], [79.0, 80.76], [81.0, 81.77], [82.0, 91.54], [96.0, 101.11], [103.0, 106.37], [110.0, 109.92], [112.0, 162.16], [163.0, 163.58], [166.0, 170.56], [173.0, 173.16], [174.0, 174.33]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.3, 0.0, 76.04, 97.54, 0.0, 0.0, 93.13, 0.0, 0.0, 96.54, 98.44, 0.0, 58.38, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.36, 98.86, 94.37, 0.0, 0.0, 0.0, 79.59, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.89, 1.35, 2.25, 2.58, 0.14, -0.26, 2.28, 0.71, 1.18, 2.12, 2.37, 0.22, 4.3, 1.02, 0.34, 1.01, -0.07, 0.96, 1.69, 1.43, 1.76, 0.77, 9.54, 5.11, 3.37, -0.08, 50.16, 0.58, 4.56, 0.16, 0.33]} \ No newline at end of file diff --git a/annotations_1/sOHoeZYeAeM_filtered.json b/annotations_1/sOHoeZYeAeM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ebd23c130d77e7d7c19b2b6db934c8a027600bd --- /dev/null +++ b/annotations_1/sOHoeZYeAeM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.28], [5.0, 5.75], [7.0, 9.59], [10.0, 15.75], [19.0, 29.12], [30.0, 34.43], [36.0, 61.97], [63.0, 78.0], [79.0, 80.82], [82.0, 84.13], [89.0, 89.16], [91.0, 93.43], [94.0, 97.77], [99.0, 99.33], [102.0, 102.88], [106.0, 107.11], [110.0, 112.26], [115.0, 120.21], [122.0, 123.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.62, 88.83, 99.31, 99.21, 73.97, 30.84, 0.0, 83.16, 0.0, 39.46, 51.88, 0.0, 0.0, 0.0, 66.63, 74.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 31.84], ["electric shaver, electric razor", 27.69], ["thunk", 19.01]], null, null, null, [["speech", 16.38], ["fly, housefly", 13.7], ["bee, wasp, etc.", 5.74]], null, null, null, null, null, null, null], "duration": [1.28, 0.75, 2.59, 5.75, 10.12, 4.43, 25.97, 15.0, 1.82, 2.13, 0.16, 2.43, 3.77, 0.33, 0.88, 1.11, 2.26, 5.21, 1.35]} \ No newline at end of file diff --git a/annotations_1/sPHeq8OM-dU_filtered.json b/annotations_1/sPHeq8OM-dU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..101cfc8c09432274a86510eb40be3a6a03d15ad4 --- /dev/null +++ b/annotations_1/sPHeq8OM-dU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.51], [5.0, 6.35], [7.0, 8.01], [9.0, 13.69], [14.0, 14.88], [15.0, 16.02], [17.0, 16.98], [18.0, 18.42], [19.0, 19.72], [20.0, 20.95], [23.0, 23.26], [24.0, 24.7], [25.0, 25.96], [30.0, 33.44], [34.0, 36.59], [37.0, 37.44], [40.0, 42.45], [47.0, 49.01], [53.0, 58.87], [61.0, 63.12], [65.0, 65.06], [79.0, 79.07], [80.0, 80.64], [92.0, 91.89], [99.0, 100.45], [105.0, 105.12], [107.0, 108.19], [118.0, 118.84], [119.0, 119.62], [123.0, 127.13], [136.0, 136.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 58.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.26, 73.36, 0.0, 47.5, 38.21, 32.08, 72.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.25, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 46.61], ["didgeridoo", 7.34], ["music", 6.81]], null, null, [["music", 86.06], ["carnatic music", 4.41], ["theremin", 1.43]], [["music", 81.46], ["carnatic music", 6.34], ["singing", 3.23]], [["music", 70.37], ["whimper", 4.01], ["speech", 3.41]], null, null, null, null, null, null, null, null, null, null, [["speech", 37.64], ["music", 17.77], ["vehicle", 6.75]], null], "duration": [1.51, 1.35, 1.01, 4.69, 0.88, 1.02, -0.02, 0.42, 0.72, 0.95, 0.26, 0.7, 0.96, 3.44, 2.59, 0.44, 2.45, 2.01, 5.87, 2.12, 0.06, 0.07, 0.64, -0.11, 1.45, 0.12, 1.19, 0.84, 0.62, 4.13, 0.63]} \ No newline at end of file diff --git a/annotations_1/sPlsA3_6hB8_filtered.json b/annotations_1/sPlsA3_6hB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebcc161bc050b93318cd7b5d0166cb648d5086f9 --- /dev/null +++ b/annotations_1/sPlsA3_6hB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 137.0], [138.0, 140.04]], "keep_status": [false, false], "silence_prob": [0.0, 51.71], "audiomae_on_audioset": [null, null], "duration": [129.0, 2.04]} \ No newline at end of file diff --git a/annotations_1/sQA199D8U2g_filtered.json b/annotations_1/sQA199D8U2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18bf8234039bc859137890d9795a4778f046eca3 --- /dev/null +++ b/annotations_1/sQA199D8U2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.33], [6.0, 7.64], [14.0, 14.67], [19.0, 20.06], [22.0, 23.58], [25.0, 25.93], [28.0, 33.22], [37.0, 81.41], [85.0, 87.05], [92.0, 91.98], [92.0, 95.34], [97.0, 117.95]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [33.84, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 71.72, 0.0, 39.93, 29.31], "audiomae_on_audioset": [[["music", 36.66], ["mains hum", 15.14], ["didgeridoo", 13.7]], null, null, null, null, null, [["music", 60.7], ["electronic music", 5.62], ["didgeridoo", 5.58]], null, null, null, [["speech", 46.79], ["music", 11.91], ["hum", 9.86]], [["speech", 51.4], ["music", 18.44], ["sonar", 7.38]]], "duration": [2.33, 1.64, 0.67, 1.06, 1.58, 0.93, 5.22, 44.41, 2.05, -0.02, 3.34, 20.95]} \ No newline at end of file diff --git a/annotations_1/sR0wCC271s4_filtered.json b/annotations_1/sR0wCC271s4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e9965205060d55a79c0093c48e0b74d5b907048 --- /dev/null +++ b/annotations_1/sR0wCC271s4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [16.0, 16.61], [26.0, 27.04], [52.0, 54.03], [70.0, 71.85], [73.0, 78.95], [80.0, 89.01], [94.0, 95.88], [96.0, 97.95], [99.0, 105.68]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.21, 0.0, 86.64, 51.66, 0.0, 0.0, 98.8], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [0.87, 0.61, 1.04, 2.03, 1.85, 5.95, 9.01, 1.88, 1.95, 6.68]} \ No newline at end of file diff --git a/annotations_1/sRR3ukzqiGs_filtered.json b/annotations_1/sRR3ukzqiGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e93b4dd3bd47661dbf66ba40bd43fa5a3a7bed04 --- /dev/null +++ b/annotations_1/sRR3ukzqiGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.55], [14.0, 17.69], [23.0, 22.86], [27.0, 28.11], [30.0, 31.95], [35.0, 35.9], [38.0, 40.27], [41.0, 40.68], [42.0, 46.45], [61.0, 61.25], [62.0, 62.68], [69.0, 69.25], [73.0, 82.36], [83.0, 83.73], [90.0, 90.58], [94.0, 96.03], [116.0, 119.4], [121.0, 124.68], [128.0, 130.5], [139.0, 139.23]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.06, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 45.78, 0.0, 0.0, 0.0, 39.31, 0.0, 0.0, 38.49, 64.29, 66.39, 63.74, 0.0], "audiomae_on_audioset": [null, [["music", 41.93], ["didgeridoo", 5.08], ["fly, housefly", 4.47]], null, null, null, null, null, null, [["music", 69.95], ["musical instrument", 2.66], ["electronic music", 2.34]], null, null, null, [["speech", 38.47], ["music", 27.29], ["fart", 3.74]], null, null, [["music", 75.83], ["musical instrument", 2.93], ["laughter", 2.86]], null, null, null, null], "duration": [0.55, 3.69, -0.14, 1.11, 1.95, 0.9, 2.27, -0.32, 4.45, 0.25, 0.68, 0.25, 9.36, 0.73, 0.58, 2.03, 3.4, 3.68, 2.5, 0.23]} \ No newline at end of file diff --git a/annotations_1/sRUb0GR0ZiE_filtered.json b/annotations_1/sRUb0GR0ZiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8a12f7e7c72a856a6f370aecf551bdce00cdd424 --- /dev/null +++ b/annotations_1/sRUb0GR0ZiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 43.38], [46.0, 47.22], [47.0, 49.54], [50.0, 101.76], [103.0, 110.84], [121.0, 122.96], [127.0, 128.38], [129.0, 131.16], [132.0, 136.17], [137.0, 139.62], [142.0, 144.36], [146.0, 148.71], [150.0, 149.93], [151.0, 153.28], [155.0, 158.06], [159.0, 160.42], [161.0, 167.36], [169.0, 170.13], [172.0, 174.68]], "keep_status": [true, false, false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false, true], "silence_prob": [34.71, 0.0, 29.71, 0.0, 32.02, 0.0, 0.0, 43.64, 49.78, 49.31, 41.93, 50.41, 0.0, 46.12, 47.58, 0.0, 43.82, 0.0, 47.62], "audiomae_on_audioset": [[["music", 30.98], ["speech", 15.78], ["throbbing", 15.16]], null, [["speech", 60.29], ["music", 12.03], ["crowd", 5.21]], null, [["music", 41.6], ["throbbing", 20.71], ["electronic music", 12.31]], null, null, [["speech", 64.43], ["rumble", 5.63], ["vehicle", 4.37]], [["rumble", 29.07], ["vehicle", 11.94], ["buzz", 8.68]], [["rumble", 18.23], ["hum", 13.6], ["buzz", 5.49]], [["speech", 10.29], ["sidetone", 10.11], ["bee, wasp, etc.", 9.36]], null, null, [["rumble", 32.36], ["vehicle", 6.93], ["car", 5.23]], [["rumble", 24.83], ["vehicle", 15.1], ["car", 6.86]], null, [["speech", 57.7], ["rumble", 20.01], ["hum", 4.54]], null, [["rumble", 20.6], ["cat", 6.93], ["vehicle", 6.24]]], "duration": [6.38, 1.22, 2.54, 51.76, 7.84, 1.96, 1.38, 2.16, 4.17, 2.62, 2.36, 2.71, -0.07, 2.28, 3.06, 1.42, 6.36, 1.13, 2.68]} \ No newline at end of file diff --git a/annotations_1/sR_tidD4M_8_filtered.json b/annotations_1/sR_tidD4M_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..adaa80e0c3fb4658fbda04d201cfc9330d0cde3e --- /dev/null +++ b/annotations_1/sR_tidD4M_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.1], [10.0, 16.56], [17.0, 20.31], [21.0, 29.1], [34.0, 39.93], [43.0, 74.06], [74.0, 104.87], [105.0, 106.41], [108.0, 116.31], [118.0, 117.88], [119.0, 132.63], [134.0, 158.6], [160.0, 177.01]], "keep_status": [false, true, true, true, true, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 41.83, 39.66, 28.69, 29.61, 0.0, 0.0, 0.0, 29.31, 0.0, 28.97, 30.94, 40.61], "audiomae_on_audioset": [null, [["sonar", 23.85], ["sine wave", 11.24], ["chirp tone", 8.52]], [["music", 36.92], ["chirp tone", 14.68], ["sine wave", 10.86]], [["sidetone", 30.28], ["speech", 15.49], ["music", 14.38]], [["speech", 27.73], ["vehicle", 8.32], ["hum", 7.79]], null, null, null, [["vehicle", 26.53], ["car", 16.34], ["motorcycle", 14.48]], null, [["speech", 32.22], ["vehicle", 28.36], ["car", 11.11]], [["music", 22.45], ["speech", 13.15], ["fly, housefly", 12.61]], [["music", 49.77], ["hum", 16.3], ["throbbing", 6.75]]], "duration": [0.1, 6.56, 3.31, 8.1, 5.93, 31.06, 30.87, 1.41, 8.31, -0.12, 13.63, 24.6, 17.01]} \ No newline at end of file diff --git a/annotations_1/sSRmhI94MUs_filtered.json b/annotations_1/sSRmhI94MUs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72f1b41a5c38b2943356d2e6ef764347e636eb32 --- /dev/null +++ b/annotations_1/sSRmhI94MUs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.3], [26.0, 27.21], [29.0, 29.52], [31.0, 31.28], [33.0, 41.23], [42.0, 42.2], [44.0, 55.0], [57.0, 57.32], [59.0, 62.5], [66.0, 66.31], [68.0, 68.99], [72.0, 108.9], [112.0, 125.47], [126.0, 128.33], [130.0, 130.87], [132.0, 132.68], [133.0, 134.72], [136.0, 136.38], [137.0, 137.83], [139.0, 142.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 96.17, 0.0, 36.28, 0.0, 0.0, 0.0, 31.1, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 32.18], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 56.39], ["radio", 34.81], ["sidetone", 2.25]], null, null, null, [["speech", 70.66], ["radio", 4.73], ["creak", 4.7]], null, null, null, null, null, null, [["hum", 23.64], ["bouncing", 8.19], ["noise", 7.73]]], "duration": [0.3, 1.21, 0.52, 0.28, 8.23, 0.2, 11.0, 0.32, 3.5, 0.31, 0.99, 36.9, 13.47, 2.33, 0.87, 0.68, 1.72, 0.38, 0.83, 3.53]} \ No newline at end of file diff --git a/annotations_1/sSc4Y4Z9lsk_filtered.json b/annotations_1/sSc4Y4Z9lsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..27a9eb6abe4e82741e729fd18a133687f6e8ac4f --- /dev/null +++ b/annotations_1/sSc4Y4Z9lsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.62], [8.0, 12.23], [13.0, 14.69], [16.0, 19.67], [21.0, 23.41], [24.0, 25.49], [39.0, 38.74], [45.0, 45.1], [50.0, 52.08], [54.0, 57.32], [58.0, 60.98], [62.0, 63.96], [65.0, 67.04], [68.0, 69.75], [71.0, 73.35], [79.0, 79.68], [88.0, 88.8], [96.0, 96.7], [110.0, 110.98], [111.0, 112.23], [113.0, 115.43], [116.0, 122.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.18, 52.92, 0.0, 87.37, 100.0, 0.0, 0.0, 0.0, 85.72, 94.07, 93.45, 0.0, 82.43, 0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 97.73, 82.25], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 4.23, 1.69, 3.67, 2.41, 1.49, -0.26, 0.1, 2.08, 3.32, 2.98, 1.96, 2.04, 1.75, 2.35, 0.68, 0.8, 0.7, 0.98, 1.23, 2.43, 6.54]} \ No newline at end of file diff --git a/annotations_1/sT7Xef0oYLU_filtered.json b/annotations_1/sT7Xef0oYLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..90eaa0994fe99d2047bc7c4de40aeb2ab36bb583 --- /dev/null +++ b/annotations_1/sT7Xef0oYLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.34], [20.0, 20.19], [23.0, 24.85], [26.0, 28.16], [30.0, 31.8], [33.0, 35.09], [40.0, 40.54], [42.0, 44.17], [47.0, 48.76], [49.0, 53.97], [55.0, 54.95], [66.0, 67.56], [78.0, 79.1], [83.0, 83.13], [84.0, 90.36], [92.0, 93.75], [100.0, 100.43], [104.0, 104.82], [106.0, 107.42], [109.0, 110.34], [111.0, 122.91], [125.0, 127.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.37, 0.0, 0.0, 49.04, 0.0, 99.99, 0.0, 99.36, 0.0, 37.99, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 0.0, 0.0, 0.0, 45.56, 87.74], "audiomae_on_audioset": [null, null, null, [["speech", 64.49], ["mains hum", 5.75], ["hum", 4.89]], null, null, null, null, null, [["thunk", 51.05], ["speech", 28.98], ["creak", 3.94]], null, null, null, null, null, null, null, null, null, null, [["speech", 40.58], ["thunk", 38.19], ["music", 11.83]], null], "duration": [3.34, 0.19, 1.85, 2.16, 1.8, 2.09, 0.54, 2.17, 1.76, 4.97, -0.05, 1.56, 1.1, 0.13, 6.36, 1.75, 0.43, 0.82, 1.42, 1.34, 11.91, 2.47]} \ No newline at end of file diff --git a/annotations_1/sTbJQwezQZY_filtered.json b/annotations_1/sTbJQwezQZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1fb02449ad50f654c32b5b339081d517e9ecd36 --- /dev/null +++ b/annotations_1/sTbJQwezQZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [11.0, 11.04], [13.0, 15.08], [20.0, 22.87], [31.0, 31.18], [50.0, 51.09], [56.0, 73.5], [75.0, 77.65], [81.0, 91.69], [93.0, 93.56], [95.0, 96.18], [97.0, 97.6], [100.0, 100.89], [102.0, 102.73], [104.0, 107.05], [107.0, 107.11], [108.0, 108.65]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 30.38, 31.48, 0.0, 0.0, 29.36, 28.11, 29.18, 0.0, 0.0, 0.0, 0.0, 0.0, 29.41, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.7], ["hum", 22.23], ["throbbing", 13.64]], [["music", 68.0], ["musical instrument", 8.26], ["guitar", 4.4]], null, null, [["music", 27.82], ["speech", 26.69], ["burst, pop", 7.39]], [["sound effect", 14.94], ["music", 11.71], ["whack, thwack", 5.86]], [["music", 51.4], ["throbbing", 27.12], ["hum", 7.97]], null, null, null, null, null, [["sidetone", 29.7], ["music", 26.23], ["speech", 10.65]], null, null], "duration": [1.31, 0.04, 2.08, 2.87, 0.18, 1.09, 17.5, 2.65, 10.69, 0.56, 1.18, 0.6, 0.89, 0.73, 3.05, 0.11, 0.65]} \ No newline at end of file diff --git a/annotations_1/sTcofHd5IlE_filtered.json b/annotations_1/sTcofHd5IlE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c21eea0c3b995322e8544267996135441fd9086 --- /dev/null +++ b/annotations_1/sTcofHd5IlE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.43], [28.0, 32.27], [34.0, 34.06], [34.0, 44.9], [45.0, 75.86], [76.0, 78.26], [80.0, 89.87], [90.0, 90.73], [95.0, 95.66], [96.0, 96.38], [100.0, 100.55]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 31.19, 0.0, 30.88, 0.0, 51.66, 30.45, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 26.32], ["throbbing", 16.48], ["sidetone", 13.04]], null, [["whack, thwack", 27.32], ["speech", 17.13], ["burst, pop", 16.48]], null, null, [["beatboxing", 29.52], ["whack, thwack", 22.2], ["speech", 20.4]], null, null, null, null], "duration": [0.43, 4.27, 0.06, 10.9, 30.86, 2.26, 9.87, 0.73, 0.66, 0.38, 0.55]} \ No newline at end of file diff --git a/annotations_1/sUQ9cisQpaY_filtered.json b/annotations_1/sUQ9cisQpaY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74eedd5bf324c07cb5a341c5d71d2501e646a861 --- /dev/null +++ b/annotations_1/sUQ9cisQpaY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.02], [15.0, 15.5], [24.0, 24.48], [25.0, 25.62], [26.0, 30.79], [32.0, 32.9], [39.0, 40.76], [44.0, 47.41], [62.0, 62.28], [65.0, 65.18], [106.0, 105.7], [116.0, 122.44], [136.0, 136.39], [140.0, 140.02], [141.0, 141.44], [144.0, 144.34], [146.0, 146.18], [148.0, 149.1], [150.0, 150.9], [158.0, 160.62], [162.0, 163.36], [164.0, 164.34]], "keep_status": [true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [43.3, 0.0, 0.0, 0.0, 45.49, 0.0, 0.0, 38.17, 0.0, 0.0, 0.0, 33.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.43, 0.0, 0.0], "audiomae_on_audioset": [[["music", 59.14], ["mosquito", 3.78], ["fly, housefly", 3.31]], null, null, null, [["music", 48.53], ["theremin", 10.46], ["musical instrument", 3.13]], null, null, [["music", 23.58], ["mains hum", 16.54], ["hum", 14.8]], null, null, null, [["music", 51.15], ["theremin", 19.63], ["musical instrument", 4.47]], null, null, null, null, null, null, null, [["music", 62.83], ["musical instrument", 8.37], ["piano", 5.98]], null, null], "duration": [2.02, 0.5, 0.48, 0.62, 4.79, 0.9, 1.76, 3.41, 0.28, 0.18, -0.3, 6.44, 0.39, 0.02, 0.44, 0.34, 0.18, 1.1, 0.9, 2.62, 1.36, 0.34]} \ No newline at end of file diff --git a/annotations_1/sVZLKLWFDYs_filtered.json b/annotations_1/sVZLKLWFDYs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df544a725027448fa86fee25070937a45b0d894c --- /dev/null +++ b/annotations_1/sVZLKLWFDYs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.21], [10.0, 10.94], [12.0, 16.41], [19.0, 19.3], [22.0, 31.01], [33.0, 35.18], [38.0, 40.69], [42.0, 47.61], [49.0, 50.68], [52.0, 55.54], [60.0, 63.59], [65.0, 65.5], [66.0, 71.25], [76.0, 79.22], [80.0, 82.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.75, 0.0, 85.17, 0.0, 87.74, 86.45, 95.23, 95.09, 0.0, 96.77, 89.19, 0.0, 70.02, 80.64, 70.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.21, 0.94, 4.41, 0.3, 9.01, 2.18, 2.69, 5.61, 1.68, 3.54, 3.59, 0.5, 5.25, 3.22, 2.27]} \ No newline at end of file diff --git a/annotations_1/sVfmACBWnIY_filtered.json b/annotations_1/sVfmACBWnIY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7309a5f708a95f653d2c1521eeaef0e8f1c05379 --- /dev/null +++ b/annotations_1/sVfmACBWnIY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.83], [11.0, 11.65], [14.0, 14.96], [19.0, 19.72], [22.0, 24.02], [26.0, 26.72], [27.0, 35.51], [40.0, 40.74], [44.0, 47.17], [53.0, 54.06], [55.0, 56.94], [58.0, 60.05], [63.0, 63.96], [68.0, 68.34], [70.0, 71.64], [73.0, 74.61], [76.0, 77.48], [79.0, 80.57], [86.0, 90.49], [91.0, 91.91], [98.0, 129.79], [137.0, 141.47], [142.0, 143.04]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 95.91, 0.0, 30.82, 0.0, 36.61, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 31.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["explosion", 32.75], ["burst, pop", 11.54], ["speech", 4.78]], null, [["speech", 73.28], ["animal", 3.54], ["duck", 3.22]], null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 29.04], ["mains hum", 28.15], ["whale vocalization", 14.9]], null], "duration": [0.83, 0.65, 0.96, 0.72, 2.02, 0.72, 8.51, 0.74, 3.17, 1.06, 1.94, 2.05, 0.96, 0.34, 1.64, 1.61, 1.48, 1.57, 4.49, 0.91, 31.79, 4.47, 1.04]} \ No newline at end of file diff --git a/annotations_1/sVfuigRSl8g_filtered.json b/annotations_1/sVfuigRSl8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc33262e3b149ac697f5e274c576d4f0b0768080 --- /dev/null +++ b/annotations_1/sVfuigRSl8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.63], [31.0, 33.99], [35.0, 37.23], [38.0, 42.18], [49.0, 55.34], [66.0, 67.91], [71.0, 72.55], [74.0, 74.66], [79.0, 78.8], [83.0, 102.86], [106.0, 107.42], [116.0, 116.7], [117.0, 117.49], [118.0, 119.21], [121.0, 123.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.5, 33.5, 35.52, 35.69, 36.43, 0.0, 0.0, 0.0, 0.0, 33.95, 0.0, 0.0, 0.0, 0.0, 80.11], "audiomae_on_audioset": [[["music", 75.32], ["boing", 15.28], ["speech", 2.58]], [["speech", 48.49], ["music", 31.78], ["crack", 2.66]], [["music", 71.8], ["speech", 8.28], ["sidetone", 2.8]], [["music", 46.58], ["boing", 28.49], ["speech", 6.41]], [["music", 70.07], ["speech", 16.06], ["throbbing", 2.22]], null, null, null, null, [["music", 35.65], ["speech", 25.52], ["sidetone", 14.86]], null, null, null, null, null], "duration": [5.63, 2.99, 2.23, 4.18, 6.34, 1.91, 1.55, 0.66, -0.2, 19.86, 1.42, 0.7, 0.49, 1.21, 2.25]} \ No newline at end of file diff --git a/annotations_1/sWCQm58jJsk_filtered.json b/annotations_1/sWCQm58jJsk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac7c0facc7e7bb45ff692e3eec51900ee5670e75 --- /dev/null +++ b/annotations_1/sWCQm58jJsk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.77], [9.0, 9.44], [10.0, 11.53], [12.0, 14.34], [15.0, 17.04], [19.0, 22.64], [25.0, 26.01], [27.0, 27.99], [29.0, 30.4], [31.0, 33.96], [35.0, 38.35], [40.0, 41.57], [43.0, 45.22], [47.0, 48.84], [50.0, 50.7], [52.0, 52.59], [53.0, 55.81], [59.0, 59.71], [62.0, 63.54], [68.0, 69.36], [71.0, 71.37], [72.0, 73.16], [74.0, 75.25], [78.0, 78.46], [79.0, 80.6], [82.0, 82.46], [83.0, 88.37], [97.0, 97.71], [101.0, 102.47], [104.0, 105.51], [108.0, 114.18], [116.0, 116.24], [118.0, 118.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.8, 98.99, 99.99, 0.0, 0.0, 0.0, 87.55, 96.17, 0.0, 99.16, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.77, 0.44, 1.53, 2.34, 2.04, 3.64, 1.01, 0.99, 1.4, 2.96, 3.35, 1.57, 2.22, 1.84, 0.7, 0.59, 2.81, 0.71, 1.54, 1.36, 0.37, 1.16, 1.25, 0.46, 1.6, 0.46, 5.37, 0.71, 1.47, 1.51, 6.18, 0.24, 0.59]} \ No newline at end of file diff --git a/annotations_1/sWjVe9dMRHU_filtered.json b/annotations_1/sWjVe9dMRHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef1c5d8afc46c9c1e79de3ebdcf173877e6d9a2 --- /dev/null +++ b/annotations_1/sWjVe9dMRHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.43], [12.0, 12.68], [14.0, 15.36], [16.0, 38.74], [44.0, 47.21], [48.0, 68.79], [70.0, 69.92], [70.0, 71.81], [72.0, 72.82], [86.0, 86.44], [94.0, 94.83], [95.0, 97.01], [98.0, 97.97], [99.0, 99.71], [101.0, 109.12], [109.0, 116.72], [122.0, 122.44], [131.0, 131.72], [134.0, 134.84], [151.0, 151.24], [155.0, 155.7], [156.0, 155.73], [156.0, 155.97], [156.0, 156.0], [156.0, 156.03], [156.0, 156.27], [157.0, 159.36], [163.0, 172.25], [173.0, 174.09], [175.0, 190.49], [203.0, 204.47], [205.0, 207.67], [212.0, 224.18], [225.0, 224.9]], "keep_status": [true, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [34.13, 0.0, 0.0, 30.87, 42.93, 32.63, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 46.19, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.73, 31.46, 0.0, 30.69, 0.0, 66.88, 43.58, 0.0], "audiomae_on_audioset": [[["music", 48.13], ["sampler", 6.23], ["musical instrument", 5.11]], null, null, [["music", 60.96], ["speech", 6.85], ["hum", 5.2]], [["music", 54.92], ["speech", 9.41], ["electronic music", 8.83]], [["hum", 31.07], ["music", 19.25], ["mains hum", 14.84]], null, null, null, null, null, null, null, null, [["music", 35.23], ["speech", 26.31], ["sidetone", 4.37]], [["speech", 24.91], ["groan", 24.65], ["music", 19.18]], null, null, null, null, null, null, null, null, null, null, [["music", 29.99], ["fart", 24.96], ["speech", 5.64]], [["music", 36.78], ["speech", 20.34], ["whack, thwack", 17.86]], null, [["music", 54.71], ["speech", 16.97], ["buzz", 2.22]], null, null, [["music", 58.67], ["speech", 27.21], ["thunk", 5.78]], null], "duration": [2.43, 0.68, 1.36, 22.74, 3.21, 20.79, -0.08, 1.81, 0.82, 0.44, 0.83, 2.01, -0.03, 0.71, 8.12, 7.72, 0.44, 0.72, 0.84, 0.24, 0.7, -0.27, -0.03, 0.0, 0.03, 0.27, 2.36, 9.25, 1.09, 15.49, 1.47, 2.67, 12.18, -0.1]} \ No newline at end of file diff --git a/annotations_1/sWqTiz8caoM_filtered.json b/annotations_1/sWqTiz8caoM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6439056605033eb3c2fb9ace0f8340bf9d4ac91 --- /dev/null +++ b/annotations_1/sWqTiz8caoM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [7.0, 10.03], [12.0, 12.46], [27.0, 28.22], [28.0, 28.29], [36.0, 40.56], [46.0, 47.85], [48.0, 52.22], [52.0, 52.57], [53.0, 82.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 80.11, 0.0, 0.0, 0.0, 98.93, 0.0, 75.55, 0.0, 49.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 72.02], ["hum", 3.62], ["zither", 1.93]]], "duration": [0.22, 3.03, 0.46, 1.22, 0.29, 4.56, 1.85, 4.22, 0.57, 29.19]} \ No newline at end of file diff --git a/annotations_1/sYWS5RSmJ-s_filtered.json b/annotations_1/sYWS5RSmJ-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1eb994475fe1765744d0822f33d61fe2c37e7372 --- /dev/null +++ b/annotations_1/sYWS5RSmJ-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.14], [11.0, 11.96], [14.0, 15.21], [20.0, 22.99], [24.0, 47.44], [48.0, 50.13], [52.0, 52.39], [60.0, 60.64], [63.0, 63.64], [70.0, 73.74], [74.0, 74.01], [81.0, 96.65]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 79.76, 47.66, 36.06, 0.0, 0.0, 0.0, 30.16, 0.0, 32.78], "audiomae_on_audioset": [null, null, null, null, [["thunk", 16.02], ["cat", 15.5], ["music", 14.6]], [["speech", 42.31], ["music", 8.63], ["throbbing", 6.81]], null, null, null, [["speech", 67.12], ["music", 10.95], ["whack, thwack", 5.04]], null, [["throbbing", 29.81], ["hum", 23.27], ["music", 9.42]]], "duration": [1.14, 0.96, 1.21, 2.99, 23.44, 2.13, 0.39, 0.64, 0.64, 3.74, 0.01, 15.65]} \ No newline at end of file diff --git a/annotations_1/sYdqpWTQyaI_filtered.json b/annotations_1/sYdqpWTQyaI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16f8555bfc3fbd98c7283b00c9ad8dc1a6656b24 --- /dev/null +++ b/annotations_1/sYdqpWTQyaI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.35], [20.0, 19.97], [28.0, 28.21], [42.0, 47.55], [48.0, 73.08], [75.0, 82.26], [83.0, 91.13], [93.0, 95.37], [99.0, 111.15], [114.0, 114.59], [115.0, 114.84], [119.0, 119.92], [120.0, 121.37], [122.0, 134.89], [136.0, 139.82], [141.0, 147.38], [148.0, 149.89], [151.0, 162.28], [163.0, 163.9], [166.0, 166.8], [167.0, 183.73], [187.0, 191.69], [196.0, 215.82], [218.0, 219.55], [221.0, 221.49], [222.0, 225.59]], "keep_status": [false, false, false, false, true, true, true, true, true, false, false, false, false, false, true, false, false, true, false, false, true, false, true, false, false, true], "silence_prob": [31.08, 0.0, 0.0, 30.64, 31.77, 29.42, 31.07, 32.14, 28.67, 0.0, 0.0, 0.0, 0.0, 29.37, 33.0, 30.05, 0.0, 31.4, 0.0, 0.0, 29.58, 31.95, 32.03, 0.0, 0.0, 48.78], "audiomae_on_audioset": [[["fly, housefly", 42.15], ["insect", 15.94], ["speech", 12.12]], null, null, [["mains hum", 35.94], ["hum", 23.4], ["music", 21.12]], [["hum", 24.33], ["music", 22.6], ["speech", 10.9]], [["speech", 40.97], ["music", 18.72], ["whack, thwack", 4.9]], [["music", 10.12], ["didgeridoo", 8.12], ["buzz", 7.36]], [["music", 16.59], ["hum", 14.56], ["speech", 11.58]], [["speech", 57.1], ["music", 3.43], ["buzz", 2.87]], null, null, null, null, [["throbbing", 37.85], ["hum", 20.77], ["music", 13.05]], [["music", 20.41], ["foghorn", 14.03], ["animal", 10.13]], [["music", 66.62], ["throbbing", 4.09], ["hum", 3.67]], null, [["music", 35.81], ["speech", 14.4], ["groan", 4.43]], null, null, [["speech", 21.01], ["music", 19.27], ["breaking", 12.21]], [["music", 58.75], ["musical instrument", 10.26], ["didgeridoo", 6.96]], [["music", 38.79], ["speech", 15.83], ["hum", 7.05]], null, null, [["music", 28.81], ["speech", 20.87], ["hum", 18.94]]], "duration": [5.35, -0.03, 0.21, 5.55, 25.08, 7.26, 8.13, 2.37, 12.15, 0.59, -0.16, 0.92, 1.37, 12.89, 3.82, 6.38, 1.89, 11.28, 0.9, 0.8, 16.73, 4.69, 19.82, 1.55, 0.49, 3.59]} \ No newline at end of file diff --git a/annotations_1/sZ6t_-wKImw_filtered.json b/annotations_1/sZ6t_-wKImw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef47b4205deb614a0e665780b17c769742eb504f --- /dev/null +++ b/annotations_1/sZ6t_-wKImw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.58], [12.0, 12.77], [14.0, 29.49], [31.0, 31.18], [33.0, 33.15], [35.0, 35.13], [36.0, 35.73], [37.0, 38.69], [42.0, 42.31], [44.0, 44.46], [47.0, 47.12], [49.0, 56.05], [57.0, 58.23], [61.0, 62.01], [63.0, 63.27], [64.0, 64.3], [66.0, 66.29], [67.0, 68.94], [70.0, 73.33], [75.0, 76.86], [78.0, 83.25], [85.0, 85.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [82.97, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 32.45, 0.0], "audiomae_on_audioset": [null, null, [["frog", 41.29], ["radio", 12.07], ["speech", 9.01]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 47.03], ["speech", 20.91], ["theremin", 7.48]], null], "duration": [10.58, 0.77, 15.49, 0.18, 0.15, 0.13, -0.27, 1.69, 0.31, 0.46, 0.12, 7.05, 1.23, 1.01, 0.27, 0.3, 0.29, 1.94, 3.33, 1.86, 5.25, 0.19]} \ No newline at end of file diff --git a/annotations_1/s_7PfocHTmc_filtered.json b/annotations_1/s_7PfocHTmc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d3ed1916298c4c54b54d2da264f5595444ca5ec --- /dev/null +++ b/annotations_1/s_7PfocHTmc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.55], [16.0, 16.46], [25.0, 29.57], [30.0, 29.61], [30.0, 34.87], [37.0, 37.12], [37.0, 38.72], [41.0, 41.99], [44.0, 46.57], [51.0, 52.03], [55.0, 59.31], [62.0, 84.18], [86.0, 94.88], [96.0, 95.93], [97.0, 122.91], [127.0, 128.04], [130.0, 157.77]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 40.88, 0.0, 39.78, 0.0, 0.0, 0.0, 48.56, 0.0, 41.66, 47.39, 37.27, 0.0, 29.76, 0.0, 30.27], "audiomae_on_audioset": [null, null, [["music", 39.74], ["theremin", 38.01], ["electronic music", 2.86]], null, [["music", 32.99], ["speech", 19.0], ["theremin", 12.89]], null, null, null, [["music", 43.63], ["theremin", 20.99], ["hum", 6.1]], null, [["music", 73.02], ["didgeridoo", 3.94], ["synthesizer", 3.61]], [["music", 33.27], ["hum", 21.05], ["throbbing", 9.1]], [["music", 65.58], ["synthesizer", 6.02], ["musical instrument", 5.88]], null, [["music", 36.94], ["speech", 23.01], ["theremin", 8.91]], null, [["music", 63.46], ["theremin", 21.23], ["shout", 1.43]]], "duration": [0.55, 0.46, 4.57, -0.39, 4.87, 0.12, 1.72, 0.99, 2.57, 1.03, 4.31, 22.18, 8.88, -0.07, 25.91, 1.04, 27.77]} \ No newline at end of file diff --git a/annotations_1/s_SM1Hly-uw_filtered.json b/annotations_1/s_SM1Hly-uw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd88242063c56af6813c66ec1701c5cb5c2c8503 --- /dev/null +++ b/annotations_1/s_SM1Hly-uw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [4.0, 6.98], [9.0, 10.17], [11.0, 14.3], [16.0, 16.97], [20.0, 22.13], [23.0, 23.31], [25.0, 25.79], [29.0, 36.51], [38.0, 39.18], [47.0, 47.85], [55.0, 56.27], [60.0, 69.33], [73.0, 74.29], [75.0, 78.21], [80.0, 83.84], [85.0, 86.49], [88.0, 90.83], [93.0, 105.39], [110.0, 112.08], [114.0, 115.91], [122.0, 123.35], [124.0, 128.02], [138.0, 139.97], [146.0, 149.17], [151.0, 154.45], [159.0, 162.57], [164.0, 165.25], [167.0, 168.79], [170.0, 171.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 73.51, 0.0, 55.89, 0.0, 63.53, 0.0, 0.0, 36.8, 0.0, 0.0, 0.0, 40.62, 0.0, 60.98, 56.78, 0.0, 58.3, 73.21, 92.64, 0.0, 0.0, 62.58, 0.0, 87.74, 98.01, 95.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 22.58], ["speech", 16.64], ["mains hum", 8.89]], null, null, null, [["didgeridoo", 23.69], ["music", 17.39], ["hum", 10.69]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.82, 2.98, 1.17, 3.3, 0.97, 2.13, 0.31, 0.79, 7.51, 1.18, 0.85, 1.27, 9.33, 1.29, 3.21, 3.84, 1.49, 2.83, 12.39, 2.08, 1.91, 1.35, 4.02, 1.97, 3.17, 3.45, 3.57, 1.25, 1.79, 1.14]} \ No newline at end of file diff --git a/annotations_1/s_cz5JFWpzE_filtered.json b/annotations_1/s_cz5JFWpzE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f12b4d601ed70d2bfa13021182aa460ad84d6d4 --- /dev/null +++ b/annotations_1/s_cz5JFWpzE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 26.77], [28.0, 28.97], [30.0, 32.16], [34.0, 34.33], [36.0, 36.61], [37.0, 37.88], [41.0, 41.39], [43.0, 45.77], [49.0, 49.05], [50.0, 50.8], [52.0, 53.06], [60.0, 60.12], [61.0, 62.41], [64.0, 65.01], [66.0, 66.7], [69.0, 70.41], [72.0, 72.17], [76.0, 79.02], [83.0, 84.06], [86.0, 106.74], [108.0, 108.45], [110.0, 110.42], [120.0, 120.07], [123.0, 125.63], [132.0, 133.52], [136.0, 137.57], [138.0, 139.41], [140.0, 142.47], [146.0, 148.44], [149.0, 150.13]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.81, 0.0, 0.0, 0.0, 0.0, 48.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.15, 0.0, 30.76, 0.0, 0.0, 0.0, 35.74, 0.0, 0.0, 0.0, 54.83, 53.78, 0.0], "audiomae_on_audioset": [null, null, [["hum", 34.61], ["music", 27.68], ["speech", 10.32]], null, null, null, null, [["hum", 30.35], ["music", 24.98], ["ambient music", 7.2]], null, null, null, null, null, null, null, null, null, [["music", 59.52], ["electronic music", 10.06], ["ambient music", 3.92]], null, [["hum", 41.91], ["music", 20.05], ["mains hum", 17.96]], null, null, null, [["hum", 31.68], ["music", 30.45], ["throbbing", 19.36]], null, null, null, null, null, null], "duration": [0.77, 0.97, 2.16, 0.33, 0.61, 0.88, 0.39, 2.77, 0.05, 0.8, 1.06, 0.12, 1.41, 1.01, 0.7, 1.41, 0.17, 3.02, 1.06, 20.74, 0.45, 0.42, 0.07, 2.63, 1.52, 1.57, 1.41, 2.47, 2.44, 1.13]} \ No newline at end of file diff --git a/annotations_1/sa9AzlyS9h0_filtered.json b/annotations_1/sa9AzlyS9h0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..562ab1153c1104a94d5871c87fc3f165be47ecbc --- /dev/null +++ b/annotations_1/sa9AzlyS9h0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.19], [9.0, 9.26], [11.0, 12.01], [12.0, 12.9], [14.0, 16.34], [17.0, 47.7], [49.0, 49.5], [53.0, 55.31], [57.0, 57.65], [59.0, 65.92], [67.0, 67.66], [71.0, 72.3], [74.0, 76.32], [79.0, 79.73], [82.0, 86.37], [89.0, 88.74], [92.0, 102.91], [104.0, 104.65], [105.0, 109.21], [112.0, 113.61], [115.0, 116.33], [116.0, 120.63], [125.0, 125.41], [129.0, 129.2], [131.0, 132.07], [136.0, 139.63], [142.0, 142.28], [144.0, 157.44], [159.0, 161.1]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, true, true], "silence_prob": [29.97, 0.0, 0.0, 0.0, 29.51, 0.0, 0.0, 29.32, 0.0, 30.29, 0.0, 0.0, 37.64, 0.0, 29.14, 0.0, 30.77, 0.0, 29.09, 0.0, 0.0, 29.89, 0.0, 0.0, 0.0, 29.27, 0.0, 29.73, 43.15], "audiomae_on_audioset": [[["speech", 65.47], ["radio", 3.79], ["buzz", 3.17]], null, null, null, [["speech", 62.69], ["buzzer", 5.94], ["alarm", 3.63]], null, null, [["cacophony", 19.9], ["speech", 16.62], ["explosion", 10.9]], null, [["hum", 17.85], ["mains hum", 12.32], ["sound effect", 6.36]], null, null, [["music", 18.75], ["noise", 16.84], ["hum", 11.45]], null, [["zipper (clothing)", 17.5], ["sound effect", 11.84], ["speech", 9.27]], null, [["speech", 86.95], ["music", 2.9], ["didgeridoo", 2.3]], null, [["music", 18.86], ["speech", 12.6], ["hum", 9.21]], null, null, [["speech", 54.8], ["sound effect", 5.52], ["music", 5.34]], null, null, null, [["speech", 43.02], ["music", 26.04], ["white noise", 3.33]], null, [["hum", 14.8], ["speech", 11.11], ["mains hum", 6.34]], [["hum", 30.92], ["mains hum", 18.91], ["music", 11.85]]], "duration": [6.19, 0.26, 1.01, 0.9, 2.34, 30.7, 0.5, 2.31, 0.65, 6.92, 0.66, 1.3, 2.32, 0.73, 4.37, -0.26, 10.91, 0.65, 4.21, 1.61, 1.33, 4.63, 0.41, 0.2, 1.07, 3.63, 0.28, 13.44, 2.1]} \ No newline at end of file diff --git a/annotations_1/saTBYjmhcok_filtered.json b/annotations_1/saTBYjmhcok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c712c6fe07c25fa9e56f7bc040c47fbf6a274260 --- /dev/null +++ b/annotations_1/saTBYjmhcok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.32], [14.0, 16.04], [17.0, 17.44], [19.0, 21.42], [22.0, 22.2], [23.0, 24.07], [25.0, 26.11], [28.0, 31.73], [33.0, 33.29], [34.0, 42.11], [43.0, 46.62], [51.0, 53.54], [54.0, 56.56], [60.0, 62.75], [64.0, 65.11], [65.0, 115.33], [118.0, 119.62], [120.0, 121.44], [123.0, 131.45], [133.0, 134.76], [137.0, 137.89], [146.0, 146.79], [149.0, 154.3]], "keep_status": [false, true, false, false, false, false, false, true, false, true, true, true, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.09, 48.78, 0.0, 46.43, 0.0, 0.0, 0.0, 47.23, 0.0, 34.79, 44.43, 36.18, 35.52, 42.72, 0.0, 0.0, 0.0, 0.0, 32.37, 0.0, 0.0, 0.0, 47.62], "audiomae_on_audioset": [[["hum", 39.81], ["mains hum", 29.72], ["music", 5.38]], [["music", 37.83], ["speech", 19.52], ["hum", 11.97]], null, [["hum", 33.23], ["mains hum", 28.69], ["music", 9.84]], null, null, null, [["music", 60.08], ["hum", 5.31], ["musical instrument", 4.36]], null, [["music", 29.23], ["hum", 21.15], ["mains hum", 10.02]], [["music", 25.62], ["hum", 19.1], ["mains hum", 11.15]], [["whale vocalization", 16.69], ["music", 7.29], ["hum", 6.14]], [["hum", 36.58], ["music", 21.34], ["throbbing", 10.98]], [["music", 31.94], ["hum", 13.26], ["whale vocalization", 7.97]], null, null, null, null, [["music", 51.17], ["hum", 21.68], ["mains hum", 10.09]], null, null, null, [["mains hum", 47.34], ["hum", 34.8], ["music", 5.13]]], "duration": [2.32, 2.04, 0.44, 2.42, 0.2, 1.07, 1.11, 3.73, 0.29, 8.11, 3.62, 2.54, 2.56, 2.75, 1.11, 50.33, 1.62, 1.44, 8.45, 1.76, 0.89, 0.79, 5.3]} \ No newline at end of file diff --git a/annotations_1/sbIfW_Pf9vk_filtered.json b/annotations_1/sbIfW_Pf9vk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba82f086490535c75c5b9333925424914e623c0 --- /dev/null +++ b/annotations_1/sbIfW_Pf9vk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.3], [7.0, 7.11], [17.0, 17.71], [19.0, 19.45], [20.0, 20.92], [21.0, 21.95], [23.0, 23.67], [25.0, 25.79], [29.0, 30.25], [32.0, 33.67], [38.0, 39.12], [41.0, 42.85], [49.0, 50.65], [53.0, 54.9], [57.0, 57.65], [61.0, 63.66], [67.0, 68.59], [69.0, 71.07], [80.0, 81.16], [90.0, 91.45], [99.0, 102.63], [103.0, 104.09], [111.0, 111.21], [114.0, 115.62], [116.0, 117.86], [121.0, 121.46], [124.0, 126.18], [127.0, 128.34], [129.0, 131.5], [133.0, 138.77], [145.0, 146.06], [147.0, 148.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 90.95, 0.0, 0.0, 34.36, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 90.25, 89.9, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 23.87], ["moo", 23.28], ["creak", 13.87]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 0.11, 0.71, 0.45, 0.92, 0.95, 0.67, 0.79, 1.25, 1.67, 1.12, 1.85, 1.65, 1.9, 0.65, 2.66, 1.59, 2.07, 1.16, 1.45, 3.63, 1.09, 0.21, 1.62, 1.86, 0.46, 2.18, 1.34, 2.5, 5.77, 1.06, 1.37]} \ No newline at end of file diff --git a/annotations_1/sbZB1drlKWI_filtered.json b/annotations_1/sbZB1drlKWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57368a15cdb4ae801b6c4d426846fdf73749fc6d --- /dev/null +++ b/annotations_1/sbZB1drlKWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.65], [11.0, 11.65], [12.0, 13.09], [15.0, 18.72], [20.0, 26.74], [32.0, 33.1], [36.0, 36.15], [37.0, 40.37], [42.0, 50.13], [51.0, 75.91], [76.0, 80.28], [81.0, 81.6]], "keep_status": [true, false, false, true, true, false, false, false, true, true, true, false], "silence_prob": [35.28, 0.0, 0.0, 36.93, 38.26, 0.0, 0.0, 30.48, 34.17, 31.92, 32.13, 0.0], "audiomae_on_audioset": [[["music", 33.84], ["boing", 7.07], ["didgeridoo", 5.53]], null, null, [["music", 29.53], ["speech", 15.89], ["didgeridoo", 8.57]], [["music", 30.67], ["clip-clop", 10.88], ["horse", 7.63]], null, null, [["cattle, bovinae", 45.11], ["moo", 29.96], ["livestock, farm animals, working animals", 23.44]], [["speech", 36.73], ["music", 16.69], ["horse", 13.72]], [["speech", 20.83], ["music", 14.55], ["clip-clop", 11.7]], [["noise", 31.11], ["hum", 10.77], ["sidetone", 9.16]], null], "duration": [2.65, 0.65, 1.09, 3.72, 6.74, 1.1, 0.15, 3.37, 8.13, 24.91, 4.28, 0.6]} \ No newline at end of file diff --git a/annotations_1/sd2pBde6gkw_filtered.json b/annotations_1/sd2pBde6gkw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6ae7251de4718c02ac37cca9d01a6f0b297879b3 --- /dev/null +++ b/annotations_1/sd2pBde6gkw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 18.79], [19.0, 19.77], [20.0, 24.02], [28.0, 29.02], [31.0, 31.06], [38.0, 39.31], [45.0, 45.96], [47.0, 49.11], [50.0, 51.58], [53.0, 54.43], [55.0, 55.61], [57.0, 58.62], [60.0, 61.11], [62.0, 63.12], [65.0, 67.66], [68.0, 69.2], [69.0, 72.5], [79.0, 80.6], [83.0, 83.84], [85.0, 86.36], [88.0, 88.21], [94.0, 95.15], [108.0, 109.73], [110.0, 112.33], [115.0, 114.79], [118.0, 118.35], [122.0, 122.4], [126.0, 125.98], [128.0, 129.42], [132.0, 132.51], [134.0, 134.5], [135.0, 137.64], [140.0, 142.67], [145.0, 146.33], [148.0, 148.78], [149.0, 150.55], [152.0, 152.56], [153.0, 154.03], [160.0, 160.76], [162.0, 163.38], [164.0, 165.15], [169.0, 173.82], [174.0, 179.91], [181.0, 188.37], [191.0, 191.44], [194.0, 195.13], [197.0, 197.33], [198.0, 219.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [60.79, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 99.96, 62.27, 0.0, 0.0, 0.0, 62.58], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.79, 0.77, 4.02, 1.02, 0.06, 1.31, 0.96, 2.11, 1.58, 1.43, 0.61, 1.62, 1.11, 1.12, 2.66, 1.2, 3.5, 1.6, 0.84, 1.36, 0.21, 1.15, 1.73, 2.33, -0.21, 0.35, 0.4, -0.02, 1.42, 0.51, 0.5, 2.64, 2.67, 1.33, 0.78, 1.55, 0.56, 1.03, 0.76, 1.38, 1.15, 4.82, 5.91, 7.37, 0.44, 1.13, 0.33, 21.96]} \ No newline at end of file diff --git a/annotations_1/sdkgpg4Plxo_filtered.json b/annotations_1/sdkgpg4Plxo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c33aa398b25dafa8b94a86c59ced262b2c31db6 --- /dev/null +++ b/annotations_1/sdkgpg4Plxo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 16.07], [16.0, 19.21], [20.0, 21.12], [22.0, 24.88], [26.0, 27.9], [29.0, 32.29], [33.0, 35.83], [41.0, 45.33], [47.0, 52.78], [54.0, 58.6], [62.0, 62.87], [65.0, 65.69], [67.0, 75.14], [76.0, 93.07], [96.0, 102.22], [103.0, 108.9], [110.0, 112.35]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.34, 40.33, 0.0, 98.51, 0.0, 73.36, 100.0, 87.74, 77.7, 99.87, 0.0, 0.0, 99.98, 99.82, 98.8, 99.98, 79.94], "audiomae_on_audioset": [null, [["speech", 46.56], ["sidetone", 7.06], ["animal", 4.47]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 3.21, 1.12, 2.88, 1.9, 3.29, 2.83, 4.33, 5.78, 4.6, 0.87, 0.69, 8.14, 17.07, 6.22, 5.9, 2.35]} \ No newline at end of file diff --git a/annotations_1/sdvrA5qnZo4_filtered.json b/annotations_1/sdvrA5qnZo4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4a9f64f36def3cc73c49a0ce2c53c3c7afeb9d62 --- /dev/null +++ b/annotations_1/sdvrA5qnZo4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [16.0, 16.75], [22.0, 26.91], [29.0, 29.64], [35.0, 42.79], [50.0, 64.57], [68.0, 68.93], [76.0, 76.08], [84.0, 84.25], [89.0, 89.63], [99.0, 101.9], [106.0, 107.16], [109.0, 109.39], [112.0, 112.6], [121.0, 130.92]], "keep_status": [false, false, true, false, true, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 46.05, 0.0, 31.19, 32.66, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 0.0, 93.45], "audiomae_on_audioset": [null, null, [["music", 34.61], ["bass guitar", 12.01], ["guitar", 11.84]], null, [["livestock, farm animals, working animals", 27.75], ["speech", 18.64], ["cattle, bovinae", 18.33]], [["music", 33.54], ["speech", 27.41], ["burst, pop", 1.92]], null, null, null, null, [["speech", 47.76], ["music", 10.78], ["crowd", 3.85]], null, null, null, null], "duration": [1.02, 0.75, 4.91, 0.64, 7.79, 14.57, 0.93, 0.08, 0.25, 0.63, 2.9, 1.16, 0.39, 0.6, 9.92]} \ No newline at end of file diff --git a/annotations_1/sdwghUH-K14_filtered.json b/annotations_1/sdwghUH-K14_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35333ac8a4d994eeeec0cf105c644425d519d49c --- /dev/null +++ b/annotations_1/sdwghUH-K14_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 8.26], [10.0, 12.99], [20.0, 21.07], [28.0, 32.71], [34.0, 42.67], [46.0, 48.81], [54.0, 58.53], [60.0, 61.99], [62.0, 63.02], [75.0, 107.57], [120.0, 120.83], [122.0, 123.26]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, false], "silence_prob": [58.13, 90.78, 0.0, 57.81, 37.71, 43.43, 42.55, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 40.37], ["music", 8.78], ["explosion", 7.97]], [["hum", 32.59], ["music", 16.83], ["mains hum", 15.16]], [["music", 24.69], ["speech", 23.87], ["hum", 14.94]], null, null, null, null, null], "duration": [5.26, 2.99, 1.07, 4.71, 8.67, 2.81, 4.53, 1.99, 1.02, 32.57, 0.83, 1.26]} \ No newline at end of file diff --git a/annotations_1/sf2RRCNlz38_filtered.json b/annotations_1/sf2RRCNlz38_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e71b3545607dad32baf103c5ddb0486337073ec --- /dev/null +++ b/annotations_1/sf2RRCNlz38_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[80.0, 90.73], [93.0, 103.33], [105.0, 108.77], [110.0, 145.62], [149.0, 157.57], [160.0, 164.32], [165.0, 165.05], [166.0, 170.09]], "keep_status": [false, true, false, false, true, true, false, true], "silence_prob": [40.52, 39.05, 99.98, 0.0, 34.36, 34.01, 0.0, 31.19], "audiomae_on_audioset": [[["whale vocalization", 48.82], ["livestock, farm animals, working animals", 13.53], ["cattle, bovinae", 9.41]], [["animal", 16.49], ["whale vocalization", 10.54], ["speech", 9.93]], null, null, [["buzz", 26.06], ["speech", 25.58], ["fart", 14.75]], [["throbbing", 15.99], ["speech", 8.19], ["sound effect", 6.3]], null, [["music", 15.15], ["fart", 8.1], ["speech", 7.85]]], "duration": [10.73, 10.33, 3.77, 35.62, 8.57, 4.32, 0.05, 4.09]} \ No newline at end of file diff --git a/annotations_1/sfCQQLSwz3s_filtered.json b/annotations_1/sfCQQLSwz3s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6c9df236b28d3dcd3ee0a159a37829afa2e990dd --- /dev/null +++ b/annotations_1/sfCQQLSwz3s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[74.0, 75.44], [81.0, 81.53], [87.0, 87.94], [89.0, 90.24], [93.0, 105.9], [108.0, 119.35]], "keep_status": [false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.29, 30.66], "audiomae_on_audioset": [null, null, null, null, [["buzz", 30.57], ["mains hum", 13.98], ["speech", 7.6]], [["music", 49.99], ["speech", 9.29], ["hum", 9.12]]], "duration": [1.44, 0.53, 0.94, 1.24, 12.9, 11.35]} \ No newline at end of file diff --git a/annotations_1/sfWe6CUZUtc_filtered.json b/annotations_1/sfWe6CUZUtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7710c21d55719fd1f0ec49a3dd96d12551a22be --- /dev/null +++ b/annotations_1/sfWe6CUZUtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.08], [7.0, 10.98], [15.0, 15.62], [23.0, 24.8], [33.0, 34.64], [36.0, 36.75], [37.0, 38.77], [39.0, 39.31], [52.0, 52.25], [57.0, 57.1], [58.0, 59.29], [60.0, 60.74], [63.0, 64.23], [65.0, 68.54], [72.0, 72.32], [72.0, 74.07], [76.0, 77.3], [80.0, 80.65], [88.0, 88.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.97, 68.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.72, 0.0, 97.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.08, 3.98, 0.62, 1.8, 1.64, 0.75, 1.77, 0.31, 0.25, 0.1, 1.29, 0.74, 1.23, 3.54, 0.32, 2.07, 1.3, 0.65, 0.21]} \ No newline at end of file diff --git a/annotations_1/sfgNK5f04iY_filtered.json b/annotations_1/sfgNK5f04iY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c46344de8081f39230bcbc16c75dc099c8b6ae6c --- /dev/null +++ b/annotations_1/sfgNK5f04iY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.56], [6.0, 19.52], [23.0, 35.95], [37.0, 54.36], [56.0, 70.17], [72.0, 83.35], [84.0, 100.09], [102.0, 105.56]], "keep_status": [false, false, false, false, true, false, false, true], "silence_prob": [0.0, 30.34, 30.02, 29.76, 30.09, 30.39, 30.18, 30.74], "audiomae_on_audioset": [null, [["speech", 51.24], ["music", 22.89], ["hum", 10.1]], [["music", 66.33], ["throbbing", 7.3], ["synthesizer", 6.02]], [["music", 63.19], ["throbbing", 18.66], ["hum", 7.17]], [["hum", 29.05], ["music", 22.34], ["throbbing", 16.39]], [["mains hum", 28.96], ["music", 22.96], ["hum", 21.3]], [["music", 67.06], ["speech", 7.0], ["electronic music", 3.61]], [["music", 48.44], ["speech", 6.3], ["throbbing", 4.06]]], "duration": [1.56, 13.52, 12.95, 17.36, 14.17, 11.35, 16.09, 3.56]} \ No newline at end of file diff --git a/annotations_1/sgB8cpEi_zU_filtered.json b/annotations_1/sgB8cpEi_zU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..727b95782a71ec983d7b94caeec594b256998487 --- /dev/null +++ b/annotations_1/sgB8cpEi_zU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 19.08], [21.0, 21.32], [22.0, 22.82], [24.0, 24.17], [25.0, 33.94], [34.0, 52.03], [56.0, 57.43], [58.0, 93.31], [96.0, 146.45], [148.0, 148.34], [149.0, 151.85], [153.0, 154.7], [155.0, 169.25], [170.0, 170.01], [171.0, 171.0], [172.0, 175.09], [176.0, 176.44]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.34, 31.96, 0.0, 0.0, 0.0, 0.0, 37.63, 0.0, 37.54, 0.0, 0.0, 37.82, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 64.11], ["radio", 4.94], ["vehicle", 3.95]], [["gurgling", 13.03], ["whale vocalization", 12.55], ["eruption", 11.67]], null, null, null, null, [["radio", 40.51], ["speech", 20.01], ["sidetone", 3.35]], null, [["frog", 23.53], ["whale vocalization", 16.45], ["gurgling", 13.48]], null, null, [["speech", 20.35], ["radio", 18.83], ["rain", 6.77]], null], "duration": [1.08, 0.32, 0.82, 0.17, 8.94, 18.03, 1.43, 35.31, 50.45, 0.34, 2.85, 1.7, 14.25, 0.01, 0.0, 3.09, 0.44]} \ No newline at end of file diff --git a/annotations_1/shE7b_6NNpU_filtered.json b/annotations_1/shE7b_6NNpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..193c6ab74811c964d07a383554ffff9a09305792 --- /dev/null +++ b/annotations_1/shE7b_6NNpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.18], [5.0, 5.97], [8.0, 8.43], [10.0, 10.67], [13.0, 13.05], [13.0, 14.57], [17.0, 16.93], [18.0, 20.33], [21.0, 25.51], [28.0, 36.12], [37.0, 37.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 63.96, 31.84, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 36.4], ["gong", 23.64], ["timpani", 12.71]], null], "duration": [0.18, 0.97, 0.43, 0.67, 0.05, 1.57, -0.07, 2.33, 4.51, 8.12, 0.49]} \ No newline at end of file diff --git a/annotations_1/shal5AF2Gxc_filtered.json b/annotations_1/shal5AF2Gxc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b501188e09501c2571d783d784cb1be05e37d74 --- /dev/null +++ b/annotations_1/shal5AF2Gxc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.16], [6.0, 7.38], [9.0, 9.75], [11.0, 11.79], [13.0, 14.13], [17.0, 17.42], [18.0, 18.66], [24.0, 24.73], [25.0, 30.5], [34.0, 35.11], [36.0, 40.07], [42.0, 43.19], [43.0, 44.51], [48.0, 60.22], [61.0, 64.89], [86.0, 86.09], [87.0, 110.02], [111.0, 118.4], [119.0, 120.26], [121.0, 122.25], [126.0, 127.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.91, 0.0, 41.52, 0.0, 0.0, 35.16, 43.48, 0.0, 36.52, 37.46, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 52.65], ["beatboxing", 21.12], ["music", 5.69]], null, null, [["speech", 84.75], ["beatboxing", 4.39], ["fart", 4.18]], [["speech", 11.08], ["music", 10.63], ["sheep", 5.47]], null, [["music", 34.64], ["quack", 13.83], ["animal", 6.73]], [["music", 43.04], ["speech", 7.6], ["didgeridoo", 3.36]], null, null, null], "duration": [0.16, 1.38, 0.75, 0.79, 1.13, 0.42, 0.66, 0.73, 5.5, 1.11, 4.07, 1.19, 1.51, 12.22, 3.89, 0.09, 23.02, 7.4, 1.26, 1.25, 1.18]} \ No newline at end of file diff --git a/annotations_1/sjEDF282UvY_filtered.json b/annotations_1/sjEDF282UvY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e21864d84610b8ad41c11a7ed9c5672e4530d118 --- /dev/null +++ b/annotations_1/sjEDF282UvY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 46.95], [47.0, 49.54], [53.0, 54.75], [55.0, 58.33], [61.0, 62.5], [69.0, 71.59], [75.0, 90.48], [92.0, 100.11], [101.0, 105.58], [106.0, 112.29], [113.0, 115.11], [118.0, 123.16], [124.0, 133.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 54.3, 0.0, 67.63, 0.0, 93.45, 90.08, 87.19, 100.0, 99.98, 97.73, 99.94, 89.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [44.95, 2.54, 1.75, 3.33, 1.5, 2.59, 15.48, 8.11, 4.58, 6.29, 2.11, 5.16, 9.95]} \ No newline at end of file diff --git a/annotations_1/sjmh7BViBtg_filtered.json b/annotations_1/sjmh7BViBtg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66c25562920154520e49e15642770362b78e12f3 --- /dev/null +++ b/annotations_1/sjmh7BViBtg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 27.58], [30.0, 33.84], [35.0, 35.78], [39.0, 39.61], [41.0, 41.27], [43.0, 46.21]], "keep_status": [false, false, false, false, false, false], "silence_prob": [39.83, 50.26, 0.0, 0.0, 0.0, 46.4], "audiomae_on_audioset": [[["music", 34.85], ["sonar", 29.91], ["hum", 10.19]], null, null, null, null, [["music", 55.17], ["synthesizer", 12.65], ["ambient music", 5.72]]], "duration": [16.58, 3.84, 0.78, 0.61, 0.27, 3.21]} \ No newline at end of file diff --git a/annotations_1/sk0mjld_eow_filtered.json b/annotations_1/sk0mjld_eow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b36258fec5919e70f963f8de9ddfa777c6b8eb5b --- /dev/null +++ b/annotations_1/sk0mjld_eow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 31.97], [34.0, 58.4], [60.0, 65.69], [67.0, 68.69], [73.0, 72.98], [75.0, 76.91], [82.0, 83.76], [86.0, 91.67], [93.0, 93.48], [93.0, 100.95], [102.0, 102.29], [109.0, 110.76], [114.0, 115.13], [116.0, 117.93], [119.0, 119.28], [122.0, 122.15], [122.0, 128.43], [129.0, 129.34], [130.0, 130.71], [138.0, 138.72], [141.0, 145.64], [147.0, 148.14], [150.0, 151.36], [154.0, 153.89], [155.0, 156.88], [160.0, 160.2], [163.0, 163.32], [164.0, 174.68]], "keep_status": [true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [29.54, 28.84, 31.34, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 31.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.35, 0.0, 0.0, 0.0, 37.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.22], "audiomae_on_audioset": [[["music", 53.74], ["sampler", 6.02], ["didgeridoo", 5.88]], [["music", 18.79], ["vehicle", 18.54], ["speech", 13.01]], [["speech", 11.9], ["sheep", 11.29], ["breaking", 10.53]], null, null, null, null, [["cattle, bovinae", 35.62], ["moo", 28.65], ["livestock, farm animals, working animals", 13.12]], null, [["livestock, farm animals, working animals", 27.15], ["animal", 25.88], ["cattle, bovinae", 11.07]], null, null, null, null, null, null, [["cattle, bovinae", 35.29], ["livestock, farm animals, working animals", 30.95], ["moo", 30.48]], null, null, null, [["moo", 34.06], ["cattle, bovinae", 33.88], ["livestock, farm animals, working animals", 27.54]], null, null, null, null, null, null, [["music", 34.21], ["gunshot, gunfire", 14.91], ["speech", 13.36]]], "duration": [24.97, 24.4, 5.69, 1.69, -0.02, 1.91, 1.76, 5.67, 0.48, 7.95, 0.29, 1.76, 1.13, 1.93, 0.28, 0.15, 6.43, 0.34, 0.71, 0.72, 4.64, 1.14, 1.36, -0.11, 1.88, 0.2, 0.32, 10.68]} \ No newline at end of file diff --git a/annotations_1/skrdyoabmgA_filtered.json b/annotations_1/skrdyoabmgA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0c099680df4d8cb77c3e1c32615806725e2bbe1 --- /dev/null +++ b/annotations_1/skrdyoabmgA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [10.0, 10.15], [15.0, 16.58], [19.0, 25.93], [27.0, 28.63], [30.0, 30.65], [33.0, 33.1], [36.0, 36.05], [40.0, 40.8], [46.0, 47.28], [50.0, 51.65], [56.0, 57.11], [58.0, 59.24], [60.0, 62.07], [63.0, 65.5], [69.0, 70.33], [71.0, 71.17], [73.0, 73.35], [82.0, 85.28], [87.0, 87.17], [89.0, 89.24], [93.0, 93.34], [95.0, 96.21], [98.0, 99.45], [107.0, 109.36], [111.0, 111.13], [124.0, 124.44], [128.0, 129.59], [132.0, 133.34], [136.0, 141.27], [143.0, 142.99], [144.0, 145.32], [149.0, 150.18], [156.0, 156.76], [163.0, 165.45], [168.0, 168.81], [173.0, 172.74], [176.0, 176.17], [177.0, 178.61], [181.0, 181.72], [186.0, 193.77], [197.0, 199.25], [200.0, 202.44], [205.0, 205.66], [213.0, 214.32], [216.0, 216.8], [218.0, 218.93], [222.0, 223.82], [227.0, 227.38], [230.0, 230.61], [235.0, 235.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.74, 71.43, 0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0, 0.0, 31.61, 0.0, 0.0, 0.0, 0.0, 29.63, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 60.51, 48.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 34.85], ["cattle, bovinae", 8.28], ["speech", 5.97]], null, null, null, null, [["music", 31.0], ["throbbing", 14.41], ["hum", 6.53]], null, null, null, null, null, [["music", 25.1], ["synthesizer", 12.87], ["effects unit", 5.84]], null, null, null, null, [["hum", 31.24], ["throbbing", 28.46], ["music", 10.7]], null, null, null, null, [["hum", 20.52], ["throbbing", 12.34], ["mains hum", 7.37]], null, null, null, null, null, [["buzz", 11.58], ["vehicle", 11.32], ["motorcycle", 10.45]], null, [["music", 38.96], ["hum", 11.32], ["ambient music", 5.13]], null, null, null, null, null, null, null, null], "duration": [0.51, 0.15, 1.58, 6.93, 1.63, 0.65, 0.1, 0.05, 0.8, 1.28, 1.65, 1.11, 1.24, 2.07, 2.5, 1.33, 0.17, 0.35, 3.28, 0.17, 0.24, 0.34, 1.21, 1.45, 2.36, 0.13, 0.44, 1.59, 1.34, 5.27, -0.01, 1.32, 1.18, 0.76, 2.45, 0.81, -0.26, 0.17, 1.61, 0.72, 7.77, 2.25, 2.44, 0.66, 1.32, 0.8, 0.93, 1.82, 0.38, 0.61, 0.92]} \ No newline at end of file diff --git a/annotations_1/sm5Zgj8kjD8_filtered.json b/annotations_1/sm5Zgj8kjD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f99ff733292a7048be9b751ff767663daa2e8b3 --- /dev/null +++ b/annotations_1/sm5Zgj8kjD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.07], [9.0, 12.85], [13.0, 14.25], [15.0, 16.51], [18.0, 40.78], [41.0, 43.98], [45.0, 129.98], [133.0, 149.25], [151.0, 153.62], [156.0, 159.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 100.0, 0.0, 0.0, 100.0, 100.0, 0.0, 99.26, 94.07, 95.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [4.07, 3.85, 1.25, 1.51, 22.78, 2.98, 84.98, 16.25, 2.62, 3.58]} \ No newline at end of file diff --git a/annotations_1/snTvACYp8NA_filtered.json b/annotations_1/snTvACYp8NA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..476fd63afdbb986a09fdd9e9628ff8f0619b3b4f --- /dev/null +++ b/annotations_1/snTvACYp8NA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.72], [5.0, 5.53], [6.0, 5.97], [6.0, 7.97]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [-0.28, 0.53, -0.03, 1.97]} \ No newline at end of file diff --git a/annotations_1/sneQ02FCals_filtered.json b/annotations_1/sneQ02FCals_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..91076b8ae5c912708702b432f5f3071b99e0aafb --- /dev/null +++ b/annotations_1/sneQ02FCals_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.93], [14.0, 21.22], [22.0, 30.55], [35.0, 35.65], [39.0, 39.39], [44.0, 44.68], [48.0, 48.41], [53.0, 54.09], [56.0, 57.82], [59.0, 59.36], [60.0, 122.18], [123.0, 123.94], [129.0, 129.56], [130.0, 133.59], [134.0, 136.61], [137.0, 137.46], [148.0, 149.23], [152.0, 152.63], [156.0, 160.07], [163.0, 163.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.58, 50.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 32.48, 0.0, 0.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [null, [["music", 66.2], ["didgeridoo", 5.35], ["synthesizer", 4.49]], null, null, null, null, null, null, null, null, null, null, null, [["gong", 42.81], ["speech", 19.04], ["music", 11.03]], [["speech", 56.26], ["music", 24.03], ["boing", 4.56]], null, null, null, null, null], "duration": [1.93, 7.22, 8.55, 0.65, 0.39, 0.68, 0.41, 1.09, 1.82, 0.36, 62.18, 0.94, 0.56, 3.59, 2.61, 0.46, 1.23, 0.63, 4.07, 0.58]} \ No newline at end of file diff --git a/annotations_1/sohDA6TQuiE_filtered.json b/annotations_1/sohDA6TQuiE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5623980d1342eef69255455ce1278bd255a584e --- /dev/null +++ b/annotations_1/sohDA6TQuiE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.01], [20.0, 28.98], [34.0, 69.8]], "keep_status": [true, true, false], "silence_prob": [30.79, 29.32, 0.0], "audiomae_on_audioset": [[["music", 33.27], ["speech", 12.61], ["throbbing", 12.58]], [["mains hum", 33.75], ["music", 16.65], ["cacophony", 15.43]], null], "duration": [10.01, 8.98, 35.8]} \ No newline at end of file diff --git a/annotations_1/sp0O70Q5FAQ_filtered.json b/annotations_1/sp0O70Q5FAQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fb89f3269318beb8c9967758856809a08f089d4 --- /dev/null +++ b/annotations_1/sp0O70Q5FAQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[95.0, 95.79], [96.0, 97.66], [99.0, 107.01], [108.0, 110.25], [110.0, 113.86], [116.0, 119.87], [121.0, 121.95], [123.0, 123.84], [125.0, 125.76]], "keep_status": [false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 44.07, 40.64, 37.67, 90.25, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bouncing", 24.24], ["speech", 10.35], ["radio", 10.06]], [["stomach rumble", 14.69], ["horse", 6.65], ["clip-clop", 5.78]], [["fly, housefly", 24.29], ["insect", 14.14], ["speech", 10.0]], null, null, null, null], "duration": [0.79, 1.66, 8.01, 2.25, 3.86, 3.87, 0.95, 0.84, 0.76]} \ No newline at end of file diff --git a/annotations_1/spy6L78o3-A_filtered.json b/annotations_1/spy6L78o3-A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..691065ca956998c0c255b51d6beb166e9ead9923 --- /dev/null +++ b/annotations_1/spy6L78o3-A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 32.19], [39.0, 43.38], [48.0, 49.2], [51.0, 51.81], [64.0, 65.08], [67.0, 76.52], [82.0, 84.5], [89.0, 111.0], [120.0, 125.15], [131.0, 132.17], [134.0, 136.63], [137.0, 138.84], [148.0, 154.84], [157.0, 158.06], [161.0, 189.31]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, true, false, true], "silence_prob": [30.89, 31.56, 0.0, 0.0, 0.0, 29.87, 29.39, 28.69, 30.64, 0.0, 30.54, 0.0, 31.77, 0.0, 28.69], "audiomae_on_audioset": [[["music", 80.78], ["electronic music", 2.58], ["boing", 1.68]], [["music", 45.27], ["speech", 28.88], ["fart", 8.24]], null, null, null, [["speech", 56.43], ["music", 7.5], ["vehicle", 6.6]], [["music", 22.91], ["sound effect", 6.74], ["siren", 5.37]], [["music", 33.01], ["speech", 15.36], ["livestock, farm animals, working animals", 8.67]], [["music", 37.8], ["vehicle", 9.14], ["buzz", 7.39]], null, [["music", 58.37], ["speech", 23.74], ["electronic music", 4.08]], null, [["music", 42.26], ["vehicle", 12.29], ["car", 9.46]], null, [["music", 31.64], ["vehicle", 18.09], ["car", 9.64]]], "duration": [3.19, 4.38, 1.2, 0.81, 1.08, 9.52, 2.5, 22.0, 5.15, 1.17, 2.63, 1.84, 6.84, 1.06, 28.31]} \ No newline at end of file diff --git a/annotations_1/sqLiTaVHPdo_filtered.json b/annotations_1/sqLiTaVHPdo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ae4c2e2c6546199c6398dc6107283bb213ab40 --- /dev/null +++ b/annotations_1/sqLiTaVHPdo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.8], [17.0, 18.42], [19.0, 19.95], [21.0, 21.2], [46.0, 45.91], [48.0, 49.17], [51.0, 51.98], [53.0, 55.61], [62.0, 61.64], [71.0, 71.78], [73.0, 73.9], [74.0, 76.79], [91.0, 91.44], [95.0, 95.18], [100.0, 100.47], [103.0, 103.06], [104.0, 105.06], [106.0, 106.86], [108.0, 108.5], [110.0, 110.1], [119.0, 119.25], [120.0, 121.19], [156.0, 156.84], [157.0, 157.96]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.37, 0.0, 0.0, 0.0, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 26.14], ["creak", 7.73], ["guitar", 4.11]], null, null, null, [["music", 57.15], ["speech", 23.69], ["synthesizer", 3.25]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.8, 1.42, 0.95, 0.2, -0.09, 1.17, 0.98, 2.61, -0.36, 0.78, 0.9, 2.79, 0.44, 0.18, 0.47, 0.06, 1.06, 0.86, 0.5, 0.1, 0.25, 1.19, 0.84, 0.96]} \ No newline at end of file diff --git a/annotations_1/sqZ6ZrVIemM_filtered.json b/annotations_1/sqZ6ZrVIemM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0507902286e69fcf0f8e131882b00a4ea99710c1 --- /dev/null +++ b/annotations_1/sqZ6ZrVIemM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.21], [13.0, 19.2], [37.0, 46.3], [47.0, 49.4], [50.0, 54.41], [55.0, 62.87], [63.0, 63.59], [64.0, 67.29], [73.0, 89.26], [90.0, 90.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [96.04, 97.43, 99.4, 96.04, 98.51, 98.86, 0.0, 99.16, 89.9, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [2.21, 6.2, 9.3, 2.4, 4.41, 7.87, 0.59, 3.29, 16.26, 0.15]} \ No newline at end of file diff --git a/annotations_1/srLwGlDe598_filtered.json b/annotations_1/srLwGlDe598_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08bdf809154a8c53315ce90216405e34972241a2 --- /dev/null +++ b/annotations_1/srLwGlDe598_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.58], [5.0, 7.37], [15.0, 15.58], [18.0, 19.95], [21.0, 31.11], [33.0, 36.48], [41.0, 41.64], [46.0, 46.04], [48.0, 47.83], [49.0, 78.95], [80.0, 87.29], [89.0, 122.72]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 60.32, 0.0, 0.0, 39.75, 62.78, 0.0, 0.0, 0.0, 41.26, 51.66, 0.0], "audiomae_on_audioset": [null, null, null, null, [["buzz", 12.63], ["glass", 12.02], ["explosion", 7.85]], null, null, null, null, [["telephone dialing, dtmf", 25.76], ["speech", 11.86], ["sidetone", 6.88]], null, null], "duration": [0.58, 2.37, 0.58, 1.95, 10.11, 3.48, 0.64, 0.04, -0.17, 29.95, 7.29, 33.72]} \ No newline at end of file diff --git a/annotations_1/srpCm9gPmZI_filtered.json b/annotations_1/srpCm9gPmZI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e410ab4136d6b37d2f61c3e0cec94ccd9854704 --- /dev/null +++ b/annotations_1/srpCm9gPmZI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [5.0, 5.88], [7.0, 8.68], [9.0, 9.58], [10.0, 10.13], [12.0, 12.97], [14.0, 32.8], [34.0, 36.56], [41.0, 52.95], [53.0, 53.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.91, 27.95, 27.94, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 75.93], ["electronic music", 3.72], ["drum machine", 3.53]], [["music", 67.92], ["dubstep", 2.97], ["echo", 2.71]], [["music", 88.79], ["electronic music", 1.3], ["funk", 0.94]], null], "duration": [0.16, 0.88, 1.68, 0.58, 0.13, 0.97, 18.8, 2.56, 11.95, 0.2]} \ No newline at end of file diff --git a/annotations_1/ssgm3-sCY-Y_filtered.json b/annotations_1/ssgm3-sCY-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..432f61a404cb4a080dff940a6e6125df84c5c446 --- /dev/null +++ b/annotations_1/ssgm3-sCY-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [4.0, 5.41], [7.0, 7.33], [12.0, 17.1], [22.0, 93.99], [94.0, 103.91]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.02, 0.0, 30.35], "audiomae_on_audioset": [null, null, null, [["music", 41.51], ["hum", 18.87], ["throbbing", 8.5]], null, [["music", 29.63], ["theremin", 26.61], ["hum", 17.11]]], "duration": [1.13, 1.41, 0.33, 5.1, 71.99, 9.91]} \ No newline at end of file diff --git a/annotations_1/ssxqmxjrx2c_filtered.json b/annotations_1/ssxqmxjrx2c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f51f05e52e79c71db7bb3b512dd26a0c5430b19 --- /dev/null +++ b/annotations_1/ssxqmxjrx2c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.83], [21.0, 21.09], [36.0, 38.53], [40.0, 41.49], [45.0, 46.57], [50.0, 50.25], [51.0, 51.19], [55.0, 55.39], [58.0, 59.17], [60.0, 59.78], [63.0, 65.2], [67.0, 67.59], [69.0, 69.96], [79.0, 80.79], [90.0, 90.31], [91.0, 91.35], [97.0, 96.87], [101.0, 102.81], [105.0, 107.7], [113.0, 113.59], [115.0, 116.01], [117.0, 118.08], [119.0, 125.12], [126.0, 131.11], [131.0, 134.3], [135.0, 136.32], [143.0, 144.29], [145.0, 147.55], [151.0, 152.56], [154.0, 154.16], [154.0, 156.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 38.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 75.88, 52.33, 33.12, 0.0, 0.0, 56.1, 0.0, 0.0, 34.47], "audiomae_on_audioset": [null, null, [["speech", 79.56], ["sidetone", 6.82], ["dial tone", 5.4]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 66.91], ["dial tone", 4.89], ["busy signal", 4.82]], null, null, null, null, null, [["music", 10.8], ["synthesizer", 8.48], ["throbbing", 8.22]]], "duration": [0.83, 0.09, 2.53, 1.49, 1.57, 0.25, 0.19, 0.39, 1.17, -0.22, 2.2, 0.59, 0.96, 1.79, 0.31, 0.35, -0.13, 1.81, 2.7, 0.59, 1.01, 1.08, 6.12, 5.11, 3.3, 1.32, 1.29, 2.55, 1.56, 0.16, 2.15]} \ No newline at end of file diff --git a/annotations_1/st8QRZbJdPY_filtered.json b/annotations_1/st8QRZbJdPY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8e17d1db1ce1084b7f831cb1dd13f8a04f1ca6e1 --- /dev/null +++ b/annotations_1/st8QRZbJdPY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.31], [13.0, 21.69], [22.0, 22.76], [24.0, 24.38], [26.0, 26.38], [33.0, 33.71], [35.0, 35.75], [36.0, 37.79], [40.0, 42.74], [43.0, 43.7], [45.0, 44.9], [49.0, 50.13], [52.0, 52.46], [55.0, 55.53], [56.0, 57.06], [58.0, 59.83], [62.0, 64.37], [65.0, 66.16], [68.0, 69.87], [72.0, 73.58], [75.0, 76.71], [79.0, 80.18], [81.0, 81.92], [83.0, 83.42], [84.0, 85.28], [86.0, 87.32], [88.0, 91.79], [93.0, 93.92], [96.0, 97.39], [98.0, 99.32], [101.0, 101.76], [103.0, 103.49], [104.0, 105.29], [107.0, 123.65], [126.0, 126.37], [127.0, 127.74], [129.0, 130.13], [132.0, 147.06], [149.0, 148.76], [149.0, 149.71], [152.0, 158.09], [160.0, 161.27], [162.0, 164.34], [165.0, 166.92], [168.0, 170.99], [176.0, 176.76], [188.0, 188.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 82.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 87.92, 0.0, 99.84, 0.0, 99.52, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 8.69, 0.76, 0.38, 0.38, 0.71, 0.75, 1.79, 2.74, 0.7, -0.1, 1.13, 0.46, 0.53, 1.06, 1.83, 2.37, 1.16, 1.87, 1.58, 1.71, 1.18, 0.92, 0.42, 1.28, 1.32, 3.79, 0.92, 1.39, 1.32, 0.76, 0.49, 1.29, 16.65, 0.37, 0.74, 1.13, 15.06, -0.24, 0.71, 6.09, 1.27, 2.34, 1.92, 2.99, 0.76, 0.32]} \ No newline at end of file diff --git a/annotations_1/suYDvQwikn4_filtered.json b/annotations_1/suYDvQwikn4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4035668dd8b2267386983a825d9a75c432b95cf7 --- /dev/null +++ b/annotations_1/suYDvQwikn4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.95], [15.0, 16.14], [19.0, 20.07], [22.0, 23.21], [27.0, 28.93], [31.0, 40.88], [45.0, 49.01], [53.0, 55.34], [57.0, 66.07], [68.0, 68.49], [72.0, 89.04], [91.0, 91.72], [94.0, 94.56], [97.0, 110.51], [111.0, 114.69], [121.0, 130.28], [133.0, 133.88], [136.0, 141.1], [143.0, 152.15], [153.0, 155.26], [158.0, 161.81], [163.0, 174.31], [174.0, 175.15], [176.0, 176.4], [177.0, 177.62]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.81, 66.51, 70.44, 28.76, 0.0, 40.71, 0.0, 0.0, 46.97, 57.25, 49.78, 0.0, 33.88, 30.36, 51.12, 54.3, 37.69, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["whack, thwack", 39.2], ["speech", 31.93], ["thunk", 17.59]], null, null, [["speech", 34.73], ["music", 27.94], ["drum", 5.75]], null, [["music", 67.93], ["speech", 15.99], ["synthesizer", 2.18]], null, null, [["music", 57.47], ["throbbing", 12.02], ["hum", 10.77]], null, [["music", 62.64], ["synthesizer", 5.82], ["hum", 2.6]], null, [["music", 32.15], ["hum", 21.14], ["mains hum", 14.16]], [["throbbing", 39.54], ["music", 33.76], ["hum", 5.73]], null, null, [["fart", 23.45], ["music", 20.15], ["hum", 9.39]], null, null, null], "duration": [0.95, 1.14, 1.07, 1.21, 1.93, 9.88, 4.01, 2.34, 9.07, 0.49, 17.04, 0.72, 0.56, 13.51, 3.69, 9.28, 0.88, 5.1, 9.15, 2.26, 3.81, 11.31, 1.15, 0.4, 0.62]} \ No newline at end of file diff --git a/annotations_1/svwcgrDZVPw_filtered.json b/annotations_1/svwcgrDZVPw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ba508c9c66f2d5c724295f24bce070d68806956 --- /dev/null +++ b/annotations_1/svwcgrDZVPw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [5.0, 9.14], [48.0, 57.94], [90.0, 90.27], [103.0, 102.81], [105.0, 107.47], [111.0, 111.42], [117.0, 117.68], [124.0, 123.7], [140.0, 139.97], [141.0, 157.37], [160.0, 164.59], [170.0, 170.48], [174.0, 176.07], [179.0, 180.3], [181.0, 183.93], [185.0, 189.4], [190.0, 192.62], [193.0, 195.39], [196.0, 197.34]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, true, true, true, false, false], "silence_prob": [0.0, 35.71, 47.54, 0.0, 0.0, 39.5, 0.0, 0.0, 0.0, 0.0, 31.75, 58.64, 0.0, 53.16, 0.0, 33.6, 32.97, 46.5, 79.94, 0.0], "audiomae_on_audioset": [null, [["music", 62.8], ["theremin", 15.62], ["musical instrument", 3.59]], [["music", 36.38], ["effects unit", 8.98], ["musical instrument", 6.9]], null, null, [["music", 16.48], ["boing", 8.56], ["speech", 7.48]], null, null, null, null, [["music", 39.55], ["noise", 18.1], ["cacophony", 5.25]], null, null, null, null, [["music", 18.71], ["speech", 15.33], ["cattle, bovinae", 14.35]], [["music", 46.76], ["speech", 11.37], ["trombone", 2.22]], [["speech", 31.15], ["music", 22.28], ["gong", 5.35]], null, null], "duration": [0.46, 4.14, 9.94, 0.27, -0.19, 2.47, 0.42, 0.68, -0.3, -0.03, 16.37, 4.59, 0.48, 2.07, 1.3, 2.93, 4.4, 2.62, 2.39, 1.34]} \ No newline at end of file diff --git a/annotations_1/sw1tJoYrs7M_filtered.json b/annotations_1/sw1tJoYrs7M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad00d4795bfcb0c6daf40f590bd419c4796d528a --- /dev/null +++ b/annotations_1/sw1tJoYrs7M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 18.22], [19.0, 20.33], [22.0, 22.84], [25.0, 24.97], [26.0, 38.85], [46.0, 46.18], [48.0, 48.22], [51.0, 51.9], [54.0, 54.89], [58.0, 58.19], [59.0, 59.21], [61.0, 61.26], [63.0, 63.95], [68.0, 69.21], [70.0, 71.68], [72.0, 73.45], [77.0, 90.41], [91.0, 92.37], [105.0, 104.75], [106.0, 106.29], [107.0, 107.81], [109.0, 109.68], [111.0, 112.4], [114.0, 129.69], [131.0, 144.02], [145.0, 146.6], [151.0, 152.0], [153.0, 153.33], [154.0, 154.21], [157.0, 158.62], [160.0, 160.34], [161.0, 182.26], [183.0, 193.33], [200.0, 200.03], [200.0, 201.55], [209.0, 210.05]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.11, 58.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.84, 34.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["noise", 33.18], ["vehicle", 14.83], ["aircraft", 7.62]], null, null, null, null, null, null, null, null, null, null, null, [["jet engine", 18.38], ["vehicle", 14.37], ["microwave oven", 5.22]], null, null, null, null, null, null, [["mains hum", 34.06], ["hum", 27.07], ["white noise", 11.31]], null, null, null, null, null, null, null, [["music", 50.42], ["theremin", 24.35], ["musical instrument", 6.77]], [["hum", 26.58], ["music", 25.16], ["mains hum", 10.24]], null, null, null], "duration": [1.22, 1.33, 0.84, -0.03, 12.85, 0.18, 0.22, 0.9, 0.89, 0.19, 0.21, 0.26, 0.95, 1.21, 1.68, 1.45, 13.41, 1.37, -0.25, 0.29, 0.81, 0.68, 1.4, 15.69, 13.02, 1.6, 1.0, 0.33, 0.21, 1.62, 0.34, 21.26, 10.33, 0.03, 1.55, 1.05]} \ No newline at end of file diff --git a/annotations_1/swEgflM5Ol4_filtered.json b/annotations_1/swEgflM5Ol4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41aef4ed90883fe1ae69807915177029fb1ec3b1 --- /dev/null +++ b/annotations_1/swEgflM5Ol4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.91], [14.0, 31.55], [32.0, 33.94], [35.0, 39.53], [41.0, 50.08], [53.0, 54.41], [70.0, 70.33], [78.0, 78.61], [83.0, 83.56], [85.0, 85.94], [87.0, 87.66], [90.0, 98.12], [100.0, 101.71], [107.0, 107.65], [109.0, 113.26], [114.0, 120.66], [121.0, 125.27], [131.0, 131.33], [132.0, 133.79], [136.0, 137.56], [142.0, 149.71], [151.0, 182.01], [184.0, 184.64], [186.0, 188.47], [192.0, 192.03], [192.0, 192.06]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 33.54, 0.0, 48.14, 31.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.59, 0.0, 0.0, 33.92, 31.06, 30.18, 0.0, 0.0, 0.0, 33.78, 0.0, 0.0, 32.64, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 48.62], ["hum", 17.75], ["throbbing", 9.28]], null, [["hum", 21.12], ["bee, wasp, etc.", 19.93], ["mains hum", 14.67]], [["whale vocalization", 20.25], ["buzz", 16.83], ["noise", 13.78]], null, null, null, null, null, null, [["explosion", 40.25], ["artillery fire", 33.26], ["burst, pop", 8.35]], null, null, [["bee, wasp, etc.", 35.85], ["fly, housefly", 27.81], ["insect", 20.25]], [["mains hum", 27.87], ["hum", 21.96], ["speech", 19.14]], [["speech", 30.15], ["music", 11.07], ["buzz", 3.31]], null, null, null, [["animal", 21.82], ["speech", 13.29], ["hum", 7.87]], null, null, [["speech", 73.14], ["radio", 4.48], ["hum", 3.53]], null, null], "duration": [0.91, 17.55, 1.94, 4.53, 9.08, 1.41, 0.33, 0.61, 0.56, 0.94, 0.66, 8.12, 1.71, 0.65, 4.26, 6.66, 4.27, 0.33, 1.79, 1.56, 7.71, 31.01, 0.64, 2.47, 0.03, 0.06]} \ No newline at end of file diff --git a/annotations_1/sxo7GjhsghQ_filtered.json b/annotations_1/sxo7GjhsghQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26466c59344bc3232d360bddf4edf48155c15464 --- /dev/null +++ b/annotations_1/sxo7GjhsghQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.27], [10.0, 14.88], [15.0, 21.96], [22.0, 22.47], [24.0, 35.31], [39.0, 40.59], [41.0, 42.31], [44.0, 53.27], [55.0, 55.49], [56.0, 56.49], [58.0, 58.73]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false], "silence_prob": [0.0, 99.88, 51.07, 0.0, 30.14, 0.0, 0.0, 43.61, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 47.34], ["artillery fire", 9.74], ["explosion", 7.8]], null, null, [["creak", 39.39], ["mechanisms", 16.46], ["noise", 10.39]], null, null, null], "duration": [1.27, 4.88, 6.96, 0.47, 11.31, 1.59, 1.31, 9.27, 0.49, 0.49, 0.73]} \ No newline at end of file diff --git a/annotations_1/szIOuIIbVfQ_filtered.json b/annotations_1/szIOuIIbVfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/szIOuIIbVfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/t-B2zR5O5Ys_filtered.json b/annotations_1/t-B2zR5O5Ys_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b116c03910c6a56573252fd849b6cca955a61236 --- /dev/null +++ b/annotations_1/t-B2zR5O5Ys_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.35], [23.0, 24.17], [52.0, 59.49], [77.0, 81.31], [93.0, 92.75], [98.0, 99.98], [124.0, 127.14], [129.0, 128.78]], "keep_status": [true, false, true, false, false, false, false, false], "silence_prob": [29.41, 0.0, 33.09, 37.82, 0.0, 0.0, 31.99, 0.0], "audiomae_on_audioset": [[["music", 34.41], ["guitar", 12.41], ["musical instrument", 11.07]], null, [["music", 58.5], ["throbbing", 5.48], ["cacophony", 5.25]], [["music", 67.52], ["theremin", 7.81], ["synthesizer", 2.24]], null, null, [["music", 80.85], ["synthesizer", 5.65], ["electronic music", 3.77]], null], "duration": [3.35, 1.17, 7.49, 4.31, -0.25, 1.98, 3.14, -0.22]} \ No newline at end of file diff --git a/annotations_1/t-lIuwPGT9w_filtered.json b/annotations_1/t-lIuwPGT9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73fa6b85a1b6f9e712e901eb08f37bda7b9f5aaf --- /dev/null +++ b/annotations_1/t-lIuwPGT9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.95], [11.0, 11.75], [15.0, 16.12], [19.0, 19.35], [20.0, 21.29], [22.0, 25.19], [25.0, 25.24], [25.0, 36.56], [38.0, 45.1], [47.0, 47.75], [49.0, 48.84], [51.0, 51.26], [53.0, 57.65], [59.0, 63.19], [65.0, 65.84], [67.0, 84.23], [85.0, 87.51], [90.0, 96.82], [99.0, 99.81], [103.0, 162.97]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 48.56, 47.58, 0.0, 0.0, 0.0, 53.59, 30.31, 0.0, 31.92, 31.28, 28.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 44.1], ["hum", 21.19], ["throbbing", 9.42]], [["hum", 30.45], ["music", 18.7], ["mains hum", 10.18]], null, null, null, null, [["animal", 51.95], ["roaring cats (lions, tigers)", 11.31], ["wild animals", 6.63]], null, [["music", 21.6], ["fly, housefly", 15.81], ["hum", 11.18]], [["music", 23.41], ["whale vocalization", 14.0], ["hum", 13.71]], [["speech", 38.43], ["music", 16.21], ["sidetone", 9.69]], null, null], "duration": [0.95, 0.75, 1.12, 0.35, 1.29, 3.19, 0.24, 11.56, 7.1, 0.75, -0.16, 0.26, 4.65, 4.19, 0.84, 17.23, 2.51, 6.82, 0.81, 59.97]} \ No newline at end of file diff --git a/annotations_1/t-t8eVDckH8_filtered.json b/annotations_1/t-t8eVDckH8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c534c73855a8aa4c63d32fa9565b7a15a3e03c56 --- /dev/null +++ b/annotations_1/t-t8eVDckH8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.66], [2.0, 2.73], [3.0, 11.06], [14.0, 17.56], [23.0, 33.4], [36.0, 63.56], [64.0, 68.37], [69.0, 70.01], [70.0, 96.13], [99.0, 100.38], [100.0, 100.41], [103.0, 153.17], [157.0, 173.38], [174.0, 185.48], [186.0, 219.65]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 28.15, 28.3, 28.11, 28.22, 28.37, 0.0, 28.22, 0.0, 0.0, 0.0, 28.23, 28.65, 0.0], "audiomae_on_audioset": [null, null, [["music", 54.48], ["vehicle", 12.07], ["motorcycle", 8.11]], [["music", 64.74], ["electronic music", 4.95], ["sound effect", 3.98]], [["music", 40.36], ["speech", 16.49], ["electronic music", 6.98]], [["music", 79.8], ["electronic music", 5.42], ["techno", 3.63]], [["music", 65.91], ["speech", 11.43], ["electronic music", 3.61]], null, [["music", 54.71], ["speech", 10.21], ["vehicle", 6.94]], null, null, null, [["music", 65.33], ["throbbing", 7.8], ["electronic music", 5.77]], [["mains hum", 52.9], ["music", 16.99], ["hum", 11.39]], null], "duration": [-0.34, 0.73, 8.06, 3.56, 10.4, 27.56, 4.37, 1.01, 26.13, 1.38, 0.41, 50.17, 16.38, 11.48, 33.65]} \ No newline at end of file diff --git a/annotations_1/t09QqjBkg0c_filtered.json b/annotations_1/t09QqjBkg0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..988ede081e0071872418729966d316826ac94523 --- /dev/null +++ b/annotations_1/t09QqjBkg0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[157.0, 157.37], [159.0, 159.49], [160.0, 162.57]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 62.17], "audiomae_on_audioset": [null, null, null], "duration": [0.37, 0.49, 2.57]} \ No newline at end of file diff --git a/annotations_1/t0oqEjxOUww_filtered.json b/annotations_1/t0oqEjxOUww_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7b5b986b139691a683586ec40fd19bb67920e0b --- /dev/null +++ b/annotations_1/t0oqEjxOUww_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [5.0, 10.23], [13.0, 14.69], [19.0, 20.31], [22.0, 23.18], [26.0, 26.28], [28.0, 29.03], [30.0, 61.67], [62.0, 63.05], [65.0, 69.42], [72.0, 73.45], [80.0, 81.36], [84.0, 85.53], [90.0, 90.64], [95.0, 96.63], [100.0, 100.77], [102.0, 102.52], [107.0, 118.13], [119.0, 120.29], [129.0, 129.05], [131.0, 131.57], [137.0, 141.42], [143.0, 143.78], [147.0, 147.93], [149.0, 152.0], [154.0, 155.02], [159.0, 159.81], [166.0, 172.42], [177.0, 177.47], [178.0, 183.52], [184.0, 184.59], [185.0, 185.75], [187.0, 200.18], [202.0, 205.78], [207.0, 207.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 77.7, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 95.78, 0.0, 0.0, 60.05, 0.0, 31.14, 0.0, 0.0, 39.86, 92.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 57.54], ["music", 14.75], ["didgeridoo", 4.58]], null, null, [["cattle, bovinae", 44.88], ["livestock, farm animals, working animals", 29.33], ["moo", 19.94]], null, null], "duration": [0.88, 5.23, 1.69, 1.31, 1.18, 0.28, 1.03, 31.67, 1.05, 4.42, 1.45, 1.36, 1.53, 0.64, 1.63, 0.77, 0.52, 11.13, 1.29, 0.05, 0.57, 4.42, 0.78, 0.93, 3.0, 1.02, 0.81, 6.42, 0.47, 5.52, 0.59, 0.75, 13.18, 3.78, 0.49]} \ No newline at end of file diff --git a/annotations_1/t0tIXAlLX8s_filtered.json b/annotations_1/t0tIXAlLX8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b7561337796d0c011601b9c312e2c5229f3084f --- /dev/null +++ b/annotations_1/t0tIXAlLX8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [13.0, 15.62], [16.0, 16.63], [24.0, 32.36], [34.0, 36.36], [38.0, 39.38], [41.0, 48.34], [52.0, 123.16], [130.0, 130.1], [131.0, 131.63], [142.0, 143.6], [145.0, 145.34], [149.0, 151.11]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 37.64, 0.0, 31.03, 30.82, 0.0, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 32.45], "audiomae_on_audioset": [null, [["speech", 75.25], ["gears", 3.05], ["mechanisms", 2.65]], null, [["speech", 27.61], ["mains hum", 16.66], ["hum", 13.77]], [["music", 43.7], ["speech", 29.6], ["electronic music", 4.38]], null, [["music", 84.45], ["hum", 3.07], ["didgeridoo", 2.72]], null, null, null, null, null, [["speech", 43.58], ["siren", 6.81], ["music", 6.5]]], "duration": [0.67, 2.62, 0.63, 8.36, 2.36, 1.38, 7.34, 71.16, 0.1, 0.63, 1.6, 0.34, 2.11]} \ No newline at end of file diff --git a/annotations_1/t1RkYJaG9bo_filtered.json b/annotations_1/t1RkYJaG9bo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e4526c44f17e7a31835feab3cd2aa8f08426b57 --- /dev/null +++ b/annotations_1/t1RkYJaG9bo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.35], [11.0, 11.6], [13.0, 13.8], [15.0, 16.09], [17.0, 17.71], [19.0, 19.79], [29.0, 29.89], [39.0, 39.63], [111.0, 111.57], [113.0, 113.9], [146.0, 146.28], [149.0, 149.4], [151.0, 151.46], [157.0, 157.44], [159.0, 161.2], [179.0, 178.83], [191.0, 194.76], [213.0, 217.61], [222.0, 224.07], [227.0, 229.9], [232.0, 237.9], [239.0, 240.75], [242.0, 250.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 32.0, 99.36, 64.86, 50.91, 41.54, 0.0, 55.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 68.32], ["speech", 7.62], ["swing music", 2.69]], null, null, null, [["music", 58.27], ["theremin", 13.39], ["singing", 2.07]], null, null], "duration": [0.35, 0.6, 0.8, 1.09, 0.71, 0.79, 0.89, 0.63, 0.57, 0.9, 0.28, 0.4, 0.46, 0.44, 2.2, -0.17, 3.76, 4.61, 2.07, 2.9, 5.9, 1.75, 8.7]} \ No newline at end of file diff --git a/annotations_1/t1Wk3H5Xur0_filtered.json b/annotations_1/t1Wk3H5Xur0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..516ad5ce7c22ca3f8b5e7ca8111362b9c98c5711 --- /dev/null +++ b/annotations_1/t1Wk3H5Xur0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.02], [5.0, 6.59], [13.0, 13.41], [14.0, 16.38], [17.0, 19.41], [24.0, 25.51], [28.0, 28.26], [34.0, 35.19], [37.0, 37.76], [42.0, 43.55], [48.0, 48.83], [51.0, 51.41], [53.0, 53.89], [61.0, 62.24], [69.0, 72.06], [74.0, 76.62], [79.0, 79.84], [85.0, 85.14], [89.0, 90.69], [98.0, 98.42], [109.0, 110.52], [132.0, 133.39], [160.0, 160.57], [163.0, 163.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.23, 99.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.02, 1.59, 0.41, 2.38, 2.41, 1.51, 0.26, 1.19, 0.76, 1.55, 0.83, 0.41, 0.89, 1.24, 3.06, 2.62, 0.84, 0.14, 1.69, 0.42, 1.52, 1.39, 0.57, 0.07]} \ No newline at end of file diff --git a/annotations_1/t2NytKIhd68_filtered.json b/annotations_1/t2NytKIhd68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc55fed4fc6002ad96daac216c20deb181776c6e --- /dev/null +++ b/annotations_1/t2NytKIhd68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.42], [7.0, 22.81], [23.0, 23.95], [28.0, 28.49], [31.0, 37.13], [39.0, 39.65], [41.0, 45.08], [48.0, 51.56], [53.0, 53.43], [55.0, 70.58], [73.0, 76.08], [79.0, 82.86], [85.0, 85.43], [110.0, 115.43], [121.0, 121.1], [123.0, 123.57], [124.0, 125.09], [145.0, 150.35], [157.0, 158.16]], "keep_status": [true, true, false, false, true, false, true, true, false, true, true, true, false, true, false, false, false, false, false], "silence_prob": [35.94, 34.4, 0.0, 0.0, 32.22, 0.0, 32.37, 35.13, 0.0, 30.32, 32.74, 34.28, 0.0, 37.9, 0.0, 0.0, 0.0, 28.9, 0.0], "audiomae_on_audioset": [[["whale vocalization", 27.91], ["speech", 9.51], ["livestock, farm animals, working animals", 9.38]], [["speech", 31.4], ["hum", 13.53], ["mains hum", 10.15]], null, null, [["speech", 16.65], ["music", 13.55], ["vehicle", 2.56]], null, [["music", 34.18], ["hum", 9.64], ["mains hum", 8.39]], [["fly, housefly", 23.15], ["bee, wasp, etc.", 16.39], ["insect", 11.08]], null, [["insect", 23.5], ["fly, housefly", 21.03], ["buzz", 15.49]], [["fly, housefly", 23.89], ["mains hum", 9.04], ["insect", 7.64]], [["mains hum", 17.01], ["hum", 16.37], ["buzz", 9.1]], null, [["thunk", 31.18], ["hum", 22.98], ["mains hum", 8.25]], null, null, null, [["cattle, bovinae", 36.18], ["speech", 18.64], ["moo", 16.96]], null], "duration": [3.42, 15.81, 0.95, 0.49, 6.13, 0.65, 4.08, 3.56, 0.43, 15.58, 3.08, 3.86, 0.43, 5.43, 0.1, 0.57, 1.09, 5.35, 1.16]} \ No newline at end of file diff --git a/annotations_1/t3gqjXINvac_filtered.json b/annotations_1/t3gqjXINvac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69fefbb4f0b79a547701ef468a8edb9df4ebe59d --- /dev/null +++ b/annotations_1/t3gqjXINvac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.15], [12.0, 12.33], [30.0, 30.6], [31.0, 33.32], [36.0, 39.83], [43.0, 44.09], [52.0, 52.88], [54.0, 54.65], [55.0, 56.3], [57.0, 58.89], [60.0, 61.72], [63.0, 63.76], [66.0, 66.38], [72.0, 73.03], [75.0, 76.06], [77.0, 78.61], [80.0, 80.74], [82.0, 84.33], [87.0, 86.88], [108.0, 109.86], [115.0, 116.61], [117.0, 118.86], [120.0, 120.99], [126.0, 127.68], [128.0, 129.59], [130.0, 133.35], [134.0, 135.67], [139.0, 142.67], [144.0, 145.08], [147.0, 148.9], [149.0, 150.97], [157.0, 158.55], [161.0, 162.63], [164.0, 164.37], [165.0, 165.94], [166.0, 170.73], [172.0, 173.33], [174.0, 183.57], [185.0, 185.4]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.97, 0.0, 0.0, 37.12, 44.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 0.0, 47.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.54, 0.0, 65.55, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 21.65], ["speech", 17.38], ["sidetone", 16.41]], [["speech", 14.13], ["burping, eructation", 13.22], ["fly, housefly", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.19], ["sine wave", 4.65], ["insect", 3.57]], null, null, null, null, null, null, null, null, null, null, null], "duration": [2.15, 0.33, 0.6, 2.32, 3.83, 1.09, 0.88, 0.65, 1.3, 1.89, 1.72, 0.76, 0.38, 1.03, 1.06, 1.61, 0.74, 2.33, -0.12, 1.86, 1.61, 1.86, 0.99, 1.68, 1.59, 3.35, 1.67, 3.67, 1.08, 1.9, 1.97, 1.55, 1.63, 0.37, 0.94, 4.73, 1.33, 9.57, 0.4]} \ No newline at end of file diff --git a/annotations_1/t3mwyiOBDrk_filtered.json b/annotations_1/t3mwyiOBDrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c98491cd0f81fcd2d277c96096605ac46e1a0dd3 --- /dev/null +++ b/annotations_1/t3mwyiOBDrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 15.16], [16.0, 17.27], [18.0, 19.55], [20.0, 21.1], [22.0, 23.94], [25.0, 26.15], [28.0, 27.97], [30.0, 70.93], [84.0, 122.93], [124.0, 127.26], [129.0, 131.87], [133.0, 134.38], [135.0, 135.58], [137.0, 137.08], [138.0, 140.21], [141.0, 145.57], [150.0, 151.56], [160.0, 160.61], [165.0, 165.91], [166.0, 167.36], [168.0, 172.18], [174.0, 177.48]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 56.03, 0.0, 0.0, 0.0, 82.43, 99.52, 0.0, 0.0, 0.0, 0.0, 91.64, 86.45], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 21.44], ["whale vocalization", 20.05], ["moo", 8.94]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.16, 1.27, 1.55, 1.1, 1.94, 1.15, -0.03, 40.93, 38.93, 3.26, 2.87, 1.38, 0.58, 0.08, 2.21, 4.57, 1.56, 0.61, 0.91, 1.36, 4.18, 3.48]} \ No newline at end of file diff --git a/annotations_1/t45uy-QuRDU_filtered.json b/annotations_1/t45uy-QuRDU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cd68f6c1ba59acf23ee405302caa461834f49e18 --- /dev/null +++ b/annotations_1/t45uy-QuRDU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.83], [2.0, 3.16], [19.0, 20.73], [22.0, 23.57], [28.0, 31.08], [36.0, 41.62], [42.0, 47.46], [50.0, 55.44], [56.0, 56.56], [57.0, 58.45], [65.0, 65.89], [68.0, 68.3]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.04, 36.2, 30.9, 32.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 62.16], ["speech", 10.98], ["hum", 2.82]], [["music", 62.07], ["animal", 4.57], ["theremin", 2.58]], [["music", 34.59], ["cattle, bovinae", 12.32], ["moo", 9.73]], null, null, null, null], "duration": [0.83, 1.16, 1.73, 1.57, 3.08, 5.62, 5.46, 5.44, 0.56, 1.45, 0.89, 0.3]} \ No newline at end of file diff --git a/annotations_1/t5GdZx7AS-E_filtered.json b/annotations_1/t5GdZx7AS-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c28cd632f8e85d6ca4dd57f5a8111caa408413e3 --- /dev/null +++ b/annotations_1/t5GdZx7AS-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.67], [5.0, 6.64], [7.0, 11.1], [11.0, 17.19], [18.0, 32.86], [34.0, 45.96], [48.0, 50.84], [52.0, 58.18], [60.0, 61.1], [64.0, 102.44], [104.0, 115.23], [122.0, 125.76], [126.0, 127.7], [129.0, 130.44], [131.0, 137.52], [138.0, 146.45], [147.0, 158.08], [158.0, 167.07], [171.0, 172.44], [174.0, 183.22]], "keep_status": [true, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.57, 0.0, 44.99, 46.72, 44.78, 32.6, 46.05, 34.38, 0.0, 0.0, 31.14, 34.65, 0.0, 0.0, 33.05, 29.51, 36.05, 37.63, 0.0, 29.66], "audiomae_on_audioset": [[["music", 39.3], ["speech", 10.44], ["didgeridoo", 4.32]], null, [["music", 40.96], ["speech", 15.92], ["synthesizer", 6.39]], [["music", 50.62], ["didgeridoo", 25.58], ["speech", 2.2]], [["music", 55.42], ["didgeridoo", 7.9], ["ambient music", 4.27]], [["speech", 27.36], ["music", 13.52], ["explosion", 9.88]], [["music", 40.72], ["speech", 31.17], ["synthesizer", 2.02]], [["music", 38.87], ["hum", 17.3], ["throbbing", 9.58]], null, null, [["music", 80.71], ["soundtrack music", 3.01], ["throbbing", 2.33]], [["hum", 38.12], ["music", 23.19], ["mains hum", 20.81]], null, null, [["speech", 41.78], ["music", 34.46], ["hum", 3.71]], [["music", 74.97], ["throbbing", 3.95], ["hum", 3.93]], [["music", 49.35], ["hum", 11.23], ["sonar", 11.07]], [["music", 44.45], ["hum", 19.69], ["mains hum", 15.05]], null, [["hum", 51.56], ["mains hum", 36.7], ["music", 4.72]]], "duration": [2.67, 1.64, 4.1, 6.19, 14.86, 11.96, 2.84, 6.18, 1.1, 38.44, 11.23, 3.76, 1.7, 1.44, 6.52, 8.45, 11.08, 9.07, 1.44, 9.22]} \ No newline at end of file diff --git a/annotations_1/t5nBikdQ1kE_filtered.json b/annotations_1/t5nBikdQ1kE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1987b7db3093d083e9926b059323c475f8438230 --- /dev/null +++ b/annotations_1/t5nBikdQ1kE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[46.0, 46.62], [50.0, 51.7], [53.0, 54.21], [56.0, 55.7], [57.0, 57.4], [58.0, 58.83], [62.0, 62.43], [64.0, 65.48], [67.0, 66.61], [69.0, 68.82], [71.0, 71.41], [79.0, 80.33], [88.0, 89.45], [95.0, 96.28], [100.0, 100.63], [102.0, 109.41], [111.0, 113.34], [114.0, 114.3], [116.0, 117.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.2, 44.15, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 43.99], ["mains hum", 11.28], ["ambient music", 7.91]], [["speech", 22.42], ["vehicle", 9.84], ["hum", 8.54]], null, null], "duration": [0.62, 1.7, 1.21, -0.3, 0.4, 0.83, 0.43, 1.48, -0.39, -0.18, 0.41, 1.33, 1.45, 1.28, 0.63, 7.41, 2.34, 0.3, 1.9]} \ No newline at end of file diff --git a/annotations_1/t5vDcrQIig0_filtered.json b/annotations_1/t5vDcrQIig0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af1b830f53d3bb653aa68f6bda558a82b9c45755 --- /dev/null +++ b/annotations_1/t5vDcrQIig0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.46], [14.0, 17.22], [18.0, 19.95], [22.0, 21.76], [25.0, 25.76], [27.0, 29.08], [29.0, 39.78], [41.0, 49.47], [51.0, 58.08], [59.0, 66.16], [69.0, 71.27], [73.0, 73.6], [75.0, 79.95], [82.0, 87.71], [89.0, 92.47], [93.0, 93.73], [114.0, 118.0], [120.0, 121.36], [123.0, 125.31], [127.0, 128.56], [131.0, 131.43], [133.0, 133.27], [137.0, 137.73], [143.0, 142.94], [154.0, 154.14], [158.0, 159.06], [162.0, 162.23], [163.0, 164.49]], "keep_status": [false, true, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.37, 0.0, 0.0, 0.0, 44.32, 45.14, 54.97, 47.27, 44.78, 66.88, 0.0, 32.53, 63.96, 99.78, 0.0, 100.0, 0.0, 59.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 46.08], ["musical instrument", 8.01], ["marimba, xylophone", 4.22]], null, null, null, [["music", 54.16], ["synthesizer", 5.16], ["musical instrument", 4.43]], [["music", 54.32], ["speech", 27.21], ["radio", 3.36]], null, [["speech", 42.44], ["music", 28.73], ["marimba, xylophone", 2.91]], [["music", 39.04], ["speech", 20.3], ["musical instrument", 5.22]], null, null, [["music", 53.52], ["musical instrument", 11.24], ["piano", 10.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.46, 3.22, 1.95, -0.24, 0.76, 2.08, 10.78, 8.47, 7.08, 7.16, 2.27, 0.6, 4.95, 5.71, 3.47, 0.73, 4.0, 1.36, 2.31, 1.56, 0.43, 0.27, 0.73, -0.06, 0.14, 1.06, 0.23, 1.49]} \ No newline at end of file diff --git a/annotations_1/t5zrRGTShZA_filtered.json b/annotations_1/t5zrRGTShZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64b5f3c1f0b012c1eb9f205867b1a74ac1351ac9 --- /dev/null +++ b/annotations_1/t5zrRGTShZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.78], [2.0, 2.84], [5.0, 5.9], [7.0, 7.72], [9.0, 9.41], [11.0, 11.87], [12.0, 12.63], [15.0, 15.97], [17.0, 17.34], [23.0, 24.9], [27.0, 27.7], [30.0, 30.21], [33.0, 32.88], [33.0, 33.61], [41.0, 40.81], [42.0, 41.93], [44.0, 43.68], [45.0, 45.32], [47.0, 47.43], [48.0, 48.88], [50.0, 50.01], [52.0, 52.47], [53.0, 53.35], [59.0, 60.45], [61.0, 61.25], [63.0, 63.36], [67.0, 67.26], [67.0, 67.47], [69.0, 70.87], [71.0, 72.81], [73.0, 73.21], [73.0, 75.02], [75.0, 76.5], [78.0, 78.68], [85.0, 85.67], [87.0, 96.18], [96.0, 96.8], [97.0, 96.85], [97.0, 100.74], [103.0, 103.6], [110.0, 110.56], [112.0, 114.72], [116.0, 117.12], [119.0, 126.23], [139.0, 148.8], [164.0, 167.14], [168.0, 168.44], [168.0, 170.16], [172.0, 173.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 67.63, 0.0, 0.0, 57.01, 0.0, 0.0, 61.47, 0.0, 51.55, 34.09, 38.67, 0.0, 34.93, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 31.49], ["whimper", 14.51], ["speech", 3.53]], [["music", 45.42], ["carnatic music", 24.35], ["musical instrument", 3.64]], null, [["music", 55.39], ["carnatic music", 9.3], ["theremin", 6.12]], null], "duration": [0.78, 0.84, 0.9, 0.72, 0.41, 0.87, 0.63, 0.97, 0.34, 1.9, 0.7, 0.21, -0.12, 0.61, -0.19, -0.07, -0.32, 0.32, 0.43, 0.88, 0.01, 0.47, 0.35, 1.45, 0.25, 0.36, 0.26, 0.47, 1.87, 1.81, 0.21, 2.02, 1.5, 0.68, 0.67, 9.18, 0.8, -0.15, 3.74, 0.6, 0.56, 2.72, 1.12, 7.23, 9.8, 3.14, 0.44, 2.16, 1.11]} \ No newline at end of file diff --git a/annotations_1/t6UyEPrqaQI_filtered.json b/annotations_1/t6UyEPrqaQI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0f44bf69a5b28db0b826ae8836125387e507b23 --- /dev/null +++ b/annotations_1/t6UyEPrqaQI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.82], [12.0, 13.39], [14.0, 16.07], [27.0, 41.71], [42.0, 43.21], [49.0, 54.11], [55.0, 55.41], [59.0, 61.99], [63.0, 64.5], [65.0, 73.89], [74.0, 75.3], [78.0, 91.49], [95.0, 149.72], [151.0, 180.59], [182.0, 181.99], [182.0, 182.39], [184.0, 186.83], [187.0, 188.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false], "silence_prob": [99.1, 0.0, 87.92, 87.74, 0.0, 66.03, 0.0, 90.43, 0.0, 58.81, 0.0, 29.78, 0.0, 28.7, 0.0, 0.0, 42.69, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.63], ["gong", 18.15], ["music", 12.22]], null, [["music", 39.87], ["scary music", 26.17], ["hum", 4.48]], null, null, [["music", 32.32], ["whale vocalization", 17.86], ["speech", 8.94]], null], "duration": [2.82, 1.39, 2.07, 14.71, 1.21, 5.11, 0.41, 2.99, 1.5, 8.89, 1.3, 13.49, 54.72, 29.59, -0.01, 0.39, 2.83, 1.74]} \ No newline at end of file diff --git a/annotations_1/t6nqp5MdMp0_filtered.json b/annotations_1/t6nqp5MdMp0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e9c50a7def1735b04302f982c11f256e7fbb042 --- /dev/null +++ b/annotations_1/t6nqp5MdMp0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [11.0, 11.97], [21.0, 23.82], [28.0, 29.17], [29.0, 30.06], [31.0, 43.77], [46.0, 66.55], [69.0, 94.83], [96.0, 103.77], [106.0, 126.54], [129.0, 136.19], [138.0, 138.67], [141.0, 143.06], [144.0, 175.44], [176.0, 176.28], [178.0, 178.28]], "keep_status": [false, false, true, false, false, false, true, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 0.0, 29.94, 29.08, 29.25, 28.42, 28.75, 28.42, 0.0, 29.03, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 49.57], ["throbbing", 6.91], ["vehicle", 6.59]], null, null, [["music", 62.29], ["hum", 13.02], ["mains hum", 9.49]], [["explosion", 32.5], ["speech", 13.13], ["burst, pop", 8.8]], [["speech", 58.1], ["music", 13.44], ["throbbing", 4.95]], [["music", 28.17], ["cacophony", 8.37], ["sound effect", 4.91]], [["speech", 53.61], ["music", 22.07], ["sound effect", 2.53]], [["speech", 67.32], ["music", 15.25], ["sound effect", 1.91]], null, [["music", 33.66], ["speech", 17.25], ["throbbing", 3.98]], null, null, null], "duration": [1.46, 0.97, 2.82, 1.17, 1.06, 12.77, 20.55, 25.83, 7.77, 20.54, 7.19, 0.67, 2.06, 31.44, 0.28, 0.28]} \ No newline at end of file diff --git a/annotations_1/t794eVHOIvo_filtered.json b/annotations_1/t794eVHOIvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..336eedecca210c0bd9f70405dbb8418e5b651bb2 --- /dev/null +++ b/annotations_1/t794eVHOIvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 9.83], [10.0, 11.64], [12.0, 17.44], [19.0, 19.67], [21.0, 21.61]], "keep_status": [false, false, false, false, false], "silence_prob": [63.21, 0.0, 78.38, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [4.83, 1.64, 5.44, 0.67, 0.61]} \ No newline at end of file diff --git a/annotations_1/t8vRwv9kRjg_filtered.json b/annotations_1/t8vRwv9kRjg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b78316bc45cdec5951396d660b077d4decb91335 --- /dev/null +++ b/annotations_1/t8vRwv9kRjg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 23.52], [26.0, 50.46], [51.0, 56.67], [62.0, 72.55], [78.0, 78.98], [80.0, 80.67], [87.0, 88.42], [94.0, 94.81], [96.0, 98.51], [103.0, 104.21], [105.0, 105.71], [106.0, 108.01], [112.0, 115.86], [117.0, 117.22], [122.0, 125.41], [125.0, 142.97], [144.0, 147.19], [149.0, 150.47], [153.0, 162.65], [163.0, 168.49], [173.0, 174.58]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [33.56, 96.54, 97.33, 84.98, 0.0, 0.0, 0.0, 0.0, 97.33, 0.0, 0.0, 62.37, 70.86, 0.0, 99.62, 61.08, 61.57, 0.0, 51.88, 50.02, 0.0], "audiomae_on_audioset": [[["mains hum", 36.02], ["hum", 24.81], ["music", 15.12]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [19.52, 24.46, 5.67, 10.55, 0.98, 0.67, 1.42, 0.81, 2.51, 1.21, 0.71, 2.01, 3.86, 0.22, 3.41, 17.97, 3.19, 1.47, 9.65, 5.49, 1.58]} \ No newline at end of file diff --git a/annotations_1/t9XjAhGr8us_filtered.json b/annotations_1/t9XjAhGr8us_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..645c125cab37d71b41cea046efbb1102f0292fb9 --- /dev/null +++ b/annotations_1/t9XjAhGr8us_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[44.0, 44.69], [45.0, 45.33], [46.0, 46.14], [50.0, 51.68], [69.0, 70.56], [85.0, 85.72]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [0.69, 0.33, 0.14, 1.68, 1.56, 0.72]} \ No newline at end of file diff --git a/annotations_1/t9vWi2ItxMc_filtered.json b/annotations_1/t9vWi2ItxMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e38415c4d240d2b50bb585d9daa1f8b4237509e0 --- /dev/null +++ b/annotations_1/t9vWi2ItxMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.29], [7.0, 7.32], [11.0, 11.11], [17.0, 17.07], [19.0, 19.43], [20.0, 21.61], [22.0, 24.65], [27.0, 27.36], [28.0, 29.69], [32.0, 35.48], [38.0, 38.97], [50.0, 49.86], [53.0, 59.16], [60.0, 59.97], [71.0, 70.66], [72.0, 71.71], [73.0, 73.68], [74.0, 74.88], [77.0, 77.41], [80.0, 79.79], [94.0, 94.9], [102.0, 101.66], [111.0, 111.7], [118.0, 123.03], [124.0, 124.43], [124.0, 124.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 62.27, 0.0, 0.0, 74.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 66.29], ["speech", 14.5], ["music", 7.58]], null, null], "duration": [0.29, 0.32, 0.11, 0.07, 0.43, 1.61, 2.65, 0.36, 1.69, 3.48, 0.97, -0.14, 6.16, -0.03, -0.34, -0.29, 0.68, 0.88, 0.41, -0.21, 0.9, -0.34, 0.7, 5.03, 0.43, 0.46]} \ No newline at end of file diff --git a/annotations_1/tAHCa87P8YI_filtered.json b/annotations_1/tAHCa87P8YI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b74015a26206bbec94aaad1cac2c99b678abd7c8 --- /dev/null +++ b/annotations_1/tAHCa87P8YI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 20.39], [22.0, 27.75], [30.0, 31.02], [32.0, 42.47], [51.0, 51.65], [58.0, 61.05], [62.0, 62.56], [64.0, 66.48], [70.0, 69.99], [71.0, 74.24], [77.0, 77.87], [90.0, 90.21], [91.0, 92.28], [100.0, 101.19], [104.0, 104.41], [105.0, 110.51], [113.0, 113.48], [115.0, 122.0], [123.0, 123.63], [131.0, 131.53], [138.0, 139.36], [140.0, 142.79]], "keep_status": [true, true, false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [41.72, 43.61, 0.0, 33.52, 0.0, 35.98, 0.0, 36.86, 0.0, 33.88, 0.0, 0.0, 0.0, 0.0, 0.0, 32.88, 0.0, 30.64, 0.0, 0.0, 0.0, 49.36], "audiomae_on_audioset": [[["whale vocalization", 34.98], ["speech", 21.84], ["hum", 5.34]], [["hum", 39.52], ["whale vocalization", 15.9], ["music", 9.68]], null, [["music", 34.26], ["hum", 17.14], ["synthesizer", 7.82]], null, [["throbbing", 28.59], ["hum", 15.33], ["noise", 14.94]], null, [["throbbing", 38.14], ["hum", 25.01], ["music", 8.61]], null, [["music", 18.69], ["throbbing", 11.96], ["hum", 9.72]], null, null, null, null, null, [["sidetone", 67.97], ["speech", 18.77], ["music", 2.72]], null, [["music", 27.02], ["speech", 18.82], ["throbbing", 13.55]], null, null, null, [["music", 32.63], ["whale vocalization", 8.79], ["didgeridoo", 7.69]]], "duration": [3.39, 5.75, 1.02, 10.47, 0.65, 3.05, 0.56, 2.48, -0.01, 3.24, 0.87, 0.21, 1.28, 1.19, 0.41, 5.51, 0.48, 7.0, 0.63, 0.53, 1.36, 2.79]} \ No newline at end of file diff --git a/annotations_1/tBOZNOYMHEg_filtered.json b/annotations_1/tBOZNOYMHEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d3594972de23ce6972edf0875c47c43c1975b745 --- /dev/null +++ b/annotations_1/tBOZNOYMHEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.7], [13.0, 16.41], [18.0, 19.52], [20.0, 22.55], [23.0, 34.7]], "keep_status": [false, true, false, false, true], "silence_prob": [0.0, 34.57, 0.0, 44.99, 29.11], "audiomae_on_audioset": [null, [["singing bowl", 29.6], ["music", 23.12], ["speech", 4.38]], null, [["speech", 37.68], ["music", 27.09], ["singing bowl", 8.57]], [["music", 28.05], ["musical instrument", 9.57], ["sonar", 9.26]]], "duration": [0.7, 3.41, 1.52, 2.55, 11.7]} \ No newline at end of file diff --git a/annotations_1/tD3vc9KZ9lQ_filtered.json b/annotations_1/tD3vc9KZ9lQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6266c833b6f64f65f45bdf5a81e0e2055666038e --- /dev/null +++ b/annotations_1/tD3vc9KZ9lQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 12.07], [19.0, 35.77], [36.0, 37.07], [39.0, 39.33], [42.0, 43.53], [45.0, 100.45], [104.0, 104.87]], "keep_status": [false, true, false, false, false, false, false], "silence_prob": [74.13, 42.69, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 24.17], ["hum", 18.49], ["mains hum", 10.04]], null, null, null, null, null], "duration": [9.07, 16.77, 1.07, 0.33, 1.53, 55.45, 0.87]} \ No newline at end of file diff --git a/annotations_1/tD8f4Xk30bg_filtered.json b/annotations_1/tD8f4Xk30bg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c82b590785a32417bb3a477c24fc0899bc96adaa --- /dev/null +++ b/annotations_1/tD8f4Xk30bg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.01], [15.0, 15.62], [23.0, 22.94], [70.0, 70.68], [79.0, 80.15], [82.0, 82.21], [83.0, 83.61], [84.0, 85.36], [86.0, 91.2]], "keep_status": [false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.4], ["speech", 16.8], ["explosion", 7.43]]], "duration": [1.01, 0.62, -0.06, 0.68, 1.15, 0.21, 0.61, 1.36, 5.2]} \ No newline at end of file diff --git a/annotations_1/tD9DfbbK6OE_filtered.json b/annotations_1/tD9DfbbK6OE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bb228c7ff5a24e93f21bfae9d82d18d69dc987 --- /dev/null +++ b/annotations_1/tD9DfbbK6OE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.74], [8.0, 11.04], [14.0, 14.1], [19.0, 25.05], [26.0, 26.52], [27.0, 53.5], [55.0, 55.04], [59.0, 76.37], [80.0, 87.27], [89.0, 89.38], [91.0, 95.93], [99.0, 119.33], [121.0, 121.37], [121.0, 139.8], [142.0, 142.87], [148.0, 154.68], [156.0, 163.36], [165.0, 166.04]], "keep_status": [false, true, false, false, false, false, false, true, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 47.54, 0.0, 64.18, 0.0, 40.28, 0.0, 31.97, 31.59, 0.0, 34.46, 34.93, 0.0, 32.74, 0.0, 38.59, 46.29, 0.0], "audiomae_on_audioset": [null, [["whale vocalization", 25.78], ["theremin", 20.74], ["animal", 8.01]], null, null, null, [["music", 51.61], ["theremin", 23.16], ["musical instrument", 4.95]], null, [["music", 46.54], ["theremin", 15.74], ["animal", 3.88]], [["speech", 51.39], ["music", 22.18], ["whale vocalization", 1.84]], null, [["music", 34.22], ["speech", 17.53], ["theremin", 11.39]], [["bee, wasp, etc.", 16.71], ["animal", 14.26], ["music", 13.43]], null, [["music", 48.91], ["theremin", 13.2], ["animal", 4.26]], null, [["music", 39.84], ["theremin", 20.55], ["speech", 9.72]], [["music", 47.14], ["theremin", 5.35], ["speech", 5.18]], null], "duration": [0.74, 3.04, 0.1, 6.05, 0.52, 26.5, 0.04, 17.37, 7.27, 0.38, 4.93, 20.33, 0.37, 18.8, 0.87, 6.68, 7.36, 1.04]} \ No newline at end of file diff --git a/annotations_1/tDD6wnNN-IQ_filtered.json b/annotations_1/tDD6wnNN-IQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3712bf39fdd629f1ac7b4d0b8b9232f94a5e722b --- /dev/null +++ b/annotations_1/tDD6wnNN-IQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 31.26], [32.0, 33.57], [34.0, 36.36], [37.0, 37.72], [38.0, 38.35], [39.0, 40.68], [41.0, 42.08], [42.0, 43.39], [44.0, 45.37], [54.0, 57.91], [61.0, 62.68], [72.0, 75.15], [78.0, 78.58], [81.0, 82.16], [85.0, 84.94], [88.0, 89.21], [92.0, 92.45], [95.0, 95.42], [102.0, 102.91], [115.0, 117.81]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [54.17, 0.0, 52.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.83, 0.0, 32.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.55], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 32.95], ["inside, small room", 17.74], ["cough", 5.19]], null, [["speech", 41.62], ["radio", 7.01], ["whack, thwack", 6.46]], null, null, null, null, null, null, null, [["speech", 44.2], ["beatboxing", 25.69], ["radio", 2.44]]], "duration": [3.26, 1.57, 2.36, 0.72, 0.35, 1.68, 1.08, 1.39, 1.37, 3.91, 1.68, 3.15, 0.58, 1.16, -0.06, 1.21, 0.45, 0.42, 0.91, 2.81]} \ No newline at end of file diff --git a/annotations_1/tDlL6QWvKNk_filtered.json b/annotations_1/tDlL6QWvKNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c78de0a007f14811caa5f7e9a397cc01315bf383 --- /dev/null +++ b/annotations_1/tDlL6QWvKNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.23], [12.0, 13.19], [14.0, 14.81], [16.0, 16.41], [21.0, 22.86], [24.0, 24.75], [27.0, 27.51], [29.0, 29.76], [31.0, 32.09], [37.0, 42.63], [43.0, 44.29], [46.0, 46.4], [48.0, 49.99], [53.0, 53.49], [54.0, 54.63], [60.0, 60.59], [61.0, 61.94], [63.0, 63.37], [64.0, 65.3], [66.0, 67.02], [68.0, 74.07], [75.0, 76.57], [79.0, 80.25], [81.0, 81.46], [83.0, 83.12], [83.0, 85.67], [86.0, 89.14], [90.0, 93.61], [95.0, 95.39], [98.0, 99.96], [102.0, 103.44], [104.0, 104.3], [105.0, 105.44], [106.0, 123.65], [124.0, 124.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 62.27, 83.7, 79.07, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.19, 0.81, 0.41, 1.86, 0.75, 0.51, 0.76, 1.09, 5.63, 1.29, 0.4, 1.99, 0.49, 0.63, 0.59, 0.94, 0.37, 1.3, 1.02, 6.07, 1.57, 1.25, 0.46, 0.12, 2.67, 3.14, 3.61, 0.39, 1.96, 1.44, 0.3, 0.44, 17.65, 0.9]} \ No newline at end of file diff --git a/annotations_1/tEWLG9sG1VM_filtered.json b/annotations_1/tEWLG9sG1VM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70ff86d91020127be1ec98c90b7165c1052c6bac --- /dev/null +++ b/annotations_1/tEWLG9sG1VM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.41], [13.0, 13.56], [14.0, 17.05], [18.0, 19.36], [21.0, 99.64], [101.0, 101.58], [104.0, 104.75]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.41, 0.56, 3.05, 1.36, 78.64, 0.58, 0.75]} \ No newline at end of file diff --git a/annotations_1/tEs0OuspG4w_filtered.json b/annotations_1/tEs0OuspG4w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..984de5b8d43a1d7383f76925715362525cd3712a --- /dev/null +++ b/annotations_1/tEs0OuspG4w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 54.8], [55.0, 59.63], [61.0, 61.32], [63.0, 67.39], [68.0, 68.49], [69.0, 71.19], [73.0, 73.14], [76.0, 83.94], [97.0, 97.01], [97.0, 97.5], [103.0, 109.56], [111.0, 128.24], [136.0, 141.13], [146.0, 148.29]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, true, true, true], "silence_prob": [90.43, 52.98, 0.0, 37.81, 0.0, 53.16, 0.0, 31.68, 0.0, 0.0, 28.13, 28.94, 28.32, 29.05], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 17.31], ["frog", 13.63], ["music", 12.16]], null, null, null, [["music", 55.53], ["thunk", 9.64], ["thump, thud", 6.44]], null, null, [["sheep", 17.65], ["speech", 16.24], ["groan", 13.22]], [["hum", 36.21], ["music", 12.28], ["whale vocalization", 11.41]], [["speech", 30.1], ["music", 17.54], ["animal", 4.65]], [["music", 31.58], ["didgeridoo", 19.2], ["throbbing", 4.09]]], "duration": [7.8, 4.63, 0.32, 4.39, 0.49, 2.19, 0.14, 7.94, 0.01, 0.5, 6.56, 17.24, 5.13, 2.29]} \ No newline at end of file diff --git a/annotations_1/tEyY-ijoyaQ_filtered.json b/annotations_1/tEyY-ijoyaQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc82089faa0af5921513ea1b981257d04629253c --- /dev/null +++ b/annotations_1/tEyY-ijoyaQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.94], [9.0, 9.96], [10.0, 11.18], [14.0, 14.37], [15.0, 16.58], [18.0, 18.42], [19.0, 21.81], [23.0, 23.55], [24.0, 24.51], [32.0, 33.59], [34.0, 35.83], [38.0, 41.03], [62.0, 83.22], [84.0, 87.44], [89.0, 89.56], [94.0, 96.26], [98.0, 98.78], [100.0, 100.21], [101.0, 100.85], [104.0, 105.26], [110.0, 110.1], [110.0, 111.94], [115.0, 116.82], [118.0, 118.56], [120.0, 120.61], [122.0, 122.62], [124.0, 125.19], [126.0, 134.45], [135.0, 141.34], [142.0, 144.71], [148.0, 149.0], [150.0, 151.17], [152.0, 155.02], [157.0, 161.42], [165.0, 167.49], [170.0, 175.83], [178.0, 178.77], [180.0, 185.41], [187.0, 189.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.71, 0.0, 0.0, 0.0, 0.0, 41.64, 43.1, 43.15, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.18, 51.18, 59.68, 0.0, 0.0, 53.97, 71.14, 70.86, 55.04, 0.0, 82.79, 73.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 59.56], ["beatboxing", 8.75], ["vocal music", 5.71]], [["music", 13.32], ["speech", 12.15], ["beatboxing", 9.66]], [["music", 72.08], ["didgeridoo", 6.07], ["bass guitar", 4.68]], null, [["sidetone", 41.55], ["speech", 25.54], ["mains hum", 5.26]], null, null, null, null, null, null, null, null, null, null, null, [["music", 42.73], ["synthesizer", 7.52], ["singing bowl", 5.77]], null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 0.96, 1.18, 0.37, 1.58, 0.42, 2.81, 0.55, 0.51, 1.59, 1.83, 3.03, 21.22, 3.44, 0.56, 2.26, 0.78, 0.21, -0.15, 1.26, 0.1, 1.94, 1.82, 0.56, 0.61, 0.62, 1.19, 8.45, 6.34, 2.71, 1.0, 1.17, 3.02, 4.42, 2.49, 5.83, 0.77, 5.41, 2.78]} \ No newline at end of file diff --git a/annotations_1/tF3eceBqcik_filtered.json b/annotations_1/tF3eceBqcik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c6c0a1c4511907ea92dff25e8aa167de0a339d --- /dev/null +++ b/annotations_1/tF3eceBqcik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.49], [4.0, 4.56], [5.0, 5.66], [6.0, 8.41], [13.0, 13.53], [15.0, 16.56], [27.0, 27.14], [38.0, 38.25], [49.0, 51.48], [52.0, 53.87], [64.0, 64.81], [82.0, 82.54], [83.0, 84.1], [87.0, 87.25], [88.0, 91.23], [92.0, 92.92], [96.0, 97.68], [114.0, 115.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 51.66, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 0.0, 45.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.16], ["music", 10.75], ["whale vocalization", 2.15]], null, null, null], "duration": [0.49, 0.56, 0.66, 2.41, 0.53, 1.56, 0.14, 0.25, 2.48, 1.87, 0.81, 0.54, 1.1, 0.25, 3.23, 0.92, 1.68, 1.62]} \ No newline at end of file diff --git a/annotations_1/tF6XBuvWdPs_filtered.json b/annotations_1/tF6XBuvWdPs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6694707a3ad8ad3ef2a073f48ee71126124d276c --- /dev/null +++ b/annotations_1/tF6XBuvWdPs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.32], [5.0, 5.75], [9.0, 8.85], [11.0, 11.57], [16.0, 16.34], [18.0, 17.95], [22.0, 22.05], [23.0, 23.28], [25.0, 25.05], [29.0, 29.2], [32.0, 32.78], [34.0, 34.38], [38.0, 38.85], [40.0, 41.15], [43.0, 43.56], [46.0, 46.4], [54.0, 54.06], [55.0, 56.02], [57.0, 58.68], [62.0, 62.07], [64.0, 63.75], [68.0, 69.65], [74.0, 74.06], [77.0, 78.88], [84.0, 84.77], [86.0, 86.0], [90.0, 91.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, 0.75, -0.15, 0.57, 0.34, -0.05, 0.05, 0.28, 0.05, 0.2, 0.78, 0.38, 0.85, 1.15, 0.56, 0.4, 0.06, 1.02, 1.68, 0.07, -0.25, 1.65, 0.06, 1.88, 0.77, 0.0, 1.08]} \ No newline at end of file diff --git a/annotations_1/tFBSGc3v7BI_filtered.json b/annotations_1/tFBSGc3v7BI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a03f6d7257e3d3301c5a5c62a31e1b37fd09d945 --- /dev/null +++ b/annotations_1/tFBSGc3v7BI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 4.8], [6.0, 7.74], [9.0, 9.21], [14.0, 17.27], [20.0, 25.22], [26.0, 27.16], [29.0, 30.77], [35.0, 35.5], [36.0, 38.28], [40.0, 41.3], [48.0, 49.89], [56.0, 56.59], [61.0, 60.67], [67.0, 67.22], [70.0, 70.04], [78.0, 80.18], [83.0, 83.81], [86.0, 87.29], [96.0, 97.21], [124.0, 125.27], [128.0, 128.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 87.55, 97.64, 0.0, 0.0, 0.0, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.8, 1.74, 0.21, 3.27, 5.22, 1.16, 1.77, 0.5, 2.28, 1.3, 1.89, 0.59, -0.33, 0.22, 0.04, 2.18, 0.81, 1.29, 1.21, 1.27, 0.97]} \ No newline at end of file diff --git a/annotations_1/tFEKMdUMjEk_filtered.json b/annotations_1/tFEKMdUMjEk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..809dd77e041df8479d052120f1342c3ad7c6bfd0 --- /dev/null +++ b/annotations_1/tFEKMdUMjEk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.6], [10.0, 12.6], [15.0, 17.58], [22.0, 22.67], [26.0, 27.94], [29.0, 31.11], [33.0, 35.4], [42.0, 42.43], [43.0, 43.48], [44.0, 47.07], [50.0, 51.83], [53.0, 55.04], [55.0, 59.39], [60.0, 64.29], [65.0, 68.77], [70.0, 74.26], [75.0, 87.2], [87.0, 118.98], [120.0, 122.12], [123.0, 128.73], [129.0, 133.81]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 52.05, 100.0, 0.0, 0.0, 100.0, 64.07, 0.0, 0.0, 99.87, 0.0, 38.87, 66.63, 78.55, 59.42, 84.25, 49.45, 0.0, 41.42, 37.3, 31.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 72.06], ["sidetone", 3.85], ["hum", 3.09]], null, null, null, null, [["speech", 27.3], ["singing bowl", 25.55], ["music", 15.82]], null, [["music", 32.24], ["theremin", 27.83], ["ambient music", 11.94]], [["music", 48.39], ["theremin", 14.38], ["synthesizer", 6.54]], [["music", 36.65], ["speech", 33.48], ["foghorn", 9.94]]], "duration": [0.6, 2.6, 2.58, 0.67, 1.94, 2.11, 2.4, 0.43, 0.48, 3.07, 1.83, 2.04, 4.39, 4.29, 3.77, 4.26, 12.2, 31.98, 2.12, 5.73, 4.81]} \ No newline at end of file diff --git a/annotations_1/tFkpixS3QZQ_filtered.json b/annotations_1/tFkpixS3QZQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..442028d46aa8588cfd5d61050e73381b7d435ac9 --- /dev/null +++ b/annotations_1/tFkpixS3QZQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 40.9], [44.0, 54.99], [55.0, 57.64], [62.0, 89.67], [90.0, 90.96], [91.0, 100.36], [101.0, 102.15], [103.0, 103.44], [104.0, 117.14], [126.0, 126.84], [129.0, 130.25]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 31.41, 41.42, 32.01, 0.0, 33.81, 0.0, 0.0, 37.81, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 41.63], ["speech", 6.85], ["hum", 4.08]], [["music", 56.83], ["ambient music", 14.81], ["scary music", 13.34]], [["music", 71.25], ["scary music", 10.16], ["hum", 6.08]], null, [["mains hum", 37.41], ["hum", 35.89], ["speech", 11.74]], null, null, [["music", 42.23], ["electronic music", 10.48], ["hum", 7.9]], null, null], "duration": [1.9, 10.99, 2.64, 27.67, 0.96, 9.36, 1.15, 0.44, 13.14, 0.84, 1.25]} \ No newline at end of file diff --git a/annotations_1/tG1crFI87ro_filtered.json b/annotations_1/tG1crFI87ro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19c9891b7625b05080f9a61af0a48019a30ec8d --- /dev/null +++ b/annotations_1/tG1crFI87ro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.65], [5.0, 11.38], [18.0, 18.57], [21.0, 21.3], [22.0, 23.11], [28.0, 28.86], [32.0, 40.39], [44.0, 49.06], [52.0, 59.31], [60.0, 86.41], [91.0, 95.44], [98.0, 97.87], [98.0, 98.32], [100.0, 100.3], [101.0, 103.11], [104.0, 105.19], [107.0, 107.99], [116.0, 115.79], [128.0, 128.26], [138.0, 142.11], [143.0, 145.03], [148.0, 148.95], [150.0, 150.92], [156.0, 156.42], [162.0, 164.54], [166.0, 167.27], [170.0, 170.24], [172.0, 172.47], [174.0, 176.49]], "keep_status": [true, true, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false], "silence_prob": [33.73, 34.16, 0.0, 0.0, 0.0, 0.0, 29.94, 28.55, 31.31, 34.89, 31.7, 0.0, 0.0, 0.0, 40.86, 0.0, 0.0, 0.0, 0.0, 32.61, 31.92, 0.0, 0.0, 0.0, 35.41, 0.0, 0.0, 0.0, 64.07], "audiomae_on_audioset": [[["music", 44.25], ["theremin", 10.42], ["clarinet", 4.57]], [["music", 37.22], ["hum", 15.31], ["speech", 12.01]], null, null, null, null, [["fly, housefly", 13.34], ["mains hum", 8.95], ["boat, water vehicle", 8.74]], [["speech", 48.16], ["music", 7.39], ["foghorn", 4.41]], [["livestock, farm animals, working animals", 46.75], ["cattle, bovinae", 30.08], ["moo", 10.36]], [["cattle, bovinae", 21.76], ["livestock, farm animals, working animals", 15.73], ["moo", 14.41]], [["music", 40.89], ["throbbing", 34.32], ["hum", 9.94]], null, null, null, [["throbbing", 58.42], ["music", 22.78], ["hum", 5.85]], null, null, null, null, [["cattle, bovinae", 29.98], ["moo", 19.3], ["livestock, farm animals, working animals", 13.93]], [["speech", 29.43], ["sidetone", 12.51], ["boing", 6.64]], null, null, null, [["hum", 31.5], ["speech", 14.61], ["throbbing", 6.31]], null, null, null, null], "duration": [2.65, 6.38, 0.57, 0.3, 1.11, 0.86, 8.39, 5.06, 7.31, 26.41, 4.44, -0.13, 0.32, 0.3, 2.11, 1.19, 0.99, -0.21, 0.26, 4.11, 2.03, 0.95, 0.92, 0.42, 2.54, 1.27, 0.24, 0.47, 2.49]} \ No newline at end of file diff --git a/annotations_1/tG2qsoC_-hs_filtered.json b/annotations_1/tG2qsoC_-hs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..894a4ea9055aa1eaf025c474a1c56c44f048d5e3 --- /dev/null +++ b/annotations_1/tG2qsoC_-hs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.62], [8.0, 12.85], [14.0, 16.04], [17.0, 26.33], [27.0, 27.38], [28.0, 28.05], [29.0, 29.96], [32.0, 32.83], [38.0, 40.26], [43.0, 43.97], [47.0, 47.8], [49.0, 49.25], [52.0, 52.61], [58.0, 58.31], [61.0, 61.79], [65.0, 66.24], [76.0, 76.23], [82.0, 82.51], [84.0, 84.52], [86.0, 86.07], [93.0, 93.36], [103.0, 102.98], [106.0, 109.24], [110.0, 111.06], [113.0, 113.02], [120.0, 120.43], [124.0, 124.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.73, 99.4, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.92, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 4.85, 2.04, 9.33, 0.38, 0.05, 0.96, 0.83, 2.26, 0.97, 0.8, 0.25, 0.61, 0.31, 0.79, 1.24, 0.23, 0.51, 0.52, 0.07, 0.36, -0.02, 3.24, 1.06, 0.02, 0.43, 0.24]} \ No newline at end of file diff --git a/annotations_1/tGg3h7NtiXs_filtered.json b/annotations_1/tGg3h7NtiXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b80c5149cd6034bfab87e890b5f280c5ed1ad6f --- /dev/null +++ b/annotations_1/tGg3h7NtiXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 40.58], [44.0, 51.11]], "keep_status": [false, true], "silence_prob": [31.99, 46.12], "audiomae_on_audioset": [[["mains hum", 32.2], ["hum", 27.49], ["music", 11.91]], [["animal", 26.9], ["fart", 13.24], ["wild animals", 9.19]]], "duration": [15.58, 7.11]} \ No newline at end of file diff --git a/annotations_1/tHHqfGeeXps_filtered.json b/annotations_1/tHHqfGeeXps_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9773dadc774fe89f24b34ac76f46992a0c4fab9f --- /dev/null +++ b/annotations_1/tHHqfGeeXps_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 17.39], [18.0, 18.76], [22.0, 27.89], [34.0, 34.79], [41.0, 41.3], [44.0, 46.01], [48.0, 49.77], [60.0, 60.42], [60.0, 60.45], [73.0, 75.49], [77.0, 77.11], [82.0, 87.79], [90.0, 90.26], [95.0, 98.05], [99.0, 99.82], [100.0, 105.56], [111.0, 111.5], [112.0, 112.24], [119.0, 119.38], [124.0, 124.63], [125.0, 127.43]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [31.6, 0.0, 38.3, 0.0, 0.0, 99.84, 0.0, 0.0, 0.0, 46.61, 0.0, 31.5, 0.0, 30.41, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 31.13], "audiomae_on_audioset": [[["music", 41.14], ["speech", 6.2], ["throbbing", 5.81]], null, [["boing", 23.37], ["hum", 14.57], ["mains hum", 8.57]], null, null, null, null, null, null, [["chirp tone", 55.42], ["sine wave", 8.51], ["boing", 6.95]], null, [["music", 66.29], ["didgeridoo", 10.6], ["synthesizer", 4.1]], null, [["moo", 48.02], ["cattle, bovinae", 34.44], ["livestock, farm animals, working animals", 16.99]], null, [["moo", 20.3], ["cattle, bovinae", 14.99], ["speech", 12.35]], null, null, null, null, [["music", 65.24], ["guitar", 5.35], ["musical instrument", 3.23]]], "duration": [3.39, 0.76, 5.89, 0.79, 0.3, 2.01, 1.77, 0.42, 0.45, 2.49, 0.11, 5.79, 0.26, 3.05, 0.82, 5.56, 0.5, 0.24, 0.38, 0.63, 2.43]} \ No newline at end of file diff --git a/annotations_1/tImxhYu2PG8_filtered.json b/annotations_1/tImxhYu2PG8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..076554f245f6bef00f1c7f369321f0f00e1d4a32 --- /dev/null +++ b/annotations_1/tImxhYu2PG8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [3.0, 3.57], [5.0, 6.18], [7.0, 10.44], [12.0, 12.9], [14.0, 15.33], [17.0, 22.23], [24.0, 24.78], [26.0, 28.54], [30.0, 34.16], [35.0, 35.75], [36.0, 38.7], [39.0, 47.06], [49.0, 51.29], [52.0, 54.09], [55.0, 55.75], [58.0, 59.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.54, 0.0, 0.0, 97.22, 0.0, 61.67, 66.88, 0.0, 88.46, 80.82, 97.83, 64.97, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.98, 0.57, 1.18, 3.44, 0.9, 1.33, 5.23, 0.78, 2.54, 4.16, 0.75, 2.7, 8.06, 2.29, 2.09, 0.75, 1.29]} \ No newline at end of file diff --git a/annotations_1/tIy7sQGKtJA_filtered.json b/annotations_1/tIy7sQGKtJA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51b1b9b3740d4cc1b68dcfeb8adb81254f82ce5d --- /dev/null +++ b/annotations_1/tIy7sQGKtJA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 22.6], [24.0, 58.38], [63.0, 64.02], [68.0, 79.24], [81.0, 81.36]], "keep_status": [false, false, false, false, false], "silence_prob": [37.19, 0.0, 0.0, 33.77, 0.0], "audiomae_on_audioset": [[["music", 57.1], ["speech", 11.02], ["whale vocalization", 5.33]], null, null, [["music", 50.43], ["speech", 16.0], ["mains hum", 7.27]], null], "duration": [10.6, 34.38, 1.02, 11.24, 0.36]} \ No newline at end of file diff --git a/annotations_1/tJ1uXsPXyao_filtered.json b/annotations_1/tJ1uXsPXyao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b60751d33c4b3b537345249baa013078b962271d --- /dev/null +++ b/annotations_1/tJ1uXsPXyao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [7.0, 11.7], [13.0, 16.51], [17.0, 18.01], [21.0, 22.27], [25.0, 26.94], [36.0, 44.9], [46.0, 51.66], [55.0, 65.26], [66.0, 78.04], [80.0, 81.73], [83.0, 85.29], [86.0, 88.57], [95.0, 95.52], [97.0, 99.33], [101.0, 102.9], [103.0, 108.48], [111.0, 112.21], [114.0, 114.86], [116.0, 145.86]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, true, false, false, true, false, true, false, false, false], "silence_prob": [0.0, 28.74, 29.38, 0.0, 0.0, 0.0, 28.8, 30.06, 30.33, 29.33, 0.0, 32.44, 30.5, 0.0, 32.75, 0.0, 29.23, 0.0, 0.0, 29.11], "audiomae_on_audioset": [null, [["speech", 64.76], ["explosion", 10.19], ["outside, rural or natural", 2.49]], [["speech", 32.84], ["music", 24.97], ["throbbing", 3.73]], null, null, null, [["music", 45.85], ["hum", 8.07], ["cacophony", 4.14]], [["speech", 21.07], ["hum", 19.57], ["whale vocalization", 18.06]], [["throbbing", 40.66], ["hum", 20.84], ["music", 19.15]], [["music", 54.86], ["throbbing", 15.35], ["hum", 13.45]], null, [["music", 32.39], ["speech", 26.56], ["musical instrument", 2.84]], [["cattle, bovinae", 46.21], ["moo", 39.6], ["livestock, farm animals, working animals", 13.51]], null, [["cattle, bovinae", 29.58], ["moo", 13.27], ["cowbell", 12.23]], null, [["vehicle", 21.81], ["speech", 21.72], ["motorboat, speedboat", 19.84]], null, null, [["hum", 34.97], ["mains hum", 27.57], ["music", 13.49]]], "duration": [0.5, 4.7, 3.51, 1.01, 1.27, 1.94, 8.9, 5.66, 10.26, 12.04, 1.73, 2.29, 2.57, 0.52, 2.33, 1.9, 5.48, 1.21, 0.86, 29.86]} \ No newline at end of file diff --git a/annotations_1/tJ4H77qrLjI_filtered.json b/annotations_1/tJ4H77qrLjI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..136699e331b10c3c59868dd4ee9cabc2f5011add --- /dev/null +++ b/annotations_1/tJ4H77qrLjI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 17.32], [21.0, 21.1], [22.0, 40.8], [53.0, 53.23], [56.0, 65.91], [67.0, 69.8], [72.0, 74.26], [78.0, 78.43], [81.0, 88.53], [98.0, 115.47], [118.0, 124.56], [125.0, 130.2], [133.0, 138.18], [140.0, 161.05]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, true], "silence_prob": [35.92, 0.0, 33.11, 0.0, 34.49, 34.78, 44.29, 0.0, 36.82, 35.66, 34.37, 35.0, 32.06, 32.49], "audiomae_on_audioset": [[["music", 57.92], ["didgeridoo", 8.28], ["synthesizer", 7.58]], null, [["speech", 47.33], ["music", 27.82], ["quack", 5.59]], null, [["speech", 42.34], ["music", 20.46], ["vehicle", 13.25]], [["music", 41.3], ["speech", 21.02], ["trombone", 7.79]], [["music", 61.6], ["musical instrument", 6.29], ["brass instrument", 3.25]], null, [["fly, housefly", 27.59], ["speech", 16.98], ["mosquito", 12.87]], [["speech", 54.28], ["music", 17.14], ["vehicle", 4.11]], [["speech", 62.78], ["aircraft", 9.88], ["vehicle", 6.6]], [["music", 47.79], ["trombone", 10.09], ["musical instrument", 6.56]], [["music", 46.65], ["speech", 31.29], ["musical instrument", 1.79]], [["music", 53.43], ["trombone", 6.57], ["brass instrument", 3.78]]], "duration": [9.32, 0.1, 18.8, 0.23, 9.91, 2.8, 2.26, 0.43, 7.53, 17.47, 6.56, 5.2, 5.18, 21.05]} \ No newline at end of file diff --git a/annotations_1/tJPokP3FVl8_filtered.json b/annotations_1/tJPokP3FVl8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17b47024f9d185c8d322ce5ad4e20e1d6314ade7 --- /dev/null +++ b/annotations_1/tJPokP3FVl8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 28.66], [31.0, 43.92], [46.0, 67.14], [68.0, 89.01], [92.0, 94.81], [99.0, 99.89], [102.0, 112.14], [112.0, 135.24], [138.0, 141.71]], "keep_status": [true, true, true, true, true, false, false, true, true], "silence_prob": [38.19, 43.08, 34.71, 40.33, 30.09, 0.0, 30.07, 30.9, 34.11], "audiomae_on_audioset": [[["speech", 24.18], ["music", 19.23], ["grunt", 16.91]], [["music", 44.43], ["whale vocalization", 12.72], ["animal", 9.83]], [["sonar", 29.05], ["hum", 16.3], ["music", 7.19]], [["music", 42.93], ["speech", 17.11], ["clang", 8.23]], [["fart", 24.39], ["fly, housefly", 24.31], ["mosquito", 14.23]], null, [["animal", 40.46], ["wild animals", 19.87], ["roaring cats (lions, tigers)", 10.75]], [["music", 44.96], ["speech", 7.84], ["groan", 7.28]], [["explosion", 25.06], ["eruption", 13.23], ["hum", 11.57]]], "duration": [12.66, 12.92, 21.14, 21.01, 2.81, 0.89, 10.14, 23.24, 3.71]} \ No newline at end of file diff --git a/annotations_1/tJya-fbl4R8_filtered.json b/annotations_1/tJya-fbl4R8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d1f1c6292ce5ad298e4c45ca4a695ee85885e89 --- /dev/null +++ b/annotations_1/tJya-fbl4R8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 44.34], [45.0, 60.79], [62.0, 69.36], [70.0, 71.96], [74.0, 74.39], [75.0, 77.09], [79.0, 83.0], [84.0, 85.83], [87.0, 97.66], [99.0, 102.56], [104.0, 106.15], [107.0, 108.84], [109.0, 115.37], [117.0, 124.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 100.0, 99.97, 0.0, 0.0, 99.88, 73.97, 0.0, 84.62, 100.0, 100.0, 0.0, 75.55, 82.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.34, 15.79, 7.36, 1.96, 0.39, 2.09, 4.0, 1.83, 10.66, 3.56, 2.15, 1.84, 6.37, 7.65]} \ No newline at end of file diff --git a/annotations_1/tKei1kTWmKU_filtered.json b/annotations_1/tKei1kTWmKU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95db936e2a341af2328c89bbaedada4b89282afd --- /dev/null +++ b/annotations_1/tKei1kTWmKU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 72.03], [74.0, 100.84], [101.0, 102.41], [104.0, 111.2], [112.0, 112.89], [115.0, 129.22], [133.0, 139.75]], "keep_status": [false, true, false, true, false, true, false], "silence_prob": [0.0, 33.31, 0.0, 46.83, 0.0, 32.18, 78.21], "audiomae_on_audioset": [null, [["music", 43.12], ["throbbing", 18.84], ["hum", 6.56]], null, [["whale vocalization", 11.74], ["fly, housefly", 11.19], ["speech", 11.16]], null, [["whale vocalization", 25.09], ["music", 11.91], ["speech", 7.65]], null], "duration": [37.03, 26.84, 1.41, 7.2, 0.89, 14.22, 6.75]} \ No newline at end of file diff --git a/annotations_1/tLXNDzc-2fA_filtered.json b/annotations_1/tLXNDzc-2fA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..968a5b67145c9c0b1b13ffd84957a18e16249282 --- /dev/null +++ b/annotations_1/tLXNDzc-2fA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 63.44], [67.0, 118.44], [123.0, 123.9], [124.0, 126.96], [129.0, 173.72], [176.0, 176.47], [177.0, 212.33], [218.0, 219.69], [222.0, 222.79], [227.0, 228.73], [231.0, 231.3]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 32.42], ["didgeridoo", 11.79], ["hum", 6.37]], null, null, null, null, null, null, null], "duration": [37.44, 51.44, 0.9, 2.96, 44.72, 0.47, 35.33, 1.69, 0.79, 1.73, 0.3]} \ No newline at end of file diff --git a/annotations_1/tMB7LgnO2Wo_filtered.json b/annotations_1/tMB7LgnO2Wo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92d12569d2e91bf5b4a789d0d03b76eac15f8a9e --- /dev/null +++ b/annotations_1/tMB7LgnO2Wo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.86], [4.0, 5.02], [7.0, 9.04], [11.0, 11.55], [14.0, 16.85], [20.0, 21.03], [21.0, 21.49], [22.0, 21.91], [23.0, 25.51], [26.0, 27.53], [29.0, 32.68], [34.0, 34.48], [36.0, 37.61], [41.0, 42.85], [48.0, 48.09], [49.0, 52.0], [53.0, 55.8], [57.0, 59.05], [60.0, 61.67], [64.0, 63.9], [65.0, 66.48], [69.0, 71.05], [72.0, 77.13], [81.0, 81.4], [85.0, 85.45], [87.0, 88.43], [91.0, 92.55], [94.0, 97.34], [99.0, 100.79], [104.0, 109.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.93, 0.0, 51.6, 0.0, 0.0, 0.0, 53.78, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 80.29, 40.21, 41.89, 0.0, 0.0, 0.0, 70.86, 70.58, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 57.56], "audiomae_on_audioset": [null, null, [["speech", 37.21], ["music", 21.31], ["singing bowl", 11.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.84], ["music", 13.53], ["hum", 6.62]], [["music", 27.3], ["gong", 24.26], ["singing bowl", 10.1]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.14, 1.02, 2.04, 0.55, 2.85, 1.03, 0.49, -0.09, 2.51, 1.53, 3.68, 0.48, 1.61, 1.85, 0.09, 3.0, 2.8, 2.05, 1.67, -0.1, 1.48, 2.05, 5.13, 0.4, 0.45, 1.43, 1.55, 3.34, 1.79, 5.76]} \ No newline at end of file diff --git a/annotations_1/tMYOmMWbUME_filtered.json b/annotations_1/tMYOmMWbUME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0434d204722f5dbd8c8fd21956135f80c44b4b5e --- /dev/null +++ b/annotations_1/tMYOmMWbUME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.05], [14.0, 15.67], [20.0, 19.79], [21.0, 21.52], [28.0, 30.23], [32.0, 35.36], [38.0, 38.21], [39.0, 39.41], [42.0, 41.91], [43.0, 44.42], [46.0, 54.33], [59.0, 62.01], [67.0, 75.36], [80.0, 81.28], [82.0, 92.45], [94.0, 95.94], [97.0, 105.07], [106.0, 109.12], [117.0, 118.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 74.76, 87.37, 0.0, 0.0, 0.0, 0.0, 99.85, 89.54, 36.95, 0.0, 74.29, 0.0, 87.0, 59.24, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["eruption", 13.46], ["speech", 9.63], ["fart", 6.93]], null, null, null, null, null, null], "duration": [1.05, 1.67, -0.21, 0.52, 2.23, 3.36, 0.21, 0.41, -0.09, 1.42, 8.33, 3.01, 8.36, 1.28, 10.45, 1.94, 8.07, 3.12, 1.52]} \ No newline at end of file diff --git a/annotations_1/tMcUZSJ3xDY_filtered.json b/annotations_1/tMcUZSJ3xDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa89db9da6960903df6a1a37aa9042131825f284 --- /dev/null +++ b/annotations_1/tMcUZSJ3xDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 56.83], [64.0, 67.69], [76.0, 153.47]], "keep_status": [false, false, false], "silence_prob": [0.0, 29.75, 0.0], "audiomae_on_audioset": [null, [["music", 59.24], ["speech", 13.85], ["throbbing", 5.35]], null], "duration": [40.83, 3.69, 77.47]} \ No newline at end of file diff --git a/annotations_1/tNuPwipxx94_filtered.json b/annotations_1/tNuPwipxx94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c493df7e8c7b2729ec72151aa34ba2ec94c9f6e4 --- /dev/null +++ b/annotations_1/tNuPwipxx94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 4.04], [7.0, 7.55], [12.0, 12.83], [14.0, 15.72], [17.0, 17.47], [20.0, 21.36], [23.0, 23.31], [26.0, 25.98], [28.0, 31.56], [32.0, 33.61], [35.0, 35.88], [38.0, 38.23], [39.0, 39.41], [42.0, 42.52], [50.0, 51.19], [53.0, 53.96], [54.0, 55.38], [56.0, 58.29], [61.0, 61.91], [63.0, 67.63], [69.0, 70.02], [71.0, 71.69], [72.0, 76.1], [77.0, 80.03], [81.0, 81.78], [83.0, 83.49], [85.0, 86.34], [87.0, 87.29], [89.0, 90.63], [92.0, 92.28]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.46, 0.0, 91.3, 0.0, 0.0, 75.88, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 1.04, 0.55, 0.83, 1.72, 0.47, 1.36, 0.31, -0.02, 3.56, 1.61, 0.88, 0.23, 0.41, 0.52, 1.19, 0.96, 1.38, 2.29, 0.91, 4.63, 1.02, 0.69, 4.1, 3.03, 0.78, 0.49, 1.34, 0.29, 1.63, 0.28]} \ No newline at end of file diff --git a/annotations_1/tNvDa9kTDUw_filtered.json b/annotations_1/tNvDa9kTDUw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8587725a03d79c2a483741c37957ce7cc8d5aa6 --- /dev/null +++ b/annotations_1/tNvDa9kTDUw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.74], [33.0, 36.8], [44.0, 44.0], [46.0, 46.58], [47.0, 50.82], [56.0, 56.51]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 36.19, 0.0, 0.0, 34.35, 0.0], "audiomae_on_audioset": [null, [["music", 74.75], ["yodeling", 3.54], ["synthesizer", 2.82]], null, null, [["music", 70.15], ["musical instrument", 2.84], ["funk", 2.4]], null], "duration": [0.74, 3.8, 0.0, 0.58, 3.82, 0.51]} \ No newline at end of file diff --git a/annotations_1/tOcnYAE2i4Q_filtered.json b/annotations_1/tOcnYAE2i4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..45d6e2617ab32f2a39352f5ab1e65665136b4e39 --- /dev/null +++ b/annotations_1/tOcnYAE2i4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.78], [20.0, 20.51], [24.0, 24.49], [25.0, 24.73], [29.0, 31.38], [35.0, 36.85], [38.0, 38.8], [48.0, 49.64], [69.0, 70.75], [76.0, 77.5], [81.0, 81.41], [84.0, 85.6], [87.0, 100.62], [120.0, 120.38]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.33], ["ambient music", 18.78], ["singing bowl", 5.77]], null], "duration": [1.78, 0.51, 0.49, -0.27, 2.38, 1.85, 0.8, 1.64, 1.75, 1.5, 0.41, 1.6, 13.62, 0.38]} \ No newline at end of file diff --git a/annotations_1/tPJJlCdrJ0M_filtered.json b/annotations_1/tPJJlCdrJ0M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f27139329cb2e149996e91d3780a9920cdfbc8b1 --- /dev/null +++ b/annotations_1/tPJJlCdrJ0M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.47], [6.0, 11.82], [18.0, 28.86], [31.0, 31.23], [31.0, 33.0], [38.0, 40.78], [44.0, 54.82], [57.0, 58.21], [60.0, 62.19], [65.0, 67.63], [69.0, 69.42], [73.0, 76.2], [77.0, 101.97], [103.0, 116.24], [116.0, 117.86], [119.0, 126.98], [128.0, 132.19]], "keep_status": [false, true, true, false, true, true, false, false, true, true, false, false, true, true, false, false, true], "silence_prob": [0.0, 29.65, 29.79, 0.0, 32.15, 29.84, 30.74, 0.0, 30.78, 30.23, 0.0, 30.13, 30.23, 33.92, 0.0, 30.29, 32.26], "audiomae_on_audioset": [null, [["speech", 33.37], ["music", 14.83], ["hum", 14.75]], [["music", 42.6], ["speech", 22.15], ["explosion", 2.44]], null, [["music", 39.11], ["speech", 11.53], ["throbbing", 6.95]], [["music", 53.76], ["hum", 8.22], ["throbbing", 6.04]], [["music", 75.35], ["breaking", 4.32], ["buzz", 2.89]], null, [["music", 33.11], ["speech", 22.85], ["theremin", 7.38]], [["sound effect", 19.48], ["music", 16.1], ["groan", 8.21]], null, [["music", 70.92], ["speech", 3.04], ["noise", 3.0]], [["music", 45.68], ["speech", 14.15], ["sine wave", 5.8]], [["music", 44.62], ["boing", 9.34], ["clarinet", 9.26]], null, [["music", 42.96], ["hum", 15.12], ["throbbing", 12.4]], [["music", 48.29], ["speech", 8.75], ["double bass", 8.23]]], "duration": [1.47, 5.82, 10.86, 0.23, 2.0, 2.78, 10.82, 1.21, 2.19, 2.63, 0.42, 3.2, 24.97, 13.24, 1.86, 7.98, 4.19]} \ No newline at end of file diff --git a/annotations_1/tRRQX1SXcMM_filtered.json b/annotations_1/tRRQX1SXcMM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66548c72bbcc53b0d371d1b23e44fd12746c76db --- /dev/null +++ b/annotations_1/tRRQX1SXcMM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 23.45], [26.0, 26.74], [30.0, 38.96], [40.0, 43.9], [46.0, 62.13], [65.0, 85.55], [87.0, 88.01], [91.0, 97.28], [99.0, 99.71], [100.0, 117.59]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [42.91, 0.0, 30.62, 31.82, 38.71, 39.6, 0.0, 35.22, 0.0, 37.97], "audiomae_on_audioset": [[["speech", 56.86], ["vehicle", 6.28], ["sidetone", 5.65]], null, [["speech", 60.26], ["explosion", 17.02], ["music", 2.64]], [["hum", 39.38], ["mains hum", 17.71], ["throbbing", 14.31]], [["hum", 27.65], ["music", 22.92], ["whale vocalization", 22.57]], [["music", 64.15], ["whale vocalization", 30.36], ["soundtrack music", 1.15]], null, [["music", 61.04], ["whale vocalization", 27.55], ["electronic music", 1.97]], null, [["whale vocalization", 56.6], ["music", 35.97], ["theremin", 1.16]]], "duration": [14.45, 0.74, 8.96, 3.9, 16.13, 20.55, 1.01, 6.28, 0.71, 17.59]} \ No newline at end of file diff --git a/annotations_1/tRx8N7mJU9g_filtered.json b/annotations_1/tRx8N7mJU9g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/tRx8N7mJU9g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/tS36ZnWoR70_filtered.json b/annotations_1/tS36ZnWoR70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa08342a68ba4b17c4df89e2863607937c7d5c64 --- /dev/null +++ b/annotations_1/tS36ZnWoR70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.85], [6.0, 8.41], [11.0, 11.08], [12.0, 12.48], [14.0, 14.93], [17.0, 18.1], [20.0, 22.27], [24.0, 24.04], [26.0, 27.35], [30.0, 32.46], [35.0, 38.35], [41.0, 41.61], [45.0, 47.41], [49.0, 50.38], [52.0, 53.64], [55.0, 56.35], [59.0, 60.44], [64.0, 66.07], [68.0, 69.06], [70.0, 71.85], [74.0, 75.1], [76.0, 81.31], [84.0, 83.94], [86.0, 86.41], [88.0, 90.71], [93.0, 94.02], [98.0, 99.59], [102.0, 102.1], [104.0, 106.56], [108.0, 108.99], [112.0, 113.24], [117.0, 118.57], [120.0, 120.83], [122.0, 123.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [84.8, 91.47, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.96, 99.95, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 97.11, 0.0, 0.0, 0.0, 50.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.85, 2.41, 0.08, 0.48, 0.93, 1.1, 2.27, 0.04, 1.35, 2.46, 3.35, 0.61, 2.41, 1.38, 1.64, 1.35, 1.44, 2.07, 1.06, 1.85, 1.1, 5.31, -0.06, 0.41, 2.71, 1.02, 1.59, 0.1, 2.56, 0.99, 1.24, 1.57, 0.83, 1.47]} \ No newline at end of file diff --git a/annotations_1/tSpOMNC3WtQ_filtered.json b/annotations_1/tSpOMNC3WtQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d93ce705864196944eec27c068d736e9837b6c8c --- /dev/null +++ b/annotations_1/tSpOMNC3WtQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.38], [18.0, 18.13], [19.0, 26.38], [31.0, 32.44], [36.0, 36.37], [46.0, 46.58], [49.0, 60.89], [66.0, 73.6], [79.0, 79.57]], "keep_status": [false, false, false, false, false, false, true, false, false], "silence_prob": [99.99, 0.0, 46.83, 0.0, 0.0, 0.0, 37.81, 38.33, 0.0], "audiomae_on_audioset": [null, null, [["speech", 68.73], ["sidetone", 6.08], ["radio", 4.48]], null, null, null, [["music", 38.39], ["bleat", 12.93], ["sheep", 12.89]], [["music", 55.54], ["speech", 14.2], ["radio", 7.35]], null], "duration": [2.38, 0.13, 7.38, 1.44, 0.37, 0.58, 11.89, 7.6, 0.57]} \ No newline at end of file diff --git a/annotations_1/tUiVEKK8rWM_filtered.json b/annotations_1/tUiVEKK8rWM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9ff6193ce9907ff74749b77c6938913215c09a --- /dev/null +++ b/annotations_1/tUiVEKK8rWM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [3.0, 4.04], [4.0, 4.29], [4.0, 4.43], [7.0, 7.94], [16.0, 16.21], [20.0, 20.48], [23.0, 23.67], [30.0, 30.89], [38.0, 38.62], [42.0, 42.69], [44.0, 44.32], [45.0, 46.52], [49.0, 50.21], [52.0, 53.28], [55.0, 55.46], [67.0, 67.61], [69.0, 69.53], [76.0, 76.08], [78.0, 78.46], [79.0, 82.26], [83.0, 84.7], [87.0, 87.39], [88.0, 89.28], [92.0, 92.25], [103.0, 111.69], [113.0, 118.88], [120.0, 121.88], [124.0, 124.39], [127.0, 128.02], [129.0, 134.57], [138.0, 141.17], [142.0, 143.24], [144.0, 144.64], [148.0, 148.0], [153.0, 153.64], [155.0, 155.22], [157.0, 157.2], [158.0, 159.07], [160.0, 161.08], [166.0, 166.99], [170.0, 171.02], [177.0, 178.31], [182.0, 183.03], [184.0, 183.93], [187.0, 187.79], [193.0, 194.09], [198.0, 198.91], [202.0, 202.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.87, 0.0, 0.0, 0.0, 0.0, 59.96, 88.28, 0.0, 0.0, 0.0, 96.42, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.38, 1.04, 0.29, 0.43, 0.94, 0.21, 0.48, 0.67, 0.89, 0.62, 0.69, 0.32, 1.52, 1.21, 1.28, 0.46, 0.61, 0.53, 0.08, 0.46, 3.26, 1.7, 0.39, 1.28, 0.25, 8.69, 5.88, 1.88, 0.39, 1.02, 5.57, 3.17, 1.24, 0.64, 0.0, 0.64, 0.22, 0.2, 1.07, 1.08, 0.99, 1.02, 1.31, 1.03, -0.07, 0.79, 1.09, 0.91, 0.27]} \ No newline at end of file diff --git a/annotations_1/tV7wQ19UBqg_filtered.json b/annotations_1/tV7wQ19UBqg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..86bcb91979c82523269e6902acffa19ddf2968e3 --- /dev/null +++ b/annotations_1/tV7wQ19UBqg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 17.9], [40.0, 75.79], [76.0, 77.94], [81.0, 82.09], [87.0, 95.61], [97.0, 100.11], [101.0, 102.29], [103.0, 105.92], [108.0, 122.15], [124.0, 125.24], [125.0, 131.9], [133.0, 136.97], [139.0, 139.99], [143.0, 144.71], [146.0, 149.79], [151.0, 151.16], [153.0, 155.11], [160.0, 161.33], [162.0, 162.11], [163.0, 164.52], [168.0, 171.9], [176.0, 178.98], [180.0, 180.3], [184.0, 184.91], [185.0, 189.73], [191.0, 197.99], [199.0, 203.17], [208.0, 211.86], [212.0, 216.67], [219.0, 221.0], [224.0, 225.41], [229.0, 231.33], [232.0, 233.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.86, 0.0, 0.0, 0.0, 100.0, 98.36, 0.0, 99.9, 99.71, 0.0, 91.47, 99.9, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 98.99, 100.0, 0.0, 0.0, 92.31, 99.85, 99.98, 97.11, 99.87, 100.0, 0.0, 97.92, 0.0], "audiomae_on_audioset": [[["speech", 68.57], ["breaking", 10.87], ["whack, thwack", 4.93]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.9, 35.79, 1.94, 1.09, 8.61, 3.11, 1.29, 2.92, 14.15, 1.24, 6.9, 3.97, 0.99, 1.71, 3.79, 0.16, 2.11, 1.33, 0.11, 1.52, 3.9, 2.98, 0.3, 0.91, 4.73, 6.99, 4.17, 3.86, 4.67, 2.0, 1.41, 2.33, 1.44]} \ No newline at end of file diff --git a/annotations_1/tVubEM2oUj4_filtered.json b/annotations_1/tVubEM2oUj4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bc38317c99f1e509ced6320496543d27da65ee2 --- /dev/null +++ b/annotations_1/tVubEM2oUj4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.49], [9.0, 9.85], [17.0, 17.54], [29.0, 31.5], [33.0, 34.77], [37.0, 36.78], [37.0, 37.84], [38.0, 40.2], [45.0, 46.04], [53.0, 55.34], [56.0, 59.48], [61.0, 65.7], [67.0, 75.54], [76.0, 76.65], [78.0, 78.26], [79.0, 79.81], [82.0, 82.54], [85.0, 85.48], [88.0, 90.24], [91.0, 91.54], [96.0, 96.74], [98.0, 99.45], [101.0, 114.42], [116.0, 130.25], [132.0, 139.13], [141.0, 141.44], [143.0, 146.52], [150.0, 150.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 100.0, 99.87, 80.46, 0.0, 0.0, 0.0, 0.0, 0.0, 81.89, 0.0, 0.0, 0.0, 99.76, 99.84, 99.76, 0.0, 99.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.49, 0.85, 0.54, 2.5, 1.77, -0.22, 0.84, 2.2, 1.04, 2.34, 3.48, 4.7, 8.54, 0.65, 0.26, 0.81, 0.54, 0.48, 2.24, 0.54, 0.74, 1.45, 13.42, 14.25, 7.13, 0.44, 3.52, 0.16]} \ No newline at end of file diff --git a/annotations_1/tVxYCeRXzGo_filtered.json b/annotations_1/tVxYCeRXzGo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9945591bb87955c00964853aa6d26d523e5fc096 --- /dev/null +++ b/annotations_1/tVxYCeRXzGo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.83], [6.0, 7.03], [8.0, 9.61], [10.0, 11.79], [13.0, 14.98], [23.0, 25.78], [27.0, 28.56], [35.0, 36.98], [53.0, 54.97], [56.0, 56.81], [57.0, 58.7], [65.0, 65.67], [80.0, 80.65], [85.0, 86.0], [96.0, 97.68], [101.0, 101.88], [106.0, 106.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.83, 1.03, 1.61, 1.79, 1.98, 2.78, 1.56, 1.98, 1.97, 0.81, 1.7, 0.67, 0.65, 1.0, 1.68, 0.88, 0.88]} \ No newline at end of file diff --git a/annotations_1/tXF23iSwW3I_filtered.json b/annotations_1/tXF23iSwW3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..383bb02a1f53557dfe18b9f11bf41914543cc25d --- /dev/null +++ b/annotations_1/tXF23iSwW3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 31.19], [36.0, 36.59]], "keep_status": [false, false], "silence_prob": [33.95, 0.0], "audiomae_on_audioset": [[["music", 44.19], ["hum", 24.1], ["throbbing", 12.37]], null], "duration": [23.19, 0.59]} \ No newline at end of file diff --git a/annotations_1/tXhTaL04ByA_filtered.json b/annotations_1/tXhTaL04ByA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a6350de73e52b9a0adf867c7cfe9181f91f51859 --- /dev/null +++ b/annotations_1/tXhTaL04ByA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.18], [8.0, 8.78], [9.0, 9.64], [11.0, 13.12], [13.0, 16.51], [17.0, 17.37], [19.0, 20.43], [21.0, 21.47], [25.0, 25.41], [32.0, 37.64], [39.0, 40.58], [42.0, 50.8], [52.0, 52.51], [53.0, 62.07], [63.0, 75.44], [76.0, 80.55], [81.0, 81.21], [84.0, 84.32], [86.0, 93.06], [93.0, 93.88], [99.0, 99.22], [100.0, 100.48], [101.0, 101.39], [103.0, 103.91], [109.0, 109.78], [111.0, 111.23], [112.0, 112.67], [114.0, 115.57]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 50.66, 43.35, 0.0, 0.0, 0.0, 0.0, 48.65, 0.0, 35.2, 0.0, 46.75, 31.05, 33.2, 0.0, 0.0, 34.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 66.6], ["telephone", 10.35], ["sidetone", 9.51]], null, null, null, null, [["music", 31.02], ["theremin", 20.11], ["hum", 10.04]], null, [["music", 50.23], ["theremin", 24.25], ["musical instrument", 6.87]], null, [["theremin", 45.3], ["hum", 19.09], ["music", 13.7]], [["theremin", 57.13], ["music", 29.48], ["musical instrument", 3.07]], [["music", 28.92], ["foghorn", 7.98], ["speech", 7.23]], null, null, [["theremin", 23.36], ["music", 17.12], ["synthesizer", 10.42]], null, null, null, null, null, null, null, null, null], "duration": [1.18, 0.78, 0.64, 2.12, 3.51, 0.37, 1.43, 0.47, 0.41, 5.64, 1.58, 8.8, 0.51, 9.07, 12.44, 4.55, 0.21, 0.32, 7.06, 0.88, 0.22, 0.48, 0.39, 0.91, 0.78, 0.23, 0.67, 1.57]} \ No newline at end of file diff --git a/annotations_1/tXrxBy-CDPc_filtered.json b/annotations_1/tXrxBy-CDPc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e222f7cba26b3f6dcc0adf161925dc05bc1cb62d --- /dev/null +++ b/annotations_1/tXrxBy-CDPc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.92], [10.0, 11.65], [12.0, 13.56], [16.0, 18.64], [20.0, 20.58], [21.0, 23.09], [25.0, 28.58], [30.0, 35.7], [37.0, 37.17], [39.0, 39.19], [41.0, 44.1], [45.0, 46.21], [48.0, 50.25], [51.0, 51.71], [52.0, 51.8], [52.0, 52.15], [53.0, 53.49], [54.0, 56.57], [57.0, 57.38], [58.0, 58.72], [59.0, 59.86], [63.0, 63.8], [66.0, 66.99], [74.0, 77.43], [82.0, 83.49], [85.0, 85.72], [87.0, 88.62], [91.0, 91.07], [92.0, 92.7], [94.0, 94.76], [96.0, 97.04], [99.0, 101.61], [103.0, 104.46], [114.0, 115.06], [116.0, 118.3], [120.0, 122.88], [125.0, 125.34], [126.0, 128.09], [131.0, 131.08], [131.0, 132.21], [134.0, 134.23], [138.0, 138.96], [139.0, 140.49], [141.0, 141.44], [142.0, 142.65], [145.0, 146.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 77.36, 0.0, 82.43, 99.84, 64.86, 0.0, 0.0, 69.61, 0.0, 63.31, 0.0, 0.0, 0.0, 0.0, 50.86, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 82.07, 80.82, 0.0, 88.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 1.65, 1.56, 2.64, 0.58, 2.09, 3.58, 5.7, 0.17, 0.19, 3.1, 1.21, 2.25, 0.71, -0.2, 0.15, 0.49, 2.57, 0.38, 0.72, 0.86, 0.8, 0.99, 3.43, 1.49, 0.72, 1.62, 0.07, 0.7, 0.76, 1.04, 2.61, 1.46, 1.06, 2.3, 2.88, 0.34, 2.09, 0.08, 1.21, 0.23, 0.96, 1.49, 0.44, 0.65, 1.65]} \ No newline at end of file diff --git a/annotations_1/tY5el7dZ9H0_filtered.json b/annotations_1/tY5el7dZ9H0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e22040669cd01f24fb537c48a12b740f59ff094d --- /dev/null +++ b/annotations_1/tY5el7dZ9H0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.02], [22.0, 22.94], [23.0, 24.14], [25.0, 26.65], [30.0, 31.45], [34.0, 34.97], [36.0, 36.85], [38.0, 39.02], [41.0, 42.2], [44.0, 45.49], [46.0, 46.57], [47.0, 47.73], [49.0, 50.3], [51.0, 51.63], [53.0, 54.26], [56.0, 60.54], [62.0, 62.21], [63.0, 63.73], [69.0, 69.33], [70.0, 70.95], [72.0, 73.03], [74.0, 75.34], [77.0, 76.87], [78.0, 77.73], [81.0, 81.51], [83.0, 83.93], [85.0, 86.14], [90.0, 90.51], [93.0, 93.56], [95.0, 96.45], [98.0, 99.3], [104.0, 106.81], [108.0, 117.86], [120.0, 120.8], [122.0, 126.32], [127.0, 128.26], [130.0, 130.79], [132.0, 132.65], [134.0, 135.24], [137.0, 173.79], [175.0, 176.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 84.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.4, 77.87, 0.0, 75.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.02, 0.94, 1.14, 1.65, 1.45, 0.97, 0.85, 1.02, 1.2, 1.49, 0.57, 0.73, 1.3, 0.63, 1.26, 4.54, 0.21, 0.73, 0.33, 0.95, 1.03, 1.34, -0.13, -0.27, 0.51, 0.93, 1.14, 0.51, 0.56, 1.45, 1.3, 2.81, 9.86, 0.8, 4.32, 1.26, 0.79, 0.65, 1.24, 36.79, 1.72]} \ No newline at end of file diff --git a/annotations_1/t_9GTwEOdkY_filtered.json b/annotations_1/t_9GTwEOdkY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f824d6da33bab22cdc9c7ac4416e92d70c23fd7f --- /dev/null +++ b/annotations_1/t_9GTwEOdkY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.0], [27.0, 31.92], [37.0, 37.86], [44.0, 52.68], [54.0, 55.7], [57.0, 110.47], [111.0, 112.67], [114.0, 114.51], [118.0, 132.88], [141.0, 141.86], [143.0, 173.58]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 42.37, 0.0, 53.65, 0.0, 0.0, 0.0, 0.0, 41.32, 0.0, 0.0], "audiomae_on_audioset": [null, [["singing bowl", 41.27], ["gong", 18.72], ["music", 8.97]], null, null, null, null, null, null, [["hum", 39.41], ["mains hum", 27.16], ["music", 12.84]], null, null], "duration": [1.0, 4.92, 0.86, 8.68, 1.7, 53.47, 1.67, 0.51, 14.88, 0.86, 30.58]} \ No newline at end of file diff --git a/annotations_1/t_FRWUPcR7Y_filtered.json b/annotations_1/t_FRWUPcR7Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dc91e2d29b7313b6e7a2700a60713d85f0d8acad --- /dev/null +++ b/annotations_1/t_FRWUPcR7Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.12], [13.0, 18.76], [22.0, 22.18], [27.0, 28.19], [36.0, 36.69], [38.0, 38.08], [39.0, 39.55], [41.0, 41.03]], "keep_status": [true, true, false, false, false, false, false, false], "silence_prob": [39.78, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.56], ["bouncing", 9.11], ["music", 4.43]], [["noise", 18.0], ["hum", 6.67], ["thunk", 6.63]], null, null, null, null, null, null], "duration": [2.12, 5.76, 0.18, 1.19, 0.69, 0.08, 0.55, 0.03]} \ No newline at end of file diff --git a/annotations_1/t_JOKNfSn1w_filtered.json b/annotations_1/t_JOKNfSn1w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd8cc60c2821295a3c912ac6f7642b51bf11c40 --- /dev/null +++ b/annotations_1/t_JOKNfSn1w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 52.32], [53.0, 53.18], [54.0, 54.95], [56.0, 58.94], [60.0, 69.03], [70.0, 71.34], [74.0, 78.38], [79.0, 114.3], [116.0, 135.62], [136.0, 140.16], [141.0, 140.95], [141.0, 169.25], [170.0, 172.91], [173.0, 181.84], [182.0, 186.46]], "keep_status": [false, false, false, true, false, false, true, false, true, false, false, false, true, true, true], "silence_prob": [0.0, 0.0, 0.0, 42.96, 31.82, 0.0, 28.77, 0.0, 29.49, 37.03, 0.0, 29.7, 28.75, 29.38, 30.02], "audiomae_on_audioset": [null, null, null, [["hum", 14.07], ["fly, housefly", 11.28], ["moo", 9.39]], [["mains hum", 38.35], ["hum", 28.03], ["fly, housefly", 9.47]], null, [["music", 20.81], ["sound effect", 7.95], ["whoosh, swoosh, swish", 6.27]], null, [["music", 17.71], ["livestock, farm animals, working animals", 10.01], ["throbbing", 7.8]], [["music", 63.28], ["squish", 8.44], ["crackle", 3.46]], null, [["music", 60.42], ["speech", 7.78], ["electronic music", 7.72]], [["rumble", 25.23], ["speech", 11.95], ["music", 6.26]], [["animal", 39.0], ["music", 12.86], ["speech", 6.81]], [["music", 51.09], ["throbbing", 2.45], ["musical instrument", 2.35]]], "duration": [49.32, 0.18, 0.95, 2.94, 9.03, 1.34, 4.38, 35.3, 19.62, 4.16, -0.05, 28.25, 2.91, 8.84, 4.46]} \ No newline at end of file diff --git a/annotations_1/taL06OVt4kQ_filtered.json b/annotations_1/taL06OVt4kQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b818dee21c70fc49eb88fb7dba630262bc40a57 --- /dev/null +++ b/annotations_1/taL06OVt4kQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 15.13], [16.0, 16.88], [18.0, 38.1], [38.0, 39.14], [40.0, 41.17], [42.0, 64.4], [66.0, 67.02], [69.0, 84.91], [85.0, 94.26], [94.0, 138.77], [139.0, 143.95], [146.0, 150.85], [152.0, 159.8], [161.0, 160.83]], "keep_status": [true, false, true, false, false, true, false, true, false, false, false, false, false, false], "silence_prob": [40.28, 0.0, 29.89, 0.0, 0.0, 31.16, 0.0, 46.43, 47.7, 0.0, 78.72, 60.6, 37.88, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 25.6], ["animal", 12.83], ["cattle, bovinae", 12.23]], null, [["music", 25.34], ["hum", 20.81], ["mains hum", 14.99]], null, null, [["explosion", 16.39], ["cattle, bovinae", 12.38], ["burst, pop", 9.78]], null, [["music", 35.67], ["speech", 8.48], ["cough", 8.21]], [["mains hum", 45.38], ["hum", 41.19], ["music", 3.23]], null, null, null, [["music", 47.62], ["mantra", 25.98], ["chant", 13.55]], null], "duration": [13.13, 0.88, 20.1, 1.14, 1.17, 22.4, 1.02, 15.91, 9.26, 44.77, 4.95, 4.85, 7.8, -0.17]} \ No newline at end of file diff --git a/annotations_1/taOda6ZwWyw_filtered.json b/annotations_1/taOda6ZwWyw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..57e228c333302d889d30f22517105d1afc2e0a7c --- /dev/null +++ b/annotations_1/taOda6ZwWyw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.13], [22.0, 24.66], [26.0, 26.37], [27.0, 31.9], [57.0, 57.94], [82.0, 84.52], [89.0, 90.93], [93.0, 109.27], [109.0, 109.46], [109.0, 113.32], [114.0, 118.08], [119.0, 118.98]], "keep_status": [false, false, false, true, false, true, false, true, false, true, true, false], "silence_prob": [0.0, 46.02, 0.0, 31.46, 0.0, 29.92, 0.0, 29.35, 0.0, 29.48, 35.1, 0.0], "audiomae_on_audioset": [null, [["music", 61.17], ["musical instrument", 10.79], ["speech", 7.12]], null, [["music", 30.25], ["speech", 24.51], ["musical instrument", 7.26]], null, [["music", 35.64], ["speech", 10.25], ["throbbing", 7.03]], null, [["music", 41.32], ["animal", 11.02], ["speech", 6.91]], null, [["moo", 27.94], ["music", 21.2], ["livestock, farm animals, working animals", 20.67]], [["music", 24.01], ["didgeridoo", 21.86], ["foghorn", 5.46]], null], "duration": [1.13, 2.66, 0.37, 4.9, 0.94, 2.52, 1.93, 16.27, 0.46, 4.32, 4.08, -0.02]} \ No newline at end of file diff --git a/annotations_1/taf0MZ5VgDc_filtered.json b/annotations_1/taf0MZ5VgDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d0fa991726e7d567a79b83f335b99a5edf0cc1c --- /dev/null +++ b/annotations_1/taf0MZ5VgDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.48], [4.0, 3.75], [4.0, 6.42], [15.0, 14.59], [15.0, 14.62], [22.0, 24.85], [29.0, 44.71], [47.0, 52.74], [55.0, 65.72], [67.0, 67.46], [71.0, 79.78], [83.0, 83.86], [94.0, 95.08], [96.0, 97.19], [102.0, 101.98], [108.0, 113.91]], "keep_status": [false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 43.03, 0.0, 0.0, 60.05, 30.53, 49.68, 32.05, 0.0, 37.86, 0.0, 0.0, 0.0, 0.0, 30.59], "audiomae_on_audioset": [null, null, [["music", 38.66], ["throbbing", 14.01], ["animal", 10.53]], null, null, null, [["music", 70.05], ["throbbing", 5.23], ["whack, thwack", 2.79]], [["hum", 27.87], ["music", 23.8], ["throbbing", 11.17]], [["music", 25.51], ["throbbing", 18.38], ["hum", 9.46]], null, [["speech", 41.88], ["music", 34.31], ["boing", 5.28]], null, null, null, null, [["electric shaver, electric razor", 10.26], ["whack, thwack", 9.4], ["speech", 6.87]]], "duration": [0.48, -0.25, 2.42, -0.41, -0.38, 2.85, 15.71, 5.74, 10.72, 0.46, 8.78, 0.86, 1.08, 1.19, -0.02, 5.91]} \ No newline at end of file diff --git a/annotations_1/tb9kVTItw3I_filtered.json b/annotations_1/tb9kVTItw3I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e156a5971c2feb27d3fc238a66aa3e7899dd87b --- /dev/null +++ b/annotations_1/tb9kVTItw3I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 34.35], [38.0, 47.48], [48.0, 48.79], [53.0, 53.28], [54.0, 54.92], [61.0, 62.34], [72.0, 75.27], [76.0, 77.06], [78.0, 94.9], [99.0, 116.48], [116.0, 116.51], [118.0, 132.88], [134.0, 138.15], [144.0, 149.61]], "keep_status": [true, false, false, false, false, false, true, false, true, true, false, false, true, true], "silence_prob": [29.69, 32.2, 0.0, 0.0, 0.0, 0.0, 32.4, 0.0, 30.21, 31.72, 0.0, 30.56, 31.48, 31.54], "audiomae_on_audioset": [[["whale vocalization", 22.14], ["fart", 8.4], ["fly, housefly", 7.31]], [["music", 64.52], ["didgeridoo", 3.02], ["whale vocalization", 2.71]], null, null, null, null, [["livestock, farm animals, working animals", 24.03], ["cattle, bovinae", 19.9], ["moo", 13.53]], null, [["livestock, farm animals, working animals", 27.56], ["speech", 21.23], ["animal", 12.02]], [["speech", 43.39], ["buzz", 6.9], ["hum", 3.12]], null, [["music", 77.24], ["boing", 2.6], ["didgeridoo", 2.51]], [["music", 20.91], ["cattle, bovinae", 8.43], ["groan", 8.14]], [["roaring cats (lions, tigers)", 23.24], ["wild animals", 20.71], ["music", 16.6]]], "duration": [8.35, 9.48, 0.79, 0.28, 0.92, 1.34, 3.27, 1.06, 16.9, 17.48, 0.51, 14.88, 4.15, 5.61]} \ No newline at end of file diff --git a/annotations_1/tdADTzvJtSY_filtered.json b/annotations_1/tdADTzvJtSY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..872be4a9694b114280101b48733916e45cd833bc --- /dev/null +++ b/annotations_1/tdADTzvJtSY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.17], [10.0, 12.6], [14.0, 15.4], [18.0, 18.96], [22.0, 23.45], [25.0, 26.57], [27.0, 28.75], [32.0, 33.18], [36.0, 38.47], [40.0, 41.18], [42.0, 43.17], [45.0, 47.28], [48.0, 49.57], [51.0, 51.39], [53.0, 61.7], [63.0, 64.13], [66.0, 67.24], [69.0, 69.9], [73.0, 75.14], [77.0, 77.85], [79.0, 80.1], [82.0, 82.9], [89.0, 90.31], [92.0, 94.02], [95.0, 96.18], [97.0, 98.31], [100.0, 103.23], [105.0, 106.1], [110.0, 112.19], [113.0, 113.17], [114.0, 114.4], [115.0, 120.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.4, 99.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0, 100.0, 0.0, 73.67, 0.0, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.17, 2.6, 1.4, 0.96, 1.45, 1.57, 1.75, 1.18, 2.47, 1.18, 1.17, 2.28, 1.57, 0.39, 8.7, 1.13, 1.24, 0.9, 2.14, 0.85, 1.1, 0.9, 1.31, 2.02, 1.18, 1.31, 3.23, 1.1, 2.19, 0.17, 0.4, 5.48]} \ No newline at end of file diff --git a/annotations_1/tdzX5AKWiDw_filtered.json b/annotations_1/tdzX5AKWiDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5d715addd71c6291eccfbaaeae4791555c9a41a5 --- /dev/null +++ b/annotations_1/tdzX5AKWiDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.38], [14.0, 14.52], [15.0, 16.66], [18.0, 18.71], [25.0, 25.88], [26.0, 26.86], [29.0, 30.05], [31.0, 33.24], [35.0, 35.6], [39.0, 40.29], [48.0, 48.17], [53.0, 54.65], [56.0, 57.16], [60.0, 61.84], [64.0, 65.35], [72.0, 72.15], [73.0, 74.01], [77.0, 78.76], [83.0, 83.61], [103.0, 104.85], [107.0, 107.77], [110.0, 111.2], [115.0, 116.58], [121.0, 122.77], [124.0, 125.32], [126.0, 127.25], [128.0, 130.59], [134.0, 135.26], [150.0, 150.62], [152.0, 152.51], [154.0, 155.14], [157.0, 164.51], [165.0, 166.06], [167.0, 168.71], [170.0, 171.49], [180.0, 180.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.38, 0.52, 1.66, 0.71, 0.88, 0.86, 1.05, 2.24, 0.6, 1.29, 0.17, 1.65, 1.16, 1.84, 1.35, 0.15, 1.01, 1.76, 0.61, 1.85, 0.77, 1.2, 1.58, 1.77, 1.32, 1.25, 2.59, 1.26, 0.62, 0.51, 1.14, 7.51, 1.06, 1.71, 1.49, 0.5]} \ No newline at end of file diff --git a/annotations_1/te2WMrdJ3yQ_filtered.json b/annotations_1/te2WMrdJ3yQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25ce5b90e764f125f949d3773b585129980844b0 --- /dev/null +++ b/annotations_1/te2WMrdJ3yQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 26.76], [27.0, 26.91], [27.0, 27.58], [29.0, 31.7], [33.0, 33.66], [34.0, 34.97], [36.0, 38.85], [41.0, 42.55], [53.0, 53.89], [60.0, 60.05], [61.0, 63.0], [66.0, 66.58], [68.0, 69.38], [71.0, 71.58], [74.0, 79.37], [82.0, 82.63], [83.0, 82.86], [88.0, 89.87], [97.0, 98.19], [102.0, 102.93], [104.0, 105.27], [107.0, 107.81], [108.0, 111.3], [116.0, 116.36], [121.0, 122.55], [127.0, 131.67], [141.0, 145.93], [146.0, 148.49], [151.0, 155.31], [158.0, 158.75], [159.0, 158.97], [159.0, 178.14], [180.0, 180.18]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 49.87, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 46.61, 0.0, 0.0, 0.0, 54.63, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.52, 0.0, 0.0, 70.16, 29.69, 34.94, 31.94, 0.0, 0.0, 30.62, 0.0], "audiomae_on_audioset": [null, null, null, [["whale vocalization", 22.0], ["rumble", 10.77], ["hum", 8.18]], null, null, [["fly, housefly", 40.82], ["mosquito", 21.64], ["insect", 19.11]], null, null, null, [["speech", 31.33], ["hum", 15.45], ["music", 13.26]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.63], ["hum", 15.08], ["throbbing", 10.96]], null, null, null, [["speech", 20.58], ["livestock, farm animals, working animals", 14.47], ["explosion", 9.46]], [["music", 28.27], ["groan", 13.71], ["cattle, bovinae", 6.02]], [["speech", 47.06], ["animal", 4.5], ["boing", 3.71]], null, null, [["music", 50.4], ["speech", 19.99], ["hum", 4.03]], null], "duration": [-0.24, -0.09, 0.58, 2.7, 0.66, 0.97, 2.85, 1.55, 0.89, 0.05, 2.0, 0.58, 1.38, 0.58, 5.37, 0.63, -0.14, 1.87, 1.19, 0.93, 1.27, 0.81, 3.3, 0.36, 1.55, 4.67, 4.93, 2.49, 4.31, 0.75, -0.03, 19.14, 0.18]} \ No newline at end of file diff --git a/annotations_1/tekVuL2mT7A_filtered.json b/annotations_1/tekVuL2mT7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2acf003e321781b8116225365b66bbf75d0b1fa --- /dev/null +++ b/annotations_1/tekVuL2mT7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 12.23], [14.0, 14.17], [15.0, 14.64], [15.0, 14.69], [15.0, 14.94], [16.0, 41.5], [44.0, 46.87], [51.0, 51.38], [52.0, 52.22], [59.0, 63.37], [64.0, 65.5], [67.0, 81.19], [81.0, 82.22], [82.0, 83.62], [119.0, 119.26], [127.0, 128.98], [134.0, 134.08], [134.0, 136.39], [139.0, 142.64], [153.0, 153.22], [154.0, 156.1], [157.0, 158.94], [162.0, 164.86], [166.0, 166.82], [168.0, 172.81], [179.0, 193.56], [197.0, 199.35], [220.0, 222.32], [223.0, 223.4], [230.0, 234.27], [235.0, 236.38]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, true, false], "silence_prob": [95.37, 0.0, 0.0, 0.0, 0.0, 37.66, 35.99, 0.0, 0.0, 31.45, 0.0, 33.96, 0.0, 0.0, 0.0, 0.0, 0.0, 50.36, 63.96, 0.0, 37.55, 0.0, 29.1, 0.0, 29.02, 30.27, 40.47, 41.36, 0.0, 42.22, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 28.53], ["speech", 15.44], ["hum", 11.65]], [["speech", 44.31], ["music", 15.86], ["foghorn", 10.17]], null, null, [["speech", 43.49], ["music", 19.45], ["fart", 13.2]], null, [["fly, housefly", 22.9], ["music", 22.78], ["insect", 15.53]], null, null, null, null, null, null, null, null, [["speech", 56.15], ["moo", 10.12], ["cattle, bovinae", 8.72]], null, [["speech", 19.28], ["music", 19.18], ["cattle, bovinae", 8.39]], null, [["music", 56.34], ["throbbing", 10.7], ["hum", 7.38]], [["boing", 41.08], ["music", 28.09], ["whack, thwack", 8.56]], [["whale vocalization", 18.91], ["fly, housefly", 14.77], ["insect", 12.32]], [["animal", 16.35], ["speech", 13.54], ["canidae, dogs, wolves", 11.11]], null, [["livestock, farm animals, working animals", 18.15], ["cattle, bovinae", 17.2], ["moo", 16.86]], null], "duration": [4.23, 0.17, -0.36, -0.31, -0.06, 25.5, 2.87, 0.38, 0.22, 4.37, 1.5, 14.19, 1.22, 1.62, 0.26, 1.98, 0.08, 2.39, 3.64, 0.22, 2.1, 1.94, 2.86, 0.82, 4.81, 14.56, 2.35, 2.32, 0.4, 4.27, 1.38]} \ No newline at end of file diff --git a/annotations_1/teoyewW1bUY_filtered.json b/annotations_1/teoyewW1bUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42f3bddf8005e7c4ff40637b262d53b31998f41d --- /dev/null +++ b/annotations_1/teoyewW1bUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.9], [10.0, 11.13], [14.0, 16.56], [20.0, 20.76], [22.0, 22.79], [27.0, 28.36], [33.0, 33.99], [36.0, 36.76], [40.0, 40.47], [43.0, 43.5], [45.0, 46.21], [52.0, 53.32], [55.0, 57.77], [59.0, 60.39], [62.0, 64.37], [66.0, 67.0], [68.0, 68.27], [70.0, 70.09], [74.0, 75.3], [77.0, 76.92], [81.0, 81.26], [85.0, 86.81], [92.0, 94.07], [97.0, 99.5], [100.0, 103.54], [107.0, 108.67], [120.0, 121.59], [123.0, 124.17], [125.0, 126.44], [130.0, 131.28], [135.0, 136.39], [138.0, 138.28], [141.0, 141.59], [142.0, 143.78], [146.0, 146.62], [148.0, 150.38], [152.0, 152.34], [155.0, 155.38], [158.0, 158.45], [164.0, 164.86], [167.0, 168.79], [170.0, 171.46], [173.0, 176.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 59.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 99.82, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.82], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.54], ["singing bowl", 20.17], ["gong", 19.83]], null, null, null, null, null, null, [["music", 41.61], ["ambient music", 31.19], ["electronic music", 6.26]]], "duration": [0.9, 1.13, 2.56, 0.76, 0.79, 1.36, 0.99, 0.76, 0.47, 0.5, 1.21, 1.32, 2.77, 1.39, 2.37, 1.0, 0.27, 0.09, 1.3, -0.08, 0.26, 1.81, 2.07, 2.5, 3.54, 1.67, 1.59, 1.17, 1.44, 1.28, 1.39, 0.28, 0.59, 1.78, 0.62, 2.38, 0.34, 0.38, 0.45, 0.86, 1.79, 1.46, 3.22]} \ No newline at end of file diff --git a/annotations_1/tf_RRItKJm0_filtered.json b/annotations_1/tf_RRItKJm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..badd399cb41239e2c0d582af5567f18eb5aafbef --- /dev/null +++ b/annotations_1/tf_RRItKJm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 17.17], [20.0, 22.69], [25.0, 48.14], [51.0, 69.52], [74.0, 77.82], [79.0, 79.37], [80.0, 90.53], [98.0, 99.05], [106.0, 106.44], [107.0, 111.59], [122.0, 137.69], [143.0, 146.53]], "keep_status": [true, false, false, false, true, false, true, false, false, true, false, true], "silence_prob": [40.47, 42.53, 32.48, 46.79, 40.84, 0.0, 33.72, 0.0, 0.0, 38.52, 32.48, 32.09], "audiomae_on_audioset": [[["rumble", 28.95], ["hum", 24.54], ["music", 13.81]], [["hum", 31.55], ["music", 22.66], ["throbbing", 18.05]], [["hum", 45.16], ["mains hum", 30.35], ["music", 11.27]], [["music", 77.34], ["ambient music", 3.75], ["theremin", 2.97]], [["music", 48.37], ["electronic music", 12.31], ["hum", 5.73]], null, [["speech", 28.57], ["music", 9.03], ["hum", 8.26]], null, null, [["music", 55.32], ["electronic music", 10.0], ["hum", 3.27]], [["hum", 51.08], ["throbbing", 19.2], ["mains hum", 17.87]], [["music", 36.43], ["speech", 28.48], ["electronic music", 3.97]]], "duration": [4.17, 2.69, 23.14, 18.52, 3.82, 0.37, 10.53, 1.05, 0.44, 4.59, 15.69, 3.53]} \ No newline at end of file diff --git a/annotations_1/tg4jLJ6OiDY_filtered.json b/annotations_1/tg4jLJ6OiDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f416cded8c3172a8b6f336aab3c548a33f81ea0a --- /dev/null +++ b/annotations_1/tg4jLJ6OiDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [5.0, 6.13], [7.0, 8.65], [10.0, 10.89], [12.0, 19.16], [22.0, 23.18], [24.0, 24.19], [25.0, 25.52], [26.0, 29.24], [39.0, 39.45], [43.0, 45.39], [48.0, 47.85], [50.0, 49.96], [53.0, 54.04], [62.0, 64.67], [66.0, 66.93], [74.0, 73.94], [80.0, 80.33], [82.0, 85.41], [86.0, 86.83], [88.0, 88.45], [89.0, 97.24], [100.0, 103.11], [111.0, 112.45], [123.0, 123.82], [128.0, 129.19]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 45.43, 0.0, 45.82, 0.0, 0.0, 0.0, 46.02, 0.0, 0.0, 0.0, 60.51, 0.0, 0.0, 76.37, 57.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["dog", 20.92], ["bow-wow", 14.8], ["animal", 12.26]], null, [["music", 49.41], ["speech", 22.31], ["musical instrument", 5.72]], null, null, null, [["music", 72.44], ["synthesizer", 4.64], ["sidetone", 4.29]], null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 1.13, 1.65, 0.89, 7.16, 1.18, 0.19, 0.52, 3.24, 0.45, 2.39, -0.15, -0.04, 1.04, 2.67, 0.93, -0.06, 0.33, 3.41, 0.83, 0.45, 8.24, 3.11, 1.45, 0.82, 1.19]} \ No newline at end of file diff --git a/annotations_1/tgHcYxKjwVE_filtered.json b/annotations_1/tgHcYxKjwVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d96b3048d9fc723d821c92202f193a7b0d13b622 --- /dev/null +++ b/annotations_1/tgHcYxKjwVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.09], [16.0, 16.29], [17.0, 18.59], [20.0, 20.8], [22.0, 25.25], [27.0, 28.44], [29.0, 30.0], [31.0, 32.12], [32.0, 33.15], [34.0, 36.76], [37.0, 38.67], [39.0, 39.75], [41.0, 44.88], [46.0, 46.77], [49.0, 49.25], [50.0, 50.75], [52.0, 53.55], [55.0, 58.89], [65.0, 65.5], [68.0, 68.22], [69.0, 69.89], [73.0, 74.16], [79.0, 88.25], [89.0, 91.0], [91.0, 91.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.81, 0.0, 0.0, 0.0, 0.0, 34.29, 0.0, 0.0, 49.82, 0.0, 0.0, 0.0, 0.0, 41.98, 0.0, 0.0, 0.0, 0.0, 88.83, 40.64, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 61.78], ["speech", 14.85], ["whale vocalization", 6.03]], null, null, null, null, [["speech", 57.1], ["sidetone", 20.68], ["dial tone", 5.01]], null, null, [["sidetone", 42.4], ["speech", 25.28], ["chirp tone", 8.31]], null, null, null, null, [["speech", 49.39], ["dial tone", 6.19], ["telephone", 5.09]], null, null, null, null, null, [["livestock, farm animals, working animals", 30.47], ["cattle, bovinae", 14.26], ["fly, housefly", 8.26]], null], "duration": [1.09, 0.29, 1.59, 0.8, 3.25, 1.44, 1.0, 1.12, 1.15, 2.76, 1.67, 0.75, 3.88, 0.77, 0.25, 0.75, 1.55, 3.89, 0.5, 0.22, 0.89, 1.16, 9.25, 2.0, 0.54]} \ No newline at end of file diff --git a/annotations_1/ti39GhRZkrw_filtered.json b/annotations_1/ti39GhRZkrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6219e447cbc518f24705c867bd9f8845df41696 --- /dev/null +++ b/annotations_1/ti39GhRZkrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.06], [9.0, 9.32], [11.0, 13.68], [15.0, 16.41], [22.0, 25.56], [28.0, 31.08], [31.0, 33.61], [38.0, 38.48], [40.0, 40.59], [43.0, 44.04], [46.0, 48.63], [51.0, 51.63], [53.0, 53.62], [56.0, 56.24], [58.0, 59.24], [63.0, 63.24], [68.0, 68.4], [71.0, 71.41], [72.0, 74.49], [76.0, 76.05], [79.0, 79.84], [83.0, 84.42], [88.0, 88.67], [94.0, 95.59], [123.0, 123.06], [124.0, 124.68], [131.0, 130.89], [136.0, 136.36], [142.0, 143.77], [148.0, 150.01], [155.0, 156.22], [161.0, 161.96], [164.0, 163.68]], "keep_status": [false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 42.58, 0.0, 41.87, 45.36, 30.24, 0.0, 0.0, 0.0, 48.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.56, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 35.61], ["hum", 16.0], ["mains hum", 8.31]], null, [["speech", 43.97], ["music", 20.85], ["sonar", 5.39]], [["whip", 30.18], ["sidetone", 10.0], ["crack", 6.5]], [["mains hum", 42.44], ["hum", 22.49], ["music", 7.17]], null, null, null, [["didgeridoo", 32.06], ["music", 29.29], ["whale vocalization", 4.86]], null, null, null, null, null, null, null, [["electric shaver, electric razor", 62.98], ["speech", 25.25], ["mains hum", 3.02]], null, null, null, null, null, null, null, null, null, null, [["music", 27.1], ["hum", 22.76], ["mains hum", 12.03]], null, null, null], "duration": [1.06, 0.32, 2.68, 1.41, 3.56, 3.08, 2.61, 0.48, 0.59, 1.04, 2.63, 0.63, 0.62, 0.24, 1.24, 0.24, 0.4, 0.41, 2.49, 0.05, 0.84, 1.42, 0.67, 1.59, 0.06, 0.68, -0.11, 0.36, 1.77, 2.01, 1.22, 0.96, -0.32]} \ No newline at end of file diff --git a/annotations_1/ti3HSBmEoVU_filtered.json b/annotations_1/ti3HSBmEoVU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c21c6084506c698bfd607483ccd26a5be4b46171 --- /dev/null +++ b/annotations_1/ti3HSBmEoVU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.74], [8.0, 9.05], [12.0, 15.53], [16.0, 20.39], [21.0, 22.54], [26.0, 26.99], [33.0, 33.54], [35.0, 35.68], [36.0, 36.54], [37.0, 37.76], [38.0, 38.69], [39.0, 45.55], [48.0, 48.42], [49.0, 51.53], [52.0, 53.7], [55.0, 67.14], [68.0, 84.33], [85.0, 86.88], [88.0, 117.24], [121.0, 131.5], [135.0, 141.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.36, 0.0, 84.07, 78.04, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.45, 0.0, 59.15, 0.0, 70.3, 93.45, 0.0, 31.61, 31.94, 32.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 69.43], ["musical instrument", 2.65], ["wind instrument, woodwind instrument", 1.99]], [["music", 82.91], ["musical instrument", 1.84], ["guitar", 1.29]], [["music", 65.04], ["didgeridoo", 7.91], ["mosquito", 1.93]]], "duration": [3.74, 1.05, 3.53, 4.39, 1.54, 0.99, 0.54, 0.68, 0.54, 0.76, 0.69, 6.55, 0.42, 2.53, 1.7, 12.14, 16.33, 1.88, 29.24, 10.5, 6.62]} \ No newline at end of file diff --git a/annotations_1/ti9jg0JOK2I_filtered.json b/annotations_1/ti9jg0JOK2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..32918c2e0a131babd4b9a01b2f9adb73bc9aa424 --- /dev/null +++ b/annotations_1/ti9jg0JOK2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.61], [19.0, 25.1], [29.0, 28.92], [29.0, 52.19], [53.0, 55.65], [57.0, 57.43], [59.0, 95.37], [98.0, 98.91], [104.0, 106.76], [109.0, 109.02], [111.0, 113.91], [115.0, 115.89], [120.0, 121.2], [132.0, 135.46]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 29.5, 0.0, 27.89, 28.22, 0.0, 0.0, 0.0, 27.99, 0.0, 32.0, 0.0, 0.0, 28.04], "audiomae_on_audioset": [null, [["throbbing", 38.41], ["music", 18.65], ["hum", 14.85]], null, [["speech", 44.2], ["music", 20.7], ["buzz", 7.89]], [["music", 83.05], ["cacophony", 2.39], ["speech", 1.63]], null, null, null, [["breaking", 87.23], ["music", 4.55], ["smash, crash", 2.13]], null, [["music", 27.37], ["speech", 20.77], ["throbbing", 13.91]], null, null, [["music", 58.67], ["boing", 4.66], ["didgeridoo", 3.39]]], "duration": [0.61, 6.1, -0.08, 23.19, 2.65, 0.43, 36.37, 0.91, 2.76, 0.02, 2.91, 0.89, 1.2, 3.46]} \ No newline at end of file diff --git a/annotations_1/tkWWtYRbnq8_filtered.json b/annotations_1/tkWWtYRbnq8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..308c5a18d34e7b4033df4f7faae59347026ab95e --- /dev/null +++ b/annotations_1/tkWWtYRbnq8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.85], [17.0, 22.03], [23.0, 28.46], [31.0, 31.31], [44.0, 43.92], [48.0, 49.91], [53.0, 54.5], [56.0, 56.66], [59.0, 59.05], [61.0, 62.95], [64.0, 68.08], [70.0, 83.96], [88.0, 101.92], [106.0, 114.15], [124.0, 142.97], [145.0, 147.99], [148.0, 148.31], [152.0, 155.28]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false], "silence_prob": [0.0, 42.6, 88.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.43, 43.13, 37.46, 42.02, 33.93, 88.1, 0.0, 63.74], "audiomae_on_audioset": [null, [["speech", 37.67], ["whale vocalization", 14.11], ["music", 13.21]], null, null, null, null, null, null, null, null, [["music", 33.6], ["harp", 18.78], ["speech", 6.88]], [["music", 50.93], ["quack", 21.67], ["duck", 3.75]], [["music", 61.77], ["synthesizer", 6.27], ["speech", 5.27]], [["music", 30.33], ["mains hum", 16.93], ["hum", 13.83]], [["music", 33.07], ["cattle, bovinae", 26.1], ["moo", 19.25]], null, null, null], "duration": [1.85, 5.03, 5.46, 0.31, -0.08, 1.91, 1.5, 0.66, 0.05, 1.95, 4.08, 13.96, 13.92, 8.15, 18.97, 2.99, 0.31, 3.28]} \ No newline at end of file diff --git a/annotations_1/tktoOXBmflI_filtered.json b/annotations_1/tktoOXBmflI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba2cdf43ecc73f8c4190c0625bd81d9421eb0824 --- /dev/null +++ b/annotations_1/tktoOXBmflI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.83], [14.0, 23.06], [24.0, 24.66], [25.0, 27.28], [28.0, 31.41], [32.0, 37.66], [38.0, 52.35], [54.0, 59.73], [61.0, 62.23], [63.0, 63.96], [66.0, 70.61], [73.0, 73.72], [76.0, 76.49], [77.0, 78.31], [82.0, 85.65], [87.0, 96.3], [97.0, 109.17], [110.0, 110.15], [110.0, 111.45], [115.0, 123.67], [128.0, 128.85], [133.0, 135.21], [137.0, 138.01]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [96.89, 70.44, 0.0, 51.66, 49.18, 76.37, 81.17, 99.21, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 59.96, 33.82, 53.97, 0.0, 0.0, 79.24, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["boing", 42.32], ["noise", 12.8], ["speech", 8.53]], null, null, null, null, null, [["speech", 60.55], ["echo", 3.77], ["boing", 3.08]], null, null, null, null, [["music", 42.48], ["synthesizer", 8.48], ["musical instrument", 4.6]], null, null, null, null, null, null, null], "duration": [5.83, 9.06, 0.66, 2.28, 3.41, 5.66, 14.35, 5.73, 1.23, 0.96, 4.61, 0.72, 0.49, 1.31, 3.65, 9.3, 12.17, 0.15, 1.45, 8.67, 0.85, 2.21, 1.01]} \ No newline at end of file diff --git a/annotations_1/tlI--ATerwo_filtered.json b/annotations_1/tlI--ATerwo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fd8a6c5b7ff8289e24f9c8197b9819aa82f72d70 --- /dev/null +++ b/annotations_1/tlI--ATerwo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.3], [12.0, 13.27], [14.0, 14.89], [16.0, 16.01], [17.0, 17.17], [22.0, 22.52], [26.0, 26.25], [27.0, 27.7], [29.0, 29.2], [38.0, 38.74], [39.0, 42.03], [43.0, 43.34], [48.0, 47.78], [49.0, 53.97], [56.0, 57.21], [58.0, 58.35], [59.0, 59.81], [61.0, 61.3], [68.0, 68.84], [70.0, 71.02]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.76, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.3, 1.27, 0.89, 0.01, 0.17, 0.52, 0.25, 0.7, 0.2, 0.74, 3.03, 0.34, -0.22, 4.97, 1.21, 0.35, 0.81, 0.3, 0.84, 1.02]} \ No newline at end of file diff --git a/annotations_1/tlJM0tgXu5Q_filtered.json b/annotations_1/tlJM0tgXu5Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5516980b7f4325da16b6306e719896f7e68fec59 --- /dev/null +++ b/annotations_1/tlJM0tgXu5Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [3.0, 112.41]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [0.76, 109.41]} \ No newline at end of file diff --git a/annotations_1/tlLSqeVA_no_filtered.json b/annotations_1/tlLSqeVA_no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7318273d8cd0a91287e9724359dc28ca9479a076 --- /dev/null +++ b/annotations_1/tlLSqeVA_no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.26], [21.0, 21.2], [22.0, 22.82], [34.0, 34.26], [35.0, 45.33], [47.0, 51.33], [53.0, 54.57], [57.0, 57.54], [60.0, 66.77], [69.0, 89.73], [90.0, 90.49], [106.0, 106.47], [107.0, 108.46], [112.0, 112.95], [120.0, 120.51], [123.0, 124.16], [128.0, 128.22], [131.0, 135.95]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 39.27, 100.0, 0.0, 0.0, 32.27, 31.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.89], "audiomae_on_audioset": [null, null, null, null, [["crow", 29.48], ["animal", 20.93], ["caw", 14.87]], null, null, null, [["speech", 62.73], ["quack", 6.48], ["duck", 4.72]], [["cattle, bovinae", 40.42], ["livestock, farm animals, working animals", 25.43], ["moo", 14.12]], null, null, null, null, null, null, null, null], "duration": [1.26, 0.2, 0.82, 0.26, 10.33, 4.33, 1.57, 0.54, 6.77, 20.73, 0.49, 0.47, 1.46, 0.95, 0.51, 1.16, 0.22, 4.95]} \ No newline at end of file diff --git a/annotations_1/tlSscKeO9Cc_filtered.json b/annotations_1/tlSscKeO9Cc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb9130c7f3d95367cbe625953ca1c4dbfd30a16f --- /dev/null +++ b/annotations_1/tlSscKeO9Cc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.91], [26.0, 27.18], [28.0, 28.63], [29.0, 31.45], [33.0, 33.35], [35.0, 54.09], [56.0, 63.75], [68.0, 76.47], [78.0, 78.43], [80.0, 85.41], [86.0, 92.91], [97.0, 112.04], [114.0, 119.52], [124.0, 131.31], [138.0, 147.77]], "keep_status": [true, false, false, true, false, false, false, true, false, true, false, true, true, true, true], "silence_prob": [29.72, 0.0, 0.0, 31.8, 0.0, 28.73, 28.53, 28.55, 0.0, 29.22, 28.25, 28.37, 30.89, 29.14, 28.65], "audiomae_on_audioset": [[["speech", 36.22], ["aircraft", 11.23], ["vehicle", 9.18]], null, null, [["speech", 17.78], ["music", 17.2], ["mains hum", 4.87]], null, [["music", 72.79], ["synthesizer", 5.33], ["electronic music", 3.88]], [["music", 45.16], ["speech", 13.43], ["hum", 13.0]], [["vehicle", 23.56], ["music", 13.87], ["speech", 11.24]], null, [["vehicle", 29.97], ["speech", 10.6], ["car", 10.36]], [["motorcycle", 62.21], ["vehicle", 8.74], ["speech", 6.45]], [["vehicle", 38.21], ["car", 13.13], ["speech", 11.31]], [["music", 49.09], ["synthesizer", 13.11], ["speech", 5.93]], [["music", 32.66], ["throbbing", 18.22], ["hum", 13.03]], [["music", 32.53], ["speech", 24.53], ["outside, rural or natural", 5.82]]], "duration": [6.91, 1.18, 0.63, 2.45, 0.35, 19.09, 7.75, 8.47, 0.43, 5.41, 6.91, 15.04, 5.52, 7.31, 9.77]} \ No newline at end of file diff --git a/annotations_1/tmUleIek9Fc_filtered.json b/annotations_1/tmUleIek9Fc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f66384053978ff86a3b8d3a4dafb499f3736e969 --- /dev/null +++ b/annotations_1/tmUleIek9Fc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.84], [17.0, 17.47], [18.0, 39.41], [41.0, 41.86], [42.0, 46.21], [48.0, 49.71], [51.0, 51.61], [55.0, 61.72], [64.0, 74.38], [77.0, 77.19], [81.0, 81.65], [85.0, 86.27], [87.0, 88.67], [91.0, 93.5], [94.0, 98.05], [98.0, 99.66], [100.0, 102.66], [104.0, 106.64], [107.0, 107.54], [108.0, 110.15], [111.0, 112.9], [114.0, 115.25], [116.0, 119.35], [120.0, 123.97], [127.0, 129.76], [130.0, 133.81], [135.0, 137.66], [138.0, 140.54], [141.0, 146.77], [147.0, 149.67]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 42.0, 0.0, 53.22, 0.0, 0.0, 63.1, 70.44, 0.0, 0.0, 0.0, 0.0, 99.26, 82.79, 0.0, 98.86, 100.0, 0.0, 93.91, 0.0, 0.0, 96.17, 77.53, 99.85, 61.97, 98.8, 48.14, 91.13, 80.46], "audiomae_on_audioset": [null, null, [["music", 18.13], ["animal", 13.93], ["hum", 9.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 23.05], ["music", 22.09], ["hum", 17.41]], null, null], "duration": [0.84, 0.47, 21.41, 0.86, 4.21, 1.71, 0.61, 6.72, 10.38, 0.19, 0.65, 1.27, 1.67, 2.5, 4.05, 1.66, 2.66, 2.64, 0.54, 2.15, 1.9, 1.25, 3.35, 3.97, 2.76, 3.81, 2.66, 2.54, 5.77, 2.67]} \ No newline at end of file diff --git a/annotations_1/tm_W36kWahM_filtered.json b/annotations_1/tm_W36kWahM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84f938de9916d744c6b94c1287ddaf08b855370b --- /dev/null +++ b/annotations_1/tm_W36kWahM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.6], [16.0, 15.65], [17.0, 17.39], [19.0, 19.57], [33.0, 33.79], [34.0, 38.47], [40.0, 40.81], [41.0, 42.01], [43.0, 44.39], [47.0, 48.66], [51.0, 52.25], [54.0, 54.5], [58.0, 58.51], [60.0, 59.8], [63.0, 67.19], [68.0, 69.65], [76.0, 76.87], [77.0, 80.06], [81.0, 82.39], [87.0, 100.7], [102.0, 102.56], [104.0, 107.2], [109.0, 116.04], [118.0, 120.93], [122.0, 137.17], [138.0, 150.23], [152.0, 154.92]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [37.2, 0.0, 0.0, 0.0, 0.0, 55.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.36, 0.0, 0.0, 48.31, 0.0, 99.99, 0.0, 49.36, 97.11, 82.25, 99.16, 66.27, 99.96], "audiomae_on_audioset": [[["speech", 54.1], ["sidetone", 12.59], ["hum", 8.05]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.73], ["music", 9.99], ["chirp tone", 9.32]], null, null, null, [["speech", 61.64], ["singing bowl", 13.46], ["music", 4.59]], null, null, null, null, null], "duration": [3.6, -0.35, 0.39, 0.57, 0.79, 4.47, 0.81, 1.01, 1.39, 1.66, 1.25, 0.5, 0.51, -0.2, 4.19, 1.65, 0.87, 3.06, 1.39, 13.7, 0.56, 3.2, 7.04, 2.93, 15.17, 12.23, 2.92]} \ No newline at end of file diff --git a/annotations_1/tp1eVLXEXm8_filtered.json b/annotations_1/tp1eVLXEXm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9eac2edfc5c1619693e0d9339cee79b7016c6d5f --- /dev/null +++ b/annotations_1/tp1eVLXEXm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.61], [14.0, 20.92], [21.0, 26.89], [34.0, 52.52], [56.0, 59.37], [62.0, 62.99], [71.0, 72.62], [81.0, 95.05], [111.0, 116.9], [119.0, 122.77], [124.0, 128.46], [131.0, 131.89], [133.0, 135.04], [136.0, 138.47], [139.0, 138.54], [140.0, 147.16]], "keep_status": [false, true, true, false, false, false, false, false, true, true, false, false, false, false, false, true], "silence_prob": [0.0, 37.01, 36.61, 33.24, 36.69, 0.0, 0.0, 32.41, 31.82, 36.99, 57.72, 0.0, 35.48, 34.14, 0.0, 31.65], "audiomae_on_audioset": [null, [["music", 25.68], ["boing", 21.45], ["speech", 18.34]], [["music", 42.67], ["speech", 15.3], ["animal", 4.12]], [["music", 61.94], ["theremin", 16.68], ["speech", 4.14]], [["music", 48.54], ["guitar", 19.03], ["musical instrument", 8.47]], null, null, [["music", 60.04], ["boing", 7.09], ["speech", 5.96]], [["boing", 28.46], ["music", 19.82], ["speech", 13.86]], [["boing", 23.73], ["music", 12.46], ["speech", 11.2]], null, null, [["whale vocalization", 48.77], ["music", 17.06], ["speech", 7.27]], [["fly, housefly", 49.71], ["mosquito", 23.65], ["insect", 18.67]], null, [["music", 38.48], ["speech", 5.21], ["hum", 4.44]]], "duration": [0.61, 6.92, 5.89, 18.52, 3.37, 0.99, 1.62, 14.05, 5.9, 3.77, 4.46, 0.89, 2.04, 2.47, -0.46, 7.16]} \ No newline at end of file diff --git a/annotations_1/tpsGUGc8Ri8_filtered.json b/annotations_1/tpsGUGc8Ri8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..152d5825cbf25b68de588ff88db5727a2933258b --- /dev/null +++ b/annotations_1/tpsGUGc8Ri8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 11.87], [17.0, 31.23], [35.0, 35.21], [39.0, 39.39], [40.0, 41.79], [45.0, 45.32], [45.0, 48.0], [58.0, 59.58], [60.0, 63.37], [64.0, 63.78], [64.0, 76.79], [79.0, 87.52], [88.0, 93.16], [94.0, 99.01], [101.0, 109.09], [109.0, 109.71], [112.0, 150.26], [159.0, 174.8]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [34.88, 31.3, 0.0, 0.0, 0.0, 0.0, 31.12, 0.0, 31.96, 0.0, 30.99, 29.54, 30.36, 29.52, 29.01, 0.0, 0.0, 29.58], "audiomae_on_audioset": [[["sidetone", 36.57], ["speech", 21.45], ["music", 11.88]], [["music", 71.03], ["throbbing", 6.27], ["hum", 5.55]], null, null, null, null, [["music", 51.38], ["speech", 7.04], ["electronic music", 5.05]], null, [["music", 26.7], ["speech", 14.37], ["sidetone", 10.66]], null, [["hum", 33.89], ["throbbing", 24.99], ["mains hum", 24.67]], [["music", 64.25], ["throbbing", 16.23], ["hum", 6.04]], [["music", 73.36], ["speech", 3.59], ["electronic music", 2.44]], [["music", 31.1], ["speech", 21.35], ["breaking", 19.06]], [["music", 70.67], ["speech", 14.8], ["throbbing", 4.18]], null, null, [["music", 61.83], ["hum", 12.24], ["throbbing", 10.77]]], "duration": [4.87, 14.23, 0.21, 0.39, 1.79, 0.32, 3.0, 1.58, 3.37, -0.22, 12.79, 8.52, 5.16, 5.01, 8.09, 0.71, 38.26, 15.8]} \ No newline at end of file diff --git a/annotations_1/tqmbgqyc1bc_filtered.json b/annotations_1/tqmbgqyc1bc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3522141ce643831fd9eb20414d764e26f6018920 --- /dev/null +++ b/annotations_1/tqmbgqyc1bc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 12.73], [14.0, 14.35], [15.0, 22.69], [28.0, 29.44], [33.0, 34.59], [46.0, 87.88], [95.0, 108.9], [112.0, 127.28], [133.0, 139.08], [142.0, 145.4], [147.0, 147.56], [149.0, 150.48], [151.0, 153.39], [154.0, 154.95], [156.0, 158.58], [159.0, 161.03], [162.0, 164.0], [166.0, 176.94]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [50.31, 0.0, 39.8, 0.0, 0.0, 0.0, 29.26, 29.73, 75.88, 41.91, 0.0, 0.0, 59.42, 0.0, 56.33, 57.4, 67.76, 52.1], "audiomae_on_audioset": [null, null, [["music", 32.57], ["speech", 21.39], ["throbbing", 9.28]], null, null, null, [["music", 72.57], ["throbbing", 3.51], ["electronic music", 2.23]], [["music", 46.88], ["mains hum", 7.11], ["speech", 4.65]], null, [["speech", 28.11], ["music", 16.35], ["fly, housefly", 8.77]], null, null, null, null, null, null, null, null], "duration": [5.73, 0.35, 7.69, 1.44, 1.59, 41.88, 13.9, 15.28, 6.08, 3.4, 0.56, 1.48, 2.39, 0.95, 2.58, 2.03, 2.0, 10.94]} \ No newline at end of file diff --git a/annotations_1/tr2hYRUEkHk_filtered.json b/annotations_1/tr2hYRUEkHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d56a3310a5d74e16e5e68abc351abc5101edb161 --- /dev/null +++ b/annotations_1/tr2hYRUEkHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [2.0, 3.82], [5.0, 5.39], [6.0, 8.6], [9.0, 9.15], [12.0, 12.83], [13.0, 13.2], [14.0, 13.85], [15.0, 20.55], [22.0, 23.03], [27.0, 27.41], [28.0, 29.44], [30.0, 30.64], [31.0, 45.6], [47.0, 49.82], [52.0, 57.13], [58.0, 59.46], [60.0, 65.52], [68.0, 70.53], [75.0, 78.27], [80.0, 81.31], [85.0, 85.4], [87.0, 87.45], [90.0, 102.68], [104.0, 109.22], [111.0, 115.77], [117.0, 121.81], [122.0, 123.85], [126.0, 131.95], [133.0, 133.64], [135.0, 135.62], [136.0, 141.15], [142.0, 149.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 92.64, 0.0, 0.0, 0.0, 0.0, 99.78, 99.52, 99.99, 0.0, 99.87, 99.91, 100.0, 0.0, 0.0, 0.0, 99.52, 99.99, 100.0, 99.99, 0.0, 99.91, 0.0, 0.0, 99.31, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.13, 1.82, 0.39, 2.6, 0.15, 0.83, 0.2, -0.15, 5.55, 1.03, 0.41, 1.44, 0.64, 14.6, 2.82, 5.13, 1.46, 5.52, 2.53, 3.27, 1.31, 0.4, 0.45, 12.68, 5.22, 4.77, 4.81, 1.85, 5.95, 0.64, 0.62, 5.15, 7.55]} \ No newline at end of file diff --git a/annotations_1/tru0WMH7yic_filtered.json b/annotations_1/tru0WMH7yic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16a4e7a27159863fd94f9786cd4b1c45ca03d5bd --- /dev/null +++ b/annotations_1/tru0WMH7yic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.44], [13.0, 14.69], [20.0, 20.55], [23.0, 24.98], [26.0, 26.59], [27.0, 31.53], [32.0, 31.62], [33.0, 51.58], [56.0, 116.85], [118.0, 119.47], [122.0, 132.02], [133.0, 133.32], [134.0, 139.04], [139.0, 142.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 52.8, 0.0, 38.05, 0.0, 0.0, 45.05, 0.0, 96.42, 32.56], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 46.7], ["mains hum", 25.57], ["music", 6.37]], null, null, [["smash, crash", 27.1], ["breaking", 23.68], ["speech", 6.39]], null, null, [["clang", 19.88], ["speech", 10.74], ["ding", 8.12]]], "duration": [0.44, 1.69, 0.55, 1.98, 0.59, 4.53, -0.38, 18.58, 60.85, 1.47, 10.02, 0.32, 5.04, 3.4]} \ No newline at end of file diff --git a/annotations_1/tskpXGAJMhw_filtered.json b/annotations_1/tskpXGAJMhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e71b4f04ccd22fc31b75b2805b05ff8ba43013d1 --- /dev/null +++ b/annotations_1/tskpXGAJMhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.25], [6.0, 6.15], [10.0, 10.67], [12.0, 12.07], [16.0, 16.11], [17.0, 17.56], [22.0, 22.54], [29.0, 29.34], [32.0, 33.71], [35.0, 35.46], [37.0, 36.86], [50.0, 51.29], [52.0, 52.56], [66.0, 66.16], [68.0, 68.4], [71.0, 71.29], [77.0, 77.21], [79.0, 79.0], [83.0, 83.44], [87.0, 91.35], [92.0, 95.15], [100.0, 102.05], [110.0, 111.16], [116.0, 116.26], [117.0, 118.64], [122.0, 121.88], [131.0, 131.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 72.01, 35.98, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 20.79], ["speech", 9.29], ["caterwaul", 4.7]], null, null, null, null, null], "duration": [0.25, 0.15, 0.67, 0.07, 0.11, 0.56, 0.54, 0.34, 1.71, 0.46, -0.14, 1.29, 0.56, 0.16, 0.4, 0.29, 0.21, 0.0, 0.44, 4.35, 3.15, 2.05, 1.16, 0.26, 1.64, -0.12, 0.43]} \ No newline at end of file diff --git a/annotations_1/ttEZ7b4Cf9w_filtered.json b/annotations_1/ttEZ7b4Cf9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c182c3d7f3ebfd39ab4129a052b6b7d53df81c6 --- /dev/null +++ b/annotations_1/ttEZ7b4Cf9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 38.15], [39.0, 43.5], [44.0, 45.47], [46.0, 50.63], [52.0, 55.71], [57.0, 58.06], [58.0, 58.92], [60.0, 61.91], [64.0, 114.74], [118.0, 160.91], [168.0, 168.62]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 43.98, 0.0, 46.97, 51.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.72], ["hum", 24.75], ["gong", 11.56]], null, [["speech", 53.22], ["music", 25.2], ["hum", 1.91]], null, null, null, null, null, null, null], "duration": [0.15, 4.5, 1.47, 4.63, 3.71, 1.06, 0.92, 1.91, 50.74, 42.91, 0.62]} \ No newline at end of file diff --git a/annotations_1/ttTyXqwsP0o_filtered.json b/annotations_1/ttTyXqwsP0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..294721e6a85234f34825e488fa7b0457a3e0b1a4 --- /dev/null +++ b/annotations_1/ttTyXqwsP0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.04], [9.0, 9.37], [12.0, 11.87], [15.0, 15.5], [17.0, 17.31], [19.0, 23.04], [26.0, 29.94], [31.0, 32.12], [34.0, 34.67], [43.0, 50.58], [52.0, 52.22], [54.0, 54.45], [59.0, 59.64], [62.0, 62.8], [66.0, 66.38], [67.0, 68.49], [70.0, 73.55], [74.0, 75.05], [76.0, 76.5], [78.0, 81.75], [84.0, 85.38], [88.0, 93.8], [95.0, 96.48], [99.0, 100.84], [103.0, 104.19], [106.0, 106.88], [111.0, 112.14]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, false, false, false, false, false, true, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 30.33, 0.0, 0.0, 31.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 0.0, 34.36, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 19.17], ["speech", 16.77], ["moo", 11.83]], [["hum", 11.04], ["music", 5.95], ["cacophony", 4.42]], null, null, [["noise", 21.7], ["buzz", 12.21], ["vehicle", 10.39]], null, null, null, null, null, null, [["noise", 17.78], ["music", 12.35], ["white noise", 6.55]], null, null, [["speech", 41.07], ["horse", 5.66], ["radio", 5.49]], null, [["vehicle", 17.54], ["fly, housefly", 14.49], ["buzz", 8.98]], null, null, null, null, null], "duration": [1.04, 0.37, -0.13, 0.5, 0.31, 4.04, 3.94, 1.12, 0.67, 7.58, 0.22, 0.45, 0.64, 0.8, 0.38, 1.49, 3.55, 1.05, 0.5, 3.75, 1.38, 5.8, 1.48, 1.84, 1.19, 0.88, 1.14]} \ No newline at end of file diff --git a/annotations_1/ttiEgVcV-Xo_filtered.json b/annotations_1/ttiEgVcV-Xo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..264a3edfc8dbf9842097d5962688eb2d56d5de54 --- /dev/null +++ b/annotations_1/ttiEgVcV-Xo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 35.8], [37.0, 39.16], [44.0, 44.86], [52.0, 54.45], [57.0, 63.07], [64.0, 64.54], [66.0, 65.99], [67.0, 74.09], [77.0, 77.23], [78.0, 80.4], [81.0, 83.54], [84.0, 90.58], [92.0, 101.66], [102.0, 110.81], [111.0, 113.83], [115.0, 121.93], [124.0, 124.9], [127.0, 130.2], [130.0, 133.39], [135.0, 136.56], [138.0, 139.18], [141.0, 153.59], [155.0, 158.03], [158.0, 160.74], [161.0, 164.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 48.06, 0.0, 96.17, 99.87, 0.0, 0.0, 36.26, 0.0, 98.73, 90.95, 91.13, 99.21, 85.54, 66.76, 68.67, 0.0, 64.18, 44.72, 0.0, 0.0, 92.97, 99.48, 94.22, 62.58], "audiomae_on_audioset": [null, [["hum", 66.13], ["mains hum", 30.83], ["speech", 0.62]], null, null, null, null, null, [["thunk", 63.3], ["speech", 31.27], ["thump, thud", 2.78]], null, null, null, null, null, null, null, null, null, null, [["speech", 49.38], ["music", 24.22], ["singing bowl", 4.11]], null, null, null, null, null, null], "duration": [30.8, 2.16, 0.86, 2.45, 6.07, 0.54, -0.01, 7.09, 0.23, 2.4, 2.54, 6.58, 9.66, 8.81, 2.83, 6.93, 0.9, 3.2, 3.39, 1.56, 1.18, 12.59, 3.03, 2.74, 3.13]} \ No newline at end of file diff --git a/annotations_1/tu6FDI4JBDY_filtered.json b/annotations_1/tu6FDI4JBDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a379b64ddf3e72e3ac0d70b4338cf21a97ed85de --- /dev/null +++ b/annotations_1/tu6FDI4JBDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.61], [23.0, 25.51], [27.0, 26.82], [27.0, 35.01], [42.0, 43.7], [44.0, 43.73], [46.0, 56.57], [61.0, 66.46], [68.0, 73.18], [73.0, 74.19], [86.0, 87.34], [89.0, 90.05], [94.0, 94.47], [99.0, 102.68]], "keep_status": [false, true, false, true, false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 30.16, 0.0, 28.97, 0.0, 0.0, 29.29, 29.76, 29.66, 0.0, 0.0, 0.0, 0.0, 31.3], "audiomae_on_audioset": [null, [["throbbing", 24.17], ["hum", 11.64], ["rumble", 11.03]], null, [["music", 27.34], ["hum", 17.71], ["breaking", 9.67]], null, null, [["speech", 39.87], ["music", 32.61], ["smash, crash", 5.89]], [["rumble", 20.91], ["music", 14.44], ["foghorn", 13.14]], [["music", 25.93], ["whack, thwack", 23.6], ["fly, housefly", 7.02]], null, null, null, null, [["speech", 39.53], ["music", 9.43], ["vehicle", 9.11]]], "duration": [0.61, 2.51, -0.18, 8.01, 1.7, -0.27, 10.57, 5.46, 5.18, 1.19, 1.34, 1.05, 0.47, 3.68]} \ No newline at end of file diff --git a/annotations_1/tuXSqMrfVW8_filtered.json b/annotations_1/tuXSqMrfVW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4da216c2b930b0e887a90ffe8f5e6d5c8021cfb3 --- /dev/null +++ b/annotations_1/tuXSqMrfVW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[101.0, 110.42], [111.0, 117.22]], "keep_status": [true, false], "silence_prob": [42.84, 40.73], "audiomae_on_audioset": [[["music", 44.81], ["speech", 6.76], ["buzz", 4.76]], [["music", 54.02], ["grunt", 17.96], ["speech", 3.36]]], "duration": [9.42, 6.22]} \ No newline at end of file diff --git a/annotations_1/tuusFUTcCO8_filtered.json b/annotations_1/tuusFUTcCO8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b2c811b4d713bd0d49d5b181cf174cad154853f --- /dev/null +++ b/annotations_1/tuusFUTcCO8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.18], [12.0, 13.09], [14.0, 15.63], [20.0, 24.22], [44.0, 45.3], [46.0, 47.46], [48.0, 49.47], [58.0, 74.43], [74.0, 74.95], [76.0, 83.83], [89.0, 89.85], [101.0, 101.12], [102.0, 106.79], [126.0, 126.79]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [33.38, 0.0, 0.0, 33.34, 0.0, 0.0, 0.0, 31.32, 0.0, 30.83, 0.0, 0.0, 33.77, 0.0], "audiomae_on_audioset": [[["speech", 33.62], ["music", 12.41], ["hum", 10.79]], null, null, [["speech", 49.05], ["throbbing", 16.25], ["hum", 6.09]], null, null, null, [["speech", 39.3], ["hum", 20.13], ["mains hum", 15.88]], null, [["sidetone", 30.03], ["speech", 26.05], ["music", 10.67]], null, null, [["didgeridoo", 55.97], ["music", 29.07], ["speech", 5.9]], null], "duration": [2.18, 1.09, 1.63, 4.22, 1.3, 1.46, 1.47, 16.43, 0.95, 7.83, 0.85, 0.12, 4.79, 0.79]} \ No newline at end of file diff --git a/annotations_1/tvxjJd08MMc_filtered.json b/annotations_1/tvxjJd08MMc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ffe76d041c9ca51c77699eee4462373853a8751 --- /dev/null +++ b/annotations_1/tvxjJd08MMc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 43.28], [47.0, 63.69], [65.0, 65.35], [67.0, 86.36], [87.0, 96.21], [97.0, 105.19], [107.0, 106.95], [107.0, 118.13], [122.0, 122.57], [126.0, 127.13]], "keep_status": [true, false, false, false, false, true, false, true, false, false], "silence_prob": [34.41, 33.06, 0.0, 33.87, 36.2, 43.15, 0.0, 47.23, 0.0, 0.0], "audiomae_on_audioset": [[["music", 51.18], ["brass instrument", 8.31], ["wind instrument, woodwind instrument", 4.7]], [["music", 67.02], ["brass instrument", 2.92], ["hum", 2.7]], null, [["music", 48.12], ["theremin", 18.99], ["clarinet", 6.29]], [["music", 63.23], ["theremin", 6.45], ["wind instrument, woodwind instrument", 5.8]], [["music", 53.33], ["fart", 5.64], ["didgeridoo", 4.29]], null, [["speech", 35.53], ["wail, moan", 8.95], ["beatboxing", 7.89]], null, null], "duration": [15.28, 16.69, 0.35, 19.36, 9.21, 8.19, -0.05, 11.13, 0.57, 1.13]} \ No newline at end of file diff --git a/annotations_1/tw84SFLxC_o_filtered.json b/annotations_1/tw84SFLxC_o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cbba6e5c04fc67b1557cd18be855c02d30644fa5 --- /dev/null +++ b/annotations_1/tw84SFLxC_o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 21.69], [23.0, 28.49]], "keep_status": [false, false], "silence_prob": [93.6, 90.25], "audiomae_on_audioset": [null, null], "duration": [8.69, 5.49]} \ No newline at end of file diff --git a/annotations_1/txQcaXvbRB8_filtered.json b/annotations_1/txQcaXvbRB8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327bbe699912fdc25f2a65951f865a5e4cda9f7e --- /dev/null +++ b/annotations_1/txQcaXvbRB8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.97], [13.0, 13.73], [14.0, 13.88], [20.0, 21.17], [22.0, 25.86], [29.0, 28.93], [33.0, 32.8], [38.0, 37.81], [40.0, 46.94], [48.0, 74.58], [77.0, 78.38], [79.0, 79.12], [82.0, 82.39], [91.0, 91.67], [101.0, 101.33], [102.0, 102.81], [108.0, 110.08], [110.0, 111.0], [111.0, 111.89], [116.0, 116.14]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.6, 0.0, 0.0, 0.0, 31.05, 30.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 35.26], ["music", 32.79], ["animal", 3.72]], null, null, null, [["music", 30.42], ["speech", 25.08], ["sidetone", 13.82]], [["music", 57.1], ["vehicle", 8.8], ["speech", 3.89]], null, null, null, null, null, null, null, null, null, null], "duration": [0.97, 0.73, -0.12, 1.17, 3.86, -0.07, -0.2, -0.19, 6.94, 26.58, 1.38, 0.12, 0.39, 0.67, 0.33, 0.81, 2.08, 1.0, 0.89, 0.14]} \ No newline at end of file diff --git a/annotations_1/ty68MEZQPS0_filtered.json b/annotations_1/ty68MEZQPS0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..605eae00a31148e60a6a0dfa6804be3c4684f2d4 --- /dev/null +++ b/annotations_1/ty68MEZQPS0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.01], [4.0, 4.72], [5.0, 8.07], [9.0, 9.81], [11.0, 12.73], [19.0, 19.41], [22.0, 22.94], [38.0, 39.28], [40.0, 40.95], [43.0, 43.01], [49.0, 50.16], [51.0, 51.8], [52.0, 52.62], [57.0, 57.01], [60.0, 60.98], [79.0, 79.08], [83.0, 85.56], [86.0, 87.1], [88.0, 89.16], [92.0, 92.01], [94.0, 94.53], [99.0, 100.43], [102.0, 102.49], [106.0, 107.16], [108.0, 107.91], [109.0, 109.46], [117.0, 117.12], [121.0, 121.2], [142.0, 143.21], [148.0, 148.42], [158.0, 162.28], [163.0, 163.49], [165.0, 165.33], [166.0, 166.6], [169.0, 175.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [44.34, 0.0, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.58, 0.0, 0.0, 0.0, 35.4], "audiomae_on_audioset": [[["hum", 30.25], ["throbbing", 29.98], ["sidetone", 10.29]], null, [["throbbing", 31.91], ["heart sounds, heartbeat", 23.83], ["hum", 22.96]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 27.06], ["insect", 17.19], ["bee, wasp, etc.", 16.46]], null, null, null, [["speech", 22.63], ["boat, water vehicle", 7.26], ["vehicle", 6.65]]], "duration": [2.01, 0.72, 3.07, 0.81, 1.73, 0.41, 0.94, 1.28, 0.95, 0.01, 1.16, 0.8, 0.62, 0.01, 0.98, 0.08, 2.56, 1.1, 1.16, 0.01, 0.53, 1.43, 0.49, 1.16, -0.09, 0.46, 0.12, 0.2, 1.21, 0.42, 4.28, 0.49, 0.33, 0.6, 6.14]} \ No newline at end of file diff --git a/annotations_1/ty_jbbvZDkQ_filtered.json b/annotations_1/ty_jbbvZDkQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e7e8298faf685c3a28cefeb682b1e6e3e4f17ed --- /dev/null +++ b/annotations_1/ty_jbbvZDkQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [12.0, 12.28], [13.0, 14.0], [16.0, 17.9], [18.0, 24.63], [27.0, 28.73], [30.0, 30.75], [35.0, 36.17], [38.0, 37.99], [41.0, 48.19], [49.0, 50.52], [53.0, 56.29], [57.0, 71.44], [77.0, 77.23], [78.0, 87.59], [90.0, 90.58], [98.0, 98.52], [101.0, 102.1], [105.0, 108.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 0.0, 0.0, 42.98, 0.0, 40.62, 82.61, 0.0, 54.9, 0.0, 0.0, 0.0, 40.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 61.43], ["radio", 11.88], ["music", 5.17]], null, [["wood", 20.61], ["hum", 13.01], ["mains hum", 11.7]], null, null, null, null, null, null, [["music", 53.51], ["didgeridoo", 4.67], ["synthesizer", 4.28]]], "duration": [-0.07, 0.28, 1.0, 1.9, 6.63, 1.73, 0.75, 1.17, -0.01, 7.19, 1.52, 3.29, 14.44, 0.23, 9.59, 0.58, 0.52, 1.1, 3.89]} \ No newline at end of file diff --git a/annotations_1/u-eTCyG0jpA_filtered.json b/annotations_1/u-eTCyG0jpA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0377effd39d23a189c4c16cf06698f33d64224ab --- /dev/null +++ b/annotations_1/u-eTCyG0jpA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.58], [16.0, 17.95], [27.0, 27.57], [34.0, 36.48], [37.0, 37.79], [40.0, 49.72], [70.0, 77.72], [82.0, 84.67], [85.0, 88.01], [90.0, 95.5], [98.0, 103.05], [106.0, 114.22], [116.0, 116.01], [126.0, 136.0], [144.0, 150.5], [165.0, 166.78], [169.0, 170.07]], "keep_status": [false, false, false, false, false, true, true, false, true, true, true, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.82, 0.0, 35.54, 29.5, 36.34, 33.77, 29.79, 29.37, 29.07, 0.0, 29.75, 30.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 51.76], ["theremin", 27.78], ["cacophony", 2.98]], null, [["music", 28.49], ["fly, housefly", 21.12], ["insect", 7.26]], [["music", 22.03], ["fart", 13.49], ["speech", 12.4]], [["speech", 40.22], ["music", 28.55], ["throbbing", 10.59]], [["music", 37.77], ["hum", 9.76], ["throbbing", 8.43]], [["music", 22.53], ["whack, thwack", 18.31], ["speech", 9.88]], [["speech", 19.04], ["music", 14.61], ["outside, rural or natural", 6.32]], [["livestock, farm animals, working animals", 25.47], ["moo", 21.82], ["cattle, bovinae", 21.65]], null, [["speech", 52.85], ["music", 9.4], ["outside, rural or natural", 3.59]], [["music", 21.33], ["moo", 20.45], ["livestock, farm animals, working animals", 16.94]], null, null], "duration": [0.58, 1.95, 0.57, 2.48, 0.79, 9.72, 7.72, 2.67, 3.01, 5.5, 5.05, 8.22, 0.01, 10.0, 6.5, 1.78, 1.07]} \ No newline at end of file diff --git a/annotations_1/u-z5139CW1I_filtered.json b/annotations_1/u-z5139CW1I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e502d192daa56a1a059956358b76badeed05828a --- /dev/null +++ b/annotations_1/u-z5139CW1I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.26], [9.0, 11.55], [18.0, 22.49], [27.0, 33.47], [34.0, 36.73], [37.0, 36.95], [37.0, 36.98], [37.0, 37.02], [37.0, 45.91], [47.0, 49.47], [63.0, 73.62], [75.0, 92.37], [93.0, 117.49], [118.0, 117.75]], "keep_status": [false, true, true, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [49.73, 34.37, 31.65, 32.17, 32.04, 0.0, 0.0, 0.0, 30.85, 31.37, 37.27, 31.65, 91.47, 0.0], "audiomae_on_audioset": [[["fly, housefly", 51.91], ["insect", 23.96], ["mosquito", 13.88]], [["music", 22.27], ["speech", 16.26], ["sonar", 8.91]], [["throbbing", 32.32], ["hum", 28.1], ["mains hum", 7.11]], [["speech", 64.77], ["music", 10.58], ["whack, thwack", 3.99]], [["sidetone", 28.28], ["whack, thwack", 19.62], ["music", 6.65]], null, null, null, [["speech", 68.8], ["music", 4.84], ["sound effect", 2.9]], [["music", 24.1], ["whale vocalization", 21.71], ["synthesizer", 6.56]], [["bee, wasp, etc.", 22.09], ["fly, housefly", 20.42], ["insect", 19.0]], [["fly, housefly", 51.59], ["insect", 18.3], ["mosquito", 14.4]], null, null], "duration": [5.26, 2.55, 4.49, 6.47, 2.73, -0.05, -0.02, 0.02, 8.91, 2.47, 10.62, 17.37, 24.49, -0.25]} \ No newline at end of file diff --git a/annotations_1/u0RqfETo2ok_filtered.json b/annotations_1/u0RqfETo2ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afccd196d8d2cdcb81e6fdd04060f402adb0eb4c --- /dev/null +++ b/annotations_1/u0RqfETo2ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.75], [13.0, 13.68], [17.0, 17.22], [19.0, 23.23], [26.0, 26.97], [36.0, 42.11], [44.0, 46.77], [51.0, 51.26], [53.0, 53.6], [59.0, 59.8], [61.0, 61.45], [63.0, 64.47], [67.0, 67.49], [69.0, 69.62], [80.0, 80.82], [90.0, 91.22], [104.0, 106.17], [112.0, 114.32]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 30.13, 0.0, 28.42, 29.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.32, 32.79], "audiomae_on_audioset": [null, null, null, [["speech", 45.76], ["music", 25.83], ["didgeridoo", 4.77]], null, [["speech", 55.85], ["music", 7.03], ["throbbing", 4.83]], [["speech", 49.02], ["crowd", 7.65], ["cheering", 6.03]], null, null, null, null, null, null, null, null, null, [["theremin", 31.45], ["whale vocalization", 20.98], ["music", 15.3]], [["music", 32.63], ["didgeridoo", 5.71], ["gong", 5.69]]], "duration": [1.75, 0.68, 0.22, 4.23, 0.97, 6.11, 2.77, 0.26, 0.6, 0.8, 0.45, 1.47, 0.49, 0.62, 0.82, 1.22, 2.17, 2.32]} \ No newline at end of file diff --git a/annotations_1/u1MRGbWEI9M_filtered.json b/annotations_1/u1MRGbWEI9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b3f7cd51b88eda055f0a684893fd088cc488cc3 --- /dev/null +++ b/annotations_1/u1MRGbWEI9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.76], [11.0, 20.09], [21.0, 22.5], [23.0, 24.16], [25.0, 25.64], [27.0, 29.2], [30.0, 31.19], [33.0, 37.0], [38.0, 40.29], [41.0, 81.24], [83.0, 119.58], [120.0, 120.63]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [76.37, 98.99, 0.0, 0.0, 0.0, 99.99, 0.0, 82.07, 45.05, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 49.66], ["burping, eructation", 11.09], ["wail, moan", 6.49]], null, null, null], "duration": [3.76, 9.09, 1.5, 1.16, 0.64, 2.2, 1.19, 4.0, 2.29, 40.24, 36.58, 0.63]} \ No newline at end of file diff --git a/annotations_1/u1Pgftn5H94_filtered.json b/annotations_1/u1Pgftn5H94_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0195920022cfd27933c32f1d33fc9a82ab540414 --- /dev/null +++ b/annotations_1/u1Pgftn5H94_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.95], [17.0, 19.18], [25.0, 25.34], [31.0, 46.5], [49.0, 53.91], [62.0, 62.68], [64.0, 68.34], [71.0, 75.51], [86.0, 87.02], [88.0, 88.97], [96.0, 96.77], [97.0, 111.92], [115.0, 119.99], [121.0, 121.44], [122.0, 128.11], [130.0, 131.5], [140.0, 141.0], [149.0, 151.7], [157.0, 156.76]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, true, true, false, true, false, false, true, false], "silence_prob": [0.0, 99.84, 0.0, 44.2, 47.01, 0.0, 57.25, 30.54, 0.0, 0.0, 0.0, 32.42, 35.95, 0.0, 37.51, 0.0, 0.0, 32.42, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 49.43], ["speech", 15.9], ["outside, rural or natural", 2.28]], [["music", 37.96], ["hum", 12.44], ["throbbing", 9.18]], null, null, [["speech", 67.55], ["hum", 7.26], ["rumble", 4.96]], null, null, null, [["music", 26.36], ["speech", 19.75], ["honk", 13.4]], [["music", 45.37], ["speech", 17.13], ["musical instrument", 4.29]], null, [["music", 58.19], ["double bass", 5.6], ["cello", 4.1]], null, null, [["music", 44.64], ["fart", 9.63], ["fly, housefly", 5.25]], null], "duration": [0.95, 2.18, 0.34, 15.5, 4.91, 0.68, 4.34, 4.51, 1.02, 0.97, 0.77, 14.92, 4.99, 0.44, 6.11, 1.5, 1.0, 2.7, -0.24]} \ No newline at end of file diff --git a/annotations_1/u3oi4L5tWQg_filtered.json b/annotations_1/u3oi4L5tWQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b196a7099123c22fe3ea0a17aa2a73e6a2dc66fc --- /dev/null +++ b/annotations_1/u3oi4L5tWQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 48.39], [49.0, 52.35], [53.0, 55.29], [57.0, 58.56], [61.0, 62.11], [64.0, 64.72], [65.0, 65.92], [68.0, 68.82], [78.0, 78.54], [83.0, 84.08], [85.0, 85.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 90.08, 99.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [31.39, 3.35, 2.29, 1.56, 1.11, 0.72, 0.92, 0.82, 0.54, 1.08, 0.82]} \ No newline at end of file diff --git a/annotations_1/u3xIs0aajN4_filtered.json b/annotations_1/u3xIs0aajN4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6007bb4ec2d7d97e1e78e541823d9d249ec6f80 --- /dev/null +++ b/annotations_1/u3xIs0aajN4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 6.45], [19.0, 22.59], [25.0, 38.79], [40.0, 40.42], [42.0, 45.42], [46.0, 46.26], [48.0, 48.59], [50.0, 54.04], [55.0, 55.61], [63.0, 64.17], [71.0, 74.53], [76.0, 76.67], [85.0, 90.04], [94.0, 95.17], [101.0, 101.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [62.58, 95.91, 91.64, 0.0, 76.53, 0.0, 0.0, 87.19, 0.0, 0.0, 48.35, 0.0, 84.8, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["ping", 11.96], ["music", 8.32], ["synthesizer", 5.47]], null, null, null, null], "duration": [4.45, 3.59, 13.79, 0.42, 3.42, 0.26, 0.59, 4.04, 0.61, 1.17, 3.53, 0.67, 5.04, 1.17, 0.09]} \ No newline at end of file diff --git a/annotations_1/u4T7slD8Mq4_filtered.json b/annotations_1/u4T7slD8Mq4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7956dae195576d80fd1dd1338009633c044220b8 --- /dev/null +++ b/annotations_1/u4T7slD8Mq4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 51.06], [53.0, 83.0], [85.0, 97.24], [98.0, 105.14], [112.0, 122.05]], "keep_status": [false, true, false, false, false], "silence_prob": [0.0, 30.87, 30.2, 31.99, 35.71], "audiomae_on_audioset": [null, [["music", 50.95], ["speech", 7.71], ["breaking", 6.06]], [["music", 55.61], ["throbbing", 24.32], ["hum", 3.8]], [["music", 70.18], ["speech", 12.42], ["thunk", 1.65]], [["music", 55.17], ["speech", 10.46], ["didgeridoo", 10.04]]], "duration": [48.06, 30.0, 12.24, 7.14, 10.05]} \ No newline at end of file diff --git a/annotations_1/u4gz2yNW_Go_filtered.json b/annotations_1/u4gz2yNW_Go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2aebe7b62b62da8c1ffdd4d9c535087a0a4b7c0 --- /dev/null +++ b/annotations_1/u4gz2yNW_Go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[48.0, 51.56], [52.0, 75.05], [76.0, 88.92], [93.0, 95.27], [97.0, 97.02], [98.0, 99.3], [100.0, 102.66], [104.0, 105.22], [105.0, 107.82], [109.0, 114.24], [118.0, 132.44], [135.0, 140.63], [147.0, 151.38], [152.0, 152.74], [156.0, 163.56], [168.0, 168.27], [176.0, 175.98], [176.0, 176.01]], "keep_status": [true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [32.44, 31.81, 32.09, 31.36, 0.0, 0.0, 32.5, 0.0, 32.9, 31.6, 30.99, 30.78, 30.62, 0.0, 30.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 21.6], ["duck", 14.95], ["quack", 10.51]], [["quack", 46.3], ["music", 18.85], ["animal", 9.53]], [["speech", 37.86], ["music", 26.37], ["fly, housefly", 7.02]], [["livestock, farm animals, working animals", 17.86], ["mosquito", 15.15], ["fly, housefly", 13.81]], null, null, [["music", 71.86], ["musical instrument", 5.42], ["drum", 2.23]], null, [["speech", 34.24], ["music", 23.73], ["fart", 15.55]], [["music", 19.63], ["speech", 13.46], ["fly, housefly", 11.72]], [["cattle, bovinae", 30.83], ["livestock, farm animals, working animals", 26.37], ["moo", 19.11]], [["honk", 42.34], ["goose", 21.57], ["music", 17.53]], [["music", 43.17], ["speech", 30.33], ["whack, thwack", 4.43]], null, [["cattle, bovinae", 53.16], ["moo", 20.71], ["livestock, farm animals, working animals", 18.58]], null, null, null], "duration": [3.56, 23.05, 12.92, 2.27, 0.02, 1.3, 2.66, 1.22, 2.82, 5.24, 14.44, 5.63, 4.38, 0.74, 7.56, 0.27, -0.02, 0.01]} \ No newline at end of file diff --git a/annotations_1/u5hpQ0KeRgY_filtered.json b/annotations_1/u5hpQ0KeRgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73ea6acd83ac0fe9c8445ae0fcff19cb1ae7f2b2 --- /dev/null +++ b/annotations_1/u5hpQ0KeRgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 34.37], [35.0, 35.68], [37.0, 47.88], [49.0, 55.58], [56.0, 57.94], [61.0, 61.72], [62.0, 64.25], [66.0, 67.53], [69.0, 70.01], [74.0, 75.52], [77.0, 77.62], [78.0, 79.47], [89.0, 89.53], [94.0, 94.53], [95.0, 95.0], [96.0, 109.14], [110.0, 117.53], [119.0, 127.2], [128.0, 130.08], [131.0, 131.95], [133.0, 133.42]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.22, 95.78, 0.0, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.07, 53.47, 97.33, 97.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.37, 0.68, 10.88, 6.58, 1.94, 0.72, 2.25, 1.53, 1.01, 1.52, 0.62, 1.47, 0.53, 0.53, 0.0, 13.14, 7.53, 8.2, 2.08, 0.95, 0.42]} \ No newline at end of file diff --git a/annotations_1/u6HHla9ApmI_filtered.json b/annotations_1/u6HHla9ApmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..594308a3a88286c26ca2083b2666b9e5a207e78a --- /dev/null +++ b/annotations_1/u6HHla9ApmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.91], [23.0, 23.21], [23.0, 23.45], [29.0, 30.97], [32.0, 34.35], [36.0, 36.17], [40.0, 42.28], [47.0, 55.39], [61.0, 61.18], [62.0, 65.43], [68.0, 69.03], [79.0, 80.38], [83.0, 83.66], [86.0, 86.8], [87.0, 89.19], [92.0, 93.93], [104.0, 104.82], [110.0, 114.29], [116.0, 117.15], [118.0, 118.2], [124.0, 125.47], [126.0, 127.57], [129.0, 129.25], [137.0, 137.54], [141.0, 141.1], [141.0, 141.15]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.79, 0.0, 30.92, 30.82, 0.0, 30.26, 0.0, 0.0, 0.0, 0.0, 35.64, 0.0, 0.0, 34.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.73], ["speech", 23.03], ["boing", 4.98]], null, [["music", 47.2], ["boing", 17.78], ["livestock, farm animals, working animals", 3.69]], [["music", 75.15], ["boing", 5.49], ["speech", 4.9]], null, [["music", 38.51], ["speech", 18.3], ["mosquito", 5.39]], null, null, null, null, [["music", 38.53], ["speech", 25.83], ["boing", 17.83]], null, null, [["speech", 51.31], ["music", 8.1], ["sidetone", 7.08]], null, null, null, null, null, null, null, null], "duration": [1.91, 0.21, 0.45, 1.97, 2.35, 0.17, 2.28, 8.39, 0.18, 3.43, 1.03, 1.38, 0.66, 0.8, 2.19, 1.93, 0.82, 4.29, 1.15, 0.2, 1.47, 1.57, 0.25, 0.54, 0.1, 0.15]} \ No newline at end of file diff --git a/annotations_1/u6IAct0ow4c_filtered.json b/annotations_1/u6IAct0ow4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2773f0c27d9fa0d2d05e4fd4482011838cab6b36 --- /dev/null +++ b/annotations_1/u6IAct0ow4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 11.84], [24.0, 24.85], [40.0, 39.97], [42.0, 41.72], [50.0, 51.36], [54.0, 64.94], [67.0, 70.95], [73.0, 75.54], [77.0, 85.13], [89.0, 89.63], [93.0, 95.62], [102.0, 107.6], [115.0, 116.34], [117.0, 119.03], [123.0, 123.63], [130.0, 130.2], [131.0, 131.26], [132.0, 132.36], [133.0, 133.93], [143.0, 144.26]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.97, 28.28, 40.33, 30.51, 0.0, 33.16, 34.93, 0.0, 33.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 31.35], ["speech", 24.0], ["mains hum", 15.3]], [["didgeridoo", 44.8], ["boing", 7.92], ["music", 7.58]], [["speech", 29.74], ["civil defense siren", 19.09], ["singing bowl", 10.71]], [["explosion", 16.81], ["music", 11.81], ["hum", 6.89]], null, [["speech", 75.91], ["music", 12.04], ["inside, large room or hall", 1.45]], [["music", 53.61], ["hum", 11.43], ["ambient music", 6.42]], null, [["hum", 31.0], ["mains hum", 16.94], ["speech", 11.41]], null, null, null, null, null, null], "duration": [-0.16, 0.85, -0.03, -0.28, 1.36, 10.94, 3.95, 2.54, 8.13, 0.63, 2.62, 5.6, 1.34, 2.03, 0.63, 0.2, 0.26, 0.36, 0.93, 1.26]} \ No newline at end of file diff --git a/annotations_1/u6W5OFK9jpU_filtered.json b/annotations_1/u6W5OFK9jpU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a185a0409a323b633774e560ec2c4ce1f998bd43 --- /dev/null +++ b/annotations_1/u6W5OFK9jpU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.02], [13.0, 13.9], [21.0, 21.86], [25.0, 25.62], [45.0, 46.08], [49.0, 52.15], [54.0, 56.05], [60.0, 61.42]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.18, 65.44, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 32.81], ["moo", 24.02], ["livestock, farm animals, working animals", 18.48]], null, null], "duration": [1.02, 0.9, 0.86, 0.62, 1.08, 3.15, 2.05, 1.42]} \ No newline at end of file diff --git a/annotations_1/u7DV5coBXSA_filtered.json b/annotations_1/u7DV5coBXSA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8450da1b303cea1a75f58fd0f093a57e7e566c7e --- /dev/null +++ b/annotations_1/u7DV5coBXSA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.54], [11.0, 12.75], [15.0, 15.85], [18.0, 20.34], [21.0, 20.97], [23.0, 22.92], [24.0, 25.03], [31.0, 32.43], [34.0, 39.78], [40.0, 60.24], [61.0, 60.81], [65.0, 75.25]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.79, 0.0, 0.0, 0.0, 0.0, 99.16, 65.2, 0.0, 48.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 52.71], ["singing bowl", 21.99], ["chirp tone", 13.24]]], "duration": [-0.46, 1.75, 0.85, 2.34, -0.03, -0.08, 1.03, 1.43, 5.78, 20.24, -0.19, 10.25]} \ No newline at end of file diff --git a/annotations_1/u7IXETT9OEQ_filtered.json b/annotations_1/u7IXETT9OEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49e3a86571ab1938f77b7ef456aadb44708364b6 --- /dev/null +++ b/annotations_1/u7IXETT9OEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.86], [8.0, 8.02], [11.0, 11.45], [13.0, 13.47], [17.0, 17.56], [18.0, 19.2], [21.0, 22.35], [26.0, 27.01], [28.0, 30.6], [32.0, 32.58], [33.0, 34.08], [35.0, 40.15], [41.0, 41.94], [45.0, 45.49], [49.0, 50.97], [54.0, 56.86], [60.0, 60.74], [66.0, 66.68], [68.0, 69.15], [71.0, 72.81], [74.0, 78.49], [79.0, 80.22], [81.0, 83.66], [88.0, 89.73], [92.0, 93.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 83.34, 0.0, 0.0, 0.0, 0.0, 71.72, 0.0, 58.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.86, 0.02, 0.45, 0.47, 0.56, 1.2, 1.35, 1.01, 2.6, 0.58, 1.08, 5.15, 0.94, 0.49, 1.97, 2.86, 0.74, 0.68, 1.15, 1.81, 4.49, 1.22, 2.66, 1.73, 1.06]} \ No newline at end of file diff --git a/annotations_1/u7yQ7qs6Zew_filtered.json b/annotations_1/u7yQ7qs6Zew_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4775d4538ab3215b5f906661716ce0790ecf43f --- /dev/null +++ b/annotations_1/u7yQ7qs6Zew_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 62.45], [65.0, 67.71], [68.0, 70.14], [71.0, 76.54], [81.0, 82.12], [92.0, 92.3], [98.0, 100.18], [102.0, 102.27], [103.0, 103.6], [105.0, 105.6], [109.0, 111.06], [112.0, 112.41], [116.0, 116.43], [117.0, 118.05], [124.0, 128.16], [128.0, 128.33], [129.0, 130.35], [134.0, 135.11], [139.0, 140.93], [143.0, 146.01], [148.0, 149.03], [150.0, 152.14], [155.0, 157.92], [159.0, 160.46], [162.0, 163.09], [165.0, 166.45], [167.0, 167.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 78.21, 77.36, 69.2, 0.0, 0.0, 77.36, 0.0, 0.0, 0.0, 45.92, 0.0, 0.0, 0.0, 35.91, 0.0, 0.0, 0.0, 0.0, 39.05, 0.0, 47.74, 43.18, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["whale vocalization", 28.85], ["cattle, bovinae", 9.64], ["theremin", 8.08]], null, null, null, [["music", 42.37], ["speech", 14.72], ["hum", 9.52]], null, null, null, null, [["music", 47.86], ["throbbing", 16.53], ["hum", 5.48]], null, [["music", 31.96], ["hum", 22.75], ["throbbing", 11.16]], [["music", 27.72], ["speech", 23.19], ["throbbing", 10.93]], null, null, null, null], "duration": [50.45, 2.71, 2.14, 5.54, 1.12, 0.3, 2.18, 0.27, 0.6, 0.6, 2.06, 0.41, 0.43, 1.05, 4.16, 0.33, 1.35, 1.11, 1.93, 3.01, 1.03, 2.14, 2.92, 1.46, 1.09, 1.45, 0.63]} \ No newline at end of file diff --git a/annotations_1/uA1Kloz4Ics_filtered.json b/annotations_1/uA1Kloz4Ics_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..195df28ad79041712a21bd0bf40e3c349ea8ac95 --- /dev/null +++ b/annotations_1/uA1Kloz4Ics_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.24], [2.0, 2.42], [4.0, 4.83], [6.0, 6.93], [11.0, 12.01], [13.0, 13.69], [16.0, 20.17], [22.0, 22.52], [26.0, 27.9], [29.0, 30.48], [31.0, 31.29], [33.0, 35.63], [36.0, 37.18], [38.0, 40.26], [45.0, 45.0], [45.0, 46.14], [50.0, 54.62], [56.0, 57.86], [60.0, 62.55], [63.0, 64.45], [65.0, 65.99], [69.0, 71.27], [74.0, 74.26], [77.0, 84.25], [95.0, 96.21], [98.0, 98.51], [99.0, 98.73], [103.0, 103.77], [111.0, 112.13], [114.0, 114.29], [115.0, 117.0], [119.0, 119.94], [122.0, 123.31], [124.0, 124.82], [126.0, 126.23], [127.0, 128.65], [129.0, 142.65], [146.0, 146.96], [148.0, 148.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.39, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 53.84, 0.0, 0.0, 99.95, 0.0, 100.0, 0.0, 0.0, 96.66, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 0.0, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.42, 0.83, 0.93, 1.01, 0.69, 4.17, 0.52, 1.9, 1.48, 0.29, 2.63, 1.18, 2.26, 0.0, 1.14, 4.62, 1.86, 2.55, 1.45, 0.99, 2.27, 0.26, 7.25, 1.21, 0.51, -0.27, 0.77, 1.13, 0.29, 2.0, 0.94, 1.31, 0.82, 0.23, 1.65, 13.65, 0.96, 0.86]} \ No newline at end of file diff --git a/annotations_1/uAjGtAOqMQw_filtered.json b/annotations_1/uAjGtAOqMQw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b60b79efe9e355b45a5ce832ca834ee756407d17 --- /dev/null +++ b/annotations_1/uAjGtAOqMQw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 43.83], [45.0, 52.03], [56.0, 61.13], [62.0, 62.4], [67.0, 77.77], [78.0, 80.18], [81.0, 83.76], [86.0, 89.51], [92.0, 93.92], [95.0, 95.07], [99.0, 113.88], [117.0, 122.52]], "keep_status": [false, true, true, false, true, false, true, true, false, false, false, true], "silence_prob": [32.37, 29.47, 30.48, 0.0, 29.15, 31.96, 31.67, 30.19, 0.0, 0.0, 29.75, 29.45], "audiomae_on_audioset": [[["music", 36.9], ["crack", 26.07], ["single-lens reflex camera", 10.71]], [["music", 22.0], ["thump, thud", 16.26], ["speech", 11.83]], [["music", 18.13], ["hiccup", 9.92], ["speech", 8.86]], null, [["music", 45.08], ["breaking", 12.23], ["speech", 10.92]], [["music", 58.24], ["didgeridoo", 7.96], ["musical instrument", 4.18]], [["music", 21.14], ["throbbing", 7.99], ["didgeridoo", 6.56]], [["speech", 19.81], ["music", 16.92], ["coin (dropping)", 11.7]], null, null, [["music", 69.23], ["sound effect", 4.91], ["hum", 4.87]], [["music", 31.96], ["mains hum", 7.96], ["hum", 7.07]]], "duration": [7.83, 7.03, 5.13, 0.4, 10.77, 2.18, 2.76, 3.51, 1.92, 0.07, 14.88, 5.52]} \ No newline at end of file diff --git a/annotations_1/uAroGB_YCmw_filtered.json b/annotations_1/uAroGB_YCmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d6b4208dfd9f081a5ef5a574026be6a8bf1311d --- /dev/null +++ b/annotations_1/uAroGB_YCmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 27.58], [32.0, 33.39], [34.0, 49.94], [57.0, 56.91], [59.0, 67.76], [69.0, 74.06], [78.0, 87.45], [91.0, 102.03], [103.0, 128.04]], "keep_status": [false, false, true, false, false, true, false, true, true], "silence_prob": [30.06, 0.0, 29.89, 0.0, 30.3, 30.36, 31.54, 30.56, 30.32], "audiomae_on_audioset": [[["music", 59.53], ["speech", 13.39], ["quack", 2.44]], null, [["music", 25.46], ["throbbing", 20.25], ["hum", 15.95]], null, [["speech", 50.49], ["music", 23.41], ["throbbing", 2.86]], [["speech", 40.91], ["music", 18.78], ["throbbing", 7.05]], [["music", 44.19], ["didgeridoo", 23.19], ["musical instrument", 5.68]], [["music", 55.7], ["didgeridoo", 7.14], ["musical instrument", 5.3]], [["music", 47.1], ["animal", 7.03], ["cattle, bovinae", 4.53]]], "duration": [17.58, 1.39, 15.94, -0.09, 8.76, 5.06, 9.45, 11.03, 25.04]} \ No newline at end of file diff --git a/annotations_1/uB-53DTWD3k_filtered.json b/annotations_1/uB-53DTWD3k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25b14a5d1b1440d1409e4ea0d6921496b801b01d --- /dev/null +++ b/annotations_1/uB-53DTWD3k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [5.0, 15.53], [16.0, 22.87], [23.0, 23.41], [24.0, 27.33], [29.0, 51.58], [53.0, 57.84], [59.0, 66.23], [67.0, 78.27], [80.0, 80.62]], "keep_status": [false, true, false, false, true, false, true, true, true, false], "silence_prob": [0.0, 30.13, 28.56, 0.0, 30.25, 30.54, 38.6, 28.86, 29.1, 0.0], "audiomae_on_audioset": [null, [["buzz", 49.63], ["speech", 13.05], ["vehicle", 3.36]], [["speech", 59.96], ["vehicle", 8.44], ["boat, water vehicle", 6.81]], null, [["mains hum", 29.05], ["music", 20.94], ["hum", 17.09]], [["speech", 44.63], ["music", 26.94], ["mains hum", 9.99]], [["hum", 22.36], ["music", 16.8], ["mains hum", 16.2]], [["speech", 31.42], ["hum", 14.56], ["mains hum", 14.53]], [["speech", 33.49], ["vehicle", 16.86], ["boat, water vehicle", 7.45]], null], "duration": [0.7, 10.53, 6.87, 0.41, 3.33, 22.58, 4.84, 7.23, 11.27, 0.62]} \ No newline at end of file diff --git a/annotations_1/uB6JMgU50J0_filtered.json b/annotations_1/uB6JMgU50J0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..881c3f4df3417b6986e726dc5994907f75e120fe --- /dev/null +++ b/annotations_1/uB6JMgU50J0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 29.56], [31.0, 31.56], [32.0, 37.05], [39.0, 46.18], [49.0, 51.48], [53.0, 56.08], [74.0, 74.82], [75.0, 86.44], [90.0, 142.87], [143.0, 145.74], [146.0, 154.16], [155.0, 155.49]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [34.3, 0.0, 37.52, 34.45, 31.55, 33.0, 0.0, 38.86, 0.0, 43.77, 36.39, 0.0], "audiomae_on_audioset": [[["music", 57.03], ["speech", 9.1], ["throbbing", 5.86]], null, [["music", 69.91], ["throbbing", 6.39], ["electronic music", 4.87]], [["hum", 32.78], ["throbbing", 28.51], ["music", 28.22]], [["music", 37.96], ["synthesizer", 18.32], ["throbbing", 10.56]], [["music", 65.31], ["didgeridoo", 9.2], ["throbbing", 3.54]], null, [["hum", 43.05], ["throbbing", 22.14], ["music", 9.57]], null, [["speech", 44.13], ["music", 21.69], ["pulse", 5.71]], [["music", 18.61], ["speech", 16.39], ["siren", 16.29]], null], "duration": [11.56, 0.56, 5.05, 7.18, 2.48, 3.08, 0.82, 11.44, 52.87, 2.74, 8.16, 0.49]} \ No newline at end of file diff --git a/annotations_1/uBP8cPLPWrQ_filtered.json b/annotations_1/uBP8cPLPWrQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f279e5f93e9b9ecef6498934d901ea43285599fd --- /dev/null +++ b/annotations_1/uBP8cPLPWrQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.29], [16.0, 18.93], [23.0, 23.55], [26.0, 26.1], [27.0, 29.24], [32.0, 31.94], [35.0, 48.9], [66.0, 66.31], [68.0, 71.51], [73.0, 74.55], [75.0, 76.65], [78.0, 78.95], [79.0, 81.57], [88.0, 88.06], [90.0, 90.73], [92.0, 92.64], [98.0, 98.81], [100.0, 128.06], [133.0, 135.65], [136.0, 137.02], [138.0, 138.18], [139.0, 141.61], [163.0, 163.71], [166.0, 166.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.0, 0.0, 0.0, 55.39, 0.0, 60.23, 0.0, 91.47, 0.0, 0.0, 0.0, 64.75, 0.0, 0.0, 0.0, 0.0, 44.12, 42.86, 0.0, 0.0, 65.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.19], ["thunk", 34.03], ["guitar", 2.7]], [["music", 53.04], ["didgeridoo", 22.27], ["musical instrument", 3.69]], null, null, null, null, null], "duration": [0.29, 2.93, 0.55, 0.1, 2.24, -0.06, 13.9, 0.31, 3.51, 1.55, 1.65, 0.95, 2.57, 0.06, 0.73, 0.64, 0.81, 28.06, 2.65, 1.02, 0.18, 2.61, 0.71, 0.89]} \ No newline at end of file diff --git a/annotations_1/uCG1EiqEAEg_filtered.json b/annotations_1/uCG1EiqEAEg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dff39f10b8ba9f27272b513a028222f048570def --- /dev/null +++ b/annotations_1/uCG1EiqEAEg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.57], [16.0, 18.55], [20.0, 24.17], [28.0, 31.38], [37.0, 37.29], [39.0, 39.55], [40.0, 47.49], [50.0, 50.82], [55.0, 55.14], [56.0, 56.93], [62.0, 62.34], [66.0, 66.93], [68.0, 70.01], [71.0, 71.78], [73.0, 72.84], [75.0, 90.61], [92.0, 97.55], [98.0, 100.33], [102.0, 102.64], [104.0, 115.21], [118.0, 119.53]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, true, false, false, false, true, true, false, true, false], "silence_prob": [94.37, 58.55, 36.8, 29.99, 0.0, 0.0, 31.42, 0.0, 0.0, 0.0, 0.0, 0.0, 49.09, 0.0, 0.0, 41.14, 33.07, 42.62, 0.0, 44.26, 0.0], "audiomae_on_audioset": [null, null, [["music", 21.42], ["breaking", 12.33], ["arrow", 8.09]], [["music", 28.3], ["theremin", 11.01], ["hum", 7.59]], null, null, [["whale vocalization", 26.96], ["speech", 20.13], ["mains hum", 18.36]], null, null, null, null, null, [["hum", 20.61], ["mains hum", 8.41], ["music", 7.15]], null, null, [["hum", 53.34], ["mains hum", 14.99], ["music", 14.16]], [["speech", 18.36], ["hum", 16.0], ["music", 12.93]], [["music", 26.39], ["didgeridoo", 23.21], ["hum", 10.23]], null, [["music", 58.77], ["ambient music", 6.34], ["throbbing", 2.96]], null], "duration": [6.57, 2.55, 4.17, 3.38, 0.29, 0.55, 7.49, 0.82, 0.14, 0.93, 0.34, 0.93, 2.01, 0.78, -0.16, 15.61, 5.55, 2.33, 0.64, 11.21, 1.53]} \ No newline at end of file diff --git a/annotations_1/uCsRqsNpF60_filtered.json b/annotations_1/uCsRqsNpF60_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8dc9849b657da5770e28736e11a4981e0b245cb --- /dev/null +++ b/annotations_1/uCsRqsNpF60_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [5.0, 5.91], [7.0, 7.7], [9.0, 14.72], [16.0, 32.34], [37.0, 38.94], [41.0, 57.96], [60.0, 66.82], [69.0, 73.68], [76.0, 78.02], [82.0, 89.14], [91.0, 91.49], [93.0, 100.23], [106.0, 111.28], [112.0, 111.89], [113.0, 116.8], [117.0, 116.83], [117.0, 116.97], [119.0, 119.74], [124.0, 126.62], [130.0, 147.24], [150.0, 160.66]], "keep_status": [false, false, false, true, false, false, true, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.45, 41.2, 0.0, 40.7, 61.27, 36.15, 46.02, 41.74, 0.0, 40.14, 54.1, 0.0, 43.1, 0.0, 0.0, 0.0, 75.88, 35.16, 34.91], "audiomae_on_audioset": [null, null, null, [["music", 22.82], ["throbbing", 19.03], ["sidetone", 11.65]], [["music", 47.48], ["hum", 20.96], ["mains hum", 7.28]], null, [["music", 36.05], ["hum", 14.87], ["speech", 7.99]], null, [["music", 43.19], ["whack, thwack", 7.44], ["sigh", 4.12]], [["music", 49.86], ["throbbing", 24.09], ["hum", 6.06]], [["throbbing", 33.16], ["music", 21.95], ["moo", 7.5]], null, [["thunk", 85.71], ["music", 6.95], ["door", 1.45]], null, null, [["music", 46.87], ["speech", 15.14], ["didgeridoo", 9.21]], null, null, null, null, [["music", 52.93], ["whack, thwack", 18.01], ["throbbing", 3.81]], [["mains hum", 49.45], ["hum", 31.88], ["music", 7.06]]], "duration": [0.5, 0.91, 0.7, 5.72, 16.34, 1.94, 16.96, 6.82, 4.68, 2.02, 7.14, 0.49, 7.23, 5.28, -0.11, 3.8, -0.17, -0.03, 0.74, 2.62, 17.24, 10.66]} \ No newline at end of file diff --git a/annotations_1/uDAIoSeEoZA_filtered.json b/annotations_1/uDAIoSeEoZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0bc8fafbf9c8c39b3e43a3ba3fb6f70a7bcacac --- /dev/null +++ b/annotations_1/uDAIoSeEoZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.05], [11.0, 11.23], [19.0, 21.56], [38.0, 38.43], [44.0, 45.62], [47.0, 47.95], [54.0, 53.77], [55.0, 55.26], [57.0, 57.75], [62.0, 62.77]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["bee, wasp, etc.", 25.33], ["fly, housefly", 15.28], ["speech", 13.99]], null, null, null, null, null, null, null], "duration": [0.05, 0.23, 2.56, 0.43, 1.62, 0.95, -0.23, 0.26, 0.75, 0.77]} \ No newline at end of file diff --git a/annotations_1/uE8yYJmpxeI_filtered.json b/annotations_1/uE8yYJmpxeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b79a86137bd0360c6d867a3057f0dcc864e31fff --- /dev/null +++ b/annotations_1/uE8yYJmpxeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 31.21], [34.0, 48.57], [49.0, 55.95], [58.0, 64.23], [65.0, 83.37], [86.0, 99.1], [100.0, 120.11], [122.0, 123.57], [126.0, 126.27], [127.0, 130.08], [132.0, 132.87], [134.0, 134.4], [142.0, 143.56], [146.0, 148.26]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.01, 49.92, 31.08, 33.05, 38.11, 29.98, 42.55, 0.0, 0.0, 98.93, 0.0, 0.0, 0.0, 98.86], "audiomae_on_audioset": [[["music", 37.13], ["theremin", 15.07], ["synthesizer", 10.69]], [["music", 49.78], ["thunk", 8.65], ["theremin", 7.45]], [["fly, housefly", 46.2], ["mosquito", 26.24], ["insect", 11.99]], [["speech", 49.44], ["hum", 12.54], ["music", 10.33]], [["quack", 39.79], ["music", 36.47], ["duck", 6.17]], [["music", 57.1], ["whale vocalization", 22.43], ["sound effect", 1.99]], [["music", 49.13], ["bow-wow", 12.11], ["animal", 11.62]], null, null, null, null, null, null, null], "duration": [26.21, 14.57, 6.95, 6.23, 18.37, 13.1, 20.11, 1.57, 0.27, 3.08, 0.87, 0.4, 1.56, 2.26]} \ No newline at end of file diff --git a/annotations_1/uEMTQYe1ro0_filtered.json b/annotations_1/uEMTQYe1ro0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54eb56bd12da0a3f62c9ff06e066a790f121dfa0 --- /dev/null +++ b/annotations_1/uEMTQYe1ro0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 46.63], [47.0, 47.07], [47.0, 63.66], [72.0, 76.45], [78.0, 108.84], [109.0, 110.03], [110.0, 115.77], [117.0, 175.98], [179.0, 221.71], [223.0, 224.38]], "keep_status": [false, false, false, true, false, false, false, false, false, false], "silence_prob": [35.51, 0.0, 30.45, 29.91, 0.0, 0.0, 43.3, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.37], ["sine wave", 4.11], ["singing bowl", 3.78]], null, [["music", 75.84], ["musical instrument", 3.02], ["hum", 1.47]], [["fly, housefly", 30.99], ["mosquito", 30.9], ["mains hum", 5.8]], null, null, [["music", 73.07], ["rumble", 3.92], ["roaring cats (lions, tigers)", 3.92]], null, null, null], "duration": [21.63, 0.07, 16.66, 4.45, 30.84, 1.03, 5.77, 58.98, 42.71, 1.38]} \ No newline at end of file diff --git a/annotations_1/uETwKF_fgKw_filtered.json b/annotations_1/uETwKF_fgKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b721b8052d8d11704cdeb97b659fd3e5210de13 --- /dev/null +++ b/annotations_1/uETwKF_fgKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.93], [23.0, 30.89], [33.0, 36.26], [39.0, 40.54], [41.0, 41.27], [42.0, 42.3], [44.0, 44.78], [45.0, 63.37], [68.0, 69.92], [74.0, 74.38], [76.0, 76.57], [78.0, 86.56], [89.0, 93.02], [95.0, 135.94], [136.0, 138.0], [142.0, 142.37], [148.0, 148.37], [155.0, 159.92], [169.0, 168.91], [169.0, 187.44], [190.0, 200.04]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.07, 32.43, 0.0, 0.0, 0.0, 0.0, 34.14, 0.0, 0.0, 0.0, 31.57, 30.36, 0.0, 30.85, 0.0, 0.0, 30.95, 0.0, 30.74, 31.32], "audiomae_on_audioset": [null, [["music", 60.96], ["didgeridoo", 12.62], ["musical instrument", 7.85]], [["music", 43.94], ["didgeridoo", 11.52], ["synthesizer", 5.88]], null, null, null, null, [["music", 79.28], ["synthesizer", 3.37], ["thunk", 2.74]], null, null, null, [["music", 83.92], ["wind instrument, woodwind instrument", 2.31], ["musical instrument", 1.54]], [["music", 60.95], ["didgeridoo", 5.56], ["wind instrument, woodwind instrument", 4.22]], null, [["music", 57.39], ["boing", 13.85], ["quack", 4.87]], null, null, [["music", 53.71], ["speech", 11.34], ["clarinet", 8.56]], null, [["music", 80.01], ["speech", 2.75], ["quack", 2.11]], [["music", 61.9], ["wind instrument, woodwind instrument", 16.84], ["harmonica", 4.76]]], "duration": [0.93, 7.89, 3.26, 1.54, 0.27, 0.3, 0.78, 18.37, 1.92, 0.38, 0.57, 8.56, 4.02, 40.94, 2.0, 0.37, 0.37, 4.92, -0.09, 18.44, 10.04]} \ No newline at end of file diff --git a/annotations_1/uEW0FlmiNec_filtered.json b/annotations_1/uEW0FlmiNec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e0d3e92273d6fe0783096a07d1d15c87e9730146 --- /dev/null +++ b/annotations_1/uEW0FlmiNec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.49], [10.0, 10.76], [14.0, 16.8], [19.0, 21.02], [24.0, 24.51], [28.0, 29.03], [30.0, 30.92], [33.0, 33.54], [40.0, 41.12], [42.0, 43.5], [44.0, 44.85], [47.0, 50.9], [52.0, 53.42], [57.0, 58.13], [59.0, 60.72], [64.0, 67.1], [75.0, 76.42], [85.0, 87.2], [90.0, 90.19], [92.0, 95.2], [103.0, 105.51], [111.0, 112.45], [118.0, 117.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 50.21, 39.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 53.22, 0.0, 60.42, 0.0, 43.15, 71.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 30.28], ["speech", 28.02], ["synthesizer", 12.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.33], ["speech", 19.03], ["didgeridoo", 10.35]], null, null, null], "duration": [0.49, 0.76, 2.8, 2.02, 0.51, 1.03, 0.92, 0.54, 1.12, 1.5, 0.85, 3.9, 1.42, 1.13, 1.72, 3.1, 1.42, 2.2, 0.19, 3.2, 2.51, 1.45, -0.22]} \ No newline at end of file diff --git a/annotations_1/uFNIrs3jtEQ_filtered.json b/annotations_1/uFNIrs3jtEQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b4120b3d226d54a86c4c8b51070e6644a7d773e8 --- /dev/null +++ b/annotations_1/uFNIrs3jtEQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.23], [12.0, 13.14], [13.0, 17.0], [19.0, 19.4], [21.0, 21.59], [22.0, 23.16], [25.0, 26.42], [27.0, 28.05], [29.0, 29.59], [30.0, 31.83], [37.0, 37.03], [38.0, 38.99], [41.0, 42.75], [43.0, 44.19], [47.0, 49.44], [53.0, 55.49], [57.0, 60.64], [63.0, 63.59], [83.0, 84.28], [85.0, 86.04], [87.0, 87.03], [90.0, 90.71], [94.0, 94.63], [97.0, 99.77], [101.0, 100.89], [102.0, 102.32], [108.0, 109.16], [111.0, 110.89], [115.0, 116.82], [118.0, 117.96], [121.0, 122.67], [125.0, 127.6], [130.0, 135.9], [146.0, 147.88], [150.0, 150.13], [151.0, 150.7], [153.0, 154.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.92, 100.0, 67.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.74, 42.33, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.87], ["telephone", 12.35], ["dial tone", 4.3]], null, null, null, null], "duration": [0.23, 1.14, 4.0, 0.4, 0.59, 1.16, 1.42, 1.05, 0.59, 1.83, 0.03, 0.99, 1.75, 1.19, 2.44, 2.49, 3.64, 0.59, 1.28, 1.04, 0.03, 0.71, 0.63, 2.77, -0.11, 0.32, 1.16, -0.11, 1.82, -0.04, 1.67, 2.6, 5.9, 1.88, 0.13, -0.3, 1.47]} \ No newline at end of file diff --git a/annotations_1/uFTd09NNJzo_filtered.json b/annotations_1/uFTd09NNJzo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec8c8e08b39e5a70785797f2d84891468e37f34f --- /dev/null +++ b/annotations_1/uFTd09NNJzo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.43], [8.0, 9.39], [11.0, 11.35], [15.0, 147.45], [151.0, 152.56]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [0.43, 1.39, 0.35, 132.45, 1.56]} \ No newline at end of file diff --git a/annotations_1/uG_KHjd_PSc_filtered.json b/annotations_1/uG_KHjd_PSc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35b8f42cab7fc85ec23fba0679e377a74555d4a0 --- /dev/null +++ b/annotations_1/uG_KHjd_PSc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.31], [2.0, 2.32], [14.0, 17.58], [19.0, 20.85], [28.0, 32.46], [33.0, 36.81], [39.0, 40.54], [41.0, 42.33], [43.0, 44.02], [47.0, 48.32], [49.0, 50.13], [51.0, 51.81], [56.0, 55.98], [64.0, 65.43], [72.0, 72.55], [75.0, 91.39], [92.0, 93.97], [95.0, 95.69], [97.0, 96.92], [101.0, 104.45], [106.0, 112.36], [115.0, 115.77], [118.0, 118.25], [123.0, 124.29], [127.0, 130.89], [132.0, 133.35], [135.0, 135.01], [139.0, 138.81], [143.0, 145.74], [150.0, 151.34], [153.0, 154.01], [157.0, 157.17], [158.0, 158.3], [160.0, 162.13], [163.0, 163.49], [168.0, 168.84], [171.0, 172.25], [174.0, 177.45]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 33.85, 0.0, 36.78, 36.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.6, 0.0, 0.0, 0.0, 29.0, 29.03, 0.0, 0.0, 0.0, 39.47, 0.0, 0.0, 0.0, 55.89, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 52.27], "audiomae_on_audioset": [null, null, [["music", 67.49], ["musical instrument", 3.53], ["guitar", 2.31]], null, [["hum", 24.81], ["speech", 11.13], ["mains hum", 8.18]], [["hum", 33.5], ["speech", 16.44], ["mains hum", 6.58]], null, null, null, null, null, null, null, null, null, [["sonar", 25.86], ["music", 17.31], ["hum", 15.76]], null, null, null, [["speech", 23.75], ["music", 9.56], ["radio", 5.12]], [["music", 63.34], ["didgeridoo", 18.3], ["speech", 5.07]], null, null, null, [["speech", 50.48], ["throbbing", 12.62], ["music", 8.11]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.31, 0.32, 3.58, 1.85, 4.46, 3.81, 1.54, 1.33, 1.02, 1.32, 1.13, 0.81, -0.02, 1.43, 0.55, 16.39, 1.97, 0.69, -0.08, 3.45, 6.36, 0.77, 0.25, 1.29, 3.89, 1.35, 0.01, -0.19, 2.74, 1.34, 1.01, 0.17, 0.3, 2.13, 0.49, 0.84, 1.25, 3.45]} \ No newline at end of file diff --git a/annotations_1/uHltDaQU1uc_filtered.json b/annotations_1/uHltDaQU1uc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6f90890f85b525721241f9fb753b2e54a4ec32a7 --- /dev/null +++ b/annotations_1/uHltDaQU1uc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 23.72], [25.0, 27.13], [29.0, 29.69], [34.0, 48.56], [49.0, 48.59], [51.0, 63.36], [67.0, 69.28], [71.0, 72.99], [73.0, 74.46], [86.0, 86.9], [91.0, 92.43], [94.0, 95.13], [100.0, 108.19], [112.0, 125.46], [127.0, 130.08], [131.0, 131.57], [133.0, 133.41], [134.0, 142.87], [146.0, 147.07], [150.0, 153.25], [154.0, 155.07], [157.0, 160.49], [164.0, 165.35], [166.0, 168.94]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false, true], "silence_prob": [42.58, 51.34, 0.0, 33.52, 0.0, 38.4, 37.14, 0.0, 0.0, 0.0, 0.0, 0.0, 31.99, 33.82, 31.96, 0.0, 0.0, 29.18, 0.0, 30.39, 0.0, 37.63, 0.0, 29.41], "audiomae_on_audioset": [[["music", 67.43], ["speech", 9.19], ["electronic music", 3.6]], null, null, [["music", 39.12], ["throbbing", 35.53], ["hum", 6.77]], null, [["music", 56.4], ["didgeridoo", 6.35], ["throbbing", 5.36]], [["music", 69.07], ["throbbing", 8.53], ["hum", 2.23]], null, null, null, null, null, [["music", 82.3], ["musical instrument", 1.07], ["middle eastern music", 0.87]], [["music", 82.7], ["throbbing", 2.97], ["hum", 1.81]], [["music", 32.16], ["hum", 6.9], ["throbbing", 5.32]], null, null, [["speech", 62.41], ["music", 17.13], ["explosion", 4.18]], null, [["throbbing", 22.86], ["music", 22.62], ["scratching (performance technique)", 4.54]], null, [["music", 36.18], ["whale vocalization", 23.3], ["speech", 4.2]], null, [["theremin", 26.15], ["music", 19.59], ["synthesizer", 6.98]]], "duration": [7.72, 2.13, 0.69, 14.56, -0.41, 12.36, 2.28, 1.99, 1.46, 0.9, 1.43, 1.13, 8.19, 13.46, 3.08, 0.57, 0.41, 8.87, 1.07, 3.25, 1.07, 3.49, 1.35, 2.94]} \ No newline at end of file diff --git a/annotations_1/uHuDwL4XEUE_filtered.json b/annotations_1/uHuDwL4XEUE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e2b5f69a23579b23f9920e313384a2b062f9739 --- /dev/null +++ b/annotations_1/uHuDwL4XEUE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.99], [8.0, 9.15], [10.0, 10.27], [11.0, 14.35], [17.0, 17.25], [20.0, 21.44], [25.0, 26.18], [28.0, 33.91], [35.0, 38.43], [39.0, 40.54], [48.0, 52.0], [55.0, 61.57], [63.0, 68.39], [69.0, 72.05], [73.0, 77.45], [78.0, 84.15], [85.0, 86.24], [86.0, 96.01], [99.0, 111.94], [112.0, 112.02], [112.0, 112.16], [115.0, 119.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.25, 0.0, 0.0, 0.0, 93.91, 91.3, 0.0, 95.09, 95.09, 92.48, 98.8, 98.36, 95.23, 0.0, 80.64, 99.82, 0.0, 0.0, 99.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 1.15, 0.27, 3.35, 0.25, 1.44, 1.18, 5.91, 3.43, 1.54, 4.0, 6.57, 5.39, 3.05, 4.45, 6.15, 1.24, 10.01, 12.94, 0.02, 0.16, 4.45]} \ No newline at end of file diff --git a/annotations_1/uI7ijvSCHcI_filtered.json b/annotations_1/uI7ijvSCHcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d52a564432690e3c08f41dbe32b253c8a124d43a --- /dev/null +++ b/annotations_1/uI7ijvSCHcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.24], [6.0, 21.12], [21.0, 28.53], [29.0, 54.24], [57.0, 58.51], [73.0, 76.67], [77.0, 88.32], [90.0, 95.05], [100.0, 103.79], [107.0, 119.55], [127.0, 127.72], [145.0, 145.29], [146.0, 146.28], [152.0, 153.4], [157.0, 157.82], [158.0, 161.7], [171.0, 171.73], [172.0, 180.69]], "keep_status": [false, true, true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.51, 31.89, 32.16, 0.0, 34.05, 32.71, 31.62, 32.38, 32.16, 0.0, 0.0, 0.0, 0.0, 0.0, 32.02, 0.0, 85.17], "audiomae_on_audioset": [null, [["hum", 27.97], ["speech", 17.9], ["throbbing", 15.65]], [["sidetone", 35.4], ["speech", 20.97], ["music", 13.56]], [["music", 23.42], ["livestock, farm animals, working animals", 13.22], ["cattle, bovinae", 8.1]], null, [["fly, housefly", 59.92], ["insect", 28.5], ["mosquito", 4.6]], [["speech", 39.39], ["music", 31.18], ["buzz", 6.12]], [["music", 25.37], ["speech", 23.28], ["hum", 7.54]], [["whale vocalization", 34.86], ["music", 25.48], ["hum", 10.61]], [["music", 50.59], ["theremin", 4.02], ["hum", 3.82]], null, null, null, null, null, [["fly, housefly", 43.5], ["insect", 21.56], ["mosquito", 20.21]], null, null], "duration": [0.24, 15.12, 7.53, 25.24, 1.51, 3.67, 11.32, 5.05, 3.79, 12.55, 0.72, 0.29, 0.28, 1.4, 0.82, 3.7, 0.73, 8.69]} \ No newline at end of file diff --git a/annotations_1/uIsdG0ydS5o_filtered.json b/annotations_1/uIsdG0ydS5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b219e8be4484805a2f5aeb9717a159d29d893bb6 --- /dev/null +++ b/annotations_1/uIsdG0ydS5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.42], [8.0, 11.37], [15.0, 16.04], [16.0, 16.07], [16.0, 24.44], [24.0, 27.41], [29.0, 29.93], [50.0, 51.21], [56.0, 58.02], [59.0, 60.98], [71.0, 72.45], [84.0, 84.38], [85.0, 86.05], [96.0, 104.08], [106.0, 108.01], [110.0, 116.02], [120.0, 120.02], [120.0, 120.14], [120.0, 120.65], [125.0, 125.49], [127.0, 127.75], [129.0, 135.55], [142.0, 142.37], [143.0, 145.27], [147.0, 150.99], [154.0, 161.62], [166.0, 166.5], [172.0, 180.15], [182.0, 190.27], [195.0, 196.11], [201.0, 207.17], [210.0, 219.94], [221.0, 221.49], [222.0, 223.91], [225.0, 228.48]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, true, false, true, true, false, false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 38.67, 0.0, 0.0, 29.41, 28.97, 0.0, 0.0, 30.62, 0.0, 0.0, 0.0, 0.0, 34.17, 35.18, 32.1, 0.0, 0.0, 0.0, 0.0, 0.0, 29.96, 0.0, 29.51, 30.8, 29.91, 0.0, 29.97, 30.1, 0.0, 29.89, 36.58, 0.0, 0.0, 28.91], "audiomae_on_audioset": [null, [["music", 59.29], ["throbbing", 7.93], ["hum", 6.35]], null, null, [["music", 53.93], ["throbbing", 18.77], ["hum", 7.8]], [["music", 26.96], ["hum", 12.84], ["animal", 6.44]], null, null, [["speech", 65.53], ["radio", 2.85], ["static", 2.18]], null, null, null, null, [["speech", 36.51], ["music", 17.4], ["hum", 6.58]], [["hum", 33.84], ["throbbing", 26.47], ["music", 16.72]], [["music", 27.73], ["speech", 17.17], ["animal", 11.34]], null, null, null, null, null, [["music", 38.93], ["speech", 23.47], ["throbbing", 6.75]], null, [["speech", 25.35], ["music", 12.09], ["sound effect", 6.41]], [["skateboard", 19.44], ["speech", 12.78], ["whip", 11.5]], [["music", 30.97], ["boing", 28.99], ["speech", 12.75]], null, [["speech", 49.11], ["music", 24.22], ["groan", 3.49]], [["speech", 41.23], ["music", 28.92], ["whack, thwack", 6.64]], null, [["music", 42.11], ["throbbing", 13.88], ["hum", 13.35]], [["music", 49.03], ["speech", 19.18], ["theremin", 9.22]], null, null, [["music", 18.86], ["whack, thwack", 13.89], ["whip", 13.59]]], "duration": [0.42, 3.37, 1.04, 0.07, 8.44, 3.41, 0.93, 1.21, 2.02, 1.98, 1.45, 0.38, 1.05, 8.08, 2.01, 6.02, 0.02, 0.14, 0.65, 0.49, 0.75, 6.55, 0.37, 2.27, 3.99, 7.62, 0.5, 8.15, 8.27, 1.11, 6.17, 9.94, 0.49, 1.91, 3.48]} \ No newline at end of file diff --git a/annotations_1/uLhrOeavvOY_filtered.json b/annotations_1/uLhrOeavvOY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db325f29442a9d33ee3d6c634baa42103e30df34 --- /dev/null +++ b/annotations_1/uLhrOeavvOY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 26.47], [31.0, 31.56], [32.0, 90.44], [91.0, 91.77], [92.0, 91.84], [92.0, 92.11], [93.0, 94.9], [98.0, 113.68], [115.0, 119.77], [121.0, 123.96], [125.0, 148.74]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true], "silence_prob": [41.85, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.21, 47.82, 48.52, 42.98], "audiomae_on_audioset": [[["speech", 45.92], ["music", 24.28], ["musical instrument", 3.4]], null, null, null, null, null, null, [["speech", 23.55], ["music", 20.59], ["breaking", 5.37]], [["music", 37.7], ["splinter", 13.58], ["crushing", 8.54]], [["music", 22.83], ["singing bowl", 15.0], ["gong", 6.86]], [["music", 31.93], ["singing bowl", 16.2], ["ambient music", 10.88]]], "duration": [7.47, 0.56, 58.44, 0.77, -0.16, 0.11, 1.9, 15.68, 4.77, 2.96, 23.74]} \ No newline at end of file diff --git a/annotations_1/uNcKTuAqLag_filtered.json b/annotations_1/uNcKTuAqLag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d6fdb4186a16a7dd557703758d5b643a5d43c41f --- /dev/null +++ b/annotations_1/uNcKTuAqLag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.48], [8.0, 8.45], [10.0, 11.55], [13.0, 13.9], [17.0, 18.01], [23.0, 25.81], [27.0, 27.62], [29.0, 29.79], [35.0, 37.67], [39.0, 39.38], [40.0, 46.87], [51.0, 52.71], [57.0, 58.43], [61.0, 61.86], [64.0, 64.72], [66.0, 68.32], [73.0, 74.22], [80.0, 81.58], [82.0, 83.74], [87.0, 87.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 0.0, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 56.4, 0.0, 81.35, 0.0, 0.0, 0.0, 0.0, 55.25, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.48, 0.45, 1.55, 0.9, 1.01, 2.81, 0.62, 0.79, 2.67, 0.38, 6.87, 1.71, 1.43, 0.86, 0.72, 2.32, 1.22, 1.58, 1.74, 0.49]} \ No newline at end of file diff --git a/annotations_1/uNjrnjiEEY8_filtered.json b/annotations_1/uNjrnjiEEY8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1a29cbff34568141c094ff69ee6cf679892aaa3 --- /dev/null +++ b/annotations_1/uNjrnjiEEY8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.19], [13.0, 13.39], [14.0, 15.3], [17.0, 19.04], [21.0, 22.54], [33.0, 32.53], [34.0, 36.63], [41.0, 43.6], [49.0, 48.9], [55.0, 55.71], [56.0, 56.76], [57.0, 56.84], [57.0, 60.76], [64.0, 64.3], [70.0, 74.68], [77.0, 78.97], [87.0, 91.62], [110.0, 110.52], [113.0, 113.39], [116.0, 118.18], [119.0, 119.03], [120.0, 121.26], [123.0, 123.85], [126.0, 126.4], [128.0, 130.2], [135.0, 137.39], [139.0, 140.66], [141.0, 141.86], [144.0, 149.86], [151.0, 151.71], [153.0, 155.36]], "keep_status": [false, false, false, false, false, false, true, true, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 38.46, 0.0, 0.0, 31.46, 33.4, 0.0, 0.0, 0.0, 0.0, 36.02, 0.0, 36.67, 0.0, 97.0, 0.0, 0.0, 69.2, 0.0, 0.0, 0.0, 0.0, 95.37, 94.52, 0.0, 0.0, 64.18, 0.0, 58.64], "audiomae_on_audioset": [null, null, null, [["music", 65.85], ["fart", 7.93], ["mosquito", 1.61]], null, null, [["music", 33.15], ["groan", 13.83], ["bleat", 10.15]], [["boing", 25.48], ["music", 19.1], ["mosquito", 7.66]], null, null, null, null, [["music", 40.99], ["boing", 18.14], ["salsa music", 4.53]], null, [["music", 36.88], ["speech", 11.25], ["boing", 7.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 0.39, 1.3, 2.04, 1.54, -0.47, 2.63, 2.6, -0.1, 0.71, 0.76, -0.16, 3.76, 0.3, 4.68, 1.97, 4.62, 0.52, 0.39, 2.18, 0.03, 1.26, 0.85, 0.4, 2.2, 2.39, 1.66, 0.86, 5.86, 0.71, 2.36]} \ No newline at end of file diff --git a/annotations_1/uOHMPcGgInI_filtered.json b/annotations_1/uOHMPcGgInI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..038f0d3a7abd5669d92ec4d90b018d2d9deb741e --- /dev/null +++ b/annotations_1/uOHMPcGgInI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 23.06], [32.0, 33.34], [33.0, 58.72], [61.0, 77.21], [80.0, 86.66], [88.0, 121.81], [123.0, 123.36], [125.0, 130.05], [131.0, 131.92], [134.0, 135.3], [136.0, 141.12], [144.0, 144.83], [146.0, 155.16], [156.0, 157.47], [158.0, 167.75], [168.0, 177.35]], "keep_status": [true, false, false, true, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [29.33, 0.0, 28.62, 28.74, 30.36, 0.0, 0.0, 30.66, 0.0, 0.0, 29.2, 0.0, 30.15, 0.0, 28.86, 29.57], "audiomae_on_audioset": [[["music", 22.56], ["throbbing", 20.9], ["hum", 12.86]], null, [["music", 56.77], ["speech", 20.53], ["buzz", 7.5]], [["music", 32.45], ["speech", 25.13], ["buzz", 4.39]], [["fly, housefly", 66.01], ["insect", 13.67], ["bee, wasp, etc.", 4.21]], null, null, [["speech", 25.51], ["fly, housefly", 16.78], ["insect", 8.94]], null, null, [["music", 10.17], ["insect", 9.41], ["fly, housefly", 8.89]], null, [["music", 50.09], ["speech", 29.74], ["mains hum", 3.46]], null, [["music", 66.96], ["mains hum", 10.27], ["hum", 3.99]], [["speech", 69.78], ["music", 9.77], ["outside, rural or natural", 1.5]]], "duration": [13.06, 1.34, 25.72, 16.21, 6.66, 33.81, 0.36, 5.05, 0.92, 1.3, 5.12, 0.83, 9.16, 1.47, 9.75, 9.35]} \ No newline at end of file diff --git a/annotations_1/uPFxRUeRfu8_filtered.json b/annotations_1/uPFxRUeRfu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..675e044daa1e4469b1b609eac8a4caf06b9d5f18 --- /dev/null +++ b/annotations_1/uPFxRUeRfu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.05], [8.0, 8.67], [14.0, 32.0], [40.0, 46.43], [47.0, 48.79], [51.0, 55.85], [56.0, 57.55], [58.0, 74.22], [76.0, 102.24]], "keep_status": [false, false, false, true, false, false, false, true, true], "silence_prob": [0.0, 0.0, 29.98, 32.71, 0.0, 42.98, 0.0, 29.78, 29.43], "audiomae_on_audioset": [null, null, [["mains hum", 37.94], ["hum", 28.45], ["music", 12.43]], [["music", 36.72], ["hum", 14.48], ["mains hum", 12.01]], null, [["music", 65.8], ["animal", 4.57], ["speech", 4.51]], null, [["speech", 46.69], ["vehicle", 13.9], ["car", 6.08]], [["fly, housefly", 19.81], ["insect", 10.27], ["music", 9.27]]], "duration": [1.05, 0.67, 18.0, 6.43, 1.79, 4.85, 1.55, 16.22, 26.24]} \ No newline at end of file diff --git a/annotations_1/uPQcsSuWlB4_filtered.json b/annotations_1/uPQcsSuWlB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..54249ee13160168553f0d841d15424448819cb7b --- /dev/null +++ b/annotations_1/uPQcsSuWlB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 23.43], [24.0, 26.27], [30.0, 82.07], [84.0, 85.51], [87.0, 87.2], [88.0, 120.07]], "keep_status": [true, true, false, false, false, false], "silence_prob": [32.24, 33.4, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 40.79], ["music", 17.28], ["hum", 4.97]], [["hum", 19.18], ["speech", 18.53], ["rumble", 15.05]], null, null, null, null], "duration": [2.43, 2.27, 52.07, 1.51, 0.2, 32.07]} \ No newline at end of file diff --git a/annotations_1/uPS3iKFXKR4_filtered.json b/annotations_1/uPS3iKFXKR4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8c4c6f1331625f68f466ccfa19dbd16849e23cc --- /dev/null +++ b/annotations_1/uPS3iKFXKR4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.88], [12.0, 12.65], [16.0, 22.33], [24.0, 25.91], [29.0, 37.3], [39.0, 40.14], [48.0, 47.83], [48.0, 50.16], [52.0, 54.7], [57.0, 57.92], [62.0, 64.61], [66.0, 67.8], [68.0, 69.82], [74.0, 80.32], [83.0, 84.1], [90.0, 91.67], [92.0, 94.1], [100.0, 100.11], [100.0, 124.29], [129.0, 130.32], [131.0, 131.57], [132.0, 133.64], [135.0, 135.67], [137.0, 136.98], [138.0, 138.5], [142.0, 142.55], [143.0, 144.54], [145.0, 155.41], [157.0, 157.69], [163.0, 165.3], [167.0, 170.55], [172.0, 174.36], [175.0, 177.6]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.64, 0.0, 87.55, 0.0, 99.95, 0.0, 0.0, 94.07, 100.0, 0.0, 97.0, 0.0, 0.0, 70.02, 0.0, 0.0, 81.53, 0.0, 34.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.02, 0.0, 62.68, 91.13, 83.52, 79.76], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.27], ["hum", 21.42], ["synthesizer", 9.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.88, 0.65, 6.33, 1.91, 8.3, 1.14, -0.17, 2.16, 2.7, 0.92, 2.61, 1.8, 1.82, 6.32, 1.1, 1.67, 2.1, 0.11, 24.29, 1.32, 0.57, 1.64, 0.67, -0.02, 0.5, 0.55, 1.54, 10.41, 0.69, 2.3, 3.55, 2.36, 2.6]} \ No newline at end of file diff --git a/annotations_1/uQR_i0ydJik_filtered.json b/annotations_1/uQR_i0ydJik_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..893e4b5816f066e6b20d493c86dfdd2dfc834ba2 --- /dev/null +++ b/annotations_1/uQR_i0ydJik_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 19.2], [22.0, 23.16], [24.0, 25.2], [29.0, 29.81], [31.0, 31.75], [33.0, 34.94], [45.0, 46.06], [48.0, 48.9], [54.0, 54.21], [55.0, 55.46], [57.0, 57.3], [61.0, 61.79], [62.0, 63.27], [69.0, 68.81], [73.0, 73.74], [79.0, 79.79], [84.0, 85.53]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [47.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 36.09], ["tubular bells", 13.64], ["singing bowl", 4.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.2, 1.16, 1.2, 0.81, 0.75, 1.94, 1.06, 0.9, 0.21, 0.46, 0.3, 0.79, 1.27, -0.19, 0.74, 0.79, 1.53]} \ No newline at end of file diff --git a/annotations_1/uQ_nGVp6x6U_filtered.json b/annotations_1/uQ_nGVp6x6U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1f4c656c412879f3d17789709945f30be6108f --- /dev/null +++ b/annotations_1/uQ_nGVp6x6U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.46], [17.0, 18.69], [21.0, 26.45], [27.0, 28.21], [29.0, 29.22], [32.0, 32.26], [37.0, 37.81], [40.0, 42.04], [46.0, 46.57], [47.0, 73.2], [74.0, 76.11], [90.0, 91.59], [96.0, 96.13], [97.0, 97.92], [102.0, 102.9], [107.0, 107.23], [113.0, 114.61], [126.0, 127.16], [129.0, 129.56], [131.0, 132.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 0.0, 54.43, 0.0, 30.09, 31.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 72.63], ["crushing", 4.7], ["animal", 1.82]], null, null, null, null, null, null, [["music", 72.56], ["drum machine", 5.87], ["electronic music", 3.18]], [["music", 74.8], ["musical instrument", 4.68], ["guitar", 4.04]], null, null, null, null, null, null, null, null, null], "duration": [0.46, 1.69, 5.45, 1.21, 0.22, 0.26, 0.81, 2.04, 0.57, 26.2, 2.11, 1.59, 0.13, 0.92, 0.9, 0.23, 1.61, 1.16, 0.56, 1.44]} \ No newline at end of file diff --git a/annotations_1/uQpHx3lBGms_filtered.json b/annotations_1/uQpHx3lBGms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b55df901555e1e3b72732101158555aeff4b404c --- /dev/null +++ b/annotations_1/uQpHx3lBGms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.33], [19.0, 20.04], [22.0, 27.3], [31.0, 49.33], [51.0, 53.42], [60.0, 63.09], [64.0, 66.8], [68.0, 89.13]], "keep_status": [false, false, true, true, true, false, true, true], "silence_prob": [0.0, 0.0, 46.61, 36.27, 36.25, 34.13, 32.85, 28.48], "audiomae_on_audioset": [null, null, [["hum", 29.94], ["mains hum", 24.88], ["throbbing", 11.68]], [["speech", 21.67], ["mains hum", 16.87], ["hum", 14.76]], [["microwave oven", 13.34], ["hum", 12.77], ["vehicle", 8.99]], [["music", 39.12], ["mains hum", 25.84], ["hum", 14.46]], [["music", 34.07], ["mains hum", 17.01], ["hum", 10.05]], [["music", 27.81], ["speech", 18.48], ["hum", 16.09]]], "duration": [0.33, 1.04, 5.3, 18.33, 2.42, 3.09, 2.8, 21.13]} \ No newline at end of file diff --git a/annotations_1/uR7yS87K1tA_filtered.json b/annotations_1/uR7yS87K1tA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33eb59f7fccf5b6db7bf258bead489c24062e6e1 --- /dev/null +++ b/annotations_1/uR7yS87K1tA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.45], [1.0, 3.25], [7.0, 9.14], [10.0, 11.23], [15.0, 15.63], [18.0, 19.13], [23.0, 22.91], [26.0, 26.16], [30.0, 30.79], [33.0, 34.53], [35.0, 37.2], [38.0, 39.61], [41.0, 41.52], [47.0, 48.02], [58.0, 58.65], [60.0, 61.99], [64.0, 65.11], [68.0, 67.71], [71.0, 72.42], [73.0, 74.21], [81.0, 81.7], [83.0, 83.54], [86.0, 86.48], [87.0, 88.23], [95.0, 95.28], [101.0, 102.12], [103.0, 104.87], [107.0, 108.78], [114.0, 113.98], [116.0, 116.55], [118.0, 119.74], [120.0, 121.78], [123.0, 123.79], [124.0, 125.41], [126.0, 126.55], [140.0, 140.37], [141.0, 142.47], [144.0, 146.15], [147.0, 147.77], [153.0, 157.27], [158.0, 160.2], [161.0, 162.55], [163.0, 164.86], [166.0, 168.47], [170.0, 171.54], [173.0, 173.74], [174.0, 179.07], [179.0, 181.35], [183.0, 183.41], [187.0, 188.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.96, 97.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.17, 0.0, 99.99, 99.97, 0.0, 0.0, 99.96, 0.0, 0.0, 90.6, 53.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.45, 2.25, 2.14, 1.23, 0.63, 1.13, -0.09, 0.16, 0.79, 1.53, 2.2, 1.61, 0.52, 1.02, 0.65, 1.99, 1.11, -0.29, 1.42, 1.21, 0.7, 0.54, 0.48, 1.23, 0.28, 1.12, 1.87, 1.78, -0.02, 0.55, 1.74, 1.78, 0.79, 1.41, 0.55, 0.37, 1.47, 2.15, 0.77, 4.27, 2.2, 1.55, 1.86, 2.47, 1.54, 0.74, 5.07, 2.35, 0.41, 1.52]} \ No newline at end of file diff --git a/annotations_1/uRjbDsGz2tc_filtered.json b/annotations_1/uRjbDsGz2tc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a62d7272f5431d759fd679c6ffff484782f5554a --- /dev/null +++ b/annotations_1/uRjbDsGz2tc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.42], [8.0, 9.78], [12.0, 14.27], [25.0, 27.84], [29.0, 30.72], [32.0, 40.63], [41.0, 59.49], [60.0, 60.37], [61.0, 61.91], [63.0, 63.41], [68.0, 69.21], [72.0, 72.28], [73.0, 76.38], [81.0, 81.55], [87.0, 87.89], [91.0, 91.74], [95.0, 95.74], [99.0, 99.72], [104.0, 103.64], [107.0, 109.38], [113.0, 115.11], [116.0, 117.56], [118.0, 120.85], [122.0, 123.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [94.22, 0.0, 100.0, 97.92, 0.0, 90.95, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.97, 45.72, 0.0, 51.6, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.58], ["guitar", 13.8], ["musical instrument", 11.16]], null, null, null], "duration": [2.42, 1.78, 2.27, 2.84, 1.72, 8.63, 18.49, 0.37, 0.91, 0.41, 1.21, 0.28, 3.38, 0.55, 0.89, 0.74, 0.74, 0.72, -0.36, 2.38, 2.11, 1.56, 2.85, 1.96]} \ No newline at end of file diff --git a/annotations_1/uSCNsJDEf1M_filtered.json b/annotations_1/uSCNsJDEf1M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f022e590cd6cdbd32545dc0e228f17059326c697 --- /dev/null +++ b/annotations_1/uSCNsJDEf1M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.8], [11.0, 15.18], [17.0, 17.54], [20.0, 34.18], [35.0, 36.9], [37.0, 42.33], [45.0, 51.51], [52.0, 53.52], [59.0, 65.21], [66.0, 66.6], [68.0, 68.88], [70.0, 71.52], [73.0, 73.82], [81.0, 90.24], [91.0, 92.13], [95.0, 99.79], [101.0, 102.54], [103.0, 104.03], [105.0, 106.86], [108.0, 115.35], [117.0, 117.66], [119.0, 119.08], [120.0, 119.77], [120.0, 123.42]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.15, 0.0, 38.95, 0.0, 34.14, 52.39, 0.0, 51.55, 0.0, 0.0, 0.0, 0.0, 51.34, 0.0, 94.22, 0.0, 0.0, 0.0, 46.33, 0.0, 0.0, 0.0, 82.97], "audiomae_on_audioset": [null, [["speech", 57.92], ["sidetone", 29.03], ["music", 2.77]], null, [["crushing", 24.34], ["noise", 18.19], ["music", 10.98]], null, [["speech", 51.88], ["sidetone", 8.5], ["fart", 5.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.4], ["music", 13.78], ["effects unit", 3.86]], null, null, null, null], "duration": [1.8, 4.18, 0.54, 14.18, 1.9, 5.33, 6.51, 1.52, 6.21, 0.6, 0.88, 1.52, 0.82, 9.24, 1.13, 4.79, 1.54, 1.03, 1.86, 7.35, 0.66, 0.08, -0.23, 3.42]} \ No newline at end of file diff --git a/annotations_1/uSLscJ2cY04_filtered.json b/annotations_1/uSLscJ2cY04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5a0c425c7ce666dca99ca7cf12269b2eab36fc5 --- /dev/null +++ b/annotations_1/uSLscJ2cY04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.54], [5.0, 10.37], [15.0, 15.55], [25.0, 25.47], [28.0, 28.65], [35.0, 36.07], [44.0, 44.14], [45.0, 46.94], [58.0, 59.64], [61.0, 61.57], [64.0, 65.33], [69.0, 70.39], [74.0, 74.93], [83.0, 83.4], [89.0, 89.07], [90.0, 91.4], [101.0, 102.27], [106.0, 106.59], [111.0, 111.64], [124.0, 124.55], [125.0, 126.74], [129.0, 128.61], [158.0, 159.14], [162.0, 162.33], [168.0, 169.55], [170.0, 170.83], [173.0, 174.02], [178.0, 178.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 5.37, 0.55, 0.47, 0.65, 1.07, 0.14, 1.94, 1.64, 0.57, 1.33, 1.39, 0.93, 0.4, 0.07, 1.4, 1.27, 0.59, 0.64, 0.55, 1.74, -0.39, 1.14, 0.33, 1.55, 0.83, 1.02, 0.75]} \ No newline at end of file diff --git a/annotations_1/uSMxnpecSZM_filtered.json b/annotations_1/uSMxnpecSZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8ef6fd365fc6852ec3875118fe8761efc9eafc69 --- /dev/null +++ b/annotations_1/uSMxnpecSZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[100.0, 101.22], [103.0, 104.38], [104.0, 120.29], [135.0, 135.65], [140.0, 152.64], [154.0, 155.71]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 31.18, 0.0, 32.91, 0.0], "audiomae_on_audioset": [null, null, [["music", 75.55], ["musical instrument", 4.23], ["trombone", 4.19]], null, [["music", 27.83], ["moo", 13.8], ["cattle, bovinae", 12.49]], null], "duration": [1.22, 1.38, 16.29, 0.65, 12.64, 1.71]} \ No newline at end of file diff --git a/annotations_1/uSZi8oPRUkE_filtered.json b/annotations_1/uSZi8oPRUkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e07f02fec5119eb6d6ebed29b45ce9aac9db1a81 --- /dev/null +++ b/annotations_1/uSZi8oPRUkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 17.78], [19.0, 21.14], [24.0, 32.26], [33.0, 34.11], [35.0, 35.01], [36.0, 38.4], [39.0, 40.36], [42.0, 48.78], [49.0, 48.9], [52.0, 58.7], [67.0, 72.28], [74.0, 76.32], [77.0, 80.81], [87.0, 89.07], [90.0, 91.05], [94.0, 102.68], [107.0, 125.29]], "keep_status": [false, false, true, false, false, true, false, true, false, true, true, true, true, false, false, false, true], "silence_prob": [32.11, 50.76, 29.99, 0.0, 0.0, 29.26, 0.0, 37.61, 0.0, 29.98, 35.87, 48.95, 37.16, 33.34, 0.0, 32.21, 31.32], "audiomae_on_audioset": [[["music", 36.59], ["hum", 32.55], ["mains hum", 13.23]], null, [["music", 47.81], ["hum", 12.34], ["mains hum", 5.84]], null, null, [["whale vocalization", 18.75], ["music", 13.47], ["sound effect", 8.37]], null, [["music", 20.5], ["insect", 9.55], ["animal", 8.07]], null, [["fly, housefly", 17.6], ["music", 13.47], ["buzz", 12.15]], [["music", 37.0], ["throbbing", 12.87], ["hum", 12.21]], [["music", 35.73], ["speech", 12.72], ["theremin", 3.62]], [["music", 58.78], ["speech", 6.18], ["electronic music", 3.85]], [["music", 32.75], ["speech", 26.35], ["sidetone", 22.63]], null, [["music", 44.67], ["speech", 34.75], ["outside, rural or natural", 1.31]], [["music", 35.64], ["hum", 10.46], ["speech", 9.74]]], "duration": [10.78, 2.14, 8.26, 1.11, 0.01, 2.4, 1.36, 6.78, -0.1, 6.7, 5.28, 2.32, 3.81, 2.07, 1.05, 8.68, 18.29]} \ No newline at end of file diff --git a/annotations_1/uTOoWlYv95w_filtered.json b/annotations_1/uTOoWlYv95w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c4b45d251e7b241eebb74298bcd62fe10e332319 --- /dev/null +++ b/annotations_1/uTOoWlYv95w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 57.3], [61.0, 61.26], [63.0, 63.21], [64.0, 66.29], [68.0, 113.49], [117.0, 150.03]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 19.54], ["fly, housefly", 14.77], ["speech", 11.71]], null, null], "duration": [30.3, 0.26, 0.21, 2.29, 45.49, 33.03]} \ No newline at end of file diff --git a/annotations_1/uTUupV0ZfBk_filtered.json b/annotations_1/uTUupV0ZfBk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..929b27300bb6dba69182464b2d91bfafc9b7040b --- /dev/null +++ b/annotations_1/uTUupV0ZfBk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.71], [11.0, 11.45], [13.0, 14.44], [18.0, 19.58], [22.0, 23.31], [25.0, 26.06], [29.0, 30.5], [32.0, 32.49], [44.0, 45.23], [47.0, 78.22], [81.0, 108.45]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [39.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.82], "audiomae_on_audioset": [[["music", 31.34], ["noise", 8.27], ["fly, housefly", 4.57]], null, null, null, null, null, null, null, null, null, [["noise", 19.58], ["fly, housefly", 17.87], ["mosquito", 11.37]]], "duration": [2.71, 0.45, 1.44, 1.58, 1.31, 1.06, 1.5, 0.49, 1.23, 31.22, 27.45]} \ No newline at end of file diff --git a/annotations_1/uUEpwPiiGco_filtered.json b/annotations_1/uUEpwPiiGco_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/uUEpwPiiGco_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/uU_ftZ6EfX8_filtered.json b/annotations_1/uU_ftZ6EfX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b7b048b84ec67da29314d3e0c876be3003ad838 --- /dev/null +++ b/annotations_1/uU_ftZ6EfX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [4.0, 4.5], [6.0, 6.67], [8.0, 8.61], [17.0, 18.13], [20.0, 19.82], [35.0, 37.25], [39.0, 59.44], [62.0, 77.16], [94.0, 95.18], [103.0, 104.01], [104.0, 106.44], [113.0, 113.56], [114.0, 128.58], [130.0, 130.45], [131.0, 132.44], [135.0, 145.1], [147.0, 148.41], [153.0, 157.92], [161.0, 161.32], [163.0, 162.68], [164.0, 164.13], [167.0, 168.29], [172.0, 176.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 61.87, 63.31, 0.0, 0.0, 62.78, 0.0, 61.27, 0.0, 0.0, 59.51, 0.0, 77.36, 0.0, 0.0, 0.0, 0.0, 84.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 0.5, 0.67, 0.61, 1.13, -0.18, 2.25, 20.44, 15.16, 1.18, 1.01, 2.44, 0.56, 14.58, 0.45, 1.44, 10.1, 1.41, 4.92, 0.32, -0.32, 0.13, 1.29, 4.35]} \ No newline at end of file diff --git a/annotations_1/uWY60oFlfxs_filtered.json b/annotations_1/uWY60oFlfxs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ebf423c7785def98a79a6f05d0fb908557d6a8ff --- /dev/null +++ b/annotations_1/uWY60oFlfxs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.97], [8.0, 10.64], [14.0, 13.93], [16.0, 17.27], [22.0, 22.74], [23.0, 30.62], [38.0, 38.4], [38.0, 38.5], [39.0, 39.36], [40.0, 40.78], [44.0, 45.15], [49.0, 49.55], [60.0, 61.18], [62.0, 62.28], [64.0, 64.72], [69.0, 69.2], [80.0, 80.52], [85.0, 85.46], [92.0, 94.61], [95.0, 95.49], [96.0, 96.31], [97.0, 97.21], [99.0, 99.87], [100.0, 101.58], [104.0, 106.61], [107.0, 108.75], [112.0, 113.05], [114.0, 116.09]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.31, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.14, 0.0, 0.0, 0.0, 0.0, 0.0, 94.37, 0.0, 0.0, 99.84], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 35.23], ["wail, moan", 8.92], ["animal", 7.74]], null, null, null, null, null, null, null, null, null], "duration": [0.97, 2.64, -0.07, 1.27, 0.74, 7.62, 0.4, 0.5, 0.36, 0.78, 1.15, 0.55, 1.18, 0.28, 0.72, 0.2, 0.52, 0.46, 2.61, 0.49, 0.31, 0.21, 0.87, 1.58, 2.61, 1.75, 1.05, 2.09]} \ No newline at end of file diff --git a/annotations_1/uX7CAoxBNOU_filtered.json b/annotations_1/uX7CAoxBNOU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da1cff89f254e3ea0fe41bbdc9ecdea3827cfe03 --- /dev/null +++ b/annotations_1/uX7CAoxBNOU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [4.0, 5.93], [10.0, 10.29], [13.0, 14.18], [17.0, 18.49], [23.0, 23.97], [26.0, 31.45], [33.0, 32.91], [34.0, 35.19], [36.0, 44.04], [45.0, 50.13], [51.0, 51.09], [52.0, 53.76], [55.0, 55.75], [57.0, 60.91], [62.0, 63.07], [65.0, 65.21], [67.0, 67.8], [68.0, 68.62], [70.0, 69.96], [74.0, 75.61], [76.0, 83.4], [84.0, 84.79], [86.0, 86.53], [88.0, 88.55], [91.0, 90.8], [92.0, 93.06], [99.0, 99.57], [102.0, 103.37], [104.0, 104.21], [114.0, 113.76], [116.0, 116.58], [121.0, 121.2], [124.0, 124.09], [126.0, 126.25], [127.0, 128.93], [129.0, 129.93], [132.0, 132.68], [134.0, 141.24], [144.0, 144.05], [145.0, 146.06], [151.0, 151.14], [152.0, 153.28], [157.0, 159.14]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.42, 0.0, 0.0, 33.48, 38.74, 0.0, 0.0, 0.0, 32.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 33.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["beatboxing", 45.63], ["speech", 38.85], ["music", 7.33]], [["music", 59.63], ["drum", 7.51], ["musical instrument", 7.12]], null, null, null, [["music", 19.35], ["theremin", 11.56], ["clapping", 10.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 26.9], ["synthesizer", 15.21], ["didgeridoo", 6.83]], null, null, null, null, [["speech", 54.13], ["fart", 29.58], ["boing", 4.22]]], "duration": [0.57, 1.93, 0.29, 1.18, 1.49, 0.97, 5.45, -0.09, 1.19, 8.04, 5.13, 0.09, 1.76, 0.75, 3.91, 1.07, 0.21, 0.8, 0.62, -0.04, 1.61, 7.4, 0.79, 0.53, 0.55, -0.2, 1.06, 0.57, 1.37, 0.21, -0.24, 0.58, 0.2, 0.09, 0.25, 1.93, 0.93, 0.68, 7.24, 0.05, 1.06, 0.14, 1.28, 2.14]} \ No newline at end of file diff --git a/annotations_1/uXG9v1_X8jc_filtered.json b/annotations_1/uXG9v1_X8jc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65a7b1932075fe35f16ff6b6dd7d2465718b2364 --- /dev/null +++ b/annotations_1/uXG9v1_X8jc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.97], [9.0, 10.37], [11.0, 12.04], [14.0, 14.23], [15.0, 16.31], [18.0, 19.63], [23.0, 23.73], [27.0, 29.76], [32.0, 34.48], [38.0, 43.28], [46.0, 49.2], [50.0, 56.22], [57.0, 64.96], [67.0, 66.95], [67.0, 71.41], [72.0, 72.69], [74.0, 76.11], [78.0, 87.56], [88.0, 95.5], [97.0, 98.1], [98.0, 100.08], [105.0, 106.15], [108.0, 109.07], [119.0, 120.65], [122.0, 123.04], [124.0, 126.74], [129.0, 164.94], [166.0, 166.55]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.78, 54.36, 49.68, 57.72, 48.39, 56.63, 0.0, 31.62, 0.0, 98.8, 80.46, 51.82, 0.0, 54.43, 0.0, 0.0, 0.0, 0.0, 43.05, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["fly, housefly", 33.25], ["insect", 25.07], ["speech", 12.63]], null, [["music", 55.51], ["musical instrument", 7.15], ["guitar", 5.45]], null, [["hum", 34.75], ["mains hum", 27.91], ["music", 8.61]], null, null, [["music", 29.91], ["throbbing", 5.45], ["hum", 5.33]], null, null, null, null, null, null, null, null, null, null, [["hum", 14.41], ["fly, housefly", 11.3], ["insect", 10.09]], null, null], "duration": [0.97, 1.37, 1.04, 0.23, 1.31, 1.63, 0.73, 2.76, 2.48, 5.28, 3.2, 6.22, 7.96, -0.05, 4.41, 0.69, 2.11, 9.56, 7.5, 1.1, 2.08, 1.15, 1.07, 1.65, 1.04, 2.74, 35.94, 0.55]} \ No newline at end of file diff --git a/annotations_1/uZpvHkGMn5k_filtered.json b/annotations_1/uZpvHkGMn5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c731ed2545cc0d9e70824ecad087e67408078436 --- /dev/null +++ b/annotations_1/uZpvHkGMn5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[131.0, 141.22], [142.0, 141.78], [145.0, 145.74], [146.0, 151.11], [153.0, 155.21], [161.0, 167.44]], "keep_status": [true, false, false, true, true, true], "silence_prob": [32.02, 0.0, 0.0, 30.15, 30.08, 30.01], "audiomae_on_audioset": [[["speech", 35.7], ["music", 18.71], ["electric shaver, electric razor", 9.21]], null, null, [["music", 60.42], ["didgeridoo", 3.44], ["speech", 3.01]], [["music", 37.53], ["zipper (clothing)", 13.84], ["musical instrument", 7.4]], [["music", 41.89], ["speech", 9.94], ["electric shaver, electric razor", 8.41]]], "duration": [10.22, -0.22, 0.74, 5.11, 2.21, 6.44]} \ No newline at end of file diff --git a/annotations_1/u_jemmhoj0Q_filtered.json b/annotations_1/u_jemmhoj0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db609cdfc0928c455898c87bc4c4d0b45f05a85d --- /dev/null +++ b/annotations_1/u_jemmhoj0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.98], [5.0, 6.62], [16.0, 16.55], [35.0, 36.95], [38.0, 42.04], [44.0, 45.0], [46.0, 60.52], [62.0, 64.49], [65.0, 65.64], [70.0, 70.34], [77.0, 77.08], [82.0, 83.15], [99.0, 99.05], [100.0, 102.29], [103.0, 103.4], [104.0, 104.63], [106.0, 106.25]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.25, 0.0, 31.07, 31.72, 0.0, 0.0, 0.0, 0.0, 0.0, 85.35, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 27.23], ["speech", 16.36], ["buzz", 5.99]], null, [["music", 53.27], ["buzz", 39.28], ["electric shaver, electric razor", 1.75]], [["music", 31.27], ["moo", 7.38], ["speech", 6.53]], null, null, null, null, null, null, null, null, null], "duration": [0.98, 1.62, 0.55, 1.95, 4.04, 1.0, 14.52, 2.49, 0.64, 0.34, 0.08, 1.15, 0.05, 2.29, 0.4, 0.63, 0.25]} \ No newline at end of file diff --git a/annotations_1/u_n1SEwWmYc_filtered.json b/annotations_1/u_n1SEwWmYc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e82657e480aca04f35e90c91d03c55f19fccb77f --- /dev/null +++ b/annotations_1/u_n1SEwWmYc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.05], [6.0, 6.35], [8.0, 8.43], [10.0, 10.66], [17.0, 17.74], [23.0, 22.67], [27.0, 28.26], [41.0, 43.38], [44.0, 45.13], [50.0, 53.74], [54.0, 54.4], [57.0, 59.36], [63.0, 62.83], [64.0, 67.8], [69.0, 69.72], [74.0, 73.7], [76.0, 76.35], [78.0, 80.16], [100.0, 104.33], [105.0, 105.24], [105.0, 106.74], [107.0, 125.19], [130.0, 131.28], [132.0, 141.94], [143.0, 148.93], [149.0, 151.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 60.79, 0.0, 53.65, 0.0, 33.01, 0.0, 0.0, 0.0, 42.33, 29.93, 0.0, 0.0, 29.45, 0.0, 29.23, 55.25, 62.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 49.65], ["music", 14.05], ["effects unit", 5.23]], null, null, null, [["music", 68.02], ["speech", 6.16], ["musical instrument", 2.82]], [["speech", 46.49], ["music", 22.61], ["explosion", 6.33]], null, null, [["speech", 44.55], ["music", 13.82], ["sound effect", 5.52]], null, [["speech", 23.04], ["music", 20.82], ["explosion", 19.01]], null, null], "duration": [1.05, 0.35, 0.43, 0.66, 0.74, -0.33, 1.26, 2.38, 1.13, 3.74, 0.4, 2.36, -0.17, 3.8, 0.72, -0.3, 0.35, 2.16, 4.33, 0.24, 1.74, 18.19, 1.28, 9.94, 5.93, 2.01]} \ No newline at end of file diff --git a/annotations_1/u_z2ttNkL24_filtered.json b/annotations_1/u_z2ttNkL24_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a4b6b996ace2e0e6881f79a2eb6a3eadf5d1b84a --- /dev/null +++ b/annotations_1/u_z2ttNkL24_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.23], [14.0, 14.57], [15.0, 16.11], [21.0, 26.52], [27.0, 31.53], [33.0, 33.67], [38.0, 38.28], [40.0, 40.71], [41.0, 42.94], [46.0, 50.01], [52.0, 52.61], [53.0, 53.89], [54.0, 54.53], [56.0, 57.79], [60.0, 61.13], [63.0, 64.29], [67.0, 68.18], [69.0, 70.19], [71.0, 73.11], [77.0, 77.57], [82.0, 87.51], [92.0, 96.75], [103.0, 103.65], [108.0, 108.06], [108.0, 110.25], [111.0, 112.4], [116.0, 116.19], [118.0, 119.28], [121.0, 122.0], [122.0, 123.23], [128.0, 135.51], [136.0, 143.73]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 48.44, 75.23, 0.0, 0.0, 0.0, 0.0, 49.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.04, 0.0, 54.7, 47.5, 0.0, 0.0, 49.87, 0.0, 0.0, 0.0, 0.0, 0.0, 59.42, 82.43], "audiomae_on_audioset": [null, null, null, [["mains hum", 54.5], ["hum", 23.21], ["door", 5.72]], null, null, null, null, null, [["mains hum", 28.24], ["speech", 20.75], ["hum", 19.72]], null, null, null, null, null, null, null, null, null, null, null, [["music", 64.79], ["effects unit", 4.1], ["musical instrument", 3.4]], null, null, [["tuning fork", 33.13], ["singing bowl", 17.31], ["speech", 14.56]], null, null, null, null, null, null, null], "duration": [0.23, 0.57, 1.11, 5.52, 4.53, 0.67, 0.28, 0.71, 1.94, 4.01, 0.61, 0.89, 0.53, 1.79, 1.13, 1.29, 1.18, 1.19, 2.11, 0.57, 5.51, 4.75, 0.65, 0.06, 2.25, 1.4, 0.19, 1.28, 1.0, 1.23, 7.51, 7.73]} \ No newline at end of file diff --git a/annotations_1/uabEMv5Sr68_filtered.json b/annotations_1/uabEMv5Sr68_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b97298edd6aa3667e42350a56cf0f004d78edf7 --- /dev/null +++ b/annotations_1/uabEMv5Sr68_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.83], [16.0, 18.17], [20.0, 21.69], [22.0, 24.07], [25.0, 26.28], [27.0, 27.31], [29.0, 29.3], [30.0, 30.16], [34.0, 34.37], [41.0, 45.05], [45.0, 51.51], [53.0, 53.64], [55.0, 55.66], [58.0, 59.61], [60.0, 60.44], [61.0, 61.3], [62.0, 62.85], [63.0, 63.76], [64.0, 64.56], [65.0, 67.64], [68.0, 68.67], [71.0, 71.49], [72.0, 72.1], [73.0, 74.17], [77.0, 80.13], [81.0, 82.66], [84.0, 85.08], [87.0, 89.73], [91.0, 91.2], [92.0, 92.65], [93.0, 94.74], [95.0, 95.66], [97.0, 97.68], [98.0, 99.96], [101.0, 105.46], [106.0, 107.87], [109.0, 114.83], [115.0, 116.72], [118.0, 120.06], [122.0, 122.59], [124.0, 124.58], [128.0, 129.12], [130.0, 131.43], [133.0, 134.82], [137.0, 138.33], [140.0, 143.36], [144.0, 145.93], [146.0, 147.93], [149.0, 150.08], [151.0, 151.85], [153.0, 155.78], [157.0, 164.19], [165.0, 166.36], [167.0, 169.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.76, 0.0, 99.21, 0.0, 0.0, 0.0, 0.0, 0.0, 78.38, 64.41, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.11, 0.0, 99.87, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.65, 67.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.83, 2.17, 1.69, 2.07, 1.28, 0.31, 0.3, 0.16, 0.37, 4.05, 6.51, 0.64, 0.66, 1.61, 0.44, 0.3, 0.85, 0.76, 0.56, 2.64, 0.67, 0.49, 0.1, 1.17, 3.13, 1.66, 1.08, 2.73, 0.2, 0.65, 1.74, 0.66, 0.68, 1.96, 4.46, 1.87, 5.83, 1.72, 2.06, 0.59, 0.58, 1.12, 1.43, 1.82, 1.33, 3.36, 1.93, 1.93, 1.08, 0.85, 2.78, 7.19, 1.36, 2.15]} \ No newline at end of file diff --git a/annotations_1/ucYwV7EWIRU_filtered.json b/annotations_1/ucYwV7EWIRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce796ac3a49628f773ddbbec27b1ae602dc75efb --- /dev/null +++ b/annotations_1/ucYwV7EWIRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 22.84], [25.0, 27.5], [31.0, 60.51], [61.0, 76.0], [80.0, 81.57]], "keep_status": [false, true, false, true, false], "silence_prob": [0.0, 48.39, 30.22, 30.74, 0.0], "audiomae_on_audioset": [null, [["music", 35.41], ["fly, housefly", 8.54], ["musical instrument", 7.76]], [["music", 34.81], ["speech", 33.92], ["explosion", 4.18]], [["music", 34.44], ["speech", 10.23], ["electric shaver, electric razor", 6.4]], null], "duration": [-0.16, 2.5, 29.51, 15.0, 1.57]} \ No newline at end of file diff --git a/annotations_1/uciRaLsFmfM_filtered.json b/annotations_1/uciRaLsFmfM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddee2025c8673fca6ebf31df98d9973dd0077b6e --- /dev/null +++ b/annotations_1/uciRaLsFmfM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.05], [32.0, 35.4], [36.0, 39.99], [40.0, 43.43], [44.0, 46.18], [47.0, 60.12], [60.0, 60.49], [61.0, 61.96], [66.0, 66.88], [74.0, 75.19], [78.0, 78.58], [87.0, 88.26], [96.0, 96.33], [112.0, 117.42], [118.0, 119.2], [124.0, 130.84], [133.0, 134.27], [135.0, 135.82]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 71.43, 67.13, 63.96, 84.07, 35.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.45, 0.0, 28.22, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 56.53], ["synthesizer", 4.72], ["hum", 4.55]], null, null, null, null, null, null, null, [["music", 57.75], ["hum", 13.8], ["mains hum", 8.72]], null, [["music", 19.62], ["hum", 17.25], ["throbbing", 11.9]], null, null], "duration": [0.05, 3.4, 3.99, 3.43, 2.18, 13.12, 0.49, 0.96, 0.88, 1.19, 0.58, 1.26, 0.33, 5.42, 1.2, 6.84, 1.27, 0.82]} \ No newline at end of file diff --git a/annotations_1/uckdiNJ10LE_filtered.json b/annotations_1/uckdiNJ10LE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/uckdiNJ10LE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/udwKI7oFT6Y_filtered.json b/annotations_1/udwKI7oFT6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..06798a97146d5a58c619795d113dfecb03d7f13b --- /dev/null +++ b/annotations_1/udwKI7oFT6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [11.0, 23.18], [24.0, 24.6], [28.0, 29.83], [32.0, 31.89], [32.0, 36.64], [38.0, 77.03], [79.0, 102.24], [107.0, 111.86]], "keep_status": [false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 35.51, 0.0, 0.0, 0.0, 36.0, 0.0, 31.37, 37.35], "audiomae_on_audioset": [null, [["music", 58.57], ["emergency vehicle", 8.67], ["siren", 6.72]], null, null, null, [["speech", 21.41], ["music", 18.69], ["siren", 17.33]], null, [["speech", 40.82], ["music", 12.92], ["gunshot, gunfire", 5.33]], [["speech", 39.59], ["music", 33.91], ["hum", 4.76]]], "duration": [1.94, 12.18, 0.6, 1.83, -0.11, 4.64, 39.03, 23.24, 4.86]} \ No newline at end of file diff --git a/annotations_1/ueMuCbXkDhw_filtered.json b/annotations_1/ueMuCbXkDhw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c63f85aa61055358fef3594b1a2d67b0e0a09ea6 --- /dev/null +++ b/annotations_1/ueMuCbXkDhw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.49], [22.0, 22.32], [26.0, 26.45], [32.0, 45.59], [51.0, 53.0], [58.0, 62.92], [67.0, 89.56]], "keep_status": [false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 31.5, 32.59, 33.58, 45.52], "audiomae_on_audioset": [null, null, null, [["music", 52.83], ["dog", 8.88], ["animal", 7.57]], [["music", 40.12], ["grunt", 11.04], ["musical instrument", 7.68]], [["music", 56.78], ["musical instrument", 7.06], ["synthesizer", 5.9]], [["hum", 34.28], ["music", 26.08], ["throbbing", 11.14]]], "duration": [0.49, 0.32, 0.45, 13.59, 2.0, 4.92, 22.56]} \ No newline at end of file diff --git a/annotations_1/ufllQr0ClXg_filtered.json b/annotations_1/ufllQr0ClXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e85e3b74335ee3d5e95c754db5834f1e1d23d7a7 --- /dev/null +++ b/annotations_1/ufllQr0ClXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 36.02], [40.0, 51.36], [53.0, 54.84], [55.0, 56.12], [59.0, 59.8], [62.0, 62.82], [66.0, 73.21], [73.0, 73.97], [75.0, 84.74], [90.0, 93.46], [95.0, 99.91], [103.0, 103.2], [106.0, 106.44], [115.0, 116.6], [118.0, 127.14], [135.0, 138.81], [139.0, 140.8], [143.0, 143.45], [145.0, 146.47], [148.0, 150.13], [153.0, 159.68], [161.0, 163.49], [169.0, 169.6], [173.0, 174.33], [176.0, 179.85], [186.0, 189.63], [190.0, 191.76], [198.0, 198.61], [203.0, 203.89], [205.0, 205.82], [208.0, 208.5], [209.0, 210.22]], "keep_status": [true, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [42.93, 40.33, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 41.7, 49.54, 43.85, 0.0, 0.0, 0.0, 80.29, 51.71, 0.0, 0.0, 0.0, 55.53, 53.28, 76.86, 0.0, 0.0, 52.98, 45.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.18], ["synthesizer", 11.49], ["hum", 11.41]], [["fart", 43.07], ["music", 32.18], ["guitar", 3.34]], null, null, null, null, null, null, [["music", 52.21], ["speech", 12.27], ["cattle, bovinae", 4.77]], [["cattle, bovinae", 28.9], ["moo", 21.52], ["livestock, farm animals, working animals", 13.48]], [["music", 28.98], ["speech", 21.65], ["fly, housefly", 5.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.06], ["musical instrument", 5.4], ["synthesizer", 5.28]], null, null, null, null, null, null], "duration": [19.02, 11.36, 1.84, 1.12, 0.8, 0.82, 7.21, 0.97, 9.74, 3.46, 4.91, 0.2, 0.44, 1.6, 9.14, 3.81, 1.8, 0.45, 1.47, 2.13, 6.68, 2.49, 0.6, 1.33, 3.85, 3.63, 1.76, 0.61, 0.89, 0.82, 0.5, 1.22]} \ No newline at end of file diff --git a/annotations_1/uhBhYnRrOg4_filtered.json b/annotations_1/uhBhYnRrOg4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..679d4a0a7e0a37e62f2cac2e8d25a8e6b861166c --- /dev/null +++ b/annotations_1/uhBhYnRrOg4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.07], [17.0, 17.37], [31.0, 39.45], [48.0, 49.84], [51.0, 58.82], [63.0, 70.24], [77.0, 79.89], [88.0, 89.02], [91.0, 92.89], [95.0, 96.03], [98.0, 98.59], [99.0, 120.85]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 0.0, 35.58, 0.0, 33.05, 35.15, 36.32, 0.0, 0.0, 0.0, 0.0, 32.0], "audiomae_on_audioset": [null, null, [["music", 77.15], ["didgeridoo", 5.04], ["timpani", 1.91]], null, [["music", 47.0], ["synthesizer", 9.34], ["noise", 4.29]], [["cattle, bovinae", 44.84], ["livestock, farm animals, working animals", 29.24], ["moo", 25.88]], [["hum", 24.62], ["throbbing", 19.54], ["music", 8.49]], null, null, null, null, [["speech", 32.85], ["music", 23.47], ["hum", 12.05]]], "duration": [1.07, 0.37, 8.45, 1.84, 7.82, 7.24, 2.89, 1.02, 1.89, 1.03, 0.59, 21.85]} \ No newline at end of file diff --git a/annotations_1/uhDhzHrffBQ_filtered.json b/annotations_1/uhDhzHrffBQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f571c35ed2df36c4af44b9d71761eafdb038ea2 --- /dev/null +++ b/annotations_1/uhDhzHrffBQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.76], [22.0, 26.55], [33.0, 37.57], [42.0, 43.07], [46.0, 46.2], [59.0, 60.91], [62.0, 63.22], [67.0, 71.51], [72.0, 72.79], [75.0, 76.62], [77.0, 77.79], [81.0, 84.57], [85.0, 112.43], [119.0, 145.54], [150.0, 150.63], [151.0, 152.39], [153.0, 154.03], [155.0, 156.09], [165.0, 166.31], [169.0, 169.92], [171.0, 171.91], [173.0, 173.53], [188.0, 188.79], [190.0, 190.46], [193.0, 194.53], [201.0, 202.0], [204.0, 204.26], [205.0, 205.38], [206.0, 206.95], [208.0, 208.6], [211.0, 211.3], [214.0, 214.76], [216.0, 216.21], [218.0, 218.19], [222.0, 222.37], [223.0, 223.67], [224.0, 228.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 29.48, 31.47, 0.0, 0.0, 0.0, 0.0, 36.45, 0.0, 0.0, 0.0, 38.41, 30.43, 29.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.02], "audiomae_on_audioset": [null, [["whip", 52.98], ["speech", 16.73], ["meow", 2.89]], [["speech", 48.8], ["boing", 28.62], ["cacophony", 2.74]], null, null, null, null, [["music", 61.85], ["speech", 5.71], ["foghorn", 3.57]], null, null, null, [["music", 51.98], ["hum", 7.82], ["throbbing", 7.23]], [["music", 78.2], ["speech", 4.55], ["drum machine", 3.46]], [["music", 30.02], ["speech", 16.33], ["smash, crash", 7.56]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.3], ["whale vocalization", 10.85], ["animal", 8.31]]], "duration": [0.76, 4.55, 4.57, 1.07, 0.2, 1.91, 1.22, 4.51, 0.79, 1.62, 0.79, 3.57, 27.43, 26.54, 0.63, 1.39, 1.03, 1.09, 1.31, 0.92, 0.91, 0.53, 0.79, 0.46, 1.53, 1.0, 0.26, 0.38, 0.95, 0.6, 0.3, 0.76, 0.21, 0.19, 0.37, 0.67, 4.53]} \ No newline at end of file diff --git a/annotations_1/uhkfz535fR8_filtered.json b/annotations_1/uhkfz535fR8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cccd5f7956540169ffb16c697acffa59d9b9f408 --- /dev/null +++ b/annotations_1/uhkfz535fR8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.57], [4.0, 4.78], [6.0, 16.56], [18.0, 20.44], [23.0, 23.84], [26.0, 72.67], [75.0, 75.36], [78.0, 79.42], [81.0, 81.11], [82.0, 83.03], [84.0, 83.86], [87.0, 87.37], [89.0, 91.37], [92.0, 109.48], [111.0, 110.74], [112.0, 114.08], [115.0, 115.25], [116.0, 130.54], [136.0, 145.18], [147.0, 147.36], [151.0, 180.54]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 35.71, 40.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.14, 34.22, 0.0, 55.96, 0.0, 33.35, 32.42, 0.0, 33.52], "audiomae_on_audioset": [null, null, [["music", 20.23], ["hum", 12.72], ["vehicle", 8.52]], [["speech", 66.03], ["vehicle", 4.75], ["hum", 4.23]], null, null, null, null, null, null, null, null, [["music", 31.23], ["buzz", 13.23], ["hum", 6.63]], [["throbbing", 23.25], ["music", 19.22], ["hum", 17.84]], null, null, null, [["speech", 45.28], ["music", 31.89], ["didgeridoo", 14.71]], [["music", 49.53], ["throbbing", 7.92], ["drum and bass", 4.51]], null, [["music", 20.37], ["throbbing", 13.07], ["speech", 12.91]]], "duration": [1.57, 0.78, 10.56, 2.44, 0.84, 46.67, 0.36, 1.42, 0.11, 1.03, -0.14, 0.37, 2.37, 17.48, -0.26, 2.08, 0.25, 14.54, 9.18, 0.36, 29.54]} \ No newline at end of file diff --git a/annotations_1/uifDWAJ6rBY_filtered.json b/annotations_1/uifDWAJ6rBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/uifDWAJ6rBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/uioT_3dqzXc_filtered.json b/annotations_1/uioT_3dqzXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b100f32339e89a162d98af56091b99747d93d7d7 --- /dev/null +++ b/annotations_1/uioT_3dqzXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.26], [12.0, 31.35], [31.0, 33.72], [35.0, 60.02], [63.0, 89.88], [92.0, 104.67], [107.0, 109.05], [109.0, 109.63]], "keep_status": [true, false, true, true, true, false, true, false], "silence_prob": [30.5, 29.77, 29.73, 30.44, 29.92, 30.26, 30.15, 0.0], "audiomae_on_audioset": [[["music", 35.28], ["mains hum", 17.17], ["musical instrument", 10.04]], [["speech", 79.54], ["vehicle", 7.05], ["music", 3.18]], [["speech", 27.78], ["music", 10.51], ["didgeridoo", 5.97]], [["explosion", 23.35], ["music", 20.66], ["burst, pop", 8.47]], [["music", 47.06], ["hum", 12.6], ["throbbing", 6.13]], [["hum", 46.63], ["mains hum", 39.95], ["throbbing", 5.11]], [["music", 41.82], ["synthesizer", 7.8], ["musical instrument", 7.72]], null], "duration": [2.26, 19.35, 2.72, 25.02, 26.88, 12.67, 2.05, 0.63]} \ No newline at end of file diff --git a/annotations_1/ujA70PK6E7U_filtered.json b/annotations_1/ujA70PK6E7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88ea73b7346adc368fc7f60ff8c6b76933616df1 --- /dev/null +++ b/annotations_1/ujA70PK6E7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 34.38], [36.0, 45.94], [47.0, 53.16], [57.0, 58.9], [64.0, 123.08], [126.0, 152.91], [156.0, 156.47]], "keep_status": [false, true, true, false, false, true, false], "silence_prob": [31.18, 30.85, 32.23, 0.0, 0.0, 30.0, 0.0], "audiomae_on_audioset": [[["speech", 67.57], ["whale vocalization", 19.21], ["music", 7.58]], [["whale vocalization", 30.79], ["vehicle", 11.63], ["music", 11.51]], [["whale vocalization", 23.94], ["music", 20.2], ["speech", 14.29]], null, null, [["speech", 51.95], ["music", 11.4], ["hum", 3.84]], null], "duration": [29.38, 9.94, 6.16, 1.9, 59.08, 26.91, 0.47]} \ No newline at end of file diff --git a/annotations_1/ujFOaYo5QME_filtered.json b/annotations_1/ujFOaYo5QME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae66a4e076bd52964c073a6ec64a4d579f3d0a76 --- /dev/null +++ b/annotations_1/ujFOaYo5QME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.51], [11.0, 12.39], [20.0, 20.58], [23.0, 23.9], [24.0, 24.02], [29.0, 29.54], [37.0, 37.64], [40.0, 40.36], [48.0, 48.88], [59.0, 59.75], [69.0, 69.16], [71.0, 71.9], [74.0, 74.46], [77.0, 77.67], [80.0, 80.43], [89.0, 89.23], [93.0, 93.77], [98.0, 98.41], [102.0, 102.47], [106.0, 106.05], [109.0, 109.05], [110.0, 110.52], [124.0, 124.56], [126.0, 126.69], [130.0, 130.47], [133.0, 134.23], [145.0, 145.35], [153.0, 153.54], [159.0, 159.7], [165.0, 165.4], [167.0, 167.63], [169.0, 168.89], [171.0, 171.17], [173.0, 173.72], [181.0, 181.28], [185.0, 185.95], [189.0, 189.67], [191.0, 191.81], [195.0, 195.1], [196.0, 196.82], [201.0, 202.15], [203.0, 202.88], [204.0, 204.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 1.39, 0.58, 0.9, 0.02, 0.54, 0.64, 0.36, 0.88, 0.75, 0.16, 0.9, 0.46, 0.67, 0.43, 0.23, 0.77, 0.41, 0.47, 0.05, 0.05, 0.52, 0.56, 0.69, 0.47, 1.23, 0.35, 0.54, 0.7, 0.4, 0.63, -0.11, 0.17, 0.72, 0.28, 0.95, 0.67, 0.81, 0.1, 0.82, 1.15, -0.12, 0.23]} \ No newline at end of file diff --git a/annotations_1/ujgbo-_khSM_filtered.json b/annotations_1/ujgbo-_khSM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e585bc48ac1a08ca6f2f02ee3cc046e4cbff20c4 --- /dev/null +++ b/annotations_1/ujgbo-_khSM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.89], [12.0, 13.05], [14.0, 16.46], [27.0, 27.28], [31.0, 31.65], [32.0, 37.61], [43.0, 44.15], [46.0, 45.81], [49.0, 49.94], [56.0, 56.15], [76.0, 76.54], [82.0, 82.05], [88.0, 88.7], [91.0, 91.0], [92.0, 92.79], [97.0, 97.24], [100.0, 103.03], [104.0, 105.44], [107.0, 113.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.53, 0.0, 90.95, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 38.06], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 52.93], ["fart", 38.79], ["inside, small room", 2.14]]], "duration": [9.89, 1.05, 2.46, 0.28, 0.65, 5.61, 1.15, -0.19, 0.94, 0.15, 0.54, 0.05, 0.7, 0.0, 0.79, 0.24, 3.03, 1.44, 6.98]} \ No newline at end of file diff --git a/annotations_1/ukNsgDQKqfY_filtered.json b/annotations_1/ukNsgDQKqfY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..619b0d6e206fe10fe2269b316bcb25f671a62327 --- /dev/null +++ b/annotations_1/ukNsgDQKqfY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 44.74], [47.0, 52.22], [53.0, 90.26], [91.0, 91.96], [93.0, 94.07]], "keep_status": [true, false, false, false, false], "silence_prob": [32.13, 41.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 38.72], ["quack", 12.22], ["trombone", 3.73]], [["music", 59.62], ["didgeridoo", 11.51], ["musical instrument", 4.55]], null, null, null], "duration": [14.74, 5.22, 37.26, 0.96, 1.07]} \ No newline at end of file diff --git a/annotations_1/ukOx2hZvXkE_filtered.json b/annotations_1/ukOx2hZvXkE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5faf15604807958f07b43155c70eb357f8efa8eb --- /dev/null +++ b/annotations_1/ukOx2hZvXkE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.28], [6.0, 8.5], [11.0, 11.03], [14.0, 14.44], [19.0, 19.26], [21.0, 21.2], [28.0, 29.71], [33.0, 34.89], [36.0, 36.8], [39.0, 42.5], [43.0, 47.43], [48.0, 54.21], [56.0, 56.62], [58.0, 62.04], [67.0, 67.8], [70.0, 72.35], [77.0, 77.72], [79.0, 79.52], [82.0, 82.9], [85.0, 86.37], [88.0, 89.09], [91.0, 91.32], [93.0, 93.97], [96.0, 96.87], [99.0, 103.06], [104.0, 106.37], [110.0, 110.59], [115.0, 116.55], [117.0, 118.39], [119.0, 121.86], [122.0, 123.31], [126.0, 127.58], [129.0, 128.9], [131.0, 131.55], [132.0, 133.27], [136.0, 135.75], [138.0, 137.76], [141.0, 141.0], [142.0, 142.3], [143.0, 145.83], [147.0, 147.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 100.0, 100.0, 0.0, 87.19, 0.0, 95.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.68, 99.59, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.28, 2.5, 0.03, 0.44, 0.26, 0.2, 1.71, 1.89, 0.8, 3.5, 4.43, 6.21, 0.62, 4.04, 0.8, 2.35, 0.72, 0.52, 0.9, 1.37, 1.09, 0.32, 0.97, 0.87, 4.06, 2.37, 0.59, 1.55, 1.39, 2.86, 1.31, 1.58, -0.1, 0.55, 1.27, -0.25, -0.24, 0.0, 0.3, 2.83, 0.78]} \ No newline at end of file diff --git a/annotations_1/ukl9qBvRXfc_filtered.json b/annotations_1/ukl9qBvRXfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bbd14d2ddec900c794c374b7e753d8d97d99caf5 --- /dev/null +++ b/annotations_1/ukl9qBvRXfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.33], [4.0, 4.09], [8.0, 9.04], [20.0, 27.06], [28.0, 28.14], [33.0, 33.35], [45.0, 46.06], [50.0, 53.94], [55.0, 54.94], [59.0, 61.15], [62.0, 62.01], [102.0, 102.24], [112.0, 112.92], [118.0, 119.48], [121.0, 121.51], [122.0, 123.4], [128.0, 128.71], [130.0, 131.95], [137.0, 140.68], [142.0, 145.93], [148.0, 149.3], [150.0, 150.3], [155.0, 159.92], [161.0, 161.92], [162.0, 167.68]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.32, 0.0, 0.0, 0.0, 42.93, 0.0, 36.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.54, 34.4, 0.0, 0.0, 41.87, 0.0, 45.27], "audiomae_on_audioset": [null, null, null, [["music", 47.57], ["speech", 28.52], ["electronic music", 3.06]], null, null, null, [["speech", 42.82], ["music", 22.25], ["wood", 2.14]], null, [["music", 54.42], ["synthesizer", 3.23], ["hum", 1.81]], null, null, null, null, null, null, null, null, null, [["music", 46.51], ["speech", 32.22], ["musical instrument", 2.09]], null, null, [["moo", 25.69], ["music", 19.6], ["cattle, bovinae", 18.95]], null, [["music", 50.11], ["ambient music", 29.17], ["electronic music", 4.41]]], "duration": [0.33, 0.09, 1.04, 7.06, 0.14, 0.35, 1.06, 3.94, -0.06, 2.15, 0.01, 0.24, 0.92, 1.48, 0.51, 1.4, 0.71, 1.95, 3.68, 3.93, 1.3, 0.3, 4.92, 0.92, 5.68]} \ No newline at end of file diff --git a/annotations_1/ukzIFp4Kj90_filtered.json b/annotations_1/ukzIFp4Kj90_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b05156457522f86101d3237fac1e6bf7a17b7da1 --- /dev/null +++ b/annotations_1/ukzIFp4Kj90_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.33], [17.0, 18.76], [26.0, 26.77], [28.0, 29.96], [30.0, 30.84], [32.0, 33.03], [36.0, 39.55], [41.0, 42.6], [44.0, 46.28], [48.0, 48.46], [50.0, 50.4], [52.0, 54.13], [57.0, 58.73], [60.0, 60.22], [62.0, 66.73], [68.0, 69.74], [70.0, 70.9], [72.0, 72.86], [74.0, 76.11], [80.0, 80.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.71, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 98.93, 0.0, 0.0, 59.42, 0.0, 0.0, 0.0, 100.0, 0.0], "audiomae_on_audioset": [[["speech", 80.63], ["bouncing", 6.37], ["fart", 1.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [12.33, 1.76, 0.77, 1.96, 0.84, 1.03, 3.55, 1.6, 2.28, 0.46, 0.4, 2.13, 1.73, 0.22, 4.73, 1.74, 0.9, 0.86, 2.11, 0.0]} \ No newline at end of file diff --git a/annotations_1/ulFxMs35-P0_filtered.json b/annotations_1/ulFxMs35-P0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2d4177677fbb7e4d70a86ef725aafcfea5c1eb3 --- /dev/null +++ b/annotations_1/ulFxMs35-P0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.92], [30.0, 30.74], [35.0, 47.9], [50.0, 49.64], [50.0, 53.4], [55.0, 80.13], [81.0, 81.45], [82.0, 92.21]], "keep_status": [false, false, false, false, true, true, false, true], "silence_prob": [0.0, 0.0, 30.02, 0.0, 31.16, 32.09, 0.0, 29.36], "audiomae_on_audioset": [null, null, [["music", 49.51], ["smash, crash", 12.59], ["thump, thud", 11.66]], null, [["music", 38.72], ["hum", 18.29], ["throbbing", 10.35]], [["speech", 21.97], ["hum", 18.1], ["mains hum", 16.36]], null, [["speech", 27.4], ["music", 26.17], ["hum", 11.78]]], "duration": [0.92, 0.74, 12.9, -0.36, 3.4, 25.13, 0.45, 10.21]} \ No newline at end of file diff --git a/annotations_1/ulJXiB5i_q0_filtered.json b/annotations_1/ulJXiB5i_q0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07695e22074e15a3fffb6b164d15fe0c64cad8a0 --- /dev/null +++ b/annotations_1/ulJXiB5i_q0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.56], [7.0, 10.18], [12.0, 14.71], [18.0, 18.89], [21.0, 23.52], [26.0, 28.41], [30.0, 37.23], [41.0, 56.19], [61.0, 63.69], [68.0, 68.74], [70.0, 71.2], [73.0, 73.53], [76.0, 79.37], [83.0, 86.98], [90.0, 94.2], [96.0, 96.74], [97.0, 99.27], [100.0, 102.71], [107.0, 107.0], [107.0, 107.13], [107.0, 108.33], [114.0, 118.44], [124.0, 126.4], [130.0, 134.03], [135.0, 137.52], [139.0, 141.98], [146.0, 159.04], [164.0, 165.97], [170.0, 172.64], [184.0, 188.43], [192.0, 197.19], [201.0, 202.69], [214.0, 216.31], [232.0, 239.97], [241.0, 242.91], [243.0, 244.76], [246.0, 247.18], [248.0, 259.31], [261.0, 265.06], [266.0, 273.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false, false], "silence_prob": [100.0, 100.0, 100.0, 0.0, 99.98, 95.23, 100.0, 79.59, 60.6, 0.0, 0.0, 0.0, 38.55, 82.25, 40.54, 0.0, 67.13, 89.9, 0.0, 0.0, 0.0, 64.18, 73.67, 30.43, 48.56, 89.36, 30.33, 0.0, 39.7, 32.7, 34.51, 0.0, 32.34, 36.52, 0.0, 0.0, 0.0, 43.08, 50.97, 99.71], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.65], ["humming", 4.71], ["lullaby", 4.02]], null, [["music", 57.45], ["theremin", 5.99], ["humming", 4.69]], null, null, null, null, null, null, null, null, [["music", 35.6], ["musical instrument", 4.76], ["effects unit", 4.58]], [["fly, housefly", 24.55], ["insect", 15.67], ["music", 13.03]], null, [["music", 51.64], ["theremin", 34.98], ["synthesizer", 1.9]], null, [["music", 72.55], ["musical instrument", 4.35], ["cello", 1.92]], [["music", 38.5], ["brass instrument", 16.58], ["trombone", 12.36]], [["music", 44.58], ["cello", 9.06], ["theremin", 8.57]], null, [["music", 53.27], ["didgeridoo", 17.73], ["theremin", 14.61]], [["theremin", 65.51], ["music", 26.52], ["singing", 0.65]], null, null, null, [["music", 35.08], ["effects unit", 10.06], ["singing", 6.43]], null, null], "duration": [2.56, 3.18, 2.71, 0.89, 2.52, 2.41, 7.23, 15.19, 2.69, 0.74, 1.2, 0.53, 3.37, 3.98, 4.2, 0.74, 2.27, 2.71, 0.0, 0.13, 1.33, 4.44, 2.4, 4.03, 2.52, 2.98, 13.04, 1.97, 2.64, 4.43, 5.19, 1.69, 2.31, 7.97, 1.91, 1.76, 1.18, 11.31, 4.06, 7.67]} \ No newline at end of file diff --git a/annotations_1/umKFAbLoUxQ_filtered.json b/annotations_1/umKFAbLoUxQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe4b9f97b37521ae8f21162a57e5d931a8e8fb0a --- /dev/null +++ b/annotations_1/umKFAbLoUxQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.43], [25.0, 30.37], [32.0, 33.89], [34.0, 33.94], [34.0, 34.16], [35.0, 35.9], [37.0, 38.2], [41.0, 41.22], [44.0, 51.06], [52.0, 55.0], [57.0, 60.96], [64.0, 65.5], [67.0, 68.18], [69.0, 72.01], [73.0, 76.99], [78.0, 78.6], [80.0, 81.87], [84.0, 84.77], [87.0, 88.05], [89.0, 89.85], [90.0, 90.46], [92.0, 95.39], [97.0, 98.85], [101.0, 101.56]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.6, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.63, 42.02, 63.21, 0.0, 0.0, 89.01, 61.67, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.46, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 44.7], ["didgeridoo", 24.26], ["theremin", 3.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.43, 5.37, 1.89, -0.06, 0.16, 0.9, 1.2, 0.22, 7.06, 3.0, 3.96, 1.5, 1.18, 3.01, 3.99, 0.6, 1.87, 0.77, 1.05, 0.85, 0.46, 3.39, 1.85, 0.56]} \ No newline at end of file diff --git a/annotations_1/umcyzRBeJtE_filtered.json b/annotations_1/umcyzRBeJtE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7ba94562f2d505c8cda466ca6715be9badd5618 --- /dev/null +++ b/annotations_1/umcyzRBeJtE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 15.53], [20.0, 21.03], [38.0, 41.34], [43.0, 43.21], [45.0, 47.36], [49.0, 48.88], [63.0, 65.47], [71.0, 71.9], [73.0, 73.41], [76.0, 78.19], [81.0, 81.5], [86.0, 88.94], [90.0, 91.62], [92.0, 92.67], [96.0, 96.23], [98.0, 99.47], [101.0, 101.09], [103.0, 103.5], [106.0, 106.37], [107.0, 107.82], [108.0, 108.73], [113.0, 113.1], [114.0, 114.99], [116.0, 116.28], [119.0, 119.64], [123.0, 123.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.98, 0.0, 51.55, 0.0, 83.7, 0.0, 0.0, 77.53, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 63.88], ["timpani", 3.54], ["inside, small room", 3.07]], null, null, null, null, null, null, null, null, [["music", 23.0], ["hum", 14.14], ["gong", 11.38]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 1.03, 3.34, 0.21, 2.36, -0.12, 2.47, 0.9, 0.41, 2.19, 0.5, 2.94, 1.62, 0.67, 0.23, 1.47, 0.09, 0.5, 0.37, 0.82, 0.73, 0.1, 0.99, 0.28, 0.64, 0.16]} \ No newline at end of file diff --git a/annotations_1/unWr90pLIvc_filtered.json b/annotations_1/unWr90pLIvc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8e67f0313b1866e6a2c403b6d444582fa1884db --- /dev/null +++ b/annotations_1/unWr90pLIvc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 33.94], [35.0, 37.3], [38.0, 41.27], [43.0, 44.86], [47.0, 49.6], [50.0, 63.88], [70.0, 85.99], [87.0, 90.0], [91.0, 93.21], [97.0, 99.22], [101.0, 102.44], [110.0, 112.65], [114.0, 116.07], [130.0, 136.61], [137.0, 137.96], [140.0, 144.49], [156.0, 156.39], [159.0, 160.05], [171.0, 174.6], [187.0, 188.0], [188.0, 188.69], [189.0, 195.57], [197.0, 199.77], [200.0, 203.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 100.0, 84.43, 0.0, 78.21, 66.15, 71.0, 67.25, 69.2, 77.7, 0.0, 86.27, 73.36, 76.7, 0.0, 78.72, 0.0, 0.0, 61.87, 0.0, 0.0, 81.71, 68.54, 53.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.94, 2.3, 3.27, 1.86, 2.6, 13.88, 15.99, 3.0, 2.21, 2.22, 1.44, 2.65, 2.07, 6.61, 0.96, 4.49, 0.39, 1.05, 3.6, 1.0, 0.69, 6.57, 2.77, 3.13]} \ No newline at end of file diff --git a/annotations_1/up1wTd5shfc_filtered.json b/annotations_1/up1wTd5shfc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd562b5fd2aab93ddd399bb588ed8bffa0931ece --- /dev/null +++ b/annotations_1/up1wTd5shfc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 9.93], [11.0, 41.47], [42.0, 42.67], [44.0, 48.46], [50.0, 51.17], [52.0, 53.57], [55.0, 57.23], [63.0, 64.67], [75.0, 74.85], [79.0, 80.54], [89.0, 91.29], [94.0, 109.17], [112.0, 116.31], [117.0, 126.98], [128.0, 130.23], [132.0, 132.54], [135.0, 136.86], [138.0, 138.38], [141.0, 158.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [54.5, 0.0, 0.0, 97.54, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 99.16, 47.2, 57.17, 50.86, 53.78, 0.0, 0.0, 0.0, 34.24], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.47], ["musical instrument", 4.15], ["didgeridoo", 3.98]], null, null, null, null, null, null, [["music", 44.66], ["throbbing", 8.24], ["synthesizer", 6.25]]], "duration": [7.93, 30.47, 0.67, 4.46, 1.17, 1.57, 2.23, 1.67, -0.15, 1.54, 2.29, 15.17, 4.31, 9.98, 2.23, 0.54, 1.86, 0.38, 17.21]} \ No newline at end of file diff --git a/annotations_1/upPFFVaVSY4_filtered.json b/annotations_1/upPFFVaVSY4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48dd8a864caaa34876d7140a3352d04617503bf9 --- /dev/null +++ b/annotations_1/upPFFVaVSY4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 20.21], [29.0, 29.32], [31.0, 33.4], [36.0, 37.17], [45.0, 48.41], [52.0, 59.1], [63.0, 64.57], [66.0, 67.68], [68.0, 69.47], [74.0, 75.03], [82.0, 86.32], [90.0, 91.05]], "keep_status": [true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [38.52, 0.0, 40.7, 0.0, 52.1, 93.45, 0.0, 0.0, 0.0, 0.0, 42.3, 0.0], "audiomae_on_audioset": [[["mains hum", 32.4], ["hum", 26.43], ["music", 9.95]], null, [["frog", 26.73], ["sidetone", 25.13], ["speech", 21.95]], null, null, null, null, null, null, null, [["noise", 24.25], ["music", 14.5], ["effects unit", 12.38]], null], "duration": [4.21, 0.32, 2.4, 1.17, 3.41, 7.1, 1.57, 1.68, 1.47, 1.03, 4.32, 1.05]} \ No newline at end of file diff --git a/annotations_1/upoh7LbKZR0_filtered.json b/annotations_1/upoh7LbKZR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c1b1b0a0cec6ccf000245b8116af66c25d12794 --- /dev/null +++ b/annotations_1/upoh7LbKZR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.09], [6.0, 5.97], [6.0, 6.88], [8.0, 8.95], [10.0, 10.57], [12.0, 13.31], [14.0, 30.4], [37.0, 37.45], [38.0, 42.69], [43.0, 43.73], [45.0, 45.62], [46.0, 46.95], [47.0, 47.95], [49.0, 50.14], [51.0, 51.9], [53.0, 53.0], [55.0, 54.9], [55.0, 55.9], [57.0, 57.2], [58.0, 58.75], [60.0, 60.4], [62.0, 62.56], [63.0, 63.15], [65.0, 66.28], [72.0, 72.59], [73.0, 74.41], [76.0, 76.71], [79.0, 79.59], [84.0, 84.23], [86.0, 86.19], [87.0, 87.59], [89.0, 89.53], [92.0, 101.7], [102.0, 102.91], [104.0, 104.46], [106.0, 106.44], [112.0, 112.13], [113.0, 113.73], [115.0, 118.76], [126.0, 145.56], [147.0, 147.01], [147.0, 152.49]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.75, 0.0, 35.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.46, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 64.63, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.59], ["ambient music", 11.11], ["didgeridoo", 6.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["throbbing", 22.59], ["hum", 18.95], ["heart murmur", 10.94]], null, null, null, null, null, [["music", 32.71], ["synthesizer", 9.45], ["sidetone", 9.16]], null, null, null], "duration": [1.09, -0.03, 0.88, 0.95, 0.57, 1.31, 16.4, 0.45, 4.69, 0.73, 0.62, 0.95, 0.95, 1.14, 0.9, 0.0, -0.1, 0.9, 0.2, 0.75, 0.4, 0.56, 0.15, 1.28, 0.59, 1.41, 0.71, 0.59, 0.23, 0.19, 0.59, 0.53, 9.7, 0.91, 0.46, 0.44, 0.13, 0.73, 3.76, 19.56, 0.01, 5.49]} \ No newline at end of file diff --git a/annotations_1/uqS2-v7iZr8_filtered.json b/annotations_1/uqS2-v7iZr8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c3d1d92b9de394bf55fe8e1dad255aa8124b48c7 --- /dev/null +++ b/annotations_1/uqS2-v7iZr8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.18], [15.0, 14.94], [15.0, 16.04], [18.0, 50.72], [52.0, 58.11], [60.0, 61.05], [63.0, 64.05], [69.0, 69.48], [73.0, 74.65], [76.0, 78.21], [82.0, 86.46], [88.0, 98.56], [100.0, 114.32], [116.0, 115.99], [117.0, 120.51], [121.0, 122.44]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [28.51, 0.0, 0.0, 0.0, 57.01, 0.0, 0.0, 0.0, 0.0, 45.56, 41.46, 35.82, 34.14, 0.0, 62.17, 0.0], "audiomae_on_audioset": [[["music", 57.39], ["didgeridoo", 6.55], ["musical instrument", 4.94]], null, null, null, null, null, null, null, null, [["music", 52.26], ["theremin", 18.01], ["musical instrument", 8.12]], [["music", 39.35], ["cello", 32.76], ["double bass", 10.67]], [["music", 32.47], ["hum", 20.09], ["mains hum", 14.14]], [["theremin", 87.37], ["music", 8.2], ["musical instrument", 1.1]], null, null, null], "duration": [3.18, -0.06, 1.04, 32.72, 6.11, 1.05, 1.05, 0.48, 1.65, 2.21, 4.46, 10.56, 14.32, -0.01, 3.51, 1.44]} \ No newline at end of file diff --git a/annotations_1/uqVEYJGg3J0_filtered.json b/annotations_1/uqVEYJGg3J0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8fee5add04e5cca4820bcfcaec27c797cbdb0f5e --- /dev/null +++ b/annotations_1/uqVEYJGg3J0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.39], [8.0, 9.39], [10.0, 10.37], [13.0, 13.61], [18.0, 19.68], [22.0, 23.35], [25.0, 25.95], [40.0, 40.71], [42.0, 43.43], [46.0, 47.36], [50.0, 52.02], [52.0, 58.19], [63.0, 67.15], [69.0, 69.43], [73.0, 73.63], [76.0, 77.01], [83.0, 84.77], [87.0, 87.98], [91.0, 93.65], [100.0, 101.92], [103.0, 104.23], [106.0, 107.42], [109.0, 109.22], [111.0, 111.42], [112.0, 112.58], [116.0, 118.25], [121.0, 122.07], [124.0, 126.35], [135.0, 136.0], [138.0, 139.18], [141.0, 141.08], [146.0, 145.67], [150.0, 150.53], [153.0, 155.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 58.89, 99.59, 0.0, 0.0, 0.0, 0.0, 0.0, 32.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.19, 0.0, 91.64, 0.0, 0.0, 0.0, 0.0, 0.0, 65.67], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 69.06], ["radio", 25.01], ["sidetone", 2.02]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.39, 1.39, 0.37, 0.61, 1.68, 1.35, 0.95, 0.71, 1.43, 1.36, 2.02, 6.19, 4.15, 0.43, 0.63, 1.01, 1.77, 0.98, 2.65, 1.92, 1.23, 1.42, 0.22, 0.42, 0.58, 2.25, 1.07, 2.35, 1.0, 1.18, 0.08, -0.33, 0.53, 2.04]} \ No newline at end of file diff --git a/annotations_1/urbo6F_qD5k_filtered.json b/annotations_1/urbo6F_qD5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d1a7f1a06048e87d18356031baf5b0c8ab9b84b --- /dev/null +++ b/annotations_1/urbo6F_qD5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.29], [5.0, 5.37], [8.0, 8.65], [10.0, 10.45], [15.0, 16.07], [17.0, 24.12], [25.0, 26.2], [29.0, 29.0], [31.0, 31.01], [35.0, 37.02], [42.0, 71.32], [72.0, 112.45], [117.0, 119.72], [122.0, 122.39], [128.0, 135.01], [137.0, 143.43], [147.0, 148.76], [149.0, 149.17], [149.0, 150.3], [152.0, 153.15]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true, false, false, false, false], "silence_prob": [76.2, 0.0, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 0.0, 29.44, 55.04, 0.0, 33.63, 0.0, 30.02, 29.98, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 11.72], ["vehicle", 8.82], ["buzz", 6.26]], null, null, [["fly, housefly", 28.12], ["insect", 10.88], ["music", 9.39]], null, [["music", 77.91], ["groan", 3.37], ["speech", 1.54]], [["livestock, farm animals, working animals", 34.27], ["cattle, bovinae", 20.66], ["moo", 8.34]], null, null, null, null], "duration": [2.29, 0.37, 0.65, 0.45, 1.07, 7.12, 1.2, 0.0, 0.01, 2.02, 29.32, 40.45, 2.72, 0.39, 7.01, 6.43, 1.76, 0.17, 1.3, 1.15]} \ No newline at end of file diff --git a/annotations_1/usmBCn2WxYU_filtered.json b/annotations_1/usmBCn2WxYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7f18c93ec816edfa7c320353bd5fb429e2ddae5a --- /dev/null +++ b/annotations_1/usmBCn2WxYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 19.33], [22.0, 26.3], [29.0, 31.21], [32.0, 55.49], [59.0, 79.39], [82.0, 110.67], [112.0, 118.61], [121.0, 156.78]], "keep_status": [true, true, true, false, false, false, true, false], "silence_prob": [29.03, 30.02, 30.78, 31.57, 29.86, 29.98, 30.27, 0.0], "audiomae_on_audioset": [[["music", 51.0], ["cacophony", 11.87], ["theremin", 3.93]], [["music", 13.05], ["motorcycle", 10.17], ["vehicle", 9.16]], [["speech", 28.68], ["music", 25.87], ["hum", 11.95]], [["hum", 48.31], ["throbbing", 37.93], ["music", 7.27]], [["music", 44.41], ["throbbing", 32.6], ["hum", 11.17]], [["hum", 58.97], ["mains hum", 10.24], ["music", 9.4]], [["music", 40.34], ["speech", 9.33], ["groan", 3.74]], null], "duration": [4.33, 4.3, 2.21, 23.49, 20.39, 28.67, 6.61, 35.78]} \ No newline at end of file diff --git a/annotations_1/utYsQTUae5w_filtered.json b/annotations_1/utYsQTUae5w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9cc11580a9c96ce088ed9c89795e701f7f550e8 --- /dev/null +++ b/annotations_1/utYsQTUae5w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 20.92], [29.0, 29.05], [43.0, 44.69], [52.0, 53.97], [56.0, 56.32], [63.0, 63.24], [70.0, 72.37], [75.0, 75.22], [80.0, 87.05], [88.0, 88.38], [90.0, 90.56], [93.0, 94.54]], "keep_status": [true, false, false, false, false, false, true, false, true, false, false, false], "silence_prob": [31.07, 0.0, 0.0, 0.0, 0.0, 0.0, 32.72, 0.0, 32.7, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 30.91], ["whip", 9.61], ["explosion", 7.58]], null, null, null, null, null, [["fart", 32.03], ["speech", 17.77], ["sidetone", 5.2]], null, [["speech", 20.59], ["gunshot, gunfire", 15.64], ["artillery fire", 10.64]], null, null, null], "duration": [2.92, 0.05, 1.69, 1.97, 0.32, 0.24, 2.37, 0.22, 7.05, 0.38, 0.56, 1.54]} \ No newline at end of file diff --git a/annotations_1/ut_z2-96X0o_filtered.json b/annotations_1/ut_z2-96X0o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b422d84f9a6a1662a4383ef7da5c307f623afd0e --- /dev/null +++ b/annotations_1/ut_z2-96X0o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 16.01], [17.0, 21.19], [22.0, 28.97], [30.0, 30.45], [31.0, 32.64], [33.0, 36.48], [38.0, 40.34], [41.0, 41.08], [43.0, 42.92], [44.0, 51.0], [52.0, 52.47], [54.0, 53.55], [54.0, 54.33], [55.0, 55.65], [56.0, 57.42], [58.0, 59.73], [61.0, 61.08], [62.0, 63.81], [65.0, 66.93], [68.0, 68.08], [69.0, 69.53], [71.0, 71.31], [72.0, 78.87], [79.0, 79.47], [80.0, 81.31], [82.0, 82.27], [83.0, 83.4], [84.0, 84.59], [85.0, 86.76], [87.0, 90.32], [91.0, 91.71], [93.0, 93.82], [95.0, 96.72], [98.0, 99.4], [101.0, 102.15], [103.0, 103.64], [104.0, 104.62], [105.0, 114.34], [117.0, 118.94], [119.0, 120.33], [121.0, 122.18], [123.0, 125.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.99, 47.58, 100.0, 0.0, 0.0, 81.17, 50.97, 0.0, 0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.9, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, [["sidetone", 44.79], ["speech", 15.65], ["mains hum", 11.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.01, 4.19, 6.97, 0.45, 1.64, 3.48, 2.34, 0.08, -0.08, 7.0, 0.47, -0.45, 0.33, 0.65, 1.42, 1.73, 0.08, 1.81, 1.93, 0.08, 0.53, 0.31, 6.87, 0.47, 1.31, 0.27, 0.4, 0.59, 1.76, 3.32, 0.71, 0.82, 1.72, 1.4, 1.15, 0.64, 0.62, 9.34, 1.94, 1.33, 1.18, 2.83]} \ No newline at end of file diff --git a/annotations_1/uta8BACjLNk_filtered.json b/annotations_1/uta8BACjLNk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dcd0f08813a6f03bde74578fb4740dfe90abaf6b --- /dev/null +++ b/annotations_1/uta8BACjLNk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.62], [7.0, 7.65], [8.0, 9.02], [10.0, 12.82], [14.0, 14.94], [18.0, 19.16], [20.0, 21.34], [23.0, 23.31], [24.0, 24.11], [26.0, 26.13], [35.0, 35.56], [38.0, 39.72], [42.0, 43.19], [45.0, 44.9], [49.0, 49.59], [54.0, 55.07], [56.0, 56.12], [57.0, 59.7], [60.0, 60.49], [61.0, 62.36], [63.0, 64.4], [69.0, 69.55], [72.0, 72.1], [74.0, 74.36], [80.0, 79.64], [84.0, 84.21], [92.0, 92.26], [107.0, 107.08], [110.0, 109.58], [111.0, 111.15], [112.0, 111.91], [113.0, 114.98], [116.0, 117.0], [121.0, 121.73], [122.0, 123.63], [128.0, 129.09], [131.0, 131.82], [134.0, 134.57], [136.0, 139.97], [140.0, 140.75], [144.0, 144.12], [145.0, 146.43]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.85, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.16], ["music", 24.99], ["burst, pop", 5.97]], null, null, null], "duration": [-0.38, 0.65, 1.02, 2.82, 0.94, 1.16, 1.34, 0.31, 0.11, 0.13, 0.56, 1.72, 1.19, -0.1, 0.59, 1.07, 0.12, 2.7, 0.49, 1.36, 1.4, 0.55, 0.1, 0.36, -0.36, 0.21, 0.26, 0.08, -0.42, 0.15, -0.09, 1.98, 1.0, 0.73, 1.63, 1.09, 0.82, 0.57, 3.97, 0.75, 0.12, 1.43]} \ No newline at end of file diff --git a/annotations_1/uuNy1Ibdk_Y_filtered.json b/annotations_1/uuNy1Ibdk_Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6254876eac6c39709a4fcf476d6366c9798823fe --- /dev/null +++ b/annotations_1/uuNy1Ibdk_Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [11.0, 10.94], [13.0, 21.93], [25.0, 28.58], [36.0, 36.41], [37.0, 55.29], [58.0, 60.03], [62.0, 63.29], [64.0, 65.04], [68.0, 76.28], [76.0, 76.54], [79.0, 81.73], [83.0, 84.2], [97.0, 97.71], [111.0, 112.82], [125.0, 126.62], [132.0, 133.42], [142.0, 146.75], [155.0, 156.78], [160.0, 159.76]], "keep_status": [false, false, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 47.01, 33.65, 0.0, 30.91, 99.85, 0.0, 0.0, 34.29, 0.0, 38.26, 0.0, 0.0, 0.0, 0.0, 0.0, 39.01, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.35], ["synthesizer", 6.97], ["singing bowl", 5.17]], [["speech", 49.89], ["music", 12.2], ["zipper (clothing)", 6.23]], null, [["music", 48.66], ["electric shaver, electric razor", 11.91], ["speech", 7.92]], null, null, null, [["cattle, bovinae", 15.23], ["livestock, farm animals, working animals", 13.53], ["music", 13.3]], null, [["music", 57.89], ["synthesizer", 6.74], ["drum machine", 6.2]], null, null, null, null, null, [["music", 43.42], ["throbbing", 21.44], ["hum", 18.3]], null, null], "duration": [0.5, -0.06, 8.93, 3.58, 0.41, 18.29, 2.03, 1.29, 1.04, 8.28, 0.54, 2.73, 1.2, 0.71, 1.82, 1.62, 1.42, 4.75, 1.78, -0.24]} \ No newline at end of file diff --git a/annotations_1/uuTeJ6tbyB4_filtered.json b/annotations_1/uuTeJ6tbyB4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7cdc8a2c685ce73df6f2de28bf817e592acfd65 --- /dev/null +++ b/annotations_1/uuTeJ6tbyB4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 65.94], [67.0, 69.13], [70.0, 72.03], [74.0, 75.78], [105.0, 105.33], [108.0, 109.56], [111.0, 111.37], [113.0, 113.07], [114.0, 120.02], [122.0, 126.59], [127.0, 129.59], [131.0, 131.46], [135.0, 135.57], [137.0, 137.71], [141.0, 141.96], [143.0, 144.02], [146.0, 146.94], [151.0, 152.91], [155.0, 155.9], [157.0, 157.25], [158.0, 158.92], [160.0, 161.22], [167.0, 167.31], [168.0, 168.44]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.94, 40.29, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 100.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["echo", 20.81], ["music", 12.6], ["synthesizer", 7.62]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [32.94, 2.13, 2.03, 1.78, 0.33, 1.56, 0.37, 0.07, 6.02, 4.59, 2.59, 0.46, 0.57, 0.71, 0.96, 1.02, 0.94, 1.91, 0.9, 0.25, 0.92, 1.22, 0.31, 0.44]} \ No newline at end of file diff --git a/annotations_1/uuWIaDATbnE_filtered.json b/annotations_1/uuWIaDATbnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..46ce7ce40a9bd8ec714fc6d5ec6b63b4717269ee --- /dev/null +++ b/annotations_1/uuWIaDATbnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.69], [10.0, 12.24], [30.0, 30.84], [35.0, 35.04], [54.0, 54.51], [55.0, 56.22], [57.0, 57.33], [59.0, 59.39], [66.0, 67.59], [83.0, 83.29], [89.0, 89.87], [105.0, 106.14], [107.0, 113.64], [114.0, 116.75], [124.0, 124.48], [129.0, 130.08]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.4, 31.09, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 39.58], ["throbbing", 23.81], ["hum", 5.82]], null, null, null, null, null, null, null, null, null, null, [["music", 46.56], ["speech", 25.24], ["frog", 2.86]], [["moo", 41.93], ["cattle, bovinae", 38.16], ["livestock, farm animals, working animals", 13.49]], null, null], "duration": [-0.31, 2.24, 0.84, 0.04, 0.51, 1.22, 0.33, 0.39, 1.59, 0.29, 0.87, 1.14, 6.64, 2.75, 0.48, 1.08]} \ No newline at end of file diff --git a/annotations_1/uvZImlL51Io_filtered.json b/annotations_1/uvZImlL51Io_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7b1ebbdcc1de9abd3519ebf2d56af2941da073c3 --- /dev/null +++ b/annotations_1/uvZImlL51Io_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.41], [23.0, 23.45], [23.0, 23.52], [24.0, 87.12], [92.0, 104.33], [105.0, 108.26], [109.0, 109.85], [111.0, 111.89]], "keep_status": [false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.51, 32.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 29.87], ["hum", 29.43], ["music", 19.51]], [["speech", 53.04], ["cacophony", 7.31], ["vehicle", 6.84]], null, null], "duration": [0.41, 0.45, 0.52, 63.12, 12.33, 3.26, 0.85, 0.89]} \ No newline at end of file diff --git a/annotations_1/uw7rRlJvEl4_filtered.json b/annotations_1/uw7rRlJvEl4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..019e84a80931fbf5fe992dd0e5be4f0d4d3ad498 --- /dev/null +++ b/annotations_1/uw7rRlJvEl4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 91.39]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [62.39]} \ No newline at end of file diff --git a/annotations_1/uxj3cKArYDI_filtered.json b/annotations_1/uxj3cKArYDI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..173feb9020126aa72fc2378333d78d411e9eea40 --- /dev/null +++ b/annotations_1/uxj3cKArYDI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.25], [6.0, 6.25], [17.0, 17.91], [36.0, 36.49], [39.0, 40.07], [41.0, 41.79], [43.0, 43.48], [48.0, 50.18], [54.0, 54.23], [58.0, 58.63], [90.0, 90.76], [109.0, 109.97], [115.0, 116.6], [120.0, 120.23], [127.0, 127.28], [131.0, 131.28], [137.0, 137.0], [194.0, 194.22], [204.0, 204.75], [225.0, 226.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["mains hum", 29.22], ["speech", 25.06], ["hum", 22.04]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.25, 0.91, 0.49, 1.07, 0.79, 0.48, 2.18, 0.23, 0.63, 0.76, 0.97, 1.6, 0.23, 0.28, 0.28, 0.0, 0.22, 0.75, 1.17]} \ No newline at end of file diff --git a/annotations_1/uy4F1IeShVA_filtered.json b/annotations_1/uy4F1IeShVA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43ef0a7152129523def8affaf7a7101240636b66 --- /dev/null +++ b/annotations_1/uy4F1IeShVA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 18.49], [20.0, 24.83], [25.0, 41.79], [42.0, 83.17], [83.0, 83.49], [85.0, 86.21], [87.0, 116.18], [116.0, 118.64], [122.0, 122.99], [124.0, 124.26], [127.0, 127.14]], "keep_status": [true, true, true, false, false, false, true, false, false, false, false], "silence_prob": [40.88, 39.35, 39.49, 0.0, 0.0, 0.0, 37.84, 59.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 41.54], ["theremin", 13.44], ["hum", 5.34]], [["music", 60.81], ["throbbing", 4.57], ["didgeridoo", 3.91]], [["music", 27.87], ["speech", 20.15], ["sidetone", 7.27]], null, null, null, [["music", 34.37], ["speech", 27.32], ["sidetone", 8.26]], null, null, null, null], "duration": [4.49, 4.83, 16.79, 41.17, 0.49, 1.21, 29.18, 2.64, 0.99, 0.26, 0.14]} \ No newline at end of file diff --git a/annotations_1/uydWF18xoCQ_filtered.json b/annotations_1/uydWF18xoCQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..028e4e57668a5c3b73ad3518d285e964d3fec46d --- /dev/null +++ b/annotations_1/uydWF18xoCQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 7.64], [9.0, 57.62], [60.0, 59.59], [62.0, 64.5], [70.0, 71.93], [73.0, 74.63], [76.0, 78.93], [80.0, 84.6], [86.0, 97.7], [99.0, 114.78]], "keep_status": [false, false, false, true, false, false, false, false, false, true], "silence_prob": [32.98, 0.0, 0.0, 32.64, 0.0, 0.0, 52.74, 45.33, 30.59, 29.43], "audiomae_on_audioset": [[["music", 64.28], ["theremin", 9.83], ["musical instrument", 3.54]], null, null, [["music", 50.95], ["gong", 13.83], ["synthesizer", 4.87]], null, null, null, [["music", 67.56], ["percussion", 4.47], ["drum", 4.05]], [["music", 57.92], ["hum", 16.25], ["throbbing", 8.2]], [["hum", 25.7], ["throbbing", 21.52], ["music", 21.23]]], "duration": [4.64, 48.62, -0.41, 2.5, 1.93, 1.63, 2.93, 4.6, 11.7, 15.78]} \ No newline at end of file diff --git a/annotations_1/uzMEc37DGZA_filtered.json b/annotations_1/uzMEc37DGZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9e78a72f69abb97bfd4074b0935770354c9ae1a5 --- /dev/null +++ b/annotations_1/uzMEc37DGZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.2], [7.0, 7.21], [11.0, 11.35], [14.0, 14.03], [17.0, 16.68], [21.0, 20.95], [25.0, 25.41], [30.0, 30.23], [31.0, 31.65], [40.0, 40.59], [43.0, 43.46], [44.0, 44.79], [47.0, 48.52], [54.0, 56.71], [57.0, 60.44], [65.0, 65.74], [67.0, 66.7], [68.0, 68.39], [69.0, 70.29], [72.0, 72.98], [76.0, 76.47], [78.0, 78.71], [81.0, 80.89], [83.0, 83.64], [89.0, 89.48], [90.0, 90.61], [100.0, 100.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.21, 51.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.2, 0.21, 0.35, 0.03, -0.32, -0.05, 0.41, 0.23, 0.65, 0.59, 0.46, 0.79, 1.52, 2.71, 3.44, 0.74, -0.3, 0.39, 1.29, 0.98, 0.47, 0.71, -0.11, 0.64, 0.48, 0.61, 0.82]} \ No newline at end of file diff --git a/annotations_1/uzTuGHYRJ9w_filtered.json b/annotations_1/uzTuGHYRJ9w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..818399577e7ac8fca2823bf145f1304cd6924291 --- /dev/null +++ b/annotations_1/uzTuGHYRJ9w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.82], [10.0, 10.25], [11.0, 12.38], [21.0, 21.69], [25.0, 25.81], [29.0, 48.14], [50.0, 59.05], [60.0, 60.66], [63.0, 62.94], [68.0, 68.03], [71.0, 72.18], [74.0, 74.88], [84.0, 84.89], [87.0, 89.34], [107.0, 133.22], [142.0, 143.5], [152.0, 152.9], [154.0, 157.99], [160.0, 161.69], [163.0, 163.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [38.93, 0.0, 0.0, 0.0, 0.0, 38.54, 28.95, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.11, 30.1, 0.0, 0.0, 38.75, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.6], ["theremin", 10.63], ["synthesizer", 9.49]], null, null, null, null, [["music", 52.08], ["synthesizer", 17.36], ["electronic music", 4.89]], [["music", 42.68], ["speech", 28.43], ["musical instrument", 4.83]], null, null, null, null, null, null, [["speech", 23.83], ["fart", 23.15], ["laughter", 12.63]], [["music", 18.68], ["fly, housefly", 18.56], ["fart", 13.06]], null, null, [["speech", 56.13], ["whack, thwack", 9.67], ["thunk", 5.66]], null, null], "duration": [2.82, 0.25, 1.38, 0.69, 0.81, 19.14, 9.05, 0.66, -0.06, 0.03, 1.18, 0.88, 0.89, 2.34, 26.22, 1.5, 0.9, 3.99, 1.69, 0.53]} \ No newline at end of file diff --git a/annotations_1/uzeSNmjxyNg_filtered.json b/annotations_1/uzeSNmjxyNg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0a8e2ec7f54cdc72e35da84069020fb15b5898b --- /dev/null +++ b/annotations_1/uzeSNmjxyNg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.63], [7.0, 7.43], [9.0, 12.97], [14.0, 14.84], [16.0, 16.06], [23.0, 23.03], [24.0, 23.84], [26.0, 29.22], [30.0, 30.86], [31.0, 59.44], [61.0, 83.86]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [40.84, 0.0, 60.89, 0.0, 0.0, 0.0, 0.0, 46.94, 0.0, 29.69, 29.72], "audiomae_on_audioset": [[["cattle, bovinae", 32.09], ["moo", 25.71], ["livestock, farm animals, working animals", 16.02]], null, null, null, null, null, null, [["moo", 16.3], ["cattle, bovinae", 9.69], ["livestock, farm animals, working animals", 9.48]], null, [["hum", 17.5], ["music", 15.65], ["whack, thwack", 13.06]], [["hum", 44.79], ["gong", 23.52], ["throbbing", 8.69]]], "duration": [4.63, 0.43, 3.97, 0.84, 0.06, 0.03, -0.16, 3.22, 0.86, 28.44, 22.86]} \ No newline at end of file diff --git a/annotations_1/uzhsjyHUBt8_filtered.json b/annotations_1/uzhsjyHUBt8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56feded97cf54ebe456321fb935d25181bf1c4e8 --- /dev/null +++ b/annotations_1/uzhsjyHUBt8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.76], [7.0, 9.07], [23.0, 22.94], [41.0, 41.54], [57.0, 57.32], [64.0, 65.91], [68.0, 68.4], [69.0, 74.76], [77.0, 77.25], [78.0, 79.81], [81.0, 81.28], [88.0, 88.84], [108.0, 108.58], [109.0, 111.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.76, 2.07, -0.06, 0.54, 0.32, 1.91, 0.4, 5.76, 0.25, 1.81, 0.28, 0.84, 0.58, 2.13]} \ No newline at end of file diff --git a/annotations_1/v00zKyXbfD4_filtered.json b/annotations_1/v00zKyXbfD4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..19322d6cdd7d900fa5d9aa6ed7f87095f3590a38 --- /dev/null +++ b/annotations_1/v00zKyXbfD4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 150.45], [150.0, 150.85]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [140.45, 0.85]} \ No newline at end of file diff --git a/annotations_1/v04j4-SBv9M_filtered.json b/annotations_1/v04j4-SBv9M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..903b06f6059c4a9c733c002e34ef588bc4f23710 --- /dev/null +++ b/annotations_1/v04j4-SBv9M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.46], [2.0, 20.28], [20.0, 21.05], [21.0, 37.44], [39.0, 51.63], [61.0, 61.43], [85.0, 85.53], [86.0, 86.19], [87.0, 87.29], [90.0, 91.77]], "keep_status": [false, true, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 29.89, 0.0, 28.85, 30.46, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 32.69], ["didgeridoo", 12.57], ["gong", 5.22]], null, [["speech", 28.0], ["buzz", 18.83], ["vehicle", 14.03]], [["music", 68.5], ["synthesizer", 4.98], ["hum", 4.91]], null, null, null, null, null], "duration": [0.46, 18.28, 1.05, 16.44, 12.63, 0.43, 0.53, 0.19, 0.29, 1.77]} \ No newline at end of file diff --git a/annotations_1/v0AyEpFDi48_filtered.json b/annotations_1/v0AyEpFDi48_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02513b53273861476ea2e2b0a17ed5749ca14c85 --- /dev/null +++ b/annotations_1/v0AyEpFDi48_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 27.75], [28.0, 44.95], [48.0, 51.0], [52.0, 116.46], [122.0, 148.51], [153.0, 153.57], [154.0, 154.9], [159.0, 159.6], [161.0, 181.04], [183.0, 242.1]], "keep_status": [true, true, true, false, true, false, false, false, true, false], "silence_prob": [28.74, 29.06, 31.48, 0.0, 28.87, 0.0, 0.0, 0.0, 28.87, 0.0], "audiomae_on_audioset": [[["car", 15.52], ["vehicle", 15.48], ["music", 8.33]], [["speech", 22.11], ["hum", 18.88], ["mains hum", 14.79]], [["music", 18.29], ["speech", 15.86], ["whale vocalization", 10.14]], null, [["music", 41.28], ["speech", 12.94], ["mains hum", 6.46]], null, null, null, [["music", 50.0], ["throbbing", 9.85], ["hum", 8.65]], null], "duration": [14.75, 16.95, 3.0, 64.46, 26.51, 0.57, 0.9, 0.6, 20.04, 59.1]} \ No newline at end of file diff --git a/annotations_1/v0gGWiRkjYM_filtered.json b/annotations_1/v0gGWiRkjYM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcf11e09ed433c5b832e0911a9f56c822ae2656f --- /dev/null +++ b/annotations_1/v0gGWiRkjYM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 8.73], [11.0, 19.47], [35.0, 39.63], [50.0, 58.06], [66.0, 79.59], [83.0, 93.34], [96.0, 109.49], [116.0, 130.82]], "keep_status": [false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 62.17, 41.1, 31.34, 31.23, 31.35, 31.26, 31.69, 30.66], "audiomae_on_audioset": [null, null, [["music", 37.7], ["keyboard (musical)", 18.53], ["piano", 15.71]], [["music", 56.25], ["speech", 8.94], ["synthesizer", 4.35]], [["music", 84.52], ["swing music", 1.95], ["musical instrument", 0.85]], [["music", 83.31], ["funk", 1.44], ["singing", 0.79]], [["music", 79.37], ["musical instrument", 3.29], ["didgeridoo", 1.61]], [["music", 38.47], ["didgeridoo", 14.93], ["cattle, bovinae", 14.0]], [["music", 81.32], ["didgeridoo", 4.57], ["speech", 2.72]]], "duration": [1.13, 5.73, 8.47, 4.63, 8.06, 13.59, 10.34, 13.49, 14.82]} \ No newline at end of file diff --git a/annotations_1/v2qDlGbaqSQ_filtered.json b/annotations_1/v2qDlGbaqSQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d1010b1f622f91ada30107f928cb210c9ff2dc7 --- /dev/null +++ b/annotations_1/v2qDlGbaqSQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.09], [5.0, 13.19], [18.0, 19.2], [24.0, 26.2], [28.0, 29.13], [31.0, 32.54], [35.0, 35.77], [38.0, 38.92], [42.0, 45.05], [47.0, 47.82], [50.0, 51.7], [55.0, 55.12], [56.0, 58.5], [63.0, 64.77], [75.0, 81.38], [83.0, 84.4], [86.0, 87.45], [90.0, 94.14], [97.0, 96.89], [97.0, 100.11], [105.0, 119.94], [126.0, 126.3], [129.0, 130.79], [135.0, 138.25], [142.0, 147.24], [149.0, 149.28], [154.0, 155.34], [156.0, 158.7], [161.0, 161.76], [163.0, 165.01], [167.0, 166.85], [168.0, 171.75], [174.0, 175.09], [180.0, 183.25], [185.0, 189.33], [199.0, 199.77], [200.0, 200.82], [203.0, 204.01], [210.0, 214.83], [216.0, 221.83], [224.0, 230.32], [233.0, 233.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.46, 70.86, 0.0, 97.64, 0.0, 0.0, 0.0, 0.0, 63.1, 0.0, 0.0, 0.0, 75.88, 0.0, 74.44, 0.0, 0.0, 50.56, 0.0, 60.98, 47.43, 0.0, 0.0, 47.39, 53.78, 0.0, 0.0, 60.32, 0.0, 58.13, 0.0, 59.42, 0.0, 56.63, 53.72, 0.0, 0.0, 0.0, 46.26, 60.51, 63.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.09], ["cello", 6.63], ["double bass", 5.88]], null, null, [["music", 55.6], ["theremin", 24.22], ["cello", 2.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.17], ["guitar", 4.09], ["musical instrument", 3.63]], null, null, null], "duration": [2.09, 8.19, 1.2, 2.2, 1.13, 1.54, 0.77, 0.92, 3.05, 0.82, 1.7, 0.12, 2.5, 1.77, 6.38, 1.4, 1.45, 4.14, -0.11, 3.11, 14.94, 0.3, 1.79, 3.25, 5.24, 0.28, 1.34, 2.7, 0.76, 2.01, -0.15, 3.75, 1.09, 3.25, 4.33, 0.77, 0.82, 1.01, 4.83, 5.83, 6.32, 0.54]} \ No newline at end of file diff --git a/annotations_1/v3E4s7VN4xE_filtered.json b/annotations_1/v3E4s7VN4xE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53528e3fd1d76000b76d18bd413b610671ceacf2 --- /dev/null +++ b/annotations_1/v3E4s7VN4xE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.75], [4.0, 6.51], [9.0, 12.38], [20.0, 21.56], [25.0, 26.22], [27.0, 29.32], [32.0, 34.7], [47.0, 48.57], [50.0, 56.78], [60.0, 60.44], [62.0, 64.62], [67.0, 70.17], [73.0, 73.2], [74.0, 75.63], [89.0, 92.18], [93.0, 96.03], [106.0, 108.4], [110.0, 110.46], [111.0, 111.57], [115.0, 117.34]], "keep_status": [false, false, false, false, false, true, true, false, true, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 100.0, 79.24, 0.0, 0.0, 42.13, 33.6, 0.0, 42.53, 0.0, 33.65, 34.41, 0.0, 0.0, 36.61, 39.67, 42.04, 0.0, 0.0, 99.71], "audiomae_on_audioset": [null, null, null, null, null, [["music", 26.4], ["crow", 6.86], ["speech", 4.33]], [["speech", 38.27], ["music", 25.62], ["hum", 3.96]], null, [["speech", 59.36], ["music", 7.29], ["ding", 3.2]], null, [["music", 39.91], ["synthesizer", 5.61], ["musical instrument", 3.21]], [["music", 46.17], ["speech", 22.06], ["hum", 4.88]], null, null, [["music", 30.36], ["fly, housefly", 15.99], ["insect", 5.12]], [["music", 31.81], ["speech", 27.88], ["musical instrument", 2.78]], [["quack", 43.43], ["music", 32.0], ["duck", 10.71]], null, null, null], "duration": [0.75, 2.51, 3.38, 1.56, 1.22, 2.32, 2.7, 1.57, 6.78, 0.44, 2.62, 3.17, 0.2, 1.63, 3.18, 3.03, 2.4, 0.46, 0.57, 2.34]} \ No newline at end of file diff --git a/annotations_1/v3bWb5qZMu8_filtered.json b/annotations_1/v3bWb5qZMu8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..154d1eeff08f5aa797f6f67fbcf38dec53bd8974 --- /dev/null +++ b/annotations_1/v3bWb5qZMu8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [4.0, 80.72], [81.0, 131.82], [132.0, 138.89], [139.0, 139.55], [140.0, 141.03], [142.0, 142.28], [143.0, 146.96], [147.0, 150.35], [158.0, 170.68], [176.0, 176.49]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 34.87, 0.0, 0.0, 0.0, 45.92, 37.35, 32.81, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 55.2], ["animal", 4.15], ["fowl", 3.69]], null, null, null, [["music", 24.23], ["speech", 23.55], ["electric shaver, electric razor", 6.94]], [["cowbell", 31.44], ["moo", 20.69], ["cattle, bovinae", 19.86]], [["speech", 59.06], ["electric shaver, electric razor", 8.85], ["hum", 4.35]], null], "duration": [0.44, 76.72, 50.82, 6.89, 0.55, 1.03, 0.28, 3.96, 3.35, 12.68, 0.49]} \ No newline at end of file diff --git a/annotations_1/v4U2mAwO6-4_filtered.json b/annotations_1/v4U2mAwO6-4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d04efef44f92c3fb2a9a042917b85bec799bc967 --- /dev/null +++ b/annotations_1/v4U2mAwO6-4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.56], [4.0, 5.46], [6.0, 7.97], [9.0, 9.76], [11.0, 11.15], [11.0, 12.31], [13.0, 15.55], [17.0, 19.18], [20.0, 23.33], [25.0, 28.07], [35.0, 37.12], [45.0, 47.14], [49.0, 53.45], [55.0, 68.64], [70.0, 70.63], [72.0, 73.43], [74.0, 75.39], [76.0, 77.45], [79.0, 79.08], [82.0, 82.63], [84.0, 84.55], [86.0, 87.15], [88.0, 90.07], [91.0, 93.02], [94.0, 95.52], [98.0, 97.73], [98.0, 101.38], [103.0, 106.02], [107.0, 109.54], [110.0, 111.7], [113.0, 113.97], [116.0, 117.8], [119.0, 124.01], [125.0, 126.69], [128.0, 135.23], [138.0, 143.01], [144.0, 145.0], [148.0, 150.72], [152.0, 152.2], [155.0, 157.13], [158.0, 158.6], [161.0, 163.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 94.37, 99.92, 99.48, 93.13, 96.89, 97.73, 93.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 99.68, 0.0, 0.0, 95.51, 84.07, 82.43, 0.0, 0.0, 0.0, 88.46, 0.0, 77.36, 89.01, 0.0, 71.0, 0.0, 75.23, 0.0, 37.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 35.29], ["insect", 9.09], ["fly, housefly", 6.72]]], "duration": [1.56, 1.46, 1.97, 0.76, 0.15, 1.31, 2.55, 2.18, 3.33, 3.07, 2.12, 2.14, 4.45, 13.64, 0.63, 1.43, 1.39, 1.45, 0.08, 0.63, 0.55, 1.15, 2.07, 2.02, 1.52, -0.27, 3.38, 3.02, 2.54, 1.7, 0.97, 1.8, 5.01, 1.69, 7.23, 5.01, 1.0, 2.72, 0.2, 2.13, 0.6, 2.16]} \ No newline at end of file diff --git a/annotations_1/v4np7L0aJd0_filtered.json b/annotations_1/v4np7L0aJd0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c3cde24bb45eaf4105cb294bb4639da42815fe0 --- /dev/null +++ b/annotations_1/v4np7L0aJd0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.75], [6.0, 7.75], [8.0, 8.67], [13.0, 13.85], [18.0, 17.96], [18.0, 19.26], [22.0, 23.63], [28.0, 29.42], [30.0, 37.05], [39.0, 39.72], [43.0, 43.07], [51.0, 52.52], [54.0, 54.82], [56.0, 55.97], [57.0, 57.91], [58.0, 60.29], [61.0, 63.93], [64.0, 65.97], [68.0, 69.69], [72.0, 73.01], [81.0, 81.75], [90.0, 90.17], [92.0, 91.98], [93.0, 94.63], [96.0, 96.03], [99.0, 100.11], [111.0, 112.46], [119.0, 123.28], [124.0, 127.72], [129.0, 149.28]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [37.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.27, 66.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 99.56, 32.08], "audiomae_on_audioset": [[["slam", 18.82], ["thunk", 12.29], ["door", 9.69]], null, null, null, null, null, null, null, [["speech", 39.2], ["moo", 16.35], ["cattle, bovinae", 15.45]], null, null, null, null, null, null, [["speech", 46.95], ["sidetone", 38.49], ["sine wave", 3.32]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 32.46], ["cattle, bovinae", 12.48], ["livestock, farm animals, working animals", 11.69]]], "duration": [3.75, 1.75, 0.67, 0.85, -0.04, 1.26, 1.63, 1.42, 7.05, 0.72, 0.07, 1.52, 0.82, -0.03, 0.91, 2.29, 2.93, 1.97, 1.69, 1.01, 0.75, 0.17, -0.02, 1.63, 0.03, 1.11, 1.46, 4.28, 3.72, 20.28]} \ No newline at end of file diff --git a/annotations_1/v5llnbqhLZM_filtered.json b/annotations_1/v5llnbqhLZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..070dd9682ebe22f488f952a37134530aa7fb9c6c --- /dev/null +++ b/annotations_1/v5llnbqhLZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.34], [5.0, 9.76], [12.0, 13.78], [16.0, 28.86], [32.0, 35.68], [37.0, 66.61], [69.0, 70.75], [73.0, 72.76], [73.0, 77.8], [78.0, 83.03], [87.0, 87.54], [88.0, 88.59], [91.0, 91.35], [97.0, 96.99], [97.0, 102.59], [103.0, 131.58], [134.0, 144.02], [146.0, 166.67], [167.0, 168.94], [171.0, 174.19], [176.0, 178.21]], "keep_status": [false, false, false, true, true, true, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 32.33, 0.0, 30.03, 29.36, 30.98, 0.0, 0.0, 29.79, 31.29, 0.0, 0.0, 0.0, 0.0, 33.14, 29.84, 29.62, 31.15, 0.0, 92.48, 92.64], "audiomae_on_audioset": [null, [["music", 40.32], ["hum", 24.93], ["throbbing", 16.6]], null, [["hum", 31.06], ["music", 29.19], ["speech", 6.47]], [["music", 17.15], ["buzz", 16.02], ["rumble", 9.96]], [["hum", 22.62], ["grunt", 16.27], ["noise", 12.69]], null, null, [["music", 68.07], ["grunt", 11.07], ["didgeridoo", 3.11]], [["music", 53.86], ["scary music", 11.83], ["foghorn", 9.43]], null, null, null, null, [["didgeridoo", 17.03], ["fart", 14.02], ["music", 12.05]], [["music", 38.37], ["hum", 22.16], ["mains hum", 15.79]], [["music", 42.17], ["whale vocalization", 12.24], ["groan", 7.16]], [["hum", 23.23], ["music", 22.15], ["sonar", 16.7]], null, null, null], "duration": [1.34, 4.76, 1.78, 12.86, 3.68, 29.61, 1.75, -0.24, 4.8, 5.03, 0.54, 0.59, 0.35, -0.01, 5.59, 28.58, 10.02, 20.67, 1.94, 3.19, 2.21]} \ No newline at end of file diff --git a/annotations_1/v5nIRiA5W-E_filtered.json b/annotations_1/v5nIRiA5W-E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3be9b3b82f678222ab0c531b35e839f83f0e537 --- /dev/null +++ b/annotations_1/v5nIRiA5W-E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.4], [9.0, 9.53], [16.0, 28.19], [33.0, 34.69], [41.0, 41.35], [45.0, 52.44], [53.0, 52.96], [54.0, 54.67], [55.0, 64.1], [65.0, 100.18]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.87, 0.0, 0.0, 31.03, 0.0, 0.0, 29.42, 0.0], "audiomae_on_audioset": [null, null, [["music", 23.92], ["livestock, farm animals, working animals", 13.93], ["mosquito", 13.1]], null, null, [["speech", 47.2], ["music", 18.88], ["grunt", 8.26]], null, null, [["cattle, bovinae", 38.03], ["livestock, farm animals, working animals", 19.59], ["moo", 19.59]], null], "duration": [1.4, 0.53, 12.19, 1.69, 0.35, 7.44, -0.04, 0.67, 9.1, 35.18]} \ No newline at end of file diff --git a/annotations_1/v757jrOBkng_filtered.json b/annotations_1/v757jrOBkng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b59056a3b740953d0e9fe037b67fa925dd76dff --- /dev/null +++ b/annotations_1/v757jrOBkng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.54], [5.0, 5.21], [7.0, 8.34], [11.0, 11.64], [14.0, 14.91], [18.0, 17.91], [22.0, 22.67], [24.0, 24.73], [28.0, 28.93], [31.0, 30.91], [41.0, 42.6], [44.0, 44.51], [45.0, 45.81], [51.0, 51.41], [56.0, 58.23], [60.0, 60.52], [61.0, 61.64], [65.0, 67.07], [68.0, 70.16], [71.0, 73.67], [78.0, 78.54], [82.0, 84.0], [85.0, 96.85], [98.0, 99.59], [100.0, 102.25], [103.0, 105.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.78, 99.56, 0.0, 100.0, 97.54, 0.0, 97.54, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.54, 0.21, 1.34, 0.64, 0.91, -0.09, 0.67, 0.73, 0.93, -0.09, 1.6, 0.51, 0.81, 0.41, 2.23, 0.52, 0.64, 2.07, 2.16, 2.67, 0.54, 2.0, 11.85, 1.59, 2.25, 2.24]} \ No newline at end of file diff --git a/annotations_1/v7QfNBfZT3w_filtered.json b/annotations_1/v7QfNBfZT3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08c9965c77f0ccb45512bbf5131f9a7b4cc85d1c --- /dev/null +++ b/annotations_1/v7QfNBfZT3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.79], [8.0, 9.63], [12.0, 14.23], [16.0, 22.25], [23.0, 24.68], [32.0, 33.12], [33.0, 36.98], [43.0, 44.93], [51.0, 55.75], [57.0, 56.61], [58.0, 59.66], [63.0, 63.34], [65.0, 66.7], [67.0, 68.59], [70.0, 71.66], [73.0, 73.63], [76.0, 76.71], [82.0, 83.0], [83.0, 84.01], [85.0, 93.46], [95.0, 96.53], [98.0, 99.91], [106.0, 108.23], [114.0, 115.6], [117.0, 117.14], [119.0, 119.4], [121.0, 122.12], [122.0, 122.79], [124.0, 125.31], [129.0, 129.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 71.0, 45.33, 0.0, 0.0, 45.95, 0.0, 96.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 44.94], ["sidetone", 34.97], ["music", 4.37]], null, null, [["speech", 87.04], ["sidetone", 4.5], ["inside, small room", 0.88]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.79, 1.63, 2.23, 6.25, 1.68, 1.12, 3.98, 1.93, 4.75, -0.39, 1.66, 0.34, 1.7, 1.59, 1.66, 0.63, 0.71, 1.0, 1.01, 8.46, 1.53, 1.91, 2.23, 1.6, 0.14, 0.4, 1.12, 0.79, 1.31, 0.41]} \ No newline at end of file diff --git a/annotations_1/v8CflcvxDJo_filtered.json b/annotations_1/v8CflcvxDJo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d14d110542819689e04bea035e8de354cb45e1d --- /dev/null +++ b/annotations_1/v8CflcvxDJo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 59.98], [61.0, 69.15], [70.0, 73.33], [78.0, 77.85], [80.0, 80.13], [84.0, 83.69], [85.0, 89.61], [94.0, 105.24], [106.0, 107.28], [109.0, 151.95]], "keep_status": [false, true, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 30.54, 30.03, 0.0, 0.0, 0.0, 30.58, 31.69, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 28.4], ["animal", 9.4], ["hum", 3.95]], [["livestock, farm animals, working animals", 20.57], ["moo", 19.82], ["cattle, bovinae", 15.91]], null, null, null, [["music", 61.08], ["throbbing", 9.42], ["electronic music", 4.53]], [["music", 49.63], ["hum", 10.14], ["throbbing", 10.03]], null, null], "duration": [46.98, 8.15, 3.33, -0.15, 0.13, -0.31, 4.61, 11.24, 1.28, 42.95]} \ No newline at end of file diff --git a/annotations_1/v8UDjwdqzKY_filtered.json b/annotations_1/v8UDjwdqzKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33f7d3fcdc51ddc3a1b99112aef728c10b590bba --- /dev/null +++ b/annotations_1/v8UDjwdqzKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.87], [7.0, 6.64], [7.0, 7.87], [9.0, 9.48], [13.0, 13.1], [22.0, 21.74], [29.0, 29.0], [30.0, 30.5], [32.0, 31.73], [33.0, 33.49], [38.0, 38.1], [46.0, 47.51], [49.0, 49.67], [51.0, 52.24], [54.0, 53.82], [55.0, 57.06], [59.0, 61.65], [63.0, 63.71], [64.0, 64.89], [65.0, 65.85], [67.0, 68.22], [69.0, 69.77], [71.0, 70.85], [72.0, 72.74], [74.0, 74.56], [86.0, 85.97], [88.0, 88.62], [91.0, 90.91], [92.0, 92.15], [98.0, 98.22], [101.0, 100.79], [102.0, 102.98], [105.0, 105.66], [115.0, 117.04], [118.0, 117.98], [119.0, 119.74], [120.0, 124.21], [127.0, 129.2], [131.0, 132.65], [134.0, 134.2], [135.0, 136.09], [137.0, 137.44], [138.0, 139.19], [140.0, 140.39], [141.0, 141.45], [142.0, 143.72], [144.0, 144.83], [146.0, 147.26], [148.0, 148.63], [150.0, 151.36], [152.0, 153.45], [154.0, 155.34], [157.0, 157.84], [160.0, 161.23], [162.0, 162.23], [165.0, 165.37], [166.0, 166.08], [167.0, 167.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.87, -0.36, 0.87, 0.48, 0.1, -0.26, 0.0, 0.5, -0.27, 0.49, 0.1, 1.51, 0.67, 1.24, -0.18, 2.06, 2.65, 0.71, 0.89, 0.85, 1.22, 0.77, -0.15, 0.74, 0.56, -0.03, 0.62, -0.09, 0.15, 0.22, -0.21, 0.98, 0.66, 2.04, -0.02, 0.74, 4.21, 2.2, 1.65, 0.2, 1.09, 0.44, 1.19, 0.39, 0.45, 1.72, 0.83, 1.26, 0.63, 1.36, 1.45, 1.34, 0.84, 1.23, 0.23, 0.37, 0.08, 0.7]} \ No newline at end of file diff --git a/annotations_1/v8kB6cqv8qM_filtered.json b/annotations_1/v8kB6cqv8qM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cfb11381f3badc50490197d381fde2ee0cf681d --- /dev/null +++ b/annotations_1/v8kB6cqv8qM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.96], [15.0, 15.16], [22.0, 24.29], [27.0, 29.46], [32.0, 32.43], [37.0, 36.98], [42.0, 51.6], [53.0, 73.82], [82.0, 83.1], [84.0, 89.33], [97.0, 97.36], [104.0, 118.69], [121.0, 121.44]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, true, false], "silence_prob": [0.0, 0.0, 82.79, 31.82, 0.0, 0.0, 29.89, 29.8, 0.0, 29.97, 0.0, 29.17, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 16.07], ["music", 12.84], ["insect", 7.78]], null, null, [["speech", 61.56], ["electric shaver, electric razor", 15.77], ["music", 5.77]], [["music", 25.11], ["mains hum", 16.52], ["hum", 16.09]], null, [["throbbing", 28.66], ["music", 26.08], ["hum", 23.75]], null, [["hum", 23.21], ["speech", 22.39], ["music", 15.66]], null], "duration": [0.96, 0.16, 2.29, 2.46, 0.43, -0.02, 9.6, 20.82, 1.1, 5.33, 0.36, 14.69, 0.44]} \ No newline at end of file diff --git a/annotations_1/v9Cq9nThaNs_filtered.json b/annotations_1/v9Cq9nThaNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb489d1a7cf1e6be6c3466eb90cb221a727845d1 --- /dev/null +++ b/annotations_1/v9Cq9nThaNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.72], [1.0, 12.21], [12.0, 12.28], [17.0, 24.88], [30.0, 29.81], [31.0, 40.74], [43.0, 43.87], [55.0, 63.54], [66.0, 66.82], [70.0, 71.88], [74.0, 75.09], [76.0, 76.45], [79.0, 83.39], [85.0, 100.45], [112.0, 131.36], [136.0, 148.69], [153.0, 178.12]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 28.89, 0.0, 28.29, 0.0, 28.95, 0.0, 28.96, 0.0, 0.0, 0.0, 0.0, 29.44, 29.4, 29.07, 29.01, 28.85], "audiomae_on_audioset": [null, [["speech", 51.24], ["music", 21.72], ["vehicle", 5.8]], null, [["vehicle", 34.74], ["music", 18.36], ["car", 18.32]], null, [["music", 47.78], ["speech", 14.1], ["hum", 12.5]], null, [["music", 65.09], ["throbbing", 17.14], ["hum", 7.18]], null, null, null, null, [["music", 81.71], ["throbbing", 4.16], ["electronic music", 3.46]], [["music", 27.94], ["vehicle", 26.41], ["car", 12.19]], [["music", 65.13], ["throbbing", 11.17], ["hum", 7.84]], [["music", 62.36], ["throbbing", 13.21], ["hum", 8.34]], [["music", 48.27], ["throbbing", 21.01], ["hum", 16.25]]], "duration": [-0.28, 11.21, 0.28, 7.88, -0.19, 9.74, 0.87, 8.54, 0.82, 1.88, 1.09, 0.45, 4.39, 15.45, 19.36, 12.69, 25.12]} \ No newline at end of file diff --git a/annotations_1/v9UIDDlnSgA_filtered.json b/annotations_1/v9UIDDlnSgA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6d0fb84bbddab782eb9cf62b70978bb700dd1432 --- /dev/null +++ b/annotations_1/v9UIDDlnSgA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.01], [18.0, 18.39], [18.0, 29.25], [30.0, 40.29], [45.0, 73.36], [74.0, 107.38]], "keep_status": [false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 29.35, 28.86, 29.12, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.36], ["theremin", 10.22], ["whale vocalization", 5.14]], [["speech", 59.31], ["explosion", 5.54], ["hubbub, speech noise, speech babble", 3.71]], [["music", 47.24], ["speech", 15.06], ["vehicle", 5.97]], null], "duration": [1.01, 0.39, 11.25, 10.29, 28.36, 33.38]} \ No newline at end of file diff --git a/annotations_1/v9pZdy4lZ7U_filtered.json b/annotations_1/v9pZdy4lZ7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb01741eabfbcfbd8536cf51a4d060c607c9b0ab --- /dev/null +++ b/annotations_1/v9pZdy4lZ7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.41], [8.0, 10.94], [12.0, 13.9], [16.0, 20.75], [23.0, 24.53], [26.0, 27.65], [32.0, 44.31], [45.0, 45.74], [46.0, 45.81], [46.0, 46.94], [47.0, 46.99], [47.0, 54.43], [58.0, 78.21], [81.0, 84.97], [85.0, 91.64], [97.0, 132.17], [132.0, 132.68], [133.0, 149.98], [150.0, 150.01]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.84, 0.0, 31.67, 0.0, 0.0, 29.46, 0.0, 0.0, 0.0, 0.0, 29.86, 29.72, 29.42, 29.28, 0.0, 0.0, 30.7, 0.0], "audiomae_on_audioset": [null, [["music", 34.91], ["throbbing", 7.14], ["speech", 5.11]], null, [["fly, housefly", 46.28], ["mosquito", 25.69], ["insect", 6.8]], null, null, [["music", 22.32], ["buzz", 6.24], ["rumble", 5.89]], null, null, null, null, [["sound effect", 34.22], ["grunt", 17.69], ["speech", 16.26]], [["hum", 29.74], ["speech", 25.19], ["throbbing", 16.38]], [["hum", 37.56], ["mains hum", 30.12], ["rumble", 6.93]], [["whale vocalization", 48.34], ["hum", 13.01], ["music", 8.66]], null, null, [["music", 34.04], ["hum", 19.38], ["theremin", 19.05]], null], "duration": [0.41, 2.94, 1.9, 4.75, 1.53, 1.65, 12.31, 0.74, -0.19, 0.94, -0.01, 7.43, 20.21, 3.97, 6.64, 35.17, 0.68, 16.98, 0.01]} \ No newline at end of file diff --git a/annotations_1/vA1fVHBWuBU_filtered.json b/annotations_1/vA1fVHBWuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..594e6bf3278ae44df451298d83adcc84a1d7f7f4 --- /dev/null +++ b/annotations_1/vA1fVHBWuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.72], [14.0, 14.57], [19.0, 18.76], [45.0, 45.2], [58.0, 58.21], [66.0, 67.0], [69.0, 69.8], [72.0, 75.91], [78.0, 78.09], [80.0, 80.49], [84.0, 84.3], [86.0, 86.7], [88.0, 89.9], [92.0, 96.15], [99.0, 100.58], [105.0, 106.89], [111.0, 111.96], [113.0, 114.52], [116.0, 117.75], [121.0, 123.45], [126.0, 128.24], [132.0, 134.76], [136.0, 138.52], [139.0, 140.16], [145.0, 146.06], [150.0, 151.24]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 0.0, 0.0, 0.0, 0.0, 68.8, 99.98, 99.4, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.57, -0.24, 0.2, 0.21, 1.0, 0.8, 3.91, 0.09, 0.49, 0.3, 0.7, 1.9, 4.15, 1.58, 1.89, 0.96, 1.52, 1.75, 2.45, 2.24, 2.76, 2.52, 1.16, 1.06, 1.24]} \ No newline at end of file diff --git a/annotations_1/vAYzTJIog1U_filtered.json b/annotations_1/vAYzTJIog1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fd914d012df6c0f456e500ed83013240b9a811f --- /dev/null +++ b/annotations_1/vAYzTJIog1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 25.37], [27.0, 27.9], [31.0, 33.64], [41.0, 41.82], [44.0, 44.49]], "keep_status": [true, false, true, false, false], "silence_prob": [40.84, 0.0, 30.29, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 27.3], ["speech", 14.48], ["music", 14.25]], null, [["sheep", 27.29], ["livestock, farm animals, working animals", 21.1], ["bleat", 13.89]], null, null], "duration": [15.37, 0.9, 2.64, 0.82, 0.49]} \ No newline at end of file diff --git a/annotations_1/vBAK4o8zHF4_filtered.json b/annotations_1/vBAK4o8zHF4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c7d42d98ac3eea5580835776d9c5ee64719e1d5 --- /dev/null +++ b/annotations_1/vBAK4o8zHF4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.15], [17.0, 17.49], [32.0, 33.2], [35.0, 36.71], [48.0, 48.59], [51.0, 52.42], [53.0, 53.65], [58.0, 64.56], [67.0, 72.13], [73.0, 74.28], [97.0, 103.69], [107.0, 108.78], [111.0, 119.45], [120.0, 125.46], [127.0, 127.7], [128.0, 132.43], [134.0, 136.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.51, 50.97, 0.0, 39.66, 0.0, 39.82, 35.59, 0.0, 35.09, 37.83], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 46.58], ["boing", 41.49], ["speech", 9.08]], null, [["music", 55.21], ["speech", 18.86], ["boing", 4.82]], [["music", 63.53], ["fly, housefly", 6.23], ["mosquito", 4.29]], null, [["speech", 40.18], ["music", 18.91], ["synthesizer", 2.85]], [["music", 23.06], ["throbbing", 14.66], ["hum", 8.53]]], "duration": [0.15, 0.49, 1.2, 1.71, 0.59, 1.42, 0.65, 6.56, 5.13, 1.28, 6.69, 1.78, 8.45, 5.46, 0.7, 4.43, 2.41]} \ No newline at end of file diff --git a/annotations_1/vBLcmGPbryg_filtered.json b/annotations_1/vBLcmGPbryg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4c7c583551412519d6c0a02e4f65f65478e0f2d7 --- /dev/null +++ b/annotations_1/vBLcmGPbryg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.2], [7.0, 7.37], [19.0, 20.98], [38.0, 40.85], [42.0, 43.82], [66.0, 66.53], [77.0, 84.5], [88.0, 88.72], [92.0, 91.79], [94.0, 94.56], [97.0, 100.67], [104.0, 107.1], [110.0, 117.42], [127.0, 132.38], [134.0, 167.97], [168.0, 168.64], [172.0, 172.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 52.22, 0.0, 0.0, 41.54, 0.0, 0.0, 0.0, 35.89, 29.42, 30.44, 29.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 63.69], ["electronic music", 5.48], ["trance music", 5.03]], null, null, null, [["music", 57.14], ["hum", 5.43], ["throbbing", 4.71]], [["music", 25.43], ["crowd", 20.67], ["cheering", 6.77]], [["music", 63.15], ["didgeridoo", 8.18], ["groan", 2.27]], [["music", 18.38], ["crowd", 9.88], ["groan", 7.2]], null, null, null], "duration": [0.2, 0.37, 1.98, 2.85, 1.82, 0.53, 7.5, 0.72, -0.21, 0.56, 3.67, 3.1, 7.42, 5.38, 33.97, 0.64, 0.2]} \ No newline at end of file diff --git a/annotations_1/vBtG9eqgf2Q_filtered.json b/annotations_1/vBtG9eqgf2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6e360268b0a6a5b36bf41a243ab7eea2fc70615 --- /dev/null +++ b/annotations_1/vBtG9eqgf2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 43.63], [47.0, 56.88], [59.0, 61.21], [62.0, 63.04], [65.0, 70.24], [72.0, 74.97], [77.0, 79.54], [90.0, 91.08], [96.0, 97.43], [103.0, 103.74], [104.0, 107.65], [108.0, 111.37], [112.0, 112.6], [113.0, 114.17], [115.0, 138.18], [144.0, 158.25], [161.0, 161.6], [163.0, 163.34], [164.0, 165.52], [167.0, 167.24], [168.0, 169.37], [170.0, 204.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [40.12, 57.32, 95.64, 0.0, 99.21, 99.98, 99.88, 0.0, 0.0, 0.0, 53.91, 45.65, 0.0, 0.0, 32.75, 31.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 91.19], ["throbbing", 1.75], ["electronic music", 0.54]], null, null, null, null, null, null, null, null, null, null, [["music", 68.54], ["synthesizer", 6.11], ["throbbing", 2.7]], null, null, [["music", 84.06], ["didgeridoo", 3.52], ["electronic music", 1.22]], [["music", 72.59], ["synthesizer", 5.75], ["speech", 4.84]], null, null, null, null, null, null], "duration": [29.63, 9.88, 2.21, 1.04, 5.24, 2.97, 2.54, 1.08, 1.43, 0.74, 3.65, 3.37, 0.6, 1.17, 23.18, 14.25, 0.6, 0.34, 1.52, 0.24, 1.37, 34.75]} \ No newline at end of file diff --git a/annotations_1/vD6FkjOtIIs_filtered.json b/annotations_1/vD6FkjOtIIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2ad4ab3b7e4b3b46190283420de0f131769e68e --- /dev/null +++ b/annotations_1/vD6FkjOtIIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [5.0, 5.46], [6.0, 9.9], [11.0, 11.8], [13.0, 14.55], [16.0, 16.28], [17.0, 17.46], [21.0, 21.41], [29.0, 29.98], [34.0, 34.37], [38.0, 39.36], [41.0, 41.67], [43.0, 49.11], [52.0, 61.26], [62.0, 62.83], [65.0, 67.47], [69.0, 69.25], [71.0, 71.61], [72.0, 77.19], [79.0, 80.79], [83.0, 104.3], [106.0, 106.78], [108.0, 108.7], [111.0, 115.1], [116.0, 116.6], [119.0, 120.09], [121.0, 121.37], [122.0, 128.65], [131.0, 131.28], [134.0, 135.11], [136.0, 138.77], [139.0, 140.8]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.5, 32.94, 0.0, 34.96, 0.0, 0.0, 31.92, 0.0, 31.84, 0.0, 0.0, 93.91, 0.0, 0.0, 0.0, 31.01, 0.0, 0.0, 31.45, 0.0], "audiomae_on_audioset": [null, null, [["civil defense siren", 62.92], ["siren", 20.1], ["whale vocalization", 10.17]], null, null, null, null, null, null, null, null, null, [["music", 48.93], ["speech", 18.21], ["breaking", 13.29]], [["music", 34.53], ["speech", 19.09], ["fly, housefly", 11.99]], null, [["music", 27.92], ["speech", 18.23], ["didgeridoo", 15.6]], null, null, [["fly, housefly", 66.8], ["mosquito", 13.1], ["insect", 6.5]], null, [["music", 46.03], ["speech", 32.28], ["didgeridoo", 2.52]], null, null, null, null, null, null, [["music", 68.77], ["hum", 3.56], ["christmas music", 2.78]], null, null, [["music", 40.77], ["fly, housefly", 5.95], ["mosquito", 5.59]], null], "duration": [0.34, 0.46, 3.9, 0.8, 1.55, 0.28, 0.46, 0.41, 0.98, 0.37, 1.36, 0.67, 6.11, 9.26, 0.83, 2.47, 0.25, 0.61, 5.19, 1.79, 21.3, 0.78, 0.7, 4.1, 0.6, 1.09, 0.37, 6.65, 0.28, 1.11, 2.77, 1.8]} \ No newline at end of file diff --git a/annotations_1/vDzbcWty6m0_filtered.json b/annotations_1/vDzbcWty6m0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93097e411e5b7fac331ed1905e1efde5aed92e46 --- /dev/null +++ b/annotations_1/vDzbcWty6m0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 21.34], [24.0, 24.51], [34.0, 34.69], [36.0, 38.97], [42.0, 44.81], [46.0, 47.55], [50.0, 50.95], [60.0, 61.42], [67.0, 74.04], [81.0, 81.21], [85.0, 86.39], [87.0, 89.16], [94.0, 94.66], [98.0, 98.74], [100.0, 104.45], [105.0, 105.43], [106.0, 106.35], [107.0, 108.26], [109.0, 109.63], [112.0, 111.97], [113.0, 116.36], [119.0, 120.99], [122.0, 125.56]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.61, 0.0, 0.0, 29.53, 66.63, 0.0, 0.0, 0.0, 30.61, 0.0, 0.0, 50.16, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 86.82], "audiomae_on_audioset": [[["music", 50.7], ["thunk", 11.2], ["effects unit", 4.77]], null, null, [["whack, thwack", 31.23], ["thump, thud", 19.15], ["speech", 5.09]], null, null, null, null, [["speech", 61.68], ["animal", 2.89], ["fart", 2.76]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 41.48], ["music", 23.02], ["beatboxing", 13.79]], null, null], "duration": [5.34, 0.51, 0.69, 2.97, 2.81, 1.55, 0.95, 1.42, 7.04, 0.21, 1.39, 2.16, 0.66, 0.74, 4.45, 0.43, 0.35, 1.26, 0.63, -0.03, 3.36, 1.99, 3.56]} \ No newline at end of file diff --git a/annotations_1/vEWPq-4sa3w_filtered.json b/annotations_1/vEWPq-4sa3w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c2607dd87e883b6160836d9e83c6c8d28d8178 --- /dev/null +++ b/annotations_1/vEWPq-4sa3w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[70.0, 90.71]], "keep_status": [false], "silence_prob": [28.22], "audiomae_on_audioset": [[["music", 64.65], ["speech", 3.85], ["vehicle", 2.57]]], "duration": [20.71]} \ No newline at end of file diff --git a/annotations_1/vEj9ZwIzk44_filtered.json b/annotations_1/vEj9ZwIzk44_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60ec9e39c56e00f4f9380afb3fea877c06ce020d --- /dev/null +++ b/annotations_1/vEj9ZwIzk44_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.09], [10.0, 11.99], [14.0, 16.5], [17.0, 20.76], [22.0, 34.86], [40.0, 40.24], [40.0, 42.67], [46.0, 46.3], [47.0, 52.62], [55.0, 57.08], [59.0, 62.09], [63.0, 68.03], [69.0, 70.7], [72.0, 73.08], [74.0, 77.45], [78.0, 78.88], [80.0, 88.45], [90.0, 90.61], [93.0, 94.39], [95.0, 97.02], [97.0, 97.06], [97.0, 97.12], [98.0, 98.44], [98.0, 98.58], [99.0, 98.68], [103.0, 115.42], [126.0, 129.41], [131.0, 131.16], [132.0, 134.03], [134.0, 134.82], [137.0, 138.37], [140.0, 140.39], [143.0, 143.36], [144.0, 145.4], [147.0, 153.87], [155.0, 156.09], [158.0, 163.46], [165.0, 166.13], [167.0, 169.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.43, 0.0, 99.96, 99.76, 99.82, 0.0, 99.91, 0.0, 89.72, 99.68, 88.1, 99.76, 0.0, 0.0, 98.01, 0.0, 89.54, 0.0, 0.0, 73.06, 0.0, 0.0, 0.0, 0.0, 0.0, 52.05, 71.57, 0.0, 87.92, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 0.0, 87.74, 0.0, 94.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.09, 1.99, 2.5, 3.76, 12.86, 0.24, 2.67, 0.3, 5.62, 2.08, 3.09, 5.03, 1.7, 1.08, 3.45, 0.88, 8.45, 0.61, 1.39, 2.02, 0.06, 0.12, 0.44, 0.58, -0.32, 12.42, 3.41, 0.16, 2.03, 0.82, 1.37, 0.39, 0.36, 1.4, 6.87, 1.09, 5.46, 1.13, 2.72]} \ No newline at end of file diff --git a/annotations_1/vF-tPvPAqhQ_filtered.json b/annotations_1/vF-tPvPAqhQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f6d32521bfc5ff803b5fedccf9e759fbe5d730d --- /dev/null +++ b/annotations_1/vF-tPvPAqhQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.52], [4.0, 5.21], [6.0, 6.54], [8.0, 10.1], [13.0, 31.21], [41.0, 41.23], [44.0, 45.77], [59.0, 62.58], [64.0, 65.67], [67.0, 68.49], [69.0, 69.16], [71.0, 72.55], [74.0, 74.29], [75.0, 79.49], [81.0, 81.3], [84.0, 84.32], [87.0, 88.42], [90.0, 90.88], [93.0, 94.74], [95.0, 94.9], [98.0, 98.47], [104.0, 107.03], [110.0, 111.25], [113.0, 130.82], [133.0, 137.39]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 63.85, 30.73, 0.0, 0.0, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 44.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.24, 0.0, 28.82, 36.28], "audiomae_on_audioset": [null, null, null, null, [["speech", 51.87], ["buzz", 13.01], ["music", 10.67]], null, null, [["music", 46.24], ["hands", 10.86], ["synthesizer", 4.4]], null, null, null, null, null, [["mains hum", 28.17], ["hum", 26.97], ["speech", 12.77]], null, null, null, null, null, null, null, [["music", 24.91], ["speech", 24.89], ["hum", 19.9]], null, [["music", 55.9], ["throbbing", 14.95], ["hum", 9.59]], [["music", 62.18], ["synthesizer", 7.8], ["electronic music", 3.53]]], "duration": [1.52, 1.21, 0.54, 2.1, 18.21, 0.23, 1.77, 3.58, 1.67, 1.49, 0.16, 1.55, 0.29, 4.49, 0.3, 0.32, 1.42, 0.88, 1.74, -0.1, 0.47, 3.03, 1.25, 17.82, 4.39]} \ No newline at end of file diff --git a/annotations_1/vFD6BbYg0-0_filtered.json b/annotations_1/vFD6BbYg0-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbff36cc864af272c8745bf53ad10fa03d0ccf43 --- /dev/null +++ b/annotations_1/vFD6BbYg0-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.98], [15.0, 17.24], [19.0, 25.39], [26.0, 32.44], [34.0, 41.15], [43.0, 45.47], [47.0, 90.24], [92.0, 127.38]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [49.04, 64.97, 54.56, 52.86, 64.97, 59.33, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 55.08], ["music", 10.16], ["hum", 5.49]], null, null, null, null, null, null, null], "duration": [8.98, 2.24, 6.39, 6.44, 7.15, 2.47, 43.24, 35.38]} \ No newline at end of file diff --git a/annotations_1/vFPRSImZev4_filtered.json b/annotations_1/vFPRSImZev4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654f6486f0bf61530c7bdcf3d94f5598943b82b6 --- /dev/null +++ b/annotations_1/vFPRSImZev4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.62], [7.0, 8.58], [9.0, 22.77], [24.0, 55.02], [56.0, 59.7], [61.0, 63.02], [63.0, 63.76], [64.0, 75.84], [79.0, 110.13], [111.0, 111.18], [113.0, 114.78], [116.0, 119.1], [120.0, 122.37], [125.0, 128.73], [129.0, 132.88], [136.0, 137.61], [140.0, 143.51], [144.0, 149.15], [150.0, 154.31], [156.0, 156.46], [157.0, 157.17], [157.0, 162.7], [164.0, 165.47], [166.0, 169.67]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.38, 0.0, 58.55, 0.0, 99.99, 82.07, 0.0, 99.36, 0.0, 0.0, 0.0, 99.62, 87.37, 99.99, 97.92, 0.0, 99.95, 99.1, 99.84, 0.0, 0.0, 44.09, 0.0, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 81.34], ["inside, small room", 2.86], ["thunk", 2.34]], null, null], "duration": [2.62, 1.58, 13.77, 31.02, 3.7, 2.02, 0.76, 11.84, 31.13, 0.18, 1.78, 3.1, 2.37, 3.73, 3.88, 1.61, 3.51, 5.15, 4.31, 0.46, 0.17, 5.7, 1.47, 3.67]} \ No newline at end of file diff --git a/annotations_1/vITX2N0hpYE_filtered.json b/annotations_1/vITX2N0hpYE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3cf8da6eaeaf6e7c18556a873778c0f22ce2aac3 --- /dev/null +++ b/annotations_1/vITX2N0hpYE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 23.87], [31.0, 32.97], [34.0, 35.45], [42.0, 42.38], [44.0, 44.71], [47.0, 47.98], [49.0, 50.73], [51.0, 51.71], [54.0, 54.73], [55.0, 55.68], [57.0, 73.01], [75.0, 75.78], [77.0, 78.33], [79.0, 80.23], [81.0, 86.61], [89.0, 91.71], [94.0, 143.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [45.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.65, 0.0, 0.0, 0.0, 40.95, 61.87, 0.0], "audiomae_on_audioset": [[["sidetone", 80.06], ["radio", 4.66], ["hum", 2.81]], null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 22.39], ["moo", 17.54], ["livestock, farm animals, working animals", 12.72]], null, null, null, [["speech", 56.34], ["sidetone", 22.23], ["busy signal", 7.03]], null, null], "duration": [5.87, 1.97, 1.45, 0.38, 0.71, 0.98, 1.73, 0.71, 0.73, 0.68, 16.01, 0.78, 1.33, 1.23, 5.61, 2.71, 49.97]} \ No newline at end of file diff --git a/annotations_1/vI_kMlvUWDw_filtered.json b/annotations_1/vI_kMlvUWDw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edcebd127eed3ec4ce1ac3d04a7abab69a61ae59 --- /dev/null +++ b/annotations_1/vI_kMlvUWDw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.94], [4.0, 5.29], [11.0, 11.62], [23.0, 23.82], [33.0, 35.28], [39.0, 38.79], [40.0, 40.53], [56.0, 56.42], [60.0, 61.84], [64.0, 67.95], [75.0, 75.03], [77.0, 77.36], [86.0, 86.83], [87.0, 99.06], [99.0, 99.66], [102.0, 102.59], [106.0, 106.57], [108.0, 112.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.54, 0.0, 0.0, 0.0, 0.0, 32.43, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0, 0.0, 49.54], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 81.68], ["speech", 8.84], ["hum", 1.74]], null, null, null, null, [["speech", 50.68], ["music", 21.47], ["hum", 4.94]], null, null, null, [["speech", 33.73], ["music", 26.91], ["throbbing", 11.59]], null, null, null, [["music", 42.74], ["hum", 11.37], ["didgeridoo", 11.19]]], "duration": [0.94, 1.29, 0.62, 0.82, 2.28, -0.21, 0.53, 0.42, 1.84, 3.95, 0.03, 0.36, 0.83, 12.06, 0.66, 0.59, 0.57, 4.51]} \ No newline at end of file diff --git a/annotations_1/vId4AoKDg2s_filtered.json b/annotations_1/vId4AoKDg2s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe0181fde87643958033d73521735cb6058c24e1 --- /dev/null +++ b/annotations_1/vId4AoKDg2s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [6.0, 8.16], [10.0, 10.93], [16.0, 36.24], [50.0, 51.38], [60.0, 69.65], [71.0, 72.79], [74.0, 76.52], [78.0, 78.41], [80.0, 81.06], [83.0, 83.61], [87.0, 87.52], [88.0, 88.89], [92.0, 92.99], [95.0, 95.2], [97.0, 96.87], [99.0, 99.27], [101.0, 101.09], [103.0, 103.77], [107.0, 108.31], [111.0, 111.0], [112.0, 112.26], [112.0, 114.4], [117.0, 116.87]], "keep_status": [false, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.06, 0.0, 33.48, 0.0, 33.6, 0.0, 42.42, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.08, 0.0], "audiomae_on_audioset": [null, [["music", 51.87], ["didgeridoo", 9.14], ["musical instrument", 4.94]], null, [["music", 44.57], ["speech", 11.38], ["bleat", 5.29]], null, [["music", 67.98], ["crying, sobbing", 1.96], ["musical instrument", 1.95]], null, [["music", 37.77], ["speech", 7.1], ["electronic music", 5.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 2.16, 0.93, 20.24, 1.38, 9.65, 1.79, 2.52, 0.41, 1.06, 0.61, 0.52, 0.89, 0.99, 0.2, -0.13, 0.27, 0.09, 0.77, 1.31, 0.0, 0.26, 2.4, -0.13]} \ No newline at end of file diff --git a/annotations_1/vJ6XJtlqqZo_filtered.json b/annotations_1/vJ6XJtlqqZo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..73dcd87ebf3c450139c73f034c4adcf9f4c78676 --- /dev/null +++ b/annotations_1/vJ6XJtlqqZo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.76], [7.0, 8.02], [10.0, 11.8], [12.0, 14.07], [14.0, 15.5], [19.0, 19.08], [19.0, 21.61], [22.0, 25.59], [30.0, 29.83], [32.0, 32.02], [33.0, 34.08], [36.0, 36.96], [40.0, 41.99], [43.0, 43.01], [45.0, 47.8], [49.0, 49.62], [50.0, 51.97], [56.0, 57.05], [58.0, 59.98], [61.0, 62.72], [67.0, 68.91], [70.0, 70.46], [73.0, 75.2], [77.0, 81.04], [83.0, 85.41], [86.0, 87.25], [88.0, 89.24], [92.0, 93.46], [96.0, 96.52], [97.0, 97.04], [97.0, 98.37], [105.0, 107.1], [108.0, 110.0], [112.0, 113.53], [115.0, 116.95], [119.0, 125.32], [132.0, 143.19], [145.0, 145.32], [146.0, 147.46], [149.0, 153.39], [154.0, 157.91], [167.0, 167.86], [169.0, 173.91], [174.0, 177.35], [178.0, 178.5], [179.0, 178.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 60.79, 0.0, 0.0, 95.78, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 100.0, 91.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 93.13, 0.0, 0.0, 99.68, 99.88, 0.0, 0.0, 100.0, 99.16, 0.0, 37.74, 40.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 45.08], ["speech", 24.21], ["sneeze", 3.47]], [["music", 53.24], ["speech", 25.97], ["musical instrument", 6.39]], null, null], "duration": [0.76, 1.02, 1.8, 2.07, 1.5, 0.08, 2.61, 3.59, -0.17, 0.02, 1.08, 0.96, 1.99, 0.01, 2.8, 0.62, 1.97, 1.05, 1.98, 1.72, 1.91, 0.46, 2.2, 4.04, 2.41, 1.25, 1.24, 1.46, 0.52, 0.04, 1.37, 2.1, 2.0, 1.53, 1.95, 6.32, 11.19, 0.32, 1.46, 4.39, 3.91, 0.86, 4.91, 3.35, 0.5, -0.23]} \ No newline at end of file diff --git a/annotations_1/vJZe9sHz10M_filtered.json b/annotations_1/vJZe9sHz10M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c49ff1533fb3f3878874c7964ec84165a06da34e --- /dev/null +++ b/annotations_1/vJZe9sHz10M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.61], [23.0, 23.48], [70.0, 70.78], [81.0, 84.38]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 35.23], "audiomae_on_audioset": [null, null, null, [["speech", 54.73], ["horse", 16.01], ["clip-clop", 11.56]]], "duration": [0.61, 0.48, 0.78, 3.38]} \ No newline at end of file diff --git a/annotations_1/vJhO79OGi20_filtered.json b/annotations_1/vJhO79OGi20_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65f38b105a0db8cdb540b31a6803028a366c8d11 --- /dev/null +++ b/annotations_1/vJhO79OGi20_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.33], [16.0, 18.05], [19.0, 22.99], [27.0, 32.41], [34.0, 33.99], [34.0, 34.8], [37.0, 37.99], [42.0, 42.45], [43.0, 44.69], [45.0, 52.1], [54.0, 54.9], [56.0, 57.97], [59.0, 60.44], [61.0, 67.53], [68.0, 69.21], [76.0, 78.12], [79.0, 83.49], [97.0, 97.39], [105.0, 109.68], [115.0, 116.07], [117.0, 121.22], [128.0, 128.04], [128.0, 128.88], [130.0, 131.57], [132.0, 132.97], [138.0, 140.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, true, false, false, false, false, true], "silence_prob": [82.97, 82.25, 80.11, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 33.2, 0.0, 35.93, 39.85, 0.0, 29.8, 0.0, 35.25, 0.0, 0.0, 0.0, 0.0, 29.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.17], ["hum", 12.06], ["music", 9.85]], null, [["speech", 76.24], ["music", 8.01], ["gong", 3.42]], [["speech", 26.15], ["music", 11.49], ["hum", 9.41]], null, [["speech", 46.18], ["breaking", 35.59], ["music", 4.58]], null, [["music", 34.29], ["speech", 14.48], ["theremin", 12.62]], null, null, null, null, [["hum", 28.4], ["music", 17.73], ["mains hum", 16.28]]], "duration": [2.33, 2.05, 3.99, 5.41, -0.01, 0.8, 0.99, 0.45, 1.69, 7.1, 0.9, 1.97, 1.44, 6.53, 1.21, 2.12, 4.49, 0.39, 4.68, 1.07, 4.22, 0.04, 0.88, 1.57, 0.97, 2.39]} \ No newline at end of file diff --git a/annotations_1/vJi3kGaAQfo_filtered.json b/annotations_1/vJi3kGaAQfo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28ecff894e8a9a7248555cb600aa78126409221a --- /dev/null +++ b/annotations_1/vJi3kGaAQfo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.03], [13.0, 14.0], [15.0, 17.04], [18.0, 19.52], [21.0, 22.69], [24.0, 24.93], [26.0, 32.46], [33.0, 34.01], [36.0, 36.34], [38.0, 45.6], [46.0, 46.99], [47.0, 47.02], [47.0, 84.01], [87.0, 88.3], [90.0, 97.61], [99.0, 106.52], [109.0, 120.51], [126.0, 127.77], [132.0, 136.53], [137.0, 153.57], [158.0, 160.03], [161.0, 161.81], [162.0, 169.5], [173.0, 184.08]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, true, true, false, true, true, false, false, true, false], "silence_prob": [0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 30.42, 0.0, 0.0, 30.36, 0.0, 0.0, 0.0, 0.0, 36.99, 30.81, 33.61, 0.0, 32.32, 31.96, 34.91, 0.0, 30.6, 48.65], "audiomae_on_audioset": [null, null, null, null, null, null, [["whack, thwack", 15.41], ["speech", 14.68], ["music", 10.43]], null, null, [["throbbing", 30.49], ["speech", 18.47], ["hum", 16.31]], null, null, null, null, [["throbbing", 42.08], ["music", 13.96], ["quack", 8.22]], [["animal", 15.8], ["dog", 14.1], ["music", 13.64]], [["beatboxing", 24.53], ["hum", 16.33], ["mains hum", 11.87]], null, [["livestock, farm animals, working animals", 15.74], ["moo", 14.28], ["speech", 11.37]], [["speech", 30.11], ["hum", 30.09], ["mains hum", 8.68]], [["music", 56.5], ["throbbing", 17.04], ["hum", 11.66]], null, [["music", 43.18], ["whack, thwack", 14.16], ["breaking", 6.0]], [["music", 47.38], ["hum", 15.2], ["sonar", 8.77]]], "duration": [1.03, 1.0, 2.04, 1.52, 1.69, 0.93, 6.46, 1.01, 0.34, 7.6, 0.99, 0.02, 37.01, 1.3, 7.61, 7.52, 11.51, 1.77, 4.53, 16.57, 2.03, 0.81, 7.5, 11.08]} \ No newline at end of file diff --git a/annotations_1/vKcEalTIwfQ_filtered.json b/annotations_1/vKcEalTIwfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d41b670417ed33f89ed6856537e0856d6d62836f --- /dev/null +++ b/annotations_1/vKcEalTIwfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [4.0, 4.38], [4.0, 5.12], [6.0, 6.52], [11.0, 13.64], [18.0, 28.07], [33.0, 32.93], [35.0, 42.96], [46.0, 46.68], [55.0, 56.2], [57.0, 63.31], [66.0, 67.02], [78.0, 79.46], [83.0, 82.97], [84.0, 85.09], [90.0, 90.91], [96.0, 96.47], [101.0, 100.89]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 30.72, 30.11, 0.0, 31.13, 0.0, 0.0, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 35.87], ["hum", 12.3], ["music", 10.69]], [["speech", 47.4], ["hum", 16.56], ["music", 9.1]], null, [["music", 41.49], ["hum", 14.87], ["throbbing", 9.89]], null, null, [["sidetone", 42.31], ["speech", 17.52], ["mains hum", 14.15]], null, null, null, null, null, null, null], "duration": [0.33, 0.38, 1.12, 0.52, 2.64, 10.07, -0.07, 7.96, 0.68, 1.2, 6.31, 1.02, 1.46, -0.03, 1.09, 0.91, 0.47, -0.11]} \ No newline at end of file diff --git a/annotations_1/vKhAdR1G9io_filtered.json b/annotations_1/vKhAdR1G9io_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..44268bac926839ea24b0662c6c2aa1fb42bfd983 --- /dev/null +++ b/annotations_1/vKhAdR1G9io_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [3.0, 4.08], [5.0, 8.18], [12.0, 15.5], [17.0, 18.22], [19.0, 19.67], [20.0, 22.01], [23.0, 25.05], [26.0, 27.4], [35.0, 36.75], [39.0, 40.17], [41.0, 42.25], [43.0, 43.88], [49.0, 48.95], [49.0, 49.4], [53.0, 56.22], [59.0, 63.27], [66.0, 67.41], [72.0, 72.27], [75.0, 78.29], [80.0, 83.81], [85.0, 86.0], [89.0, 89.31], [90.0, 90.39], [91.0, 91.77], [93.0, 99.0], [100.0, 100.6], [102.0, 104.18], [109.0, 111.35], [114.0, 114.74], [119.0, 119.57], [127.0, 128.26]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 0.0, 96.66, 97.92, 0.0, 0.0, 49.54, 45.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.1, 75.72, 0.0, 0.0, 94.95, 97.11, 0.0, 0.0, 0.0, 0.0, 43.18, 0.0, 45.85, 46.64, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sine wave", 37.95], ["chirp tone", 29.14], ["tuning fork", 9.83]], [["sidetone", 26.79], ["speech", 22.39], ["telephone", 10.27]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 31.03], ["hum", 12.34], ["mains hum", 5.09]], null, [["speech", 17.51], ["fly, housefly", 13.5], ["mosquito", 8.37]], [["mains hum", 12.89], ["hum", 12.62], ["throbbing", 12.11]], null, null, null], "duration": [0.24, 1.08, 3.18, 3.5, 1.22, 0.67, 2.01, 2.05, 1.4, 1.75, 1.17, 1.25, 0.88, -0.05, 0.4, 3.22, 4.27, 1.41, 0.27, 3.29, 3.81, 1.0, 0.31, 0.39, 0.77, 6.0, 0.6, 2.18, 2.35, 0.74, 0.57, 1.26]} \ No newline at end of file diff --git a/annotations_1/vLgTWXjMlWI_filtered.json b/annotations_1/vLgTWXjMlWI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a7a55d490f99089671f89fcb620506f6117d0418 --- /dev/null +++ b/annotations_1/vLgTWXjMlWI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.49], [39.0, 40.59], [42.0, 43.28], [49.0, 49.69], [50.0, 54.89], [56.0, 58.55], [60.0, 62.56], [64.0, 68.5], [71.0, 71.22], [72.0, 72.91], [76.0, 77.84], [88.0, 88.5], [89.0, 89.67], [90.0, 90.26], [91.0, 91.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.78, 99.96, 99.93, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 1.59, 1.28, 0.69, 4.89, 2.55, 2.56, 4.5, 0.22, 0.91, 1.84, 0.5, 0.67, 0.26, 0.77]} \ No newline at end of file diff --git a/annotations_1/vLt5ei598CY_filtered.json b/annotations_1/vLt5ei598CY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a751fedd8269ce0fe114b9c472245fab9567ae --- /dev/null +++ b/annotations_1/vLt5ei598CY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 22.32], [23.0, 28.0], [29.0, 30.16], [33.0, 36.1], [37.0, 37.94], [39.0, 40.53], [41.0, 52.2], [53.0, 53.03], [57.0, 57.99], [59.0, 60.88], [61.0, 62.31], [66.0, 69.8], [70.0, 70.78], [74.0, 85.6], [89.0, 89.94], [93.0, 106.42], [107.0, 108.35], [109.0, 109.51], [111.0, 113.54], [114.0, 116.56], [118.0, 119.52], [125.0, 141.35], [141.0, 146.1], [147.0, 153.69], [155.0, 155.53], [156.0, 158.94], [159.0, 159.39], [160.0, 160.78], [161.0, 161.49]], "keep_status": [true, true, false, true, false, false, true, false, false, false, false, true, false, true, false, false, false, false, true, true, false, true, false, true, false, false, false, false, false], "silence_prob": [30.61, 31.24, 0.0, 49.73, 0.0, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 31.13, 0.0, 34.51, 0.0, 31.53, 0.0, 0.0, 35.33, 34.08, 0.0, 30.15, 30.78, 29.72, 0.0, 30.62, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["electric shaver, electric razor", 14.07], ["music", 13.61], ["buzz", 5.18]], [["whale vocalization", 14.86], ["sheep", 13.66], ["civil defense siren", 11.77]], null, [["hum", 46.18], ["mains hum", 14.98], ["throbbing", 6.06]], null, null, [["vehicle", 22.98], ["boat, water vehicle", 7.27], ["aircraft", 4.93]], null, null, null, null, [["whack, thwack", 22.11], ["speech", 20.64], ["rumble", 7.53]], null, [["buzz", 36.11], ["hum", 13.22], ["speech", 10.77]], null, [["music", 65.78], ["theremin", 7.02], ["electronic music", 2.93]], null, null, [["mains hum", 16.84], ["whale vocalization", 14.24], ["hum", 10.56]], [["hum", 35.34], ["mains hum", 21.67], ["throbbing", 9.91]], null, [["speech", 26.81], ["music", 13.83], ["breaking", 8.42]], [["speech", 49.7], ["vehicle", 12.35], ["music", 8.85]], [["music", 42.06], ["speech", 18.75], ["buzz", 8.42]], null, [["cattle, bovinae", 32.4], ["livestock, farm animals, working animals", 24.83], ["moo", 13.6]], null, null, null], "duration": [18.32, 5.0, 1.16, 3.1, 0.94, 1.53, 11.2, 0.03, 0.99, 1.88, 1.31, 3.8, 0.78, 11.6, 0.94, 13.42, 1.35, 0.51, 2.54, 2.56, 1.52, 16.35, 5.1, 6.69, 0.53, 2.94, 0.39, 0.78, 0.49]} \ No newline at end of file diff --git a/annotations_1/vLw24Xr1zKo_filtered.json b/annotations_1/vLw24Xr1zKo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0d7a546874128d0735db2f5910f96635d61452eb --- /dev/null +++ b/annotations_1/vLw24Xr1zKo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.87], [14.0, 17.95], [23.0, 24.81], [26.0, 32.37], [37.0, 37.91], [43.0, 43.41], [46.0, 66.07], [71.0, 86.78], [88.0, 89.13], [119.0, 119.15], [119.0, 120.92], [122.0, 123.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 51.18, 0.0, 30.47, 0.0, 0.0, 30.05, 39.85, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 42.91], ["music", 35.93], ["explosion", 3.97]], null, null, [["speech", 71.6], ["music", 10.37], ["vehicle", 1.69]], [["speech", 46.83], ["music", 28.97], ["hum", 5.64]], null, null, null, null], "duration": [-0.13, 3.95, 1.81, 6.37, 0.91, 0.41, 20.07, 15.78, 1.13, 0.15, 1.92, 1.04]} \ No newline at end of file diff --git a/annotations_1/vM7QMLTm1so_filtered.json b/annotations_1/vM7QMLTm1so_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aae6356d745b18c6f9315b82ca3caac1a3660430 --- /dev/null +++ b/annotations_1/vM7QMLTm1so_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [8.0, 11.16], [12.0, 15.25], [22.0, 22.76], [23.0, 22.84], [29.0, 31.36], [34.0, 35.04], [37.0, 37.07], [39.0, 39.19], [45.0, 46.04], [48.0, 48.86], [50.0, 51.34], [55.0, 61.77], [64.0, 65.11], [85.0, 85.85], [94.0, 98.42], [99.0, 99.74], [100.0, 124.09], [125.0, 129.69], [131.0, 142.11], [162.0, 164.24], [166.0, 168.24], [173.0, 177.72], [178.0, 177.75], [178.0, 177.79], [178.0, 177.82], [179.0, 194.34], [207.0, 211.82]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, true, false, true, false, false, false, false, true], "silence_prob": [0.0, 29.36, 39.35, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.61, 0.0, 0.0, 31.48, 0.0, 30.96, 36.44, 32.6, 32.2, 31.78, 30.1, 0.0, 0.0, 0.0, 30.39, 35.35], "audiomae_on_audioset": [null, [["vehicle", 14.28], ["music", 12.82], ["aircraft", 10.38]], [["speech", 35.72], ["music", 15.67], ["hum", 5.93]], null, null, null, null, null, null, null, null, null, [["music", 30.9], ["explosion", 24.39], ["burst, pop", 12.74]], null, null, [["cattle, bovinae", 50.41], ["moo", 39.11], ["livestock, farm animals, working animals", 8.77]], null, [["music", 44.98], ["throbbing", 10.56], ["smash, crash", 6.63]], [["music", 48.5], ["trombone", 15.65], ["brass instrument", 11.54]], [["music", 40.61], ["groan", 27.33], ["whack, thwack", 11.53]], [["speech", 36.72], ["fart", 12.97], ["grunt", 3.43]], [["hum", 29.73], ["music", 22.83], ["throbbing", 20.38]], [["speech", 31.19], ["music", 26.22], ["throbbing", 2.07]], null, null, null, [["speech", 37.23], ["music", 27.24], ["whack, thwack", 6.78]], [["music", 59.03], ["hum", 4.43], ["electronic music", 3.16]]], "duration": [0.51, 3.16, 3.25, 0.76, -0.16, 2.36, 1.04, 0.07, 0.19, 1.04, 0.86, 1.34, 6.77, 1.11, 0.85, 4.42, 0.74, 24.09, 4.69, 11.11, 2.24, 2.24, 4.72, -0.25, -0.21, -0.18, 15.34, 4.82]} \ No newline at end of file diff --git a/annotations_1/vNPCXKmF9LI_filtered.json b/annotations_1/vNPCXKmF9LI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da3b053ac83ceaf781b20d7140f7ef2d18094b6f --- /dev/null +++ b/annotations_1/vNPCXKmF9LI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.53], [3.0, 4.53], [6.0, 6.29], [14.0, 15.08], [16.0, 16.85], [20.0, 20.11], [27.0, 28.39], [37.0, 37.49], [38.0, 38.28], [45.0, 46.57], [47.0, 47.51], [49.0, 50.58], [51.0, 52.22], [55.0, 55.14], [57.0, 57.16], [59.0, 59.59], [60.0, 62.82], [69.0, 69.57], [71.0, 71.88], [75.0, 77.36], [78.0, 78.54], [88.0, 89.36], [91.0, 91.32], [95.0, 99.0], [103.0, 106.81], [114.0, 115.43], [119.0, 119.37], [120.0, 122.77], [123.0, 130.59], [134.0, 135.58], [138.0, 142.3], [144.0, 144.19], [146.0, 169.59], [171.0, 172.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 53.22, 31.14, 0.0, 0.0, 39.57, 32.43, 0.0, 70.58, 0.0, 35.95, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.49], ["music", 15.34], ["gunshot, gunfire", 6.84]], null, null, [["music", 20.28], ["hum", 16.32], ["mains hum", 11.43]], [["speech", 42.68], ["music", 30.01], ["whack, thwack", 3.5]], null, null, null, [["music", 63.97], ["grunt", 5.55], ["breaking", 5.38]], null], "duration": [0.53, 1.53, 0.29, 1.08, 0.85, 0.11, 1.39, 0.49, 0.28, 1.57, 0.51, 1.58, 1.22, 0.14, 0.16, 0.59, 2.82, 0.57, 0.88, 2.36, 0.54, 1.36, 0.32, 4.0, 3.81, 1.43, 0.37, 2.77, 7.59, 1.58, 4.3, 0.19, 23.59, 1.64]} \ No newline at end of file diff --git a/annotations_1/vOQ211AFtLU_filtered.json b/annotations_1/vOQ211AFtLU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ea773b90a6cd86292bd832bfe8d6627aa29b55d --- /dev/null +++ b/annotations_1/vOQ211AFtLU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.71], [25.0, 29.94], [31.0, 36.54], [38.0, 40.66], [41.0, 57.35], [58.0, 59.83], [61.0, 61.65], [65.0, 69.97], [71.0, 75.69], [77.0, 99.54], [101.0, 101.14], [103.0, 104.35], [106.0, 107.42], [109.0, 110.37], [112.0, 112.7], [115.0, 116.41], [117.0, 119.11]], "keep_status": [false, false, false, false, true, false, false, true, false, true, false, false, false, false, false, false, true], "silence_prob": [0.0, 82.79, 76.37, 89.19, 47.9, 0.0, 0.0, 37.32, 57.09, 32.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.06], "audiomae_on_audioset": [null, null, null, null, [["mains hum", 24.06], ["music", 21.51], ["hum", 20.1]], null, null, [["hum", 38.19], ["music", 19.84], ["mains hum", 8.03]], null, [["music", 15.61], ["explosion", 15.07], ["hum", 8.15]], null, null, null, null, null, null, [["music", 42.88], ["speech", 14.63], ["hum", 12.14]]], "duration": [1.71, 4.94, 5.54, 2.66, 16.35, 1.83, 0.65, 4.97, 4.69, 22.54, 0.14, 1.35, 1.42, 1.37, 0.7, 1.41, 2.11]} \ No newline at end of file diff --git a/annotations_1/vOfFVhSiwiA_filtered.json b/annotations_1/vOfFVhSiwiA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a3a27da2d82fe3ca8bc5ce11bb287dac15eaee --- /dev/null +++ b/annotations_1/vOfFVhSiwiA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 24.07], [25.0, 26.28], [27.0, 33.61], [35.0, 35.87], [39.0, 43.16], [44.0, 44.86], [45.0, 50.04], [50.0, 63.0], [63.0, 80.3], [82.0, 121.63]], "keep_status": [true, false, true, false, true, false, true, false, false, false], "silence_prob": [37.14, 0.0, 40.36, 0.0, 37.55, 0.0, 34.53, 33.45, 28.6, 0.0], "audiomae_on_audioset": [[["music", 39.89], ["hum", 13.11], ["throbbing", 5.6]], null, [["music", 19.29], ["hum", 13.0], ["mains hum", 12.58]], null, [["music", 39.82], ["didgeridoo", 7.54], ["livestock, farm animals, working animals", 6.43]], null, [["hum", 21.68], ["music", 20.47], ["mains hum", 18.66]], [["music", 48.47], ["hum", 17.22], ["throbbing", 8.95]], [["hum", 36.52], ["music", 23.32], ["throbbing", 22.91]], null], "duration": [5.07, 1.28, 6.61, 0.87, 4.16, 0.86, 5.04, 13.0, 17.3, 39.63]} \ No newline at end of file diff --git a/annotations_1/vOoyaqLrZnE_filtered.json b/annotations_1/vOoyaqLrZnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba67ae5e584e01eafdfeb32c3b8c82990aa1939a --- /dev/null +++ b/annotations_1/vOoyaqLrZnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.27], [5.0, 10.79], [12.0, 19.18], [20.0, 21.17], [22.0, 25.02], [27.0, 30.64], [32.0, 32.43], [33.0, 38.4], [39.0, 45.99], [47.0, 47.88], [51.0, 55.49], [58.0, 59.12], [60.0, 61.64], [63.0, 65.45], [68.0, 70.04], [75.0, 75.09], [76.0, 76.52], [78.0, 78.87], [79.0, 79.91], [81.0, 98.49], [104.0, 105.81], [107.0, 108.41], [112.0, 112.62], [113.0, 113.48], [115.0, 115.26], [117.0, 117.53], [122.0, 122.64], [125.0, 125.0], [130.0, 130.44], [136.0, 136.71], [138.0, 140.21], [142.0, 143.63]], "keep_status": [true, true, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [31.87, 38.43, 50.66, 0.0, 50.76, 61.77, 0.0, 42.28, 34.7, 0.0, 54.1, 0.0, 0.0, 31.73, 33.74, 0.0, 0.0, 0.0, 0.0, 29.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0], "audiomae_on_audioset": [[["speech", 16.46], ["music", 12.65], ["throbbing", 9.63]], [["hum", 20.29], ["speech", 19.26], ["mains hum", 14.86]], null, null, null, null, null, [["speech", 29.15], ["didgeridoo", 24.59], ["music", 15.25]], [["thunk", 51.75], ["clang", 9.55], ["ding", 6.42]], null, null, null, null, [["speech", 54.75], ["dial tone", 29.51], ["busy signal", 3.41]], [["speech", 64.55], ["sine wave", 5.34], ["dial tone", 4.5]], null, null, null, null, [["music", 29.07], ["hum", 22.6], ["mains hum", 13.6]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.27, 5.79, 7.18, 1.17, 3.02, 3.64, 0.43, 5.4, 6.99, 0.88, 4.49, 1.12, 1.64, 2.45, 2.04, 0.09, 0.52, 0.87, 0.91, 17.49, 1.81, 1.41, 0.62, 0.48, 0.26, 0.53, 0.64, 0.0, 0.44, 0.71, 2.21, 1.63]} \ No newline at end of file diff --git a/annotations_1/vP7uKAQLwXc_filtered.json b/annotations_1/vP7uKAQLwXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..296a3e7fbf10737fe357978bb908baa93d32808c --- /dev/null +++ b/annotations_1/vP7uKAQLwXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 32.0], [37.0, 43.51], [45.0, 52.05], [54.0, 56.27], [60.0, 86.93]], "keep_status": [false, false, true, true, false], "silence_prob": [28.84, 28.7, 28.39, 28.79, 34.71], "audiomae_on_audioset": [[["music", 38.03], ["vehicle", 26.22], ["car", 19.26]], [["vehicle", 47.55], ["car", 16.4], ["music", 11.21]], [["vehicle", 37.51], ["car", 17.0], ["skidding", 13.39]], [["didgeridoo", 40.15], ["music", 17.69], ["hum", 6.94]], [["music", 46.56], ["hum", 15.29], ["mains hum", 8.68]]], "duration": [23.0, 6.51, 7.05, 2.27, 26.93]} \ No newline at end of file diff --git a/annotations_1/vPYiq9JNq_c_filtered.json b/annotations_1/vPYiq9JNq_c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ee73cbbbf345a89e8371fb87897e53963f2c50f6 --- /dev/null +++ b/annotations_1/vPYiq9JNq_c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.38], [26.0, 26.65], [27.0, 28.76], [29.0, 36.31], [40.0, 43.09], [48.0, 48.44], [51.0, 51.76], [53.0, 53.5], [59.0, 60.39], [65.0, 65.55], [72.0, 73.33], [76.0, 76.5], [95.0, 95.34], [100.0, 100.89], [103.0, 111.86], [112.0, 112.68]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.89, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.31, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 67.66], ["music", 7.89], ["fireworks", 5.77]], [["speech", 47.04], ["cheering", 7.45], ["throbbing", 7.31]], null, null, null, null, null, null, null, null, null, [["speech", 53.1], ["hum", 9.56], ["explosion", 7.78]], null], "duration": [0.38, 0.65, 1.76, 7.31, 3.09, 0.44, 0.76, 0.5, 1.39, 0.55, 1.33, 0.5, 0.34, 0.89, 8.86, 0.68]} \ No newline at end of file diff --git a/annotations_1/vRUQ_q5mivc_filtered.json b/annotations_1/vRUQ_q5mivc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7e2ffb10a50468499dd711810f042376b7bb5f0 --- /dev/null +++ b/annotations_1/vRUQ_q5mivc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.1], [10.0, 12.48], [13.0, 22.94], [24.0, 30.35], [40.0, 42.06], [44.0, 45.23], [46.0, 62.78], [70.0, 83.3], [84.0, 87.34], [88.0, 88.94], [90.0, 94.29], [96.0, 96.52], [100.0, 120.61], [122.0, 131.13], [133.0, 173.85]], "keep_status": [false, false, true, true, true, false, false, true, true, false, false, false, true, true, false], "silence_prob": [0.0, 35.0, 30.08, 29.79, 32.15, 0.0, 30.63, 31.61, 32.84, 0.0, 44.93, 0.0, 35.42, 32.97, 0.0], "audiomae_on_audioset": [null, [["mains hum", 37.51], ["hum", 33.43], ["music", 10.78]], [["sidetone", 24.17], ["fly, housefly", 18.8], ["insect", 11.14]], [["speech", 44.71], ["music", 16.7], ["hum", 7.53]], [["moo", 25.9], ["cattle, bovinae", 21.39], ["livestock, farm animals, working animals", 16.19]], null, [["music", 57.72], ["speech", 14.65], ["theremin", 9.55]], [["fly, housefly", 22.24], ["music", 19.62], ["speech", 6.89]], [["speech", 33.67], ["music", 25.56], ["synthesizer", 4.68]], null, [["whale vocalization", 51.76], ["hum", 9.54], ["music", 9.41]], null, [["music", 50.71], ["ambient music", 7.09], ["hum", 6.78]], [["music", 40.33], ["didgeridoo", 14.01], ["throbbing", 13.27]], null], "duration": [0.1, 2.48, 9.94, 6.35, 2.06, 1.23, 16.78, 13.3, 3.34, 0.94, 4.29, 0.52, 20.61, 9.13, 40.85]} \ No newline at end of file diff --git a/annotations_1/vT3QXNKoZKw_filtered.json b/annotations_1/vT3QXNKoZKw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1abeda8a16fd7a29ca6042bb27e562c7fbf786db --- /dev/null +++ b/annotations_1/vT3QXNKoZKw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.55], [15.0, 21.14], [22.0, 22.79], [25.0, 28.88], [30.0, 30.65], [34.0, 39.45], [48.0, 50.63], [53.0, 57.94], [61.0, 63.26], [64.0, 65.4], [66.0, 69.48], [73.0, 73.4], [75.0, 91.94], [93.0, 95.62], [96.0, 102.56], [104.0, 105.26]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [100.0, 99.36, 0.0, 100.0, 0.0, 100.0, 98.27, 48.74, 94.37, 0.0, 79.94, 0.0, 37.0, 38.67, 35.15, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 47.25], ["speech", 19.66], ["singing bowl", 2.2]], null, null, null, null, [["music", 53.08], ["synthesizer", 15.47], ["musical instrument", 3.99]], [["music", 57.38], ["didgeridoo", 6.68], ["synthesizer", 5.05]], [["music", 58.41], ["theremin", 6.15], ["ambient music", 5.27]], null], "duration": [8.55, 6.14, 0.79, 3.88, 0.65, 5.45, 2.63, 4.94, 2.26, 1.4, 3.48, 0.4, 16.94, 2.62, 6.56, 1.26]} \ No newline at end of file diff --git a/annotations_1/vTTzWRdAN4M_filtered.json b/annotations_1/vTTzWRdAN4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26ff529c41c5e086332535c56c4bb79eaeeefca2 --- /dev/null +++ b/annotations_1/vTTzWRdAN4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.86], [11.0, 11.5], [16.0, 17.52], [24.0, 24.63], [26.0, 26.42], [27.0, 49.6], [55.0, 55.81], [61.0, 65.57], [68.0, 69.53], [73.0, 74.9], [78.0, 79.54], [80.0, 80.22], [85.0, 85.24], [90.0, 95.86], [97.0, 97.66], [100.0, 100.75], [109.0, 109.58], [111.0, 111.5], [114.0, 121.17], [135.0, 135.18], [143.0, 146.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [55.46, 0.0, 0.0, 0.0, 0.0, 56.03, 0.0, 56.93, 0.0, 0.0, 0.0, 0.0, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 91.3, 0.0, 52.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 54.77], ["fart", 10.43], ["creak", 8.47]], null, null, null, null, null, null, null], "duration": [5.86, 0.5, 1.52, 0.63, 0.42, 22.6, 0.81, 4.57, 1.53, 1.9, 1.54, 0.22, 0.24, 5.86, 0.66, 0.75, 0.58, 0.5, 7.17, 0.18, 3.96]} \ No newline at end of file diff --git a/annotations_1/vUbnqySPN8E_filtered.json b/annotations_1/vUbnqySPN8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5fedca087910de4860dc17240d4fca622da160e5 --- /dev/null +++ b/annotations_1/vUbnqySPN8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.65], [6.0, 7.21], [11.0, 14.84], [15.0, 16.92], [18.0, 19.72], [22.0, 23.25], [24.0, 25.51], [27.0, 27.06], [28.0, 29.27], [30.0, 35.88], [37.0, 40.81], [43.0, 54.73], [55.0, 57.75], [58.0, 63.53], [65.0, 71.31], [74.0, 76.74], [78.0, 100.84], [106.0, 105.71], [106.0, 109.02], [111.0, 117.32], [122.0, 126.98], [133.0, 133.37], [135.0, 140.75], [143.0, 143.26], [145.0, 153.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 100.0, 100.0, 100.0, 100.0, 100.0, 100.0, 65.67, 0.0, 46.57, 59.42, 58.3, 0.0, 59.15, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 43.33], ["speech", 11.86], ["ambient music", 2.97]], null, null, null, null, null, null], "duration": [0.65, 1.21, 3.84, 1.92, 1.72, 1.25, 1.51, 0.06, 1.27, 5.88, 3.81, 11.73, 2.75, 5.53, 6.31, 2.74, 22.84, -0.29, 3.02, 6.32, 4.98, 0.37, 5.75, 0.26, 8.94]} \ No newline at end of file diff --git a/annotations_1/vUrgn1Vm86I_filtered.json b/annotations_1/vUrgn1Vm86I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a1bd1de1cd973b1d1577153b787e83e25af5b0e --- /dev/null +++ b/annotations_1/vUrgn1Vm86I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.3], [4.0, 5.86], [10.0, 15.97], [17.0, 19.99], [20.0, 20.44], [22.0, 22.47], [26.0, 28.83], [31.0, 34.32], [35.0, 35.61], [37.0, 36.83], [37.0, 38.74], [40.0, 49.08], [50.0, 80.35], [86.0, 110.47], [117.0, 119.18], [120.0, 123.6], [124.0, 124.92], [126.0, 126.99], [128.0, 129.03], [130.0, 131.25], [132.0, 132.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [85.35, 0.0, 79.76, 52.68, 0.0, 0.0, 97.11, 93.76, 0.0, 0.0, 0.0, 71.14, 0.0, 32.78, 32.28, 42.86, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["electric shaver, electric razor", 25.03], ["mains hum", 19.98], ["music", 14.31]], [["music", 54.16], ["throbbing", 11.69], ["speech", 5.45]], [["speech", 65.24], ["music", 7.26], ["hum", 5.49]], null, null, null, null, null], "duration": [2.3, 1.86, 5.97, 2.99, 0.44, 0.47, 2.83, 3.32, 0.61, -0.17, 1.74, 9.08, 30.35, 24.47, 2.18, 3.6, 0.92, 0.99, 1.03, 1.25, 0.83]} \ No newline at end of file diff --git a/annotations_1/vUzF61mtilA_filtered.json b/annotations_1/vUzF61mtilA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd3547092448d027435301e1cde33c2756a8765 --- /dev/null +++ b/annotations_1/vUzF61mtilA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 29.59], [32.0, 43.63], [47.0, 48.03], [49.0, 50.5], [53.0, 53.65], [54.0, 57.54], [58.0, 59.1], [62.0, 63.34], [65.0, 74.22], [77.0, 89.88], [91.0, 95.01], [95.0, 95.27], [95.0, 101.68], [104.0, 117.76], [124.0, 124.53], [125.0, 125.64], [127.0, 138.1], [141.0, 141.62], [145.0, 154.94], [159.0, 172.08], [175.0, 175.05], [176.0, 177.79], [181.0, 182.02]], "keep_status": [true, true, false, false, false, false, false, false, true, true, true, false, false, true, false, false, true, false, false, true, false, false, false], "silence_prob": [32.51, 30.04, 0.0, 0.0, 0.0, 37.3, 0.0, 0.0, 30.52, 31.97, 30.49, 0.0, 30.23, 29.58, 0.0, 0.0, 29.93, 0.0, 30.78, 30.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 42.73], ["speech", 20.78], ["electronic music", 4.51]], [["music", 25.5], ["buzz", 18.66], ["speech", 8.9]], null, null, null, [["music", 53.77], ["speech", 12.18], ["synthesizer", 6.19]], null, null, [["livestock, farm animals, working animals", 39.61], ["cattle, bovinae", 14.18], ["vehicle", 10.29]], [["music", 25.17], ["livestock, farm animals, working animals", 23.74], ["throbbing", 13.51]], [["music", 33.03], ["hum", 20.16], ["throbbing", 16.67]], null, [["speech", 52.12], ["music", 24.83], ["noise", 4.49]], [["speech", 22.13], ["hum", 20.52], ["music", 17.22]], null, null, [["hum", 21.68], ["music", 18.55], ["mains hum", 14.75]], null, [["music", 77.09], ["fly, housefly", 4.06], ["speech", 2.0]], [["speech", 28.07], ["music", 24.9], ["hum", 12.76]], null, null, null], "duration": [2.59, 11.63, 1.03, 1.5, 0.65, 3.54, 1.1, 1.34, 9.22, 12.88, 4.01, 0.27, 6.68, 13.76, 0.53, 0.64, 11.1, 0.62, 9.94, 13.08, 0.05, 1.79, 1.02]} \ No newline at end of file diff --git a/annotations_1/vV30irsal-w_filtered.json b/annotations_1/vV30irsal-w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ab139bd736ce85627af832322724fc5cb03ceab9 --- /dev/null +++ b/annotations_1/vV30irsal-w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.43], [31.0, 37.67], [46.0, 46.45], [47.0, 48.15], [60.0, 60.35], [66.0, 65.85], [91.0, 90.93], [95.0, 95.67], [103.0, 106.71], [107.0, 107.99], [109.0, 109.63], [111.0, 111.77], [112.0, 114.96], [128.0, 130.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 32.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.15, 0.0, 0.0, 0.0, 43.66, 88.1], "audiomae_on_audioset": [null, [["music", 72.42], ["speech", 9.55], ["boing", 4.08]], null, null, null, null, null, null, null, null, null, null, [["music", 53.08], ["guitar", 4.73], ["chirp tone", 4.09]], null], "duration": [0.43, 6.67, 0.45, 1.15, 0.35, -0.15, -0.07, 0.67, 3.71, 0.99, 0.63, 0.77, 2.96, 2.3]} \ No newline at end of file diff --git a/annotations_1/vVmZO3W0I1A_filtered.json b/annotations_1/vVmZO3W0I1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5d530ba03d214ae8099d8566773192dfd1788c7 --- /dev/null +++ b/annotations_1/vVmZO3W0I1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.42], [18.0, 18.77], [20.0, 21.1], [23.0, 23.43], [25.0, 25.22], [27.0, 27.33], [28.0, 42.8], [44.0, 47.43], [48.0, 53.03], [54.0, 58.28], [59.0, 68.89], [76.0, 77.77], [79.0, 80.96], [83.0, 86.83], [88.0, 89.7], [92.0, 95.79], [98.0, 99.2], [101.0, 101.73], [116.0, 118.05], [123.0, 124.66], [127.0, 127.18], [128.0, 140.44], [140.0, 140.51]], "keep_status": [true, false, false, false, false, false, false, true, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [49.31, 0.0, 0.0, 0.0, 0.0, 0.0, 33.6, 39.47, 30.32, 32.5, 31.37, 0.0, 0.0, 30.9, 0.0, 31.48, 0.0, 0.0, 33.36, 0.0, 0.0, 30.37, 0.0], "audiomae_on_audioset": [[["music", 26.05], ["throbbing", 12.83], ["speech", 7.55]], null, null, null, null, null, [["hum", 44.5], ["throbbing", 20.49], ["music", 13.34]], [["music", 24.73], ["hum", 18.96], ["throbbing", 10.69]], [["breaking", 42.29], ["music", 12.5], ["smash, crash", 10.31]], [["boing", 26.66], ["thunk", 13.04], ["speech", 12.39]], [["throbbing", 44.51], ["music", 30.47], ["hum", 18.83]], null, null, [["speech", 47.1], ["music", 17.42], ["explosion", 5.46]], null, [["speech", 37.83], ["breaking", 34.62], ["smash, crash", 9.84]], null, null, [["foghorn", 50.7], ["music", 17.34], ["hum", 8.89]], null, null, [["music", 37.02], ["throbbing", 31.29], ["speech", 15.18]], null], "duration": [2.42, 0.77, 1.1, 0.43, 0.22, 0.33, 14.8, 3.43, 5.03, 4.28, 9.89, 1.77, 1.96, 3.83, 1.7, 3.79, 1.2, 0.73, 2.05, 1.66, 0.18, 12.44, 0.51]} \ No newline at end of file diff --git a/annotations_1/vVqCU0iWlFM_filtered.json b/annotations_1/vVqCU0iWlFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0fa867295e4f26ef6a37036d5007a1023a4813cb --- /dev/null +++ b/annotations_1/vVqCU0iWlFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.78], [2.0, 34.06], [36.0, 67.85], [69.0, 138.65], [139.0, 152.39], [163.0, 164.0], [175.0, 189.46]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 99.9], "audiomae_on_audioset": [null, null, null, null, null, null, null], "duration": [1.78, 32.06, 31.85, 69.65, 13.39, 1.0, 14.46]} \ No newline at end of file diff --git a/annotations_1/vW7-H-GGYwk_filtered.json b/annotations_1/vW7-H-GGYwk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8282f8aee7c58a380f6bb49924db86dd412602f7 --- /dev/null +++ b/annotations_1/vW7-H-GGYwk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 21.74], [25.0, 25.3], [25.0, 38.47], [40.0, 40.83], [47.0, 53.22], [57.0, 71.19], [75.0, 81.24], [82.0, 121.54], [122.0, 122.25]], "keep_status": [false, false, true, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 32.1, 0.0, 31.74, 31.64, 32.77, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 36.41], ["hum", 13.7], ["speech", 11.75]], null, [["music", 36.5], ["hum", 18.92], ["mains hum", 14.66]], [["music", 27.86], ["speech", 15.74], ["vehicle", 13.16]], [["hum", 27.03], ["music", 19.09], ["speech", 16.08]], null, null], "duration": [-0.26, 0.3, 13.47, 0.83, 6.22, 14.19, 6.24, 39.54, 0.25]} \ No newline at end of file diff --git a/annotations_1/vWkJPL2Dt9A_filtered.json b/annotations_1/vWkJPL2Dt9A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8154a3c75e0149f1c24b225aa0e0dc26900a8dcf --- /dev/null +++ b/annotations_1/vWkJPL2Dt9A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.01], [3.0, 4.8], [5.0, 6.86], [8.0, 10.12], [13.0, 14.59], [19.0, 21.36], [23.0, 24.63], [26.0, 28.56], [32.0, 33.74], [37.0, 40.69], [46.0, 47.7], [49.0, 53.6], [54.0, 56.91], [58.0, 89.28], [92.0, 93.14], [95.0, 97.33], [100.0, 100.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 73.82, 0.0, 100.0, 0.0, 100.0, 0.0, 94.37, 0.0, 99.62, 100.0, 0.0, 0.0, 99.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 1.8, 1.86, 2.12, 1.59, 2.36, 1.63, 2.56, 1.74, 3.69, 1.7, 4.6, 2.91, 31.28, 1.14, 2.33, 0.65]} \ No newline at end of file diff --git a/annotations_1/vXQlXYcAksI_filtered.json b/annotations_1/vXQlXYcAksI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7baa237a980bc10f4ff5669138932cdbc28597cc --- /dev/null +++ b/annotations_1/vXQlXYcAksI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.78], [8.0, 15.89], [16.0, 16.01], [16.0, 17.14], [20.0, 20.97], [23.0, 23.73], [27.0, 27.43], [31.0, 30.91], [32.0, 61.15], [69.0, 69.2], [70.0, 70.77], [79.0, 79.57], [81.0, 81.57], [84.0, 84.15], [102.0, 101.82]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 38.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 40.17], ["hum", 15.1], ["throbbing", 8.76]], null, null, null, null, null, null, [["music", 26.77], ["hum", 22.87], ["throbbing", 10.95]], null, null, null, null, null, null], "duration": [0.78, 7.89, 0.01, 1.14, 0.97, 0.73, 0.43, -0.09, 29.15, 0.2, 0.77, 0.57, 0.57, 0.15, -0.18]} \ No newline at end of file diff --git a/annotations_1/vXXDqjLe4Ls_filtered.json b/annotations_1/vXXDqjLe4Ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f819ee69bde2940340a4f2c4aaa314caee9e75c8 --- /dev/null +++ b/annotations_1/vXXDqjLe4Ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.7], [5.0, 5.85], [6.0, 6.37], [9.0, 9.58], [11.0, 11.25], [14.0, 14.35], [15.0, 15.84], [16.0, 18.28], [20.0, 20.29], [20.0, 22.18], [24.0, 23.85], [29.0, 29.96], [31.0, 36.46], [38.0, 37.71], [46.0, 47.78], [49.0, 54.89], [56.0, 56.13], [62.0, 63.27], [67.0, 69.04], [70.0, 70.75], [76.0, 83.76], [89.0, 90.64], [91.0, 155.93], [157.0, 159.78], [164.0, 165.21], [166.0, 170.26], [172.0, 180.98], [181.0, 184.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.76, 0.0, 51.82, 0.0, 0.0, 57.97, 0.0, 0.0, 46.15, 0.0, 0.0, 64.41, 0.0, 99.05, 0.0, 0.0, 47.62, 0.0, 76.04, 90.25, 61.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mouse", 20.68], ["speech", 16.12], ["animal", 12.98]], null, null, null, null, null, null, null, [["music", 46.79], ["theremin", 11.92], ["musical instrument", 4.04]], null, null, null, null], "duration": [0.7, 0.85, 0.37, 0.58, 0.25, 0.35, 0.84, 2.28, 0.29, 2.18, -0.15, 0.96, 5.46, -0.29, 1.78, 5.89, 0.13, 1.27, 2.04, 0.75, 7.76, 1.64, 64.93, 2.78, 1.21, 4.26, 8.98, 3.05]} \ No newline at end of file diff --git a/annotations_1/vYH5urNq1Ao_filtered.json b/annotations_1/vYH5urNq1Ao_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c12148993523f5235da56689d07d43bc61e57b34 --- /dev/null +++ b/annotations_1/vYH5urNq1Ao_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.68], [9.0, 9.91], [13.0, 14.69], [16.0, 20.53], [23.0, 23.75], [24.0, 25.27], [32.0, 33.22], [34.0, 35.6], [37.0, 37.76], [40.0, 40.49], [44.0, 53.91], [57.0, 58.58], [70.0, 71.83], [75.0, 74.76], [78.0, 79.83], [82.0, 82.51], [85.0, 88.16], [89.0, 89.83], [94.0, 95.0], [98.0, 98.27], [102.0, 102.51], [104.0, 106.78], [110.0, 116.24], [120.0, 121.1], [122.0, 122.12], [123.0, 123.48], [125.0, 128.8], [133.0, 133.1], [135.0, 145.25], [146.0, 149.99], [151.0, 154.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 51.99, 0.0, 0.0, 0.0, 0.0, 52.56, 98.36, 0.0, 0.0, 0.0, 54.9, 0.0, 48.35, 83.52, 81.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 44.39], ["music", 17.79], ["mains hum", 12.76]], null, null], "duration": [1.68, 0.91, 1.69, 4.53, 0.75, 1.27, 1.22, 1.6, 0.76, 0.49, 9.91, 1.58, 1.83, -0.24, 1.83, 0.51, 3.16, 0.83, 1.0, 0.27, 0.51, 2.78, 6.24, 1.1, 0.12, 0.48, 3.8, 0.1, 10.25, 3.99, 3.01]} \ No newline at end of file diff --git a/annotations_1/vYm_2A_cg0Y_filtered.json b/annotations_1/vYm_2A_cg0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..43369ed4fd6b5dd89c6cf3a09021706fbfc9c199 --- /dev/null +++ b/annotations_1/vYm_2A_cg0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [6.0, 6.81], [10.0, 12.16], [16.0, 27.41], [28.0, 46.5], [47.0, 47.48], [50.0, 49.99], [52.0, 99.35], [101.0, 101.19]], "keep_status": [false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 90.08, 40.48, 38.82, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 30.61], ["sidetone", 24.74], ["music", 11.49]], [["music", 32.14], ["throbbing", 23.87], ["electronic music", 13.12]], null, null, null, null], "duration": [1.13, 0.81, 2.16, 11.41, 18.5, 0.48, -0.01, 47.35, 0.19]} \ No newline at end of file diff --git a/annotations_1/vYtc_bS47oM_filtered.json b/annotations_1/vYtc_bS47oM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..928641d69acaa1d4085ec96f43b010e589345988 --- /dev/null +++ b/annotations_1/vYtc_bS47oM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 15.72], [17.0, 25.68], [27.0, 28.8], [31.0, 31.43], [34.0, 36.31], [41.0, 42.06], [45.0, 45.47], [46.0, 46.99], [48.0, 48.07], [49.0, 49.77], [53.0, 55.61], [60.0, 61.5], [64.0, 64.27], [65.0, 66.97], [80.0, 80.57], [85.0, 86.22], [87.0, 87.81], [90.0, 90.96], [95.0, 94.83], [97.0, 97.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [87.37, 97.43, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 60.62], ["fart", 3.77], ["inside, small room", 3.44]], null, null, null, null, null, null, null, null, null], "duration": [6.72, 8.68, 1.8, 0.43, 2.31, 1.06, 0.47, 0.99, 0.07, 0.77, 2.61, 1.5, 0.27, 1.97, 0.57, 1.22, 0.81, 0.96, -0.17, 0.19]} \ No newline at end of file diff --git a/annotations_1/vZ3nHOtlQiU_filtered.json b/annotations_1/vZ3nHOtlQiU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..939ed6a0844082a2f05e8ee9ddfef0f8105ea351 --- /dev/null +++ b/annotations_1/vZ3nHOtlQiU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.88], [12.0, 13.76], [15.0, 17.39], [18.0, 22.84], [27.0, 42.65], [43.0, 43.95], [46.0, 90.61], [92.0, 95.52], [97.0, 102.39], [104.0, 114.93], [118.0, 118.67], [120.0, 121.12], [122.0, 128.51], [129.0, 129.95], [131.0, 130.94]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 58.38, 62.89, 37.26, 0.0, 0.0, 36.69, 35.79, 28.49, 0.0, 0.0, 30.31, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 29.39], ["speech", 13.9], ["fly, housefly", 10.26]], null, null, [["music", 54.32], ["throbbing", 16.14], ["hum", 10.06]], [["music", 52.89], ["hum", 17.17], ["throbbing", 14.95]], [["music", 50.12], ["rumble", 7.83], ["hum", 4.99]], null, null, [["speech", 55.78], ["fart", 11.77], ["groan", 6.05]], null, null], "duration": [1.88, 1.76, 2.39, 4.84, 15.65, 0.95, 44.61, 3.52, 5.39, 10.93, 0.67, 1.12, 6.51, 0.95, -0.06]} \ No newline at end of file diff --git a/annotations_1/vZHS1nXJaGU_filtered.json b/annotations_1/vZHS1nXJaGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76678287cc892954e70af1b6693093dcd44167d7 --- /dev/null +++ b/annotations_1/vZHS1nXJaGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.88], [22.0, 22.05], [32.0, 35.63], [38.0, 43.68], [46.0, 46.31], [47.0, 47.01], [48.0, 48.91], [55.0, 55.68], [59.0, 59.98], [64.0, 65.37], [65.0, 65.5], [66.0, 66.97], [68.0, 68.59], [87.0, 87.51], [91.0, 95.3], [97.0, 98.37]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 40.34, 39.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.52, 0.0], "audiomae_on_audioset": [null, null, [["whale vocalization", 24.41], ["speech", 16.8], ["rumble", 15.63]], [["whale vocalization", 70.8], ["hum", 8.21], ["noise", 6.56]], null, null, null, null, null, null, null, null, null, null, [["chirp tone", 18.34], ["sine wave", 13.58], ["music", 9.81]], null], "duration": [-0.12, 0.05, 3.63, 5.68, 0.31, 0.01, 0.91, 0.68, 0.98, 1.37, 0.5, 0.97, 0.59, 0.51, 4.3, 1.37]} \ No newline at end of file diff --git a/annotations_1/vZqr-1GJIAk_filtered.json b/annotations_1/vZqr-1GJIAk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..abe11393b41ecfc5fe0cc17982859ab4e5ddb690 --- /dev/null +++ b/annotations_1/vZqr-1GJIAk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.43], [3.0, 3.43], [6.0, 6.62], [11.0, 11.4], [16.0, 16.48], [17.0, 17.36], [19.0, 19.55], [20.0, 20.68], [26.0, 27.6], [29.0, 30.72], [33.0, 33.18], [35.0, 38.21], [40.0, 41.59], [43.0, 44.46], [47.0, 48.68], [52.0, 53.28], [55.0, 55.51], [57.0, 57.59], [59.0, 60.07], [62.0, 63.59], [72.0, 71.9], [73.0, 74.33], [76.0, 76.55], [77.0, 77.26], [78.0, 80.2], [82.0, 82.11], [83.0, 93.06], [96.0, 110.0], [113.0, 119.57], [122.0, 127.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 67.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.55, 0.0, 58.22, 32.35, 31.93, 31.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 32.72], ["fly, housefly", 18.41], ["noise", 11.88]], [["cattle, bovinae", 48.85], ["moo", 22.57], ["livestock, farm animals, working animals", 8.18]], [["livestock, farm animals, working animals", 31.45], ["cattle, bovinae", 20.89], ["moo", 12.98]]], "duration": [0.43, 0.43, 0.62, 0.4, 0.48, 0.36, 0.55, 0.68, 1.6, 1.72, 0.18, 3.21, 1.59, 1.46, 1.68, 1.28, 0.51, 0.59, 1.07, 1.59, -0.1, 1.33, 0.55, 0.26, 2.2, 0.11, 10.06, 14.0, 6.57, 5.35]} \ No newline at end of file diff --git a/annotations_1/vaCI48KHW1k_filtered.json b/annotations_1/vaCI48KHW1k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52f9476e9d27c39fd7b9db70811c88675de726d9 --- /dev/null +++ b/annotations_1/vaCI48KHW1k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 60.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [47.22]} \ No newline at end of file diff --git a/annotations_1/vaJ2yQC_ktY_filtered.json b/annotations_1/vaJ2yQC_ktY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..337a7cac4a4b0d3dee7ddfbef90d64f55d44cc26 --- /dev/null +++ b/annotations_1/vaJ2yQC_ktY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.24], [17.0, 17.58], [30.0, 31.99], [36.0, 39.75], [41.0, 43.38], [44.0, 45.52], [46.0, 46.57], [47.0, 49.08], [49.0, 50.06], [52.0, 56.03], [61.0, 61.59], [62.0, 63.56], [66.0, 71.9], [79.0, 86.46], [87.0, 87.35], [89.0, 90.37], [115.0, 118.69], [127.0, 130.37], [134.0, 134.7], [136.0, 138.32], [141.0, 142.52], [145.0, 145.2], [148.0, 148.96], [152.0, 154.85], [156.0, 158.14], [159.0, 160.62], [163.0, 163.26], [169.0, 169.62], [191.0, 192.82], [195.0, 202.44], [204.0, 205.58], [216.0, 220.65], [223.0, 222.67], [233.0, 232.88], [245.0, 246.1], [246.0, 255.88], [266.0, 269.27]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 32.7, 31.75, 0.0, 0.0, 39.89, 0.0, 38.03, 0.0, 0.0, 42.74, 46.15, 0.0, 0.0, 73.67, 99.8, 0.0, 80.64, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 77.03, 0.0, 59.15, 0.0, 0.0, 0.0, 95.64, 52.86], "audiomae_on_audioset": [null, null, null, [["moo", 28.24], ["cattle, bovinae", 20.63], ["livestock, farm animals, working animals", 12.16]], [["speech", 40.36], ["music", 33.03], ["boing", 4.54]], null, null, [["music", 30.19], ["speech", 16.47], ["musical instrument", 5.93]], null, [["boing", 56.26], ["ding", 15.87], ["clang", 12.33]], null, null, [["speech", 15.58], ["moo", 9.73], ["cattle, bovinae", 8.6]], [["grunt", 61.83], ["speech", 6.59], ["groan", 6.29]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.24, 0.58, 1.99, 3.75, 2.38, 1.52, 0.57, 2.08, 1.06, 4.03, 0.59, 1.56, 5.9, 7.46, 0.35, 1.37, 3.69, 3.37, 0.7, 2.32, 1.52, 0.2, 0.96, 2.85, 2.14, 1.62, 0.26, 0.62, 1.82, 7.44, 1.58, 4.65, -0.33, -0.12, 1.1, 9.88, 3.27]} \ No newline at end of file diff --git a/annotations_1/vagva7xKyE8_filtered.json b/annotations_1/vagva7xKyE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1f21c3a28c9cf8835e5a30ba579ed2e74e525a --- /dev/null +++ b/annotations_1/vagva7xKyE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 25.91], [27.0, 41.4], [42.0, 42.13], [49.0, 49.23], [58.0, 58.02], [71.0, 70.97], [72.0, 72.5], [77.0, 79.62], [92.0, 94.36], [100.0, 100.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.93, 30.04, 0.0, 0.0, 0.0, 0.0, 0.0, 78.89, 97.73, 0.0], "audiomae_on_audioset": [[["music", 62.5], ["house music", 10.95], ["dance music", 5.59]], [["music", 83.39], ["house music", 6.86], ["dance music", 2.13]], null, null, null, null, null, null, null, null], "duration": [3.91, 14.4, 0.13, 0.23, 0.02, -0.03, 0.5, 2.62, 2.36, 0.11]} \ No newline at end of file diff --git a/annotations_1/vbJsLuL2YzQ_filtered.json b/annotations_1/vbJsLuL2YzQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e77501ccf97047a4e00be4df5fb9076e59e6f80a --- /dev/null +++ b/annotations_1/vbJsLuL2YzQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 13.49], [15.0, 22.99], [24.0, 28.05], [29.0, 30.1], [34.0, 42.3], [43.0, 43.19], [44.0, 44.91], [48.0, 53.33], [54.0, 54.7], [56.0, 65.77], [67.0, 70.9], [75.0, 75.29], [76.0, 77.77], [79.0, 79.81], [82.0, 110.0], [111.0, 112.01], [114.0, 114.24], [119.0, 119.7], [123.0, 127.06]], "keep_status": [true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [42.58, 44.01, 65.67, 0.0, 49.27, 0.0, 0.0, 40.61, 0.0, 34.3, 33.3, 0.0, 0.0, 0.0, 31.73, 0.0, 0.0, 0.0, 70.58], "audiomae_on_audioset": [[["music", 40.44], ["wild animals", 9.56], ["musical instrument", 9.01]], [["music", 61.21], ["speech", 5.36], ["synthesizer", 3.87]], null, null, [["frog", 60.75], ["croak", 12.52], ["music", 11.17]], null, null, [["frog", 82.23], ["music", 4.71], ["croak", 4.0]], null, [["music", 29.36], ["livestock, farm animals, working animals", 19.61], ["animal", 9.62]], [["music", 38.29], ["frog", 13.05], ["animal", 6.64]], null, null, null, [["music", 51.9], ["frog", 20.52], ["groan", 4.77]], null, null, null, null], "duration": [5.49, 7.99, 4.05, 1.1, 8.3, 0.19, 0.91, 5.33, 0.7, 9.77, 3.9, 0.29, 1.77, 0.81, 28.0, 1.01, 0.24, 0.7, 4.06]} \ No newline at end of file diff --git a/annotations_1/vcURIKX8710_filtered.json b/annotations_1/vcURIKX8710_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8595b42ec0d65cc415b4a6d5c38c6bb51d77185c --- /dev/null +++ b/annotations_1/vcURIKX8710_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 16.95], [18.0, 18.67], [26.0, 44.25], [48.0, 51.19], [57.0, 64.49], [66.0, 66.36], [69.0, 70.6], [72.0, 72.67], [73.0, 78.02], [89.0, 91.18], [92.0, 92.94], [100.0, 103.42], [108.0, 108.55], [113.0, 113.32], [122.0, 123.62]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [58.05, 0.0, 30.7, 30.26, 30.42, 0.0, 0.0, 0.0, 58.72, 59.51, 0.0, 73.51, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 22.38], ["speech", 21.92], ["hum", 16.58]], [["music", 44.95], ["speech", 14.06], ["throbbing", 12.93]], [["hum", 24.08], ["music", 20.05], ["speech", 15.78]], null, null, null, null, null, null, null, null, null, null], "duration": [2.95, 0.67, 18.25, 3.19, 7.49, 0.36, 1.6, 0.67, 5.02, 2.18, 0.94, 3.42, 0.55, 0.32, 1.62]} \ No newline at end of file diff --git a/annotations_1/vcdDRblTOmM_filtered.json b/annotations_1/vcdDRblTOmM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..97a31888dc04ade63bd81a4867f4180b24100f87 --- /dev/null +++ b/annotations_1/vcdDRblTOmM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 17.88], [20.0, 27.53], [28.0, 47.31], [47.0, 85.48], [86.0, 85.72], [86.0, 115.99], [118.0, 124.93], [125.0, 128.16], [129.0, 129.0], [133.0, 133.76], [134.0, 138.65]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [29.5, 29.75, 29.42, 0.0, 0.0, 30.17, 28.89, 29.9, 0.0, 0.0, 29.87], "audiomae_on_audioset": [[["hum", 55.74], ["throbbing", 20.43], ["mains hum", 11.48]], [["throbbing", 48.16], ["hum", 40.92], ["music", 5.25]], [["music", 70.42], ["throbbing", 11.69], ["hum", 3.77]], null, null, [["hum", 52.25], ["mains hum", 39.36], ["throbbing", 2.53]], [["whip", 65.98], ["speech", 5.79], ["whoosh, swoosh, swish", 4.38]], [["music", 23.98], ["throbbing", 21.66], ["hum", 15.02]], null, null, [["hum", 51.73], ["mains hum", 20.44], ["throbbing", 4.16]]], "duration": [16.88, 7.53, 19.31, 38.48, -0.28, 29.99, 6.93, 3.16, 0.0, 0.76, 4.65]} \ No newline at end of file diff --git a/annotations_1/vcw4b2U_0nU_filtered.json b/annotations_1/vcw4b2U_0nU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/vcw4b2U_0nU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/vdMEu03CjTk_filtered.json b/annotations_1/vdMEu03CjTk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5920e0e82fd7165e44ed3eaf3f43216a9335583e --- /dev/null +++ b/annotations_1/vdMEu03CjTk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 27.03], [28.0, 65.15], [67.0, 82.22], [84.0, 85.08], [86.0, 87.61], [89.0, 90.69], [93.0, 93.38], [99.0, 100.14], [102.0, 102.32], [104.0, 105.09], [106.0, 106.95], [109.0, 111.15], [113.0, 114.08], [115.0, 116.9], [119.0, 120.46], [122.0, 124.39], [128.0, 127.63], [130.0, 130.99], [133.0, 134.05], [135.0, 136.59], [137.0, 138.05], [141.0, 140.8], [149.0, 155.6], [156.0, 157.65], [159.0, 161.76]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 36.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.67, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.37, 0.0, 84.98], "audiomae_on_audioset": [null, null, [["music", 17.53], ["hum", 16.68], ["breaking", 9.66]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.03, 37.15, 15.22, 1.08, 1.61, 1.69, 0.38, 1.14, 0.32, 1.09, 0.95, 2.15, 1.08, 1.9, 1.46, 2.39, -0.37, 0.99, 1.05, 1.59, 1.05, -0.2, 6.6, 1.65, 2.76]} \ No newline at end of file diff --git a/annotations_1/vejLIHky2HE_filtered.json b/annotations_1/vejLIHky2HE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b8f3de0e329697585a37964c0f6f7f094c682cb --- /dev/null +++ b/annotations_1/vejLIHky2HE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.62], [8.0, 10.96], [13.0, 14.07], [16.0, 17.07], [19.0, 28.66], [30.0, 31.53], [33.0, 34.4], [35.0, 37.07], [39.0, 40.29], [47.0, 47.51], [55.0, 55.56], [67.0, 69.89]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 49.97, 0.0, 0.0, 57.09, 0.0, 0.0, 60.79, 0.0, 0.0, 0.0, 58.72], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 13.97], ["moo", 12.77], ["music", 11.52]], null, null, null, null, null, null, null, null, null, null], "duration": [1.62, 2.96, 1.07, 1.07, 9.66, 1.53, 1.4, 2.07, 1.29, 0.51, 0.56, 2.89]} \ No newline at end of file diff --git a/annotations_1/vfc3TGvcjEY_filtered.json b/annotations_1/vfc3TGvcjEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7bbb0e807669657f5e3f5be9b8f71ef8f9bd134d --- /dev/null +++ b/annotations_1/vfc3TGvcjEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[98.0, 104.14], [106.0, 108.14], [109.0, 110.17], [112.0, 113.27], [115.0, 116.46], [119.0, 120.33], [123.0, 123.3], [124.0, 132.49], [140.0, 169.53], [173.0, 184.5], [188.0, 195.91], [201.0, 202.63]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [35.52, 37.07, 0.0, 0.0, 0.0, 0.0, 0.0, 35.97, 30.28, 30.32, 31.46, 0.0], "audiomae_on_audioset": [[["music", 60.14], ["throbbing", 10.42], ["electronic music", 3.98]], [["music", 62.68], ["electronic music", 5.48], ["dubstep", 4.73]], null, null, null, null, null, [["music", 55.37], ["electronic music", 9.05], ["throbbing", 7.99]], [["music", 41.37], ["fart", 8.58], ["groan", 5.51]], [["music", 36.64], ["speech", 11.27], ["electronic music", 11.0]], [["music", 55.82], ["moo", 8.05], ["livestock, farm animals, working animals", 6.81]], null], "duration": [6.14, 2.14, 1.17, 1.27, 1.46, 1.33, 0.3, 8.49, 29.53, 11.5, 7.91, 1.63]} \ No newline at end of file diff --git a/annotations_1/vgEq476aHxk_filtered.json b/annotations_1/vgEq476aHxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a110e6267c89c7461e03892205b5f175e518e1f --- /dev/null +++ b/annotations_1/vgEq476aHxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [7.0, 16.95], [21.0, 35.63], [36.0, 64.07], [79.0, 79.51], [80.0, 79.61], [82.0, 85.28], [86.0, 110.35], [115.0, 119.3], [124.0, 130.01], [133.0, 133.32], [133.0, 152.93]], "keep_status": [false, true, false, true, false, false, true, true, false, false, false, true], "silence_prob": [0.0, 28.8, 28.79, 28.66, 0.0, 0.0, 29.35, 28.77, 28.47, 28.56, 0.0, 28.46], "audiomae_on_audioset": [null, [["music", 30.0], ["mains hum", 19.73], ["hum", 16.69]], [["speech", 66.75], ["music", 9.21], ["vehicle", 7.09]], [["music", 47.49], ["vehicle", 8.46], ["buzz", 6.04]], null, null, [["vehicle", 26.59], ["music", 25.65], ["buzz", 7.74]], [["buzz", 24.82], ["hum", 19.54], ["music", 14.12]], [["vehicle", 33.74], ["buzz", 27.57], ["car", 9.91]], [["hum", 32.77], ["throbbing", 19.82], ["music", 18.53]], null, [["speech", 45.09], ["music", 19.01], ["whack, thwack", 5.25]]], "duration": [0.45, 9.95, 14.63, 28.07, 0.51, -0.39, 3.28, 24.35, 4.3, 6.01, 0.32, 19.93]} \ No newline at end of file diff --git a/annotations_1/vh-mdPoc92Y_filtered.json b/annotations_1/vh-mdPoc92Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4608dd4276e81d4fb04811e93645e1278af30bb --- /dev/null +++ b/annotations_1/vh-mdPoc92Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.37], [7.0, 8.56], [11.0, 11.03], [12.0, 24.71], [30.0, 35.92], [36.0, 37.17], [39.0, 39.9], [41.0, 41.18], [42.0, 43.14], [44.0, 127.25], [129.0, 130.82], [132.0, 135.9], [137.0, 138.28], [139.0, 143.36], [144.0, 156.02]], "keep_status": [false, false, false, true, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.29, 30.21, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 37.42, 34.64], "audiomae_on_audioset": [null, null, null, [["fart", 24.29], ["music", 16.86], ["noise", 10.21]], [["fart", 22.83], ["speech", 11.5], ["whack, thwack", 10.86]], null, null, null, null, null, null, null, null, [["didgeridoo", 61.74], ["music", 24.06], ["musical instrument", 6.1]], [["didgeridoo", 36.59], ["music", 36.37], ["musical instrument", 3.8]]], "duration": [0.37, 1.56, 0.03, 12.71, 5.92, 1.17, 0.9, 0.18, 1.14, 83.25, 1.82, 3.9, 1.28, 4.36, 12.02]} \ No newline at end of file diff --git a/annotations_1/vh7_WKODlE8_filtered.json b/annotations_1/vh7_WKODlE8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..085cfc36998c1e29b1ea9405e0d3176a07d8c2f2 --- /dev/null +++ b/annotations_1/vh7_WKODlE8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.04], [2.0, 2.98], [7.0, 8.63], [10.0, 18.42], [20.0, 21.86], [22.0, 31.08], [33.0, 44.39], [45.0, 47.87], [50.0, 50.8], [51.0, 54.53], [55.0, 60.84], [63.0, 68.28], [69.0, 71.0], [72.0, 76.45], [83.0, 85.23], [87.0, 87.52], [90.0, 90.05], [93.0, 94.0], [98.0, 98.69], [106.0, 106.71], [107.0, 111.1], [112.0, 112.99], [116.0, 116.43], [120.0, 124.78], [129.0, 130.76], [131.0, 134.1], [134.0, 134.18], [135.0, 135.28], [137.0, 138.33], [139.0, 145.12], [146.0, 148.49], [150.0, 151.87], [156.0, 162.97], [164.0, 166.21], [167.0, 169.91], [171.0, 171.93], [173.0, 181.95], [184.0, 184.01]], "keep_status": [false, false, false, false, false, true, true, false, false, true, false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 45.46, 0.0, 41.68, 45.85, 73.82, 0.0, 40.79, 55.96, 44.57, 36.49, 52.51, 56.7, 0.0, 0.0, 0.0, 0.0, 0.0, 33.9, 0.0, 0.0, 33.69, 0.0, 32.83, 0.0, 0.0, 0.0, 35.97, 39.38, 0.0, 71.57, 96.29, 96.29, 0.0, 49.68, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 36.36], ["mains hum", 24.82], ["speech", 8.92]], null, [["speech", 31.27], ["music", 5.49], ["hum", 5.49]], [["speech", 34.65], ["music", 12.12], ["hum", 8.47]], null, null, [["music", 44.18], ["speech", 10.16], ["whale vocalization", 7.42]], null, [["speech", 27.02], ["music", 26.25], ["whale vocalization", 15.58]], [["music", 23.48], ["didgeridoo", 13.95], ["boing", 6.95]], null, null, null, null, null, null, null, [["speech", 21.9], ["sine wave", 19.33], ["chirp tone", 11.7]], null, null, [["music", 32.21], ["beatboxing", 26.68], ["speech", 16.44]], null, [["speech", 57.59], ["gong", 13.01], ["singing bowl", 5.66]], null, null, null, [["speech", 36.92], ["music", 16.96], ["didgeridoo", 5.23]], [["music", 27.61], ["didgeridoo", 17.15], ["speech", 12.61]], null, null, null, null, null, [["speech", 67.34], ["animal", 6.84], ["inside, small room", 3.26]], null], "duration": [0.04, 0.98, 1.63, 8.42, 1.86, 9.08, 11.39, 2.87, 0.8, 3.53, 5.84, 5.28, 2.0, 4.45, 2.23, 0.52, 0.05, 1.0, 0.69, 0.71, 4.1, 0.99, 0.43, 4.78, 1.76, 3.1, 0.18, 0.28, 1.33, 6.12, 2.49, 1.87, 6.97, 2.21, 2.91, 0.93, 8.95, 0.01]} \ No newline at end of file diff --git a/annotations_1/vhEOInyNr54_filtered.json b/annotations_1/vhEOInyNr54_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1265e5e660b760d934eeb2c2de4a19d6a062e05e --- /dev/null +++ b/annotations_1/vhEOInyNr54_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.88], [6.0, 9.24], [13.0, 13.26], [14.0, 13.78], [14.0, 19.55], [21.0, 23.23], [24.0, 24.76], [25.0, 25.69], [27.0, 27.62], [30.0, 31.46], [33.0, 35.45], [37.0, 37.94], [38.0, 40.12], [41.0, 42.13], [43.0, 43.44], [45.0, 45.39], [46.0, 46.18], [47.0, 47.75], [49.0, 49.54], [51.0, 53.32], [54.0, 55.78], [59.0, 59.58], [64.0, 64.25], [67.0, 70.34], [72.0, 74.11], [80.0, 80.4], [83.0, 84.84], [85.0, 86.26], [88.0, 88.7], [90.0, 90.19], [95.0, 95.07], [96.0, 97.29], [100.0, 118.69], [126.0, 126.57], [128.0, 131.6], [133.0, 133.64], [137.0, 136.9], [140.0, 141.27], [142.0, 142.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [78.89, 79.41, 0.0, 0.0, 93.13, 97.83, 0.0, 0.0, 0.0, 0.0, 97.43, 0.0, 43.64, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 0.0, 0.0, 0.0, 76.7, 71.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 46.36, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 28.48], ["sidetone", 20.29], ["sine wave", 8.24]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 53.7], ["musical instrument", 2.91], ["theremin", 2.8]], null, null, null, null], "duration": [2.88, 3.24, 0.26, -0.22, 5.55, 2.23, 0.76, 0.69, 0.62, 1.46, 2.45, 0.94, 2.12, 1.13, 0.44, 0.39, 0.18, 0.75, 0.54, 2.32, 1.78, 0.58, 0.25, 3.34, 2.11, 0.4, 1.84, 1.26, 0.7, 0.19, 0.07, 1.29, 18.69, 0.57, 3.6, 0.64, -0.1, 1.27, 0.64]} \ No newline at end of file diff --git a/annotations_1/vhfk-aOAgIE_filtered.json b/annotations_1/vhfk-aOAgIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..477e7a580a72d7d9ac6203bfea5b9085700354be --- /dev/null +++ b/annotations_1/vhfk-aOAgIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 41.15], [47.0, 47.19], [48.0, 70.68]], "keep_status": [false, false, false], "silence_prob": [32.84, 0.0, 33.1], "audiomae_on_audioset": [[["music", 80.27], ["boing", 3.1], ["sampler", 1.62]], null, [["music", 54.47], ["cattle, bovinae", 10.56], ["moo", 10.06]]], "duration": [3.15, 0.19, 22.68]} \ No newline at end of file diff --git a/annotations_1/vhhiJqQBMMY_filtered.json b/annotations_1/vhhiJqQBMMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dbb693a209c5c041e155a21c4f78e464e4b7625 --- /dev/null +++ b/annotations_1/vhhiJqQBMMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.56], [9.0, 10.22], [20.0, 21.63], [23.0, 22.91], [23.0, 24.02], [25.0, 25.56], [27.0, 27.35], [28.0, 28.9], [30.0, 31.38], [33.0, 33.96], [35.0, 37.29], [43.0, 42.87], [44.0, 46.28], [49.0, 49.57], [53.0, 53.72], [54.0, 55.49], [63.0, 68.25], [73.0, 75.07], [75.0, 76.25], [78.0, 78.75], [85.0, 85.78], [100.0, 100.16], [101.0, 101.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.98, 0.0, 37.4, 0.0, 0.0, 0.0, 37.35, 40.82, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 19.35], ["didgeridoo", 9.35], ["speech", 8.65]], null, [["music", 59.02], ["speech", 7.05], ["theremin", 2.88]], null, null, null, [["music", 67.65], ["didgeridoo", 5.53], ["animal", 2.95]], [["speech", 36.2], ["music", 16.15], ["sidetone", 8.13]], null, null, null, null, null], "duration": [1.56, 1.22, 1.63, -0.09, 1.02, 0.56, 0.35, 0.9, 1.38, 0.96, 2.29, -0.13, 2.28, 0.57, 0.72, 1.49, 5.25, 2.07, 1.25, 0.75, 0.78, 0.16, 0.83]} \ No newline at end of file diff --git a/annotations_1/vhmFJKHhdw4_filtered.json b/annotations_1/vhmFJKHhdw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..136db0bfca957966643c7758fe90e37db9cb2990 --- /dev/null +++ b/annotations_1/vhmFJKHhdw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [3.0, 3.48], [5.0, 9.37], [11.0, 14.93], [18.0, 18.57], [22.0, 22.62], [29.0, 30.16], [37.0, 37.54], [46.0, 47.53], [59.0, 59.53], [73.0, 73.82], [76.0, 77.06], [77.0, 80.11], [87.0, 87.62], [94.0, 95.37], [110.0, 135.55], [138.0, 138.57], [142.0, 142.79], [153.0, 153.39], [155.0, 156.88], [166.0, 168.76], [182.0, 182.97], [186.0, 185.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 31.42, 32.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.77, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0, 30.5, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 58.15], ["music", 21.28], ["fart", 6.11]], [["music", 67.14], ["musical instrument", 10.89], ["synthesizer", 7.78]], null, null, null, null, null, null, null, null, [["music", 51.77], ["speech", 6.55], ["didgeridoo", 3.75]], null, null, [["music", 58.6], ["musical instrument", 4.78], ["effects unit", 3.32]], null, null, null, null, [["music", 30.0], ["carnatic music", 16.96], ["moo", 6.45]], null, null], "duration": [-0.05, 0.48, 4.37, 3.93, 0.57, 0.62, 1.16, 0.54, 1.53, 0.53, 0.82, 1.06, 3.11, 0.62, 1.37, 25.55, 0.57, 0.79, 0.39, 1.88, 2.76, 0.97, -0.01]} \ No newline at end of file diff --git a/annotations_1/vi9m0JRo71I_filtered.json b/annotations_1/vi9m0JRo71I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d2e0d38701aae2a13207d543137eaf60a4a54fa0 --- /dev/null +++ b/annotations_1/vi9m0JRo71I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.0], [14.0, 17.86], [22.0, 22.42], [24.0, 72.52], [73.0, 75.71], [80.0, 101.38], [110.0, 111.69], [112.0, 112.26], [112.0, 112.29], [113.0, 122.84], [125.0, 139.01]], "keep_status": [true, true, false, false, false, true, false, false, false, true, false], "silence_prob": [46.12, 47.46, 0.0, 0.0, 56.7, 29.41, 0.0, 0.0, 0.0, 29.32, 29.74], "audiomae_on_audioset": [[["rumble", 37.13], ["hum", 11.02], ["throbbing", 9.41]], [["fly, housefly", 20.77], ["bee, wasp, etc.", 15.89], ["speech", 10.08]], null, null, null, [["vehicle", 20.55], ["whale vocalization", 13.26], ["buzz", 12.51]], null, null, null, [["grunt", 35.18], ["whale vocalization", 19.55], ["music", 12.63]], [["speech", 64.06], ["music", 28.4], ["animal", 0.81]]], "duration": [3.0, 3.86, 0.42, 48.52, 2.71, 21.38, 1.69, 0.26, 0.29, 9.84, 14.01]} \ No newline at end of file diff --git a/annotations_1/vjDxkz5LO7A_filtered.json b/annotations_1/vjDxkz5LO7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9dcc632db877e3e88e7d175a533ab265436fc8c --- /dev/null +++ b/annotations_1/vjDxkz5LO7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 5.78], [9.0, 10.2], [14.0, 14.66], [16.0, 16.88], [18.0, 18.72], [19.0, 20.34], [21.0, 21.96], [23.0, 25.19], [28.0, 43.41], [46.0, 48.49], [51.0, 51.41], [53.0, 55.19], [56.0, 56.64], [58.0, 59.07], [61.0, 65.11], [71.0, 72.44], [85.0, 133.76], [136.0, 138.67], [140.0, 158.95]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.25, 57.72, 52.74, 0.0, 53.1, 0.0, 0.0, 31.26, 0.0, 0.0, 31.83, 30.26], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["theremin", 24.28], ["music", 21.12], ["foghorn", 17.67]], null, null, null, null, null, null, [["music", 33.21], ["sonar", 7.74], ["creak", 5.99]], null, null, [["thunk", 28.17], ["mains hum", 18.88], ["whack, thwack", 12.15]], [["music", 83.35], ["didgeridoo", 1.98], ["electronic music", 1.7]]], "duration": [-0.22, 1.2, 0.66, 0.88, 0.72, 1.34, 0.96, 2.19, 15.41, 2.49, 0.41, 2.19, 0.64, 1.07, 4.11, 1.44, 48.76, 2.67, 18.95]} \ No newline at end of file diff --git a/annotations_1/vjmHq57MZso_filtered.json b/annotations_1/vjmHq57MZso_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3f952b8528cb53b6f866ffe77a3806c84894cae8 --- /dev/null +++ b/annotations_1/vjmHq57MZso_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.8], [17.0, 17.52], [20.0, 20.76], [33.0, 33.44], [36.0, 37.98], [39.0, 40.02], [41.0, 41.74], [52.0, 52.24], [60.0, 68.72], [74.0, 75.03], [76.0, 78.31], [81.0, 81.58], [84.0, 84.65], [85.0, 85.77], [87.0, 87.02], [89.0, 92.91], [93.0, 93.88], [95.0, 95.49], [99.0, 99.82], [102.0, 103.2], [107.0, 107.82], [112.0, 118.57], [119.0, 121.09], [123.0, 124.12], [125.0, 126.62], [127.0, 131.36], [134.0, 136.56], [138.0, 147.24], [156.0, 156.78], [158.0, 158.11], [159.0, 159.38], [161.0, 162.85], [163.0, 165.1], [170.0, 174.24], [174.0, 176.49], [178.0, 178.55], [180.0, 180.64], [181.0, 183.24], [184.0, 185.7], [187.0, 189.5], [190.0, 191.3], [193.0, 192.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.25, 0.0, 41.72, 0.0, 0.0, 0.0, 0.0, 53.78, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 72.6, 0.0, 0.0, 62.89, 52.51, 33.07, 0.0, 0.0, 0.0, 0.0, 88.46, 61.27, 70.3, 0.0, 0.0, 47.7, 0.0, 51.88, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 61.44], ["music", 6.57], ["boing", 3.01]], null, [["sidetone", 22.4], ["music", 20.79], ["speech", 18.04]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["theremin", 31.34], ["music", 23.2], ["synthesizer", 10.74]], null, null, null, null, null, null, null, null, null, [["speech", 35.05], ["music", 14.25], ["ping", 4.61]], null, null, null, null], "duration": [0.8, 0.52, 0.76, 0.44, 1.98, 1.02, 0.74, 0.24, 8.72, 1.03, 2.31, 0.58, 0.65, 0.77, 0.02, 3.91, 0.88, 0.49, 0.82, 1.2, 0.82, 6.57, 2.09, 1.12, 1.62, 4.36, 2.56, 9.24, 0.78, 0.11, 0.38, 1.85, 2.1, 4.24, 2.49, 0.55, 0.64, 2.24, 1.7, 2.5, 1.3, -0.03]} \ No newline at end of file diff --git a/annotations_1/vk5Kr-zV8AE_filtered.json b/annotations_1/vk5Kr-zV8AE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..38425bc167aa171449bb533e8fafc1e34fba0491 --- /dev/null +++ b/annotations_1/vk5Kr-zV8AE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.51], [12.0, 11.84], [34.0, 34.11], [44.0, 44.83], [59.0, 59.21], [60.0, 61.23], [66.0, 66.43], [69.0, 68.81], [73.0, 73.8], [78.0, 80.32], [82.0, 83.54], [86.0, 104.75], [105.0, 106.27], [127.0, 127.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 0.0, 30.36, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["hum", 35.18], ["music", 25.32], ["throbbing", 13.08]], null, null], "duration": [0.51, -0.16, 0.11, 0.83, 0.21, 1.23, 0.43, -0.19, 0.8, 2.32, 1.54, 18.75, 1.27, 0.62]} \ No newline at end of file diff --git a/annotations_1/vkXY0EqahbY_filtered.json b/annotations_1/vkXY0EqahbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1587958981c7f41ce349836e54f65394a7347315 --- /dev/null +++ b/annotations_1/vkXY0EqahbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.51], [7.0, 6.74], [10.0, 10.29], [15.0, 15.6], [19.0, 19.48], [22.0, 23.16], [25.0, 26.59], [30.0, 30.7], [33.0, 33.71], [35.0, 38.35], [42.0, 42.33], [43.0, 43.06], [47.0, 47.98], [51.0, 50.79], [51.0, 51.98], [54.0, 54.58], [57.0, 58.06], [62.0, 61.94], [63.0, 63.81], [66.0, 66.39], [67.0, 67.04], [71.0, 71.59], [74.0, 76.05], [81.0, 81.04], [84.0, 84.43], [85.0, 85.68], [87.0, 87.39], [91.0, 91.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, -0.26, 0.29, 0.6, 0.48, 1.16, 1.59, 0.7, 0.71, 3.35, 0.33, 0.06, 0.98, -0.21, 0.98, 0.58, 1.06, -0.06, 0.81, 0.39, 0.04, 0.59, 2.05, 0.04, 0.43, 0.68, 0.39, 0.84]} \ No newline at end of file diff --git a/annotations_1/vlK8CMKzWUY_filtered.json b/annotations_1/vlK8CMKzWUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e8e2037b940caa5e3ea08b7a69cd1911ce2dc29 --- /dev/null +++ b/annotations_1/vlK8CMKzWUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.85], [13.0, 13.32], [14.0, 14.67], [18.0, 19.08], [21.0, 21.42], [23.0, 24.7], [26.0, 27.24], [34.0, 33.89], [37.0, 37.12], [43.0, 43.92], [51.0, 52.24], [61.0, 62.95], [64.0, 65.13], [66.0, 71.29], [81.0, 83.51], [85.0, 88.43], [90.0, 90.41], [92.0, 91.98], [95.0, 95.98], [100.0, 101.78], [103.0, 104.19], [106.0, 107.0], [108.0, 108.18], [109.0, 109.56], [114.0, 115.86], [117.0, 118.74], [120.0, 122.76], [127.0, 127.72], [129.0, 130.15], [132.0, 133.03], [138.0, 139.45], [143.0, 143.38], [144.0, 145.5], [146.0, 146.75], [155.0, 156.42], [166.0, 167.21], [169.0, 169.08], [169.0, 170.94], [172.0, 173.33], [175.0, 176.54], [178.0, 177.94], [178.0, 178.02], [178.0, 178.09], [180.0, 182.44], [184.0, 185.25], [187.0, 194.7], [196.0, 196.89]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.75, 32.3, 38.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.79, 0.0, 39.09, 0.0], "audiomae_on_audioset": [[["clapping", 30.81], ["hands", 11.65], ["tap", 11.64]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 20.51], ["hum", 18.69], ["mains hum", 10.64]], [["speech", 23.44], ["didgeridoo", 17.68], ["music", 16.56]], [["music", 46.31], ["synthesizer", 25.45], ["hum", 6.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 56.53], ["thunk", 13.11], ["flamenco", 4.28]], null, [["music", 74.5], ["synthesizer", 6.48], ["musical instrument", 3.14]], null], "duration": [2.85, 0.32, 0.67, 1.08, 0.42, 1.7, 1.24, -0.11, 0.12, 0.92, 1.24, 1.95, 1.13, 5.29, 2.51, 3.43, 0.41, -0.02, 0.98, 1.78, 1.19, 1.0, 0.18, 0.56, 1.86, 1.74, 2.76, 0.72, 1.15, 1.03, 1.45, 0.38, 1.5, 0.75, 1.42, 1.21, 0.08, 1.94, 1.33, 1.54, -0.06, 0.02, 0.09, 2.44, 1.25, 7.7, 0.89]} \ No newline at end of file diff --git a/annotations_1/vlg5VPKbGQg_filtered.json b/annotations_1/vlg5VPKbGQg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..31f2bdacc87c5296609124434428801dcb7012ae --- /dev/null +++ b/annotations_1/vlg5VPKbGQg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [6.0, 7.91], [9.0, 13.07], [14.0, 14.49], [15.0, 20.44], [22.0, 23.16], [24.0, 34.8], [36.0, 39.9], [42.0, 44.46], [46.0, 47.65], [49.0, 52.35], [54.0, 54.63], [57.0, 59.71], [61.0, 62.95], [66.0, 69.87], [71.0, 79.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 93.45, 0.0, 99.62, 0.0, 87.74, 98.51, 100.0, 0.0, 99.97, 0.0, 90.78, 0.0, 99.92, 70.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.91, 4.07, 0.49, 5.44, 1.16, 10.8, 3.9, 2.46, 1.65, 3.35, 0.63, 2.71, 1.95, 3.87, 8.88]} \ No newline at end of file diff --git a/annotations_1/vm-rgqRKqz8_filtered.json b/annotations_1/vm-rgqRKqz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b87a35a70f4ac7550a7c2c4f00505d299ae470 --- /dev/null +++ b/annotations_1/vm-rgqRKqz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.16], [8.0, 19.57], [25.0, 25.3], [31.0, 32.1], [33.0, 49.08], [51.0, 52.54], [60.0, 60.1], [65.0, 66.31], [68.0, 69.31], [70.0, 71.61], [72.0, 73.72], [75.0, 75.12], [78.0, 80.05], [85.0, 86.41], [87.0, 87.17], [88.0, 92.85], [94.0, 110.96], [113.0, 115.13], [121.0, 125.19]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [88.64, 57.09, 0.0, 0.0, 48.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.48, 0.0, 0.0, 48.39, 50.11, 34.08, 40.28], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 23.3], ["hum", 20.23], ["music", 10.58]], null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 21.92], ["sidetone", 18.95], ["bee, wasp, etc.", 13.74]], null, [["cattle, bovinae", 18.52], ["wild animals", 17.1], ["animal", 16.74]], [["music", 59.37], ["theremin", 7.48], ["didgeridoo", 4.18]]], "duration": [2.16, 11.57, 0.3, 1.1, 16.08, 1.54, 0.1, 1.31, 1.31, 1.61, 1.72, 0.12, 2.05, 1.41, 0.17, 4.85, 16.96, 2.13, 4.19]} \ No newline at end of file diff --git a/annotations_1/vmOBZjVBCUo_filtered.json b/annotations_1/vmOBZjVBCUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1d69e83b3a82a800b77bc91d555ef3492656a804 --- /dev/null +++ b/annotations_1/vmOBZjVBCUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 52.69], [54.0, 57.52], [58.0, 60.05], [62.0, 70.33], [75.0, 78.83], [81.0, 81.65], [82.0, 82.63], [87.0, 86.95], [87.0, 87.76], [89.0, 101.83]], "keep_status": [true, false, true, true, false, false, false, false, false, false], "silence_prob": [37.54, 38.78, 35.54, 37.23, 40.48, 0.0, 0.0, 0.0, 0.0, 29.46], "audiomae_on_audioset": [[["speech", 48.22], ["crushing", 5.25], ["music", 4.87]], [["music", 58.88], ["throbbing", 7.33], ["electronic music", 6.94]], [["throbbing", 27.5], ["music", 17.2], ["hum", 12.39]], [["glass", 16.65], ["hum", 11.6], ["throbbing", 9.84]], [["cattle, bovinae", 47.27], ["moo", 17.84], ["livestock, farm animals, working animals", 14.85]], null, null, null, null, [["music", 79.67], ["hum", 3.53], ["throbbing", 2.41]]], "duration": [3.69, 3.52, 2.05, 8.33, 3.83, 0.65, 0.63, -0.05, 0.76, 12.83]} \ No newline at end of file diff --git a/annotations_1/vmWm02fUJ-o_filtered.json b/annotations_1/vmWm02fUJ-o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..411fec309ed9b1034e1baa532269b73e77122698 --- /dev/null +++ b/annotations_1/vmWm02fUJ-o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[24.0, 27.62], [33.0, 37.4], [38.0, 42.63], [44.0, 43.97], [45.0, 46.23], [48.0, 52.35], [55.0, 60.54], [64.0, 92.6], [94.0, 95.1], [97.0, 101.46], [102.0, 106.05], [106.0, 107.06], [110.0, 114.88], [116.0, 119.52], [122.0, 123.58], [124.0, 124.06], [125.0, 126.57], [127.0, 127.5], [129.0, 132.66], [133.0, 134.37], [135.0, 135.78], [143.0, 143.63], [148.0, 148.14], [150.0, 155.24], [156.0, 156.44], [160.0, 160.57], [162.0, 163.46], [165.0, 165.43], [168.0, 168.72], [172.0, 174.51], [176.0, 178.17], [180.0, 183.17], [185.0, 186.88], [188.0, 189.24], [192.0, 195.57], [199.0, 207.1], [207.0, 207.18]], "keep_status": [false, false, true, false, false, true, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false], "silence_prob": [37.92, 33.02, 38.71, 0.0, 0.0, 34.59, 33.94, 31.44, 0.0, 34.72, 36.44, 0.0, 34.37, 43.93, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 0.0, 0.0, 0.0, 40.75, 0.0, 0.0, 0.0, 0.0, 0.0, 67.51, 43.4, 41.09, 0.0, 0.0, 34.53, 31.5, 0.0], "audiomae_on_audioset": [[["fly, housefly", 58.83], ["insect", 32.73], ["bee, wasp, etc.", 6.91]], [["fly, housefly", 47.65], ["insect", 38.62], ["bee, wasp, etc.", 10.49]], [["speech", 46.93], ["telephone", 7.72], ["radio", 6.57]], null, null, [["noise", 15.41], ["speech", 10.43], ["music", 9.99]], [["fly, housefly", 58.24], ["insect", 19.67], ["bee, wasp, etc.", 17.42]], [["whale vocalization", 33.9], ["noise", 19.25], ["music", 5.63]], null, [["fly, housefly", 45.7], ["insect", 19.26], ["sidetone", 8.17]], [["fly, housefly", 49.76], ["insect", 26.43], ["bee, wasp, etc.", 14.56]], null, [["music", 30.05], ["didgeridoo", 10.28], ["speech", 6.47]], [["fly, housefly", 36.06], ["insect", 26.62], ["bee, wasp, etc.", 13.8]], null, null, null, null, null, null, null, null, null, [["speech", 52.97], ["radio", 20.76], ["frog", 8.18]], null, null, null, null, null, null, [["music", 17.64], ["hum", 10.3], ["mains hum", 8.73]], [["music", 12.47], ["effects unit", 10.97], ["synthesizer", 10.52]], null, null, [["speech", 42.25], ["music", 19.56], ["beatboxing", 4.86]], [["music", 46.08], ["didgeridoo", 14.85], ["frog", 10.92]], null], "duration": [3.62, 4.4, 4.63, -0.03, 1.23, 4.35, 5.54, 28.6, 1.1, 4.46, 4.05, 1.06, 4.88, 3.52, 1.58, 0.06, 1.57, 0.5, 3.66, 1.37, 0.78, 0.63, 0.14, 5.24, 0.44, 0.57, 1.46, 0.43, 0.72, 2.51, 2.17, 3.17, 1.88, 1.24, 3.57, 8.1, 0.18]} \ No newline at end of file diff --git a/annotations_1/vmynulColPI_filtered.json b/annotations_1/vmynulColPI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7e0f0e53cb47905ce32c473e67097a1802ff3b7a --- /dev/null +++ b/annotations_1/vmynulColPI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.9], [11.0, 12.93], [13.0, 14.39], [15.0, 16.06], [26.0, 26.28], [28.0, 32.19], [35.0, 35.72], [45.0, 45.28], [45.0, 51.21], [52.0, 63.8], [69.0, 68.69], [71.0, 71.39], [77.0, 77.5], [79.0, 79.83], [83.0, 83.51], [86.0, 86.43], [107.0, 107.18], [117.0, 120.51], [121.0, 121.66]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [63.42, 0.0, 0.0, 0.0, 0.0, 29.48, 0.0, 0.0, 29.41, 29.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 82.4], ["music", 4.37], ["outside, rural or natural", 1.88]], null, null, [["music", 41.99], ["speech", 23.43], ["explosion", 5.71]], [["whack, thwack", 30.53], ["breaking", 7.57], ["livestock, farm animals, working animals", 7.44]], null, null, null, null, null, null, null, [["mains hum", 38.87], ["hum", 32.14], ["music", 15.75]], null], "duration": [3.9, 1.93, 1.39, 1.06, 0.28, 4.19, 0.72, 0.28, 6.21, 11.8, -0.31, 0.39, 0.5, 0.83, 0.51, 0.43, 0.18, 3.51, 0.66]} \ No newline at end of file diff --git a/annotations_1/vn-PJRh_nFQ_filtered.json b/annotations_1/vn-PJRh_nFQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9641036da505392d0609160eb5df7fc3550fa13 --- /dev/null +++ b/annotations_1/vn-PJRh_nFQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.64], [11.0, 11.55], [20.0, 25.12], [30.0, 30.48], [34.0, 35.77], [39.0, 43.56], [47.0, 53.7], [64.0, 99.1], [100.0, 106.34], [110.0, 111.21], [114.0, 115.33], [117.0, 118.64], [120.0, 122.69], [125.0, 125.74], [127.0, 129.19], [130.0, 132.0], [133.0, 133.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [94.22, 0.0, 34.04, 0.0, 0.0, 94.66, 37.98, 0.0, 83.7, 0.0, 0.0, 0.0, 99.92, 0.0, 100.0, 96.89, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.73], ["boing", 8.66], ["pizzicato", 4.6]], null, null, null, [["music", 74.6], ["musical instrument", 3.38], ["keyboard (musical)", 2.46]], null, null, null, null, null, null, null, null, null, null], "duration": [5.64, 0.55, 5.12, 0.48, 1.77, 4.56, 6.7, 35.1, 6.34, 1.21, 1.33, 1.64, 2.69, 0.74, 2.19, 2.0, 0.86]} \ No newline at end of file diff --git a/annotations_1/vn8YIDxEGrw_filtered.json b/annotations_1/vn8YIDxEGrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9d7867edaf1ff151f1e1f0e4f4b5c3889f34963b --- /dev/null +++ b/annotations_1/vn8YIDxEGrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.52], [15.0, 16.34], [18.0, 19.03], [19.0, 21.47], [23.0, 23.33], [24.0, 43.65], [47.0, 54.65], [56.0, 56.66], [57.0, 58.41], [59.0, 59.88], [60.0, 60.61], [61.0, 62.26], [63.0, 84.21], [85.0, 85.33], [87.0, 87.05], [87.0, 98.79], [99.0, 100.31], [101.0, 101.71], [102.0, 101.95], [102.0, 105.97], [108.0, 128.29], [129.0, 129.81], [130.0, 136.07], [137.0, 141.96], [143.0, 146.67], [148.0, 163.61], [164.0, 165.0], [166.0, 177.47], [178.0, 180.77], [184.0, 195.34]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 36.72, 0.0, 32.77, 41.58, 0.0, 0.0, 0.0, 0.0, 0.0, 36.72, 0.0, 0.0, 33.05, 0.0, 0.0, 0.0, 36.63, 41.72, 0.0, 40.73, 63.21, 58.22, 48.23, 0.0, 33.63, 42.51, 35.42], "audiomae_on_audioset": [null, null, null, [["moo", 15.19], ["cattle, bovinae", 14.27], ["speech", 10.06]], null, [["explosion", 16.94], ["speech", 13.74], ["boom", 10.96]], [["hum", 34.78], ["rumble", 34.09], ["mains hum", 7.51]], null, null, null, null, null, [["music", 27.62], ["whale vocalization", 7.05], ["buzz", 6.36]], null, null, [["whack, thwack", 20.4], ["music", 16.11], ["hum", 11.14]], null, null, null, [["speech", 41.28], ["whale vocalization", 21.81], ["music", 11.16]], [["singing bowl", 29.16], ["speech", 26.53], ["rumble", 12.67]], null, [["hum", 36.16], ["mains hum", 30.72], ["speech", 14.24]], null, null, [["music", 62.6], ["electronic music", 4.78], ["hum", 4.36]], null, [["speech", 49.93], ["mains hum", 11.85], ["hum", 9.77]], [["hiccup", 21.18], ["rumble", 19.71], ["heart sounds, heartbeat", 5.76]], [["didgeridoo", 50.22], ["music", 20.86], ["speech", 11.08]]], "duration": [1.52, 1.34, 1.03, 2.47, 0.33, 19.65, 7.65, 0.66, 1.41, 0.88, 0.61, 1.26, 21.21, 0.33, 0.05, 11.79, 1.31, 0.71, -0.05, 3.97, 20.29, 0.81, 6.07, 4.96, 3.67, 15.61, 1.0, 11.47, 2.77, 11.34]} \ No newline at end of file diff --git a/annotations_1/vnL8uiqp6_k_filtered.json b/annotations_1/vnL8uiqp6_k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a86830ef2105ebe0d143296307e94209cc08b797 --- /dev/null +++ b/annotations_1/vnL8uiqp6_k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 1.0], [1.0, 1.12], [5.0, 6.12], [8.0, 8.09], [10.0, 10.91], [14.0, 20.36], [22.0, 23.23], [27.0, 28.54], [30.0, 31.78], [34.0, 43.21], [45.0, 48.91], [50.0, 51.0], [51.0, 52.0], [54.0, 57.72], [61.0, 66.77], [69.0, 72.37], [75.0, 79.73], [81.0, 80.86], [83.0, 91.05], [94.0, 112.45], [119.0, 125.78], [133.0, 134.69], [137.0, 139.31], [144.0, 144.91], [146.0, 148.66], [150.0, 157.86], [161.0, 162.11], [163.0, 165.84]], "keep_status": [false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, true, false, true, true, false, false, true, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.02, 0.0, 0.0, 0.0, 42.79, 45.72, 0.0, 0.0, 53.53, 52.05, 72.31, 49.36, 0.0, 48.14, 34.42, 31.18, 0.0, 43.87, 0.0, 41.89, 37.72, 0.0, 33.35], "audiomae_on_audioset": [null, null, null, null, null, [["music", 9.58], ["baby cry, infant cry", 8.55], ["speech", 7.37]], null, null, null, [["whimper", 19.95], ["baby cry, infant cry", 16.23], ["grunt", 9.75]], [["music", 32.48], ["baby cry, infant cry", 9.56], ["groan", 3.88]], null, null, null, null, null, [["cattle, bovinae", 12.48], ["moo", 11.88], ["livestock, farm animals, working animals", 11.47]], null, [["speech", 48.83], ["music", 16.66], ["crying, sobbing", 3.33]], [["music", 17.14], ["explosion", 12.76], ["artillery fire", 10.62]], [["music", 68.03], ["scary music", 5.89], ["soundtrack music", 4.48]], null, [["music", 58.14], ["singing bowl", 4.17], ["didgeridoo", 4.07]], null, [["music", 18.77], ["hum", 18.75], ["mains hum", 15.88]], [["music", 58.92], ["grunt", 17.26], ["groan", 2.98]], null, [["music", 30.43], ["fly, housefly", 6.81], ["whale vocalization", 6.26]]], "duration": [1.0, 0.12, 1.12, 0.09, 0.91, 6.36, 1.23, 1.54, 1.78, 9.21, 3.91, 1.0, 1.0, 3.72, 5.77, 3.37, 4.73, -0.14, 8.05, 18.45, 6.78, 1.69, 2.31, 0.91, 2.66, 7.86, 1.11, 2.84]} \ No newline at end of file diff --git a/annotations_1/vndiMloYcYU_filtered.json b/annotations_1/vndiMloYcYU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..02ccfc29f4f1f285356491126394446b89bb15de --- /dev/null +++ b/annotations_1/vndiMloYcYU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.38], [5.0, 6.05], [8.0, 9.05], [9.0, 10.05], [11.0, 15.74], [20.0, 21.14], [25.0, 25.59], [27.0, 28.59], [30.0, 30.81], [32.0, 34.35], [35.0, 40.31], [42.0, 42.55], [44.0, 45.13], [46.0, 46.08], [46.0, 47.71], [48.0, 50.28], [51.0, 55.68], [56.0, 57.03], [58.0, 59.46], [63.0, 84.13], [85.0, 86.44], [91.0, 96.7], [97.0, 99.22], [102.0, 101.85], [110.0, 110.37], [113.0, 118.45], [121.0, 122.52], [128.0, 128.61], [132.0, 132.41], [148.0, 150.13], [152.0, 156.2], [157.0, 157.76], [160.0, 160.69], [166.0, 168.54]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 40.01, 0.0, 0.0, 0.0, 0.0, 40.68, 44.72, 0.0, 0.0, 0.0, 0.0, 44.26, 71.0, 0.0, 0.0, 44.46, 0.0, 48.31, 48.1, 0.0, 0.0, 39.7, 0.0, 0.0, 0.0, 77.7, 51.44, 0.0, 0.0, 50.36], "audiomae_on_audioset": [null, null, null, null, [["whale vocalization", 80.33], ["animal", 2.81], ["roaring cats (lions, tigers)", 2.59]], null, null, null, null, [["speech", 42.55], ["music", 10.28], ["inside, small room", 2.88]], [["livestock, farm animals, working animals", 36.45], ["cattle, bovinae", 32.25], ["moo", 21.83]], null, null, null, null, [["speech", 75.14], ["inside, small room", 2.07], ["hum", 1.88]], null, null, null, [["coin (dropping)", 44.28], ["speech", 31.64], ["glass", 2.11]], null, [["speech", 72.68], ["music", 4.29], ["radio", 3.25]], [["fart", 18.25], ["speech", 13.31], ["music", 4.99]], null, null, [["fly, housefly", 31.85], ["mosquito", 24.97], ["speech", 11.07]], null, null, null, null, null, null, null, null], "duration": [1.38, 1.05, 1.05, 1.05, 4.74, 1.14, 0.59, 1.59, 0.81, 2.35, 5.31, 0.55, 1.13, 0.08, 1.71, 2.28, 4.68, 1.03, 1.46, 21.13, 1.44, 5.7, 2.22, -0.15, 0.37, 5.45, 1.52, 0.61, 0.41, 2.13, 4.2, 0.76, 0.69, 2.54]} \ No newline at end of file diff --git a/annotations_1/vnh7gxa0z4Q_filtered.json b/annotations_1/vnh7gxa0z4Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..836402df4bc0c5c39184851167e57f2df8344b92 --- /dev/null +++ b/annotations_1/vnh7gxa0z4Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.98], [11.0, 11.8], [33.0, 34.74], [35.0, 36.9], [39.0, 39.7], [41.0, 41.42], [66.0, 68.86], [75.0, 74.95], [77.0, 78.71], [79.0, 80.33], [84.0, 84.52], [85.0, 90.37], [96.0, 96.5], [98.0, 98.98], [102.0, 103.69], [104.0, 110.69], [112.0, 122.5], [126.0, 126.3], [128.0, 128.31]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 29.97, 0.0, 0.0, 0.0, 29.74, 29.25, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.41], ["music", 20.06], ["vehicle", 12.18]], null, null, null, [["speech", 26.49], ["sidetone", 11.26], ["hum", 10.31]], [["speech", 69.58], ["music", 6.07], ["explosion", 1.71]], null, null], "duration": [-0.02, 0.8, 1.74, 1.9, 0.7, 0.42, 2.86, -0.05, 1.71, 1.33, 0.52, 5.37, 0.5, 0.98, 1.69, 6.69, 10.5, 0.3, 0.31]} \ No newline at end of file diff --git a/annotations_1/vo0cUbT4Lh4_filtered.json b/annotations_1/vo0cUbT4Lh4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..304af0c9cdf064d5f73ea3be6da43a0528e1f727 --- /dev/null +++ b/annotations_1/vo0cUbT4Lh4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.82], [14.0, 14.18], [16.0, 16.9], [20.0, 20.17], [24.0, 24.88], [41.0, 41.4], [43.0, 44.9], [47.0, 48.96], [51.0, 51.29]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [1.82, 0.18, 0.9, 0.17, 0.88, 0.4, 1.9, 1.96, 0.29]} \ No newline at end of file diff --git a/annotations_1/vozjOGBUz2I_filtered.json b/annotations_1/vozjOGBUz2I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f06e6684fd38b72c8768246100b194d7ab9ba3cb --- /dev/null +++ b/annotations_1/vozjOGBUz2I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.29], [9.0, 10.74], [12.0, 14.84], [16.0, 17.9], [19.0, 19.72], [21.0, 21.24], [22.0, 22.2], [24.0, 31.06], [42.0, 45.25], [46.0, 46.28], [49.0, 50.19], [51.0, 53.0], [58.0, 58.02], [60.0, 61.15], [63.0, 63.07], [65.0, 65.92], [71.0, 73.35], [76.0, 76.67], [85.0, 88.91], [94.0, 97.93], [101.0, 101.49], [103.0, 103.55], [104.0, 104.87], [106.0, 106.59], [109.0, 112.18], [114.0, 114.79], [119.0, 119.6], [120.0, 120.29], [121.0, 121.64], [123.0, 123.09], [130.0, 129.95], [135.0, 135.28], [138.0, 141.13], [141.0, 141.69], [143.0, 143.18], [143.0, 143.99], [145.0, 149.47]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 74.76, 78.38, 0.0, 0.0, 55.67, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 96.54, 99.68, 0.0, 0.0, 0.0, 0.0, 84.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 0.0, 0.0, 50.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.29, 1.74, 2.84, 1.9, 0.72, 0.24, 0.2, 7.06, 3.25, 0.28, 1.19, 2.0, 0.02, 1.15, 0.07, 0.92, 2.35, 0.67, 3.91, 3.93, 0.49, 0.55, 0.87, 0.59, 3.18, 0.79, 0.6, 0.29, 0.64, 0.09, -0.05, 0.28, 3.13, 0.69, 0.18, 0.99, 4.47]} \ No newline at end of file diff --git a/annotations_1/vp7r-h8OLm0_filtered.json b/annotations_1/vp7r-h8OLm0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..474d055e622acd92f64fb44c4c27255d393acefe --- /dev/null +++ b/annotations_1/vp7r-h8OLm0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.8], [6.0, 6.94], [14.0, 14.79], [26.0, 32.73], [34.0, 35.33], [37.0, 37.94], [39.0, 40.9], [43.0, 44.0], [47.0, 49.57], [53.0, 52.76], [56.0, 58.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.52, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 92.48, 0.0, 98.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [2.8, 0.94, 0.79, 6.73, 1.33, 0.94, 1.9, 1.0, 2.57, -0.24, 2.48]} \ No newline at end of file diff --git a/annotations_1/vpEAO0gIAxE_filtered.json b/annotations_1/vpEAO0gIAxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48c740b66dd905fb6f85de300297c91f2d1c0d41 --- /dev/null +++ b/annotations_1/vpEAO0gIAxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.59], [5.0, 6.39], [8.0, 12.77], [19.0, 21.83], [24.0, 26.76], [27.0, 29.13], [32.0, 34.77], [36.0, 39.29], [41.0, 44.91], [46.0, 48.12], [52.0, 55.29], [57.0, 59.49], [60.0, 62.99], [65.0, 66.7], [69.0, 69.53], [71.0, 72.79], [74.0, 78.8], [80.0, 84.45], [85.0, 90.51], [91.0, 95.22], [98.0, 100.82], [102.0, 105.87], [107.0, 110.37], [113.0, 116.5], [120.0, 123.21], [125.0, 126.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 92.31, 99.36, 99.78, 90.25, 99.97, 99.95, 86.82, 99.96, 99.99, 99.36, 75.55, 0.0, 0.0, 0.0, 97.43, 99.85, 99.76, 90.95, 99.93, 99.84, 99.94, 97.64, 82.61, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.59, 1.39, 4.77, 2.83, 2.76, 2.13, 2.77, 3.29, 3.91, 2.12, 3.29, 2.49, 2.99, 1.7, 0.53, 1.79, 4.8, 4.45, 5.51, 4.22, 2.82, 3.87, 3.37, 3.5, 3.21, 1.87]} \ No newline at end of file diff --git a/annotations_1/vpqzFo0aD0c_filtered.json b/annotations_1/vpqzFo0aD0c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77d25f4bfe0d7c4c5b28859d41900657d6c5b567 --- /dev/null +++ b/annotations_1/vpqzFo0aD0c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.52], [13.0, 13.42], [14.0, 14.55], [36.0, 36.44], [42.0, 42.67], [47.0, 47.61], [50.0, 49.86], [59.0, 59.54], [62.0, 62.14], [66.0, 66.23], [69.0, 69.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [0.52, 0.42, 0.55, 0.44, 0.67, 0.61, -0.14, 0.54, 0.14, 0.23, 0.79]} \ No newline at end of file diff --git a/annotations_1/vq0OqfmArnY_filtered.json b/annotations_1/vq0OqfmArnY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22508c67198f566d0cc0060e871f8cef87ff98b8 --- /dev/null +++ b/annotations_1/vq0OqfmArnY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 32.02], [34.0, 95.37], [99.0, 99.27], [100.0, 100.95], [101.0, 102.91], [103.0, 104.45], [105.0, 108.13], [109.0, 111.57], [113.0, 114.05], [115.0, 121.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 78.21, 0.0, 75.88], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [31.02, 61.37, 0.27, 0.95, 1.91, 1.45, 3.13, 2.57, 1.05, 6.98]} \ No newline at end of file diff --git a/annotations_1/vq6ofw0hqkU_filtered.json b/annotations_1/vq6ofw0hqkU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e25f24deb1d84d482c721fe0fa1b2a97fe30ce --- /dev/null +++ b/annotations_1/vq6ofw0hqkU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.31], [13.0, 13.78], [18.0, 18.87], [21.0, 22.72], [24.0, 30.4], [34.0, 43.8], [45.0, 50.41], [54.0, 54.4], [56.0, 56.02], [63.0, 63.09], [68.0, 69.03], [70.0, 72.37], [74.0, 75.63], [81.0, 81.43], [84.0, 85.04], [86.0, 88.15], [89.0, 89.87], [96.0, 98.05], [100.0, 101.19], [103.0, 104.21], [106.0, 111.15], [112.0, 115.89], [116.0, 119.85], [122.0, 122.59], [124.0, 125.56], [127.0, 128.43], [129.0, 131.09]], "keep_status": [false, false, false, false, true, true, true, false, false, false, false, true, false, false, false, true, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 35.38, 35.01, 33.96, 0.0, 0.0, 0.0, 0.0, 32.87, 0.0, 0.0, 0.0, 42.28, 0.0, 44.6, 0.0, 0.0, 41.6, 53.28, 46.61, 0.0, 0.0, 0.0, 42.0], "audiomae_on_audioset": [null, null, null, null, [["noise", 18.17], ["fly, housefly", 11.17], ["breaking", 6.52]], [["breaking", 27.35], ["music", 25.36], ["speech", 14.37]], [["hum", 40.33], ["throbbing", 15.12], ["mains hum", 9.36]], null, null, null, null, [["whale vocalization", 47.07], ["hum", 13.39], ["throbbing", 5.63]], null, null, null, [["hum", 27.7], ["mains hum", 19.4], ["speech", 12.64]], null, [["speech", 32.78], ["mains hum", 19.91], ["hum", 8.64]], null, null, [["hum", 32.46], ["mains hum", 20.27], ["speech", 15.64]], null, [["mains hum", 32.67], ["hum", 29.7], ["music", 9.22]], null, null, null, [["mains hum", 18.58], ["music", 17.6], ["hum", 13.72]]], "duration": [1.31, 0.78, 0.87, 1.72, 6.4, 9.8, 5.41, 0.4, 0.02, 0.09, 1.03, 2.37, 1.63, 0.43, 1.04, 2.15, 0.87, 2.05, 1.19, 1.21, 5.15, 3.89, 3.85, 0.59, 1.56, 1.43, 2.09]} \ No newline at end of file diff --git a/annotations_1/vqPT1IbJrX8_filtered.json b/annotations_1/vqPT1IbJrX8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..baca081c213eed6b1546859a54209b68216fa80d --- /dev/null +++ b/annotations_1/vqPT1IbJrX8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.1], [15.0, 17.83], [19.0, 21.71], [22.0, 23.75], [27.0, 30.03], [31.0, 31.83], [39.0, 39.9], [43.0, 44.78], [47.0, 47.17], [52.0, 60.39], [63.0, 63.56], [67.0, 67.02], [72.0, 72.06], [73.0, 74.01], [74.0, 76.0], [80.0, 80.27], [82.0, 82.8], [85.0, 86.95], [88.0, 105.53], [107.0, 107.67], [108.0, 112.01], [114.0, 114.76], [117.0, 120.02], [123.0, 128.04], [130.0, 132.33], [133.0, 140.88], [145.0, 145.42], [146.0, 152.49], [158.0, 159.83], [162.0, 165.5], [168.0, 169.59], [176.0, 175.91], [180.0, 191.69], [192.0, 194.07], [195.0, 201.5], [202.0, 203.1], [204.0, 206.83], [209.0, 211.3], [214.0, 215.97], [219.0, 221.91], [229.0, 230.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, true, true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 36.06, 56.4, 0.0, 72.16, 0.0, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 48.78, 0.0, 0.0, 0.0, 34.62, 0.0, 33.48, 0.0, 30.79, 30.11, 37.34, 36.53, 0.0, 32.97, 0.0, 37.27, 0.0, 0.0, 34.68, 56.25, 52.39, 0.0, 85.17, 82.25, 0.0, 43.58, 0.0], "audiomae_on_audioset": [null, [["music", 35.6], ["speech", 30.6], ["hum", 4.08]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.03], ["speech", 13.41], ["synthesizer", 8.85]], null, null, null, [["music", 29.45], ["speech", 23.85], ["buzz", 7.79]], null, [["music", 23.23], ["hum", 21.63], ["throbbing", 21.41]], null, [["speech", 20.89], ["music", 12.33], ["electric shaver, electric razor", 3.81]], [["speech", 31.74], ["mains hum", 18.74], ["electric shaver, electric razor", 9.93]], [["music", 45.47], ["speech", 17.74], ["carnatic music", 7.37]], [["speech", 71.38], ["music", 5.92], ["explosion", 1.21]], null, [["music", 49.4], ["musical instrument", 6.04], ["didgeridoo", 5.54]], null, [["music", 46.41], ["speech", 9.11], ["electronic music", 7.54]], null, null, [["throbbing", 40.42], ["hum", 37.31], ["music", 10.18]], null, null, null, null, null, null, [["hum", 36.71], ["speech", 11.79], ["mains hum", 11.38]], null], "duration": [1.1, 2.83, 2.71, 1.75, 3.03, 0.83, 0.9, 1.78, 0.17, 8.39, 0.56, 0.02, 0.06, 1.01, 2.0, 0.27, 0.8, 1.95, 17.53, 0.67, 4.01, 0.76, 3.02, 5.04, 2.33, 7.88, 0.42, 6.49, 1.83, 3.5, 1.59, -0.09, 11.69, 2.07, 6.5, 1.1, 2.83, 2.3, 1.97, 2.91, 1.66]} \ No newline at end of file diff --git a/annotations_1/vqxbLAcIgiw_filtered.json b/annotations_1/vqxbLAcIgiw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b53e993f0c92c241ffc683b1032a63d93d2517f3 --- /dev/null +++ b/annotations_1/vqxbLAcIgiw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 13.37], [24.0, 24.7], [39.0, 39.51], [41.0, 59.1]], "keep_status": [false, false, false, true], "silence_prob": [30.89, 0.0, 0.0, 28.78], "audiomae_on_audioset": [[["hum", 44.15], ["mains hum", 32.87], ["throbbing", 10.07]], null, null, [["music", 22.7], ["speech", 16.57], ["ding", 10.64]]], "duration": [8.37, 0.7, 0.51, 18.1]} \ No newline at end of file diff --git a/annotations_1/vr2jJkcTcxk_filtered.json b/annotations_1/vr2jJkcTcxk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fdff62e0c6961f4f97a27ff797329f9dbd97a63 --- /dev/null +++ b/annotations_1/vr2jJkcTcxk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 18.22], [19.0, 20.01], [21.0, 23.19], [24.0, 24.95], [26.0, 26.35], [29.0, 29.12], [30.0, 31.68], [32.0, 34.64], [37.0, 37.84], [38.0, 39.75], [41.0, 42.72], [44.0, 44.66], [45.0, 46.9], [49.0, 51.22], [53.0, 55.58], [57.0, 58.4], [60.0, 63.1], [65.0, 66.12], [67.0, 68.12], [74.0, 75.59], [79.0, 79.15], [79.0, 83.27], [86.0, 86.91], [87.0, 87.66], [89.0, 89.43], [91.0, 95.42], [96.0, 96.4], [97.0, 98.09], [100.0, 100.62], [102.0, 106.08], [107.0, 108.18], [112.0, 115.72], [117.0, 122.98], [124.0, 125.1]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.64, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 0.0, 62.27, 60.79, 0.0, 77.87, 0.0, 0.0, 0.0, 0.0, 39.35, 0.0, 0.0, 0.0, 77.7, 0.0, 0.0, 0.0, 85.35, 0.0, 57.56, 33.11, 0.0], "audiomae_on_audioset": [[["hum", 25.65], ["thunk", 21.15], ["throbbing", 7.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 70.42], ["speech synthesizer", 13.82], ["radio", 3.28]], null, null, null, null, null, null, null, null, null, null, [["music", 65.45], ["throbbing", 5.13], ["synthesizer", 4.29]], null], "duration": [7.22, 1.01, 2.19, 0.95, 0.35, 0.12, 1.68, 2.64, 0.84, 1.75, 1.72, 0.66, 1.9, 2.22, 2.58, 1.4, 3.1, 1.12, 1.12, 1.59, 0.15, 4.27, 0.91, 0.66, 0.43, 4.42, 0.4, 1.09, 0.62, 4.08, 1.18, 3.72, 5.98, 1.1]} \ No newline at end of file diff --git a/annotations_1/vrEjev5DoXc_filtered.json b/annotations_1/vrEjev5DoXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cedc7d461fbf25bbfb92c03e97c4bcca02a6be93 --- /dev/null +++ b/annotations_1/vrEjev5DoXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.67], [6.0, 7.84], [10.0, 11.38], [13.0, 13.47], [15.0, 16.06], [17.0, 18.15], [22.0, 23.03], [24.0, 25.84], [26.0, 27.31], [30.0, 30.75], [33.0, 74.88], [76.0, 76.84], [78.0, 81.43], [85.0, 85.72], [89.0, 92.5], [95.0, 96.43], [99.0, 100.31], [102.0, 105.29], [108.0, 113.59], [116.0, 121.8], [124.0, 130.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.42, 0.0, 34.46, 0.0, 0.0, 33.77, 34.57, 30.02, 28.96], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["mains hum", 41.49], ["hum", 24.06], ["music", 9.5]], null, [["sidetone", 36.63], ["speech", 16.21], ["mains hum", 12.51]], null, null, [["music", 34.44], ["hum", 14.07], ["breaking", 12.88]], [["music", 49.77], ["throbbing", 15.23], ["hum", 11.69]], [["music", 43.96], ["hum", 17.66], ["throbbing", 13.21]], [["music", 50.7], ["hum", 8.85], ["mains hum", 7.9]]], "duration": [0.67, 1.84, 1.38, 0.47, 1.06, 1.15, 1.03, 1.84, 1.31, 0.75, 41.88, 0.84, 3.43, 0.72, 3.5, 1.43, 1.31, 3.29, 5.59, 5.8, 6.27]} \ No newline at end of file diff --git a/annotations_1/vrhgkmAzWvo_filtered.json b/annotations_1/vrhgkmAzWvo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc3201a3b5835ffe57a15678687a6f51e2ab3f14 --- /dev/null +++ b/annotations_1/vrhgkmAzWvo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.36], [18.0, 18.62], [33.0, 33.45], [49.0, 53.13], [55.0, 61.37], [62.0, 63.85], [66.0, 67.54], [82.0, 83.19], [87.0, 90.37], [92.0, 93.72], [95.0, 95.67], [97.0, 97.73], [100.0, 101.83], [107.0, 107.91], [108.0, 109.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 65.2, 72.46, 0.0, 0.0, 0.0, 94.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.36, 0.62, 0.45, 4.13, 6.37, 1.85, 1.54, 1.19, 3.37, 1.72, 0.67, 0.73, 1.83, 0.91, 1.88]} \ No newline at end of file diff --git a/annotations_1/vsQak7aKH30_filtered.json b/annotations_1/vsQak7aKH30_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1725cfaac4c3ff862f095e798aff17a3dee42b8 --- /dev/null +++ b/annotations_1/vsQak7aKH30_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.64], [6.0, 6.45], [8.0, 9.17], [15.0, 15.2], [20.0, 21.25], [23.0, 23.89], [25.0, 26.45], [29.0, 29.17], [38.0, 38.64], [55.0, 55.31], [77.0, 78.0], [87.0, 87.45], [103.0, 104.26], [117.0, 118.02], [124.0, 124.65], [125.0, 133.78], [134.0, 134.59], [135.0, 138.18], [140.0, 140.76], [142.0, 142.2], [144.0, 145.08], [150.0, 150.3], [156.0, 156.02], [157.0, 157.86], [159.0, 163.76], [165.0, 165.35], [166.0, 166.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.15, 0.0, 99.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.45, 1.17, 0.2, 1.25, 0.89, 1.45, 0.17, 0.64, 0.31, 1.0, 0.45, 1.26, 1.02, 0.65, 8.78, 0.59, 3.18, 0.76, 0.2, 1.08, 0.3, 0.02, 0.86, 4.76, 0.35, 0.87]} \ No newline at end of file diff --git a/annotations_1/vsU27J8K3Tw_filtered.json b/annotations_1/vsU27J8K3Tw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..48e8bb97c11485c63738e6403515dc3837aba84c --- /dev/null +++ b/annotations_1/vsU27J8K3Tw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 66.33], [67.0, 75.68], [77.0, 78.73], [79.0, 81.63], [83.0, 85.41], [87.0, 89.01]], "keep_status": [false, true, false, false, true, false], "silence_prob": [50.06, 48.61, 0.0, 51.34, 38.02, 54.36], "audiomae_on_audioset": [null, [["speech", 38.79], ["sidetone", 15.27], ["hum", 7.92]], null, null, [["whale vocalization", 29.55], ["hum", 15.38], ["music", 8.86]], null], "duration": [8.33, 8.68, 1.73, 2.63, 2.41, 2.01]} \ No newline at end of file diff --git a/annotations_1/vubylfvbMhk_filtered.json b/annotations_1/vubylfvbMhk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c949821bd2fec50aac22dd28bbf71c547178b297 --- /dev/null +++ b/annotations_1/vubylfvbMhk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.65], [24.0, 25.15], [30.0, 30.48], [40.0, 42.25], [53.0, 52.86], [53.0, 53.7], [74.0, 74.46], [77.0, 80.59], [82.0, 94.66], [110.0, 110.67], [112.0, 112.48], [113.0, 113.81]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [92.8, 0.0, 0.0, 87.55, 0.0, 0.0, 0.0, 44.6, 31.33, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 43.99], ["fly, housefly", 6.36], ["theremin", 4.57]], [["speech", 38.34], ["music", 15.49], ["boing", 10.49]], null, null, null], "duration": [2.65, 1.15, 0.48, 2.25, -0.14, 0.7, 0.46, 3.59, 12.66, 0.67, 0.48, 0.81]} \ No newline at end of file diff --git a/annotations_1/vvBW4Szes1U_filtered.json b/annotations_1/vvBW4Szes1U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6511a13cf43d85684ca419ada207e1d21a73128c --- /dev/null +++ b/annotations_1/vvBW4Szes1U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.44], [3.0, 4.35], [6.0, 10.54], [11.0, 15.62], [18.0, 18.32], [19.0, 20.33], [21.0, 22.47], [23.0, 24.85], [26.0, 28.61], [29.0, 31.24], [32.0, 37.29], [38.0, 40.86], [42.0, 43.85], [45.0, 45.17], [46.0, 47.78], [49.0, 50.97], [52.0, 53.97], [55.0, 64.13], [66.0, 72.03], [73.0, 74.33], [75.0, 77.62], [78.0, 105.16], [106.0, 108.38], [109.0, 113.31], [115.0, 119.75], [120.0, 119.87], [122.0, 129.24], [131.0, 130.98]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 37.09, 42.69, 0.0, 0.0, 0.0, 0.0, 43.93, 69.61, 65.09, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 50.91, 53.34, 0.0, 41.81, 34.74, 42.6, 44.69, 37.64, 0.0, 32.06, 0.0], "audiomae_on_audioset": [null, null, [["cough", 18.66], ["throat clearing", 16.77], ["music", 15.26]], [["speech", 48.93], ["music", 27.22], ["inside, small room", 2.96]], null, null, null, null, [["music", 36.7], ["hum", 13.84], ["speech", 12.62]], null, null, null, null, null, null, null, null, null, null, null, [["music", 39.87], ["crushing", 23.11], ["musical instrument", 2.54]], [["music", 59.2], ["hum", 8.43], ["keyboard (musical)", 3.74]], [["music", 50.15], ["musical instrument", 7.08], ["synthesizer", 3.67]], [["music", 65.65], ["didgeridoo", 7.98], ["musical instrument", 4.87]], [["music", 46.8], ["synthesizer", 11.1], ["theremin", 6.18]], null, [["music", 52.09], ["synthesizer", 6.68], ["musical instrument", 5.6]], null], "duration": [0.44, 1.35, 4.54, 4.62, 0.32, 1.33, 1.47, 1.85, 2.61, 2.24, 5.29, 2.86, 1.85, 0.17, 1.78, 1.97, 1.97, 9.13, 6.03, 1.33, 2.62, 27.16, 2.38, 4.31, 4.75, -0.13, 7.24, -0.02]} \ No newline at end of file diff --git a/annotations_1/vw44oj_STSw_filtered.json b/annotations_1/vw44oj_STSw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d8b7748abea6094981f477224b274c66b6441d6d --- /dev/null +++ b/annotations_1/vw44oj_STSw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.34], [29.0, 29.67], [35.0, 35.02], [35.0, 35.24], [36.0, 36.56], [43.0, 43.61], [50.0, 51.19], [69.0, 69.9], [70.0, 70.28], [70.0, 71.0], [72.0, 72.76], [78.0, 78.9], [80.0, 80.72], [85.0, 85.23], [96.0, 97.06], [98.0, 98.54], [100.0, 100.8], [112.0, 112.85], [114.0, 114.54], [118.0, 118.23], [130.0, 131.08], [135.0, 137.34], [138.0, 138.43], [140.0, 141.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.73, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.34, 0.67, 0.02, 0.24, 0.56, 0.61, 1.19, 0.9, 0.28, 1.0, 0.76, 0.9, 0.72, 0.23, 1.06, 0.54, 0.8, 0.85, 0.54, 0.23, 1.08, 2.34, 0.43, 1.17]} \ No newline at end of file diff --git a/annotations_1/vwbryjr2BKg_filtered.json b/annotations_1/vwbryjr2BKg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5ba5ced131f433748e7bc8930877d68bf5283bf7 --- /dev/null +++ b/annotations_1/vwbryjr2BKg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [7.0, 7.2], [10.0, 11.33], [16.0, 16.75], [18.0, 19.5], [23.0, 24.09], [43.0, 44.56], [52.0, 52.88], [53.0, 53.43], [54.0, 54.87], [58.0, 59.19], [60.0, 61.37], [62.0, 67.31], [68.0, 71.36], [74.0, 74.11], [76.0, 77.41], [78.0, 78.95], [80.0, 97.65], [99.0, 99.5], [101.0, 102.83], [105.0, 106.71], [109.0, 109.97], [112.0, 112.78], [115.0, 116.6], [120.0, 119.75], [126.0, 128.51], [129.0, 135.31], [136.0, 137.79], [138.0, 144.42], [145.0, 149.08], [151.0, 150.8], [152.0, 153.37], [154.0, 154.53], [155.0, 158.8], [161.0, 163.04], [164.0, 164.4], [166.0, 167.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 99.71, 0.0, 0.0, 0.0, 99.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.73, 0.0, 95.09, 98.36, 0.0, 0.0, 0.0, 91.13, 73.67, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.65, 0.2, 1.33, 0.75, 1.5, 1.09, 1.56, 0.88, 0.43, 0.87, 1.19, 1.37, 5.31, 3.36, 0.11, 1.41, 0.95, 17.65, 0.5, 1.83, 1.71, 0.97, 0.78, 1.6, -0.25, 2.51, 6.31, 1.79, 6.42, 4.08, -0.2, 1.37, 0.53, 3.8, 2.04, 0.4, 1.39]} \ No newline at end of file diff --git a/annotations_1/vxFr0xNspFU_filtered.json b/annotations_1/vxFr0xNspFU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2e18c5324c14ea52e75efc134fe49c89efe7896 --- /dev/null +++ b/annotations_1/vxFr0xNspFU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 8.13], [13.0, 22.23], [24.0, 30.64], [31.0, 32.88], [38.0, 39.04], [41.0, 42.69], [43.0, 44.88], [45.0, 50.84]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [45.4, 33.6, 46.19, 0.0, 0.0, 0.0, 0.0, 38.58], "audiomae_on_audioset": [[["music", 47.65], ["squish", 13.02], ["whale vocalization", 9.64]], [["music", 79.41], ["breaking", 5.05], ["buzz", 2.41]], [["music", 56.03], ["whale vocalization", 17.5], ["pour", 3.35]], null, null, null, null, [["music", 50.6], ["whale vocalization", 15.19], ["speech", 7.6]]], "duration": [2.13, 9.23, 6.64, 1.88, 1.04, 1.69, 1.88, 5.84]} \ No newline at end of file diff --git a/annotations_1/vyb2Imfghkg_filtered.json b/annotations_1/vyb2Imfghkg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..517cd324e6771a759e1fe189a8541ac1f40e5e90 --- /dev/null +++ b/annotations_1/vyb2Imfghkg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.52], [11.0, 15.28], [16.0, 17.15], [17.0, 24.73], [27.0, 29.44], [37.0, 42.48], [43.0, 48.96], [54.0, 54.51], [57.0, 57.57], [60.0, 60.34], [62.0, 62.73], [71.0, 71.85], [75.0, 82.36], [87.0, 87.74], [91.0, 91.27], [92.0, 93.34], [94.0, 94.71], [97.0, 98.74], [101.0, 100.97], [102.0, 103.06], [104.0, 104.33], [106.0, 106.91], [109.0, 109.43], [119.0, 119.18], [126.0, 130.18], [131.0, 132.22], [134.0, 133.62], [136.0, 138.47], [140.0, 142.92], [145.0, 146.16], [151.0, 154.4], [155.0, 156.49], [157.0, 157.0], [159.0, 160.98], [169.0, 173.01]], "keep_status": [true, true, false, false, true, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, true, false, false, false, true], "silence_prob": [46.75, 43.2, 0.0, 32.05, 37.09, 42.81, 31.82, 0.0, 0.0, 0.0, 0.0, 0.0, 37.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.65, 0.0, 0.0, 74.92, 49.68, 0.0, 46.79, 0.0, 0.0, 0.0, 42.67], "audiomae_on_audioset": [[["music", 42.79], ["speech", 4.9], ["animal", 4.44]], [["music", 55.19], ["glockenspiel", 4.22], ["speech", 4.02]], null, [["music", 69.27], ["speech", 7.18], ["theremin", 4.52]], [["music", 35.64], ["speech", 12.22], ["foghorn", 9.16]], [["music", 27.16], ["speech", 6.64], ["brass instrument", 6.14]], [["music", 30.44], ["speech", 25.71], ["foghorn", 8.69]], null, null, null, null, null, [["music", 53.23], ["synthesizer", 10.58], ["musical instrument", 3.88]], null, null, null, null, null, null, null, null, null, null, null, [["music", 57.76], ["theremin", 5.93], ["synthesizer", 4.04]], null, null, null, [["mosquito", 32.52], ["fly, housefly", 12.23], ["music", 7.9]], null, [["music", 35.95], ["speech", 7.54], ["didgeridoo", 5.64]], null, null, null, [["music", 34.08], ["mains hum", 13.89], ["hum", 10.44]]], "duration": [2.52, 4.28, 1.15, 7.73, 2.44, 5.48, 5.96, 0.51, 0.57, 0.34, 0.73, 0.85, 7.36, 0.74, 0.27, 1.34, 0.71, 1.74, -0.03, 1.06, 0.33, 0.91, 0.43, 0.18, 4.18, 1.22, -0.38, 2.47, 2.92, 1.16, 3.4, 1.49, 0.0, 1.98, 4.01]} \ No newline at end of file diff --git a/annotations_1/vzzuOkCkHlQ_filtered.json b/annotations_1/vzzuOkCkHlQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..65c6a6406a0bbfac54e5a89b899f197bfb717f59 --- /dev/null +++ b/annotations_1/vzzuOkCkHlQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 4.92], [9.0, 10.0], [11.0, 11.72], [13.0, 13.9], [15.0, 16.78], [18.0, 18.72], [21.0, 22.37], [23.0, 38.08], [40.0, 40.14], [49.0, 49.94], [61.0, 74.26], [81.0, 82.14], [83.0, 83.54], [86.0, 86.27]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.28, 0.0, 0.0, 36.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["insect", 12.22], ["fly, housefly", 11.09], ["wild animals", 10.65]], null, null, [["music", 37.08], ["speech", 25.07], ["ice cream truck, ice cream van", 12.24]], null, null, null], "duration": [-0.08, 1.0, 0.72, 0.9, 1.78, 0.72, 1.37, 15.08, 0.14, 0.94, 13.26, 1.14, 0.54, 0.27]} \ No newline at end of file diff --git a/annotations_1/w-6lVMklaKY_filtered.json b/annotations_1/w-6lVMklaKY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7d437dc150cc64a07e68ce943fe6c90892a8cc5 --- /dev/null +++ b/annotations_1/w-6lVMklaKY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 61.23], [61.0, 63.81], [64.0, 65.08], [69.0, 69.3], [72.0, 73.14], [79.0, 89.94], [91.0, 91.57], [94.0, 95.05], [96.0, 100.72], [102.0, 107.89], [109.0, 109.49], [111.0, 114.57], [118.0, 117.95], [119.0, 123.18], [127.0, 130.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [36.94, 41.93, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.99, 0.0, 100.0, 0.0, 100.0, 100.0], "audiomae_on_audioset": [[["hum", 54.71], ["mains hum", 18.63], ["throbbing", 17.3]], [["speech", 71.15], ["sidetone", 8.02], ["music", 3.84]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [20.23, 2.81, 1.08, 0.3, 1.14, 10.94, 0.57, 1.05, 4.72, 5.89, 0.49, 3.57, -0.05, 4.18, 3.06]} \ No newline at end of file diff --git a/annotations_1/w0qfQaJtF2E_filtered.json b/annotations_1/w0qfQaJtF2E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1e77e59f2898dff492399ea760fa11f0d7e1aa9 --- /dev/null +++ b/annotations_1/w0qfQaJtF2E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 55.21], [58.0, 69.79], [72.0, 97.61], [99.0, 113.66], [117.0, 130.57], [134.0, 140.9]], "keep_status": [false, true, false, true, false, false], "silence_prob": [31.55, 30.09, 37.24, 35.24, 34.3, 34.27], "audiomae_on_audioset": [[["music", 71.07], ["scary music", 6.23], ["hum", 3.79]], [["music", 37.03], ["speech", 14.29], ["thump, thud", 13.52]], [["music", 53.39], ["hum", 18.8], ["mains hum", 4.92]], [["music", 30.61], ["hum", 26.84], ["mains hum", 11.86]], [["music", 66.17], ["speech", 12.47], ["electronic music", 3.98]], [["music", 48.52], ["hum", 15.07], ["mains hum", 9.42]]], "duration": [21.21, 11.79, 25.61, 14.66, 13.57, 6.9]} \ No newline at end of file diff --git a/annotations_1/w3hwZ-7CWeg_filtered.json b/annotations_1/w3hwZ-7CWeg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1ccdd586fd5d403978351b95f4aa2bdbf50babae --- /dev/null +++ b/annotations_1/w3hwZ-7CWeg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 24.49], [25.0, 28.59], [29.0, 50.8], [51.0, 108.28], [111.0, 116.99], [118.0, 120.01], [121.0, 126.23], [128.0, 132.54]], "keep_status": [true, false, true, false, false, false, true, false], "silence_prob": [43.03, 41.93, 44.72, 0.0, 63.64, 97.64, 30.25, 30.48], "audiomae_on_audioset": [[["hum", 34.0], ["mains hum", 17.93], ["music", 9.69]], [["hum", 43.9], ["mains hum", 19.96], ["sidetone", 10.82]], [["hum", 38.27], ["speech", 20.81], ["whale vocalization", 7.59]], null, null, null, [["animal", 24.61], ["speech", 20.09], ["dog", 19.03]], [["dog", 29.15], ["animal", 25.67], ["domestic animals, pets", 19.44]]], "duration": [15.49, 3.59, 21.8, 57.28, 5.99, 2.01, 5.23, 4.54]} \ No newline at end of file diff --git a/annotations_1/w424xCe0eGQ_filtered.json b/annotations_1/w424xCe0eGQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aa9afa5f95c6441817fe64ee5e53cf8366429b8d --- /dev/null +++ b/annotations_1/w424xCe0eGQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.79], [4.0, 5.26], [7.0, 9.26], [14.0, 16.31], [19.0, 19.58], [23.0, 25.69], [26.0, 27.77], [30.0, 32.46], [33.0, 33.61], [36.0, 36.05], [39.0, 40.71], [41.0, 50.92], [54.0, 56.84], [59.0, 61.55], [64.0, 65.72], [67.0, 68.79], [71.0, 74.95], [77.0, 76.77], [79.0, 83.96], [89.0, 91.03], [95.0, 95.22], [97.0, 102.74], [105.0, 107.16], [111.0, 135.97], [138.0, 140.19], [141.0, 145.61]], "keep_status": [false, false, false, true, false, false, false, true, false, false, false, false, true, false, false, false, true, false, true, true, false, true, true, false, false, true], "silence_prob": [0.0, 0.0, 40.17, 39.11, 0.0, 40.52, 0.0, 42.0, 0.0, 0.0, 0.0, 33.58, 34.37, 35.15, 0.0, 0.0, 37.43, 0.0, 32.36, 30.64, 0.0, 31.89, 33.86, 31.99, 35.59, 38.59], "audiomae_on_audioset": [null, null, [["music", 37.83], ["speech", 28.92], ["hum", 8.84]], [["hum", 32.74], ["throbbing", 18.48], ["music", 16.93]], null, [["speech", 40.59], ["music", 35.71], ["hum", 7.84]], null, [["music", 35.37], ["didgeridoo", 14.97], ["theremin", 7.62]], null, null, null, [["music", 40.22], ["synthesizer", 21.26], ["speech", 8.89]], [["music", 45.27], ["marimba, xylophone", 6.59], ["musical instrument", 5.59]], [["music", 59.47], ["speech", 9.31], ["musical instrument", 4.82]], null, null, [["music", 44.85], ["speech", 15.82], ["hum", 5.17]], null, [["music", 34.43], ["speech", 6.69], ["quack", 5.86]], [["music", 51.5], ["vibraphone", 10.14], ["musical instrument", 7.89]], null, [["music", 54.26], ["musical instrument", 11.18], ["harmonic", 3.97]], [["music", 37.49], ["percussion", 10.88], ["musical instrument", 9.78]], [["music", 68.82], ["musical instrument", 7.71], ["marimba, xylophone", 1.68]], [["music", 48.22], ["throbbing", 19.11], ["hum", 11.09]], [["music", 23.91], ["vibraphone", 19.93], ["marimba, xylophone", 14.16]]], "duration": [0.79, 1.26, 2.26, 2.31, 0.58, 2.69, 1.77, 2.46, 0.61, 0.05, 1.71, 9.92, 2.84, 2.55, 1.72, 1.79, 3.95, -0.23, 4.96, 2.03, 0.22, 5.74, 2.16, 24.97, 2.19, 4.61]} \ No newline at end of file diff --git a/annotations_1/w4TCxFKaqIw_filtered.json b/annotations_1/w4TCxFKaqIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ac71cfe1770390f8d6b553ce31058a3d71af2c42 --- /dev/null +++ b/annotations_1/w4TCxFKaqIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 27.4], [29.0, 29.86], [31.0, 32.54], [33.0, 34.13], [36.0, 45.18], [46.0, 47.24], [52.0, 53.42], [58.0, 61.38], [63.0, 63.46], [67.0, 69.43], [70.0, 73.79], [74.0, 76.4], [77.0, 79.69], [83.0, 83.83], [92.0, 92.43], [97.0, 97.44], [98.0, 98.46], [99.0, 99.89], [101.0, 102.32], [104.0, 104.8], [106.0, 106.51]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [36.31, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 33.71, 0.0, 36.78, 42.91, 39.22, 36.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.32], ["knock", 11.39], ["brass instrument", 3.79]], null, null, null, null, null, null, [["throbbing", 19.78], ["speech", 8.37], ["heart sounds, heartbeat", 6.49]], null, [["speech", 47.44], ["radio", 26.04], ["vehicle", 4.5]], [["speech", 41.07], ["music", 27.18], ["hum", 8.78]], [["hum", 20.39], ["mains hum", 17.61], ["didgeridoo", 13.11]], [["speech", 36.13], ["music", 23.45], ["didgeridoo", 9.68]], null, null, null, null, null, null, null, null], "duration": [5.4, 0.86, 1.54, 1.13, 9.18, 1.24, 1.42, 3.38, 0.46, 2.43, 3.79, 2.4, 2.69, 0.83, 0.43, 0.44, 0.46, 0.89, 1.32, 0.8, 0.51]} \ No newline at end of file diff --git a/annotations_1/w5mtX7FnO3M_filtered.json b/annotations_1/w5mtX7FnO3M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e7d19a7c8d3684f230d69bb1a174b8740f307588 --- /dev/null +++ b/annotations_1/w5mtX7FnO3M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.33], [5.0, 5.39], [6.0, 7.25], [8.0, 8.4], [10.0, 22.28], [23.0, 24.92], [28.0, 44.41], [48.0, 48.88], [50.0, 50.99], [52.0, 53.38], [55.0, 55.39], [57.0, 56.96], [59.0, 61.52], [63.0, 79.07], [80.0, 106.93], [110.0, 113.66], [115.0, 117.66], [120.0, 121.51], [122.0, 122.1], [122.0, 125.44], [133.0, 133.68], [136.0, 136.22], [140.0, 140.53], [142.0, 147.92], [150.0, 151.85], [152.0, 160.73], [162.0, 162.36], [163.0, 171.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.98, 0.0, 0.0, 0.0, 87.55, 0.0, 92.31, 0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 93.6, 98.27, 90.78, 98.51, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0, 71.87, 0.0, 73.36, 0.0, 60.7], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.33, 0.39, 1.25, 0.4, 12.28, 1.92, 16.41, 0.88, 0.99, 1.38, 0.39, -0.04, 2.52, 16.07, 26.93, 3.66, 2.66, 1.51, 0.1, 3.44, 0.68, 0.22, 0.53, 5.92, 1.85, 8.73, 0.36, 8.05]} \ No newline at end of file diff --git a/annotations_1/w5oWgKtku3Q_filtered.json b/annotations_1/w5oWgKtku3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f900a93fea05cb3652e0d851362bd923d4f275aa --- /dev/null +++ b/annotations_1/w5oWgKtku3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.45], [8.0, 7.52], [8.0, 9.44], [19.0, 21.34], [22.0, 24.75], [26.0, 29.54], [30.0, 41.82], [42.0, 42.55], [48.0, 49.17], [50.0, 54.53], [57.0, 57.35], [63.0, 68.79], [78.0, 79.15], [82.0, 83.83], [87.0, 89.58], [90.0, 94.73], [96.0, 108.46], [109.0, 113.54], [115.0, 118.18], [122.0, 122.49], [124.0, 124.31]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 54.17, 97.54, 70.16, 31.26, 0.0, 0.0, 47.94, 0.0, 76.86, 0.0, 0.0, 83.52, 43.71, 30.25, 28.99, 29.14, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["fart", 28.45], ["whack, thwack", 17.1], ["speech", 6.04]], null, null, [["speech", 39.31], ["sine wave", 23.58], ["chirp tone", 10.52]], null, null, null, null, null, [["music", 33.22], ["speech", 29.15], ["musical instrument", 5.9]], [["heart sounds, heartbeat", 59.04], ["throbbing", 16.01], ["hum", 8.7]], [["hum", 50.34], ["throbbing", 33.94], ["speech", 6.91]], [["hum", 40.08], ["throbbing", 27.44], ["music", 11.86]], null, null], "duration": [0.45, -0.48, 1.44, 2.34, 2.75, 3.54, 11.82, 0.55, 1.17, 4.53, 0.35, 5.79, 1.15, 1.83, 2.58, 4.73, 12.46, 4.54, 3.18, 0.49, 0.31]} \ No newline at end of file diff --git a/annotations_1/w5yJV_TKOWg_filtered.json b/annotations_1/w5yJV_TKOWg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185fa79e73dc75766f0531f8c871cf9ad04f2961 --- /dev/null +++ b/annotations_1/w5yJV_TKOWg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.71], [2.0, 4.4], [5.0, 6.32], [26.0, 43.41], [45.0, 45.52], [47.0, 48.36], [51.0, 51.29], [53.0, 56.74], [67.0, 68.66], [70.0, 95.88], [97.0, 97.58], [99.0, 107.01], [110.0, 111.27], [114.0, 121.09]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, true, false, true], "silence_prob": [0.0, 58.64, 0.0, 29.63, 0.0, 0.0, 0.0, 28.74, 0.0, 28.8, 0.0, 28.59, 0.0, 28.73], "audiomae_on_audioset": [null, null, null, [["speech", 64.33], ["music", 11.25], ["hum", 5.16]], null, null, null, [["throbbing", 33.48], ["hum", 26.93], ["music", 17.35]], null, [["speech", 24.77], ["music", 21.28], ["outside, rural or natural", 7.04]], null, [["music", 30.67], ["speech", 20.92], ["groan", 5.44]], null, [["speech", 42.58], ["music", 6.83], ["explosion", 5.19]]], "duration": [0.71, 2.4, 1.32, 17.41, 0.52, 1.36, 0.29, 3.74, 1.66, 25.88, 0.58, 8.01, 1.27, 7.09]} \ No newline at end of file diff --git a/annotations_1/w6YTq-3hmnA_filtered.json b/annotations_1/w6YTq-3hmnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88d6fdb76fdeb5841fc91c40554eff10ad85be35 --- /dev/null +++ b/annotations_1/w6YTq-3hmnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.51], [9.0, 9.27], [14.0, 15.57], [18.0, 18.82], [31.0, 31.29], [33.0, 34.65], [76.0, 76.76], [82.0, 85.18], [93.0, 94.49], [101.0, 101.39], [105.0, 105.56], [114.0, 115.16], [118.0, 120.07]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.08, 0.0, 0.0, 0.0, 0.0, 48.95], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["breaking", 33.67], ["speech", 14.91], ["tuning fork", 12.92]], null, null, null, null, [["music", 62.23], ["throbbing", 5.61], ["hum", 3.09]]], "duration": [0.51, 0.27, 1.57, 0.82, 0.29, 1.65, 0.76, 3.18, 1.49, 0.39, 0.56, 1.16, 2.07]} \ No newline at end of file diff --git a/annotations_1/w6ivjvOqBy0_filtered.json b/annotations_1/w6ivjvOqBy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..61b8baae16117694ea5b57ebe074f28b20b5ffa8 --- /dev/null +++ b/annotations_1/w6ivjvOqBy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.29], [14.0, 15.58], [19.0, 18.72], [20.0, 20.95], [24.0, 24.63], [25.0, 25.86], [36.0, 36.66], [39.0, 43.31], [70.0, 71.29], [78.0, 78.83], [79.0, 80.38], [88.0, 91.66], [101.0, 101.04], [101.0, 101.73], [102.0, 102.68], [104.0, 103.89], [107.0, 115.33], [117.0, 121.56], [122.0, 122.66], [123.0, 134.35], [136.0, 138.89], [148.0, 164.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.8, 0.0, 0.0, 0.0, 32.1, 0.0, 0.0, 0.0, 0.0, 30.38, 31.12, 0.0, 28.97, 28.89, 29.1], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 51.8], ["thunk", 11.68], ["whack, thwack", 8.18]], null, null, null, [["music", 33.06], ["speech", 25.43], ["theremin", 10.59]], null, null, null, null, [["whale vocalization", 51.66], ["cattle, bovinae", 13.68], ["moo", 10.43]], [["speech", 47.45], ["music", 18.64], ["explosion", 7.85]], null, [["mosquito", 57.38], ["fly, housefly", 27.18], ["insect", 14.71]], [["speech", 58.46], ["vehicle", 10.17], ["car", 3.09]], [["livestock, farm animals, working animals", 41.32], ["cattle, bovinae", 17.85], ["moo", 13.53]]], "duration": [1.29, 1.58, -0.28, 0.95, 0.63, 0.86, 0.66, 4.31, 1.29, 0.83, 1.38, 3.66, 0.04, 0.73, 0.68, -0.11, 8.33, 4.56, 0.66, 11.35, 2.89, 16.73]} \ No newline at end of file diff --git a/annotations_1/w71pHLUz2i0_filtered.json b/annotations_1/w71pHLUz2i0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db33a535edc9f50ea7f500403ba8d725369b8be8 --- /dev/null +++ b/annotations_1/w71pHLUz2i0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.43], [6.0, 8.58], [10.0, 10.25], [14.0, 14.89], [16.0, 18.55], [20.0, 20.55], [21.0, 21.36], [23.0, 23.89], [31.0, 31.56], [32.0, 35.67], [44.0, 44.37], [46.0, 47.87], [53.0, 54.46], [62.0, 63.21], [65.0, 66.82], [69.0, 76.5], [84.0, 88.01], [89.0, 91.05], [92.0, 97.23], [102.0, 111.94], [115.0, 116.53], [121.0, 121.34], [122.0, 123.33], [125.0, 126.57], [129.0, 130.45], [132.0, 133.34], [134.0, 136.38], [137.0, 137.76], [138.0, 138.74]], "keep_status": [false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 33.35, 0.0, 0.0, 29.99, 0.0, 0.0, 0.0, 0.0, 30.55, 0.0, 0.0, 0.0, 0.0, 0.0, 33.25, 50.91, 44.34, 41.5, 32.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0], "audiomae_on_audioset": [null, [["throbbing", 34.63], ["hum", 14.15], ["music", 11.36]], null, null, [["speech", 37.42], ["boing", 19.26], ["music", 14.68]], null, null, null, null, [["music", 27.3], ["speech", 22.08], ["boing", 20.32]], null, null, null, null, null, [["boing", 43.5], ["speech", 25.43], ["music", 15.83]], null, [["music", 66.59], ["didgeridoo", 3.65], ["musical instrument", 2.62]], [["music", 45.92], ["speech", 16.95], ["hum", 9.86]], [["mosquito", 21.4], ["music", 15.77], ["fly, housefly", 8.58]], null, null, null, null, null, null, null, null, null], "duration": [0.43, 2.58, 0.25, 0.89, 2.55, 0.55, 0.36, 0.89, 0.56, 3.67, 0.37, 1.87, 1.46, 1.21, 1.82, 7.5, 4.01, 2.05, 5.23, 9.94, 1.53, 0.34, 1.33, 1.57, 1.45, 1.34, 2.38, 0.76, 0.74]} \ No newline at end of file diff --git a/annotations_1/w80ZSg7kNbE_filtered.json b/annotations_1/w80ZSg7kNbE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3ed5cb3757aae95ea5319557abd9cb65bc95c21 --- /dev/null +++ b/annotations_1/w80ZSg7kNbE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.89], [11.0, 14.0], [16.0, 17.41], [18.0, 19.25], [20.0, 21.39], [25.0, 26.96], [45.0, 45.47], [49.0, 58.95], [59.0, 71.36], [73.0, 74.58], [76.0, 77.03], [78.0, 78.04], [80.0, 85.58], [87.0, 87.84], [90.0, 92.82], [93.0, 94.51], [98.0, 99.1], [104.0, 110.56], [111.0, 123.47]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 93.76, 0.0, 0.0, 0.0, 0.0, 0.0, 30.78, 33.69, 0.0, 0.0, 0.0, 99.93, 0.0, 88.28, 0.0, 0.0, 87.37, 52.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 47.06], ["brass instrument", 5.38], ["trombone", 4.37]], [["music", 63.56], ["musical instrument", 4.84], ["effects unit", 4.21]], null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 3.0, 1.41, 1.25, 1.39, 1.96, 0.47, 9.95, 12.36, 1.58, 1.03, 0.04, 5.58, 0.84, 2.82, 1.51, 1.1, 6.56, 12.47]} \ No newline at end of file diff --git a/annotations_1/w80bZTK88mc_filtered.json b/annotations_1/w80bZTK88mc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3fe8b9147fc7627ba8e8f25387601c16d0775c6e --- /dev/null +++ b/annotations_1/w80bZTK88mc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 19.67], [21.0, 24.92], [26.0, 43.92]], "keep_status": [false, false, true], "silence_prob": [0.0, 100.0, 48.35], "audiomae_on_audioset": [null, null, [["speech", 31.98], ["insect", 11.24], ["cricket", 10.61]]], "duration": [0.67, 3.92, 17.92]} \ No newline at end of file diff --git a/annotations_1/w86nTX6Iixo_filtered.json b/annotations_1/w86nTX6Iixo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60880ae2df0e1339ac4d6aa4b397cbd925cd31e1 --- /dev/null +++ b/annotations_1/w86nTX6Iixo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.93], [5.0, 8.61], [11.0, 30.99], [32.0, 32.97], [35.0, 34.67], [36.0, 36.63], [37.0, 37.76], [38.0, 40.26], [42.0, 42.48], [44.0, 48.47], [50.0, 49.86], [50.0, 51.38], [55.0, 56.1], [59.0, 61.94], [62.0, 63.54], [64.0, 65.2], [71.0, 81.73], [82.0, 82.56], [86.0, 86.46], [89.0, 92.08], [94.0, 98.79], [102.0, 102.76], [109.0, 110.52], [111.0, 112.19], [115.0, 116.13], [129.0, 131.62], [135.0, 135.3]], "keep_status": [false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 33.14, 31.55, 0.0, 0.0, 0.0, 0.0, 82.25, 0.0, 50.71, 0.0, 0.0, 0.0, 96.89, 0.0, 0.0, 74.92, 0.0, 0.0, 31.43, 34.49, 0.0, 0.0, 0.0, 0.0, 50.66, 0.0], "audiomae_on_audioset": [null, [["speech", 43.71], ["music", 16.66], ["groan", 3.14]], [["music", 37.31], ["buzz", 14.9], ["didgeridoo", 5.3]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.89], ["theremin", 8.85], ["whale vocalization", 4.49]], [["music", 47.81], ["theremin", 6.43], ["crowd", 4.5]], null, null, null, null, null, null], "duration": [-0.07, 3.61, 19.99, 0.97, -0.33, 0.63, 0.76, 2.26, 0.48, 4.47, -0.14, 1.38, 1.1, 2.94, 1.54, 1.2, 10.73, 0.56, 0.46, 3.08, 4.79, 0.76, 1.52, 1.19, 1.13, 2.62, 0.3]} \ No newline at end of file diff --git a/annotations_1/w8mbmSijd4o_filtered.json b/annotations_1/w8mbmSijd4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba619410341bb870e6b8df835be4928a0476913 --- /dev/null +++ b/annotations_1/w8mbmSijd4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.17], [24.0, 26.1], [28.0, 28.66], [29.0, 33.88], [35.0, 41.27], [44.0, 44.74], [46.0, 48.03], [49.0, 49.99], [51.0, 53.25], [57.0, 60.4], [61.0, 60.84], [63.0, 63.53], [69.0, 68.99], [72.0, 71.95], [85.0, 86.56], [89.0, 90.0], [94.0, 94.74], [101.0, 102.22], [105.0, 105.61], [107.0, 107.82], [110.0, 110.22], [111.0, 119.2], [120.0, 129.07], [131.0, 133.35], [133.0, 133.39], [136.0, 136.04], [140.0, 141.52], [145.0, 146.18], [149.0, 149.32], [151.0, 151.14], [153.0, 153.28], [154.0, 154.3], [156.0, 155.87], [157.0, 157.54], [158.0, 158.52], [162.0, 161.97], [163.0, 163.98], [165.0, 165.65], [169.0, 177.36], [179.0, 179.78], [182.0, 182.02], [183.0, 184.35]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.27, 0.0, 33.84, 63.31, 0.0, 65.79, 0.0, 97.83, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.34, 100.0, 46.83, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.26, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 41.22], ["musical instrument", 15.65], ["didgeridoo", 11.8]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.31], ["sidetone", 22.02], ["radio", 20.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.17, 2.1, 0.66, 4.88, 6.27, 0.74, 2.03, 0.99, 2.25, 3.4, -0.16, 0.53, -0.01, -0.05, 1.56, 1.0, 0.74, 1.22, 0.61, 0.82, 0.22, 8.2, 9.07, 2.35, 0.39, 0.04, 1.52, 1.18, 0.32, 0.14, 0.28, 0.3, -0.13, 0.54, 0.52, -0.03, 0.98, 0.65, 8.36, 0.78, 0.02, 1.35]} \ No newline at end of file diff --git a/annotations_1/w9-ylaUijdc_filtered.json b/annotations_1/w9-ylaUijdc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..896ee89d3046fffcc048acd97e52058c540f1dfd --- /dev/null +++ b/annotations_1/w9-ylaUijdc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 27.99], [29.0, 29.91], [33.0, 36.85], [39.0, 41.45], [42.0, 44.42], [48.0, 49.94], [53.0, 56.05], [58.0, 58.13], [64.0, 64.83], [66.0, 68.69], [73.0, 73.3], [76.0, 77.75], [82.0, 82.56], [86.0, 87.57], [90.0, 90.88], [93.0, 93.82], [95.0, 95.76], [97.0, 97.75], [99.0, 98.95], [100.0, 101.11], [102.0, 102.34], [119.0, 119.03], [121.0, 121.64], [126.0, 126.79], [128.0, 128.49], [134.0, 134.77], [145.0, 146.42], [148.0, 148.56], [152.0, 152.29], [157.0, 158.97], [162.0, 162.6], [163.0, 170.43], [173.0, 173.31], [174.0, 175.07]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.94, 0.0, 59.59, 50.86, 41.76, 0.0, 90.25, 0.0, 0.0, 47.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.72, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.14], ["throbbing", 18.74], ["hum", 18.2]], null, null, null, [["speech", 15.02], ["reverberation", 8.0], ["effects unit", 5.3]], null, null, null, null, [["speech", 37.18], ["dial tone", 12.53], ["sidetone", 9.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 60.48], ["musical instrument", 12.0], ["didgeridoo", 5.57]], null, null], "duration": [24.99, 0.91, 3.85, 2.45, 2.42, 1.94, 3.05, 0.13, 0.83, 2.69, 0.3, 1.75, 0.56, 1.57, 0.88, 0.82, 0.76, 0.75, -0.05, 1.11, 0.34, 0.03, 0.64, 0.79, 0.49, 0.77, 1.42, 0.56, 0.29, 1.97, 0.6, 7.43, 0.31, 1.07]} \ No newline at end of file diff --git a/annotations_1/w98xbfLGWro_filtered.json b/annotations_1/w98xbfLGWro_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca8bd7c2d50591c94e56ce55cf5a87733451925b --- /dev/null +++ b/annotations_1/w98xbfLGWro_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 21.27], [22.0, 29.19], [31.0, 31.02], [32.0, 33.4], [35.0, 35.87], [37.0, 37.71], [38.0, 38.74], [39.0, 40.29], [43.0, 43.56], [46.0, 47.49], [49.0, 51.75], [54.0, 54.75], [55.0, 56.1], [57.0, 59.29], [62.0, 65.77], [67.0, 67.8], [82.0, 83.62], [88.0, 90.64], [93.0, 93.8], [96.0, 96.38], [97.0, 98.85], [109.0, 109.49], [115.0, 117.71], [119.0, 119.67], [121.0, 124.02], [126.0, 126.45], [127.0, 127.85], [129.0, 133.54], [135.0, 136.29], [139.0, 142.77], [143.0, 144.51], [145.0, 147.18], [148.0, 150.52], [151.0, 152.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [56.48, 82.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.64, 0.0, 0.0, 99.44, 98.8, 0.0, 0.0, 89.01, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 99.9, 0.0, 0.0, 100.0, 0.0, 99.05, 0.0, 99.94, 92.8, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [9.27, 7.19, 0.02, 1.4, 0.87, 0.71, 0.74, 1.29, 0.56, 1.49, 2.75, 0.75, 1.1, 2.29, 3.77, 0.8, 1.62, 2.64, 0.8, 0.38, 1.85, 0.49, 2.71, 0.67, 3.02, 0.45, 0.85, 4.54, 1.29, 3.77, 1.51, 2.18, 2.52, 1.59]} \ No newline at end of file diff --git a/annotations_1/w9I7PBSMBZw_filtered.json b/annotations_1/w9I7PBSMBZw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8f98f94e73e22b6aea685827b300870b844e12 --- /dev/null +++ b/annotations_1/w9I7PBSMBZw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.28], [22.0, 32.41], [34.0, 34.2], [35.0, 35.38], [38.0, 38.18], [43.0, 43.29], [45.0, 45.82], [51.0, 52.39], [56.0, 61.94], [62.0, 63.59], [66.0, 100.45], [101.0, 111.15]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 42.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.44, 0.0, 0.0, 38.06], "audiomae_on_audioset": [null, [["music", 71.43], ["soundtrack music", 6.24], ["electronic music", 5.0]], null, null, null, null, null, null, [["speech", 34.19], ["music", 27.23], ["electronic music", 6.42]], null, null, [["music", 62.14], ["speech", 7.56], ["foghorn", 4.5]]], "duration": [0.28, 10.41, 0.2, 0.38, 0.18, 0.29, 0.82, 1.39, 5.94, 1.59, 34.45, 10.15]} \ No newline at end of file diff --git a/annotations_1/wAJQ-yWgSJs_filtered.json b/annotations_1/wAJQ-yWgSJs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a890685024d9b58d9ecdf383915f7bef5b8178ca --- /dev/null +++ b/annotations_1/wAJQ-yWgSJs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.4], [16.0, 16.53], [19.0, 19.3], [23.0, 22.84], [24.0, 26.35], [28.0, 31.16], [34.0, 41.32], [46.0, 46.45], [51.0, 54.41], [87.0, 96.77], [97.0, 98.41], [100.0, 101.68], [109.0, 110.51], [112.0, 117.05], [119.0, 122.1]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 73.97, 93.76, 96.29, 0.0, 97.92, 67.13, 0.0, 0.0, 0.0, 99.98, 75.39], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.4, 0.53, 0.3, -0.16, 2.35, 3.16, 7.32, 0.45, 3.41, 9.77, 1.41, 1.68, 1.51, 5.05, 3.1]} \ No newline at end of file diff --git a/annotations_1/wB2w4t9dr0Y_filtered.json b/annotations_1/wB2w4t9dr0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5405cf09c95a7e8dcaaa8a1550e9263b877d5875 --- /dev/null +++ b/annotations_1/wB2w4t9dr0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.22]], "keep_status": [false], "silence_prob": [0.0], "audiomae_on_audioset": [null], "duration": [0.22]} \ No newline at end of file diff --git a/annotations_1/wBM9Aa_HG8g_filtered.json b/annotations_1/wBM9Aa_HG8g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8502f9b2beb62829ddb88211fce67a491f2b4ac5 --- /dev/null +++ b/annotations_1/wBM9Aa_HG8g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 9.24], [11.0, 11.57], [12.0, 12.06], [19.0, 19.53], [23.0, 25.32], [28.0, 29.42], [33.0, 32.64], [39.0, 41.23], [42.0, 42.53], [44.0, 44.22], [46.0, 51.46], [53.0, 53.69], [56.0, 56.74], [60.0, 60.79], [62.0, 62.16], [71.0, 72.52], [74.0, 75.36], [76.0, 76.76], [79.0, 80.32], [82.0, 82.32], [83.0, 84.1], [86.0, 87.18], [96.0, 96.48], [98.0, 100.53], [101.0, 101.41], [103.0, 103.59], [104.0, 106.25], [108.0, 108.18], [110.0, 111.7], [112.0, 113.39], [114.0, 114.74], [115.0, 116.01], [117.0, 117.32]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [64.18, 0.0, 0.0, 0.0, 45.49, 0.0, 0.0, 99.95, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 90.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 26.78], ["noise", 5.39], ["crushing", 4.41]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [5.24, 0.57, 0.06, 0.53, 2.32, 1.42, -0.36, 2.23, 0.53, 0.22, 5.46, 0.69, 0.74, 0.79, 0.16, 1.52, 1.36, 0.76, 1.32, 0.32, 1.1, 1.18, 0.48, 2.53, 0.41, 0.59, 2.25, 0.18, 1.7, 1.39, 0.74, 1.01, 0.32]} \ No newline at end of file diff --git a/annotations_1/wC4MzUvxVa0_filtered.json b/annotations_1/wC4MzUvxVa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6f2213a2d90ea33346db7b34863ae0cecc02df7 --- /dev/null +++ b/annotations_1/wC4MzUvxVa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.74], [8.0, 9.69], [13.0, 13.76], [26.0, 26.7], [28.0, 29.51], [32.0, 34.11], [55.0, 56.78], [59.0, 59.14], [76.0, 76.94], [81.0, 83.35]], "keep_status": [false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 89.19, 0.0, 0.0, 0.0, 47.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 43.26], ["musical instrument", 13.49], ["guitar", 11.86]]], "duration": [0.74, 1.69, 0.76, 0.7, 1.51, 2.11, 1.78, 0.14, 0.94, 2.35]} \ No newline at end of file diff --git a/annotations_1/wDFOO-dC-Nw_filtered.json b/annotations_1/wDFOO-dC-Nw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18c4c46c5e4ff31fba8d658a060aaf38bf7c59f0 --- /dev/null +++ b/annotations_1/wDFOO-dC-Nw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.14], [19.0, 22.44], [25.0, 24.95], [28.0, 36.15], [37.0, 37.89], [39.0, 41.23], [42.0, 42.9], [44.0, 44.19], [45.0, 46.09], [47.0, 51.33], [55.0, 55.49], [56.0, 56.86], [60.0, 82.68], [85.0, 86.04], [87.0, 88.43], [92.0, 93.88], [97.0, 97.36], [98.0, 98.17], [102.0, 103.92], [109.0, 120.58], [122.0, 130.64], [132.0, 142.62], [144.0, 148.19], [157.0, 161.5], [162.0, 163.78]], "keep_status": [false, false, false, true, false, true, false, false, false, true, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 48.56, 0.0, 31.88, 0.0, 34.85, 0.0, 0.0, 0.0, 31.07, 0.0, 0.0, 44.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 44.69, 62.07, 63.64, 32.16, 0.0], "audiomae_on_audioset": [null, [["music", 65.65], ["throbbing", 6.74], ["synthesizer", 4.33]], null, [["music", 60.92], ["guitar", 2.84], ["musical instrument", 2.76]], null, [["music", 40.92], ["speech", 22.99], ["electronic music", 2.41]], null, null, null, [["music", 45.46], ["hum", 10.25], ["throbbing", 5.61]], null, null, [["fly, housefly", 26.36], ["insect", 16.01], ["hum", 11.55]], null, null, null, null, null, null, [["breaking", 50.36], ["sine wave", 8.79], ["glass", 3.41]], [["hum", 26.21], ["noise", 18.72], ["mains hum", 17.33]], null, null, [["music", 51.38], ["didgeridoo", 11.93], ["synthesizer", 7.12]], null], "duration": [0.14, 3.44, -0.05, 8.15, 0.89, 2.23, 0.9, 0.19, 1.09, 4.33, 0.49, 0.86, 22.68, 1.04, 1.43, 1.88, 0.36, 0.17, 1.92, 11.58, 8.64, 10.62, 4.19, 4.5, 1.78]} \ No newline at end of file diff --git a/annotations_1/wEPZVYQqdMY_filtered.json b/annotations_1/wEPZVYQqdMY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..af204800bb6e4533dca9a02192109d0d5d1e98b9 --- /dev/null +++ b/annotations_1/wEPZVYQqdMY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.25], [6.0, 143.65], [145.0, 152.44], [153.0, 155.29], [157.0, 159.39]], "keep_status": [false, false, false, true, false], "silence_prob": [0.0, 0.0, 34.02, 38.54, 68.41], "audiomae_on_audioset": [null, null, [["music", 76.19], ["synthesizer", 4.28], ["hum", 2.75]], [["speech", 17.29], ["boing", 8.3], ["music", 5.17]], null], "duration": [1.25, 137.65, 7.44, 2.29, 2.39]} \ No newline at end of file diff --git a/annotations_1/wEvSZB_Dhqc_filtered.json b/annotations_1/wEvSZB_Dhqc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2226672dcee08d27b94c1ee94fef5230d1adf1ee --- /dev/null +++ b/annotations_1/wEvSZB_Dhqc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 15.96], [18.0, 19.35], [22.0, 24.66], [28.0, 33.94], [34.0, 34.13], [36.0, 44.46], [49.0, 49.92], [55.0, 60.0], [71.0, 83.89], [89.0, 103.01], [106.0, 106.96], [113.0, 119.28], [139.0, 149.54], [151.0, 151.44], [156.0, 156.29], [157.0, 158.89], [165.0, 174.12], [178.0, 178.83], [181.0, 199.39], [200.0, 203.81], [205.0, 206.47], [213.0, 224.01]], "keep_status": [true, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, true], "silence_prob": [32.74, 0.0, 32.8, 32.34, 0.0, 30.84, 0.0, 31.15, 31.36, 31.36, 0.0, 31.69, 31.28, 0.0, 0.0, 0.0, 30.38, 0.0, 31.63, 56.4, 0.0, 41.46], "audiomae_on_audioset": [[["music", 36.49], ["hum", 15.96], ["throbbing", 11.78]], null, [["music", 39.11], ["speech", 12.65], ["throbbing", 8.88]], [["music", 58.28], ["sidetone", 15.6], ["boing", 3.78]], null, [["music", 42.28], ["throbbing", 16.54], ["hum", 12.51]], null, [["speech", 50.79], ["music", 34.93], ["boing", 2.88]], [["music", 57.16], ["speech", 15.12], ["electronic music", 3.38]], [["music", 75.99], ["speech", 2.84], ["boing", 2.6]], null, [["throbbing", 24.61], ["music", 24.21], ["hum", 9.99]], [["music", 34.09], ["speech", 28.14], ["sidetone", 9.46]], null, null, null, [["speech", 51.0], ["music", 27.01], ["electronic music", 2.01]], null, [["music", 49.25], ["didgeridoo", 8.71], ["livestock, farm animals, working animals", 4.44]], null, null, [["sidetone", 27.38], ["fly, housefly", 16.61], ["speech", 12.94]]], "duration": [3.96, 1.35, 2.66, 5.94, 0.13, 8.46, 0.92, 5.0, 12.89, 14.01, 0.96, 6.28, 10.54, 0.44, 0.29, 1.89, 9.12, 0.83, 18.39, 3.81, 1.47, 11.01]} \ No newline at end of file diff --git a/annotations_1/wH-i4ImreXs_filtered.json b/annotations_1/wH-i4ImreXs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1456753ff89aad89f71702d71e471965ed7077e3 --- /dev/null +++ b/annotations_1/wH-i4ImreXs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.0], [3.0, 3.59], [5.0, 5.88], [7.0, 8.33], [10.0, 10.96], [12.0, 12.39], [15.0, 15.3], [20.0, 22.06], [23.0, 23.41], [25.0, 25.54], [26.0, 26.43], [28.0, 29.73], [30.0, 32.7], [34.0, 34.69], [36.0, 36.32], [38.0, 38.92], [41.0, 42.36], [44.0, 44.17], [45.0, 45.44], [46.0, 47.73], [48.0, 49.59], [51.0, 51.34], [53.0, 58.95], [59.0, 59.93], [63.0, 64.32], [65.0, 65.01], [66.0, 68.27], [70.0, 70.63], [73.0, 74.09], [75.0, 75.66], [78.0, 78.04], [79.0, 80.25], [82.0, 82.11], [83.0, 83.98], [85.0, 85.83], [87.0, 90.95], [92.0, 93.51], [94.0, 95.4], [96.0, 100.11], [102.0, 106.02], [106.0, 114.35], [116.0, 115.94], [117.0, 117.86], [119.0, 119.94], [121.0, 121.9], [123.0, 127.06], [127.0, 128.6], [129.0, 131.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 66.51, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.31, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 99.62, 76.04, 0.0, 0.0, 0.0, 0.0, 98.8, 0.0, 57.97], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.0, 0.59, 0.88, 1.33, 0.96, 0.39, 0.3, 2.06, 0.41, 0.54, 0.43, 1.73, 2.7, 0.69, 0.32, 0.92, 1.36, 0.17, 0.44, 1.73, 1.59, 0.34, 5.95, 0.93, 1.32, 0.01, 2.27, 0.63, 1.09, 0.66, 0.04, 1.25, 0.11, 0.98, 0.83, 3.95, 1.51, 1.4, 4.11, 4.02, 8.35, -0.06, 0.86, 0.94, 0.9, 4.06, 1.6, 2.85]} \ No newline at end of file diff --git a/annotations_1/wHfXZ9jcX3A_filtered.json b/annotations_1/wHfXZ9jcX3A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6729513a8811c77ea6cbf5e7fa4129306fa57de5 --- /dev/null +++ b/annotations_1/wHfXZ9jcX3A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.68], [15.0, 22.38], [23.0, 30.4], [33.0, 46.35], [47.0, 54.3], [58.0, 58.5], [60.0, 64.94], [66.0, 66.61], [74.0, 75.69], [79.0, 79.32], [81.0, 81.65], [83.0, 97.38], [100.0, 102.63], [105.0, 112.9], [114.0, 134.81], [136.0, 136.05], [138.0, 138.96], [141.0, 144.29], [145.0, 147.63], [149.0, 160.27], [161.0, 161.57], [162.0, 163.71]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, false, true, true, true, false, false, true, true, false, false, false], "silence_prob": [29.37, 29.57, 29.65, 29.93, 30.02, 0.0, 30.37, 0.0, 0.0, 0.0, 0.0, 31.66, 30.4, 30.4, 30.75, 0.0, 0.0, 30.01, 31.03, 29.77, 0.0, 0.0], "audiomae_on_audioset": [[["music", 46.14], ["noise", 10.04], ["hum", 6.99]], [["speech", 31.35], ["explosion", 12.62], ["music", 9.22]], [["speech", 52.73], ["vehicle", 19.48], ["car", 12.76]], [["speech", 30.87], ["music", 30.85], ["vehicle", 7.04]], [["throbbing", 61.18], ["music", 22.91], ["hum", 8.33]], null, [["music", 79.47], ["throbbing", 3.35], ["hum", 2.46]], null, null, null, null, [["music", 42.47], ["speech", 24.34], ["hum", 12.6]], [["race car, auto racing", 20.08], ["vehicle", 18.43], ["skidding", 16.75]], [["music", 24.85], ["mains hum", 21.96], ["hum", 17.03]], [["music", 51.91], ["car", 7.65], ["vehicle", 4.52]], null, null, [["music", 39.49], ["hum", 13.18], ["cacophony", 9.7]], [["mains hum", 16.53], ["buzz", 15.82], ["hum", 12.49]], [["throbbing", 32.46], ["hum", 26.05], ["mains hum", 17.07]], null, null], "duration": [3.68, 7.38, 7.4, 13.35, 7.3, 0.5, 4.94, 0.61, 1.69, 0.32, 0.65, 14.38, 2.63, 7.9, 20.81, 0.05, 0.96, 3.29, 2.63, 11.27, 0.57, 1.71]} \ No newline at end of file diff --git a/annotations_1/wHqQzF4JXdE_filtered.json b/annotations_1/wHqQzF4JXdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b12f3b83cc04554bedaf8bf49f572957e0d61d21 --- /dev/null +++ b/annotations_1/wHqQzF4JXdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 44.27], [46.0, 121.29], [125.0, 125.81], [127.0, 128.38], [129.0, 130.37], [133.0, 133.54], [139.0, 139.6], [141.0, 142.06], [149.0, 150.09], [152.0, 152.46], [155.0, 156.36], [157.0, 162.14], [172.0, 173.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["speech", 51.63], ["music", 13.75], ["whale vocalization", 9.55]], null], "duration": [38.27, 75.29, 0.81, 1.38, 1.37, 0.54, 0.6, 1.06, 1.09, 0.46, 1.36, 5.14, 1.65]} \ No newline at end of file diff --git a/annotations_1/wI1LRBDvSFs_filtered.json b/annotations_1/wI1LRBDvSFs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..eba56edeee4b59447ddbeb6f31ee2ca8045725ab --- /dev/null +++ b/annotations_1/wI1LRBDvSFs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 32.12], [38.0, 38.53], [44.0, 44.44], [46.0, 46.47], [59.0, 59.1], [60.0, 60.89], [64.0, 65.25], [67.0, 68.84], [70.0, 70.02], [71.0, 71.46], [75.0, 76.0]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [51.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [6.12, 0.53, 0.44, 0.47, 0.1, 0.89, 1.25, 1.84, 0.02, 0.46, 1.0]} \ No newline at end of file diff --git a/annotations_1/wIb3cRvQYw8_filtered.json b/annotations_1/wIb3cRvQYw8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e5a992fddadc0a4b3152ddd5697c07f5b8abb52 --- /dev/null +++ b/annotations_1/wIb3cRvQYw8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.32], [27.0, 26.84], [35.0, 35.4], [60.0, 60.69], [62.0, 61.77], [77.0, 77.9], [80.0, 79.88], [91.0, 91.02], [93.0, 93.12], [94.0, 95.32], [118.0, 118.45], [140.0, 140.54], [149.0, 148.86], [166.0, 166.38], [170.0, 171.19]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.32, -0.16, 0.4, 0.69, -0.23, 0.9, -0.12, 0.02, 0.12, 1.32, 0.45, 0.54, -0.14, 0.38, 1.19]} \ No newline at end of file diff --git a/annotations_1/wIloYFMzS6M_filtered.json b/annotations_1/wIloYFMzS6M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e34a5f5749884102f1d155d77da4aeec3934a295 --- /dev/null +++ b/annotations_1/wIloYFMzS6M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[77.0, 104.13], [106.0, 106.74], [108.0, 108.62], [110.0, 110.54], [112.0, 111.94], [112.0, 117.41], [119.0, 118.96], [120.0, 122.08], [126.0, 127.9], [128.0, 129.64], [130.0, 145.29], [146.0, 162.36], [165.0, 173.1], [174.0, 174.23], [174.0, 180.76], [187.0, 187.57], [192.0, 193.68], [195.0, 196.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [90.25, 0.0, 0.0, 0.0, 0.0, 61.67, 0.0, 100.0, 0.0, 0.0, 99.71, 97.0, 66.27, 0.0, 44.09, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 67.46], ["telephone", 7.73], ["music", 5.9]], null, null, null], "duration": [27.13, 0.74, 0.62, 0.54, -0.06, 5.41, -0.04, 2.08, 1.9, 1.64, 15.29, 16.36, 8.1, 0.23, 6.76, 0.57, 1.68, 1.06]} \ No newline at end of file diff --git a/annotations_1/wJZP20y0R2Q_filtered.json b/annotations_1/wJZP20y0R2Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f19d24ba92b686cc0ea4f4cf7bde600c615e86f8 --- /dev/null +++ b/annotations_1/wJZP20y0R2Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.34], [27.0, 29.49], [34.0, 44.73], [48.0, 63.78], [70.0, 70.75], [72.0, 72.2], [74.0, 74.04], [85.0, 85.7], [86.0, 91.66], [92.0, 108.9], [109.0, 109.68], [111.0, 111.52], [112.0, 114.15], [119.0, 119.77], [120.0, 136.24], [146.0, 146.58], [151.0, 151.75]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 39.78, 33.03, 31.65, 0.0, 0.0, 0.0, 0.0, 94.07, 33.64, 0.0, 0.0, 31.3, 0.0, 31.16, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 30.41], ["hum", 10.86], ["speech", 10.42]], [["music", 81.59], ["speech", 3.47], ["radio", 1.32]], [["music", 62.58], ["speech", 16.87], ["buzz", 1.59]], null, null, null, null, null, [["music", 72.15], ["synthesizer", 8.22], ["electronic music", 2.69]], null, null, [["music", 62.77], ["didgeridoo", 3.23], ["electronic music", 2.09]], null, [["music", 76.44], ["didgeridoo", 4.15], ["musical instrument", 1.57]], null, null], "duration": [0.34, 2.49, 10.73, 15.78, 0.75, 0.2, 0.04, 0.7, 5.66, 16.9, 0.68, 0.52, 2.15, 0.77, 16.24, 0.58, 0.75]} \ No newline at end of file diff --git a/annotations_1/wKIL7__ybL0_filtered.json b/annotations_1/wKIL7__ybL0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..58e3537e7b4dbadca8498e0f4df64b2d65c16940 --- /dev/null +++ b/annotations_1/wKIL7__ybL0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.17], [7.0, 8.46], [11.0, 13.26], [16.0, 22.06], [25.0, 43.78], [45.0, 45.17], [47.0, 51.97], [55.0, 58.41], [63.0, 63.88], [65.0, 78.06], [79.0, 109.61], [111.0, 126.45]], "keep_status": [false, false, true, true, true, false, true, true, false, true, false, false], "silence_prob": [37.81, 0.0, 31.63, 30.46, 31.99, 0.0, 31.08, 45.95, 0.0, 31.03, 0.0, 31.17], "audiomae_on_audioset": [[["music", 64.41], ["musical instrument", 3.66], ["guitar", 3.08]], null, [["music", 14.19], ["boing", 10.56], ["hum", 5.91]], [["music", 24.25], ["throbbing", 9.58], ["hum", 7.8]], [["music", 34.4], ["speech", 8.53], ["fart", 3.74]], null, [["music", 49.7], ["speech", 12.24], ["didgeridoo", 7.44]], [["cattle, bovinae", 22.41], ["music", 15.5], ["livestock, farm animals, working animals", 13.76]], null, [["music", 32.37], ["speech", 12.87], ["fart", 3.13]], null, [["music", 72.58], ["didgeridoo", 6.1], ["synthesizer", 4.85]]], "duration": [2.17, 1.46, 2.26, 6.06, 18.78, 0.17, 4.97, 3.41, 0.88, 13.06, 30.61, 15.45]} \ No newline at end of file diff --git a/annotations_1/wKPbi9oL5xU_filtered.json b/annotations_1/wKPbi9oL5xU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6207bb143f97d60aea408e4e26324abe218c0ecb --- /dev/null +++ b/annotations_1/wKPbi9oL5xU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.27], [25.0, 25.71], [28.0, 30.21], [31.0, 32.58], [36.0, 36.39], [37.0, 39.06], [40.0, 40.76], [42.0, 43.78], [45.0, 45.77], [47.0, 49.69], [51.0, 53.08], [54.0, 67.04], [67.0, 67.1], [68.0, 84.74], [85.0, 135.84], [137.0, 137.12], [137.0, 139.78], [140.0, 152.1], [153.0, 154.9], [155.0, 160.05], [160.0, 166.5], [168.0, 169.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.36, 0.0, 0.0, 99.8, 0.0, 0.0, 0.0, 64.97, 100.0, 100.0, 0.0, 99.05, 0.0, 0.0, 91.81, 78.89, 0.0, 99.96, 77.2, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.27, 0.71, 2.21, 1.58, 0.39, 2.06, 0.76, 1.78, 0.77, 2.69, 2.08, 13.04, 0.1, 16.74, 50.84, 0.12, 2.78, 12.1, 1.9, 5.05, 6.5, 1.74]} \ No newline at end of file diff --git a/annotations_1/wKiW5OYjels_filtered.json b/annotations_1/wKiW5OYjels_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..327e00660f70a55abfb32584788b1a647ff6e93a --- /dev/null +++ b/annotations_1/wKiW5OYjels_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.3], [3.0, 6.94], [8.0, 8.34], [11.0, 12.24], [27.0, 27.13], [34.0, 35.28], [36.0, 36.37], [44.0, 57.96], [60.0, 61.06], [62.0, 63.12], [65.0, 71.68], [72.0, 72.79], [75.0, 76.01], [80.0, 82.8], [92.0, 92.99], [94.0, 97.5], [98.0, 100.41], [101.0, 102.83], [105.0, 107.23], [108.0, 108.97], [110.0, 111.3], [112.0, 113.68], [120.0, 120.56], [125.0, 128.21]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.66, 42.65, 0.0, 0.0, 0.0, 0.0, 0.0, 34.6, 0.0, 0.0, 97.54, 0.0, 0.0, 95.23, 0.0, 99.71, 96.29, 0.0, 88.28, 0.0, 0.0, 0.0, 0.0, 77.7], "audiomae_on_audioset": [[["music", 29.66], ["speech", 15.65], ["cattle, bovinae", 8.63]], [["mains hum", 33.28], ["hum", 14.74], ["electric shaver, electric razor", 11.28]], null, null, null, null, null, [["music", 72.44], ["electronic music", 6.86], ["throbbing", 2.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.3, 3.94, 0.34, 1.24, 0.13, 1.28, 0.37, 13.96, 1.06, 1.12, 6.68, 0.79, 1.01, 2.8, 0.99, 3.5, 2.41, 1.83, 2.23, 0.97, 1.3, 1.68, 0.56, 3.21]} \ No newline at end of file diff --git a/annotations_1/wLGpzRMJsVE_filtered.json b/annotations_1/wLGpzRMJsVE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a50a57f094954ca21a98c1b22a67cb534482a16d --- /dev/null +++ b/annotations_1/wLGpzRMJsVE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.78], [7.0, 8.45], [12.0, 12.55], [15.0, 14.77], [17.0, 17.46], [20.0, 21.19], [26.0, 27.21], [27.0, 29.3], [33.0, 48.27], [49.0, 49.25], [52.0, 52.74], [53.0, 86.88], [89.0, 96.89], [98.0, 124.19], [139.0, 139.68]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.07, 29.5, 0.0, 0.0, 0.0, 28.48, 28.4, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["frog", 23.07], ["hum", 21.37], ["rumble", 8.97]], [["mains hum", 42.1], ["hum", 29.08], ["throbbing", 10.04]], null, null, null, [["speech", 35.91], ["music", 22.13], ["whale vocalization", 5.07]], [["music", 61.66], ["didgeridoo", 20.08], ["synthesizer", 4.25]], null], "duration": [0.78, 1.45, 0.55, -0.23, 0.46, 1.19, 1.21, 2.3, 15.27, 0.25, 0.74, 33.88, 7.89, 26.19, 0.68]} \ No newline at end of file diff --git a/annotations_1/wLuRwDl3MrE_filtered.json b/annotations_1/wLuRwDl3MrE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1e891d406794db68f990a612cdc38fef14c43417 --- /dev/null +++ b/annotations_1/wLuRwDl3MrE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.24], [8.0, 9.07], [11.0, 12.01], [15.0, 15.67], [19.0, 20.75], [29.0, 33.76], [39.0, 39.01], [48.0, 48.02], [52.0, 55.56], [60.0, 60.84], [71.0, 72.82], [84.0, 85.48], [94.0, 94.0], [99.0, 99.23], [114.0, 116.14], [122.0, 122.64], [131.0, 131.14], [140.0, 141.37], [150.0, 150.31], [159.0, 159.53], [165.0, 165.3], [167.0, 167.26]], "keep_status": [false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 46.43, 0.0, 0.0, 31.62, 0.0, 0.0, 0.0, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 32.03], ["music", 22.81], ["throbbing", 10.69]], null, null, [["music", 41.85], ["hum", 16.17], ["mains hum", 7.32]], null, null, null, null, null, [["music", 29.57], ["marimba, xylophone", 10.65], ["musical instrument", 9.34]], null, null, null, null, null, null, null], "duration": [0.24, 1.07, 1.01, 0.67, 1.75, 4.76, 0.01, 0.02, 3.56, 0.84, 1.82, 1.48, 0.0, 0.23, 2.14, 0.64, 0.14, 1.37, 0.31, 0.53, 0.3, 0.26]} \ No newline at end of file diff --git a/annotations_1/wM5rRXQZvjU_filtered.json b/annotations_1/wM5rRXQZvjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..170014aa540a244fad8715c14ebfc08fd8b7416d --- /dev/null +++ b/annotations_1/wM5rRXQZvjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 31.4], [37.0, 37.5], [39.0, 41.77], [46.0, 46.65], [49.0, 49.87], [52.0, 55.93], [58.0, 58.02], [60.0, 61.96], [63.0, 66.21], [70.0, 70.26], [77.0, 116.99], [117.0, 128.66]], "keep_status": [true, false, false, false, false, true, false, false, true, false, false, true], "silence_prob": [29.98, 0.0, 55.04, 0.0, 0.0, 42.65, 0.0, 0.0, 30.59, 0.0, 0.0, 31.12], "audiomae_on_audioset": [[["music", 35.79], ["fly, housefly", 13.21], ["speech", 10.76]], null, null, null, null, [["music", 27.98], ["speech", 11.06], ["hum", 9.42]], null, null, [["music", 43.66], ["hum", 8.15], ["throbbing", 5.6]], null, null, [["noise", 40.21], ["music", 11.62], ["sound effect", 4.93]]], "duration": [12.4, 0.5, 2.77, 0.65, 0.87, 3.93, 0.02, 1.96, 3.21, 0.26, 39.99, 11.66]} \ No newline at end of file diff --git a/annotations_1/wMr2d10-xf0_filtered.json b/annotations_1/wMr2d10-xf0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1cdcfd8eea68ae665709000c297a1de80317a1af --- /dev/null +++ b/annotations_1/wMr2d10-xf0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 7.23], [10.0, 21.27], [30.0, 33.52], [35.0, 34.97], [36.0, 36.9], [40.0, 41.5], [43.0, 47.07], [49.0, 49.54], [51.0, 52.62], [54.0, 54.19], [56.0, 61.62], [63.0, 69.2], [77.0, 79.3], [86.0, 86.8], [91.0, 105.97], [111.0, 117.36], [122.0, 125.04], [136.0, 138.57], [142.0, 142.52], [144.0, 151.97]], "keep_status": [true, false, true, false, false, false, true, false, false, false, true, true, true, false, false, true, true, true, false, false], "silence_prob": [29.08, 28.76, 28.97, 0.0, 0.0, 0.0, 29.65, 0.0, 0.0, 0.0, 30.11, 29.73, 29.83, 0.0, 28.89, 29.28, 29.56, 33.19, 0.0, 28.78], "audiomae_on_audioset": [[["music", 29.03], ["speech", 22.34], ["foghorn", 17.3]], [["music", 30.35], ["speech", 29.47], ["throbbing", 19.12]], [["music", 27.72], ["speech", 6.06], ["musical instrument", 5.31]], null, null, null, [["music", 43.15], ["didgeridoo", 10.15], ["cattle, bovinae", 3.85]], null, null, null, [["music", 41.58], ["livestock, farm animals, working animals", 6.8], ["moo", 6.18]], [["speech", 37.87], ["hum", 10.3], ["music", 10.25]], [["music", 44.31], ["speech", 18.01], ["boing", 7.53]], null, [["music", 60.52], ["speech", 10.51], ["animal", 4.56]], [["music", 52.19], ["throbbing", 7.69], ["hum", 3.52]], [["speech", 31.37], ["music", 21.72], ["vehicle", 8.18]], [["grunt", 27.98], ["music", 21.58], ["speech", 6.67]], null, [["music", 63.17], ["speech", 11.32], ["didgeridoo", 7.61]]], "duration": [5.23, 11.27, 3.52, -0.03, 0.9, 1.5, 4.07, 0.54, 1.62, 0.19, 5.62, 6.2, 2.3, 0.8, 14.97, 6.36, 3.04, 2.57, 0.52, 7.97]} \ No newline at end of file diff --git a/annotations_1/wN1iAzPTBbM_filtered.json b/annotations_1/wN1iAzPTBbM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae52102a4c3b25baa7bfe0a30d7b8681f265a159 --- /dev/null +++ b/annotations_1/wN1iAzPTBbM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 13.12], [15.0, 14.88], [18.0, 19.75], [23.0, 23.3], [38.0, 38.33], [42.0, 42.42], [44.0, 45.13], [46.0, 47.39], [48.0, 47.7], [52.0, 53.05], [54.0, 54.95], [79.0, 79.86], [88.0, 88.06]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [35.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 24.62], ["grunt", 10.55], ["boing", 5.78]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.12, -0.12, 1.75, 0.3, 0.33, 0.42, 1.13, 1.39, -0.3, 1.05, 0.95, 0.86, 0.06]} \ No newline at end of file diff --git a/annotations_1/wNRvgeiaVXA_filtered.json b/annotations_1/wNRvgeiaVXA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ca16dc580679ffa77c9723f9a111f79f87c35d --- /dev/null +++ b/annotations_1/wNRvgeiaVXA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.77], [14.0, 15.4], [25.0, 25.51], [26.0, 25.88], [33.0, 34.26], [48.0, 48.17], [49.0, 49.59], [54.0, 54.9], [55.0, 57.06], [61.0, 63.02], [80.0, 80.97], [93.0, 93.41], [97.0, 98.64], [111.0, 112.77], [131.0, 134.01], [136.0, 143.24]], "keep_status": [true, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false], "silence_prob": [32.23, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.37, 44.6, 0.0, 0.0, 0.0, 0.0, 30.97, 31.05], "audiomae_on_audioset": [[["music", 41.93], ["speech", 5.82], ["musical instrument", 4.6]], null, null, null, null, null, null, null, [["music", 21.35], ["speech", 17.57], ["synthesizer", 11.26]], [["music", 41.06], ["musical instrument", 9.74], ["effects unit", 7.65]], null, null, null, null, [["music", 47.48], ["speech", 6.93], ["yodeling", 4.81]], [["moo", 35.84], ["cattle, bovinae", 31.35], ["livestock, farm animals, working animals", 15.37]]], "duration": [3.77, 1.4, 0.51, -0.12, 1.26, 0.17, 0.59, 0.9, 2.06, 2.02, 0.97, 0.41, 1.64, 1.77, 3.01, 7.24]} \ No newline at end of file diff --git a/annotations_1/wO4P6Yz_LZg_filtered.json b/annotations_1/wO4P6Yz_LZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..556c902b86c918b6a1171e584b001a952c6a08c8 --- /dev/null +++ b/annotations_1/wO4P6Yz_LZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 26.96], [29.0, 34.16], [38.0, 64.77], [76.0, 78.11], [79.0, 79.64], [81.0, 104.68], [107.0, 123.01], [123.0, 147.21], [148.0, 149.18], [150.0, 153.32]], "keep_status": [false, false, true, false, false, false, true, true, false, true], "silence_prob": [66.39, 31.65, 28.99, 55.11, 0.0, 30.16, 42.81, 42.84, 0.0, 41.42], "audiomae_on_audioset": [null, [["music", 51.25], ["noise", 15.05], ["musical instrument", 6.8]], [["throbbing", 26.75], ["music", 26.42], ["hum", 11.97]], null, null, [["hum", 46.0], ["throbbing", 24.67], ["mains hum", 16.24]], [["hum", 28.6], ["whack, thwack", 12.21], ["music", 7.84]], [["chime", 23.45], ["wind chime", 20.64], ["music", 15.31]], null, [["music", 45.51], ["rumble", 8.19], ["hum", 4.63]]], "duration": [11.96, 5.16, 26.77, 2.11, 0.64, 23.68, 16.01, 24.21, 1.18, 3.32]} \ No newline at end of file diff --git a/annotations_1/wOSP7YOuOH4_filtered.json b/annotations_1/wOSP7YOuOH4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2382a606099af23f0e073b32ca4f119847793088 --- /dev/null +++ b/annotations_1/wOSP7YOuOH4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.18], [0.0, 0.33], [17.0, 18.4], [22.0, 22.84], [31.0, 31.97], [33.0, 33.89], [36.0, 36.44], [44.0, 44.88], [46.0, 47.29], [53.0, 55.05], [56.0, 56.51], [60.0, 60.4], [61.0, 61.64], [64.0, 63.56], [69.0, 70.5], [71.0, 72.66], [73.0, 75.27], [78.0, 78.07], [79.0, 79.74], [82.0, 82.12], [85.0, 87.4], [91.0, 98.2], [103.0, 102.83]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.42, 0.0, 0.0, 0.0, 39.64, 40.79, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 46.27], ["didgeridoo", 9.72], ["guitar", 7.32]], null, null, null, null, null, null, [["music", 88.25], ["musical instrument", 2.67], ["guitar", 0.8]], null, null, null, [["music", 73.37], ["musical instrument", 4.11], ["guitar", 2.61]], [["music", 69.08], ["boing", 3.08], ["music for children", 2.73]], null], "duration": [0.18, 0.33, 1.4, 0.84, 0.97, 0.89, 0.44, 0.88, 1.29, 2.05, 0.51, 0.4, 0.64, -0.44, 1.5, 1.66, 2.27, 0.07, 0.74, 0.12, 2.4, 7.2, -0.17]} \ No newline at end of file diff --git a/annotations_1/wOuk6V3Dj5A_filtered.json b/annotations_1/wOuk6V3Dj5A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b43881801ca70ad9f4b3abd0d663d14080085b91 --- /dev/null +++ b/annotations_1/wOuk6V3Dj5A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[122.0, 124.01], [128.0, 127.95]], "keep_status": [true, false], "silence_prob": [46.4, 0.0], "audiomae_on_audioset": [[["frog", 18.15], ["crow", 16.06], ["caw", 14.63]], null], "duration": [2.01, -0.05]} \ No newline at end of file diff --git a/annotations_1/wPmgfWpamb0_filtered.json b/annotations_1/wPmgfWpamb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c64457c19d32d9db8bff666afa7776d0443e9eb6 --- /dev/null +++ b/annotations_1/wPmgfWpamb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.81], [29.0, 30.72], [32.0, 48.56], [50.0, 51.11], [52.0, 53.05], [54.0, 62.75], [74.0, 83.08], [87.0, 87.99], [92.0, 94.83], [97.0, 103.27], [112.0, 115.5]], "keep_status": [false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 44.81, 0.0, 0.0, 42.19, 35.34, 0.0, 84.25, 44.9, 28.99], "audiomae_on_audioset": [null, null, [["music", 43.14], ["hum", 16.99], ["ambient music", 10.44]], null, null, [["music", 71.73], ["ambient music", 5.14], ["theremin", 4.49]], [["music", 34.52], ["hum", 16.02], ["throbbing", 9.54]], null, null, [["speech", 31.19], ["timpani", 12.39], ["music", 6.67]], [["music", 64.95], ["quack", 5.82], ["duck", 2.55]]], "duration": [1.81, 1.72, 16.56, 1.11, 1.05, 8.75, 9.08, 0.99, 2.83, 6.27, 3.5]} \ No newline at end of file diff --git a/annotations_1/wQc-GpTtnR0_filtered.json b/annotations_1/wQc-GpTtnR0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..92aed9b459e12c1f885b06e71e8ed91558b9383c --- /dev/null +++ b/annotations_1/wQc-GpTtnR0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.11], [8.0, 8.88], [11.0, 11.79], [17.0, 25.37], [30.0, 30.43], [35.0, 34.84], [47.0, 48.1], [63.0, 63.34], [64.0, 64.34], [67.0, 67.69], [69.0, 70.01], [70.0, 70.56], [77.0, 77.67], [82.0, 82.83], [85.0, 85.65], [89.0, 88.94], [108.0, 108.77], [110.0, 112.89], [114.0, 115.79], [117.0, 120.82], [122.0, 124.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.9, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.65, 0.0, 89.36, 82.79], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.11, 0.88, 0.79, 8.37, 0.43, -0.16, 1.1, 0.34, 0.34, 0.69, 1.01, 0.56, 0.67, 0.83, 0.65, -0.06, 0.77, 2.89, 1.79, 3.82, 2.11]} \ No newline at end of file diff --git a/annotations_1/wQj8uFwQP2A_filtered.json b/annotations_1/wQj8uFwQP2A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0b8cf43db9e20026af8e524b9bb3cd15c4d26a68 --- /dev/null +++ b/annotations_1/wQj8uFwQP2A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [15.0, 16.29], [21.0, 21.57], [24.0, 24.26], [27.0, 26.99], [27.0, 28.44], [29.0, 31.41], [40.0, 40.49], [58.0, 64.2], [72.0, 76.67], [78.0, 81.65], [83.0, 83.35], [87.0, 88.26], [89.0, 90.75], [91.0, 91.3], [99.0, 105.6], [117.0, 127.55]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.5, 0.0, 36.06, 59.96, 51.44, 0.0, 0.0, 0.0, 0.0, 31.06, 31.68], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 41.9], ["speech", 24.29], ["didgeridoo", 3.28]], null, [["moo", 23.71], ["cattle, bovinae", 23.07], ["livestock, farm animals, working animals", 16.52]], null, null, null, null, null, null, [["music", 63.95], ["didgeridoo", 6.7], ["singing", 2.61]], [["music", 35.09], ["speech", 12.85], ["fart", 10.64]]], "duration": [1.12, 1.29, 0.57, 0.26, -0.01, 1.44, 2.41, 0.49, 6.2, 4.67, 3.65, 0.35, 1.26, 1.75, 0.3, 6.6, 10.55]} \ No newline at end of file diff --git a/annotations_1/wRN8Q_Lts7k_filtered.json b/annotations_1/wRN8Q_Lts7k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f46311611dacae5bf687186d0722ce592d5a5670 --- /dev/null +++ b/annotations_1/wRN8Q_Lts7k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.4], [11.0, 12.45], [13.0, 18.77], [20.0, 20.65], [22.0, 22.77], [23.0, 34.77], [37.0, 37.79], [39.0, 40.41], [41.0, 43.12], [45.0, 48.9], [52.0, 77.43], [80.0, 104.95], [106.0, 107.97]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 73.82, 0.0, 0.0, 62.37, 0.0, 0.0, 51.66, 37.41, 35.59, 89.01, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 25.38], ["hum", 9.2], ["throbbing", 4.51]], [["music", 46.7], ["didgeridoo", 9.34], ["hum", 5.48]], null, null], "duration": [0.4, 1.45, 5.77, 0.65, 0.77, 11.77, 0.79, 1.41, 2.12, 3.9, 25.43, 24.95, 1.97]} \ No newline at end of file diff --git a/annotations_1/wR_e9lxh7Ds_filtered.json b/annotations_1/wR_e9lxh7Ds_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a5185758de67992af46ece4567ef04c26f8ecdd7 --- /dev/null +++ b/annotations_1/wR_e9lxh7Ds_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.66], [8.0, 8.9], [13.0, 14.94], [16.0, 21.42], [22.0, 25.0], [27.0, 28.21], [32.0, 32.26], [36.0, 36.34], [46.0, 46.68], [52.0, 52.22], [63.0, 66.85], [97.0, 99.05], [101.0, 108.89], [112.0, 114.99]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.59, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 38.78, 86.64, 54.76, 43.13], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 24.41], ["cattle, bovinae", 11.22], ["livestock, farm animals, working animals", 9.33]], null, null, [["music", 59.83], ["speech", 24.34], ["musical instrument", 2.52]]], "duration": [0.66, 0.9, 1.94, 5.42, 3.0, 1.21, 0.26, 0.34, 0.68, 0.22, 3.85, 2.05, 7.89, 2.99]} \ No newline at end of file diff --git a/annotations_1/wSOMPH85zvQ_filtered.json b/annotations_1/wSOMPH85zvQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf723f98ecaf533321115bfc8c221251e0fe6d21 --- /dev/null +++ b/annotations_1/wSOMPH85zvQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.11], [6.0, 6.84], [8.0, 9.63], [11.0, 12.75], [16.0, 19.74], [20.0, 21.41], [27.0, 30.77], [35.0, 38.87], [41.0, 41.17], [44.0, 47.93], [55.0, 57.08], [58.0, 59.58], [65.0, 65.91], [67.0, 67.19], [72.0, 74.31], [84.0, 87.76], [91.0, 100.53], [103.0, 139.8], [141.0, 142.35], [146.0, 148.54], [153.0, 157.99], [164.0, 178.01], [179.0, 205.07], [206.0, 209.85], [210.0, 214.05], [216.0, 223.92], [226.0, 228.82]], "keep_status": [false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, true, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 56.33, 0.0, 56.86, 54.76, 0.0, 44.9, 48.69, 0.0, 0.0, 0.0, 34.49, 36.77, 35.88, 0.0, 0.0, 34.42, 34.31, 45.24, 97.11, 96.29, 71.14, 60.79, 74.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 32.36], ["piano", 11.98], ["musical instrument", 10.81]], [["music", 28.69], ["bow-wow", 5.86], ["dog", 5.84]], null, null, null, [["music", 56.38], ["musical instrument", 10.25], ["guitar", 8.02]], [["music", 49.87], ["musical instrument", 10.1], ["piano", 6.34]], [["music", 62.94], ["musical instrument", 5.39], ["guitar", 4.08]], null, null, [["music", 49.36], ["brass instrument", 11.39], ["trombone", 6.19]], [["music", 59.54], ["musical instrument", 6.71], ["synthesizer", 2.79]], [["music", 66.63], ["musical instrument", 3.81], ["keyboard (musical)", 2.59]], null, null, null, null, null], "duration": [1.11, 0.84, 1.63, 1.75, 3.74, 1.41, 3.77, 3.87, 0.17, 3.93, 2.08, 1.58, 0.91, 0.19, 2.31, 3.76, 9.53, 36.8, 1.35, 2.54, 4.99, 14.01, 26.07, 3.85, 4.05, 7.92, 2.82]} \ No newline at end of file diff --git a/annotations_1/wTGRsKLqkGM_filtered.json b/annotations_1/wTGRsKLqkGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9574f8b10fe5671fc2f7f0ec489c0ecff10ca23 --- /dev/null +++ b/annotations_1/wTGRsKLqkGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[47.0, 80.2], [83.0, 83.03], [84.0, 84.54], [92.0, 143.23]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null], "duration": [33.2, 0.03, 0.54, 51.23]} \ No newline at end of file diff --git a/annotations_1/wTLo8CdhxGs_filtered.json b/annotations_1/wTLo8CdhxGs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..52c057c08cbba4c0162dbc73f390032710735024 --- /dev/null +++ b/annotations_1/wTLo8CdhxGs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 91.07], [96.0, 98.1], [103.0, 108.6], [109.0, 108.63], [123.0, 122.79], [129.0, 129.52]], "keep_status": [false, false, false, false, false, false], "silence_prob": [29.97, 30.73, 29.86, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 68.55], ["moo", 7.68], ["cattle, bovinae", 4.09]], [["music", 72.4], ["musical instrument", 3.03], ["salsa music", 2.02]], [["music", 57.55], ["speech", 10.96], ["synthesizer", 2.2]], null, null, null], "duration": [16.07, 2.1, 5.6, -0.37, -0.21, 0.52]} \ No newline at end of file diff --git a/annotations_1/wTf4njh9TnE_filtered.json b/annotations_1/wTf4njh9TnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0949aba5eb3acd48751731dda4113158e95b5218 --- /dev/null +++ b/annotations_1/wTf4njh9TnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 20.66], [22.0, 22.89], [26.0, 29.74], [33.0, 35.11], [39.0, 39.75], [43.0, 44.69], [55.0, 55.75], [60.0, 60.42], [62.0, 69.53], [72.0, 72.67], [76.0, 76.84], [78.0, 79.78], [84.0, 87.1], [90.0, 91.88], [94.0, 96.23], [98.0, 98.59], [103.0, 108.28], [110.0, 114.4], [116.0, 118.76], [121.0, 121.39], [126.0, 127.53], [130.0, 131.14]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [50.31, 0.0, 44.2, 61.67, 0.0, 0.0, 0.0, 0.0, 37.72, 0.0, 0.0, 0.0, 37.59, 0.0, 33.97, 0.0, 34.86, 29.51, 32.18, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 29.38], ["hum", 26.86], ["music", 22.21]], null, null, null, null, null, [["speech", 33.63], ["bee, wasp, etc.", 9.21], ["insect", 8.78]], null, null, null, [["music", 56.4], ["throbbing", 15.72], ["hum", 8.48]], null, [["hum", 28.09], ["throbbing", 27.37], ["music", 17.39]], null, [["music", 52.39], ["hum", 9.19], ["throbbing", 8.73]], [["fly, housefly", 19.63], ["insect", 14.44], ["bee, wasp, etc.", 10.53]], [["music", 31.4], ["throbbing", 26.12], ["hum", 24.04]], null, null, null], "duration": [11.66, 0.89, 3.74, 2.11, 0.75, 1.69, 0.75, 0.42, 7.53, 0.67, 0.84, 1.78, 3.1, 1.88, 2.23, 0.59, 5.28, 4.4, 2.76, 0.39, 1.53, 1.14]} \ No newline at end of file diff --git a/annotations_1/wTfbHs4HlPo_filtered.json b/annotations_1/wTfbHs4HlPo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1d975516b81052fbe398ddc130539a5bb2b5c01 --- /dev/null +++ b/annotations_1/wTfbHs4HlPo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.91], [5.0, 5.37], [8.0, 8.56], [11.0, 11.57], [15.0, 16.34], [19.0, 19.04], [20.0, 21.24], [22.0, 24.09], [25.0, 25.41], [26.0, 26.69], [29.0, 29.1], [33.0, 33.94], [39.0, 39.46], [40.0, 51.39], [52.0, 53.47], [55.0, 55.07], [58.0, 58.82], [61.0, 61.72], [63.0, 62.78], [68.0, 71.12], [75.0, 76.54], [78.0, 77.84], [79.0, 79.69], [80.0, 82.93], [87.0, 87.42], [89.0, 89.95], [91.0, 93.58], [95.0, 96.96], [99.0, 103.65], [108.0, 113.83], [114.0, 115.45], [119.0, 120.09], [123.0, 124.87], [127.0, 128.17], [129.0, 130.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 31.17, 0.0, 0.0, 0.0, 33.37, 0.0, 0.0, 34.43, 0.0, 33.04, 33.91, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["chirp tone", 16.08], ["sine wave", 14.8], ["whale vocalization", 13.1]], null, null, null, [["music", 32.09], ["speech", 7.46], ["musical instrument", 5.31]], null, null, [["music", 51.91], ["synthesizer", 6.33], ["electronic music", 5.35]], null, [["hum", 26.61], ["speech", 24.87], ["rumble", 11.0]], [["music", 36.01], ["speech", 7.62], ["knock", 5.98]], null, null, null, null, null], "duration": [0.91, 0.37, 0.56, 0.57, 1.34, 0.04, 1.24, 2.09, 0.41, 0.69, 0.1, 0.94, 0.46, 11.39, 1.47, 0.07, 0.82, 0.72, -0.22, 3.12, 1.54, -0.16, 0.69, 2.93, 0.42, 0.95, 2.58, 1.96, 4.65, 5.83, 1.45, 1.09, 1.87, 1.17, 1.4]} \ No newline at end of file diff --git a/annotations_1/wTqLwoaEUmU_filtered.json b/annotations_1/wTqLwoaEUmU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..51ca80850d053e7713f2e3f47fa64890fc3ee7a0 --- /dev/null +++ b/annotations_1/wTqLwoaEUmU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.55], [10.0, 14.18], [15.0, 15.89], [16.0, 17.64], [18.0, 22.77], [26.0, 26.55], [28.0, 29.81], [30.0, 30.94], [32.0, 32.09], [34.0, 34.65], [38.0, 39.29], [41.0, 41.71], [42.0, 42.8], [44.0, 44.54], [47.0, 46.7], [49.0, 49.15], [53.0, 54.3], [56.0, 57.37], [58.0, 59.85], [65.0, 68.62], [71.0, 71.31], [73.0, 75.37], [77.0, 78.02], [80.0, 80.5], [82.0, 81.78], [94.0, 95.17], [98.0, 102.32], [103.0, 103.62], [105.0, 105.63], [107.0, 108.21], [109.0, 109.71], [112.0, 112.09], [113.0, 114.71], [127.0, 127.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 56.55, 0.0, 0.0, 56.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.52, 0.0, 69.74, 0.0, 0.0, 0.0, 0.0, 61.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.55, 4.18, 0.89, 1.64, 4.77, 0.55, 1.81, 0.94, 0.09, 0.65, 1.29, 0.71, 0.8, 0.54, -0.3, 0.15, 1.3, 1.37, 1.85, 3.62, 0.31, 2.37, 1.02, 0.5, -0.22, 1.17, 4.32, 0.62, 0.63, 1.21, 0.71, 0.09, 1.71, 0.82]} \ No newline at end of file diff --git a/annotations_1/wTzfJT3zGz0_filtered.json b/annotations_1/wTzfJT3zGz0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..74f93a445cafa48e39d741f88e3348a32ed71ba4 --- /dev/null +++ b/annotations_1/wTzfJT3zGz0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.62], [23.0, 23.21], [38.0, 52.15], [56.0, 61.28], [65.0, 76.99], [79.0, 79.32], [80.0, 86.73], [92.0, 97.38], [98.0, 101.04], [110.0, 121.26], [124.0, 127.79]], "keep_status": [false, false, true, true, false, false, true, false, false, false, true], "silence_prob": [37.9, 0.0, 31.39, 32.02, 33.72, 0.0, 34.96, 35.18, 35.66, 33.48, 30.22], "audiomae_on_audioset": [[["hum", 39.93], ["throbbing", 27.94], ["music", 10.53]], null, [["cattle, bovinae", 19.77], ["livestock, farm animals, working animals", 16.49], ["moo", 16.46]], [["music", 30.27], ["speech", 17.16], ["mains hum", 14.98]], [["music", 32.29], ["throbbing", 31.45], ["hum", 15.18]], null, [["music", 38.85], ["throbbing", 22.3], ["hum", 6.55]], [["throbbing", 46.5], ["music", 36.69], ["hum", 9.92]], [["music", 54.91], ["throbbing", 14.32], ["hum", 7.77]], [["hum", 37.39], ["speech", 18.98], ["throbbing", 15.09]], [["music", 20.77], ["throbbing", 19.19], ["hum", 17.96]]], "duration": [2.62, 0.21, 14.15, 5.28, 11.99, 0.32, 6.73, 5.38, 3.04, 11.26, 3.79]} \ No newline at end of file diff --git a/annotations_1/wV7vM4-FzJM_filtered.json b/annotations_1/wV7vM4-FzJM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6710e42b6835bb53dcead3ea23afafef6148144 --- /dev/null +++ b/annotations_1/wV7vM4-FzJM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 1.95], [2.0, 3.62], [6.0, 7.92], [8.0, 9.29], [15.0, 15.16], [19.0, 20.01], [29.0, 30.74], [31.0, 32.21], [50.0, 50.8], [52.0, 51.83], [54.0, 53.84], [58.0, 58.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.05, 1.62, 1.92, 1.29, 0.16, 1.01, 1.74, 1.21, 0.8, -0.17, -0.16, 0.63]} \ No newline at end of file diff --git a/annotations_1/wVFNjHAnpcI_filtered.json b/annotations_1/wVFNjHAnpcI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bf9cdb9c54d63ebfd1cd56231ca55ec2b6fe4198 --- /dev/null +++ b/annotations_1/wVFNjHAnpcI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.81], [4.0, 3.75], [4.0, 9.07], [14.0, 15.69], [18.0, 18.71], [36.0, 35.94], [36.0, 43.98], [49.0, 49.74], [52.0, 51.76], [52.0, 53.64], [56.0, 56.05], [58.0, 58.55], [63.0, 66.06], [93.0, 97.09]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.42, 0.0, 0.0, 0.0, 36.36, 0.0, 0.0, 0.0, 0.0, 0.0, 40.41, 99.71], "audiomae_on_audioset": [null, null, [["speech", 44.69], ["computer keyboard", 10.57], ["typewriter", 10.21]], null, null, null, [["speech", 68.54], ["noise", 17.93], ["telephone", 2.66]], null, null, null, null, null, [["speech", 59.73], ["telephone", 8.25], ["radio", 4.52]], null], "duration": [0.81, -0.25, 5.07, 1.69, 0.71, -0.06, 7.98, 0.74, -0.24, 1.64, 0.05, 0.55, 3.06, 4.09]} \ No newline at end of file diff --git a/annotations_1/wWKQ2aOTfN0_filtered.json b/annotations_1/wWKQ2aOTfN0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7acb5b7e3c2653d5561201e64d309691d616207c --- /dev/null +++ b/annotations_1/wWKQ2aOTfN0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.06], [2.0, 2.61], [5.0, 5.75], [9.0, 10.03], [10.0, 11.03], [15.0, 14.76], [15.0, 16.14], [17.0, 29.35], [32.0, 47.21], [51.0, 113.8], [117.0, 118.18], [119.0, 120.12], [121.0, 124.8], [126.0, 127.36]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.59, 29.38, 0.0, 0.0, 0.0, 85.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["livestock, farm animals, working animals", 16.42], ["cattle, bovinae", 10.9], ["grunt", 5.7]], [["hum", 35.07], ["mains hum", 16.96], ["throbbing", 14.83]], null, null, null, null, null], "duration": [0.06, 0.61, 0.75, 1.03, 1.03, -0.24, 1.14, 12.35, 15.21, 62.8, 1.18, 1.12, 3.8, 1.36]} \ No newline at end of file diff --git a/annotations_1/wWRnv1V8iUY_filtered.json b/annotations_1/wWRnv1V8iUY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..42e2292c045d97b58181c1108999d09743babed5 --- /dev/null +++ b/annotations_1/wWRnv1V8iUY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.73], [8.0, 8.6], [10.0, 13.64], [19.0, 22.62], [26.0, 26.52], [27.0, 28.22], [40.0, 40.56], [43.0, 43.88], [44.0, 46.47], [49.0, 50.99], [51.0, 51.9], [54.0, 56.19], [57.0, 57.65], [59.0, 59.49], [62.0, 63.66], [65.0, 66.82], [68.0, 69.16], [72.0, 73.23], [75.0, 76.5], [81.0, 84.28], [90.0, 90.41], [92.0, 96.82], [103.0, 131.13], [133.0, 136.49], [141.0, 141.69], [146.0, 149.42], [152.0, 152.51], [154.0, 158.45]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, true], "silence_prob": [0.0, 0.0, 96.89, 34.02, 0.0, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 32.6, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.06, 0.0, 30.37, 29.82, 97.73, 0.0, 30.33, 0.0, 39.46], "audiomae_on_audioset": [null, null, null, [["theremin", 42.52], ["music", 37.2], ["wind instrument, woodwind instrument", 2.14]], null, null, null, null, [["music", 19.56], ["speech", 16.36], ["musical instrument", 2.49]], null, null, [["music", 41.57], ["noise", 9.57], ["fart", 7.64]], null, null, null, null, null, null, null, [["music", 35.04], ["speech", 10.66], ["foghorn", 7.19]], null, [["music", 42.21], ["speech", 7.99], ["didgeridoo", 5.06]], [["speech", 36.37], ["music", 18.02], ["throbbing", 7.55]], null, null, [["music", 20.78], ["whale vocalization", 10.77], ["musical instrument", 7.86]], null, [["music", 24.47], ["speech", 20.52], ["moo", 9.98]]], "duration": [0.73, 0.6, 3.64, 3.62, 0.52, 1.22, 0.56, 0.88, 2.47, 1.99, 0.9, 2.19, 0.65, 0.49, 1.66, 1.82, 1.16, 1.23, 1.5, 3.28, 0.41, 4.82, 28.13, 3.49, 0.69, 3.42, 0.51, 4.45]} \ No newline at end of file diff --git a/annotations_1/wXDgyuxBuBU_filtered.json b/annotations_1/wXDgyuxBuBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a53be61512e7f1bac882c1a8816816be871c94f --- /dev/null +++ b/annotations_1/wXDgyuxBuBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 22.79], [39.0, 39.34], [41.0, 41.69], [42.0, 43.07], [44.0, 45.72], [47.0, 47.11], [48.0, 49.42], [57.0, 57.57], [60.0, 62.68], [63.0, 63.48], [67.0, 66.92], [67.0, 67.95], [78.0, 78.97], [89.0, 89.31], [91.0, 91.2], [92.0, 101.04], [104.0, 108.57], [111.0, 112.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.55, 38.91, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 54.11], ["speech", 8.71], ["fart", 8.13]], null], "duration": [0.79, 0.34, 0.69, 1.07, 1.72, 0.11, 1.42, 0.57, 2.68, 0.48, -0.08, 0.95, 0.97, 0.31, 0.2, 9.04, 4.57, 1.94]} \ No newline at end of file diff --git a/annotations_1/wXLFg03in2U_filtered.json b/annotations_1/wXLFg03in2U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dd5f6523bcb72dadf24f6b0160abe5ec7a31347c --- /dev/null +++ b/annotations_1/wXLFg03in2U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[39.0, 50.43], [52.0, 52.19], [54.0, 54.87], [57.0, 57.47], [58.0, 88.62], [91.0, 94.61], [96.0, 96.23], [97.0, 99.0], [100.0, 102.39], [104.0, 130.72]], "keep_status": [true, false, false, false, false, false, false, false, false, false], "silence_prob": [30.36, 0.0, 0.0, 0.0, 0.0, 32.36, 0.0, 32.01, 31.4, 30.11], "audiomae_on_audioset": [[["music", 25.7], ["hum", 11.3], ["throbbing", 9.08]], null, null, null, null, [["music", 65.54], ["didgeridoo", 14.17], ["musical instrument", 3.35]], null, [["music", 61.34], ["speech", 17.86], ["throbbing", 9.72]], [["music", 39.64], ["throbbing", 32.07], ["hum", 10.58]], [["music", 54.58], ["speech", 13.34], ["throbbing", 5.78]]], "duration": [11.43, 0.19, 0.87, 0.47, 30.62, 3.61, 0.23, 2.0, 2.39, 26.72]} \ No newline at end of file diff --git a/annotations_1/wXQ1EhVW2xQ_filtered.json b/annotations_1/wXQ1EhVW2xQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1311b53c1c5588e6f1ed3e6837c290fd55b30480 --- /dev/null +++ b/annotations_1/wXQ1EhVW2xQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.94], [4.0, 18.71], [22.0, 24.87], [26.0, 29.05], [30.0, 33.12], [34.0, 36.66], [39.0, 41.34], [42.0, 45.27], [46.0, 49.11], [50.0, 59.98], [60.0, 61.3], [63.0, 65.28], [66.0, 66.72], [67.0, 66.93], [67.0, 70.5], [73.0, 74.09], [76.0, 82.9], [86.0, 90.12], [93.0, 96.52], [97.0, 99.84], [104.0, 105.39], [107.0, 110.51], [119.0, 119.99], [121.0, 121.12], [121.0, 122.18], [124.0, 127.25], [129.0, 130.76], [132.0, 137.59], [138.0, 140.48], [141.0, 144.71], [146.0, 150.06], [152.0, 153.99], [155.0, 156.61], [161.0, 161.59]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 92.97, 87.55, 100.0, 100.0, 100.0, 100.0, 99.73, 99.84, 99.4, 0.0, 85.72, 0.0, 0.0, 68.93, 0.0, 97.54, 99.97, 82.07, 99.56, 0.0, 97.22, 0.0, 0.0, 0.0, 96.04, 0.0, 97.11, 90.43, 94.37, 94.22, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.94, 14.71, 2.87, 3.05, 3.12, 2.66, 2.34, 3.27, 3.11, 9.98, 1.3, 2.28, 0.72, -0.07, 3.5, 1.09, 6.9, 4.12, 3.52, 2.84, 1.39, 3.51, 0.99, 0.12, 1.18, 3.25, 1.76, 5.59, 2.48, 3.71, 4.06, 1.99, 1.61, 0.59]} \ No newline at end of file diff --git a/annotations_1/wZTaXoogvDQ_filtered.json b/annotations_1/wZTaXoogvDQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8423f0066be79f6038d028e9188249b5b3b66ee2 --- /dev/null +++ b/annotations_1/wZTaXoogvDQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.48], [15.0, 19.84], [21.0, 25.89], [28.0, 33.32], [34.0, 37.56], [40.0, 41.44], [43.0, 45.87], [47.0, 48.34], [50.0, 50.41], [51.0, 52.22], [55.0, 55.8], [59.0, 60.54], [64.0, 64.02], [64.0, 65.53], [76.0, 77.63], [78.0, 83.96], [85.0, 88.1], [89.0, 102.22], [102.0, 106.39], [107.0, 108.99], [110.0, 111.87], [113.0, 114.67], [115.0, 117.51], [118.0, 121.31]], "keep_status": [false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [53.22, 41.54, 54.23, 43.3, 63.64, 0.0, 64.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.89, 65.79, 44.34, 30.56, 0.0, 0.0, 0.0, 72.01, 51.28], "audiomae_on_audioset": [null, [["music", 31.56], ["throbbing", 17.33], ["hum", 15.56]], null, [["hum", 27.08], ["mains hum", 22.3], ["speech", 17.17]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["fly, housefly", 49.92], ["insect", 15.39], ["speech", 8.99]], [["speech", 54.33], ["fly, housefly", 7.5], ["mains hum", 4.8]], null, null, null, null, null], "duration": [3.48, 4.84, 4.89, 5.32, 3.56, 1.44, 2.87, 1.34, 0.41, 1.22, 0.8, 1.54, 0.02, 1.53, 1.63, 5.96, 3.1, 13.22, 4.39, 1.99, 1.87, 1.67, 2.51, 3.31]} \ No newline at end of file diff --git a/annotations_1/wZWNmL5VsIs_filtered.json b/annotations_1/wZWNmL5VsIs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ee387c30ad8d04b897430f152514ca7c55057d --- /dev/null +++ b/annotations_1/wZWNmL5VsIs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [9.0, 22.35], [27.0, 31.23], [39.0, 39.63], [41.0, 42.15], [43.0, 45.15], [56.0, 56.15], [59.0, 77.18], [82.0, 82.8], [90.0, 90.31], [92.0, 122.18], [136.0, 137.74], [141.0, 143.46], [153.0, 155.44], [159.0, 190.24], [196.0, 196.45], [197.0, 199.0], [200.0, 201.02], [202.0, 204.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true], "silence_prob": [0.0, 34.48, 36.31, 0.0, 0.0, 37.55, 0.0, 34.02, 0.0, 0.0, 0.0, 0.0, 34.75, 31.79, 0.0, 0.0, 65.2, 0.0, 37.88], "audiomae_on_audioset": [null, [["music", 71.29], ["speech", 8.74], ["synthesizer", 4.86]], [["music", 48.03], ["speech", 24.95], ["throbbing", 2.72]], null, null, [["music", 70.48], ["synthesizer", 7.29], ["throbbing", 7.17]], null, [["music", 40.71], ["speech", 38.95], ["quack", 7.92]], null, null, null, null, [["music", 57.49], ["throbbing", 11.76], ["speech", 6.45]], [["music", 35.09], ["throbbing", 20.84], ["speech", 9.81]], null, null, null, null, [["music", 43.92], ["hum", 14.98], ["mains hum", 10.45]]], "duration": [1.18, 13.35, 4.23, 0.63, 1.15, 2.15, 0.15, 18.18, 0.8, 0.31, 30.18, 1.74, 2.46, 2.44, 31.24, 0.45, 2.0, 1.02, 2.16]} \ No newline at end of file diff --git a/annotations_1/wZcRiRs1x-8_filtered.json b/annotations_1/wZcRiRs1x-8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9274f272a0ebd915710269d2952b2fafc769df9b --- /dev/null +++ b/annotations_1/wZcRiRs1x-8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 36.98], [38.0, 43.85], [45.0, 75.57], [76.0, 87.76], [89.0, 111.64], [116.0, 116.67], [122.0, 139.16]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [70.72, 67.38, 0.0, 61.18, 29.77, 0.0, 28.4], "audiomae_on_audioset": [null, null, null, null, [["music", 86.83], ["swing music", 2.99], ["funk", 1.34]], null, [["cattle, bovinae", 44.11], ["moo", 30.89], ["livestock, farm animals, working animals", 24.5]]], "duration": [16.98, 5.85, 30.57, 11.76, 22.64, 0.67, 17.16]} \ No newline at end of file diff --git a/annotations_1/wZl5uWOpepU_filtered.json b/annotations_1/wZl5uWOpepU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a75b3118a28bf199b7edb3de4667edb503c8b7dc --- /dev/null +++ b/annotations_1/wZl5uWOpepU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 24.56], [28.0, 29.22], [39.0, 41.23], [60.0, 61.33], [77.0, 77.58]], "keep_status": [false, false, true, false, false], "silence_prob": [0.0, 0.0, 36.61, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 45.97], ["didgeridoo", 12.42], ["speech", 6.58]], null, null], "duration": [1.56, 1.22, 2.23, 1.33, 0.58]} \ No newline at end of file diff --git a/annotations_1/w_5OidjXy5o_filtered.json b/annotations_1/w_5OidjXy5o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c0cac86111ba558449ec3d62a34505e890486b36 --- /dev/null +++ b/annotations_1/w_5OidjXy5o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 26.64], [33.0, 45.69], [48.0, 48.69], [49.0, 48.79], [49.0, 49.03], [49.0, 49.08], [51.0, 72.39], [73.0, 79.96], [81.0, 90.17], [92.0, 94.91], [96.0, 97.11], [98.0, 117.95], [118.0, 118.44], [118.0, 160.89], [161.0, 161.25], [161.0, 161.33], [161.0, 161.45]], "keep_status": [false, true, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [31.0, 31.21, 0.0, 0.0, 0.0, 0.0, 30.77, 31.67, 31.05, 33.95, 0.0, 31.29, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 29.03], ["throbbing", 23.99], ["mains hum", 19.27]], [["fly, housefly", 22.0], ["music", 20.35], ["buzz", 6.86]], null, null, null, null, [["hum", 36.1], ["music", 23.52], ["throbbing", 14.87]], [["hum", 31.29], ["throbbing", 19.84], ["mains hum", 18.16]], [["hum", 35.35], ["music", 21.01], ["throbbing", 14.85]], [["music", 18.36], ["cacophony", 16.2], ["hum", 10.09]], null, [["hum", 66.65], ["mains hum", 15.8], ["throbbing", 7.85]], null, null, null, null, null], "duration": [16.64, 12.69, 0.69, -0.21, 0.03, 0.08, 21.39, 6.96, 9.17, 2.91, 1.11, 19.95, 0.44, 42.89, 0.25, 0.33, 0.45]} \ No newline at end of file diff --git a/annotations_1/w_92-vVfgrw_filtered.json b/annotations_1/w_92-vVfgrw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4002d6f0f47947fbb748fd8c899c5d3f884a593f --- /dev/null +++ b/annotations_1/w_92-vVfgrw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 33.18], [36.0, 36.78], [39.0, 40.1], [44.0, 45.42], [58.0, 58.62], [74.0, 75.41], [93.0, 93.06], [99.0, 99.03], [102.0, 120.34], [124.0, 132.95], [134.0, 133.95]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.46, 32.72, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 28.08], ["wind chime", 17.6], ["glockenspiel", 10.78]], [["music", 47.15], ["civil defense siren", 10.42], ["siren", 6.07]], null], "duration": [0.18, 0.78, 1.1, 1.42, 0.62, 1.41, 0.06, 0.03, 18.34, 8.95, -0.05]} \ No newline at end of file diff --git a/annotations_1/w_e5kx3ONfs_filtered.json b/annotations_1/w_e5kx3ONfs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..185cd6eaa3fef1ca5ef47fe450429423362d9e67 --- /dev/null +++ b/annotations_1/w_e5kx3ONfs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.53], [15.0, 17.54], [19.0, 19.5], [21.0, 21.79], [23.0, 24.19], [25.0, 25.91], [27.0, 28.38], [31.0, 31.18], [34.0, 35.55], [37.0, 39.38], [41.0, 43.78], [46.0, 46.23], [49.0, 49.98], [52.0, 56.57], [59.0, 61.42], [64.0, 75.42], [78.0, 91.47], [93.0, 95.67], [97.0, 98.15], [102.0, 103.44], [105.0, 106.49]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 56.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.5, 41.16, 0.0, 0.0, 46.72, 43.53, 45.69, 62.68, 96.54, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 48.42], ["mains hum", 5.46], ["ambient music", 4.96]], [["livestock, farm animals, working animals", 32.02], ["cattle, bovinae", 28.95], ["moo", 21.85]], null, null, [["singing bowl", 36.42], ["music", 32.33], ["tubular bells", 6.41]], [["music", 27.66], ["singing bowl", 18.61], ["speech", 7.53]], [["music", 61.17], ["singing bowl", 10.91], ["bell", 6.01]], null, null, null, null, null], "duration": [1.53, 2.54, 0.5, 0.79, 1.19, 0.91, 1.38, 0.18, 1.55, 2.38, 2.78, 0.23, 0.98, 4.57, 2.42, 11.42, 13.47, 2.67, 1.15, 1.44, 1.49]} \ No newline at end of file diff --git a/annotations_1/wa1uJbTy6XE_filtered.json b/annotations_1/wa1uJbTy6XE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b616512aed5293d4cffbe113f3a983f2fe26c9e --- /dev/null +++ b/annotations_1/wa1uJbTy6XE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.63], [14.0, 18.18], [19.0, 30.43], [38.0, 60.37], [61.0, 62.61], [65.0, 79.39], [84.0, 149.72], [152.0, 152.41], [153.0, 155.19], [157.0, 158.14], [164.0, 164.96], [166.0, 168.0], [169.0, 171.59]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 31.49, 32.57, 31.84, 0.0, 32.92, 0.0, 0.0, 95.64, 0.0, 0.0, 40.29, 48.06], "audiomae_on_audioset": [null, [["speech", 59.83], ["music", 3.77], ["rumble", 2.68]], [["livestock, farm animals, working animals", 56.08], ["music", 15.93], ["cattle, bovinae", 10.82]], [["speech", 48.0], ["music", 24.54], ["buzz", 4.08]], null, [["music", 39.43], ["mains hum", 13.45], ["hum", 11.95]], null, null, null, null, null, [["fart", 19.31], ["mosquito", 10.85], ["hum", 10.6]], [["music", 80.44], ["hum", 2.17], ["musical instrument", 2.15]]], "duration": [1.63, 4.18, 11.43, 22.37, 1.61, 14.39, 65.72, 0.41, 2.19, 1.14, 0.96, 2.0, 2.59]} \ No newline at end of file diff --git a/annotations_1/wa_9eIwrEK8_filtered.json b/annotations_1/wa_9eIwrEK8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fbdb653bfa5675ce117fcdf553f4bdff2d879dd --- /dev/null +++ b/annotations_1/wa_9eIwrEK8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 11.67], [15.0, 22.91], [24.0, 41.91], [44.0, 46.8], [48.0, 69.87], [71.0, 71.56], [79.0, 141.84], [143.0, 142.79], [144.0, 144.78], [145.0, 146.42], [148.0, 148.49], [149.0, 151.09], [152.0, 153.54], [156.0, 164.52]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [30.41, 30.78, 29.78, 28.56, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.43, 0.0, 30.52], "audiomae_on_audioset": [[["music", 46.86], ["speech", 15.03], ["didgeridoo", 5.69]], [["music", 38.03], ["speech", 9.27], ["throbbing", 5.29]], [["music", 27.16], ["buzz", 18.54], ["didgeridoo", 7.37]], [["music", 36.68], ["mains hum", 18.89], ["hum", 10.97]], [["speech", 38.93], ["music", 38.07], ["explosion", 3.18]], null, null, null, null, null, null, [["music", 33.35], ["speech", 22.65], ["whale vocalization", 4.14]], null, [["music", 57.24], ["gunshot, gunfire", 5.17], ["speech", 4.45]]], "duration": [3.67, 7.91, 17.91, 2.8, 21.87, 0.56, 62.84, -0.21, 0.78, 1.42, 0.49, 2.09, 1.54, 8.52]} \ No newline at end of file diff --git a/annotations_1/waeNIUB5wz4_filtered.json b/annotations_1/waeNIUB5wz4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5a264f5eafe4ba1061bda8d1b909fe5f59a1d24 --- /dev/null +++ b/annotations_1/waeNIUB5wz4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.49], [14.0, 14.61], [19.0, 19.01], [28.0, 30.25], [35.0, 36.85], [37.0, 38.2], [39.0, 64.66], [69.0, 78.7], [79.0, 88.28], [96.0, 100.85], [101.0, 103.08], [105.0, 113.09], [116.0, 119.25], [122.0, 122.67], [125.0, 126.22], [127.0, 127.3], [128.0, 128.75]], "keep_status": [true, false, false, true, false, false, false, false, true, false, false, true, false, false, false, false, false], "silence_prob": [33.71, 0.0, 0.0, 40.06, 0.0, 0.0, 33.45, 31.37, 31.98, 31.57, 35.4, 33.48, 87.55, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 45.44], ["boing", 6.89], ["musical instrument", 5.14]], null, null, [["cattle, bovinae", 12.29], ["moo", 11.0], ["noise", 10.32]], null, null, [["music", 50.21], ["sidetone", 22.2], ["throbbing", 6.28]], [["music", 30.78], ["sidetone", 24.56], ["speech", 15.87]], [["music", 49.58], ["sidetone", 7.13], ["speech", 5.53]], [["music", 50.67], ["speech", 19.7], ["sidetone", 11.0]], [["music", 60.26], ["speech", 15.45], ["musical instrument", 3.12]], [["fart", 30.71], ["music", 23.07], ["throbbing", 10.24]], null, null, null, null, null], "duration": [2.49, 0.61, 0.01, 2.25, 1.85, 1.2, 25.66, 9.7, 9.28, 4.85, 2.08, 8.09, 3.25, 0.67, 1.22, 0.3, 0.75]} \ No newline at end of file diff --git a/annotations_1/wbROoMNi8Ho_filtered.json b/annotations_1/wbROoMNi8Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e52ebfca14b49c482205bbde5ce76a751021905 --- /dev/null +++ b/annotations_1/wbROoMNi8Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.73], [5.0, 5.27], [6.0, 27.95], [30.0, 34.57], [35.0, 52.19], [53.0, 55.16], [56.0, 61.6], [62.0, 65.75], [66.0, 72.25], [75.0, 76.15], [76.0, 85.7], [86.0, 88.75], [90.0, 92.3], [94.0, 95.2], [96.0, 99.94], [100.0, 105.41], [107.0, 113.63], [115.0, 117.53], [119.0, 128.92], [134.0, 138.55], [140.0, 139.95], [140.0, 140.02], [141.0, 144.75], [148.0, 151.04], [155.0, 157.74], [158.0, 169.16], [171.0, 176.22], [177.0, 184.42]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.18, 54.5, 39.3, 100.0, 100.0, 99.4, 73.97, 0.0, 62.78, 99.8, 99.97, 0.0, 98.93, 49.64, 92.15, 53.04, 42.91, 88.83, 0.0, 0.0, 99.71, 88.1, 98.01, 42.04, 99.56, 99.96], "audiomae_on_audioset": [null, null, null, null, [["speech", 20.44], ["fly, housefly", 9.7], ["music", 9.57]], null, null, null, null, null, null, null, null, null, null, [["speech", 79.69], ["telephone", 10.38], ["radio", 4.71]], null, null, [["speech", 45.45], ["bouncing", 7.42], ["boing", 4.1]], null, null, null, null, null, null, [["speech", 45.23], ["music", 26.65], ["crack", 17.39]], null, null], "duration": [1.73, 0.27, 21.95, 4.57, 17.19, 2.16, 5.6, 3.75, 6.25, 1.15, 9.7, 2.75, 2.3, 1.2, 3.94, 5.41, 6.63, 2.53, 9.92, 4.55, -0.05, 0.02, 3.75, 3.04, 2.74, 11.16, 5.22, 7.42]} \ No newline at end of file diff --git a/annotations_1/wbwXHxqxDwc_filtered.json b/annotations_1/wbwXHxqxDwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70c480f16eef32ec4f76da2b3b3f08fbbda21cc4 --- /dev/null +++ b/annotations_1/wbwXHxqxDwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 20.82], [24.0, 23.75], [24.0, 25.86], [32.0, 42.74], [44.0, 45.71], [47.0, 47.06], [48.0, 48.37], [49.0, 51.22], [55.0, 55.53], [57.0, 57.92], [58.0, 59.22], [61.0, 63.56], [66.0, 66.24], [67.0, 68.22], [70.0, 70.36], [71.0, 71.32], [72.0, 72.94], [74.0, 77.21], [92.0, 101.04], [105.0, 106.79], [107.0, 111.3], [114.0, 114.56], [117.0, 118.4], [120.0, 120.88], [122.0, 129.19], [129.0, 133.73], [135.0, 135.65], [136.0, 136.53], [138.0, 138.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 57.4, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 84.07, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 37.2, 0.0, 36.39, 0.0, 0.0, 0.0, 37.57, 48.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 43.15], ["hum", 13.36], ["radio", 8.54]], null, [["speech", 52.04], ["radio", 30.03], ["sidetone", 5.61]], null, null, null, [["noise", 40.09], ["sidetone", 25.25], ["speech", 7.17]], [["whale vocalization", 75.97], ["mains hum", 6.65], ["hum", 2.74]], null, null, null], "duration": [0.82, -0.25, 1.86, 10.74, 1.71, 0.06, 0.37, 2.22, 0.53, 0.92, 1.22, 2.56, 0.24, 1.22, 0.36, 0.32, 0.94, 3.21, 9.04, 1.79, 4.3, 0.56, 1.4, 0.88, 7.19, 4.73, 0.65, 0.53, 0.87]} \ No newline at end of file diff --git a/annotations_1/wcjCEUeC8nk_filtered.json b/annotations_1/wcjCEUeC8nk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6492c5a32507fc43769ec4e4abf5bc8049dbe912 --- /dev/null +++ b/annotations_1/wcjCEUeC8nk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.46], [9.0, 15.94], [16.0, 23.26], [24.0, 24.49], [29.0, 29.4], [36.0, 36.83], [37.0, 39.04], [40.0, 45.33], [47.0, 51.29], [54.0, 69.75], [72.0, 73.87], [75.0, 76.81], [78.0, 78.54], [79.0, 79.32], [84.0, 136.73], [138.0, 139.4], [141.0, 157.28]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 71.0, 36.2, 0.0, 0.0, 0.0, 62.37, 99.05, 48.52, 33.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.52], "audiomae_on_audioset": [null, null, [["speech", 64.5], ["grunt", 6.28], ["beatboxing", 5.17]], null, null, null, null, null, [["speech", 37.37], ["music", 5.14], ["fart", 4.78]], [["music", 67.91], ["speech", 4.45], ["throbbing", 4.09]], null, null, null, null, null, null, [["music", 54.71], ["speech", 11.21], ["theremin", 7.14]]], "duration": [1.46, 6.94, 7.26, 0.49, 0.4, 0.83, 2.04, 5.33, 4.29, 15.75, 1.87, 1.81, 0.54, 0.32, 52.73, 1.4, 16.28]} \ No newline at end of file diff --git a/annotations_1/wdS1l__SWms_filtered.json b/annotations_1/wdS1l__SWms_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67cf93df51e32a873d79996f48079dd515e0b87f --- /dev/null +++ b/annotations_1/wdS1l__SWms_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 14.79], [19.0, 40.58], [42.0, 44.98], [48.0, 81.99], [83.0, 83.07], [84.0, 84.48], [85.0, 91.49], [100.0, 100.08], [100.0, 108.87], [114.0, 119.25], [120.0, 121.07], [123.0, 122.76], [125.0, 125.54], [126.0, 126.6], [128.0, 128.44], [130.0, 130.94], [136.0, 144.22], [146.0, 172.35]], "keep_status": [true, false, true, false, false, false, false, false, true, true, false, false, false, false, false, false, true, true], "silence_prob": [42.88, 31.19, 36.8, 0.0, 0.0, 0.0, 31.44, 0.0, 33.58, 42.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.05, 32.2], "audiomae_on_audioset": [[["music", 36.98], ["speech", 21.4], ["theremin", 5.32]], [["music", 85.67], ["musical instrument", 2.89], ["brass instrument", 2.02]], [["music", 42.69], ["musical instrument", 5.84], ["hum", 4.93]], null, null, null, [["speech", 32.7], ["fart", 22.02], ["music", 18.27]], null, [["speech", 20.83], ["didgeridoo", 18.68], ["music", 15.78]], [["music", 40.28], ["theremin", 9.54], ["whack, thwack", 6.79]], null, null, null, null, null, null, [["music", 45.94], ["speech", 14.4], ["foghorn", 7.23]], [["music", 61.58], ["musical instrument", 4.2], ["theremin", 3.63]]], "duration": [8.79, 21.58, 2.98, 33.99, 0.07, 0.48, 6.49, 0.08, 8.87, 5.25, 1.07, -0.24, 0.54, 0.6, 0.44, 0.94, 8.22, 26.35]} \ No newline at end of file diff --git a/annotations_1/wdVtcHMYAM4_filtered.json b/annotations_1/wdVtcHMYAM4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aed65552475803c2a090608290bb8e03958d297d --- /dev/null +++ b/annotations_1/wdVtcHMYAM4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.94], [3.0, 27.31], [28.0, 28.39], [30.0, 30.32], [32.0, 33.2], [35.0, 35.53], [36.0, 67.31], [71.0, 73.18], [74.0, 76.17], [78.0, 92.33], [101.0, 100.72], [101.0, 102.39]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 42.81, 0.0, 0.0, 0.0, 0.0, 0.0, 75.23, 48.23, 37.97, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 35.25], ["breaking", 26.7], ["thunk", 12.93]], null, null, null, null, null, null, [["frog", 27.76], ["music", 24.01], ["sidetone", 10.19]], [["music", 62.72], ["speech", 13.82], ["echo", 2.32]], null, null], "duration": [-0.06, 24.31, 0.39, 0.32, 1.2, 0.53, 31.31, 2.18, 2.17, 14.33, -0.28, 1.39]} \ No newline at end of file diff --git a/annotations_1/wdcRrpMHIGM_filtered.json b/annotations_1/wdcRrpMHIGM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4eeb61164c312f49cfca5c8be898d4d12370c9d7 --- /dev/null +++ b/annotations_1/wdcRrpMHIGM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.68], [6.0, 7.11], [8.0, 9.71], [11.0, 13.1], [15.0, 20.16], [21.0, 23.99], [25.0, 25.08], [27.0, 29.51], [34.0, 40.15], [42.0, 43.12], [44.0, 45.42], [46.0, 48.17], [50.0, 55.27], [57.0, 62.97], [63.0, 112.5], [114.0, 116.38], [120.0, 120.9], [122.0, 123.69], [125.0, 180.49], [183.0, 184.08], [185.0, 185.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [34.1, 0.0, 0.0, 35.88, 32.61, 37.37, 0.0, 29.84, 42.24, 0.0, 0.0, 34.6, 29.01, 30.38, 0.0, 76.53, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 30.98], ["mains hum", 27.74], ["speech", 16.46]], null, null, [["mains hum", 48.44], ["hum", 25.09], ["music", 8.9]], [["music", 40.74], ["mains hum", 20.32], ["hum", 20.07]], [["mains hum", 35.43], ["hum", 22.75], ["music", 15.08]], null, [["music", 71.94], ["didgeridoo", 7.28], ["theremin", 2.5]], [["music", 56.85], ["hum", 9.96], ["didgeridoo", 7.47]], null, null, [["speech", 26.72], ["mains hum", 26.59], ["hum", 17.16]], [["music", 71.58], ["reverberation", 4.69], ["scary music", 3.13]], [["music", 50.8], ["speech", 21.02], ["mains hum", 5.22]], null, null, null, null, null, null, null], "duration": [3.68, 1.11, 1.71, 2.1, 5.16, 2.99, 0.08, 2.51, 6.15, 1.12, 1.42, 2.17, 5.27, 5.97, 49.5, 2.38, 0.9, 1.69, 55.49, 1.08, 0.79]} \ No newline at end of file diff --git a/annotations_1/weEay_Y4EeE_filtered.json b/annotations_1/weEay_Y4EeE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d94dab36a48dd25b413f0dfffb5509735eb2bf48 --- /dev/null +++ b/annotations_1/weEay_Y4EeE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 35.34], [36.0, 51.41], [52.0, 52.2]], "keep_status": [false, false, false], "silence_prob": [97.64, 83.7, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [8.34, 15.41, 0.2]} \ No newline at end of file diff --git a/annotations_1/wfAfwKUkfHU_filtered.json b/annotations_1/wfAfwKUkfHU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d154451d52333e69f12b256f628b1811063561 --- /dev/null +++ b/annotations_1/wfAfwKUkfHU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.32], [16.0, 20.87], [22.0, 44.64], [46.0, 47.68], [49.0, 49.99], [51.0, 53.74], [56.0, 57.81], [59.0, 60.54], [65.0, 65.48], [67.0, 77.62], [78.0, 79.57], [82.0, 83.69], [85.0, 90.83], [94.0, 102.12], [103.0, 107.4], [109.0, 112.08], [116.0, 120.07], [122.0, 123.99], [125.0, 126.28], [130.0, 138.5], [140.0, 141.02], [142.0, 143.94], [147.0, 149.66], [151.0, 153.1], [154.0, 155.88], [158.0, 164.22], [166.0, 170.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 80.46, 59.77, 0.0, 0.0, 97.33, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 58.72, 37.08, 53.04, 55.81, 53.4, 0.0, 0.0, 76.2, 0.0, 0.0, 97.33, 98.8, 0.0, 70.86, 45.75], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 71.26], ["soundtrack music", 6.37], ["scary music", 5.65]], null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.51], ["hum", 9.79], ["whale vocalization", 7.19]]], "duration": [1.32, 4.87, 22.64, 1.68, 0.99, 2.74, 1.81, 1.54, 0.48, 10.62, 1.57, 1.69, 5.83, 8.12, 4.4, 3.08, 4.07, 1.99, 1.28, 8.5, 1.02, 1.94, 2.66, 2.1, 1.88, 6.22, 4.36]} \ No newline at end of file diff --git a/annotations_1/wfq7O3AgXdE_filtered.json b/annotations_1/wfq7O3AgXdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc9a5620bc8bfcbbd0e93498df651f931c7ff964 --- /dev/null +++ b/annotations_1/wfq7O3AgXdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.12], [6.0, 7.48], [8.0, 10.02], [15.0, 16.43], [17.0, 17.61], [18.0, 18.99], [20.0, 19.8], [23.0, 24.16], [36.0, 36.73], [39.0, 39.58], [45.0, 45.89], [47.0, 47.22], [49.0, 49.13], [53.0, 53.15], [56.0, 56.62], [61.0, 61.32], [62.0, 69.08], [70.0, 70.51], [71.0, 71.69], [76.0, 76.54], [79.0, 79.89], [82.0, 82.07], [82.0, 84.03], [86.0, 87.22], [88.0, 88.84], [90.0, 90.41], [93.0, 94.14], [94.0, 98.12], [98.0, 101.28], [106.0, 106.78], [108.0, 107.82], [110.0, 126.49], [127.0, 127.62], [128.0, 132.04], [136.0, 136.49], [137.0, 137.81], [141.0, 142.79], [144.0, 144.19], [147.0, 148.2], [149.0, 150.82], [151.0, 152.36], [154.0, 161.27], [163.0, 169.82], [171.0, 174.46], [176.0, 176.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.16, 0.0, 95.37, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.68, 0.0, 0.0, 0.0, 0.0, 0.0, 99.59, 0.0, 0.0, 0.0, 0.0, 99.05, 95.09, 0.0, 0.0, 63.53, 0.0, 85.35, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.43, 86.27, 91.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.12, 1.48, 2.02, 1.43, 0.61, 0.99, -0.2, 1.16, 0.73, 0.58, 0.89, 0.22, 0.13, 0.15, 0.62, 0.32, 7.08, 0.51, 0.69, 0.54, 0.89, 0.07, 2.03, 1.22, 0.84, 0.41, 1.14, 4.12, 3.28, 0.78, -0.18, 16.49, 0.62, 4.04, 0.49, 0.81, 1.79, 0.19, 1.2, 1.82, 1.36, 7.27, 6.82, 3.46, 0.44]} \ No newline at end of file diff --git a/annotations_1/wgkxKdTVrHo_filtered.json b/annotations_1/wgkxKdTVrHo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7d179b4ca00dff06d94cf1f899c28f5cd90a5e87 --- /dev/null +++ b/annotations_1/wgkxKdTVrHo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.4], [3.0, 6.78], [7.0, 7.8], [9.0, 10.64], [14.0, 16.88], [19.0, 24.07], [26.0, 27.4], [28.0, 29.84], [32.0, 43.58], [44.0, 48.3], [50.0, 50.11], [56.0, 56.96], [63.0, 63.48], [64.0, 75.47], [77.0, 79.66], [84.0, 84.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 0.0, 99.05, 77.36, 0.0, 0.0, 34.73, 42.58, 0.0, 0.0, 0.0, 54.3, 53.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 71.15], ["musical instrument", 5.17], ["didgeridoo", 3.46]], [["music", 60.8], ["frog", 6.66], ["speech", 6.23]], null, null, null, null, null, null], "duration": [0.4, 3.78, 0.8, 1.64, 2.88, 5.07, 1.4, 1.84, 11.58, 4.3, 0.11, 0.96, 0.48, 11.47, 2.66, 0.62]} \ No newline at end of file diff --git a/annotations_1/whFoAKQ10gY_filtered.json b/annotations_1/whFoAKQ10gY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ca7cbcac144e86918c3d93bcb52e02fe5a714b01 --- /dev/null +++ b/annotations_1/whFoAKQ10gY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.71], [17.0, 19.01], [20.0, 22.1], [23.0, 23.18], [26.0, 34.21], [44.0, 44.76], [55.0, 55.09], [55.0, 56.54]], "keep_status": [false, false, true, false, false, false, false, false], "silence_prob": [0.0, 51.66, 43.71, 0.0, 58.47, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 26.45], ["musical instrument", 6.91], ["guitar", 6.72]], null, null, null, null, null], "duration": [0.71, 2.01, 2.1, 0.18, 8.21, 0.76, 0.09, 1.54]} \ No newline at end of file diff --git a/annotations_1/wjVPv5aO_no_filtered.json b/annotations_1/wjVPv5aO_no_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0098d186b32b27fa18784cb206261cee23472c4c --- /dev/null +++ b/annotations_1/wjVPv5aO_no_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.95], [7.0, 8.02], [10.0, 10.66], [13.0, 12.85], [16.0, 32.83], [36.0, 78.41], [81.0, 93.14], [95.0, 99.67], [102.0, 102.59], [114.0, 114.29], [115.0, 115.62], [127.0, 127.33]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.32, 0.0, 30.16, 32.37, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 22.65], ["screaming", 9.38], ["whack, thwack", 6.76]], null, [["vehicle", 29.18], ["car", 19.56], ["speech", 8.34]], [["speech", 23.7], ["music", 17.85], ["noise", 6.61]], null, null, null, null], "duration": [0.95, 1.02, 0.66, -0.15, 16.83, 42.41, 12.14, 4.67, 0.59, 0.29, 0.62, 0.33]} \ No newline at end of file diff --git a/annotations_1/wkoHQdbhfOc_filtered.json b/annotations_1/wkoHQdbhfOc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b6db43a29fa10ba798bb9e4d64a1b082898415d1 --- /dev/null +++ b/annotations_1/wkoHQdbhfOc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 25.62], [26.0, 53.08], [54.0, 59.63], [62.0, 66.16], [68.0, 70.12], [73.0, 75.63], [88.0, 88.82], [90.0, 90.71], [91.0, 96.31], [98.0, 111.18], [112.0, 115.26], [116.0, 132.26], [133.0, 137.61], [138.0, 145.45], [147.0, 149.52], [152.0, 158.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [79.59, 58.72, 82.25, 98.99, 99.59, 84.98, 0.0, 0.0, 56.55, 73.97, 99.56, 99.48, 87.74, 56.1, 97.33, 98.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [13.62, 27.08, 5.63, 4.16, 2.12, 2.63, 0.82, 0.71, 5.31, 13.18, 3.26, 16.26, 4.61, 7.45, 2.52, 6.9]} \ No newline at end of file diff --git a/annotations_1/wmXFSQdF3PM_filtered.json b/annotations_1/wmXFSQdF3PM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2acc59a8607edf2879b812683ff209d854e19ae6 --- /dev/null +++ b/annotations_1/wmXFSQdF3PM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.1], [8.0, 7.55], [11.0, 12.88], [15.0, 15.01], [17.0, 18.13], [21.0, 21.91], [24.0, 81.95], [83.0, 82.98], [84.0, 102.17], [104.0, 122.86], [123.0, 124.44], [126.0, 140.76], [142.0, 142.75], [146.0, 146.92], [148.0, 148.14], [150.0, 150.96], [152.0, 152.58], [153.0, 155.29], [157.0, 156.76], [158.0, 164.88], [167.0, 167.39]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [30.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.43, 30.33, 0.0, 30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 33.5, 0.0, 35.28, 0.0], "audiomae_on_audioset": [[["fire", 21.1], ["speech", 15.95], ["eruption", 5.63]], null, null, null, null, null, null, null, [["music", 73.07], ["hum", 6.16], ["scary music", 3.01]], [["music", 35.4], ["hum", 13.75], ["speech", 11.42]], null, [["music", 47.58], ["hum", 19.92], ["throbbing", 14.27]], null, null, null, null, null, [["music", 41.17], ["speech", 25.49], ["didgeridoo", 6.32]], null, [["hum", 39.5], ["sidetone", 12.72], ["speech", 9.75]], null], "duration": [2.1, -0.45, 1.88, 0.01, 1.13, 0.91, 57.95, -0.02, 18.17, 18.86, 1.44, 14.76, 0.75, 0.92, 0.14, 0.96, 0.58, 2.29, -0.24, 6.88, 0.39]} \ No newline at end of file diff --git a/annotations_1/wmbN_BXQaho_filtered.json b/annotations_1/wmbN_BXQaho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..67c8c95d471065e9a5164eb90736e296fd18a509 --- /dev/null +++ b/annotations_1/wmbN_BXQaho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.34], [6.0, 7.47], [8.0, 8.19], [11.0, 13.78], [16.0, 16.46], [17.0, 16.8], [18.0, 19.18], [19.0, 21.69], [23.0, 24.34], [25.0, 26.59], [28.0, 28.11], [29.0, 29.1], [30.0, 33.3], [35.0, 50.65], [51.0, 50.7], [51.0, 73.67], [77.0, 81.33], [82.0, 113.97], [119.0, 137.52], [140.0, 140.9], [143.0, 145.79], [147.0, 149.39], [154.0, 154.6], [156.0, 156.61], [158.0, 158.23], [159.0, 160.1], [163.0, 164.08], [166.0, 167.59], [169.0, 175.63]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [67.76, 0.0, 0.0, 70.58, 0.0, 0.0, 0.0, 62.89, 0.0, 0.0, 0.0, 0.0, 73.21, 33.62, 0.0, 33.63, 34.73, 0.0, 37.08, 0.0, 61.97, 70.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.86], ["speech", 17.1], ["fart", 12.38]], null, [["hum", 25.31], ["speech", 15.24], ["sidetone", 8.41]], [["music", 45.13], ["didgeridoo", 7.73], ["musical instrument", 4.52]], null, [["noise", 27.12], ["hum", 17.77], ["mains hum", 11.19]], null, null, null, null, null, null, null, null, null, null], "duration": [3.34, 1.47, 0.19, 2.78, 0.46, -0.2, 1.18, 2.69, 1.34, 1.59, 0.11, 0.1, 3.3, 15.65, -0.3, 22.67, 4.33, 31.97, 18.52, 0.9, 2.79, 2.39, 0.6, 0.61, 0.23, 1.1, 1.08, 1.59, 6.63]} \ No newline at end of file diff --git a/annotations_1/wmu9xg12xuc_filtered.json b/annotations_1/wmu9xg12xuc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..433b38f187b6c8612ddadf117aa03c68e31533af --- /dev/null +++ b/annotations_1/wmu9xg12xuc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.77], [18.0, 26.67], [28.0, 38.57], [41.0, 43.71], [45.0, 48.98], [51.0, 51.63], [56.0, 55.83], [56.0, 58.63], [62.0, 61.59], [64.0, 74.12], [76.0, 81.41], [83.0, 87.81], [91.0, 92.42], [94.0, 96.26], [96.0, 101.95], [106.0, 110.46]], "keep_status": [true, false, true, false, false, false, false, true, false, false, false, true, false, true, false, true], "silence_prob": [37.58, 32.81, 29.12, 29.84, 30.18, 0.0, 0.0, 30.73, 0.0, 29.83, 29.58, 28.95, 0.0, 29.8, 30.27, 28.78], "audiomae_on_audioset": [[["music", 34.14], ["hum", 9.88], ["mains hum", 5.39]], [["speech", 26.07], ["throbbing", 25.78], ["music", 25.3]], [["music", 39.19], ["speech", 22.09], ["vehicle", 4.68]], [["speech", 48.97], ["music", 22.7], ["hum", 4.2]], [["hum", 47.99], ["mains hum", 20.78], ["music", 11.5]], null, null, [["music", 19.49], ["throbbing", 14.93], ["hum", 10.54]], null, [["throbbing", 44.44], ["music", 44.25], ["hum", 5.07]], [["music", 44.19], ["speech", 30.03], ["throbbing", 11.1]], [["music", 40.14], ["speech", 10.37], ["noise", 6.13]], null, [["music", 30.94], ["angry music", 9.29], ["brass instrument", 4.82]], [["throbbing", 66.38], ["music", 13.09], ["hum", 11.29]], [["music", 32.43], ["smash, crash", 17.5], ["throbbing", 15.52]]], "duration": [2.77, 8.67, 10.57, 2.71, 3.98, 0.63, -0.17, 2.63, -0.41, 10.12, 5.41, 4.81, 1.42, 2.26, 5.95, 4.46]} \ No newline at end of file diff --git a/annotations_1/wn-e7FlYRJU_filtered.json b/annotations_1/wn-e7FlYRJU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6d5e8c61c01e9b6b7b64d8091a867ad1943ca2d --- /dev/null +++ b/annotations_1/wn-e7FlYRJU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 26.13], [27.0, 27.65], [50.0, 52.05], [54.0, 53.87], [55.0, 55.85], [62.0, 63.04], [65.0, 65.47], [80.0, 81.58], [84.0, 85.11], [98.0, 98.34], [103.0, 103.62], [106.0, 107.16], [117.0, 116.92], [119.0, 119.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 98.99, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.13, 0.65, 2.05, -0.13, 0.85, 1.04, 0.47, 1.58, 1.11, 0.34, 0.62, 1.16, -0.08, 0.53]} \ No newline at end of file diff --git a/annotations_1/wn_8YBvVugo_filtered.json b/annotations_1/wn_8YBvVugo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1e0a726fc4fc4fd7ff9a0223447c2a53b0c47c2 --- /dev/null +++ b/annotations_1/wn_8YBvVugo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 32.95], [34.0, 34.89], [37.0, 78.16], [80.0, 80.25], [83.0, 83.15], [85.0, 84.86], [95.0, 99.57], [100.0, 100.55], [102.0, 105.04]], "keep_status": [true, false, false, false, false, false, false, false, true], "silence_prob": [31.26, 0.0, 0.0, 0.0, 0.0, 0.0, 34.03, 0.0, 36.46], "audiomae_on_audioset": [[["music", 27.25], ["speech", 16.15], ["throbbing", 7.84]], null, null, null, null, null, [["music", 59.79], ["throbbing", 19.47], ["hum", 12.09]], null, [["music", 37.23], ["speech", 10.74], ["synthesizer", 9.96]]], "duration": [11.95, 0.89, 41.16, 0.25, 0.15, -0.14, 4.57, 0.55, 3.04]} \ No newline at end of file diff --git a/annotations_1/wnvRIdndQdk_filtered.json b/annotations_1/wnvRIdndQdk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71ff9719eb06cada80dce99f9313826cf2e96317 --- /dev/null +++ b/annotations_1/wnvRIdndQdk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.75], [9.0, 17.42], [19.0, 23.57], [24.0, 49.72], [50.0, 49.94], [50.0, 50.52], [53.0, 72.87], [75.0, 97.39], [102.0, 116.67]], "keep_status": [false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 39.46, 52.98, 30.6, 0.0, 0.0, 29.67, 30.32, 29.07], "audiomae_on_audioset": [null, [["didgeridoo", 53.44], ["music", 26.74], ["whale vocalization", 4.51]], null, [["whale vocalization", 16.24], ["hum", 15.0], ["throbbing", 11.43]], null, null, [["music", 55.1], ["throbbing", 10.18], ["outside, rural or natural", 2.88]], [["music", 43.45], ["hum", 22.09], ["mains hum", 9.97]], [["hum", 31.59], ["music", 29.5], ["throbbing", 17.4]]], "duration": [1.75, 8.42, 4.57, 25.72, -0.06, 0.52, 19.87, 22.39, 14.67]} \ No newline at end of file diff --git a/annotations_1/wnwsSOrmEKI_filtered.json b/annotations_1/wnwsSOrmEKI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..995c37ded454e1ff0fce3a1885833944bcf464da --- /dev/null +++ b/annotations_1/wnwsSOrmEKI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 27.48], [28.0, 39.39], [43.0, 44.61], [45.0, 45.35], [45.0, 48.51], [51.0, 53.7], [55.0, 59.7], [66.0, 66.38], [73.0, 73.7], [77.0, 78.76], [79.0, 82.65], [83.0, 84.96], [89.0, 89.92], [90.0, 90.56], [92.0, 91.64], [93.0, 93.21], [99.0, 99.05], [105.0, 105.46], [108.0, 111.37], [114.0, 114.86], [117.0, 126.87], [128.0, 133.27], [136.0, 154.48]], "keep_status": [false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.48, 36.71, 0.0, 0.0, 44.78, 49.82, 64.41, 0.0, 0.0, 0.0, 45.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.61, 0.0, 45.78, 100.0, 85.9], "audiomae_on_audioset": [null, [["speech", 56.65], ["sidetone", 34.42], ["dial tone", 1.41]], null, null, [["speech", 16.93], ["hum", 11.9], ["whale vocalization", 10.14]], [["burping, eructation", 22.88], ["hum", 14.7], ["speech", 8.13]], null, null, null, null, [["fart", 23.22], ["grunt", 13.89], ["growling", 6.55]], null, null, null, null, null, null, null, null, null, [["speech", 83.42], ["grunt", 10.12], ["male speech, man speaking", 2.4]], null, null], "duration": [21.48, 11.39, 1.61, 0.35, 3.51, 2.7, 4.7, 0.38, 0.7, 1.76, 3.65, 1.96, 0.92, 0.56, -0.36, 0.21, 0.05, 0.46, 3.37, 0.86, 9.87, 5.27, 18.48]} \ No newline at end of file diff --git a/annotations_1/woLbaFLoJI8_filtered.json b/annotations_1/woLbaFLoJI8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3e85ce63c46d49c1b3239ca1964932ce6af20650 --- /dev/null +++ b/annotations_1/woLbaFLoJI8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.92], [3.0, 5.14], [6.0, 7.08], [10.0, 11.8], [14.0, 15.03], [16.0, 17.56], [19.0, 19.2], [20.0, 21.41], [23.0, 24.61], [30.0, 30.11], [41.0, 59.41], [63.0, 64.18], [67.0, 68.64], [82.0, 91.94], [93.0, 94.53], [95.0, 95.47], [100.0, 102.64], [113.0, 114.49], [116.0, 119.25], [120.0, 120.48], [121.0, 126.66], [127.0, 129.14], [130.0, 136.61], [138.0, 139.04], [140.0, 140.09], [142.0, 143.13], [145.0, 146.21], [147.0, 147.61], [151.0, 152.04]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 44.46, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.24, 0.0, 0.0, 48.95, 0.0, 0.0, 60.05, 0.0, 72.01, 0.0, 83.16, 99.26, 99.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["theremin", 31.33], ["speech", 14.69], ["music", 14.21]], null, null, null, null, null, null, null, null, [["music", 48.62], ["speech", 17.93], ["hum", 11.06]], null, null, [["speech", 43.62], ["music", 20.59], ["insect", 3.75]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.92, 2.14, 1.08, 1.8, 1.03, 1.56, 0.2, 1.41, 1.61, 0.11, 18.41, 1.18, 1.64, 9.94, 1.53, 0.47, 2.64, 1.49, 3.25, 0.48, 5.66, 2.14, 6.61, 1.04, 0.09, 1.13, 1.21, 0.61, 1.04]} \ No newline at end of file diff --git a/annotations_1/woSj0M9Decw_filtered.json b/annotations_1/woSj0M9Decw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1934d05aa37088690737fb047b33095834ebffb --- /dev/null +++ b/annotations_1/woSj0M9Decw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.67], [15.0, 17.74], [20.0, 30.69], [32.0, 40.59], [42.0, 42.01], [42.0, 48.42], [54.0, 55.53], [57.0, 57.72], [59.0, 59.22], [64.0, 64.5], [69.0, 69.01], [71.0, 89.38], [91.0, 101.83], [104.0, 106.2]], "keep_status": [false, true, true, true, false, true, false, false, false, false, false, false, false, true], "silence_prob": [29.61, 32.32, 30.27, 30.65, 0.0, 29.66, 0.0, 0.0, 0.0, 0.0, 0.0, 30.14, 30.65, 30.07], "audiomae_on_audioset": [[["music", 47.41], ["didgeridoo", 24.42], ["whale vocalization", 7.24]], [["music", 25.11], ["throbbing", 17.58], ["livestock, farm animals, working animals", 13.55]], [["music", 54.81], ["musical instrument", 5.52], ["speech", 4.62]], [["livestock, farm animals, working animals", 31.93], ["cattle, bovinae", 19.66], ["music", 15.58]], null, [["moo", 19.11], ["cattle, bovinae", 19.09], ["speech", 15.94]], null, null, null, null, null, [["theremin", 38.39], ["music", 38.17], ["synthesizer", 4.33]], [["music", 63.87], ["synthesizer", 16.02], ["theremin", 3.6]], [["speech", 29.15], ["sidetone", 10.17], ["music", 10.07]]], "duration": [7.67, 2.74, 10.69, 8.59, 0.01, 6.42, 1.53, 0.72, 0.22, 0.5, 0.01, 18.38, 10.83, 2.2]} \ No newline at end of file diff --git a/annotations_1/wpQ4R1jlFHs_filtered.json b/annotations_1/wpQ4R1jlFHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1bc67522bfbf640a6e092ea1557875b73191b07c --- /dev/null +++ b/annotations_1/wpQ4R1jlFHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[19.0, 20.09], [21.0, 21.91], [23.0, 23.6], [26.0, 31.75], [33.0, 33.56], [35.0, 38.2], [39.0, 41.28], [43.0, 43.09], [44.0, 46.25], [47.0, 49.69], [52.0, 53.59], [59.0, 59.39], [65.0, 67.31], [68.0, 68.62], [72.0, 72.05], [80.0, 80.05], [82.0, 81.87], [84.0, 87.25], [94.0, 94.69], [102.0, 102.3], [104.0, 104.4], [106.0, 106.79], [110.0, 110.54], [111.0, 112.24], [114.0, 116.09], [120.0, 120.5], [122.0, 122.79], [123.0, 123.85], [133.0, 134.33], [137.0, 137.3], [140.0, 141.18], [144.0, 144.34], [146.0, 146.74], [148.0, 148.05]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 39.82, 0.0, 99.52, 65.79, 0.0, 40.68, 30.11, 0.0, 0.0, 51.5, 0.0, 0.0, 0.0, 0.0, 43.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 74.49], ["telephone", 8.42], ["dial tone", 8.3]], null, null, null, null, [["speech", 52.59], ["sidetone", 23.0], ["busy signal", 5.5]], [["speech", 36.98], ["music", 14.06], ["smash, crash", 6.22]], null, null, null, null, null, null, null, [["speech", 40.01], ["fart", 5.35], ["bee, wasp, etc.", 2.98]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.09, 0.91, 0.6, 5.75, 0.56, 3.2, 2.28, 0.09, 2.25, 2.69, 1.59, 0.39, 2.31, 0.62, 0.05, 0.05, -0.13, 3.25, 0.69, 0.3, 0.4, 0.79, 0.54, 1.24, 2.09, 0.5, 0.79, 0.85, 1.33, 0.3, 1.18, 0.34, 0.74, 0.05]} \ No newline at end of file diff --git a/annotations_1/wpci2WuWy4E_filtered.json b/annotations_1/wpci2WuWy4E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22eee6e6d91c2de7d61c17ca85d08faaad3389f4 --- /dev/null +++ b/annotations_1/wpci2WuWy4E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 10.27], [12.0, 14.52], [17.0, 17.24], [18.0, 19.35], [23.0, 24.68], [26.0, 26.72], [30.0, 29.66], [31.0, 31.73], [32.0, 33.44], [34.0, 64.29], [64.0, 78.87], [81.0, 81.68], [82.0, 105.29], [111.0, 115.52], [116.0, 121.56], [123.0, 127.58], [128.0, 128.85], [131.0, 136.8], [141.0, 141.51], [142.0, 143.7], [144.0, 153.05], [154.0, 155.46], [159.0, 159.29], [161.0, 161.33], [164.0, 163.95], [165.0, 168.15], [172.0, 173.33], [175.0, 175.88], [176.0, 190.51], [193.0, 195.86], [199.0, 220.35], [223.0, 224.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, true, true, false, false], "silence_prob": [34.52, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.11, 0.0, 30.9, 30.25, 31.33, 30.72, 0.0, 29.8, 0.0, 0.0, 29.35, 0.0, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 29.98, 39.37, 63.64, 0.0], "audiomae_on_audioset": [[["mains hum", 34.62], ["hum", 34.53], ["sidetone", 6.51]], null, null, null, null, null, null, null, null, null, [["music", 85.86], ["hum", 4.32], ["throbbing", 2.03]], null, [["music", 63.02], ["throbbing", 4.1], ["hum", 3.68]], [["music", 71.04], ["didgeridoo", 13.53], ["musical instrument", 2.67]], [["music", 75.94], ["synthesizer", 5.02], ["musical instrument", 2.99]], [["music", 51.16], ["didgeridoo", 14.48], ["speech", 9.1]], null, [["music", 24.89], ["noise", 24.51], ["mains hum", 7.17]], null, null, [["music", 47.24], ["hum", 9.69], ["throbbing", 7.97]], null, null, null, null, [["music", 30.14], ["hum", 12.07], ["throbbing", 8.22]], null, null, [["speech", 28.97], ["music", 9.69], ["hum", 7.84]], [["frog", 9.48], ["whale vocalization", 5.62], ["music", 4.88]], null, null], "duration": [7.27, 2.52, 0.24, 1.35, 1.68, 0.72, -0.34, 0.73, 1.44, 30.29, 14.87, 0.68, 23.29, 4.52, 5.56, 4.58, 0.85, 5.8, 0.51, 1.7, 9.05, 1.46, 0.29, 0.33, -0.05, 3.15, 1.33, 0.88, 14.51, 2.86, 21.35, 1.04]} \ No newline at end of file diff --git a/annotations_1/wpxS1xSxUDY_filtered.json b/annotations_1/wpxS1xSxUDY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0aaa3ceaa206839d422716c4dffda5d03c6ba728 --- /dev/null +++ b/annotations_1/wpxS1xSxUDY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.73], [3.0, 3.75], [8.0, 11.23], [13.0, 14.5], [16.0, 17.2], [18.0, 18.87], [21.0, 21.98], [24.0, 24.93], [26.0, 26.42], [30.0, 29.74], [31.0, 32.36], [34.0, 83.49], [86.0, 86.34], [93.0, 94.64], [96.0, 97.9], [98.0, 99.96], [102.0, 102.88], [106.0, 106.84], [109.0, 109.19], [113.0, 114.0], [119.0, 120.8], [123.0, 124.17], [126.0, 127.2], [128.0, 129.25], [131.0, 132.04], [134.0, 154.57], [161.0, 161.15], [161.0, 164.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 99.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.73, 0.0, 41.01], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 39.62], ["mains hum", 21.05], ["throbbing", 10.62]], null, [["music", 60.93], ["electronic music", 3.26], ["synthesizer", 3.05]]], "duration": [0.73, 0.75, 3.23, 1.5, 1.2, 0.87, 0.98, 0.93, 0.42, -0.26, 1.36, 49.49, 0.34, 1.64, 1.9, 1.96, 0.88, 0.84, 0.19, 1.0, 1.8, 1.17, 1.2, 1.25, 1.04, 20.57, 0.15, 3.94]} \ No newline at end of file diff --git a/annotations_1/wr5-v7rYg70_filtered.json b/annotations_1/wr5-v7rYg70_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c691428761c724f3eabdeaed7776db6fa85193ba --- /dev/null +++ b/annotations_1/wr5-v7rYg70_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.99], [12.0, 13.22], [29.0, 30.0], [32.0, 32.54], [41.0, 41.54], [58.0, 58.36], [60.0, 70.5], [97.0, 97.73], [102.0, 104.28], [116.0, 116.26], [117.0, 119.45], [120.0, 121.39], [122.0, 126.0], [127.0, 130.42], [131.0, 132.14], [133.0, 134.01]], "keep_status": [true, false, false, false, false, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 32.29, 0.0, 31.24, 0.0, 40.62, 0.0, 100.0, 38.23, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.73], ["guitar", 14.82], ["musical instrument", 12.39]], null, null, null, null, null, [["music", 40.22], ["wind instrument, woodwind instrument", 13.27], ["musical instrument", 6.13]], null, [["music", 71.65], ["speech", 9.41], ["boing", 1.91]], null, [["speech", 38.55], ["knock", 9.26], ["whack, thwack", 7.25]], null, null, [["speech", 23.27], ["moo", 18.18], ["cattle, bovinae", 15.99]], null, null], "duration": [2.99, 1.22, 1.0, 0.54, 0.54, 0.36, 10.5, 0.73, 2.28, 0.26, 2.45, 1.39, 4.0, 3.42, 1.14, 1.01]} \ No newline at end of file diff --git a/annotations_1/wsFQrTAEs7A_filtered.json b/annotations_1/wsFQrTAEs7A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dbad93da0efb0214529c3bb09aec8a9d0419245 --- /dev/null +++ b/annotations_1/wsFQrTAEs7A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.88], [19.0, 20.01], [21.0, 22.57], [23.0, 24.06], [25.0, 28.88], [35.0, 35.33], [51.0, 54.35], [71.0, 75.1], [85.0, 89.99], [93.0, 101.8], [109.0, 108.89], [114.0, 114.83], [117.0, 117.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.82, 0.0, 0.0, 0.0, 41.05, 0.0, 33.3, 32.0, 32.33, 33.12, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.54], ["musical instrument", 11.42], ["brass instrument", 5.5]], null, null, null, [["music", 54.73], ["musical instrument", 14.65], ["speech", 5.08]], null, [["music", 59.21], ["speech", 9.53], ["didgeridoo", 3.3]], [["music", 53.02], ["theremin", 13.48], ["didgeridoo", 8.98]], [["music", 79.74], ["musical instrument", 5.21], ["synthesizer", 2.4]], [["theremin", 53.78], ["music", 41.66], ["musical instrument", 1.0]], null, null, null], "duration": [2.88, 1.01, 1.57, 1.06, 3.88, 0.33, 3.35, 4.1, 4.99, 8.8, -0.11, 0.83, 0.53]} \ No newline at end of file diff --git a/annotations_1/wsooQlbj934_filtered.json b/annotations_1/wsooQlbj934_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7fb0bed956a3c5065ad665cd849f1911dbdb769f --- /dev/null +++ b/annotations_1/wsooQlbj934_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 18.28], [19.0, 33.88], [41.0, 63.07], [64.0, 76.03], [78.0, 79.73], [82.0, 91.86], [94.0, 94.47], [96.0, 96.7], [99.0, 100.18], [101.0, 102.25], [104.0, 105.66], [109.0, 113.68], [118.0, 127.94], [129.0, 131.4], [134.0, 142.6], [144.0, 144.64], [145.0, 155.14], [156.0, 157.37], [160.0, 162.18], [163.0, 163.76], [165.0, 170.41], [171.0, 174.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false, true, false, true, true], "silence_prob": [29.84, 58.72, 40.04, 34.49, 0.0, 34.22, 0.0, 0.0, 0.0, 0.0, 0.0, 41.24, 31.79, 33.8, 37.28, 0.0, 36.9, 0.0, 41.32, 0.0, 39.33, 44.75], "audiomae_on_audioset": [[["hum", 33.68], ["music", 30.13], ["mains hum", 11.54]], null, [["hum", 50.93], ["mains hum", 24.82], ["throbbing", 8.56]], [["speech", 48.87], ["noise", 13.31], ["whack, thwack", 8.59]], null, [["hum", 50.05], ["mains hum", 23.39], ["buzz", 6.36]], null, null, null, null, null, [["speech", 37.21], ["whale vocalization", 31.2], ["sidetone", 6.48]], [["explosion", 22.2], ["speech", 15.55], ["burst, pop", 10.9]], [["whale vocalization", 44.81], ["livestock, farm animals, working animals", 9.23], ["cattle, bovinae", 6.5]], [["quack", 13.25], ["rumble", 13.08], ["duck", 11.7]], null, [["sidetone", 32.01], ["speech", 29.59], ["throbbing", 4.99]], null, [["whale vocalization", 11.87], ["hum", 11.1], ["rumble", 9.45]], null, [["speech", 30.73], ["hum", 17.59], ["music", 11.31]], [["gong", 26.56], ["music", 15.01], ["sonar", 7.22]]], "duration": [13.28, 14.88, 22.07, 12.03, 1.73, 9.86, 0.47, 0.7, 1.18, 1.25, 1.66, 4.68, 9.94, 2.4, 8.6, 0.64, 10.14, 1.37, 2.18, 0.76, 5.41, 3.88]} \ No newline at end of file diff --git a/annotations_1/wt0klpk3tBA_filtered.json b/annotations_1/wt0klpk3tBA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a0477a58b77df3b653185dcf6707ab1b18a8b2ff --- /dev/null +++ b/annotations_1/wt0klpk3tBA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.01], [10.0, 10.25], [14.0, 14.88], [16.0, 16.98], [23.0, 24.38], [27.0, 29.84], [31.0, 43.61], [44.0, 43.7], [48.0, 60.47], [62.0, 64.05], [66.0, 66.68], [73.0, 73.35], [76.0, 76.35], [78.0, 78.8], [81.0, 83.29], [84.0, 84.7], [85.0, 89.06], [100.0, 104.62], [106.0, 113.32], [114.0, 125.79], [128.0, 128.63], [130.0, 130.5], [132.0, 134.47], [141.0, 143.78], [145.0, 148.27], [149.0, 148.95], [149.0, 156.81], [162.0, 162.95], [164.0, 165.32], [166.0, 168.15], [170.0, 170.34], [171.0, 175.86], [177.0, 178.51], [181.0, 181.89], [183.0, 183.83], [187.0, 193.83], [194.0, 199.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 32.14, 38.19, 0.0, 91.47, 78.21, 0.0, 0.0, 0.0, 0.0, 96.04, 0.0, 93.91, 40.07, 32.44, 30.97, 0.0, 0.0, 61.97, 66.03, 90.6, 0.0, 93.91, 0.0, 0.0, 96.42, 0.0, 99.26, 0.0, 0.0, 0.0, 95.78, 94.22], "audiomae_on_audioset": [null, null, null, null, null, [["hum", 44.0], ["throbbing", 19.18], ["mains hum", 17.4]], [["music", 39.52], ["speech", 27.65], ["electronic music", 4.93]], null, null, null, null, null, null, null, null, null, null, [["speech", 17.93], ["hum", 13.42], ["music", 7.53]], [["hum", 59.3], ["mains hum", 16.16], ["throbbing", 15.83]], [["speech", 26.34], ["livestock, farm animals, working animals", 19.22], ["cattle, bovinae", 8.76]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.25, 0.88, 0.98, 1.38, 2.84, 12.61, -0.3, 12.47, 2.05, 0.68, 0.35, 0.35, 0.8, 2.29, 0.7, 4.06, 4.62, 7.32, 11.79, 0.63, 0.5, 2.47, 2.78, 3.27, -0.05, 7.81, 0.95, 1.32, 2.15, 0.34, 4.86, 1.51, 0.89, 0.83, 6.83, 5.61]} \ No newline at end of file diff --git a/annotations_1/wuzbUsy6snc_filtered.json b/annotations_1/wuzbUsy6snc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f616fc37e443f9f67bde32d0872f62ee48c306e8 --- /dev/null +++ b/annotations_1/wuzbUsy6snc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.69], [16.0, 16.12], [18.0, 19.99], [21.0, 22.3], [23.0, 23.16], [25.0, 25.69], [27.0, 28.16], [29.0, 31.95], [38.0, 39.09], [42.0, 43.73], [50.0, 56.84], [61.0, 61.6], [65.0, 86.27], [92.0, 94.88], [96.0, 96.11], [96.0, 105.98]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.48, 0.0, 0.0, 29.75, 0.0, 31.89, 30.17, 0.0, 30.48], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 55.14], ["musical instrument", 6.73], ["guitar", 5.26]], null, null, [["music", 71.85], ["yodeling", 3.43], ["swing music", 2.13]], null, [["music", 53.34], ["synthesizer", 8.18], ["siren", 6.27]], [["music", 60.8], ["synthetic singing", 5.53], ["saxophone", 4.35]], null, [["music", 60.38], ["swing music", 8.76], ["harmonica", 3.17]]], "duration": [0.69, 0.12, 1.99, 1.3, 0.16, 0.69, 1.16, 2.95, 1.09, 1.73, 6.84, 0.6, 21.27, 2.88, 0.11, 9.98]} \ No newline at end of file diff --git a/annotations_1/wwnqJH8OF-I_filtered.json b/annotations_1/wwnqJH8OF-I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bcd83984d9216201420f21800fd76d6c5b69ade1 --- /dev/null +++ b/annotations_1/wwnqJH8OF-I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.33], [12.0, 11.87], [12.0, 11.99], [18.0, 18.39], [19.0, 20.39], [28.0, 30.37], [47.0, 47.76], [53.0, 53.27], [56.0, 57.05], [60.0, 60.05], [61.0, 61.47], [66.0, 70.07], [72.0, 81.85], [83.0, 87.59], [92.0, 92.77], [96.0, 98.12], [102.0, 102.73], [107.0, 107.67], [108.0, 108.51], [116.0, 115.6], [119.0, 122.23], [123.0, 123.42], [130.0, 132.53], [145.0, 145.07], [147.0, 150.62], [157.0, 157.84], [158.0, 158.87]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.8, 0.0, 0.0, 0.0, 0.0, 0.0, 58.13, 87.55, 41.6, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 48.56, 0.0, 40.28, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 58.64], ["groan", 5.8], ["music", 4.3]], null, null, null, null, null, null, null, [["music", 40.04], ["whack, thwack", 6.12], ["fart", 5.92]], null, null, null, null, null, null, [["speech", 48.63], ["ding-dong", 22.55], ["music", 11.79]], null, [["moo", 32.69], ["cattle, bovinae", 30.33], ["livestock, farm animals, working animals", 7.91]], null, null, null, null], "duration": [0.33, -0.13, -0.01, 0.39, 1.39, 2.37, 0.76, 0.27, 1.05, 0.05, 0.47, 4.07, 9.85, 4.59, 0.77, 2.12, 0.73, 0.67, 0.51, -0.4, 3.23, 0.42, 2.53, 0.07, 3.62, 0.84, 0.87]} \ No newline at end of file diff --git a/annotations_1/wx-HWqbwssg_filtered.json b/annotations_1/wx-HWqbwssg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..efaeedb0ec42b7a3480a591a752c815ec958c332 --- /dev/null +++ b/annotations_1/wx-HWqbwssg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.83], [5.0, 6.64], [9.0, 10.59], [11.0, 11.84], [13.0, 14.32], [16.0, 17.22], [20.0, 20.55], [27.0, 31.09], [40.0, 42.47], [46.0, 47.9], [49.0, 50.97], [56.0, 56.42], [60.0, 60.03], [62.0, 62.23], [64.0, 65.65], [68.0, 69.69], [71.0, 71.68], [76.0, 76.42], [77.0, 77.68], [79.0, 80.1], [83.0, 84.72], [85.0, 87.98], [91.0, 91.62], [93.0, 93.95], [97.0, 97.02], [98.0, 99.33], [106.0, 107.1], [108.0, 111.37], [123.0, 126.59], [133.0, 133.34], [134.0, 134.3]], "keep_status": [false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.29, 47.01, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.25, 0.0, 0.0, 0.0, 0.0, 0.0, 33.65, 33.78, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 27.8], ["speech", 14.58], ["hum", 12.68]], [["hum", 31.8], ["mains hum", 11.63], ["dial tone", 9.8]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 27.9], ["mains hum", 11.18], ["hum", 7.91]], null, null, null, null, null, [["music", 47.0], ["hum", 11.61], ["sine wave", 7.32]], [["speech", 23.01], ["chirp tone", 18.7], ["sine wave", 15.09]], null, null], "duration": [1.83, 1.64, 1.59, 0.84, 1.32, 1.22, 0.55, 4.09, 2.47, 1.9, 1.97, 0.42, 0.03, 0.23, 1.65, 1.69, 0.68, 0.42, 0.68, 1.1, 1.72, 2.98, 0.62, 0.95, 0.02, 1.33, 1.1, 3.37, 3.59, 0.34, 0.3]} \ No newline at end of file diff --git a/annotations_1/wxV84RoUr_U_filtered.json b/annotations_1/wxV84RoUr_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..23bf4178cc091200984672566f2acd2529bce478 --- /dev/null +++ b/annotations_1/wxV84RoUr_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.21], [8.0, 8.24], [8.0, 16.23], [22.0, 22.67], [28.0, 29.12], [29.0, 37.42], [39.0, 39.16], [40.0, 45.45], [47.0, 47.14], [51.0, 51.76], [56.0, 56.62], [59.0, 60.3], [62.0, 63.78], [67.0, 68.05], [74.0, 75.22], [77.0, 77.75], [80.0, 80.37], [83.0, 84.2]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.08, 0.0, 30.02, 0.0, 0.0, 32.83, 0.0, 32.65, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 55.29], ["hum", 15.34], ["didgeridoo", 7.46]], null, [["music", 53.51], ["didgeridoo", 14.61], ["hum", 8.72]], null, null, [["music", 68.8], ["hum", 8.39], ["throbbing", 7.77]], null, [["music", 38.71], ["throbbing", 14.15], ["speech", 13.07]], null, null, null, null, null, null, null, null, null, null], "duration": [6.21, 0.24, 8.23, 0.67, 1.12, 8.42, 0.16, 5.45, 0.14, 0.76, 0.62, 1.3, 1.78, 1.05, 1.22, 0.75, 0.37, 1.2]} \ No newline at end of file diff --git a/annotations_1/wxhUTK7xbz8_filtered.json b/annotations_1/wxhUTK7xbz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1a0037de620226e9a99d7d1bab9d07706049422 --- /dev/null +++ b/annotations_1/wxhUTK7xbz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 23.77], [24.0, 25.14], [26.0, 26.18], [28.0, 29.05], [30.0, 31.41], [32.0, 33.42], [34.0, 35.48], [37.0, 37.79], [42.0, 42.84], [44.0, 44.46], [47.0, 47.76], [49.0, 50.41], [52.0, 54.53], [56.0, 59.41], [61.0, 63.27], [65.0, 66.28], [67.0, 69.08], [70.0, 71.19], [73.0, 74.51], [75.0, 76.99], [77.0, 78.75], [80.0, 82.34], [83.0, 87.13], [89.0, 90.81], [92.0, 92.58], [94.0, 93.82], [97.0, 98.34], [104.0, 108.33], [109.0, 111.05], [112.0, 112.45], [114.0, 114.54], [119.0, 121.09], [124.0, 124.77], [126.0, 127.99], [132.0, 136.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [92.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.8, 100.0, 87.37, 0.0, 74.13, 0.0, 0.0, 0.0, 0.0, 99.21, 95.91, 0.0, 0.0, 0.0, 0.0, 96.89, 79.24, 0.0, 0.0, 83.52, 0.0, 0.0, 97.43], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.77, 1.14, 0.18, 1.05, 1.41, 1.42, 1.48, 0.79, 0.84, 0.46, 0.76, 1.41, 2.53, 3.41, 2.27, 1.28, 2.08, 1.19, 1.51, 1.99, 1.75, 2.34, 4.13, 1.81, 0.58, -0.18, 1.34, 4.33, 2.05, 0.45, 0.54, 2.09, 0.77, 1.99, 4.7]} \ No newline at end of file diff --git a/annotations_1/wxlD2wwIgVk_filtered.json b/annotations_1/wxlD2wwIgVk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/wxlD2wwIgVk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/wyHOKleZzFM_filtered.json b/annotations_1/wyHOKleZzFM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..28ffa8d45f08a613b5beef5b353011f3342254c2 --- /dev/null +++ b/annotations_1/wyHOKleZzFM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 12.75], [13.0, 33.49], [34.0, 34.3], [34.0, 44.86], [47.0, 48.83], [54.0, 56.19], [57.0, 56.74], [57.0, 56.86], [57.0, 56.89], [57.0, 58.95], [62.0, 67.46], [68.0, 73.79], [75.0, 75.46], [76.0, 76.94], [78.0, 89.68], [108.0, 114.83], [118.0, 119.28], [120.0, 129.46], [130.0, 133.14]], "keep_status": [false, false, false, true, false, true, false, false, false, false, false, false, false, false, true, true, false, true, false], "silence_prob": [0.0, 42.98, 0.0, 45.36, 0.0, 39.3, 0.0, 0.0, 0.0, 0.0, 42.08, 29.42, 0.0, 0.0, 33.24, 36.52, 0.0, 28.63, 28.76], "audiomae_on_audioset": [null, [["sidetone", 53.03], ["speech", 25.88], ["noise", 5.88]], null, [["speech", 45.22], ["rumble", 4.9], ["whale vocalization", 4.03]], null, [["speech", 34.12], ["cattle, bovinae", 10.63], ["moo", 6.33]], null, null, null, null, [["throbbing", 31.64], ["speech", 26.77], ["hum", 18.5]], [["speech", 45.2], ["explosion", 17.27], ["vehicle", 7.94]], null, null, [["speech", 44.55], ["sidetone", 7.51], ["fly, housefly", 5.25]], [["speech", 40.57], ["fart", 13.61], ["animal", 6.8]], null, [["speech", 17.79], ["outside, rural or natural", 11.66], ["groan", 7.27]], [["whale vocalization", 93.8], ["cattle, bovinae", 1.55], ["livestock, farm animals, working animals", 0.73]]], "duration": [-0.25, 20.49, 0.3, 10.86, 1.83, 2.19, -0.26, -0.14, -0.11, 1.95, 5.46, 5.79, 0.46, 0.94, 11.68, 6.83, 1.28, 9.46, 3.14]} \ No newline at end of file diff --git a/annotations_1/wyQmO-LFF4M_filtered.json b/annotations_1/wyQmO-LFF4M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4ca157425898c347b1b5cae4f33eec8b47d2c24f --- /dev/null +++ b/annotations_1/wyQmO-LFF4M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.86], [6.0, 7.57], [9.0, 10.25], [13.0, 14.03], [15.0, 24.56], [28.0, 29.37], [31.0, 33.49], [35.0, 36.76], [37.0, 38.28], [41.0, 47.36], [48.0, 50.9], [51.0, 54.04], [55.0, 58.51], [60.0, 68.82], [69.0, 71.34], [72.0, 75.76], [78.0, 81.09], [82.0, 83.93], [85.0, 86.43], [89.0, 92.97], [96.0, 121.76], [122.0, 128.48], [132.0, 156.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 100.0, 0.0, 0.0, 98.66, 100.0, 71.43, 100.0, 99.98, 99.21, 100.0, 99.93, 0.0, 0.0, 52.33, 100.0, 86.27, 99.99], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.86, 1.57, 1.25, 1.03, 9.56, 1.37, 2.49, 1.76, 1.28, 6.36, 2.9, 3.04, 3.51, 8.82, 2.34, 3.76, 3.09, 1.93, 1.43, 3.97, 25.76, 6.48, 24.78]} \ No newline at end of file diff --git a/annotations_1/wySz6ysIDhs_filtered.json b/annotations_1/wySz6ysIDhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..524401c4a0c00238a0b5f3469d05e45352202cc1 --- /dev/null +++ b/annotations_1/wySz6ysIDhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.0], [4.0, 4.75], [6.0, 6.72], [8.0, 9.31], [13.0, 13.54], [14.0, 14.47], [16.0, 15.84], [17.0, 17.41], [19.0, 19.06], [20.0, 20.76], [21.0, 21.56], [23.0, 23.85], [26.0, 26.01], [26.0, 26.69], [30.0, 30.74], [37.0, 37.05], [42.0, 42.3], [45.0, 44.73], [47.0, 47.6], [49.0, 50.13], [52.0, 52.34], [54.0, 54.35], [55.0, 55.7], [57.0, 63.59], [65.0, 66.39], [67.0, 73.74], [74.0, 74.83], [76.0, 76.59], [78.0, 78.6], [79.0, 81.33], [82.0, 82.49], [84.0, 84.32], [85.0, 88.53], [89.0, 89.72], [90.0, 90.9], [92.0, 92.33], [95.0, 95.28], [96.0, 97.8], [98.0, 98.78], [101.0, 101.34], [102.0, 101.85], [102.0, 103.22], [105.0, 106.1], [108.0, 108.23], [109.0, 110.0], [112.0, 112.7], [113.0, 113.98], [115.0, 115.11], [118.0, 118.67], [120.0, 120.45], [121.0, 122.32], [123.0, 124.07], [126.0, 126.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.82, 0.0, 37.0, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 71.64], ["music", 4.14], ["thunk", 3.51]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.0, 0.75, 0.72, 1.31, 0.54, 0.47, -0.16, 0.41, 0.06, 0.76, 0.56, 0.85, 0.01, 0.69, 0.74, 0.05, 0.3, -0.27, 0.6, 1.13, 0.34, 0.35, 0.7, 6.59, 1.39, 6.74, 0.83, 0.59, 0.6, 2.33, 0.49, 0.32, 3.53, 0.72, 0.9, 0.33, 0.28, 1.8, 0.78, 0.34, -0.15, 1.22, 1.1, 0.23, 1.0, 0.7, 0.98, 0.11, 0.67, 0.45, 1.32, 1.07, 0.69]} \ No newline at end of file diff --git a/annotations_1/wyifbBO6sAY_filtered.json b/annotations_1/wyifbBO6sAY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..21088980a63ad2831985483d9aa25204be3da01d --- /dev/null +++ b/annotations_1/wyifbBO6sAY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.37], [11.0, 12.29], [17.0, 35.78], [38.0, 67.44], [69.0, 68.94], [69.0, 72.4], [80.0, 91.64], [94.0, 96.9], [97.0, 107.4], [109.0, 117.68], [119.0, 125.54], [131.0, 131.62], [136.0, 136.61], [140.0, 140.85], [142.0, 149.39], [151.0, 152.9], [155.0, 156.17], [157.0, 157.35], [158.0, 164.03], [168.0, 169.74], [170.0, 176.64]], "keep_status": [false, false, false, true, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [85.9, 0.0, 74.6, 36.84, 0.0, 34.04, 37.58, 37.69, 40.47, 33.55, 34.29, 0.0, 0.0, 0.0, 53.97, 0.0, 0.0, 0.0, 71.72, 0.0, 50.97], "audiomae_on_audioset": [null, null, null, [["music", 47.2], ["musical instrument", 11.42], ["guitar", 6.4]], null, [["aircraft", 7.86], ["hum", 7.76], ["mains hum", 6.58]], [["speech", 40.26], ["music", 19.12], ["hum", 8.41]], [["music", 70.22], ["ambient music", 6.89], ["throbbing", 2.83]], [["speech", 42.11], ["music", 17.51], ["hum", 10.64]], [["speech", 46.06], ["music", 19.56], ["musical instrument", 5.5]], [["music", 57.57], ["speech", 21.42], ["hum", 6.18]], null, null, null, null, null, null, null, null, null, null], "duration": [2.37, 1.29, 18.78, 29.44, -0.06, 3.4, 11.64, 2.9, 10.4, 8.68, 6.54, 0.62, 0.61, 0.85, 7.39, 1.9, 1.17, 0.35, 6.03, 1.74, 6.64]} \ No newline at end of file diff --git a/annotations_1/wytpJXfw86w_filtered.json b/annotations_1/wytpJXfw86w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..acc13140513018046d1dace69e81e8276462ff06 --- /dev/null +++ b/annotations_1/wytpJXfw86w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.29], [8.0, 20.02], [24.0, 58.73], [66.0, 65.94], [67.0, 83.13], [84.0, 105.49], [107.0, 118.89], [119.0, 120.33], [121.0, 125.0], [125.0, 145.44], [147.0, 150.47], [152.0, 162.85], [163.0, 165.23], [167.0, 168.89], [169.0, 175.15]], "keep_status": [false, true, false, false, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 29.37, 0.0, 0.0, 46.05, 65.79, 59.42, 0.0, 47.86, 60.79, 73.21, 64.75, 50.21, 0.0, 44.49], "audiomae_on_audioset": [null, [["music", 49.58], ["thump, thud", 5.84], ["hum", 5.38]], null, null, [["hum", 37.45], ["mains hum", 22.54], ["throbbing", 11.75]], null, null, null, [["music", 27.8], ["speech", 17.55], ["hum", 7.3]], null, null, null, null, null, [["music", 20.21], ["speech", 12.52], ["cattle, bovinae", 8.45]]], "duration": [0.29, 12.02, 34.73, -0.06, 16.13, 21.49, 11.89, 1.33, 4.0, 20.44, 3.47, 10.85, 2.23, 1.89, 6.15]} \ No newline at end of file diff --git a/annotations_1/wzZ3S0ZC1Is_filtered.json b/annotations_1/wzZ3S0ZC1Is_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..78ca59ae3ab8cdaa4fdb75593ad561360dc221b3 --- /dev/null +++ b/annotations_1/wzZ3S0ZC1Is_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.13], [3.0, 11.42], [12.0, 12.83], [14.0, 17.34], [20.0, 20.93], [29.0, 34.48], [36.0, 37.44], [39.0, 44.42], [46.0, 47.21], [48.0, 49.49], [50.0, 51.0], [51.0, 51.65], [52.0, 53.42], [56.0, 60.0], [64.0, 64.32], [64.0, 64.35], [67.0, 76.42], [83.0, 88.5], [91.0, 94.42], [100.0, 100.48], [101.0, 101.17], [103.0, 109.41], [110.0, 110.67], [113.0, 113.85], [116.0, 121.66], [122.0, 122.98], [124.0, 124.21], [125.0, 125.2], [127.0, 131.57], [133.0, 138.38], [140.0, 144.83], [153.0, 154.28], [157.0, 156.91], [158.0, 159.81], [161.0, 161.45]], "keep_status": [false, false, false, true, false, true, false, true, false, false, false, false, false, true, false, false, false, true, true, false, false, true, false, false, true, false, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 33.17, 0.0, 34.67, 0.0, 33.67, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 34.51, 0.0, 0.0, 32.63, 32.41, 32.79, 0.0, 0.0, 32.84, 0.0, 0.0, 32.98, 0.0, 0.0, 0.0, 31.76, 32.45, 33.21, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.31], ["musical instrument", 13.76], ["theremin", 3.01]], null, [["music", 29.17], ["trombone", 19.81], ["brass instrument", 16.52]], null, [["music", 43.74], ["musical instrument", 8.97], ["echo", 5.53]], null, [["music", 48.8], ["didgeridoo", 5.26], ["musical instrument", 4.69]], null, null, null, null, null, [["speech", 31.4], ["music", 23.18], ["trombone", 7.96]], null, null, [["music", 64.78], ["musical instrument", 6.2], ["trombone", 4.66]], [["music", 21.83], ["didgeridoo", 12.95], ["theremin", 11.51]], [["music", 44.22], ["musical instrument", 7.35], ["saxophone", 6.36]], null, null, [["music", 43.77], ["brass instrument", 15.83], ["musical instrument", 9.88]], null, null, [["music", 39.88], ["brass instrument", 9.77], ["trombone", 8.56]], null, null, null, [["music", 66.16], ["musical instrument", 6.85], ["brass instrument", 3.07]], [["music", 31.21], ["brass instrument", 14.45], ["trombone", 11.84]], [["music", 36.49], ["brass instrument", 18.68], ["musical instrument", 13.08]], null, null, null, null], "duration": [1.13, 8.42, 0.83, 3.34, 0.93, 5.48, 1.44, 5.42, 1.21, 1.49, 1.0, 0.65, 1.42, 4.0, 0.32, 0.35, 9.42, 5.5, 3.42, 0.48, 0.17, 6.41, 0.67, 0.85, 5.66, 0.98, 0.21, 0.2, 4.57, 5.38, 4.83, 1.28, -0.09, 1.81, 0.45]} \ No newline at end of file diff --git a/annotations_1/x-_17t-v9dA_filtered.json b/annotations_1/x-_17t-v9dA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbefb2e3cc47dc88d09229408d7b5ffe1498e49e --- /dev/null +++ b/annotations_1/x-_17t-v9dA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 17.93], [24.0, 24.33], [25.0, 25.57], [26.0, 26.6], [47.0, 47.41], [111.0, 111.16], [122.0, 121.63], [122.0, 122.4], [132.0, 132.16]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.93, 0.33, 0.57, 0.6, 0.41, 0.16, -0.37, 0.4, 0.16]} \ No newline at end of file diff --git a/annotations_1/x1FhrhoudSE_filtered.json b/annotations_1/x1FhrhoudSE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df345045ff9c37976b2dcafba76ec7bd97513678 --- /dev/null +++ b/annotations_1/x1FhrhoudSE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 17.81], [19.0, 19.09], [24.0, 26.03], [30.0, 30.43], [32.0, 32.14], [33.0, 33.86], [38.0, 38.38], [41.0, 45.15], [48.0, 48.95], [53.0, 53.54], [59.0, 60.57], [65.0, 65.45], [70.0, 70.23], [71.0, 71.66], [74.0, 75.02], [82.0, 81.99], [84.0, 83.88], [89.0, 91.74], [93.0, 93.77], [95.0, 95.81], [97.0, 96.9], [107.0, 107.3], [115.0, 116.51], [122.0, 122.74], [123.0, 123.23], [137.0, 138.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.99, 0.0, 99.26, 0.0, 0.0, 0.0, 0.0, 52.86, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [15.81, 0.09, 2.03, 0.43, 0.14, 0.86, 0.38, 4.15, 0.95, 0.54, 1.57, 0.45, 0.23, 0.66, 1.02, -0.01, -0.12, 2.74, 0.77, 0.81, -0.1, 0.3, 1.51, 0.74, 0.23, 1.52]} \ No newline at end of file diff --git a/annotations_1/x1YvX61qS0Q_filtered.json b/annotations_1/x1YvX61qS0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a42070edf50ef81d923d0a9e2e24037673806aee --- /dev/null +++ b/annotations_1/x1YvX61qS0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [2.0, 6.78], [9.0, 12.39], [15.0, 16.93], [18.0, 18.89], [21.0, 22.38], [24.0, 25.37], [26.0, 28.39], [33.0, 34.28], [35.0, 36.1], [37.0, 38.38], [39.0, 42.89], [43.0, 50.95], [51.0, 51.92], [52.0, 53.18], [58.0, 59.31], [61.0, 71.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 59.86, 58.81, 0.0, 0.0, 0.0, 0.0, 97.83, 0.0, 0.0, 0.0, 95.51, 55.67, 0.0, 0.0, 0.0, 37.47], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.39], ["frog", 8.97], ["fart", 5.64]]], "duration": [0.51, 4.78, 3.39, 1.93, 0.89, 1.38, 1.37, 2.39, 1.28, 1.1, 1.38, 3.89, 7.95, 0.92, 1.18, 1.31, 10.74]} \ No newline at end of file diff --git a/annotations_1/x24Olya2NLk_filtered.json b/annotations_1/x24Olya2NLk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..16de397fb42aaf0707aac76b1c283446a6880ea9 --- /dev/null +++ b/annotations_1/x24Olya2NLk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.26], [9.0, 9.66], [11.0, 12.39], [14.0, 35.63], [37.0, 37.15], [37.0, 41.22], [42.0, 41.57], [42.0, 63.1], [65.0, 72.57], [74.0, 74.55], [76.0, 192.87]], "keep_status": [false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 28.22, 0.0, 28.26, 0.0, 28.5, 28.55, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 61.84], ["musical instrument", 5.29], ["hum", 4.61]], null, [["music", 24.51], ["whack, thwack", 15.93], ["whip", 7.21]], null, [["music", 18.31], ["hum", 17.61], ["mains hum", 10.57]], [["music", 31.81], ["sound effect", 9.48], ["hum", 7.66]], null, null], "duration": [0.26, 0.66, 1.39, 21.63, 0.15, 4.22, -0.43, 21.1, 7.57, 0.55, 116.87]} \ No newline at end of file diff --git a/annotations_1/x2K8I28zejw_filtered.json b/annotations_1/x2K8I28zejw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..77997e5c7e2a264dc372c51f2e1c684008e7c947 --- /dev/null +++ b/annotations_1/x2K8I28zejw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.56], [12.0, 12.5], [14.0, 21.84], [24.0, 25.66], [30.0, 31.45], [33.0, 33.72], [35.0, 35.29], [37.0, 37.4], [39.0, 39.38], [44.0, 44.15], [45.0, 48.51], [59.0, 59.17], [60.0, 60.32], [62.0, 62.87], [64.0, 67.44], [67.0, 70.16], [74.0, 76.5], [101.0, 101.92], [112.0, 112.85], [123.0, 123.06], [124.0, 124.55], [140.0, 141.34], [154.0, 155.19], [164.0, 165.33], [166.0, 165.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.07, 0.0, 0.0, 0.0, 44.87, 50.66, 35.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 75.88], ["theremin", 3.56], ["throbbing", 2.85]], null, null, null, null, null, null, null, [["speech", 49.77], ["sidetone", 21.14], ["hum", 5.9]], null, null, null, [["music", 26.14], ["hum", 19.11], ["mains hum", 9.0]], null, [["speech", 51.59], ["mains hum", 7.29], ["buzz", 6.86]], null, null, null, null, null, null, null, null], "duration": [0.56, 0.5, 7.84, 1.66, 1.45, 0.72, 0.29, 0.4, 0.38, 0.15, 3.51, 0.17, 0.32, 0.87, 3.44, 3.16, 2.5, 0.92, 0.85, 0.06, 0.55, 1.34, 1.19, 1.33, -0.14]} \ No newline at end of file diff --git a/annotations_1/x2S78gnCkRg_filtered.json b/annotations_1/x2S78gnCkRg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..12d6293bf0aedd7b5b9c0879a14c7ff743a64091 --- /dev/null +++ b/annotations_1/x2S78gnCkRg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[40.0, 41.27], [43.0, 59.1], [61.0, 61.28], [63.0, 63.14], [69.0, 73.04], [74.0, 74.58], [80.0, 80.69], [81.0, 160.54]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 37.31, 0.0, 0.0, 39.34, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 61.56], ["electronic music", 4.9], ["speech", 3.83]], null, null, [["music", 61.54], ["throbbing", 11.51], ["hum", 3.93]], null, null, null], "duration": [1.27, 16.1, 0.28, 0.14, 4.04, 0.58, 0.69, 79.54]} \ No newline at end of file diff --git a/annotations_1/x35VnGsGrFc_filtered.json b/annotations_1/x35VnGsGrFc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b56f5ff524b34f4007523faccdbba06cb8ae8403 --- /dev/null +++ b/annotations_1/x35VnGsGrFc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 21.1], [21.0, 22.18], [25.0, 25.08], [26.0, 26.0], [26.0, 50.67], [52.0, 53.79], [54.0, 102.84], [108.0, 127.99], [130.0, 131.8]], "keep_status": [false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.17, 0.0, 0.0, 30.22, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.61], ["speech", 37.61], ["whack, thwack", 2.44]], null, null, [["music", 31.87], ["throbbing", 22.05], ["hum", 14.58]], null], "duration": [0.1, 1.18, 0.08, 0.0, 24.67, 1.79, 48.84, 19.99, 1.8]} \ No newline at end of file diff --git a/annotations_1/x39ZG34sn28_filtered.json b/annotations_1/x39ZG34sn28_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f727625614e0c1841ebbcc296e6b34b6c722e7c --- /dev/null +++ b/annotations_1/x39ZG34sn28_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[71.0, 71.95], [74.0, 77.33], [79.0, 91.42], [92.0, 95.94], [97.0, 101.31], [102.0, 104.87], [105.0, 111.64], [113.0, 114.54], [117.0, 117.02], [118.0, 121.64], [122.0, 122.94], [123.0, 124.12]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 69.61, 68.28, 65.67, 75.39, 83.7, 77.03, 0.0, 0.0, 42.65, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 46.55], ["speech", 17.48], ["hum", 3.06]], null, null], "duration": [0.95, 3.33, 12.42, 3.94, 4.31, 2.87, 6.64, 1.54, 0.02, 3.64, 0.94, 1.12]} \ No newline at end of file diff --git a/annotations_1/x3OTeacsT84_filtered.json b/annotations_1/x3OTeacsT84_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..343bc780f804fce6bf3ec68527ddbcee6ce5d270 --- /dev/null +++ b/annotations_1/x3OTeacsT84_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.42], [5.0, 5.58], [25.0, 28.63], [30.0, 31.77], [33.0, 34.32], [35.0, 36.22], [39.0, 48.59], [50.0, 51.33], [53.0, 55.17], [58.0, 58.13], [59.0, 60.74], [62.0, 62.7], [67.0, 68.34], [72.0, 74.11], [76.0, 76.92], [78.0, 79.69], [81.0, 86.64], [87.0, 89.13], [92.0, 93.75], [96.0, 97.21], [98.0, 101.06], [105.0, 108.92], [109.0, 111.23], [112.0, 113.09], [114.0, 114.49], [117.0, 117.73], [119.0, 129.39], [130.0, 130.6], [132.0, 136.8], [138.0, 138.62], [142.0, 143.72], [145.0, 144.64], [145.0, 147.82], [149.0, 156.98], [162.0, 161.91], [164.0, 164.03], [166.0, 166.23], [167.0, 167.34], [176.0, 176.69], [178.0, 178.02], [183.0, 183.91], [185.0, 187.49], [188.0, 190.14], [191.0, 192.6], [195.0, 195.84], [199.0, 201.48], [203.0, 203.23], [203.0, 206.39], [210.0, 225.22]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 77.87, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 99.52, 0.0, 0.0, 99.95, 99.98, 0.0, 0.0, 90.95, 99.36, 47.86, 0.0, 0.0, 0.0, 98.51, 0.0, 99.73, 0.0, 0.0, 0.0, 32.6, 53.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.92, 53.65, 0.0, 0.0, 64.86, 0.0, 47.9, 38.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 39.22], ["whale vocalization", 15.77], ["hum", 5.46]], null, null, null, null, null, null, null, null, null, [["music", 36.81], ["snicker", 11.26], ["laughter", 10.83]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.13], ["music", 27.96], ["throbbing", 4.74]], [["music", 31.28], ["throbbing", 23.86], ["hum", 20.74]]], "duration": [0.42, 0.58, 3.63, 1.77, 1.32, 1.22, 9.59, 1.33, 2.17, 0.13, 1.74, 0.7, 1.34, 2.11, 0.92, 1.69, 5.64, 2.13, 1.75, 1.21, 3.06, 3.92, 2.23, 1.09, 0.49, 0.73, 10.39, 0.6, 4.8, 0.62, 1.72, -0.36, 2.82, 7.98, -0.09, 0.03, 0.23, 0.34, 0.69, 0.02, 0.91, 2.49, 2.14, 1.6, 0.84, 2.48, 0.23, 3.39, 15.22]} \ No newline at end of file diff --git a/annotations_1/x4IKGG_2L6I_filtered.json b/annotations_1/x4IKGG_2L6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a348615f871f54cd4c053c6441f5da0964a5d01b --- /dev/null +++ b/annotations_1/x4IKGG_2L6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 12.21], [13.0, 13.81], [18.0, 18.5], [25.0, 28.43], [29.0, 33.59], [34.0, 36.07], [39.0, 40.69], [43.0, 47.66], [48.0, 49.4], [50.0, 51.06], [53.0, 54.82], [64.0, 68.64], [73.0, 73.82], [78.0, 79.95], [83.0, 82.9], [83.0, 83.02], [83.0, 84.79], [86.0, 87.0], [89.0, 88.74], [89.0, 89.4], [92.0, 92.85], [95.0, 94.81], [97.0, 97.09], [98.0, 99.2], [100.0, 100.36], [101.0, 101.44], [102.0, 102.81], [107.0, 108.4], [110.0, 113.49], [116.0, 116.65], [118.0, 121.05], [123.0, 126.77], [129.0, 137.1], [139.0, 139.19], [159.0, 159.39], [172.0, 173.97], [176.0, 177.06], [178.0, 181.79]], "keep_status": [false, false, false, false, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true], "silence_prob": [34.26, 0.0, 0.0, 53.22, 39.83, 39.66, 0.0, 49.82, 0.0, 0.0, 0.0, 30.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.2, 0.0, 61.47, 35.98, 42.13, 0.0, 0.0, 0.0, 0.0, 35.59], "audiomae_on_audioset": [[["music", 53.47], ["speech", 33.02], ["sidetone", 1.41]], null, null, null, [["music", 47.13], ["speech", 13.18], ["hum", 3.26]], [["speech", 50.76], ["hum", 9.61], ["music", 6.49]], null, [["sidetone", 67.38], ["speech", 17.51], ["hum", 3.24]], null, null, null, [["fly, housefly", 44.54], ["insect", 13.25], ["speech", 10.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 15.62], ["whack, thwack", 15.12], ["echo", 10.7]], null, null, [["music", 25.59], ["hum", 23.17], ["throbbing", 13.52]], [["throbbing", 36.49], ["hum", 25.06], ["music", 11.33]], null, null, null, null, [["whack, thwack", 10.54], ["music", 10.45], ["throbbing", 7.23]]], "duration": [8.21, 0.81, 0.5, 3.43, 4.59, 2.07, 1.69, 4.66, 1.4, 1.06, 1.82, 4.64, 0.82, 1.95, -0.1, 0.02, 1.79, 1.0, -0.26, 0.4, 0.85, -0.19, 0.09, 1.2, 0.36, 0.44, 0.81, 1.4, 3.49, 0.65, 3.05, 3.77, 8.1, 0.19, 0.39, 1.97, 1.06, 3.79]} \ No newline at end of file diff --git a/annotations_1/x4L81QLGYuM_filtered.json b/annotations_1/x4L81QLGYuM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7204aae38ecfaaf99a18c0cf9764b736526d13ff --- /dev/null +++ b/annotations_1/x4L81QLGYuM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.31], [10.0, 13.93], [16.0, 20.39], [24.0, 24.68], [27.0, 33.91], [34.0, 33.94], [36.0, 36.41], [38.0, 38.18], [39.0, 43.93], [50.0, 51.92], [53.0, 56.98], [60.0, 60.94], [62.0, 63.14], [67.0, 69.11], [69.0, 74.44], [77.0, 88.32], [90.0, 105.51], [107.0, 108.08], [109.0, 108.94], [110.0, 114.51], [116.0, 119.77], [121.0, 122.69], [123.0, 124.12], [125.0, 171.04], [177.0, 180.94], [185.0, 184.84], [185.0, 186.95], [188.0, 192.94], [195.0, 201.41], [202.0, 220.94]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 29.71, 30.65, 0.0, 31.28, 0.0, 0.0, 0.0, 29.62, 0.0, 29.86, 0.0, 0.0, 34.66, 29.49, 30.28, 30.94, 0.0, 0.0, 31.6, 29.95, 0.0, 0.0, 0.0, 34.72, 0.0, 0.0, 28.66, 28.91, 28.97], "audiomae_on_audioset": [null, [["music", 61.79], ["electronic music", 5.32], ["hum", 3.92]], [["music", 54.42], ["throbbing", 14.14], ["hum", 12.71]], null, [["hum", 33.97], ["mains hum", 21.12], ["speech", 15.79]], null, null, null, [["speech", 40.66], ["music", 12.87], ["breaking", 5.61]], null, [["livestock, farm animals, working animals", 54.47], ["cattle, bovinae", 29.8], ["moo", 15.24]], null, null, [["mains hum", 26.58], ["hum", 23.86], ["music", 16.08]], [["speech", 28.8], ["explosion", 18.98], ["burst, pop", 7.04]], [["speech", 68.89], ["music", 14.27], ["sidetone", 1.85]], [["speech", 48.73], ["music", 16.26], ["whack, thwack", 8.57]], null, null, [["music", 55.32], ["hum", 5.19], ["throbbing", 4.75]], [["speech", 50.14], ["music", 12.28], ["thunk", 10.89]], null, null, null, [["music", 49.39], ["hum", 8.0], ["mains hum", 5.97]], null, null, [["music", 19.72], ["cattle, bovinae", 9.5], ["whack, thwack", 9.26]], [["music", 58.62], ["throbbing", 24.23], ["hum", 4.19]], [["music", 57.21], ["speech", 13.2], ["hum", 4.53]]], "duration": [1.31, 3.93, 4.39, 0.68, 6.91, -0.06, 0.41, 0.18, 4.93, 1.92, 3.98, 0.94, 1.14, 2.11, 5.44, 11.32, 15.51, 1.08, -0.06, 4.51, 3.77, 1.69, 1.12, 46.04, 3.94, -0.16, 1.95, 4.94, 6.41, 18.94]} \ No newline at end of file diff --git a/annotations_1/x5Gwzy2FY10_filtered.json b/annotations_1/x5Gwzy2FY10_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b602194e0e2ae26e0518ad6bb0accf68360d3fa4 --- /dev/null +++ b/annotations_1/x5Gwzy2FY10_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.82], [5.0, 7.79], [9.0, 11.64], [13.0, 14.07], [15.0, 15.13], [19.0, 18.99], [19.0, 20.58], [21.0, 22.67], [23.0, 23.45], [27.0, 28.16], [30.0, 32.19], [33.0, 34.21], [41.0, 40.9], [43.0, 43.85], [45.0, 46.62], [49.0, 51.73], [54.0, 54.99], [56.0, 68.3], [72.0, 73.11], [74.0, 74.63], [77.0, 77.53], [79.0, 93.8], [100.0, 100.38], [101.0, 101.14], [103.0, 104.06], [105.0, 105.71], [109.0, 108.9], [109.0, 111.18], [112.0, 113.16], [115.0, 115.53], [116.0, 117.81]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 34.19, 38.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.75, 0.0, 0.0, 0.0, 0.0, 62.27, 0.0, 30.71, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0, 0.0, 46.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.29], ["synthesizer", 12.46], ["electronic music", 7.01]], [["music", 34.77], ["speech", 11.61], ["synthesizer", 7.45]], null, null, null, null, null, null, null, [["music", 15.72], ["boing", 12.17], ["sidetone", 10.33]], null, null, null, null, null, null, [["music", 47.81], ["throbbing", 20.43], ["hum", 13.54]], null, null, null, null, null, null, null, null, null, [["speech", 62.55], ["fart", 3.3], ["burping, eructation", 3.23]], null, null, null], "duration": [0.82, 2.79, 2.64, 1.07, 0.13, -0.01, 1.58, 1.67, 0.45, 1.16, 2.19, 1.21, -0.1, 0.85, 1.62, 2.73, 0.99, 12.3, 1.11, 0.63, 0.53, 14.8, 0.38, 0.14, 1.06, 0.71, -0.1, 2.18, 1.16, 0.53, 1.81]} \ No newline at end of file diff --git a/annotations_1/x5ajdqqytyA_filtered.json b/annotations_1/x5ajdqqytyA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..861d59a65e584c38d411c8850618685fc9606863 --- /dev/null +++ b/annotations_1/x5ajdqqytyA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.03], [12.0, 23.11], [24.0, 27.48], [29.0, 31.97], [33.0, 43.97], [46.0, 59.8], [61.0, 62.87], [64.0, 64.67], [68.0, 73.2], [74.0, 76.69], [80.0, 83.12], [86.0, 97.9], [99.0, 102.15], [103.0, 105.98], [108.0, 113.04], [114.0, 124.65], [127.0, 127.38], [128.0, 128.7], [130.0, 130.94], [134.0, 134.74], [137.0, 138.0], [140.0, 141.83], [144.0, 144.12], [146.0, 147.36], [150.0, 151.66], [152.0, 152.31], [152.0, 152.51], [153.0, 153.66], [155.0, 155.95], [157.0, 158.28], [159.0, 160.51], [162.0, 163.44], [166.0, 167.66], [170.0, 171.71], [173.0, 173.72], [175.0, 175.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.88, 97.22, 98.73, 98.36, 96.77, 65.2, 0.0, 0.0, 55.89, 99.99, 99.91, 97.0, 81.71, 99.8, 99.98, 86.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.03, 11.11, 3.48, 2.97, 10.97, 13.8, 1.87, 0.67, 5.2, 2.69, 3.12, 11.9, 3.15, 2.98, 5.04, 10.65, 0.38, 0.7, 0.94, 0.74, 1.0, 1.83, 0.12, 1.36, 1.66, 0.31, 0.51, 0.66, 0.95, 1.28, 1.51, 1.44, 1.66, 1.71, 0.72, 0.86]} \ No newline at end of file diff --git a/annotations_1/x5z9VZO--G4_filtered.json b/annotations_1/x5z9VZO--G4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9de3d03ab18c540263c61a1089cc74a2a12d2153 --- /dev/null +++ b/annotations_1/x5z9VZO--G4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [3.0, 4.04], [8.0, 7.84], [10.0, 10.72], [20.0, 20.61], [25.0, 24.75], [27.0, 27.62], [28.0, 29.05], [37.0, 39.38], [41.0, 43.31], [44.0, 44.12], [45.0, 46.43], [50.0, 54.16], [55.0, 57.35], [58.0, 60.39], [63.0, 63.9], [67.0, 69.31], [71.0, 71.15], [72.0, 73.09], [75.0, 75.52], [79.0, 81.35], [83.0, 84.77], [87.0, 92.67], [93.0, 95.45], [102.0, 103.11], [105.0, 104.75], [107.0, 112.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.44, 59.77, 0.0, 0.0, 100.0, 100.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 97.73, 0.0, 0.0, 95.78], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.88, 1.04, -0.16, 0.72, 0.61, -0.25, 0.62, 1.05, 2.38, 2.31, 0.12, 1.43, 4.16, 2.35, 2.39, 0.9, 2.31, 0.15, 1.09, 0.52, 2.35, 1.77, 5.67, 2.45, 1.11, -0.25, 5.95]} \ No newline at end of file diff --git a/annotations_1/x7S89GM5N7w_filtered.json b/annotations_1/x7S89GM5N7w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f5205bb556b481d8b1c6da6b77ada457511f3d5f --- /dev/null +++ b/annotations_1/x7S89GM5N7w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 23.11], [26.0, 26.6], [39.0, 41.81], [45.0, 45.06], [45.0, 45.96], [47.0, 47.85], [49.0, 53.3], [59.0, 59.36], [62.0, 62.07], [65.0, 65.06], [68.0, 68.39], [68.0, 68.45], [77.0, 78.17], [87.0, 87.69], [96.0, 95.99], [99.0, 99.86], [100.0, 100.57], [101.0, 102.42], [103.0, 103.69], [105.0, 105.83], [107.0, 108.08], [115.0, 115.26], [121.0, 121.59], [122.0, 121.78], [122.0, 122.22], [123.0, 128.8], [130.0, 130.27]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 86.27, 0.0, 0.0, 0.0, 49.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["speech", 87.19], ["radio", 4.83], ["telephone", 1.33]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.67], ["radio", 12.68], ["music", 9.04]], null], "duration": [0.11, 0.6, 2.81, 0.06, 0.96, 0.85, 4.3, 0.36, 0.07, 0.06, 0.39, 0.45, 1.17, 0.69, -0.01, 0.86, 0.57, 1.42, 0.69, 0.83, 1.08, 0.26, 0.59, -0.22, 0.22, 5.8, 0.27]} \ No newline at end of file diff --git a/annotations_1/x7qvOFN1QZg_filtered.json b/annotations_1/x7qvOFN1QZg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2550e69c16d03ffb49d00ab46518dc72f6285c30 --- /dev/null +++ b/annotations_1/x7qvOFN1QZg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 17.9], [20.0, 21.42], [22.0, 23.62], [36.0, 37.74], [42.0, 50.67], [51.0, 51.97], [60.0, 60.66], [69.0, 72.98], [74.0, 80.0], [87.0, 89.07], [91.0, 92.64], [94.0, 96.03], [97.0, 97.09], [97.0, 105.19], [106.0, 111.25], [113.0, 136.16], [141.0, 142.33], [146.0, 155.44]], "keep_status": [true, false, false, false, false, false, false, true, true, false, false, true, false, true, true, true, false, true], "silence_prob": [30.98, 0.0, 0.0, 0.0, 30.94, 0.0, 0.0, 32.38, 44.43, 59.96, 0.0, 40.07, 0.0, 43.38, 36.79, 33.08, 0.0, 32.55], "audiomae_on_audioset": [[["breaking", 36.14], ["music", 24.66], ["speech", 6.89]], null, null, null, [["speech", 46.96], ["fart", 15.09], ["music", 11.52]], null, null, [["music", 34.84], ["speech", 26.66], ["electric shaver, electric razor", 4.47]], [["speech", 28.43], ["music", 19.2], ["hum", 18.51]], null, null, [["speech", 24.9], ["hum", 22.34], ["whale vocalization", 5.51]], null, [["whale vocalization", 31.9], ["hum", 27.33], ["mains hum", 8.23]], [["speech", 22.91], ["mains hum", 18.82], ["hum", 16.53]], [["music", 46.82], ["speech", 11.96], ["synthesizer", 5.62]], null, [["speech", 35.48], ["music", 29.46], ["buzz", 4.89]]], "duration": [6.9, 1.42, 1.62, 1.74, 8.67, 0.97, 0.66, 3.98, 6.0, 2.07, 1.64, 2.03, 0.09, 8.19, 5.25, 23.16, 1.33, 9.44]} \ No newline at end of file diff --git a/annotations_1/x7yAcIuyOb4_filtered.json b/annotations_1/x7yAcIuyOb4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db37595bdd6ba4f1eba2047c528e5091b6f9f151 --- /dev/null +++ b/annotations_1/x7yAcIuyOb4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.44], [17.0, 22.25], [24.0, 27.19], [28.0, 30.87], [33.0, 46.23], [52.0, 52.78], [61.0, 66.73], [67.0, 67.86], [71.0, 72.3], [75.0, 76.74], [80.0, 81.11], [84.0, 84.7], [86.0, 91.2], [97.0, 97.66], [98.0, 98.78], [101.0, 104.03], [115.0, 117.51], [122.0, 123.31], [140.0, 142.55], [145.0, 145.67], [149.0, 149.57], [161.0, 161.79], [165.0, 165.77], [168.0, 168.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.41, 52.8, 99.1, 99.85, 63.96, 0.0, 86.45, 0.0, 0.0, 0.0, 0.0, 0.0, 73.21, 0.0, 0.0, 55.18, 60.42, 0.0, 58.05, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 69.38], ["musical instrument", 7.15], ["flamenco", 4.74]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.44, 5.25, 3.19, 2.87, 13.23, 0.78, 5.73, 0.86, 1.3, 1.74, 1.11, 0.7, 5.2, 0.66, 0.78, 3.03, 2.51, 1.31, 2.55, 0.67, 0.57, 0.79, 0.77, 0.57]} \ No newline at end of file diff --git a/annotations_1/x9mLSJS0n3Q_filtered.json b/annotations_1/x9mLSJS0n3Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..095a7160f416cc1b24f0dd44af5d3fbcc15a7981 --- /dev/null +++ b/annotations_1/x9mLSJS0n3Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.28], [22.0, 24.54], [27.0, 28.56], [31.0, 31.89], [35.0, 35.36], [39.0, 39.66], [45.0, 46.43], [47.0, 52.17], [53.0, 55.36], [57.0, 61.64], [65.0, 66.39], [69.0, 70.88], [71.0, 75.64], [87.0, 88.72], [92.0, 91.89], [92.0, 92.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.9, 0.0, 0.0, 0.0, 0.0, 0.0, 92.31, 84.25, 95.64, 0.0, 0.0, 92.8, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.28, 2.54, 1.56, 0.89, 0.36, 0.66, 1.43, 5.17, 2.36, 4.64, 1.39, 1.88, 4.64, 1.72, -0.11, 0.03]} \ No newline at end of file diff --git a/annotations_1/xA1Uz_TMzhs_filtered.json b/annotations_1/xA1Uz_TMzhs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99ce588ece5ced19835c17fe5dc75a677f0eadd8 --- /dev/null +++ b/annotations_1/xA1Uz_TMzhs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.59], [8.0, 9.1], [16.0, 16.82], [25.0, 26.84], [28.0, 29.07], [32.0, 32.48], [48.0, 47.88], [50.0, 58.04], [61.0, 62.19], [67.0, 68.77], [73.0, 73.53], [76.0, 76.65], [79.0, 80.38], [90.0, 90.69], [96.0, 98.39], [99.0, 100.3], [102.0, 103.62], [135.0, 135.58], [141.0, 141.74], [155.0, 159.39], [161.0, 161.65]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.75, 0.0, 0.0, 0.0, 0.0, 89.54, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["fart", 40.21], ["fly, housefly", 12.27], ["music", 8.68]], null, null, null, null, null, null], "duration": [1.59, 1.1, 0.82, 1.84, 1.07, 0.48, -0.12, 8.04, 1.19, 1.77, 0.53, 0.65, 1.38, 0.69, 2.39, 1.3, 1.62, 0.58, 0.74, 4.39, 0.65]} \ No newline at end of file diff --git a/annotations_1/xAkmG6uqBd4_filtered.json b/annotations_1/xAkmG6uqBd4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..81cec29e56512b8ef435e68bd5b2c36d775a5554 --- /dev/null +++ b/annotations_1/xAkmG6uqBd4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.43], [13.0, 13.59], [17.0, 17.37], [19.0, 19.31], [23.0, 23.26], [24.0, 28.34], [33.0, 37.32], [40.0, 45.18], [49.0, 53.22], [56.0, 57.18], [58.0, 58.23], [60.0, 59.56], [65.0, 67.09], [78.0, 78.61], [82.0, 83.44], [85.0, 85.24], [93.0, 93.88], [95.0, 95.81], [100.0, 102.95], [103.0, 104.04], [104.0, 104.75], [105.0, 105.53], [111.0, 118.93], [124.0, 132.27], [133.0, 134.3], [135.0, 136.32]], "keep_status": [false, false, false, false, false, true, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [47.05, 0.0, 0.0, 0.0, 0.0, 31.38, 30.6, 31.87, 31.6, 0.0, 0.0, 0.0, 71.57, 0.0, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 31.95, 31.36, 0.0, 0.0], "audiomae_on_audioset": [[["music", 75.45], ["theremin", 8.72], ["whale vocalization", 1.76]], null, null, null, null, [["music", 46.2], ["didgeridoo", 6.0], ["speech", 5.93]], [["moo", 19.08], ["cattle, bovinae", 7.83], ["music", 7.07]], [["mosquito", 39.93], ["fly, housefly", 21.39], ["insect", 11.43]], [["music", 37.41], ["noise", 24.76], ["theremin", 6.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 34.61], ["fly, housefly", 10.6], ["insect", 6.51]], [["music", 50.3], ["whack, thwack", 30.87], ["smash, crash", 4.32]], null, null], "duration": [2.43, 0.59, 0.37, 0.31, 0.26, 4.34, 4.32, 5.18, 4.22, 1.18, 0.23, -0.44, 2.09, 0.61, 1.44, 0.24, 0.88, 0.81, 2.95, 1.04, 0.75, 0.53, 7.93, 8.27, 1.3, 1.32]} \ No newline at end of file diff --git a/annotations_1/xBI5Rk9qYjU_filtered.json b/annotations_1/xBI5Rk9qYjU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..778caadfd9e99c8a130e5f7ba28eab444ebc7763 --- /dev/null +++ b/annotations_1/xBI5Rk9qYjU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.24], [10.0, 10.61], [12.0, 12.55], [14.0, 14.55], [36.0, 35.97], [41.0, 51.49], [52.0, 57.16], [60.0, 62.73], [65.0, 69.43], [71.0, 71.79], [77.0, 78.33], [92.0, 92.62], [94.0, 95.23], [97.0, 97.28], [107.0, 110.29], [119.0, 119.69], [120.0, 120.28], [121.0, 121.61], [141.0, 144.71], [149.0, 154.03], [157.0, 158.14], [160.0, 160.37], [161.0, 161.18], [161.0, 161.62], [170.0, 173.31]], "keep_status": [false, false, false, false, false, false, true, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 34.89, 35.2, 35.16, 41.1, 0.0, 0.0, 0.0, 0.0, 0.0, 73.67, 0.0, 0.0, 0.0, 33.84, 31.06, 0.0, 0.0, 0.0, 0.0, 29.54], "audiomae_on_audioset": [null, null, null, null, null, [["music", 53.56], ["didgeridoo", 36.77], ["musical instrument", 0.57]], [["music", 44.1], ["mosquito", 6.95], ["fly, housefly", 5.58]], [["music", 46.0], ["fly, housefly", 7.07], ["speech", 6.23]], [["fly, housefly", 17.06], ["hum", 13.99], ["insect", 11.9]], null, null, null, null, null, null, null, null, null, [["music", 36.68], ["speech", 23.14], ["boing", 4.53]], [["music", 39.42], ["boing", 14.36], ["speech", 10.49]], null, null, null, null, [["music", 72.85], ["static", 2.47], ["hum", 2.34]]], "duration": [1.24, 0.61, 0.55, 0.55, -0.03, 10.49, 5.16, 2.73, 4.43, 0.79, 1.33, 0.62, 1.23, 0.28, 3.29, 0.69, 0.28, 0.61, 3.71, 5.03, 1.14, 0.37, 0.18, 0.62, 3.31]} \ No newline at end of file diff --git a/annotations_1/xBr1UV3kWqA_filtered.json b/annotations_1/xBr1UV3kWqA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d080852267884988639e3997b9ec8ea0e013e1df --- /dev/null +++ b/annotations_1/xBr1UV3kWqA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.45], [10.0, 10.25], [13.0, 13.09], [21.0, 24.9], [28.0, 28.44], [36.0, 36.46], [38.0, 38.87], [41.0, 43.46], [45.0, 45.77], [46.0, 48.78], [50.0, 51.31], [53.0, 54.87], [58.0, 59.59], [60.0, 67.49], [71.0, 72.87], [83.0, 83.25], [86.0, 101.75], [106.0, 106.46], [115.0, 116.41]], "keep_status": [false, false, false, true, false, false, false, true, false, true, false, false, false, true, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 31.36, 0.0, 0.0, 0.0, 39.02, 0.0, 37.82, 0.0, 0.0, 0.0, 32.09, 0.0, 0.0, 32.03, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 21.33], ["crowd", 12.78], ["livestock, farm animals, working animals", 12.75]], null, null, null, [["speech", 17.87], ["moo", 13.1], ["livestock, farm animals, working animals", 8.08]], null, [["mosquito", 16.86], ["livestock, farm animals, working animals", 14.81], ["moo", 10.97]], null, null, null, [["speech", 27.59], ["moo", 23.16], ["cattle, bovinae", 16.24]], null, null, [["music", 31.9], ["boing", 13.34], ["crowd", 12.05]], null, null], "duration": [0.45, 0.25, 0.09, 3.9, 0.44, 0.46, 0.87, 2.46, 0.77, 2.78, 1.31, 1.87, 1.59, 7.49, 1.87, 0.25, 15.75, 0.46, 1.41]} \ No newline at end of file diff --git a/annotations_1/xC3PGTTjX7E_filtered.json b/annotations_1/xC3PGTTjX7E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a19a8bfa923cfe23a74d413a0f9f9cb49670f7b4 --- /dev/null +++ b/annotations_1/xC3PGTTjX7E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.45], [6.0, 15.13], [16.0, 18.74], [24.0, 28.12], [29.0, 42.15], [51.0, 56.88], [62.0, 65.91], [70.0, 74.41], [84.0, 86.91], [88.0, 90.27], [93.0, 93.55], [94.0, 111.79], [114.0, 115.77], [119.0, 119.52]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, true, false, false], "silence_prob": [0.0, 75.07, 85.35, 95.64, 38.28, 30.88, 29.47, 29.03, 28.98, 28.7, 0.0, 29.16, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 19.04], ["sidetone", 16.73], ["whale vocalization", 13.97]], [["whale vocalization", 47.2], ["music", 12.63], ["hum", 10.93]], [["music", 66.76], ["didgeridoo", 17.25], ["musical instrument", 4.1]], [["music", 62.2], ["didgeridoo", 14.2], ["whale vocalization", 3.45]], [["sidetone", 30.73], ["music", 29.15], ["hum", 10.46]], [["speech", 23.32], ["music", 18.39], ["mains hum", 8.12]], null, [["music", 28.52], ["theremin", 11.53], ["didgeridoo", 8.77]], null, null], "duration": [1.45, 9.13, 2.74, 4.12, 13.15, 5.88, 3.91, 4.41, 2.91, 2.27, 0.55, 17.79, 1.77, 0.52]} \ No newline at end of file diff --git a/annotations_1/xCWkAXGz8W8_filtered.json b/annotations_1/xCWkAXGz8W8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bb459f527425cab75c66af7b42268346f6fa249 --- /dev/null +++ b/annotations_1/xCWkAXGz8W8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.41], [38.0, 49.2], [50.0, 51.07], [53.0, 55.0], [60.0, 63.09], [64.0, 67.76], [69.0, 70.6], [73.0, 82.76], [89.0, 89.04], [91.0, 92.77], [96.0, 97.17], [98.0, 100.11], [101.0, 101.71], [106.0, 106.47], [110.0, 115.28], [118.0, 118.5], [121.0, 120.9], [122.0, 122.44]], "keep_status": [true, true, false, true, true, true, false, true, false, false, false, true, false, false, false, false, false, false], "silence_prob": [36.52, 31.5, 0.0, 32.51, 30.77, 33.11, 0.0, 31.58, 0.0, 0.0, 0.0, 32.54, 0.0, 0.0, 29.72, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["busy signal", 42.79], ["sidetone", 9.79], ["dial tone", 9.66]], [["speech", 33.07], ["whack, thwack", 22.41], ["smash, crash", 5.42]], null, [["speech", 25.24], ["music", 17.21], ["fly, housefly", 8.85]], [["music", 21.77], ["speech", 20.98], ["fly, housefly", 13.62]], [["fly, housefly", 43.33], ["mosquito", 13.17], ["speech", 12.87]], null, [["groan", 23.09], ["speech", 22.58], ["music", 17.58]], null, null, null, [["vehicle", 44.59], ["speech", 8.75], ["car", 7.7]], null, null, [["didgeridoo", 35.15], ["music", 31.61], ["noise", 5.06]], null, null, null], "duration": [4.41, 11.2, 1.07, 2.0, 3.09, 3.76, 1.6, 9.76, 0.04, 1.77, 1.17, 2.11, 0.71, 0.47, 5.28, 0.5, -0.1, 0.44]} \ No newline at end of file diff --git a/annotations_1/xCvyw2bipUM_filtered.json b/annotations_1/xCvyw2bipUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf439b3ac8b5a17209b773a2a4075b88278985c6 --- /dev/null +++ b/annotations_1/xCvyw2bipUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.45], [13.0, 36.81], [38.0, 61.11], [62.0, 65.96], [67.0, 70.75], [73.0, 73.11], [74.0, 74.41], [77.0, 77.11], [94.0, 94.85], [106.0, 106.46], [111.0, 112.41], [118.0, 141.88], [145.0, 146.25], [147.0, 167.05], [167.0, 167.86], [169.0, 170.16], [171.0, 172.42], [172.0, 172.45], [173.0, 173.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [46.12, 37.49, 34.92, 53.47, 59.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.63, 0.0, 29.97, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 49.37], ["throbbing", 11.21], ["mains hum", 11.08]], [["hum", 65.03], ["mains hum", 14.4], ["throbbing", 9.04]], [["hum", 41.66], ["mains hum", 16.09], ["rumble", 14.55]], null, null, null, null, null, null, null, null, [["hum", 31.8], ["mains hum", 16.51], ["breaking", 16.01]], null, [["speech", 17.19], ["music", 15.43], ["whack, thwack", 9.0]], null, null, null, null, null], "duration": [2.45, 23.81, 23.11, 3.96, 3.75, 0.11, 0.41, 0.11, 0.85, 0.46, 1.41, 23.88, 1.25, 20.05, 0.86, 1.16, 1.42, 0.45, 0.69]} \ No newline at end of file diff --git a/annotations_1/xD9G6rUq_5I_filtered.json b/annotations_1/xD9G6rUq_5I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a179a630b7ce457b35d48aef716012451e7c421 --- /dev/null +++ b/annotations_1/xD9G6rUq_5I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 17.24], [20.0, 21.37], [23.0, 23.23], [25.0, 27.08], [28.0, 29.74], [31.0, 32.27], [33.0, 36.86], [37.0, 60.08], [61.0, 61.65], [63.0, 69.15], [74.0, 110.86]], "keep_status": [true, false, false, false, false, false, false, true, false, false, false], "silence_prob": [41.07, 0.0, 0.0, 46.02, 0.0, 0.0, 71.87, 30.94, 0.0, 52.39, 0.0], "audiomae_on_audioset": [[["music", 40.05], ["speech", 17.49], ["synthesizer", 9.68]], null, null, [["speech", 47.12], ["sidetone", 23.49], ["music", 5.44]], null, null, null, [["music", 33.51], ["gong", 14.42], ["hum", 12.69]], null, null, null], "duration": [8.24, 1.37, 0.23, 2.08, 1.74, 1.27, 3.86, 23.08, 0.65, 6.15, 36.86]} \ No newline at end of file diff --git a/annotations_1/xDZfwTsiLrk_filtered.json b/annotations_1/xDZfwTsiLrk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3869eca524f1f4a4ad02123eb16856f785040b3d --- /dev/null +++ b/annotations_1/xDZfwTsiLrk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.16], [2.0, 2.35], [4.0, 5.36], [6.0, 6.64], [7.0, 7.75], [20.0, 20.24], [21.0, 21.84], [27.0, 29.54], [31.0, 33.84], [35.0, 38.8], [40.0, 42.48], [44.0, 46.53], [47.0, 49.45], [57.0, 57.89], [59.0, 60.61], [61.0, 62.18], [70.0, 70.16], [94.0, 94.37], [99.0, 99.94], [102.0, 103.38]], "keep_status": [false, false, false, false, false, false, false, true, true, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.74, 34.61, 36.65, 35.4, 38.8, 30.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 32.78], ["fire alarm", 5.19], ["synthesizer", 4.8]], [["music", 31.58], ["whale vocalization", 29.87], ["synthesizer", 2.84]], [["music", 39.56], ["synthesizer", 6.12], ["buzz", 5.64]], [["music", 47.22], ["ambient music", 11.08], ["hum", 6.66]], [["music", 35.14], ["speech", 16.29], ["mains hum", 5.2]], [["music", 64.66], ["theremin", 7.16], ["synthesizer", 4.37]], null, null, null, null, null, null, null], "duration": [0.16, 0.35, 1.36, 0.64, 0.75, 0.24, 0.84, 2.54, 2.84, 3.8, 2.48, 2.53, 2.45, 0.89, 1.61, 1.18, 0.16, 0.37, 0.94, 1.38]} \ No newline at end of file diff --git a/annotations_1/xDe-990DWEw_filtered.json b/annotations_1/xDe-990DWEw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce1a415de2db34bcab5716551ac826f1db7cddaf --- /dev/null +++ b/annotations_1/xDe-990DWEw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[36.0, 51.73], [53.0, 53.35], [54.0, 55.54], [57.0, 63.02], [65.0, 67.02]], "keep_status": [false, false, false, false, false], "silence_prob": [29.44, 0.0, 0.0, 39.54, 39.22], "audiomae_on_audioset": [[["hum", 40.51], ["mains hum", 38.66], ["music", 9.88]], null, null, [["music", 80.41], ["beatboxing", 3.32], ["speech", 3.19]], [["music", 70.16], ["didgeridoo", 2.59], ["speech", 1.65]]], "duration": [15.73, 0.35, 1.54, 6.02, 2.02]} \ No newline at end of file diff --git a/annotations_1/xDkXQ7uBr5M_filtered.json b/annotations_1/xDkXQ7uBr5M_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7cc5d462bd9581deaec0e96a67f0baaf1a1b0906 --- /dev/null +++ b/annotations_1/xDkXQ7uBr5M_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[33.0, 39.61], [41.0, 42.18], [54.0, 54.3], [55.0, 55.58], [56.0, 58.97], [60.0, 60.45], [61.0, 62.19], [69.0, 70.97], [72.0, 80.37], [82.0, 84.05], [86.0, 89.07], [90.0, 97.28], [98.0, 104.03], [105.0, 109.17], [110.0, 121.19], [121.0, 121.36], [128.0, 129.37], [130.0, 130.54], [131.0, 133.41], [134.0, 137.83], [140.0, 161.06]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, true, true, true], "silence_prob": [97.54, 0.0, 0.0, 0.0, 66.27, 0.0, 0.0, 0.0, 54.3, 80.64, 39.74, 79.94, 72.01, 30.6, 31.3, 0.0, 0.0, 0.0, 30.66, 30.5, 30.49], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["speech", 46.91], ["sidetone", 13.0], ["thunk", 10.69]], null, null, [["speech", 24.05], ["music", 19.52], ["whack, thwack", 9.28]], [["music", 36.37], ["speech", 23.63], ["hum", 7.94]], null, null, null, [["speech", 18.95], ["music", 16.58], ["animal", 2.91]], [["speech", 20.47], ["hum", 17.85], ["music", 17.25]], [["breaking", 25.97], ["music", 24.38], ["whack, thwack", 11.68]]], "duration": [6.61, 1.18, 0.3, 0.58, 2.97, 0.45, 1.19, 1.97, 8.37, 2.05, 3.07, 7.28, 6.03, 4.17, 11.19, 0.36, 1.37, 0.54, 2.41, 3.83, 21.06]} \ No newline at end of file diff --git a/annotations_1/xFoBu7P_Kwc_filtered.json b/annotations_1/xFoBu7P_Kwc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f9cf63ef0f30d234c38b9b97ad7d80ef47f275a0 --- /dev/null +++ b/annotations_1/xFoBu7P_Kwc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.42], [4.0, 4.94], [6.0, 6.98], [8.0, 16.88], [18.0, 24.75], [25.0, 26.52], [28.0, 28.34], [30.0, 34.6], [36.0, 38.99], [43.0, 55.04], [57.0, 57.97], [59.0, 58.95], [60.0, 62.36], [65.0, 74.41], [77.0, 89.7], [90.0, 92.64], [95.0, 95.08], [96.0, 96.97], [99.0, 99.25], [100.0, 117.59], [120.0, 133.93], [138.0, 177.35], [178.0, 184.45], [188.0, 190.63], [196.0, 199.98], [201.0, 201.78], [204.0, 204.2], [205.0, 206.49], [211.0, 212.53], [215.0, 215.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.96, 99.9, 0.0, 0.0, 99.76, 99.62, 63.53, 0.0, 0.0, 68.8, 50.36, 30.88, 100.0, 0.0, 0.0, 0.0, 31.23, 30.72, 0.0, 48.27, 38.37, 99.93, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 14.32], ["gong", 12.92], ["musical instrument", 10.65]], null, null, null, null, [["speech", 50.57], ["explosion", 28.93], ["burst, pop", 8.31]], [["speech", 34.05], ["music", 18.46], ["explosion", 5.47]], null, [["speech", 64.22], ["male speech, man speaking", 6.96], ["hum", 5.65]], [["animal", 33.47], ["cattle, bovinae", 12.46], ["domestic animals, pets", 8.02]], null, null, null, null, null, null], "duration": [1.42, 0.94, 0.98, 8.88, 6.75, 1.52, 0.34, 4.6, 2.99, 12.04, 0.97, -0.05, 2.36, 9.41, 12.7, 2.64, 0.08, 0.97, 0.25, 17.59, 13.93, 39.35, 6.45, 2.63, 3.98, 0.78, 0.2, 1.49, 1.53, 0.64]} \ No newline at end of file diff --git a/annotations_1/xG6__eK9jIE_filtered.json b/annotations_1/xG6__eK9jIE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c784051210bc1b86e5fe6b4136f902018e2b7e97 --- /dev/null +++ b/annotations_1/xG6__eK9jIE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 17.79], [18.0, 27.57], [29.0, 51.88], [53.0, 53.84], [55.0, 79.29], [85.0, 85.68]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 52.33, 39.7, 0.0, 29.65, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.0], ["speech", 29.3], ["hum", 10.13]], null, [["music", 57.2], ["throbbing", 12.74], ["hum", 8.64]], null], "duration": [-0.21, 9.57, 22.88, 0.84, 24.29, 0.68]} \ No newline at end of file diff --git a/annotations_1/xGAAMQLb4ZE_filtered.json b/annotations_1/xGAAMQLb4ZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0e31ff96e0b78cb6b3f2fb4e259c460231354952 --- /dev/null +++ b/annotations_1/xGAAMQLb4ZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [5.0, 6.89], [28.0, 29.89], [30.0, 30.0], [99.0, 100.58], [103.0, 103.84]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.18, 1.89, 1.89, 0.0, 1.58, 0.84]} \ No newline at end of file diff --git a/annotations_1/xGeYzlEV5KY_filtered.json b/annotations_1/xGeYzlEV5KY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..054eb0dfc101909d19d0e37130358fc5cc0a8195 --- /dev/null +++ b/annotations_1/xGeYzlEV5KY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.57], [5.0, 5.19], [22.0, 22.6], [24.0, 24.56], [30.0, 29.81], [30.0, 31.04], [32.0, 32.75], [43.0, 44.66], [46.0, 47.97], [53.0, 53.84], [58.0, 58.99], [61.0, 62.73], [70.0, 72.91], [85.0, 84.91], [88.0, 89.13], [99.0, 107.13], [108.0, 110.76], [112.0, 118.56], [130.0, 131.73], [138.0, 139.72], [141.0, 140.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.9, 0.0, 0.0, 91.13, 92.15, 81.71, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.57, 0.19, 0.6, 0.56, -0.19, 1.04, 0.75, 1.66, 1.97, 0.84, 0.99, 1.73, 2.91, -0.09, 1.13, 8.13, 2.76, 6.56, 1.73, 1.72, -0.07]} \ No newline at end of file diff --git a/annotations_1/xGon_kZAVtU_filtered.json b/annotations_1/xGon_kZAVtU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20096257f62476fb4e87d5796018c3d765431091 --- /dev/null +++ b/annotations_1/xGon_kZAVtU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[61.0, 96.11], [103.0, 103.0], [104.0, 108.43], [114.0, 123.16]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 28.5, 28.49], "audiomae_on_audioset": [null, null, [["speech", 49.88], ["music", 9.54], ["hubbub, speech noise, speech babble", 5.89]], [["speech", 45.22], ["music", 24.77], ["explosion", 2.89]]], "duration": [35.11, 0.0, 4.43, 9.16]} \ No newline at end of file diff --git a/annotations_1/xHDeLp0sWBc_filtered.json b/annotations_1/xHDeLp0sWBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfe59102950b86c2831949593f0f863cade949d8 --- /dev/null +++ b/annotations_1/xHDeLp0sWBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.55], [10.0, 13.12], [15.0, 14.99], [23.0, 23.72], [25.0, 25.83], [29.0, 29.78], [30.0, 31.29], [32.0, 32.59], [34.0, 34.72], [36.0, 35.9], [37.0, 37.81], [38.0, 39.33], [40.0, 47.49], [50.0, 63.42], [66.0, 77.03], [77.0, 77.68], [79.0, 80.35], [82.0, 82.97], [85.0, 84.84], [86.0, 86.16], [88.0, 93.12], [95.0, 95.76], [99.0, 100.33], [102.0, 102.57], [105.0, 106.15], [109.0, 109.95], [114.0, 113.88], [115.0, 115.37], [117.0, 121.63], [123.0, 126.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 81.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.88, 98.8, 79.76, 0.0, 0.0, 0.0, 0.0, 0.0, 93.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 99.44], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 3.12, -0.01, 0.72, 0.83, 0.78, 1.29, 0.59, 0.72, -0.1, 0.81, 1.33, 7.49, 13.42, 11.03, 0.68, 1.35, 0.97, -0.16, 0.16, 5.12, 0.76, 1.33, 0.57, 1.15, 0.95, -0.12, 0.37, 4.63, 3.13]} \ No newline at end of file diff --git a/annotations_1/xHtAfA2ctBs_filtered.json b/annotations_1/xHtAfA2ctBs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f5acfbeb2636bc741b67230b48cfd8c129bb92 --- /dev/null +++ b/annotations_1/xHtAfA2ctBs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 11.13], [15.0, 130.23]], "keep_status": [false, false], "silence_prob": [32.73, 0.0], "audiomae_on_audioset": [[["speech", 34.46], ["music", 29.45], ["hum", 6.72]], null], "duration": [10.13, 115.23]} \ No newline at end of file diff --git a/annotations_1/xI-ehlRwN8o_filtered.json b/annotations_1/xI-ehlRwN8o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dbaae73f68e3a218a24b6c6959281da5d5daede --- /dev/null +++ b/annotations_1/xI-ehlRwN8o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 15.36], [16.0, 71.22], [72.0, 72.39], [73.0, 75.24], [87.0, 105.02], [107.0, 112.94], [116.0, 122.37], [125.0, 127.79], [128.0, 159.41], [163.0, 167.56], [169.0, 170.24], [179.0, 180.18], [180.0, 180.99], [182.0, 183.05], [187.0, 186.76], [188.0, 188.79], [189.0, 191.56], [194.0, 198.32], [199.0, 199.99], [202.0, 206.47], [207.0, 207.59], [211.0, 211.15], [211.0, 215.86], [220.0, 221.36], [228.0, 228.63]], "keep_status": [false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 35.45, 33.62, 32.27, 99.36, 0.0, 80.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.79, 87.55, 0.0, 99.99, 0.0, 0.0, 77.87, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 34.28], ["fart", 20.27], ["fly, housefly", 11.84]], [["livestock, farm animals, working animals", 33.35], ["cattle, bovinae", 32.91], ["moo", 24.44]], [["music", 18.94], ["livestock, farm animals, working animals", 13.49], ["moo", 9.55]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.36, 55.22, 0.39, 2.24, 18.02, 5.94, 6.37, 2.79, 31.41, 4.56, 1.24, 1.18, 0.99, 1.05, -0.24, 0.79, 2.56, 4.32, 0.99, 4.47, 0.59, 0.15, 4.86, 1.36, 0.63]} \ No newline at end of file diff --git a/annotations_1/xI4s1uyYIX4_filtered.json b/annotations_1/xI4s1uyYIX4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..20c0a370e2303194a3d403817adf7de9d383e3a6 --- /dev/null +++ b/annotations_1/xI4s1uyYIX4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.22], [4.0, 3.94], [9.0, 63.58], [66.0, 81.6], [85.0, 113.97], [114.0, 114.02], [114.0, 114.05], [115.0, 117.27], [117.0, 119.65], [123.0, 126.5], [127.0, 128.31], [130.0, 146.75], [148.0, 158.38], [161.0, 162.03]], "keep_status": [false, false, false, false, true, false, false, false, true, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.09, 33.14, 0.0, 0.0, 36.57, 32.55, 42.81, 0.0, 30.73, 35.11, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 80.06], ["animal", 4.51], ["livestock, farm animals, working animals", 3.96]], [["music", 21.15], ["noise", 19.14], ["hum", 17.61]], null, null, [["hum", 33.46], ["throbbing", 19.41], ["whale vocalization", 17.45]], [["speech", 31.79], ["hum", 20.69], ["whale vocalization", 11.85]], [["hum", 25.1], ["throbbing", 25.05], ["explosion", 7.54]], null, [["music", 28.75], ["hum", 23.67], ["mains hum", 19.32]], [["hum", 48.59], ["mains hum", 31.78], ["music", 12.19]], null], "duration": [0.22, -0.06, 54.58, 15.6, 28.97, 0.02, 0.05, 2.27, 2.65, 3.5, 1.31, 16.75, 10.38, 1.03]} \ No newline at end of file diff --git a/annotations_1/xI9CLKI1h-g_filtered.json b/annotations_1/xI9CLKI1h-g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b0644d2f6ba0521fa4554b1647852200eddd715 --- /dev/null +++ b/annotations_1/xI9CLKI1h-g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.0], [1.0, 1.68], [4.0, 27.87], [30.0, 47.12], [52.0, 55.85], [58.0, 60.81], [70.0, 73.16], [74.0, 80.87], [84.0, 86.58]], "keep_status": [false, false, false, false, true, false, false, false, true], "silence_prob": [0.0, 0.0, 51.18, 35.21, 46.83, 37.73, 44.9, 31.78, 39.61], "audiomae_on_audioset": [null, null, null, [["radio", 38.55], ["speech", 25.15], ["mains hum", 7.9]], [["throbbing", 17.26], ["music", 16.18], ["hum", 15.4]], [["hum", 51.78], ["throbbing", 17.77], ["mains hum", 11.82]], [["mains hum", 37.67], ["hum", 34.32], ["music", 4.83]], [["whale vocalization", 86.31], ["hum", 6.73], ["throbbing", 2.67]], [["hum", 30.8], ["mains hum", 11.91], ["whale vocalization", 9.0]]], "duration": [0.0, 0.68, 23.87, 17.12, 3.85, 2.81, 3.16, 6.87, 2.58]} \ No newline at end of file diff --git a/annotations_1/xIsVK254RXU_filtered.json b/annotations_1/xIsVK254RXU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5621ecf313d699c48338e8a6b38cd1c0feec71e3 --- /dev/null +++ b/annotations_1/xIsVK254RXU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 25.62], [32.0, 33.4], [35.0, 36.0], [36.0, 41.64], [44.0, 44.61], [47.0, 88.99], [90.0, 91.13], [93.0, 109.66]], "keep_status": [true, false, false, true, false, false, false, false], "silence_prob": [49.5, 0.0, 0.0, 36.38, 0.0, 0.0, 0.0, 29.96], "audiomae_on_audioset": [[["fly, housefly", 27.75], ["insect", 17.19], ["livestock, farm animals, working animals", 8.55]], null, null, [["music", 46.21], ["speech", 4.81], ["didgeridoo", 4.55]], null, null, null, [["speech", 45.43], ["music", 20.74], ["vehicle", 7.84]]], "duration": [12.62, 1.4, 1.0, 5.64, 0.61, 41.99, 1.13, 16.66]} \ No newline at end of file diff --git a/annotations_1/xJb5tOlE1Fs_filtered.json b/annotations_1/xJb5tOlE1Fs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..436cbc30ab8b3f577d9674edb7c9d92111fa5a67 --- /dev/null +++ b/annotations_1/xJb5tOlE1Fs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.66], [4.0, 5.34], [6.0, 6.79], [8.0, 9.32], [11.0, 11.96], [13.0, 13.31], [14.0, 15.48], [16.0, 16.55], [17.0, 17.51], [23.0, 22.87], [25.0, 25.81], [26.0, 26.69], [28.0, 28.24], [29.0, 29.54], [31.0, 31.6], [33.0, 33.51], [35.0, 35.09], [36.0, 37.0], [37.0, 38.06], [40.0, 41.27], [42.0, 43.17], [44.0, 44.68], [45.0, 46.95], [48.0, 48.54], [51.0, 51.02], [53.0, 56.51], [58.0, 73.53], [78.0, 82.31], [84.0, 84.5], [86.0, 85.75], [88.0, 88.28], [89.0, 89.18], [90.0, 90.96], [92.0, 91.72], [94.0, 93.99], [94.0, 94.53], [99.0, 100.9], [102.0, 102.86], [104.0, 105.19], [106.0, 107.52], [109.0, 109.63], [111.0, 111.5], [117.0, 117.78], [118.0, 118.72], [120.0, 124.43], [125.0, 125.0], [125.0, 125.66], [126.0, 127.38], [131.0, 131.11], [132.0, 137.73], [138.0, 140.16], [141.0, 142.86]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 70.3, 87.55, 65.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 75.88, 0.0, 0.0, 0.0, 0.0, 94.37, 72.31, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.66, 1.34, 0.79, 1.32, 0.96, 0.31, 1.48, 0.55, 0.51, -0.13, 0.81, 0.69, 0.24, 0.54, 0.6, 0.51, 0.09, 1.0, 1.06, 1.27, 1.17, 0.68, 1.95, 0.54, 0.02, 3.51, 15.53, 4.31, 0.5, -0.25, 0.28, 0.18, 0.96, -0.28, -0.01, 0.53, 1.9, 0.86, 1.19, 1.52, 0.63, 0.5, 0.78, 0.72, 4.43, 0.0, 0.66, 1.38, 0.11, 5.73, 2.16, 1.86]} \ No newline at end of file diff --git a/annotations_1/xKYgXZQuqm8_filtered.json b/annotations_1/xKYgXZQuqm8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2515f512b9bd8127ccc3525df80a83dc5ee37fc6 --- /dev/null +++ b/annotations_1/xKYgXZQuqm8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.23], [4.0, 5.64], [7.0, 28.21]], "keep_status": [false, false, true], "silence_prob": [0.0, 0.0, 31.34], "audiomae_on_audioset": [null, null, [["speech", 15.37], ["cattle, bovinae", 12.21], ["livestock, farm animals, working animals", 7.68]]], "duration": [1.23, 1.64, 21.21]} \ No newline at end of file diff --git a/annotations_1/xKaCxkf1Ccs_filtered.json b/annotations_1/xKaCxkf1Ccs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ef183e5195088fe53fe5d7dc111bc4f7bac6c66c --- /dev/null +++ b/annotations_1/xKaCxkf1Ccs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.85], [5.0, 5.97], [13.0, 13.81], [16.0, 15.94], [21.0, 23.31], [24.0, 25.03], [30.0, 30.84], [31.0, 32.51], [35.0, 35.56], [37.0, 37.42], [39.0, 42.72], [50.0, 52.07], [54.0, 54.24], [67.0, 66.9], [68.0, 68.42], [75.0, 80.0], [88.0, 89.55], [91.0, 91.72], [92.0, 93.07], [95.0, 95.0], [96.0, 96.69], [105.0, 105.51], [115.0, 115.96], [126.0, 126.45], [131.0, 130.99], [134.0, 136.0], [139.0, 138.92], [140.0, 142.99]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 45.46, 0.0, 0.0, 0.0, 0.0, 0.0, 41.07, 33.25, 0.0, 0.0, 0.0, 39.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 85.72, 0.0, 59.86], "audiomae_on_audioset": [null, null, null, null, [["music", 24.13], ["honk", 9.9], ["musical instrument", 6.63]], null, null, null, null, null, [["music", 35.62], ["speech", 21.31], ["musical instrument", 2.81]], [["livestock, farm animals, working animals", 23.75], ["cattle, bovinae", 16.0], ["moo", 15.07]], null, null, null, [["music", 22.34], ["animal", 17.61], ["bow-wow", 8.36]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.85, 0.97, 0.81, -0.06, 2.31, 1.03, 0.84, 1.51, 0.56, 0.42, 3.72, 2.07, 0.24, -0.1, 0.42, 5.0, 1.55, 0.72, 1.07, 0.0, 0.69, 0.51, 0.96, 0.45, -0.01, 2.0, -0.08, 2.99]} \ No newline at end of file diff --git a/annotations_1/xL3ZOCRgJZM_filtered.json b/annotations_1/xL3ZOCRgJZM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..24c28d406eb9190707af0763043cb1f990562176 --- /dev/null +++ b/annotations_1/xL3ZOCRgJZM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.44], [8.0, 8.72], [10.0, 11.8], [13.0, 22.67], [24.0, 24.9], [25.0, 27.03], [46.0, 50.09], [53.0, 53.91], [54.0, 55.16], [56.0, 56.56], [64.0, 67.15], [70.0, 77.28], [88.0, 94.63], [99.0, 99.59], [100.0, 102.39], [109.0, 119.55], [122.0, 126.27], [127.0, 131.03], [132.0, 133.83], [135.0, 136.36], [138.0, 139.31], [143.0, 143.51], [145.0, 146.03], [153.0, 161.11], [162.0, 168.32], [169.0, 176.52]], "keep_status": [false, false, false, false, false, false, true, false, false, false, true, true, false, false, true, true, false, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 73.51, 0.0, 58.64, 33.1, 0.0, 0.0, 0.0, 35.41, 31.4, 37.77, 0.0, 39.43, 33.54, 93.29, 63.53, 0.0, 0.0, 0.0, 0.0, 0.0, 29.7, 28.55, 29.84], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 51.02], ["speech", 10.07], ["whack, thwack", 8.1]], null, null, null, [["whale vocalization", 18.9], ["grunt", 12.87], ["throbbing", 12.28]], [["speech", 39.32], ["whack, thwack", 9.39], ["music", 7.52]], [["whale vocalization", 89.31], ["livestock, farm animals, working animals", 3.95], ["cattle, bovinae", 3.19]], null, [["whale vocalization", 27.33], ["speech", 19.05], ["sidetone", 12.27]], [["whale vocalization", 28.65], ["speech", 24.56], ["explosion", 9.52]], null, null, null, null, null, null, null, [["music", 15.28], ["speech", 15.12], ["sidetone", 14.17]], [["music", 45.43], ["speech", 15.1], ["electric shaver, electric razor", 3.41]], [["sidetone", 65.9], ["speech", 9.39], ["electric shaver, electric razor", 2.9]]], "duration": [0.44, 0.72, 1.8, 9.67, 0.9, 2.03, 4.09, 0.91, 1.16, 0.56, 3.15, 7.28, 6.63, 0.59, 2.39, 10.55, 4.27, 4.03, 1.83, 1.36, 1.31, 0.51, 1.03, 8.11, 6.32, 7.52]} \ No newline at end of file diff --git a/annotations_1/xLLOmh2nxWQ_filtered.json b/annotations_1/xLLOmh2nxWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dae8dd16b1cd6d6fc67973b5093b374e839f3f9 --- /dev/null +++ b/annotations_1/xLLOmh2nxWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.84], [3.0, 4.31], [11.0, 11.48], [14.0, 14.47], [15.0, 19.14], [22.0, 22.89], [24.0, 24.31], [25.0, 39.09], [42.0, 45.44], [46.0, 47.51], [48.0, 49.44], [52.0, 53.37], [55.0, 60.0], [63.0, 64.71], [68.0, 68.72], [72.0, 72.59], [74.0, 74.16], [75.0, 91.34], [92.0, 101.09], [102.0, 106.91], [112.0, 112.18], [116.0, 116.77], [120.0, 129.76], [132.0, 134.0], [134.0, 136.61], [159.0, 166.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 78.04, 0.0, 0.0, 51.02, 49.54, 0.0, 0.0, 0.0, 46.09, 0.0, 0.0, 0.0, 0.0, 51.77, 52.62, 54.76, 0.0, 0.0, 62.07, 52.51, 56.25, 60.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["music", 70.74], ["musical instrument", 4.18], ["quack", 3.2]], null, null, null, [["music", 61.39], ["speech", 10.77], ["guitar", 6.54]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.84, 1.31, 0.48, 0.47, 4.14, 0.89, 0.31, 14.09, 3.44, 1.51, 1.44, 1.37, 5.0, 1.71, 0.72, 0.59, 0.16, 16.34, 9.09, 4.91, 0.18, 0.77, 9.76, 2.0, 2.61, 7.16]} \ No newline at end of file diff --git a/annotations_1/xLZDij_-ZRw_filtered.json b/annotations_1/xLZDij_-ZRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c49e0f5b8557aeb3dfb5480e455a18488f458bb0 --- /dev/null +++ b/annotations_1/xLZDij_-ZRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.23], [6.0, 6.25], [19.0, 19.13], [24.0, 24.11], [30.0, 30.47], [39.0, 40.34], [53.0, 54.65], [56.0, 57.13], [63.0, 63.22], [66.0, 67.05], [72.0, 72.54], [77.0, 78.29], [79.0, 79.71], [80.0, 81.03], [85.0, 86.41], [87.0, 89.78], [94.0, 94.98], [96.0, 96.89], [102.0, 102.76], [105.0, 105.43], [114.0, 114.34], [124.0, 125.04], [125.0, 129.93], [130.0, 131.67], [136.0, 140.97]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.57, 0.0, 36.52], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 34.17], ["moo", 21.88], ["whale vocalization", 20.05]], null, [["cattle, bovinae", 60.95], ["moo", 25.13], ["livestock, farm animals, working animals", 13.58]]], "duration": [0.23, 0.25, 0.13, 0.11, 0.47, 1.34, 1.65, 1.13, 0.22, 1.05, 0.54, 1.29, 0.71, 1.03, 1.41, 2.78, 0.98, 0.89, 0.76, 0.43, 0.34, 1.04, 4.93, 1.67, 4.97]} \ No newline at end of file diff --git a/annotations_1/xLdIkC6qcow_filtered.json b/annotations_1/xLdIkC6qcow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c33579cb2ee0f8cd492c028015805c75d32ada2 --- /dev/null +++ b/annotations_1/xLdIkC6qcow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.05], [9.0, 10.94], [13.0, 13.88], [15.0, 15.15], [16.0, 17.05], [25.0, 25.07], [26.0, 27.51], [43.0, 49.96], [51.0, 63.88], [65.0, 66.58], [75.0, 75.83], [77.0, 77.87], [78.0, 79.27], [82.0, 82.75], [89.0, 88.82], [89.0, 90.26], [91.0, 92.11], [93.0, 94.73], [97.0, 97.53], [104.0, 105.04], [108.0, 108.23], [119.0, 120.19], [122.0, 123.3], [127.0, 127.13], [129.0, 130.05], [133.0, 132.76], [134.0, 135.04], [138.0, 140.22], [142.0, 143.46]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.66, 53.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.16, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["noise", 15.6], ["hum", 15.57], ["music", 13.67]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.05, 1.94, 0.88, 0.15, 1.05, 0.07, 1.51, 6.96, 12.88, 1.58, 0.83, 0.87, 1.27, 0.75, -0.18, 1.26, 1.11, 1.73, 0.53, 1.04, 0.23, 1.19, 1.3, 0.13, 1.05, -0.24, 1.04, 2.22, 1.46]} \ No newline at end of file diff --git a/annotations_1/xM1MNPKYl5g_filtered.json b/annotations_1/xM1MNPKYl5g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b31919f1791a9d4261b4834c87abecce09b17a7 --- /dev/null +++ b/annotations_1/xM1MNPKYl5g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 13.37], [14.0, 16.68], [17.0, 17.91], [24.0, 24.43], [27.0, 43.5], [44.0, 45.67], [49.0, 49.72], [52.0, 53.1], [54.0, 56.88], [58.0, 81.24], [84.0, 85.24], [87.0, 87.24], [89.0, 89.45], [92.0, 93.87], [97.0, 110.44], [114.0, 115.91], [117.0, 130.2]], "keep_status": [true, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [35.74, 93.29, 0.0, 0.0, 37.46, 0.0, 0.0, 0.0, 57.72, 56.25, 0.0, 0.0, 0.0, 0.0, 32.13, 0.0, 56.86], "audiomae_on_audioset": [[["music", 42.75], ["thunk", 13.02], ["thump, thud", 4.47]], null, null, null, [["music", 39.73], ["thunk", 11.07], ["hum", 10.22]], null, null, null, null, null, null, null, null, null, [["speech", 32.9], ["fly, housefly", 10.36], ["fart", 6.45]], null, null], "duration": [4.37, 2.68, 0.91, 0.43, 16.5, 1.67, 0.72, 1.1, 2.88, 23.24, 1.24, 0.24, 0.45, 1.87, 13.44, 1.91, 13.2]} \ No newline at end of file diff --git a/annotations_1/xME4tintsqs_filtered.json b/annotations_1/xME4tintsqs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d1168963cf7f30d776201e2b1dabb22cc47c1be6 --- /dev/null +++ b/annotations_1/xME4tintsqs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.05], [4.0, 3.91], [7.0, 8.33], [13.0, 13.19], [16.0, 16.58], [19.0, 22.3], [23.0, 24.44], [29.0, 33.67], [36.0, 39.43], [41.0, 74.04], [75.0, 75.0], [76.0, 76.06], [78.0, 97.8], [99.0, 100.77], [103.0, 107.74], [110.0, 110.25], [111.0, 111.5], [112.0, 136.9], [142.0, 143.48], [145.0, 145.74], [149.0, 149.13], [152.0, 152.52], [160.0, 162.48], [164.0, 164.62], [166.0, 166.92], [169.0, 169.62]], "keep_status": [false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 33.49, 0.0, 28.61, 29.13, 0.0, 0.0, 0.0, 43.64, 0.0, 35.75, 0.0, 0.0, 40.61, 0.0, 0.0, 0.0, 0.0, 82.79, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 72.3], ["musical instrument", 3.01], ["hum", 2.35]], null, [["throbbing", 16.84], ["hum", 15.6], ["explosion", 12.65]], [["hum", 30.69], ["music", 25.48], ["throbbing", 22.44]], null, null, null, [["music", 60.79], ["hum", 17.83], ["throbbing", 7.58]], null, [["music", 40.22], ["mains hum", 23.75], ["hum", 10.84]], null, null, [["speech", 26.28], ["music", 23.39], ["hum", 13.14]], null, null, null, null, null, null, null, null], "duration": [1.05, -0.09, 1.33, 0.19, 0.58, 3.3, 1.44, 4.67, 3.43, 33.04, 0.0, 0.06, 19.8, 1.77, 4.74, 0.25, 0.5, 24.9, 1.48, 0.74, 0.13, 0.52, 2.48, 0.62, 0.92, 0.62]} \ No newline at end of file diff --git a/annotations_1/xMjEmE1YLSU_filtered.json b/annotations_1/xMjEmE1YLSU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d389ef93de5e09c518c9ce8cd4e83fd89177906 --- /dev/null +++ b/annotations_1/xMjEmE1YLSU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [7.0, 7.65], [12.0, 12.78], [15.0, 15.72], [19.0, 23.46], [36.0, 56.81], [57.0, 59.07], [69.0, 68.77], [77.0, 77.28], [79.0, 79.88], [86.0, 86.93], [89.0, 89.36], [92.0, 92.84], [94.0, 95.34], [99.0, 100.57], [101.0, 107.42], [109.0, 113.17], [128.0, 129.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 57.89, 39.11, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.13, 99.97, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 45.55], ["music", 34.82], ["electronic music", 1.98]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.96, 0.65, 0.78, 0.72, 4.46, 20.81, 2.07, -0.23, 0.28, 0.88, 0.93, 0.36, 0.84, 1.34, 1.57, 6.42, 4.17, 1.05]} \ No newline at end of file diff --git a/annotations_1/xMoCoTO3d-Y_filtered.json b/annotations_1/xMoCoTO3d-Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..88bf1dc7a86ef1fe2b31753c22f0421dca54d961 --- /dev/null +++ b/annotations_1/xMoCoTO3d-Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.25], [3.0, 3.06], [4.0, 36.85], [41.0, 41.05], [47.0, 47.75], [49.0, 50.97], [52.0, 52.76], [54.0, 54.77], [56.0, 56.03], [60.0, 61.69], [63.0, 64.25], [69.0, 69.8], [76.0, 77.8], [85.0, 86.04], [88.0, 88.3], [97.0, 97.93], [99.0, 99.18], [102.0, 102.22], [103.0, 104.68], [109.0, 109.24], [110.0, 110.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.25, 0.06, 32.85, 0.05, 0.75, 1.97, 0.76, 0.77, 0.03, 1.69, 1.25, 0.8, 1.8, 1.04, 0.3, 0.93, 0.18, 0.22, 1.68, 0.24, 0.49]} \ No newline at end of file diff --git a/annotations_1/xNNd9Uc9J_8_filtered.json b/annotations_1/xNNd9Uc9J_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0377da9ec2b80375dec44e3790d90c7faf1b30f2 --- /dev/null +++ b/annotations_1/xNNd9Uc9J_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.91], [12.0, 19.38], [21.0, 30.5], [35.0, 52.96], [54.0, 53.86], [56.0, 56.34], [57.0, 60.57], [61.0, 69.38], [70.0, 99.99], [103.0, 110.05], [111.0, 112.38], [113.0, 116.87]], "keep_status": [false, false, true, false, false, false, true, true, false, true, false, true], "silence_prob": [0.0, 30.98, 31.21, 30.43, 0.0, 0.0, 29.76, 30.74, 30.56, 46.47, 0.0, 31.56], "audiomae_on_audioset": [null, [["music", 67.0], ["synthesizer", 6.45], ["emergency vehicle", 3.74]], [["music", 47.28], ["hum", 8.35], ["ding", 3.98]], [["music", 65.16], ["musical instrument", 9.87], ["didgeridoo", 3.85]], null, null, [["music", 40.66], ["speech", 12.07], ["electronic music", 4.67]], [["hum", 17.77], ["speech", 16.82], ["music", 12.01]], [["music", 65.78], ["hum", 7.47], ["throbbing", 5.56]], [["music", 42.72], ["hum", 10.8], ["throbbing", 8.45]], null, [["music", 22.98], ["speech", 18.72], ["fly, housefly", 4.66]]], "duration": [1.91, 7.38, 9.5, 17.96, -0.14, 0.34, 3.57, 8.38, 29.99, 7.05, 1.38, 3.87]} \ No newline at end of file diff --git a/annotations_1/xNc951Hq2WA_filtered.json b/annotations_1/xNc951Hq2WA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d0d8b243c545908271a7fd071ac30fc4300d01d9 --- /dev/null +++ b/annotations_1/xNc951Hq2WA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.6], [10.0, 10.84], [12.0, 22.64], [25.0, 46.72], [48.0, 53.81], [56.0, 56.66], [58.0, 58.67], [59.0, 60.67], [62.0, 62.33], [63.0, 65.25], [67.0, 67.09], [71.0, 70.85]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.36, 78.04, 59.07, 0.0, 0.0, 0.0, 0.0, 88.28, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["throbbing", 52.4], ["hum", 32.67], ["music", 5.32]], null, null, null, null, null, null, null, null, null], "duration": [0.6, 0.84, 10.64, 21.72, 5.81, 0.66, 0.67, 1.67, 0.33, 2.25, 0.09, -0.15]} \ No newline at end of file diff --git a/annotations_1/xP7yIQladb0_filtered.json b/annotations_1/xP7yIQladb0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf1121b916638a2f392d4b41e5f6f01319dd93ae --- /dev/null +++ b/annotations_1/xP7yIQladb0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.13], [13.0, 18.69], [33.0, 37.49], [40.0, 42.6], [43.0, 43.55], [47.0, 55.66], [57.0, 67.37], [72.0, 72.37], [74.0, 81.67], [83.0, 83.25], [84.0, 106.95], [112.0, 116.67], [120.0, 124.28]], "keep_status": [true, true, true, true, false, true, true, false, false, false, true, true, true], "silence_prob": [33.2, 29.08, 35.83, 38.05, 0.0, 29.92, 28.68, 0.0, 32.16, 0.0, 29.14, 29.26, 29.62], "audiomae_on_audioset": [[["speech", 43.29], ["livestock, farm animals, working animals", 7.36], ["cattle, bovinae", 5.4]], [["speech", 33.38], ["vehicle", 11.98], ["music", 11.13]], [["speech", 42.63], ["music", 10.44], ["boat, water vehicle", 4.68]], [["speech", 22.95], ["music", 20.14], ["whale vocalization", 5.14]], null, [["music", 23.88], ["vehicle", 22.04], ["buzz", 9.27]], [["buzz", 23.63], ["speech", 12.34], ["livestock, farm animals, working animals", 9.78]], null, [["music", 49.48], ["hum", 18.62], ["throbbing", 15.34]], null, [["music", 16.63], ["vehicle", 8.19], ["hum", 7.24]], [["music", 27.63], ["hum", 4.52], ["speech", 4.11]], [["music", 23.4], ["buzz", 10.12], ["hum", 9.17]]], "duration": [2.13, 5.69, 4.49, 2.6, 0.55, 8.66, 10.37, 0.37, 7.67, 0.25, 22.95, 4.67, 4.28]} \ No newline at end of file diff --git a/annotations_1/xPk6RGGwQC8_filtered.json b/annotations_1/xPk6RGGwQC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3ef631fbf538663d1b38d474dab7335c420ed2b9 --- /dev/null +++ b/annotations_1/xPk6RGGwQC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.64], [8.0, 8.18], [9.0, 10.08], [14.0, 14.61], [18.0, 18.69], [31.0, 32.95], [36.0, 39.61], [41.0, 42.2], [44.0, 45.45], [48.0, 50.13], [59.0, 59.36], [62.0, 63.49], [66.0, 68.28], [69.0, 86.36], [101.0, 108.36], [111.0, 113.21], [119.0, 121.59], [123.0, 123.94], [124.0, 125.68], [127.0, 128.68], [129.0, 129.59], [131.0, 131.55]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.97, 0.0, 0.0, 77.2, 0.0, 0.0, 73.06, 71.43, 71.87, 89.36, 60.42, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.64, 0.18, 1.08, 0.61, 0.69, 1.95, 3.61, 1.2, 1.45, 2.13, 0.36, 1.49, 2.28, 17.36, 7.36, 2.21, 2.59, 0.94, 1.68, 1.68, 0.59, 0.55]} \ No newline at end of file diff --git a/annotations_1/xPwq9go3HDc_filtered.json b/annotations_1/xPwq9go3HDc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..08d7bd71709d9fcb45aa26c4e3028a14ef22e54f --- /dev/null +++ b/annotations_1/xPwq9go3HDc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.12], [12.0, 15.09], [17.0, 23.21], [25.0, 27.04], [28.0, 30.11], [31.0, 32.26], [33.0, 37.05], [38.0, 49.06], [50.0, 60.1], [60.0, 61.94], [63.0, 81.72], [84.0, 87.27], [89.0, 90.34], [91.0, 94.2], [97.0, 98.31], [100.0, 101.6], [108.0, 113.86], [115.0, 117.49], [119.0, 120.83], [122.0, 124.58], [125.0, 131.4], [133.0, 153.66], [155.0, 162.82], [164.0, 179.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [99.26, 99.98, 99.78, 76.04, 98.44, 0.0, 99.65, 99.31, 99.94, 0.0, 89.72, 99.21, 0.0, 71.29, 0.0, 0.0, 98.51, 97.64, 0.0, 94.52, 96.29, 30.64, 96.04, 80.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 37.39], ["hum", 18.68], ["burping, eructation", 8.43]], null, null], "duration": [2.12, 3.09, 6.21, 2.04, 2.11, 1.26, 4.05, 11.06, 10.1, 1.94, 18.72, 3.27, 1.34, 3.2, 1.31, 1.6, 5.86, 2.49, 1.83, 2.58, 6.4, 20.66, 7.82, 15.2]} \ No newline at end of file diff --git a/annotations_1/xQyVBxABGxw_filtered.json b/annotations_1/xQyVBxABGxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..291d63d993a4fd3e11e0a21c1f253e778762c0d8 --- /dev/null +++ b/annotations_1/xQyVBxABGxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [4.0, 5.7], [10.0, 10.83], [13.0, 13.85], [17.0, 17.24], [18.0, 18.89], [25.0, 27.33], [29.0, 29.98], [33.0, 36.9], [42.0, 42.38], [46.0, 46.09], [49.0, 49.92], [52.0, 52.76], [57.0, 59.53], [60.0, 72.08], [75.0, 93.51], [95.0, 95.37], [96.0, 96.04], [99.0, 104.84], [107.0, 118.15], [122.0, 122.23], [126.0, 127.48], [128.0, 140.61], [142.0, 144.0], [145.0, 148.04]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.96, 0.0, 75.23, 0.0, 0.0, 0.0, 0.0, 52.39, 33.38, 30.92, 0.0, 0.0, 28.69, 29.65, 0.0, 0.0, 29.6, 32.75, 33.63], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 21.39], ["mains hum", 13.42], ["thunk", 7.75]], [["music", 77.76], ["speech", 6.12], ["throbbing", 3.06]], null, null, [["music", 86.69], ["electronic music", 1.79], ["didgeridoo", 1.29]], [["music", 62.84], ["throbbing", 8.26], ["hum", 7.55]], null, null, [["music", 49.36], ["didgeridoo", 10.97], ["throbbing", 9.54]], [["music", 63.86], ["whale vocalization", 6.33], ["speech", 3.34]], [["music", 32.76], ["hum", 14.0], ["mains hum", 11.87]]], "duration": [0.51, 1.7, 0.83, 0.85, 0.24, 0.89, 2.33, 0.98, 3.9, 0.38, 0.09, 0.92, 0.76, 2.53, 12.08, 18.51, 0.37, 0.04, 5.84, 11.15, 0.23, 1.48, 12.61, 2.0, 3.04]} \ No newline at end of file diff --git a/annotations_1/xR6jSh2HrAA_filtered.json b/annotations_1/xR6jSh2HrAA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0f93284a80faa02777b3eb23d47c4b69cd9cc700 --- /dev/null +++ b/annotations_1/xR6jSh2HrAA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 7.94], [11.0, 29.84], [32.0, 33.07], [38.0, 39.43], [43.0, 54.14], [56.0, 57.25], [59.0, 60.1], [61.0, 62.55], [64.0, 64.34], [65.0, 68.94], [71.0, 73.52], [74.0, 79.22], [80.0, 83.61], [84.0, 85.53], [89.0, 93.01], [94.0, 99.18], [100.0, 101.98], [104.0, 105.16], [106.0, 109.73], [111.0, 134.08], [137.0, 138.35], [139.0, 176.05], [176.0, 177.47]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, true, true, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 0.0, 48.23, 0.0, 0.0, 0.0, 0.0, 41.24, 69.88, 46.5, 34.18, 0.0, 59.68, 44.34, 0.0, 0.0, 37.91, 39.89, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["stomach rumble", 72.52], ["music", 6.74], ["whale vocalization", 5.85]], null, null, null, null, [["music", 24.48], ["whale vocalization", 21.29], ["heart murmur", 15.77]], null, [["whale vocalization", 74.25], ["chirp tone", 3.34], ["rumble", 3.21]], [["music", 40.75], ["whale vocalization", 12.11], ["electronic music", 4.86]], null, null, [["speech", 50.57], ["sidetone", 15.68], ["hum", 6.1]], null, null, [["hum", 33.32], ["throbbing", 19.36], ["music", 15.31]], [["animal", 17.64], ["goat", 11.19], ["stomach rumble", 10.54]], null, null, null], "duration": [-0.06, 18.84, 1.07, 1.43, 11.14, 1.25, 1.1, 1.55, 0.34, 3.94, 2.52, 5.22, 3.61, 1.53, 4.01, 5.18, 1.98, 1.16, 3.73, 23.08, 1.35, 37.05, 1.47]} \ No newline at end of file diff --git a/annotations_1/xRShAxpUZ6Y_filtered.json b/annotations_1/xRShAxpUZ6Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..15adf5f99c1b86f8cd2acce934f5fdb838d8eb4b --- /dev/null +++ b/annotations_1/xRShAxpUZ6Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 15.57], [16.0, 17.9], [18.0, 24.14], [29.0, 33.0], [34.0, 34.82], [40.0, 41.3], [43.0, 43.07], [45.0, 46.5], [52.0, 53.5], [63.0, 66.45], [68.0, 68.28], [73.0, 78.53], [79.0, 79.56], [83.0, 89.16], [90.0, 102.54], [106.0, 112.31], [116.0, 116.41], [117.0, 117.85], [121.0, 128.36], [131.0, 131.21], [134.0, 139.18], [142.0, 156.12], [157.0, 157.44], [158.0, 160.71], [167.0, 171.69], [179.0, 179.85], [181.0, 182.8], [185.0, 185.62], [187.0, 193.41]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, true, false, false, false, true], "silence_prob": [35.63, 0.0, 35.41, 36.54, 0.0, 0.0, 0.0, 0.0, 0.0, 40.04, 0.0, 32.26, 0.0, 29.76, 30.7, 30.41, 0.0, 0.0, 31.37, 0.0, 30.93, 30.62, 0.0, 31.06, 29.45, 0.0, 0.0, 0.0, 30.35], "audiomae_on_audioset": [[["music", 48.74], ["speech", 27.93], ["synthesizer", 2.98]], null, [["music", 69.9], ["synthesizer", 5.61], ["musical instrument", 2.44]], [["music", 38.75], ["speech", 17.66], ["synthesizer", 13.46]], null, null, null, null, null, [["music", 64.04], ["synthesizer", 7.22], ["singing bowl", 2.41]], null, [["music", 54.55], ["speech", 16.16], ["guitar", 7.91]], null, [["music", 61.16], ["speech", 14.63], ["crowd", 3.02]], [["music", 64.82], ["speech", 27.51], ["didgeridoo", 1.18]], [["music", 53.07], ["speech", 32.36], ["boing", 3.81]], null, null, [["music", 57.44], ["didgeridoo", 5.27], ["throbbing", 3.19]], null, [["hum", 19.96], ["mains hum", 16.56], ["breaking", 13.17]], [["music", 26.11], ["hum", 9.31], ["foghorn", 8.24]], null, [["didgeridoo", 65.01], ["music", 18.45], ["speech", 7.67]], [["music", 31.04], ["speech", 13.1], ["thump, thud", 5.47]], null, null, null, [["music", 39.31], ["electronic music", 6.63], ["speech", 5.98]]], "duration": [9.57, 1.9, 6.14, 4.0, 0.82, 1.3, 0.07, 1.5, 1.5, 3.45, 0.28, 5.53, 0.56, 6.16, 12.54, 6.31, 0.41, 0.85, 7.36, 0.21, 5.18, 14.12, 0.44, 2.71, 4.69, 0.85, 1.8, 0.62, 6.41]} \ No newline at end of file diff --git a/annotations_1/xRw3fodr6jY_filtered.json b/annotations_1/xRw3fodr6jY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9d721d31ee2908d3ec9a7b753bd7327f1fafcca --- /dev/null +++ b/annotations_1/xRw3fodr6jY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.65], [20.0, 20.01], [30.0, 31.92], [42.0, 42.35], [58.0, 59.63], [64.0, 64.71], [68.0, 75.71], [78.0, 81.9], [83.0, 83.44], [98.0, 100.57], [101.0, 102.27], [103.0, 106.44], [109.0, 109.05], [118.0, 119.26], [131.0, 136.68], [138.0, 140.56], [157.0, 157.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.53, 40.04, 0.0, 78.72, 0.0, 67.63, 0.0, 0.0, 48.06, 73.36, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 88.46], ["electronic music", 1.92], ["drum and bass", 1.63]], [["electric shaver, electric razor", 35.0], ["hum", 22.95], ["mains hum", 20.28]], null, null, null, null, null, null, [["whistling", 95.4], ["theremin", 1.86], ["whistle", 1.0]], null, null], "duration": [1.65, 0.01, 1.92, 0.35, 1.63, 0.71, 7.71, 3.9, 0.44, 2.57, 1.27, 3.44, 0.05, 1.26, 5.68, 2.56, 0.54]} \ No newline at end of file diff --git a/annotations_1/xSJaxpJHf-s_filtered.json b/annotations_1/xSJaxpJHf-s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4695a95b52bb5374c8374e6046b88ac22a5ee3f7 --- /dev/null +++ b/annotations_1/xSJaxpJHf-s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 29.56], [39.0, 49.05], [55.0, 57.08], [60.0, 61.53], [62.0, 96.36], [100.0, 114.69], [116.0, 117.81], [118.0, 124.93], [128.0, 148.86], [152.0, 167.9], [169.0, 169.16], [170.0, 176.32], [178.0, 180.28], [184.0, 188.69], [202.0, 202.88], [204.0, 249.78]], "keep_status": [false, true, false, false, false, true, false, true, false, false, false, false, false, true, false, false], "silence_prob": [32.01, 32.78, 35.2, 0.0, 0.0, 32.76, 0.0, 34.45, 31.92, 32.53, 0.0, 33.88, 43.61, 33.6, 0.0, 0.0], "audiomae_on_audioset": [[["music", 70.37], ["musical instrument", 3.94], ["cacophony", 3.09]], [["music", 58.85], ["hum", 5.17], ["synthesizer", 4.72]], [["music", 65.01], ["throbbing", 6.71], ["sonar", 5.71]], null, null, [["music", 29.27], ["speech", 10.27], ["animal", 2.32]], null, [["music", 32.04], ["hum", 15.19], ["mains hum", 7.74]], [["music", 35.66], ["mains hum", 22.41], ["hum", 15.06]], [["music", 66.34], ["musical instrument", 4.77], ["percussion", 3.41]], null, [["hum", 39.81], ["throbbing", 22.47], ["mains hum", 16.04]], [["throbbing", 34.96], ["hum", 25.74], ["heart sounds, heartbeat", 15.21]], [["hum", 32.06], ["music", 13.7], ["noise", 12.55]], null, null], "duration": [23.56, 10.05, 2.08, 1.53, 34.36, 14.69, 1.81, 6.93, 20.86, 15.9, 0.16, 6.32, 2.28, 4.69, 0.88, 45.78]} \ No newline at end of file diff --git a/annotations_1/xSM_nz6gKOI_filtered.json b/annotations_1/xSM_nz6gKOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f36e32f723f472bafe7b55a70ad6267758529d6f --- /dev/null +++ b/annotations_1/xSM_nz6gKOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 9.96], [11.0, 12.56], [13.0, 153.84]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [-0.04, 1.56, 140.84]} \ No newline at end of file diff --git a/annotations_1/xSNkZYKC_c0_filtered.json b/annotations_1/xSNkZYKC_c0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4b3d4b219cb3aaa534e97bd3b099cacbe157d9c9 --- /dev/null +++ b/annotations_1/xSNkZYKC_c0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[43.0, 51.39], [56.0, 57.91], [58.0, 87.61], [90.0, 94.95], [96.0, 107.33], [109.0, 126.74], [128.0, 134.86], [137.0, 138.7], [141.0, 143.87], [145.0, 145.42]], "keep_status": [false, false, true, false, false, true, true, false, false, false], "silence_prob": [41.85, 0.0, 29.32, 32.53, 29.52, 29.2, 31.16, 0.0, 31.37, 0.0], "audiomae_on_audioset": [[["mains hum", 24.99], ["hum", 24.81], ["music", 23.06]], null, [["speech", 25.97], ["hum", 21.31], ["music", 17.2]], [["hum", 36.6], ["mains hum", 34.88], ["throbbing", 5.1]], [["hum", 40.98], ["music", 24.61], ["mains hum", 11.72]], [["throbbing", 29.82], ["hum", 24.94], ["speech", 13.45]], [["music", 56.9], ["throbbing", 5.41], ["hum", 2.56]], null, [["speech", 39.92], ["throbbing", 19.93], ["music", 16.62]], null], "duration": [8.39, 1.91, 29.61, 4.95, 11.33, 17.74, 6.86, 1.7, 2.87, 0.42]} \ No newline at end of file diff --git a/annotations_1/xTKfpU41hbY_filtered.json b/annotations_1/xTKfpU41hbY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c1e35ca0224ae35aee00dfdb1704af92fc87e7f6 --- /dev/null +++ b/annotations_1/xTKfpU41hbY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.87], [4.0, 4.41], [4.0, 9.04], [10.0, 27.13], [30.0, 31.87], [33.0, 34.08], [37.0, 44.17], [46.0, 46.95], [52.0, 51.95], [53.0, 57.55], [59.0, 59.26], [60.0, 64.35], [65.0, 65.89], [67.0, 67.36], [70.0, 77.21], [78.0, 79.12], [80.0, 81.77], [83.0, 84.11], [85.0, 86.17], [87.0, 138.77], [144.0, 143.75], [144.0, 149.64], [150.0, 152.79], [154.0, 170.48], [171.0, 172.98]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 28.5, 29.82, 0.0, 0.0, 33.6, 0.0, 0.0, 39.18, 0.0, 39.34, 0.0, 0.0, 49.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.74, 51.99, 39.47, 0.0], "audiomae_on_audioset": [null, null, [["speech", 61.08], ["music", 6.23], ["explosion", 5.44]], [["hum", 24.75], ["mains hum", 20.74], ["music", 14.46]], null, null, [["speech", 35.83], ["hum", 29.92], ["mains hum", 8.87]], null, null, [["throbbing", 41.26], ["music", 19.09], ["hum", 13.25]], null, [["hum", 22.03], ["speech", 20.36], ["mains hum", 15.59]], null, null, [["music", 29.63], ["hum", 7.63], ["crackle", 5.61]], null, null, null, null, null, null, [["music", 21.69], ["speech", 14.33], ["hum", 8.71]], null, [["music", 34.85], ["speech", 19.08], ["hum", 8.45]], null], "duration": [-0.13, 0.41, 5.04, 17.13, 1.87, 1.08, 7.17, 0.95, -0.05, 4.55, 0.26, 4.35, 0.89, 0.36, 7.21, 1.12, 1.77, 1.11, 1.17, 51.77, -0.25, 5.64, 2.79, 16.48, 1.98]} \ No newline at end of file diff --git a/annotations_1/xUHjhz5U1bA_filtered.json b/annotations_1/xUHjhz5U1bA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc8b70cecd188add03de7a0fc65964d8f385079 --- /dev/null +++ b/annotations_1/xUHjhz5U1bA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 62.02], [63.0, 66.02], [67.0, 72.32], [78.0, 79.74], [80.0, 82.56], [84.0, 95.22], [96.0, 96.77], [100.0, 100.99], [101.0, 115.91]], "keep_status": [false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 80.46, 45.14, 0.0, 46.19, 33.36, 0.0, 0.0, 29.67], "audiomae_on_audioset": [null, null, [["speech", 38.57], ["music", 29.48], ["singing bowl", 2.86]], null, [["music", 40.74], ["speech", 8.07], ["theremin", 4.62]], [["music", 43.6], ["speech", 32.34], ["electric shaver, electric razor", 1.86]], null, null, [["music", 62.82], ["musical instrument", 4.71], ["hum", 3.52]]], "duration": [48.02, 3.02, 5.32, 1.74, 2.56, 11.22, 0.77, 0.99, 14.91]} \ No newline at end of file diff --git a/annotations_1/xUNy6fZy4WE_filtered.json b/annotations_1/xUNy6fZy4WE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..60edf2e4b47621a8cad932ee873f656824111cca --- /dev/null +++ b/annotations_1/xUNy6fZy4WE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 14.86], [17.0, 17.07], [18.0, 19.48], [21.0, 21.9], [23.0, 24.92], [26.0, 26.33], [32.0, 32.71], [35.0, 36.24], [37.0, 38.4], [39.0, 40.0], [41.0, 43.11], [44.0, 46.95], [48.0, 53.5], [55.0, 56.71], [62.0, 64.03], [67.0, 67.42], [68.0, 69.01], [70.0, 71.2], [72.0, 73.28], [75.0, 75.68], [77.0, 78.24], [79.0, 82.27], [84.0, 84.4], [85.0, 85.41], [87.0, 87.83], [89.0, 91.42], [96.0, 113.56], [114.0, 147.82], [149.0, 153.96], [155.0, 160.51]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [61.08, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.04, 59.42, 57.81, 0.0, 61.47, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.56, 0.0, 0.0, 0.0, 45.65, 31.97, 0.0, 33.4, 37.66], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 63.23], ["effects unit", 5.84], ["musical instrument", 3.65]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 15.03], ["speech", 9.6], ["throbbing", 8.06]], [["speech", 40.83], ["music", 16.53], ["throbbing", 8.35]], null, [["music", 50.76], ["hum", 12.54], ["throbbing", 9.12]], [["throbbing", 49.6], ["music", 28.07], ["hum", 9.5]]], "duration": [3.86, 0.07, 1.48, 0.9, 1.92, 0.33, 0.71, 1.24, 1.4, 1.0, 2.11, 2.95, 5.5, 1.71, 2.03, 0.42, 1.01, 1.2, 1.28, 0.68, 1.24, 3.27, 0.4, 0.41, 0.83, 2.42, 17.56, 33.82, 4.96, 5.51]} \ No newline at end of file diff --git a/annotations_1/xURDJ-IW5YM_filtered.json b/annotations_1/xURDJ-IW5YM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad80d7370ae20e276fed6d9140863ef51ffbe19a --- /dev/null +++ b/annotations_1/xURDJ-IW5YM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.93], [26.0, 27.6], [31.0, 33.47], [34.0, 38.13], [41.0, 41.64], [54.0, 55.27], [60.0, 60.94], [65.0, 65.77], [67.0, 68.15], [70.0, 76.23], [77.0, 77.94], [79.0, 85.55], [97.0, 99.03], [110.0, 114.78], [116.0, 128.93], [136.0, 136.66], [137.0, 138.54], [150.0, 154.68], [157.0, 157.69], [161.0, 161.0], [162.0, 163.49], [164.0, 163.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.93, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.48, 0.0, 58.72, 72.31, 47.82, 42.67, 0.0, 0.0, 47.74, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["music", 73.79], ["musical instrument", 3.04], ["carnatic music", 1.85]], null, null, null, [["music", 64.55], ["mantra", 4.07], ["plucked string instrument", 3.38]], [["music", 74.48], ["humming", 5.19], ["musical instrument", 2.62]], null, null, [["music", 73.65], ["lullaby", 2.92], ["singing", 2.33]], null, null, null, null], "duration": [-0.07, 1.6, 2.47, 4.13, 0.64, 1.27, 0.94, 0.77, 1.15, 6.23, 0.94, 6.55, 2.03, 4.78, 12.93, 0.66, 1.54, 4.68, 0.69, 0.0, 1.49, -0.47]} \ No newline at end of file diff --git a/annotations_1/xVANxG9gI6g_filtered.json b/annotations_1/xVANxG9gI6g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6bdbcaa0d66d0002a1fd5c0fcff1c719f1b3b15d --- /dev/null +++ b/annotations_1/xVANxG9gI6g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 14.23], [22.0, 23.16], [24.0, 29.54], [30.0, 29.62], [31.0, 32.26], [33.0, 33.0], [33.0, 34.33], [38.0, 44.34], [56.0, 67.81], [73.0, 73.4], [82.0, 82.7], [84.0, 84.03], [86.0, 87.3], [98.0, 99.06], [101.0, 102.41], [103.0, 104.97], [107.0, 108.51], [111.0, 112.04], [114.0, 114.27], [116.0, 117.21], [119.0, 120.61], [122.0, 123.09], [129.0, 129.9], [131.0, 132.8], [134.0, 135.03], [136.0, 137.37], [140.0, 140.05], [141.0, 140.9], [144.0, 144.64], [148.0, 148.71], [162.0, 162.33], [166.0, 166.78], [168.0, 169.4]], "keep_status": [false, false, true, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 30.01, 0.0, 0.0, 0.0, 0.0, 29.22, 30.75, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 61.55], ["didgeridoo", 3.82], ["musical instrument", 3.3]], null, null, null, null, [["moo", 22.6], ["cattle, bovinae", 21.78], ["music", 19.34]], [["music", 31.59], ["speech", 28.67], ["cattle, bovinae", 4.79]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.23, 1.16, 5.54, -0.38, 1.26, 0.0, 1.33, 6.34, 11.81, 0.4, 0.7, 0.03, 1.3, 1.06, 1.41, 1.97, 1.51, 1.04, 0.27, 1.21, 1.61, 1.09, 0.9, 1.8, 1.03, 1.37, 0.05, -0.1, 0.64, 0.71, 0.33, 0.78, 1.4]} \ No newline at end of file diff --git a/annotations_1/xVWAp3OLYTM_filtered.json b/annotations_1/xVWAp3OLYTM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3d0f9597495725a0a1b3a12271a61cd83152aa3c --- /dev/null +++ b/annotations_1/xVWAp3OLYTM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.69], [7.0, 16.17], [17.0, 23.58], [25.0, 26.33], [28.0, 28.98], [30.0, 30.86], [35.0, 42.94], [43.0, 49.5], [50.0, 53.59], [54.0, 56.52], [59.0, 68.67], [70.0, 70.21], [72.0, 72.06], [73.0, 73.18], [74.0, 75.56], [76.0, 78.29], [80.0, 84.74], [86.0, 97.9], [98.0, 103.27], [104.0, 104.67], [105.0, 106.1], [108.0, 109.85], [110.0, 114.18], [115.0, 114.94], [115.0, 116.97], [117.0, 117.05], [117.0, 147.51], [149.0, 149.12], [152.0, 154.97], [156.0, 175.53], [177.0, 192.21]], "keep_status": [false, true, false, false, false, false, true, false, true, true, false, false, false, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.16, 40.7, 0.0, 0.0, 0.0, 40.36, 35.18, 43.71, 36.51, 33.08, 0.0, 0.0, 0.0, 0.0, 32.89, 34.52, 32.03, 37.62, 0.0, 0.0, 0.0, 34.52, 0.0, 0.0, 0.0, 0.0, 0.0, 86.64, 62.37, 51.44], "audiomae_on_audioset": [null, [["hum", 28.52], ["whale vocalization", 12.59], ["animal", 8.72]], [["livestock, farm animals, working animals", 46.29], ["cattle, bovinae", 42.42], ["moo", 9.11]], null, null, null, [["speech", 20.18], ["didgeridoo", 19.28], ["whale vocalization", 6.73]], [["hum", 46.18], ["throbbing", 38.55], ["mains hum", 4.27]], [["hum", 19.93], ["throbbing", 11.37], ["rumble", 6.3]], [["music", 33.03], ["hum", 15.97], ["musical instrument", 5.17]], [["livestock, farm animals, working animals", 57.35], ["cattle, bovinae", 31.9], ["moo", 6.59]], null, null, null, null, [["noise", 73.1], ["hum", 4.62], ["groan", 4.31]], [["music", 18.65], ["throbbing", 16.3], ["hum", 14.19]], [["hum", 16.77], ["explosion", 12.84], ["throbbing", 8.55]], [["hum", 45.47], ["throbbing", 29.9], ["music", 11.33]], null, null, null, [["speech", 25.33], ["hum", 13.4], ["whale vocalization", 11.03]], null, null, null, null, null, null, null, null], "duration": [-0.31, 9.17, 6.58, 1.33, 0.98, 0.86, 7.94, 6.5, 3.59, 2.52, 9.67, 0.21, 0.06, 0.18, 1.56, 2.29, 4.74, 11.9, 5.27, 0.67, 1.1, 1.85, 4.18, -0.06, 1.97, 0.05, 30.51, 0.12, 2.97, 19.53, 15.21]} \ No newline at end of file diff --git a/annotations_1/xXi-6s-qrQM_filtered.json b/annotations_1/xXi-6s-qrQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d036a3821f73a04f0dab9a106153290cb8708713 --- /dev/null +++ b/annotations_1/xXi-6s-qrQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.7], [7.0, 10.13], [15.0, 23.7], [26.0, 26.69], [30.0, 30.97], [37.0, 40.86], [42.0, 47.06], [57.0, 58.13], [66.0, 66.38], [69.0, 69.48], [70.0, 74.36], [75.0, 76.27], [83.0, 83.84], [87.0, 86.9], [92.0, 92.6], [98.0, 99.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [47.46, 46.5, 88.83, 0.0, 0.0, 77.87, 77.03, 0.0, 0.0, 0.0, 41.95, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 54.75], ["synthesizer", 14.56], ["electronic music", 3.11]], [["music", 60.8], ["hum", 5.71], ["electronic music", 5.52]], null, null, null, null, null, null, null, null, [["frog", 12.55], ["wild animals", 12.42], ["whale vocalization", 10.54]], null, null, null, null, null], "duration": [2.7, 3.13, 8.7, 0.69, 0.97, 3.86, 5.06, 1.13, 0.38, 0.48, 4.36, 1.27, 0.84, -0.1, 0.6, 1.74]} \ No newline at end of file diff --git a/annotations_1/xYHBAXUJ-Zs_filtered.json b/annotations_1/xYHBAXUJ-Zs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bc4f48423ad1872428ea4b744b8c9269a311653c --- /dev/null +++ b/annotations_1/xYHBAXUJ-Zs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 11.01], [17.0, 17.54], [26.0, 26.35], [29.0, 28.88], [32.0, 32.54], [33.0, 33.89], [37.0, 37.61], [43.0, 43.24], [47.0, 47.68], [51.0, 51.41], [81.0, 81.4], [82.0, 83.05], [87.0, 88.6], [92.0, 92.69], [102.0, 102.24], [106.0, 105.9], [109.0, 109.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.01, 0.54, 0.35, -0.12, 0.54, 0.89, 0.61, 0.24, 0.68, 0.41, 0.4, 1.05, 1.6, 0.69, 0.24, -0.1, 0.73]} \ No newline at end of file diff --git a/annotations_1/xYIhxXt58uE_filtered.json b/annotations_1/xYIhxXt58uE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d30125f0fdcfb41a4056004e9da89203a93d1c4c --- /dev/null +++ b/annotations_1/xYIhxXt58uE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 17.24], [21.0, 21.59], [23.0, 22.98], [24.0, 24.31], [29.0, 28.92], [31.0, 31.82], [34.0, 36.61], [38.0, 50.94], [53.0, 167.44], [170.0, 177.3]], "keep_status": [true, false, false, false, false, false, true, false, false, false], "silence_prob": [37.74, 0.0, 0.0, 0.0, 0.0, 0.0, 37.13, 28.46, 0.0, 30.74], "audiomae_on_audioset": [[["sidetone", 30.05], ["speech", 26.58], ["music", 11.47]], null, null, null, null, null, [["hum", 21.22], ["music", 15.81], ["throbbing", 13.29]], [["hum", 38.07], ["throbbing", 27.73], ["music", 20.45]], null, [["music", 45.19], ["whale vocalization", 38.73], ["theremin", 6.56]]], "duration": [2.24, 0.59, -0.02, 0.31, -0.08, 0.82, 2.61, 12.94, 114.44, 7.3]} \ No newline at end of file diff --git a/annotations_1/xYfxboRtKJE_filtered.json b/annotations_1/xYfxboRtKJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc7972492dc8f487400befbbceac82a6dfa312a9 --- /dev/null +++ b/annotations_1/xYfxboRtKJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 57.33], [62.0, 62.97], [70.0, 72.45], [75.0, 75.22], [76.0, 78.73], [79.0, 79.78], [82.0, 82.7], [84.0, 83.86], [84.0, 95.1], [97.0, 108.97], [110.0, 110.67], [111.0, 114.89], [116.0, 126.94], [129.0, 129.93], [131.0, 130.98], [132.0, 133.37], [134.0, 134.47]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 35.42, 0.0, 80.82, 0.0, 0.0, 0.0, 77.87, 55.11, 0.0, 63.53, 59.15, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["noise", 8.11], ["cough", 7.29], ["radio", 6.61]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [36.33, 0.97, 2.45, 0.22, 2.73, 0.78, 0.7, -0.14, 11.1, 11.97, 0.67, 3.89, 10.94, 0.93, -0.02, 1.37, 0.47]} \ No newline at end of file diff --git a/annotations_1/x_6ZpxB4xIc_filtered.json b/annotations_1/x_6ZpxB4xIc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49e626a3da5ceb9f87f7bd1a3411895e3092389d --- /dev/null +++ b/annotations_1/x_6ZpxB4xIc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 10.5], [12.0, 15.53], [17.0, 16.92], [25.0, 25.35], [29.0, 29.35], [30.0, 30.74], [32.0, 33.02], [34.0, 35.19], [39.0, 40.98], [43.0, 42.89], [44.0, 45.35], [48.0, 48.64], [51.0, 51.97], [56.0, 56.67], [58.0, 59.48], [62.0, 63.64], [65.0, 65.74], [67.0, 67.19], [77.0, 77.06], [79.0, 80.0], [82.0, 82.83], [86.0, 86.8], [87.0, 88.1], [92.0, 94.27], [95.0, 96.55], [97.0, 98.73], [102.0, 101.92], [106.0, 106.71], [117.0, 117.58], [122.0, 129.03], [133.0, 133.19], [134.0, 134.65], [136.0, 140.02], [143.0, 143.11]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 35.3, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.48, 0.0, 0.0, 0.0, 0.0, 0.0, 43.87, 0.0, 0.0, 57.09, 0.0], "audiomae_on_audioset": [null, [["music", 33.89], ["wind instrument, woodwind instrument", 17.05], ["brass instrument", 8.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 59.55], ["musical instrument", 8.76], ["didgeridoo", 6.84]], null, null, null, null], "duration": [0.5, 3.53, -0.08, 0.35, 0.35, 0.74, 1.02, 1.19, 1.98, -0.11, 1.35, 0.64, 0.97, 0.67, 1.48, 1.64, 0.74, 0.19, 0.06, 1.0, 0.83, 0.8, 1.1, 2.27, 1.55, 1.73, -0.08, 0.71, 0.58, 7.03, 0.19, 0.65, 4.02, 0.11]} \ No newline at end of file diff --git a/annotations_1/x_BYzj4jQEM_filtered.json b/annotations_1/x_BYzj4jQEM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..032bb45b15ad27824b7ccdb20512053d16409783 --- /dev/null +++ b/annotations_1/x_BYzj4jQEM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.95], [16.0, 16.83], [24.0, 25.78], [29.0, 29.52], [31.0, 32.51], [34.0, 36.14], [37.0, 37.32], [39.0, 39.87], [44.0, 44.81], [46.0, 54.51], [71.0, 81.19], [83.0, 84.5], [88.0, 87.89], [89.0, 88.91], [90.0, 91.08], [92.0, 93.77], [96.0, 99.57], [101.0, 109.43], [111.0, 111.92], [112.0, 113.63], [115.0, 115.23], [117.0, 116.83], [118.0, 118.12], [119.0, 118.89], [123.0, 124.19], [125.0, 136.24], [137.0, 137.88], [143.0, 143.56]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 0.0, 0.0, 0.0, 49.59, 89.36, 0.0, 0.0, 0.0, 0.0, 0.0, 99.52, 91.13, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 23.65], ["vehicle", 18.41], ["mains hum", 6.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.95, 0.83, 1.78, 0.52, 1.51, 2.14, 0.32, 0.87, 0.81, 8.51, 10.19, 1.5, -0.11, -0.09, 1.08, 1.77, 3.57, 8.43, 0.92, 1.63, 0.23, -0.17, 0.12, -0.11, 1.19, 11.24, 0.88, 0.56]} \ No newline at end of file diff --git a/annotations_1/xaIlgOMjspo_filtered.json b/annotations_1/xaIlgOMjspo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..37d1852ed60aed88f5bc1e0f2e55a687e2217be4 --- /dev/null +++ b/annotations_1/xaIlgOMjspo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.99], [13.0, 15.79], [19.0, 20.8], [33.0, 33.57], [34.0, 34.92], [41.0, 42.85], [43.0, 42.9], [43.0, 43.51], [50.0, 50.35], [52.0, 53.22], [56.0, 56.22], [66.0, 66.36], [82.0, 83.03], [88.0, 89.41], [118.0, 120.75], [121.0, 122.5]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.99, 2.79, 1.8, 0.57, 0.92, 1.85, -0.1, 0.51, 0.35, 1.22, 0.22, 0.36, 1.03, 1.41, 2.75, 1.5]} \ No newline at end of file diff --git a/annotations_1/xbhm9F1ST6I_filtered.json b/annotations_1/xbhm9F1ST6I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bb1a1d03e8e4ecf0e9fd1230a9f585c14be680d6 --- /dev/null +++ b/annotations_1/xbhm9F1ST6I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 16.6], [23.0, 23.53], [41.0, 42.01], [46.0, 46.82], [54.0, 54.41], [57.0, 58.6], [59.0, 58.87], [60.0, 60.37], [60.0, 61.75], [62.0, 63.46], [64.0, 64.74], [66.0, 66.45], [68.0, 70.88], [75.0, 83.34], [84.0, 84.6], [85.0, 85.73], [93.0, 95.77], [96.0, 96.11], [106.0, 105.97], [121.0, 121.54], [126.0, 126.54], [127.0, 128.29], [152.0, 153.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.4, 37.99, 0.0, 0.0, 39.28, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 72.24], ["speech", 2.51], ["musical instrument", 1.58]], [["music", 78.96], ["synthesizer", 5.67], ["musical instrument", 1.96]], null, null, [["speech", 40.94], ["moo", 14.02], ["cattle, bovinae", 11.0]], null, null, null, null, null, null], "duration": [1.6, 0.53, 1.01, 0.82, 0.41, 1.6, -0.13, 0.37, 1.75, 1.46, 0.74, 0.45, 2.88, 8.34, 0.6, 0.73, 2.77, 0.11, -0.03, 0.54, 0.54, 1.29, 1.17]} \ No newline at end of file diff --git a/annotations_1/xc2Ctw8pGrc_filtered.json b/annotations_1/xc2Ctw8pGrc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bb41c737480d246d95e532a65cd33c1735221da --- /dev/null +++ b/annotations_1/xc2Ctw8pGrc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.05], [3.0, 3.65], [9.0, 9.41], [10.0, 10.93], [18.0, 21.91], [24.0, 25.71], [29.0, 29.44], [30.0, 31.13], [31.0, 33.24], [36.0, 36.09], [37.0, 37.93], [45.0, 48.17], [49.0, 50.94], [52.0, 58.41], [60.0, 61.7], [63.0, 66.88], [68.0, 69.06], [70.0, 72.08], [73.0, 77.03], [77.0, 92.37], [95.0, 96.55], [97.0, 99.08], [100.0, 112.36], [114.0, 118.27], [119.0, 123.38], [125.0, 134.11], [137.0, 137.54], [140.0, 141.79], [143.0, 143.68], [144.0, 144.85], [146.0, 148.91], [149.0, 149.01], [150.0, 154.06], [155.0, 157.74], [159.0, 181.31], [182.0, 182.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, true, false, false, false, false, true, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 37.33, 0.0, 0.0, 0.0, 50.56, 0.0, 0.0, 52.86, 0.0, 66.15, 0.0, 65.91, 0.0, 40.01, 97.11, 61.57, 0.0, 67.89, 30.93, 31.5, 40.93, 31.06, 0.0, 0.0, 0.0, 0.0, 30.63, 0.0, 33.26, 38.83, 30.83, 0.0], "audiomae_on_audioset": [null, null, null, null, [["sidetone", 45.38], ["mains hum", 21.76], ["hum", 12.29]], null, null, null, null, null, null, null, null, null, null, null, null, [["didgeridoo", 65.72], ["music", 25.42], ["musical instrument", 2.36]], null, null, null, null, [["music", 32.4], ["throbbing", 8.48], ["speech", 8.47]], [["music", 21.0], ["speech", 19.25], ["clang", 10.28]], [["music", 41.24], ["speech", 30.35], ["hum", 6.39]], [["music", 39.56], ["thunk", 11.88], ["throbbing", 9.68]], null, null, null, null, [["speech", 23.04], ["hum", 17.47], ["music", 14.37]], null, [["speech", 27.13], ["music", 15.05], ["electric shaver, electric razor", 9.24]], [["gong", 53.24], ["speech", 17.42], ["hum", 8.8]], [["music", 44.12], ["hum", 17.87], ["mains hum", 7.44]], null], "duration": [0.05, 0.65, 0.41, 0.93, 3.91, 1.71, 0.44, 1.13, 2.24, 0.09, 0.93, 3.17, 1.94, 6.41, 1.7, 3.88, 1.06, 2.08, 4.03, 15.37, 1.55, 2.08, 12.36, 4.27, 4.38, 9.11, 0.54, 1.79, 0.68, 0.85, 2.91, 0.01, 4.06, 2.74, 22.31, 0.95]} \ No newline at end of file diff --git a/annotations_1/xcTK6uPPiAo_filtered.json b/annotations_1/xcTK6uPPiAo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..919d1a82c8818649fe92b3e5513b79b995b31fc0 --- /dev/null +++ b/annotations_1/xcTK6uPPiAo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 7.67], [11.0, 17.52], [19.0, 18.79], [26.0, 39.7], [41.0, 52.79], [54.0, 72.74], [74.0, 120.45], [122.0, 123.26], [123.0, 125.39], [127.0, 129.91], [130.0, 163.38]], "keep_status": [false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [0.0, 47.78, 0.0, 32.72, 32.18, 31.17, 0.0, 0.0, 33.28, 33.51, 0.0], "audiomae_on_audioset": [null, [["music", 59.26], ["throbbing", 15.1], ["hum", 9.98]], null, [["music", 50.3], ["synthesizer", 10.06], ["musical instrument", 4.55]], [["hum", 39.38], ["throbbing", 25.06], ["music", 22.05]], [["music", 57.99], ["speech", 6.87], ["musical instrument", 4.84]], null, null, [["speech", 73.62], ["music", 9.68], ["timpani", 5.03]], [["music", 41.63], ["didgeridoo", 17.39], ["musical instrument", 5.85]], null], "duration": [0.67, 6.52, -0.21, 13.7, 11.79, 18.74, 46.45, 1.26, 2.39, 2.91, 33.38]} \ No newline at end of file diff --git a/annotations_1/xcc3vzgR9QQ_filtered.json b/annotations_1/xcc3vzgR9QQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc9d1a99a403aa28fd21b0e52fd81d3c82b2406 --- /dev/null +++ b/annotations_1/xcc3vzgR9QQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 30.45], [33.0, 39.28], [39.0, 71.14], [74.0, 74.7], [79.0, 80.15], [83.0, 83.86], [86.0, 85.95], [90.0, 90.51], [93.0, 94.22], [98.0, 99.23], [106.0, 108.04], [110.0, 111.84], [119.0, 119.01], [121.0, 122.3], [124.0, 124.83], [127.0, 126.64], [128.0, 128.97], [130.0, 132.24], [133.0, 138.06], [142.0, 144.39], [146.0, 149.64], [151.0, 151.44]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [52.92, 51.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.11, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 98.8, 98.86, 80.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [17.45, 6.28, 32.14, 0.7, 1.15, 0.86, -0.05, 0.51, 1.22, 1.23, 2.04, 1.84, 0.01, 1.3, 0.83, -0.36, 0.97, 2.24, 5.06, 2.39, 3.64, 0.44]} \ No newline at end of file diff --git a/annotations_1/xcfYbwSXFVw_filtered.json b/annotations_1/xcfYbwSXFVw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69604e4bde23d79659ce0527b17f6e25e541d27b --- /dev/null +++ b/annotations_1/xcfYbwSXFVw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.89], [6.0, 9.24], [11.0, 12.11], [14.0, 14.0], [15.0, 14.86], [16.0, 16.26], [17.0, 17.36], [22.0, 22.11], [25.0, 25.69], [28.0, 28.76], [38.0, 82.39], [88.0, 89.88], [91.0, 92.3], [93.0, 93.7], [94.0, 94.64], [96.0, 98.58], [100.0, 101.51], [103.0, 115.55], [117.0, 118.03], [121.0, 130.45], [133.0, 134.35], [139.0, 140.19], [148.0, 148.37], [150.0, 151.95], [153.0, 153.06], [161.0, 161.64], [173.0, 172.96], [176.0, 181.95], [182.0, 184.28], [186.0, 186.97], [188.0, 189.35], [190.0, 191.52], [194.0, 194.64], [196.0, 197.53], [203.0, 203.5], [205.0, 205.44], [207.0, 206.88], [209.0, 209.63], [211.0, 211.96], [213.0, 214.17], [215.0, 215.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.6, 0.0, 99.16, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.62, 93.45, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["effects unit", 22.99], ["echo", 10.17], ["distortion", 7.65]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.89, 3.24, 1.11, 0.0, -0.14, 0.26, 0.36, 0.11, 0.69, 0.76, 44.39, 1.88, 1.3, 0.7, 0.64, 2.58, 1.51, 12.55, 1.03, 9.45, 1.35, 1.19, 0.37, 1.95, 0.06, 0.64, -0.04, 5.95, 2.28, 0.97, 1.35, 1.52, 0.64, 1.53, 0.5, 0.44, -0.12, 0.63, 0.96, 1.17, 0.64]} \ No newline at end of file diff --git a/annotations_1/xd9K2o_ZDdU_filtered.json b/annotations_1/xd9K2o_ZDdU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6be5446d7255c32cbf5d92d6c9dc65df7f82925e --- /dev/null +++ b/annotations_1/xd9K2o_ZDdU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.87], [4.0, 4.83], [6.0, 7.75], [11.0, 11.82], [13.0, 15.21], [16.0, 17.93], [18.0, 19.53], [20.0, 22.11], [23.0, 23.06], [23.0, 25.27], [26.0, 28.86], [32.0, 36.9], [38.0, 40.46], [41.0, 41.89], [43.0, 44.44], [45.0, 52.12], [53.0, 53.96], [57.0, 57.52], [58.0, 63.31], [64.0, 76.0], [81.0, 82.17], [82.0, 89.21], [90.0, 95.44], [100.0, 130.71], [132.0, 140.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 100.0, 0.0, 95.78, 100.0, 82.07, 100.0, 0.0, 0.0, 98.66, 0.0, 0.0, 80.29, 49.27, 0.0, 42.69, 35.54, 0.0, 28.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 37.68], ["animal", 13.69], ["horse", 8.97]], null, [["speech", 57.6], ["clip-clop", 15.1], ["horse", 10.63]], [["speech", 47.54], ["throbbing", 12.89], ["hum", 10.39]], null, [["explosion", 44.54], ["groan", 22.81], ["burst, pop", 7.07]]], "duration": [1.87, 0.83, 1.75, 0.82, 2.21, 1.93, 1.53, 2.11, 0.06, 2.27, 2.86, 4.9, 2.46, 0.89, 1.44, 7.12, 0.96, 0.52, 5.31, 12.0, 1.17, 7.21, 5.44, 30.71, 8.88]} \ No newline at end of file diff --git a/annotations_1/xdnibOE5L40_filtered.json b/annotations_1/xdnibOE5L40_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0dda1c7be51c0d8cd4ef0f01f9ee3875d522273a --- /dev/null +++ b/annotations_1/xdnibOE5L40_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.56], [20.0, 20.14], [21.0, 21.63], [24.0, 31.92], [35.0, 35.77], [38.0, 39.95], [42.0, 41.91], [44.0, 44.69], [52.0, 53.82], [57.0, 58.21], [59.0, 59.9], [70.0, 72.13], [73.0, 79.27], [81.0, 85.48], [88.0, 88.72], [102.0, 102.17], [119.0, 122.55], [126.0, 127.25], [129.0, 131.6], [133.0, 133.44], [137.0, 137.35], [138.0, 138.91], [166.0, 168.32], [170.0, 170.36], [172.0, 172.45], [175.0, 175.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 33.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.25, 49.4, 74.44, 0.0, 0.0, 94.52, 0.0, 72.31, 0.0, 0.0, 0.0, 97.43, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 55.92], ["music", 13.07], ["knock", 4.06]], null, null, null, null, null, null, null, null, [["frog", 13.37], ["speech", 9.89], ["hum", 9.65]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.56, 0.14, 0.63, 7.92, 0.77, 1.95, -0.09, 0.69, 1.82, 1.21, 0.9, 2.13, 6.27, 4.48, 0.72, 0.17, 3.55, 1.25, 2.6, 0.44, 0.35, 0.91, 2.32, 0.36, 0.45, 0.95]} \ No newline at end of file diff --git a/annotations_1/xe6kO-SJYCk_filtered.json b/annotations_1/xe6kO-SJYCk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..18704d165c4a467d078220772cd5e45e407041f9 --- /dev/null +++ b/annotations_1/xe6kO-SJYCk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.21], [3.0, 4.56], [8.0, 10.54], [13.0, 13.32], [18.0, 20.12], [23.0, 23.87], [26.0, 26.82], [30.0, 30.32], [32.0, 33.1], [37.0, 37.02], [45.0, 45.18], [47.0, 48.2], [49.0, 48.78], [49.0, 53.25], [57.0, 58.24], [59.0, 59.63], [64.0, 66.83], [68.0, 69.26], [74.0, 75.76], [80.0, 80.99], [84.0, 85.26], [85.0, 101.53], [102.0, 101.7]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 94.07, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 54.63, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.21, 1.56, 2.54, 0.32, 2.12, 0.87, 0.82, 0.32, 1.1, 0.02, 0.18, 1.2, -0.22, 4.25, 1.24, 0.63, 2.83, 1.26, 1.76, 0.99, 1.26, 16.53, -0.3]} \ No newline at end of file diff --git a/annotations_1/xfF-ZL3xvxw_filtered.json b/annotations_1/xfF-ZL3xvxw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f2a19c0c19edd9f80adb6a29a9abfa983716eda3 --- /dev/null +++ b/annotations_1/xfF-ZL3xvxw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 18.13], [22.0, 24.41], [29.0, 29.76], [37.0, 49.22], [73.0, 73.95], [81.0, 81.97], [105.0, 105.17], [108.0, 108.8], [109.0, 109.88], [115.0, 115.5], [134.0, 136.98], [142.0, 157.13], [167.0, 168.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [36.71, 67.51, 0.0, 33.71, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.44, 38.43, 0.0], "audiomae_on_audioset": [[["music", 59.04], ["brass instrument", 5.95], ["musical instrument", 5.77]], null, null, [["music", 50.79], ["speech", 13.05], ["boing", 12.93]], null, null, null, null, null, null, [["livestock, farm animals, working animals", 15.74], ["fly, housefly", 15.0], ["cattle, bovinae", 8.4]], [["music", 44.28], ["boing", 33.79], ["speech", 13.56]], null], "duration": [5.13, 2.41, 0.76, 12.22, 0.95, 0.97, 0.17, 0.8, 0.88, 0.5, 2.98, 15.13, 1.88]} \ No newline at end of file diff --git a/annotations_1/xgX9WrVFO0Q_filtered.json b/annotations_1/xgX9WrVFO0Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba6ee77a3a89569f3545c8ec804ac89d6addd2f2 --- /dev/null +++ b/annotations_1/xgX9WrVFO0Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 14.42], [18.0, 49.72], [50.0, 95.55], [98.0, 127.35], [128.0, 131.99], [136.0, 141.72], [145.0, 147.09], [150.0, 156.95], [160.0, 160.95], [163.0, 168.08]], "keep_status": [true, false, false, true, false, false, false, false, false, false], "silence_prob": [29.42, 0.0, 0.0, 34.96, 62.68, 65.79, 64.75, 33.3, 0.0, 34.34], "audiomae_on_audioset": [[["speech", 44.7], ["music", 7.38], ["fly, housefly", 5.85]], null, null, [["hum", 39.11], ["sidetone", 16.77], ["throbbing", 13.16]], null, null, null, [["music", 56.25], ["theremin", 16.07], ["synthesizer", 8.23]], null, [["theremin", 42.36], ["music", 41.76], ["scary music", 2.79]]], "duration": [6.42, 31.72, 45.55, 29.35, 3.99, 5.72, 2.09, 6.95, 0.95, 5.08]} \ No newline at end of file diff --git a/annotations_1/xgkspBFxLi4_filtered.json b/annotations_1/xgkspBFxLi4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8eff9c82a24cd5d66794a030764d3d67fab6a9a --- /dev/null +++ b/annotations_1/xgkspBFxLi4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.72], [5.0, 6.57], [11.0, 11.64], [15.0, 16.53], [23.0, 23.28], [29.0, 29.71], [36.0, 36.44], [41.0, 42.35], [52.0, 52.96], [54.0, 56.05], [59.0, 59.12], [64.0, 65.01], [66.0, 67.76], [72.0, 72.93], [75.0, 75.56], [98.0, 101.98], [105.0, 106.62], [108.0, 108.6], [110.0, 111.21], [127.0, 129.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.03, 0.0, 0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 0.0, 0.0, 36.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 46.8], ["speech", 24.92], ["foghorn", 12.69]]], "duration": [2.72, 1.57, 0.64, 1.53, 0.28, 0.71, 0.44, 1.35, 0.96, 2.05, 0.12, 1.01, 1.76, 0.93, 0.56, 3.98, 1.62, 0.6, 1.21, 2.15]} \ No newline at end of file diff --git a/annotations_1/xhgWGU6cQ00_filtered.json b/annotations_1/xhgWGU6cQ00_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d539baef45c44b44602c38691fa463696a80bd44 --- /dev/null +++ b/annotations_1/xhgWGU6cQ00_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[17.0, 16.98], [23.0, 25.02], [26.0, 26.52], [28.0, 29.12], [35.0, 35.24], [39.0, 38.74], [44.0, 44.1], [46.0, 47.87], [51.0, 51.16], [60.0, 59.95], [63.0, 63.41], [66.0, 66.33], [68.0, 68.12], [71.0, 71.73], [75.0, 75.42], [78.0, 78.38], [81.0, 82.92], [88.0, 88.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.02, 2.02, 0.52, 1.12, 0.24, -0.26, 0.1, 1.87, 0.16, -0.05, 0.41, 0.33, 0.12, 0.73, 0.42, 0.38, 1.92, 0.45]} \ No newline at end of file diff --git a/annotations_1/xhj4CAFsPt0_filtered.json b/annotations_1/xhj4CAFsPt0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fe373d37d8d0753cef113182ed4cf31d3f866171 --- /dev/null +++ b/annotations_1/xhj4CAFsPt0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.33], [5.0, 7.18], [8.0, 8.5], [20.0, 20.33], [21.0, 21.57], [22.0, 24.39], [26.0, 28.21], [31.0, 31.77], [35.0, 36.39], [37.0, 38.99], [39.0, 39.33], [45.0, 45.23], [52.0, 69.15], [71.0, 71.71], [77.0, 80.23], [89.0, 88.94], [104.0, 105.21], [107.0, 107.79], [108.0, 108.35], [109.0, 110.05], [113.0, 113.43], [114.0, 114.88], [120.0, 120.14], [130.0, 130.49], [131.0, 130.6], [131.0, 133.51], [141.0, 142.13], [144.0, 144.58], [146.0, 145.88], [147.0, 147.46], [151.0, 150.99], [154.0, 161.25], [167.0, 173.74], [175.0, 176.61]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 97.64, 0.0, 0.0, 0.0, 51.23, 91.81, 0.0, 0.0, 0.0, 0.0, 0.0, 56.63, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.09, 0.0, 0.0, 0.0, 0.0, 0.0, 91.13, 87.74, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["boing", 30.75], ["speech", 9.44], ["snicker", 8.57]], null, null, null, null, null, null, null, null], "duration": [0.33, 2.18, 0.5, 0.33, 0.57, 2.39, 2.21, 0.77, 1.39, 1.99, 0.33, 0.23, 17.15, 0.71, 3.23, -0.06, 1.21, 0.79, 0.35, 1.05, 0.43, 0.88, 0.14, 0.49, -0.4, 2.51, 1.13, 0.58, -0.12, 0.46, -0.01, 7.25, 6.74, 1.61]} \ No newline at end of file diff --git a/annotations_1/xihdBpPICZY_filtered.json b/annotations_1/xihdBpPICZY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..628c49c86f594e3696af4afd4e61cba38c88a1db --- /dev/null +++ b/annotations_1/xihdBpPICZY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 33.94], [35.0, 60.12], [61.0, 80.1], [83.0, 146.31]], "keep_status": [false, false, false, false], "silence_prob": [0.0, 28.59, 28.66, 0.0], "audiomae_on_audioset": [null, [["hum", 36.78], ["throbbing", 33.55], ["music", 15.74]], [["music", 64.18], ["hum", 6.37], ["cacophony", 4.49]], null], "duration": [-0.06, 25.12, 19.1, 63.31]} \ No newline at end of file diff --git a/annotations_1/xiwtX0NC0uA_filtered.json b/annotations_1/xiwtX0NC0uA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26340655881141aef33973f7abb569817b2ed0de --- /dev/null +++ b/annotations_1/xiwtX0NC0uA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.67], [12.0, 29.2], [31.0, 48.64], [50.0, 66.02], [70.0, 97.17], [99.0, 107.47], [109.0, 109.66], [116.0, 121.95], [124.0, 131.09], [131.0, 131.45], [131.0, 140.75], [147.0, 147.45], [152.0, 152.1], [153.0, 153.44], [155.0, 156.05]], "keep_status": [false, true, false, false, true, true, false, true, true, false, true, false, false, false, false], "silence_prob": [0.0, 28.48, 28.53, 28.63, 28.66, 28.81, 0.0, 28.62, 28.59, 0.0, 29.83, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 27.76], ["music", 16.71], ["whack, thwack", 16.63]], [["music", 79.56], ["musical instrument", 2.47], ["speech", 1.28]], [["music", 52.69], ["cacophony", 12.8], ["buzz", 4.66]], [["buzz", 41.24], ["music", 18.24], ["speech", 6.34]], [["music", 49.41], ["speech", 5.48], ["cattle, bovinae", 5.03]], null, [["speech", 39.89], ["bang", 10.32], ["explosion", 7.25]], [["buzz", 37.99], ["hum", 18.15], ["music", 11.84]], null, [["speech", 33.16], ["music", 19.03], ["eruption", 11.71]], null, null, null, null], "duration": [1.67, 17.2, 17.64, 16.02, 27.17, 8.47, 0.66, 5.95, 7.09, 0.45, 9.75, 0.45, 0.1, 0.44, 1.05]} \ No newline at end of file diff --git a/annotations_1/xjAHbBY-UUM_filtered.json b/annotations_1/xjAHbBY-UUM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13456a05f1ee16d0f19d11187c703c22da7b7a31 --- /dev/null +++ b/annotations_1/xjAHbBY-UUM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[31.0, 31.46], [32.0, 37.18], [38.0, 45.4], [47.0, 47.78], [48.0, 49.64], [56.0, 57.6], [58.0, 60.47], [62.0, 63.95], [65.0, 65.52], [66.0, 66.38], [67.0, 70.87], [71.0, 71.14], [75.0, 74.75], [75.0, 74.95], [94.0, 95.28], [97.0, 99.18], [100.0, 100.03], [104.0, 105.14], [107.0, 107.55], [123.0, 128.22], [133.0, 135.41], [137.0, 137.49], [138.0, 138.91], [142.0, 143.07], [155.0, 156.61], [158.0, 169.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.18, 55.46, 0.0, 0.0, 0.0, 91.64, 0.0, 0.0, 0.0, 62.58, 0.0, 0.0, 0.0, 0.0, 42.04, 0.0, 0.0, 0.0, 78.72, 99.85, 0.0, 0.0, 0.0, 0.0, 42.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["synthesizer", 11.6], ["sidetone", 11.51], ["tuning fork", 7.0]], null, null, null, null, null, null, null, null, null, [["speech", 36.63], ["music", 33.97], ["thunk", 8.82]]], "duration": [0.46, 5.18, 7.4, 0.78, 1.64, 1.6, 2.47, 1.95, 0.52, 0.38, 3.87, 0.14, -0.25, -0.05, 1.28, 2.18, 0.03, 1.14, 0.55, 5.22, 2.41, 0.49, 0.91, 1.07, 1.61, 11.2]} \ No newline at end of file diff --git a/annotations_1/xjdKPS6-8XU_filtered.json b/annotations_1/xjdKPS6-8XU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aef6117d411e6e46a9955783b4c62f6f774c2fd5 --- /dev/null +++ b/annotations_1/xjdKPS6-8XU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [12.0, 12.61], [13.0, 13.24], [14.0, 23.57], [26.0, 26.43], [28.0, 27.78], [31.0, 31.36], [34.0, 34.3], [37.0, 37.61], [40.0, 42.65], [43.0, 44.96], [47.0, 47.88], [49.0, 49.69], [55.0, 55.63], [58.0, 59.51], [62.0, 62.26], [64.0, 64.47], [69.0, 69.6], [71.0, 71.29], [73.0, 72.89], [75.0, 75.05], [77.0, 77.68], [80.0, 80.35], [83.0, 83.27], [85.0, 85.56], [89.0, 89.13], [91.0, 92.04], [94.0, 94.85], [97.0, 97.36], [97.0, 97.44], [103.0, 103.77], [106.0, 106.1], [108.0, 108.38], [114.0, 119.69], [121.0, 121.29], [122.0, 124.07], [126.0, 128.66], [132.0, 133.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 83.52, 0.0, 0.0, 0.0, 0.0, 0.0, 98.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.71, 0.0, 97.64, 96.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.31, 0.61, 0.24, 9.57, 0.43, -0.22, 0.36, 0.3, 0.61, 2.65, 1.96, 0.88, 0.69, 0.63, 1.51, 0.26, 0.47, 0.6, 0.29, -0.11, 0.05, 0.68, 0.35, 0.27, 0.56, 0.13, 1.04, 0.85, 0.36, 0.44, 0.77, 0.1, 0.38, 5.69, 0.29, 2.07, 2.66, 1.15]} \ No newline at end of file diff --git a/annotations_1/xkMijsfMZBU_filtered.json b/annotations_1/xkMijsfMZBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..07b5df6c39d070b827422a27964915f83e465757 --- /dev/null +++ b/annotations_1/xkMijsfMZBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.92], [5.0, 6.1], [10.0, 10.83], [15.0, 14.99], [18.0, 18.39], [20.0, 20.63], [29.0, 30.6], [31.0, 32.88], [34.0, 34.89], [36.0, 37.18], [38.0, 42.55], [44.0, 62.41], [64.0, 74.8], [77.0, 88.1], [92.0, 92.48], [94.0, 95.99], [98.0, 98.85], [104.0, 109.34], [113.0, 114.2], [116.0, 119.48], [122.0, 129.44], [130.0, 132.78], [139.0, 144.36], [148.0, 148.66]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, true, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.04, 30.0, 29.03, 29.28, 0.0, 0.0, 0.0, 30.78, 0.0, 30.01, 31.69, 38.46, 29.42, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 53.91], ["crowd", 12.12], ["theremin", 3.4]], [["music", 65.55], ["burst, pop", 4.69], ["fireworks", 3.31]], [["music", 30.5], ["vehicle", 18.62], ["car", 14.86]], null, null, null, [["music", 79.58], ["guitar", 1.95], ["theremin", 1.74]], null, [["music", 57.03], ["speech", 15.19], ["crowd", 6.21]], [["music", 31.37], ["speech", 28.86], ["burst, pop", 6.52]], [["male singing", 16.56], ["speech", 6.88], ["music", 5.99]], [["livestock, farm animals, working animals", 26.35], ["moo", 11.35], ["cattle, bovinae", 10.28]], null], "duration": [0.92, 1.1, 0.83, -0.01, 0.39, 0.63, 1.6, 1.88, 0.89, 1.18, 4.55, 18.41, 10.8, 11.1, 0.48, 1.99, 0.85, 5.34, 1.2, 3.48, 7.44, 2.78, 5.36, 0.66]} \ No newline at end of file diff --git a/annotations_1/xkjfSZtHBXc_filtered.json b/annotations_1/xkjfSZtHBXc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e114d8a4dca3692eb02e7ad5a0495fee48308735 --- /dev/null +++ b/annotations_1/xkjfSZtHBXc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[81.0, 80.82], [82.0, 82.05], [83.0, 83.81], [85.0, 87.34], [89.0, 168.51], [169.0, 168.91]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.21, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["fly, housefly", 24.73], ["insect", 22.12], ["music", 17.0]], null, null], "duration": [-0.18, 0.05, 0.81, 2.34, 79.51, -0.09]} \ No newline at end of file diff --git a/annotations_1/xkzlZGohQ_4_filtered.json b/annotations_1/xkzlZGohQ_4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6406dae8f859d7e16999cc4769672b07506f1362 --- /dev/null +++ b/annotations_1/xkzlZGohQ_4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.85], [34.0, 36.37], [37.0, 39.01], [42.0, 42.75], [48.0, 56.29], [60.0, 62.58], [67.0, 94.56], [100.0, 110.39], [113.0, 115.62], [118.0, 119.52], [120.0, 122.82], [123.0, 124.5], [127.0, 127.95], [130.0, 132.0], [147.0, 151.11], [153.0, 153.59]], "keep_status": [false, false, false, false, false, true, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 40.5, 36.37, 0.0, 34.57, 36.1, 29.69, 29.74, 30.75, 0.0, 35.58, 0.0, 0.0, 35.84, 30.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.7], ["speech", 30.72], ["didgeridoo", 4.28]], [["music", 63.75], ["speech", 16.79], ["sidetone", 3.89]], null, [["throbbing", 34.4], ["hum", 29.33], ["music", 20.08]], [["music", 55.66], ["didgeridoo", 7.46], ["hum", 5.2]], [["music", 36.68], ["speech", 14.65], ["throbbing", 10.9]], [["music", 72.18], ["hum", 6.32], ["breaking", 5.28]], [["music", 40.56], ["throbbing", 27.01], ["hum", 12.99]], null, [["music", 59.44], ["didgeridoo", 9.69], ["musical instrument", 5.29]], null, null, [["music", 51.58], ["speech", 9.35], ["hum", 7.62]], [["music", 19.8], ["hum", 17.0], ["throbbing", 12.23]], null], "duration": [0.85, 2.37, 2.01, 0.75, 8.29, 2.58, 27.56, 10.39, 2.62, 1.52, 2.82, 1.5, 0.95, 2.0, 4.11, 0.59]} \ No newline at end of file diff --git a/annotations_1/xlAwSNbAY8E_filtered.json b/annotations_1/xlAwSNbAY8E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a12937302681cdfda255b808b7c166495ed5b479 --- /dev/null +++ b/annotations_1/xlAwSNbAY8E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.91], [5.0, 5.46], [6.0, 6.93], [10.0, 11.89], [13.0, 14.98], [16.0, 16.92], [18.0, 21.12], [23.0, 46.9], [49.0, 50.08], [52.0, 54.38], [57.0, 57.96], [59.0, 60.05], [62.0, 63.32], [66.0, 67.0], [68.0, 69.01], [70.0, 70.83], [74.0, 81.78], [83.0, 89.33], [89.0, 89.43], [89.0, 89.51], [90.0, 89.77], [90.0, 98.98], [100.0, 129.2], [130.0, 130.64], [131.0, 132.22], [135.0, 135.8], [136.0, 138.92], [140.0, 145.77], [149.0, 150.47], [155.0, 156.59], [160.0, 159.81], [160.0, 159.92], [163.0, 163.11], [165.0, 167.17], [169.0, 170.6], [172.0, 180.18]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.37, 54.23, 0.0, 96.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.98, 38.98, 0.0, 0.0, 0.0, 36.57, 32.93, 0.0, 0.0, 0.0, 99.96, 67.38, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 0.0, 50.36], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.69], ["sonar", 17.49], ["electronic music", 4.53]], [["music", 44.6], ["hum", 13.24], ["speech", 11.82]], null, null, null, [["music", 68.13], ["throbbing", 9.69], ["electronic music", 6.04]], [["music", 45.33], ["throbbing", 22.36], ["hum", 16.66]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.91, 0.46, 0.93, 1.89, 1.98, 0.92, 3.12, 23.9, 1.08, 2.38, 0.96, 1.05, 1.32, 1.0, 1.01, 0.83, 7.78, 6.33, 0.43, 0.51, -0.23, 8.98, 29.2, 0.64, 1.22, 0.8, 2.92, 5.77, 1.47, 1.59, -0.19, -0.08, 0.11, 2.17, 1.6, 8.18]} \ No newline at end of file diff --git a/annotations_1/xllpnvAmnHE_filtered.json b/annotations_1/xllpnvAmnHE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84c15bbebb1ed75467f5382838a59c4d3003b9a2 --- /dev/null +++ b/annotations_1/xllpnvAmnHE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.39], [5.0, 5.53], [7.0, 7.82], [12.0, 12.21], [20.0, 24.7], [31.0, 32.44], [33.0, 35.9], [36.0, 36.24], [37.0, 48.78], [50.0, 54.01], [54.0, 55.68], [65.0, 65.15], [69.0, 72.49], [78.0, 78.33], [86.0, 87.84], [100.0, 101.34], [102.0, 105.61], [112.0, 112.56], [117.0, 120.36], [124.0, 123.99], [127.0, 127.5], [130.0, 131.03], [139.0, 139.09], [139.0, 140.12], [145.0, 146.72], [148.0, 148.8], [153.0, 155.6]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 33.89, 0.0, 100.0, 0.0, 49.5, 48.19, 0.0, 0.0, 36.75, 0.0, 0.0, 0.0, 50.06, 0.0, 41.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87], "audiomae_on_audioset": [null, null, null, null, [["speech", 33.45], ["thunk", 13.44], ["whack, thwack", 5.92]], null, null, null, [["speech", 85.45], ["sidetone", 7.42], ["whale vocalization", 1.03]], [["speech", 52.32], ["hum", 10.77], ["sidetone", 9.9]], null, null, [["speech", 59.0], ["sidetone", 24.13], ["speech synthesizer", 5.86]], null, null, null, null, null, [["speech", 61.61], ["livestock, farm animals, working animals", 6.48], ["moo", 4.45]], null, null, null, null, null, null, null, null], "duration": [0.39, 0.53, 0.82, 0.21, 4.7, 1.44, 2.9, 0.24, 11.78, 4.01, 1.68, 0.15, 3.49, 0.33, 1.84, 1.34, 3.61, 0.56, 3.36, -0.01, 0.5, 1.03, 0.09, 1.12, 1.72, 0.8, 2.6]} \ No newline at end of file diff --git a/annotations_1/xm2ztDqbbZE_filtered.json b/annotations_1/xm2ztDqbbZE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70adb30390f5d87367d0c6845fcad46ce1464b8d --- /dev/null +++ b/annotations_1/xm2ztDqbbZE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.3], [7.0, 9.21], [10.0, 11.28], [12.0, 17.56], [22.0, 23.72], [25.0, 25.69], [26.0, 27.6], [29.0, 35.01], [46.0, 59.56], [67.0, 67.2], [68.0, 84.96], [88.0, 98.98], [105.0, 110.0]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.81, 0.0, 30.55, 0.0, 0.0, 0.0, 99.98, 30.79, 0.0, 35.03, 31.85, 30.94], "audiomae_on_audioset": [null, [["explosion", 13.41], ["speech", 8.67], ["burst, pop", 7.25]], null, [["speech", 64.66], ["breaking", 15.64], ["explosion", 2.91]], null, null, null, null, [["speech", 49.14], ["noise", 34.07], ["music", 2.83]], null, [["music", 61.12], ["speech", 22.34], ["electronic music", 1.02]], [["speech", 38.91], ["music", 25.72], ["burst, pop", 5.7]], [["music", 60.02], ["speech", 14.37], ["boing", 5.36]]], "duration": [0.3, 2.21, 1.28, 5.56, 1.72, 0.69, 1.6, 6.01, 13.56, 0.2, 16.96, 10.98, 5.0]} \ No newline at end of file diff --git a/annotations_1/xmihht20Z0E_filtered.json b/annotations_1/xmihht20Z0E_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b15b83a2ad0e8f4730c6a6069b897b75170043f --- /dev/null +++ b/annotations_1/xmihht20Z0E_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 3.84], [5.0, 88.15], [89.0, 89.48], [90.0, 91.34], [103.0, 103.54], [106.0, 107.65], [108.0, 108.51], [112.0, 118.1], [119.0, 119.79]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.34, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 49.6], ["music", 14.41], ["vehicle", 10.89]], null], "duration": [-0.16, 83.15, 0.48, 1.34, 0.54, 1.65, 0.51, 6.1, 0.79]} \ No newline at end of file diff --git a/annotations_1/xmzkZ12GMAs_filtered.json b/annotations_1/xmzkZ12GMAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/xmzkZ12GMAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/xof2LkhAFGU_filtered.json b/annotations_1/xof2LkhAFGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ba20aa26dd7490bb771786baf74bbee8742b7802 --- /dev/null +++ b/annotations_1/xof2LkhAFGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.62], [7.0, 7.6], [37.0, 37.29], [44.0, 57.99], [59.0, 63.12], [66.0, 66.8], [68.0, 68.55], [78.0, 77.84], [96.0, 97.24], [99.0, 101.16], [104.0, 105.21], [116.0, 116.82], [118.0, 118.93], [119.0, 126.17], [127.0, 127.5], [130.0, 130.79], [133.0, 135.73], [137.0, 138.72]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 99.21, 84.62, 0.0, 0.0, 0.0, 0.0, 97.22, 0.0, 0.0, 0.0, 63.31, 0.0, 0.0, 63.53, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.62, 0.6, 0.29, 13.99, 4.12, 0.8, 0.55, -0.16, 1.24, 2.16, 1.21, 0.82, 0.93, 7.17, 0.5, 0.79, 2.73, 1.72]} \ No newline at end of file diff --git a/annotations_1/xqeAW5qAHNQ_filtered.json b/annotations_1/xqeAW5qAHNQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..251f4dfe205290a9273396f47c5b919f6abf9db4 --- /dev/null +++ b/annotations_1/xqeAW5qAHNQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 13.83], [15.0, 15.31], [17.0, 36.15], [42.0, 41.88], [52.0, 52.07], [52.0, 55.26], [60.0, 66.53], [68.0, 67.66], [70.0, 70.28]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.07, 0.0, 0.0, 40.17, 31.3, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 66.96], ["speech synthesizer", 5.89], ["mechanisms", 3.17]], [["music", 47.2], ["didgeridoo", 24.54], ["speech", 14.9]], null, null], "duration": [1.83, 0.31, 19.15, -0.12, 0.07, 3.26, 6.53, -0.34, 0.28]} \ No newline at end of file diff --git a/annotations_1/xqmqskVELNs_filtered.json b/annotations_1/xqmqskVELNs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..702a682bea69ca8d9f9efbe670cd564aecdf85e4 --- /dev/null +++ b/annotations_1/xqmqskVELNs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[35.0, 37.49], [38.0, 37.61], [38.0, 37.93], [38.0, 41.18], [100.0, 106.29], [119.0, 120.16], [137.0, 137.27], [167.0, 167.59]], "keep_status": [false, false, false, true, false, false, false, false], "silence_prob": [30.6, 0.0, 0.0, 31.63, 30.58, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 61.68], ["musical instrument", 7.22], ["mantra", 4.75]], null, null, [["music", 32.65], ["mantra", 13.38], ["male singing", 5.64]], [["speech", 83.97], ["horse", 2.53], ["outside, rural or natural", 1.69]], null, null, null], "duration": [2.49, -0.39, -0.07, 3.18, 6.29, 1.16, 0.27, 0.59]} \ No newline at end of file diff --git a/annotations_1/xqtbz-pVp2g_filtered.json b/annotations_1/xqtbz-pVp2g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56b903e1db773350c8c967f69490f178920e05ea --- /dev/null +++ b/annotations_1/xqtbz-pVp2g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.75], [10.0, 12.12], [13.0, 13.86], [16.0, 17.02], [31.0, 31.63], [34.0, 37.02], [38.0, 38.42], [41.0, 41.84], [42.0, 43.16], [44.0, 44.41], [45.0, 48.19], [51.0, 51.39], [55.0, 56.86], [63.0, 63.64], [66.0, 66.01], [70.0, 70.61], [72.0, 72.28], [77.0, 77.65], [78.0, 80.99], [83.0, 84.86], [88.0, 91.47], [95.0, 103.64], [108.0, 108.43], [109.0, 109.97], [110.0, 110.89], [112.0, 111.96]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 41.95, 0.0, 0.0, 0.0, 47.23, 0.0, 0.0, 0.0, 0.0, 51.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.23, 0.0, 34.59, 35.01, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 38.64], ["didgeridoo", 31.54], ["speech", 5.01]], null, null, null, [["speech", 31.52], ["radio", 14.65], ["music", 14.34]], null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 42.41], ["music", 15.83], ["radio", 9.2]], null, [["music", 67.42], ["synthesizer", 8.4], ["didgeridoo", 3.2]], [["music", 45.41], ["speech", 19.83], ["doorbell", 12.45]], null, null, null, null], "duration": [0.75, 2.12, 0.86, 1.02, 0.63, 3.02, 0.42, 0.84, 1.16, 0.41, 3.19, 0.39, 1.86, 0.64, 0.01, 0.61, 0.28, 0.65, 2.99, 1.86, 3.47, 8.64, 0.43, 0.97, 0.89, -0.04]} \ No newline at end of file diff --git a/annotations_1/xrO8AQ4CrKk_filtered.json b/annotations_1/xrO8AQ4CrKk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ba0b3ed9cb7c0052ccfacd8ad44730c1ea70d29 --- /dev/null +++ b/annotations_1/xrO8AQ4CrKk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.74], [20.0, 25.42], [26.0, 26.57], [28.0, 145.13], [146.0, 164.44], [165.0, 167.44]], "keep_status": [false, false, false, false, false, false], "silence_prob": [53.16, 51.99, 0.0, 0.0, 29.49, 29.28], "audiomae_on_audioset": [null, null, null, null, [["hum", 43.15], ["mains hum", 28.62], ["music", 9.16]], [["vehicle", 37.37], ["car", 28.74], ["race car, auto racing", 10.17]]], "duration": [3.74, 5.42, 0.57, 117.13, 18.44, 2.44]} \ No newline at end of file diff --git a/annotations_1/xs8jGY2dnCg_filtered.json b/annotations_1/xs8jGY2dnCg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4704beca5b11c4cc738eb67be834721c4fe0be91 --- /dev/null +++ b/annotations_1/xs8jGY2dnCg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.37], [14.0, 19.68], [22.0, 24.22], [25.0, 26.23], [31.0, 44.2], [45.0, 46.43], [50.0, 49.99], [53.0, 55.29], [58.0, 59.24], [63.0, 70.17], [74.0, 74.58], [79.0, 87.35], [92.0, 92.99], [96.0, 101.83], [104.0, 114.34], [117.0, 116.83], [119.0, 130.49], [134.0, 138.28], [142.0, 154.8], [162.0, 163.7], [165.0, 175.74], [177.0, 179.14], [182.0, 189.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [91.98, 100.0, 100.0, 0.0, 97.33, 0.0, 0.0, 80.11, 0.0, 31.4, 0.0, 67.89, 0.0, 30.99, 30.95, 0.0, 30.87, 31.05, 30.62, 0.0, 37.93, 93.76, 64.07], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["speech", 37.94], ["breaking", 27.54], ["inside, small room", 7.34]], null, null, null, [["speech", 39.82], ["whack, thwack", 23.16], ["smash, crash", 12.23]], [["speech", 75.35], ["whack, thwack", 8.69], ["breaking", 4.61]], null, [["whack, thwack", 69.51], ["speech", 6.86], ["fart", 4.84]], [["speech", 40.65], ["thunk", 15.89], ["fart", 15.77]], [["speech", 19.21], ["whack, thwack", 16.63], ["fart", 10.53]], null, [["speech", 64.19], ["crow", 9.41], ["caw", 6.23]], null, null], "duration": [3.37, 5.68, 2.22, 1.23, 13.2, 1.43, -0.01, 2.29, 1.24, 7.17, 0.58, 8.35, 0.99, 5.83, 10.34, -0.17, 11.49, 4.28, 12.8, 1.7, 10.74, 2.14, 7.01]} \ No newline at end of file diff --git a/annotations_1/xsHxWhCydMI_filtered.json b/annotations_1/xsHxWhCydMI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4574177cfb7e028713838312e03261afd841c83 --- /dev/null +++ b/annotations_1/xsHxWhCydMI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 23.19], [30.0, 30.57], [39.0, 39.5], [50.0, 50.03], [55.0, 55.02], [62.0, 61.84], [67.0, 67.29], [75.0, 75.88], [81.0, 82.51], [91.0, 91.88], [99.0, 99.94], [109.0, 110.19], [128.0, 128.8], [140.0, 139.72], [143.0, 144.49]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 50.32], ["wind instrument, woodwind instrument", 10.95], ["speech", 5.78]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [8.19, 0.57, 0.5, 0.03, 0.02, -0.16, 0.29, 0.88, 1.51, 0.88, 0.94, 1.19, 0.8, -0.28, 1.49]} \ No newline at end of file diff --git a/annotations_1/xsK7WF3jWI4_filtered.json b/annotations_1/xsK7WF3jWI4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fa2925c460a0da7b3ed40a2b510c5d51a43260ec --- /dev/null +++ b/annotations_1/xsK7WF3jWI4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.38], [3.0, 4.43], [5.0, 24.27], [26.0, 29.03], [31.0, 31.85], [36.0, 36.54], [40.0, 56.42], [59.0, 59.76], [62.0, 63.02], [66.0, 67.95], [70.0, 70.78], [74.0, 75.68], [77.0, 77.87], [79.0, 81.28], [83.0, 87.78], [90.0, 89.95], [92.0, 92.16], [94.0, 94.63], [98.0, 99.17], [101.0, 102.41], [106.0, 107.11], [109.0, 109.86], [112.0, 119.85], [127.0, 127.8]], "keep_status": [false, false, true, true, false, false, true, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.71, 32.09, 0.0, 0.0, 31.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.25, 31.93, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.8, 0.0], "audiomae_on_audioset": [null, null, [["didgeridoo", 29.74], ["fly, housefly", 15.67], ["music", 15.4]], [["livestock, farm animals, working animals", 16.95], ["cattle, bovinae", 14.84], ["moo", 14.17]], null, null, [["music", 15.61], ["fly, housefly", 13.65], ["buzz", 10.53]], null, null, null, null, null, null, [["moo", 19.08], ["livestock, farm animals, working animals", 18.16], ["cattle, bovinae", 17.21]], [["speech", 32.47], ["sidetone", 15.03], ["vehicle", 6.39]], null, null, null, null, null, null, null, [["speech", 47.48], ["music", 28.21], ["explosion", 1.6]], null], "duration": [0.38, 1.43, 19.27, 3.03, 0.85, 0.54, 16.42, 0.76, 1.02, 1.95, 0.78, 1.68, 0.87, 2.28, 4.78, -0.05, 0.16, 0.63, 1.17, 1.41, 1.11, 0.86, 7.85, 0.8]} \ No newline at end of file diff --git a/annotations_1/xswJpwb7Afs_filtered.json b/annotations_1/xswJpwb7Afs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd839781b508b67dd4379b34954a3cf641f50b6b --- /dev/null +++ b/annotations_1/xswJpwb7Afs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.27], [27.0, 32.0], [32.0, 35.5], [36.0, 35.72], [36.0, 36.14], [39.0, 44.42], [49.0, 57.42], [58.0, 65.1], [70.0, 71.69], [77.0, 82.39], [96.0, 98.04], [100.0, 100.11], [105.0, 105.26], [106.0, 108.06], [110.0, 110.52], [113.0, 113.54], [119.0, 126.93]], "keep_status": [false, true, true, false, false, true, false, false, false, false, false, false, false, true, false, false, true], "silence_prob": [0.0, 29.14, 29.28, 0.0, 0.0, 31.28, 31.74, 31.86, 0.0, 31.16, 70.58, 0.0, 0.0, 47.05, 0.0, 0.0, 32.02], "audiomae_on_audioset": [null, [["livestock, farm animals, working animals", 38.6], ["cattle, bovinae", 16.82], ["moo", 13.54]], [["speech", 42.84], ["music", 20.62], ["mains hum", 4.26]], null, null, [["groan", 20.23], ["music", 12.77], ["animal", 11.08]], [["speech", 50.24], ["music", 29.43], ["groan", 7.3]], [["music", 45.28], ["speech", 37.03], ["electronic music", 1.56]], null, [["music", 61.23], ["speech", 10.92], ["hum", 5.74]], null, null, null, [["music", 39.19], ["speech", 12.71], ["synthesizer", 4.0]], null, null, [["music", 33.81], ["fly, housefly", 13.74], ["breaking", 12.6]]], "duration": [0.27, 5.0, 3.5, -0.28, 0.14, 5.42, 8.42, 7.1, 1.69, 5.39, 2.04, 0.11, 0.26, 2.06, 0.52, 0.54, 7.93]} \ No newline at end of file diff --git a/annotations_1/xuhl1rceZdE_filtered.json b/annotations_1/xuhl1rceZdE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..04ca0fd025ba20a2ccde766491b5acea5dacb86e --- /dev/null +++ b/annotations_1/xuhl1rceZdE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 36.91], [38.0, 40.05], [42.0, 44.14], [46.0, 132.29], [135.0, 166.94]], "keep_status": [true, true, true, false, false], "silence_prob": [29.78, 31.88, 32.31, 0.0, 0.0], "audiomae_on_audioset": [[["music", 23.28], ["speech", 8.16], ["burst, pop", 6.97]], [["music", 14.38], ["speech", 10.41], ["gunshot, gunfire", 9.51]], [["speech", 32.94], ["thunk", 11.33], ["gunshot, gunfire", 10.04]], null, null], "duration": [6.91, 2.05, 2.14, 86.29, 31.94]} \ No newline at end of file diff --git a/annotations_1/xvZRXcg4iS8_filtered.json b/annotations_1/xvZRXcg4iS8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..942ad0e265fe55a7b1d5c1630e094345a008f203 --- /dev/null +++ b/annotations_1/xvZRXcg4iS8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 16.98], [18.0, 19.21], [26.0, 26.18], [28.0, 30.74], [38.0, 41.88], [45.0, 44.88], [55.0, 59.27], [60.0, 60.3], [64.0, 64.54], [65.0, 79.34], [84.0, 90.17], [90.0, 96.16], [98.0, 154.77], [156.0, 157.6], [159.0, 159.36], [160.0, 160.59], [168.0, 168.86], [170.0, 170.21]], "keep_status": [false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 46.9, 67.51, 0.0, 46.47, 0.0, 0.0, 67.51, 40.12, 40.92, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["thunk", 16.82], ["fart", 15.82], ["walk, footsteps", 4.87]], null, null, [["groan", 20.68], ["animal", 18.04], ["grunt", 11.85]], null, null, null, [["music", 63.36], ["guitar", 8.71], ["musical instrument", 5.16]], [["music", 56.02], ["guitar", 9.29], ["musical instrument", 8.89]], null, null, null, null, null, null], "duration": [0.98, 1.21, 0.18, 2.74, 3.88, -0.12, 4.27, 0.3, 0.54, 14.34, 6.17, 6.16, 56.77, 1.6, 0.36, 0.59, 0.86, 0.21]} \ No newline at end of file diff --git a/annotations_1/xwfJyzB6dow_filtered.json b/annotations_1/xwfJyzB6dow_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..984d1bcec3b8b307a5c77d6d709f00ef4cc351ce --- /dev/null +++ b/annotations_1/xwfJyzB6dow_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[37.0, 37.77], [43.0, 44.61], [53.0, 53.32], [57.0, 57.97], [61.0, 62.07], [72.0, 72.39], [78.0, 77.94], [89.0, 88.75]], "keep_status": [false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null], "duration": [0.77, 1.61, 0.32, 0.97, 1.07, 0.39, -0.06, -0.25]} \ No newline at end of file diff --git a/annotations_1/xwjw5TFPKwA_filtered.json b/annotations_1/xwjw5TFPKwA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b0bf078bd12859238abdba79edd45267d6b9528d --- /dev/null +++ b/annotations_1/xwjw5TFPKwA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[49.0, 50.14], [51.0, 51.75], [53.0, 87.3], [88.0, 88.94], [89.0, 119.01], [123.0, 123.04]], "keep_status": [false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null], "duration": [1.14, 0.75, 34.3, 0.94, 30.01, 0.04]} \ No newline at end of file diff --git a/annotations_1/xxGmwvrt4ZA_filtered.json b/annotations_1/xxGmwvrt4ZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a66a495320682983c6d25b9dd17c844b39be71d7 --- /dev/null +++ b/annotations_1/xxGmwvrt4ZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.49], [32.0, 33.18], [48.0, 59.7], [64.0, 73.38], [78.0, 109.63], [116.0, 147.8]], "keep_status": [false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 45.4, 30.32, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 52.66], ["electronic music", 5.8], ["throbbing", 3.71]], [["music", 47.35], ["speech", 11.97], ["hum", 7.87]], null, null], "duration": [0.49, 1.18, 11.7, 9.38, 31.63, 31.8]} \ No newline at end of file diff --git a/annotations_1/xxl1Hrw2eQM_filtered.json b/annotations_1/xxl1Hrw2eQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11f4cb47d60f9a2f46abc419c0a00beae36d1fcc --- /dev/null +++ b/annotations_1/xxl1Hrw2eQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.76], [8.0, 15.3], [17.0, 18.89], [19.0, 23.67], [26.0, 26.43], [27.0, 33.56], [34.0, 38.5], [40.0, 41.96], [45.0, 46.82], [47.0, 50.14], [51.0, 52.68], [54.0, 57.03], [67.0, 68.22], [70.0, 73.74], [76.0, 76.87], [78.0, 79.24], [82.0, 89.43], [97.0, 101.83], [103.0, 107.5], [111.0, 110.76], [112.0, 112.65], [114.0, 120.5], [125.0, 130.59], [132.0, 134.1], [137.0, 143.45], [145.0, 145.59], [146.0, 156.32]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, true, true, false, false, true], "silence_prob": [0.0, 42.42, 0.0, 53.72, 0.0, 56.78, 55.46, 0.0, 0.0, 63.21, 0.0, 68.28, 0.0, 59.68, 0.0, 0.0, 77.87, 43.53, 41.89, 0.0, 0.0, 43.77, 36.26, 44.99, 38.72, 0.0, 34.58], "audiomae_on_audioset": [null, [["cattle, bovinae", 22.32], ["livestock, farm animals, working animals", 15.05], ["moo", 9.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 52.04], ["singing bowl", 14.17], ["speech", 11.51]], [["speech", 34.66], ["whale vocalization", 16.54], ["music", 13.84]], null, null, [["music", 54.75], ["speech", 7.0], ["synthesizer", 5.43]], [["music", 34.19], ["fly, housefly", 13.11], ["insect", 6.59]], [["music", 37.36], ["hiccup", 27.15], ["synthesizer", 3.24]], [["music", 66.73], ["marimba, xylophone", 9.08], ["mallet percussion", 2.88]], null, [["music", 40.61], ["fly, housefly", 10.4], ["speech", 4.77]]], "duration": [0.76, 7.3, 1.89, 4.67, 0.43, 6.56, 4.5, 1.96, 1.82, 3.14, 1.68, 3.03, 1.22, 3.74, 0.87, 1.24, 7.43, 4.83, 4.5, -0.24, 0.65, 6.5, 5.59, 2.1, 6.45, 0.59, 10.32]} \ No newline at end of file diff --git a/annotations_1/xxulNn8UDtY_filtered.json b/annotations_1/xxulNn8UDtY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0bead0d49d2f221bd98f42425efbb3f621a227dc --- /dev/null +++ b/annotations_1/xxulNn8UDtY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.96], [6.0, 6.69], [8.0, 14.28], [17.0, 19.26], [34.0, 34.1], [36.0, 37.94], [41.0, 41.86], [43.0, 53.96], [56.0, 61.5], [62.0, 84.5], [86.0, 127.06], [127.0, 127.09], [128.0, 129.98], [130.0, 134.6]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.48, 31.43, 0.0, 0.0, 0.0, 68.28, 96.89, 38.15, 0.0, 0.0, 0.0, 31.16], "audiomae_on_audioset": [null, null, null, [["baby laughter", 13.74], ["livestock, farm animals, working animals", 11.29], ["cattle, bovinae", 10.66]], null, null, null, null, null, [["music", 53.61], ["theremin", 17.41], ["synthesizer", 6.63]], null, null, null, [["music", 61.44], ["speech", 13.78], ["boing", 9.82]]], "duration": [0.96, 0.69, 6.28, 2.26, 0.1, 1.94, 0.86, 10.96, 5.5, 22.5, 41.06, 0.09, 1.98, 4.6]} \ No newline at end of file diff --git a/annotations_1/xz3nif1TPDk_filtered.json b/annotations_1/xz3nif1TPDk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cc516b46aec17c14122ea84662a5fbb0e1a790a9 --- /dev/null +++ b/annotations_1/xz3nif1TPDk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 2.62], [4.0, 14.1], [15.0, 15.99], [18.0, 18.12], [21.0, 21.39], [22.0, 22.2], [24.0, 33.47], [43.0, 48.0], [54.0, 60.08], [67.0, 79.27], [81.0, 89.31], [94.0, 99.13], [99.0, 102.51], [104.0, 111.03], [112.0, 112.31], [113.0, 113.19], [114.0, 115.28], [116.0, 116.73], [118.0, 118.67], [124.0, 125.31], [126.0, 126.89], [136.0, 136.09], [138.0, 138.82], [139.0, 139.14], [142.0, 143.36], [144.0, 145.23], [146.0, 147.5], [150.0, 151.17], [153.0, 153.22], [158.0, 159.58], [162.0, 162.99], [164.0, 164.25], [166.0, 167.09], [168.0, 168.34], [171.0, 172.13], [173.0, 174.19], [175.0, 175.53], [176.0, 175.88], [177.0, 178.07]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [70.72, 73.97, 0.0, 0.0, 0.0, 0.0, 38.12, 46.97, 46.4, 61.47, 50.36, 45.98, 53.22, 62.07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.09], ["theremin", 20.61], ["hum", 5.08]], [["music", 49.86], ["hum", 14.28], ["mains hum", 11.77]], [["music", 70.37], ["musical instrument", 3.7], ["effects unit", 3.04]], null, null, [["music", 78.02], ["sonar", 4.19], ["synthesizer", 3.34]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.62, 10.1, 0.99, 0.12, 0.39, 0.2, 9.47, 5.0, 6.08, 12.27, 8.31, 5.13, 3.51, 7.03, 0.31, 0.19, 1.28, 0.73, 0.67, 1.31, 0.89, 0.09, 0.82, 0.14, 1.36, 1.23, 1.5, 1.17, 0.22, 1.58, 0.99, 0.25, 1.09, 0.34, 1.13, 1.19, 0.53, -0.12, 1.07]} \ No newline at end of file diff --git a/annotations_1/xzBC35K-vug_filtered.json b/annotations_1/xzBC35K-vug_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..63628a47dc68ca53626d6885d9b30f28bd18f47a --- /dev/null +++ b/annotations_1/xzBC35K-vug_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.46], [10.0, 9.9], [11.0, 25.78], [37.0, 43.63], [45.0, 45.49], [54.0, 53.86], [56.0, 74.02], [77.0, 78.07], [79.0, 80.15], [83.0, 83.71], [87.0, 87.61], [88.0, 88.37], [89.0, 97.24], [101.0, 101.68], [104.0, 112.18], [117.0, 121.64], [122.0, 126.25], [132.0, 132.83], [136.0, 154.38], [156.0, 157.11], [161.0, 168.13], [169.0, 174.83], [180.0, 181.84], [182.0, 181.89], [186.0, 185.94], [187.0, 190.44], [192.0, 203.12], [204.0, 204.84], [205.0, 206.61]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true, false, false, false, true, true, false, false], "silence_prob": [0.0, 0.0, 30.68, 31.76, 0.0, 0.0, 32.62, 0.0, 0.0, 0.0, 0.0, 0.0, 30.03, 0.0, 29.69, 29.23, 37.57, 0.0, 29.41, 0.0, 29.46, 29.84, 0.0, 0.0, 0.0, 30.51, 30.04, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 77.4], ["electronic music", 4.2], ["speech", 3.87]], [["music", 32.13], ["speech", 15.91], ["cattle, bovinae", 10.69]], null, null, [["music", 72.67], ["electronic music", 5.5], ["techno", 4.16]], null, null, null, null, null, [["music", 33.32], ["hum", 15.15], ["throbbing", 10.81]], null, [["music", 86.8], ["electronic music", 2.93], ["throbbing", 2.68]], [["music", 70.57], ["speech", 11.69], ["boing", 2.64]], [["music", 51.39], ["boing", 20.71], ["speech", 5.84]], null, [["music", 65.66], ["speech", 13.85], ["buzz", 5.01]], null, [["music", 56.76], ["speech", 7.04], ["vehicle", 4.5]], [["speech", 38.65], ["music", 11.54], ["boat, water vehicle", 4.7]], null, null, null, [["speech", 42.43], ["whale vocalization", 16.94], ["vehicle", 6.35]], [["music", 43.26], ["cattle, bovinae", 7.64], ["moo", 7.47]], null, null], "duration": [0.46, -0.1, 14.78, 6.63, 0.49, -0.14, 18.02, 1.07, 1.15, 0.71, 0.61, 0.37, 8.24, 0.68, 8.18, 4.64, 4.25, 0.83, 18.38, 1.11, 7.13, 5.83, 1.84, -0.11, -0.06, 3.44, 11.12, 0.84, 1.61]} \ No newline at end of file diff --git a/annotations_1/y-qCvfXMTlg_filtered.json b/annotations_1/y-qCvfXMTlg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..13ec9e3ab62ec11ad35f977a5e926379739aa9de --- /dev/null +++ b/annotations_1/y-qCvfXMTlg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.24], [13.0, 13.93], [15.0, 16.24], [18.0, 20.09], [23.0, 23.3], [29.0, 29.15], [36.0, 37.15], [40.0, 41.35], [51.0, 51.65], [54.0, 56.62], [59.0, 59.19], [61.0, 63.15], [69.0, 75.88], [78.0, 78.83], [82.0, 83.1], [85.0, 88.53], [89.0, 96.33], [97.0, 98.47], [100.0, 100.82]], "keep_status": [true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [44.72, 0.0, 0.0, 51.28, 0.0, 0.0, 0.0, 0.0, 0.0, 37.13, 0.0, 32.34, 29.93, 0.0, 0.0, 29.12, 59.59, 0.0, 0.0], "audiomae_on_audioset": [[["music", 35.28], ["hum", 14.45], ["throbbing", 8.82]], null, null, null, null, null, null, null, null, [["speech", 33.91], ["sidetone", 17.68], ["music", 5.11]], null, [["throbbing", 39.31], ["hum", 31.88], ["mains hum", 11.16]], [["mains hum", 35.96], ["hum", 33.27], ["speech", 16.61]], null, null, [["breaking", 51.59], ["gong", 19.47], ["whip", 5.03]], null, null, null], "duration": [2.24, 0.93, 1.24, 2.09, 0.3, 0.15, 1.15, 1.35, 0.65, 2.62, 0.19, 2.15, 6.88, 0.83, 1.1, 3.53, 7.33, 1.47, 0.82]} \ No newline at end of file diff --git a/annotations_1/y0DYykDLU0Y_filtered.json b/annotations_1/y0DYykDLU0Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd2531588f429df0f419e06286006e1f4d602588 --- /dev/null +++ b/annotations_1/y0DYykDLU0Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 7.06], [10.0, 60.64], [61.0, 102.19], [105.0, 112.11], [115.0, 117.98], [118.0, 118.29], [118.0, 118.35], [118.0, 118.4], [118.0, 130.44]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [84.43, 0.0, 0.0, 29.16, 30.15, 0.0, 0.0, 0.0, 29.26], "audiomae_on_audioset": [null, null, null, [["music", 54.54], ["speech", 17.83], ["cacophony", 3.7]], [["music", 35.56], ["throbbing", 24.52], ["drum and bass", 13.04]], null, null, null, [["music", 62.22], ["drum and bass", 5.91], ["throbbing", 5.82]]], "duration": [6.06, 50.64, 41.19, 7.11, 2.98, 0.29, 0.35, 0.4, 12.44]} \ No newline at end of file diff --git a/annotations_1/y1-gPBJ-C_U_filtered.json b/annotations_1/y1-gPBJ-C_U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b2a7afe19d40bef0bf04f0c096da52d60c1c4b7 --- /dev/null +++ b/annotations_1/y1-gPBJ-C_U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.95], [14.0, 18.76], [20.0, 23.3], [25.0, 27.21], [28.0, 30.0], [31.0, 32.04], [33.0, 37.57], [39.0, 40.17], [42.0, 46.33], [47.0, 59.98], [62.0, 66.26], [67.0, 90.19], [91.0, 93.46], [94.0, 102.56], [104.0, 107.82], [109.0, 110.34], [112.0, 112.77], [114.0, 116.41], [118.0, 120.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [58.05, 87.0, 98.51, 48.14, 91.47, 0.0, 77.36, 0.0, 60.14, 34.27, 28.77, 29.81, 98.73, 30.27, 74.92, 0.0, 0.0, 82.79, 99.98], "audiomae_on_audioset": [null, null, null, [["speech", 48.6], ["music", 17.6], ["whale vocalization", 6.11]], null, null, null, null, null, [["music", 39.67], ["hum", 20.72], ["mains hum", 10.05]], [["mains hum", 44.95], ["hum", 16.09], ["speech", 11.34]], [["music", 19.81], ["hum", 9.63], ["throbbing", 9.05]], null, [["hum", 34.59], ["throbbing", 20.65], ["mains hum", 12.86]], null, null, null, null, null], "duration": [3.95, 4.76, 3.3, 2.21, 2.0, 1.04, 4.57, 1.17, 4.33, 12.98, 4.26, 23.19, 2.46, 8.56, 3.82, 1.34, 0.77, 2.41, 2.11]} \ No newline at end of file diff --git a/annotations_1/y1OhC9h3flY_filtered.json b/annotations_1/y1OhC9h3flY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afb3d3ea9d2b36ab932936692cd2d5ce42538802 --- /dev/null +++ b/annotations_1/y1OhC9h3flY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.88], [8.0, 8.97], [12.0, 13.95], [16.0, 16.7], [21.0, 21.79], [23.0, 24.16], [28.0, 28.78], [33.0, 34.18], [35.0, 36.8], [38.0, 40.19], [41.0, 42.18], [43.0, 45.39], [46.0, 47.21], [48.0, 50.77], [51.0, 53.43], [54.0, 55.81], [57.0, 59.09], [60.0, 61.97], [63.0, 65.33], [66.0, 66.9], [68.0, 70.02], [72.0, 98.17], [103.0, 103.57], [108.0, 109.95], [111.0, 112.89], [116.0, 118.72], [122.0, 124.55]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, true, false, false, true, false, false, false, false, false], "silence_prob": [48.74, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.51, 0.0, 67.89, 0.0, 98.66, 38.17, 0.0, 43.25, 0.0, 40.61, 0.0, 56.7, 46.57, 0.0, 0.0, 0.0, 92.8, 71.14], "audiomae_on_audioset": [[["sine wave", 18.07], ["tuning fork", 16.12], ["chirp tone", 13.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 30.19], ["speech", 19.21], ["music", 10.79]], null, [["hum", 24.14], ["throbbing", 20.99], ["speech", 18.01]], null, [["speech", 36.95], ["hum", 12.58], ["music", 10.94]], null, null, [["hum", 26.77], ["singing bowl", 10.47], ["gong", 7.27]], null, null, null, null, null], "duration": [4.88, 0.97, 1.95, 0.7, 0.79, 1.16, 0.78, 1.18, 1.8, 2.19, 1.18, 2.39, 1.21, 2.77, 2.43, 1.81, 2.09, 1.97, 2.33, 0.9, 2.02, 26.17, 0.57, 1.95, 1.89, 2.72, 2.55]} \ No newline at end of file diff --git a/annotations_1/y1gkMNjkFiQ_filtered.json b/annotations_1/y1gkMNjkFiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b91a3431ed89be8e5f92937df121c2d04a2ae09 --- /dev/null +++ b/annotations_1/y1gkMNjkFiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[54.0, 104.84], [106.0, 106.2], [107.0, 154.62]], "keep_status": [false, false, false], "silence_prob": [0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null], "duration": [50.84, 0.2, 47.62]} \ No newline at end of file diff --git a/annotations_1/y2_oXPF2b3Y_filtered.json b/annotations_1/y2_oXPF2b3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d335437433935d08c9d04115a38195e5a52a5bad --- /dev/null +++ b/annotations_1/y2_oXPF2b3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.0], [7.0, 7.89], [12.0, 13.17], [14.0, 15.94], [18.0, 23.21], [24.0, 27.51], [28.0, 45.01], [48.0, 51.43], [52.0, 52.83], [54.0, 55.07], [59.0, 58.7], [61.0, 61.86], [63.0, 63.12], [65.0, 67.56], [85.0, 89.48], [93.0, 94.66], [96.0, 97.44], [98.0, 100.87], [109.0, 110.25], [111.0, 113.39], [114.0, 114.34], [115.0, 114.76], [115.0, 115.6], [118.0, 119.25], [120.0, 122.89], [124.0, 131.65], [133.0, 137.73], [138.0, 138.79], [139.0, 140.76], [141.0, 148.54]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 58.05, 49.09, 33.81, 57.09, 0.0, 0.0, 0.0, 0.0, 0.0, 67.25, 35.75, 0.0, 0.0, 82.43, 0.0, 39.09, 0.0, 0.0, 0.0, 0.0, 31.1, 99.26, 89.19, 0.0, 0.0, 61.27], "audiomae_on_audioset": [null, null, null, null, null, [["music", 58.63], ["scary music", 11.96], ["ambient music", 4.29]], [["music", 43.35], ["noise", 9.65], ["static", 6.08]], null, null, null, null, null, null, null, [["music", 65.09], ["theremin", 19.73], ["musical instrument", 1.68]], null, null, null, null, [["music", 36.69], ["musical instrument", 7.61], ["theremin", 4.93]], null, null, null, null, [["speech", 48.03], ["creak", 6.98], ["burst, pop", 6.41]], null, null, null, null, null], "duration": [1.0, 0.89, 1.17, 1.94, 5.21, 3.51, 17.01, 3.43, 0.83, 1.07, -0.3, 0.86, 0.12, 2.56, 4.48, 1.66, 1.44, 2.87, 1.25, 2.39, 0.34, -0.24, 0.6, 1.25, 2.89, 7.65, 4.73, 0.79, 1.76, 7.54]} \ No newline at end of file diff --git a/annotations_1/y2wupV34DRk_filtered.json b/annotations_1/y2wupV34DRk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2fa84ef7c803cec9e9ce7f56eb0806d16d666aa --- /dev/null +++ b/annotations_1/y2wupV34DRk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.06], [11.0, 11.58], [18.0, 18.37], [19.0, 19.38], [32.0, 38.92], [42.0, 43.02], [44.0, 45.13], [47.0, 48.36], [51.0, 61.47], [64.0, 81.24], [83.0, 101.36], [106.0, 106.39], [108.0, 112.11], [112.0, 114.12], [115.0, 115.72], [128.0, 128.26], [136.0, 137.81], [138.0, 140.68], [142.0, 143.02], [149.0, 149.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false], "silence_prob": [45.43, 0.0, 0.0, 0.0, 30.43, 0.0, 0.0, 0.0, 30.56, 30.67, 31.14, 0.0, 65.67, 49.36, 0.0, 0.0, 0.0, 44.2, 0.0, 0.0], "audiomae_on_audioset": [[["music", 56.45], ["hum", 8.28], ["mains hum", 5.36]], null, null, null, [["speech", 44.68], ["music", 25.37], ["throbbing", 13.13]], null, null, null, [["throbbing", 28.66], ["music", 28.04], ["hum", 17.76]], [["music", 37.96], ["throbbing", 19.94], ["hum", 14.41]], [["throbbing", 43.64], ["hum", 31.46], ["music", 11.71]], null, null, [["speech", 33.35], ["music", 7.13], ["hum", 6.77]], null, null, null, [["speech", 34.1], ["music", 15.08], ["rumble", 12.65]], null, null], "duration": [2.06, 0.58, 0.37, 0.38, 6.92, 1.02, 1.13, 1.36, 10.47, 17.24, 18.36, 0.39, 4.11, 2.12, 0.72, 0.26, 1.81, 2.68, 1.02, 0.4]} \ No newline at end of file diff --git a/annotations_1/y3NLNK72mzI_filtered.json b/annotations_1/y3NLNK72mzI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8964cd7c163f111d23c29cc61509ddb64fab1c55 --- /dev/null +++ b/annotations_1/y3NLNK72mzI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 18.66], [23.0, 22.91], [31.0, 32.44], [41.0, 42.08], [45.0, 47.38], [53.0, 55.44], [58.0, 61.4], [64.0, 64.77], [65.0, 67.26], [68.0, 69.45], [76.0, 76.55], [77.0, 77.28], [82.0, 87.4], [91.0, 91.61], [94.0, 98.24], [99.0, 101.55], [102.0, 107.65], [113.0, 114.08], [117.0, 118.25], [122.0, 122.88], [125.0, 126.44], [137.0, 137.34], [138.0, 138.38], [139.0, 138.94], [140.0, 140.53]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.97, 97.43, 99.91, 0.0, 91.64, 0.0, 0.0, 0.0, 71.72, 0.0, 99.21, 98.93, 99.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.66, -0.09, 1.44, 1.08, 2.38, 2.44, 3.4, 0.77, 2.26, 1.45, 0.55, 0.28, 5.4, 0.61, 4.24, 2.55, 5.65, 1.08, 1.25, 0.88, 1.44, 0.34, 0.38, -0.06, 0.53]} \ No newline at end of file diff --git a/annotations_1/y4fdm5gdvnE_filtered.json b/annotations_1/y4fdm5gdvnE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..99b1d3f73fe67ac8466fbee97dc2682aec6bc0d5 --- /dev/null +++ b/annotations_1/y4fdm5gdvnE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.88], [4.0, 4.33], [10.0, 10.62], [14.0, 14.71], [20.0, 21.44], [29.0, 34.3], [35.0, 35.33], [39.0, 39.77], [48.0, 49.15], [50.0, 52.05], [57.0, 58.58], [59.0, 59.76], [66.0, 66.53], [79.0, 80.91], [82.0, 83.79], [91.0, 91.44], [96.0, 96.82], [98.0, 98.46], [105.0, 125.49], [130.0, 131.09], [135.0, 135.9], [136.0, 138.92], [143.0, 145.57], [146.0, 146.48], [149.0, 153.6], [155.0, 156.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0, 31.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.96, 0.0, 0.0, 30.12, 30.37, 0.0, 34.75, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 72.58], ["electronic music", 2.82], ["hip hop music", 1.66]], null, null, null, [["music", 65.23], ["musical instrument", 5.16], ["guitar", 3.27]], null, null, null, null, null, null, null, null, [["music", 87.19], ["electronic music", 2.03], ["musical instrument", 1.64]], null, null, [["music", 83.11], ["electronic music", 1.27], ["dubstep", 0.75]], [["music", 59.99], ["reggae", 6.23], ["electronic music", 4.27]], null, [["whack, thwack", 35.54], ["thunk", 16.28], ["breaking", 10.54]], null], "duration": [0.88, 0.33, 0.62, 0.71, 1.44, 5.3, 0.33, 0.77, 1.15, 2.05, 1.58, 0.76, 0.53, 1.91, 1.79, 0.44, 0.82, 0.46, 20.49, 1.09, 0.9, 2.92, 2.57, 0.48, 4.6, 1.17]} \ No newline at end of file diff --git a/annotations_1/y5vxDOma1Ok_filtered.json b/annotations_1/y5vxDOma1Ok_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c1fddb55c90a270785c95ab35c2292bf7a71c3a --- /dev/null +++ b/annotations_1/y5vxDOma1Ok_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 51.65], [52.0, 53.23], [54.0, 55.43], [56.0, 76.71], [77.0, 77.3], [77.0, 90.95], [91.0, 103.33], [104.0, 104.72], [106.0, 119.25], [120.0, 120.78], [121.0, 126.05]], "keep_status": [false, false, false, true, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 30.83, 0.0, 30.99, 31.81, 0.0, 31.0, 0.0, 31.24], "audiomae_on_audioset": [null, null, null, [["music", 30.98], ["hum", 25.02], ["mains hum", 13.89]], null, [["music", 50.47], ["speech", 33.04], ["boing", 2.55]], [["speech", 51.48], ["music", 28.52], ["sidetone", 7.59]], null, [["music", 44.22], ["hum", 12.01], ["mains hum", 8.5]], null, [["music", 41.98], ["mains hum", 18.32], ["hum", 15.08]]], "duration": [49.65, 1.23, 1.43, 20.71, 0.3, 13.95, 12.33, 0.72, 13.25, 0.78, 5.05]} \ No newline at end of file diff --git a/annotations_1/y64QBxHJiqI_filtered.json b/annotations_1/y64QBxHJiqI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b00d705708f4aeef907bbc66e9f254a21ef4985b --- /dev/null +++ b/annotations_1/y64QBxHJiqI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.15], [25.0, 27.28], [29.0, 30.01], [30.0, 31.08], [33.0, 33.81], [35.0, 38.64], [40.0, 44.1], [45.0, 45.23], [47.0, 47.22], [48.0, 50.43], [61.0, 65.26], [73.0, 79.34], [92.0, 99.52], [105.0, 119.8], [122.0, 123.5], [125.0, 126.06], [127.0, 128.43], [130.0, 130.72], [132.0, 133.66], [134.0, 135.7], [136.0, 137.19], [139.0, 142.11], [143.0, 144.56], [146.0, 146.97], [148.0, 154.33], [156.0, 159.0], [161.0, 161.23]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 64.97, 0.0, 0.0, 0.0, 33.89, 33.26, 0.0, 0.0, 80.64, 30.32, 30.6, 30.62, 31.33, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.25, 0.0, 0.0, 50.31, 53.78, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["cattle, bovinae", 28.56], ["whale vocalization", 28.2], ["moo", 20.82]], [["livestock, farm animals, working animals", 29.01], ["cattle, bovinae", 20.02], ["moo", 12.0]], null, null, null, [["livestock, farm animals, working animals", 41.62], ["sheep", 20.52], ["speech", 8.6]], [["music", 16.96], ["vehicle", 12.96], ["skidding", 11.0]], [["music", 74.18], ["drum machine", 2.86], ["sampler", 1.58]], [["music", 64.57], ["throbbing", 10.43], ["speech", 5.1]], null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.15, 2.28, 1.01, 1.08, 0.81, 3.64, 4.1, 0.23, 0.22, 2.43, 4.26, 6.34, 7.52, 14.8, 1.5, 1.06, 1.43, 0.72, 1.66, 1.7, 1.19, 3.11, 1.56, 0.97, 6.33, 3.0, 0.23]} \ No newline at end of file diff --git a/annotations_1/y6uK9wxhl_w_filtered.json b/annotations_1/y6uK9wxhl_w_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0db48025f93e7e15883cb83b4cb862e403c227a7 --- /dev/null +++ b/annotations_1/y6uK9wxhl_w_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.22], [4.0, 5.17], [7.0, 7.45], [11.0, 13.69], [15.0, 15.16], [16.0, 16.65], [19.0, 19.26], [22.0, 22.91], [23.0, 25.73], [29.0, 31.72], [35.0, 36.31], [44.0, 44.41], [46.0, 46.38], [47.0, 47.98], [54.0, 55.51], [63.0, 64.2], [66.0, 66.99], [70.0, 71.85], [73.0, 73.4], [76.0, 77.45], [80.0, 79.96], [82.0, 82.04], [83.0, 84.75], [89.0, 89.48], [91.0, 94.34], [96.0, 97.73], [99.0, 100.55], [102.0, 103.64], [105.0, 111.7], [113.0, 117.88], [119.0, 119.97], [128.0, 128.24], [130.0, 129.69]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 93.13, 0.0, 0.0, 0.0, 0.0, 60.89, 95.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.0, 0.0, 0.0, 0.0, 99.91, 47.16, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 36.58], ["guitar", 19.04], ["plucked string instrument", 9.06]], null, null, null], "duration": [1.22, 1.17, 0.45, 2.69, 0.16, 0.65, 0.26, 0.91, 2.73, 2.72, 1.31, 0.41, 0.38, 0.98, 1.51, 1.2, 0.99, 1.85, 0.4, 1.45, -0.04, 0.04, 1.75, 0.48, 3.34, 1.73, 1.55, 1.64, 6.7, 4.88, 0.97, 0.24, -0.31]} \ No newline at end of file diff --git a/annotations_1/y87LPJHRfOI_filtered.json b/annotations_1/y87LPJHRfOI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53c73197dd04897abc8e932265bc4128b8c4c644 --- /dev/null +++ b/annotations_1/y87LPJHRfOI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.32], [9.0, 13.63], [16.0, 21.81], [23.0, 25.32], [28.0, 31.9], [34.0, 35.78], [38.0, 40.85], [43.0, 44.66], [46.0, 48.86], [50.0, 50.7], [55.0, 56.62], [59.0, 60.89], [62.0, 66.04], [66.0, 67.37], [73.0, 75.41], [82.0, 83.46], [87.0, 90.19], [96.0, 99.05], [100.0, 108.08], [109.0, 110.71], [113.0, 114.67], [118.0, 127.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [99.31, 99.98, 99.84, 99.94, 99.99, 0.0, 99.1, 0.0, 99.87, 0.0, 0.0, 0.0, 99.21, 0.0, 93.6, 0.0, 99.62, 99.93, 99.92, 0.0, 0.0, 95.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.32, 4.63, 5.81, 2.32, 3.9, 1.78, 2.85, 1.66, 2.86, 0.7, 1.62, 1.89, 4.04, 1.37, 2.41, 1.46, 3.19, 3.05, 8.08, 1.71, 1.67, 9.87]} \ No newline at end of file diff --git a/annotations_1/y8i5Nwg_TqU_filtered.json b/annotations_1/y8i5Nwg_TqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f35cec527156ebeae8828f888467c0098a09341 --- /dev/null +++ b/annotations_1/y8i5Nwg_TqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.7], [7.0, 10.84], [15.0, 21.51], [23.0, 24.19], [29.0, 43.75], [44.0, 56.08], [57.0, 71.44], [72.0, 94.53], [96.0, 97.12], [100.0, 100.31], [103.0, 103.94]], "keep_status": [false, false, false, false, true, false, true, true, false, false, false], "silence_prob": [0.0, 99.97, 99.05, 0.0, 36.09, 95.23, 37.66, 41.44, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 17.7], ["glass", 11.2], ["breaking", 11.11]], null, [["music", 33.28], ["flamenco", 9.42], ["hum", 7.47]], [["music", 36.06], ["musical instrument", 10.73], ["effects unit", 9.35]], null, null, null], "duration": [1.7, 3.84, 6.51, 1.19, 14.75, 12.08, 14.44, 22.53, 1.12, 0.31, 0.94]} \ No newline at end of file diff --git a/annotations_1/y9NhqnuoSAs_filtered.json b/annotations_1/y9NhqnuoSAs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..00f7838459732c2bd3aea7a6db7dbe1928699445 --- /dev/null +++ b/annotations_1/y9NhqnuoSAs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[34.0, 63.12], [65.0, 90.17], [91.0, 139.85], [142.0, 142.01]], "keep_status": [true, true, false, false], "silence_prob": [29.59, 28.79, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 24.01], ["music", 14.05], ["thump, thud", 8.49]], [["animal", 24.02], ["sound effect", 13.77], ["roar", 12.49]], null, null], "duration": [29.12, 25.17, 48.85, 0.01]} \ No newline at end of file diff --git a/annotations_1/yAmTu-R5MQM_filtered.json b/annotations_1/yAmTu-R5MQM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8c9bce3b03fae14138975cc40a6cb125926f8b56 --- /dev/null +++ b/annotations_1/yAmTu-R5MQM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.66], [3.0, 4.68], [7.0, 8.18], [9.0, 11.3], [12.0, 12.72], [17.0, 17.64], [19.0, 19.79], [20.0, 21.1], [25.0, 25.42], [30.0, 30.87], [34.0, 36.26], [38.0, 38.06], [48.0, 48.24], [60.0, 61.35], [64.0, 73.31], [74.0, 75.84], [90.0, 90.17], [103.0, 104.01], [108.0, 108.43], [114.0, 114.22], [118.0, 118.13], [122.0, 122.52], [126.0, 129.29], [132.0, 132.97], [138.0, 142.96], [145.0, 145.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 90.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.05, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.7, 0.0, 32.08, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 12.53], ["noise", 8.1], ["effects unit", 7.21]], null, [["livestock, farm animals, working animals", 30.1], ["cattle, bovinae", 21.3], ["moo", 20.12]], null], "duration": [0.66, 1.68, 1.18, 2.3, 0.72, 0.64, 0.79, 1.1, 0.42, 0.87, 2.26, 0.06, 0.24, 1.35, 9.31, 1.84, 0.17, 1.01, 0.43, 0.22, 0.13, 0.52, 3.29, 0.97, 4.96, 0.57]} \ No newline at end of file diff --git a/annotations_1/yAo3144gBw4_filtered.json b/annotations_1/yAo3144gBw4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ef2f96ba837301a573971053adbe6ee227ddd25 --- /dev/null +++ b/annotations_1/yAo3144gBw4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 27.14], [29.0, 29.03], [31.0, 32.1], [34.0, 35.61], [41.0, 40.68], [43.0, 43.51], [46.0, 46.43], [48.0, 62.73], [68.0, 75.95]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.8, 95.51], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null], "duration": [0.14, 0.03, 1.1, 1.61, -0.32, 0.51, 0.43, 14.73, 7.95]} \ No newline at end of file diff --git a/annotations_1/yB1w-AypA_s_filtered.json b/annotations_1/yB1w-AypA_s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3e346d5e7543d650ce3a2583c8109d3fb073623 --- /dev/null +++ b/annotations_1/yB1w-AypA_s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.57], [13.0, 14.59], [15.0, 16.14], [17.0, 17.81], [19.0, 20.76], [21.0, 21.73], [23.0, 24.85], [27.0, 27.35], [28.0, 30.11], [32.0, 32.88], [34.0, 51.16], [53.0, 53.57], [56.0, 57.47], [60.0, 60.67], [63.0, 63.46], [66.0, 65.82], [67.0, 109.95], [111.0, 111.86], [113.0, 114.51], [117.0, 122.13], [124.0, 125.79], [126.0, 127.03], [130.0, 143.72], [145.0, 145.88], [147.0, 147.09], [148.0, 148.68], [150.0, 162.33]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [48.14, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.29, 0.0, 58.81, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.11, 0.0, 0.0, 42.74, 0.0, 0.0, 0.0, 32.42], "audiomae_on_audioset": [[["speech", 51.74], ["music", 7.08], ["hum", 6.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.12], ["hum", 20.01], ["throbbing", 10.64]], null, null, [["hum", 41.36], ["mains hum", 19.18], ["music", 10.27]], null, null, null, [["hum", 36.21], ["music", 21.0], ["mains hum", 11.27]]], "duration": [2.57, 1.59, 1.14, 0.81, 1.76, 0.73, 1.85, 0.35, 2.11, 0.88, 17.16, 0.57, 1.47, 0.67, 0.46, -0.18, 42.95, 0.86, 1.51, 5.13, 1.79, 1.03, 13.72, 0.88, 0.09, 0.68, 12.33]} \ No newline at end of file diff --git a/annotations_1/yBd_y4V7vtc_filtered.json b/annotations_1/yBd_y4V7vtc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..952e3a10110d5efcc2ca671fa3ce1f8d7c4faf77 --- /dev/null +++ b/annotations_1/yBd_y4V7vtc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 20.01], [22.0, 22.35], [23.0, 23.25], [35.0, 36.21], [44.0, 44.17], [48.0, 51.19], [51.0, 51.65], [55.0, 56.07], [57.0, 57.28], [64.0, 64.74], [66.0, 66.9], [69.0, 70.41], [71.0, 71.98], [74.0, 75.25], [77.0, 76.86], [78.0, 78.19], [80.0, 80.2], [81.0, 81.78], [82.0, 82.71], [86.0, 86.95], [97.0, 97.01], [98.0, 100.33], [101.0, 101.43], [103.0, 103.77], [105.0, 107.15], [108.0, 108.57], [113.0, 113.66], [114.0, 115.26], [116.0, 119.35], [125.0, 125.44], [127.0, 128.14], [130.0, 133.42], [135.0, 135.53]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, true, false], "silence_prob": [29.94, 0.0, 0.0, 0.0, 0.0, 31.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.28, 0.0, 0.0, 33.77, 0.0, 0.0, 0.0, 30.95, 0.0, 0.0, 33.98, 0.0], "audiomae_on_audioset": [[["speech", 16.87], ["fly, housefly", 15.54], ["mosquito", 10.28]], null, null, null, null, [["pant", 50.89], ["speech", 30.47], ["dog", 4.44]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["whack, thwack", 25.54], ["squeal", 19.48], ["scratch", 4.14]], null, null, [["music", 11.03], ["fly, housefly", 10.21], ["speech", 10.19]], null, null, null, [["speech", 66.93], ["sidetone", 7.82], ["radio", 3.98]], null, null, [["bouncing", 49.53], ["basketball bounce", 12.86], ["whack, thwack", 7.17]], null], "duration": [9.01, 0.35, 0.25, 1.21, 0.17, 3.19, 0.65, 1.07, 0.28, 0.74, 0.9, 1.41, 0.98, 1.25, -0.14, 0.19, 0.2, 0.78, 0.71, 0.95, 0.01, 2.33, 0.43, 0.77, 2.15, 0.57, 0.66, 1.26, 3.35, 0.44, 1.14, 3.42, 0.53]} \ No newline at end of file diff --git a/annotations_1/yCHoWsMt0LY_filtered.json b/annotations_1/yCHoWsMt0LY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1280efd9774a369e152f13f66b27babf8d2c3718 --- /dev/null +++ b/annotations_1/yCHoWsMt0LY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[26.0, 49.37], [50.0, 56.3], [57.0, 58.82], [61.0, 80.54], [82.0, 92.96], [94.0, 94.96], [96.0, 101.29], [105.0, 233.54], [234.0, 244.83], [245.0, 246.32]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [49.27, 45.49, 0.0, 31.78, 52.05, 0.0, 37.85, 0.0, 31.61, 0.0], "audiomae_on_audioset": [[["music", 78.76], ["synthesizer", 7.36], ["theremin", 2.89]], [["music", 75.9], ["single-lens reflex camera", 1.6], ["theremin", 1.44]], null, [["music", 58.23], ["throbbing", 13.71], ["hum", 9.88]], null, null, [["music", 69.44], ["didgeridoo", 7.09], ["theremin", 4.78]], null, [["music", 67.79], ["musical instrument", 4.66], ["synthesizer", 3.58]], null], "duration": [23.37, 6.3, 1.82, 19.54, 10.96, 0.96, 5.29, 128.54, 10.83, 1.32]} \ No newline at end of file diff --git a/annotations_1/yCrq5v5cg1A_filtered.json b/annotations_1/yCrq5v5cg1A_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76afc42d6d6648ba364c3edbe46d00e838a35639 --- /dev/null +++ b/annotations_1/yCrq5v5cg1A_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[41.0, 42.74], [44.0, 44.42], [46.0, 47.01], [48.0, 55.51], [57.0, 58.14], [59.0, 60.05], [61.0, 64.47], [67.0, 67.24], [71.0, 71.15], [73.0, 73.62], [77.0, 78.78], [88.0, 163.71], [165.0, 166.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 75.39, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.74, 0.42, 1.01, 7.51, 1.14, 1.05, 3.47, 0.24, 0.15, 0.62, 1.78, 75.71, 1.26]} \ No newline at end of file diff --git a/annotations_1/yDxNlPIFWHM_filtered.json b/annotations_1/yDxNlPIFWHM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..654cb584023dc72c5f35879969429b9e273f1a81 --- /dev/null +++ b/annotations_1/yDxNlPIFWHM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [1.0, 3.05], [4.0, 4.95], [6.0, 7.86], [9.0, 16.46], [18.0, 21.22], [22.0, 48.91], [54.0, 139.85], [141.0, 145.18], [147.0, 147.21], [150.0, 150.58], [152.0, 152.02], [153.0, 153.03], [156.0, 156.81], [158.0, 158.46], [160.0, 161.1], [162.0, 163.11], [165.0, 164.98], [167.0, 166.9]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 57.17, 0.0, 0.0, 57.32, 78.21, 31.97, 0.0, 84.25, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 36.72], ["hum", 22.22], ["music", 6.3]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 2.05, 0.95, 1.86, 7.46, 3.22, 26.91, 85.85, 4.18, 0.21, 0.58, 0.02, 0.03, 0.81, 0.46, 1.1, 1.11, -0.02, -0.1]} \ No newline at end of file diff --git a/annotations_1/yEKOx9OHEz8_filtered.json b/annotations_1/yEKOx9OHEz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ec0ca6b09a5572a846a47c2e2d755754837ac9b4 --- /dev/null +++ b/annotations_1/yEKOx9OHEz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.78], [6.0, 7.3], [11.0, 12.5], [14.0, 17.64], [18.0, 19.38], [20.0, 20.36], [21.0, 21.54], [22.0, 24.22], [26.0, 28.12], [29.0, 31.87], [36.0, 36.24], [36.0, 37.83], [41.0, 41.2], [42.0, 42.52], [43.0, 43.34], [47.0, 47.9], [50.0, 50.57], [54.0, 54.8], [58.0, 58.35], [62.0, 62.33], [66.0, 65.77], [72.0, 72.33], [73.0, 73.5], [77.0, 77.72], [78.0, 79.83], [82.0, 84.81], [85.0, 85.68], [93.0, 93.36]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 81.89, 99.94, 99.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.13, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.78, 1.3, 1.5, 3.64, 1.38, 0.36, 0.54, 2.22, 2.12, 2.87, 0.24, 1.83, 0.2, 0.52, 0.34, 0.9, 0.57, 0.8, 0.35, 0.33, -0.23, 0.33, 0.5, 0.72, 1.83, 2.81, 0.68, 0.36]} \ No newline at end of file diff --git a/annotations_1/yEeyJzItKAg_filtered.json b/annotations_1/yEeyJzItKAg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..677e01687e668779ca58f3848b0178d7569a1b08 --- /dev/null +++ b/annotations_1/yEeyJzItKAg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 41.25], [66.0, 67.47], [71.0, 99.98], [104.0, 107.55], [110.0, 113.02], [115.0, 119.33], [120.0, 120.72], [125.0, 125.86], [134.0, 140.88], [144.0, 148.59], [150.0, 160.81], [163.0, 182.22], [187.0, 188.16], [191.0, 192.05], [193.0, 193.87], [195.0, 198.88]], "keep_status": [false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 32.12, 31.68, 32.57, 33.17, 0.0, 0.0, 31.48, 31.88, 32.03, 32.3, 0.0, 0.0, 0.0, 38.0], "audiomae_on_audioset": [null, null, [["music", 51.18], ["speech", 8.83], ["electronic music", 6.13]], [["hum", 29.27], ["mains hum", 27.0], ["music", 14.81]], [["music", 37.7], ["speech", 10.21], ["hum", 8.47]], [["music", 49.98], ["hum", 14.38], ["throbbing", 11.68]], null, null, [["hum", 42.53], ["mains hum", 26.02], ["throbbing", 13.12]], [["music", 33.83], ["mains hum", 22.28], ["hum", 20.0]], [["speech", 61.03], ["music", 16.64], ["eruption", 3.65]], [["throbbing", 24.97], ["music", 24.6], ["hum", 21.71]], null, null, null, [["speech", 61.94], ["music", 4.97], ["eruption", 3.3]]], "duration": [31.25, 1.47, 28.98, 3.55, 3.02, 4.33, 0.72, 0.86, 6.88, 4.59, 10.81, 19.22, 1.16, 1.05, 0.87, 3.88]} \ No newline at end of file diff --git a/annotations_1/yEqjnlWEIcg_filtered.json b/annotations_1/yEqjnlWEIcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..079e52f63f52c51b12039eaa99f9002312eea4d4 --- /dev/null +++ b/annotations_1/yEqjnlWEIcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 15.06], [20.0, 22.01], [24.0, 25.49], [29.0, 30.27], [40.0, 40.36], [41.0, 45.06], [64.0, 66.31], [71.0, 72.3], [80.0, 83.93], [89.0, 89.75], [91.0, 91.4], [97.0, 98.05], [105.0, 106.91], [115.0, 115.53], [127.0, 128.19], [129.0, 130.49], [131.0, 130.94], [134.0, 140.21], [141.0, 144.61], [146.0, 146.3]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [50.86, 100.0, 0.0, 0.0, 0.0, 39.64, 44.49, 0.0, 99.05, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.69, 38.47, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 42.84], ["mains hum", 13.28], ["hum", 8.9]], [["music", 45.65], ["theremin", 39.76], ["oink", 2.91]], null, null, null, null, null, null, null, null, null, null, [["breaking", 42.53], ["music", 19.91], ["glass", 6.42]], [["music", 67.46], ["boing", 9.32], ["thunk", 2.64]], null], "duration": [2.06, 2.01, 1.49, 1.27, 0.36, 4.06, 2.31, 1.3, 3.93, 0.75, 0.4, 1.05, 1.91, 0.53, 1.19, 1.49, -0.06, 6.21, 3.61, 0.3]} \ No newline at end of file diff --git a/annotations_1/yEyQgxLmGmI_filtered.json b/annotations_1/yEyQgxLmGmI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8f8667cdd470a079019d4242a97f505035a98d --- /dev/null +++ b/annotations_1/yEyQgxLmGmI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.26], [37.0, 38.23], [41.0, 41.54], [45.0, 46.09], [48.0, 48.93], [50.0, 52.54], [55.0, 55.97], [65.0, 66.61], [72.0, 72.47], [74.0, 75.24], [77.0, 79.84], [83.0, 84.42], [98.0, 98.98]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.23, 0.54, 1.09, 0.93, 2.54, 0.97, 1.61, 0.47, 1.24, 2.84, 1.42, 0.98]} \ No newline at end of file diff --git a/annotations_1/yFSvuz5aHy8_filtered.json b/annotations_1/yFSvuz5aHy8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cab3c4e046aeff93097facc2801291cb7a759625 --- /dev/null +++ b/annotations_1/yFSvuz5aHy8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 2.83], [3.0, 3.72], [5.0, 5.48], [6.0, 6.84], [35.0, 36.73], [38.0, 39.36], [40.0, 41.99], [49.0, 50.77], [52.0, 53.97], [61.0, 60.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [-0.17, 0.72, 0.48, 0.84, 1.73, 1.36, 1.99, 1.77, 1.97, -0.43]} \ No newline at end of file diff --git a/annotations_1/yGYPTb9T3MU_filtered.json b/annotations_1/yGYPTb9T3MU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c40fd9c2d36e4f96e661aca6ffff83577825994 --- /dev/null +++ b/annotations_1/yGYPTb9T3MU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 31.28], [32.0, 60.17], [61.0, 68.88], [69.0, 73.41], [74.0, 81.58], [82.0, 87.94], [91.0, 91.42], [94.0, 95.76], [97.0, 98.79], [102.0, 105.46], [106.0, 106.83], [109.0, 110.73], [112.0, 113.09], [114.0, 122.45], [123.0, 129.79], [131.0, 132.51], [136.0, 139.87], [142.0, 142.62], [145.0, 146.6], [150.0, 152.85], [155.0, 156.95], [160.0, 160.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.59, 93.91, 33.02, 79.24, 73.06, 64.75, 0.0, 0.0, 0.0, 99.65, 0.0, 0.0, 0.0, 89.19, 78.21, 0.0, 79.07, 0.0, 0.0, 84.07, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["shofar", 50.72], ["wind instrument, woodwind instrument", 18.54], ["music", 9.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [25.28, 28.17, 7.88, 4.41, 7.58, 5.94, 0.42, 1.76, 1.79, 3.46, 0.83, 1.73, 1.09, 8.45, 6.79, 1.51, 3.87, 0.62, 1.6, 2.85, 1.95, 0.3]} \ No newline at end of file diff --git a/annotations_1/yHjejU3HvRE_filtered.json b/annotations_1/yHjejU3HvRE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..33e555b865bf06575d5d1ba9c19ba33d01241431 --- /dev/null +++ b/annotations_1/yHjejU3HvRE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[58.0, 81.18], [82.0, 82.95], [83.0, 89.67], [90.0, 90.88], [91.0, 92.25], [93.0, 93.68], [94.0, 97.8], [100.0, 101.82], [102.0, 102.12], [105.0, 106.0], [107.0, 108.58], [109.0, 112.35]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false], "silence_prob": [29.81, 0.0, 31.92, 0.0, 0.0, 0.0, 29.55, 0.0, 0.0, 0.0, 0.0, 33.71], "audiomae_on_audioset": [[["music", 73.55], ["synthesizer", 7.04], ["musical instrument", 4.26]], null, [["music", 50.56], ["speech", 10.95], ["throbbing", 8.22]], null, null, null, [["music", 27.16], ["wild animals", 9.93], ["roaring cats (lions, tigers)", 7.29]], null, null, null, null, [["music", 48.96], ["speech", 18.35], ["throbbing", 7.98]]], "duration": [23.18, 0.95, 6.67, 0.88, 1.25, 0.68, 3.8, 1.82, 0.12, 1.0, 1.58, 3.35]} \ No newline at end of file diff --git a/annotations_1/yHw5A9BAZ98_filtered.json b/annotations_1/yHw5A9BAZ98_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fbbb1dfb1a64c1fab8fefaa0efa333da25697904 --- /dev/null +++ b/annotations_1/yHw5A9BAZ98_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.82], [6.0, 7.28], [8.0, 9.37], [14.0, 14.39], [21.0, 21.17], [25.0, 28.73], [30.0, 31.23], [34.0, 34.86], [38.0, 39.45], [42.0, 42.84], [54.0, 53.99], [55.0, 60.37], [60.0, 60.47], [60.0, 60.51], [61.0, 61.79], [63.0, 68.88], [69.0, 71.47], [77.0, 77.33], [79.0, 78.61], [81.0, 82.9], [84.0, 85.63], [88.0, 88.38], [92.0, 98.73], [109.0, 110.12], [116.0, 115.87], [124.0, 124.66], [130.0, 131.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 53.22, 0.0, 0.0, 0.0, 0.0, 0.0, 52.51, 0.0, 0.0, 0.0, 64.63, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 47.9, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.19], ["sidetone", 14.94], ["hum", 4.86]], null, null, null, null], "duration": [1.82, 1.28, 1.37, 0.39, 0.17, 3.73, 1.23, 0.86, 1.45, 0.84, -0.01, 5.37, 0.47, 0.51, 0.79, 5.88, 2.47, 0.33, -0.39, 1.9, 1.63, 0.38, 6.73, 1.12, -0.13, 0.66, 1.87]} \ No newline at end of file diff --git a/annotations_1/yISManYcWqU_filtered.json b/annotations_1/yISManYcWqU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d47ca8c4bc52d86893d04b66f3015865c51bbfb4 --- /dev/null +++ b/annotations_1/yISManYcWqU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 21.2], [23.0, 24.48], [27.0, 47.83], [50.0, 55.24], [56.0, 63.75], [65.0, 67.71], [69.0, 69.48], [73.0, 77.68], [79.0, 134.91], [136.0, 150.11]], "keep_status": [false, false, false, false, true, true, false, true, false, true], "silence_prob": [33.03, 0.0, 34.65, 31.41, 29.56, 33.06, 0.0, 32.0, 0.0, 39.35], "audiomae_on_audioset": [[["music", 39.64], ["speech", 34.13], ["roar", 7.9]], null, [["music", 51.42], ["frog", 15.26], ["croak", 6.56]], [["music", 28.16], ["whale vocalization", 23.56], ["theremin", 20.98]], [["music", 25.39], ["buzz", 23.42], ["speech", 18.6]], [["music", 27.17], ["hum", 13.45], ["speech", 12.74]], null, [["music", 33.36], ["throbbing", 17.21], ["hum", 12.88]], null, [["hum", 27.44], ["throbbing", 20.02], ["gong", 14.51]]], "duration": [10.2, 1.48, 20.83, 5.24, 7.75, 2.71, 0.48, 4.68, 55.91, 14.11]} \ No newline at end of file diff --git a/annotations_1/yJTucB8fH04_filtered.json b/annotations_1/yJTucB8fH04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..29e3f2d92df418deba804e644ec69edea9850a91 --- /dev/null +++ b/annotations_1/yJTucB8fH04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.16], [6.0, 8.7], [11.0, 11.69], [14.0, 14.59], [15.0, 15.04], [21.0, 22.77], [25.0, 28.78], [32.0, 34.23], [38.0, 40.24], [49.0, 51.63], [56.0, 56.94], [66.0, 66.95], [70.0, 71.86], [75.0, 76.74], [80.0, 81.46], [84.0, 85.77], [88.0, 93.24], [94.0, 95.12], [97.0, 99.1], [102.0, 102.49], [103.0, 103.27], [103.0, 108.18], [115.0, 116.55], [122.0, 123.15], [124.0, 125.02], [129.0, 129.66], [132.0, 134.32], [140.0, 143.09], [144.0, 145.52], [147.0, 149.64], [151.0, 151.95], [153.0, 162.87], [163.0, 168.71], [170.0, 171.73], [173.0, 173.08]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 98.59, 76.37, 99.98, 99.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.07, 0.0, 99.92, 0.0, 0.0, 94.66, 0.0, 0.0, 0.0, 0.0, 64.41, 60.05, 0.0, 57.17, 0.0, 88.46, 58.81, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.16, 2.7, 0.69, 0.59, 0.04, 1.77, 3.78, 2.23, 2.24, 2.63, 0.94, 0.95, 1.86, 1.74, 1.46, 1.77, 5.24, 1.12, 2.1, 0.49, 0.27, 5.18, 1.55, 1.15, 1.02, 0.66, 2.32, 3.09, 1.52, 2.64, 0.95, 9.87, 5.71, 1.73, 0.08]} \ No newline at end of file diff --git a/annotations_1/yJ_3DswWIeI_filtered.json b/annotations_1/yJ_3DswWIeI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c58aa073f1530d50eb392abad42985f7dcbc7a82 --- /dev/null +++ b/annotations_1/yJ_3DswWIeI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.69], [22.0, 22.28], [23.0, 39.73], [41.0, 42.5], [44.0, 45.59], [46.0, 50.68], [52.0, 53.69], [55.0, 56.02], [56.0, 58.58], [61.0, 73.14], [76.0, 78.21], [79.0, 80.6], [84.0, 106.42], [107.0, 107.87], [109.0, 110.67], [113.0, 116.29]], "keep_status": [false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 39.82, 0.0, 0.0, 95.37, 0.0, 0.0, 43.08, 53.34, 100.0, 0.0, 100.0, 0.0, 0.0, 52.39], "audiomae_on_audioset": [null, null, [["hum", 29.22], ["music", 18.87], ["gong", 16.58]], null, null, null, null, null, [["sidetone", 16.65], ["fly, housefly", 15.87], ["insect", 10.78]], null, null, null, null, null, null, null], "duration": [1.69, 0.28, 16.73, 1.5, 1.59, 4.68, 1.69, 1.02, 2.58, 12.14, 2.21, 1.6, 22.42, 0.87, 1.67, 3.29]} \ No newline at end of file diff --git a/annotations_1/yKv7A92MoBY_filtered.json b/annotations_1/yKv7A92MoBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..558d06e4cb8ce2c9f00477744bf547816f662f98 --- /dev/null +++ b/annotations_1/yKv7A92MoBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.73], [16.0, 16.11], [17.0, 17.63], [19.0, 19.01], [22.0, 28.54], [33.0, 39.21], [40.0, 49.71], [52.0, 52.54], [54.0, 61.52], [66.0, 71.76], [73.0, 76.82], [78.0, 84.77], [86.0, 92.3], [93.0, 93.26], [94.0, 96.13], [99.0, 99.25], [107.0, 108.19], [110.0, 110.61], [112.0, 112.08], [122.0, 121.66], [125.0, 125.91], [126.0, 126.28], [133.0, 133.29], [136.0, 136.97], [142.0, 142.59]], "keep_status": [false, false, false, false, true, false, false, false, false, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.06, 31.86, 31.49, 0.0, 31.9, 31.93, 38.11, 30.6, 48.31, 0.0, 99.31, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 47.73], ["whack, thwack", 15.41], ["synthesizer", 5.71]], [["music", 50.49], ["didgeridoo", 16.67], ["synthesizer", 2.99]], [["music", 53.45], ["speech", 26.66], ["whack, thwack", 3.36]], null, [["music", 44.83], ["speech", 22.96], ["whack, thwack", 16.83]], [["music", 27.25], ["thunk", 21.08], ["whack, thwack", 18.5]], [["music", 60.03], ["throbbing", 5.68], ["electronica", 3.03]], [["music", 28.31], ["whack, thwack", 28.19], ["speech", 10.17]], [["noise", 28.73], ["speech", 20.48], ["music", 11.07]], null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.73, 0.11, 0.63, 0.01, 6.54, 6.21, 9.71, 0.54, 7.52, 5.76, 3.82, 6.77, 6.3, 0.26, 2.13, 0.25, 1.19, 0.61, 0.08, -0.34, 0.91, 0.28, 0.29, 0.97, 0.59]} \ No newline at end of file diff --git a/annotations_1/yKw8Cw13NmY_filtered.json b/annotations_1/yKw8Cw13NmY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70367753c4cb8a4fadb89966c81a5259c5b676e6 --- /dev/null +++ b/annotations_1/yKw8Cw13NmY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 12.14], [13.0, 14.66], [22.0, 25.54], [26.0, 27.33], [28.0, 33.17], [37.0, 80.28], [81.0, 82.85], [84.0, 99.55], [101.0, 101.6], [103.0, 119.25], [120.0, 122.01], [123.0, 123.53], [124.0, 124.88], [125.0, 126.45], [127.0, 127.89]], "keep_status": [false, false, true, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [37.0, 0.0, 30.79, 0.0, 31.52, 0.0, 0.0, 32.83, 0.0, 31.83, 33.54, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 27.62], ["hum", 27.38], ["throbbing", 20.04]], null, [["music", 41.27], ["speech", 18.17], ["hum", 8.86]], null, [["music", 55.53], ["throbbing", 24.51], ["hum", 6.75]], null, null, [["hum", 26.91], ["mains hum", 14.58], ["speech", 12.8]], null, [["music", 21.09], ["hum", 19.37], ["throbbing", 8.18]], [["hum", 32.09], ["mains hum", 24.37], ["music", 16.97]], null, null, null, null], "duration": [2.14, 1.66, 3.54, 1.33, 5.17, 43.28, 1.85, 15.55, 0.6, 16.25, 2.01, 0.53, 0.88, 1.45, 0.89]} \ No newline at end of file diff --git a/annotations_1/yLFZcXeZymY_filtered.json b/annotations_1/yLFZcXeZymY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2bcac7cf2bd70c98a2be6e1b46a26a5312b4f9dc --- /dev/null +++ b/annotations_1/yLFZcXeZymY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.43], [13.0, 15.16], [18.0, 18.3], [21.0, 21.68], [25.0, 25.34], [26.0, 30.28], [33.0, 33.93], [40.0, 42.08], [44.0, 52.52], [53.0, 53.79], [54.0, 56.98], [60.0, 61.16], [64.0, 64.1], [68.0, 68.55], [70.0, 74.78], [77.0, 77.19], [80.0, 82.53], [85.0, 84.91], [89.0, 91.64], [93.0, 94.59], [99.0, 100.67], [104.0, 105.73], [108.0, 109.97], [112.0, 112.31], [113.0, 117.56], [119.0, 124.01]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [44.49, 54.36, 0.0, 0.0, 0.0, 71.87, 0.0, 67.51, 68.41, 0.0, 62.68, 0.0, 0.0, 0.0, 52.56, 0.0, 98.93, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 99.99, 79.76], "audiomae_on_audioset": [[["music", 28.38], ["throbbing", 18.84], ["speech", 16.5]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.43, 2.16, 0.3, 0.68, 0.34, 4.28, 0.93, 2.08, 8.52, 0.79, 2.98, 1.16, 0.1, 0.55, 4.78, 0.19, 2.53, -0.09, 2.64, 1.59, 1.67, 1.73, 1.97, 0.31, 4.56, 5.01]} \ No newline at end of file diff --git a/annotations_1/yLJ5hUWH0yE_filtered.json b/annotations_1/yLJ5hUWH0yE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f0cd42c5c7ab5f13f369dbf890e7f0e3567c2e3 --- /dev/null +++ b/annotations_1/yLJ5hUWH0yE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[75.0, 137.44], [142.0, 143.63], [145.0, 153.66], [157.0, 157.25]], "keep_status": [false, false, true, false], "silence_prob": [0.0, 0.0, 35.99, 0.0], "audiomae_on_audioset": [null, null, [["noise", 23.36], ["speech", 17.3], ["music", 10.93]], null], "duration": [62.44, 1.63, 8.66, 0.25]} \ No newline at end of file diff --git a/annotations_1/yLm_tJ-ZrNc_filtered.json b/annotations_1/yLm_tJ-ZrNc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e10b1fc33e759083db58b933c5cc95ce3db4095f --- /dev/null +++ b/annotations_1/yLm_tJ-ZrNc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.15], [7.0, 10.66], [17.0, 20.87], [21.0, 36.05], [39.0, 39.87], [42.0, 44.9], [46.0, 48.42], [52.0, 52.1], [54.0, 54.35], [64.0, 65.79], [68.0, 70.21], [71.0, 72.12], [75.0, 76.17], [77.0, 81.03], [82.0, 83.27], [84.0, 85.87], [87.0, 87.03], [88.0, 95.15], [96.0, 96.35], [101.0, 101.73], [103.0, 103.32], [105.0, 105.63], [107.0, 117.64], [118.0, 117.69]], "keep_status": [false, false, true, false, false, true, true, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 52.45, 44.57, 50.46, 0.0, 42.96, 47.54, 0.0, 0.0, 0.0, 41.66, 0.0, 0.0, 32.64, 0.0, 0.0, 0.0, 34.04, 0.0, 0.0, 0.0, 0.0, 35.22, 0.0], "audiomae_on_audioset": [null, null, [["music", 55.05], ["mains hum", 7.41], ["musical instrument", 5.17]], null, null, [["mains hum", 27.23], ["hum", 22.67], ["tick", 10.65]], [["hum", 26.33], ["mains hum", 17.76], ["music", 5.57]], null, null, null, [["hum", 20.98], ["mains hum", 12.22], ["music", 9.9]], null, null, [["fly, housefly", 38.1], ["insect", 18.33], ["rumble", 9.01]], null, null, null, [["music", 64.27], ["throbbing", 12.4], ["hum", 3.25]], null, null, null, null, [["music", 55.63], ["hum", 15.5], ["throbbing", 9.74]], null], "duration": [0.15, 3.66, 3.87, 15.05, 0.87, 2.9, 2.42, 0.1, 0.35, 1.79, 2.21, 1.12, 1.17, 4.03, 1.27, 1.87, 0.03, 7.15, 0.35, 0.73, 0.32, 0.63, 10.64, -0.31]} \ No newline at end of file diff --git a/annotations_1/yLtC-gH6ktw_filtered.json b/annotations_1/yLtC-gH6ktw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..68be008f878d8a58d0293b54ce1fa872edae5c19 --- /dev/null +++ b/annotations_1/yLtC-gH6ktw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 10.67], [12.0, 16.7], [20.0, 21.54], [24.0, 26.76], [29.0, 29.44], [33.0, 37.49], [38.0, 38.84], [40.0, 50.21], [52.0, 57.03], [58.0, 59.81], [61.0, 62.46], [65.0, 65.3], [67.0, 68.01], [69.0, 70.14], [72.0, 73.74], [75.0, 75.39], [76.0, 78.97], [80.0, 85.28], [86.0, 86.93], [94.0, 96.15], [98.0, 100.2], [102.0, 102.79], [107.0, 109.39], [112.0, 116.36], [117.0, 118.67], [119.0, 120.82], [122.0, 123.97], [126.0, 128.8], [132.0, 132.88], [135.0, 136.09], [138.0, 138.77], [145.0, 145.07], [147.0, 148.0], [152.0, 153.37], [154.0, 155.39], [159.0, 166.89]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.47, 92.97, 0.0, 64.52, 0.0, 82.25, 0.0, 93.91, 96.89, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.7, 86.27, 0.0, 91.3, 73.97, 0.0, 80.46, 92.97, 0.0, 0.0, 0.0, 51.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.91], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.67, 4.7, 1.54, 2.76, 0.44, 4.49, 0.84, 10.21, 5.03, 1.81, 1.46, 0.3, 1.01, 1.14, 1.74, 0.39, 2.97, 5.28, 0.93, 2.15, 2.2, 0.79, 2.39, 4.36, 1.67, 1.82, 1.97, 2.8, 0.88, 1.09, 0.77, 0.07, 1.0, 1.37, 1.39, 7.89]} \ No newline at end of file diff --git a/annotations_1/yMiJp1nYlNA_filtered.json b/annotations_1/yMiJp1nYlNA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ae6e75867c793a57b7dceb91ed470c72010e8d36 --- /dev/null +++ b/annotations_1/yMiJp1nYlNA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [2.0, 4.31], [7.0, 10.59], [12.0, 12.07], [14.0, 16.39], [20.0, 21.54], [22.0, 27.57], [28.0, 34.86], [39.0, 39.5], [40.0, 40.09], [43.0, 44.25], [45.0, 46.84], [52.0, 52.95], [56.0, 59.73], [62.0, 62.4], [74.0, 74.7], [80.0, 81.7], [84.0, 84.69], [86.0, 86.68], [91.0, 92.84], [94.0, 94.34], [97.0, 98.61], [100.0, 100.41], [101.0, 104.23], [110.0, 112.58], [119.0, 120.8], [124.0, 125.17], [126.0, 128.55], [130.0, 133.59], [135.0, 140.44], [144.0, 144.86], [159.0, 159.88], [160.0, 161.64]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.5, 99.98, 0.0, 100.0, 0.0, 66.15, 37.84, 0.0, 0.0, 0.0, 0.0, 0.0, 35.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.66, 29.24, 0.0, 0.0, 53.78, 100.0, 100.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 42.82], ["music", 14.44], ["effects unit", 7.17]], null, null, null, null, null, [["theremin", 33.01], ["music", 29.12], ["speech", 12.02]], null, null, null, null, null, [["howl", 16.97], ["hum", 7.26], ["mains hum", 6.45]], null, null, null, null, null, null, null, null, null, [["speech", 63.07], ["inside, small room", 6.24], ["whimper", 4.59]], [["music", 59.67], ["carnatic music", 12.6], ["musical instrument", 6.25]], null, null, null, null, null, null, null, null], "duration": [0.38, 2.31, 3.59, 0.07, 2.39, 1.54, 5.57, 6.86, 0.5, 0.09, 1.25, 1.84, 0.95, 3.73, 0.4, 0.7, 1.7, 0.69, 0.68, 1.84, 0.34, 1.61, 0.41, 3.23, 2.58, 1.8, 1.17, 2.55, 3.59, 5.44, 0.86, 0.88, 1.64]} \ No newline at end of file diff --git a/annotations_1/yMyXgCLhAXk_filtered.json b/annotations_1/yMyXgCLhAXk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..993a4bc2990e4792f659f9e42202dfa2be2e6d38 --- /dev/null +++ b/annotations_1/yMyXgCLhAXk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 20.53], [29.0, 31.13], [33.0, 47.33], [49.0, 66.8], [69.0, 69.33], [70.0, 77.6], [83.0, 84.28], [86.0, 86.85]], "keep_status": [false, true, true, false, false, true, false, false], "silence_prob": [35.4, 40.12, 35.19, 39.18, 0.0, 37.84, 0.0, 0.0], "audiomae_on_audioset": [[["music", 63.15], ["telephone dialing, dtmf", 10.76], ["synthesizer", 6.23]], [["music", 48.92], ["speech", 6.42], ["throbbing", 5.82]], [["music", 44.09], ["hum", 17.34], ["throbbing", 8.42]], [["music", 72.85], ["hum", 2.19], ["musical instrument", 1.93]], null, [["music", 54.92], ["hum", 10.37], ["gong", 4.5]], null, null], "duration": [18.53, 2.13, 14.33, 17.8, 0.33, 7.6, 1.28, 0.85]} \ No newline at end of file diff --git a/annotations_1/yNhbLL3Xvcw_filtered.json b/annotations_1/yNhbLL3Xvcw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b14bdac2b3e9f6388550d3271b028cf3f08cff4f --- /dev/null +++ b/annotations_1/yNhbLL3Xvcw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [6.0, 14.76], [19.0, 19.43], [26.0, 34.69], [37.0, 45.1], [48.0, 56.42], [59.0, 61.42], [61.0, 61.47], [62.0, 65.2]], "keep_status": [false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 64.18, 0.0, 92.48, 79.24, 31.74, 85.9, 0.0, 87.37], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 45.78], ["music", 15.89], ["outside, urban or manmade", 3.07]], null, null, null], "duration": [1.13, 8.76, 0.43, 8.69, 8.1, 8.42, 2.42, 0.47, 3.2]} \ No newline at end of file diff --git a/annotations_1/yNmBX5mZvRw_filtered.json b/annotations_1/yNmBX5mZvRw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2f95c10b6a5f2c17962e1a73807f8ea337b7362 --- /dev/null +++ b/annotations_1/yNmBX5mZvRw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 24.98], [26.0, 26.94], [27.0, 28.32], [28.0, 28.41], [28.0, 28.92], [30.0, 33.24], [35.0, 45.62], [46.0, 49.55], [50.0, 60.37], [65.0, 66.43], [70.0, 71.73], [77.0, 77.4], [78.0, 78.7], [85.0, 86.41], [87.0, 88.48], [89.0, 90.88], [95.0, 95.55], [97.0, 98.68], [99.0, 102.76], [104.0, 112.95], [115.0, 115.72], [117.0, 117.32], [118.0, 117.81], [119.0, 118.64], [121.0, 121.63], [123.0, 123.6], [124.0, 125.0], [125.0, 125.54], [126.0, 126.23], [127.0, 126.79], [127.0, 128.21]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [37.69, 0.0, 0.0, 0.0, 0.0, 49.87, 60.23, 40.61, 38.03, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.29, 41.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 92.59], ["stomach rumble", 2.36], ["television", 0.59]], null, null, null, null, [["insect", 6.58], ["zipper (clothing)", 4.88], ["buzz", 4.71]], null, [["fly, housefly", 44.2], ["insect", 29.37], ["bee, wasp, etc.", 19.2]], [["insect", 40.36], ["fly, housefly", 36.22], ["bee, wasp, etc.", 8.1]], null, null, null, null, null, null, null, null, null, [["fly, housefly", 61.34], ["insect", 19.87], ["bee, wasp, etc.", 14.41]], [["fly, housefly", 41.49], ["insect", 25.96], ["bee, wasp, etc.", 23.64]], null, null, null, null, null, null, null, null, null, null, null], "duration": [3.98, 0.94, 1.32, 0.41, 0.92, 3.24, 10.62, 3.55, 10.37, 1.43, 1.73, 0.4, 0.7, 1.41, 1.48, 1.88, 0.55, 1.68, 3.76, 8.95, 0.72, 0.32, -0.19, -0.36, 0.63, 0.6, 1.0, 0.54, 0.23, -0.21, 1.21]} \ No newline at end of file diff --git a/annotations_1/yPJlBsQE96o_filtered.json b/annotations_1/yPJlBsQE96o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b2a683cf25127e5ef1c869566f7609a8562cd56c --- /dev/null +++ b/annotations_1/yPJlBsQE96o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 7.4], [10.0, 11.03], [16.0, 16.16], [18.0, 20.21], [26.0, 30.38], [31.0, 30.57], [31.0, 32.17], [34.0, 37.83], [40.0, 41.67], [44.0, 45.32], [51.0, 52.29], [54.0, 55.17], [57.0, 60.62], [64.0, 63.85], [65.0, 69.48], [72.0, 73.41], [75.0, 76.65], [83.0, 83.98], [90.0, 94.46], [95.0, 94.53], [95.0, 94.56], [95.0, 94.59], [95.0, 94.63], [95.0, 102.91], [109.0, 112.08], [118.0, 131.3], [132.0, 132.83]], "keep_status": [false, false, false, false, true, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 40.45, 36.45, 0.0, 0.0, 38.79, 0.0, 0.0, 0.0, 0.0, 36.67, 0.0, 34.03, 0.0, 0.0, 0.0, 31.85, 0.0, 0.0, 0.0, 0.0, 31.16, 39.25, 32.45, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 73.05], ["synthesizer", 4.92], ["musical instrument", 2.61]], [["music", 56.55], ["piano", 5.42], ["keyboard (musical)", 5.15]], null, null, [["music", 50.2], ["synthesizer", 12.63], ["electric piano", 6.35]], null, null, null, null, [["music", 56.07], ["musical instrument", 6.24], ["plucked string instrument", 3.61]], null, [["music", 50.54], ["synthesizer", 14.77], ["electric piano", 5.19]], null, null, null, [["music", 83.64], ["guitar", 3.96], ["plucked string instrument", 3.56]], null, null, null, null, [["music", 71.77], ["musical instrument", 4.74], ["synthesizer", 2.9]], [["music", 47.95], ["effects unit", 7.06], ["didgeridoo", 6.23]], [["music", 73.99], ["guitar", 2.83], ["musical instrument", 2.69]], null], "duration": [1.4, 1.03, 0.16, 2.21, 4.38, -0.43, 1.17, 3.83, 1.67, 1.32, 1.29, 1.17, 3.62, -0.15, 4.48, 1.41, 1.65, 0.98, 4.46, -0.47, -0.44, -0.41, -0.37, 7.91, 3.08, 13.3, 0.83]} \ No newline at end of file diff --git a/annotations_1/yQ62WM_w2iM_filtered.json b/annotations_1/yQ62WM_w2iM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..41cc5d4f801ee852143d52f3b3a9052473f73e55 --- /dev/null +++ b/annotations_1/yQ62WM_w2iM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.09], [30.0, 60.66], [61.0, 60.71], [64.0, 67.14], [69.0, 70.85], [73.0, 73.85], [76.0, 76.62], [78.0, 78.56], [81.0, 84.97], [89.0, 90.29], [94.0, 97.28], [102.0, 103.0], [116.0, 122.05], [128.0, 127.94], [146.0, 146.38], [150.0, 150.6], [153.0, 153.01], [161.0, 161.67], [163.0, 167.53]], "keep_status": [false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [29.79, 0.0, 0.0, 30.55, 0.0, 0.0, 0.0, 0.0, 36.36, 0.0, 30.72, 0.0, 31.39, 0.0, 0.0, 0.0, 0.0, 0.0, 30.71], "audiomae_on_audioset": [[["music", 58.63], ["trombone", 8.51], ["brass instrument", 8.02]], null, null, [["explosion", 34.91], ["burst, pop", 26.62], ["gunshot, gunfire", 8.24]], null, null, null, null, [["speech", 60.55], ["hum", 6.71], ["sidetone", 4.5]], null, [["cattle, bovinae", 22.7], ["livestock, farm animals, working animals", 16.91], ["animal", 12.02]], null, [["cattle, bovinae", 39.54], ["speech", 23.18], ["moo", 19.09]], null, null, null, null, null, [["music", 36.79], ["trombone", 19.97], ["brass instrument", 10.57]]], "duration": [4.09, 30.66, -0.29, 3.14, 1.85, 0.85, 0.62, 0.56, 3.97, 1.29, 3.28, 1.0, 6.05, -0.06, 0.38, 0.6, 0.01, 0.67, 4.53]} \ No newline at end of file diff --git a/annotations_1/yQVdwJcerjw_filtered.json b/annotations_1/yQVdwJcerjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b9b38bf2169d3ea50e83a0393ec701d5a7169bd2 --- /dev/null +++ b/annotations_1/yQVdwJcerjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.55], [14.0, 14.93], [16.0, 24.97], [26.0, 38.89], [48.0, 49.74], [67.0, 67.15], [69.0, 69.67], [76.0, 76.86], [87.0, 87.88], [92.0, 92.79], [111.0, 111.35], [114.0, 114.03], [115.0, 115.87], [119.0, 119.15], [120.0, 120.87], [123.0, 123.63], [124.0, 125.0], [127.0, 129.44], [132.0, 131.99], [135.0, 136.31], [147.0, 149.82], [152.0, 153.18], [156.0, 156.69], [159.0, 160.81], [161.0, 162.08], [168.0, 168.47]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 41.05, 34.78, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.2, 0.0, 0.0, 98.86, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 56.71], ["smash, crash", 11.07], ["synthesizer", 2.54]], [["animal", 35.49], ["roaring cats (lions, tigers)", 18.45], ["wild animals", 9.2]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.93, 8.97, 12.89, 1.74, 0.15, 0.67, 0.86, 0.88, 0.79, 0.35, 0.03, 0.87, 0.15, 0.87, 0.63, 1.0, 2.44, -0.01, 1.31, 2.82, 1.18, 0.69, 1.81, 1.08, 0.47]} \ No newline at end of file diff --git a/annotations_1/yQXi94aNwBU_filtered.json b/annotations_1/yQXi94aNwBU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..156a2b22e9305d56373ef8fea943d8f6aee30826 --- /dev/null +++ b/annotations_1/yQXi94aNwBU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.39], [3.0, 3.87], [5.0, 5.76], [17.0, 19.31], [22.0, 23.3], [26.0, 32.59], [34.0, 35.97], [40.0, 41.61], [42.0, 42.47], [43.0, 47.58], [51.0, 59.51], [66.0, 68.45], [69.0, 70.29], [72.0, 79.34], [82.0, 88.16], [89.0, 89.36], [96.0, 101.19], [105.0, 133.44], [135.0, 141.08], [142.0, 148.44], [149.0, 153.94], [160.0, 159.6], [166.0, 167.39], [168.0, 169.26], [169.0, 174.77], [175.0, 177.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 99.62, 0.0, 81.71, 0.0, 0.0, 0.0, 84.07, 73.36, 59.33, 0.0, 76.37, 52.98, 0.0, 60.23, 47.78, 98.8, 98.73, 49.04, 0.0, 0.0, 0.0, 60.7, 46.64], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 53.62], ["speech", 14.98], ["mains hum", 10.84]], null, null, [["speech", 71.87], ["chirp tone", 12.4], ["sine wave", 4.46]], null, null, null, null, [["music", 19.6], ["speech", 18.61], ["grunt", 16.33]]], "duration": [1.39, 0.87, 0.76, 2.31, 1.3, 6.59, 1.97, 1.61, 0.47, 4.58, 8.51, 2.45, 1.29, 7.34, 6.16, 0.36, 5.19, 28.44, 6.08, 6.44, 4.94, -0.4, 1.39, 1.26, 5.77, 2.03]} \ No newline at end of file diff --git a/annotations_1/yQpFQFL-YLI_filtered.json b/annotations_1/yQpFQFL-YLI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2acb8fc3b4dc3c03542846e46cd7873f74134b --- /dev/null +++ b/annotations_1/yQpFQFL-YLI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.11], [4.0, 7.59], [9.0, 10.96], [13.0, 13.54], [22.0, 25.07], [30.0, 34.25], [34.0, 36.32], [41.0, 41.84], [44.0, 47.21], [52.0, 54.53], [56.0, 57.69], [60.0, 62.45], [64.0, 72.93], [75.0, 106.1], [112.0, 118.62], [124.0, 126.86], [131.0, 130.86], [133.0, 168.67], [170.0, 187.93]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [57.64, 98.19, 0.0, 0.0, 98.8, 98.86, 94.07, 0.0, 49.4, 40.14, 0.0, 48.95, 41.95, 0.0, 30.82, 32.5, 0.0, 0.0, 30.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["speech", 55.18], ["music", 11.2], ["sidetone", 8.51]], [["speech", 55.99], ["sidetone", 20.42], ["dial tone", 3.71]], null, [["splinter", 17.34], ["mains hum", 5.68], ["hum", 4.96]], [["insect", 14.36], ["frog", 11.58], ["speech", 11.41]], null, [["music", 60.0], ["hum", 8.49], ["throbbing", 3.91]], [["moo", 15.53], ["cattle, bovinae", 15.3], ["livestock, farm animals, working animals", 8.9]], null, null, [["music", 54.87], ["hum", 17.11], ["scary music", 6.17]]], "duration": [2.11, 3.59, 1.96, 0.54, 3.07, 4.25, 2.32, 0.84, 3.21, 2.53, 1.69, 2.45, 8.93, 31.1, 6.62, 2.86, -0.14, 35.67, 17.93]} \ No newline at end of file diff --git a/annotations_1/yR3zsO8pCMw_filtered.json b/annotations_1/yR3zsO8pCMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2692dab56448ce246fb8ebe4245a633c4ede0c0e --- /dev/null +++ b/annotations_1/yR3zsO8pCMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.89], [5.0, 6.98], [9.0, 10.57], [12.0, 15.13], [16.0, 17.1], [19.0, 20.04], [21.0, 47.38], [48.0, 50.19], [53.0, 52.78], [55.0, 70.09], [73.0, 77.08], [83.0, 102.73], [104.0, 104.68]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 56.55, 0.0, 0.0, 37.21, 46.79, 0.0, 42.26, 30.12, 29.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["mains hum", 40.08], ["hum", 28.16], ["music", 18.52]], [["throbbing", 25.59], ["hum", 18.36], ["fly, housefly", 15.71]], null, [["speech", 32.76], ["hum", 28.59], ["mains hum", 8.93]], [["burst, pop", 15.19], ["speech", 13.94], ["eruption", 10.63]], [["music", 48.38], ["vehicle", 5.63], ["didgeridoo", 5.4]], null], "duration": [0.89, 1.98, 1.57, 3.13, 1.1, 1.04, 26.38, 2.19, -0.22, 15.09, 4.08, 19.73, 0.68]} \ No newline at end of file diff --git a/annotations_1/yRlyvNmVWK0_filtered.json b/annotations_1/yRlyvNmVWK0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c47d7b6d82bfff35f58ab6b9b46a787b6356c04 --- /dev/null +++ b/annotations_1/yRlyvNmVWK0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.44], [3.0, 3.87], [5.0, 6.0], [7.0, 7.33], [8.0, 10.0], [12.0, 12.24], [16.0, 18.74], [23.0, 24.73], [27.0, 40.02], [43.0, 49.01], [52.0, 114.94], [117.0, 117.83], [120.0, 127.25], [130.0, 132.9], [137.0, 139.09], [139.0, 141.02], [143.0, 146.28], [149.0, 149.34]], "keep_status": [false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.96, 0.0, 92.64, 0.0, 47.39, 35.22, 0.0, 0.0, 81.35, 80.29, 75.07, 52.1, 79.76, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["hum", 35.43], ["mains hum", 18.63], ["chirp tone", 13.31]], [["speech", 36.27], ["thunk", 17.55], ["thump, thud", 6.21]], null, null, null, null, null, null, null, null], "duration": [1.44, 0.87, 1.0, 0.33, 2.0, 0.24, 2.74, 1.73, 13.02, 6.01, 62.94, 0.83, 7.25, 2.9, 2.09, 2.02, 3.28, 0.34]} \ No newline at end of file diff --git a/annotations_1/ySC245RIiD8_filtered.json b/annotations_1/ySC245RIiD8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e811c2a5e362a37119a3b903c1fb3fa778dccd8 --- /dev/null +++ b/annotations_1/ySC245RIiD8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.26], [7.0, 8.9], [11.0, 12.45], [16.0, 16.9], [17.0, 17.93], [22.0, 22.37], [24.0, 26.01], [27.0, 27.75], [29.0, 31.41], [33.0, 33.96], [36.0, 37.61], [41.0, 42.01], [44.0, 44.0], [47.0, 47.09]], "keep_status": [false, false, false, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 44.57, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["sonar", 25.36], ["hum", 21.38], ["chirp tone", 16.0]], null, [["hum", 38.0], ["chirp tone", 11.74], ["throbbing", 8.31]], null, null, null, null, null], "duration": [1.26, 1.9, 1.45, 0.9, 0.93, 0.37, 2.01, 0.75, 2.41, 0.96, 1.61, 1.01, 0.0, 0.09]} \ No newline at end of file diff --git a/annotations_1/yV5UTHVjMME_filtered.json b/annotations_1/yV5UTHVjMME_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..aaaabf9885b865f8a15e27b4d8c7740b1e877924 --- /dev/null +++ b/annotations_1/yV5UTHVjMME_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.27], [14.0, 13.95], [50.0, 49.91], [52.0, 52.07], [59.0, 58.92], [64.0, 64.72], [67.0, 67.56], [77.0, 77.26], [84.0, 85.4], [92.0, 93.02], [95.0, 95.0], [97.0, 100.35], [105.0, 108.6], [113.0, 115.11], [116.0, 116.73], [119.0, 119.74], [122.0, 122.1], [123.0, 124.19], [138.0, 138.67], [147.0, 148.74], [166.0, 166.72], [182.0, 186.39], [206.0, 206.69], [209.0, 209.73], [214.0, 214.3], [215.0, 216.21]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 89.01, 73.36, 68.02, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.6, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 29.95], ["moo", 28.68], ["livestock, farm animals, working animals", 21.1]], null, null, null, null], "duration": [1.27, -0.05, -0.09, 0.07, -0.08, 0.72, 0.56, 0.26, 1.4, 1.02, 0.0, 3.35, 3.6, 2.11, 0.73, 0.74, 0.1, 1.19, 0.67, 1.74, 0.72, 4.39, 0.69, 0.73, 0.3, 1.21]} \ No newline at end of file diff --git a/annotations_1/yV5w71aImSo_filtered.json b/annotations_1/yV5w71aImSo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..84b9f82f2f7128e823f4a95ab3bdbdc1de0b5991 --- /dev/null +++ b/annotations_1/yV5w71aImSo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 107.92], [109.0, 109.49], [113.0, 114.66], [116.0, 118.02], [118.0, 119.21], [124.0, 124.73], [126.0, 130.4], [131.0, 131.5], [133.0, 137.35], [142.0, 142.48]], "keep_status": [false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 64.07, 0.0, 0.0, 54.7, 0.0, 63.85, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null], "duration": [87.92, 0.49, 1.66, 2.02, 1.21, 0.73, 4.4, 0.5, 4.35, 0.48]} \ No newline at end of file diff --git a/annotations_1/yVRmafc7cqQ_filtered.json b/annotations_1/yVRmafc7cqQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..69fa68731c56eb9cc9edb5ca392bed7757c47910 --- /dev/null +++ b/annotations_1/yVRmafc7cqQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.26], [17.0, 18.37], [23.0, 23.75], [32.0, 32.34], [33.0, 34.25], [37.0, 39.83], [41.0, 42.79], [49.0, 50.14], [55.0, 56.42], [60.0, 59.86], [71.0, 72.23], [73.0, 73.3], [76.0, 76.23], [79.0, 79.3], [80.0, 82.98], [84.0, 84.54], [96.0, 95.96], [98.0, 99.76], [100.0, 101.48], [102.0, 105.0], [108.0, 108.75], [111.0, 116.11]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.26, 1.37, 0.75, 0.34, 1.25, 2.83, 1.79, 1.14, 1.42, -0.14, 1.23, 0.3, 0.23, 0.3, 2.98, 0.54, -0.04, 1.76, 1.48, 3.0, 0.75, 5.11]} \ No newline at end of file diff --git a/annotations_1/yWGLNaCYevk_filtered.json b/annotations_1/yWGLNaCYevk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1beb182991df93e2b69cbe658b6ca12842f872f1 --- /dev/null +++ b/annotations_1/yWGLNaCYevk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 30.43], [37.0, 53.96], [56.0, 143.95], [145.0, 181.38], [182.0, 198.81]], "keep_status": [false, false, false, false, true], "silence_prob": [56.1, 57.81, 0.0, 0.0, 35.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 27.83], ["throbbing", 20.66], ["music", 19.41]]], "duration": [18.43, 16.96, 87.95, 36.38, 16.81]} \ No newline at end of file diff --git a/annotations_1/yWP5eC822Ac_filtered.json b/annotations_1/yWP5eC822Ac_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..7a706d383ca9b05d6b39c9091160395d88c22f1e --- /dev/null +++ b/annotations_1/yWP5eC822Ac_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 17.98], [19.0, 20.95], [22.0, 24.46], [26.0, 29.62], [31.0, 34.72], [36.0, 39.34], [41.0, 54.57], [57.0, 65.01], [66.0, 67.05], [69.0, 79.49], [83.0, 96.03], [96.0, 109.86], [112.0, 114.4], [115.0, 141.64], [142.0, 189.5], [193.0, 194.12], [195.0, 196.48], [198.0, 199.2], [200.0, 201.19]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 40.71, 63.1, 59.24, 57.32, 48.87, 60.79, 0.0, 38.17, 37.66, 39.96, 75.72, 29.67, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["music", 19.25], ["speech", 13.33], ["foghorn", 8.4]], null, null, null, [["music", 61.54], ["theremin", 12.97], ["ambient music", 5.1]], null, null, [["music", 56.87], ["foghorn", 9.04], ["didgeridoo", 6.61]], [["music", 43.74], ["theremin", 33.63], ["musical instrument", 4.33]], [["music", 63.17], ["didgeridoo", 10.98], ["foghorn", 5.33]], null, [["music", 32.14], ["speech", 15.96], ["mains hum", 9.73]], null, null, null, null, null], "duration": [1.98, 1.95, 2.46, 3.62, 3.72, 3.34, 13.57, 8.01, 1.05, 10.49, 13.03, 13.86, 2.4, 26.64, 47.5, 1.12, 1.48, 1.2, 1.19]} \ No newline at end of file diff --git a/annotations_1/yWSRVYU_JMo_filtered.json b/annotations_1/yWSRVYU_JMo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..afbf9c632a7ad8a2ce29b7d5cf4ce54a0cf49416 --- /dev/null +++ b/annotations_1/yWSRVYU_JMo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 49.76], [86.0, 86.31]], "keep_status": [false, false], "silence_prob": [36.16, 0.0], "audiomae_on_audioset": [[["music", 74.86], ["keyboard (musical)", 4.79], ["piano", 3.89]], null], "duration": [19.76, 0.31]} \ No newline at end of file diff --git a/annotations_1/yWeMWD-Yagg_filtered.json b/annotations_1/yWeMWD-Yagg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..692a004d10d7528f5131068dfabccc2bc9953372 --- /dev/null +++ b/annotations_1/yWeMWD-Yagg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 28.34], [33.0, 36.17], [69.0, 68.99], [85.0, 87.1], [104.0, 105.41], [116.0, 116.26]], "keep_status": [false, false, false, true, false, false], "silence_prob": [0.0, 77.53, 0.0, 46.26, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["hum", 18.78], ["speech", 15.66], ["sidetone", 12.07]], null, null], "duration": [1.34, 3.17, -0.01, 2.1, 1.41, 0.26]} \ No newline at end of file diff --git a/annotations_1/yWu4GUFpwWo_filtered.json b/annotations_1/yWu4GUFpwWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..713ddffc583408954eda762c2609c198adbd3ffa --- /dev/null +++ b/annotations_1/yWu4GUFpwWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.98], [5.0, 5.26], [6.0, 7.06], [8.0, 9.85], [14.0, 15.23]], "keep_status": [false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null], "duration": [1.98, 0.26, 1.06, 1.85, 1.23]} \ No newline at end of file diff --git a/annotations_1/yXDgPREBssw_filtered.json b/annotations_1/yXDgPREBssw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..66005f8f272a3c55ea5f0cb5949169bd6053023a --- /dev/null +++ b/annotations_1/yXDgPREBssw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.57], [4.0, 12.14], [14.0, 14.15], [15.0, 17.24], [21.0, 33.03], [44.0, 48.61], [51.0, 54.62], [58.0, 65.4], [69.0, 73.99], [75.0, 76.96], [78.0, 78.34], [80.0, 83.3], [85.0, 87.94], [88.0, 91.12], [93.0, 94.46], [97.0, 97.01], [100.0, 100.84], [103.0, 104.28], [106.0, 107.62], [112.0, 113.41], [114.0, 115.21], [116.0, 117.31], [119.0, 119.85], [122.0, 124.31], [125.0, 126.57], [129.0, 131.01], [133.0, 133.49], [140.0, 140.26], [143.0, 144.26], [145.0, 146.1], [148.0, 149.81], [158.0, 158.58], [159.0, 159.68], [167.0, 167.05], [169.0, 170.23], [172.0, 178.71]], "keep_status": [false, false, false, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 99.97, 0.0, 32.19, 31.11, 30.68, 31.97, 31.81, 31.5, 0.0, 0.0, 100.0, 100.0, 80.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.95, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, [["sidetone", 15.28], ["music", 11.84], ["throbbing", 10.74]], [["speech", 46.41], ["music", 11.86], ["whack, thwack", 10.01]], [["music", 35.37], ["speech", 7.62], ["groan", 5.59]], [["sidetone", 31.96], ["speech", 23.63], ["music", 8.52]], [["music", 20.04], ["groan", 13.31], ["sidetone", 12.68]], [["speech", 32.26], ["fly, housefly", 9.02], ["groan", 8.31]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.57, 8.14, 0.15, 2.24, 12.03, 4.61, 3.62, 7.4, 4.99, 1.96, 0.34, 3.3, 2.94, 3.12, 1.46, 0.01, 0.84, 1.28, 1.62, 1.41, 1.21, 1.31, 0.85, 2.31, 1.57, 2.01, 0.49, 0.26, 1.26, 1.1, 1.81, 0.58, 0.68, 0.05, 1.23, 6.71]} \ No newline at end of file diff --git a/annotations_1/yYCVu5ZSki0_filtered.json b/annotations_1/yYCVu5ZSki0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfb9358b223385f69dbe3b8de6d23a2520595256 --- /dev/null +++ b/annotations_1/yYCVu5ZSki0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[29.0, 30.27], [31.0, 31.67], [32.0, 33.07], [35.0, 36.41], [43.0, 43.5], [48.0, 59.73], [68.0, 67.96], [78.0, 78.56], [89.0, 91.03], [100.0, 102.68], [113.0, 113.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 64.41, 60.98, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["telephone bell ringing", 60.38], ["music", 30.56], ["telephone", 2.72]], null, null, null, null, null], "duration": [1.27, 0.67, 1.07, 1.41, 0.5, 11.73, -0.04, 0.56, 2.03, 2.68, 0.75]} \ No newline at end of file diff --git a/annotations_1/yYQtZCaPFaM_filtered.json b/annotations_1/yYQtZCaPFaM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad458ecab110441b023bb7044a175298f025739 --- /dev/null +++ b/annotations_1/yYQtZCaPFaM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 11.18], [15.0, 20.83], [23.0, 25.95], [26.0, 36.39], [37.0, 37.77], [38.0, 43.78], [45.0, 68.37], [70.0, 71.81], [74.0, 78.73], [80.0, 88.45], [91.0, 92.04], [92.0, 92.91], [95.0, 107.81], [108.0, 109.16], [110.0, 110.42], [111.0, 112.87], [115.0, 122.86], [125.0, 126.01], [135.0, 138.7], [139.0, 142.42], [144.0, 148.95]], "keep_status": [true, true, true, true, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [35.77, 48.14, 48.23, 37.97, 0.0, 37.06, 34.3, 0.0, 35.8, 43.82, 0.0, 0.0, 40.22, 0.0, 0.0, 0.0, 51.99, 0.0, 63.74, 40.09, 36.54], "audiomae_on_audioset": [[["music", 53.12], ["ambient music", 11.01], ["synthesizer", 4.74]], [["music", 22.01], ["hum", 18.95], ["mains hum", 13.46]], [["music", 52.77], ["singing bowl", 9.55], ["synthesizer", 5.4]], [["music", 46.48], ["synthesizer", 13.32], ["hum", 8.93]], null, [["music", 33.3], ["hum", 18.33], ["speech", 10.36]], [["music", 61.71], ["ambient music", 6.79], ["synthesizer", 5.43]], null, [["music", 60.71], ["synthesizer", 7.8], ["musical instrument", 4.61]], [["music", 44.78], ["ambient music", 13.02], ["synthesizer", 11.9]], null, null, [["music", 36.13], ["singing bowl", 21.91], ["theremin", 19.08]], null, null, null, null, null, null, [["speech", 47.67], ["music", 17.05], ["hum", 4.06]], [["music", 56.86], ["ambient music", 10.31], ["synthesizer", 7.44]]], "duration": [9.18, 5.83, 2.95, 10.39, 0.77, 5.78, 23.37, 1.81, 4.73, 8.45, 1.04, 0.91, 12.81, 1.16, 0.42, 1.87, 7.86, 1.01, 3.7, 3.42, 4.95]} \ No newline at end of file diff --git a/annotations_1/yZ773W4UICY_filtered.json b/annotations_1/yZ773W4UICY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..504847036a83549f1b5ce54bd500243ebb544fb0 --- /dev/null +++ b/annotations_1/yZ773W4UICY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.82], [7.0, 6.99], [8.0, 9.07], [10.0, 10.49], [13.0, 12.97], [32.0, 43.6], [44.0, 46.4], [48.0, 47.82], [51.0, 58.9], [88.0, 88.2], [90.0, 90.36], [93.0, 93.19]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 39.12, 47.62, 0.0, 54.1, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["speech", 62.53], ["radio", 9.04], ["burping, eructation", 1.99]], [["animal", 15.77], ["speech", 11.35], ["insect", 6.59]], null, null, null, null, null], "duration": [0.82, -0.01, 1.07, 0.49, -0.03, 11.6, 2.4, -0.18, 7.9, 0.2, 0.36, 0.19]} \ No newline at end of file diff --git a/annotations_1/yZgf5wSULog_filtered.json b/annotations_1/yZgf5wSULog_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..30a8bb73ed763ce0ad145a13153150e16c7e5c9b --- /dev/null +++ b/annotations_1/yZgf5wSULog_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.59], [4.0, 3.84], [6.0, 5.9], [8.0, 9.0], [10.0, 23.94], [26.0, 32.88], [33.0, 36.05], [37.0, 47.43], [51.0, 51.46], [53.0, 53.28], [53.0, 55.53], [56.0, 55.71], [56.0, 56.02], [56.0, 56.05], [57.0, 56.79], [59.0, 63.05], [66.0, 69.18], [76.0, 80.82], [88.0, 96.5], [102.0, 109.0], [110.0, 110.2], [117.0, 123.89], [125.0, 140.46], [146.0, 146.47], [150.0, 172.03], [173.0, 176.15], [177.0, 176.88], [180.0, 182.16], [183.0, 184.77], [187.0, 192.59], [194.0, 196.37], [197.0, 197.97], [201.0, 205.73], [207.0, 209.87]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, true, true], "silence_prob": [37.98, 0.0, 0.0, 0.0, 35.05, 35.07, 35.91, 34.36, 0.0, 0.0, 37.03, 0.0, 0.0, 0.0, 0.0, 40.7, 40.21, 35.86, 38.21, 36.65, 0.0, 37.84, 39.35, 0.0, 45.43, 52.1, 0.0, 54.83, 0.0, 43.82, 51.94, 0.0, 43.0, 48.91], "audiomae_on_audioset": [[["music", 19.65], ["singing bowl", 14.27], ["sine wave", 7.91]], null, null, null, [["music", 52.07], ["electronic music", 9.93], ["musical instrument", 5.36]], [["music", 63.67], ["musical instrument", 6.39], ["synthesizer", 5.61]], [["music", 56.58], ["synthesizer", 6.11], ["throbbing", 5.07]], [["music", 72.12], ["didgeridoo", 5.19], ["hum", 5.02]], null, null, [["music", 53.38], ["didgeridoo", 19.85], ["musical instrument", 3.44]], null, null, null, null, [["music", 63.69], ["synthesizer", 6.06], ["musical instrument", 4.37]], [["music", 65.54], ["synthesizer", 8.1], ["musical instrument", 4.27]], [["music", 60.24], ["didgeridoo", 8.2], ["synthesizer", 6.95]], [["music", 59.82], ["synthesizer", 6.18], ["sampler", 3.66]], [["music", 61.19], ["synthesizer", 5.73], ["didgeridoo", 5.51]], null, [["music", 72.32], ["didgeridoo", 9.2], ["speech", 3.01]], [["music", 61.33], ["didgeridoo", 12.44], ["synthesizer", 5.88]], null, [["music", 55.91], ["musical instrument", 9.34], ["orchestra", 3.56]], null, null, null, null, [["music", 50.18], ["throbbing", 12.48], ["hum", 8.57]], null, null, [["music", 54.6], ["throbbing", 4.56], ["livestock, farm animals, working animals", 3.67]], [["music", 53.92], ["throbbing", 3.51], ["musical instrument", 2.87]]], "duration": [2.59, -0.16, -0.1, 1.0, 13.94, 6.88, 3.05, 10.43, 0.46, 0.28, 2.53, -0.29, 0.02, 0.05, -0.21, 4.05, 3.18, 4.82, 8.5, 7.0, 0.2, 6.89, 15.46, 0.47, 22.03, 3.15, -0.12, 2.16, 1.77, 5.59, 2.37, 0.97, 4.73, 2.87]} \ No newline at end of file diff --git a/annotations_1/y_LVaQiyLrM_filtered.json b/annotations_1/y_LVaQiyLrM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b1707dcc8350598a94bcb8e55b358132acb5385a --- /dev/null +++ b/annotations_1/y_LVaQiyLrM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 25.64], [26.0, 31.87], [33.0, 34.42], [35.0, 37.67], [38.0, 49.22], [52.0, 53.22], [59.0, 58.63], [66.0, 67.98], [75.0, 76.6], [79.0, 79.79], [81.0, 81.8], [97.0, 99.47], [106.0, 106.93]], "keep_status": [true, true, false, true, false, false, false, false, false, false, false, true, false], "silence_prob": [46.57, 39.11, 0.0, 48.31, 33.49, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.27, 0.0], "audiomae_on_audioset": [[["music", 43.31], ["speech", 8.62], ["glockenspiel", 8.19]], [["music", 40.99], ["speech", 18.48], ["bleat", 4.69]], null, [["music", 28.42], ["speech", 9.11], ["didgeridoo", 6.91]], [["music", 69.54], ["theremin", 3.38], ["moo", 2.55]], null, null, null, null, null, null, [["music", 20.48], ["rumble", 11.68], ["synthesizer", 7.68]], null], "duration": [4.64, 5.87, 1.42, 2.67, 11.22, 1.22, -0.37, 1.98, 1.6, 0.79, 0.8, 2.47, 0.93]} \ No newline at end of file diff --git a/annotations_1/y_Zo1Wg4RAM_filtered.json b/annotations_1/y_Zo1Wg4RAM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2d80ce9bde5837fd0de2c9096551f7eec97362ec --- /dev/null +++ b/annotations_1/y_Zo1Wg4RAM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[14.0, 14.15], [16.0, 20.93], [25.0, 35.61], [38.0, 39.72], [40.0, 43.48], [45.0, 45.22], [47.0, 47.7], [51.0, 52.89], [54.0, 55.17], [57.0, 57.0], [59.0, 59.43], [61.0, 62.63], [64.0, 65.87], [68.0, 69.4], [70.0, 72.54], [74.0, 74.58], [78.0, 79.24], [80.0, 111.23], [112.0, 118.32], [119.0, 120.26], [122.0, 122.54], [123.0, 124.12], [126.0, 128.65], [130.0, 130.4], [131.0, 132.22]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.33, 33.86, 0.0, 54.5, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.56, 0.0, 0.0, 0.0, 32.15, 0.0, 0.0, 0.0, 33.71, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 55.14], ["hum", 16.39], ["throbbing", 4.24]], [["music", 16.82], ["hum", 14.8], ["mains hum", 13.81]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 63.76], ["theremin", 14.6], ["musical instrument", 4.55]], null, null, null, [["music", 55.71], ["theremin", 19.87], ["ambient music", 4.11]], null, null], "duration": [0.15, 4.93, 10.61, 1.72, 3.48, 0.22, 0.7, 1.89, 1.17, 0.0, 0.43, 1.63, 1.87, 1.4, 2.54, 0.58, 1.24, 31.23, 6.32, 1.26, 0.54, 1.12, 2.65, 0.4, 1.22]} \ No newline at end of file diff --git a/annotations_1/y_eZw262fhM_filtered.json b/annotations_1/y_eZw262fhM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f70b21e8f0494c126aaf01e0660a2bf538b4e37a --- /dev/null +++ b/annotations_1/y_eZw262fhM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[55.0, 68.81], [78.0, 163.97]], "keep_status": [true, false], "silence_prob": [28.58, 0.0], "audiomae_on_audioset": [[["breaking", 28.02], ["whack, thwack", 21.02], ["smash, crash", 6.8]], null], "duration": [13.81, 85.97]} \ No newline at end of file diff --git a/annotations_1/yaWmlDjvMs8_filtered.json b/annotations_1/yaWmlDjvMs8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..53a388e3be094e18a590f34573f7a71760100311 --- /dev/null +++ b/annotations_1/yaWmlDjvMs8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.04], [5.0, 5.39], [7.0, 8.34], [10.0, 11.6], [14.0, 16.97], [18.0, 35.58], [40.0, 63.1], [66.0, 66.48], [67.0, 67.8], [68.0, 72.93], [75.0, 80.35], [86.0, 94.24], [97.0, 106.54], [108.0, 107.81], [109.0, 108.99], [111.0, 124.39], [128.0, 128.36], [136.0, 136.56], [142.0, 144.02], [145.0, 153.33]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true], "silence_prob": [42.28, 0.0, 0.0, 0.0, 32.12, 30.09, 31.96, 0.0, 0.0, 30.35, 31.27, 33.0, 31.47, 0.0, 0.0, 31.17, 0.0, 0.0, 28.83, 30.29], "audiomae_on_audioset": [[["speech", 36.97], ["whale vocalization", 24.61], ["music", 11.09]], null, null, null, [["boing", 16.33], ["grunt", 12.03], ["clang", 10.85]], [["speech", 43.54], ["music", 33.15], ["throbbing", 3.9]], [["music", 33.71], ["boing", 30.44], ["speech", 21.9]], null, null, [["music", 63.88], ["boing", 8.18], ["speech", 6.18]], [["cattle, bovinae", 48.4], ["moo", 26.47], ["music", 11.1]], [["music", 62.96], ["foghorn", 7.93], ["throbbing", 6.06]], [["music", 63.43], ["throbbing", 3.25], ["hum", 3.21]], null, null, [["music", 42.32], ["livestock, farm animals, working animals", 23.17], ["cattle, bovinae", 8.98]], null, null, [["aircraft", 27.76], ["fixed-wing aircraft, airplane", 22.53], ["propeller, airscrew", 10.43]], [["music", 26.98], ["trombone", 9.21], ["foghorn", 8.61]]], "duration": [2.04, 0.39, 1.34, 1.6, 2.97, 17.58, 23.1, 0.48, 0.8, 4.93, 5.35, 8.24, 9.54, -0.19, -0.01, 13.39, 0.36, 0.56, 2.02, 8.33]} \ No newline at end of file diff --git a/annotations_1/yaoCvjqu_co_filtered.json b/annotations_1/yaoCvjqu_co_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4a58950b387c47a4db831bbffb2668e4d8e014b --- /dev/null +++ b/annotations_1/yaoCvjqu_co_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 23.41], [24.0, 24.85], [27.0, 31.16], [31.0, 31.33], [32.0, 35.68], [36.0, 43.07], [44.0, 52.69], [53.0, 64.2], [65.0, 70.14], [71.0, 71.88], [72.0, 81.36], [85.0, 85.21], [87.0, 101.98], [103.0, 104.13], [105.0, 106.1], [108.0, 109.68], [117.0, 117.17], [119.0, 120.34], [121.0, 122.64], [125.0, 126.17], [128.0, 128.36], [129.0, 130.08], [130.0, 130.94], [132.0, 135.99], [137.0, 149.18], [150.0, 150.55], [152.0, 154.74], [155.0, 161.23]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.53, 0.0, 67.63, 66.51, 64.75, 73.21, 86.64, 0.0, 86.09, 0.0, 69.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.79, 92.97, 0.0, 97.73, 63.74], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.41, 0.85, 4.16, 0.33, 3.68, 7.07, 8.69, 11.2, 5.14, 0.88, 9.36, 0.21, 14.98, 1.13, 1.1, 1.68, 0.17, 1.34, 1.64, 1.17, 0.36, 1.08, 0.94, 3.99, 12.18, 0.55, 2.74, 6.23]} \ No newline at end of file diff --git a/annotations_1/yat2WR8Ishk_filtered.json b/annotations_1/yat2WR8Ishk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2c79568c0e4cf64de1533f73b2d4990bbbd27b4d --- /dev/null +++ b/annotations_1/yat2WR8Ishk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.51], [4.0, 6.49], [8.0, 9.14], [9.0, 11.7], [13.0, 12.92], [14.0, 15.63], [18.0, 17.68], [19.0, 18.96], [20.0, 21.66], [24.0, 24.56], [25.0, 30.59], [31.0, 39.01], [39.0, 39.23], [39.0, 39.63], [40.0, 41.08], [43.0, 47.14], [47.0, 47.38], [48.0, 48.34], [49.0, 68.44], [69.0, 69.94], [71.0, 72.45], [74.0, 75.05], [78.0, 80.03], [84.0, 84.7], [86.0, 86.27], [94.0, 94.76], [95.0, 96.72], [98.0, 98.25], [98.0, 98.29], [98.0, 98.32], [98.0, 98.9], [99.0, 99.12], [99.0, 99.17]], "keep_status": [false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.51, 0.0, 37.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.9, 61.87, 0.0, 0.0, 0.0, 79.94, 0.0, 0.0, 66.76, 0.0, 0.0, 0.0, 99.68, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["buzzer", 44.91], ["fire alarm", 13.17], ["frog", 6.04]], null, [["speech", 72.68], ["busy signal", 5.88], ["sidetone", 5.58]], null, null, null, null, null, null, [["music", 54.22], ["musical instrument", 8.87], ["effects unit", 5.73]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.51, 2.49, 1.14, 2.7, -0.08, 1.63, -0.32, -0.04, 1.66, 0.56, 5.59, 8.01, 0.23, 0.63, 1.08, 4.14, 0.38, 0.34, 19.44, 0.94, 1.45, 1.05, 2.03, 0.7, 0.27, 0.76, 1.72, 0.25, 0.29, 0.32, 0.9, 0.12, 0.17]} \ No newline at end of file diff --git a/annotations_1/ybDsC1DzIPk_filtered.json b/annotations_1/ybDsC1DzIPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1df3a55fe275c37c55a59a993d274c6006348014 --- /dev/null +++ b/annotations_1/ybDsC1DzIPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[42.0, 76.81], [79.0, 83.47], [87.0, 89.75], [91.0, 91.12], [91.0, 96.33], [97.0, 132.41], [135.0, 135.45], [137.0, 137.49], [142.0, 142.79], [146.0, 165.23]], "keep_status": [false, true, true, false, true, false, false, false, false, false], "silence_prob": [0.0, 39.22, 36.52, 0.0, 39.64, 0.0, 0.0, 0.0, 0.0, 67.51], "audiomae_on_audioset": [null, [["mains hum", 24.01], ["hum", 14.34], ["music", 11.06]], [["hum", 29.94], ["throbbing", 13.77], ["mains hum", 10.84]], null, [["speech", 37.57], ["music", 22.75], ["fly, housefly", 5.64]], null, null, null, null, null], "duration": [34.81, 4.47, 2.75, 0.12, 5.33, 35.41, 0.45, 0.49, 0.79, 19.23]} \ No newline at end of file diff --git a/annotations_1/ybF7eOf_n4s_filtered.json b/annotations_1/ybF7eOf_n4s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a05aaf736d00fce2fc06d3037b99c88beb9a1c4 --- /dev/null +++ b/annotations_1/ybF7eOf_n4s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.1], [9.0, 12.38], [13.0, 48.98], [51.0, 55.83], [56.0, 64.08], [66.0, 92.91], [94.0, 96.92], [97.0, 98.25], [99.0, 107.84], [109.0, 117.14], [119.0, 120.43], [125.0, 128.28], [137.0, 139.89], [143.0, 143.48], [144.0, 145.13], [154.0, 154.25]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 34.09, 0.0, 42.79, 61.08, 71.0, 48.56, 0.0, 70.86, 71.14, 0.0, 57.01, 76.53, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 37.88], ["foghorn", 11.11], ["musical instrument", 6.01]], null, [["speech", 31.48], ["noise", 11.85], ["music", 10.3]], null, null, [["music", 51.51], ["speech", 11.01], ["animal", 2.89]], null, null, null, null, null, null, null, null, null], "duration": [0.1, 3.38, 35.98, 4.83, 8.08, 26.91, 2.92, 1.25, 8.84, 8.14, 1.43, 3.28, 2.89, 0.48, 1.13, 0.25]} \ No newline at end of file diff --git a/annotations_1/ybRy055wBsw_filtered.json b/annotations_1/ybRy055wBsw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5c76747885daccb41f3e1f7316e532ec5e3040f --- /dev/null +++ b/annotations_1/ybRy055wBsw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.74], [18.0, 44.44], [45.0, 61.91], [62.0, 63.53], [70.0, 91.23], [95.0, 107.38], [110.0, 139.4]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [28.99, 28.2, 28.12, 0.0, 28.93, 28.4, 28.2], "audiomae_on_audioset": [[["music", 79.5], ["dubstep", 2.2], ["singing", 1.31]], [["music", 69.55], ["dubstep", 4.07], ["electronic music", 2.73]], [["music", 75.57], ["dubstep", 9.98], ["electronic music", 4.08]], null, [["music", 76.72], ["dubstep", 3.58], ["hum", 2.16]], [["music", 75.62], ["dubstep", 2.17], ["hum", 1.54]], [["music", 73.22], ["dubstep", 7.85], ["electronic music", 3.13]]], "duration": [14.74, 26.44, 16.91, 1.53, 21.23, 12.38, 29.4]} \ No newline at end of file diff --git a/annotations_1/yceziOf95-0_filtered.json b/annotations_1/yceziOf95-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d7ec81f90e9e4ab99f1e03405599dccf3749236a --- /dev/null +++ b/annotations_1/yceziOf95-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.88], [16.0, 18.49], [22.0, 22.52], [29.0, 28.78], [30.0, 29.81], [30.0, 30.48], [31.0, 31.73], [36.0, 35.94], [43.0, 43.44], [45.0, 45.5], [46.0, 46.38], [47.0, 47.24], [58.0, 59.19], [63.0, 62.88], [65.0, 68.23], [69.0, 68.86], [69.0, 70.31], [72.0, 72.81], [74.0, 74.33], [80.0, 81.43], [83.0, 83.93], [85.0, 86.81], [87.0, 88.2], [92.0, 93.38], [96.0, 96.01], [97.0, 99.55], [104.0, 104.6], [105.0, 112.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 36.12, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.91, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 66.76, 0.0, 52.74], "audiomae_on_audioset": [null, [["speech", 81.18], ["music", 4.02], ["electric shaver, electric razor", 2.68]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 2.49, 0.52, -0.22, -0.19, 0.48, 0.73, -0.06, 0.44, 0.5, 0.38, 0.24, 1.19, -0.12, 3.23, -0.14, 1.31, 0.81, 0.33, 1.43, 0.93, 1.81, 1.2, 1.38, 0.01, 2.55, 0.6, 7.83]} \ No newline at end of file diff --git a/annotations_1/ye38FmLnLBo_filtered.json b/annotations_1/ye38FmLnLBo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1490881f5d88217e127c4e8083afb1422c96fe35 --- /dev/null +++ b/annotations_1/ye38FmLnLBo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.93], [14.0, 15.06], [22.0, 22.15], [24.0, 30.45], [31.0, 31.89], [38.0, 38.13], [42.0, 42.31], [43.0, 57.42], [59.0, 59.29], [63.0, 71.81], [73.0, 87.69], [88.0, 89.83], [92.0, 103.38], [106.0, 107.43], [108.0, 108.38], [118.0, 119.35]], "keep_status": [false, false, false, true, false, false, false, true, false, true, true, false, false, false, false, false], "silence_prob": [58.22, 0.0, 0.0, 47.5, 0.0, 0.0, 0.0, 38.47, 0.0, 34.58, 41.42, 0.0, 38.68, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["speech", 15.0], ["beatboxing", 11.96], ["music", 9.47]], null, null, null, [["speech", 48.34], ["siren", 10.52], ["emergency vehicle", 5.82]], null, [["crow", 36.5], ["caw", 14.9], ["speech", 13.5]], [["hum", 23.98], ["mains hum", 19.27], ["speech", 9.42]], null, [["speech", 52.79], ["fart", 11.48], ["electric shaver, electric razor", 6.35]], null, null, null], "duration": [3.93, 1.06, 0.15, 6.45, 0.89, 0.13, 0.31, 14.42, 0.29, 8.81, 14.69, 1.83, 11.38, 1.43, 0.38, 1.35]} \ No newline at end of file diff --git a/annotations_1/yfg9cb_9NWQ_filtered.json b/annotations_1/yfg9cb_9NWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b611e5a08476c10ad5644e1a536919d1db37d8fd --- /dev/null +++ b/annotations_1/yfg9cb_9NWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 16.73], [18.0, 18.81], [30.0, 30.23], [31.0, 32.37], [34.0, 35.21], [38.0, 38.18], [42.0, 43.16], [49.0, 50.28], [52.0, 52.95], [54.0, 55.46], [57.0, 57.72], [59.0, 62.13], [67.0, 74.82], [76.0, 81.73], [83.0, 84.28], [86.0, 86.21], [92.0, 92.21], [93.0, 96.3], [97.0, 96.97], [98.0, 98.61], [104.0, 104.57], [106.0, 108.09], [109.0, 109.49], [112.0, 113.48], [115.0, 115.55], [118.0, 118.45], [127.0, 127.57]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [39.52, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 86.09, 54.7, 0.0, 0.0, 0.0, 52.27, 0.0, 0.0, 0.0, 43.61, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 34.6], ["sidetone", 29.55], ["radio", 15.08]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 68.76], ["telephone", 10.0], ["sidetone", 7.05]], null, null, null, null, null], "duration": [8.73, 0.81, 0.23, 1.37, 1.21, 0.18, 1.16, 1.28, 0.95, 1.46, 0.72, 3.13, 7.82, 5.73, 1.28, 0.21, 0.21, 3.3, -0.03, 0.61, 0.57, 2.09, 0.49, 1.48, 0.55, 0.45, 0.57]} \ No newline at end of file diff --git a/annotations_1/yg42xdVf9mM_filtered.json b/annotations_1/yg42xdVf9mM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..889dfb7ed3ec4d70d0ee4d84260b7dc2dd1da6ee --- /dev/null +++ b/annotations_1/yg42xdVf9mM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.4], [12.0, 12.06], [15.0, 15.23], [16.0, 16.78], [19.0, 19.47], [20.0, 20.88], [21.0, 21.42], [27.0, 36.98], [39.0, 44.95], [51.0, 51.51], [53.0, 53.45], [61.0, 61.26], [67.0, 73.89], [82.0, 82.59], [84.0, 85.02], [86.0, 87.61], [89.0, 90.48], [95.0, 99.49]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.2, 36.68, 0.0, 0.0, 0.0, 88.1, 0.0, 0.0, 0.0, 0.0, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, [["explosion", 18.89], ["cattle, bovinae", 11.53], ["moo", 9.22]], null, null, null, null, null, null, null, null, null], "duration": [2.4, 0.06, 0.23, 0.78, 0.47, 0.88, 0.42, 9.98, 5.95, 0.51, 0.45, 0.26, 6.89, 0.59, 1.02, 1.61, 1.48, 4.49]} \ No newline at end of file diff --git a/annotations_1/yi2YuSALRzs_filtered.json b/annotations_1/yi2YuSALRzs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8f154f27c57abf974912ba33f533f99ec674d7b2 --- /dev/null +++ b/annotations_1/yi2YuSALRzs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 5.51], [6.0, 12.38], [13.0, 55.95], [60.0, 64.69], [72.0, 76.59], [78.0, 81.53], [83.0, 86.86], [87.0, 105.8], [109.0, 109.88], [113.0, 114.34], [115.0, 120.56], [123.0, 128.83], [130.0, 130.47], [131.0, 134.06], [135.0, 138.0], [142.0, 143.38], [144.0, 146.74], [148.0, 149.01], [150.0, 152.79], [154.0, 154.36], [155.0, 160.02], [163.0, 168.99], [170.0, 169.94], [171.0, 171.96], [175.0, 175.86], [178.0, 177.72], [178.0, 180.93], [182.0, 183.34], [184.0, 185.21]], "keep_status": [true, true, false, true, false, true, false, false, false, false, false, false, false, true, true, false, false, false, true, false, false, true, false, false, false, false, true, false, false], "silence_prob": [39.09, 33.37, 0.0, 34.03, 52.33, 47.9, 62.47, 30.43, 0.0, 0.0, 30.39, 35.21, 0.0, 30.19, 33.48, 0.0, 38.28, 0.0, 49.36, 0.0, 29.81, 30.45, 0.0, 0.0, 0.0, 0.0, 36.33, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.53], ["theremin", 22.76], ["noise", 16.62]], [["music", 39.39], ["thunk", 4.16], ["speech", 3.81]], null, [["music", 45.01], ["hum", 12.46], ["ambient music", 12.15]], null, [["music", 39.13], ["ambient music", 18.23], ["hum", 8.97]], null, [["music", 64.24], ["hum", 5.62], ["synthesizer", 5.5]], null, null, [["speech", 40.08], ["sidetone", 20.09], ["hum", 12.98]], [["speech", 40.17], ["didgeridoo", 28.25], ["music", 14.99]], null, [["speech", 56.38], ["music", 6.48], ["thunk", 4.92]], [["music", 19.14], ["speech", 14.8], ["mains hum", 5.91]], null, [["speech", 40.33], ["didgeridoo", 19.78], ["music", 16.11]], null, [["music", 18.57], ["hum", 8.33], ["mains hum", 7.52]], null, [["speech", 86.54], ["telephone dialing, dtmf", 1.7], ["whack, thwack", 1.63]], [["hum", 25.31], ["buzz", 15.38], ["music", 12.76]], null, null, null, null, [["music", 25.83], ["speech", 13.25], ["radio", 10.51]], null, null], "duration": [4.51, 6.38, 42.95, 4.69, 4.59, 3.53, 3.86, 18.8, 0.88, 1.34, 5.56, 5.83, 0.47, 3.06, 3.0, 1.38, 2.74, 1.01, 2.79, 0.36, 5.02, 5.99, -0.06, 0.96, 0.86, -0.28, 2.93, 1.34, 1.21]} \ No newline at end of file diff --git a/annotations_1/yiOUEU4KG6s_filtered.json b/annotations_1/yiOUEU4KG6s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..35232f61f00fd884aba54606f732a8b54926392e --- /dev/null +++ b/annotations_1/yiOUEU4KG6s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 8.77], [9.0, 11.25], [12.0, 13.88], [15.0, 18.17], [19.0, 21.49], [22.0, 22.65], [23.0, 24.16], [26.0, 26.79], [29.0, 29.74], [32.0, 32.39], [34.0, 34.37], [37.0, 38.25], [40.0, 41.81], [42.0, 43.55], [45.0, 46.8], [51.0, 52.3], [53.0, 59.26], [61.0, 66.56], [68.0, 71.64], [72.0, 72.72], [74.0, 75.98], [78.0, 82.29], [83.0, 87.96], [89.0, 94.59], [96.0, 96.31], [99.0, 113.1], [114.0, 113.81], [115.0, 116.09], [117.0, 118.5], [121.0, 124.11], [128.0, 129.46], [130.0, 130.17], [131.0, 131.55], [132.0, 151.48], [152.0, 152.78], [153.0, 154.03], [155.0, 155.09], [158.0, 158.77], [160.0, 160.17], [161.0, 161.69]], "keep_status": [false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [69.2, 52.92, 0.0, 43.35, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 75.72, 69.74, 0.0, 0.0, 36.26, 32.26, 38.63, 0.0, 31.72, 0.0, 0.0, 0.0, 28.66, 0.0, 0.0, 0.0, 77.53, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, [["thunk", 24.47], ["tuning fork", 24.01], ["wood", 11.43]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 41.69], ["musical instrument", 15.6], ["hum", 5.79]], [["mains hum", 17.25], ["didgeridoo", 14.34], ["music", 13.65]], [["music", 25.65], ["mains hum", 12.7], ["didgeridoo", 9.58]], null, [["theremin", 46.65], ["music", 34.57], ["wind instrument, woodwind instrument", 3.03]], null, null, null, [["music", 32.77], ["trombone", 22.01], ["foghorn", 11.22]], null, null, null, null, null, null, null, null, null, null], "duration": [6.77, 2.25, 1.88, 3.17, 2.49, 0.65, 1.16, 0.79, 0.74, 0.39, 0.37, 1.25, 1.81, 1.55, 1.8, 1.3, 6.26, 5.56, 3.64, 0.72, 1.98, 4.29, 4.96, 5.59, 0.31, 14.1, -0.19, 1.09, 1.5, 3.11, 1.46, 0.17, 0.55, 19.48, 0.78, 1.03, 0.09, 0.77, 0.17, 0.69]} \ No newline at end of file diff --git a/annotations_1/yiPqxnLMKbs_filtered.json b/annotations_1/yiPqxnLMKbs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..584c5731d0c75a8561a3fa5763d54f0b8d16db53 --- /dev/null +++ b/annotations_1/yiPqxnLMKbs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.59], [3.0, 3.89], [5.0, 6.42], [7.0, 7.67], [9.0, 10.71], [12.0, 12.46], [13.0, 13.29], [16.0, 17.36], [19.0, 20.12], [23.0, 23.46], [26.0, 26.99], [29.0, 29.34], [30.0, 29.98], [32.0, 32.27], [35.0, 37.37], [41.0, 43.14], [44.0, 45.0], [53.0, 53.91], [58.0, 58.06], [61.0, 63.39], [64.0, 64.42], [65.0, 65.31], [66.0, 66.99], [74.0, 74.7], [82.0, 83.3], [90.0, 95.35], [96.0, 99.45]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.18, 62.89, 0.0, 0.0, 0.0, 53.53, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 65.2], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.59, 0.89, 1.42, 0.67, 1.71, 0.46, 0.29, 1.36, 1.12, 0.46, 0.99, 0.34, -0.02, 0.27, 2.37, 2.14, 1.0, 0.91, 0.06, 2.39, 0.42, 0.31, 0.99, 0.7, 1.3, 5.35, 3.45]} \ No newline at end of file diff --git a/annotations_1/yijQXDtxgic_filtered.json b/annotations_1/yijQXDtxgic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3dcaca09cc83cf1673f3400edd6973badc2fa6be --- /dev/null +++ b/annotations_1/yijQXDtxgic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 7.86], [9.0, 10.89], [26.0, 26.22], [30.0, 29.89], [31.0, 31.85], [34.0, 34.94], [35.0, 37.3], [40.0, 41.32], [46.0, 47.87], [49.0, 49.65], [62.0, 61.72], [66.0, 67.14], [80.0, 96.11], [100.0, 100.3], [101.0, 101.98], [109.0, 110.51], [111.0, 111.52]], "keep_status": [true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [42.67, 0.0, 0.0, 0.0, 0.0, 0.0, 31.96, 0.0, 0.0, 0.0, 0.0, 0.0, 32.34, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 28.99], ["speech", 23.65], ["clip-clop", 9.9]], null, null, null, null, null, [["boing", 12.78], ["frog", 11.53], ["animal", 7.22]], null, null, null, null, null, [["music", 53.89], ["speech", 21.17], ["theremin", 5.35]], null, null, null, null], "duration": [3.86, 1.89, 0.22, -0.11, 0.85, 0.94, 2.3, 1.32, 1.87, 0.65, -0.28, 1.14, 16.11, 0.3, 0.98, 1.51, 0.52]} \ No newline at end of file diff --git a/annotations_1/yjrvJkWU_5k_filtered.json b/annotations_1/yjrvJkWU_5k_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..483d72fab08df9587aff80c6963c52e033a489bf --- /dev/null +++ b/annotations_1/yjrvJkWU_5k_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.63], [9.0, 8.9], [11.0, 14.42], [20.0, 26.62], [30.0, 30.91], [32.0, 32.58], [33.0, 36.37], [37.0, 38.06], [41.0, 43.33], [46.0, 46.7], [51.0, 54.87], [63.0, 63.73], [79.0, 80.25], [82.0, 83.39], [89.0, 88.89]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 31.39, 33.05, 0.0, 0.0, 40.16, 0.0, 37.15, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["boing", 27.99], ["music", 22.61], ["whale vocalization", 11.64]], [["music", 67.16], ["musical instrument", 5.4], ["synthesizer", 5.22]], null, null, [["cattle, bovinae", 27.04], ["moo", 20.99], ["livestock, farm animals, working animals", 7.27]], null, [["music", 66.38], ["speech", 17.24], ["musical instrument", 4.3]], null, [["music", 62.32], ["synthesizer", 8.62], ["boing", 6.11]], null, null, null, null], "duration": [0.63, -0.1, 3.42, 6.62, 0.91, 0.58, 3.37, 1.06, 2.33, 0.7, 3.87, 0.73, 1.25, 1.39, -0.11]} \ No newline at end of file diff --git a/annotations_1/yk5d161ytXE_filtered.json b/annotations_1/yk5d161ytXE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50ff8ef88d4379f386f63378b68bed12bb5d8920 --- /dev/null +++ b/annotations_1/yk5d161ytXE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 8.95], [12.0, 18.32], [23.0, 26.57], [32.0, 36.51], [41.0, 45.94], [50.0, 50.65], [53.0, 65.89], [67.0, 67.69], [69.0, 78.61], [90.0, 93.61], [99.0, 99.39], [102.0, 116.34], [116.0, 116.58], [117.0, 116.63], [117.0, 116.67], [117.0, 117.53], [118.0, 133.14], [139.0, 153.94], [154.0, 154.04], [154.0, 154.33], [154.0, 154.52], [155.0, 154.57], [155.0, 158.09], [162.0, 165.94], [170.0, 186.38], [188.0, 199.42]], "keep_status": [true, false, false, false, true, false, true, false, true, true, false, true, false, false, false, false, true, true, false, false, false, false, false, false, true, false], "silence_prob": [38.38, 33.99, 35.91, 59.86, 37.32, 0.0, 38.41, 0.0, 37.35, 41.5, 0.0, 34.8, 0.0, 0.0, 0.0, 0.0, 36.7, 34.07, 0.0, 0.0, 0.0, 0.0, 43.23, 39.4, 38.79, 34.33], "audiomae_on_audioset": [[["music", 27.56], ["livestock, farm animals, working animals", 24.49], ["cattle, bovinae", 12.35]], [["speech", 68.3], ["vehicle", 2.83], ["sidetone", 2.57]], [["speech", 65.33], ["car", 3.96], ["music", 3.63]], null, [["speech", 32.15], ["music", 25.11], ["vehicle", 7.56]], null, [["speech", 31.52], ["vehicle", 16.11], ["music", 8.29]], null, [["speech", 32.96], ["vehicle", 19.16], ["livestock, farm animals, working animals", 8.24]], [["music", 16.8], ["fly, housefly", 14.32], ["cattle, bovinae", 12.74]], null, [["speech", 29.95], ["vehicle", 19.69], ["race car, auto racing", 11.49]], null, null, null, null, [["hum", 25.1], ["mains hum", 12.33], ["skidding", 8.54]], [["fly, housefly", 39.2], ["insect", 13.48], ["buzz", 12.5]], null, null, null, null, [["fly, housefly", 37.93], ["insect", 33.54], ["mosquito", 9.86]], [["speech", 46.17], ["music", 25.32], ["explosion", 3.33]], [["music", 39.59], ["speech", 19.73], ["sidetone", 4.79]], [["speech", 49.32], ["music", 34.59], ["radio", 3.31]]], "duration": [4.95, 6.32, 3.57, 4.51, 4.94, 0.65, 12.89, 0.69, 9.61, 3.61, 0.39, 14.34, 0.58, -0.37, -0.33, 0.53, 15.14, 14.94, 0.04, 0.33, 0.52, -0.43, 3.09, 3.94, 16.38, 11.42]} \ No newline at end of file diff --git a/annotations_1/yk73thpx_B8_filtered.json b/annotations_1/yk73thpx_B8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/yk73thpx_B8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/ykBG9mW1yC4_filtered.json b/annotations_1/ykBG9mW1yC4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..df375e3043a86ee77e01c4922b05fbe0c34bc96d --- /dev/null +++ b/annotations_1/ykBG9mW1yC4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.51], [9.0, 9.1], [12.0, 15.42], [17.0, 17.31], [20.0, 19.72], [26.0, 26.55], [28.0, 28.41], [29.0, 29.81], [34.0, 34.65], [35.0, 35.26], [43.0, 43.06], [45.0, 45.94], [50.0, 49.94], [50.0, 50.67], [51.0, 53.01], [63.0, 63.04], [65.0, 70.29], [83.0, 84.32], [88.0, 88.64], [92.0, 94.98], [96.0, 96.13], [99.0, 99.62], [101.0, 106.95], [107.0, 107.91], [112.0, 112.7], [118.0, 118.35]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 84.8, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.88, 0.0, 33.34, 0.0, 0.0, 36.54, 0.0, 0.0, 49.4, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 29.02], ["speech", 21.12], ["hum", 9.29]], null, [["moo", 15.17], ["cattle, bovinae", 11.92], ["boing", 11.61]], null, null, [["speech", 71.13], ["fart", 6.69], ["boing", 4.83]], null, null, [["speech", 52.41], ["grunt", 16.6], ["chirp tone", 9.05]], null, null, null], "duration": [0.51, 0.1, 3.42, 0.31, -0.28, 0.55, 0.41, 0.81, 0.65, 0.26, 0.06, 0.94, -0.06, 0.67, 2.01, 0.04, 5.29, 1.32, 0.64, 2.98, 0.13, 0.62, 5.95, 0.91, 0.7, 0.35]} \ No newline at end of file diff --git a/annotations_1/ykQ9g2HT2sU_filtered.json b/annotations_1/ykQ9g2HT2sU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17d841458d0f43fbe2dfe643a6e524ea6ca75795 --- /dev/null +++ b/annotations_1/ykQ9g2HT2sU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 27.19], [36.0, 36.71], [38.0, 38.16], [43.0, 43.21], [49.0, 51.56], [72.0, 84.52], [92.0, 106.17], [121.0, 123.63], [124.0, 125.47], [129.0, 133.74], [143.0, 143.5], [144.0, 145.57], [150.0, 151.87], [157.0, 159.22], [162.0, 179.9]], "keep_status": [false, false, false, false, false, false, false, true, false, true, false, false, false, true, false], "silence_prob": [31.65, 0.0, 0.0, 0.0, 91.64, 34.03, 33.62, 41.68, 0.0, 36.8, 0.0, 0.0, 0.0, 40.34, 32.1], "audiomae_on_audioset": [[["music", 86.05], ["electronic music", 2.4], ["synthesizer", 2.01]], null, null, null, null, [["music", 78.8], ["boing", 5.85], ["synthesizer", 2.61]], [["music", 42.41], ["speech", 17.53], ["boing", 10.09]], [["music", 39.93], ["speech", 13.71], ["fly, housefly", 8.73]], null, [["music", 41.49], ["speech", 6.83], ["throbbing", 5.7]], null, null, null, [["music", 21.44], ["frog", 18.98], ["croak", 8.81]], [["music", 63.09], ["throbbing", 9.86], ["hum", 5.84]]], "duration": [19.19, 0.71, 0.16, 0.21, 2.56, 12.52, 14.17, 2.63, 1.47, 4.74, 0.5, 1.57, 1.87, 2.22, 17.9]} \ No newline at end of file diff --git a/annotations_1/ykcCGhbl1H4_filtered.json b/annotations_1/ykcCGhbl1H4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..770a41d111a54854945d11ed00229b2530752219 --- /dev/null +++ b/annotations_1/ykcCGhbl1H4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 12.01], [15.0, 15.89], [36.0, 43.39], [48.0, 48.59], [50.0, 50.25], [53.0, 54.48], [64.0, 92.77], [94.0, 102.84], [105.0, 105.66], [109.0, 108.89], [109.0, 116.26], [119.0, 119.75]], "keep_status": [false, false, true, false, false, false, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 30.18, 0.0, 0.0, 0.0, 30.26, 35.0, 0.0, 0.0, 35.69, 0.0], "audiomae_on_audioset": [null, null, [["music", 38.02], ["skidding", 13.3], ["car", 7.08]], null, null, null, [["music", 45.64], ["speech", 17.31], ["vehicle", 9.26]], [["hum", 29.2], ["music", 24.35], ["throbbing", 10.59]], null, null, [["music", 64.02], ["synthesizer", 10.44], ["musical instrument", 5.41]], null], "duration": [1.01, 0.89, 7.39, 0.59, 0.25, 1.48, 28.77, 8.84, 0.66, -0.11, 7.26, 0.75]} \ No newline at end of file diff --git a/annotations_1/ylvh800i85I_filtered.json b/annotations_1/ylvh800i85I_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2acca43f8657aef864b5fccebd4f51314b8581ef --- /dev/null +++ b/annotations_1/ylvh800i85I_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.12], [11.0, 23.09], [28.0, 29.07], [29.0, 31.77], [40.0, 40.96], [42.0, 43.02], [51.0, 57.87], [59.0, 59.59], [62.0, 61.8], [63.0, 63.07], [70.0, 70.92], [74.0, 74.36], [76.0, 76.23], [77.0, 77.41], [78.0, 78.6], [79.0, 79.17], [80.0, 81.03], [107.0, 108.43], [109.0, 110.89], [114.0, 114.02], [116.0, 116.61], [117.0, 117.49], [130.0, 131.48], [134.0, 134.54], [135.0, 136.0], [137.0, 138.43], [147.0, 147.55], [151.0, 151.44], [154.0, 160.22]], "keep_status": [false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 45.36, 0.0, 39.49, 0.0, 0.0, 37.26, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.81], "audiomae_on_audioset": [null, [["music", 61.7], ["speech", 3.39], ["outside, rural or natural", 2.12]], null, [["music", 82.82], ["musical instrument", 3.28], ["boing", 2.17]], null, null, [["music", 58.58], ["speech", 7.31], ["didgeridoo", 3.21]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 12.09, 1.07, 2.77, 0.96, 1.02, 6.87, 0.59, -0.2, 0.07, 0.92, 0.36, 0.23, 0.41, 0.6, 0.17, 1.03, 1.43, 1.89, 0.02, 0.61, 0.49, 1.48, 0.54, 1.0, 1.43, 0.55, 0.44, 6.22]} \ No newline at end of file diff --git a/annotations_1/ymbKDavsVaU_filtered.json b/annotations_1/ymbKDavsVaU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1dd78ee4f90093e50e4dc0472da394bd0eb6da75 --- /dev/null +++ b/annotations_1/ymbKDavsVaU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.96], [13.0, 13.91], [18.0, 28.38], [29.0, 29.74], [32.0, 34.62], [38.0, 38.55], [52.0, 54.57], [55.0, 55.31], [57.0, 60.02], [66.0, 67.86], [71.0, 72.22], [87.0, 87.07], [101.0, 101.82], [108.0, 109.0], [119.0, 120.55], [122.0, 123.04], [153.0, 154.95], [160.0, 160.44], [166.0, 168.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 55.18, 0.0, 57.72, 0.0, 77.2, 0.0, 80.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.86], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.96, 0.91, 10.38, 0.74, 2.62, 0.55, 2.57, 0.31, 3.02, 1.86, 1.22, 0.07, 0.82, 1.0, 1.55, 1.04, 1.95, 0.44, 2.39]} \ No newline at end of file diff --git a/annotations_1/yn2p3AV23-Q_filtered.json b/annotations_1/yn2p3AV23-Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2980bc8a74d25bfb9b2b4599f9f95580255d10af --- /dev/null +++ b/annotations_1/yn2p3AV23-Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 47.19], [48.0, 56.27], [58.0, 61.86], [63.0, 125.71], [131.0, 131.25], [132.0, 133.42]], "keep_status": [true, false, true, false, false, false], "silence_prob": [30.56, 31.26, 35.14, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 25.9], ["hum", 20.17], ["ambient music", 12.18]], [["hum", 49.49], ["throbbing", 16.54], ["mains hum", 14.6]], [["gong", 24.21], ["speech", 20.91], ["music", 19.24]], null, null, null], "duration": [27.19, 8.27, 3.86, 62.71, 0.25, 1.42]} \ No newline at end of file diff --git a/annotations_1/ynC2_22yuGA_filtered.json b/annotations_1/ynC2_22yuGA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3b6f14dc76149c6573a7a5e08c9de06aec669713 --- /dev/null +++ b/annotations_1/ynC2_22yuGA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.97], [6.0, 5.95], [10.0, 10.37], [12.0, 11.8], [14.0, 14.44], [19.0, 21.71], [22.0, 23.8], [26.0, 27.67], [32.0, 32.8], [34.0, 34.75], [39.0, 39.41], [42.0, 42.36], [43.0, 43.58], [44.0, 45.59], [46.0, 52.46], [54.0, 55.7], [57.0, 67.91], [71.0, 73.79], [77.0, 80.62], [83.0, 83.61], [85.0, 85.77], [88.0, 89.6], [91.0, 91.49], [93.0, 94.31], [95.0, 95.39], [99.0, 102.3], [104.0, 106.03], [107.0, 108.9]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.61, 0.0, 40.4, 41.93, 48.27, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.82, 41.81, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 73.12], ["speech", 3.75], ["musical instrument", 1.19]], [["hum", 61.59], ["mains hum", 19.75], ["throbbing", 7.82]], [["music", 32.76], ["fly, housefly", 9.88], ["insect", 7.11]], null, null, null, null, null, null, [["hum", 9.58], ["mains hum", 7.79], ["burping, eructation", 7.09]], [["speech", 20.19], ["frog", 7.49], ["hum", 6.29]], null], "duration": [0.97, -0.05, 0.37, -0.2, 0.44, 2.71, 1.8, 1.67, 0.8, 0.75, 0.41, 0.36, 0.58, 1.59, 6.46, 1.7, 10.91, 2.79, 3.62, 0.61, 0.77, 1.6, 0.49, 1.31, 0.39, 3.3, 2.03, 1.9]} \ No newline at end of file diff --git a/annotations_1/yoYPBCFehng_filtered.json b/annotations_1/yoYPBCFehng_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f940507cd90a08893e9581b469bce374d39ce61 --- /dev/null +++ b/annotations_1/yoYPBCFehng_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[73.0, 81.35]], "keep_status": [false], "silence_prob": [32.35], "audiomae_on_audioset": [[["music", 42.98], ["hum", 18.71], ["mains hum", 9.33]]], "duration": [8.35]} \ No newline at end of file diff --git a/annotations_1/yodVQ5QAc88_filtered.json b/annotations_1/yodVQ5QAc88_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4612f33eba7747902488b95d37ee84b9d9e24417 --- /dev/null +++ b/annotations_1/yodVQ5QAc88_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 11.67], [16.0, 19.3], [20.0, 22.84], [24.0, 25.61], [27.0, 28.88], [34.0, 34.33], [36.0, 41.62], [43.0, 43.06], [45.0, 65.31], [66.0, 68.69], [70.0, 72.01], [76.0, 88.62], [90.0, 91.66], [92.0, 93.26], [95.0, 147.21], [148.0, 149.59]], "keep_status": [false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.81, 33.9, 0.0, 0.0, 0.0, 35.68, 0.0, 29.25, 29.46, 28.64, 28.09, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 66.43], ["sidetone", 9.35], ["hum", 3.99]], [["hum", 35.83], ["noise", 12.8], ["mains hum", 11.72]], null, null, null, [["noise", 27.17], ["music", 18.57], ["whale vocalization", 15.14]], null, [["hum", 44.95], ["mains hum", 19.97], ["throbbing", 17.15]], [["speech", 43.81], ["music", 32.74], ["electronic music", 1.75]], [["music", 39.49], ["speech", 30.64], ["electronic music", 6.17]], [["speech", 42.98], ["music", 20.99], ["vehicle", 7.6]], null, null, null, null], "duration": [0.67, 3.3, 2.84, 1.61, 1.88, 0.33, 5.62, 0.06, 20.31, 2.69, 2.01, 12.62, 1.66, 1.26, 52.21, 1.59]} \ No newline at end of file diff --git a/annotations_1/yprYw3FQUpQ_filtered.json b/annotations_1/yprYw3FQUpQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e6911a183799aefbea84ad410001d6a6875fb0cf --- /dev/null +++ b/annotations_1/yprYw3FQUpQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.13], [5.0, 24.36], [27.0, 46.04], [46.0, 58.63], [60.0, 60.51], [62.0, 62.56], [63.0, 65.92], [67.0, 67.53], [78.0, 78.65], [80.0, 80.1], [81.0, 85.29], [86.0, 86.88], [102.0, 106.25], [107.0, 109.19], [111.0, 113.37], [113.0, 118.57], [119.0, 127.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, true, false], "silence_prob": [0.0, 30.87, 46.15, 36.96, 0.0, 0.0, 43.08, 0.0, 0.0, 0.0, 32.01, 0.0, 31.74, 29.39, 28.88, 29.59, 29.06], "audiomae_on_audioset": [null, [["music", 25.9], ["mains hum", 23.52], ["hum", 20.69]], [["hum", 42.24], ["throbbing", 23.28], ["music", 11.64]], [["speech", 49.26], ["music", 16.1], ["stomach rumble", 5.35]], null, null, [["throbbing", 54.97], ["hum", 20.23], ["music", 6.55]], null, null, null, [["quack", 36.47], ["music", 32.79], ["speech", 13.94]], null, [["music", 40.99], ["speech", 13.78], ["whack, thwack", 2.99]], [["music", 24.89], ["car", 19.21], ["vehicle", 19.03]], [["music", 24.55], ["whoosh, swoosh, swish", 8.43], ["smash, crash", 6.29]], [["speech", 38.03], ["music", 18.78], ["whip", 10.57]], [["music", 70.98], ["trombone", 5.67], ["brass instrument", 3.18]]], "duration": [1.13, 19.36, 19.04, 12.63, 0.51, 0.56, 2.92, 0.53, 0.65, 0.1, 4.29, 0.88, 4.25, 2.19, 2.37, 5.57, 8.95]} \ No newline at end of file diff --git a/annotations_1/yq571gv49HQ_filtered.json b/annotations_1/yq571gv49HQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d9eedbf2b4f4e90f085608dba94b74cbb56ea830 --- /dev/null +++ b/annotations_1/yq571gv49HQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 44.47], [48.0, 50.38], [51.0, 60.03], [64.0, 80.33], [81.0, 96.01], [102.0, 114.02], [119.0, 130.22], [131.0, 144.98], [153.0, 153.52]], "keep_status": [false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 78.04, 70.3, 35.55, 32.4, 34.39, 34.48, 35.13, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 39.89], ["mains hum", 19.99], ["hum", 10.98]], [["music", 63.48], ["didgeridoo", 5.5], ["musical instrument", 3.54]], [["music", 71.96], ["synthesizer", 6.19], ["didgeridoo", 3.37]], [["mains hum", 49.24], ["hum", 20.08], ["music", 13.92]], [["music", 76.41], ["musical instrument", 5.56], ["cacophony", 2.07]], null], "duration": [37.47, 2.38, 9.03, 16.33, 15.01, 12.02, 11.22, 13.98, 0.52]} \ No newline at end of file diff --git a/annotations_1/yqlAjK0PVsU_filtered.json b/annotations_1/yqlAjK0PVsU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f7cf05cd27a5b4f9abfb81a34dcec3d4d3efaab8 --- /dev/null +++ b/annotations_1/yqlAjK0PVsU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[22.0, 48.73], [51.0, 52.74], [56.0, 96.4], [97.0, 97.77], [98.0, 99.33], [100.0, 101.31], [102.0, 104.33], [105.0, 107.16]], "keep_status": [true, false, false, false, false, false, true, true], "silence_prob": [28.22, 0.0, 0.0, 0.0, 0.0, 0.0, 32.53, 34.61], "audiomae_on_audioset": [[["music", 55.21], ["throbbing", 7.37], ["speech", 6.75]], null, null, null, null, null, [["insect", 14.94], ["fly, housefly", 12.35], ["speech", 8.24]], [["hum", 9.63], ["mains hum", 8.78], ["whale vocalization", 7.79]]], "duration": [26.73, 1.74, 40.4, 0.77, 1.33, 1.31, 2.33, 2.16]} \ No newline at end of file diff --git a/annotations_1/yquyze0QbPk_filtered.json b/annotations_1/yquyze0QbPk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cf82ee36413b3a2f62f896067677df2ba4f8586a --- /dev/null +++ b/annotations_1/yquyze0QbPk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.94], [8.0, 8.34], [10.0, 10.86], [11.0, 11.58], [16.0, 16.33], [20.0, 20.78], [21.0, 22.91], [25.0, 32.56], [33.0, 36.86], [37.0, 41.89], [44.0, 44.19], [45.0, 45.54], [47.0, 47.21], [47.0, 49.08], [50.0, 53.99], [54.0, 58.75], [61.0, 61.01], [62.0, 63.05], [64.0, 65.1], [66.0, 67.95], [71.0, 72.25], [74.0, 78.06], [79.0, 80.79], [82.0, 83.56], [84.0, 87.07], [88.0, 96.3]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [89.19, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.98, 99.71, 99.56, 0.0, 0.0, 0.0, 87.19, 85.35, 65.2, 0.0, 0.0, 0.0, 0.0, 0.0, 98.93, 0.0, 0.0, 96.17, 100.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.94, 0.34, 0.86, 0.58, 0.33, 0.78, 1.91, 7.56, 3.86, 4.89, 0.19, 0.54, 0.21, 2.08, 3.99, 4.75, 0.01, 1.05, 1.1, 1.95, 1.25, 4.06, 1.79, 1.56, 3.07, 8.3]} \ No newline at end of file diff --git a/annotations_1/yr-gQl9CKIU_filtered.json b/annotations_1/yr-gQl9CKIU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..76ad73b45553f6e91cc21ea5e544fcdb2550dc7e --- /dev/null +++ b/annotations_1/yr-gQl9CKIU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.55], [8.0, 10.22], [15.0, 15.92], [21.0, 21.68], [23.0, 24.09], [26.0, 26.0], [26.0, 26.74], [27.0, 26.77], [27.0, 27.82], [28.0, 28.27], [29.0, 30.06], [35.0, 34.82], [36.0, 36.76], [47.0, 49.99], [52.0, 53.4], [54.0, 54.28], [56.0, 58.5], [59.0, 59.64], [61.0, 70.38], [73.0, 74.14], [74.0, 75.02], [77.0, 77.45], [82.0, 82.09], [86.0, 86.34], [88.0, 89.68], [95.0, 95.67], [103.0, 103.52], [106.0, 106.35], [124.0, 125.07], [127.0, 127.08], [130.0, 131.18], [137.0, 137.61], [140.0, 144.17], [146.0, 145.76], [147.0, 147.6], [150.0, 150.82], [158.0, 159.65], [173.0, 173.69], [174.0, 174.68], [182.0, 182.61], [184.0, 184.81], [189.0, 189.4], [190.0, 191.79]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 66.15, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.96, 0.0, 0.0, 99.98, 0.0, 44.9, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 44.14], ["fly, housefly", 6.5], ["insect", 4.24]], null, null, null, null, [["speech", 30.09], ["animal", 12.4], ["fly, housefly", 7.46]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 2.22, 0.92, 0.68, 1.09, 0.0, 0.74, -0.23, 0.82, 0.27, 1.06, -0.18, 0.76, 2.99, 1.4, 0.28, 2.5, 0.64, 9.38, 1.14, 1.02, 0.45, 0.09, 0.34, 1.68, 0.67, 0.52, 0.35, 1.07, 0.08, 1.18, 0.61, 4.17, -0.24, 0.6, 0.82, 1.65, 0.69, 0.68, 0.61, 0.81, 0.4, 1.79]} \ No newline at end of file diff --git a/annotations_1/yr5x9xFoI04_filtered.json b/annotations_1/yr5x9xFoI04_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..202f1282ed23c9f1154f81c01406f638c79b4172 --- /dev/null +++ b/annotations_1/yr5x9xFoI04_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 9.8], [18.0, 17.83], [21.0, 21.3], [25.0, 25.02], [29.0, 31.24], [34.0, 35.88], [44.0, 45.3], [49.0, 54.01], [56.0, 57.87]], "keep_status": [true, false, false, false, false, false, false, true, false], "silence_prob": [35.39, 0.0, 0.0, 0.0, 69.88, 0.0, 0.0, 48.23, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 9.22], ["crowd", 8.53], ["cattle, bovinae", 7.97]], null, null, null, null, null, null, [["applause", 13.14], ["sound effect", 6.16], ["music", 6.05]], null], "duration": [2.8, -0.17, 0.3, 0.02, 2.24, 1.88, 1.3, 5.01, 1.87]} \ No newline at end of file diff --git a/annotations_1/yrfpRh2SqIw_filtered.json b/annotations_1/yrfpRh2SqIw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1231da5df14d79bf2017bd7f1bd832fcb8e48aad --- /dev/null +++ b/annotations_1/yrfpRh2SqIw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[25.0, 31.13], [32.0, 77.67], [80.0, 81.5], [84.0, 88.13]], "keep_status": [false, false, false, true], "silence_prob": [29.48, 0.0, 0.0, 30.9], "audiomae_on_audioset": [[["speech", 37.39], ["music", 34.61], ["hum", 2.79]], null, null, [["music", 20.58], ["speech", 17.5], ["explosion", 6.09]]], "duration": [6.13, 45.67, 1.5, 4.13]} \ No newline at end of file diff --git a/annotations_1/ysLBlalu91s_filtered.json b/annotations_1/ysLBlalu91s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11cc20e016898e88ec7a5e5ce8c9ba42d3c394b8 --- /dev/null +++ b/annotations_1/ysLBlalu91s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 16.82], [18.0, 34.53], [35.0, 36.39], [41.0, 42.25], [43.0, 44.2], [46.0, 47.82], [50.0, 51.71], [55.0, 57.69], [58.0, 71.58], [72.0, 79.91], [81.0, 81.53], [82.0, 87.51], [89.0, 88.97], [89.0, 89.11], [90.0, 89.87], [92.0, 92.18], [94.0, 94.9], [97.0, 100.97], [102.0, 111.84], [116.0, 116.73], [120.0, 120.97], [127.0, 129.05], [130.0, 131.52], [132.0, 133.49], [134.0, 135.19], [137.0, 137.3], [144.0, 145.3], [146.0, 151.38], [153.0, 153.72], [156.0, 160.51], [162.0, 164.27], [168.0, 170.4], [171.0, 172.15], [173.0, 174.01], [175.0, 179.14], [180.0, 202.09], [203.0, 205.33], [207.0, 207.96], [209.0, 213.53], [215.0, 216.18], [217.0, 220.29], [221.0, 231.85], [232.0, 232.17], [233.0, 234.1], [236.0, 236.31], [238.0, 237.66]], "keep_status": [false, false, false, false, false, false, false, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, true, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [37.66, 38.93, 0.0, 0.0, 0.0, 0.0, 0.0, 55.81, 43.66, 53.4, 0.0, 41.89, 0.0, 0.0, 0.0, 0.0, 0.0, 63.21, 55.67, 0.0, 0.0, 60.7, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 42.42, 47.31, 40.66, 0.0, 0.0, 37.69, 30.4, 36.92, 0.0, 46.22, 0.0, 58.47, 37.99, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["hum", 41.4], ["mains hum", 21.44], ["music", 10.97]], [["throbbing", 27.97], ["music", 26.9], ["hum", 19.7]], null, null, null, null, null, null, [["hum", 45.96], ["mains hum", 9.79], ["speech", 7.15]], null, null, [["speech", 18.2], ["fly, housefly", 14.19], ["music", 13.14]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["hum", 20.6], ["speech", 20.48], ["outside, rural or natural", 5.42]], null, [["throbbing", 16.84], ["hum", 12.63], ["music", 11.21]], [["music", 17.55], ["frog", 10.28], ["didgeridoo", 7.95]], [["music", 35.3], ["hum", 6.14], ["rumble", 4.81]], null, null, [["hum", 29.38], ["music", 26.84], ["throbbing", 24.41]], [["hum", 41.63], ["throbbing", 24.16], ["music", 15.48]], [["hum", 44.17], ["mains hum", 15.47], ["music", 14.63]], null, [["hum", 24.11], ["throbbing", 22.39], ["music", 8.6]], null, null, [["hum", 67.2], ["throbbing", 24.33], ["mains hum", 6.96]], null, null, null, null], "duration": [3.82, 16.53, 1.39, 1.25, 1.2, 1.82, 1.71, 2.69, 13.58, 7.91, 0.53, 5.51, -0.03, 0.11, -0.13, 0.18, 0.9, 3.97, 9.84, 0.73, 0.97, 2.05, 1.52, 1.49, 1.19, 0.3, 1.3, 5.38, 0.72, 4.51, 2.27, 2.4, 1.15, 1.01, 4.14, 22.09, 2.33, 0.96, 4.53, 1.18, 3.29, 10.85, 0.17, 1.1, 0.31, -0.34]} \ No newline at end of file diff --git a/annotations_1/ysudBGghmnA_filtered.json b/annotations_1/ysudBGghmnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..71df9a73fa307a7c2013974090f657c74d74f369 --- /dev/null +++ b/annotations_1/ysudBGghmnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 15.4], [16.0, 43.9], [47.0, 59.09], [60.0, 60.76], [73.0, 74.14], [76.0, 76.42], [78.0, 78.97], [80.0, 80.52], [85.0, 85.75], [96.0, 97.21], [101.0, 101.16], [103.0, 104.03], [105.0, 105.76], [116.0, 116.31], [126.0, 129.83], [132.0, 136.27], [138.0, 140.34], [141.0, 156.1], [157.0, 163.39], [164.0, 165.15], [167.0, 167.68], [170.0, 171.04], [172.0, 172.86]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [29.14, 28.59, 34.56, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.31, 47.62, 34.93, 32.2, 34.11, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 57.05], ["hum", 18.6], ["music", 14.26]], [["music", 35.47], ["hum", 26.11], ["throbbing", 23.15]], [["hum", 29.62], ["mains hum", 23.29], ["music", 11.74]], null, null, null, null, null, null, null, null, null, null, null, [["music", 53.23], ["speech", 14.17], ["hum", 9.46]], [["mains hum", 40.88], ["hum", 20.94], ["music", 17.83]], [["music", 43.88], ["hum", 12.69], ["speech", 10.34]], [["music", 38.5], ["hum", 12.03], ["mains hum", 7.34]], [["speech", 45.57], ["hum", 10.97], ["music", 7.61]], null, null, null, null], "duration": [12.4, 27.9, 12.09, 0.76, 1.14, 0.42, 0.97, 0.52, 0.75, 1.21, 0.16, 1.03, 0.76, 0.31, 3.83, 4.27, 2.34, 15.1, 6.39, 1.15, 0.68, 1.04, 0.86]} \ No newline at end of file diff --git a/annotations_1/yt1pZiuyKJE_filtered.json b/annotations_1/yt1pZiuyKJE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cef66be062e4ad8acdd8751bde46bb5b696c62b9 --- /dev/null +++ b/annotations_1/yt1pZiuyKJE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.38], [6.0, 19.48], [20.0, 22.52], [23.0, 24.7], [26.0, 31.38], [33.0, 48.91], [50.0, 50.97], [52.0, 51.85], [52.0, 53.23], [54.0, 55.49], [56.0, 59.27], [67.0, 68.39], [72.0, 75.49], [76.0, 77.25], [85.0, 85.73], [93.0, 93.46], [96.0, 97.92], [101.0, 105.36], [107.0, 107.67], [108.0, 110.4], [115.0, 118.34], [120.0, 120.78], [125.0, 129.12], [131.0, 140.05], [141.0, 142.84], [144.0, 182.65], [184.0, 185.16], [186.0, 186.41], [187.0, 187.52], [189.0, 191.32]], "keep_status": [false, true, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.67, 46.22, 0.0, 29.57, 38.6, 0.0, 0.0, 0.0, 0.0, 53.04, 0.0, 41.34, 0.0, 0.0, 0.0, 0.0, 62.37, 0.0, 62.47, 38.52, 0.0, 32.87, 40.11, 0.0, 0.0, 0.0, 0.0, 0.0, 52.74], "audiomae_on_audioset": [null, [["mains hum", 29.4], ["hum", 26.51], ["explosion", 13.14]], [["speech", 41.54], ["hum", 17.95], ["whale vocalization", 11.72]], null, [["explosion", 30.54], ["breaking", 24.95], ["burst, pop", 8.74]], [["music", 32.58], ["hum", 24.01], ["throbbing", 13.51]], null, null, null, null, null, null, [["music", 34.35], ["speech", 5.88], ["gong", 5.36]], null, null, null, null, null, null, null, [["music", 34.66], ["beatboxing", 13.11], ["electronic music", 5.56]], null, [["music", 62.01], ["synthesizer", 3.96], ["explosion", 3.74]], [["throbbing", 43.96], ["music", 23.34], ["hum", 19.43]], null, null, null, null, null, null], "duration": [1.38, 13.48, 2.52, 1.7, 5.38, 15.91, 0.97, -0.15, 1.23, 1.49, 3.27, 1.39, 3.49, 1.25, 0.73, 0.46, 1.92, 4.36, 0.67, 2.4, 3.34, 0.78, 4.12, 9.05, 1.84, 38.65, 1.16, 0.41, 0.52, 2.32]} \ No newline at end of file diff --git a/annotations_1/ytEsz9ZEh_g_filtered.json b/annotations_1/ytEsz9ZEh_g_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce0195b46624d773d704b5f3b31ae72ed78c0203 --- /dev/null +++ b/annotations_1/ytEsz9ZEh_g_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.73], [8.0, 9.63], [11.0, 14.05], [15.0, 19.47], [22.0, 32.0], [33.0, 35.55], [37.0, 53.47], [54.0, 57.06], [59.0, 60.71], [62.0, 65.35], [66.0, 68.05], [71.0, 74.31], [76.0, 99.64], [102.0, 109.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [98.8, 0.0, 90.6, 62.68, 59.96, 97.54, 97.22, 99.52, 0.0, 99.71, 99.65, 99.87, 83.88, 97.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.73, 1.63, 3.05, 4.47, 10.0, 2.55, 16.47, 3.06, 1.71, 3.35, 2.05, 3.31, 23.64, 7.07]} \ No newline at end of file diff --git a/annotations_1/yuQW4F1siis_filtered.json b/annotations_1/yuQW4F1siis_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9c0ee4e539fc028c373945cdc83c49022da13cfd --- /dev/null +++ b/annotations_1/yuQW4F1siis_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[18.0, 21.2], [23.0, 23.62], [26.0, 31.53], [34.0, 34.32], [35.0, 35.9], [37.0, 40.31], [41.0, 42.21], [43.0, 43.58], [44.0, 46.28], [49.0, 48.91], [52.0, 52.84], [55.0, 54.67], [55.0, 57.13], [58.0, 58.26], [59.0, 61.1], [61.0, 62.01], [65.0, 66.68], [68.0, 69.35], [71.0, 72.99], [74.0, 74.6], [75.0, 79.19], [84.0, 85.55], [94.0, 103.38], [105.0, 105.81], [108.0, 108.13], [108.0, 108.41], [108.0, 115.72], [116.0, 117.59], [119.0, 122.03], [123.0, 124.23], [130.0, 144.75]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true], "silence_prob": [52.74, 0.0, 54.9, 0.0, 0.0, 43.66, 0.0, 0.0, 48.82, 0.0, 0.0, 0.0, 54.36, 0.0, 37.71, 0.0, 0.0, 0.0, 0.0, 0.0, 36.98, 0.0, 42.11, 0.0, 0.0, 0.0, 39.69, 0.0, 50.31, 0.0, 31.05], "audiomae_on_audioset": [null, null, null, null, null, [["music", 23.07], ["hum", 13.32], ["whale vocalization", 7.68]], null, null, [["speech", 67.1], ["whale vocalization", 5.18], ["music", 3.4]], null, null, null, null, null, [["music", 19.07], ["speech", 18.39], ["hum", 17.51]], null, null, null, null, null, [["speech", 60.82], ["sidetone", 14.52], ["music", 8.4]], null, [["hum", 50.15], ["throbbing", 19.6], ["speech", 14.39]], null, null, null, [["hum", 36.64], ["sidetone", 18.99], ["mains hum", 13.13]], null, null, null, [["music", 41.44], ["speech", 25.4], ["didgeridoo", 2.62]]], "duration": [3.2, 0.62, 5.53, 0.32, 0.9, 3.31, 1.21, 0.58, 2.28, -0.09, 0.84, -0.33, 2.13, 0.26, 2.1, 1.01, 1.68, 1.35, 1.99, 0.6, 4.19, 1.55, 9.38, 0.81, 0.13, 0.41, 7.72, 1.59, 3.03, 1.23, 14.75]} \ No newline at end of file diff --git a/annotations_1/yuQipNK_BiQ_filtered.json b/annotations_1/yuQipNK_BiQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a3ea18de0eda287f73d73af12b76ed7a313b198 --- /dev/null +++ b/annotations_1/yuQipNK_BiQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.92], [5.0, 8.33], [9.0, 18.12], [21.0, 21.44], [24.0, 24.68], [26.0, 28.22], [30.0, 30.59], [34.0, 37.2], [39.0, 39.65], [42.0, 42.94], [45.0, 46.57], [48.0, 49.4], [52.0, 52.34], [54.0, 54.82], [55.0, 56.47], [58.0, 62.06], [63.0, 63.12], [64.0, 64.94], [66.0, 69.47], [71.0, 71.81], [79.0, 79.64], [81.0, 82.71], [84.0, 86.21], [90.0, 93.85], [98.0, 99.37], [105.0, 106.29], [107.0, 106.89], [107.0, 111.35], [113.0, 117.27], [119.0, 123.58], [124.0, 126.86], [129.0, 130.62], [132.0, 135.26], [136.0, 136.27], [139.0, 141.94]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [88.83, 93.6, 97.73, 0.0, 0.0, 99.99, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.93, 0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 99.97, 99.96, 0.0, 0.0, 0.0, 99.71, 99.88, 99.97, 99.91, 0.0, 99.91, 0.0, 97.73], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [3.92, 3.33, 9.12, 0.44, 0.68, 2.22, 0.59, 3.2, 0.65, 0.94, 1.57, 1.4, 0.34, 0.82, 1.47, 4.06, 0.12, 0.94, 3.47, 0.81, 0.64, 1.71, 2.21, 3.85, 1.37, 1.29, -0.11, 4.35, 4.27, 4.58, 2.86, 1.62, 3.26, 0.27, 2.94]} \ No newline at end of file diff --git a/annotations_1/yuU4pFcEgWo_filtered.json b/annotations_1/yuU4pFcEgWo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..11a04d4355146a7f7d16577be9da4d441cf905de --- /dev/null +++ b/annotations_1/yuU4pFcEgWo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.93], [23.0, 23.62], [26.0, 27.41], [28.0, 34.7], [45.0, 51.0], [51.0, 80.55], [81.0, 81.72], [83.0, 83.61], [85.0, 85.14], [87.0, 88.03], [92.0, 92.58], [93.0, 93.6], [94.0, 113.73], [117.0, 118.81], [119.0, 121.66], [124.0, 128.75], [131.0, 138.69], [142.0, 142.62], [147.0, 148.02], [149.0, 149.23], [152.0, 152.54], [154.0, 154.97], [159.0, 159.8], [161.0, 165.01]], "keep_status": [true, false, false, true, true, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false], "silence_prob": [29.15, 0.0, 0.0, 29.04, 30.36, 29.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 28.96, 0.0, 34.93, 30.44, 29.2, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 68.02], "audiomae_on_audioset": [[["speech", 24.98], ["foghorn", 22.07], ["music", 18.84]], null, null, [["livestock, farm animals, working animals", 22.82], ["moo", 12.44], ["cattle, bovinae", 10.74]], [["music", 33.37], ["hum", 5.27], ["throbbing", 5.23]], [["music", 65.89], ["speech", 14.43], ["musical instrument", 2.82]], null, null, null, null, null, null, [["music", 69.75], ["theremin", 4.87], ["musical instrument", 3.05]], null, [["speech", 20.62], ["animal", 19.65], ["radio", 8.97]], [["vehicle", 16.75], ["speech", 12.25], ["boat, water vehicle", 11.89]], [["music", 54.56], ["trombone", 15.42], ["echo", 4.81]], null, null, null, null, null, null, null], "duration": [9.93, 0.62, 1.41, 6.7, 6.0, 29.55, 0.72, 0.61, 0.14, 1.03, 0.58, 0.6, 19.73, 1.81, 2.66, 4.75, 7.69, 0.62, 1.02, 0.23, 0.54, 0.97, 0.8, 4.01]} \ No newline at end of file diff --git a/annotations_1/yunEcgw8va0_filtered.json b/annotations_1/yunEcgw8va0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6b4164098c7c13e658f1a7b25b98919a4e30c65f --- /dev/null +++ b/annotations_1/yunEcgw8va0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 9.31], [9.0, 9.49], [10.0, 9.98], [16.0, 17.54], [22.0, 23.75], [28.0, 30.13], [37.0, 37.99], [40.0, 53.96]], "keep_status": [false, false, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 30.81, 0.0, 30.36], "audiomae_on_audioset": [null, null, null, null, null, [["vehicle", 15.71], ["speech", 11.2], ["motorboat, speedboat", 4.9]], null, [["speech", 41.43], ["buzz", 10.62], ["music", 9.3]]], "duration": [1.31, 0.49, -0.02, 1.54, 1.75, 2.13, 0.99, 13.96]} \ No newline at end of file diff --git a/annotations_1/yvD3X3RcK3Y_filtered.json b/annotations_1/yvD3X3RcK3Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e55c1caa1d9993c0cd99177500e4c68b4b648951 --- /dev/null +++ b/annotations_1/yvD3X3RcK3Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 61.59], [62.0, 63.0], [64.0, 64.64], [69.0, 69.01], [70.0, 70.06], [71.0, 79.62], [82.0, 82.8], [85.0, 86.39], [88.0, 88.5], [89.0, 89.19], [90.0, 100.04], [101.0, 109.12], [110.0, 110.76], [112.0, 132.41], [140.0, 140.24], [141.0, 148.81], [150.0, 149.82], [151.0, 150.77], [153.0, 154.28]], "keep_status": [false, false, false, false, false, true, false, false, false, false, true, true, false, true, false, true, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 35.65, 0.0, 0.0, 0.0, 0.0, 33.5, 36.44, 0.0, 34.67, 0.0, 32.88, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["noise", 28.97], ["effects unit", 14.49], ["distortion", 12.02]], null, null, null, null, [["effects unit", 16.26], ["distortion", 12.38], ["music", 10.94]], [["distortion", 11.97], ["effects unit", 11.72], ["animal", 9.87]], null, [["noise", 36.26], ["effects unit", 12.14], ["distortion", 5.92]], null, [["music", 36.86], ["effects unit", 17.56], ["musical instrument", 10.2]], null, null, null], "duration": [56.59, 1.0, 0.64, 0.01, 0.06, 8.62, 0.8, 1.39, 0.5, 0.19, 10.04, 8.12, 0.76, 20.41, 0.24, 7.81, -0.18, -0.23, 1.28]} \ No newline at end of file diff --git a/annotations_1/yvtb9A9ai9Q_filtered.json b/annotations_1/yvtb9A9ai9Q_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f046e468842661bb16baa66e5fd65491eda5a0e0 --- /dev/null +++ b/annotations_1/yvtb9A9ai9Q_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.74], [9.0, 9.78], [12.0, 14.64], [17.0, 20.29], [22.0, 31.18], [33.0, 34.26], [37.0, 56.51], [80.0, 97.78], [99.0, 99.74], [101.0, 123.65], [130.0, 130.91], [132.0, 132.85]], "keep_status": [true, false, false, false, true, false, true, false, false, false, false, false], "silence_prob": [31.49, 0.0, 31.07, 32.04, 30.1, 0.0, 30.34, 30.59, 0.0, 30.86, 0.0, 0.0], "audiomae_on_audioset": [[["throbbing", 43.06], ["music", 15.76], ["hum", 7.82]], null, [["music", 60.97], ["throbbing", 5.51], ["electronic music", 4.71]], [["music", 47.83], ["throbbing", 14.02], ["speech", 13.81]], [["music", 44.35], ["throbbing", 12.74], ["whack, thwack", 6.16]], null, [["speech", 21.27], ["throbbing", 19.24], ["music", 18.87]], [["music", 53.66], ["speech", 12.63], ["electronic music", 5.75]], null, [["hum", 44.16], ["throbbing", 32.29], ["mains hum", 9.07]], null, null], "duration": [2.74, 0.78, 2.64, 3.29, 9.18, 1.26, 19.51, 17.78, 0.74, 22.65, 0.91, 0.85]} \ No newline at end of file diff --git a/annotations_1/yvzmLB30MwM_filtered.json b/annotations_1/yvzmLB30MwM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..894e3267505abb3063986ee3801b922b26b25405 --- /dev/null +++ b/annotations_1/yvzmLB30MwM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.1], [12.0, 16.77], [18.0, 18.33], [19.0, 19.31], [22.0, 22.65], [23.0, 30.11], [38.0, 42.8], [49.0, 53.6], [55.0, 56.37], [57.0, 58.02], [60.0, 61.3], [67.0, 67.58], [68.0, 70.01], [72.0, 80.74], [81.0, 83.35], [88.0, 90.19], [93.0, 114.83], [117.0, 140.39]], "keep_status": [false, false, false, false, false, true, true, true, false, false, false, false, false, false, true, false, true, true], "silence_prob": [29.5, 28.63, 0.0, 0.0, 0.0, 28.84, 28.66, 28.5, 0.0, 0.0, 0.0, 0.0, 30.43, 28.31, 30.04, 33.79, 29.23, 28.43], "audiomae_on_audioset": [[["throbbing", 49.88], ["hum", 20.81], ["music", 19.01]], [["hum", 38.05], ["mains hum", 29.33], ["music", 10.14]], null, null, null, [["speech", 44.1], ["music", 14.42], ["hum", 6.01]], [["music", 63.02], ["speech", 3.09], ["throbbing", 3.02]], [["speech", 33.32], ["music", 26.59], ["rumble", 6.51]], null, null, null, null, [["music", 49.5], ["speech", 21.0], ["hum", 2.95]], [["music", 67.17], ["cacophony", 5.06], ["speech", 2.85]], [["music", 26.57], ["hum", 7.46], ["cattle, bovinae", 7.05]], [["hum", 29.14], ["music", 26.77], ["mains hum", 18.3]], [["music", 48.28], ["speech", 14.37], ["thump, thud", 3.25]], [["speech", 41.17], ["music", 20.61], ["hum", 7.86]]], "duration": [3.1, 4.77, 0.33, 0.31, 0.65, 7.11, 4.8, 4.6, 1.37, 1.02, 1.3, 0.58, 2.01, 8.74, 2.35, 2.19, 21.83, 23.39]} \ No newline at end of file diff --git a/annotations_1/ywRWNlbXD8s_filtered.json b/annotations_1/ywRWNlbXD8s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a23229247509afa089756af6180529a55abb4ca1 --- /dev/null +++ b/annotations_1/ywRWNlbXD8s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.37], [18.0, 25.25], [31.0, 44.34], [48.0, 48.73], [50.0, 50.52], [53.0, 53.77], [55.0, 56.13], [58.0, 65.15], [68.0, 69.26], [70.0, 85.41], [89.0, 93.36], [103.0, 106.41], [107.0, 107.76], [112.0, 124.51], [128.0, 130.77], [137.0, 138.54]], "keep_status": [false, false, true, false, false, false, false, true, false, false, true, true, false, true, true, false], "silence_prob": [0.0, 33.16, 31.73, 0.0, 0.0, 0.0, 0.0, 31.95, 0.0, 66.39, 31.54, 36.84, 0.0, 30.44, 30.95, 0.0], "audiomae_on_audioset": [null, [["music", 42.16], ["hum", 23.53], ["throbbing", 14.46]], [["music", 46.26], ["didgeridoo", 7.17], ["boing", 6.31]], null, null, null, null, [["speech", 26.24], ["explosion", 21.01], ["animal", 6.9]], null, null, [["music", 25.01], ["hum", 21.31], ["gong", 12.07]], [["livestock, farm animals, working animals", 17.29], ["cattle, bovinae", 15.4], ["music", 9.46]], null, [["music", 53.62], ["hum", 9.22], ["mains hum", 6.81]], [["cattle, bovinae", 23.91], ["music", 15.23], ["moo", 10.97]], null], "duration": [1.37, 7.25, 13.34, 0.73, 0.52, 0.77, 1.13, 7.15, 1.26, 15.41, 4.36, 3.41, 0.76, 12.51, 2.77, 1.54]} \ No newline at end of file diff --git a/annotations_1/ywlNZzvlaKE_filtered.json b/annotations_1/ywlNZzvlaKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e9f72408f1af2f540db4ca6ae5ed3ee55d3e762c --- /dev/null +++ b/annotations_1/ywlNZzvlaKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 18.4], [19.0, 22.49], [23.0, 25.76], [27.0, 28.29], [29.0, 35.72], [36.0, 47.66], [48.0, 52.93], [54.0, 54.87], [56.0, 58.75], [60.0, 61.55], [62.0, 63.26], [64.0, 65.13], [66.0, 68.52], [70.0, 70.75], [72.0, 87.57], [89.0, 185.94], [186.0, 192.23]], "keep_status": [false, true, true, false, false, true, true, false, true, false, false, false, true, false, true, false, false], "silence_prob": [57.4, 38.84, 37.59, 0.0, 29.84, 28.45, 28.77, 0.0, 29.49, 0.0, 0.0, 0.0, 30.03, 0.0, 29.03, 0.0, 32.96], "audiomae_on_audioset": [null, [["speech", 23.96], ["hum", 20.15], ["music", 12.76]], [["speech", 32.67], ["sidetone", 15.92], ["noise", 6.69]], null, [["music", 58.45], ["noise", 17.19], ["synthesizer", 4.95]], [["music", 28.94], ["speech", 25.55], ["hum", 11.89]], [["speech", 50.85], ["music", 11.89], ["mains hum", 5.95]], null, [["mains hum", 45.54], ["hum", 10.07], ["electric shaver, electric razor", 9.33]], null, null, null, [["music", 24.28], ["didgeridoo", 16.34], ["hum", 5.47]], null, [["music", 34.11], ["didgeridoo", 18.1], ["hum", 17.53]], null, [["gong", 38.87], ["music", 34.64], ["ambient music", 15.71]]], "duration": [3.4, 3.49, 2.76, 1.29, 6.72, 11.66, 4.93, 0.87, 2.75, 1.55, 1.26, 1.13, 2.52, 0.75, 15.57, 96.94, 6.23]} \ No newline at end of file diff --git a/annotations_1/yxlXYm5Uo08_filtered.json b/annotations_1/yxlXYm5Uo08_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f210b424f31a0e81d1c6ec85deb6715c9308b7da --- /dev/null +++ b/annotations_1/yxlXYm5Uo08_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.47], [5.0, 15.69], [17.0, 18.96], [20.0, 23.63], [25.0, 32.16], [35.0, 36.41], [38.0, 40.37], [42.0, 43.38], [45.0, 48.74], [51.0, 51.07], [52.0, 56.62], [57.0, 60.74], [62.0, 67.17], [69.0, 70.17], [74.0, 77.35], [81.0, 81.63], [82.0, 83.42], [84.0, 89.34], [90.0, 90.32], [91.0, 92.38], [93.0, 95.82]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 46.86, 0.0, 96.42, 97.73, 0.0, 100.0, 0.0, 99.44, 0.0, 96.89, 52.27, 56.86, 0.0, 91.3, 0.0, 0.0, 51.5, 0.0, 0.0, 60.98], "audiomae_on_audioset": [null, [["music", 67.26], ["horse", 3.63], ["speech", 2.9]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.47, 10.69, 1.96, 3.63, 7.16, 1.41, 2.37, 1.38, 3.74, 0.07, 4.62, 3.74, 5.17, 1.17, 3.35, 0.63, 1.42, 5.34, 0.32, 1.38, 2.82]} \ No newline at end of file diff --git a/annotations_1/yyPkV_leKEY_filtered.json b/annotations_1/yyPkV_leKEY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..edd43f59c54c7dec10e75914b6f61f95283c258c --- /dev/null +++ b/annotations_1/yyPkV_leKEY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 3.91], [6.0, 7.72], [10.0, 9.93], [10.0, 10.56], [15.0, 16.87], [22.0, 23.63], [27.0, 31.97], [37.0, 38.67], [40.0, 42.57], [46.0, 49.64], [53.0, 53.22], [57.0, 57.59], [61.0, 60.98], [68.0, 68.2], [73.0, 74.16], [85.0, 87.72], [89.0, 90.85], [92.0, 93.51], [94.0, 95.93], [96.0, 98.46], [102.0, 105.31], [107.0, 117.1], [119.0, 120.34], [128.0, 130.57], [133.0, 133.78], [149.0, 154.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.8, 0.0, 77.87, 83.34, 0.0, 0.0, 0.0, 0.0, 0.0, 97.54, 0.0, 0.0, 0.0, 77.2, 75.07, 59.68, 0.0, 55.11, 0.0, 81.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.91, 1.72, -0.07, 0.56, 1.87, 1.63, 4.97, 1.67, 2.57, 3.64, 0.22, 0.59, -0.02, 0.2, 1.16, 2.72, 1.85, 1.51, 1.93, 2.46, 3.31, 10.1, 1.34, 2.57, 0.78, 5.95]} \ No newline at end of file diff --git a/annotations_1/yygNdTxoHus_filtered.json b/annotations_1/yygNdTxoHus_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5219824512ba8f358c5cf96b506007f060922af4 --- /dev/null +++ b/annotations_1/yygNdTxoHus_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.18], [3.0, 3.99], [6.0, 5.88], [10.0, 11.75], [12.0, 14.62], [18.0, 19.04], [21.0, 22.98], [24.0, 29.19], [31.0, 32.14], [32.0, 39.72], [48.0, 58.04], [59.0, 59.12], [60.0, 118.34], [119.0, 143.58], [147.0, 149.42], [155.0, 158.52], [163.0, 171.85], [175.0, 180.4], [187.0, 196.47], [197.0, 197.5], [198.0, 197.56], [198.0, 197.68], [198.0, 197.8], [198.0, 197.95]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 99.62, 0.0, 0.0, 99.8, 0.0, 93.13, 61.47, 0.0, 0.0, 35.62, 35.41, 34.37, 34.93, 34.54, 33.4, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 79.75], ["carnatic music", 3.59], ["theremin", 3.05]], [["music", 53.66], ["throbbing", 6.93], ["synthesizer", 5.23]], [["music", 68.7], ["didgeridoo", 11.8], ["musical instrument", 2.83]], [["music", 52.76], ["didgeridoo", 33.46], ["musical instrument", 2.87]], [["music", 56.83], ["didgeridoo", 12.61], ["beatboxing", 7.31]], [["music", 79.55], ["reggae", 1.72], ["funk", 1.48]], null, null, null, null, null], "duration": [0.18, 0.99, -0.12, 1.75, 2.62, 1.04, 1.98, 5.19, 1.14, 7.72, 10.04, 0.12, 58.34, 24.58, 2.42, 3.52, 8.85, 5.4, 9.47, 0.5, -0.44, -0.32, -0.2, -0.05]} \ No newline at end of file diff --git a/annotations_1/yywlulXZ0ls_filtered.json b/annotations_1/yywlulXZ0ls_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c2d938be61d6b22adf0b60db84a73269e19034cf --- /dev/null +++ b/annotations_1/yywlulXZ0ls_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.52], [18.0, 19.11], [25.0, 30.33], [31.0, 31.6], [35.0, 40.29], [41.0, 50.33], [53.0, 53.33], [54.0, 63.68], [66.0, 66.82], [67.0, 67.41], [68.0, 68.79], [71.0, 73.13]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, true], "silence_prob": [77.53, 0.0, 39.69, 0.0, 43.77, 34.13, 0.0, 43.58, 0.0, 0.0, 0.0, 44.26], "audiomae_on_audioset": [null, null, [["sidetone", 41.55], ["speech", 24.33], ["music", 8.88]], null, [["music", 49.25], ["cattle, bovinae", 6.56], ["moo", 5.36]], [["music", 61.4], ["groan", 13.9], ["synthesizer", 5.49]], null, [["speech", 51.4], ["duck", 11.19], ["quack", 8.51]], null, null, null, [["sidetone", 43.88], ["speech", 10.14], ["music", 6.44]]], "duration": [3.52, 1.11, 5.33, 0.6, 5.29, 9.33, 0.33, 9.68, 0.82, 0.41, 0.79, 2.13]} \ No newline at end of file diff --git a/annotations_1/yzera03y4_0_filtered.json b/annotations_1/yzera03y4_0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3bf3902e5ad46d6e43ce3913d334251f8297b94 --- /dev/null +++ b/annotations_1/yzera03y4_0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 11.89], [13.0, 14.39], [17.0, 23.53], [24.0, 34.15], [35.0, 39.56], [40.0, 42.69], [44.0, 44.68], [46.0, 46.85], [48.0, 49.45], [52.0, 55.7], [57.0, 59.21], [61.0, 64.47], [65.0, 68.69], [70.0, 77.73], [78.0, 78.29]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [63.74, 0.0, 82.61, 99.99, 99.65, 91.13, 0.0, 0.0, 0.0, 100.0, 99.99, 100.0, 98.59, 95.64, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [7.89, 1.39, 6.53, 10.15, 4.56, 2.69, 0.68, 0.85, 1.45, 3.7, 2.21, 3.47, 3.69, 7.73, 0.29]} \ No newline at end of file diff --git a/annotations_1/yzwheD19-PQ_filtered.json b/annotations_1/yzwheD19-PQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e2a41c76337e572c9bc5f491fdb823f9fbabce06 --- /dev/null +++ b/annotations_1/yzwheD19-PQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 12.07], [16.0, 25.46], [26.0, 61.69], [63.0, 91.0], [91.0, 91.66], [92.0, 105.46], [106.0, 108.35], [109.0, 110.19], [111.0, 113.1], [116.0, 116.23], [119.0, 118.89], [120.0, 120.7], [121.0, 122.15], [124.0, 129.73], [130.0, 133.79], [138.0, 168.91], [169.0, 169.94], [170.0, 172.22]], "keep_status": [false, true, false, true, false, false, true, false, false, false, false, false, false, true, true, false, false, false], "silence_prob": [31.5, 29.46, 0.0, 28.33, 0.0, 57.56, 49.18, 0.0, 34.77, 0.0, 0.0, 0.0, 0.0, 33.45, 47.08, 0.0, 0.0, 43.71], "audiomae_on_audioset": [[["speech", 52.4], ["music", 25.09], ["throbbing", 4.68]], [["music", 39.2], ["hum", 17.13], ["whale vocalization", 10.25]], null, [["buzz", 32.6], ["speech", 12.4], ["music", 9.25]], null, null, [["music", 36.43], ["didgeridoo", 8.03], ["hum", 3.49]], null, [["music", 39.79], ["speech", 28.34], ["didgeridoo", 5.83]], null, null, null, null, [["speech", 34.23], ["whack, thwack", 15.55], ["music", 9.69]], [["cattle, bovinae", 19.3], ["livestock, farm animals, working animals", 13.79], ["moo", 11.86]], null, null, [["music", 63.65], ["musical instrument", 5.68], ["guitar", 4.34]]], "duration": [3.07, 9.46, 35.69, 28.0, 0.66, 13.46, 2.35, 1.19, 2.1, 0.23, -0.11, 0.7, 1.15, 5.73, 3.79, 30.91, 0.94, 2.22]} \ No newline at end of file diff --git a/annotations_1/z-4DtLFGzG0_filtered.json b/annotations_1/z-4DtLFGzG0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0c39985f2cbc3101c062b2980ab4ffb3853797ca --- /dev/null +++ b/annotations_1/z-4DtLFGzG0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.22], [2.0, 2.96], [8.0, 8.06], [10.0, 11.42], [15.0, 16.38], [18.0, 18.28], [18.0, 23.09], [25.0, 26.7], [45.0, 46.52], [48.0, 49.1], [52.0, 52.69], [54.0, 58.58], [69.0, 69.31], [118.0, 119.79], [121.0, 121.9], [129.0, 129.24], [130.0, 129.96], [130.0, 130.1], [130.0, 136.7], [138.0, 138.11], [144.0, 144.36], [153.0, 154.31], [156.0, 156.78], [158.0, 159.34], [160.0, 168.02], [169.0, 169.42], [171.0, 171.54]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.1, 0.0, 0.0, 0.0, 0.0, 73.97, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.15, 0.0, 0.0, 0.0, 0.0, 0.0, 29.72, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["speech", 48.56], ["music", 29.45], ["livestock, farm animals, working animals", 6.04]], null, null, null, null, null, [["speech", 28.85], ["sonar", 28.05], ["music", 20.39]], null, null], "duration": [0.22, 0.96, 0.06, 1.42, 1.38, 0.28, 5.09, 1.7, 1.52, 1.1, 0.69, 4.58, 0.31, 1.79, 0.9, 0.24, -0.04, 0.1, 6.7, 0.11, 0.36, 1.31, 0.78, 1.34, 8.02, 0.42, 0.54]} \ No newline at end of file diff --git a/annotations_1/z-fCbA2aAyg_filtered.json b/annotations_1/z-fCbA2aAyg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..6e648f961408c32163f4333225d668f0419fa272 --- /dev/null +++ b/annotations_1/z-fCbA2aAyg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 16.9], [19.0, 19.8], [21.0, 22.57], [35.0, 35.8], [38.0, 38.58], [49.0, 49.98], [52.0, 53.86], [55.0, 55.09], [56.0, 56.94], [58.0, 58.75], [61.0, 64.12], [65.0, 67.58], [68.0, 79.34], [80.0, 80.45], [83.0, 109.61], [114.0, 117.0], [120.0, 130.69], [134.0, 134.25], [134.0, 140.16], [147.0, 150.87], [151.0, 151.23], [152.0, 165.25]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, true, false, false], "silence_prob": [30.73, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 86.27, 31.13, 0.0, 29.69, 30.39, 31.78, 0.0, 30.76, 29.93, 0.0, 30.07], "audiomae_on_audioset": [[["speech", 26.96], ["music", 25.67], ["didgeridoo", 3.75]], null, null, null, null, null, null, null, null, null, null, null, [["speech", 33.53], ["music", 29.63], ["whale vocalization", 5.9]], null, [["music", 35.53], ["mosquito", 6.96], ["whale vocalization", 6.52]], [["electric shaver, electric razor", 22.07], ["music", 6.19], ["buzz", 5.87]], [["music", 55.43], ["theremin", 8.97], ["hum", 8.91]], null, [["music", 43.38], ["speech", 31.81], ["didgeridoo", 2.92]], [["music", 32.81], ["theremin", 10.74], ["speech", 8.86]], null, [["music", 84.69], ["meow", 1.52], ["musical instrument", 1.24]]], "duration": [10.9, 0.8, 1.57, 0.8, 0.58, 0.98, 1.86, 0.09, 0.94, 0.75, 3.12, 2.58, 11.34, 0.45, 26.61, 3.0, 10.69, 0.25, 6.16, 3.87, 0.23, 13.25]} \ No newline at end of file diff --git a/annotations_1/z08tZYDrY_8_filtered.json b/annotations_1/z08tZYDrY_8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..126c783e3ed82abe1de180bf521801ebc8530e53 --- /dev/null +++ b/annotations_1/z08tZYDrY_8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.98], [11.0, 23.46], [24.0, 36.69], [42.0, 46.45], [48.0, 56.19], [59.0, 85.5], [89.0, 105.95], [109.0, 110.46], [113.0, 120.6], [122.0, 133.03]], "keep_status": [false, false, false, true, true, false, false, false, false, true], "silence_prob": [0.0, 28.52, 28.71, 28.64, 28.7, 28.76, 28.89, 0.0, 29.3, 28.32], "audiomae_on_audioset": [null, [["music", 60.35], ["throbbing", 8.47], ["hum", 5.52]], [["music", 51.55], ["cacophony", 17.23], ["sound effect", 4.29]], [["speech", 44.58], ["music", 5.61], ["vehicle", 5.19]], [["music", 32.37], ["mains hum", 14.69], ["hum", 11.85]], [["hum", 29.8], ["throbbing", 24.95], ["mains hum", 19.54]], [["music", 76.9], ["throbbing", 6.63], ["electronic music", 4.57]], null, [["music", 75.92], ["electronic music", 7.33], ["trance music", 4.92]], [["mains hum", 19.77], ["hum", 15.97], ["music", 13.62]]], "duration": [0.98, 12.46, 12.69, 4.45, 8.19, 26.5, 16.95, 1.46, 7.6, 11.03]} \ No newline at end of file diff --git a/annotations_1/z1RLdJwkFZA_filtered.json b/annotations_1/z1RLdJwkFZA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f1f0851e3ba9abd588fb68801f618c1dcf852d0e --- /dev/null +++ b/annotations_1/z1RLdJwkFZA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 30.06], [34.0, 62.85], [64.0, 66.12], [73.0, 72.6], [77.0, 87.67], [89.0, 90.24], [92.0, 98.09], [101.0, 101.71]], "keep_status": [false, false, true, false, true, false, false, false], "silence_prob": [35.22, 32.83, 44.6, 0.0, 33.77, 0.0, 35.8, 0.0], "audiomae_on_audioset": [[["music", 51.74], ["throbbing", 19.64], ["hum", 7.74]], [["throbbing", 38.84], ["music", 27.64], ["hum", 17.79]], [["music", 25.67], ["fly, housefly", 9.23], ["mosquito", 7.55]], null, [["music", 58.61], ["thump, thud", 5.56], ["whack, thwack", 3.42]], null, [["speech", 30.92], ["music", 27.67], ["hum", 18.89]], null], "duration": [17.06, 28.85, 2.12, -0.4, 10.67, 1.24, 6.09, 0.71]} \ No newline at end of file diff --git a/annotations_1/z21tJkx07J8_filtered.json b/annotations_1/z21tJkx07J8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f4684d943b4d2318e544197a19761d40c0fef1da --- /dev/null +++ b/annotations_1/z21tJkx07J8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[67.0, 68.28], [69.0, 122.45]], "keep_status": [false, false], "silence_prob": [0.0, 0.0], "audiomae_on_audioset": [null, null], "duration": [1.28, 53.45]} \ No newline at end of file diff --git a/annotations_1/z23vdob1grU_filtered.json b/annotations_1/z23vdob1grU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..22be788d96ac0db83737774f77f705fd62615aaf --- /dev/null +++ b/annotations_1/z23vdob1grU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 35.77], [38.0, 40.73], [42.0, 52.19], [53.0, 84.08], [86.0, 94.41], [97.0, 99.81], [102.0, 158.31]], "keep_status": [true, false, false, false, false, true, false], "silence_prob": [31.58, 79.76, 59.51, 0.0, 32.94, 33.27, 0.0], "audiomae_on_audioset": [[["speech", 31.13], ["music", 15.45], ["animal", 4.94]], null, null, null, [["mains hum", 33.22], ["hum", 32.79], ["speech", 14.46]], [["music", 31.99], ["theremin", 23.01], ["creak", 2.88]], null], "duration": [22.77, 2.73, 10.19, 31.08, 8.41, 2.81, 56.31]} \ No newline at end of file diff --git a/annotations_1/z2NhPvlzjcg_filtered.json b/annotations_1/z2NhPvlzjcg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ddd8cadebe3c2a5d64e08a890bd813d6e30cc7c5 --- /dev/null +++ b/annotations_1/z2NhPvlzjcg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 14.34], [15.0, 23.6], [24.0, 23.92], [24.0, 24.11], [25.0, 29.57], [32.0, 35.13], [40.0, 44.37], [45.0, 47.66], [51.0, 57.42], [62.0, 71.44], [75.0, 76.55], [78.0, 83.52], [85.0, 85.9], [86.0, 86.29], [87.0, 88.15], [93.0, 112.94], [114.0, 118.05], [121.0, 121.1], [126.0, 134.37], [137.0, 143.11], [144.0, 144.96], [146.0, 146.7], [147.0, 161.96]], "keep_status": [false, true, false, false, true, false, true, true, true, false, false, true, false, false, false, true, true, false, false, true, false, false, false], "silence_prob": [30.73, 29.75, 0.0, 0.0, 31.29, 40.79, 33.83, 34.86, 31.82, 35.28, 0.0, 32.67, 0.0, 0.0, 0.0, 30.05, 33.36, 0.0, 32.23, 30.29, 0.0, 0.0, 29.42], "audiomae_on_audioset": [[["music", 52.58], ["didgeridoo", 19.5], ["animal", 4.09]], [["music", 48.03], ["bow-wow", 14.1], ["animal", 7.33]], null, null, [["music", 42.22], ["brass instrument", 14.92], ["foghorn", 6.59]], [["music", 69.26], ["didgeridoo", 4.47], ["synthesizer", 1.93]], [["music", 20.81], ["animal", 13.1], ["speech", 11.7]], [["theremin", 28.41], ["music", 25.93], ["roar", 7.36]], [["speech", 22.77], ["music", 20.61], ["insect", 7.41]], [["music", 40.26], ["speech", 25.43], ["animal", 6.53]], null, [["music", 29.65], ["speech", 17.17], ["animal", 6.81]], null, null, null, [["music", 43.02], ["animal", 9.59], ["whack, thwack", 6.22]], [["noise", 28.86], ["music", 15.32], ["speech", 12.42]], null, [["music", 68.03], ["speech", 5.23], ["animal", 5.09]], [["music", 30.02], ["speech", 21.09], ["oink", 6.51]], null, null, [["music", 82.34], ["animal", 4.3], ["bow-wow", 2.22]]], "duration": [9.34, 8.6, -0.08, 0.11, 4.57, 3.13, 4.37, 2.66, 6.42, 9.44, 1.55, 5.52, 0.9, 0.29, 1.15, 19.94, 4.05, 0.1, 8.37, 6.11, 0.96, 0.7, 14.96]} \ No newline at end of file diff --git a/annotations_1/z2PH2-yl5Ho_filtered.json b/annotations_1/z2PH2-yl5Ho_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..829efac57e6e4a0f3ae702bcdf54001b98f4fd77 --- /dev/null +++ b/annotations_1/z2PH2-yl5Ho_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 11.72], [13.0, 12.93], [13.0, 17.46], [19.0, 82.29], [83.0, 83.44], [84.0, 92.96], [94.0, 94.68], [95.0, 100.04], [101.0, 110.44], [111.0, 110.59], [112.0, 142.99], [146.0, 154.47]], "keep_status": [false, false, true, false, false, true, false, false, true, false, false, true], "silence_prob": [31.52, 0.0, 33.34, 0.0, 0.0, 29.58, 0.0, 29.14, 29.11, 0.0, 0.0, 28.69], "audiomae_on_audioset": [[["music", 55.77], ["throbbing", 16.61], ["hum", 9.39]], null, [["music", 29.03], ["hum", 25.18], ["speech", 15.4]], null, null, [["music", 43.99], ["hum", 12.22], ["mains hum", 11.39]], null, [["speech", 54.74], ["music", 9.1], ["explosion", 6.44]], [["speech", 36.96], ["music", 17.17], ["throbbing", 8.4]], null, null, [["music", 26.19], ["mains hum", 20.25], ["hum", 14.47]]], "duration": [5.72, -0.07, 4.46, 63.29, 0.44, 8.96, 0.68, 5.04, 9.44, -0.41, 30.99, 8.47]} \ No newline at end of file diff --git a/annotations_1/z542q4dYk-0_filtered.json b/annotations_1/z542q4dYk-0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..59ef065c2f35024d14ec21f3914220279e7a042f --- /dev/null +++ b/annotations_1/z542q4dYk-0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.4], [6.0, 10.44], [13.0, 12.92], [14.0, 15.38], [19.0, 19.21], [20.0, 21.44], [22.0, 23.5], [26.0, 31.14], [34.0, 98.25], [102.0, 105.76], [108.0, 110.79], [112.0, 118.69]], "keep_status": [false, false, false, false, false, false, false, true, false, true, true, true], "silence_prob": [0.0, 66.63, 0.0, 0.0, 0.0, 0.0, 0.0, 30.33, 0.0, 37.18, 29.1, 31.29], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["hum", 24.96], ["mains hum", 17.08], ["speech", 14.6]], null, [["music", 35.72], ["throbbing", 13.26], ["hum", 9.97]], [["speech", 17.66], ["fly, housefly", 14.34], ["vehicle", 12.37]], [["music", 52.85], ["trombone", 5.53], ["musical instrument", 3.19]]], "duration": [1.4, 4.44, -0.08, 1.38, 0.21, 1.44, 1.5, 5.14, 64.25, 3.76, 2.79, 6.69]} \ No newline at end of file diff --git a/annotations_1/z5NuK6qTdBc_filtered.json b/annotations_1/z5NuK6qTdBc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0ea7e97bc806275d0f66dedf79a90ab71dfc6fae --- /dev/null +++ b/annotations_1/z5NuK6qTdBc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 37.5], [39.0, 39.26], [40.0, 51.17], [51.0, 53.32], [57.0, 61.45], [65.0, 65.62], [66.0, 77.77], [85.0, 90.09], [92.0, 92.57], [94.0, 95.49], [97.0, 99.44], [100.0, 102.39], [106.0, 107.76], [109.0, 110.0], [114.0, 116.34], [118.0, 119.38], [120.0, 124.46], [130.0, 131.23], [137.0, 138.25], [139.0, 142.33]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [38.9, 0.0, 33.12, 32.6, 31.23, 0.0, 30.91, 30.7, 0.0, 0.0, 56.93, 33.56, 0.0, 0.0, 42.08, 0.0, 29.58, 0.0, 0.0, 47.2], "audiomae_on_audioset": [[["throbbing", 30.05], ["hum", 20.38], ["speech", 14.6]], null, [["hum", 41.32], ["mains hum", 21.54], ["speech", 15.64]], [["speech", 29.81], ["hum", 29.12], ["music", 12.5]], [["throbbing", 39.38], ["music", 21.35], ["hum", 13.85]], null, [["music", 39.2], ["speech", 27.02], ["whack, thwack", 6.66]], [["speech", 59.61], ["music", 19.13], ["fart", 2.88]], null, null, null, [["speech", 68.72], ["music", 22.05], ["throbbing", 1.04]], null, null, [["music", 84.82], ["throbbing", 1.99], ["scary music", 1.87]], null, [["speech", 50.06], ["music", 21.82], ["thump, thud", 3.37]], null, null, [["music", 37.42], ["hum", 24.85], ["throbbing", 9.98]]], "duration": [9.5, 0.26, 11.17, 2.32, 4.45, 0.62, 11.77, 5.09, 0.57, 1.49, 2.44, 2.39, 1.76, 1.0, 2.34, 1.38, 4.46, 1.23, 1.25, 3.33]} \ No newline at end of file diff --git a/annotations_1/z79ikmr3JY8_filtered.json b/annotations_1/z79ikmr3JY8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..25d44ca0cfafd38b96ea37011cff94b34bf2598b --- /dev/null +++ b/annotations_1/z79ikmr3JY8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[59.0, 59.46], [61.0, 61.67], [67.0, 68.55], [71.0, 71.02], [73.0, 72.84], [75.0, 93.85], [95.0, 98.09], [100.0, 111.67], [114.0, 124.28], [126.0, 146.08], [150.0, 150.47], [151.0, 160.51], [163.0, 165.25], [169.0, 174.77], [177.0, 176.76], [177.0, 187.83], [191.0, 195.67], [196.0, 197.63], [198.0, 201.83]], "keep_status": [false, false, false, false, false, true, true, false, true, false, false, true, true, false, false, false, true, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 29.46, 29.24, 29.52, 28.89, 29.23, 0.0, 29.06, 29.45, 29.32, 0.0, 29.46, 29.81, 0.0, 30.72], "audiomae_on_audioset": [null, null, null, null, null, [["music", 39.59], ["hum", 10.4], ["sound effect", 4.95]], [["rumble", 17.8], ["mains hum", 12.06], ["hum", 8.53]], [["music", 65.25], ["didgeridoo", 8.03], ["speech", 2.22]], [["throbbing", 29.35], ["music", 24.18], ["hum", 9.48]], [["music", 34.18], ["whack, thwack", 18.78], ["smash, crash", 17.49]], null, [["music", 57.57], ["speech", 8.1], ["didgeridoo", 3.93]], [["explosion", 11.7], ["burst, pop", 10.9], ["whip", 10.08]], [["mains hum", 34.26], ["music", 26.13], ["hum", 16.59]], null, [["music", 54.99], ["buzz", 13.83], ["cacophony", 5.91]], [["fly, housefly", 26.96], ["hum", 10.9], ["mosquito", 7.81]], null, [["music", 30.47], ["hum", 14.82], ["throbbing", 8.98]]], "duration": [0.46, 0.67, 1.55, 0.02, -0.16, 18.85, 3.09, 11.67, 10.28, 20.08, 0.47, 9.51, 2.25, 5.77, -0.24, 10.83, 4.67, 1.63, 3.83]} \ No newline at end of file diff --git a/annotations_1/z7J95xF4vW8_filtered.json b/annotations_1/z7J95xF4vW8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/z7J95xF4vW8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/z7fOP7aW1P4_filtered.json b/annotations_1/z7fOP7aW1P4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..dfe1a26d52c9f3edc432be9b3adda2bc9356814e --- /dev/null +++ b/annotations_1/z7fOP7aW1P4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 5.46], [11.0, 11.97], [13.0, 13.68], [15.0, 14.79], [15.0, 19.5], [23.0, 24.31], [25.0, 26.37], [29.0, 30.75], [32.0, 33.42], [34.0, 35.61], [39.0, 42.18], [44.0, 45.5], [47.0, 49.27], [51.0, 51.75], [53.0, 54.23], [57.0, 57.97], [68.0, 71.37], [84.0, 84.33], [95.0, 94.91], [101.0, 101.65], [103.0, 103.84], [106.0, 106.95], [108.0, 109.98], [111.0, 111.81], [113.0, 115.26], [120.0, 121.51], [124.0, 124.19], [128.0, 129.34], [134.0, 135.03], [135.0, 135.31], [139.0, 139.14], [139.0, 146.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.81, 0.0, 0.0, 0.0, 99.98, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 100.0, 0.0, 0.0, 0.0, 45.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.43, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.23], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 40.47], ["guitar", 15.31], ["plucked string instrument", 8.13]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["cattle, bovinae", 30.74], ["speech", 28.42], ["moo", 15.4]]], "duration": [2.46, 0.97, 0.68, -0.21, 4.5, 1.31, 1.37, 1.75, 1.42, 1.61, 3.18, 1.5, 2.27, 0.75, 1.23, 0.97, 3.37, 0.33, -0.09, 0.65, 0.84, 0.95, 1.98, 0.81, 2.26, 1.51, 0.19, 1.34, 1.03, 0.31, 0.14, 7.4]} \ No newline at end of file diff --git a/annotations_1/z7gYF5LF-ec_filtered.json b/annotations_1/z7gYF5LF-ec_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f6aa0078a4b488b89a5583ab48e635c1f82c2f9e --- /dev/null +++ b/annotations_1/z7gYF5LF-ec_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.25], [10.0, 13.34], [15.0, 15.01], [16.0, 16.85], [22.0, 22.67], [30.0, 30.91], [38.0, 40.73], [42.0, 44.39], [46.0, 45.82], [61.0, 62.5], [78.0, 78.51], [80.0, 82.21], [92.0, 95.44], [96.0, 97.19], [98.0, 98.27], [99.0, 99.96]], "keep_status": [false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 38.04, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 79.07, 97.11, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["speech", 28.81], ["fart", 10.0], ["throbbing", 8.58]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.25, 3.34, 0.01, 0.85, 0.67, 0.91, 2.73, 2.39, -0.18, 1.5, 0.51, 2.21, 3.44, 1.19, 0.27, 0.96]} \ No newline at end of file diff --git a/annotations_1/z7siqPhc1qc_filtered.json b/annotations_1/z7siqPhc1qc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4aa1374fdfd3065b6eae91f6e55d4bddb4fdbccb --- /dev/null +++ b/annotations_1/z7siqPhc1qc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.03], [19.0, 28.61], [34.0, 35.06], [36.0, 36.21], [39.0, 40.15], [40.0, 42.16], [43.0, 46.41], [49.0, 52.84], [53.0, 54.92], [58.0, 60.27], [61.0, 61.65], [62.0, 63.22], [66.0, 66.09], [69.0, 71.1], [72.0, 71.85], [72.0, 72.6], [76.0, 75.86], [77.0, 77.09], [82.0, 85.09], [94.0, 95.62], [96.0, 98.76], [105.0, 106.05], [108.0, 111.15], [112.0, 112.7], [114.0, 115.38], [116.0, 117.15], [118.0, 122.49], [123.0, 124.26], [125.0, 128.01], [129.0, 129.78], [132.0, 135.6], [136.0, 145.57], [146.0, 148.85], [150.0, 149.94], [152.0, 152.74], [158.0, 162.89], [167.0, 169.45], [173.0, 175.73], [178.0, 183.05], [184.0, 188.72], [191.0, 198.32], [200.0, 203.99]], "keep_status": [false, true, false, false, false, true, true, true, false, true, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, true, true, true, true], "silence_prob": [52.8, 47.27, 0.0, 0.0, 0.0, 35.62, 42.48, 40.14, 0.0, 35.42, 0.0, 0.0, 0.0, 49.5, 0.0, 0.0, 0.0, 0.0, 37.01, 0.0, 35.41, 0.0, 49.54, 0.0, 0.0, 0.0, 69.47, 0.0, 40.84, 0.0, 64.97, 29.74, 31.05, 0.0, 0.0, 29.14, 29.47, 28.79, 28.67, 28.65, 32.64, 38.41], "audiomae_on_audioset": [null, [["speech", 36.58], ["sidetone", 17.91], ["fly, housefly", 11.36]], null, null, null, [["speech", 26.97], ["beatboxing", 9.04], ["grunt", 5.33]], [["animal", 13.47], ["livestock, farm animals, working animals", 11.85], ["moo", 11.74]], [["mains hum", 19.28], ["hum", 18.45], ["music", 9.22]], null, [["electric shaver, electric razor", 14.77], ["mains hum", 12.41], ["frog", 6.67]], null, null, null, [["throbbing", 31.7], ["hum", 26.86], ["speech", 15.63]], null, null, null, null, [["sidetone", 20.53], ["speech", 18.87], ["throbbing", 16.9]], null, [["noise", 36.85], ["frog", 7.82], ["whale vocalization", 6.34]], null, [["whale vocalization", 46.28], ["hum", 17.53], ["throbbing", 12.62]], null, null, null, null, null, [["sidetone", 43.38], ["speech", 17.03], ["whale vocalization", 12.95]], null, null, [["speech", 50.42], ["explosion", 15.32], ["music", 6.54]], [["music", 52.58], ["speech", 8.99], ["sidetone", 5.48]], null, null, [["music", 49.7], ["speech", 29.89], ["crowd", 3.29]], [["music", 73.61], ["electronic music", 4.55], ["trance music", 2.66]], [["music", 43.53], ["speech", 15.54], ["electronic music", 4.32]], [["music", 43.77], ["speech", 5.65], ["electronic music", 5.07]], [["music", 26.19], ["throbbing", 16.66], ["electronic music", 11.24]], [["music", 25.54], ["synthesizer", 13.85], ["fly, housefly", 12.43]], [["animal", 10.15], ["whale vocalization", 8.56], ["music", 5.14]]], "duration": [6.03, 9.61, 1.06, 0.21, 1.15, 2.16, 3.41, 3.84, 1.92, 2.27, 0.65, 1.22, 0.09, 2.1, -0.15, 0.6, -0.14, 0.09, 3.09, 1.62, 2.76, 1.05, 3.15, 0.7, 1.38, 1.15, 4.49, 1.26, 3.01, 0.78, 3.6, 9.57, 2.85, -0.06, 0.74, 4.89, 2.45, 2.73, 5.05, 4.72, 7.32, 3.99]} \ No newline at end of file diff --git a/annotations_1/z7tcVyV7wjw_filtered.json b/annotations_1/z7tcVyV7wjw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..26c0aac2ad3bdeb72db0e86fbe5c71315fc03e7d --- /dev/null +++ b/annotations_1/z7tcVyV7wjw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 4.73], [11.0, 11.8], [13.0, 27.23], [29.0, 29.56], [32.0, 32.39], [33.0, 33.57], [34.0, 34.38], [36.0, 37.54], [46.0, 47.28], [48.0, 48.51], [49.0, 49.17], [51.0, 50.97], [53.0, 53.52], [60.0, 60.71], [62.0, 64.91], [65.0, 66.92], [68.0, 74.17], [76.0, 76.35], [79.0, 80.23], [86.0, 86.17], [87.0, 87.69], [92.0, 93.18], [95.0, 95.39], [97.0, 96.82], [99.0, 99.2], [105.0, 105.63], [107.0, 109.07], [128.0, 129.51], [130.0, 130.98], [137.0, 138.72], [139.0, 143.85], [146.0, 154.48], [155.0, 160.64], [162.0, 162.45], [166.0, 166.85], [169.0, 178.73], [179.0, 178.88]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, true, true, false, false, false, true, false], "silence_prob": [99.92, 0.0, 98.59, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.16, 0.0, 37.98, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.64, 0.0, 0.0, 0.0, 28.85, 31.31, 37.61, 0.0, 0.0, 42.62, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 39.91], ["thunk", 9.7], ["noise", 5.74]], null, [["speech", 26.67], ["music", 26.26], ["boing", 11.59]], null, null, null, null, null, null, null, null, null, [["humming", 20.32], ["synthetic singing", 8.08], ["boing", 7.82]], null, null, null, [["theremin", 24.73], ["hum", 13.93], ["music", 8.57]], [["music", 28.39], ["speech", 11.63], ["whale vocalization", 11.35]], [["speech", 59.23], ["music", 17.66], ["groan", 4.54]], null, null, [["hum", 23.21], ["throbbing", 18.87], ["music", 11.46]], null], "duration": [3.73, 0.8, 14.23, 0.56, 0.39, 0.57, 0.38, 1.54, 1.28, 0.51, 0.17, -0.03, 0.52, 0.71, 2.91, 1.92, 6.17, 0.35, 1.23, 0.17, 0.69, 1.18, 0.39, -0.18, 0.2, 0.63, 2.07, 1.51, 0.98, 1.72, 4.85, 8.48, 5.64, 0.45, 0.85, 9.73, -0.12]} \ No newline at end of file diff --git a/annotations_1/z82GwvEQ3Vc_filtered.json b/annotations_1/z82GwvEQ3Vc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..082d61032923a5d3a134c17d6702203d833c9ff9 --- /dev/null +++ b/annotations_1/z82GwvEQ3Vc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.18], [7.0, 7.35], [11.0, 11.8], [14.0, 22.13], [27.0, 28.09], [34.0, 34.94], [36.0, 37.13], [38.0, 38.62], [41.0, 41.57], [44.0, 48.24], [49.0, 49.82], [51.0, 54.41], [56.0, 56.24], [61.0, 61.21], [62.0, 68.25], [79.0, 80.37], [81.0, 82.48], [87.0, 89.77], [94.0, 95.32], [97.0, 99.76]], "keep_status": [false, false, false, true, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 37.99, 0.0, 0.0, 0.0, 0.0, 0.0, 47.66, 0.0, 31.32, 0.0, 0.0, 30.57, 0.0, 0.0, 31.18, 0.0, 37.2], "audiomae_on_audioset": [null, null, null, [["music", 43.27], ["throbbing", 13.92], ["hum", 9.58]], null, null, null, null, null, [["speech", 32.91], ["hum", 14.55], ["music", 9.85]], null, [["music", 55.11], ["boing", 24.16], ["speech", 9.08]], null, null, [["music", 51.24], ["speech", 19.72], ["whack, thwack", 4.13]], null, null, [["music", 68.99], ["animal", 6.03], ["dog", 4.74]], null, [["speech", 58.18], ["music", 12.98], ["rumble", 6.23]]], "duration": [1.18, 0.35, 0.8, 8.13, 1.09, 0.94, 1.13, 0.62, 0.57, 4.24, 0.82, 3.41, 0.24, 0.21, 6.25, 1.37, 1.48, 2.77, 1.32, 2.76]} \ No newline at end of file diff --git a/annotations_1/z8XPccwMkKE_filtered.json b/annotations_1/z8XPccwMkKE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..50047f1acc751a0c75c3781aa960f9a8a85a324a --- /dev/null +++ b/annotations_1/z8XPccwMkKE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 13.42], [14.0, 15.09], [18.0, 29.42], [30.0, 30.79], [32.0, 38.94], [41.0, 41.23], [42.0, 48.86], [49.0, 51.6], [52.0, 64.0], [65.0, 68.45], [72.0, 76.27]], "keep_status": [false, false, true, false, true, false, false, false, true, false, false], "silence_prob": [33.38, 0.0, 29.54, 0.0, 29.29, 0.0, 29.06, 29.18, 28.78, 28.82, 28.34], "audiomae_on_audioset": [[["hum", 60.05], ["mains hum", 21.26], ["throbbing", 16.83]], null, [["music", 22.05], ["hum", 13.21], ["rumble", 9.83]], null, [["music", 37.19], ["sonar", 9.96], ["rumble", 6.82]], null, [["music", 68.97], ["sidetone", 9.09], ["musical instrument", 5.4]], [["music", 64.83], ["electronic music", 6.14], ["synthesizer", 4.8]], [["music", 43.46], ["electronic music", 14.92], ["sidetone", 3.93]], [["music", 52.2], ["throbbing", 10.04], ["synthesizer", 7.94]], [["speech", 68.38], ["explosion", 8.32], ["burst, pop", 5.79]]], "duration": [6.42, 1.09, 11.42, 0.79, 6.94, 0.23, 6.86, 2.6, 12.0, 3.45, 4.27]} \ No newline at end of file diff --git a/annotations_1/z9OUZNicTGU_filtered.json b/annotations_1/z9OUZNicTGU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3a6e7dad729f44f41ed8e957d8b85f272e536deb --- /dev/null +++ b/annotations_1/z9OUZNicTGU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[28.0, 28.53], [32.0, 32.53], [64.0, 64.18], [73.0, 73.87], [97.0, 98.2], [104.0, 105.36], [107.0, 108.9], [112.0, 112.04], [114.0, 114.34], [116.0, 115.97], [120.0, 120.09], [133.0, 133.3], [143.0, 143.97], [148.0, 148.74]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.53, 0.53, 0.18, 0.87, 1.2, 1.36, 1.9, 0.04, 0.34, -0.03, 0.09, 0.3, 0.97, 0.74]} \ No newline at end of file diff --git a/annotations_1/z9uP9znP-mA_filtered.json b/annotations_1/z9uP9znP-mA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..64bc8203fef32548ee540dcb5a8752ef40af04fd --- /dev/null +++ b/annotations_1/z9uP9znP-mA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 30.4], [35.0, 34.94], [41.0, 41.37], [49.0, 79.3], [83.0, 99.66], [100.0, 105.24], [106.0, 107.15], [108.0, 108.48], [114.0, 116.28], [117.0, 118.08], [126.0, 127.31], [129.0, 148.41], [150.0, 157.03], [159.0, 167.91], [170.0, 181.82], [183.0, 194.54], [202.0, 202.41], [204.0, 204.48]], "keep_status": [true, false, false, false, true, true, false, false, true, false, false, false, false, true, true, false, false, false], "silence_prob": [31.6, 0.0, 0.0, 0.0, 30.59, 31.56, 0.0, 0.0, 42.81, 0.0, 0.0, 31.12, 32.19, 30.9, 31.82, 31.73, 0.0, 0.0], "audiomae_on_audioset": [[["music", 29.51], ["hum", 7.43], ["foghorn", 5.65]], null, null, null, [["music", 48.36], ["throbbing", 12.57], ["hum", 7.99]], [["music", 48.38], ["speech", 12.31], ["buzz", 2.78]], null, null, [["music", 26.79], ["synthesizer", 13.26], ["speech", 8.44]], null, null, [["music", 76.68], ["synthesizer", 4.59], ["theremin", 2.35]], [["music", 72.29], ["throbbing", 3.33], ["cacophony", 2.38]], [["music", 57.16], ["musical instrument", 5.96], ["theremin", 2.91]], [["music", 29.41], ["cowbell", 9.02], ["livestock, farm animals, working animals", 6.14]], [["music", 37.5], ["speech", 20.71], ["buzz", 14.09]], null, null], "duration": [26.4, -0.06, 0.37, 30.3, 16.66, 5.24, 1.15, 0.48, 2.28, 1.08, 1.31, 19.41, 7.03, 8.91, 11.82, 11.54, 0.41, 0.48]} \ No newline at end of file diff --git a/annotations_1/zBLsO7BKVHw_filtered.json b/annotations_1/zBLsO7BKVHw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cfd4cba73f5060795d08bbb03a3b53184bb940bb --- /dev/null +++ b/annotations_1/zBLsO7BKVHw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 9.22], [13.0, 14.57], [15.0, 15.65], [18.0, 110.56], [112.0, 112.31], [117.0, 140.83], [142.0, 150.57], [153.0, 156.52]], "keep_status": [true, false, false, false, false, false, false, false], "silence_prob": [46.36, 0.0, 0.0, 0.0, 0.0, 31.12, 44.96, 81.0], "audiomae_on_audioset": [[["speech", 23.79], ["mains hum", 12.02], ["hum", 10.03]], null, null, null, null, [["music", 77.14], ["trombone", 5.86], ["brass instrument", 4.71]], [["speech", 73.31], ["sidetone", 4.02], ["busy signal", 3.99]], null], "duration": [3.22, 1.57, 0.65, 92.56, 0.31, 23.83, 8.57, 3.52]} \ No newline at end of file diff --git a/annotations_1/zDEPob22tHs_filtered.json b/annotations_1/zDEPob22tHs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9c6d1f8645b06d20f49167e8ef2e24d67ae90c6 --- /dev/null +++ b/annotations_1/zDEPob22tHs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.53], [5.0, 5.58], [7.0, 7.59], [13.0, 14.18], [16.0, 16.9], [22.0, 23.09], [24.0, 25.19], [31.0, 32.78], [34.0, 34.26], [34.0, 35.48], [39.0, 41.67], [43.0, 55.26], [56.0, 57.18], [57.0, 58.89], [60.0, 60.24], [64.0, 64.94], [67.0, 69.48], [72.0, 72.55], [81.0, 81.48], [84.0, 85.68], [87.0, 89.23], [91.0, 92.04], [95.0, 107.74], [108.0, 109.65], [118.0, 119.91], [121.0, 125.29], [126.0, 128.41], [129.0, 131.53], [132.0, 133.05], [135.0, 135.65], [142.0, 142.4]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.96, 62.68, 0.0, 0.0, 0.0, 0.0, 55.18, 0.0, 0.0, 0.0, 50.16, 0.0, 79.76, 0.0, 0.0, 54.1, 43.53, 72.6, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["sidetone", 50.08], ["speech", 19.88], ["hum", 8.1]], null, null, null, null], "duration": [1.53, 0.58, 0.59, 1.18, 0.9, 1.09, 1.19, 1.78, 0.26, 1.48, 2.67, 12.26, 1.18, 1.89, 0.24, 0.94, 2.48, 0.55, 0.48, 1.68, 2.23, 1.04, 12.74, 1.65, 1.91, 4.29, 2.41, 2.53, 1.05, 0.65, 0.4]} \ No newline at end of file diff --git a/annotations_1/zDQHwzF1n4U_filtered.json b/annotations_1/zDQHwzF1n4U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ce84ab7eb5a285e1371b21b4da857a5cb30bda34 --- /dev/null +++ b/annotations_1/zDQHwzF1n4U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[21.0, 22.55], [26.0, 31.48], [32.0, 34.15], [38.0, 40.19], [44.0, 45.74], [50.0, 88.4], [93.0, 103.45], [119.0, 120.72], [130.0, 132.27], [141.0, 171.41]], "keep_status": [false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 30.91, 31.05, 30.88, 0.0, 0.0, 30.81, 0.0, 31.26, 0.0], "audiomae_on_audioset": [null, [["music", 71.34], ["rock and roll", 3.9], ["roll", 3.74]], [["music", 53.76], ["funny music", 2.99], ["sampler", 2.5]], [["music", 62.65], ["throbbing", 8.45], ["musical instrument", 2.21]], null, null, [["music", 66.2], ["roll", 7.77], ["rock and roll", 7.13]], null, [["music", 63.67], ["electronic music", 4.66], ["musical instrument", 3.48]], null], "duration": [1.55, 5.48, 2.15, 2.19, 1.74, 38.4, 10.45, 1.72, 2.27, 30.41]} \ No newline at end of file diff --git a/annotations_1/zElzcOQWLLo_filtered.json b/annotations_1/zElzcOQWLLo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..411a2001c92a69e99ee913ca4098c4a9a48c180a --- /dev/null +++ b/annotations_1/zElzcOQWLLo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 5.49], [8.0, 11.6], [12.0, 37.02], [40.0, 41.64], [43.0, 54.41], [55.0, 55.95], [56.0, 57.38], [59.0, 59.95], [61.0, 69.87], [74.0, 79.3], [83.0, 89.07], [90.0, 95.99], [97.0, 97.19], [100.0, 101.09], [102.0, 102.68], [104.0, 105.41], [107.0, 110.08], [112.0, 113.17], [115.0, 118.29], [124.0, 124.33], [126.0, 130.76], [134.0, 135.72], [138.0, 138.75], [141.0, 142.8], [150.0, 152.32], [158.0, 158.77], [160.0, 160.29], [167.0, 169.32], [176.0, 175.95]], "keep_status": [false, true, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 32.32, 42.72, 0.0, 77.87, 0.0, 0.0, 0.0, 99.48, 58.3, 48.06, 70.72, 0.0, 0.0, 0.0, 0.0, 65.32, 0.0, 97.33, 0.0, 99.59, 0.0, 0.0, 0.0, 99.99, 0.0, 0.0, 99.99, 0.0], "audiomae_on_audioset": [null, [["speech", 26.24], ["music", 24.93], ["electric shaver, electric razor", 9.62]], [["music", 24.09], ["hum", 20.51], ["coin (dropping)", 18.69]], null, null, null, null, null, null, null, [["hiccup", 16.03], ["fart", 13.44], ["laughter", 11.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.49, 3.6, 25.02, 1.64, 11.41, 0.95, 1.38, 0.95, 8.87, 5.3, 6.07, 5.99, 0.19, 1.09, 0.68, 1.41, 3.08, 1.17, 3.29, 0.33, 4.76, 1.72, 0.75, 1.8, 2.32, 0.77, 0.29, 2.32, -0.05]} \ No newline at end of file diff --git a/annotations_1/zErzJxN84iw_filtered.json b/annotations_1/zErzJxN84iw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1a3ffb1a888222df97a72fcf562fb661f28d82d2 --- /dev/null +++ b/annotations_1/zErzJxN84iw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[50.0, 56.84], [59.0, 59.93], [61.0, 61.21], [62.0, 64.37], [70.0, 71.52]], "keep_status": [false, false, false, true, false], "silence_prob": [34.25, 0.0, 0.0, 30.61, 0.0], "audiomae_on_audioset": [[["music", 56.88], ["throbbing", 28.33], ["hum", 2.53]], null, null, [["whip", 25.48], ["music", 17.23], ["speech", 15.48]], null], "duration": [6.84, 0.93, 0.21, 2.37, 1.52]} \ No newline at end of file diff --git a/annotations_1/zFDNg1Swx0s_filtered.json b/annotations_1/zFDNg1Swx0s_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..338b68d109dbba38c0aadf9b963e517f5fce1602 --- /dev/null +++ b/annotations_1/zFDNg1Swx0s_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[23.0, 27.82], [32.0, 49.6], [53.0, 75.02], [75.0, 81.18], [82.0, 83.07], [87.0, 90.48], [93.0, 98.02], [99.0, 103.0], [108.0, 112.11], [114.0, 116.92], [120.0, 125.63], [126.0, 133.3], [135.0, 135.85], [136.0, 137.83], [138.0, 142.37], [143.0, 147.63]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [91.98, 97.22, 49.82, 96.89, 0.0, 99.91, 99.36, 86.45, 99.65, 98.8, 99.65, 99.21, 0.0, 0.0, 46.86, 70.72], "audiomae_on_audioset": [null, null, [["speech", 29.49], ["sidetone", 27.88], ["radio", 12.3]], null, null, null, null, null, null, null, null, null, null, null, [["sine wave", 47.89], ["hum", 11.97], ["chirp tone", 11.33]], null], "duration": [4.82, 17.6, 22.02, 6.18, 1.07, 3.48, 5.02, 4.0, 4.11, 2.92, 5.63, 7.3, 0.85, 1.83, 4.37, 4.63]} \ No newline at end of file diff --git a/annotations_1/zFIHYJAp2rc_filtered.json b/annotations_1/zFIHYJAp2rc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4339f857c7b2743586817be26e99b458a19d6073 --- /dev/null +++ b/annotations_1/zFIHYJAp2rc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 55.59], [56.0, 57.33], [58.0, 63.17], [64.0, 65.01], [66.0, 66.45], [69.0, 71.52], [73.0, 77.85], [79.0, 84.87], [85.0, 87.56], [88.0, 104.94], [111.0, 152.95], [154.0, 156.1], [157.0, 158.31], [159.0, 164.83], [166.0, 166.94]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false], "silence_prob": [40.43, 0.0, 46.68, 0.0, 0.0, 39.85, 38.83, 59.59, 71.43, 43.48, 0.0, 59.33, 0.0, 49.27, 0.0], "audiomae_on_audioset": [[["mains hum", 38.19], ["hum", 16.77], ["speech", 10.65]], null, [["speech", 45.04], ["sheep", 15.81], ["goat", 7.38]], null, null, [["speech", 21.91], ["music", 10.66], ["boing", 8.73]], [["whale vocalization", 40.98], ["speech", 30.26], ["music", 3.77]], null, null, [["electric shaver, electric razor", 42.05], ["speech", 26.52], ["hum", 8.82]], null, null, null, [["music", 52.34], ["hum", 14.2], ["throbbing", 9.71]], null], "duration": [25.59, 1.33, 5.17, 1.01, 0.45, 2.52, 4.85, 5.87, 2.56, 16.94, 41.95, 2.1, 1.31, 5.83, 0.94]} \ No newline at end of file diff --git a/annotations_1/zFxkzMB3qCE_filtered.json b/annotations_1/zFxkzMB3qCE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e861972a6a30fd23d22e1801a3bb357e9399efc5 --- /dev/null +++ b/annotations_1/zFxkzMB3qCE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.5], [6.0, 6.54], [8.0, 8.51], [12.0, 12.88], [17.0, 17.54], [20.0, 20.12], [23.0, 23.25], [27.0, 27.68], [31.0, 33.02], [34.0, 34.77], [41.0, 41.62], [43.0, 44.22], [47.0, 49.01], [52.0, 52.73], [55.0, 56.02], [57.0, 58.77]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.29, 0.0, 0.0, 0.0, 94.95, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.5, 0.54, 0.51, 0.88, 0.54, 0.12, 0.25, 0.68, 2.02, 0.77, 0.62, 1.22, 2.01, 0.73, 1.02, 1.77]} \ No newline at end of file diff --git a/annotations_1/zGXxYW_Zisk_filtered.json b/annotations_1/zGXxYW_Zisk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/zGXxYW_Zisk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/zH80pWTYSLg_filtered.json b/annotations_1/zH80pWTYSLg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..49af11371b5b72432368a167b3e937f3e54a4bd8 --- /dev/null +++ b/annotations_1/zH80pWTYSLg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 29.39], [37.0, 43.12], [46.0, 47.48], [51.0, 53.42], [57.0, 57.64], [59.0, 59.34], [61.0, 63.85], [72.0, 72.06], [73.0, 77.25], [77.0, 81.58], [83.0, 85.09], [88.0, 88.33], [90.0, 91.5], [92.0, 93.63], [97.0, 97.63], [100.0, 101.61], [103.0, 103.49], [105.0, 107.25], [108.0, 108.72], [110.0, 115.84], [117.0, 117.95], [123.0, 124.43], [126.0, 126.94], [128.0, 131.21], [133.0, 134.4], [135.0, 135.75], [136.0, 139.45]], "keep_status": [true, true, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [29.84, 33.58, 0.0, 54.63, 0.0, 0.0, 55.31, 0.0, 34.42, 40.77, 43.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.3, 0.0, 54.56, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 54.23], "audiomae_on_audioset": [[["music", 48.24], ["musical instrument", 14.27], ["effects unit", 6.69]], [["music", 25.49], ["theremin", 16.24], ["speech", 6.5]], null, null, null, null, null, null, [["speech", 73.85], ["sidetone", 9.47], ["radio", 5.46]], [["music", 19.46], ["speech", 16.5], ["noise", 9.71]], [["music", 48.36], ["sidetone", 15.0], ["speech", 4.92]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [24.39, 6.12, 1.48, 2.42, 0.64, 0.34, 2.85, 0.06, 4.25, 4.58, 2.09, 0.33, 1.5, 1.63, 0.63, 1.61, 0.49, 2.25, 0.72, 5.84, 0.95, 1.43, 0.94, 3.21, 1.4, 0.75, 3.45]} \ No newline at end of file diff --git a/annotations_1/zHqM-oKCPBY_filtered.json b/annotations_1/zHqM-oKCPBY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..0945e4c7997239679b4c1a539081f7fdaa1700ee --- /dev/null +++ b/annotations_1/zHqM-oKCPBY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[15.0, 52.76], [54.0, 100.77], [101.0, 101.9], [104.0, 124.07], [126.0, 128.46], [130.0, 129.78]], "keep_status": [false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 30.52, 32.55, 0.0], "audiomae_on_audioset": [null, null, null, [["music", 69.69], ["throbbing", 9.87], ["hum", 3.58]], [["music", 47.47], ["boing", 16.56], ["smash, crash", 4.12]], null], "duration": [37.76, 46.77, 0.9, 20.07, 2.46, -0.22]} \ No newline at end of file diff --git a/annotations_1/zHwUR2EqUO0_filtered.json b/annotations_1/zHwUR2EqUO0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a3738b0b0f171477118e03a46c0768520e971e3b --- /dev/null +++ b/annotations_1/zHwUR2EqUO0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.38], [8.0, 8.5], [9.0, 9.17], [9.0, 9.91], [10.0, 10.3], [13.0, 13.88], [16.0, 22.06], [22.0, 30.52], [32.0, 39.46], [42.0, 42.42], [43.0, 52.59], [58.0, 62.28], [62.0, 62.46], [63.0, 64.76], [66.0, 77.04], [78.0, 85.7], [89.0, 111.79], [116.0, 122.28], [123.0, 124.78], [137.0, 144.95], [147.0, 176.66], [179.0, 192.01], [194.0, 204.16], [206.0, 206.25], [208.0, 208.11]], "keep_status": [false, false, false, false, false, false, false, true, false, false, true, true, false, false, false, false, false, false, false, true, false, true, true, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.41, 39.33, 52.92, 0.0, 31.14, 35.77, 0.0, 0.0, 31.97, 32.44, 31.17, 31.55, 0.0, 30.38, 30.58, 30.82, 31.09, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["music", 40.85], ["speech", 17.88], ["breaking", 4.23]], null, null, [["music", 20.55], ["speech", 12.65], ["whack, thwack", 9.36]], [["music", 41.47], ["speech", 14.33], ["throbbing", 13.64]], null, null, [["music", 44.42], ["speech", 25.48], ["whack, thwack", 5.61]], [["music", 67.52], ["throbbing", 13.74], ["hum", 3.45]], [["music", 68.19], ["didgeridoo", 6.91], ["speech", 2.96]], [["fly, housefly", 46.75], ["insect", 21.77], ["mosquito", 11.52]], null, [["music", 29.82], ["throbbing", 25.96], ["hum", 8.58]], [["speech", 43.23], ["music", 37.97], ["throbbing", 7.26]], [["livestock, farm animals, working animals", 31.01], ["cattle, bovinae", 15.52], ["music", 11.99]], [["music", 41.39], ["theremin", 18.93], ["noise", 6.04]], null, null], "duration": [0.38, 0.5, 0.17, 0.91, 0.3, 0.88, 6.06, 8.52, 7.46, 0.42, 9.59, 4.28, 0.46, 1.76, 11.04, 7.7, 22.79, 6.28, 1.78, 7.95, 29.66, 13.01, 10.16, 0.25, 0.11]} \ No newline at end of file diff --git a/annotations_1/zIKq7DqdZa4_filtered.json b/annotations_1/zIKq7DqdZa4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..56d5a5c8044fc9f55790d0e625dba72b5fc4aacf --- /dev/null +++ b/annotations_1/zIKq7DqdZa4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.72], [6.0, 6.99], [7.0, 12.51], [13.0, 15.35], [18.0, 20.73], [22.0, 24.17], [29.0, 28.97], [30.0, 32.81], [34.0, 34.43], [35.0, 47.39], [49.0, 52.07], [54.0, 81.9], [88.0, 95.81], [97.0, 96.85], [102.0, 118.76], [124.0, 124.7], [127.0, 137.69], [139.0, 139.06], [139.0, 140.43], [141.0, 142.03], [143.0, 146.06], [147.0, 147.6], [148.0, 149.07], [150.0, 152.05], [154.0, 155.51], [157.0, 157.49], [162.0, 161.72], [166.0, 166.41], [167.0, 168.39], [170.0, 170.67], [173.0, 173.57]], "keep_status": [false, false, true, true, true, false, false, false, false, false, false, false, true, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 34.68, 47.43, 45.02, 77.87, 0.0, 31.25, 0.0, 70.16, 55.25, 33.27, 30.87, 0.0, 39.33, 0.0, 46.97, 0.0, 0.0, 0.0, 52.86, 0.0, 0.0, 56.4, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 32.36], ["fly, housefly", 16.68], ["insect", 11.34]], [["speech", 42.96], ["hum", 9.89], ["sidetone", 6.3]], [["hum", 26.59], ["mains hum", 24.18], ["speech", 14.37]], null, null, [["speech", 38.03], ["sidetone", 22.64], ["music", 11.39]], null, null, null, [["hum", 39.62], ["throbbing", 20.18], ["mains hum", 13.71]], [["throbbing", 22.4], ["hum", 21.67], ["speech", 19.41]], null, [["fly, housefly", 14.05], ["insect", 13.99], ["hum", 8.17]], null, [["music", 56.23], ["hum", 15.27], ["theremin", 6.64]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.72, 0.99, 5.51, 2.35, 2.73, 2.17, -0.03, 2.81, 0.43, 12.39, 3.07, 27.9, 7.81, -0.15, 16.76, 0.7, 10.69, 0.06, 1.43, 1.03, 3.06, 0.6, 1.07, 2.05, 1.51, 0.49, -0.28, 0.41, 1.39, 0.67, 0.57]} \ No newline at end of file diff --git a/annotations_1/zJ3hgBFfQy0_filtered.json b/annotations_1/zJ3hgBFfQy0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..17cd53bcad8ad50501c6fe4bb4599b13be6b2fd1 --- /dev/null +++ b/annotations_1/zJ3hgBFfQy0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.75], [6.0, 6.62], [8.0, 11.3], [12.0, 13.86], [16.0, 18.23], [19.0, 21.93], [22.0, 24.61], [25.0, 26.22], [27.0, 28.83], [30.0, 31.5], [35.0, 36.59], [38.0, 39.16], [41.0, 42.21], [45.0, 45.57], [48.0, 49.89], [51.0, 52.84]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 100.0, 0.0, 100.0, 91.47, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.75, 0.62, 3.3, 1.86, 2.23, 2.93, 2.61, 1.22, 1.83, 1.5, 1.59, 1.16, 1.21, 0.57, 1.89, 1.84]} \ No newline at end of file diff --git a/annotations_1/zJMCctR8ivc_filtered.json b/annotations_1/zJMCctR8ivc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..983e93f2615eba03a530f29241243e87315af083 --- /dev/null +++ b/annotations_1/zJMCctR8ivc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.5], [8.0, 7.8], [12.0, 12.11], [24.0, 25.39], [27.0, 27.36], [28.0, 29.42], [33.0, 33.59], [36.0, 36.88], [38.0, 38.21], [46.0, 46.89], [49.0, 49.6], [50.0, 50.52], [54.0, 53.74], [56.0, 56.32], [58.0, 70.26], [71.0, 71.12], [72.0, 72.33], [73.0, 73.58], [75.0, 76.23], [78.0, 78.24], [82.0, 83.02], [84.0, 85.38], [87.0, 87.62], [88.0, 88.4], [89.0, 90.29], [95.0, 95.17], [96.0, 96.09], [98.0, 99.22], [103.0, 103.65], [105.0, 105.31], [107.0, 107.22], [109.0, 110.3], [111.0, 112.63], [114.0, 114.07], [116.0, 121.36], [126.0, 126.52], [130.0, 134.87], [136.0, 137.17], [138.0, 137.98], [140.0, 142.79], [146.0, 148.05]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.17, 0.0, 31.59, 0.0, 0.0, 44.15, 53.22], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 16.5], ["speech", 16.37], ["theremin", 9.76]], null, null, [["speech", 31.7], ["throbbing", 8.03], ["hum", 7.66]], null], "duration": [0.5, -0.2, 0.11, 1.39, 0.36, 1.42, 0.59, 0.88, 0.21, 0.89, 0.6, 0.52, -0.26, 0.32, 12.26, 0.12, 0.33, 0.58, 1.23, 0.24, 1.02, 1.38, 0.62, 0.4, 1.29, 0.17, 0.09, 1.22, 0.65, 0.31, 0.22, 1.3, 1.63, 0.07, 5.36, 0.52, 4.87, 1.17, -0.02, 2.79, 2.05]} \ No newline at end of file diff --git a/annotations_1/zKATih1nvVo_filtered.json b/annotations_1/zKATih1nvVo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5015d8a8bceddba19eff344db80c63f65ca5cbce --- /dev/null +++ b/annotations_1/zKATih1nvVo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 13.81], [14.0, 18.5], [20.0, 22.6], [31.0, 38.99], [40.0, 39.85], [45.0, 45.03], [45.0, 56.86], [62.0, 70.31], [73.0, 73.01], [73.0, 80.33], [81.0, 81.4], [83.0, 83.37]], "keep_status": [true, true, true, true, false, false, false, false, false, false, false, false], "silence_prob": [44.84, 46.5, 40.92, 42.88, 0.0, 0.0, 34.32, 49.5, 0.0, 43.87, 0.0, 0.0], "audiomae_on_audioset": [[["speech", 44.09], ["outside, urban or manmade", 11.69], ["run", 7.63]], [["fly, housefly", 19.26], ["whale vocalization", 12.12], ["mosquito", 11.35]], [["speech", 24.5], ["fly, housefly", 20.21], ["mosquito", 14.79]], [["speech", 22.63], ["moo", 14.99], ["whale vocalization", 11.0]], null, null, [["speech", 81.0], ["whack, thwack", 2.93], ["fart", 2.34]], [["speech", 75.71], ["beatboxing", 9.07], ["music", 2.94]], null, [["speech", 92.34], ["fart", 1.53], ["inside, small room", 0.48]], null, null], "duration": [3.81, 4.5, 2.6, 7.99, -0.15, 0.03, 11.86, 8.31, 0.01, 7.33, 0.4, 0.37]} \ No newline at end of file diff --git a/annotations_1/zLkNUykewic_filtered.json b/annotations_1/zLkNUykewic_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..fec6189de497209f5b547a3659cf93c3ae86657f --- /dev/null +++ b/annotations_1/zLkNUykewic_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 5.83], [9.0, 9.1], [10.0, 10.59], [12.0, 12.78], [16.0, 16.53], [17.0, 62.8], [65.0, 86.61]], "keep_status": [false, false, false, false, false, false, false], "silence_prob": [37.55, 0.0, 0.0, 0.0, 0.0, 0.0, 30.55], "audiomae_on_audioset": [[["shofar", 54.0], ["wind instrument, woodwind instrument", 15.45], ["music", 8.17]], null, null, null, null, null, [["mains hum", 38.14], ["hum", 30.25], ["speech", 7.6]]], "duration": [3.83, 0.1, 0.59, 0.78, 0.53, 45.8, 21.61]} \ No newline at end of file diff --git a/annotations_1/zNMpSVorNr0_filtered.json b/annotations_1/zNMpSVorNr0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbe22abfc0e655ce220a0bce21251e76ef3b04d --- /dev/null +++ b/annotations_1/zNMpSVorNr0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 8.26], [10.0, 11.15], [25.0, 25.41], [26.0, 26.11], [29.0, 53.77], [60.0, 61.84], [65.0, 66.18], [68.0, 69.9], [72.0, 73.75], [76.0, 77.04], [78.0, 80.47], [86.0, 86.81], [91.0, 94.0], [97.0, 101.76], [107.0, 108.77], [109.0, 110.57], [118.0, 117.9], [119.0, 119.67], [120.0, 130.08], [131.0, 137.17], [138.0, 138.03], [140.0, 141.78], [145.0, 146.53], [148.0, 149.86], [152.0, 159.83]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 41.09, 0.0, 0.0, 0.0, 0.0, 0.0, 47.82, 0.0, 43.53, 41.16, 0.0, 0.0, 0.0, 0.0, 40.17, 49.45, 0.0, 0.0, 0.0, 0.0, 39.74], "audiomae_on_audioset": [null, null, null, null, [["hum", 22.28], ["speech", 20.87], ["mains hum", 12.24]], null, null, null, null, null, [["fart", 60.59], ["speech", 13.99], ["burping, eructation", 3.17]], null, [["throbbing", 21.16], ["hum", 18.13], ["heart sounds, heartbeat", 9.99]], [["speech", 64.38], ["noise", 5.99], ["hum", 5.56]], null, null, null, null, [["speech", 66.93], ["burping, eructation", 5.8], ["animal", 2.46]], [["animal", 15.32], ["fly, housefly", 11.43], ["speech", 6.81]], null, null, null, null, [["speech", 68.32], ["hum", 5.9], ["sheep", 4.2]]], "duration": [1.26, 1.15, 0.41, 0.11, 24.77, 1.84, 1.18, 1.9, 1.75, 1.04, 2.47, 0.81, 3.0, 4.76, 1.77, 1.57, -0.1, 0.67, 10.08, 6.17, 0.03, 1.78, 1.53, 1.86, 7.83]} \ No newline at end of file diff --git a/annotations_1/zNSDAaeIh7U_filtered.json b/annotations_1/zNSDAaeIh7U_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a2d38e6f05171a2869167bea5c950f71ea2cc44c --- /dev/null +++ b/annotations_1/zNSDAaeIh7U_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 9.39], [11.0, 13.41], [15.0, 28.54], [31.0, 36.04], [42.0, 43.97], [46.0, 48.47], [50.0, 50.43], [53.0, 58.75], [63.0, 97.44], [101.0, 113.34], [114.0, 162.68]], "keep_status": [true, false, true, true, false, false, false, true, false, true, false], "silence_prob": [32.16, 84.25, 31.04, 33.56, 0.0, 67.76, 0.0, 29.25, 0.0, 29.74, 0.0], "audiomae_on_audioset": [[["music", 25.02], ["thunk", 17.56], ["theremin", 9.72]], null, [["buzz", 27.19], ["mains hum", 24.27], ["hum", 11.81]], [["hum", 15.13], ["mains hum", 9.68], ["whale vocalization", 9.32]], null, null, null, [["vehicle", 44.55], ["car", 12.81], ["race car, auto racing", 9.12]], null, [["hum", 27.27], ["music", 24.2], ["mains hum", 9.69]], null], "duration": [8.39, 2.41, 13.54, 5.04, 1.97, 2.47, 0.43, 5.75, 34.44, 12.34, 48.68]} \ No newline at end of file diff --git a/annotations_1/zNT4XSI1doU_filtered.json b/annotations_1/zNT4XSI1doU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/zNT4XSI1doU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/zOHL9JZPELk_filtered.json b/annotations_1/zOHL9JZPELk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a9b9176144dce18ad70b95fb69b25b7a466af10c --- /dev/null +++ b/annotations_1/zOHL9JZPELk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.55], [12.0, 12.11], [14.0, 34.69], [45.0, 47.24], [52.0, 53.27], [62.0, 62.33], [64.0, 63.9], [92.0, 92.26], [95.0, 95.77], [100.0, 100.8], [106.0, 106.15], [112.0, 113.05], [120.0, 120.23], [130.0, 130.77], [134.0, 135.68], [136.0, 136.12], [147.0, 148.78], [150.0, 150.36], [152.0, 152.69], [155.0, 156.12], [160.0, 160.62], [165.0, 175.73]], "keep_status": [false, false, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 43.28, 37.36, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 55.04], "audiomae_on_audioset": [null, null, [["mains hum", 25.93], ["hum", 23.43], ["noise", 15.49]], [["music", 16.81], ["synthesizer", 12.15], ["musical instrument", 7.82]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.55, 0.11, 20.69, 2.24, 1.27, 0.33, -0.1, 0.26, 0.77, 0.8, 0.15, 1.05, 0.23, 0.77, 1.68, 0.12, 1.78, 0.36, 0.69, 1.12, 0.62, 10.73]} \ No newline at end of file diff --git a/annotations_1/zOvMmwnFVa0_filtered.json b/annotations_1/zOvMmwnFVa0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2b0ca65bcbaa7f2679e20519b9202d48b8f998d6 --- /dev/null +++ b/annotations_1/zOvMmwnFVa0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[16.0, 19.4], [20.0, 49.71], [51.0, 82.17], [84.0, 85.53], [86.0, 92.87], [93.0, 103.45], [108.0, 107.91], [109.0, 109.48], [111.0, 111.43], [114.0, 115.13], [121.0, 121.34], [122.0, 122.32], [125.0, 125.0], [130.0, 130.0], [136.0, 137.12], [139.0, 143.45], [145.0, 145.89]], "keep_status": [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [30.25, 28.94, 0.0, 0.0, 29.74, 30.82, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0], "audiomae_on_audioset": [[["music", 44.17], ["whale vocalization", 14.22], ["theremin", 10.12]], [["music", 33.25], ["buzz", 24.63], ["hum", 5.69]], null, null, [["speech", 37.29], ["music", 36.01], ["fart", 2.72]], [["speech", 42.29], ["music", 25.77], ["noise", 7.11]], null, null, null, null, null, null, null, null, null, [["throbbing", 42.38], ["music", 23.96], ["hum", 22.76]], null], "duration": [3.4, 29.71, 31.17, 1.53, 6.87, 10.45, -0.09, 0.48, 0.43, 1.13, 0.34, 0.32, 0.0, 0.0, 1.12, 4.45, 0.89]} \ No newline at end of file diff --git a/annotations_1/zPuVP5U-xag_filtered.json b/annotations_1/zPuVP5U-xag_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..da8908822defb0c47ac6b570a0753a787dbc0aa9 --- /dev/null +++ b/annotations_1/zPuVP5U-xag_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[11.0, 10.61], [12.0, 12.26], [19.0, 19.26], [35.0, 37.66], [38.0, 39.09], [49.0, 49.38], [52.0, 52.62], [58.0, 58.08], [68.0, 68.22], [73.0, 73.67], [75.0, 76.62], [78.0, 80.35], [82.0, 83.88], [85.0, 87.35], [91.0, 91.88], [93.0, 95.03]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 86.09, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 97.11, 0.0, 78.04, 0.0, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.39, 0.26, 0.26, 2.66, 1.09, 0.38, 0.62, 0.08, 0.22, 0.67, 1.62, 2.35, 1.88, 2.35, 0.88, 2.03]} \ No newline at end of file diff --git a/annotations_1/zQf0jUhqJYw_filtered.json b/annotations_1/zQf0jUhqJYw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..70f65fe97ec1c2a5f4a48b2bbb2455de0ef7d7dc --- /dev/null +++ b/annotations_1/zQf0jUhqJYw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 15.72], [20.0, 23.5], [24.0, 23.53], [24.0, 23.57], [24.0, 23.6], [28.0, 35.99], [43.0, 44.12], [47.0, 59.49], [61.0, 82.95], [85.0, 85.48], [88.0, 99.5], [100.0, 100.74], [102.0, 144.02], [147.0, 154.53], [158.0, 186.92], [188.0, 193.75], [197.0, 210.69], [214.0, 222.99], [225.0, 245.94], [247.0, 247.21], [248.0, 250.26], [253.0, 262.67]], "keep_status": [false, true, false, false, false, true, false, false, true, false, false, false, false, true, false, true, false, false, true, false, true, true], "silence_prob": [36.06, 44.26, 0.0, 0.0, 0.0, 34.11, 0.0, 31.74, 30.17, 0.0, 30.94, 0.0, 0.0, 30.43, 30.61, 34.39, 32.03, 30.63, 30.76, 0.0, 45.11, 36.06], "audiomae_on_audioset": [[["hum", 48.22], ["throbbing", 13.86], ["mains hum", 12.63]], [["hum", 33.78], ["mains hum", 16.03], ["fly, housefly", 8.01]], null, null, null, [["music", 34.63], ["speech", 16.1], ["buzz", 10.54]], null, [["speech", 56.2], ["music", 10.54], ["buzz", 10.24]], [["music", 24.46], ["livestock, farm animals, working animals", 13.18], ["cattle, bovinae", 11.53]], null, [["music", 55.85], ["speech", 22.2], ["foghorn", 2.36]], null, null, [["hum", 30.22], ["mains hum", 25.92], ["music", 8.77]], [["speech", 60.18], ["vehicle", 6.87], ["boat, water vehicle", 5.11]], [["boing", 30.72], ["music", 22.72], ["noise", 7.13]], [["speech", 39.87], ["music", 39.14], ["vehicle", 2.8]], [["music", 67.17], ["boing", 5.57], ["didgeridoo", 3.6]], [["music", 33.55], ["speech", 10.81], ["livestock, farm animals, working animals", 9.73]], null, [["music", 37.62], ["crushing", 9.53], ["singing bowl", 8.79]], [["music", 25.33], ["hum", 18.58], ["buzz", 14.11]]], "duration": [7.72, 3.5, -0.47, -0.43, -0.4, 7.99, 1.12, 12.49, 21.95, 0.48, 11.5, 0.74, 42.02, 7.53, 28.92, 5.75, 13.69, 8.99, 20.94, 0.21, 2.26, 9.67]} \ No newline at end of file diff --git a/annotations_1/zS41k2xmQUI_filtered.json b/annotations_1/zS41k2xmQUI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8bdd6fcf5882590cf8f5433940cfb8eea119b2cf --- /dev/null +++ b/annotations_1/zS41k2xmQUI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[56.0, 55.95], [65.0, 78.81], [79.0, 80.57], [81.0, 107.82], [111.0, 113.16]], "keep_status": [false, true, false, true, false], "silence_prob": [0.0, 28.8, 0.0, 28.39, 33.1], "audiomae_on_audioset": [null, [["crow", 13.51], ["caw", 9.19], ["sheep", 6.46]], null, [["speech", 28.13], ["animal", 11.31], ["sine wave", 5.19]], [["speech", 71.74], ["vehicle", 3.04], ["fart", 2.51]]], "duration": [-0.05, 13.81, 1.57, 26.82, 2.16]} \ No newline at end of file diff --git a/annotations_1/zSh-Wy2vvHY_filtered.json b/annotations_1/zSh-Wy2vvHY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e4d260d54848d63ba74fe3ff5072612011509562 --- /dev/null +++ b/annotations_1/zSh-Wy2vvHY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 9.73], [11.0, 12.02], [14.0, 16.7], [21.0, 24.22], [25.0, 26.77], [32.0, 34.86], [37.0, 37.88], [58.0, 65.37], [70.0, 71.27], [77.0, 79.76], [82.0, 83.52], [86.0, 92.89], [94.0, 96.21], [104.0, 107.4], [108.0, 109.56], [110.0, 111.33], [113.0, 114.07], [118.0, 120.06], [122.0, 125.37]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 56.03, 51.82, 0.0, 55.31, 0.0, 31.27, 0.0, 51.99, 0.0, 47.86, 52.22, 58.72, 0.0, 0.0, 0.0, 60.79, 50.61], "audiomae_on_audioset": [null, null, null, null, null, null, null, [["speech", 46.98], ["music", 28.58], ["beatboxing", 3.97]], null, null, null, [["hum", 13.47], ["throbbing", 10.31], ["rumble", 8.19]], null, null, null, null, null, null, null], "duration": [0.73, 1.02, 2.7, 3.22, 1.77, 2.86, 0.88, 7.37, 1.27, 2.76, 1.52, 6.89, 2.21, 3.4, 1.56, 1.33, 1.07, 2.06, 3.37]} \ No newline at end of file diff --git a/annotations_1/zSw2bGgrIQQ_filtered.json b/annotations_1/zSw2bGgrIQQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d65f0eb38fe5b314b03545605a28487d0dfaa89f --- /dev/null +++ b/annotations_1/zSw2bGgrIQQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 11.5], [13.0, 14.62], [16.0, 23.25], [24.0, 24.87], [32.0, 32.83], [36.0, 38.2], [43.0, 47.83], [50.0, 50.41], [54.0, 54.97], [55.0, 55.88], [61.0, 62.92], [68.0, 68.25], [71.0, 70.82], [73.0, 74.17], [77.0, 77.23], [78.0, 77.67], [78.0, 78.0], [82.0, 82.95], [88.0, 88.6], [90.0, 90.95], [97.0, 101.71], [112.0, 113.49], [124.0, 125.93], [128.0, 128.01], [129.0, 145.47], [146.0, 145.56], [146.0, 146.45], [147.0, 150.42], [156.0, 157.91], [159.0, 162.58], [163.0, 162.94]], "keep_status": [true, false, true, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, false], "silence_prob": [30.21, 0.0, 28.91, 0.0, 0.0, 36.44, 30.22, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.44, 0.0, 0.0, 0.0, 28.38, 0.0, 0.0, 28.51, 0.0, 34.09, 0.0], "audiomae_on_audioset": [[["speech", 32.43], ["mains hum", 23.41], ["music", 9.86]], null, [["music", 43.79], ["noise", 21.43], ["throbbing", 3.54]], null, null, [["music", 34.19], ["speech", 22.67], ["hum", 5.53]], [["speech", 85.41], ["music", 3.44], ["telephone", 2.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 82.11], ["electronic music", 2.77], ["musical instrument", 1.71]], null, null, null, [["music", 76.44], ["electronic music", 5.23], ["hum", 4.7]], null, null, [["cattle, bovinae", 24.08], ["livestock, farm animals, working animals", 18.21], ["moo", 13.4]], null, [["music", 21.75], ["hum", 13.66], ["mains hum", 12.04]], null], "duration": [2.5, 1.62, 7.25, 0.87, 0.83, 2.2, 4.83, 0.41, 0.97, 0.88, 1.92, 0.25, -0.18, 1.17, 0.23, -0.33, 0.0, 0.95, 0.6, 0.95, 4.71, 1.49, 1.93, 0.01, 16.47, -0.44, 0.45, 3.42, 1.91, 3.58, -0.06]} \ No newline at end of file diff --git a/annotations_1/zUCWPJk-XHk_filtered.json b/annotations_1/zUCWPJk-XHk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..246235eb3178cc4c4c1f052dc8fbb215c69e4419 --- /dev/null +++ b/annotations_1/zUCWPJk-XHk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 3.94], [8.0, 10.59], [13.0, 13.29], [14.0, 15.7], [20.0, 24.14], [26.0, 26.57], [27.0, 27.85], [35.0, 35.53], [49.0, 49.96], [51.0, 51.75], [54.0, 53.84], [55.0, 55.44], [61.0, 61.4], [73.0, 74.07], [95.0, 95.61], [102.0, 102.96], [112.0, 112.41], [114.0, 116.38], [129.0, 129.15]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [0.0, 41.87, 0.0, 0.0, 57.48, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.86, 0.0], "audiomae_on_audioset": [null, [["music", 35.22], ["theremin", 20.89], ["speech", 17.15]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["doorbell", 11.71], ["music", 8.91], ["singing bowl", 8.6]], null], "duration": [0.94, 2.59, 0.29, 1.7, 4.14, 0.57, 0.85, 0.53, 0.96, 0.75, -0.16, 0.44, 0.4, 1.07, 0.61, 0.96, 0.41, 2.38, 0.15]} \ No newline at end of file diff --git a/annotations_1/zUL_yawY6Ks_filtered.json b/annotations_1/zUL_yawY6Ks_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..cb72211a5f8801179eaa7458b22385b8121ba9b5 --- /dev/null +++ b/annotations_1/zUL_yawY6Ks_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 16.17], [17.0, 17.76], [19.0, 22.47], [25.0, 26.92], [34.0, 34.86], [40.0, 41.12], [42.0, 43.71], [46.0, 46.43], [48.0, 55.26], [57.0, 57.25], [61.0, 66.51], [68.0, 69.5], [70.0, 75.19], [75.0, 81.57], [88.0, 88.77], [98.0, 101.17], [103.0, 104.67], [107.0, 122.52], [123.0, 132.87]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [51.88, 0.0, 59.07, 0.0, 0.0, 0.0, 0.0, 0.0, 58.05, 0.0, 57.72, 0.0, 43.69, 48.02, 0.0, 34.26, 0.0, 29.94, 29.14], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, [["music", 70.09], ["speech", 12.15], ["theremin", 1.72]], [["music", 52.89], ["throbbing", 7.15], ["electronic music", 5.64]], null, [["music", 68.83], ["synthesizer", 4.05], ["throbbing", 3.44]], null, [["music", 65.08], ["throbbing", 2.91], ["soundtrack music", 2.62]], [["music", 58.42], ["hum", 10.49], ["throbbing", 8.62]]], "duration": [12.17, 0.76, 3.47, 1.92, 0.86, 1.12, 1.71, 0.43, 7.26, 0.25, 5.51, 1.5, 5.19, 6.57, 0.77, 3.17, 1.67, 15.52, 9.87]} \ No newline at end of file diff --git a/annotations_1/zUhsEXaj_oY_filtered.json b/annotations_1/zUhsEXaj_oY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..95ecc3f9345c23a719effc49b5afae2dfb6850f3 --- /dev/null +++ b/annotations_1/zUhsEXaj_oY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.2], [12.0, 23.73], [25.0, 25.69], [27.0, 27.41], [30.0, 30.25], [33.0, 33.72], [40.0, 40.58], [50.0, 58.31], [59.0, 64.88], [71.0, 85.5], [86.0, 86.78], [87.0, 88.48], [92.0, 92.92], [93.0, 93.78], [96.0, 103.6], [104.0, 113.51], [116.0, 118.29], [122.0, 121.98], [122.0, 124.5], [126.0, 126.05], [126.0, 127.16], [130.0, 142.47], [148.0, 153.62]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 62.37, 0.0, 0.0, 0.0, 0.0, 0.0, 74.6, 75.39, 53.78, 0.0, 0.0, 0.0, 0.0, 48.48, 40.38, 50.66, 0.0, 56.18, 0.0, 0.0, 36.33, 43.3], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 25.68], ["speech", 9.34], ["inside, small room", 5.46]], [["music", 41.37], ["speech", 21.77], ["animal", 9.53]], null, null, null, null, null, [["music", 65.59], ["speech", 5.25], ["boing", 2.92]], [["music", 58.59], ["boing", 5.81], ["harmonica", 4.66]]], "duration": [0.2, 11.73, 0.69, 0.41, 0.25, 0.72, 0.58, 8.31, 5.88, 14.5, 0.78, 1.48, 0.92, 0.78, 7.6, 9.51, 2.29, -0.02, 2.5, 0.05, 1.16, 12.47, 5.62]} \ No newline at end of file diff --git a/annotations_1/zWW_SH8IFnI_filtered.json b/annotations_1/zWW_SH8IFnI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..825f6a00a1cbfb895fa5463c910e9e29389cbbca --- /dev/null +++ b/annotations_1/zWW_SH8IFnI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[38.0, 39.38], [41.0, 42.23], [42.0, 44.25], [46.0, 47.71], [48.0, 58.33], [62.0, 156.71]], "keep_status": [false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 34.68, 0.0, 29.02, 0.0], "audiomae_on_audioset": [null, null, [["music", 57.83], ["musical instrument", 4.36], ["classical music", 2.58]], null, [["music", 34.08], ["hum", 10.34], ["cacophony", 7.89]], null], "duration": [1.38, 1.23, 2.25, 1.71, 10.33, 94.71]} \ No newline at end of file diff --git a/annotations_1/zXF0zcwPGuI_filtered.json b/annotations_1/zXF0zcwPGuI_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b00438666ae73f31d2b96777439500bb561fd50 --- /dev/null +++ b/annotations_1/zXF0zcwPGuI_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 6.91], [11.0, 11.69], [13.0, 13.02], [14.0, 14.81], [23.0, 27.84], [29.0, 29.88], [30.0, 40.22], [40.0, 51.48], [52.0, 53.0], [54.0, 65.89], [71.0, 91.27], [93.0, 94.44], [95.0, 100.08], [107.0, 106.73], [107.0, 111.48], [114.0, 135.09], [136.0, 137.13]], "keep_status": [false, false, false, false, false, false, false, false, false, false, true, false, true, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 52.74, 0.0, 44.04, 44.43, 0.0, 42.35, 39.28, 0.0, 39.54, 0.0, 41.83, 39.77, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 83.63], ["musical instrument", 1.76], ["mantra", 1.53]], [["music", 74.03], ["carnatic music", 3.6], ["speech", 2.1]], null, [["music", 74.3], ["clarinet", 3.67], ["musical instrument", 2.17]], [["music", 37.31], ["theremin", 12.79], ["cello", 6.82]], null, [["music", 52.83], ["musical instrument", 4.71], ["carnatic music", 3.95]], null, [["music", 57.75], ["theremin", 19.6], ["didgeridoo", 1.4]], [["music", 84.25], ["lullaby", 1.93], ["middle eastern music", 1.87]], null], "duration": [-0.09, 0.69, 0.02, 0.81, 4.84, 0.88, 10.22, 11.48, 1.0, 11.89, 20.27, 1.44, 5.08, -0.27, 4.48, 21.09, 1.13]} \ No newline at end of file diff --git a/annotations_1/zXR_4li9ZnA_filtered.json b/annotations_1/zXR_4li9ZnA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8ed17cc389ca2ce6b6aaa48f32570523ca8148f --- /dev/null +++ b/annotations_1/zXR_4li9ZnA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 15.4], [26.0, 26.32], [28.0, 35.24], [36.0, 50.33], [63.0, 67.04], [68.0, 71.95], [89.0, 89.65], [91.0, 91.66], [92.0, 96.85], [103.0, 107.79], [114.0, 114.13], [122.0, 125.73], [131.0, 134.4], [135.0, 136.02], [137.0, 137.49]], "keep_status": [true, false, false, false, true, true, false, false, false, true, false, true, true, false, false], "silence_prob": [31.65, 0.0, 60.6, 43.61, 33.5, 33.22, 0.0, 0.0, 34.28, 30.47, 0.0, 36.31, 38.54, 0.0, 0.0], "audiomae_on_audioset": [[["livestock, farm animals, working animals", 23.62], ["moo", 19.9], ["cattle, bovinae", 12.71]], null, null, [["music", 69.12], ["ambient music", 4.42], ["singing bowl", 3.19]], [["music", 28.95], ["speech", 17.73], ["thunk", 15.17]], [["fart", 20.23], ["music", 19.54], ["speech", 14.62]], null, null, [["music", 40.92], ["speech", 20.33], ["fart", 12.29]], [["speech", 17.45], ["buzz", 17.4], ["music", 8.26]], null, [["music", 38.1], ["didgeridoo", 15.22], ["musical instrument", 8.22]], [["music", 32.61], ["synthesizer", 13.23], ["quack", 6.44]], null, null], "duration": [14.4, 0.32, 7.24, 14.33, 4.04, 3.95, 0.65, 0.66, 4.85, 4.79, 0.13, 3.73, 3.4, 1.02, 0.49]} \ No newline at end of file diff --git a/annotations_1/zYTsJkuEPWQ_filtered.json b/annotations_1/zYTsJkuEPWQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4d6413885af1749561f1bb12735ca8281d70917c --- /dev/null +++ b/annotations_1/zYTsJkuEPWQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 30.48], [33.0, 36.26], [43.0, 44.14], [50.0, 50.67], [51.0, 51.46], [51.0, 51.85]], "keep_status": [false, true, false, false, false, false], "silence_prob": [0.0, 32.7, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, [["music", 50.1], ["cattle, bovinae", 9.81], ["moo", 6.05]], null, null, null, null], "duration": [0.48, 3.26, 1.14, 0.67, 0.46, 0.85]} \ No newline at end of file diff --git a/annotations_1/zZLAinjBShg_filtered.json b/annotations_1/zZLAinjBShg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4f2801cfe92df858d8b78223de3729f4b7606052 --- /dev/null +++ b/annotations_1/zZLAinjBShg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 0.99], [8.0, 75.84], [76.0, 83.47], [86.0, 86.71], [90.0, 91.99], [96.0, 98.93], [102.0, 101.76], [105.0, 125.19], [129.0, 132.38], [134.0, 134.45], [135.0, 135.01], [137.0, 137.22], [139.0, 142.57], [145.0, 145.72], [151.0, 152.96], [157.0, 157.37], [159.0, 159.44], [161.0, 161.97], [165.0, 165.18]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 44.04, 0.0, 0.0, 37.22, 0.0, 42.69, 80.46, 0.0, 0.0, 0.0, 69.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 43.14], ["boing", 24.58], ["music", 14.72]], null, null, [["music", 15.54], ["sidetone", 8.81], ["moo", 8.09]], null, [["thunk", 53.42], ["speech", 22.28], ["music", 13.29]], null, null, null, null, null, null, null, null, null, null, null], "duration": [-0.01, 67.84, 7.47, 0.71, 1.99, 2.93, -0.24, 20.19, 3.38, 0.45, 0.01, 0.22, 3.57, 0.72, 1.96, 0.37, 0.44, 0.97, 0.18]} \ No newline at end of file diff --git a/annotations_1/zZTH3HdE8Sg_filtered.json b/annotations_1/zZTH3HdE8Sg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5c1a46b4431913d95ba09109d8757570ad3a4e02 --- /dev/null +++ b/annotations_1/zZTH3HdE8Sg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.88], [5.0, 6.22], [8.0, 9.09], [12.0, 11.96], [15.0, 16.43], [19.0, 19.28], [24.0, 24.27], [25.0, 27.5], [34.0, 35.01], [38.0, 38.2], [42.0, 55.65], [59.0, 59.31], [65.0, 66.19], [69.0, 71.95], [72.0, 76.05], [77.0, 120.78], [123.0, 122.93], [124.0, 124.17], [127.0, 130.81], [132.0, 165.48], [168.0, 168.52], [169.0, 169.64]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.01, 0.0, 0.0, 99.85, 0.0, 0.0, 78.21, 52.27, 0.0, 0.0, 0.0, 61.67, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.88, 1.22, 1.09, -0.04, 1.43, 0.28, 0.27, 2.5, 1.01, 0.2, 13.65, 0.31, 1.19, 2.95, 4.05, 43.78, -0.07, 0.17, 3.81, 33.48, 0.52, 0.64]} \ No newline at end of file diff --git a/annotations_1/zZcYZmsSGs0_filtered.json b/annotations_1/zZcYZmsSGs0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..1b348c04215ce3880d24a928aeac1c66c4b52d1c --- /dev/null +++ b/annotations_1/zZcYZmsSGs0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[32.0, 33.81], [35.0, 35.82], [45.0, 54.3], [55.0, 55.04], [56.0, 78.85], [79.0, 79.44], [83.0, 92.45], [93.0, 92.53], [93.0, 92.57], [93.0, 104.99], [106.0, 108.43], [110.0, 112.97], [121.0, 122.07]], "keep_status": [false, false, false, false, true, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 87.19, 0.0, 32.72, 0.0, 35.12, 0.0, 0.0, 38.54, 42.42, 39.52, 0.0], "audiomae_on_audioset": [null, null, null, null, [["speech", 37.52], ["screaming", 13.96], ["animal", 3.45]], null, [["speech", 54.41], ["radio", 9.44], ["frog", 8.55]], null, null, [["moo", 19.3], ["cattle, bovinae", 12.03], ["livestock, farm animals, working animals", 10.36]], [["whale vocalization", 63.77], ["sidetone", 4.45], ["frog", 3.04]], [["vehicle", 21.85], ["car", 21.18], ["race car, auto racing", 16.1]], null], "duration": [1.81, 0.82, 9.3, 0.04, 22.85, 0.44, 9.45, -0.47, -0.43, 11.99, 2.43, 2.97, 1.07]} \ No newline at end of file diff --git a/annotations_1/z_a4zak_zk0_filtered.json b/annotations_1/z_a4zak_zk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4dc42c927cdd086bbf3678409574bfb9d52b7eb0 --- /dev/null +++ b/annotations_1/z_a4zak_zk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 18.74], [23.0, 38.7], [43.0, 45.91], [47.0, 50.18], [51.0, 57.87], [58.0, 59.85], [62.0, 62.82], [63.0, 63.12], [70.0, 70.98], [72.0, 72.0], [79.0, 79.07], [84.0, 84.5], [89.0, 89.28], [89.0, 90.02], [100.0, 101.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [97.33, 90.08, 82.43, 99.4, 72.16, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [6.74, 15.7, 2.91, 3.18, 6.87, 1.85, 0.82, 0.12, 0.98, 0.0, 0.07, 0.5, 0.28, 1.02, 1.83]} \ No newline at end of file diff --git a/annotations_1/za8FVqsMmZ0_filtered.json b/annotations_1/za8FVqsMmZ0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d44b514e73ea6d84875868b3b36054cd8ca9565d --- /dev/null +++ b/annotations_1/za8FVqsMmZ0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.34], [4.0, 4.68], [8.0, 8.29], [10.0, 10.99], [14.0, 20.98], [23.0, 23.53], [25.0, 58.63], [63.0, 66.77], [68.0, 173.45], [174.0, 175.0], [180.0, 195.76], [197.0, 196.94]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 34.36, 0.0, 0.0, 35.01, 0.0, 0.0, 31.74, 0.0], "audiomae_on_audioset": [null, null, null, null, [["music", 37.8], ["speech", 16.56], ["hum", 12.41]], null, null, [["music", 43.06], ["whale vocalization", 25.44], ["musical instrument", 4.98]], null, null, [["music", 31.14], ["hum", 14.73], ["throbbing", 8.9]], null], "duration": [0.34, 0.68, 0.29, 0.99, 6.98, 0.53, 33.63, 3.77, 105.45, 1.0, 15.76, -0.06]} \ No newline at end of file diff --git a/annotations_1/zaHU1FW_RZk_filtered.json b/annotations_1/zaHU1FW_RZk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a8173a8aa6b1fefaa5ca3a1da162c4122482a048 --- /dev/null +++ b/annotations_1/zaHU1FW_RZk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 2.1], [3.0, 3.96], [6.0, 7.15], [16.0, 16.19], [17.0, 17.34], [19.0, 19.87], [37.0, 47.73], [58.0, 60.64], [62.0, 63.49], [69.0, 71.88], [76.0, 77.79], [79.0, 80.52], [83.0, 83.24], [86.0, 86.19], [88.0, 90.19], [91.0, 92.3], [96.0, 98.37], [106.0, 106.51], [111.0, 112.28], [114.0, 115.23], [117.0, 117.98], [119.0, 129.64]], "keep_status": [false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.56, 31.62, 0.0, 31.89, 0.0, 0.0, 0.0, 0.0, 31.83, 0.0, 31.76, 0.0, 0.0, 0.0, 0.0, 31.83], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 79.03], ["speech", 6.15], ["throbbing", 2.12]], [["music", 76.1], ["didgeridoo", 5.89], ["theremin", 3.88]], null, [["music", 34.06], ["sidetone", 19.06], ["throbbing", 8.57]], null, null, null, null, [["music", 77.68], ["electronic music", 3.7], ["techno", 3.12]], null, [["music", 48.4], ["didgeridoo", 9.26], ["sidetone", 8.5]], null, null, null, null, [["music", 81.18], ["throbbing", 3.31], ["hum", 2.64]]], "duration": [1.1, 0.96, 1.15, 0.19, 0.34, 0.87, 10.73, 2.64, 1.49, 2.88, 1.79, 1.52, 0.24, 0.19, 2.19, 1.3, 2.37, 0.51, 1.28, 1.23, 0.98, 10.64]} \ No newline at end of file diff --git a/annotations_1/zadI5ngwLsM_filtered.json b/annotations_1/zadI5ngwLsM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5db881cc03f3265000898173d7afd33204e7688c --- /dev/null +++ b/annotations_1/zadI5ngwLsM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 4.16], [11.0, 12.33], [20.0, 20.76], [23.0, 24.54], [26.0, 27.26], [29.0, 30.06], [34.0, 34.42], [39.0, 41.49], [42.0, 79.49], [81.0, 87.52], [90.0, 99.55], [100.0, 100.11], [101.0, 101.41], [103.0, 102.84], [104.0, 120.26], [121.0, 130.69], [133.0, 132.98], [133.0, 133.08], [133.0, 133.12], [133.0, 154.43], [155.0, 158.94], [161.0, 168.05], [170.0, 174.01]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 94.81, 0.0, 47.43, 61.27, 0.0, 0.0, 0.0, 32.31, 37.95, 0.0, 0.0, 0.0, 40.52, 45.59, 96.29, 81.53], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, [["hum", 46.41], ["throbbing", 18.89], ["mains hum", 16.5]], null, null, null, null, [["music", 43.3], ["breaking", 20.35], ["ding", 5.56]], [["mains hum", 25.49], ["hum", 20.38], ["rumble", 18.66]], null, null, null, [["speech", 67.6], ["music", 10.41], ["hum", 4.4]], [["speech", 61.0], ["glass", 6.4], ["music", 3.37]], null, null], "duration": [0.16, 1.33, 0.76, 1.54, 1.26, 1.06, 0.42, 2.49, 37.49, 6.52, 9.55, 0.11, 0.41, -0.16, 16.26, 9.69, -0.02, 0.08, 0.12, 21.43, 3.94, 7.05, 4.01]} \ No newline at end of file diff --git a/annotations_1/zb5RJyrk4gc_filtered.json b/annotations_1/zb5RJyrk4gc_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..47f8655d063b1b1702a344d27eafb712642b4e35 --- /dev/null +++ b/annotations_1/zb5RJyrk4gc_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.93], [9.0, 9.76], [11.0, 11.75], [13.0, 13.74], [16.0, 18.12], [29.0, 28.71], [32.0, 32.97], [34.0, 34.38], [36.0, 35.8], [37.0, 37.13], [39.0, 40.56], [41.0, 43.02], [46.0, 46.28], [48.0, 48.98], [51.0, 52.07], [54.0, 59.44], [62.0, 65.21], [81.0, 83.07], [84.0, 84.89], [87.0, 87.51], [89.0, 93.61], [97.0, 98.09], [99.0, 100.87], [107.0, 107.23], [114.0, 127.99], [131.0, 138.06], [139.0, 142.77], [147.0, 157.6], [160.0, 174.9]], "keep_status": [false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, false, true, false, false, false, false, false, true, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 32.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.96, 0.0, 0.0, 0.0, 31.27, 30.43, 31.41, 0.0, 0.0, 34.34, 0.0, 0.0, 0.0, 30.63, 30.82, 31.06, 30.31, 30.83], "audiomae_on_audioset": [null, null, null, null, [["music", 55.77], ["speech", 6.04], ["musical instrument", 3.59]], null, null, null, null, null, null, [["speech", 56.61], ["vehicle", 8.15], ["boat, water vehicle", 7.32]], null, null, null, [["speech", 52.17], ["music", 13.95], ["hubbub, speech noise, speech babble", 3.57]], [["vehicle", 15.39], ["speech", 14.39], ["music", 12.6]], [["fly, housefly", 19.88], ["speech", 11.53], ["insect", 9.16]], null, null, [["music", 37.56], ["speech", 10.95], ["throbbing", 4.92]], null, null, null, [["music", 64.53], ["speech", 16.4], ["electronic music", 3.7]], [["hum", 32.31], ["music", 23.75], ["mains hum", 20.35]], [["music", 49.99], ["electronic music", 10.32], ["speech", 5.53]], [["speech", 14.85], ["music", 13.67], ["hum", 13.24]], [["music", 37.64], ["hum", 17.67], ["mains hum", 16.5]]], "duration": [0.93, 0.76, 0.75, 0.74, 2.12, -0.29, 0.97, 0.38, -0.2, 0.13, 1.56, 2.02, 0.28, 0.98, 1.07, 5.44, 3.21, 2.07, 0.89, 0.51, 4.61, 1.09, 1.87, 0.23, 13.99, 7.06, 3.77, 10.6, 14.9]} \ No newline at end of file diff --git a/annotations_1/zbAsqngq2qY_filtered.json b/annotations_1/zbAsqngq2qY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..db1d30e9a2ee830a9e30aa4f79e129cdcc2c2ca1 --- /dev/null +++ b/annotations_1/zbAsqngq2qY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [4.0, 4.33], [5.0, 5.48], [7.0, 7.75], [9.0, 10.07], [10.0, 10.76], [11.0, 11.85], [13.0, 14.99], [18.0, 19.92], [21.0, 22.45], [23.0, 24.97], [26.0, 28.12], [32.0, 42.72], [43.0, 54.78], [55.0, 55.98], [58.0, 58.48], [59.0, 59.29], [61.0, 61.08], [62.0, 79.95], [81.0, 80.91], [84.0, 92.89], [94.0, 104.28], [106.0, 106.81], [107.0, 113.17]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.85, 73.06, 67.51, 0.0, 0.0, 0.0, 0.0, 35.03, 0.0, 61.08, 37.25, 0.0, 32.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["mosquito", 42.14], ["fly, housefly", 11.19], ["music", 8.72]], null, null, [["music", 64.18], ["didgeridoo", 7.04], ["musical instrument", 5.51]], null, [["saxophone", 31.28], ["music", 26.58], ["brass instrument", 13.53]]], "duration": [0.74, 0.33, 0.48, 0.75, 1.07, 0.76, 0.85, 1.99, 1.92, 1.45, 1.97, 2.12, 10.72, 11.78, 0.98, 0.48, 0.29, 0.08, 17.95, -0.09, 8.89, 10.28, 0.81, 6.17]} \ No newline at end of file diff --git a/annotations_1/zbHFgQ419Qs_filtered.json b/annotations_1/zbHFgQ419Qs_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5a6eeacbaf2ebecd1cff15f1667ae007b42a2b29 --- /dev/null +++ b/annotations_1/zbHFgQ419Qs_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 4.58], [5.0, 5.85], [10.0, 18.79], [25.0, 25.42], [26.0, 28.43], [31.0, 34.82], [39.0, 45.3], [47.0, 47.29], [48.0, 48.54], [50.0, 51.0], [52.0, 55.65], [59.0, 61.87], [65.0, 64.79], [67.0, 67.36], [74.0, 74.39], [77.0, 76.81], [79.0, 79.35], [82.0, 82.88], [84.0, 85.45], [87.0, 87.59], [88.0, 88.94], [91.0, 93.55], [96.0, 97.34], [100.0, 105.31], [106.0, 106.17], [108.0, 109.81], [110.0, 111.48], [112.0, 118.05], [119.0, 121.36]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false], "silence_prob": [58.89, 0.0, 54.76, 0.0, 99.68, 99.91, 46.54, 0.0, 0.0, 0.0, 97.33, 70.44, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.95, 0.0, 67.0, 0.0, 0.0, 0.0, 38.67, 55.81], "audiomae_on_audioset": [null, null, null, null, null, null, [["singing bowl", 34.91], ["music", 25.21], ["guitar", 4.1]], null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 33.98], ["speech", 13.87], ["groan", 3.78]], null], "duration": [2.58, 0.85, 8.79, 0.42, 2.43, 3.82, 6.3, 0.29, 0.54, 1.0, 3.65, 2.87, -0.21, 0.36, 0.39, -0.19, 0.35, 0.88, 1.45, 0.59, 0.94, 2.55, 1.34, 5.31, 0.17, 1.81, 1.48, 6.05, 2.36]} \ No newline at end of file diff --git a/annotations_1/zct1tPK1Zk0_filtered.json b/annotations_1/zct1tPK1Zk0_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..747fcbe5c78cdcbef97b7cd1255b32e15c36401b --- /dev/null +++ b/annotations_1/zct1tPK1Zk0_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[7.0, 10.4], [12.0, 13.15], [16.0, 16.85], [21.0, 21.59], [24.0, 24.11], [26.0, 36.9], [49.0, 49.96], [51.0, 55.04], [59.0, 59.98], [60.0, 61.13], [62.0, 64.93], [70.0, 75.76], [80.0, 84.7], [90.0, 95.76], [101.0, 119.42], [122.0, 135.6], [140.0, 159.46]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, true, true, false, true, false], "silence_prob": [35.9, 0.0, 0.0, 0.0, 0.0, 34.24, 0.0, 54.97, 0.0, 0.0, 87.92, 36.16, 49.18, 32.78, 31.57, 32.74, 35.55], "audiomae_on_audioset": [[["music", 28.38], ["sidetone", 9.78], ["musical instrument", 6.82]], null, null, null, null, [["music", 60.61], ["trombone", 8.44], ["musical instrument", 6.97]], null, null, null, null, null, [["effects unit", 13.41], ["music", 11.83], ["hum", 9.49]], [["hum", 42.29], ["roar", 13.28], ["throbbing", 8.66]], [["speech", 26.52], ["music", 12.85], ["radio", 10.4]], [["music", 60.43], ["didgeridoo", 16.68], ["speech", 2.28]], [["music", 28.16], ["vehicle", 10.47], ["effects unit", 9.65]], [["music", 71.83], ["musical instrument", 5.02], ["trombone", 2.27]]], "duration": [3.4, 1.15, 0.85, 0.59, 0.11, 10.9, 0.96, 4.04, 0.98, 1.13, 2.93, 5.76, 4.7, 5.76, 18.42, 13.6, 19.46]} \ No newline at end of file diff --git a/annotations_1/zd6ZUTrW5b4_filtered.json b/annotations_1/zd6ZUTrW5b4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b718b2d786115a056795f1113ad8f7d727a3a5a0 --- /dev/null +++ b/annotations_1/zd6ZUTrW5b4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 6.54], [7.0, 8.83], [9.0, 9.85], [10.0, 11.18], [13.0, 14.77], [15.0, 16.02], [17.0, 17.95], [19.0, 19.94], [21.0, 21.83], [23.0, 23.33], [24.0, 25.27], [27.0, 29.34], [31.0, 33.34], [40.0, 40.17], [43.0, 44.36], [45.0, 45.98], [46.0, 46.36], [47.0, 47.78], [48.0, 49.45], [50.0, 51.43], [54.0, 55.44], [57.0, 57.38], [59.0, 59.26], [61.0, 61.35], [63.0, 65.99], [67.0, 67.76], [72.0, 73.28], [75.0, 75.14], [78.0, 78.14], [81.0, 81.77], [82.0, 83.44], [87.0, 87.32], [89.0, 89.83], [91.0, 91.69], [96.0, 95.98], [102.0, 102.34], [104.0, 104.11], [107.0, 107.92], [109.0, 109.39], [112.0, 113.27], [114.0, 114.3], [118.0, 118.64], [121.0, 122.98], [123.0, 125.22], [126.0, 128.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [87.55, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 93.45, 78.04], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [2.54, 1.83, 0.85, 1.18, 1.77, 1.02, 0.95, 0.94, 0.83, 0.33, 1.27, 2.34, 2.34, 0.17, 1.36, 0.98, 0.36, 0.78, 1.45, 1.43, 1.44, 0.38, 0.26, 0.35, 2.99, 0.76, 1.28, 0.14, 0.14, 0.77, 1.44, 0.32, 0.83, 0.69, -0.02, 0.34, 0.11, 0.92, 0.39, 1.27, 0.3, 0.64, 1.98, 2.22, 2.73]} \ No newline at end of file diff --git a/annotations_1/ze8D_5hdmTE_filtered.json b/annotations_1/ze8D_5hdmTE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..609687c32aebecb2b750af9fdfb600d97ad7b26b --- /dev/null +++ b/annotations_1/ze8D_5hdmTE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[20.0, 21.02], [30.0, 31.4], [45.0, 46.14], [48.0, 48.46], [49.0, 51.12], [51.0, 51.65], [60.0, 64.34], [76.0, 75.68], [86.0, 89.36], [107.0, 110.44], [114.0, 114.56], [116.0, 117.96], [119.0, 125.66], [127.0, 144.63], [146.0, 146.03], [148.0, 148.05], [151.0, 162.21], [165.0, 165.81], [170.0, 171.05], [180.0, 181.01]], "keep_status": [false, false, false, false, true, false, true, false, true, true, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 31.07, 0.0, 28.94, 0.0, 29.33, 28.76, 0.0, 0.0, 29.09, 29.47, 0.0, 0.0, 31.83, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["explosion", 38.76], ["eruption", 14.94], ["burst, pop", 7.18]], null, [["music", 39.06], ["reverberation", 7.46], ["rumble", 4.09]], null, [["speech", 31.55], ["music", 22.5], ["hum", 12.51]], [["speech", 40.13], ["music", 9.51], ["civil defense siren", 4.61]], null, null, [["music", 34.19], ["speech", 23.14], ["didgeridoo", 7.75]], [["music", 56.21], ["speech", 22.08], ["thump, thud", 6.29]], null, null, [["speech", 82.69], ["applause", 1.83], ["music", 1.58]], null, null, null], "duration": [1.02, 1.4, 1.14, 0.46, 2.12, 0.65, 4.34, -0.32, 3.36, 3.44, 0.56, 1.96, 6.66, 17.63, 0.03, 0.05, 11.21, 0.81, 1.05, 1.01]} \ No newline at end of file diff --git a/annotations_1/zeGRvFbWbz8_filtered.json b/annotations_1/zeGRvFbWbz8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..291f492ed434ffe44424c76bb279183985772e6d --- /dev/null +++ b/annotations_1/zeGRvFbWbz8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.46], [8.0, 8.77], [14.0, 14.57], [16.0, 16.71], [19.0, 18.59], [23.0, 24.0], [25.0, 26.92], [29.0, 28.93], [30.0, 31.06], [34.0, 35.06], [37.0, 39.33], [43.0, 50.82], [54.0, 56.37], [59.0, 59.49], [61.0, 65.84], [68.0, 68.66], [71.0, 73.08], [74.0, 75.57], [78.0, 78.97], [80.0, 81.06], [84.0, 91.99], [93.0, 93.68], [98.0, 98.52], [103.0, 103.79], [109.0, 109.29], [112.0, 111.86], [123.0, 124.41], [129.0, 129.42], [132.0, 138.69], [142.0, 142.5], [146.0, 146.74], [149.0, 150.48], [158.0, 164.52], [169.0, 171.68], [177.0, 179.64], [180.0, 180.15], [182.0, 185.46], [187.0, 195.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.75, 34.7, 40.81, 0.0, 37.32, 0.0, 35.45, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.21, 0.0, 0.0, 0.0, 82.79, 50.31, 65.67, 0.0, 63.85, 39.33], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, [["music", 45.34], ["boing", 14.52], ["throbbing", 10.72]], [["music", 49.38], ["speech", 20.54], ["boing", 4.85]], [["music", 72.69], ["fart", 10.84], ["zipper (clothing)", 3.7]], null, [["music", 69.85], ["throbbing", 9.55], ["hum", 7.06]], null, [["music", 54.93], ["throbbing", 8.84], ["hum", 4.24]], null, null, null, [["music", 49.46], ["speech", 12.66], ["hum", 6.72]], null, null, null, null, null, null, null, [["cattle, bovinae", 32.28], ["moo", 25.26], ["livestock, farm animals, working animals", 19.97]], null, null, null, null, null, null, null, null, [["speech", 52.3], ["music", 26.67], ["boing", 3.66]]], "duration": [1.46, 0.77, 0.57, 0.71, -0.41, 1.0, 1.92, -0.07, 1.06, 1.06, 2.33, 7.82, 2.37, 0.49, 4.84, 0.66, 2.08, 1.57, 0.97, 1.06, 7.99, 0.68, 0.52, 0.79, 0.29, -0.14, 1.41, 0.42, 6.69, 0.5, 0.74, 1.48, 6.52, 2.68, 2.64, 0.15, 3.46, 8.52]} \ No newline at end of file diff --git a/annotations_1/zeSe5X9ALXg_filtered.json b/annotations_1/zeSe5X9ALXg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..94f5a1bf9ca383abd74e4c7155247b02dd518651 --- /dev/null +++ b/annotations_1/zeSe5X9ALXg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 11.47], [12.0, 12.8], [14.0, 36.95], [41.0, 41.28], [42.0, 47.22], [50.0, 81.72], [82.0, 83.0], [84.0, 83.89], [87.0, 87.91], [93.0, 93.06], [95.0, 95.57], [97.0, 100.84], [103.0, 112.94]], "keep_status": [false, false, true, false, false, false, false, false, false, false, false, false, true], "silence_prob": [52.39, 0.0, 35.57, 0.0, 30.34, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 58.98, 40.73], "audiomae_on_audioset": [null, null, [["speech", 28.22], ["music", 19.55], ["hum", 19.15]], null, [["whale vocalization", 87.68], ["frog", 1.19], ["speech", 1.09]], null, null, null, null, null, null, null, [["noise", 20.6], ["fly, housefly", 16.61], ["electric shaver, electric razor", 15.42]]], "duration": [6.47, 0.8, 22.95, 0.28, 5.22, 31.72, 1.0, -0.11, 0.91, 0.06, 0.57, 3.84, 9.94]} \ No newline at end of file diff --git a/annotations_1/zeV1-Ito9HM_filtered.json b/annotations_1/zeV1-Ito9HM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f646672c1adf30920486b2e6a0c67862ef9d5992 --- /dev/null +++ b/annotations_1/zeV1-Ito9HM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 26.15], [29.0, 47.39], [48.0, 49.17], [50.0, 52.3], [53.0, 56.57], [58.0, 65.7], [66.0, 73.47], [74.0, 74.9], [77.0, 81.01], [81.0, 81.21], [84.0, 100.2]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [66.27, 99.9, 0.0, 82.25, 92.15, 96.17, 77.53, 0.0, 56.93, 0.0, 85.35], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null], "duration": [14.15, 18.39, 1.17, 2.3, 3.57, 7.7, 7.47, 0.9, 4.01, 0.21, 16.2]} \ No newline at end of file diff --git a/annotations_1/zfUzaYV1xfE_filtered.json b/annotations_1/zfUzaYV1xfE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2a746950e3ca3f0887f9ef54b318b851d2316df1 --- /dev/null +++ b/annotations_1/zfUzaYV1xfE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.17], [7.0, 11.35], [12.0, 14.74], [16.0, 24.51], [25.0, 26.16], [32.0, 33.66], [36.0, 39.36], [41.0, 44.63], [45.0, 46.2], [47.0, 48.52], [49.0, 49.54], [50.0, 51.53], [53.0, 59.05], [63.0, 63.96], [66.0, 66.65], [67.0, 70.75], [71.0, 71.88], [79.0, 81.87], [86.0, 89.75], [93.0, 95.37], [99.0, 100.08], [102.0, 103.01], [105.0, 106.1], [107.0, 109.24], [109.0, 113.93], [115.0, 115.79], [117.0, 118.93], [125.0, 137.4], [139.0, 147.23], [148.0, 149.05]], "keep_status": [false, false, true, false, false, false, true, true, false, false, false, false, true, false, false, false, false, false, true, true, false, false, false, true, false, false, false, true, false, false], "silence_prob": [70.02, 51.39, 44.46, 35.56, 0.0, 0.0, 37.17, 30.94, 0.0, 0.0, 0.0, 0.0, 30.86, 0.0, 0.0, 30.68, 0.0, 28.75, 36.01, 28.57, 0.0, 0.0, 0.0, 29.86, 34.75, 0.0, 0.0, 29.36, 28.35, 0.0], "audiomae_on_audioset": [null, null, [["speech", 25.17], ["music", 21.25], ["hum", 10.35]], [["music", 52.49], ["ambient music", 12.66], ["synthesizer", 4.9]], null, null, [["throbbing", 18.96], ["hum", 17.99], ["mains hum", 16.11]], [["hum", 31.28], ["mains hum", 11.99], ["music", 11.7]], null, null, null, null, [["music", 35.11], ["hum", 12.33], ["speech", 9.63]], null, null, [["music", 62.05], ["hum", 8.15], ["mains hum", 5.61]], null, [["mains hum", 55.78], ["hum", 19.4], ["music", 5.84]], [["hum", 31.76], ["mains hum", 21.9], ["music", 7.31]], [["whack, thwack", 20.38], ["explosion", 12.08], ["fart", 7.43]], null, null, null, [["mains hum", 28.11], ["hum", 18.99], ["buzz", 6.38]], [["bee, wasp, etc.", 40.59], ["fly, housefly", 29.82], ["insect", 10.14]], null, null, [["speech", 24.58], ["mains hum", 21.13], ["hum", 17.88]], [["speech", 47.39], ["fly, housefly", 15.91], ["insect", 9.72]], null], "duration": [3.17, 4.35, 2.74, 8.51, 1.16, 1.66, 3.36, 3.63, 1.2, 1.52, 0.54, 1.53, 6.05, 0.96, 0.65, 3.75, 0.88, 2.87, 3.75, 2.37, 1.08, 1.01, 1.1, 2.24, 4.93, 0.79, 1.93, 12.4, 8.23, 1.05]} \ No newline at end of file diff --git a/annotations_1/zfyDw7VR3Hg_filtered.json b/annotations_1/zfyDw7VR3Hg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bdc37e8a586e086b7d814dcd4e8814f7b86b8490 --- /dev/null +++ b/annotations_1/zfyDw7VR3Hg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 19.68], [22.0, 76.35], [78.0, 109.73], [112.0, 114.12], [121.0, 120.68], [122.0, 122.44], [123.0, 126.5], [127.0, 129.07], [131.0, 134.92], [135.0, 135.87]], "keep_status": [false, false, false, false, false, false, false, false, true, false], "silence_prob": [35.03, 0.0, 0.0, 96.04, 0.0, 0.0, 75.39, 41.91, 36.53, 0.0], "audiomae_on_audioset": [[["music", 65.52], ["hum", 5.91], ["speech", 4.62]], null, null, null, null, null, null, [["speech", 60.8], ["music", 11.08], ["sidetone", 9.32]], [["beatboxing", 27.7], ["speech", 19.13], ["mains hum", 9.06]], null], "duration": [13.68, 54.35, 31.73, 2.12, -0.32, 0.44, 3.5, 2.07, 3.92, 0.87]} \ No newline at end of file diff --git a/annotations_1/zgrvS0PJDrA_filtered.json b/annotations_1/zgrvS0PJDrA_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..f67c24ac427b60fc0d8e9c30d987516c221eb9c5 --- /dev/null +++ b/annotations_1/zgrvS0PJDrA_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.74], [8.0, 10.71], [12.0, 11.99], [16.0, 17.95], [20.0, 20.49], [21.0, 20.85], [21.0, 23.77], [34.0, 33.76], [34.0, 36.71], [40.0, 40.85], [51.0, 52.86], [55.0, 78.16], [82.0, 83.35], [85.0, 88.26], [89.0, 89.99], [97.0, 97.34], [124.0, 124.02], [127.0, 127.63], [129.0, 130.52]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 75.07, 0.0, 0.0, 0.0, 0.0, 65.2, 0.0, 57.81, 0.0, 0.0, 47.74, 0.0, 70.72, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, [["music", 34.63], ["synthesizer", 13.83], ["musical instrument", 4.77]], null, null, null, null, null, null, null], "duration": [0.74, 2.71, -0.01, 1.95, 0.49, -0.15, 2.77, -0.24, 2.71, 0.85, 1.86, 23.16, 1.35, 3.26, 0.99, 0.34, 0.02, 0.63, 1.52]} \ No newline at end of file diff --git a/annotations_1/zha1tYGnAC8_filtered.json b/annotations_1/zha1tYGnAC8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b8e420a58030b5797f106ae6e566a0401e8a6d77 --- /dev/null +++ b/annotations_1/zha1tYGnAC8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 7.01], [9.0, 9.19], [10.0, 12.61], [14.0, 14.18], [15.0, 18.47], [20.0, 20.58], [22.0, 35.94], [41.0, 46.11], [48.0, 100.57], [103.0, 103.57], [105.0, 108.4]], "keep_status": [false, false, true, false, true, false, true, false, false, false, false], "silence_prob": [58.98, 0.0, 32.83, 0.0, 32.66, 0.0, 30.11, 30.89, 0.0, 0.0, 34.74], "audiomae_on_audioset": [null, null, [["music", 37.95], ["noise", 12.71], ["chirp tone", 7.47]], null, [["music", 21.03], ["hum", 19.82], ["mains hum", 15.43]], null, [["music", 40.68], ["buzz", 12.35], ["vehicle", 4.72]], [["music", 46.63], ["throbbing", 20.66], ["hum", 10.32]], null, null, [["hum", 39.8], ["mains hum", 29.45], ["throbbing", 12.58]]], "duration": [2.01, 0.19, 2.61, 0.18, 3.47, 0.58, 13.94, 5.11, 52.57, 0.57, 3.4]} \ No newline at end of file diff --git a/annotations_1/zhhLFNr_Jio_filtered.json b/annotations_1/zhhLFNr_Jio_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d4b0b88834329ceed7528e27b05134e7b6c5bb6b --- /dev/null +++ b/annotations_1/zhhLFNr_Jio_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[4.0, 5.24], [7.0, 13.68], [14.0, 14.57], [19.0, 23.7], [26.0, 28.31], [31.0, 48.07], [48.0, 50.4], [52.0, 86.09], [89.0, 90.12], [92.0, 103.81], [104.0, 126.39], [128.0, 137.17], [137.0, 142.86], [143.0, 144.53], [145.0, 151.56], [155.0, 156.02], [156.0, 156.44]], "keep_status": [false, true, false, true, false, true, true, false, false, true, true, false, true, false, true, false, false], "silence_prob": [0.0, 37.43, 0.0, 47.98, 53.04, 30.91, 30.38, 0.0, 0.0, 43.53, 46.33, 39.25, 41.36, 0.0, 41.91, 0.0, 0.0], "audiomae_on_audioset": [null, [["hum", 22.61], ["music", 16.57], ["synthesizer", 13.85]], null, [["music", 43.66], ["synthesizer", 13.16], ["musical instrument", 3.54]], null, [["speech", 33.25], ["music", 24.93], ["whack, thwack", 5.72]], [["speech", 37.43], ["music", 17.65], ["fart", 4.77]], null, null, [["speech", 20.66], ["hum", 17.31], ["grunt", 12.08]], [["gasp", 34.59], ["speech", 17.81], ["beatboxing", 7.95]], [["throbbing", 45.55], ["hum", 27.0], ["mains hum", 6.95]], [["speech", 22.56], ["hum", 15.3], ["music", 11.6]], null, [["hum", 21.36], ["music", 12.11], ["throbbing", 12.06]], null, null], "duration": [1.24, 6.68, 0.57, 4.7, 2.31, 17.07, 2.4, 34.09, 1.12, 11.81, 22.39, 9.17, 5.86, 1.53, 6.56, 1.02, 0.44]} \ No newline at end of file diff --git a/annotations_1/zjQSWtB7Kp4_filtered.json b/annotations_1/zjQSWtB7Kp4_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..10b62e4cda0fea2b1385733f165798e92c37c2ca --- /dev/null +++ b/annotations_1/zjQSWtB7Kp4_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 61.8], [65.0, 67.47], [74.0, 76.57], [78.0, 83.4]], "keep_status": [false, true, true, true], "silence_prob": [0.0, 39.41, 38.91, 32.62], "audiomae_on_audioset": [null, [["music", 52.86], ["ambient music", 5.29], ["electronic music", 5.01]], [["music", 40.93], ["theremin", 9.81], ["fly, housefly", 6.35]], [["music", 22.46], ["didgeridoo", 15.84], ["firecracker", 10.14]]], "duration": [34.8, 2.47, 2.57, 5.4]} \ No newline at end of file diff --git a/annotations_1/zjXn9UGZt4o_filtered.json b/annotations_1/zjXn9UGZt4o_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..645ed233dade43c959e84451484eec716b75b025 --- /dev/null +++ b/annotations_1/zjXn9UGZt4o_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 3.23], [5.0, 6.51], [7.0, 12.65], [15.0, 15.3], [21.0, 22.13], [23.0, 26.64], [30.0, 31.55], [32.0, 33.03], [34.0, 34.7], [36.0, 35.78], [48.0, 49.1], [55.0, 55.31], [63.0, 64.54], [66.0, 67.53], [72.0, 72.6], [74.0, 77.85], [79.0, 79.32], [80.0, 81.08], [81.0, 82.09], [84.0, 84.38], [86.0, 108.89], [110.0, 113.61], [114.0, 116.38], [117.0, 134.91], [136.0, 141.07], [142.0, 143.8], [147.0, 147.88], [149.0, 150.38]], "keep_status": [false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, true, true, true, false, false, false, false], "silence_prob": [59.96, 0.0, 64.18, 0.0, 0.0, 35.39, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.01, 0.0, 0.0, 0.0, 0.0, 31.16, 38.37, 37.56, 30.68, 34.29, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, [["music", 61.75], ["throbbing", 4.95], ["drum machine", 2.71]], null, null, null, null, null, null, null, null, null, [["music", 51.14], ["didgeridoo", 12.56], ["electronic music", 2.44]], null, null, null, null, [["speech", 67.96], ["music", 11.28], ["whack, thwack", 6.45]], [["music", 38.86], ["hum", 16.57], ["speech", 4.63]], [["speech", 25.8], ["sidetone", 14.05], ["music", 13.68]], [["music", 34.49], ["hum", 10.63], ["speech", 8.89]], [["music", 56.18], ["didgeridoo", 14.12], ["throbbing", 5.62]], null, null, null], "duration": [2.23, 1.51, 5.65, 0.3, 1.13, 3.64, 1.55, 1.03, 0.7, -0.22, 1.1, 0.31, 1.54, 1.53, 0.6, 3.85, 0.32, 1.08, 1.09, 0.38, 22.89, 3.61, 2.38, 17.91, 5.07, 1.8, 0.88, 1.38]} \ No newline at end of file diff --git a/annotations_1/zjdTL3Z77G8_filtered.json b/annotations_1/zjdTL3Z77G8_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b5bb555e772132b4cf4c59667ae36deec667810e --- /dev/null +++ b/annotations_1/zjdTL3Z77G8_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[0.0, 0.26], [10.0, 13.14], [17.0, 17.47], [29.0, 29.64], [44.0, 44.74], [45.0, 49.67], [57.0, 56.81], [66.0, 67.24], [78.0, 78.39], [81.0, 81.97], [85.0, 85.73], [88.0, 87.89], [88.0, 87.93], [88.0, 87.99], [97.0, 97.28], [105.0, 106.95], [112.0, 120.45]], "keep_status": [false, true, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 39.5, 0.0, 0.0, 0.0, 38.58, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.55], "audiomae_on_audioset": [null, [["music", 59.99], ["electronic music", 4.8], ["synthesizer", 3.08]], null, null, null, [["music", 45.87], ["throbbing", 11.91], ["speech", 11.71]], null, null, null, null, null, null, null, null, null, null, [["music", 81.63], ["electronic music", 4.31], ["house music", 2.82]]], "duration": [0.26, 3.14, 0.47, 0.64, 0.74, 4.67, -0.19, 1.24, 0.39, 0.97, 0.73, -0.11, -0.07, -0.01, 0.28, 1.95, 8.45]} \ No newline at end of file diff --git a/annotations_1/zjm_GqK-Kmo_filtered.json b/annotations_1/zjm_GqK-Kmo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1efddf662d8a9722cb547430c7a57d11b211b6c --- /dev/null +++ b/annotations_1/zjm_GqK-Kmo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[13.0, 13.86], [15.0, 16.02], [17.0, 19.94], [22.0, 21.81], [23.0, 25.51], [29.0, 29.46], [32.0, 34.11], [37.0, 37.1], [44.0, 45.15], [47.0, 48.66], [50.0, 50.31], [54.0, 56.1], [57.0, 64.79], [66.0, 68.57], [69.0, 70.66], [72.0, 73.45], [77.0, 79.39]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false], "silence_prob": [0.0, 0.0, 99.68, 0.0, 99.26, 0.0, 99.99, 0.0, 0.0, 0.0, 0.0, 96.66, 75.88, 45.49, 0.0, 0.0, 57.09], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["rumble", 18.04], ["hum", 9.57], ["vehicle", 7.54]], null, null, null], "duration": [0.86, 1.02, 2.94, -0.19, 2.51, 0.46, 2.11, 0.1, 1.15, 1.66, 0.31, 2.1, 7.79, 2.57, 1.66, 1.45, 2.39]} \ No newline at end of file diff --git a/annotations_1/zkRkL94VQxY_filtered.json b/annotations_1/zkRkL94VQxY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c69e29bde00ee3d1e9953aec8d2fe5c8dbf7189f --- /dev/null +++ b/annotations_1/zkRkL94VQxY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[27.0, 32.07], [33.0, 39.26], [43.0, 43.68], [45.0, 45.98], [47.0, 55.34], [57.0, 57.0], [57.0, 57.52], [77.0, 93.97], [95.0, 96.96], [98.0, 99.45], [100.0, 100.53], [102.0, 108.6], [110.0, 110.1], [115.0, 117.0], [118.0, 119.11], [120.0, 120.5], [130.0, 130.2], [148.0, 151.01], [153.0, 154.38], [160.0, 161.64]], "keep_status": [true, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false], "silence_prob": [32.83, 32.26, 0.0, 0.0, 32.3, 0.0, 0.0, 34.93, 0.0, 0.0, 0.0, 31.54, 0.0, 93.91, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0], "audiomae_on_audioset": [[["music", 31.81], ["whack, thwack", 17.25], ["speech", 8.58]], [["music", 55.99], ["boing", 11.35], ["speech", 4.09]], null, null, [["didgeridoo", 41.08], ["music", 36.38], ["musical instrument", 5.86]], null, null, [["music", 56.06], ["throbbing", 18.16], ["hum", 11.62]], null, null, null, [["speech", 16.69], ["music", 11.98], ["whale vocalization", 9.78]], null, null, null, null, null, null, null, null], "duration": [5.07, 6.26, 0.68, 0.98, 8.34, 0.0, 0.52, 16.97, 1.96, 1.45, 0.53, 6.6, 0.1, 2.0, 1.11, 0.5, 0.2, 3.01, 1.38, 1.64]} \ No newline at end of file diff --git a/annotations_1/zkWthOfGYgM_filtered.json b/annotations_1/zkWthOfGYgM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..72061d976a9344e59e2c2691cdcbabc01bb1c417 --- /dev/null +++ b/annotations_1/zkWthOfGYgM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.11], [5.0, 6.02], [8.0, 9.02], [10.0, 10.32], [11.0, 13.68], [16.0, 17.34], [18.0, 20.76], [22.0, 22.38], [23.0, 24.63], [27.0, 27.48], [30.0, 30.33], [45.0, 44.74], [54.0, 55.12], [61.0, 61.89], [63.0, 63.46], [64.0, 64.61], [65.0, 65.77], [66.0, 65.87], [66.0, 67.31], [68.0, 67.63], [69.0, 69.35], [70.0, 71.39], [72.0, 72.76], [75.0, 76.59], [83.0, 83.66], [84.0, 84.74], [85.0, 85.78]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 91.64, 0.0, 85.72, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.11, 1.02, 1.02, 0.32, 2.68, 1.34, 2.76, 0.38, 1.63, 0.48, 0.33, -0.26, 1.12, 0.89, 0.46, 0.61, 0.77, -0.13, 1.31, -0.37, 0.35, 1.39, 0.76, 1.59, 0.66, 0.74, 0.78]} \ No newline at end of file diff --git a/annotations_1/zm9XOZXVyyU_filtered.json b/annotations_1/zm9XOZXVyyU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..687b7256c0efe3ffe1985c1c0dfbd29af734eb49 --- /dev/null +++ b/annotations_1/zm9XOZXVyyU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[12.0, 12.73], [18.0, 18.42], [24.0, 28.22], [32.0, 32.68], [34.0, 37.84], [39.0, 38.99], [39.0, 46.03], [56.0, 56.39], [59.0, 61.91], [64.0, 69.04], [69.0, 70.16], [73.0, 75.44], [78.0, 85.18], [88.0, 93.43], [100.0, 103.99], [107.0, 130.59], [133.0, 134.23], [144.0, 147.24], [149.0, 150.23], [155.0, 155.49], [156.0, 155.53], [161.0, 161.33], [166.0, 166.75]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, true, false, true, true, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 45.46, 0.0, 96.77, 0.0, 30.62, 0.0, 91.81, 30.32, 0.0, 31.55, 30.01, 29.52, 29.41, 28.44, 0.0, 29.83, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, [["speech", 66.61], ["sine wave", 6.4], ["chirp tone", 5.55]], null, null, null, [["speech", 64.98], ["whack, thwack", 9.29], ["fart", 4.29]], null, null, [["moo", 28.81], ["cattle, bovinae", 25.17], ["livestock, farm animals, working animals", 16.67]], null, [["speech", 49.1], ["music", 11.6], ["didgeridoo", 10.57]], [["cattle, bovinae", 22.05], ["livestock, farm animals, working animals", 20.87], ["moo", 20.06]], [["speech", 88.07], ["whack, thwack", 1.09], ["electric shaver, electric razor", 1.01]], [["cattle, bovinae", 25.34], ["livestock, farm animals, working animals", 18.59], ["moo", 17.69]], [["speech", 27.43], ["groan", 11.18], ["whimper", 10.59]], null, [["boing", 66.12], ["speech", 13.16], ["music", 11.66]], null, null, null, null, null], "duration": [0.73, 0.42, 4.22, 0.68, 3.84, -0.01, 7.03, 0.39, 2.91, 5.04, 1.16, 2.44, 7.18, 5.43, 3.99, 23.59, 1.23, 3.24, 1.23, 0.49, -0.47, 0.33, 0.75]} \ No newline at end of file diff --git a/annotations_1/zmdsY7PIJDg_filtered.json b/annotations_1/zmdsY7PIJDg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..873f357a085476d044b49dda4a19cdceadfdf64d --- /dev/null +++ b/annotations_1/zmdsY7PIJDg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 6.03], [8.0, 8.23], [10.0, 10.32], [16.0, 16.29], [22.0, 34.96], [36.0, 39.56], [45.0, 47.68], [56.0, 56.89], [59.0, 59.66], [61.0, 62.55], [63.0, 68.59], [70.0, 75.84], [82.0, 82.61], [88.0, 90.9], [92.0, 93.28], [95.0, 97.66], [98.0, 106.98], [112.0, 112.73], [114.0, 114.81], [115.0, 115.91], [118.0, 120.02], [127.0, 136.81], [137.0, 137.02], [138.0, 138.21], [139.0, 139.29], [144.0, 144.42], [154.0, 154.52], [159.0, 159.39], [160.0, 161.2]], "keep_status": [false, false, false, false, true, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [68.02, 0.0, 0.0, 0.0, 45.82, 55.53, 64.18, 0.0, 0.0, 0.0, 37.31, 55.96, 0.0, 67.89, 0.0, 46.54, 54.36, 0.0, 0.0, 0.0, 99.31, 48.1, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["hum", 29.95], ["music", 23.74], ["synthesizer", 8.15]], null, null, null, null, null, [["music", 23.49], ["didgeridoo", 11.53], ["fart", 9.32]], null, null, null, null, [["speech", 34.32], ["music", 22.25], ["hum", 8.89]], null, null, null, null, null, [["speech", 67.05], ["sidetone", 17.81], ["radio", 3.27]], null, null, null, null, null, null, null], "duration": [3.03, 0.23, 0.32, 0.29, 12.96, 3.56, 2.68, 0.89, 0.66, 1.55, 5.59, 5.84, 0.61, 2.9, 1.28, 2.66, 8.98, 0.73, 0.81, 0.91, 2.02, 9.81, 0.02, 0.21, 0.29, 0.42, 0.52, 0.39, 1.2]} \ No newline at end of file diff --git a/annotations_1/zn9D_4bE0hM_filtered.json b/annotations_1/zn9D_4bE0hM_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..3bf0eed22d73b7da91468465c1c9682f6a578998 --- /dev/null +++ b/annotations_1/zn9D_4bE0hM_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[91.0, 118.27]], "keep_status": [false], "silence_prob": [30.61], "audiomae_on_audioset": [[["speech", 46.01], ["singing bowl", 21.49], ["rumble", 14.68]]], "duration": [27.27]} \ No newline at end of file diff --git a/annotations_1/zoo3aMvQdMw_filtered.json b/annotations_1/zoo3aMvQdMw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..c8f0dd9cc5ed72beebfb25cdde60ce64d6e583a7 --- /dev/null +++ b/annotations_1/zoo3aMvQdMw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[30.0, 31.46], [33.0, 34.52], [37.0, 37.67], [39.0, 39.92], [42.0, 43.66], [44.0, 48.95], [50.0, 51.02], [55.0, 55.02], [56.0, 56.94], [59.0, 58.94], [59.0, 60.52], [63.0, 64.34], [71.0, 71.61], [72.0, 75.56], [76.0, 77.23], [79.0, 97.41], [101.0, 101.17], [102.0, 105.36], [106.0, 107.2], [111.0, 111.86], [114.0, 115.45], [117.0, 117.69], [123.0, 124.77], [129.0, 129.41], [132.0, 132.46], [133.0, 135.41], [136.0, 136.76], [139.0, 141.89], [143.0, 143.48], [144.0, 145.44], [147.0, 149.45], [152.0, 152.83], [158.0, 160.3], [160.0, 161.16]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false, false, false, false, false, false, false, false, true, false, false, false, false, true, false, true, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 99.94, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.16, 0.0, 36.68, 0.0, 61.18, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.67, 0.0, 33.74, 0.0, 0.0, 39.72, 0.0, 31.86, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 49.82], ["didgeridoo", 8.02], ["musical instrument", 6.03]], null, null, null, null, null, null, null, null, null, [["music", 25.95], ["speech", 25.0], ["fireworks", 3.36]], null, [["music", 63.08], ["hum", 11.49], ["throbbing", 8.7]], null, null, [["music", 52.23], ["hum", 7.95], ["didgeridoo", 4.9]], null, [["music", 37.81], ["speech", 13.2], ["rumble", 7.93]], null], "duration": [1.46, 1.52, 0.67, 0.92, 1.66, 4.95, 1.02, 0.02, 0.94, -0.06, 1.52, 1.34, 0.61, 3.56, 1.23, 18.41, 0.17, 3.36, 1.2, 0.86, 1.45, 0.69, 1.77, 0.41, 0.46, 2.41, 0.76, 2.89, 0.48, 1.44, 2.45, 0.83, 2.3, 1.16]} \ No newline at end of file diff --git a/annotations_1/zpsNG-exYxE_filtered.json b/annotations_1/zpsNG-exYxE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..ffa25eeb2ace972a2bdfcc19929d10531d233c49 --- /dev/null +++ b/annotations_1/zpsNG-exYxE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[6.0, 6.98], [8.0, 10.22], [11.0, 12.73], [13.0, 13.83], [16.0, 16.29], [25.0, 25.0], [26.0, 26.11], [41.0, 41.49], [45.0, 46.57], [48.0, 48.1], [49.0, 49.99], [51.0, 51.04], [53.0, 54.63], [55.0, 57.79], [58.0, 58.56], [59.0, 60.98], [61.0, 62.11], [63.0, 68.79], [71.0, 71.51], [78.0, 79.49]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true, false, false], "silence_prob": [0.0, 85.54, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.9, 0.0, 0.0, 0.0, 36.62, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 27.15], ["hum", 27.09], ["speech", 21.78]], null, null, null, [["music", 60.65], ["musical instrument", 3.62], ["throbbing", 3.28]], null, null], "duration": [0.98, 2.22, 1.73, 0.83, 0.29, 0.0, 0.11, 0.49, 1.57, 0.1, 0.99, 0.04, 1.63, 2.79, 0.56, 1.98, 1.11, 5.79, 0.51, 1.49]} \ No newline at end of file diff --git a/annotations_1/zqv3YesdtRU_filtered.json b/annotations_1/zqv3YesdtRU_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..4e46633e0a9608bffbc2bb9d55775657827a856d --- /dev/null +++ b/annotations_1/zqv3YesdtRU_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[10.0, 31.23], [51.0, 52.14], [56.0, 59.0], [63.0, 65.58], [80.0, 82.43], [88.0, 103.64], [105.0, 110.76], [111.0, 111.32], [131.0, 133.64], [148.0, 150.74], [165.0, 171.0], [178.0, 178.36], [222.0, 222.62], [226.0, 226.27], [227.0, 230.05], [231.0, 231.23], [231.0, 232.53]], "keep_status": [false, false, true, true, true, false, false, false, true, true, true, false, false, false, true, false, false], "silence_prob": [30.82, 0.0, 30.48, 30.81, 30.85, 31.52, 30.55, 0.0, 29.96, 30.26, 30.67, 0.0, 0.0, 0.0, 30.03, 0.0, 0.0], "audiomae_on_audioset": [[["music", 58.25], ["theremin", 28.77], ["hum", 1.23]], null, [["music", 55.55], ["electronic music", 3.6], ["trance music", 3.58]], [["music", 45.35], ["house music", 3.26], ["electronic music", 2.66]], [["music", 58.57], ["house music", 5.15], ["sampler", 4.22]], [["music", 81.06], ["disco", 2.49], ["theremin", 1.87]], [["music", 76.13], ["christmas music", 1.51], ["singing", 1.48]], null, [["music", 60.66], ["sampler", 3.84], ["electronic music", 2.3]], [["music", 56.65], ["singing", 2.41], ["electronic music", 2.29]], [["music", 61.96], ["swing music", 3.14], ["singing", 1.85]], null, null, null, [["music", 56.47], ["electronic music", 3.05], ["house music", 2.65]], null, null], "duration": [21.23, 1.14, 3.0, 2.58, 2.43, 15.64, 5.76, 0.32, 2.64, 2.74, 6.0, 0.36, 0.62, 0.27, 3.05, 0.23, 1.53]} \ No newline at end of file diff --git a/annotations_1/zt4ek_5zQgY_filtered.json b/annotations_1/zt4ek_5zQgY_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..e1fa1eb83283b29ab0de35a7d7037058e86e666a --- /dev/null +++ b/annotations_1/zt4ek_5zQgY_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 4.19], [6.0, 7.37], [9.0, 10.05], [11.0, 13.78], [14.0, 24.29], [25.0, 26.5], [27.0, 29.39], [30.0, 33.25], [34.0, 36.64], [37.0, 38.1], [40.0, 41.98], [43.0, 45.25], [46.0, 48.64], [50.0, 54.46], [55.0, 63.8], [64.0, 68.01], [69.0, 70.98], [72.0, 74.24], [75.0, 76.94], [78.0, 78.97], [81.0, 82.24], [83.0, 86.24], [88.0, 88.82], [90.0, 90.88], [92.0, 92.64], [94.0, 95.66], [97.0, 98.81], [99.0, 101.87], [104.0, 105.43], [110.0, 112.63], [113.0, 119.45], [121.0, 123.43], [124.0, 126.28], [128.0, 133.07]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 100.0, 100.0, 0.0, 100.0, 99.84, 100.0, 0.0, 0.0, 100.0, 100.0, 100.0, 100.0, 99.96, 0.0, 100.0, 0.0, 0.0, 0.0, 99.76, 0.0, 0.0, 0.0, 0.0, 0.0, 98.66, 0.0, 100.0, 100.0, 100.0, 99.73, 99.98], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.19, 1.37, 1.05, 2.78, 10.29, 1.5, 2.39, 3.25, 2.64, 1.1, 1.98, 2.25, 2.64, 4.46, 8.8, 4.01, 1.98, 2.24, 1.94, 0.97, 1.24, 3.24, 0.82, 0.88, 0.64, 1.66, 1.81, 2.87, 1.43, 2.63, 6.45, 2.43, 2.28, 5.07]} \ No newline at end of file diff --git a/annotations_1/zuSBq10_5go_filtered.json b/annotations_1/zuSBq10_5go_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..bd4f2dbe2da2fc2f9b7d0ccd785ec1490d23f442 --- /dev/null +++ b/annotations_1/zuSBq10_5go_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 74.06], [76.0, 78.75], [80.0, 108.72], [112.0, 114.44], [115.0, 117.64], [120.0, 123.38], [125.0, 125.25], [125.0, 146.87], [150.0, 157.32], [159.0, 159.7], [160.0, 186.06]], "keep_status": [false, false, true, true, true, true, false, false, true, false, false], "silence_prob": [0.0, 33.11, 29.49, 33.53, 34.85, 31.3, 0.0, 29.32, 43.25, 0.0, 28.63], "audiomae_on_audioset": [null, [["music", 48.98], ["theremin", 22.42], ["synthesizer", 5.4]], [["music", 18.53], ["hum", 18.42], ["mains hum", 17.62]], [["hum", 32.92], ["throbbing", 18.66], ["music", 17.06]], [["speech", 42.9], ["music", 21.08], ["mains hum", 4.84]], [["hum", 35.68], ["throbbing", 18.67], ["music", 12.81]], null, [["music", 60.94], ["speech", 31.12], ["hum", 1.08]], [["bee, wasp, etc.", 34.34], ["fly, housefly", 15.97], ["insect", 13.76]], null, [["music", 44.69], ["whale vocalization", 34.19], ["speech", 3.31]]], "duration": [71.06, 2.75, 28.72, 2.44, 2.64, 3.38, 0.25, 21.87, 7.32, 0.7, 26.06]} \ No newline at end of file diff --git a/annotations_1/zvGA7DNmxmw_filtered.json b/annotations_1/zvGA7DNmxmw_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..9b97e8f639be9245012af6f24507e7ef9a6ccaf1 --- /dev/null +++ b/annotations_1/zvGA7DNmxmw_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[8.0, 8.48], [12.0, 11.72], [14.0, 15.01], [23.0, 24.92], [31.0, 33.22], [34.0, 35.34], [45.0, 46.26], [60.0, 61.15], [67.0, 67.91], [71.0, 71.93], [83.0, 85.5], [87.0, 88.43], [99.0, 99.59], [102.0, 102.19], [112.0, 118.2], [120.0, 121.53], [123.0, 123.75], [126.0, 126.4], [128.0, 128.83]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 49.68, 0.0, 0.0, 0.0, 0.0, 0.0, 71.87, 0.0, 0.0, 0.0, 57.97, 0.0, 0.0, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, [["fly, housefly", 80.51], ["insect", 12.19], ["bee, wasp, etc.", 5.25]], null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [0.48, -0.28, 1.01, 1.92, 2.22, 1.34, 1.26, 1.15, 0.91, 0.93, 2.5, 1.43, 0.59, 0.19, 6.2, 1.53, 0.75, 0.4, 0.83]} \ No newline at end of file diff --git a/annotations_1/zvY-EPgYB4Y_filtered.json b/annotations_1/zvY-EPgYB4Y_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..93a9ec78a2087389feb0393c9a7fbc25eb2842a9 --- /dev/null +++ b/annotations_1/zvY-EPgYB4Y_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[2.0, 2.29], [3.0, 4.11], [9.0, 9.37], [13.0, 13.76], [16.0, 17.83], [22.0, 22.81], [24.0, 48.84], [50.0, 94.53], [97.0, 98.02], [101.0, 101.65], [106.0, 111.57], [112.0, 116.29], [119.0, 128.46], [130.0, 130.59], [131.0, 131.35], [132.0, 188.01], [188.0, 199.59], [201.0, 215.6]], "keep_status": [false, false, false, false, false, false, true, false, false, false, false, true, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.65, 0.0, 0.0, 0.0, 81.71, 46.79, 43.64, 0.0, 0.0, 0.0, 33.32, 31.67], "audiomae_on_audioset": [null, null, null, null, null, null, [["music", 38.2], ["fart", 19.05], ["groan", 8.82]], null, null, null, null, [["speech", 41.3], ["busy signal", 16.44], ["sonar", 8.47]], [["music", 45.41], ["speech", 26.43], ["timpani", 9.47]], null, null, null, [["music", 81.91], ["speech", 2.4], ["throbbing", 1.25]], [["gong", 33.87], ["music", 27.45], ["didgeridoo", 5.64]]], "duration": [0.29, 1.11, 0.37, 0.76, 1.83, 0.81, 24.84, 44.53, 1.02, 0.65, 5.57, 4.29, 9.46, 0.59, 0.35, 56.01, 11.59, 14.6]} \ No newline at end of file diff --git a/annotations_1/zvn05TBxdUo_filtered.json b/annotations_1/zvn05TBxdUo_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..b73e233c874ff9f8610a6e5aecddca80c8ad7518 --- /dev/null +++ b/annotations_1/zvn05TBxdUo_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.38], [4.0, 4.94], [8.0, 9.24], [12.0, 13.46], [18.0, 19.13], [23.0, 24.61], [27.0, 26.92], [27.0, 27.46], [28.0, 29.94], [31.0, 31.58], [33.0, 39.14], [40.0, 42.82], [49.0, 49.17], [50.0, 51.14], [52.0, 53.23], [56.0, 58.02], [58.0, 61.38], [63.0, 72.94], [76.0, 76.72], [80.0, 81.09], [82.0, 83.52], [90.0, 90.31], [93.0, 98.63], [102.0, 112.38], [113.0, 122.37], [123.0, 123.57], [127.0, 128.41]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.24, 72.75, 0.0, 0.0, 0.0, 99.96, 50.02, 77.03, 0.0, 0.0, 0.0, 0.0, 28.52, 28.33, 28.4, 0.0, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 62.08], ["rattle (instrument)", 15.43], ["afrobeat", 5.48]], [["music", 79.4], ["musical instrument", 3.95], ["rattle (instrument)", 2.66]], [["music", 78.96], ["crowd", 6.03], ["didgeridoo", 1.42]], null, null], "duration": [0.38, 0.94, 1.24, 1.46, 1.13, 1.61, -0.08, 0.46, 1.94, 0.58, 6.14, 2.82, 0.17, 1.14, 1.23, 2.02, 3.38, 9.94, 0.72, 1.09, 1.52, 0.31, 5.63, 10.38, 9.37, 0.57, 1.41]} \ No newline at end of file diff --git a/annotations_1/zvy5tDkETfQ_filtered.json b/annotations_1/zvy5tDkETfQ_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..8621e24c1c7227f0cd8b5f665cd5302a6b191575 --- /dev/null +++ b/annotations_1/zvy5tDkETfQ_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[5.0, 6.12], [6.0, 7.89], [9.0, 9.8], [14.0, 15.42], [18.0, 18.6], [22.0, 21.91], [38.0, 38.47], [43.0, 43.8], [46.0, 46.6], [53.0, 53.22], [55.0, 55.8], [58.0, 61.7], [63.0, 63.8], [65.0, 65.18], [68.0, 69.38], [72.0, 73.16], [74.0, 75.32], [91.0, 91.02], [104.0, 107.37], [108.0, 110.52], [112.0, 113.41], [116.0, 117.26], [120.0, 123.96]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 96.77, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 79.94, 99.62, 0.0, 0.0, 81.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null], "duration": [1.12, 1.89, 0.8, 1.42, 0.6, -0.09, 0.47, 0.8, 0.6, 0.22, 0.8, 3.7, 0.8, 0.18, 1.38, 1.16, 1.32, 0.02, 3.37, 2.52, 1.41, 1.26, 3.96]} \ No newline at end of file diff --git a/annotations_1/zwLOflhZOBg_filtered.json b/annotations_1/zwLOflhZOBg_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..a63fa83055958229deaf04000361d14d43157457 --- /dev/null +++ b/annotations_1/zwLOflhZOBg_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [], "keep_status": [], "silence_prob": [], "audiomae_on_audioset": [], "duration": []} \ No newline at end of file diff --git a/annotations_1/zyaOnPSzcPE_filtered.json b/annotations_1/zyaOnPSzcPE_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..2f911bf6965c59c502089caa840213b5a7ce3eaf --- /dev/null +++ b/annotations_1/zyaOnPSzcPE_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[9.0, 10.02], [12.0, 13.91], [15.0, 36.73], [41.0, 42.21], [42.0, 42.25], [42.0, 42.28], [51.0, 52.19], [53.0, 56.62], [58.0, 58.08], [68.0, 68.62], [78.0, 78.75], [80.0, 81.21], [83.0, 83.15], [85.0, 85.24], [88.0, 91.0], [97.0, 104.73]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, true], "silence_prob": [0.0, 0.0, 95.51, 0.0, 0.0, 0.0, 0.0, 51.88, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.86, 38.37], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.47], ["speech", 10.87], ["quack", 9.39]], [["music", 48.78], ["quack", 11.76], ["speech", 6.76]]], "duration": [1.02, 1.91, 21.73, 1.21, 0.25, 0.28, 1.19, 3.62, 0.08, 0.62, 0.75, 1.21, 0.15, 0.24, 3.0, 7.73]} \ No newline at end of file diff --git a/annotations_1/zzORtbUYE4c_filtered.json b/annotations_1/zzORtbUYE4c_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..d361ec5e7b61ac63e8d7085a2ea8337083af0702 --- /dev/null +++ b/annotations_1/zzORtbUYE4c_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[1.0, 1.19], [6.0, 6.61], [10.0, 12.99], [14.0, 15.33], [16.0, 20.09], [25.0, 33.64], [34.0, 33.88], [34.0, 36.39], [40.0, 43.48], [43.0, 43.58], [44.0, 44.2], [44.0, 90.39], [91.0, 93.31], [95.0, 95.79], [97.0, 98.09], [98.0, 100.01], [101.0, 102.69], [104.0, 104.89], [106.0, 106.42], [110.0, 109.93], [111.0, 113.12], [114.0, 118.44], [120.0, 121.14], [122.0, 121.56], [122.0, 122.74], [126.0, 127.26], [129.0, 141.45], [143.0, 152.39], [154.0, 154.26]], "keep_status": [false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], "silence_prob": [0.0, 0.0, 99.9, 0.0, 99.93, 62.27, 0.0, 95.78, 92.15, 0.0, 0.0, 0.0, 65.44, 0.0, 0.0, 50.02, 0.0, 0.0, 0.0, 0.0, 54.1, 56.4, 0.0, 0.0, 0.0, 0.0, 56.33, 44.57, 0.0], "audiomae_on_audioset": [null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, null, [["music", 65.78], ["guitar", 7.13], ["musical instrument", 5.47]], null], "duration": [0.19, 0.61, 2.99, 1.33, 4.09, 8.64, -0.12, 2.39, 3.48, 0.58, 0.2, 46.39, 2.31, 0.79, 1.09, 2.01, 1.69, 0.89, 0.42, -0.07, 2.12, 4.44, 1.14, -0.44, 0.74, 1.26, 12.45, 9.39, 0.26]} \ No newline at end of file diff --git a/annotations_1/zzabhummvzk_filtered.json b/annotations_1/zzabhummvzk_filtered.json new file mode 100644 index 0000000000000000000000000000000000000000..5e4058f4f0644ad0ce18b59c1c47148017169a7e --- /dev/null +++ b/annotations_1/zzabhummvzk_filtered.json @@ -0,0 +1 @@ +{"non_speech_segments": [[3.0, 11.11], [12.0, 25.95], [28.0, 41.27], [44.0, 50.11], [51.0, 91.44]], "keep_status": [false, true, true, true, false], "silence_prob": [29.57, 29.31, 29.04, 29.33, 0.0], "audiomae_on_audioset": [[["throbbing", 35.11], ["hum", 33.39], ["music", 17.62]], [["car", 26.39], ["vehicle", 20.28], ["music", 12.08]], [["music", 34.13], ["buzz", 9.72], ["hum", 6.72]], [["music", 25.26], ["hum", 17.64], ["mains hum", 11.71]], null], "duration": [8.11, 13.95, 13.27, 6.11, 40.44]} \ No newline at end of file